diff --git "a/log/debug_0.log" "b/log/debug_0.log" --- "a/log/debug_0.log" +++ "b/log/debug_0.log" @@ -1,60040 +1,3 @@ -08/30/2021 13:13:56 - INFO - __main__ - Distributed environment: MULTI_GPU Backend: nccl -Num processes: 16 -Process index: 0 -Local process index: 0 -Device: cuda:0 -Use FP16 precision: True - -08/30/2021 13:13:57 - WARNING - huggingface_hub.repository - /home/leandro/codeparrot-small/./ is already a clone of https://huggingface.co/transformersbook/codeparrot-small. Make sure you pull the latest changes with `repo.git_pull()`. -08/30/2021 13:14:00 - WARNING - huggingface_hub.repository - Revision `zesty-violet-116` does not exist. Created and checked out branch `zesty-violet-116`. -08/30/2021 13:14:00 - WARNING - huggingface_hub.repository - M codeparrot_training.py -M requirements.txt - -08/30/2021 13:14:02 - INFO - datasets.load - Some files matched the pattern '*' at /home/leandro/codeparrot-train but don't have valid data file extensions: [PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/11/70/1170a8200f43dfa3902e9d41088229febdf4d7044d9d762dd5809685e5448b11'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/fa/f2/faf2e65a89fda5ec7a00a36b9fd6c4b2429f1249072b838f2a02d5d01fcaeb18'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b1/70/b1705347d88e73a7de652d1486a3eccda92e420e65a58917c88af635baf55ac8'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/17/89/178953ae530dc7960c803bd22a37026f4190b822b95145240537840bfc5a1ad1'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/37/9d/379db3f5d257369fd927b7395599ec2aef5cefcb57811a57281487da9fd58c5b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/8b/d9/8bd964dad421ed624f4bd5e4719e3e28f62d002b350d850e902688c9e9bcfd80'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1b/c7/1bc7cd472751ec9917bf55ce8b05b8ea467453335103f16c4551e94daefdbaf0'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1f/46/1f46dcfefd87339930fa912ec98a56b7b93c2f052d7f452f82c9c3d0043ffa43'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f9/91/f9915d283d95c3316a76922f129897823efd397287916e8f7af88ed7aaf517b0'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4c/10/4c10f31fa342f81c13b27e7ae0761b17729ee82f6e02824361e2cfcc4ab096c1'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/c0/0f/c00f0550d90e881145954ad24df7fdf512ffc3d63c50d2aa0c85774757d8f37d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/c3/d3/c3d3e55004ff21e36332b9612e385ba07c2610b832b4a94cca2d9fda372a9fb4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a2/17/a21791d67c018e486dde68b8956a16b8fa0c54af93dc3c6ec2c669da87861b02'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/9c/75/9c7526f2ec341f2d2483d9db25b2b2e9fe630b21b737fa7ebbc19965c6ee46b1'), PosixPath('/home/leandro/codeparrot-train/.git/logs/refs/heads/main'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/01/87/0187e92041e5ef1abe3190a48330ff50c7d5fc5ed1219c3bcbb465907430d34e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/37/f2/37f2a405d0e8c52b4a51f79b23f135bcb537eb3f61fe8a27a29ab63b74a37671'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/82/4c/824c9524070c36ed317c12b9b0e77f8b9460e8519ba32c6795a5a2e7232d088c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/44/18/44181da41968eab59b99558c2afd4d6f95397bc2b580622a96f2f9fb74f545b2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/5b/66/5b66654660bc52d66f5bf0e6a62e0b65a0dd2499ec316daed0432efb2c7a8d7b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/47/d1/47d1fedd443c4edfca241c00be8984a2157c668726cc06d92ad7e2704cb5c951'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/9c/83/9c83dabc6a7c8a9629093125ff70fc60f594b0b95cb56f2f12d2bd91352367c7'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/08/4a/084a245793d30784f6ae4f8b666624293bdab2d05a5e1eeadf20b7d9db444951'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/45/da/45da5a5e4acd37b6e288eb4045434fb6b4a8d77979ac61c8306ca9eca6d24128'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/44/10/4410ab4420ffe54105620e1f038b0f6b14afa88a8df9dcf63468f6a2c105d770'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/b9/14b9124b7b2ffa27d79dc210ae77b9b970e067ad7d3dc4d3eebc08671b770c16'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ca/00/ca00ed91ba94519faaba619e5eec6498215695acc6b3f760dc056967cefeea80'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f8/3b/f83b75420e369ae1d55e7009effe9f7a05577a31c19a8c02ce7f0b56b5dc8a87'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ba/5a/ba5ad5064f9ef5d1429abd4c4742cf37b56589c060ff3995e5331eb69fb9c1c5'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/prepare-commit-msg.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/0a/03/0a03d68d6dda083d189878113e864c580b9b5572e53d3e1684b93a9996c7699d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/54/10/5410ae89d1cf3ea5325b7e948fd4db3d352e44bbd2a6a5c813f77be0da958c80'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a9/73/a973fc07ce8ae881a878bf92c6c70583c08ea6bdb2ca2583002271f96dab9543'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2b/85/2b85d040d424bde044014147be3c4949a8d2b0e558c4f4c2c65aead5ece2cde9'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e6/f0/e6f0840fa125b6ad771b853937bd215b369bfb815ff521316cf6cb46fba66968'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/23/ee/23eed9f8512ca62c4b9b4fb28a84688ee550b75ec7658209f3cd5d82a2d4aa57'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a0/53/a05359f8e5ca97304272052f806034ebdca89a94f0d052b719b8b81dd8ddd868'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/21/e1/21e166aee17c30af55849b552e2eaa9c0641dc6cb0ac6386bd3f7797d8af2a9b'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-applypatch.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/70/b0/70b01a02ca2810cf2e74a43655979028b31de42c566bc65d8b749720d1b08fb2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/21/be/21be1bf5e86f5da2dbd83f0bb904a3d68d9abea09bbd5adab6a6873c53ed0112'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7d/04/7d049e95fe5200dc13c1451523e00fd08d37ffde2a863aa025f030f00d3d747b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/41/11/4111a00cda1b0988507f8b544a9e4da7bfb0bff35c13990c6fb1c360aa6a6688'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b9/d1/b9d1c713e023c821f98968ea670a01aa7127c1c915f3d7f6368616f17369e8f2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d5/98/d59884b54759159fcaf45b671dfe9ee2a7d7aea34f1cc7762a1c25499589efb9'), PosixPath('/home/leandro/codeparrot-train/.git/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/8e/81/8e81a5187b909a82581e8030a8008ffb9517519e477797b195bbcf422ef6e20c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1e/89/1e890b33c7f95f900932797f1ba2b15f1f1780926f744ea04e0a969bf270df1a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6b/f5/6bf5fd370b20157e47d88709fb5c8b572f1b682a1fdb80091900bfda70a36491'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/58/1458ee6ad39f24b25d2db9153ba9aa25f4ff2f16c2f624361a0186904a658a54'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-commit.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6b/ce/6bce0dd945b67accdd3077504bc286a26bdb4b03fbbf34d427c21582f3374994'), PosixPath('/home/leandro/codeparrot-train/.git/index'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d0/20/d02098784b5ee7b5d5206ee9cc52e881782d98fc90530322af1c5cb7d401f1fd'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7d/d3/7dd37fe8445ee2641f14179d5a2aa636780822347d880a401d41c90bfd5cfd68'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6f/bc/6fbcee1936749498486745c2dd217ee108f1a243f054dcb2591cfee772906fae'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7f/8d/7f8dc2a2357a3d91ecc5fa5f125c73181dfbe22524d853f672010513044c80f7'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/69/ef/69efdcdb035636e6a8cd18cfc4ef702f95730a381b5d86b36c10028b4df94090'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-push'), PosixPath('/home/leandro/codeparrot-train/.git/objects/pack/pack-67102b35e20edaa7f1ed9c266f37841cd38f158a.pack'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/26/99/2699022bd98f8d49f5505ab457b15dd31156713279335d0c28db1c99edc36894'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/fsmonitor-watchman.sample'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/post-update.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/db/d4/dbd4ddc668c0c838eecd756db64c9a3c2127d8e9bbc05b3fcba00b075854b24c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/fa/40/fa40f7fe8b2d031a32282dce9a40462d67eecff28203c1743fcace8ef4bb37e6'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/bd/9b/bd9be9097633349b5ecd400375be5d511e812feadf983f3c2cbcba263a3a14ab'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/97/af/97af2a98400865661b26c3d5c0a3b6be51603452f459136bc9ab2568667ed199'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b4/2c/b42c05288d42233fb829266917ae1145a835f3ccf8e00ea21e5927f9528fb500'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6a/34/6a34d6e3ac6572933b2f66c74af568a0df3b91b94622dd4b7e5d5538c04071ff'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/05/9b/059bc5381874a28e5a467291be6ee44e3f667609290d74e5ed009be10329bdbb'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/28/29/28290f1947521e2d6c58ee18d83b864b5d95e1fad3b54ee817799991642488ec'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/8a/ae/8aae623a251bd31627554141be2150a5ffb8ddea900ae244fd8492cc03245b36'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/3d/35/3d354291d12d6be3833eda95bd0db307dcd26b5b4287a3f6ca33b3b51b2e46f2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/13/ae/13ae38510e10076edaa24cf051e6403a270c95febd0e2e9b9e052128d632fe36'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/85/28/8528503b464d6cbf8041e0a1481681d0bff4bb24f9d18230fe56c3bc99dfa2ab'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/post-commit'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ba/38/ba38a25c6b8dd335baf2c6cd925ca5b91668af93f7ecee2b120ad352f46a6565'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/77/13/77131f000b7ab27e1336a181a4e4188f31ed40cea3fdf98b6398b5bbddaa5c76'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/93/51/935137f4370f4f5c85ba6a157825fe6102edb991a46610fa9939e2960be9653d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/78/bb/78bbf19a9e7a29b17fa71e3d05842b9469e3187e938efd8c793ceadbdd38c709'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/55/cb/55cb3e32311273135568ef3da7960400d95f63dad586ccfe56996561277b483f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a7/9a/a79a92653692037bf2fd6de92d93429455cd31dc7f96513adb40277d11be891d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/96/84/9684f7bb635a937d6899902ad758fd565826bfe5b8ea42c296d791dd7089b0f9'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1c/5f/1c5f7b819a67cfca7be02b743fbf0dabf7d53a1c7ddf82e70e094d92973d95c7'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/0b/de/0bde10d6ad4055811339a7ed51fca332317529d6b5854a4b7ce90000e352aa33'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/5c/d6/5cd6e14ff3ac522a3a7bac22ef6ec299833c685a9c343d347fe21152e4173856'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ff/bc/ffbc64d8a248deb916c3ef209d2a18fc5de5c56a2cfa546a633cbfec31e6ccb2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/81/7c/817cc36de53f7c914d82e2536a5538c21330ef54662366733e45c76a3c770d06'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/3a/fc/3afc8a938123d0f8e566043d271b4c6a60e3df968b72d8939982a09527763aae'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/95/2e/952eaf2d8448261925753def51d58ff5af595d6469207db42abc0b17204640fb'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1d/b3/1db3132794e05cd2decef99af5f56073af4b4a27c33e3a0d0b4289e61b34c9dc'), PosixPath('/home/leandro/codeparrot-train/.git/info/exclude'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/44/b6/44b6239e61c700810037d9d8aa2fe706d7eaeb5766e492fad95411ad184490f5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/60/07/6007f21e5625708f4710d48386db1297bb1dbd26196ced77b305e7e35da0300d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2d/15/2d15883c4954ffcaafce389f10ccbad7c93e66fae3b7ca7db0a50343180cedf4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2e/b3/2eb3b4ea8f84ef14a84b43002a148d99df05f68c1cfc0c0f074572bda0e0e1ee'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/da/b9/dab942e6da72846fc60682ce21a8e8fa6bf3452a29abff69ec0750e058ab3b92'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/79/c1/79c13ad14568c659397387f3d0e1358393fb0041ff48ce9c98ad4f28df8cde4b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/22/c4/22c47cc7619654f7faafe250a2dd0cabae5520263e967245b8d5638215244239'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/94/e0/94e011d7b77e55164bb15d95c453fa1282d78e234ff378adb930d756bbd33f64'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b9/07/b907e571662c19245abd148afb306b5c6e411d24a5117e0bb4c182a56afb9b97'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/9d/a6/9da6dd8c62377fcfe1e95882a17aa711a8fcc38e02cf21cc1a678f22a9e50d39'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/03/bb/03bb832cf6fad7e4bc885cc1d9502cf312d2951a51afbd63fb6a90f53e49d096'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4a/54/4a54ecd83d3083585ddc7beb921140b2b2e5b4fb82dec9543ac0932c6136e84b'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/post-checkout'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/02/dd/02ddc3cc1a121d8e237578028f34a994a7548f0d086a1312133c3864dbff6b37'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/46/df/46df1517cd973f00262b495f82b10c46ec077a33bcfc83bade078a36590c6d0a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/04/64/04647e38d2a928e08abccf777e680adf7cb0066862374bd847c492de44cb047f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/43/98/439848f817f432ceefdf7e69a64b60dd99a75cc6fb26599a0ea5ac1167c3db4c'), PosixPath('/home/leandro/codeparrot-train/.git/objects/pack/pack-67102b35e20edaa7f1ed9c266f37841cd38f158a.idx'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7c/bf/7cbfb385a3bbebdb3eed3e154c80f0c9bf6b397aa702e5410339c2b1d74ae867'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/bd/9a/bd9af7b8106e0a773e5a12495aa88339995c2084c2f9a243733879eb73f595d8'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/63/77/6377867a616a0b6e8e3e3691c5cce9cd566773ec5bbd02f5a457edac8a0f24d4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/64/35/643576ec614d0ba328db99ae865b8f1321ec4f288164f76fd6746b3b83e34f19'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d7/c8/d7c88386b6a3c339c8a6d0beead12bf440477473df676886099ca289057fbace'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/0d/07/0d07213fb514be71d57406af05dafff0edd3c7506621df761c9453ff598d89c9'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/fc/eb/fcebafda8e3681732437c98581a30faedf7802c6b90c84394d2c42b792c32507'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/applypatch-msg.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/83/14830fec70eb2227647b241d9ff90addbc461cbdcddfe12e015028cefaba6f4e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ef/8b/ef8b57ab3924e70df4f4a37b6853205113144fa01ea6c0140bea3a21b14eafeb'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/98/de/98de114cefba6caad86991425c276e59a5ab4a3a1006d29f73ec5cede6233efd'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/87/fb/87fb4ab74dad4c0f520d49769333d5d1b010fcb9e8f30c8dab16430a5a0af9d2'), PosixPath('/home/leandro/codeparrot-train/.git/logs/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ed/ae/edae53c081ce347a58430f0930ce4fb318a9f62e15f85aa638a86c1666f70df4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/49/d8/49d89abc121b49ef8a540796b63edd68f67f679d6ad1b969d6637d852d59f79f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/87/f9/87f9d6d6889eb78e70ba55d2f959fa4e896bd3a78d02dd347792e30ddd730bf6'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/bd/a8/bda8ae48acb883ddb225719c3584e3baa76887afb7198d76478af06e7f80572e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/08/26/0826780cd0e3d564882321e246176eac0fb695b706bc72c6022925075047a62e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4f/df/4fdfd51962dfc725568d88de53b29e285d52e858e849acb543101fe556779a42'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/4f/144f1231964ab251596b40abdd80f37fe7ce4ac7b2b31fc517b942cc24110341'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6b/3d/6b3d8a7164286112196af65658426d2faeda5c50fc381bdebf378f0226342d4e'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/update.sample'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-rebase.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/da/6e/da6e9d2f263cf7b0254b4c0a57483ed8ac9652d6f67a63d648e9d968c576d526'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6d/c7/6dc73c3794ad5c29870563658a7003cb2a6cfb0c1852c47037a6eda6cc3cf3a1'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/25/84/2584f186110af7310075f15e07ddadb9c50c26cafd4c66b2e2baaab040028c3b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4c/35/4c35db8d1672615cddac65cdf0a76ea9ca1ec9d1d8b18ce293be0df23ff694db'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a9/df/a9dfb7586f9a1bfaaa7175a2384e101f51513b0b98ce01eeaafe5a783cdbad96'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/3a/b5/3ab5c68d9424b10ca45197172baa495813eae7efa9b3914ea4e4afd0201995b5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4f/2c/4f2cb5d9fe3ef94da4aa3ec743d37b83c2347d6f1d3d4696a5c667ff9968ea38'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7f/4f/7f4fb07272574ef183fd21a911f45f989a941516a11fe1d71335954a54657e07'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/39/32/39325e24ddd711eacc61305d421e004de68e6f6d0b649ca695ad53d4dc53b47f'), PosixPath('/home/leandro/codeparrot-train/.git/logs/HEAD'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ee/25/ee25b95231437c8795fca58f4a4d95b2698995f29e7f264956f78670f37ea982'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/5f/34/5f342fc03b8d9c90aa9ff917ca3ff3edce748b6f0b55f61aadc9940ca53b45d5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b3/84/b3849196f2777c6e3fb662ae301ae63561db9aaff9bd2ac2f32ad02e9d26d399'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f1/a5/f1a543df8fe1562a57657011c09d45778915a202f279013041e4f08d6cb1b475'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1d/a5/1da55a92827ad63ee4eb1f5eabf14500459bf357c28b767756b80342024063d4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a2/af/a2af1215060dc01f13d389abee1fc25ff94ed84262c54dea264810a5bcc074fc'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ba/86/ba86bfbe83793efcb2e89df75179188dee67b96ace3e7f1628c133ce11fc361e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a0/cc/a0ccfd373c5bb31028d4b7abb80a9a328395361cc2ac4f7376f5b1f6e89d89d0'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-push.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/44/79/447953386aab39785c0f6c5e44b7310d433886fb73a1e40efe67c9620639e6fa'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2b/ac/2bac46edf98c75901284aff8296f80fea6701821000b205bd85aef8399124074'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e9/95/e995f5605e676fd577e4c78ee6bf43451324ddbcb04e841cf1dfce07c69dc1b6'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2a/6b/2a6b5f923b286f640ad586bc295e653ec0db8e4c8487db1c25fa384e216b6ce5'), PosixPath('/home/leandro/codeparrot-train/.git/refs/heads/main'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/12/a7/12a785cd978d3ec0330adae618ad3103dd53f63c7c11b96a7a0d33254407aaa4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/50/83/5083522f9ebdb4c72e4e384dfd9bce8293d84dcdf0a7580cab1ce8e44f2880da'), PosixPath('/home/leandro/codeparrot-train/.git/config'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/33/27/3327f7692a61d984758a71929f4466af87f91a2db0a656321df0d331ef4def20'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4c/b0/4cb0db5e545856bfeb62f7fa15d3472b705ac8fdeb8c4a831727b730951f8902'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/77/63/7763fa2cb60958f8d28fc6bebc0105ed3614addd32296fe929b7262e4d62f58a'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/commit-msg.sample'), PosixPath('/home/leandro/codeparrot-train/.git/HEAD'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1c/6f/1c6ff13e754a4260b097390066ecc973302f45756b4151bbfb7efbb7b1ac9963'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/17/ba/17ba31d8c126b19d7dc4899e46ec476e059462beaf2364bf77471b2f920ddf37'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d5/74/d574d02117a4209d073c3d382e859fdf07d6e18ac38bed8a4d900c8c9975550c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/c0/8a/c08ad7d3c85ef3631747172211b65c70912bae157b55f922f1f70016bf7f64e6'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/70/35/70353ba511fe03b0f820a7ef6156771de34ef20a404a1cc2c064033998de0f9f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/cf/84/cf84f4c64b1173bb12e281b88ca920c4c6d130c54214b5172bccbcc045fb2d0f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/69/63/6963f0671c853a7bb7ae245df7c1f07fd8db821e59e1ab83b74d07909e029111'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b7/d8/b7d84fc6c01ec6eb79187a7e252a3f033bfd1f2ba297d569e1bf507af9b50fa6'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/32/d9/32d95bf48e9ba4ed480df0015326b0ed07647ce17e84a48a5a445db22bc5de4a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/15/95/159531500b1c473455d10fda2fb82f6ea7814500799e27eaf5f2be6f124f994c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/8f/8a/8f8a74c1e1fc4ee43110f74ae0cc01de863a0ceb3f2c4815cab1dc1efeb5339a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4f/5b/4f5b4ba86fe51a134d866d06e472bd6c6f9d1f122cb905c65cb7c0a35bf51acd'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/17/da/17dac3999cf0cb027901ecb382180aa9560b4bb2c5b839f3afc8cadc229962bf'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/de/af/deaf9432f8e1fdc2bd3b9078dc3996c536e661ebb379b81818ecfc70a360c923'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d0/e5/d0e599bab79fe0054313a92ab57e7a89c65c2fc45011168aa73c0fe000c4f689'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e0/49/e049a0f4444d560849ab8c2d893157b975d183f839984001f101046ca74b7978'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f8/46/f84677f7389798b5c74ff00760d08732db022e99f60dc77e5bb4d900aa80dc60'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/0f/70/0f704aab387aa4e2f0f4dd866d5f0888b25d0d0b61ef7881c38b918f22802ec2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b5/3e/b53e982e883c26c1a21db49bff0a27d8d628f4fc498715739936fa93bfb5353e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e3/62/e3627cc99f31126c54a8a4188ce59123e876c812bdbdc5cba35d2f76e369a385'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/post-merge'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/25/16/25162ca0d0fa0474f367ba4720b75f0cb10c70b3f62dd90cbb6e201773c99cb3'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e1/7a/e17a32eafebfa6f8d8b0edf6c0463c639f06a72fadae7907c9fd026f01136b98'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/00/33/0033a83827749523a25d0ef661ef307b27edc162ce38c44e25fd033e9a187c76'), PosixPath('/home/leandro/codeparrot-train/.git/description'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2d/31/2d3127f22a64cf04b4ab8fd23512d5b7d6373429e36ffd68b3f86d0dff4e2fdb'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/55/db/55dbc21eb4360618b60fc5eaa4ce705ea71bb1e8241237099cfe43c59ed5b2ed'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b8/ac/b8acca45caffd1db94c790f13ed8f1742b71d4f9cd3d242417e87bb150b6af20'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d6/ec/d6ecd24bfd9e0c2877dfa00417568e07d9f64a150c5518d471ff91ded60bf146'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/02/a0/02a07bbab0f2b514c1a9d5296ca8c1a843aca846fcde56fc810700ee416db1b4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/96/f9/96f9e109fe3ebce8c82610b0af4398170d678185b18ce5bc0384d84eb421ace5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/eb/34/eb344442f4771eb011e0e520b8b1666903717e5e8c59a5462fe80aa82401940a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/26/142694003d3fc3bc57e51dab9eaf07472e0f24a4b092d70159943ecc8c2496a4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2a/ff/2aff254f1288353b713d8e718915f8a2eba7d65097ed5f5d0df520a7058ddf71'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-receive.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2c/a7/2ca7213ba4af470b5f4caa0b4439992b7483c8b4d1cb977089f9b9abef1c7fba'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/80/61/8061f4f61c3955c90dab77a1553ac22e9d1ff604c229375be54a38e32ce6f8ca'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f3/5e/f35ec6ce622145756740be75b1fa969996e7e716ac0a15d9bbc4e86aed616000'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a7/6e/a76e8e4bbc39a74e4ff59e02aaf1404a8bc429f1033a216058b09f7e0ee3cd0c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/07/b9/07b951a7cc55afc0d48a47f0dbd9e06c7311279e4a747256b5dcfe11ba56690d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1c/2e/1c2e85e92de0f8a29ed6e534983e0051fa2c79e31013c11c7cc66f3f3f1e0155'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/09/c2/09c237a78f8a49d7840d8e5fc58e79db7e225b9904323f46791dce8fd0585332'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f0/f9/f0f92a74ef6e03d0c05ae2012d7e33242c3b091f3e01d2d8f942e68cf295f7a4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/eb/a4/eba49c7ea511320fd7040022951873a465016ddb72d078b958a4003c396ffb52'), PosixPath('/home/leandro/codeparrot-train/.git/packed-refs'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/62/03/6203a1aae8671a6a23849de3aa6aa3efec0e3fbe3275757643abfd63a9ee9af8')] -08/30/2021 13:14:02 - INFO - datasets.load - Some files matched the pattern '*' at /home/leandro/codeparrot-train but don't have valid data file extensions: [PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/11/70/1170a8200f43dfa3902e9d41088229febdf4d7044d9d762dd5809685e5448b11'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/fa/f2/faf2e65a89fda5ec7a00a36b9fd6c4b2429f1249072b838f2a02d5d01fcaeb18'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b1/70/b1705347d88e73a7de652d1486a3eccda92e420e65a58917c88af635baf55ac8'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/17/89/178953ae530dc7960c803bd22a37026f4190b822b95145240537840bfc5a1ad1'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/37/9d/379db3f5d257369fd927b7395599ec2aef5cefcb57811a57281487da9fd58c5b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/8b/d9/8bd964dad421ed624f4bd5e4719e3e28f62d002b350d850e902688c9e9bcfd80'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1b/c7/1bc7cd472751ec9917bf55ce8b05b8ea467453335103f16c4551e94daefdbaf0'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1f/46/1f46dcfefd87339930fa912ec98a56b7b93c2f052d7f452f82c9c3d0043ffa43'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f9/91/f9915d283d95c3316a76922f129897823efd397287916e8f7af88ed7aaf517b0'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4c/10/4c10f31fa342f81c13b27e7ae0761b17729ee82f6e02824361e2cfcc4ab096c1'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/c0/0f/c00f0550d90e881145954ad24df7fdf512ffc3d63c50d2aa0c85774757d8f37d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/c3/d3/c3d3e55004ff21e36332b9612e385ba07c2610b832b4a94cca2d9fda372a9fb4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a2/17/a21791d67c018e486dde68b8956a16b8fa0c54af93dc3c6ec2c669da87861b02'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/9c/75/9c7526f2ec341f2d2483d9db25b2b2e9fe630b21b737fa7ebbc19965c6ee46b1'), PosixPath('/home/leandro/codeparrot-train/.git/logs/refs/heads/main'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/01/87/0187e92041e5ef1abe3190a48330ff50c7d5fc5ed1219c3bcbb465907430d34e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/37/f2/37f2a405d0e8c52b4a51f79b23f135bcb537eb3f61fe8a27a29ab63b74a37671'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/82/4c/824c9524070c36ed317c12b9b0e77f8b9460e8519ba32c6795a5a2e7232d088c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/44/18/44181da41968eab59b99558c2afd4d6f95397bc2b580622a96f2f9fb74f545b2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/5b/66/5b66654660bc52d66f5bf0e6a62e0b65a0dd2499ec316daed0432efb2c7a8d7b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/47/d1/47d1fedd443c4edfca241c00be8984a2157c668726cc06d92ad7e2704cb5c951'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/9c/83/9c83dabc6a7c8a9629093125ff70fc60f594b0b95cb56f2f12d2bd91352367c7'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/08/4a/084a245793d30784f6ae4f8b666624293bdab2d05a5e1eeadf20b7d9db444951'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/45/da/45da5a5e4acd37b6e288eb4045434fb6b4a8d77979ac61c8306ca9eca6d24128'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/44/10/4410ab4420ffe54105620e1f038b0f6b14afa88a8df9dcf63468f6a2c105d770'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/b9/14b9124b7b2ffa27d79dc210ae77b9b970e067ad7d3dc4d3eebc08671b770c16'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ca/00/ca00ed91ba94519faaba619e5eec6498215695acc6b3f760dc056967cefeea80'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f8/3b/f83b75420e369ae1d55e7009effe9f7a05577a31c19a8c02ce7f0b56b5dc8a87'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ba/5a/ba5ad5064f9ef5d1429abd4c4742cf37b56589c060ff3995e5331eb69fb9c1c5'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/prepare-commit-msg.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/0a/03/0a03d68d6dda083d189878113e864c580b9b5572e53d3e1684b93a9996c7699d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/54/10/5410ae89d1cf3ea5325b7e948fd4db3d352e44bbd2a6a5c813f77be0da958c80'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a9/73/a973fc07ce8ae881a878bf92c6c70583c08ea6bdb2ca2583002271f96dab9543'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2b/85/2b85d040d424bde044014147be3c4949a8d2b0e558c4f4c2c65aead5ece2cde9'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e6/f0/e6f0840fa125b6ad771b853937bd215b369bfb815ff521316cf6cb46fba66968'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/23/ee/23eed9f8512ca62c4b9b4fb28a84688ee550b75ec7658209f3cd5d82a2d4aa57'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a0/53/a05359f8e5ca97304272052f806034ebdca89a94f0d052b719b8b81dd8ddd868'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/21/e1/21e166aee17c30af55849b552e2eaa9c0641dc6cb0ac6386bd3f7797d8af2a9b'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-applypatch.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/70/b0/70b01a02ca2810cf2e74a43655979028b31de42c566bc65d8b749720d1b08fb2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/21/be/21be1bf5e86f5da2dbd83f0bb904a3d68d9abea09bbd5adab6a6873c53ed0112'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7d/04/7d049e95fe5200dc13c1451523e00fd08d37ffde2a863aa025f030f00d3d747b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/41/11/4111a00cda1b0988507f8b544a9e4da7bfb0bff35c13990c6fb1c360aa6a6688'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b9/d1/b9d1c713e023c821f98968ea670a01aa7127c1c915f3d7f6368616f17369e8f2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d5/98/d59884b54759159fcaf45b671dfe9ee2a7d7aea34f1cc7762a1c25499589efb9'), PosixPath('/home/leandro/codeparrot-train/.git/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/8e/81/8e81a5187b909a82581e8030a8008ffb9517519e477797b195bbcf422ef6e20c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1e/89/1e890b33c7f95f900932797f1ba2b15f1f1780926f744ea04e0a969bf270df1a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6b/f5/6bf5fd370b20157e47d88709fb5c8b572f1b682a1fdb80091900bfda70a36491'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/58/1458ee6ad39f24b25d2db9153ba9aa25f4ff2f16c2f624361a0186904a658a54'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-commit.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6b/ce/6bce0dd945b67accdd3077504bc286a26bdb4b03fbbf34d427c21582f3374994'), PosixPath('/home/leandro/codeparrot-train/.git/index'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d0/20/d02098784b5ee7b5d5206ee9cc52e881782d98fc90530322af1c5cb7d401f1fd'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7d/d3/7dd37fe8445ee2641f14179d5a2aa636780822347d880a401d41c90bfd5cfd68'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6f/bc/6fbcee1936749498486745c2dd217ee108f1a243f054dcb2591cfee772906fae'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7f/8d/7f8dc2a2357a3d91ecc5fa5f125c73181dfbe22524d853f672010513044c80f7'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/69/ef/69efdcdb035636e6a8cd18cfc4ef702f95730a381b5d86b36c10028b4df94090'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-push'), PosixPath('/home/leandro/codeparrot-train/.git/objects/pack/pack-67102b35e20edaa7f1ed9c266f37841cd38f158a.pack'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/26/99/2699022bd98f8d49f5505ab457b15dd31156713279335d0c28db1c99edc36894'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/fsmonitor-watchman.sample'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/post-update.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/db/d4/dbd4ddc668c0c838eecd756db64c9a3c2127d8e9bbc05b3fcba00b075854b24c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/fa/40/fa40f7fe8b2d031a32282dce9a40462d67eecff28203c1743fcace8ef4bb37e6'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/bd/9b/bd9be9097633349b5ecd400375be5d511e812feadf983f3c2cbcba263a3a14ab'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/97/af/97af2a98400865661b26c3d5c0a3b6be51603452f459136bc9ab2568667ed199'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b4/2c/b42c05288d42233fb829266917ae1145a835f3ccf8e00ea21e5927f9528fb500'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6a/34/6a34d6e3ac6572933b2f66c74af568a0df3b91b94622dd4b7e5d5538c04071ff'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/05/9b/059bc5381874a28e5a467291be6ee44e3f667609290d74e5ed009be10329bdbb'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/28/29/28290f1947521e2d6c58ee18d83b864b5d95e1fad3b54ee817799991642488ec'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/8a/ae/8aae623a251bd31627554141be2150a5ffb8ddea900ae244fd8492cc03245b36'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/3d/35/3d354291d12d6be3833eda95bd0db307dcd26b5b4287a3f6ca33b3b51b2e46f2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/13/ae/13ae38510e10076edaa24cf051e6403a270c95febd0e2e9b9e052128d632fe36'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/85/28/8528503b464d6cbf8041e0a1481681d0bff4bb24f9d18230fe56c3bc99dfa2ab'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/post-commit'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ba/38/ba38a25c6b8dd335baf2c6cd925ca5b91668af93f7ecee2b120ad352f46a6565'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/77/13/77131f000b7ab27e1336a181a4e4188f31ed40cea3fdf98b6398b5bbddaa5c76'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/93/51/935137f4370f4f5c85ba6a157825fe6102edb991a46610fa9939e2960be9653d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/78/bb/78bbf19a9e7a29b17fa71e3d05842b9469e3187e938efd8c793ceadbdd38c709'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/55/cb/55cb3e32311273135568ef3da7960400d95f63dad586ccfe56996561277b483f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a7/9a/a79a92653692037bf2fd6de92d93429455cd31dc7f96513adb40277d11be891d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/96/84/9684f7bb635a937d6899902ad758fd565826bfe5b8ea42c296d791dd7089b0f9'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1c/5f/1c5f7b819a67cfca7be02b743fbf0dabf7d53a1c7ddf82e70e094d92973d95c7'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/0b/de/0bde10d6ad4055811339a7ed51fca332317529d6b5854a4b7ce90000e352aa33'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/5c/d6/5cd6e14ff3ac522a3a7bac22ef6ec299833c685a9c343d347fe21152e4173856'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ff/bc/ffbc64d8a248deb916c3ef209d2a18fc5de5c56a2cfa546a633cbfec31e6ccb2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/81/7c/817cc36de53f7c914d82e2536a5538c21330ef54662366733e45c76a3c770d06'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/3a/fc/3afc8a938123d0f8e566043d271b4c6a60e3df968b72d8939982a09527763aae'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/95/2e/952eaf2d8448261925753def51d58ff5af595d6469207db42abc0b17204640fb'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1d/b3/1db3132794e05cd2decef99af5f56073af4b4a27c33e3a0d0b4289e61b34c9dc'), PosixPath('/home/leandro/codeparrot-train/.git/info/exclude'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/44/b6/44b6239e61c700810037d9d8aa2fe706d7eaeb5766e492fad95411ad184490f5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/60/07/6007f21e5625708f4710d48386db1297bb1dbd26196ced77b305e7e35da0300d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2d/15/2d15883c4954ffcaafce389f10ccbad7c93e66fae3b7ca7db0a50343180cedf4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2e/b3/2eb3b4ea8f84ef14a84b43002a148d99df05f68c1cfc0c0f074572bda0e0e1ee'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/da/b9/dab942e6da72846fc60682ce21a8e8fa6bf3452a29abff69ec0750e058ab3b92'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/79/c1/79c13ad14568c659397387f3d0e1358393fb0041ff48ce9c98ad4f28df8cde4b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/22/c4/22c47cc7619654f7faafe250a2dd0cabae5520263e967245b8d5638215244239'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/94/e0/94e011d7b77e55164bb15d95c453fa1282d78e234ff378adb930d756bbd33f64'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b9/07/b907e571662c19245abd148afb306b5c6e411d24a5117e0bb4c182a56afb9b97'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/9d/a6/9da6dd8c62377fcfe1e95882a17aa711a8fcc38e02cf21cc1a678f22a9e50d39'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/03/bb/03bb832cf6fad7e4bc885cc1d9502cf312d2951a51afbd63fb6a90f53e49d096'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4a/54/4a54ecd83d3083585ddc7beb921140b2b2e5b4fb82dec9543ac0932c6136e84b'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/post-checkout'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/02/dd/02ddc3cc1a121d8e237578028f34a994a7548f0d086a1312133c3864dbff6b37'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/46/df/46df1517cd973f00262b495f82b10c46ec077a33bcfc83bade078a36590c6d0a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/04/64/04647e38d2a928e08abccf777e680adf7cb0066862374bd847c492de44cb047f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/43/98/439848f817f432ceefdf7e69a64b60dd99a75cc6fb26599a0ea5ac1167c3db4c'), PosixPath('/home/leandro/codeparrot-train/.git/objects/pack/pack-67102b35e20edaa7f1ed9c266f37841cd38f158a.idx'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7c/bf/7cbfb385a3bbebdb3eed3e154c80f0c9bf6b397aa702e5410339c2b1d74ae867'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/bd/9a/bd9af7b8106e0a773e5a12495aa88339995c2084c2f9a243733879eb73f595d8'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/63/77/6377867a616a0b6e8e3e3691c5cce9cd566773ec5bbd02f5a457edac8a0f24d4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/64/35/643576ec614d0ba328db99ae865b8f1321ec4f288164f76fd6746b3b83e34f19'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d7/c8/d7c88386b6a3c339c8a6d0beead12bf440477473df676886099ca289057fbace'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/0d/07/0d07213fb514be71d57406af05dafff0edd3c7506621df761c9453ff598d89c9'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/fc/eb/fcebafda8e3681732437c98581a30faedf7802c6b90c84394d2c42b792c32507'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/applypatch-msg.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/83/14830fec70eb2227647b241d9ff90addbc461cbdcddfe12e015028cefaba6f4e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ef/8b/ef8b57ab3924e70df4f4a37b6853205113144fa01ea6c0140bea3a21b14eafeb'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/98/de/98de114cefba6caad86991425c276e59a5ab4a3a1006d29f73ec5cede6233efd'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/87/fb/87fb4ab74dad4c0f520d49769333d5d1b010fcb9e8f30c8dab16430a5a0af9d2'), PosixPath('/home/leandro/codeparrot-train/.git/logs/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ed/ae/edae53c081ce347a58430f0930ce4fb318a9f62e15f85aa638a86c1666f70df4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/49/d8/49d89abc121b49ef8a540796b63edd68f67f679d6ad1b969d6637d852d59f79f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/87/f9/87f9d6d6889eb78e70ba55d2f959fa4e896bd3a78d02dd347792e30ddd730bf6'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/bd/a8/bda8ae48acb883ddb225719c3584e3baa76887afb7198d76478af06e7f80572e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/08/26/0826780cd0e3d564882321e246176eac0fb695b706bc72c6022925075047a62e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4f/df/4fdfd51962dfc725568d88de53b29e285d52e858e849acb543101fe556779a42'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/4f/144f1231964ab251596b40abdd80f37fe7ce4ac7b2b31fc517b942cc24110341'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6b/3d/6b3d8a7164286112196af65658426d2faeda5c50fc381bdebf378f0226342d4e'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/update.sample'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-rebase.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/da/6e/da6e9d2f263cf7b0254b4c0a57483ed8ac9652d6f67a63d648e9d968c576d526'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/6d/c7/6dc73c3794ad5c29870563658a7003cb2a6cfb0c1852c47037a6eda6cc3cf3a1'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/25/84/2584f186110af7310075f15e07ddadb9c50c26cafd4c66b2e2baaab040028c3b'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4c/35/4c35db8d1672615cddac65cdf0a76ea9ca1ec9d1d8b18ce293be0df23ff694db'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a9/df/a9dfb7586f9a1bfaaa7175a2384e101f51513b0b98ce01eeaafe5a783cdbad96'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/3a/b5/3ab5c68d9424b10ca45197172baa495813eae7efa9b3914ea4e4afd0201995b5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4f/2c/4f2cb5d9fe3ef94da4aa3ec743d37b83c2347d6f1d3d4696a5c667ff9968ea38'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/7f/4f/7f4fb07272574ef183fd21a911f45f989a941516a11fe1d71335954a54657e07'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/39/32/39325e24ddd711eacc61305d421e004de68e6f6d0b649ca695ad53d4dc53b47f'), PosixPath('/home/leandro/codeparrot-train/.git/logs/HEAD'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ee/25/ee25b95231437c8795fca58f4a4d95b2698995f29e7f264956f78670f37ea982'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/5f/34/5f342fc03b8d9c90aa9ff917ca3ff3edce748b6f0b55f61aadc9940ca53b45d5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b3/84/b3849196f2777c6e3fb662ae301ae63561db9aaff9bd2ac2f32ad02e9d26d399'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f1/a5/f1a543df8fe1562a57657011c09d45778915a202f279013041e4f08d6cb1b475'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1d/a5/1da55a92827ad63ee4eb1f5eabf14500459bf357c28b767756b80342024063d4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a2/af/a2af1215060dc01f13d389abee1fc25ff94ed84262c54dea264810a5bcc074fc'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/ba/86/ba86bfbe83793efcb2e89df75179188dee67b96ace3e7f1628c133ce11fc361e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a0/cc/a0ccfd373c5bb31028d4b7abb80a9a328395361cc2ac4f7376f5b1f6e89d89d0'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-push.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/44/79/447953386aab39785c0f6c5e44b7310d433886fb73a1e40efe67c9620639e6fa'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2b/ac/2bac46edf98c75901284aff8296f80fea6701821000b205bd85aef8399124074'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e9/95/e995f5605e676fd577e4c78ee6bf43451324ddbcb04e841cf1dfce07c69dc1b6'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2a/6b/2a6b5f923b286f640ad586bc295e653ec0db8e4c8487db1c25fa384e216b6ce5'), PosixPath('/home/leandro/codeparrot-train/.git/refs/heads/main'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/12/a7/12a785cd978d3ec0330adae618ad3103dd53f63c7c11b96a7a0d33254407aaa4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/50/83/5083522f9ebdb4c72e4e384dfd9bce8293d84dcdf0a7580cab1ce8e44f2880da'), PosixPath('/home/leandro/codeparrot-train/.git/config'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/33/27/3327f7692a61d984758a71929f4466af87f91a2db0a656321df0d331ef4def20'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4c/b0/4cb0db5e545856bfeb62f7fa15d3472b705ac8fdeb8c4a831727b730951f8902'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/77/63/7763fa2cb60958f8d28fc6bebc0105ed3614addd32296fe929b7262e4d62f58a'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/commit-msg.sample'), PosixPath('/home/leandro/codeparrot-train/.git/HEAD'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1c/6f/1c6ff13e754a4260b097390066ecc973302f45756b4151bbfb7efbb7b1ac9963'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/17/ba/17ba31d8c126b19d7dc4899e46ec476e059462beaf2364bf77471b2f920ddf37'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d5/74/d574d02117a4209d073c3d382e859fdf07d6e18ac38bed8a4d900c8c9975550c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/c0/8a/c08ad7d3c85ef3631747172211b65c70912bae157b55f922f1f70016bf7f64e6'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/70/35/70353ba511fe03b0f820a7ef6156771de34ef20a404a1cc2c064033998de0f9f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/cf/84/cf84f4c64b1173bb12e281b88ca920c4c6d130c54214b5172bccbcc045fb2d0f'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/69/63/6963f0671c853a7bb7ae245df7c1f07fd8db821e59e1ab83b74d07909e029111'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b7/d8/b7d84fc6c01ec6eb79187a7e252a3f033bfd1f2ba297d569e1bf507af9b50fa6'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/32/d9/32d95bf48e9ba4ed480df0015326b0ed07647ce17e84a48a5a445db22bc5de4a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/15/95/159531500b1c473455d10fda2fb82f6ea7814500799e27eaf5f2be6f124f994c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/8f/8a/8f8a74c1e1fc4ee43110f74ae0cc01de863a0ceb3f2c4815cab1dc1efeb5339a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/4f/5b/4f5b4ba86fe51a134d866d06e472bd6c6f9d1f122cb905c65cb7c0a35bf51acd'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/17/da/17dac3999cf0cb027901ecb382180aa9560b4bb2c5b839f3afc8cadc229962bf'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/de/af/deaf9432f8e1fdc2bd3b9078dc3996c536e661ebb379b81818ecfc70a360c923'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d0/e5/d0e599bab79fe0054313a92ab57e7a89c65c2fc45011168aa73c0fe000c4f689'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e0/49/e049a0f4444d560849ab8c2d893157b975d183f839984001f101046ca74b7978'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f8/46/f84677f7389798b5c74ff00760d08732db022e99f60dc77e5bb4d900aa80dc60'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/0f/70/0f704aab387aa4e2f0f4dd866d5f0888b25d0d0b61ef7881c38b918f22802ec2'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b5/3e/b53e982e883c26c1a21db49bff0a27d8d628f4fc498715739936fa93bfb5353e'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e3/62/e3627cc99f31126c54a8a4188ce59123e876c812bdbdc5cba35d2f76e369a385'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/post-merge'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/25/16/25162ca0d0fa0474f367ba4720b75f0cb10c70b3f62dd90cbb6e201773c99cb3'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/e1/7a/e17a32eafebfa6f8d8b0edf6c0463c639f06a72fadae7907c9fd026f01136b98'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/00/33/0033a83827749523a25d0ef661ef307b27edc162ce38c44e25fd033e9a187c76'), PosixPath('/home/leandro/codeparrot-train/.git/description'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2d/31/2d3127f22a64cf04b4ab8fd23512d5b7d6373429e36ffd68b3f86d0dff4e2fdb'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/55/db/55dbc21eb4360618b60fc5eaa4ce705ea71bb1e8241237099cfe43c59ed5b2ed'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/b8/ac/b8acca45caffd1db94c790f13ed8f1742b71d4f9cd3d242417e87bb150b6af20'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/d6/ec/d6ecd24bfd9e0c2877dfa00417568e07d9f64a150c5518d471ff91ded60bf146'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/02/a0/02a07bbab0f2b514c1a9d5296ca8c1a843aca846fcde56fc810700ee416db1b4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/96/f9/96f9e109fe3ebce8c82610b0af4398170d678185b18ce5bc0384d84eb421ace5'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/eb/34/eb344442f4771eb011e0e520b8b1666903717e5e8c59a5462fe80aa82401940a'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/14/26/142694003d3fc3bc57e51dab9eaf07472e0f24a4b092d70159943ecc8c2496a4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2a/ff/2aff254f1288353b713d8e718915f8a2eba7d65097ed5f5d0df520a7058ddf71'), PosixPath('/home/leandro/codeparrot-train/.git/hooks/pre-receive.sample'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/2c/a7/2ca7213ba4af470b5f4caa0b4439992b7483c8b4d1cb977089f9b9abef1c7fba'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/80/61/8061f4f61c3955c90dab77a1553ac22e9d1ff604c229375be54a38e32ce6f8ca'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f3/5e/f35ec6ce622145756740be75b1fa969996e7e716ac0a15d9bbc4e86aed616000'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/a7/6e/a76e8e4bbc39a74e4ff59e02aaf1404a8bc429f1033a216058b09f7e0ee3cd0c'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/07/b9/07b951a7cc55afc0d48a47f0dbd9e06c7311279e4a747256b5dcfe11ba56690d'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/1c/2e/1c2e85e92de0f8a29ed6e534983e0051fa2c79e31013c11c7cc66f3f3f1e0155'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/09/c2/09c237a78f8a49d7840d8e5fc58e79db7e225b9904323f46791dce8fd0585332'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/f0/f9/f0f92a74ef6e03d0c05ae2012d7e33242c3b091f3e01d2d8f942e68cf295f7a4'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/eb/a4/eba49c7ea511320fd7040022951873a465016ddb72d078b958a4003c396ffb52'), PosixPath('/home/leandro/codeparrot-train/.git/packed-refs'), PosixPath('/home/leandro/codeparrot-train/.git/lfs/objects/62/03/6203a1aae8671a6a23849de3aa6aa3efec0e3fbe3275757643abfd63a9ee9af8')] -08/30/2021 13:14:02 - WARNING - datasets.builder - Using custom data configuration codeparrot-train-3a26f48916bbb7e0 -08/30/2021 13:14:02 - DEBUG - datasets.utils.filelock - Attempting to acquire lock 139865678200064 on /home/leandro/.cache/huggingface/datasets/_home_leandro_.cache_huggingface_datasets_json_codeparrot-train-3a26f48916bbb7e0_0.0.0_e0dcb9fb097c37d83741a1ffd70553ea5e06cb0082872d4def076475be3ec67c.lock -08/30/2021 13:14:02 - DEBUG - datasets.utils.filelock - Lock 139865678200064 acquired on /home/leandro/.cache/huggingface/datasets/_home_leandro_.cache_huggingface_datasets_json_codeparrot-train-3a26f48916bbb7e0_0.0.0_e0dcb9fb097c37d83741a1ffd70553ea5e06cb0082872d4def076475be3ec67c.lock -08/30/2021 13:14:02 - DEBUG - datasets.utils.filelock - Attempting to release lock 139865678200064 on /home/leandro/.cache/huggingface/datasets/_home_leandro_.cache_huggingface_datasets_json_codeparrot-train-3a26f48916bbb7e0_0.0.0_e0dcb9fb097c37d83741a1ffd70553ea5e06cb0082872d4def076475be3ec67c.lock -08/30/2021 13:14:02 - DEBUG - datasets.utils.filelock - Lock 139865678200064 released on /home/leandro/.cache/huggingface/datasets/_home_leandro_.cache_huggingface_datasets_json_codeparrot-train-3a26f48916bbb7e0_0.0.0_e0dcb9fb097c37d83741a1ffd70553ea5e06cb0082872d4def076475be3ec67c.lock -08/30/2021 13:14:02 - INFO - datasets.load - Some files matched the pattern '*' at /home/leandro/codeparrot-valid but don't have valid data file extensions: [PosixPath('/home/leandro/codeparrot-valid/.git/objects/c6/7ccd65e0057c57364469d576a57387eaa57530'), PosixPath('/home/leandro/codeparrot-valid/.git/description'), PosixPath('/home/leandro/codeparrot-valid/.git/logs/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/post-commit'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/0b/0462e46b355e305d77ff3b85f3a01776e188ea'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/f3/fa800d7629eabb8ba09a504140b5a203d1341a'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/post-merge'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/update.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/info/exclude'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-rebase.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/prepare-commit-msg.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/packed-refs'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-applypatch.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-valid/.git/logs/refs/heads/main'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-receive.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/index'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/c9/b135a100a1770bcdc5ae26195bd4f7bd85a764'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/post-checkout'), PosixPath('/home/leandro/codeparrot-valid/.git/config'), PosixPath('/home/leandro/codeparrot-valid/.git/HEAD'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-commit.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/logs/HEAD'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/07/f0db3339ad9053dc95b284c4ae14e014efff89'), PosixPath('/home/leandro/codeparrot-valid/.git/refs/heads/main'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-push.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/5e/9d29c73e4d5b8ecb2b60628d17a791508a514f'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-push'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/fsmonitor-watchman.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/applypatch-msg.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/post-update.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/lfs/objects/43/23/432375a8140ca79af9fa62e3145815c0f7965af8026ed1847ce6e75a11f413fd'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/commit-msg.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/d7/b8c495dd9e6df27bfd6a47dad7e33da0850a5b')] -08/30/2021 13:14:02 - INFO - datasets.load - Some files matched the pattern '*' at /home/leandro/codeparrot-valid but don't have valid data file extensions: [PosixPath('/home/leandro/codeparrot-valid/.git/objects/c6/7ccd65e0057c57364469d576a57387eaa57530'), PosixPath('/home/leandro/codeparrot-valid/.git/description'), PosixPath('/home/leandro/codeparrot-valid/.git/logs/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/post-commit'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/0b/0462e46b355e305d77ff3b85f3a01776e188ea'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/f3/fa800d7629eabb8ba09a504140b5a203d1341a'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/post-merge'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/update.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/info/exclude'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-rebase.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/prepare-commit-msg.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/packed-refs'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-applypatch.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/refs/remotes/origin/HEAD'), PosixPath('/home/leandro/codeparrot-valid/.git/logs/refs/heads/main'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-receive.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/index'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/c9/b135a100a1770bcdc5ae26195bd4f7bd85a764'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/post-checkout'), PosixPath('/home/leandro/codeparrot-valid/.git/config'), PosixPath('/home/leandro/codeparrot-valid/.git/HEAD'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-commit.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/logs/HEAD'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/07/f0db3339ad9053dc95b284c4ae14e014efff89'), PosixPath('/home/leandro/codeparrot-valid/.git/refs/heads/main'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-push.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/5e/9d29c73e4d5b8ecb2b60628d17a791508a514f'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/pre-push'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/fsmonitor-watchman.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/applypatch-msg.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/post-update.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/lfs/objects/43/23/432375a8140ca79af9fa62e3145815c0f7965af8026ed1847ce6e75a11f413fd'), PosixPath('/home/leandro/codeparrot-valid/.git/hooks/commit-msg.sample'), PosixPath('/home/leandro/codeparrot-valid/.git/objects/d7/b8c495dd9e6df27bfd6a47dad7e33da0850a5b')] -08/30/2021 13:14:02 - WARNING - datasets.builder - Using custom data configuration codeparrot-valid-52bb4ddf73523afb -08/30/2021 13:14:02 - DEBUG - datasets.utils.filelock - Attempting to acquire lock 139865678180160 on /home/leandro/.cache/huggingface/datasets/_home_leandro_.cache_huggingface_datasets_json_codeparrot-valid-52bb4ddf73523afb_0.0.0_e0dcb9fb097c37d83741a1ffd70553ea5e06cb0082872d4def076475be3ec67c.lock -08/30/2021 13:14:02 - DEBUG - datasets.utils.filelock - Lock 139865678180160 acquired on /home/leandro/.cache/huggingface/datasets/_home_leandro_.cache_huggingface_datasets_json_codeparrot-valid-52bb4ddf73523afb_0.0.0_e0dcb9fb097c37d83741a1ffd70553ea5e06cb0082872d4def076475be3ec67c.lock -08/30/2021 13:14:02 - DEBUG - datasets.utils.filelock - Attempting to release lock 139865678180160 on /home/leandro/.cache/huggingface/datasets/_home_leandro_.cache_huggingface_datasets_json_codeparrot-valid-52bb4ddf73523afb_0.0.0_e0dcb9fb097c37d83741a1ffd70553ea5e06cb0082872d4def076475be3ec67c.lock -08/30/2021 13:14:02 - DEBUG - datasets.utils.filelock - Lock 139865678180160 released on /home/leandro/.cache/huggingface/datasets/_home_leandro_.cache_huggingface_datasets_json_codeparrot-valid-52bb4ddf73523afb_0.0.0_e0dcb9fb097c37d83741a1ffd70553ea5e06cb0082872d4def076475be3ec67c.lock -08/30/2021 13:14:28 - INFO - __main__ - Step 1: {'lr': 0.0, 'samples': 192, 'steps': 0, 'loss/train': 10.546818733215332} -08/30/2021 13:14:30 - INFO - root - Reducer buckets have been rebuilt in this iteration. -08/30/2021 13:14:30 - INFO - __main__ - Step 2: {'lr': 2.5e-07, 'samples': 384, 'steps': 1, 'loss/train': 10.525705337524414} -08/30/2021 13:14:30 - INFO - __main__ - Step 3: {'lr': 5e-07, 'samples': 576, 'steps': 2, 'loss/train': 10.52365493774414} -08/30/2021 13:14:31 - INFO - __main__ - Step 4: {'lr': 7.5e-07, 'samples': 768, 'steps': 3, 'loss/train': 10.503287315368652} -08/30/2021 13:14:31 - INFO - __main__ - Step 5: {'lr': 1e-06, 'samples': 960, 'steps': 4, 'loss/train': 10.504632949829102} -08/30/2021 13:14:32 - INFO - __main__ - Step 6: {'lr': 1.25e-06, 'samples': 1152, 'steps': 5, 'loss/train': 10.51413345336914} -08/30/2021 13:14:33 - INFO - __main__ - Step 7: {'lr': 1.5e-06, 'samples': 1344, 'steps': 6, 'loss/train': 10.520750999450684} -08/30/2021 13:14:33 - INFO - __main__ - Step 8: {'lr': 1.75e-06, 'samples': 1536, 'steps': 7, 'loss/train': 10.414685249328613} -08/30/2021 13:14:34 - INFO - __main__ - Step 9: {'lr': 2e-06, 'samples': 1728, 'steps': 8, 'loss/train': 10.404026985168457} -08/30/2021 13:14:34 - INFO - __main__ - Step 10: {'lr': 2.25e-06, 'samples': 1920, 'steps': 9, 'loss/train': 10.328200340270996} -08/30/2021 13:14:36 - INFO - __main__ - Step 11: {'lr': 2.5e-06, 'samples': 2112, 'steps': 10, 'loss/train': 10.321759223937988} -08/30/2021 13:14:36 - INFO - __main__ - Step 12: {'lr': 2.75e-06, 'samples': 2304, 'steps': 11, 'loss/train': 10.262408256530762} -08/30/2021 13:14:37 - INFO - __main__ - Step 13: {'lr': 3e-06, 'samples': 2496, 'steps': 12, 'loss/train': 10.278728485107422} -08/30/2021 13:14:37 - INFO - __main__ - Step 14: {'lr': 3.25e-06, 'samples': 2688, 'steps': 13, 'loss/train': 10.19308853149414} -08/30/2021 13:14:37 - INFO - __main__ - Step 15: {'lr': 3.5e-06, 'samples': 2880, 'steps': 14, 'loss/train': 10.08371353149414} -08/30/2021 13:14:39 - INFO - __main__ - Step 16: {'lr': 3.75e-06, 'samples': 3072, 'steps': 15, 'loss/train': 10.086686134338379} -08/30/2021 13:14:39 - INFO - __main__ - Step 17: {'lr': 4e-06, 'samples': 3264, 'steps': 16, 'loss/train': 9.986761093139648} -08/30/2021 13:14:40 - INFO - __main__ - Step 18: {'lr': 4.250000000000001e-06, 'samples': 3456, 'steps': 17, 'loss/train': 9.912551879882812} -08/30/2021 13:14:40 - INFO - __main__ - Step 19: {'lr': 4.5e-06, 'samples': 3648, 'steps': 18, 'loss/train': 9.928834915161133} -08/30/2021 13:14:40 - INFO - __main__ - Step 20: {'lr': 4.75e-06, 'samples': 3840, 'steps': 19, 'loss/train': 9.895331382751465} -08/30/2021 13:14:42 - INFO - __main__ - Step 21: {'lr': 5e-06, 'samples': 4032, 'steps': 20, 'loss/train': 9.97384262084961} -08/30/2021 13:14:42 - INFO - __main__ - Step 22: {'lr': 5.2500000000000006e-06, 'samples': 4224, 'steps': 21, 'loss/train': 9.905083656311035} -08/30/2021 13:14:43 - INFO - __main__ - Step 23: {'lr': 5.5e-06, 'samples': 4416, 'steps': 22, 'loss/train': 9.64094352722168} -08/30/2021 13:14:43 - INFO - __main__ - Step 24: {'lr': 5.75e-06, 'samples': 4608, 'steps': 23, 'loss/train': 9.791954040527344} -08/30/2021 13:14:44 - INFO - __main__ - Step 25: {'lr': 6e-06, 'samples': 4800, 'steps': 24, 'loss/train': 9.601712226867676} -08/30/2021 13:14:45 - INFO - __main__ - Step 26: {'lr': 6.25e-06, 'samples': 4992, 'steps': 25, 'loss/train': 9.53923225402832} -08/30/2021 13:14:46 - INFO - __main__ - Step 27: {'lr': 6.5e-06, 'samples': 5184, 'steps': 26, 'loss/train': 9.611143112182617} -08/30/2021 13:14:46 - INFO - __main__ - Step 28: {'lr': 6.75e-06, 'samples': 5376, 'steps': 27, 'loss/train': 9.653268814086914} -08/30/2021 13:14:46 - INFO - __main__ - Step 29: {'lr': 7e-06, 'samples': 5568, 'steps': 28, 'loss/train': 9.100192070007324} -08/30/2021 13:14:47 - INFO - __main__ - Step 30: {'lr': 7.250000000000001e-06, 'samples': 5760, 'steps': 29, 'loss/train': 9.508585929870605} -08/30/2021 13:14:49 - INFO - __main__ - Step 31: {'lr': 7.5e-06, 'samples': 5952, 'steps': 30, 'loss/train': 9.466412544250488} -08/30/2021 13:14:49 - INFO - __main__ - Step 32: {'lr': 7.75e-06, 'samples': 6144, 'steps': 31, 'loss/train': 9.346211433410645} -08/30/2021 13:14:49 - INFO - __main__ - Step 33: {'lr': 8e-06, 'samples': 6336, 'steps': 32, 'loss/train': 9.451282501220703} -08/30/2021 13:14:50 - INFO - __main__ - Step 34: {'lr': 8.25e-06, 'samples': 6528, 'steps': 33, 'loss/train': 9.759281158447266} -08/30/2021 13:14:50 - INFO - __main__ - Step 35: {'lr': 8.500000000000002e-06, 'samples': 6720, 'steps': 34, 'loss/train': 9.649574279785156} -08/30/2021 13:14:52 - INFO - __main__ - Step 36: {'lr': 8.750000000000001e-06, 'samples': 6912, 'steps': 35, 'loss/train': 9.331921577453613} -08/30/2021 13:14:53 - INFO - __main__ - Step 37: {'lr': 9e-06, 'samples': 7104, 'steps': 36, 'loss/train': 9.344559669494629} -08/30/2021 13:14:53 - INFO - __main__ - Step 38: {'lr': 9.25e-06, 'samples': 7296, 'steps': 37, 'loss/train': 9.458386421203613} -08/30/2021 13:14:53 - INFO - __main__ - Step 39: {'lr': 9.5e-06, 'samples': 7488, 'steps': 38, 'loss/train': 8.978026390075684} -08/30/2021 13:14:54 - INFO - __main__ - Step 40: {'lr': 9.75e-06, 'samples': 7680, 'steps': 39, 'loss/train': 9.016935348510742} -08/30/2021 13:14:55 - INFO - __main__ - Step 41: {'lr': 1e-05, 'samples': 7872, 'steps': 40, 'loss/train': 9.311957359313965} -08/30/2021 13:14:56 - INFO - __main__ - Step 42: {'lr': 1.025e-05, 'samples': 8064, 'steps': 41, 'loss/train': 9.269092559814453} -08/30/2021 13:14:56 - INFO - __main__ - Step 43: {'lr': 1.0500000000000001e-05, 'samples': 8256, 'steps': 42, 'loss/train': 9.038583755493164} -08/30/2021 13:14:56 - INFO - __main__ - Step 44: {'lr': 1.0749999999999999e-05, 'samples': 8448, 'steps': 43, 'loss/train': 8.843268394470215} -08/30/2021 13:14:57 - INFO - __main__ - Step 45: {'lr': 1.1e-05, 'samples': 8640, 'steps': 44, 'loss/train': 9.406013488769531} -08/30/2021 13:14:58 - INFO - __main__ - Step 46: {'lr': 1.1249999999999999e-05, 'samples': 8832, 'steps': 45, 'loss/train': 9.007134437561035} -08/30/2021 13:14:59 - INFO - __main__ - Step 47: {'lr': 1.15e-05, 'samples': 9024, 'steps': 46, 'loss/train': 9.294915199279785} -08/30/2021 13:14:59 - INFO - __main__ - Step 48: {'lr': 1.1750000000000001e-05, 'samples': 9216, 'steps': 47, 'loss/train': 9.259795188903809} -08/30/2021 13:15:00 - INFO - __main__ - Step 49: {'lr': 1.2e-05, 'samples': 9408, 'steps': 48, 'loss/train': 8.890713691711426} -08/30/2021 13:15:00 - INFO - __main__ - Step 50: {'lr': 1.2250000000000001e-05, 'samples': 9600, 'steps': 49, 'loss/train': 9.338799476623535} -08/30/2021 13:15:00 - INFO - __main__ - Step 51: {'lr': 1.25e-05, 'samples': 9792, 'steps': 50, 'loss/train': 8.270134925842285} -08/30/2021 13:15:02 - INFO - __main__ - Step 52: {'lr': 1.275e-05, 'samples': 9984, 'steps': 51, 'loss/train': 9.038247108459473} -08/30/2021 13:15:02 - INFO - __main__ - Step 53: {'lr': 1.3e-05, 'samples': 10176, 'steps': 52, 'loss/train': 8.898700714111328} -08/30/2021 13:15:03 - INFO - __main__ - Step 54: {'lr': 1.325e-05, 'samples': 10368, 'steps': 53, 'loss/train': 8.948592185974121} -08/30/2021 13:15:03 - INFO - __main__ - Step 55: {'lr': 1.35e-05, 'samples': 10560, 'steps': 54, 'loss/train': 9.279808044433594} -08/30/2021 13:15:03 - INFO - __main__ - Step 56: {'lr': 1.375e-05, 'samples': 10752, 'steps': 55, 'loss/train': 7.908687591552734} -08/30/2021 13:15:05 - INFO - __main__ - Step 57: {'lr': 1.4e-05, 'samples': 10944, 'steps': 56, 'loss/train': 8.963644981384277} -08/30/2021 13:15:05 - INFO - __main__ - Step 58: {'lr': 1.425e-05, 'samples': 11136, 'steps': 57, 'loss/train': 8.764342308044434} -08/30/2021 13:15:06 - INFO - __main__ - Step 59: {'lr': 1.4500000000000002e-05, 'samples': 11328, 'steps': 58, 'loss/train': 8.986572265625} -08/30/2021 13:15:06 - INFO - __main__ - Step 60: {'lr': 1.475e-05, 'samples': 11520, 'steps': 59, 'loss/train': 8.97697639465332} -08/30/2021 13:15:06 - INFO - __main__ - Step 61: {'lr': 1.5e-05, 'samples': 11712, 'steps': 60, 'loss/train': 8.946927070617676} -08/30/2021 13:15:08 - INFO - __main__ - Step 62: {'lr': 1.525e-05, 'samples': 11904, 'steps': 61, 'loss/train': 9.006952285766602} -08/30/2021 13:15:08 - INFO - __main__ - Step 63: {'lr': 1.55e-05, 'samples': 12096, 'steps': 62, 'loss/train': 8.8870849609375} -08/30/2021 13:15:09 - INFO - __main__ - Step 64: {'lr': 1.575e-05, 'samples': 12288, 'steps': 63, 'loss/train': 8.90562915802002} -08/30/2021 13:15:09 - INFO - __main__ - Step 65: {'lr': 1.6e-05, 'samples': 12480, 'steps': 64, 'loss/train': 8.861169815063477} -08/30/2021 13:15:09 - INFO - __main__ - Step 66: {'lr': 1.6250000000000002e-05, 'samples': 12672, 'steps': 65, 'loss/train': 8.712646484375} -08/30/2021 13:15:11 - INFO - __main__ - Step 67: {'lr': 1.65e-05, 'samples': 12864, 'steps': 66, 'loss/train': 8.782997131347656} -08/30/2021 13:15:12 - INFO - __main__ - Step 68: {'lr': 1.675e-05, 'samples': 13056, 'steps': 67, 'loss/train': 8.86316204071045} -08/30/2021 13:15:12 - INFO - __main__ - Step 69: {'lr': 1.7000000000000003e-05, 'samples': 13248, 'steps': 68, 'loss/train': 8.866331100463867} -08/30/2021 13:15:12 - INFO - __main__ - Step 70: {'lr': 1.7250000000000003e-05, 'samples': 13440, 'steps': 69, 'loss/train': 8.66346549987793} -08/30/2021 13:15:13 - INFO - __main__ - Step 71: {'lr': 1.7500000000000002e-05, 'samples': 13632, 'steps': 70, 'loss/train': 8.741483688354492} -08/30/2021 13:15:14 - INFO - __main__ - Step 72: {'lr': 1.7749999999999998e-05, 'samples': 13824, 'steps': 71, 'loss/train': 8.24655532836914} -08/30/2021 13:15:15 - INFO - __main__ - Step 73: {'lr': 1.8e-05, 'samples': 14016, 'steps': 72, 'loss/train': 8.648695945739746} -08/30/2021 13:15:15 - INFO - __main__ - Step 74: {'lr': 1.825e-05, 'samples': 14208, 'steps': 73, 'loss/train': 8.465259552001953} -08/30/2021 13:15:15 - INFO - __main__ - Step 75: {'lr': 1.85e-05, 'samples': 14400, 'steps': 74, 'loss/train': 8.739703178405762} -08/30/2021 13:15:16 - INFO - __main__ - Step 76: {'lr': 1.875e-05, 'samples': 14592, 'steps': 75, 'loss/train': 8.829558372497559} -08/30/2021 13:15:17 - INFO - __main__ - Step 77: {'lr': 1.9e-05, 'samples': 14784, 'steps': 76, 'loss/train': 7.585636615753174} -08/30/2021 13:15:18 - INFO - __main__ - Step 78: {'lr': 1.925e-05, 'samples': 14976, 'steps': 77, 'loss/train': 8.732975006103516} -08/30/2021 13:15:18 - INFO - __main__ - Step 79: {'lr': 1.95e-05, 'samples': 15168, 'steps': 78, 'loss/train': 8.731362342834473} -08/30/2021 13:15:19 - INFO - __main__ - Step 80: {'lr': 1.975e-05, 'samples': 15360, 'steps': 79, 'loss/train': 8.499696731567383} -08/30/2021 13:15:19 - INFO - __main__ - Step 81: {'lr': 2e-05, 'samples': 15552, 'steps': 80, 'loss/train': 9.014501571655273} -08/30/2021 13:15:19 - INFO - __main__ - Step 82: {'lr': 2.025e-05, 'samples': 15744, 'steps': 81, 'loss/train': 8.513715744018555} -08/30/2021 13:15:21 - INFO - __main__ - Step 83: {'lr': 2.05e-05, 'samples': 15936, 'steps': 82, 'loss/train': 8.84457778930664} -08/30/2021 13:15:21 - INFO - __main__ - Step 84: {'lr': 2.0750000000000003e-05, 'samples': 16128, 'steps': 83, 'loss/train': 8.340596199035645} -08/30/2021 13:15:22 - INFO - __main__ - Step 85: {'lr': 2.1000000000000002e-05, 'samples': 16320, 'steps': 84, 'loss/train': 8.586440086364746} -08/30/2021 13:15:22 - INFO - __main__ - Step 86: {'lr': 2.125e-05, 'samples': 16512, 'steps': 85, 'loss/train': 8.27778148651123} -08/30/2021 13:15:22 - INFO - __main__ - Step 87: {'lr': 2.1499999999999997e-05, 'samples': 16704, 'steps': 86, 'loss/train': 8.524147987365723} -08/30/2021 13:15:24 - INFO - __main__ - Step 88: {'lr': 2.175e-05, 'samples': 16896, 'steps': 87, 'loss/train': 8.412591934204102} -08/30/2021 13:15:25 - INFO - __main__ - Step 89: {'lr': 2.2e-05, 'samples': 17088, 'steps': 88, 'loss/train': 8.645748138427734} -08/30/2021 13:15:25 - INFO - __main__ - Step 90: {'lr': 2.225e-05, 'samples': 17280, 'steps': 89, 'loss/train': 8.578646659851074} -08/30/2021 13:15:25 - INFO - __main__ - Step 91: {'lr': 2.2499999999999998e-05, 'samples': 17472, 'steps': 90, 'loss/train': 8.59123420715332} -08/30/2021 13:15:26 - INFO - __main__ - Step 92: {'lr': 2.275e-05, 'samples': 17664, 'steps': 91, 'loss/train': 9.487090110778809} -08/30/2021 13:15:26 - INFO - __main__ - Step 93: {'lr': 2.3e-05, 'samples': 17856, 'steps': 92, 'loss/train': 8.676104545593262} -08/30/2021 13:15:26 - INFO - __main__ - Step 94: {'lr': 2.325e-05, 'samples': 18048, 'steps': 93, 'loss/train': 8.010075569152832} -08/30/2021 13:15:29 - INFO - __main__ - Step 95: {'lr': 2.3500000000000002e-05, 'samples': 18240, 'steps': 94, 'loss/train': 8.484045028686523} -08/30/2021 13:15:29 - INFO - __main__ - Step 96: {'lr': 2.375e-05, 'samples': 18432, 'steps': 95, 'loss/train': 8.230620384216309} -08/30/2021 13:15:29 - INFO - __main__ - Step 97: {'lr': 2.4e-05, 'samples': 18624, 'steps': 96, 'loss/train': 8.564264297485352} -08/30/2021 13:15:30 - INFO - __main__ - Step 98: {'lr': 2.425e-05, 'samples': 18816, 'steps': 97, 'loss/train': 8.579083442687988} -08/30/2021 13:15:30 - INFO - __main__ - Step 99: {'lr': 2.4500000000000003e-05, 'samples': 19008, 'steps': 98, 'loss/train': 8.529154777526855} -08/30/2021 13:15:32 - INFO - __main__ - Step 100: {'lr': 2.4750000000000002e-05, 'samples': 19200, 'steps': 99, 'loss/train': 8.343099594116211} -08/30/2021 13:15:32 - INFO - __main__ - Step 101: {'lr': 2.5e-05, 'samples': 19392, 'steps': 100, 'loss/train': 8.50272274017334} -08/30/2021 13:15:32 - INFO - __main__ - Step 102: {'lr': 2.525e-05, 'samples': 19584, 'steps': 101, 'loss/train': 8.26205825805664} -08/30/2021 13:15:33 - INFO - __main__ - Step 103: {'lr': 2.55e-05, 'samples': 19776, 'steps': 102, 'loss/train': 8.597186088562012} -08/30/2021 13:15:33 - INFO - __main__ - Step 104: {'lr': 2.575e-05, 'samples': 19968, 'steps': 103, 'loss/train': 8.398731231689453} -08/30/2021 13:15:35 - INFO - __main__ - Step 105: {'lr': 2.6e-05, 'samples': 20160, 'steps': 104, 'loss/train': 7.961066246032715} -08/30/2021 13:15:35 - INFO - __main__ - Step 106: {'lr': 2.625e-05, 'samples': 20352, 'steps': 105, 'loss/train': 8.320724487304688} -08/30/2021 13:15:35 - INFO - __main__ - Step 107: {'lr': 2.65e-05, 'samples': 20544, 'steps': 106, 'loss/train': 9.094656944274902} -08/30/2021 13:15:36 - INFO - __main__ - Step 108: {'lr': 2.675e-05, 'samples': 20736, 'steps': 107, 'loss/train': 8.722951889038086} -08/30/2021 13:15:36 - INFO - __main__ - Step 109: {'lr': 2.7e-05, 'samples': 20928, 'steps': 108, 'loss/train': 8.294156074523926} -08/30/2021 13:15:38 - INFO - __main__ - Step 110: {'lr': 2.725e-05, 'samples': 21120, 'steps': 109, 'loss/train': 8.313566207885742} -08/30/2021 13:15:38 - INFO - __main__ - Step 111: {'lr': 2.75e-05, 'samples': 21312, 'steps': 110, 'loss/train': 8.41221809387207} -08/30/2021 13:15:39 - INFO - __main__ - Step 112: {'lr': 2.775e-05, 'samples': 21504, 'steps': 111, 'loss/train': 8.197552680969238} -08/30/2021 13:15:39 - INFO - __main__ - Step 113: {'lr': 2.8e-05, 'samples': 21696, 'steps': 112, 'loss/train': 7.915801048278809} -08/30/2021 13:15:39 - INFO - __main__ - Step 114: {'lr': 2.8250000000000002e-05, 'samples': 21888, 'steps': 113, 'loss/train': 8.26795768737793} -08/30/2021 13:15:40 - INFO - __main__ - Step 115: {'lr': 2.85e-05, 'samples': 22080, 'steps': 114, 'loss/train': 8.088530540466309} -08/30/2021 13:15:41 - INFO - __main__ - Step 116: {'lr': 2.875e-05, 'samples': 22272, 'steps': 115, 'loss/train': 8.1422700881958} -08/30/2021 13:15:42 - INFO - __main__ - Step 117: {'lr': 2.9000000000000004e-05, 'samples': 22464, 'steps': 116, 'loss/train': 7.825667381286621} -08/30/2021 13:15:42 - INFO - __main__ - Step 118: {'lr': 2.9250000000000003e-05, 'samples': 22656, 'steps': 117, 'loss/train': 8.091445922851562} -08/30/2021 13:15:42 - INFO - __main__ - Step 119: {'lr': 2.95e-05, 'samples': 22848, 'steps': 118, 'loss/train': 8.04175853729248} -08/30/2021 13:15:43 - INFO - __main__ - Step 120: {'lr': 2.9749999999999998e-05, 'samples': 23040, 'steps': 119, 'loss/train': 8.295466423034668} -08/30/2021 13:15:44 - INFO - __main__ - Step 121: {'lr': 3e-05, 'samples': 23232, 'steps': 120, 'loss/train': 7.831602096557617} -08/30/2021 13:15:44 - INFO - __main__ - Step 122: {'lr': 3.025e-05, 'samples': 23424, 'steps': 121, 'loss/train': 7.929701328277588} -08/30/2021 13:15:45 - INFO - __main__ - Step 123: {'lr': 3.05e-05, 'samples': 23616, 'steps': 122, 'loss/train': 8.287981033325195} -08/30/2021 13:15:45 - INFO - __main__ - Step 124: {'lr': 3.075e-05, 'samples': 23808, 'steps': 123, 'loss/train': 8.041546821594238} -08/30/2021 13:15:45 - INFO - __main__ - Step 125: {'lr': 3.1e-05, 'samples': 24000, 'steps': 124, 'loss/train': 7.768130302429199} -08/30/2021 13:15:47 - INFO - __main__ - Step 126: {'lr': 3.125e-05, 'samples': 24192, 'steps': 125, 'loss/train': 8.019730567932129} -08/30/2021 13:15:47 - INFO - __main__ - Step 127: {'lr': 3.15e-05, 'samples': 24384, 'steps': 126, 'loss/train': 8.072555541992188} -08/30/2021 13:15:48 - INFO - __main__ - Step 128: {'lr': 3.175e-05, 'samples': 24576, 'steps': 127, 'loss/train': 7.807083606719971} -08/30/2021 13:15:48 - INFO - __main__ - Step 129: {'lr': 3.2e-05, 'samples': 24768, 'steps': 128, 'loss/train': 7.171544551849365} -08/30/2021 13:15:48 - INFO - __main__ - Step 130: {'lr': 3.2250000000000005e-05, 'samples': 24960, 'steps': 129, 'loss/train': 7.535074710845947} -08/30/2021 13:15:50 - INFO - __main__ - Step 131: {'lr': 3.2500000000000004e-05, 'samples': 25152, 'steps': 130, 'loss/train': 8.027023315429688} -08/30/2021 13:15:51 - INFO - __main__ - Step 132: {'lr': 3.275e-05, 'samples': 25344, 'steps': 131, 'loss/train': 7.754735469818115} -08/30/2021 13:15:51 - INFO - __main__ - Step 133: {'lr': 3.3e-05, 'samples': 25536, 'steps': 132, 'loss/train': 7.7708282470703125} -08/30/2021 13:15:51 - INFO - __main__ - Step 134: {'lr': 3.325e-05, 'samples': 25728, 'steps': 133, 'loss/train': 7.703486919403076} -08/30/2021 13:15:52 - INFO - __main__ - Step 135: {'lr': 3.35e-05, 'samples': 25920, 'steps': 134, 'loss/train': 7.797639846801758} -08/30/2021 13:15:53 - INFO - __main__ - Step 136: {'lr': 3.375e-05, 'samples': 26112, 'steps': 135, 'loss/train': 7.808203220367432} -08/30/2021 13:15:54 - INFO - __main__ - Step 137: {'lr': 3.4000000000000007e-05, 'samples': 26304, 'steps': 136, 'loss/train': 7.523798942565918} -08/30/2021 13:15:54 - INFO - __main__ - Step 138: {'lr': 3.4250000000000006e-05, 'samples': 26496, 'steps': 137, 'loss/train': 7.6538214683532715} -08/30/2021 13:15:54 - INFO - __main__ - Step 139: {'lr': 3.4500000000000005e-05, 'samples': 26688, 'steps': 138, 'loss/train': 7.683449745178223} -08/30/2021 13:15:55 - INFO - __main__ - Step 140: {'lr': 3.4750000000000004e-05, 'samples': 26880, 'steps': 139, 'loss/train': 7.692724227905273} -08/30/2021 13:15:55 - INFO - __main__ - Step 141: {'lr': 3.5000000000000004e-05, 'samples': 27072, 'steps': 140, 'loss/train': 7.852876663208008} -08/30/2021 13:15:57 - INFO - __main__ - Step 142: {'lr': 3.5249999999999996e-05, 'samples': 27264, 'steps': 141, 'loss/train': 7.375845909118652} -08/30/2021 13:15:57 - INFO - __main__ - Step 143: {'lr': 3.5499999999999996e-05, 'samples': 27456, 'steps': 142, 'loss/train': 7.803616523742676} -08/30/2021 13:15:58 - INFO - __main__ - Step 144: {'lr': 3.5749999999999995e-05, 'samples': 27648, 'steps': 143, 'loss/train': 8.747018814086914} -08/30/2021 13:15:58 - INFO - __main__ - Step 145: {'lr': 3.6e-05, 'samples': 27840, 'steps': 144, 'loss/train': 7.117000579833984} -08/30/2021 13:15:58 - INFO - __main__ - Step 146: {'lr': 3.625e-05, 'samples': 28032, 'steps': 145, 'loss/train': 7.414916038513184} -08/30/2021 13:16:01 - INFO - __main__ - Step 147: {'lr': 3.65e-05, 'samples': 28224, 'steps': 146, 'loss/train': 8.180768966674805} -08/30/2021 13:16:01 - INFO - __main__ - Step 148: {'lr': 3.675e-05, 'samples': 28416, 'steps': 147, 'loss/train': 7.569336891174316} -08/30/2021 13:16:02 - INFO - __main__ - Step 149: {'lr': 3.7e-05, 'samples': 28608, 'steps': 148, 'loss/train': 7.721749782562256} -08/30/2021 13:16:02 - INFO - __main__ - Step 150: {'lr': 3.725e-05, 'samples': 28800, 'steps': 149, 'loss/train': 9.089354515075684} -08/30/2021 13:16:02 - INFO - __main__ - Step 151: {'lr': 3.75e-05, 'samples': 28992, 'steps': 150, 'loss/train': 7.522524356842041} -08/30/2021 13:16:03 - INFO - __main__ - Step 152: {'lr': 3.775e-05, 'samples': 29184, 'steps': 151, 'loss/train': 6.467438220977783} -08/30/2021 13:16:04 - INFO - __main__ - Step 153: {'lr': 3.8e-05, 'samples': 29376, 'steps': 152, 'loss/train': 8.00661563873291} -08/30/2021 13:16:05 - INFO - __main__ - Step 154: {'lr': 3.825e-05, 'samples': 29568, 'steps': 153, 'loss/train': 8.649490356445312} -08/30/2021 13:16:05 - INFO - __main__ - Step 155: {'lr': 3.85e-05, 'samples': 29760, 'steps': 154, 'loss/train': 7.1845011711120605} -08/30/2021 13:16:06 - INFO - __main__ - Step 156: {'lr': 3.875e-05, 'samples': 29952, 'steps': 155, 'loss/train': 7.420681953430176} -08/30/2021 13:16:06 - INFO - __main__ - Step 157: {'lr': 3.9e-05, 'samples': 30144, 'steps': 156, 'loss/train': 7.687047004699707} -08/30/2021 13:16:06 - INFO - __main__ - Step 158: {'lr': 3.925e-05, 'samples': 30336, 'steps': 157, 'loss/train': 7.417532920837402} -08/30/2021 13:16:08 - INFO - __main__ - Step 159: {'lr': 3.95e-05, 'samples': 30528, 'steps': 158, 'loss/train': 7.372868537902832} -08/30/2021 13:16:08 - INFO - __main__ - Step 160: {'lr': 3.9750000000000004e-05, 'samples': 30720, 'steps': 159, 'loss/train': 7.476993560791016} -08/30/2021 13:16:09 - INFO - __main__ - Step 161: {'lr': 4e-05, 'samples': 30912, 'steps': 160, 'loss/train': 7.318636894226074} -08/30/2021 13:16:09 - INFO - __main__ - Step 162: {'lr': 4.025e-05, 'samples': 31104, 'steps': 161, 'loss/train': 6.126968860626221} -08/30/2021 13:16:09 - INFO - __main__ - Step 163: {'lr': 4.05e-05, 'samples': 31296, 'steps': 162, 'loss/train': 7.044919490814209} -08/30/2021 13:16:11 - INFO - __main__ - Step 164: {'lr': 4.075e-05, 'samples': 31488, 'steps': 163, 'loss/train': 7.408450126647949} -08/30/2021 13:16:11 - INFO - __main__ - Step 165: {'lr': 4.1e-05, 'samples': 31680, 'steps': 164, 'loss/train': 7.306212902069092} -08/30/2021 13:16:12 - INFO - __main__ - Step 166: {'lr': 4.125e-05, 'samples': 31872, 'steps': 165, 'loss/train': 7.709270000457764} -08/30/2021 13:16:12 - INFO - __main__ - Step 167: {'lr': 4.1500000000000006e-05, 'samples': 32064, 'steps': 166, 'loss/train': 8.131908416748047} -08/30/2021 13:16:12 - INFO - __main__ - Step 168: {'lr': 4.1750000000000005e-05, 'samples': 32256, 'steps': 167, 'loss/train': 7.362995624542236} -08/30/2021 13:16:14 - INFO - __main__ - Step 169: {'lr': 4.2000000000000004e-05, 'samples': 32448, 'steps': 168, 'loss/train': 7.193559646606445} -08/30/2021 13:16:14 - INFO - __main__ - Step 170: {'lr': 4.2250000000000004e-05, 'samples': 32640, 'steps': 169, 'loss/train': 7.005338191986084} -08/30/2021 13:16:15 - INFO - __main__ - Step 171: {'lr': 4.25e-05, 'samples': 32832, 'steps': 170, 'loss/train': 7.036742687225342} -08/30/2021 13:16:15 - INFO - __main__ - Step 172: {'lr': 4.275e-05, 'samples': 33024, 'steps': 171, 'loss/train': 7.050740718841553} -08/30/2021 13:16:15 - INFO - __main__ - Step 173: {'lr': 4.2999999999999995e-05, 'samples': 33216, 'steps': 172, 'loss/train': 6.541714191436768} -08/30/2021 13:16:16 - INFO - __main__ - Step 174: {'lr': 4.325e-05, 'samples': 33408, 'steps': 173, 'loss/train': 6.680890083312988} -08/30/2021 13:16:17 - INFO - __main__ - Step 175: {'lr': 4.35e-05, 'samples': 33600, 'steps': 174, 'loss/train': 8.720884323120117} -08/30/2021 13:16:18 - INFO - __main__ - Step 176: {'lr': 4.375e-05, 'samples': 33792, 'steps': 175, 'loss/train': 7.001683235168457} -08/30/2021 13:16:18 - INFO - __main__ - Step 177: {'lr': 4.4e-05, 'samples': 33984, 'steps': 176, 'loss/train': 7.472266674041748} -08/30/2021 13:16:19 - INFO - __main__ - Step 178: {'lr': 4.425e-05, 'samples': 34176, 'steps': 177, 'loss/train': 8.132484436035156} -08/30/2021 13:16:19 - INFO - __main__ - Step 179: {'lr': 4.45e-05, 'samples': 34368, 'steps': 178, 'loss/train': 7.092846393585205} -08/30/2021 13:16:20 - INFO - __main__ - Step 180: {'lr': 4.475e-05, 'samples': 34560, 'steps': 179, 'loss/train': 7.776556015014648} -08/30/2021 13:16:21 - INFO - __main__ - Step 181: {'lr': 4.4999999999999996e-05, 'samples': 34752, 'steps': 180, 'loss/train': 6.613148212432861} -08/30/2021 13:16:21 - INFO - __main__ - Step 182: {'lr': 4.525e-05, 'samples': 34944, 'steps': 181, 'loss/train': 6.981738567352295} -08/30/2021 13:16:22 - INFO - __main__ - Step 183: {'lr': 4.55e-05, 'samples': 35136, 'steps': 182, 'loss/train': 7.218873500823975} -08/30/2021 13:16:22 - INFO - __main__ - Step 184: {'lr': 4.575e-05, 'samples': 35328, 'steps': 183, 'loss/train': 7.0679473876953125} -08/30/2021 13:16:24 - INFO - __main__ - Step 185: {'lr': 4.6e-05, 'samples': 35520, 'steps': 184, 'loss/train': 6.852197170257568} -08/30/2021 13:16:24 - INFO - __main__ - Step 186: {'lr': 4.625e-05, 'samples': 35712, 'steps': 185, 'loss/train': 6.924624919891357} -08/30/2021 13:16:24 - INFO - __main__ - Step 187: {'lr': 4.65e-05, 'samples': 35904, 'steps': 186, 'loss/train': 7.059135913848877} -08/30/2021 13:16:25 - INFO - __main__ - Step 188: {'lr': 4.675e-05, 'samples': 36096, 'steps': 187, 'loss/train': 8.635014533996582} -08/30/2021 13:16:25 - INFO - __main__ - Step 189: {'lr': 4.7000000000000004e-05, 'samples': 36288, 'steps': 188, 'loss/train': 7.537959575653076} -08/30/2021 13:16:25 - INFO - __main__ - Step 190: {'lr': 4.725e-05, 'samples': 36480, 'steps': 189, 'loss/train': 6.609078884124756} -08/30/2021 13:16:27 - INFO - __main__ - Step 191: {'lr': 4.75e-05, 'samples': 36672, 'steps': 190, 'loss/train': 6.9301300048828125} -08/30/2021 13:16:27 - INFO - __main__ - Step 192: {'lr': 4.775e-05, 'samples': 36864, 'steps': 191, 'loss/train': 7.088875770568848} -08/30/2021 13:16:28 - INFO - __main__ - Step 193: {'lr': 4.8e-05, 'samples': 37056, 'steps': 192, 'loss/train': 6.6858696937561035} -08/30/2021 13:16:28 - INFO - __main__ - Step 194: {'lr': 4.825e-05, 'samples': 37248, 'steps': 193, 'loss/train': 7.036083698272705} -08/30/2021 13:16:28 - INFO - __main__ - Step 195: {'lr': 4.85e-05, 'samples': 37440, 'steps': 194, 'loss/train': 6.408541679382324} -08/30/2021 13:16:30 - INFO - __main__ - Step 196: {'lr': 4.8750000000000006e-05, 'samples': 37632, 'steps': 195, 'loss/train': 7.12893533706665} -08/30/2021 13:16:31 - INFO - __main__ - Step 197: {'lr': 4.9000000000000005e-05, 'samples': 37824, 'steps': 196, 'loss/train': 6.899067401885986} -08/30/2021 13:16:31 - INFO - __main__ - Step 198: {'lr': 4.9250000000000004e-05, 'samples': 38016, 'steps': 197, 'loss/train': 6.713313102722168} -08/30/2021 13:16:32 - INFO - __main__ - Step 199: {'lr': 4.9500000000000004e-05, 'samples': 38208, 'steps': 198, 'loss/train': 6.786980628967285} -08/30/2021 13:16:32 - INFO - __main__ - Step 200: {'lr': 4.975e-05, 'samples': 38400, 'steps': 199, 'loss/train': 7.545706748962402} -08/30/2021 13:16:32 - INFO - __main__ - Step 201: {'lr': 5e-05, 'samples': 38592, 'steps': 200, 'loss/train': 6.757307052612305} -08/30/2021 13:16:34 - INFO - __main__ - Step 202: {'lr': 5.025e-05, 'samples': 38784, 'steps': 201, 'loss/train': 6.9278669357299805} -08/30/2021 13:16:35 - INFO - __main__ - Step 203: {'lr': 5.05e-05, 'samples': 38976, 'steps': 202, 'loss/train': 6.424849987030029} -08/30/2021 13:16:35 - INFO - __main__ - Step 204: {'lr': 5.075000000000001e-05, 'samples': 39168, 'steps': 203, 'loss/train': 6.568314075469971} -08/30/2021 13:16:35 - INFO - __main__ - Step 205: {'lr': 5.1e-05, 'samples': 39360, 'steps': 204, 'loss/train': 6.462455749511719} -08/30/2021 13:16:36 - INFO - __main__ - Step 206: {'lr': 5.125e-05, 'samples': 39552, 'steps': 205, 'loss/train': 6.838433265686035} -08/30/2021 13:16:36 - INFO - __main__ - Step 207: {'lr': 5.15e-05, 'samples': 39744, 'steps': 206, 'loss/train': 6.531557559967041} -08/30/2021 13:16:38 - INFO - __main__ - Step 208: {'lr': 5.175e-05, 'samples': 39936, 'steps': 207, 'loss/train': 6.422881126403809} -08/30/2021 13:16:38 - INFO - __main__ - Step 209: {'lr': 5.2e-05, 'samples': 40128, 'steps': 208, 'loss/train': 5.729274272918701} -08/30/2021 13:16:39 - INFO - __main__ - Step 210: {'lr': 5.2249999999999996e-05, 'samples': 40320, 'steps': 209, 'loss/train': 5.9838175773620605} -08/30/2021 13:16:39 - INFO - __main__ - Step 211: {'lr': 5.25e-05, 'samples': 40512, 'steps': 210, 'loss/train': 6.901343822479248} -08/30/2021 13:16:39 - INFO - __main__ - Step 212: {'lr': 5.275e-05, 'samples': 40704, 'steps': 211, 'loss/train': 7.349523544311523} -08/30/2021 13:16:40 - INFO - __main__ - Step 213: {'lr': 5.3e-05, 'samples': 40896, 'steps': 212, 'loss/train': 6.588607311248779} -08/30/2021 13:16:42 - INFO - __main__ - Step 214: {'lr': 5.325e-05, 'samples': 41088, 'steps': 213, 'loss/train': 6.809523582458496} -08/30/2021 13:16:42 - INFO - __main__ - Step 215: {'lr': 5.35e-05, 'samples': 41280, 'steps': 214, 'loss/train': 6.712080478668213} -08/30/2021 13:16:43 - INFO - __main__ - Step 216: {'lr': 5.375e-05, 'samples': 41472, 'steps': 215, 'loss/train': 7.01638126373291} -08/30/2021 13:16:43 - INFO - __main__ - Step 217: {'lr': 5.4e-05, 'samples': 41664, 'steps': 216, 'loss/train': 6.674835681915283} -08/30/2021 13:16:43 - INFO - __main__ - Step 218: {'lr': 5.4250000000000004e-05, 'samples': 41856, 'steps': 217, 'loss/train': 5.89940881729126} -08/30/2021 13:16:44 - INFO - __main__ - Step 219: {'lr': 5.45e-05, 'samples': 42048, 'steps': 218, 'loss/train': 6.69445276260376} -08/30/2021 13:16:44 - INFO - __main__ - Step 220: {'lr': 5.475e-05, 'samples': 42240, 'steps': 219, 'loss/train': 6.964169025421143} -08/30/2021 13:16:46 - INFO - __main__ - Step 221: {'lr': 5.5e-05, 'samples': 42432, 'steps': 220, 'loss/train': 5.135345935821533} -08/30/2021 13:16:46 - INFO - __main__ - Step 222: {'lr': 5.525e-05, 'samples': 42624, 'steps': 221, 'loss/train': 6.899173259735107} -08/30/2021 13:16:47 - INFO - __main__ - Step 223: {'lr': 5.55e-05, 'samples': 42816, 'steps': 222, 'loss/train': 4.228754043579102} -08/30/2021 13:16:47 - INFO - __main__ - Step 224: {'lr': 5.575e-05, 'samples': 43008, 'steps': 223, 'loss/train': 1.7641043663024902} -08/30/2021 13:16:47 - INFO - __main__ - Step 225: {'lr': 5.6e-05, 'samples': 43200, 'steps': 224, 'loss/train': 6.569450378417969} -08/30/2021 13:16:48 - INFO - __main__ - Step 226: {'lr': 5.6250000000000005e-05, 'samples': 43392, 'steps': 225, 'loss/train': 7.532073974609375} -08/30/2021 13:16:49 - INFO - __main__ - Step 227: {'lr': 5.6500000000000005e-05, 'samples': 43584, 'steps': 226, 'loss/train': 6.195535182952881} -08/30/2021 13:16:49 - INFO - __main__ - Step 228: {'lr': 5.6750000000000004e-05, 'samples': 43776, 'steps': 227, 'loss/train': 6.496519088745117} -08/30/2021 13:16:50 - INFO - __main__ - Step 229: {'lr': 5.7e-05, 'samples': 43968, 'steps': 228, 'loss/train': 6.168381214141846} -08/30/2021 13:16:50 - INFO - __main__ - Step 230: {'lr': 5.725e-05, 'samples': 44160, 'steps': 229, 'loss/train': 7.491093635559082} -08/30/2021 13:16:51 - INFO - __main__ - Step 231: {'lr': 5.75e-05, 'samples': 44352, 'steps': 230, 'loss/train': 7.151771068572998} -08/30/2021 13:16:52 - INFO - __main__ - Step 232: {'lr': 5.775e-05, 'samples': 44544, 'steps': 231, 'loss/train': 6.826668739318848} -08/30/2021 13:16:53 - INFO - __main__ - Step 233: {'lr': 5.800000000000001e-05, 'samples': 44736, 'steps': 232, 'loss/train': 6.619130611419678} -08/30/2021 13:16:53 - INFO - __main__ - Step 234: {'lr': 5.8250000000000006e-05, 'samples': 44928, 'steps': 233, 'loss/train': 6.137080192565918} -08/30/2021 13:16:53 - INFO - __main__ - Step 235: {'lr': 5.8500000000000006e-05, 'samples': 45120, 'steps': 234, 'loss/train': 6.702738285064697} -08/30/2021 13:16:54 - INFO - __main__ - Step 236: {'lr': 5.875e-05, 'samples': 45312, 'steps': 235, 'loss/train': 6.450294494628906} -08/30/2021 13:16:55 - INFO - __main__ - Step 237: {'lr': 5.9e-05, 'samples': 45504, 'steps': 236, 'loss/train': 6.517692565917969} -08/30/2021 13:16:55 - INFO - __main__ - Step 238: {'lr': 5.925e-05, 'samples': 45696, 'steps': 237, 'loss/train': 6.6421098709106445} -08/30/2021 13:16:56 - INFO - __main__ - Step 239: {'lr': 5.9499999999999996e-05, 'samples': 45888, 'steps': 238, 'loss/train': 6.984536647796631} -08/30/2021 13:16:56 - INFO - __main__ - Step 240: {'lr': 5.9749999999999995e-05, 'samples': 46080, 'steps': 239, 'loss/train': 6.613828659057617} -08/30/2021 13:16:57 - INFO - __main__ - Step 241: {'lr': 6e-05, 'samples': 46272, 'steps': 240, 'loss/train': 6.637491226196289} -08/30/2021 13:16:57 - INFO - __main__ - Step 242: {'lr': 6.025e-05, 'samples': 46464, 'steps': 241, 'loss/train': 6.738170623779297} -08/30/2021 13:16:59 - INFO - __main__ - Step 243: {'lr': 6.05e-05, 'samples': 46656, 'steps': 242, 'loss/train': 6.628913879394531} -08/30/2021 13:16:59 - INFO - __main__ - Step 244: {'lr': 6.075e-05, 'samples': 46848, 'steps': 243, 'loss/train': 6.514838218688965} -08/30/2021 13:17:00 - INFO - __main__ - Step 245: {'lr': 6.1e-05, 'samples': 47040, 'steps': 244, 'loss/train': 6.199484825134277} -08/30/2021 13:17:00 - INFO - __main__ - Step 246: {'lr': 6.125e-05, 'samples': 47232, 'steps': 245, 'loss/train': 7.448530197143555} -08/30/2021 13:17:00 - INFO - __main__ - Step 247: {'lr': 6.15e-05, 'samples': 47424, 'steps': 246, 'loss/train': 6.739471435546875} -08/30/2021 13:17:02 - INFO - __main__ - Step 248: {'lr': 6.175e-05, 'samples': 47616, 'steps': 247, 'loss/train': 6.479034423828125} -08/30/2021 13:17:02 - INFO - __main__ - Step 249: {'lr': 6.2e-05, 'samples': 47808, 'steps': 248, 'loss/train': 6.803154468536377} -08/30/2021 13:17:03 - INFO - __main__ - Step 250: {'lr': 6.225e-05, 'samples': 48000, 'steps': 249, 'loss/train': 6.7155585289001465} -08/30/2021 13:17:03 - INFO - __main__ - Step 251: {'lr': 6.25e-05, 'samples': 48192, 'steps': 250, 'loss/train': 7.329843997955322} -08/30/2021 13:17:03 - INFO - __main__ - Step 252: {'lr': 6.275000000000001e-05, 'samples': 48384, 'steps': 251, 'loss/train': 6.693150520324707} -08/30/2021 13:17:05 - INFO - __main__ - Step 253: {'lr': 6.3e-05, 'samples': 48576, 'steps': 252, 'loss/train': 6.362494468688965} -08/30/2021 13:17:05 - INFO - __main__ - Step 254: {'lr': 6.325e-05, 'samples': 48768, 'steps': 253, 'loss/train': 6.805384159088135} -08/30/2021 13:17:05 - INFO - __main__ - Step 255: {'lr': 6.35e-05, 'samples': 48960, 'steps': 254, 'loss/train': 6.727595806121826} -08/30/2021 13:17:06 - INFO - __main__ - Step 256: {'lr': 6.375e-05, 'samples': 49152, 'steps': 255, 'loss/train': 6.758667945861816} -08/30/2021 13:17:06 - INFO - __main__ - Step 257: {'lr': 6.4e-05, 'samples': 49344, 'steps': 256, 'loss/train': 6.727235794067383} -08/30/2021 13:17:08 - INFO - __main__ - Step 258: {'lr': 6.425e-05, 'samples': 49536, 'steps': 257, 'loss/train': 6.790642261505127} -08/30/2021 13:17:08 - INFO - __main__ - Step 259: {'lr': 6.450000000000001e-05, 'samples': 49728, 'steps': 258, 'loss/train': 6.2721405029296875} -08/30/2021 13:17:09 - INFO - __main__ - Step 260: {'lr': 6.475e-05, 'samples': 49920, 'steps': 259, 'loss/train': 6.076294898986816} -08/30/2021 13:17:09 - INFO - __main__ - Step 261: {'lr': 6.500000000000001e-05, 'samples': 50112, 'steps': 260, 'loss/train': 6.275369167327881} -08/30/2021 13:17:09 - INFO - __main__ - Step 262: {'lr': 6.525e-05, 'samples': 50304, 'steps': 261, 'loss/train': 6.536117076873779} -08/30/2021 13:17:11 - INFO - __main__ - Step 263: {'lr': 6.55e-05, 'samples': 50496, 'steps': 262, 'loss/train': 6.122943878173828} -08/30/2021 13:17:12 - INFO - __main__ - Step 264: {'lr': 6.575e-05, 'samples': 50688, 'steps': 263, 'loss/train': 6.044567584991455} -08/30/2021 13:17:12 - INFO - __main__ - Step 265: {'lr': 6.6e-05, 'samples': 50880, 'steps': 264, 'loss/train': 6.834893703460693} -08/30/2021 13:17:13 - INFO - __main__ - Step 266: {'lr': 6.625000000000001e-05, 'samples': 51072, 'steps': 265, 'loss/train': 6.797702312469482} -08/30/2021 13:17:13 - INFO - __main__ - Step 267: {'lr': 6.65e-05, 'samples': 51264, 'steps': 266, 'loss/train': 6.716531276702881} -08/30/2021 13:17:15 - INFO - __main__ - Step 268: {'lr': 6.675000000000001e-05, 'samples': 51456, 'steps': 267, 'loss/train': 6.557199954986572} -08/30/2021 13:17:15 - INFO - __main__ - Step 269: {'lr': 6.7e-05, 'samples': 51648, 'steps': 268, 'loss/train': 6.293004512786865} -08/30/2021 13:17:16 - INFO - __main__ - Step 270: {'lr': 6.725000000000001e-05, 'samples': 51840, 'steps': 269, 'loss/train': 6.490097999572754} -08/30/2021 13:17:16 - INFO - __main__ - Step 271: {'lr': 6.75e-05, 'samples': 52032, 'steps': 270, 'loss/train': 5.555928707122803} -08/30/2021 13:17:16 - INFO - __main__ - Step 272: {'lr': 6.775000000000001e-05, 'samples': 52224, 'steps': 271, 'loss/train': 6.2016282081604} -08/30/2021 13:17:17 - INFO - __main__ - Step 273: {'lr': 6.800000000000001e-05, 'samples': 52416, 'steps': 272, 'loss/train': 6.706387042999268} -08/30/2021 13:17:17 - INFO - __main__ - Step 274: {'lr': 6.825e-05, 'samples': 52608, 'steps': 273, 'loss/train': 6.345366477966309} -08/30/2021 13:17:18 - INFO - __main__ - Step 275: {'lr': 6.850000000000001e-05, 'samples': 52800, 'steps': 274, 'loss/train': 6.390197277069092} -08/30/2021 13:17:19 - INFO - __main__ - Step 276: {'lr': 6.875e-05, 'samples': 52992, 'steps': 275, 'loss/train': 6.968113422393799} -08/30/2021 13:17:19 - INFO - __main__ - Step 277: {'lr': 6.900000000000001e-05, 'samples': 53184, 'steps': 276, 'loss/train': 6.015243053436279} -08/30/2021 13:17:20 - INFO - __main__ - Step 278: {'lr': 6.925e-05, 'samples': 53376, 'steps': 277, 'loss/train': 6.234228610992432} -08/30/2021 13:17:20 - INFO - __main__ - Step 279: {'lr': 6.950000000000001e-05, 'samples': 53568, 'steps': 278, 'loss/train': 6.04856538772583} -08/30/2021 13:17:21 - INFO - __main__ - Step 280: {'lr': 6.975e-05, 'samples': 53760, 'steps': 279, 'loss/train': 6.198585510253906} -08/30/2021 13:17:22 - INFO - __main__ - Step 281: {'lr': 7.000000000000001e-05, 'samples': 53952, 'steps': 280, 'loss/train': 6.070130348205566} -08/30/2021 13:17:22 - INFO - __main__ - Step 282: {'lr': 7.025000000000001e-05, 'samples': 54144, 'steps': 281, 'loss/train': 6.166639804840088} -08/30/2021 13:17:23 - INFO - __main__ - Step 283: {'lr': 7.049999999999999e-05, 'samples': 54336, 'steps': 282, 'loss/train': 6.3716888427734375} -08/30/2021 13:17:23 - INFO - __main__ - Step 284: {'lr': 7.075e-05, 'samples': 54528, 'steps': 283, 'loss/train': 6.35542106628418} -08/30/2021 13:17:25 - INFO - __main__ - Step 285: {'lr': 7.099999999999999e-05, 'samples': 54720, 'steps': 284, 'loss/train': 6.591944694519043} -08/30/2021 13:17:25 - INFO - __main__ - Step 286: {'lr': 7.125e-05, 'samples': 54912, 'steps': 285, 'loss/train': 6.389350891113281} -08/30/2021 13:17:25 - INFO - __main__ - Step 287: {'lr': 7.149999999999999e-05, 'samples': 55104, 'steps': 286, 'loss/train': 5.966076374053955} -08/30/2021 13:17:26 - INFO - __main__ - Step 288: {'lr': 7.175e-05, 'samples': 55296, 'steps': 287, 'loss/train': 6.342068672180176} -08/30/2021 13:17:26 - INFO - __main__ - Step 289: {'lr': 7.2e-05, 'samples': 55488, 'steps': 288, 'loss/train': 6.697934627532959} -08/30/2021 13:17:27 - INFO - __main__ - Step 290: {'lr': 7.225e-05, 'samples': 55680, 'steps': 289, 'loss/train': 6.229708194732666} -08/30/2021 13:17:28 - INFO - __main__ - Step 291: {'lr': 7.25e-05, 'samples': 55872, 'steps': 290, 'loss/train': 6.215189456939697} -08/30/2021 13:17:28 - INFO - __main__ - Step 292: {'lr': 7.274999999999999e-05, 'samples': 56064, 'steps': 291, 'loss/train': 6.311378479003906} -08/30/2021 13:17:29 - INFO - __main__ - Step 293: {'lr': 7.3e-05, 'samples': 56256, 'steps': 292, 'loss/train': 6.328258037567139} -08/30/2021 13:17:29 - INFO - __main__ - Step 294: {'lr': 7.324999999999999e-05, 'samples': 56448, 'steps': 293, 'loss/train': 5.831396102905273} -08/30/2021 13:17:30 - INFO - __main__ - Step 295: {'lr': 7.35e-05, 'samples': 56640, 'steps': 294, 'loss/train': 6.255168437957764} -08/30/2021 13:17:31 - INFO - __main__ - Step 296: {'lr': 7.375e-05, 'samples': 56832, 'steps': 295, 'loss/train': 5.845766067504883} -08/30/2021 13:17:31 - INFO - __main__ - Step 297: {'lr': 7.4e-05, 'samples': 57024, 'steps': 296, 'loss/train': 6.156411170959473} -08/30/2021 13:17:32 - INFO - __main__ - Step 298: {'lr': 7.425e-05, 'samples': 57216, 'steps': 297, 'loss/train': 6.51584005355835} -08/30/2021 13:17:32 - INFO - __main__ - Step 299: {'lr': 7.45e-05, 'samples': 57408, 'steps': 298, 'loss/train': 6.158653736114502} -08/30/2021 13:17:32 - INFO - __main__ - Step 300: {'lr': 7.475e-05, 'samples': 57600, 'steps': 299, 'loss/train': 6.394083023071289} -08/30/2021 13:17:34 - INFO - __main__ - Step 301: {'lr': 7.5e-05, 'samples': 57792, 'steps': 300, 'loss/train': 6.393588542938232} -08/30/2021 13:17:34 - INFO - __main__ - Step 302: {'lr': 7.525e-05, 'samples': 57984, 'steps': 301, 'loss/train': 6.1207661628723145} -08/30/2021 13:17:35 - INFO - __main__ - Step 303: {'lr': 7.55e-05, 'samples': 58176, 'steps': 302, 'loss/train': 5.8542985916137695} -08/30/2021 13:17:35 - INFO - __main__ - Step 304: {'lr': 7.575e-05, 'samples': 58368, 'steps': 303, 'loss/train': 6.160946846008301} -08/30/2021 13:17:35 - INFO - __main__ - Step 305: {'lr': 7.6e-05, 'samples': 58560, 'steps': 304, 'loss/train': 5.6898274421691895} -08/30/2021 13:17:37 - INFO - __main__ - Step 306: {'lr': 7.625e-05, 'samples': 58752, 'steps': 305, 'loss/train': 8.189115524291992} -08/30/2021 13:17:37 - INFO - __main__ - Step 307: {'lr': 7.65e-05, 'samples': 58944, 'steps': 306, 'loss/train': 6.525139331817627} -08/30/2021 13:17:38 - INFO - __main__ - Step 308: {'lr': 7.675e-05, 'samples': 59136, 'steps': 307, 'loss/train': 5.728509426116943} -08/30/2021 13:17:38 - INFO - __main__ - Step 309: {'lr': 7.7e-05, 'samples': 59328, 'steps': 308, 'loss/train': 6.039815425872803} -08/30/2021 13:17:38 - INFO - __main__ - Step 310: {'lr': 7.725000000000001e-05, 'samples': 59520, 'steps': 309, 'loss/train': 6.44235372543335} -08/30/2021 13:17:39 - INFO - __main__ - Step 311: {'lr': 7.75e-05, 'samples': 59712, 'steps': 310, 'loss/train': 6.429628849029541} -08/30/2021 13:17:40 - INFO - __main__ - Step 312: {'lr': 7.775e-05, 'samples': 59904, 'steps': 311, 'loss/train': 5.878021717071533} -08/30/2021 13:17:41 - INFO - __main__ - Step 313: {'lr': 7.8e-05, 'samples': 60096, 'steps': 312, 'loss/train': 6.173260688781738} -08/30/2021 13:17:41 - INFO - __main__ - Step 314: {'lr': 7.825e-05, 'samples': 60288, 'steps': 313, 'loss/train': 6.34955358505249} -08/30/2021 13:17:41 - INFO - __main__ - Step 315: {'lr': 7.85e-05, 'samples': 60480, 'steps': 314, 'loss/train': 5.728211402893066} -08/30/2021 13:17:42 - INFO - __main__ - Step 316: {'lr': 7.875e-05, 'samples': 60672, 'steps': 315, 'loss/train': 6.1544294357299805} -08/30/2021 13:17:44 - INFO - __main__ - Step 317: {'lr': 7.9e-05, 'samples': 60864, 'steps': 316, 'loss/train': 6.2256975173950195} -08/30/2021 13:17:45 - INFO - __main__ - Step 318: {'lr': 7.925e-05, 'samples': 61056, 'steps': 317, 'loss/train': 6.413060665130615} -08/30/2021 13:17:45 - INFO - __main__ - Step 319: {'lr': 7.950000000000001e-05, 'samples': 61248, 'steps': 318, 'loss/train': 5.53223180770874} -08/30/2021 13:17:45 - INFO - __main__ - Step 320: {'lr': 7.975e-05, 'samples': 61440, 'steps': 319, 'loss/train': 6.0107951164245605} -08/30/2021 13:17:46 - INFO - __main__ - Step 321: {'lr': 8e-05, 'samples': 61632, 'steps': 320, 'loss/train': 6.844748497009277} -08/30/2021 13:17:48 - INFO - __main__ - Step 322: {'lr': 8.025e-05, 'samples': 61824, 'steps': 321, 'loss/train': 5.647246360778809} -08/30/2021 13:17:48 - INFO - __main__ - Step 323: {'lr': 8.05e-05, 'samples': 62016, 'steps': 322, 'loss/train': 6.0663909912109375} -08/30/2021 13:17:48 - INFO - __main__ - Step 324: {'lr': 8.075e-05, 'samples': 62208, 'steps': 323, 'loss/train': 6.454882621765137} -08/30/2021 13:17:49 - INFO - __main__ - Step 325: {'lr': 8.1e-05, 'samples': 62400, 'steps': 324, 'loss/train': 6.121888160705566} -08/30/2021 13:17:49 - INFO - __main__ - Step 326: {'lr': 8.125000000000001e-05, 'samples': 62592, 'steps': 325, 'loss/train': 6.522874355316162} -08/30/2021 13:17:51 - INFO - __main__ - Step 327: {'lr': 8.15e-05, 'samples': 62784, 'steps': 326, 'loss/train': 6.217108249664307} -08/30/2021 13:17:51 - INFO - __main__ - Step 328: {'lr': 8.175000000000001e-05, 'samples': 62976, 'steps': 327, 'loss/train': 6.257899761199951} -08/30/2021 13:17:52 - INFO - __main__ - Step 329: {'lr': 8.2e-05, 'samples': 63168, 'steps': 328, 'loss/train': 6.448293209075928} -08/30/2021 13:17:52 - INFO - __main__ - Step 330: {'lr': 8.225000000000001e-05, 'samples': 63360, 'steps': 329, 'loss/train': 6.304119110107422} -08/30/2021 13:17:52 - INFO - __main__ - Step 331: {'lr': 8.25e-05, 'samples': 63552, 'steps': 330, 'loss/train': 6.791227340698242} -08/30/2021 13:17:53 - INFO - __main__ - Step 332: {'lr': 8.275e-05, 'samples': 63744, 'steps': 331, 'loss/train': 4.826516628265381} -08/30/2021 13:17:53 - INFO - __main__ - Step 333: {'lr': 8.300000000000001e-05, 'samples': 63936, 'steps': 332, 'loss/train': 6.303062915802002} -08/30/2021 13:17:55 - INFO - __main__ - Step 334: {'lr': 8.325e-05, 'samples': 64128, 'steps': 333, 'loss/train': 5.697182655334473} -08/30/2021 13:17:55 - INFO - __main__ - Step 335: {'lr': 8.350000000000001e-05, 'samples': 64320, 'steps': 334, 'loss/train': 5.643592357635498} -08/30/2021 13:17:55 - INFO - __main__ - Step 336: {'lr': 8.375e-05, 'samples': 64512, 'steps': 335, 'loss/train': 6.222052097320557} -08/30/2021 13:17:56 - INFO - __main__ - Step 337: {'lr': 8.400000000000001e-05, 'samples': 64704, 'steps': 336, 'loss/train': 5.895704746246338} -08/30/2021 13:17:56 - INFO - __main__ - Step 338: {'lr': 8.425e-05, 'samples': 64896, 'steps': 337, 'loss/train': 5.852711200714111} -08/30/2021 13:17:58 - INFO - __main__ - Step 339: {'lr': 8.450000000000001e-05, 'samples': 65088, 'steps': 338, 'loss/train': 6.112983226776123} -08/30/2021 13:17:58 - INFO - __main__ - Step 340: {'lr': 8.475000000000001e-05, 'samples': 65280, 'steps': 339, 'loss/train': 6.1996235847473145} -08/30/2021 13:17:58 - INFO - __main__ - Step 341: {'lr': 8.5e-05, 'samples': 65472, 'steps': 340, 'loss/train': 6.592947006225586} -08/30/2021 13:17:59 - INFO - __main__ - Step 342: {'lr': 8.525000000000001e-05, 'samples': 65664, 'steps': 341, 'loss/train': 5.923532962799072} -08/30/2021 13:17:59 - INFO - __main__ - Step 343: {'lr': 8.55e-05, 'samples': 65856, 'steps': 342, 'loss/train': 5.868164539337158} -08/30/2021 13:18:01 - INFO - __main__ - Step 344: {'lr': 8.575000000000001e-05, 'samples': 66048, 'steps': 343, 'loss/train': 6.542609214782715} -08/30/2021 13:18:01 - INFO - __main__ - Step 345: {'lr': 8.599999999999999e-05, 'samples': 66240, 'steps': 344, 'loss/train': 5.413185119628906} -08/30/2021 13:18:02 - INFO - __main__ - Step 346: {'lr': 8.625e-05, 'samples': 66432, 'steps': 345, 'loss/train': 5.551840305328369} -08/30/2021 13:18:02 - INFO - __main__ - Step 347: {'lr': 8.65e-05, 'samples': 66624, 'steps': 346, 'loss/train': 5.807283878326416} -08/30/2021 13:18:02 - INFO - __main__ - Step 348: {'lr': 8.675e-05, 'samples': 66816, 'steps': 347, 'loss/train': 6.04257869720459} -08/30/2021 13:18:04 - INFO - __main__ - Step 349: {'lr': 8.7e-05, 'samples': 67008, 'steps': 348, 'loss/train': 6.191489219665527} -08/30/2021 13:18:04 - INFO - __main__ - Step 350: {'lr': 8.724999999999999e-05, 'samples': 67200, 'steps': 349, 'loss/train': 6.023970603942871} -08/30/2021 13:18:05 - INFO - __main__ - Step 351: {'lr': 8.75e-05, 'samples': 67392, 'steps': 350, 'loss/train': 6.3830976486206055} -08/30/2021 13:18:05 - INFO - __main__ - Step 352: {'lr': 8.774999999999999e-05, 'samples': 67584, 'steps': 351, 'loss/train': 5.905723571777344} -08/30/2021 13:18:05 - INFO - __main__ - Step 353: {'lr': 8.8e-05, 'samples': 67776, 'steps': 352, 'loss/train': 6.28004264831543} -08/30/2021 13:18:07 - INFO - __main__ - Step 354: {'lr': 8.824999999999999e-05, 'samples': 67968, 'steps': 353, 'loss/train': 5.97433614730835} -08/30/2021 13:18:08 - INFO - __main__ - Step 355: {'lr': 8.85e-05, 'samples': 68160, 'steps': 354, 'loss/train': 6.19740104675293} -08/30/2021 13:18:08 - INFO - __main__ - Step 356: {'lr': 8.875e-05, 'samples': 68352, 'steps': 355, 'loss/train': 6.187588691711426} -08/30/2021 13:18:08 - INFO - __main__ - Step 357: {'lr': 8.9e-05, 'samples': 68544, 'steps': 356, 'loss/train': 5.520158767700195} -08/30/2021 13:18:09 - INFO - __main__ - Step 358: {'lr': 8.925e-05, 'samples': 68736, 'steps': 357, 'loss/train': 5.60365104675293} -08/30/2021 13:18:10 - INFO - __main__ - Step 359: {'lr': 8.95e-05, 'samples': 68928, 'steps': 358, 'loss/train': 5.0504889488220215} -08/30/2021 13:18:11 - INFO - __main__ - Step 360: {'lr': 8.975e-05, 'samples': 69120, 'steps': 359, 'loss/train': 6.02947998046875} -08/30/2021 13:18:11 - INFO - __main__ - Step 361: {'lr': 8.999999999999999e-05, 'samples': 69312, 'steps': 360, 'loss/train': 5.876142501831055} -08/30/2021 13:18:11 - INFO - __main__ - Step 362: {'lr': 9.025e-05, 'samples': 69504, 'steps': 361, 'loss/train': 6.375011444091797} -08/30/2021 13:18:12 - INFO - __main__ - Step 363: {'lr': 9.05e-05, 'samples': 69696, 'steps': 362, 'loss/train': 6.455024242401123} -08/30/2021 13:18:13 - INFO - __main__ - Step 364: {'lr': 9.075e-05, 'samples': 69888, 'steps': 363, 'loss/train': 4.663980484008789} -08/30/2021 13:18:14 - INFO - __main__ - Step 365: {'lr': 9.1e-05, 'samples': 70080, 'steps': 364, 'loss/train': 6.091887950897217} -08/30/2021 13:18:14 - INFO - __main__ - Step 366: {'lr': 9.125e-05, 'samples': 70272, 'steps': 365, 'loss/train': 6.282298564910889} -08/30/2021 13:18:14 - INFO - __main__ - Step 367: {'lr': 9.15e-05, 'samples': 70464, 'steps': 366, 'loss/train': 6.375043869018555} -08/30/2021 13:18:15 - INFO - __main__ - Step 368: {'lr': 9.175e-05, 'samples': 70656, 'steps': 367, 'loss/train': 5.624589920043945} -08/30/2021 13:18:15 - INFO - __main__ - Step 369: {'lr': 9.2e-05, 'samples': 70848, 'steps': 368, 'loss/train': 7.198649883270264} -08/30/2021 13:18:18 - INFO - __main__ - Step 370: {'lr': 9.225e-05, 'samples': 71040, 'steps': 369, 'loss/train': 5.610406398773193} -08/30/2021 13:18:18 - INFO - __main__ - Step 371: {'lr': 9.25e-05, 'samples': 71232, 'steps': 370, 'loss/train': 6.06537389755249} -08/30/2021 13:18:18 - INFO - __main__ - Step 372: {'lr': 9.275e-05, 'samples': 71424, 'steps': 371, 'loss/train': 4.313782215118408} -08/30/2021 13:18:19 - INFO - __main__ - Step 373: {'lr': 9.3e-05, 'samples': 71616, 'steps': 372, 'loss/train': 6.235553741455078} -08/30/2021 13:18:19 - INFO - __main__ - Step 374: {'lr': 9.325e-05, 'samples': 71808, 'steps': 373, 'loss/train': 5.99864387512207} -08/30/2021 13:18:19 - INFO - __main__ - Step 375: {'lr': 9.35e-05, 'samples': 72000, 'steps': 374, 'loss/train': 5.66547155380249} -08/30/2021 13:18:21 - INFO - __main__ - Step 376: {'lr': 9.375e-05, 'samples': 72192, 'steps': 375, 'loss/train': 5.540463447570801} -08/30/2021 13:18:21 - INFO - __main__ - Step 377: {'lr': 9.400000000000001e-05, 'samples': 72384, 'steps': 376, 'loss/train': 4.755856990814209} -08/30/2021 13:18:22 - INFO - __main__ - Step 378: {'lr': 9.425e-05, 'samples': 72576, 'steps': 377, 'loss/train': 5.674274444580078} -08/30/2021 13:18:22 - INFO - __main__ - Step 379: {'lr': 9.45e-05, 'samples': 72768, 'steps': 378, 'loss/train': 6.150738716125488} -08/30/2021 13:18:23 - INFO - __main__ - Step 380: {'lr': 9.475e-05, 'samples': 72960, 'steps': 379, 'loss/train': 6.264613628387451} -08/30/2021 13:18:24 - INFO - __main__ - Step 381: {'lr': 9.5e-05, 'samples': 73152, 'steps': 380, 'loss/train': 6.115423202514648} -08/30/2021 13:18:25 - INFO - __main__ - Step 382: {'lr': 9.525e-05, 'samples': 73344, 'steps': 381, 'loss/train': 5.927343845367432} -08/30/2021 13:18:25 - INFO - __main__ - Step 383: {'lr': 9.55e-05, 'samples': 73536, 'steps': 382, 'loss/train': 5.794401168823242} -08/30/2021 13:18:25 - INFO - __main__ - Step 384: {'lr': 9.575000000000001e-05, 'samples': 73728, 'steps': 383, 'loss/train': 3.3423562049865723} -08/30/2021 13:18:26 - INFO - __main__ - Step 385: {'lr': 9.6e-05, 'samples': 73920, 'steps': 384, 'loss/train': 5.551865100860596} -08/30/2021 13:18:28 - INFO - __main__ - Step 386: {'lr': 9.625000000000001e-05, 'samples': 74112, 'steps': 385, 'loss/train': 5.7878241539001465} -08/30/2021 13:18:28 - INFO - __main__ - Step 387: {'lr': 9.65e-05, 'samples': 74304, 'steps': 386, 'loss/train': 5.973217487335205} -08/30/2021 13:18:28 - INFO - __main__ - Step 388: {'lr': 9.675000000000001e-05, 'samples': 74496, 'steps': 387, 'loss/train': 5.955297470092773} -08/30/2021 13:18:29 - INFO - __main__ - Step 389: {'lr': 9.7e-05, 'samples': 74688, 'steps': 388, 'loss/train': 5.313389778137207} -08/30/2021 13:18:29 - INFO - __main__ - Step 390: {'lr': 9.725e-05, 'samples': 74880, 'steps': 389, 'loss/train': 5.470920562744141} -08/30/2021 13:18:30 - INFO - __main__ - Step 391: {'lr': 9.750000000000001e-05, 'samples': 75072, 'steps': 390, 'loss/train': 5.316433906555176} -08/30/2021 13:18:30 - INFO - __main__ - Step 392: {'lr': 9.775e-05, 'samples': 75264, 'steps': 391, 'loss/train': 8.51474380493164} -08/30/2021 13:18:31 - INFO - __main__ - Step 393: {'lr': 9.800000000000001e-05, 'samples': 75456, 'steps': 392, 'loss/train': 5.866165637969971} -08/30/2021 13:18:32 - INFO - __main__ - Step 394: {'lr': 9.825e-05, 'samples': 75648, 'steps': 393, 'loss/train': 5.825680732727051} -08/30/2021 13:18:32 - INFO - __main__ - Step 395: {'lr': 9.850000000000001e-05, 'samples': 75840, 'steps': 394, 'loss/train': 5.5515899658203125} -08/30/2021 13:18:33 - INFO - __main__ - Step 396: {'lr': 9.875e-05, 'samples': 76032, 'steps': 395, 'loss/train': 5.187445163726807} -08/30/2021 13:18:33 - INFO - __main__ - Step 397: {'lr': 9.900000000000001e-05, 'samples': 76224, 'steps': 396, 'loss/train': 5.892002582550049} -08/30/2021 13:18:35 - INFO - __main__ - Step 398: {'lr': 9.925000000000001e-05, 'samples': 76416, 'steps': 397, 'loss/train': 6.205374717712402} -08/30/2021 13:18:35 - INFO - __main__ - Step 399: {'lr': 9.95e-05, 'samples': 76608, 'steps': 398, 'loss/train': 5.7176055908203125} -08/30/2021 13:18:35 - INFO - __main__ - Step 400: {'lr': 9.975000000000001e-05, 'samples': 76800, 'steps': 399, 'loss/train': 5.981853485107422} -08/30/2021 13:18:36 - INFO - __main__ - Step 401: {'lr': 0.0001, 'samples': 76992, 'steps': 400, 'loss/train': 5.49164342880249} -08/30/2021 13:18:36 - INFO - __main__ - Step 402: {'lr': 0.00010025000000000001, 'samples': 77184, 'steps': 401, 'loss/train': 4.759962558746338} -08/30/2021 13:18:38 - INFO - __main__ - Step 403: {'lr': 0.0001005, 'samples': 77376, 'steps': 402, 'loss/train': 6.679123878479004} -08/30/2021 13:18:39 - INFO - __main__ - Step 404: {'lr': 0.00010075000000000001, 'samples': 77568, 'steps': 403, 'loss/train': 5.9271674156188965} -08/30/2021 13:18:39 - INFO - __main__ - Step 405: {'lr': 0.000101, 'samples': 77760, 'steps': 404, 'loss/train': 5.913862705230713} -08/30/2021 13:18:40 - INFO - __main__ - Step 406: {'lr': 0.00010125000000000001, 'samples': 77952, 'steps': 405, 'loss/train': 4.9790849685668945} -08/30/2021 13:18:40 - INFO - __main__ - Step 407: {'lr': 0.00010150000000000001, 'samples': 78144, 'steps': 406, 'loss/train': 5.997152328491211} -08/30/2021 13:18:40 - INFO - __main__ - Step 408: {'lr': 0.00010174999999999999, 'samples': 78336, 'steps': 407, 'loss/train': 5.821843147277832} -08/30/2021 13:18:41 - INFO - __main__ - Step 409: {'lr': 0.000102, 'samples': 78528, 'steps': 408, 'loss/train': 6.093254089355469} -08/30/2021 13:18:42 - INFO - __main__ - Step 410: {'lr': 0.00010224999999999999, 'samples': 78720, 'steps': 409, 'loss/train': 7.17864465713501} -08/30/2021 13:18:43 - INFO - __main__ - Step 411: {'lr': 0.0001025, 'samples': 78912, 'steps': 410, 'loss/train': 5.948477745056152} -08/30/2021 13:18:43 - INFO - __main__ - Step 412: {'lr': 0.00010274999999999999, 'samples': 79104, 'steps': 411, 'loss/train': 5.505001544952393} -08/30/2021 13:18:43 - INFO - __main__ - Step 413: {'lr': 0.000103, 'samples': 79296, 'steps': 412, 'loss/train': 5.888233184814453} -08/30/2021 13:18:44 - INFO - __main__ - Step 414: {'lr': 0.00010325, 'samples': 79488, 'steps': 413, 'loss/train': 5.7912116050720215} -08/30/2021 13:18:45 - INFO - __main__ - Step 415: {'lr': 0.0001035, 'samples': 79680, 'steps': 414, 'loss/train': 5.851842403411865} -08/30/2021 13:18:46 - INFO - __main__ - Step 416: {'lr': 0.00010375, 'samples': 79872, 'steps': 415, 'loss/train': 5.67678689956665} -08/30/2021 13:18:46 - INFO - __main__ - Step 417: {'lr': 0.000104, 'samples': 80064, 'steps': 416, 'loss/train': 6.132983684539795} -08/30/2021 13:18:46 - INFO - __main__ - Step 418: {'lr': 0.00010425, 'samples': 80256, 'steps': 417, 'loss/train': 5.8515496253967285} -08/30/2021 13:18:47 - INFO - __main__ - Step 419: {'lr': 0.00010449999999999999, 'samples': 80448, 'steps': 418, 'loss/train': 6.48202657699585} -08/30/2021 13:18:48 - INFO - __main__ - Step 420: {'lr': 0.00010475, 'samples': 80640, 'steps': 419, 'loss/train': 6.2916741371154785} -08/30/2021 13:18:48 - INFO - __main__ - Step 421: {'lr': 0.000105, 'samples': 80832, 'steps': 420, 'loss/train': 5.926718711853027} -08/30/2021 13:18:49 - INFO - __main__ - Step 422: {'lr': 0.00010525, 'samples': 81024, 'steps': 421, 'loss/train': 5.585618019104004} -08/30/2021 13:18:49 - INFO - __main__ - Step 423: {'lr': 0.0001055, 'samples': 81216, 'steps': 422, 'loss/train': 5.546139717102051} -08/30/2021 13:18:49 - INFO - __main__ - Step 424: {'lr': 0.00010575, 'samples': 81408, 'steps': 423, 'loss/train': 6.199115753173828} -08/30/2021 13:18:51 - INFO - __main__ - Step 425: {'lr': 0.000106, 'samples': 81600, 'steps': 424, 'loss/train': 5.3427348136901855} -08/30/2021 13:18:51 - INFO - __main__ - Step 426: {'lr': 0.00010625, 'samples': 81792, 'steps': 425, 'loss/train': 5.438610553741455} -08/30/2021 13:18:52 - INFO - __main__ - Step 427: {'lr': 0.0001065, 'samples': 81984, 'steps': 426, 'loss/train': 6.038686275482178} -08/30/2021 13:18:52 - INFO - __main__ - Step 428: {'lr': 0.00010675, 'samples': 82176, 'steps': 427, 'loss/train': 5.396204471588135} -08/30/2021 13:18:52 - INFO - __main__ - Step 429: {'lr': 0.000107, 'samples': 82368, 'steps': 428, 'loss/train': 5.535378456115723} -08/30/2021 13:18:53 - INFO - __main__ - Step 430: {'lr': 0.00010725, 'samples': 82560, 'steps': 429, 'loss/train': 6.227622985839844} -08/30/2021 13:18:55 - INFO - __main__ - Step 431: {'lr': 0.0001075, 'samples': 82752, 'steps': 430, 'loss/train': 6.117164611816406} -08/30/2021 13:18:55 - INFO - __main__ - Step 432: {'lr': 0.00010775, 'samples': 82944, 'steps': 431, 'loss/train': 6.0254058837890625} -08/30/2021 13:18:56 - INFO - __main__ - Step 433: {'lr': 0.000108, 'samples': 83136, 'steps': 432, 'loss/train': 5.1386590003967285} -08/30/2021 13:18:56 - INFO - __main__ - Step 434: {'lr': 0.00010825, 'samples': 83328, 'steps': 433, 'loss/train': 4.882626056671143} -08/30/2021 13:18:56 - INFO - __main__ - Step 435: {'lr': 0.00010850000000000001, 'samples': 83520, 'steps': 434, 'loss/train': 5.809022903442383} -08/30/2021 13:18:58 - INFO - __main__ - Step 436: {'lr': 0.00010875, 'samples': 83712, 'steps': 435, 'loss/train': 5.087780952453613} -08/30/2021 13:18:59 - INFO - __main__ - Step 437: {'lr': 0.000109, 'samples': 83904, 'steps': 436, 'loss/train': 5.409515380859375} -08/30/2021 13:18:59 - INFO - __main__ - Step 438: {'lr': 0.00010925, 'samples': 84096, 'steps': 437, 'loss/train': 4.946671485900879} -08/30/2021 13:18:59 - INFO - __main__ - Step 439: {'lr': 0.0001095, 'samples': 84288, 'steps': 438, 'loss/train': 4.746728420257568} -08/30/2021 13:19:00 - INFO - __main__ - Step 440: {'lr': 0.00010975, 'samples': 84480, 'steps': 439, 'loss/train': 5.767526626586914} -08/30/2021 13:19:01 - INFO - __main__ - Step 441: {'lr': 0.00011, 'samples': 84672, 'steps': 440, 'loss/train': 6.015324115753174} -08/30/2021 13:19:01 - INFO - __main__ - Step 442: {'lr': 0.00011025, 'samples': 84864, 'steps': 441, 'loss/train': 5.7094011306762695} -08/30/2021 13:19:02 - INFO - __main__ - Step 443: {'lr': 0.0001105, 'samples': 85056, 'steps': 442, 'loss/train': 5.760134696960449} -08/30/2021 13:19:02 - INFO - __main__ - Step 444: {'lr': 0.00011075000000000001, 'samples': 85248, 'steps': 443, 'loss/train': 5.706537246704102} -08/30/2021 13:19:02 - INFO - __main__ - Step 445: {'lr': 0.000111, 'samples': 85440, 'steps': 444, 'loss/train': 4.999929428100586} -08/30/2021 13:19:04 - INFO - __main__ - Step 446: {'lr': 0.00011125000000000001, 'samples': 85632, 'steps': 445, 'loss/train': 4.658752918243408} -08/30/2021 13:19:05 - INFO - __main__ - Step 447: {'lr': 0.0001115, 'samples': 85824, 'steps': 446, 'loss/train': 5.415980815887451} -08/30/2021 13:19:05 - INFO - __main__ - Step 448: {'lr': 0.00011175, 'samples': 86016, 'steps': 447, 'loss/train': 5.274680137634277} -08/30/2021 13:19:05 - INFO - __main__ - Step 449: {'lr': 0.000112, 'samples': 86208, 'steps': 448, 'loss/train': 4.624673366546631} -08/30/2021 13:19:06 - INFO - __main__ - Step 450: {'lr': 0.00011225, 'samples': 86400, 'steps': 449, 'loss/train': 5.0226640701293945} -08/30/2021 13:19:07 - INFO - __main__ - Step 451: {'lr': 0.00011250000000000001, 'samples': 86592, 'steps': 450, 'loss/train': 5.516931533813477} -08/30/2021 13:19:07 - INFO - __main__ - Step 452: {'lr': 0.00011275, 'samples': 86784, 'steps': 451, 'loss/train': 5.60693359375} -08/30/2021 13:19:08 - INFO - __main__ - Step 453: {'lr': 0.00011300000000000001, 'samples': 86976, 'steps': 452, 'loss/train': 5.57399845123291} -08/30/2021 13:19:08 - INFO - __main__ - Step 454: {'lr': 0.00011325, 'samples': 87168, 'steps': 453, 'loss/train': 5.57354211807251} -08/30/2021 13:19:08 - INFO - __main__ - Step 455: {'lr': 0.00011350000000000001, 'samples': 87360, 'steps': 454, 'loss/train': 5.579854965209961} -08/30/2021 13:19:10 - INFO - __main__ - Step 456: {'lr': 0.00011375, 'samples': 87552, 'steps': 455, 'loss/train': 5.586076259613037} -08/30/2021 13:19:10 - INFO - __main__ - Step 457: {'lr': 0.000114, 'samples': 87744, 'steps': 456, 'loss/train': 5.7872233390808105} -08/30/2021 13:19:11 - INFO - __main__ - Step 458: {'lr': 0.00011425000000000001, 'samples': 87936, 'steps': 457, 'loss/train': 5.377703666687012} -08/30/2021 13:19:11 - INFO - __main__ - Step 459: {'lr': 0.0001145, 'samples': 88128, 'steps': 458, 'loss/train': 5.658486366271973} -08/30/2021 13:19:11 - INFO - __main__ - Step 460: {'lr': 0.00011475000000000001, 'samples': 88320, 'steps': 459, 'loss/train': 5.546477794647217} -08/30/2021 13:19:13 - INFO - __main__ - Step 461: {'lr': 0.000115, 'samples': 88512, 'steps': 460, 'loss/train': 6.00485897064209} -08/30/2021 13:19:13 - INFO - __main__ - Step 462: {'lr': 0.00011525000000000001, 'samples': 88704, 'steps': 461, 'loss/train': 5.189422130584717} -08/30/2021 13:19:14 - INFO - __main__ - Step 463: {'lr': 0.0001155, 'samples': 88896, 'steps': 462, 'loss/train': 5.5748162269592285} -08/30/2021 13:19:14 - INFO - __main__ - Step 464: {'lr': 0.00011575000000000001, 'samples': 89088, 'steps': 463, 'loss/train': 6.147246360778809} -08/30/2021 13:19:14 - INFO - __main__ - Step 465: {'lr': 0.00011600000000000001, 'samples': 89280, 'steps': 464, 'loss/train': 5.877396583557129} -08/30/2021 13:19:16 - INFO - __main__ - Step 466: {'lr': 0.00011625, 'samples': 89472, 'steps': 465, 'loss/train': 5.3202362060546875} -08/30/2021 13:19:16 - INFO - __main__ - Step 467: {'lr': 0.00011650000000000001, 'samples': 89664, 'steps': 466, 'loss/train': 5.167083263397217} -08/30/2021 13:19:17 - INFO - __main__ - Step 468: {'lr': 0.00011675, 'samples': 89856, 'steps': 467, 'loss/train': 6.410694122314453} -08/30/2021 13:19:17 - INFO - __main__ - Step 469: {'lr': 0.00011700000000000001, 'samples': 90048, 'steps': 468, 'loss/train': 6.226719856262207} -08/30/2021 13:19:17 - INFO - __main__ - Step 470: {'lr': 0.00011724999999999999, 'samples': 90240, 'steps': 469, 'loss/train': 5.951915264129639} -08/30/2021 13:19:19 - INFO - __main__ - Step 471: {'lr': 0.0001175, 'samples': 90432, 'steps': 470, 'loss/train': 5.894048690795898} -08/30/2021 13:19:20 - INFO - __main__ - Step 472: {'lr': 0.00011775, 'samples': 90624, 'steps': 471, 'loss/train': 5.099086761474609} -08/30/2021 13:19:20 - INFO - __main__ - Step 473: {'lr': 0.000118, 'samples': 90816, 'steps': 472, 'loss/train': 5.429386615753174} -08/30/2021 13:19:20 - INFO - __main__ - Step 474: {'lr': 0.00011825, 'samples': 91008, 'steps': 473, 'loss/train': 5.523043155670166} -08/30/2021 13:19:21 - INFO - __main__ - Step 475: {'lr': 0.0001185, 'samples': 91200, 'steps': 474, 'loss/train': 5.883626461029053} -08/30/2021 13:19:22 - INFO - __main__ - Step 476: {'lr': 0.00011875, 'samples': 91392, 'steps': 475, 'loss/train': 5.555183410644531} -08/30/2021 13:19:23 - INFO - __main__ - Step 477: {'lr': 0.00011899999999999999, 'samples': 91584, 'steps': 476, 'loss/train': 5.388443470001221} -08/30/2021 13:19:23 - INFO - __main__ - Step 478: {'lr': 0.00011925, 'samples': 91776, 'steps': 477, 'loss/train': 9.009052276611328} -08/30/2021 13:19:24 - INFO - __main__ - Step 479: {'lr': 0.00011949999999999999, 'samples': 91968, 'steps': 478, 'loss/train': 7.975252151489258} -08/30/2021 13:19:24 - INFO - __main__ - Step 480: {'lr': 0.00011975, 'samples': 92160, 'steps': 479, 'loss/train': 6.8069963455200195} -08/30/2021 13:19:24 - INFO - __main__ - Step 481: {'lr': 0.00012, 'samples': 92352, 'steps': 480, 'loss/train': 5.477241516113281} -08/30/2021 13:19:27 - INFO - __main__ - Step 482: {'lr': 0.00012025, 'samples': 92544, 'steps': 481, 'loss/train': 4.654419898986816} -08/30/2021 13:19:27 - INFO - __main__ - Step 483: {'lr': 0.0001205, 'samples': 92736, 'steps': 482, 'loss/train': 5.462592124938965} -08/30/2021 13:19:28 - INFO - __main__ - Step 484: {'lr': 0.00012075, 'samples': 92928, 'steps': 483, 'loss/train': 6.125245571136475} -08/30/2021 13:19:28 - INFO - __main__ - Step 485: {'lr': 0.000121, 'samples': 93120, 'steps': 484, 'loss/train': 5.8257293701171875} -08/30/2021 13:19:28 - INFO - __main__ - Step 486: {'lr': 0.00012124999999999999, 'samples': 93312, 'steps': 485, 'loss/train': 6.578179836273193} -08/30/2021 13:19:29 - INFO - __main__ - Step 487: {'lr': 0.0001215, 'samples': 93504, 'steps': 486, 'loss/train': 5.597835063934326} -08/30/2021 13:19:30 - INFO - __main__ - Step 488: {'lr': 0.00012175, 'samples': 93696, 'steps': 487, 'loss/train': 5.9039740562438965} -08/30/2021 13:19:31 - INFO - __main__ - Step 489: {'lr': 0.000122, 'samples': 93888, 'steps': 488, 'loss/train': 5.389415264129639} -08/30/2021 13:19:31 - INFO - __main__ - Step 490: {'lr': 0.00012225, 'samples': 94080, 'steps': 489, 'loss/train': 6.134588241577148} -08/30/2021 13:19:31 - INFO - __main__ - Step 491: {'lr': 0.0001225, 'samples': 94272, 'steps': 490, 'loss/train': 5.465774059295654} -08/30/2021 13:19:32 - INFO - __main__ - Step 492: {'lr': 0.00012275, 'samples': 94464, 'steps': 491, 'loss/train': 5.640119552612305} -08/30/2021 13:19:32 - INFO - __main__ - Step 493: {'lr': 0.000123, 'samples': 94656, 'steps': 492, 'loss/train': 4.687599182128906} -08/30/2021 13:19:33 - INFO - __main__ - Step 494: {'lr': 0.00012325000000000001, 'samples': 94848, 'steps': 493, 'loss/train': 5.525679588317871} -08/30/2021 13:19:34 - INFO - __main__ - Step 495: {'lr': 0.0001235, 'samples': 95040, 'steps': 494, 'loss/train': 5.946816921234131} -08/30/2021 13:19:34 - INFO - __main__ - Step 496: {'lr': 0.00012375, 'samples': 95232, 'steps': 495, 'loss/train': 5.446334362030029} -08/30/2021 13:19:35 - INFO - __main__ - Step 497: {'lr': 0.000124, 'samples': 95424, 'steps': 496, 'loss/train': 5.384819507598877} -08/30/2021 13:19:35 - INFO - __main__ - Step 498: {'lr': 0.00012425, 'samples': 95616, 'steps': 497, 'loss/train': 5.5549845695495605} -08/30/2021 13:19:36 - INFO - __main__ - Step 499: {'lr': 0.0001245, 'samples': 95808, 'steps': 498, 'loss/train': 5.564133644104004} -08/30/2021 13:19:37 - INFO - __main__ - Step 500: {'lr': 0.00012475, 'samples': 96000, 'steps': 499, 'loss/train': 5.740269184112549} -08/30/2021 13:19:37 - INFO - __main__ - Step 501: {'lr': 0.000125, 'samples': 96192, 'steps': 500, 'loss/train': 5.81393575668335} -08/30/2021 13:19:38 - INFO - __main__ - Step 502: {'lr': 0.00012525, 'samples': 96384, 'steps': 501, 'loss/train': 6.138937473297119} -08/30/2021 13:19:38 - INFO - __main__ - Step 503: {'lr': 0.00012550000000000001, 'samples': 96576, 'steps': 502, 'loss/train': 5.4254631996154785} -08/30/2021 13:19:39 - INFO - __main__ - Step 504: {'lr': 0.00012575, 'samples': 96768, 'steps': 503, 'loss/train': 6.424824237823486} -08/30/2021 13:19:40 - INFO - __main__ - Step 505: {'lr': 0.000126, 'samples': 96960, 'steps': 504, 'loss/train': 5.346781253814697} -08/30/2021 13:19:40 - INFO - __main__ - Step 506: {'lr': 0.00012625, 'samples': 97152, 'steps': 505, 'loss/train': 5.492609024047852} -08/30/2021 13:19:41 - INFO - __main__ - Step 507: {'lr': 0.0001265, 'samples': 97344, 'steps': 506, 'loss/train': 5.778714656829834} -08/30/2021 13:19:41 - INFO - __main__ - Step 508: {'lr': 0.00012675, 'samples': 97536, 'steps': 507, 'loss/train': 5.443634510040283} -08/30/2021 13:19:43 - INFO - __main__ - Step 509: {'lr': 0.000127, 'samples': 97728, 'steps': 508, 'loss/train': 3.9383697509765625} -08/30/2021 13:19:43 - INFO - __main__ - Step 510: {'lr': 0.00012725, 'samples': 97920, 'steps': 509, 'loss/train': 5.67879056930542} -08/30/2021 13:19:43 - INFO - __main__ - Step 511: {'lr': 0.0001275, 'samples': 98112, 'steps': 510, 'loss/train': 5.304076671600342} -08/30/2021 13:19:44 - INFO - __main__ - Step 512: {'lr': 0.00012775000000000002, 'samples': 98304, 'steps': 511, 'loss/train': 5.341429233551025} -08/30/2021 13:19:44 - INFO - __main__ - Step 513: {'lr': 0.000128, 'samples': 98496, 'steps': 512, 'loss/train': 5.897983074188232} -08/30/2021 13:19:44 - INFO - __main__ - Step 514: {'lr': 0.00012825, 'samples': 98688, 'steps': 513, 'loss/train': 5.628521919250488} -08/30/2021 13:19:46 - INFO - __main__ - Step 515: {'lr': 0.0001285, 'samples': 98880, 'steps': 514, 'loss/train': 5.3900322914123535} -08/30/2021 13:19:46 - INFO - __main__ - Step 516: {'lr': 0.00012875, 'samples': 99072, 'steps': 515, 'loss/train': 5.59366512298584} -08/30/2021 13:19:47 - INFO - __main__ - Step 517: {'lr': 0.00012900000000000002, 'samples': 99264, 'steps': 516, 'loss/train': 5.774766445159912} -08/30/2021 13:19:47 - INFO - __main__ - Step 518: {'lr': 0.00012925, 'samples': 99456, 'steps': 517, 'loss/train': 5.637266635894775} -08/30/2021 13:19:47 - INFO - __main__ - Step 519: {'lr': 0.0001295, 'samples': 99648, 'steps': 518, 'loss/train': 5.623018264770508} -08/30/2021 13:19:49 - INFO - __main__ - Step 520: {'lr': 0.00012975, 'samples': 99840, 'steps': 519, 'loss/train': 5.417008876800537} -08/30/2021 13:19:49 - INFO - __main__ - Step 521: {'lr': 0.00013000000000000002, 'samples': 100032, 'steps': 520, 'loss/train': 7.079473972320557} -08/30/2021 13:19:50 - INFO - __main__ - Step 522: {'lr': 0.00013025, 'samples': 100224, 'steps': 521, 'loss/train': 5.893174648284912} -08/30/2021 13:19:50 - INFO - __main__ - Step 523: {'lr': 0.0001305, 'samples': 100416, 'steps': 522, 'loss/train': 5.409637451171875} -08/30/2021 13:19:50 - INFO - __main__ - Step 524: {'lr': 0.00013075, 'samples': 100608, 'steps': 523, 'loss/train': 5.7304463386535645} -08/30/2021 13:19:52 - INFO - __main__ - Step 525: {'lr': 0.000131, 'samples': 100800, 'steps': 524, 'loss/train': 5.777679920196533} -08/30/2021 13:19:53 - INFO - __main__ - Step 526: {'lr': 0.00013125000000000002, 'samples': 100992, 'steps': 525, 'loss/train': 5.652060508728027} -08/30/2021 13:19:53 - INFO - __main__ - Step 527: {'lr': 0.0001315, 'samples': 101184, 'steps': 526, 'loss/train': 5.265826225280762} -08/30/2021 13:19:53 - INFO - __main__ - Step 528: {'lr': 0.00013175, 'samples': 101376, 'steps': 527, 'loss/train': 5.488304615020752} -08/30/2021 13:19:54 - INFO - __main__ - Step 529: {'lr': 0.000132, 'samples': 101568, 'steps': 528, 'loss/train': 5.802730560302734} -08/30/2021 13:19:55 - INFO - __main__ - Step 530: {'lr': 0.00013225000000000002, 'samples': 101760, 'steps': 529, 'loss/train': 4.198696136474609} -08/30/2021 13:19:56 - INFO - __main__ - Step 531: {'lr': 0.00013250000000000002, 'samples': 101952, 'steps': 530, 'loss/train': 5.73695707321167} -08/30/2021 13:19:56 - INFO - __main__ - Step 532: {'lr': 0.00013275, 'samples': 102144, 'steps': 531, 'loss/train': 6.057995319366455} -08/30/2021 13:19:56 - INFO - __main__ - Step 533: {'lr': 0.000133, 'samples': 102336, 'steps': 532, 'loss/train': 5.944148063659668} -08/30/2021 13:19:57 - INFO - __main__ - Step 534: {'lr': 0.00013325, 'samples': 102528, 'steps': 533, 'loss/train': 5.650229454040527} -08/30/2021 13:19:57 - INFO - __main__ - Step 535: {'lr': 0.00013350000000000002, 'samples': 102720, 'steps': 534, 'loss/train': 5.595287322998047} -08/30/2021 13:19:59 - INFO - __main__ - Step 536: {'lr': 0.00013375, 'samples': 102912, 'steps': 535, 'loss/train': 5.86622953414917} -08/30/2021 13:19:59 - INFO - __main__ - Step 537: {'lr': 0.000134, 'samples': 103104, 'steps': 536, 'loss/train': 5.728094100952148} -08/30/2021 13:20:00 - INFO - __main__ - Step 538: {'lr': 0.00013425, 'samples': 103296, 'steps': 537, 'loss/train': 5.270711421966553} -08/30/2021 13:20:00 - INFO - __main__ - Step 539: {'lr': 0.00013450000000000002, 'samples': 103488, 'steps': 538, 'loss/train': 5.468379497528076} -08/30/2021 13:20:00 - INFO - __main__ - Step 540: {'lr': 0.00013475000000000002, 'samples': 103680, 'steps': 539, 'loss/train': 5.228604316711426} -08/30/2021 13:20:02 - INFO - __main__ - Step 541: {'lr': 0.000135, 'samples': 103872, 'steps': 540, 'loss/train': 5.395594120025635} -08/30/2021 13:20:02 - INFO - __main__ - Step 542: {'lr': 0.00013525, 'samples': 104064, 'steps': 541, 'loss/train': 5.566400051116943} -08/30/2021 13:20:03 - INFO - __main__ - Step 543: {'lr': 0.00013550000000000001, 'samples': 104256, 'steps': 542, 'loss/train': 5.838968276977539} -08/30/2021 13:20:03 - INFO - __main__ - Step 544: {'lr': 0.00013575000000000002, 'samples': 104448, 'steps': 543, 'loss/train': 5.202871322631836} -08/30/2021 13:20:03 - INFO - __main__ - Step 545: {'lr': 0.00013600000000000003, 'samples': 104640, 'steps': 544, 'loss/train': 5.848567485809326} -08/30/2021 13:20:05 - INFO - __main__ - Step 546: {'lr': 0.00013625, 'samples': 104832, 'steps': 545, 'loss/train': 6.2512526512146} -08/30/2021 13:20:06 - INFO - __main__ - Step 547: {'lr': 0.0001365, 'samples': 105024, 'steps': 546, 'loss/train': 5.530820846557617} -08/30/2021 13:20:06 - INFO - __main__ - Step 548: {'lr': 0.00013675000000000002, 'samples': 105216, 'steps': 547, 'loss/train': 3.847254753112793} -08/30/2021 13:20:06 - INFO - __main__ - Step 549: {'lr': 0.00013700000000000002, 'samples': 105408, 'steps': 548, 'loss/train': 4.007019519805908} -08/30/2021 13:20:07 - INFO - __main__ - Step 550: {'lr': 0.00013725, 'samples': 105600, 'steps': 549, 'loss/train': 3.8318333625793457} -08/30/2021 13:20:07 - INFO - __main__ - Step 551: {'lr': 0.0001375, 'samples': 105792, 'steps': 550, 'loss/train': 5.498006820678711} -08/30/2021 13:20:09 - INFO - __main__ - Step 552: {'lr': 0.00013775000000000001, 'samples': 105984, 'steps': 551, 'loss/train': 4.983112812042236} -08/30/2021 13:20:09 - INFO - __main__ - Step 553: {'lr': 0.00013800000000000002, 'samples': 106176, 'steps': 552, 'loss/train': 5.6042704582214355} -08/30/2021 13:20:09 - INFO - __main__ - Step 554: {'lr': 0.00013825000000000003, 'samples': 106368, 'steps': 553, 'loss/train': 5.392212390899658} -08/30/2021 13:20:10 - INFO - __main__ - Step 555: {'lr': 0.0001385, 'samples': 106560, 'steps': 554, 'loss/train': 5.752504348754883} -08/30/2021 13:20:10 - INFO - __main__ - Step 556: {'lr': 0.00013875, 'samples': 106752, 'steps': 555, 'loss/train': 4.8399810791015625} -08/30/2021 13:20:12 - INFO - __main__ - Step 557: {'lr': 0.00013900000000000002, 'samples': 106944, 'steps': 556, 'loss/train': 5.256772041320801} -08/30/2021 13:20:12 - INFO - __main__ - Step 558: {'lr': 0.00013925000000000002, 'samples': 107136, 'steps': 557, 'loss/train': 5.493489742279053} -08/30/2021 13:20:12 - INFO - __main__ - Step 559: {'lr': 0.0001395, 'samples': 107328, 'steps': 558, 'loss/train': 5.2617669105529785} -08/30/2021 13:20:13 - INFO - __main__ - Step 560: {'lr': 0.00013975, 'samples': 107520, 'steps': 559, 'loss/train': 5.1201863288879395} -08/30/2021 13:20:13 - INFO - __main__ - Step 561: {'lr': 0.00014000000000000001, 'samples': 107712, 'steps': 560, 'loss/train': 5.30458927154541} -08/30/2021 13:20:15 - INFO - __main__ - Step 562: {'lr': 0.00014025000000000002, 'samples': 107904, 'steps': 561, 'loss/train': 5.496264457702637} -08/30/2021 13:20:15 - INFO - __main__ - Step 563: {'lr': 0.00014050000000000003, 'samples': 108096, 'steps': 562, 'loss/train': 5.537848949432373} -08/30/2021 13:20:15 - INFO - __main__ - Step 564: {'lr': 0.00014074999999999998, 'samples': 108288, 'steps': 563, 'loss/train': 5.250120162963867} -08/30/2021 13:20:16 - INFO - __main__ - Step 565: {'lr': 0.00014099999999999998, 'samples': 108480, 'steps': 564, 'loss/train': 5.629787445068359} -08/30/2021 13:20:16 - INFO - __main__ - Step 566: {'lr': 0.00014125, 'samples': 108672, 'steps': 565, 'loss/train': 5.242862224578857} -08/30/2021 13:20:18 - INFO - __main__ - Step 567: {'lr': 0.0001415, 'samples': 108864, 'steps': 566, 'loss/train': 5.9160332679748535} -08/30/2021 13:20:18 - INFO - __main__ - Step 568: {'lr': 0.00014175, 'samples': 109056, 'steps': 567, 'loss/train': 6.136992454528809} -08/30/2021 13:20:18 - INFO - __main__ - Step 569: {'lr': 0.00014199999999999998, 'samples': 109248, 'steps': 568, 'loss/train': 4.711137771606445} -08/30/2021 13:20:19 - INFO - __main__ - Step 570: {'lr': 0.00014225, 'samples': 109440, 'steps': 569, 'loss/train': 5.519400596618652} -08/30/2021 13:20:19 - INFO - __main__ - Step 571: {'lr': 0.0001425, 'samples': 109632, 'steps': 570, 'loss/train': 5.262238502502441} -08/30/2021 13:20:20 - INFO - __main__ - Step 572: {'lr': 0.00014275, 'samples': 109824, 'steps': 571, 'loss/train': 4.25198221206665} -08/30/2021 13:20:21 - INFO - __main__ - Step 573: {'lr': 0.00014299999999999998, 'samples': 110016, 'steps': 572, 'loss/train': 5.467993259429932} -08/30/2021 13:20:21 - INFO - __main__ - Step 574: {'lr': 0.00014324999999999999, 'samples': 110208, 'steps': 573, 'loss/train': 6.125296592712402} -08/30/2021 13:20:22 - INFO - __main__ - Step 575: {'lr': 0.0001435, 'samples': 110400, 'steps': 574, 'loss/train': 5.636240005493164} -08/30/2021 13:20:22 - INFO - __main__ - Step 576: {'lr': 0.00014375, 'samples': 110592, 'steps': 575, 'loss/train': 5.511364459991455} -08/30/2021 13:20:24 - INFO - __main__ - Step 577: {'lr': 0.000144, 'samples': 110784, 'steps': 576, 'loss/train': 5.202625751495361} -08/30/2021 13:20:24 - INFO - __main__ - Step 578: {'lr': 0.00014424999999999998, 'samples': 110976, 'steps': 577, 'loss/train': 5.799747943878174} -08/30/2021 13:20:24 - INFO - __main__ - Step 579: {'lr': 0.0001445, 'samples': 111168, 'steps': 578, 'loss/train': 5.501727104187012} -08/30/2021 13:20:25 - INFO - __main__ - Step 580: {'lr': 0.00014475, 'samples': 111360, 'steps': 579, 'loss/train': 6.1024370193481445} -08/30/2021 13:20:25 - INFO - __main__ - Step 581: {'lr': 0.000145, 'samples': 111552, 'steps': 580, 'loss/train': 5.24338436126709} -08/30/2021 13:20:25 - INFO - __main__ - Step 582: {'lr': 0.00014524999999999998, 'samples': 111744, 'steps': 581, 'loss/train': 5.631160259246826} -08/30/2021 13:20:27 - INFO - __main__ - Step 583: {'lr': 0.00014549999999999999, 'samples': 111936, 'steps': 582, 'loss/train': 5.755254745483398} -08/30/2021 13:20:27 - INFO - __main__ - Step 584: {'lr': 0.00014575, 'samples': 112128, 'steps': 583, 'loss/train': 5.443774223327637} -08/30/2021 13:20:28 - INFO - __main__ - Step 585: {'lr': 0.000146, 'samples': 112320, 'steps': 584, 'loss/train': 5.5379638671875} -08/30/2021 13:20:28 - INFO - __main__ - Step 586: {'lr': 0.00014625, 'samples': 112512, 'steps': 585, 'loss/train': 3.491403818130493} -08/30/2021 13:20:28 - INFO - __main__ - Step 587: {'lr': 0.00014649999999999998, 'samples': 112704, 'steps': 586, 'loss/train': 5.373976230621338} -08/30/2021 13:20:30 - INFO - __main__ - Step 588: {'lr': 0.00014675, 'samples': 112896, 'steps': 587, 'loss/train': 5.232706546783447} -08/30/2021 13:20:30 - INFO - __main__ - Step 589: {'lr': 0.000147, 'samples': 113088, 'steps': 588, 'loss/train': 5.442381858825684} -08/30/2021 13:20:31 - INFO - __main__ - Step 590: {'lr': 0.00014725, 'samples': 113280, 'steps': 589, 'loss/train': 5.538836479187012} -08/30/2021 13:20:31 - INFO - __main__ - Step 591: {'lr': 0.0001475, 'samples': 113472, 'steps': 590, 'loss/train': 5.548551082611084} -08/30/2021 13:20:31 - INFO - __main__ - Step 592: {'lr': 0.00014774999999999999, 'samples': 113664, 'steps': 591, 'loss/train': 4.918911933898926} -08/30/2021 13:20:33 - INFO - __main__ - Step 593: {'lr': 0.000148, 'samples': 113856, 'steps': 592, 'loss/train': 5.318609237670898} -08/30/2021 13:20:34 - INFO - __main__ - Step 594: {'lr': 0.00014825, 'samples': 114048, 'steps': 593, 'loss/train': 4.92004919052124} -08/30/2021 13:20:34 - INFO - __main__ - Step 595: {'lr': 0.0001485, 'samples': 114240, 'steps': 594, 'loss/train': 4.587899684906006} -08/30/2021 13:20:35 - INFO - __main__ - Step 596: {'lr': 0.00014874999999999998, 'samples': 114432, 'steps': 595, 'loss/train': 5.18981409072876} -08/30/2021 13:20:35 - INFO - __main__ - Step 597: {'lr': 0.000149, 'samples': 114624, 'steps': 596, 'loss/train': 5.675904273986816} -08/30/2021 13:20:36 - INFO - __main__ - Step 598: {'lr': 0.00014925, 'samples': 114816, 'steps': 597, 'loss/train': 4.244988441467285} -08/30/2021 13:20:37 - INFO - __main__ - Step 599: {'lr': 0.0001495, 'samples': 115008, 'steps': 598, 'loss/train': 5.155581474304199} -08/30/2021 13:20:37 - INFO - __main__ - Step 600: {'lr': 0.00014975, 'samples': 115200, 'steps': 599, 'loss/train': 5.592281818389893} -08/30/2021 13:20:38 - INFO - __main__ - Step 601: {'lr': 0.00015, 'samples': 115392, 'steps': 600, 'loss/train': 5.556156158447266} -08/30/2021 13:20:38 - INFO - __main__ - Step 602: {'lr': 0.00015025, 'samples': 115584, 'steps': 601, 'loss/train': 5.371763706207275} -08/30/2021 13:20:38 - INFO - __main__ - Step 603: {'lr': 0.0001505, 'samples': 115776, 'steps': 602, 'loss/train': 5.190732002258301} -08/30/2021 13:20:40 - INFO - __main__ - Step 604: {'lr': 0.00015075, 'samples': 115968, 'steps': 603, 'loss/train': 5.801718235015869} -08/30/2021 13:20:40 - INFO - __main__ - Step 605: {'lr': 0.000151, 'samples': 116160, 'steps': 604, 'loss/train': 4.600075721740723} -08/30/2021 13:20:41 - INFO - __main__ - Step 606: {'lr': 0.00015125, 'samples': 116352, 'steps': 605, 'loss/train': 5.391104698181152} -08/30/2021 13:20:41 - INFO - __main__ - Step 607: {'lr': 0.0001515, 'samples': 116544, 'steps': 606, 'loss/train': 5.737253665924072} -08/30/2021 13:20:41 - INFO - __main__ - Step 608: {'lr': 0.00015175, 'samples': 116736, 'steps': 607, 'loss/train': 6.661869525909424} -08/30/2021 13:20:43 - INFO - __main__ - Step 609: {'lr': 0.000152, 'samples': 116928, 'steps': 608, 'loss/train': 5.0190935134887695} -08/30/2021 13:20:43 - INFO - __main__ - Step 610: {'lr': 0.00015225, 'samples': 117120, 'steps': 609, 'loss/train': 5.521247863769531} -08/30/2021 13:20:43 - INFO - __main__ - Step 611: {'lr': 0.0001525, 'samples': 117312, 'steps': 610, 'loss/train': 5.56842041015625} -08/30/2021 13:20:44 - INFO - __main__ - Step 612: {'lr': 0.00015275, 'samples': 117504, 'steps': 611, 'loss/train': 5.202230453491211} -08/30/2021 13:20:44 - INFO - __main__ - Step 613: {'lr': 0.000153, 'samples': 117696, 'steps': 612, 'loss/train': 5.65955114364624} -08/30/2021 13:20:46 - INFO - __main__ - Step 614: {'lr': 0.00015325, 'samples': 117888, 'steps': 613, 'loss/train': 5.5583577156066895} -08/30/2021 13:20:46 - INFO - __main__ - Step 615: {'lr': 0.0001535, 'samples': 118080, 'steps': 614, 'loss/train': 5.10887336730957} -08/30/2021 13:20:46 - INFO - __main__ - Step 616: {'lr': 0.00015375, 'samples': 118272, 'steps': 615, 'loss/train': 5.222726345062256} -08/30/2021 13:20:47 - INFO - __main__ - Step 617: {'lr': 0.000154, 'samples': 118464, 'steps': 616, 'loss/train': 5.619663715362549} -08/30/2021 13:20:47 - INFO - __main__ - Step 618: {'lr': 0.00015425, 'samples': 118656, 'steps': 617, 'loss/train': 5.197406768798828} -08/30/2021 13:20:49 - INFO - __main__ - Step 619: {'lr': 0.00015450000000000001, 'samples': 118848, 'steps': 618, 'loss/train': 5.745248794555664} -08/30/2021 13:20:49 - INFO - __main__ - Step 620: {'lr': 0.00015475, 'samples': 119040, 'steps': 619, 'loss/train': 5.443110466003418} -08/30/2021 13:20:49 - INFO - __main__ - Step 621: {'lr': 0.000155, 'samples': 119232, 'steps': 620, 'loss/train': 5.6602911949157715} -08/30/2021 13:20:50 - INFO - __main__ - Step 622: {'lr': 0.00015525, 'samples': 119424, 'steps': 621, 'loss/train': 5.558720588684082} -08/30/2021 13:20:50 - INFO - __main__ - Step 623: {'lr': 0.0001555, 'samples': 119616, 'steps': 622, 'loss/train': 5.768640995025635} -08/30/2021 13:20:52 - INFO - __main__ - Step 624: {'lr': 0.00015575, 'samples': 119808, 'steps': 623, 'loss/train': 5.520753860473633} -08/30/2021 13:20:52 - INFO - __main__ - Step 625: {'lr': 0.000156, 'samples': 120000, 'steps': 624, 'loss/train': 4.979221820831299} -08/30/2021 13:20:53 - INFO - __main__ - Step 626: {'lr': 0.00015625, 'samples': 120192, 'steps': 625, 'loss/train': 4.893407821655273} -08/30/2021 13:20:53 - INFO - __main__ - Step 627: {'lr': 0.0001565, 'samples': 120384, 'steps': 626, 'loss/train': 3.3585562705993652} -08/30/2021 13:20:53 - INFO - __main__ - Step 628: {'lr': 0.00015675000000000002, 'samples': 120576, 'steps': 627, 'loss/train': 4.998554229736328} -08/30/2021 13:20:54 - INFO - __main__ - Step 629: {'lr': 0.000157, 'samples': 120768, 'steps': 628, 'loss/train': 7.1863813400268555} -08/30/2021 13:20:55 - INFO - __main__ - Step 630: {'lr': 0.00015725, 'samples': 120960, 'steps': 629, 'loss/train': 5.3697638511657715} -08/30/2021 13:20:56 - INFO - __main__ - Step 631: {'lr': 0.0001575, 'samples': 121152, 'steps': 630, 'loss/train': 5.502453804016113} -08/30/2021 13:20:56 - INFO - __main__ - Step 632: {'lr': 0.00015775, 'samples': 121344, 'steps': 631, 'loss/train': 5.311975002288818} -08/30/2021 13:20:56 - INFO - __main__ - Step 633: {'lr': 0.000158, 'samples': 121536, 'steps': 632, 'loss/train': 2.156040668487549} -08/30/2021 13:20:57 - INFO - __main__ - Step 634: {'lr': 0.00015825, 'samples': 121728, 'steps': 633, 'loss/train': 5.429723739624023} -08/30/2021 13:20:58 - INFO - __main__ - Step 635: {'lr': 0.0001585, 'samples': 121920, 'steps': 634, 'loss/train': 5.562890529632568} -08/30/2021 13:20:59 - INFO - __main__ - Step 636: {'lr': 0.00015875, 'samples': 122112, 'steps': 635, 'loss/train': 6.574239253997803} -08/30/2021 13:20:59 - INFO - __main__ - Step 637: {'lr': 0.00015900000000000002, 'samples': 122304, 'steps': 636, 'loss/train': 5.023447513580322} -08/30/2021 13:20:59 - INFO - __main__ - Step 638: {'lr': 0.00015925, 'samples': 122496, 'steps': 637, 'loss/train': 5.247769832611084} -08/30/2021 13:21:00 - INFO - __main__ - Step 639: {'lr': 0.0001595, 'samples': 122688, 'steps': 638, 'loss/train': 5.273298263549805} -08/30/2021 13:21:01 - INFO - __main__ - Step 640: {'lr': 0.00015975, 'samples': 122880, 'steps': 639, 'loss/train': 5.828912258148193} -08/30/2021 13:21:02 - INFO - __main__ - Step 641: {'lr': 0.00016, 'samples': 123072, 'steps': 640, 'loss/train': 5.328188419342041} -08/30/2021 13:21:02 - INFO - __main__ - Step 642: {'lr': 0.00016025000000000002, 'samples': 123264, 'steps': 641, 'loss/train': 5.148167133331299} -08/30/2021 13:21:03 - INFO - __main__ - Step 643: {'lr': 0.0001605, 'samples': 123456, 'steps': 642, 'loss/train': 5.197710037231445} -08/30/2021 13:21:03 - INFO - __main__ - Step 644: {'lr': 0.00016075, 'samples': 123648, 'steps': 643, 'loss/train': 6.053573131561279} -08/30/2021 13:21:03 - INFO - __main__ - Step 645: {'lr': 0.000161, 'samples': 123840, 'steps': 644, 'loss/train': 5.226877689361572} -08/30/2021 13:21:05 - INFO - __main__ - Step 646: {'lr': 0.00016125000000000002, 'samples': 124032, 'steps': 645, 'loss/train': 5.793482780456543} -08/30/2021 13:21:06 - INFO - __main__ - Step 647: {'lr': 0.0001615, 'samples': 124224, 'steps': 646, 'loss/train': 5.376224517822266} -08/30/2021 13:21:06 - INFO - __main__ - Step 648: {'lr': 0.00016175, 'samples': 124416, 'steps': 647, 'loss/train': 4.9352521896362305} -08/30/2021 13:21:06 - INFO - __main__ - Step 649: {'lr': 0.000162, 'samples': 124608, 'steps': 648, 'loss/train': 5.265020370483398} -08/30/2021 13:21:07 - INFO - __main__ - Step 650: {'lr': 0.00016225000000000001, 'samples': 124800, 'steps': 649, 'loss/train': 4.683105945587158} -08/30/2021 13:21:09 - INFO - __main__ - Step 651: {'lr': 0.00016250000000000002, 'samples': 124992, 'steps': 650, 'loss/train': 5.088352203369141} -08/30/2021 13:21:09 - INFO - __main__ - Step 652: {'lr': 0.00016275, 'samples': 125184, 'steps': 651, 'loss/train': 5.291248798370361} -08/30/2021 13:21:09 - INFO - __main__ - Step 653: {'lr': 0.000163, 'samples': 125376, 'steps': 652, 'loss/train': 5.060006141662598} -08/30/2021 13:21:10 - INFO - __main__ - Step 654: {'lr': 0.00016325, 'samples': 125568, 'steps': 653, 'loss/train': 5.836855411529541} -08/30/2021 13:21:10 - INFO - __main__ - Step 655: {'lr': 0.00016350000000000002, 'samples': 125760, 'steps': 654, 'loss/train': 5.828429222106934} -08/30/2021 13:21:10 - INFO - __main__ - Step 656: {'lr': 0.00016375000000000002, 'samples': 125952, 'steps': 655, 'loss/train': 4.9753737449646} -08/30/2021 13:21:12 - INFO - __main__ - Step 657: {'lr': 0.000164, 'samples': 126144, 'steps': 656, 'loss/train': 4.924708843231201} -08/30/2021 13:21:12 - INFO - __main__ - Step 658: {'lr': 0.00016425, 'samples': 126336, 'steps': 657, 'loss/train': 5.880825519561768} -08/30/2021 13:21:13 - INFO - __main__ - Step 659: {'lr': 0.00016450000000000001, 'samples': 126528, 'steps': 658, 'loss/train': 4.768339157104492} -08/30/2021 13:21:13 - INFO - __main__ - Step 660: {'lr': 0.00016475000000000002, 'samples': 126720, 'steps': 659, 'loss/train': 5.182678699493408} -08/30/2021 13:21:13 - INFO - __main__ - Step 661: {'lr': 0.000165, 'samples': 126912, 'steps': 660, 'loss/train': 4.780258655548096} -08/30/2021 13:21:15 - INFO - __main__ - Step 662: {'lr': 0.00016525, 'samples': 127104, 'steps': 661, 'loss/train': 5.283553123474121} -08/30/2021 13:21:16 - INFO - __main__ - Step 663: {'lr': 0.0001655, 'samples': 127296, 'steps': 662, 'loss/train': 5.456881046295166} -08/30/2021 13:21:16 - INFO - __main__ - Step 664: {'lr': 0.00016575000000000002, 'samples': 127488, 'steps': 663, 'loss/train': 5.081045627593994} -08/30/2021 13:21:16 - INFO - __main__ - Step 665: {'lr': 0.00016600000000000002, 'samples': 127680, 'steps': 664, 'loss/train': 4.800060749053955} -08/30/2021 13:21:17 - INFO - __main__ - Step 666: {'lr': 0.00016625, 'samples': 127872, 'steps': 665, 'loss/train': 5.490692615509033} -08/30/2021 13:21:17 - INFO - __main__ - Step 667: {'lr': 0.0001665, 'samples': 128064, 'steps': 666, 'loss/train': 4.857069492340088} -08/30/2021 13:21:18 - INFO - __main__ - Step 668: {'lr': 0.00016675000000000001, 'samples': 128256, 'steps': 667, 'loss/train': 5.199826717376709} -08/30/2021 13:21:19 - INFO - __main__ - Step 669: {'lr': 0.00016700000000000002, 'samples': 128448, 'steps': 668, 'loss/train': 5.700835227966309} -08/30/2021 13:21:19 - INFO - __main__ - Step 670: {'lr': 0.00016725000000000003, 'samples': 128640, 'steps': 669, 'loss/train': 5.933552265167236} -08/30/2021 13:21:20 - INFO - __main__ - Step 671: {'lr': 0.0001675, 'samples': 128832, 'steps': 670, 'loss/train': 5.337162971496582} -08/30/2021 13:21:20 - INFO - __main__ - Step 672: {'lr': 0.00016775, 'samples': 129024, 'steps': 671, 'loss/train': 4.543347358703613} -08/30/2021 13:21:21 - INFO - __main__ - Step 673: {'lr': 0.00016800000000000002, 'samples': 129216, 'steps': 672, 'loss/train': 6.116588115692139} -08/30/2021 13:21:22 - INFO - __main__ - Step 674: {'lr': 0.00016825000000000002, 'samples': 129408, 'steps': 673, 'loss/train': 5.417694568634033} -08/30/2021 13:21:22 - INFO - __main__ - Step 675: {'lr': 0.0001685, 'samples': 129600, 'steps': 674, 'loss/train': 5.213335037231445} -08/30/2021 13:21:22 - INFO - __main__ - Step 676: {'lr': 0.00016875, 'samples': 129792, 'steps': 675, 'loss/train': 5.951706409454346} -08/30/2021 13:21:23 - INFO - __main__ - Step 677: {'lr': 0.00016900000000000002, 'samples': 129984, 'steps': 676, 'loss/train': 5.452194690704346} -08/30/2021 13:21:24 - INFO - __main__ - Step 678: {'lr': 0.00016925000000000002, 'samples': 130176, 'steps': 677, 'loss/train': 5.46601676940918} -08/30/2021 13:21:25 - INFO - __main__ - Step 679: {'lr': 0.00016950000000000003, 'samples': 130368, 'steps': 678, 'loss/train': 5.440823078155518} -08/30/2021 13:21:25 - INFO - __main__ - Step 680: {'lr': 0.00016975, 'samples': 130560, 'steps': 679, 'loss/train': 4.783233165740967} -08/30/2021 13:21:25 - INFO - __main__ - Step 681: {'lr': 0.00017, 'samples': 130752, 'steps': 680, 'loss/train': 6.0311150550842285} -08/30/2021 13:21:26 - INFO - __main__ - Step 682: {'lr': 0.00017025000000000002, 'samples': 130944, 'steps': 681, 'loss/train': 5.060884475708008} -08/30/2021 13:21:27 - INFO - __main__ - Step 683: {'lr': 0.00017050000000000002, 'samples': 131136, 'steps': 682, 'loss/train': 3.212306499481201} -08/30/2021 13:21:28 - INFO - __main__ - Step 684: {'lr': 0.00017075, 'samples': 131328, 'steps': 683, 'loss/train': 5.141605377197266} -08/30/2021 13:21:28 - INFO - __main__ - Step 685: {'lr': 0.000171, 'samples': 131520, 'steps': 684, 'loss/train': 5.018991470336914} -08/30/2021 13:21:29 - INFO - __main__ - Step 686: {'lr': 0.00017125000000000002, 'samples': 131712, 'steps': 685, 'loss/train': 4.840954780578613} -08/30/2021 13:21:29 - INFO - __main__ - Step 687: {'lr': 0.00017150000000000002, 'samples': 131904, 'steps': 686, 'loss/train': 6.280068397521973} -08/30/2021 13:21:29 - INFO - __main__ - Step 688: {'lr': 0.00017175000000000003, 'samples': 132096, 'steps': 687, 'loss/train': 5.397987365722656} -08/30/2021 13:21:31 - INFO - __main__ - Step 689: {'lr': 0.00017199999999999998, 'samples': 132288, 'steps': 688, 'loss/train': 4.996814250946045} -08/30/2021 13:21:31 - INFO - __main__ - Step 690: {'lr': 0.00017224999999999999, 'samples': 132480, 'steps': 689, 'loss/train': 4.932107925415039} -08/30/2021 13:21:32 - INFO - __main__ - Step 691: {'lr': 0.0001725, 'samples': 132672, 'steps': 690, 'loss/train': 5.188143253326416} -08/30/2021 13:21:32 - INFO - __main__ - Step 692: {'lr': 0.00017275, 'samples': 132864, 'steps': 691, 'loss/train': 5.35989236831665} -08/30/2021 13:21:32 - INFO - __main__ - Step 693: {'lr': 0.000173, 'samples': 133056, 'steps': 692, 'loss/train': 5.086303234100342} -08/30/2021 13:21:34 - INFO - __main__ - Step 694: {'lr': 0.00017324999999999998, 'samples': 133248, 'steps': 693, 'loss/train': 4.893771171569824} -08/30/2021 13:21:34 - INFO - __main__ - Step 695: {'lr': 0.0001735, 'samples': 133440, 'steps': 694, 'loss/train': 5.735641956329346} -08/30/2021 13:21:35 - INFO - __main__ - Step 696: {'lr': 0.00017375, 'samples': 133632, 'steps': 695, 'loss/train': 5.167459487915039} -08/30/2021 13:21:35 - INFO - __main__ - Step 697: {'lr': 0.000174, 'samples': 133824, 'steps': 696, 'loss/train': 4.828813076019287} -08/30/2021 13:21:35 - INFO - __main__ - Step 698: {'lr': 0.00017424999999999998, 'samples': 134016, 'steps': 697, 'loss/train': 4.851093292236328} -08/30/2021 13:21:37 - INFO - __main__ - Step 699: {'lr': 0.00017449999999999999, 'samples': 134208, 'steps': 698, 'loss/train': 4.942488193511963} -08/30/2021 13:21:37 - INFO - __main__ - Step 700: {'lr': 0.00017475, 'samples': 134400, 'steps': 699, 'loss/train': 5.506532669067383} -08/30/2021 13:21:38 - INFO - __main__ - Step 701: {'lr': 0.000175, 'samples': 134592, 'steps': 700, 'loss/train': 5.4863715171813965} -08/30/2021 13:21:38 - INFO - __main__ - Step 702: {'lr': 0.00017525, 'samples': 134784, 'steps': 701, 'loss/train': 5.2799553871154785} -08/30/2021 13:21:38 - INFO - __main__ - Step 703: {'lr': 0.00017549999999999998, 'samples': 134976, 'steps': 702, 'loss/train': 5.637045860290527} -08/30/2021 13:21:40 - INFO - __main__ - Step 704: {'lr': 0.00017575, 'samples': 135168, 'steps': 703, 'loss/train': 5.424383640289307} -08/30/2021 13:21:41 - INFO - __main__ - Step 705: {'lr': 0.000176, 'samples': 135360, 'steps': 704, 'loss/train': 5.126307487487793} -08/30/2021 13:21:41 - INFO - __main__ - Step 706: {'lr': 0.00017625, 'samples': 135552, 'steps': 705, 'loss/train': 5.253078460693359} -08/30/2021 13:21:42 - INFO - __main__ - Step 707: {'lr': 0.00017649999999999998, 'samples': 135744, 'steps': 706, 'loss/train': 5.362359046936035} -08/30/2021 13:21:42 - INFO - __main__ - Step 708: {'lr': 0.00017675, 'samples': 135936, 'steps': 707, 'loss/train': 5.219271659851074} -08/30/2021 13:21:43 - INFO - __main__ - Step 709: {'lr': 0.000177, 'samples': 136128, 'steps': 708, 'loss/train': 5.232418537139893} -08/30/2021 13:21:44 - INFO - __main__ - Step 710: {'lr': 0.00017725, 'samples': 136320, 'steps': 709, 'loss/train': 5.332751750946045} -08/30/2021 13:21:44 - INFO - __main__ - Step 711: {'lr': 0.0001775, 'samples': 136512, 'steps': 710, 'loss/train': 5.502506256103516} -08/30/2021 13:21:45 - INFO - __main__ - Step 712: {'lr': 0.00017774999999999998, 'samples': 136704, 'steps': 711, 'loss/train': 5.203675270080566} -08/30/2021 13:21:45 - INFO - __main__ - Step 713: {'lr': 0.000178, 'samples': 136896, 'steps': 712, 'loss/train': 5.390910625457764} -08/30/2021 13:21:46 - INFO - __main__ - Step 714: {'lr': 0.00017825, 'samples': 137088, 'steps': 713, 'loss/train': 5.454862594604492} -08/30/2021 13:21:47 - INFO - __main__ - Step 715: {'lr': 0.0001785, 'samples': 137280, 'steps': 714, 'loss/train': 5.786046981811523} -08/30/2021 13:21:47 - INFO - __main__ - Step 716: {'lr': 0.00017875, 'samples': 137472, 'steps': 715, 'loss/train': 5.449164867401123} -08/30/2021 13:21:48 - INFO - __main__ - Step 717: {'lr': 0.000179, 'samples': 137664, 'steps': 716, 'loss/train': 5.285722732543945} -08/30/2021 13:21:48 - INFO - __main__ - Step 718: {'lr': 0.00017925, 'samples': 137856, 'steps': 717, 'loss/train': 4.428260803222656} -08/30/2021 13:21:50 - INFO - __main__ - Step 719: {'lr': 0.0001795, 'samples': 138048, 'steps': 718, 'loss/train': 4.634762287139893} -08/30/2021 13:21:50 - INFO - __main__ - Step 720: {'lr': 0.00017975, 'samples': 138240, 'steps': 719, 'loss/train': 5.215118885040283} -08/30/2021 13:21:50 - INFO - __main__ - Step 721: {'lr': 0.00017999999999999998, 'samples': 138432, 'steps': 720, 'loss/train': 4.848156929016113} -08/30/2021 13:21:51 - INFO - __main__ - Step 722: {'lr': 0.00018025, 'samples': 138624, 'steps': 721, 'loss/train': 5.2248969078063965} -08/30/2021 13:21:51 - INFO - __main__ - Step 723: {'lr': 0.0001805, 'samples': 138816, 'steps': 722, 'loss/train': 5.293713569641113} -08/30/2021 13:21:51 - INFO - __main__ - Step 724: {'lr': 0.00018075, 'samples': 139008, 'steps': 723, 'loss/train': 2.9500813484191895} -08/30/2021 13:21:53 - INFO - __main__ - Step 725: {'lr': 0.000181, 'samples': 139200, 'steps': 724, 'loss/train': 5.430168151855469} -08/30/2021 13:21:53 - INFO - __main__ - Step 726: {'lr': 0.00018125, 'samples': 139392, 'steps': 725, 'loss/train': 4.909379005432129} -08/30/2021 13:21:53 - INFO - __main__ - Step 727: {'lr': 0.0001815, 'samples': 139584, 'steps': 726, 'loss/train': 4.975824356079102} -08/30/2021 13:21:54 - INFO - __main__ - Step 728: {'lr': 0.00018175, 'samples': 139776, 'steps': 727, 'loss/train': 5.0482683181762695} -08/30/2021 13:21:54 - INFO - __main__ - Step 729: {'lr': 0.000182, 'samples': 139968, 'steps': 728, 'loss/train': 4.883768558502197} -08/30/2021 13:21:56 - INFO - __main__ - Step 730: {'lr': 0.00018225, 'samples': 140160, 'steps': 729, 'loss/train': 5.080338954925537} -08/30/2021 13:21:56 - INFO - __main__ - Step 731: {'lr': 0.0001825, 'samples': 140352, 'steps': 730, 'loss/train': 6.052454948425293} -08/30/2021 13:21:56 - INFO - __main__ - Step 732: {'lr': 0.00018275, 'samples': 140544, 'steps': 731, 'loss/train': 5.398553848266602} -08/30/2021 13:21:57 - INFO - __main__ - Step 733: {'lr': 0.000183, 'samples': 140736, 'steps': 732, 'loss/train': 5.351493835449219} -08/30/2021 13:21:57 - INFO - __main__ - Step 734: {'lr': 0.00018325, 'samples': 140928, 'steps': 733, 'loss/train': 5.326423645019531} -08/30/2021 13:21:59 - INFO - __main__ - Step 735: {'lr': 0.0001835, 'samples': 141120, 'steps': 734, 'loss/train': 5.069309711456299} -08/30/2021 13:21:59 - INFO - __main__ - Step 736: {'lr': 0.00018375, 'samples': 141312, 'steps': 735, 'loss/train': 5.322574138641357} -08/30/2021 13:21:59 - INFO - __main__ - Step 737: {'lr': 0.000184, 'samples': 141504, 'steps': 736, 'loss/train': 5.334287166595459} -08/30/2021 13:22:00 - INFO - __main__ - Step 738: {'lr': 0.00018425, 'samples': 141696, 'steps': 737, 'loss/train': 5.26049280166626} -08/30/2021 13:22:00 - INFO - __main__ - Step 739: {'lr': 0.0001845, 'samples': 141888, 'steps': 738, 'loss/train': 5.1639323234558105} -08/30/2021 13:22:02 - INFO - __main__ - Step 740: {'lr': 0.00018475, 'samples': 142080, 'steps': 739, 'loss/train': 5.386720657348633} -08/30/2021 13:22:02 - INFO - __main__ - Step 741: {'lr': 0.000185, 'samples': 142272, 'steps': 740, 'loss/train': 4.5195183753967285} -08/30/2021 13:22:03 - INFO - __main__ - Step 742: {'lr': 0.00018525, 'samples': 142464, 'steps': 741, 'loss/train': 4.867159843444824} -08/30/2021 13:22:03 - INFO - __main__ - Step 743: {'lr': 0.0001855, 'samples': 142656, 'steps': 742, 'loss/train': 5.191786289215088} -08/30/2021 13:22:03 - INFO - __main__ - Step 744: {'lr': 0.00018575000000000002, 'samples': 142848, 'steps': 743, 'loss/train': 4.717995643615723} -08/30/2021 13:22:05 - INFO - __main__ - Step 745: {'lr': 0.000186, 'samples': 143040, 'steps': 744, 'loss/train': 6.0065155029296875} -08/30/2021 13:22:05 - INFO - __main__ - Step 746: {'lr': 0.00018625, 'samples': 143232, 'steps': 745, 'loss/train': 5.013382434844971} -08/30/2021 13:22:06 - INFO - __main__ - Step 747: {'lr': 0.0001865, 'samples': 143424, 'steps': 746, 'loss/train': 4.988122940063477} -08/30/2021 13:22:06 - INFO - __main__ - Step 748: {'lr': 0.00018675, 'samples': 143616, 'steps': 747, 'loss/train': 4.544159412384033} -08/30/2021 13:22:06 - INFO - __main__ - Step 749: {'lr': 0.000187, 'samples': 143808, 'steps': 748, 'loss/train': 4.364598274230957} -08/30/2021 13:22:08 - INFO - __main__ - Step 750: {'lr': 0.00018725, 'samples': 144000, 'steps': 749, 'loss/train': 4.41270112991333} -08/30/2021 13:22:08 - INFO - __main__ - Step 751: {'lr': 0.0001875, 'samples': 144192, 'steps': 750, 'loss/train': 5.2335357666015625} -08/30/2021 13:22:09 - INFO - __main__ - Step 752: {'lr': 0.00018775, 'samples': 144384, 'steps': 751, 'loss/train': 2.75010085105896} -08/30/2021 13:22:09 - INFO - __main__ - Step 753: {'lr': 0.00018800000000000002, 'samples': 144576, 'steps': 752, 'loss/train': 5.661611080169678} -08/30/2021 13:22:09 - INFO - __main__ - Step 754: {'lr': 0.00018825, 'samples': 144768, 'steps': 753, 'loss/train': 5.012766361236572} -08/30/2021 13:22:10 - INFO - __main__ - Step 755: {'lr': 0.0001885, 'samples': 144960, 'steps': 754, 'loss/train': 4.824182033538818} -08/30/2021 13:22:12 - INFO - __main__ - Step 756: {'lr': 0.00018875, 'samples': 145152, 'steps': 755, 'loss/train': 4.862341403961182} -08/30/2021 13:22:12 - INFO - __main__ - Step 757: {'lr': 0.000189, 'samples': 145344, 'steps': 756, 'loss/train': 4.939844131469727} -08/30/2021 13:22:13 - INFO - __main__ - Step 758: {'lr': 0.00018925, 'samples': 145536, 'steps': 757, 'loss/train': 3.1442975997924805} -08/30/2021 13:22:13 - INFO - __main__ - Step 759: {'lr': 0.0001895, 'samples': 145728, 'steps': 758, 'loss/train': 5.516304016113281} -08/30/2021 13:22:13 - INFO - __main__ - Step 760: {'lr': 0.00018975, 'samples': 145920, 'steps': 759, 'loss/train': 4.981257915496826} -08/30/2021 13:22:15 - INFO - __main__ - Step 761: {'lr': 0.00019, 'samples': 146112, 'steps': 760, 'loss/train': 4.415140628814697} -08/30/2021 13:22:15 - INFO - __main__ - Step 762: {'lr': 0.00019025000000000002, 'samples': 146304, 'steps': 761, 'loss/train': 4.696414470672607} -08/30/2021 13:22:15 - INFO - __main__ - Step 763: {'lr': 0.0001905, 'samples': 146496, 'steps': 762, 'loss/train': 4.768802165985107} -08/30/2021 13:22:16 - INFO - __main__ - Step 764: {'lr': 0.00019075, 'samples': 146688, 'steps': 763, 'loss/train': 2.537238836288452} -08/30/2021 13:22:16 - INFO - __main__ - Step 765: {'lr': 0.000191, 'samples': 146880, 'steps': 764, 'loss/train': 4.994415760040283} -08/30/2021 13:22:18 - INFO - __main__ - Step 766: {'lr': 0.00019125000000000001, 'samples': 147072, 'steps': 765, 'loss/train': 4.782634735107422} -08/30/2021 13:22:18 - INFO - __main__ - Step 767: {'lr': 0.00019150000000000002, 'samples': 147264, 'steps': 766, 'loss/train': 4.660978317260742} -08/30/2021 13:22:19 - INFO - __main__ - Step 768: {'lr': 0.00019175, 'samples': 147456, 'steps': 767, 'loss/train': 5.131323337554932} -08/30/2021 13:22:19 - INFO - __main__ - Step 769: {'lr': 0.000192, 'samples': 147648, 'steps': 768, 'loss/train': 5.445662021636963} -08/30/2021 13:22:19 - INFO - __main__ - Step 770: {'lr': 0.00019225, 'samples': 147840, 'steps': 769, 'loss/train': 6.240190029144287} -08/30/2021 13:22:21 - INFO - __main__ - Step 771: {'lr': 0.00019250000000000002, 'samples': 148032, 'steps': 770, 'loss/train': 2.3361003398895264} -08/30/2021 13:22:21 - INFO - __main__ - Step 772: {'lr': 0.00019275, 'samples': 148224, 'steps': 771, 'loss/train': 5.761361122131348} -08/30/2021 13:22:21 - INFO - __main__ - Step 773: {'lr': 0.000193, 'samples': 148416, 'steps': 772, 'loss/train': 4.719097137451172} -08/30/2021 13:22:22 - INFO - __main__ - Step 774: {'lr': 0.00019325, 'samples': 148608, 'steps': 773, 'loss/train': 4.363806247711182} -08/30/2021 13:22:22 - INFO - __main__ - Step 775: {'lr': 0.00019350000000000001, 'samples': 148800, 'steps': 774, 'loss/train': 5.564626216888428} -08/30/2021 13:22:24 - INFO - __main__ - Step 776: {'lr': 0.00019375000000000002, 'samples': 148992, 'steps': 775, 'loss/train': 5.3247761726379395} -08/30/2021 13:22:24 - INFO - __main__ - Step 777: {'lr': 0.000194, 'samples': 149184, 'steps': 776, 'loss/train': 5.080868721008301} -08/30/2021 13:22:25 - INFO - __main__ - Step 778: {'lr': 0.00019425, 'samples': 149376, 'steps': 777, 'loss/train': 4.219135761260986} -08/30/2021 13:22:25 - INFO - __main__ - Step 779: {'lr': 0.0001945, 'samples': 149568, 'steps': 778, 'loss/train': 4.896482944488525} -08/30/2021 13:22:25 - INFO - __main__ - Step 780: {'lr': 0.00019475000000000002, 'samples': 149760, 'steps': 779, 'loss/train': 5.075745105743408} -08/30/2021 13:22:27 - INFO - __main__ - Step 781: {'lr': 0.00019500000000000002, 'samples': 149952, 'steps': 780, 'loss/train': 5.609300136566162} -08/30/2021 13:22:27 - INFO - __main__ - Step 782: {'lr': 0.00019525, 'samples': 150144, 'steps': 781, 'loss/train': 4.639266490936279} -08/30/2021 13:22:28 - INFO - __main__ - Step 783: {'lr': 0.0001955, 'samples': 150336, 'steps': 782, 'loss/train': 4.969395637512207} -08/30/2021 13:22:28 - INFO - __main__ - Step 784: {'lr': 0.00019575000000000001, 'samples': 150528, 'steps': 783, 'loss/train': 4.845355987548828} -08/30/2021 13:22:28 - INFO - __main__ - Step 785: {'lr': 0.00019600000000000002, 'samples': 150720, 'steps': 784, 'loss/train': 4.61663818359375} -08/30/2021 13:22:30 - INFO - __main__ - Step 786: {'lr': 0.00019625, 'samples': 150912, 'steps': 785, 'loss/train': 5.339992046356201} -08/30/2021 13:22:30 - INFO - __main__ - Step 787: {'lr': 0.0001965, 'samples': 151104, 'steps': 786, 'loss/train': 5.528865814208984} -08/30/2021 13:22:31 - INFO - __main__ - Step 788: {'lr': 0.00019675, 'samples': 151296, 'steps': 787, 'loss/train': 4.822768211364746} -08/30/2021 13:22:31 - INFO - __main__ - Step 789: {'lr': 0.00019700000000000002, 'samples': 151488, 'steps': 788, 'loss/train': 5.273317337036133} -08/30/2021 13:22:31 - INFO - __main__ - Step 790: {'lr': 0.00019725000000000002, 'samples': 151680, 'steps': 789, 'loss/train': 5.14328145980835} -08/30/2021 13:22:32 - INFO - __main__ - Step 791: {'lr': 0.0001975, 'samples': 151872, 'steps': 790, 'loss/train': 3.8901455402374268} -08/30/2021 13:22:33 - INFO - __main__ - Step 792: {'lr': 0.00019775, 'samples': 152064, 'steps': 791, 'loss/train': 4.757646560668945} -08/30/2021 13:22:33 - INFO - __main__ - Step 793: {'lr': 0.00019800000000000002, 'samples': 152256, 'steps': 792, 'loss/train': 4.969261169433594} -08/30/2021 13:22:34 - INFO - __main__ - Step 794: {'lr': 0.00019825000000000002, 'samples': 152448, 'steps': 793, 'loss/train': 5.182010173797607} -08/30/2021 13:22:34 - INFO - __main__ - Step 795: {'lr': 0.00019850000000000003, 'samples': 152640, 'steps': 794, 'loss/train': 5.210019111633301} -08/30/2021 13:22:34 - INFO - __main__ - Step 796: {'lr': 0.00019875, 'samples': 152832, 'steps': 795, 'loss/train': 5.464728355407715} -08/30/2021 13:22:36 - INFO - __main__ - Step 797: {'lr': 0.000199, 'samples': 153024, 'steps': 796, 'loss/train': 4.786752223968506} -08/30/2021 13:22:36 - INFO - __main__ - Step 798: {'lr': 0.00019925000000000002, 'samples': 153216, 'steps': 797, 'loss/train': 4.941608428955078} -08/30/2021 13:22:37 - INFO - __main__ - Step 799: {'lr': 0.00019950000000000002, 'samples': 153408, 'steps': 798, 'loss/train': 5.074517726898193} -08/30/2021 13:22:37 - INFO - __main__ - Step 800: {'lr': 0.00019975, 'samples': 153600, 'steps': 799, 'loss/train': 4.99080753326416} -08/30/2021 13:22:37 - INFO - __main__ - Step 801: {'lr': 0.0002, 'samples': 153792, 'steps': 800, 'loss/train': 5.171445369720459} -08/30/2021 13:22:39 - INFO - __main__ - Step 802: {'lr': 0.00020025000000000002, 'samples': 153984, 'steps': 801, 'loss/train': 4.744009971618652} -08/30/2021 13:22:40 - INFO - __main__ - Step 803: {'lr': 0.00020050000000000002, 'samples': 154176, 'steps': 802, 'loss/train': 4.89526891708374} -08/30/2021 13:22:40 - INFO - __main__ - Step 804: {'lr': 0.00020075000000000003, 'samples': 154368, 'steps': 803, 'loss/train': 5.267028331756592} -08/30/2021 13:22:41 - INFO - __main__ - Step 805: {'lr': 0.000201, 'samples': 154560, 'steps': 804, 'loss/train': 3.488680839538574} -08/30/2021 13:22:41 - INFO - __main__ - Step 806: {'lr': 0.00020125, 'samples': 154752, 'steps': 805, 'loss/train': 5.09182071685791} -08/30/2021 13:22:41 - INFO - __main__ - Step 807: {'lr': 0.00020150000000000002, 'samples': 154944, 'steps': 806, 'loss/train': 7.005643844604492} -08/30/2021 13:22:43 - INFO - __main__ - Step 808: {'lr': 0.00020175000000000003, 'samples': 155136, 'steps': 807, 'loss/train': 5.229349136352539} -08/30/2021 13:22:44 - INFO - __main__ - Step 809: {'lr': 0.000202, 'samples': 155328, 'steps': 808, 'loss/train': 6.564152240753174} -08/30/2021 13:22:44 - INFO - __main__ - Step 810: {'lr': 0.00020225, 'samples': 155520, 'steps': 809, 'loss/train': 5.298187732696533} -08/30/2021 13:22:44 - INFO - __main__ - Step 811: {'lr': 0.00020250000000000002, 'samples': 155712, 'steps': 810, 'loss/train': 5.483476161956787} -08/30/2021 13:22:45 - INFO - __main__ - Step 812: {'lr': 0.00020275000000000002, 'samples': 155904, 'steps': 811, 'loss/train': 5.093533039093018} -08/30/2021 13:22:46 - INFO - __main__ - Step 813: {'lr': 0.00020300000000000003, 'samples': 156096, 'steps': 812, 'loss/train': 5.095035076141357} -08/30/2021 13:22:47 - INFO - __main__ - Step 814: {'lr': 0.00020324999999999998, 'samples': 156288, 'steps': 813, 'loss/train': 5.363131523132324} -08/30/2021 13:22:47 - INFO - __main__ - Step 815: {'lr': 0.00020349999999999999, 'samples': 156480, 'steps': 814, 'loss/train': 4.598577499389648} -08/30/2021 13:22:47 - INFO - __main__ - Step 816: {'lr': 0.00020375, 'samples': 156672, 'steps': 815, 'loss/train': 5.136349678039551} -08/30/2021 13:22:48 - INFO - __main__ - Step 817: {'lr': 0.000204, 'samples': 156864, 'steps': 816, 'loss/train': 5.176651954650879} -08/30/2021 13:22:49 - INFO - __main__ - Step 818: {'lr': 0.00020425, 'samples': 157056, 'steps': 817, 'loss/train': 5.160329818725586} -08/30/2021 13:22:49 - INFO - __main__ - Step 819: {'lr': 0.00020449999999999998, 'samples': 157248, 'steps': 818, 'loss/train': 5.5419111251831055} -08/30/2021 13:22:50 - INFO - __main__ - Step 820: {'lr': 0.00020475, 'samples': 157440, 'steps': 819, 'loss/train': 4.841118812561035} -08/30/2021 13:22:50 - INFO - __main__ - Step 821: {'lr': 0.000205, 'samples': 157632, 'steps': 820, 'loss/train': 5.133449077606201} -08/30/2021 13:22:51 - INFO - __main__ - Step 822: {'lr': 0.00020525, 'samples': 157824, 'steps': 821, 'loss/train': 5.230595588684082} -08/30/2021 13:22:52 - INFO - __main__ - Step 823: {'lr': 0.00020549999999999998, 'samples': 158016, 'steps': 822, 'loss/train': 4.926100254058838} -08/30/2021 13:22:53 - INFO - __main__ - Step 824: {'lr': 0.00020575, 'samples': 158208, 'steps': 823, 'loss/train': 4.861969947814941} -08/30/2021 13:22:53 - INFO - __main__ - Step 825: {'lr': 0.000206, 'samples': 158400, 'steps': 824, 'loss/train': 5.224119663238525} -08/30/2021 13:22:53 - INFO - __main__ - Step 826: {'lr': 0.00020625, 'samples': 158592, 'steps': 825, 'loss/train': 4.030957221984863} -08/30/2021 13:22:54 - INFO - __main__ - Step 827: {'lr': 0.0002065, 'samples': 158784, 'steps': 826, 'loss/train': 5.341745376586914} -08/30/2021 13:22:54 - INFO - __main__ - Step 828: {'lr': 0.00020674999999999998, 'samples': 158976, 'steps': 827, 'loss/train': 5.493295669555664} -08/30/2021 13:22:56 - INFO - __main__ - Step 829: {'lr': 0.000207, 'samples': 159168, 'steps': 828, 'loss/train': 5.471200942993164} -08/30/2021 13:22:57 - INFO - __main__ - Step 830: {'lr': 0.00020725, 'samples': 159360, 'steps': 829, 'loss/train': 5.901124000549316} -08/30/2021 13:22:57 - INFO - __main__ - Step 831: {'lr': 0.0002075, 'samples': 159552, 'steps': 830, 'loss/train': 5.5267744064331055} -08/30/2021 13:22:57 - INFO - __main__ - Step 832: {'lr': 0.00020774999999999998, 'samples': 159744, 'steps': 831, 'loss/train': 5.741833686828613} -08/30/2021 13:22:58 - INFO - __main__ - Step 833: {'lr': 0.000208, 'samples': 159936, 'steps': 832, 'loss/train': 4.6413984298706055} -08/30/2021 13:22:59 - INFO - __main__ - Step 834: {'lr': 0.00020825, 'samples': 160128, 'steps': 833, 'loss/train': 5.036070346832275} -08/30/2021 13:23:00 - INFO - __main__ - Step 835: {'lr': 0.0002085, 'samples': 160320, 'steps': 834, 'loss/train': 5.281602382659912} -08/30/2021 13:23:00 - INFO - __main__ - Step 836: {'lr': 0.00020875, 'samples': 160512, 'steps': 835, 'loss/train': 5.298867702484131} -08/30/2021 13:23:00 - INFO - __main__ - Step 837: {'lr': 0.00020899999999999998, 'samples': 160704, 'steps': 836, 'loss/train': 5.015073299407959} -08/30/2021 13:23:01 - INFO - __main__ - Step 838: {'lr': 0.00020925, 'samples': 160896, 'steps': 837, 'loss/train': 4.940237998962402} -08/30/2021 13:23:02 - INFO - __main__ - Step 839: {'lr': 0.0002095, 'samples': 161088, 'steps': 838, 'loss/train': 5.205511093139648} -08/30/2021 13:23:03 - INFO - __main__ - Step 840: {'lr': 0.00020975, 'samples': 161280, 'steps': 839, 'loss/train': 4.30275821685791} -08/30/2021 13:23:03 - INFO - __main__ - Step 841: {'lr': 0.00021, 'samples': 161472, 'steps': 840, 'loss/train': 4.556493759155273} -08/30/2021 13:23:03 - INFO - __main__ - Step 842: {'lr': 0.00021025, 'samples': 161664, 'steps': 841, 'loss/train': 5.241671562194824} -08/30/2021 13:23:04 - INFO - __main__ - Step 843: {'lr': 0.0002105, 'samples': 161856, 'steps': 842, 'loss/train': 5.299282073974609} -08/30/2021 13:23:04 - INFO - __main__ - Step 844: {'lr': 0.00021075, 'samples': 162048, 'steps': 843, 'loss/train': 5.412060260772705} -08/30/2021 13:23:05 - INFO - __main__ - Step 845: {'lr': 0.000211, 'samples': 162240, 'steps': 844, 'loss/train': 4.72500467300415} -08/30/2021 13:23:06 - INFO - __main__ - Step 846: {'lr': 0.00021124999999999998, 'samples': 162432, 'steps': 845, 'loss/train': 5.450290679931641} -08/30/2021 13:23:06 - INFO - __main__ - Step 847: {'lr': 0.0002115, 'samples': 162624, 'steps': 846, 'loss/train': 5.327075481414795} -08/30/2021 13:23:06 - INFO - __main__ - Step 848: {'lr': 0.00021175, 'samples': 162816, 'steps': 847, 'loss/train': 5.164058685302734} -08/30/2021 13:23:07 - INFO - __main__ - Step 849: {'lr': 0.000212, 'samples': 163008, 'steps': 848, 'loss/train': 2.9785478115081787} -08/30/2021 13:23:08 - INFO - __main__ - Step 850: {'lr': 0.00021225, 'samples': 163200, 'steps': 849, 'loss/train': 4.942882061004639} -08/30/2021 13:23:09 - INFO - __main__ - Step 851: {'lr': 0.0002125, 'samples': 163392, 'steps': 850, 'loss/train': 4.294112205505371} -08/30/2021 13:23:09 - INFO - __main__ - Step 852: {'lr': 0.00021275, 'samples': 163584, 'steps': 851, 'loss/train': 4.876553058624268} -08/30/2021 13:23:09 - INFO - __main__ - Step 853: {'lr': 0.000213, 'samples': 163776, 'steps': 852, 'loss/train': 5.452459335327148} -08/30/2021 13:23:10 - INFO - __main__ - Step 854: {'lr': 0.00021325, 'samples': 163968, 'steps': 853, 'loss/train': 3.861050605773926} -08/30/2021 13:23:11 - INFO - __main__ - Step 855: {'lr': 0.0002135, 'samples': 164160, 'steps': 854, 'loss/train': 5.315682888031006} -08/30/2021 13:23:12 - INFO - __main__ - Step 856: {'lr': 0.00021375, 'samples': 164352, 'steps': 855, 'loss/train': 4.639874458312988} -08/30/2021 13:23:12 - INFO - __main__ - Step 857: {'lr': 0.000214, 'samples': 164544, 'steps': 856, 'loss/train': 4.612071990966797} -08/30/2021 13:23:12 - INFO - __main__ - Step 858: {'lr': 0.00021425, 'samples': 164736, 'steps': 857, 'loss/train': 5.122485637664795} -08/30/2021 13:23:13 - INFO - __main__ - Step 859: {'lr': 0.0002145, 'samples': 164928, 'steps': 858, 'loss/train': 5.199220180511475} -08/30/2021 13:23:14 - INFO - __main__ - Step 860: {'lr': 0.00021475, 'samples': 165120, 'steps': 859, 'loss/train': 5.492043495178223} -08/30/2021 13:23:15 - INFO - __main__ - Step 861: {'lr': 0.000215, 'samples': 165312, 'steps': 860, 'loss/train': 4.861348628997803} -08/30/2021 13:23:15 - INFO - __main__ - Step 862: {'lr': 0.00021525, 'samples': 165504, 'steps': 861, 'loss/train': 5.139138698577881} -08/30/2021 13:23:15 - INFO - __main__ - Step 863: {'lr': 0.0002155, 'samples': 165696, 'steps': 862, 'loss/train': 5.403965473175049} -08/30/2021 13:23:16 - INFO - __main__ - Step 864: {'lr': 0.00021575, 'samples': 165888, 'steps': 863, 'loss/train': 5.412846565246582} -08/30/2021 13:23:16 - INFO - __main__ - Step 865: {'lr': 0.000216, 'samples': 166080, 'steps': 864, 'loss/train': 5.67106294631958} -08/30/2021 13:23:18 - INFO - __main__ - Step 866: {'lr': 0.00021625, 'samples': 166272, 'steps': 865, 'loss/train': 5.427254676818848} -08/30/2021 13:23:18 - INFO - __main__ - Step 867: {'lr': 0.0002165, 'samples': 166464, 'steps': 866, 'loss/train': 5.4803643226623535} -08/30/2021 13:23:19 - INFO - __main__ - Step 868: {'lr': 0.00021675, 'samples': 166656, 'steps': 867, 'loss/train': 4.972472667694092} -08/30/2021 13:23:19 - INFO - __main__ - Step 869: {'lr': 0.00021700000000000002, 'samples': 166848, 'steps': 868, 'loss/train': 5.120309829711914} -08/30/2021 13:23:19 - INFO - __main__ - Step 870: {'lr': 0.00021725, 'samples': 167040, 'steps': 869, 'loss/train': 4.365508556365967} -08/30/2021 13:23:21 - INFO - __main__ - Step 871: {'lr': 0.0002175, 'samples': 167232, 'steps': 870, 'loss/train': 4.659406661987305} -08/30/2021 13:23:21 - INFO - __main__ - Step 872: {'lr': 0.00021775, 'samples': 167424, 'steps': 871, 'loss/train': 3.791257381439209} -08/30/2021 13:23:22 - INFO - __main__ - Step 873: {'lr': 0.000218, 'samples': 167616, 'steps': 872, 'loss/train': 5.003664493560791} -08/30/2021 13:23:22 - INFO - __main__ - Step 874: {'lr': 0.00021825, 'samples': 167808, 'steps': 873, 'loss/train': 5.018499851226807} -08/30/2021 13:23:22 - INFO - __main__ - Step 875: {'lr': 0.0002185, 'samples': 168000, 'steps': 874, 'loss/train': 4.5537919998168945} -08/30/2021 13:23:24 - INFO - __main__ - Step 876: {'lr': 0.00021875, 'samples': 168192, 'steps': 875, 'loss/train': 5.3264007568359375} -08/30/2021 13:23:24 - INFO - __main__ - Step 877: {'lr': 0.000219, 'samples': 168384, 'steps': 876, 'loss/train': 5.37451696395874} -08/30/2021 13:23:25 - INFO - __main__ - Step 878: {'lr': 0.00021925000000000002, 'samples': 168576, 'steps': 877, 'loss/train': 5.83143424987793} -08/30/2021 13:23:25 - INFO - __main__ - Step 879: {'lr': 0.0002195, 'samples': 168768, 'steps': 878, 'loss/train': 5.012094974517822} -08/30/2021 13:23:25 - INFO - __main__ - Step 880: {'lr': 0.00021975, 'samples': 168960, 'steps': 879, 'loss/train': 5.125668048858643} -08/30/2021 13:23:27 - INFO - __main__ - Step 881: {'lr': 0.00022, 'samples': 169152, 'steps': 880, 'loss/train': 4.766420841217041} -08/30/2021 13:23:27 - INFO - __main__ - Step 882: {'lr': 0.00022025000000000001, 'samples': 169344, 'steps': 881, 'loss/train': 4.905979156494141} -08/30/2021 13:23:28 - INFO - __main__ - Step 883: {'lr': 0.0002205, 'samples': 169536, 'steps': 882, 'loss/train': 4.748187065124512} -08/30/2021 13:23:28 - INFO - __main__ - Step 884: {'lr': 0.00022075, 'samples': 169728, 'steps': 883, 'loss/train': 4.937015533447266} -08/30/2021 13:23:29 - INFO - __main__ - Step 885: {'lr': 0.000221, 'samples': 169920, 'steps': 884, 'loss/train': 5.347287654876709} -08/30/2021 13:23:29 - INFO - __main__ - Step 886: {'lr': 0.00022125, 'samples': 170112, 'steps': 885, 'loss/train': 5.439239978790283} -08/30/2021 13:23:30 - INFO - __main__ - Step 887: {'lr': 0.00022150000000000002, 'samples': 170304, 'steps': 886, 'loss/train': 3.6341307163238525} -08/30/2021 13:23:31 - INFO - __main__ - Step 888: {'lr': 0.00022175, 'samples': 170496, 'steps': 887, 'loss/train': 5.345653057098389} -08/30/2021 13:23:31 - INFO - __main__ - Step 889: {'lr': 0.000222, 'samples': 170688, 'steps': 888, 'loss/train': 4.535131931304932} -08/30/2021 13:23:31 - INFO - __main__ - Step 890: {'lr': 0.00022225, 'samples': 170880, 'steps': 889, 'loss/train': 4.764547348022461} -08/30/2021 13:23:32 - INFO - __main__ - Step 891: {'lr': 0.00022250000000000001, 'samples': 171072, 'steps': 890, 'loss/train': 5.351622104644775} -08/30/2021 13:23:34 - INFO - __main__ - Step 892: {'lr': 0.00022275000000000002, 'samples': 171264, 'steps': 891, 'loss/train': 5.136674880981445} -08/30/2021 13:23:34 - INFO - __main__ - Step 893: {'lr': 0.000223, 'samples': 171456, 'steps': 892, 'loss/train': 5.209806442260742} -08/30/2021 13:23:35 - INFO - __main__ - Step 894: {'lr': 0.00022325, 'samples': 171648, 'steps': 893, 'loss/train': 4.967884063720703} -08/30/2021 13:23:35 - INFO - __main__ - Step 895: {'lr': 0.0002235, 'samples': 171840, 'steps': 894, 'loss/train': 5.144252300262451} -08/30/2021 13:23:35 - INFO - __main__ - Step 896: {'lr': 0.00022375000000000002, 'samples': 172032, 'steps': 895, 'loss/train': 4.881674766540527} -08/30/2021 13:23:37 - INFO - __main__ - Step 897: {'lr': 0.000224, 'samples': 172224, 'steps': 896, 'loss/train': 3.2832298278808594} -08/30/2021 13:23:38 - INFO - __main__ - Step 898: {'lr': 0.00022425, 'samples': 172416, 'steps': 897, 'loss/train': 3.2080790996551514} -08/30/2021 13:23:38 - INFO - __main__ - Step 899: {'lr': 0.0002245, 'samples': 172608, 'steps': 898, 'loss/train': 4.1041364669799805} -08/30/2021 13:23:38 - INFO - __main__ - Step 900: {'lr': 0.00022475000000000001, 'samples': 172800, 'steps': 899, 'loss/train': 3.7498514652252197} -08/30/2021 13:23:39 - INFO - __main__ - Step 901: {'lr': 0.00022500000000000002, 'samples': 172992, 'steps': 900, 'loss/train': 4.493736743927002} -08/30/2021 13:23:39 - INFO - __main__ - Step 902: {'lr': 0.00022525, 'samples': 173184, 'steps': 901, 'loss/train': 4.7351813316345215} -08/30/2021 13:23:40 - INFO - __main__ - Step 903: {'lr': 0.0002255, 'samples': 173376, 'steps': 902, 'loss/train': 5.0882344245910645} -08/30/2021 13:23:41 - INFO - __main__ - Step 904: {'lr': 0.00022575, 'samples': 173568, 'steps': 903, 'loss/train': 5.257927894592285} -08/30/2021 13:23:41 - INFO - __main__ - Step 905: {'lr': 0.00022600000000000002, 'samples': 173760, 'steps': 904, 'loss/train': 5.417869567871094} -08/30/2021 13:23:42 - INFO - __main__ - Step 906: {'lr': 0.00022625000000000002, 'samples': 173952, 'steps': 905, 'loss/train': 4.744801044464111} -08/30/2021 13:23:42 - INFO - __main__ - Step 907: {'lr': 0.0002265, 'samples': 174144, 'steps': 906, 'loss/train': 5.283426761627197} -08/30/2021 13:23:44 - INFO - __main__ - Step 908: {'lr': 0.00022675, 'samples': 174336, 'steps': 907, 'loss/train': 4.119637489318848} -08/30/2021 13:23:44 - INFO - __main__ - Step 909: {'lr': 0.00022700000000000002, 'samples': 174528, 'steps': 908, 'loss/train': 4.175868034362793} -08/30/2021 13:23:45 - INFO - __main__ - Step 910: {'lr': 0.00022725000000000002, 'samples': 174720, 'steps': 909, 'loss/train': 5.934485912322998} -08/30/2021 13:23:45 - INFO - __main__ - Step 911: {'lr': 0.0002275, 'samples': 174912, 'steps': 910, 'loss/train': 2.738405704498291} -08/30/2021 13:23:45 - INFO - __main__ - Step 912: {'lr': 0.00022775, 'samples': 175104, 'steps': 911, 'loss/train': 3.277622699737549} -08/30/2021 13:23:46 - INFO - __main__ - Step 913: {'lr': 0.000228, 'samples': 175296, 'steps': 912, 'loss/train': 3.008151054382324} -08/30/2021 13:23:47 - INFO - __main__ - Step 914: {'lr': 0.00022825000000000002, 'samples': 175488, 'steps': 913, 'loss/train': 5.002523899078369} -08/30/2021 13:23:48 - INFO - __main__ - Step 915: {'lr': 0.00022850000000000002, 'samples': 175680, 'steps': 914, 'loss/train': 5.076720237731934} -08/30/2021 13:23:48 - INFO - __main__ - Step 916: {'lr': 0.00022875, 'samples': 175872, 'steps': 915, 'loss/train': 5.253383636474609} -08/30/2021 13:23:48 - INFO - __main__ - Step 917: {'lr': 0.000229, 'samples': 176064, 'steps': 916, 'loss/train': 5.0943284034729} -08/30/2021 13:23:49 - INFO - __main__ - Step 918: {'lr': 0.00022925000000000002, 'samples': 176256, 'steps': 917, 'loss/train': 4.55018949508667} -08/30/2021 13:23:51 - INFO - __main__ - Step 919: {'lr': 0.00022950000000000002, 'samples': 176448, 'steps': 918, 'loss/train': 4.921761512756348} -08/30/2021 13:23:52 - INFO - __main__ - Step 920: {'lr': 0.00022975000000000003, 'samples': 176640, 'steps': 919, 'loss/train': 5.253277778625488} -08/30/2021 13:23:52 - INFO - __main__ - Step 921: {'lr': 0.00023, 'samples': 176832, 'steps': 920, 'loss/train': 5.203185081481934} -08/30/2021 13:23:53 - INFO - __main__ - Step 922: {'lr': 0.00023025, 'samples': 177024, 'steps': 921, 'loss/train': 4.610296726226807} -08/30/2021 13:23:53 - INFO - __main__ - Step 923: {'lr': 0.00023050000000000002, 'samples': 177216, 'steps': 922, 'loss/train': 5.244607925415039} -08/30/2021 13:23:53 - INFO - __main__ - Step 924: {'lr': 0.00023075000000000003, 'samples': 177408, 'steps': 923, 'loss/train': 3.095468282699585} -08/30/2021 13:23:55 - INFO - __main__ - Step 925: {'lr': 0.000231, 'samples': 177600, 'steps': 924, 'loss/train': 5.682310104370117} -08/30/2021 13:23:55 - INFO - __main__ - Step 926: {'lr': 0.00023125, 'samples': 177792, 'steps': 925, 'loss/train': 5.327188491821289} -08/30/2021 13:23:56 - INFO - __main__ - Step 927: {'lr': 0.00023150000000000002, 'samples': 177984, 'steps': 926, 'loss/train': 4.54959774017334} -08/30/2021 13:23:56 - INFO - __main__ - Step 928: {'lr': 0.00023175000000000002, 'samples': 178176, 'steps': 927, 'loss/train': 4.926276206970215} -08/30/2021 13:23:57 - INFO - __main__ - Step 929: {'lr': 0.00023200000000000003, 'samples': 178368, 'steps': 928, 'loss/train': 5.122226238250732} -08/30/2021 13:23:57 - INFO - __main__ - Step 930: {'lr': 0.00023225, 'samples': 178560, 'steps': 929, 'loss/train': 4.549820423126221} -08/30/2021 13:23:58 - INFO - __main__ - Step 931: {'lr': 0.0002325, 'samples': 178752, 'steps': 930, 'loss/train': 4.424227237701416} -08/30/2021 13:23:59 - INFO - __main__ - Step 932: {'lr': 0.00023275000000000002, 'samples': 178944, 'steps': 931, 'loss/train': 5.274239540100098} -08/30/2021 13:23:59 - INFO - __main__ - Step 933: {'lr': 0.00023300000000000003, 'samples': 179136, 'steps': 932, 'loss/train': 4.753902912139893} -08/30/2021 13:24:00 - INFO - __main__ - Step 934: {'lr': 0.00023325, 'samples': 179328, 'steps': 933, 'loss/train': 5.339258193969727} -08/30/2021 13:24:00 - INFO - __main__ - Step 935: {'lr': 0.0002335, 'samples': 179520, 'steps': 934, 'loss/train': 5.210813045501709} -08/30/2021 13:24:00 - INFO - __main__ - Step 936: {'lr': 0.00023375000000000002, 'samples': 179712, 'steps': 935, 'loss/train': 6.598178863525391} -08/30/2021 13:24:02 - INFO - __main__ - Step 937: {'lr': 0.00023400000000000002, 'samples': 179904, 'steps': 936, 'loss/train': 5.520947456359863} -08/30/2021 13:24:02 - INFO - __main__ - Step 938: {'lr': 0.00023425000000000003, 'samples': 180096, 'steps': 937, 'loss/train': 4.812737941741943} -08/30/2021 13:24:03 - INFO - __main__ - Step 939: {'lr': 0.00023449999999999998, 'samples': 180288, 'steps': 938, 'loss/train': 5.629942893981934} -08/30/2021 13:24:03 - INFO - __main__ - Step 940: {'lr': 0.00023475, 'samples': 180480, 'steps': 939, 'loss/train': 5.933011531829834} -08/30/2021 13:24:03 - INFO - __main__ - Step 941: {'lr': 0.000235, 'samples': 180672, 'steps': 940, 'loss/train': 5.207772254943848} -08/30/2021 13:24:05 - INFO - __main__ - Step 942: {'lr': 0.00023525, 'samples': 180864, 'steps': 941, 'loss/train': 4.708285331726074} -08/30/2021 13:24:06 - INFO - __main__ - Step 943: {'lr': 0.0002355, 'samples': 181056, 'steps': 942, 'loss/train': 5.191772937774658} -08/30/2021 13:24:06 - INFO - __main__ - Step 944: {'lr': 0.00023574999999999998, 'samples': 181248, 'steps': 943, 'loss/train': 5.858270645141602} -08/30/2021 13:24:06 - INFO - __main__ - Step 945: {'lr': 0.000236, 'samples': 181440, 'steps': 944, 'loss/train': 4.297399520874023} -08/30/2021 13:24:07 - INFO - __main__ - Step 946: {'lr': 0.00023625, 'samples': 181632, 'steps': 945, 'loss/train': 4.04622745513916} -08/30/2021 13:24:07 - INFO - __main__ - Step 947: {'lr': 0.0002365, 'samples': 181824, 'steps': 946, 'loss/train': 4.916435718536377} -08/30/2021 13:24:09 - INFO - __main__ - Step 948: {'lr': 0.00023674999999999998, 'samples': 182016, 'steps': 947, 'loss/train': 4.6477370262146} -08/30/2021 13:24:09 - INFO - __main__ - Step 949: {'lr': 0.000237, 'samples': 182208, 'steps': 948, 'loss/train': 5.313317775726318} -08/30/2021 13:24:10 - INFO - __main__ - Step 950: {'lr': 0.00023725, 'samples': 182400, 'steps': 949, 'loss/train': 5.334430694580078} -08/30/2021 13:24:10 - INFO - __main__ - Step 951: {'lr': 0.0002375, 'samples': 182592, 'steps': 950, 'loss/train': 2.398557424545288} -08/30/2021 13:24:10 - INFO - __main__ - Step 952: {'lr': 0.00023775, 'samples': 182784, 'steps': 951, 'loss/train': 5.0697431564331055} -08/30/2021 13:24:12 - INFO - __main__ - Step 953: {'lr': 0.00023799999999999998, 'samples': 182976, 'steps': 952, 'loss/train': 5.132518291473389} -08/30/2021 13:24:12 - INFO - __main__ - Step 954: {'lr': 0.00023825, 'samples': 183168, 'steps': 953, 'loss/train': 4.551535606384277} -08/30/2021 13:24:12 - INFO - __main__ - Step 955: {'lr': 0.0002385, 'samples': 183360, 'steps': 954, 'loss/train': 4.82934045791626} -08/30/2021 13:24:13 - INFO - __main__ - Step 956: {'lr': 0.00023875, 'samples': 183552, 'steps': 955, 'loss/train': 5.0286688804626465} -08/30/2021 13:24:13 - INFO - __main__ - Step 957: {'lr': 0.00023899999999999998, 'samples': 183744, 'steps': 956, 'loss/train': 5.761747360229492} -08/30/2021 13:24:15 - INFO - __main__ - Step 958: {'lr': 0.00023925, 'samples': 183936, 'steps': 957, 'loss/train': 4.5377516746521} -08/30/2021 13:24:15 - INFO - __main__ - Step 959: {'lr': 0.0002395, 'samples': 184128, 'steps': 958, 'loss/train': 4.695328235626221} -08/30/2021 13:24:15 - INFO - __main__ - Step 960: {'lr': 0.00023975, 'samples': 184320, 'steps': 959, 'loss/train': 4.9971842765808105} -08/30/2021 13:24:16 - INFO - __main__ - Step 961: {'lr': 0.00024, 'samples': 184512, 'steps': 960, 'loss/train': 5.350215911865234} -08/30/2021 13:24:16 - INFO - __main__ - Step 962: {'lr': 0.00024024999999999999, 'samples': 184704, 'steps': 961, 'loss/train': 4.973150730133057} -08/30/2021 13:24:18 - INFO - __main__ - Step 963: {'lr': 0.0002405, 'samples': 184896, 'steps': 962, 'loss/train': 4.839539527893066} -08/30/2021 13:24:18 - INFO - __main__ - Step 964: {'lr': 0.00024075, 'samples': 185088, 'steps': 963, 'loss/train': 5.313961982727051} -08/30/2021 13:24:19 - INFO - __main__ - Step 965: {'lr': 0.000241, 'samples': 185280, 'steps': 964, 'loss/train': 5.329487323760986} -08/30/2021 13:24:19 - INFO - __main__ - Step 966: {'lr': 0.00024125, 'samples': 185472, 'steps': 965, 'loss/train': 4.904882907867432} -08/30/2021 13:24:19 - INFO - __main__ - Step 967: {'lr': 0.0002415, 'samples': 185664, 'steps': 966, 'loss/train': 4.989374160766602} -08/30/2021 13:24:21 - INFO - __main__ - Step 968: {'lr': 0.00024175, 'samples': 185856, 'steps': 967, 'loss/train': 4.942816734313965} -08/30/2021 13:24:21 - INFO - __main__ - Step 969: {'lr': 0.000242, 'samples': 186048, 'steps': 968, 'loss/train': 4.176417827606201} -08/30/2021 13:24:22 - INFO - __main__ - Step 970: {'lr': 0.00024225, 'samples': 186240, 'steps': 969, 'loss/train': 2.1338582038879395} -08/30/2021 13:24:22 - INFO - __main__ - Step 971: {'lr': 0.00024249999999999999, 'samples': 186432, 'steps': 970, 'loss/train': 3.527592182159424} -08/30/2021 13:24:22 - INFO - __main__ - Step 972: {'lr': 0.00024275, 'samples': 186624, 'steps': 971, 'loss/train': 7.0105485916137695} -08/30/2021 13:24:23 - INFO - __main__ - Step 973: {'lr': 0.000243, 'samples': 186816, 'steps': 972, 'loss/train': 5.990324020385742} -08/30/2021 13:24:24 - INFO - __main__ - Step 974: {'lr': 0.00024325, 'samples': 187008, 'steps': 973, 'loss/train': 4.93520975112915} -08/30/2021 13:24:25 - INFO - __main__ - Step 975: {'lr': 0.0002435, 'samples': 187200, 'steps': 974, 'loss/train': 4.439929485321045} -08/30/2021 13:24:25 - INFO - __main__ - Step 976: {'lr': 0.00024375, 'samples': 187392, 'steps': 975, 'loss/train': 5.595407962799072} -08/30/2021 13:24:25 - INFO - __main__ - Step 977: {'lr': 0.000244, 'samples': 187584, 'steps': 976, 'loss/train': 5.29143762588501} -08/30/2021 13:24:26 - INFO - __main__ - Step 978: {'lr': 0.00024425, 'samples': 187776, 'steps': 977, 'loss/train': 4.921665191650391} -08/30/2021 13:24:28 - INFO - __main__ - Step 979: {'lr': 0.0002445, 'samples': 187968, 'steps': 978, 'loss/train': 4.97409200668335} -08/30/2021 13:24:28 - INFO - __main__ - Step 980: {'lr': 0.00024475, 'samples': 188160, 'steps': 979, 'loss/train': 4.857159614562988} -08/30/2021 13:24:29 - INFO - __main__ - Step 981: {'lr': 0.000245, 'samples': 188352, 'steps': 980, 'loss/train': 5.116833209991455} -08/30/2021 13:24:29 - INFO - __main__ - Step 982: {'lr': 0.00024525, 'samples': 188544, 'steps': 981, 'loss/train': 5.800650119781494} -08/30/2021 13:24:29 - INFO - __main__ - Step 983: {'lr': 0.0002455, 'samples': 188736, 'steps': 982, 'loss/train': 4.4499077796936035} -08/30/2021 13:24:31 - INFO - __main__ - Step 984: {'lr': 0.00024575, 'samples': 188928, 'steps': 983, 'loss/train': 5.1292243003845215} -08/30/2021 13:24:32 - INFO - __main__ - Step 985: {'lr': 0.000246, 'samples': 189120, 'steps': 984, 'loss/train': 5.253803253173828} -08/30/2021 13:24:32 - INFO - __main__ - Step 986: {'lr': 0.00024625, 'samples': 189312, 'steps': 985, 'loss/train': 4.8171305656433105} -08/30/2021 13:24:32 - INFO - __main__ - Step 987: {'lr': 0.00024650000000000003, 'samples': 189504, 'steps': 986, 'loss/train': 4.849854469299316} -08/30/2021 13:24:33 - INFO - __main__ - Step 988: {'lr': 0.00024675, 'samples': 189696, 'steps': 987, 'loss/train': 4.776261806488037} -08/30/2021 13:24:34 - INFO - __main__ - Step 989: {'lr': 0.000247, 'samples': 189888, 'steps': 988, 'loss/train': 4.666213512420654} -08/30/2021 13:24:35 - INFO - __main__ - Step 990: {'lr': 0.00024725, 'samples': 190080, 'steps': 989, 'loss/train': 5.387469291687012} -08/30/2021 13:24:35 - INFO - __main__ - Step 991: {'lr': 0.0002475, 'samples': 190272, 'steps': 990, 'loss/train': 4.036428928375244} -08/30/2021 13:24:36 - INFO - __main__ - Step 992: {'lr': 0.00024775, 'samples': 190464, 'steps': 991, 'loss/train': 6.747364044189453} -08/30/2021 13:24:36 - INFO - __main__ - Step 993: {'lr': 0.000248, 'samples': 190656, 'steps': 992, 'loss/train': 6.409087181091309} -08/30/2021 13:24:36 - INFO - __main__ - Step 994: {'lr': 0.00024825, 'samples': 190848, 'steps': 993, 'loss/train': 4.653579235076904} -08/30/2021 13:24:37 - INFO - __main__ - Step 995: {'lr': 0.0002485, 'samples': 191040, 'steps': 994, 'loss/train': 5.695528984069824} -08/30/2021 13:24:38 - INFO - __main__ - Step 996: {'lr': 0.00024875, 'samples': 191232, 'steps': 995, 'loss/train': 4.943525314331055} -08/30/2021 13:24:39 - INFO - __main__ - Step 997: {'lr': 0.000249, 'samples': 191424, 'steps': 996, 'loss/train': 5.276374340057373} -08/30/2021 13:24:39 - INFO - __main__ - Step 998: {'lr': 0.00024925, 'samples': 191616, 'steps': 997, 'loss/train': 4.639342784881592} -08/30/2021 13:24:39 - INFO - __main__ - Step 999: {'lr': 0.0002495, 'samples': 191808, 'steps': 998, 'loss/train': 4.728384971618652} -08/30/2021 13:24:40 - INFO - __main__ - Step 1000: {'lr': 0.00024975, 'samples': 192000, 'steps': 999, 'loss/train': 4.859615325927734} -08/30/2021 13:24:41 - INFO - __main__ - Step 1001: {'lr': 0.00025, 'samples': 192192, 'steps': 1000, 'loss/train': 5.420141220092773} -08/30/2021 13:24:42 - INFO - __main__ - Step 1002: {'lr': 0.00025025, 'samples': 192384, 'steps': 1001, 'loss/train': 4.719789505004883} -08/30/2021 13:24:42 - INFO - __main__ - Step 1003: {'lr': 0.0002505, 'samples': 192576, 'steps': 1002, 'loss/train': 4.400145053863525} -08/30/2021 13:24:42 - INFO - __main__ - Step 1004: {'lr': 0.00025075, 'samples': 192768, 'steps': 1003, 'loss/train': 4.5933685302734375} -08/30/2021 13:24:43 - INFO - __main__ - Step 1005: {'lr': 0.00025100000000000003, 'samples': 192960, 'steps': 1004, 'loss/train': 4.682366847991943} -08/30/2021 13:24:44 - INFO - __main__ - Step 1006: {'lr': 0.00025124999999999995, 'samples': 193152, 'steps': 1005, 'loss/train': 4.802097797393799} -08/30/2021 13:24:45 - INFO - __main__ - Step 1007: {'lr': 0.0002515, 'samples': 193344, 'steps': 1006, 'loss/train': 4.660820007324219} -08/30/2021 13:24:45 - INFO - __main__ - Step 1008: {'lr': 0.00025174999999999997, 'samples': 193536, 'steps': 1007, 'loss/train': 4.959339618682861} -08/30/2021 13:24:46 - INFO - __main__ - Step 1009: {'lr': 0.000252, 'samples': 193728, 'steps': 1008, 'loss/train': 4.599143028259277} -08/30/2021 13:24:46 - INFO - __main__ - Step 1010: {'lr': 0.00025225, 'samples': 193920, 'steps': 1009, 'loss/train': 2.5530784130096436} -08/30/2021 13:24:46 - INFO - __main__ - Step 1011: {'lr': 0.0002525, 'samples': 194112, 'steps': 1010, 'loss/train': 4.39011812210083} -08/30/2021 13:24:48 - INFO - __main__ - Step 1012: {'lr': 0.00025275, 'samples': 194304, 'steps': 1011, 'loss/train': 5.429310321807861} -08/30/2021 13:24:48 - INFO - __main__ - Step 1013: {'lr': 0.000253, 'samples': 194496, 'steps': 1012, 'loss/train': 3.1441714763641357} -08/30/2021 13:24:49 - INFO - __main__ - Step 1014: {'lr': 0.00025325, 'samples': 194688, 'steps': 1013, 'loss/train': 4.4851179122924805} -08/30/2021 13:24:49 - INFO - __main__ - Step 1015: {'lr': 0.0002535, 'samples': 194880, 'steps': 1014, 'loss/train': 6.730905532836914} -08/30/2021 13:24:50 - INFO - __main__ - Step 1016: {'lr': 0.00025374999999999996, 'samples': 195072, 'steps': 1015, 'loss/train': 4.265136241912842} -08/30/2021 13:24:51 - INFO - __main__ - Step 1017: {'lr': 0.000254, 'samples': 195264, 'steps': 1016, 'loss/train': 5.068685531616211} -08/30/2021 13:24:52 - INFO - __main__ - Step 1018: {'lr': 0.00025425, 'samples': 195456, 'steps': 1017, 'loss/train': 5.1631855964660645} -08/30/2021 13:24:52 - INFO - __main__ - Step 1019: {'lr': 0.0002545, 'samples': 195648, 'steps': 1018, 'loss/train': 5.227428436279297} -08/30/2021 13:24:52 - INFO - __main__ - Step 1020: {'lr': 0.00025475, 'samples': 195840, 'steps': 1019, 'loss/train': 5.787811756134033} -08/30/2021 13:24:53 - INFO - __main__ - Step 1021: {'lr': 0.000255, 'samples': 196032, 'steps': 1020, 'loss/train': 4.167182922363281} -08/30/2021 13:24:54 - INFO - __main__ - Step 1022: {'lr': 0.00025525, 'samples': 196224, 'steps': 1021, 'loss/train': 4.919136047363281} -08/30/2021 13:24:55 - INFO - __main__ - Step 1023: {'lr': 0.00025550000000000003, 'samples': 196416, 'steps': 1022, 'loss/train': 5.054874420166016} -08/30/2021 13:24:55 - INFO - __main__ - Step 1024: {'lr': 0.00025575, 'samples': 196608, 'steps': 1023, 'loss/train': 5.161455154418945} -08/30/2021 13:24:55 - INFO - __main__ - Step 1025: {'lr': 0.000256, 'samples': 196800, 'steps': 1024, 'loss/train': 6.443774223327637} -08/30/2021 13:24:56 - INFO - __main__ - Step 1026: {'lr': 0.00025624999999999997, 'samples': 196992, 'steps': 1025, 'loss/train': 4.580659866333008} -08/30/2021 13:24:57 - INFO - __main__ - Step 1027: {'lr': 0.0002565, 'samples': 197184, 'steps': 1026, 'loss/train': 4.926455974578857} -08/30/2021 13:24:58 - INFO - __main__ - Step 1028: {'lr': 0.00025675, 'samples': 197376, 'steps': 1027, 'loss/train': 4.851318359375} -08/30/2021 13:24:58 - INFO - __main__ - Step 1029: {'lr': 0.000257, 'samples': 197568, 'steps': 1028, 'loss/train': 4.88503885269165} -08/30/2021 13:24:59 - INFO - __main__ - Step 1030: {'lr': 0.00025725, 'samples': 197760, 'steps': 1029, 'loss/train': 3.5910897254943848} -08/30/2021 13:24:59 - INFO - __main__ - Step 1031: {'lr': 0.0002575, 'samples': 197952, 'steps': 1030, 'loss/train': 5.1407999992370605} -08/30/2021 13:25:01 - INFO - __main__ - Step 1032: {'lr': 0.00025775, 'samples': 198144, 'steps': 1031, 'loss/train': 4.925992965698242} -08/30/2021 13:25:02 - INFO - __main__ - Step 1033: {'lr': 0.00025800000000000004, 'samples': 198336, 'steps': 1032, 'loss/train': 4.9896464347839355} -08/30/2021 13:25:02 - INFO - __main__ - Step 1034: {'lr': 0.00025824999999999996, 'samples': 198528, 'steps': 1033, 'loss/train': 5.108402729034424} -08/30/2021 13:25:02 - INFO - __main__ - Step 1035: {'lr': 0.0002585, 'samples': 198720, 'steps': 1034, 'loss/train': 4.846958637237549} -08/30/2021 13:25:03 - INFO - __main__ - Step 1036: {'lr': 0.00025875, 'samples': 198912, 'steps': 1035, 'loss/train': 5.197140216827393} -08/30/2021 13:25:03 - INFO - __main__ - Step 1037: {'lr': 0.000259, 'samples': 199104, 'steps': 1036, 'loss/train': 4.693840026855469} -08/30/2021 13:25:04 - INFO - __main__ - Step 1038: {'lr': 0.00025925, 'samples': 199296, 'steps': 1037, 'loss/train': 5.01608943939209} -08/30/2021 13:25:05 - INFO - __main__ - Step 1039: {'lr': 0.0002595, 'samples': 199488, 'steps': 1038, 'loss/train': 4.83984375} -08/30/2021 13:25:05 - INFO - __main__ - Step 1040: {'lr': 0.00025975, 'samples': 199680, 'steps': 1039, 'loss/train': 4.813290596008301} -08/30/2021 13:25:06 - INFO - __main__ - Step 1041: {'lr': 0.00026000000000000003, 'samples': 199872, 'steps': 1040, 'loss/train': 4.417173385620117} -08/30/2021 13:25:06 - INFO - __main__ - Step 1042: {'lr': 0.00026025, 'samples': 200064, 'steps': 1041, 'loss/train': 4.47005558013916} -08/30/2021 13:25:07 - INFO - __main__ - Step 1043: {'lr': 0.0002605, 'samples': 200256, 'steps': 1042, 'loss/train': 4.648036956787109} -08/30/2021 13:25:08 - INFO - __main__ - Step 1044: {'lr': 0.00026074999999999997, 'samples': 200448, 'steps': 1043, 'loss/train': 4.901439189910889} -08/30/2021 13:25:08 - INFO - __main__ - Step 1045: {'lr': 0.000261, 'samples': 200640, 'steps': 1044, 'loss/train': 4.551402568817139} -08/30/2021 13:25:09 - INFO - __main__ - Step 1046: {'lr': 0.00026125, 'samples': 200832, 'steps': 1045, 'loss/train': 5.28316593170166} -08/30/2021 13:25:09 - INFO - __main__ - Step 1047: {'lr': 0.0002615, 'samples': 201024, 'steps': 1046, 'loss/train': 4.648711681365967} -08/30/2021 13:25:11 - INFO - __main__ - Step 1048: {'lr': 0.00026175, 'samples': 201216, 'steps': 1047, 'loss/train': 5.267274379730225} -08/30/2021 13:25:11 - INFO - __main__ - Step 1049: {'lr': 0.000262, 'samples': 201408, 'steps': 1048, 'loss/train': 4.830605983734131} -08/30/2021 13:25:11 - INFO - __main__ - Step 1050: {'lr': 0.00026225, 'samples': 201600, 'steps': 1049, 'loss/train': 4.501389503479004} -08/30/2021 13:25:12 - INFO - __main__ - Step 1051: {'lr': 0.00026250000000000004, 'samples': 201792, 'steps': 1050, 'loss/train': 3.8279778957366943} -08/30/2021 13:25:12 - INFO - __main__ - Step 1052: {'lr': 0.00026274999999999996, 'samples': 201984, 'steps': 1051, 'loss/train': 4.429965019226074} -08/30/2021 13:25:14 - INFO - __main__ - Step 1053: {'lr': 0.000263, 'samples': 202176, 'steps': 1052, 'loss/train': 4.966457366943359} -08/30/2021 13:25:14 - INFO - __main__ - Step 1054: {'lr': 0.00026325, 'samples': 202368, 'steps': 1053, 'loss/train': 4.288132190704346} -08/30/2021 13:25:14 - INFO - __main__ - Step 1055: {'lr': 0.0002635, 'samples': 202560, 'steps': 1054, 'loss/train': 4.567619800567627} -08/30/2021 13:25:15 - INFO - __main__ - Step 1056: {'lr': 0.00026375, 'samples': 202752, 'steps': 1055, 'loss/train': 4.083355903625488} -08/30/2021 13:25:15 - INFO - __main__ - Step 1057: {'lr': 0.000264, 'samples': 202944, 'steps': 1056, 'loss/train': 4.958721160888672} -08/30/2021 13:25:16 - INFO - __main__ - Step 1058: {'lr': 0.00026425, 'samples': 203136, 'steps': 1057, 'loss/train': 5.07416296005249} -08/30/2021 13:25:17 - INFO - __main__ - Step 1059: {'lr': 0.00026450000000000003, 'samples': 203328, 'steps': 1058, 'loss/train': 4.9287543296813965} -08/30/2021 13:25:17 - INFO - __main__ - Step 1060: {'lr': 0.00026475, 'samples': 203520, 'steps': 1059, 'loss/train': 4.357052326202393} -08/30/2021 13:25:18 - INFO - __main__ - Step 1061: {'lr': 0.00026500000000000004, 'samples': 203712, 'steps': 1060, 'loss/train': 4.9349365234375} -08/30/2021 13:25:18 - INFO - __main__ - Step 1062: {'lr': 0.00026524999999999997, 'samples': 203904, 'steps': 1061, 'loss/train': 4.818123817443848} -08/30/2021 13:25:19 - INFO - __main__ - Step 1063: {'lr': 0.0002655, 'samples': 204096, 'steps': 1062, 'loss/train': 4.870808124542236} -08/30/2021 13:25:20 - INFO - __main__ - Step 1064: {'lr': 0.00026575, 'samples': 204288, 'steps': 1063, 'loss/train': 4.647601127624512} -08/30/2021 13:25:20 - INFO - __main__ - Step 1065: {'lr': 0.000266, 'samples': 204480, 'steps': 1064, 'loss/train': 3.552048444747925} -08/30/2021 13:25:21 - INFO - __main__ - Step 1066: {'lr': 0.00026625, 'samples': 204672, 'steps': 1065, 'loss/train': 4.389318943023682} -08/30/2021 13:25:21 - INFO - __main__ - Step 1067: {'lr': 0.0002665, 'samples': 204864, 'steps': 1066, 'loss/train': 4.931048393249512} -08/30/2021 13:25:23 - INFO - __main__ - Step 1068: {'lr': 0.00026675, 'samples': 205056, 'steps': 1067, 'loss/train': 3.999504327774048} -08/30/2021 13:25:23 - INFO - __main__ - Step 1069: {'lr': 0.00026700000000000004, 'samples': 205248, 'steps': 1068, 'loss/train': 5.582645893096924} -08/30/2021 13:25:23 - INFO - __main__ - Step 1070: {'lr': 0.00026725, 'samples': 205440, 'steps': 1069, 'loss/train': 5.052674770355225} -08/30/2021 13:25:24 - INFO - __main__ - Step 1071: {'lr': 0.0002675, 'samples': 205632, 'steps': 1070, 'loss/train': 5.009417533874512} -08/30/2021 13:25:24 - INFO - __main__ - Step 1072: {'lr': 0.00026775, 'samples': 205824, 'steps': 1071, 'loss/train': 4.371978282928467} -08/30/2021 13:25:26 - INFO - __main__ - Step 1073: {'lr': 0.000268, 'samples': 206016, 'steps': 1072, 'loss/train': 4.760138034820557} -08/30/2021 13:25:26 - INFO - __main__ - Step 1074: {'lr': 0.00026825, 'samples': 206208, 'steps': 1073, 'loss/train': 4.837433338165283} -08/30/2021 13:25:26 - INFO - __main__ - Step 1075: {'lr': 0.0002685, 'samples': 206400, 'steps': 1074, 'loss/train': 4.604000091552734} -08/30/2021 13:25:27 - INFO - __main__ - Step 1076: {'lr': 0.00026875, 'samples': 206592, 'steps': 1075, 'loss/train': 4.446019649505615} -08/30/2021 13:25:27 - INFO - __main__ - Step 1077: {'lr': 0.00026900000000000003, 'samples': 206784, 'steps': 1076, 'loss/train': 4.247913360595703} -08/30/2021 13:25:27 - INFO - __main__ - Step 1078: {'lr': 0.00026925, 'samples': 206976, 'steps': 1077, 'loss/train': 4.347595691680908} -08/30/2021 13:25:29 - INFO - __main__ - Step 1079: {'lr': 0.00026950000000000005, 'samples': 207168, 'steps': 1078, 'loss/train': 4.9044389724731445} -08/30/2021 13:25:29 - INFO - __main__ - Step 1080: {'lr': 0.00026974999999999997, 'samples': 207360, 'steps': 1079, 'loss/train': 4.687417507171631} -08/30/2021 13:25:30 - INFO - __main__ - Step 1081: {'lr': 0.00027, 'samples': 207552, 'steps': 1080, 'loss/train': 4.920577049255371} -08/30/2021 13:25:30 - INFO - __main__ - Step 1082: {'lr': 0.00027025, 'samples': 207744, 'steps': 1081, 'loss/train': 4.4795026779174805} -08/30/2021 13:25:30 - INFO - __main__ - Step 1083: {'lr': 0.0002705, 'samples': 207936, 'steps': 1082, 'loss/train': 4.78497314453125} -08/30/2021 13:25:32 - INFO - __main__ - Step 1084: {'lr': 0.00027075, 'samples': 208128, 'steps': 1083, 'loss/train': 4.856836318969727} -08/30/2021 13:25:32 - INFO - __main__ - Step 1085: {'lr': 0.00027100000000000003, 'samples': 208320, 'steps': 1084, 'loss/train': 2.3175480365753174} -08/30/2021 13:25:33 - INFO - __main__ - Step 1086: {'lr': 0.00027125, 'samples': 208512, 'steps': 1085, 'loss/train': 4.838772773742676} -08/30/2021 13:25:33 - INFO - __main__ - Step 1087: {'lr': 0.00027150000000000004, 'samples': 208704, 'steps': 1086, 'loss/train': 4.821920871734619} -08/30/2021 13:25:33 - INFO - __main__ - Step 1088: {'lr': 0.00027175, 'samples': 208896, 'steps': 1087, 'loss/train': 4.47393274307251} -08/30/2021 13:25:36 - INFO - __main__ - Step 1089: {'lr': 0.00027200000000000005, 'samples': 209088, 'steps': 1088, 'loss/train': 5.056207656860352} -08/30/2021 13:25:36 - INFO - __main__ - Step 1090: {'lr': 0.00027225, 'samples': 209280, 'steps': 1089, 'loss/train': 4.7649970054626465} -08/30/2021 13:25:36 - INFO - __main__ - Step 1091: {'lr': 0.0002725, 'samples': 209472, 'steps': 1090, 'loss/train': 4.859498977661133} -08/30/2021 13:25:37 - INFO - __main__ - Step 1092: {'lr': 0.00027275, 'samples': 209664, 'steps': 1091, 'loss/train': 4.725033760070801} -08/30/2021 13:25:37 - INFO - __main__ - Step 1093: {'lr': 0.000273, 'samples': 209856, 'steps': 1092, 'loss/train': 4.648543357849121} -08/30/2021 13:25:38 - INFO - __main__ - Step 1094: {'lr': 0.00027325, 'samples': 210048, 'steps': 1093, 'loss/train': 4.039570331573486} -08/30/2021 13:25:39 - INFO - __main__ - Step 1095: {'lr': 0.00027350000000000003, 'samples': 210240, 'steps': 1094, 'loss/train': 4.392956256866455} -08/30/2021 13:25:39 - INFO - __main__ - Step 1096: {'lr': 0.00027375, 'samples': 210432, 'steps': 1095, 'loss/train': 4.70611047744751} -08/30/2021 13:25:40 - INFO - __main__ - Step 1097: {'lr': 0.00027400000000000005, 'samples': 210624, 'steps': 1096, 'loss/train': 5.329628944396973} -08/30/2021 13:25:40 - INFO - __main__ - Step 1098: {'lr': 0.00027425, 'samples': 210816, 'steps': 1097, 'loss/train': 4.339066505432129} -08/30/2021 13:25:42 - INFO - __main__ - Step 1099: {'lr': 0.0002745, 'samples': 211008, 'steps': 1098, 'loss/train': 4.041830539703369} -08/30/2021 13:25:42 - INFO - __main__ - Step 1100: {'lr': 0.00027475, 'samples': 211200, 'steps': 1099, 'loss/train': 4.83737850189209} -08/30/2021 13:25:43 - INFO - __main__ - Step 1101: {'lr': 0.000275, 'samples': 211392, 'steps': 1100, 'loss/train': 4.446187496185303} -08/30/2021 13:25:43 - INFO - __main__ - Step 1102: {'lr': 0.00027525, 'samples': 211584, 'steps': 1101, 'loss/train': 4.877076148986816} -08/30/2021 13:25:43 - INFO - __main__ - Step 1103: {'lr': 0.00027550000000000003, 'samples': 211776, 'steps': 1102, 'loss/train': 4.218622207641602} -08/30/2021 13:25:45 - INFO - __main__ - Step 1104: {'lr': 0.00027575, 'samples': 211968, 'steps': 1103, 'loss/train': 5.401310443878174} -08/30/2021 13:25:45 - INFO - __main__ - Step 1105: {'lr': 0.00027600000000000004, 'samples': 212160, 'steps': 1104, 'loss/train': 4.578069686889648} -08/30/2021 13:25:46 - INFO - __main__ - Step 1106: {'lr': 0.00027625, 'samples': 212352, 'steps': 1105, 'loss/train': 4.28236198425293} -08/30/2021 13:25:46 - INFO - __main__ - Step 1107: {'lr': 0.00027650000000000005, 'samples': 212544, 'steps': 1106, 'loss/train': 1.6180003881454468} -08/30/2021 13:25:46 - INFO - __main__ - Step 1108: {'lr': 0.00027675, 'samples': 212736, 'steps': 1107, 'loss/train': 4.664124011993408} -08/30/2021 13:25:48 - INFO - __main__ - Step 1109: {'lr': 0.000277, 'samples': 212928, 'steps': 1108, 'loss/train': 4.81748104095459} -08/30/2021 13:25:48 - INFO - __main__ - Step 1110: {'lr': 0.00027725, 'samples': 213120, 'steps': 1109, 'loss/train': 4.777357578277588} -08/30/2021 13:25:49 - INFO - __main__ - Step 1111: {'lr': 0.0002775, 'samples': 213312, 'steps': 1110, 'loss/train': 5.144052982330322} -08/30/2021 13:25:49 - INFO - __main__ - Step 1112: {'lr': 0.00027775, 'samples': 213504, 'steps': 1111, 'loss/train': 5.010110378265381} -08/30/2021 13:25:49 - INFO - __main__ - Step 1113: {'lr': 0.00027800000000000004, 'samples': 213696, 'steps': 1112, 'loss/train': 4.681898593902588} -08/30/2021 13:25:51 - INFO - __main__ - Step 1114: {'lr': 0.00027825, 'samples': 213888, 'steps': 1113, 'loss/train': 4.8639960289001465} -08/30/2021 13:25:51 - INFO - __main__ - Step 1115: {'lr': 0.00027850000000000005, 'samples': 214080, 'steps': 1114, 'loss/train': 4.909400939941406} -08/30/2021 13:25:52 - INFO - __main__ - Step 1116: {'lr': 0.00027875, 'samples': 214272, 'steps': 1115, 'loss/train': 4.448228359222412} -08/30/2021 13:25:52 - INFO - __main__ - Step 1117: {'lr': 0.000279, 'samples': 214464, 'steps': 1116, 'loss/train': 4.7131147384643555} -08/30/2021 13:25:52 - INFO - __main__ - Step 1118: {'lr': 0.00027925, 'samples': 214656, 'steps': 1117, 'loss/train': 4.465978622436523} -08/30/2021 13:25:53 - INFO - __main__ - Step 1119: {'lr': 0.0002795, 'samples': 214848, 'steps': 1118, 'loss/train': 4.741469860076904} -08/30/2021 13:25:54 - INFO - __main__ - Step 1120: {'lr': 0.00027975, 'samples': 215040, 'steps': 1119, 'loss/train': 3.005525827407837} -08/30/2021 13:25:55 - INFO - __main__ - Step 1121: {'lr': 0.00028000000000000003, 'samples': 215232, 'steps': 1120, 'loss/train': 4.87128210067749} -08/30/2021 13:25:55 - INFO - __main__ - Step 1122: {'lr': 0.00028025, 'samples': 215424, 'steps': 1121, 'loss/train': 4.876620292663574} -08/30/2021 13:25:55 - INFO - __main__ - Step 1123: {'lr': 0.00028050000000000004, 'samples': 215616, 'steps': 1122, 'loss/train': 4.7476487159729} -08/30/2021 13:25:56 - INFO - __main__ - Step 1124: {'lr': 0.00028075, 'samples': 215808, 'steps': 1123, 'loss/train': 4.4817633628845215} -08/30/2021 13:25:57 - INFO - __main__ - Step 1125: {'lr': 0.00028100000000000005, 'samples': 216000, 'steps': 1124, 'loss/train': 4.958332061767578} -08/30/2021 13:25:58 - INFO - __main__ - Step 1126: {'lr': 0.00028125000000000003, 'samples': 216192, 'steps': 1125, 'loss/train': 5.6920390129089355} -08/30/2021 13:25:58 - INFO - __main__ - Step 1127: {'lr': 0.00028149999999999996, 'samples': 216384, 'steps': 1126, 'loss/train': 4.852529048919678} -08/30/2021 13:25:58 - INFO - __main__ - Step 1128: {'lr': 0.00028175, 'samples': 216576, 'steps': 1127, 'loss/train': 5.391927242279053} -08/30/2021 13:25:59 - INFO - __main__ - Step 1129: {'lr': 0.00028199999999999997, 'samples': 216768, 'steps': 1128, 'loss/train': 4.675811767578125} -08/30/2021 13:26:00 - INFO - __main__ - Step 1130: {'lr': 0.00028225, 'samples': 216960, 'steps': 1129, 'loss/train': 4.625685214996338} -08/30/2021 13:26:01 - INFO - __main__ - Step 1131: {'lr': 0.0002825, 'samples': 217152, 'steps': 1130, 'loss/train': 4.073273181915283} -08/30/2021 13:26:01 - INFO - __main__ - Step 1132: {'lr': 0.00028275, 'samples': 217344, 'steps': 1131, 'loss/train': 4.4050397872924805} -08/30/2021 13:26:01 - INFO - __main__ - Step 1133: {'lr': 0.000283, 'samples': 217536, 'steps': 1132, 'loss/train': 4.553639888763428} -08/30/2021 13:26:02 - INFO - __main__ - Step 1134: {'lr': 0.00028325000000000003, 'samples': 217728, 'steps': 1133, 'loss/train': 3.735881805419922} -08/30/2021 13:26:03 - INFO - __main__ - Step 1135: {'lr': 0.0002835, 'samples': 217920, 'steps': 1134, 'loss/train': 5.083900451660156} -08/30/2021 13:26:04 - INFO - __main__ - Step 1136: {'lr': 0.00028375, 'samples': 218112, 'steps': 1135, 'loss/train': 4.858189105987549} -08/30/2021 13:26:04 - INFO - __main__ - Step 1137: {'lr': 0.00028399999999999996, 'samples': 218304, 'steps': 1136, 'loss/train': 4.526271820068359} -08/30/2021 13:26:04 - INFO - __main__ - Step 1138: {'lr': 0.00028425, 'samples': 218496, 'steps': 1137, 'loss/train': 4.845973968505859} -08/30/2021 13:26:05 - INFO - __main__ - Step 1139: {'lr': 0.0002845, 'samples': 218688, 'steps': 1138, 'loss/train': 4.050032615661621} -08/30/2021 13:26:05 - INFO - __main__ - Step 1140: {'lr': 0.00028475, 'samples': 218880, 'steps': 1139, 'loss/train': 5.131923198699951} -08/30/2021 13:26:07 - INFO - __main__ - Step 1141: {'lr': 0.000285, 'samples': 219072, 'steps': 1140, 'loss/train': 4.84916877746582} -08/30/2021 13:26:08 - INFO - __main__ - Step 1142: {'lr': 0.00028525, 'samples': 219264, 'steps': 1141, 'loss/train': 4.465821743011475} -08/30/2021 13:26:08 - INFO - __main__ - Step 1143: {'lr': 0.0002855, 'samples': 219456, 'steps': 1142, 'loss/train': 4.294210910797119} -08/30/2021 13:26:08 - INFO - __main__ - Step 1144: {'lr': 0.00028575000000000003, 'samples': 219648, 'steps': 1143, 'loss/train': 4.31614875793457} -08/30/2021 13:26:09 - INFO - __main__ - Step 1145: {'lr': 0.00028599999999999996, 'samples': 219840, 'steps': 1144, 'loss/train': 4.901950359344482} -08/30/2021 13:26:10 - INFO - __main__ - Step 1146: {'lr': 0.00028625, 'samples': 220032, 'steps': 1145, 'loss/train': 4.419631004333496} -08/30/2021 13:26:11 - INFO - __main__ - Step 1147: {'lr': 0.00028649999999999997, 'samples': 220224, 'steps': 1146, 'loss/train': 5.121374607086182} -08/30/2021 13:26:11 - INFO - __main__ - Step 1148: {'lr': 0.00028675, 'samples': 220416, 'steps': 1147, 'loss/train': 4.64249324798584} -08/30/2021 13:26:11 - INFO - __main__ - Step 1149: {'lr': 0.000287, 'samples': 220608, 'steps': 1148, 'loss/train': 4.029555320739746} -08/30/2021 13:26:12 - INFO - __main__ - Step 1150: {'lr': 0.00028725, 'samples': 220800, 'steps': 1149, 'loss/train': 3.603362798690796} -08/30/2021 13:26:13 - INFO - __main__ - Step 1151: {'lr': 0.0002875, 'samples': 220992, 'steps': 1150, 'loss/train': 4.238906383514404} -08/30/2021 13:26:14 - INFO - __main__ - Step 1152: {'lr': 0.00028775000000000003, 'samples': 221184, 'steps': 1151, 'loss/train': 4.948597431182861} -08/30/2021 13:26:14 - INFO - __main__ - Step 1153: {'lr': 0.000288, 'samples': 221376, 'steps': 1152, 'loss/train': 4.241683006286621} -08/30/2021 13:26:15 - INFO - __main__ - Step 1154: {'lr': 0.00028825, 'samples': 221568, 'steps': 1153, 'loss/train': 4.642980098724365} -08/30/2021 13:26:15 - INFO - __main__ - Step 1155: {'lr': 0.00028849999999999997, 'samples': 221760, 'steps': 1154, 'loss/train': 4.6034393310546875} -08/30/2021 13:26:15 - INFO - __main__ - Step 1156: {'lr': 0.00028875, 'samples': 221952, 'steps': 1155, 'loss/train': 4.561765670776367} -08/30/2021 13:26:17 - INFO - __main__ - Step 1157: {'lr': 0.000289, 'samples': 222144, 'steps': 1156, 'loss/train': 5.744253158569336} -08/30/2021 13:26:17 - INFO - __main__ - Step 1158: {'lr': 0.00028925, 'samples': 222336, 'steps': 1157, 'loss/train': 5.428072929382324} -08/30/2021 13:26:18 - INFO - __main__ - Step 1159: {'lr': 0.0002895, 'samples': 222528, 'steps': 1158, 'loss/train': 4.342047691345215} -08/30/2021 13:26:18 - INFO - __main__ - Step 1160: {'lr': 0.00028975, 'samples': 222720, 'steps': 1159, 'loss/train': 4.6265668869018555} -08/30/2021 13:26:18 - INFO - __main__ - Step 1161: {'lr': 0.00029, 'samples': 222912, 'steps': 1160, 'loss/train': 4.878502368927002} -08/30/2021 13:26:20 - INFO - __main__ - Step 1162: {'lr': 0.00029025000000000003, 'samples': 223104, 'steps': 1161, 'loss/train': 3.7984821796417236} -08/30/2021 13:26:20 - INFO - __main__ - Step 1163: {'lr': 0.00029049999999999996, 'samples': 223296, 'steps': 1162, 'loss/train': 1.8246033191680908} -08/30/2021 13:26:21 - INFO - __main__ - Step 1164: {'lr': 0.00029075, 'samples': 223488, 'steps': 1163, 'loss/train': 4.839077949523926} -08/30/2021 13:26:21 - INFO - __main__ - Step 1165: {'lr': 0.00029099999999999997, 'samples': 223680, 'steps': 1164, 'loss/train': 2.739114284515381} -08/30/2021 13:26:21 - INFO - __main__ - Step 1166: {'lr': 0.00029125, 'samples': 223872, 'steps': 1165, 'loss/train': 4.731240749359131} -08/30/2021 13:26:23 - INFO - __main__ - Step 1167: {'lr': 0.0002915, 'samples': 224064, 'steps': 1166, 'loss/train': 4.460262298583984} -08/30/2021 13:26:23 - INFO - __main__ - Step 1168: {'lr': 0.00029175, 'samples': 224256, 'steps': 1167, 'loss/train': 6.072906494140625} -08/30/2021 13:26:24 - INFO - __main__ - Step 1169: {'lr': 0.000292, 'samples': 224448, 'steps': 1168, 'loss/train': 4.812139987945557} -08/30/2021 13:26:24 - INFO - __main__ - Step 1170: {'lr': 0.00029225000000000003, 'samples': 224640, 'steps': 1169, 'loss/train': 4.564539909362793} -08/30/2021 13:26:24 - INFO - __main__ - Step 1171: {'lr': 0.0002925, 'samples': 224832, 'steps': 1170, 'loss/train': 5.155861854553223} -08/30/2021 13:26:26 - INFO - __main__ - Step 1172: {'lr': 0.00029275000000000004, 'samples': 225024, 'steps': 1171, 'loss/train': 4.882957458496094} -08/30/2021 13:26:27 - INFO - __main__ - Step 1173: {'lr': 0.00029299999999999997, 'samples': 225216, 'steps': 1172, 'loss/train': 3.6840343475341797} -08/30/2021 13:26:27 - INFO - __main__ - Step 1174: {'lr': 0.00029325, 'samples': 225408, 'steps': 1173, 'loss/train': 4.6220383644104} -08/30/2021 13:26:27 - INFO - __main__ - Step 1175: {'lr': 0.0002935, 'samples': 225600, 'steps': 1174, 'loss/train': 4.422476291656494} -08/30/2021 13:26:28 - INFO - __main__ - Step 1176: {'lr': 0.00029375, 'samples': 225792, 'steps': 1175, 'loss/train': 4.572627544403076} -08/30/2021 13:26:29 - INFO - __main__ - Step 1177: {'lr': 0.000294, 'samples': 225984, 'steps': 1176, 'loss/train': 4.542801856994629} -08/30/2021 13:26:30 - INFO - __main__ - Step 1178: {'lr': 0.00029425, 'samples': 226176, 'steps': 1177, 'loss/train': 5.249860763549805} -08/30/2021 13:26:30 - INFO - __main__ - Step 1179: {'lr': 0.0002945, 'samples': 226368, 'steps': 1178, 'loss/train': 5.008918762207031} -08/30/2021 13:26:30 - INFO - __main__ - Step 1180: {'lr': 0.00029475000000000004, 'samples': 226560, 'steps': 1179, 'loss/train': 4.455695629119873} -08/30/2021 13:26:31 - INFO - __main__ - Step 1181: {'lr': 0.000295, 'samples': 226752, 'steps': 1180, 'loss/train': 2.9186155796051025} -08/30/2021 13:26:33 - INFO - __main__ - Step 1182: {'lr': 0.00029525, 'samples': 226944, 'steps': 1181, 'loss/train': 4.856095790863037} -08/30/2021 13:26:33 - INFO - __main__ - Step 1183: {'lr': 0.00029549999999999997, 'samples': 227136, 'steps': 1182, 'loss/train': 4.697263240814209} -08/30/2021 13:26:33 - INFO - __main__ - Step 1184: {'lr': 0.00029575, 'samples': 227328, 'steps': 1183, 'loss/train': 4.650768280029297} -08/30/2021 13:26:34 - INFO - __main__ - Step 1185: {'lr': 0.000296, 'samples': 227520, 'steps': 1184, 'loss/train': 3.7115986347198486} -08/30/2021 13:26:34 - INFO - __main__ - Step 1186: {'lr': 0.00029625, 'samples': 227712, 'steps': 1185, 'loss/train': 2.548330545425415} -08/30/2021 13:26:34 - INFO - __main__ - Step 1187: {'lr': 0.0002965, 'samples': 227904, 'steps': 1186, 'loss/train': 2.445172071456909} -08/30/2021 13:26:36 - INFO - __main__ - Step 1188: {'lr': 0.00029675000000000003, 'samples': 228096, 'steps': 1187, 'loss/train': 5.328794956207275} -08/30/2021 13:26:36 - INFO - __main__ - Step 1189: {'lr': 0.000297, 'samples': 228288, 'steps': 1188, 'loss/train': 4.762747287750244} -08/30/2021 13:26:37 - INFO - __main__ - Step 1190: {'lr': 0.00029725000000000004, 'samples': 228480, 'steps': 1189, 'loss/train': 4.807939052581787} -08/30/2021 13:26:37 - INFO - __main__ - Step 1191: {'lr': 0.00029749999999999997, 'samples': 228672, 'steps': 1190, 'loss/train': 4.6072187423706055} -08/30/2021 13:26:37 - INFO - __main__ - Step 1192: {'lr': 0.00029775, 'samples': 228864, 'steps': 1191, 'loss/train': 4.544644832611084} -08/30/2021 13:26:40 - INFO - __main__ - Step 1193: {'lr': 0.000298, 'samples': 229056, 'steps': 1192, 'loss/train': 4.550241470336914} -08/30/2021 13:26:40 - INFO - __main__ - Step 1194: {'lr': 0.00029825, 'samples': 229248, 'steps': 1193, 'loss/train': 6.383086204528809} -08/30/2021 13:26:41 - INFO - __main__ - Step 1195: {'lr': 0.0002985, 'samples': 229440, 'steps': 1194, 'loss/train': 3.5256423950195312} -08/30/2021 13:26:41 - INFO - __main__ - Step 1196: {'lr': 0.00029875, 'samples': 229632, 'steps': 1195, 'loss/train': 4.381834506988525} -08/30/2021 13:26:41 - INFO - __main__ - Step 1197: {'lr': 0.000299, 'samples': 229824, 'steps': 1196, 'loss/train': 4.199514865875244} -08/30/2021 13:26:42 - INFO - __main__ - Step 1198: {'lr': 0.00029925000000000004, 'samples': 230016, 'steps': 1197, 'loss/train': 4.502466201782227} -08/30/2021 13:26:43 - INFO - __main__ - Step 1199: {'lr': 0.0002995, 'samples': 230208, 'steps': 1198, 'loss/train': 4.6133036613464355} -08/30/2021 13:26:44 - INFO - __main__ - Step 1200: {'lr': 0.00029975000000000005, 'samples': 230400, 'steps': 1199, 'loss/train': 5.174978256225586} -08/30/2021 13:26:44 - INFO - __main__ - Step 1201: {'lr': 0.0003, 'samples': 230592, 'steps': 1200, 'loss/train': 4.766360282897949} -08/30/2021 13:26:44 - INFO - __main__ - Step 1202: {'lr': 0.00030025, 'samples': 230784, 'steps': 1201, 'loss/train': 4.671626091003418} -08/30/2021 13:26:45 - INFO - __main__ - Step 1203: {'lr': 0.0003005, 'samples': 230976, 'steps': 1202, 'loss/train': 4.615602970123291} -08/30/2021 13:26:46 - INFO - __main__ - Step 1204: {'lr': 0.00030075, 'samples': 231168, 'steps': 1203, 'loss/train': 4.681416988372803} -08/30/2021 13:26:47 - INFO - __main__ - Step 1205: {'lr': 0.000301, 'samples': 231360, 'steps': 1204, 'loss/train': 4.479160785675049} -08/30/2021 13:26:47 - INFO - __main__ - Step 1206: {'lr': 0.00030125000000000003, 'samples': 231552, 'steps': 1205, 'loss/train': 4.991608142852783} -08/30/2021 13:26:47 - INFO - __main__ - Step 1207: {'lr': 0.0003015, 'samples': 231744, 'steps': 1206, 'loss/train': 4.851442813873291} -08/30/2021 13:26:48 - INFO - __main__ - Step 1208: {'lr': 0.00030175000000000004, 'samples': 231936, 'steps': 1207, 'loss/train': 4.640334606170654} -08/30/2021 13:26:49 - INFO - __main__ - Step 1209: {'lr': 0.000302, 'samples': 232128, 'steps': 1208, 'loss/train': 5.395857334136963} -08/30/2021 13:26:49 - INFO - __main__ - Step 1210: {'lr': 0.00030225, 'samples': 232320, 'steps': 1209, 'loss/train': 4.886153221130371} -08/30/2021 13:26:50 - INFO - __main__ - Step 1211: {'lr': 0.0003025, 'samples': 232512, 'steps': 1210, 'loss/train': 5.126450538635254} -08/30/2021 13:26:50 - INFO - __main__ - Step 1212: {'lr': 0.00030275, 'samples': 232704, 'steps': 1211, 'loss/train': 4.263417720794678} -08/30/2021 13:26:51 - INFO - __main__ - Step 1213: {'lr': 0.000303, 'samples': 232896, 'steps': 1212, 'loss/train': 4.8280348777771} -08/30/2021 13:26:52 - INFO - __main__ - Step 1214: {'lr': 0.00030325, 'samples': 233088, 'steps': 1213, 'loss/train': 3.6417994499206543} -08/30/2021 13:26:53 - INFO - __main__ - Step 1215: {'lr': 0.0003035, 'samples': 233280, 'steps': 1214, 'loss/train': 4.839969635009766} -08/30/2021 13:26:53 - INFO - __main__ - Step 1216: {'lr': 0.00030375000000000004, 'samples': 233472, 'steps': 1215, 'loss/train': 4.414170265197754} -08/30/2021 13:26:53 - INFO - __main__ - Step 1217: {'lr': 0.000304, 'samples': 233664, 'steps': 1216, 'loss/train': 5.36515474319458} -08/30/2021 13:26:54 - INFO - __main__ - Step 1218: {'lr': 0.00030425000000000005, 'samples': 233856, 'steps': 1217, 'loss/train': 4.983379364013672} -08/30/2021 13:26:55 - INFO - __main__ - Step 1219: {'lr': 0.0003045, 'samples': 234048, 'steps': 1218, 'loss/train': 4.838827133178711} -08/30/2021 13:26:56 - INFO - __main__ - Step 1220: {'lr': 0.00030475, 'samples': 234240, 'steps': 1219, 'loss/train': 4.412363052368164} -08/30/2021 13:26:56 - INFO - __main__ - Step 1221: {'lr': 0.000305, 'samples': 234432, 'steps': 1220, 'loss/train': 4.714923858642578} -08/30/2021 13:26:56 - INFO - __main__ - Step 1222: {'lr': 0.00030525, 'samples': 234624, 'steps': 1221, 'loss/train': 3.9077796936035156} -08/30/2021 13:26:57 - INFO - __main__ - Step 1223: {'lr': 0.0003055, 'samples': 234816, 'steps': 1222, 'loss/train': 4.756908416748047} -08/30/2021 13:26:58 - INFO - __main__ - Step 1224: {'lr': 0.00030575000000000003, 'samples': 235008, 'steps': 1223, 'loss/train': 4.987254619598389} -08/30/2021 13:26:59 - INFO - __main__ - Step 1225: {'lr': 0.000306, 'samples': 235200, 'steps': 1224, 'loss/train': 4.241818428039551} -08/30/2021 13:26:59 - INFO - __main__ - Step 1226: {'lr': 0.00030625000000000004, 'samples': 235392, 'steps': 1225, 'loss/train': 4.861268043518066} -08/30/2021 13:26:59 - INFO - __main__ - Step 1227: {'lr': 0.0003065, 'samples': 235584, 'steps': 1226, 'loss/train': 4.192913055419922} -08/30/2021 13:27:00 - INFO - __main__ - Step 1228: {'lr': 0.00030675, 'samples': 235776, 'steps': 1227, 'loss/train': 4.0988993644714355} -08/30/2021 13:27:00 - INFO - __main__ - Step 1229: {'lr': 0.000307, 'samples': 235968, 'steps': 1228, 'loss/train': 4.682774543762207} -08/30/2021 13:27:01 - INFO - __main__ - Step 1230: {'lr': 0.00030725, 'samples': 236160, 'steps': 1229, 'loss/train': 5.342475414276123} -08/30/2021 13:27:02 - INFO - __main__ - Step 1231: {'lr': 0.0003075, 'samples': 236352, 'steps': 1230, 'loss/train': 4.609219551086426} -08/30/2021 13:27:02 - INFO - __main__ - Step 1232: {'lr': 0.00030775, 'samples': 236544, 'steps': 1231, 'loss/train': 4.775742530822754} -08/30/2021 13:27:03 - INFO - __main__ - Step 1233: {'lr': 0.000308, 'samples': 236736, 'steps': 1232, 'loss/train': 4.936896324157715} -08/30/2021 13:27:03 - INFO - __main__ - Step 1234: {'lr': 0.00030825000000000004, 'samples': 236928, 'steps': 1233, 'loss/train': 4.298108100891113} -08/30/2021 13:27:04 - INFO - __main__ - Step 1235: {'lr': 0.0003085, 'samples': 237120, 'steps': 1234, 'loss/train': 4.250104904174805} -08/30/2021 13:27:05 - INFO - __main__ - Step 1236: {'lr': 0.00030875000000000005, 'samples': 237312, 'steps': 1235, 'loss/train': 1.9314104318618774} -08/30/2021 13:27:05 - INFO - __main__ - Step 1237: {'lr': 0.00030900000000000003, 'samples': 237504, 'steps': 1236, 'loss/train': 4.494245529174805} -08/30/2021 13:27:06 - INFO - __main__ - Step 1238: {'lr': 0.00030925, 'samples': 237696, 'steps': 1237, 'loss/train': 4.776963233947754} -08/30/2021 13:27:06 - INFO - __main__ - Step 1239: {'lr': 0.0003095, 'samples': 237888, 'steps': 1238, 'loss/train': 4.345894813537598} -08/30/2021 13:27:07 - INFO - __main__ - Step 1240: {'lr': 0.00030975, 'samples': 238080, 'steps': 1239, 'loss/train': 5.152431488037109} -08/30/2021 13:27:08 - INFO - __main__ - Step 1241: {'lr': 0.00031, 'samples': 238272, 'steps': 1240, 'loss/train': 4.401095867156982} -08/30/2021 13:27:08 - INFO - __main__ - Step 1242: {'lr': 0.00031025000000000003, 'samples': 238464, 'steps': 1241, 'loss/train': 4.679511070251465} -08/30/2021 13:27:09 - INFO - __main__ - Step 1243: {'lr': 0.0003105, 'samples': 238656, 'steps': 1242, 'loss/train': 4.977512359619141} -08/30/2021 13:27:09 - INFO - __main__ - Step 1244: {'lr': 0.00031075000000000005, 'samples': 238848, 'steps': 1243, 'loss/train': 4.606505870819092} -08/30/2021 13:27:10 - INFO - __main__ - Step 1245: {'lr': 0.000311, 'samples': 239040, 'steps': 1244, 'loss/train': 4.016382694244385} -08/30/2021 13:27:11 - INFO - __main__ - Step 1246: {'lr': 0.00031125000000000006, 'samples': 239232, 'steps': 1245, 'loss/train': 4.495089054107666} -08/30/2021 13:27:11 - INFO - __main__ - Step 1247: {'lr': 0.0003115, 'samples': 239424, 'steps': 1246, 'loss/train': 4.898197174072266} -08/30/2021 13:27:12 - INFO - __main__ - Step 1248: {'lr': 0.00031175, 'samples': 239616, 'steps': 1247, 'loss/train': 4.841574668884277} -08/30/2021 13:27:12 - INFO - __main__ - Step 1249: {'lr': 0.000312, 'samples': 239808, 'steps': 1248, 'loss/train': 4.659887790679932} -08/30/2021 13:27:14 - INFO - __main__ - Step 1250: {'lr': 0.00031225000000000003, 'samples': 240000, 'steps': 1249, 'loss/train': 4.44929313659668} -08/30/2021 13:27:14 - INFO - __main__ - Step 1251: {'lr': 0.0003125, 'samples': 240192, 'steps': 1250, 'loss/train': 3.747215747833252} -08/30/2021 13:27:15 - INFO - __main__ - Step 1252: {'lr': 0.00031275, 'samples': 240384, 'steps': 1251, 'loss/train': 4.292858600616455} -08/30/2021 13:27:15 - INFO - __main__ - Step 1253: {'lr': 0.000313, 'samples': 240576, 'steps': 1252, 'loss/train': 4.516558647155762} -08/30/2021 13:27:15 - INFO - __main__ - Step 1254: {'lr': 0.00031325, 'samples': 240768, 'steps': 1253, 'loss/train': 4.808173179626465} -08/30/2021 13:27:17 - INFO - __main__ - Step 1255: {'lr': 0.00031350000000000003, 'samples': 240960, 'steps': 1254, 'loss/train': 4.414249420166016} -08/30/2021 13:27:17 - INFO - __main__ - Step 1256: {'lr': 0.00031374999999999996, 'samples': 241152, 'steps': 1255, 'loss/train': 4.453027725219727} -08/30/2021 13:27:18 - INFO - __main__ - Step 1257: {'lr': 0.000314, 'samples': 241344, 'steps': 1256, 'loss/train': 5.009148597717285} -08/30/2021 13:27:18 - INFO - __main__ - Step 1258: {'lr': 0.00031424999999999997, 'samples': 241536, 'steps': 1257, 'loss/train': 3.922722339630127} -08/30/2021 13:27:18 - INFO - __main__ - Step 1259: {'lr': 0.0003145, 'samples': 241728, 'steps': 1258, 'loss/train': 4.6702423095703125} -08/30/2021 13:27:19 - INFO - __main__ - Step 1260: {'lr': 0.00031475, 'samples': 241920, 'steps': 1259, 'loss/train': 4.826611518859863} -08/30/2021 13:27:20 - INFO - __main__ - Step 1261: {'lr': 0.000315, 'samples': 242112, 'steps': 1260, 'loss/train': 5.18397331237793} -08/30/2021 13:27:21 - INFO - __main__ - Step 1262: {'lr': 0.00031525, 'samples': 242304, 'steps': 1261, 'loss/train': 4.696173191070557} -08/30/2021 13:27:21 - INFO - __main__ - Step 1263: {'lr': 0.0003155, 'samples': 242496, 'steps': 1262, 'loss/train': 4.818138122558594} -08/30/2021 13:27:21 - INFO - __main__ - Step 1264: {'lr': 0.00031575, 'samples': 242688, 'steps': 1263, 'loss/train': 5.506348133087158} -08/30/2021 13:27:22 - INFO - __main__ - Step 1265: {'lr': 0.000316, 'samples': 242880, 'steps': 1264, 'loss/train': 4.260590553283691} -08/30/2021 13:27:23 - INFO - __main__ - Step 1266: {'lr': 0.00031624999999999996, 'samples': 243072, 'steps': 1265, 'loss/train': 4.641239643096924} -08/30/2021 13:27:24 - INFO - __main__ - Step 1267: {'lr': 0.0003165, 'samples': 243264, 'steps': 1266, 'loss/train': 4.229900360107422} -08/30/2021 13:27:24 - INFO - __main__ - Step 1268: {'lr': 0.00031675, 'samples': 243456, 'steps': 1267, 'loss/train': 4.410894393920898} -08/30/2021 13:27:24 - INFO - __main__ - Step 1269: {'lr': 0.000317, 'samples': 243648, 'steps': 1268, 'loss/train': 4.6991496086120605} -08/30/2021 13:27:25 - INFO - __main__ - Step 1270: {'lr': 0.00031725, 'samples': 243840, 'steps': 1269, 'loss/train': 4.288592338562012} -08/30/2021 13:27:26 - INFO - __main__ - Step 1271: {'lr': 0.0003175, 'samples': 244032, 'steps': 1270, 'loss/train': 4.804139137268066} -08/30/2021 13:27:27 - INFO - __main__ - Step 1272: {'lr': 0.00031775, 'samples': 244224, 'steps': 1271, 'loss/train': 4.242639064788818} -08/30/2021 13:27:27 - INFO - __main__ - Step 1273: {'lr': 0.00031800000000000003, 'samples': 244416, 'steps': 1272, 'loss/train': 4.992812156677246} -08/30/2021 13:27:27 - INFO - __main__ - Step 1274: {'lr': 0.00031825, 'samples': 244608, 'steps': 1273, 'loss/train': 4.1714277267456055} -08/30/2021 13:27:28 - INFO - __main__ - Step 1275: {'lr': 0.0003185, 'samples': 244800, 'steps': 1274, 'loss/train': 1.792271375656128} -08/30/2021 13:27:29 - INFO - __main__ - Step 1276: {'lr': 0.00031874999999999997, 'samples': 244992, 'steps': 1275, 'loss/train': 4.166008472442627} -08/30/2021 13:27:30 - INFO - __main__ - Step 1277: {'lr': 0.000319, 'samples': 245184, 'steps': 1276, 'loss/train': 4.203356742858887} -08/30/2021 13:27:30 - INFO - __main__ - Step 1278: {'lr': 0.00031925, 'samples': 245376, 'steps': 1277, 'loss/train': 4.392521858215332} -08/30/2021 13:27:30 - INFO - __main__ - Step 1279: {'lr': 0.0003195, 'samples': 245568, 'steps': 1278, 'loss/train': 5.123244285583496} -08/30/2021 13:27:31 - INFO - __main__ - Step 1280: {'lr': 0.00031975, 'samples': 245760, 'steps': 1279, 'loss/train': 4.326639175415039} -08/30/2021 13:27:31 - INFO - __main__ - Step 1281: {'lr': 0.00032, 'samples': 245952, 'steps': 1280, 'loss/train': 4.643868923187256} -08/30/2021 13:27:33 - INFO - __main__ - Step 1282: {'lr': 0.00032025, 'samples': 246144, 'steps': 1281, 'loss/train': 4.453815937042236} -08/30/2021 13:27:33 - INFO - __main__ - Step 1283: {'lr': 0.00032050000000000004, 'samples': 246336, 'steps': 1282, 'loss/train': 4.541042804718018} -08/30/2021 13:27:34 - INFO - __main__ - Step 1284: {'lr': 0.00032074999999999996, 'samples': 246528, 'steps': 1283, 'loss/train': 4.184276103973389} -08/30/2021 13:27:34 - INFO - __main__ - Step 1285: {'lr': 0.000321, 'samples': 246720, 'steps': 1284, 'loss/train': 4.502721786499023} -08/30/2021 13:27:34 - INFO - __main__ - Step 1286: {'lr': 0.00032125, 'samples': 246912, 'steps': 1285, 'loss/train': 4.524459362030029} -08/30/2021 13:27:36 - INFO - __main__ - Step 1287: {'lr': 0.0003215, 'samples': 247104, 'steps': 1286, 'loss/train': 4.998214244842529} -08/30/2021 13:27:36 - INFO - __main__ - Step 1288: {'lr': 0.00032175, 'samples': 247296, 'steps': 1287, 'loss/train': 4.486813068389893} -08/30/2021 13:27:36 - INFO - __main__ - Step 1289: {'lr': 0.000322, 'samples': 247488, 'steps': 1288, 'loss/train': 3.9918529987335205} -08/30/2021 13:27:37 - INFO - __main__ - Step 1290: {'lr': 0.00032225, 'samples': 247680, 'steps': 1289, 'loss/train': 4.199202537536621} -08/30/2021 13:27:37 - INFO - __main__ - Step 1291: {'lr': 0.00032250000000000003, 'samples': 247872, 'steps': 1290, 'loss/train': 4.5257134437561035} -08/30/2021 13:27:39 - INFO - __main__ - Step 1292: {'lr': 0.00032275, 'samples': 248064, 'steps': 1291, 'loss/train': 3.9086365699768066} -08/30/2021 13:27:39 - INFO - __main__ - Step 1293: {'lr': 0.000323, 'samples': 248256, 'steps': 1292, 'loss/train': 4.684390068054199} -08/30/2021 13:27:40 - INFO - __main__ - Step 1294: {'lr': 0.00032324999999999997, 'samples': 248448, 'steps': 1293, 'loss/train': 4.8196120262146} -08/30/2021 13:27:40 - INFO - __main__ - Step 1295: {'lr': 0.0003235, 'samples': 248640, 'steps': 1294, 'loss/train': 4.693305492401123} -08/30/2021 13:27:40 - INFO - __main__ - Step 1296: {'lr': 0.00032375, 'samples': 248832, 'steps': 1295, 'loss/train': 4.538880825042725} -08/30/2021 13:27:42 - INFO - __main__ - Step 1297: {'lr': 0.000324, 'samples': 249024, 'steps': 1296, 'loss/train': 3.790248155593872} -08/30/2021 13:27:42 - INFO - __main__ - Step 1298: {'lr': 0.00032425, 'samples': 249216, 'steps': 1297, 'loss/train': 4.5623779296875} -08/30/2021 13:27:43 - INFO - __main__ - Step 1299: {'lr': 0.00032450000000000003, 'samples': 249408, 'steps': 1298, 'loss/train': 4.117589950561523} -08/30/2021 13:27:43 - INFO - __main__ - Step 1300: {'lr': 0.00032475, 'samples': 249600, 'steps': 1299, 'loss/train': 4.715627670288086} -08/30/2021 13:27:43 - INFO - __main__ - Step 1301: {'lr': 0.00032500000000000004, 'samples': 249792, 'steps': 1300, 'loss/train': 4.385561943054199} -08/30/2021 13:27:45 - INFO - __main__ - Step 1302: {'lr': 0.00032524999999999996, 'samples': 249984, 'steps': 1301, 'loss/train': 4.569333076477051} -08/30/2021 13:27:46 - INFO - __main__ - Step 1303: {'lr': 0.0003255, 'samples': 250176, 'steps': 1302, 'loss/train': 4.422083377838135} -08/30/2021 13:27:46 - INFO - __main__ - Step 1304: {'lr': 0.00032575, 'samples': 250368, 'steps': 1303, 'loss/train': 4.419223308563232} -08/30/2021 13:27:47 - INFO - __main__ - Step 1305: {'lr': 0.000326, 'samples': 250560, 'steps': 1304, 'loss/train': 4.673562049865723} -08/30/2021 13:27:47 - INFO - __main__ - Step 1306: {'lr': 0.00032625, 'samples': 250752, 'steps': 1305, 'loss/train': 4.185782432556152} -08/30/2021 13:27:48 - INFO - __main__ - Step 1307: {'lr': 0.0003265, 'samples': 250944, 'steps': 1306, 'loss/train': 4.824061393737793} -08/30/2021 13:27:49 - INFO - __main__ - Step 1308: {'lr': 0.00032675, 'samples': 251136, 'steps': 1307, 'loss/train': 4.664660930633545} -08/30/2021 13:27:49 - INFO - __main__ - Step 1309: {'lr': 0.00032700000000000003, 'samples': 251328, 'steps': 1308, 'loss/train': 4.350864887237549} -08/30/2021 13:27:50 - INFO - __main__ - Step 1310: {'lr': 0.00032725, 'samples': 251520, 'steps': 1309, 'loss/train': 3.9895272254943848} -08/30/2021 13:27:50 - INFO - __main__ - Step 1311: {'lr': 0.00032750000000000005, 'samples': 251712, 'steps': 1310, 'loss/train': 5.069451332092285} -08/30/2021 13:27:51 - INFO - __main__ - Step 1312: {'lr': 0.00032774999999999997, 'samples': 251904, 'steps': 1311, 'loss/train': 4.556570529937744} -08/30/2021 13:27:52 - INFO - __main__ - Step 1313: {'lr': 0.000328, 'samples': 252096, 'steps': 1312, 'loss/train': 4.382578372955322} -08/30/2021 13:27:52 - INFO - __main__ - Step 1314: {'lr': 0.00032825, 'samples': 252288, 'steps': 1313, 'loss/train': 2.4415385723114014} -08/30/2021 13:27:53 - INFO - __main__ - Step 1315: {'lr': 0.0003285, 'samples': 252480, 'steps': 1314, 'loss/train': 4.276082515716553} -08/30/2021 13:27:53 - INFO - __main__ - Step 1316: {'lr': 0.00032875, 'samples': 252672, 'steps': 1315, 'loss/train': 4.509583473205566} -08/30/2021 13:27:54 - INFO - __main__ - Step 1317: {'lr': 0.00032900000000000003, 'samples': 252864, 'steps': 1316, 'loss/train': 4.153806686401367} -08/30/2021 13:27:55 - INFO - __main__ - Step 1318: {'lr': 0.00032925, 'samples': 253056, 'steps': 1317, 'loss/train': 4.242760181427002} -08/30/2021 13:27:55 - INFO - __main__ - Step 1319: {'lr': 0.00032950000000000004, 'samples': 253248, 'steps': 1318, 'loss/train': 3.9864144325256348} -08/30/2021 13:27:56 - INFO - __main__ - Step 1320: {'lr': 0.00032975, 'samples': 253440, 'steps': 1319, 'loss/train': 4.75071382522583} -08/30/2021 13:27:56 - INFO - __main__ - Step 1321: {'lr': 0.00033, 'samples': 253632, 'steps': 1320, 'loss/train': 3.9804000854492188} -08/30/2021 13:27:57 - INFO - __main__ - Step 1322: {'lr': 0.00033025, 'samples': 253824, 'steps': 1321, 'loss/train': 3.368206024169922} -08/30/2021 13:27:58 - INFO - __main__ - Step 1323: {'lr': 0.0003305, 'samples': 254016, 'steps': 1322, 'loss/train': 4.578549385070801} -08/30/2021 13:27:58 - INFO - __main__ - Step 1324: {'lr': 0.00033075, 'samples': 254208, 'steps': 1323, 'loss/train': 4.7281036376953125} -08/30/2021 13:27:58 - INFO - __main__ - Step 1325: {'lr': 0.000331, 'samples': 254400, 'steps': 1324, 'loss/train': 3.5485174655914307} -08/30/2021 13:27:59 - INFO - __main__ - Step 1326: {'lr': 0.00033125, 'samples': 254592, 'steps': 1325, 'loss/train': 6.437094211578369} -08/30/2021 13:27:59 - INFO - __main__ - Step 1327: {'lr': 0.00033150000000000003, 'samples': 254784, 'steps': 1326, 'loss/train': 4.145354270935059} -08/30/2021 13:28:01 - INFO - __main__ - Step 1328: {'lr': 0.00033175, 'samples': 254976, 'steps': 1327, 'loss/train': 5.2326860427856445} -08/30/2021 13:28:01 - INFO - __main__ - Step 1329: {'lr': 0.00033200000000000005, 'samples': 255168, 'steps': 1328, 'loss/train': 4.132408618927002} -08/30/2021 13:28:01 - INFO - __main__ - Step 1330: {'lr': 0.00033224999999999997, 'samples': 255360, 'steps': 1329, 'loss/train': 5.378190994262695} -08/30/2021 13:28:02 - INFO - __main__ - Step 1331: {'lr': 0.0003325, 'samples': 255552, 'steps': 1330, 'loss/train': 7.080970287322998} -08/30/2021 13:28:02 - INFO - __main__ - Step 1332: {'lr': 0.00033275, 'samples': 255744, 'steps': 1331, 'loss/train': 4.624168872833252} -08/30/2021 13:28:04 - INFO - __main__ - Step 1333: {'lr': 0.000333, 'samples': 255936, 'steps': 1332, 'loss/train': 4.436684608459473} -08/30/2021 13:28:04 - INFO - __main__ - Step 1334: {'lr': 0.00033325, 'samples': 256128, 'steps': 1333, 'loss/train': 4.374962329864502} -08/30/2021 13:28:05 - INFO - __main__ - Step 1335: {'lr': 0.00033350000000000003, 'samples': 256320, 'steps': 1334, 'loss/train': 4.5060529708862305} -08/30/2021 13:28:05 - INFO - __main__ - Step 1336: {'lr': 0.00033375, 'samples': 256512, 'steps': 1335, 'loss/train': 4.0865559577941895} -08/30/2021 13:28:05 - INFO - __main__ - Step 1337: {'lr': 0.00033400000000000004, 'samples': 256704, 'steps': 1336, 'loss/train': 4.452343463897705} -08/30/2021 13:28:07 - INFO - __main__ - Step 1338: {'lr': 0.00033425, 'samples': 256896, 'steps': 1337, 'loss/train': 4.250465393066406} -08/30/2021 13:28:07 - INFO - __main__ - Step 1339: {'lr': 0.00033450000000000005, 'samples': 257088, 'steps': 1338, 'loss/train': 4.740878582000732} -08/30/2021 13:28:07 - INFO - __main__ - Step 1340: {'lr': 0.00033475, 'samples': 257280, 'steps': 1339, 'loss/train': 3.674431085586548} -08/30/2021 13:28:08 - INFO - __main__ - Step 1341: {'lr': 0.000335, 'samples': 257472, 'steps': 1340, 'loss/train': 4.267061710357666} -08/30/2021 13:28:08 - INFO - __main__ - Step 1342: {'lr': 0.00033525, 'samples': 257664, 'steps': 1341, 'loss/train': 3.882347345352173} -08/30/2021 13:28:10 - INFO - __main__ - Step 1343: {'lr': 0.0003355, 'samples': 257856, 'steps': 1342, 'loss/train': 4.04584264755249} -08/30/2021 13:28:10 - INFO - __main__ - Step 1344: {'lr': 0.00033575, 'samples': 258048, 'steps': 1343, 'loss/train': 5.775942325592041} -08/30/2021 13:28:10 - INFO - __main__ - Step 1345: {'lr': 0.00033600000000000004, 'samples': 258240, 'steps': 1344, 'loss/train': 4.075455188751221} -08/30/2021 13:28:11 - INFO - __main__ - Step 1346: {'lr': 0.00033625, 'samples': 258432, 'steps': 1345, 'loss/train': 5.206962585449219} -08/30/2021 13:28:11 - INFO - __main__ - Step 1347: {'lr': 0.00033650000000000005, 'samples': 258624, 'steps': 1346, 'loss/train': 4.038782596588135} -08/30/2021 13:28:13 - INFO - __main__ - Step 1348: {'lr': 0.00033675, 'samples': 258816, 'steps': 1347, 'loss/train': 5.3180060386657715} -08/30/2021 13:28:13 - INFO - __main__ - Step 1349: {'lr': 0.000337, 'samples': 259008, 'steps': 1348, 'loss/train': 3.534853219985962} -08/30/2021 13:28:13 - INFO - __main__ - Step 1350: {'lr': 0.00033725, 'samples': 259200, 'steps': 1349, 'loss/train': 4.311325550079346} -08/30/2021 13:28:14 - INFO - __main__ - Step 1351: {'lr': 0.0003375, 'samples': 259392, 'steps': 1350, 'loss/train': 4.755340576171875} -08/30/2021 13:28:14 - INFO - __main__ - Step 1352: {'lr': 0.00033775, 'samples': 259584, 'steps': 1351, 'loss/train': 2.4528939723968506} -08/30/2021 13:28:16 - INFO - __main__ - Step 1353: {'lr': 0.00033800000000000003, 'samples': 259776, 'steps': 1352, 'loss/train': 4.556753635406494} -08/30/2021 13:28:16 - INFO - __main__ - Step 1354: {'lr': 0.00033825, 'samples': 259968, 'steps': 1353, 'loss/train': 4.163471698760986} -08/30/2021 13:28:16 - INFO - __main__ - Step 1355: {'lr': 0.00033850000000000004, 'samples': 260160, 'steps': 1354, 'loss/train': 4.440191745758057} -08/30/2021 13:28:17 - INFO - __main__ - Step 1356: {'lr': 0.00033875, 'samples': 260352, 'steps': 1355, 'loss/train': 4.314537525177002} -08/30/2021 13:28:17 - INFO - __main__ - Step 1357: {'lr': 0.00033900000000000005, 'samples': 260544, 'steps': 1356, 'loss/train': 4.676640033721924} -08/30/2021 13:28:19 - INFO - __main__ - Step 1358: {'lr': 0.00033925, 'samples': 260736, 'steps': 1357, 'loss/train': 3.737349033355713} -08/30/2021 13:28:19 - INFO - __main__ - Step 1359: {'lr': 0.0003395, 'samples': 260928, 'steps': 1358, 'loss/train': 4.140536308288574} -08/30/2021 13:28:20 - INFO - __main__ - Step 1360: {'lr': 0.00033975, 'samples': 261120, 'steps': 1359, 'loss/train': 4.576985836029053} -08/30/2021 13:28:20 - INFO - __main__ - Step 1361: {'lr': 0.00034, 'samples': 261312, 'steps': 1360, 'loss/train': 4.539398193359375} -08/30/2021 13:28:21 - INFO - __main__ - Step 1362: {'lr': 0.00034025, 'samples': 261504, 'steps': 1361, 'loss/train': 5.453786373138428} -08/30/2021 13:28:22 - INFO - __main__ - Step 1363: {'lr': 0.00034050000000000004, 'samples': 261696, 'steps': 1362, 'loss/train': 4.280670642852783} -08/30/2021 13:28:23 - INFO - __main__ - Step 1364: {'lr': 0.00034075, 'samples': 261888, 'steps': 1363, 'loss/train': 3.8596203327178955} -08/30/2021 13:28:23 - INFO - __main__ - Step 1365: {'lr': 0.00034100000000000005, 'samples': 262080, 'steps': 1364, 'loss/train': 3.9746007919311523} -08/30/2021 13:28:23 - INFO - __main__ - Step 1366: {'lr': 0.00034125000000000003, 'samples': 262272, 'steps': 1365, 'loss/train': 4.350702285766602} -08/30/2021 13:28:24 - INFO - __main__ - Step 1367: {'lr': 0.0003415, 'samples': 262464, 'steps': 1366, 'loss/train': 4.536733150482178} -08/30/2021 13:28:24 - INFO - __main__ - Step 1368: {'lr': 0.00034175, 'samples': 262656, 'steps': 1367, 'loss/train': 4.735171318054199} -08/30/2021 13:28:25 - INFO - __main__ - Step 1369: {'lr': 0.000342, 'samples': 262848, 'steps': 1368, 'loss/train': 4.363914966583252} -08/30/2021 13:28:26 - INFO - __main__ - Step 1370: {'lr': 0.00034225, 'samples': 263040, 'steps': 1369, 'loss/train': 4.070268630981445} -08/30/2021 13:28:26 - INFO - __main__ - Step 1371: {'lr': 0.00034250000000000003, 'samples': 263232, 'steps': 1370, 'loss/train': 4.607729911804199} -08/30/2021 13:28:27 - INFO - __main__ - Step 1372: {'lr': 0.00034275, 'samples': 263424, 'steps': 1371, 'loss/train': 4.5332465171813965} -08/30/2021 13:28:27 - INFO - __main__ - Step 1373: {'lr': 0.00034300000000000004, 'samples': 263616, 'steps': 1372, 'loss/train': 4.54966402053833} -08/30/2021 13:28:28 - INFO - __main__ - Step 1374: {'lr': 0.00034325, 'samples': 263808, 'steps': 1373, 'loss/train': 4.341580390930176} -08/30/2021 13:28:29 - INFO - __main__ - Step 1375: {'lr': 0.00034350000000000006, 'samples': 264000, 'steps': 1374, 'loss/train': 3.9261229038238525} -08/30/2021 13:28:29 - INFO - __main__ - Step 1376: {'lr': 0.00034375, 'samples': 264192, 'steps': 1375, 'loss/train': 4.626092433929443} -08/30/2021 13:28:30 - INFO - __main__ - Step 1377: {'lr': 0.00034399999999999996, 'samples': 264384, 'steps': 1376, 'loss/train': 4.53762149810791} -08/30/2021 13:28:30 - INFO - __main__ - Step 1378: {'lr': 0.00034425, 'samples': 264576, 'steps': 1377, 'loss/train': 4.843814373016357} -08/30/2021 13:28:31 - INFO - __main__ - Step 1379: {'lr': 0.00034449999999999997, 'samples': 264768, 'steps': 1378, 'loss/train': 4.533663749694824} -08/30/2021 13:28:32 - INFO - __main__ - Step 1380: {'lr': 0.00034475, 'samples': 264960, 'steps': 1379, 'loss/train': 4.268194675445557} -08/30/2021 13:28:32 - INFO - __main__ - Step 1381: {'lr': 0.000345, 'samples': 265152, 'steps': 1380, 'loss/train': 4.627920150756836} -08/30/2021 13:28:33 - INFO - __main__ - Step 1382: {'lr': 0.00034525, 'samples': 265344, 'steps': 1381, 'loss/train': 4.625608921051025} -08/30/2021 13:28:33 - INFO - __main__ - Step 1383: {'lr': 0.0003455, 'samples': 265536, 'steps': 1382, 'loss/train': 4.480739116668701} -08/30/2021 13:28:34 - INFO - __main__ - Step 1384: {'lr': 0.00034575000000000003, 'samples': 265728, 'steps': 1383, 'loss/train': 4.329967975616455} -08/30/2021 13:28:35 - INFO - __main__ - Step 1385: {'lr': 0.000346, 'samples': 265920, 'steps': 1384, 'loss/train': 4.387570858001709} -08/30/2021 13:28:35 - INFO - __main__ - Step 1386: {'lr': 0.00034625, 'samples': 266112, 'steps': 1385, 'loss/train': 4.490174770355225} -08/30/2021 13:28:36 - INFO - __main__ - Step 1387: {'lr': 0.00034649999999999997, 'samples': 266304, 'steps': 1386, 'loss/train': 4.425543785095215} -08/30/2021 13:28:36 - INFO - __main__ - Step 1388: {'lr': 0.00034675, 'samples': 266496, 'steps': 1387, 'loss/train': 3.9120686054229736} -08/30/2021 13:28:37 - INFO - __main__ - Step 1389: {'lr': 0.000347, 'samples': 266688, 'steps': 1388, 'loss/train': 4.659025192260742} -08/30/2021 13:28:38 - INFO - __main__ - Step 1390: {'lr': 0.00034725, 'samples': 266880, 'steps': 1389, 'loss/train': 4.53112268447876} -08/30/2021 13:28:38 - INFO - __main__ - Step 1391: {'lr': 0.0003475, 'samples': 267072, 'steps': 1390, 'loss/train': 4.275741100311279} -08/30/2021 13:28:38 - INFO - __main__ - Step 1392: {'lr': 0.00034775, 'samples': 267264, 'steps': 1391, 'loss/train': 4.180943965911865} -08/30/2021 13:28:39 - INFO - __main__ - Step 1393: {'lr': 0.000348, 'samples': 267456, 'steps': 1392, 'loss/train': 4.7057576179504395} -08/30/2021 13:28:40 - INFO - __main__ - Step 1394: {'lr': 0.00034825000000000004, 'samples': 267648, 'steps': 1393, 'loss/train': 4.166080951690674} -08/30/2021 13:28:41 - INFO - __main__ - Step 1395: {'lr': 0.00034849999999999996, 'samples': 267840, 'steps': 1394, 'loss/train': 4.255853652954102} -08/30/2021 13:28:41 - INFO - __main__ - Step 1396: {'lr': 0.00034875, 'samples': 268032, 'steps': 1395, 'loss/train': 4.1657938957214355} -08/30/2021 13:28:41 - INFO - __main__ - Step 1397: {'lr': 0.00034899999999999997, 'samples': 268224, 'steps': 1396, 'loss/train': 4.592858791351318} -08/30/2021 13:28:42 - INFO - __main__ - Step 1398: {'lr': 0.00034925, 'samples': 268416, 'steps': 1397, 'loss/train': 4.626420974731445} -08/30/2021 13:28:42 - INFO - __main__ - Step 1399: {'lr': 0.0003495, 'samples': 268608, 'steps': 1398, 'loss/train': 4.299635887145996} -08/30/2021 13:28:44 - INFO - __main__ - Step 1400: {'lr': 0.00034975, 'samples': 268800, 'steps': 1399, 'loss/train': 4.366077423095703} -08/30/2021 13:28:44 - INFO - __main__ - Step 1401: {'lr': 0.00035, 'samples': 268992, 'steps': 1400, 'loss/train': 5.40753698348999} -08/30/2021 13:28:45 - INFO - __main__ - Step 1402: {'lr': 0.00035025000000000003, 'samples': 269184, 'steps': 1401, 'loss/train': 4.4894537925720215} -08/30/2021 13:28:45 - INFO - __main__ - Step 1403: {'lr': 0.0003505, 'samples': 269376, 'steps': 1402, 'loss/train': 4.545291423797607} -08/30/2021 13:28:45 - INFO - __main__ - Step 1404: {'lr': 0.00035075, 'samples': 269568, 'steps': 1403, 'loss/train': 4.797220706939697} -08/30/2021 13:28:47 - INFO - __main__ - Step 1405: {'lr': 0.00035099999999999997, 'samples': 269760, 'steps': 1404, 'loss/train': 4.782083034515381} -08/30/2021 13:28:48 - INFO - __main__ - Step 1406: {'lr': 0.00035125, 'samples': 269952, 'steps': 1405, 'loss/train': 4.428123950958252} -08/30/2021 13:28:48 - INFO - __main__ - Step 1407: {'lr': 0.0003515, 'samples': 270144, 'steps': 1406, 'loss/train': 4.661625862121582} -08/30/2021 13:28:48 - INFO - __main__ - Step 1408: {'lr': 0.00035175, 'samples': 270336, 'steps': 1407, 'loss/train': 3.7704012393951416} -08/30/2021 13:28:49 - INFO - __main__ - Step 1409: {'lr': 0.000352, 'samples': 270528, 'steps': 1408, 'loss/train': 4.755863189697266} -08/30/2021 13:28:50 - INFO - __main__ - Step 1410: {'lr': 0.00035225, 'samples': 270720, 'steps': 1409, 'loss/train': 4.273111820220947} -08/30/2021 13:28:51 - INFO - __main__ - Step 1411: {'lr': 0.0003525, 'samples': 270912, 'steps': 1410, 'loss/train': 4.178704738616943} -08/30/2021 13:28:51 - INFO - __main__ - Step 1412: {'lr': 0.00035275000000000004, 'samples': 271104, 'steps': 1411, 'loss/train': 4.520911693572998} -08/30/2021 13:28:52 - INFO - __main__ - Step 1413: {'lr': 0.00035299999999999996, 'samples': 271296, 'steps': 1412, 'loss/train': 4.139966011047363} -08/30/2021 13:28:52 - INFO - __main__ - Step 1414: {'lr': 0.00035325, 'samples': 271488, 'steps': 1413, 'loss/train': 4.225654125213623} -08/30/2021 13:28:53 - INFO - __main__ - Step 1415: {'lr': 0.0003535, 'samples': 271680, 'steps': 1414, 'loss/train': 4.571483612060547} -08/30/2021 13:28:54 - INFO - __main__ - Step 1416: {'lr': 0.00035375, 'samples': 271872, 'steps': 1415, 'loss/train': 4.365446090698242} -08/30/2021 13:28:54 - INFO - __main__ - Step 1417: {'lr': 0.000354, 'samples': 272064, 'steps': 1416, 'loss/train': 4.675602912902832} -08/30/2021 13:28:55 - INFO - __main__ - Step 1418: {'lr': 0.00035425, 'samples': 272256, 'steps': 1417, 'loss/train': 4.224637508392334} -08/30/2021 13:28:55 - INFO - __main__ - Step 1419: {'lr': 0.0003545, 'samples': 272448, 'steps': 1418, 'loss/train': 4.211911678314209} -08/30/2021 13:28:55 - INFO - __main__ - Step 1420: {'lr': 0.00035475000000000003, 'samples': 272640, 'steps': 1419, 'loss/train': 5.085281848907471} -08/30/2021 13:28:57 - INFO - __main__ - Step 1421: {'lr': 0.000355, 'samples': 272832, 'steps': 1420, 'loss/train': 4.593563079833984} -08/30/2021 13:28:57 - INFO - __main__ - Step 1422: {'lr': 0.00035525000000000004, 'samples': 273024, 'steps': 1421, 'loss/train': 4.751321315765381} -08/30/2021 13:28:58 - INFO - __main__ - Step 1423: {'lr': 0.00035549999999999997, 'samples': 273216, 'steps': 1422, 'loss/train': 4.472665309906006} -08/30/2021 13:28:58 - INFO - __main__ - Step 1424: {'lr': 0.00035575, 'samples': 273408, 'steps': 1423, 'loss/train': 4.202507972717285} -08/30/2021 13:28:58 - INFO - __main__ - Step 1425: {'lr': 0.000356, 'samples': 273600, 'steps': 1424, 'loss/train': 4.3050994873046875} -08/30/2021 13:29:00 - INFO - __main__ - Step 1426: {'lr': 0.00035625, 'samples': 273792, 'steps': 1425, 'loss/train': 4.268754005432129} -08/30/2021 13:29:00 - INFO - __main__ - Step 1427: {'lr': 0.0003565, 'samples': 273984, 'steps': 1426, 'loss/train': 4.267064094543457} -08/30/2021 13:29:00 - INFO - __main__ - Step 1428: {'lr': 0.00035675, 'samples': 274176, 'steps': 1427, 'loss/train': 4.332093238830566} -08/30/2021 13:29:01 - INFO - __main__ - Step 1429: {'lr': 0.000357, 'samples': 274368, 'steps': 1428, 'loss/train': 4.247141361236572} -08/30/2021 13:29:01 - INFO - __main__ - Step 1430: {'lr': 0.00035725000000000004, 'samples': 274560, 'steps': 1429, 'loss/train': 3.9781038761138916} -08/30/2021 13:29:03 - INFO - __main__ - Step 1431: {'lr': 0.0003575, 'samples': 274752, 'steps': 1430, 'loss/train': 4.520853519439697} -08/30/2021 13:29:03 - INFO - __main__ - Step 1432: {'lr': 0.00035775, 'samples': 274944, 'steps': 1431, 'loss/train': 4.8411736488342285} -08/30/2021 13:29:03 - INFO - __main__ - Step 1433: {'lr': 0.000358, 'samples': 275136, 'steps': 1432, 'loss/train': 4.100142002105713} -08/30/2021 13:29:04 - INFO - __main__ - Step 1434: {'lr': 0.00035825, 'samples': 275328, 'steps': 1433, 'loss/train': 4.149476528167725} -08/30/2021 13:29:04 - INFO - __main__ - Step 1435: {'lr': 0.0003585, 'samples': 275520, 'steps': 1434, 'loss/train': 4.42181396484375} -08/30/2021 13:29:06 - INFO - __main__ - Step 1436: {'lr': 0.00035875, 'samples': 275712, 'steps': 1435, 'loss/train': 4.3713226318359375} -08/30/2021 13:29:06 - INFO - __main__ - Step 1437: {'lr': 0.000359, 'samples': 275904, 'steps': 1436, 'loss/train': 4.0421648025512695} -08/30/2021 13:29:06 - INFO - __main__ - Step 1438: {'lr': 0.00035925000000000003, 'samples': 276096, 'steps': 1437, 'loss/train': 4.149511337280273} -08/30/2021 13:29:07 - INFO - __main__ - Step 1439: {'lr': 0.0003595, 'samples': 276288, 'steps': 1438, 'loss/train': 4.122163772583008} -08/30/2021 13:29:07 - INFO - __main__ - Step 1440: {'lr': 0.00035975000000000004, 'samples': 276480, 'steps': 1439, 'loss/train': 4.252772808074951} -08/30/2021 13:29:09 - INFO - __main__ - Step 1441: {'lr': 0.00035999999999999997, 'samples': 276672, 'steps': 1440, 'loss/train': 4.3171210289001465} -08/30/2021 13:29:09 - INFO - __main__ - Step 1442: {'lr': 0.00036025, 'samples': 276864, 'steps': 1441, 'loss/train': 4.632924556732178} -08/30/2021 13:29:10 - INFO - __main__ - Step 1443: {'lr': 0.0003605, 'samples': 277056, 'steps': 1442, 'loss/train': 4.305054664611816} -08/30/2021 13:29:10 - INFO - __main__ - Step 1444: {'lr': 0.00036075, 'samples': 277248, 'steps': 1443, 'loss/train': 4.408972263336182} -08/30/2021 13:29:11 - INFO - __main__ - Step 1445: {'lr': 0.000361, 'samples': 277440, 'steps': 1444, 'loss/train': 4.228984832763672} -08/30/2021 13:29:12 - INFO - __main__ - Step 1446: {'lr': 0.00036125, 'samples': 277632, 'steps': 1445, 'loss/train': 4.329809665679932} -08/30/2021 13:29:12 - INFO - __main__ - Step 1447: {'lr': 0.0003615, 'samples': 277824, 'steps': 1446, 'loss/train': 4.439213752746582} -08/30/2021 13:29:13 - INFO - __main__ - Step 1448: {'lr': 0.00036175000000000004, 'samples': 278016, 'steps': 1447, 'loss/train': 4.233701705932617} -08/30/2021 13:29:13 - INFO - __main__ - Step 1449: {'lr': 0.000362, 'samples': 278208, 'steps': 1448, 'loss/train': 3.235466718673706} -08/30/2021 13:29:13 - INFO - __main__ - Step 1450: {'lr': 0.00036225000000000005, 'samples': 278400, 'steps': 1449, 'loss/train': 3.3804967403411865} -08/30/2021 13:29:15 - INFO - __main__ - Step 1451: {'lr': 0.0003625, 'samples': 278592, 'steps': 1450, 'loss/train': 4.406125068664551} -08/30/2021 13:29:15 - INFO - __main__ - Step 1452: {'lr': 0.00036275, 'samples': 278784, 'steps': 1451, 'loss/train': 1.672944188117981} -08/30/2021 13:29:16 - INFO - __main__ - Step 1453: {'lr': 0.000363, 'samples': 278976, 'steps': 1452, 'loss/train': 4.2426862716674805} -08/30/2021 13:29:16 - INFO - __main__ - Step 1454: {'lr': 0.00036325, 'samples': 279168, 'steps': 1453, 'loss/train': 4.787095546722412} -08/30/2021 13:29:16 - INFO - __main__ - Step 1455: {'lr': 0.0003635, 'samples': 279360, 'steps': 1454, 'loss/train': 4.5315728187561035} -08/30/2021 13:29:18 - INFO - __main__ - Step 1456: {'lr': 0.00036375000000000003, 'samples': 279552, 'steps': 1455, 'loss/train': 3.1854286193847656} -08/30/2021 13:29:19 - INFO - __main__ - Step 1457: {'lr': 0.000364, 'samples': 279744, 'steps': 1456, 'loss/train': 3.866952896118164} -08/30/2021 13:29:19 - INFO - __main__ - Step 1458: {'lr': 0.00036425000000000004, 'samples': 279936, 'steps': 1457, 'loss/train': 4.139428615570068} -08/30/2021 13:29:19 - INFO - __main__ - Step 1459: {'lr': 0.0003645, 'samples': 280128, 'steps': 1458, 'loss/train': 4.534155368804932} -08/30/2021 13:29:20 - INFO - __main__ - Step 1460: {'lr': 0.00036475, 'samples': 280320, 'steps': 1459, 'loss/train': 2.945066452026367} -08/30/2021 13:29:20 - INFO - __main__ - Step 1461: {'lr': 0.000365, 'samples': 280512, 'steps': 1460, 'loss/train': 2.2096877098083496} -08/30/2021 13:29:22 - INFO - __main__ - Step 1462: {'lr': 0.00036525, 'samples': 280704, 'steps': 1461, 'loss/train': 4.244150638580322} -08/30/2021 13:29:22 - INFO - __main__ - Step 1463: {'lr': 0.0003655, 'samples': 280896, 'steps': 1462, 'loss/train': 4.8449788093566895} -08/30/2021 13:29:22 - INFO - __main__ - Step 1464: {'lr': 0.00036575, 'samples': 281088, 'steps': 1463, 'loss/train': 3.7697691917419434} -08/30/2021 13:29:23 - INFO - __main__ - Step 1465: {'lr': 0.000366, 'samples': 281280, 'steps': 1464, 'loss/train': 4.358305931091309} -08/30/2021 13:29:23 - INFO - __main__ - Step 1466: {'lr': 0.00036625000000000004, 'samples': 281472, 'steps': 1465, 'loss/train': 6.622794151306152} -08/30/2021 13:29:25 - INFO - __main__ - Step 1467: {'lr': 0.0003665, 'samples': 281664, 'steps': 1466, 'loss/train': 4.413908958435059} -08/30/2021 13:29:26 - INFO - __main__ - Step 1468: {'lr': 0.00036675000000000005, 'samples': 281856, 'steps': 1467, 'loss/train': 4.058522701263428} -08/30/2021 13:29:26 - INFO - __main__ - Step 1469: {'lr': 0.000367, 'samples': 282048, 'steps': 1468, 'loss/train': 3.260404348373413} -08/30/2021 13:29:26 - INFO - __main__ - Step 1470: {'lr': 0.00036725, 'samples': 282240, 'steps': 1469, 'loss/train': 3.354424476623535} -08/30/2021 13:29:27 - INFO - __main__ - Step 1471: {'lr': 0.0003675, 'samples': 282432, 'steps': 1470, 'loss/train': 4.304652214050293} -08/30/2021 13:29:27 - INFO - __main__ - Step 1472: {'lr': 0.00036775, 'samples': 282624, 'steps': 1471, 'loss/train': 4.494898796081543} -08/30/2021 13:29:28 - INFO - __main__ - Step 1473: {'lr': 0.000368, 'samples': 282816, 'steps': 1472, 'loss/train': 5.061712265014648} -08/30/2021 13:29:29 - INFO - __main__ - Step 1474: {'lr': 0.00036825000000000003, 'samples': 283008, 'steps': 1473, 'loss/train': 4.55220890045166} -08/30/2021 13:29:29 - INFO - __main__ - Step 1475: {'lr': 0.0003685, 'samples': 283200, 'steps': 1474, 'loss/train': 4.2048845291137695} -08/30/2021 13:29:30 - INFO - __main__ - Step 1476: {'lr': 0.00036875000000000005, 'samples': 283392, 'steps': 1475, 'loss/train': 4.37580680847168} -08/30/2021 13:29:30 - INFO - __main__ - Step 1477: {'lr': 0.000369, 'samples': 283584, 'steps': 1476, 'loss/train': 4.393023490905762} -08/30/2021 13:29:32 - INFO - __main__ - Step 1478: {'lr': 0.00036925, 'samples': 283776, 'steps': 1477, 'loss/train': 4.154752254486084} -08/30/2021 13:29:32 - INFO - __main__ - Step 1479: {'lr': 0.0003695, 'samples': 283968, 'steps': 1478, 'loss/train': 4.85263729095459} -08/30/2021 13:29:33 - INFO - __main__ - Step 1480: {'lr': 0.00036975, 'samples': 284160, 'steps': 1479, 'loss/train': 4.904667854309082} -08/30/2021 13:29:33 - INFO - __main__ - Step 1481: {'lr': 0.00037, 'samples': 284352, 'steps': 1480, 'loss/train': 4.509653091430664} -08/30/2021 13:29:33 - INFO - __main__ - Step 1482: {'lr': 0.00037025000000000003, 'samples': 284544, 'steps': 1481, 'loss/train': 2.2799997329711914} -08/30/2021 13:29:35 - INFO - __main__ - Step 1483: {'lr': 0.0003705, 'samples': 284736, 'steps': 1482, 'loss/train': 4.844964027404785} -08/30/2021 13:29:36 - INFO - __main__ - Step 1484: {'lr': 0.00037075000000000004, 'samples': 284928, 'steps': 1483, 'loss/train': 4.235947132110596} -08/30/2021 13:29:36 - INFO - __main__ - Step 1485: {'lr': 0.000371, 'samples': 285120, 'steps': 1484, 'loss/train': 1.4060440063476562} -08/30/2021 13:29:36 - INFO - __main__ - Step 1486: {'lr': 0.00037125000000000005, 'samples': 285312, 'steps': 1485, 'loss/train': 4.211449146270752} -08/30/2021 13:29:37 - INFO - __main__ - Step 1487: {'lr': 0.00037150000000000003, 'samples': 285504, 'steps': 1486, 'loss/train': 4.709524631500244} -08/30/2021 13:29:37 - INFO - __main__ - Step 1488: {'lr': 0.00037175, 'samples': 285696, 'steps': 1487, 'loss/train': 3.5683043003082275} -08/30/2021 13:29:39 - INFO - __main__ - Step 1489: {'lr': 0.000372, 'samples': 285888, 'steps': 1488, 'loss/train': 5.118578910827637} -08/30/2021 13:29:39 - INFO - __main__ - Step 1490: {'lr': 0.00037225, 'samples': 286080, 'steps': 1489, 'loss/train': 4.15762186050415} -08/30/2021 13:29:39 - INFO - __main__ - Step 1491: {'lr': 0.0003725, 'samples': 286272, 'steps': 1490, 'loss/train': 3.8408548831939697} -08/30/2021 13:29:40 - INFO - __main__ - Step 1492: {'lr': 0.00037275000000000003, 'samples': 286464, 'steps': 1491, 'loss/train': 4.238423824310303} -08/30/2021 13:29:40 - INFO - __main__ - Step 1493: {'lr': 0.000373, 'samples': 286656, 'steps': 1492, 'loss/train': 6.055631160736084} -08/30/2021 13:29:42 - INFO - __main__ - Step 1494: {'lr': 0.00037325000000000005, 'samples': 286848, 'steps': 1493, 'loss/train': 4.529669761657715} -08/30/2021 13:29:42 - INFO - __main__ - Step 1495: {'lr': 0.0003735, 'samples': 287040, 'steps': 1494, 'loss/train': 4.583528995513916} -08/30/2021 13:29:42 - INFO - __main__ - Step 1496: {'lr': 0.00037375000000000006, 'samples': 287232, 'steps': 1495, 'loss/train': 4.353099346160889} -08/30/2021 13:29:43 - INFO - __main__ - Step 1497: {'lr': 0.000374, 'samples': 287424, 'steps': 1496, 'loss/train': 4.231982707977295} -08/30/2021 13:29:43 - INFO - __main__ - Step 1498: {'lr': 0.00037425, 'samples': 287616, 'steps': 1497, 'loss/train': 4.441566467285156} -08/30/2021 13:29:45 - INFO - __main__ - Step 1499: {'lr': 0.0003745, 'samples': 287808, 'steps': 1498, 'loss/train': 4.646770000457764} -08/30/2021 13:29:46 - INFO - __main__ - Step 1500: {'lr': 0.00037475000000000003, 'samples': 288000, 'steps': 1499, 'loss/train': 3.9177045822143555} -08/30/2021 13:29:46 - INFO - __main__ - Step 1501: {'lr': 0.000375, 'samples': 288192, 'steps': 1500, 'loss/train': 4.252547740936279} -08/30/2021 13:29:47 - INFO - __main__ - Step 1502: {'lr': 0.00037525, 'samples': 288384, 'steps': 1501, 'loss/train': 4.6158366203308105} -08/30/2021 13:29:47 - INFO - __main__ - Step 1503: {'lr': 0.0003755, 'samples': 288576, 'steps': 1502, 'loss/train': 4.698845386505127} -08/30/2021 13:29:47 - INFO - __main__ - Step 1504: {'lr': 0.00037575, 'samples': 288768, 'steps': 1503, 'loss/train': 4.231035232543945} -08/30/2021 13:29:49 - INFO - __main__ - Step 1505: {'lr': 0.00037600000000000003, 'samples': 288960, 'steps': 1504, 'loss/train': 4.305008411407471} -08/30/2021 13:29:49 - INFO - __main__ - Step 1506: {'lr': 0.00037624999999999996, 'samples': 289152, 'steps': 1505, 'loss/train': 3.5773348808288574} -08/30/2021 13:29:49 - INFO - __main__ - Step 1507: {'lr': 0.0003765, 'samples': 289344, 'steps': 1506, 'loss/train': 4.525704383850098} -08/30/2021 13:29:50 - INFO - __main__ - Step 1508: {'lr': 0.00037674999999999997, 'samples': 289536, 'steps': 1507, 'loss/train': 4.645226001739502} -08/30/2021 13:29:50 - INFO - __main__ - Step 1509: {'lr': 0.000377, 'samples': 289728, 'steps': 1508, 'loss/train': 4.71548318862915} -08/30/2021 13:29:52 - INFO - __main__ - Step 1510: {'lr': 0.00037725, 'samples': 289920, 'steps': 1509, 'loss/train': 4.2164106369018555} -08/30/2021 13:29:52 - INFO - __main__ - Step 1511: {'lr': 0.0003775, 'samples': 290112, 'steps': 1510, 'loss/train': 4.314056396484375} -08/30/2021 13:29:53 - INFO - __main__ - Step 1512: {'lr': 0.00037775, 'samples': 290304, 'steps': 1511, 'loss/train': 4.566384792327881} -08/30/2021 13:29:53 - INFO - __main__ - Step 1513: {'lr': 0.000378, 'samples': 290496, 'steps': 1512, 'loss/train': 2.8232011795043945} -08/30/2021 13:29:53 - INFO - __main__ - Step 1514: {'lr': 0.00037825, 'samples': 290688, 'steps': 1513, 'loss/train': 4.194929599761963} -08/30/2021 13:29:55 - INFO - __main__ - Step 1515: {'lr': 0.0003785, 'samples': 290880, 'steps': 1514, 'loss/train': 3.6204090118408203} -08/30/2021 13:29:55 - INFO - __main__ - Step 1516: {'lr': 0.00037874999999999996, 'samples': 291072, 'steps': 1515, 'loss/train': 2.259321928024292} -08/30/2021 13:29:56 - INFO - __main__ - Step 1517: {'lr': 0.000379, 'samples': 291264, 'steps': 1516, 'loss/train': 4.508073329925537} -08/30/2021 13:29:56 - INFO - __main__ - Step 1518: {'lr': 0.00037925, 'samples': 291456, 'steps': 1517, 'loss/train': 4.136277198791504} -08/30/2021 13:29:56 - INFO - __main__ - Step 1519: {'lr': 0.0003795, 'samples': 291648, 'steps': 1518, 'loss/train': 4.656012535095215} -08/30/2021 13:29:58 - INFO - __main__ - Step 1520: {'lr': 0.00037975, 'samples': 291840, 'steps': 1519, 'loss/train': 3.939546585083008} -08/30/2021 13:29:59 - INFO - __main__ - Step 1521: {'lr': 0.00038, 'samples': 292032, 'steps': 1520, 'loss/train': 4.163784980773926} -08/30/2021 13:29:59 - INFO - __main__ - Step 1522: {'lr': 0.00038025, 'samples': 292224, 'steps': 1521, 'loss/train': 3.413626194000244} -08/30/2021 13:29:59 - INFO - __main__ - Step 1523: {'lr': 0.00038050000000000003, 'samples': 292416, 'steps': 1522, 'loss/train': 4.128015041351318} -08/30/2021 13:30:00 - INFO - __main__ - Step 1524: {'lr': 0.00038075, 'samples': 292608, 'steps': 1523, 'loss/train': 4.029847145080566} -08/30/2021 13:30:01 - INFO - __main__ - Step 1525: {'lr': 0.000381, 'samples': 292800, 'steps': 1524, 'loss/train': 4.129461765289307} -08/30/2021 13:30:02 - INFO - __main__ - Step 1526: {'lr': 0.00038124999999999997, 'samples': 292992, 'steps': 1525, 'loss/train': 4.3723835945129395} -08/30/2021 13:30:02 - INFO - __main__ - Step 1527: {'lr': 0.0003815, 'samples': 293184, 'steps': 1526, 'loss/train': 4.338167190551758} -08/30/2021 13:30:02 - INFO - __main__ - Step 1528: {'lr': 0.00038175, 'samples': 293376, 'steps': 1527, 'loss/train': 3.519054651260376} -08/30/2021 13:30:03 - INFO - __main__ - Step 1529: {'lr': 0.000382, 'samples': 293568, 'steps': 1528, 'loss/train': 4.21800422668457} -08/30/2021 13:30:03 - INFO - __main__ - Step 1530: {'lr': 0.00038225, 'samples': 293760, 'steps': 1529, 'loss/train': 3.9521214962005615} -08/30/2021 13:30:05 - INFO - __main__ - Step 1531: {'lr': 0.00038250000000000003, 'samples': 293952, 'steps': 1530, 'loss/train': 6.254088878631592} -08/30/2021 13:30:05 - INFO - __main__ - Step 1532: {'lr': 0.00038275, 'samples': 294144, 'steps': 1531, 'loss/train': 4.113962650299072} -08/30/2021 13:30:06 - INFO - __main__ - Step 1533: {'lr': 0.00038300000000000004, 'samples': 294336, 'steps': 1532, 'loss/train': 4.775832176208496} -08/30/2021 13:30:06 - INFO - __main__ - Step 1534: {'lr': 0.00038324999999999996, 'samples': 294528, 'steps': 1533, 'loss/train': 4.4971537590026855} -08/30/2021 13:30:06 - INFO - __main__ - Step 1535: {'lr': 0.0003835, 'samples': 294720, 'steps': 1534, 'loss/train': 5.525181293487549} -08/30/2021 13:30:08 - INFO - __main__ - Step 1536: {'lr': 0.00038375, 'samples': 294912, 'steps': 1535, 'loss/train': 4.181306838989258} -08/30/2021 13:30:08 - INFO - __main__ - Step 1537: {'lr': 0.000384, 'samples': 295104, 'steps': 1536, 'loss/train': 3.903292417526245} -08/30/2021 13:30:09 - INFO - __main__ - Step 1538: {'lr': 0.00038425, 'samples': 295296, 'steps': 1537, 'loss/train': 5.626465797424316} -08/30/2021 13:30:09 - INFO - __main__ - Step 1539: {'lr': 0.0003845, 'samples': 295488, 'steps': 1538, 'loss/train': 4.052511692047119} -08/30/2021 13:30:09 - INFO - __main__ - Step 1540: {'lr': 0.00038475, 'samples': 295680, 'steps': 1539, 'loss/train': 3.402632713317871} -08/30/2021 13:30:10 - INFO - __main__ - Step 1541: {'lr': 0.00038500000000000003, 'samples': 295872, 'steps': 1540, 'loss/train': 4.247229099273682} -08/30/2021 13:30:11 - INFO - __main__ - Step 1542: {'lr': 0.00038525, 'samples': 296064, 'steps': 1541, 'loss/train': 4.7946672439575195} -08/30/2021 13:30:12 - INFO - __main__ - Step 1543: {'lr': 0.0003855, 'samples': 296256, 'steps': 1542, 'loss/train': 4.134920120239258} -08/30/2021 13:30:12 - INFO - __main__ - Step 1544: {'lr': 0.00038574999999999997, 'samples': 296448, 'steps': 1543, 'loss/train': 4.3115363121032715} -08/30/2021 13:30:12 - INFO - __main__ - Step 1545: {'lr': 0.000386, 'samples': 296640, 'steps': 1544, 'loss/train': 4.576611042022705} -08/30/2021 13:30:13 - INFO - __main__ - Step 1546: {'lr': 0.00038625, 'samples': 296832, 'steps': 1545, 'loss/train': 4.4993696212768555} -08/30/2021 13:30:14 - INFO - __main__ - Step 1547: {'lr': 0.0003865, 'samples': 297024, 'steps': 1546, 'loss/train': 3.7387473583221436} -08/30/2021 13:30:15 - INFO - __main__ - Step 1548: {'lr': 0.00038675, 'samples': 297216, 'steps': 1547, 'loss/train': 4.228835582733154} -08/30/2021 13:30:15 - INFO - __main__ - Step 1549: {'lr': 0.00038700000000000003, 'samples': 297408, 'steps': 1548, 'loss/train': 4.637598514556885} -08/30/2021 13:30:15 - INFO - __main__ - Step 1550: {'lr': 0.00038725, 'samples': 297600, 'steps': 1549, 'loss/train': 4.239960193634033} -08/30/2021 13:30:16 - INFO - __main__ - Step 1551: {'lr': 0.00038750000000000004, 'samples': 297792, 'steps': 1550, 'loss/train': 4.193304538726807} -08/30/2021 13:30:18 - INFO - __main__ - Step 1552: {'lr': 0.00038774999999999997, 'samples': 297984, 'steps': 1551, 'loss/train': 4.810821533203125} -08/30/2021 13:30:18 - INFO - __main__ - Step 1553: {'lr': 0.000388, 'samples': 298176, 'steps': 1552, 'loss/train': 4.437920570373535} -08/30/2021 13:30:18 - INFO - __main__ - Step 1554: {'lr': 0.00038825, 'samples': 298368, 'steps': 1553, 'loss/train': 4.394014835357666} -08/30/2021 13:30:19 - INFO - __main__ - Step 1555: {'lr': 0.0003885, 'samples': 298560, 'steps': 1554, 'loss/train': 4.478893756866455} -08/30/2021 13:30:19 - INFO - __main__ - Step 1556: {'lr': 0.00038875, 'samples': 298752, 'steps': 1555, 'loss/train': 3.117422103881836} -08/30/2021 13:30:19 - INFO - __main__ - Step 1557: {'lr': 0.000389, 'samples': 298944, 'steps': 1556, 'loss/train': 2.5692341327667236} -08/30/2021 13:30:21 - INFO - __main__ - Step 1558: {'lr': 0.00038925, 'samples': 299136, 'steps': 1557, 'loss/train': 5.1680521965026855} -08/30/2021 13:30:22 - INFO - __main__ - Step 1559: {'lr': 0.00038950000000000003, 'samples': 299328, 'steps': 1558, 'loss/train': 4.88592529296875} -08/30/2021 13:30:22 - INFO - __main__ - Step 1560: {'lr': 0.00038975, 'samples': 299520, 'steps': 1559, 'loss/train': 4.256154537200928} -08/30/2021 13:30:23 - INFO - __main__ - Step 1561: {'lr': 0.00039000000000000005, 'samples': 299712, 'steps': 1560, 'loss/train': 4.822085380554199} -08/30/2021 13:30:23 - INFO - __main__ - Step 1562: {'lr': 0.00039024999999999997, 'samples': 299904, 'steps': 1561, 'loss/train': 3.565521717071533} -08/30/2021 13:30:24 - INFO - __main__ - Step 1563: {'lr': 0.0003905, 'samples': 300096, 'steps': 1562, 'loss/train': 4.09617805480957} -08/30/2021 13:30:25 - INFO - __main__ - Step 1564: {'lr': 0.00039075, 'samples': 300288, 'steps': 1563, 'loss/train': 3.3210463523864746} -08/30/2021 13:30:25 - INFO - __main__ - Step 1565: {'lr': 0.000391, 'samples': 300480, 'steps': 1564, 'loss/train': 4.729197978973389} -08/30/2021 13:30:26 - INFO - __main__ - Step 1566: {'lr': 0.00039125, 'samples': 300672, 'steps': 1565, 'loss/train': 4.8554768562316895} -08/30/2021 13:30:26 - INFO - __main__ - Step 1567: {'lr': 0.00039150000000000003, 'samples': 300864, 'steps': 1566, 'loss/train': 3.703321695327759} -08/30/2021 13:30:28 - INFO - __main__ - Step 1568: {'lr': 0.00039175, 'samples': 301056, 'steps': 1567, 'loss/train': 3.9964680671691895} -08/30/2021 13:30:28 - INFO - __main__ - Step 1569: {'lr': 0.00039200000000000004, 'samples': 301248, 'steps': 1568, 'loss/train': 4.367398738861084} -08/30/2021 13:30:29 - INFO - __main__ - Step 1570: {'lr': 0.00039225, 'samples': 301440, 'steps': 1569, 'loss/train': 4.335350513458252} -08/30/2021 13:30:29 - INFO - __main__ - Step 1571: {'lr': 0.0003925, 'samples': 301632, 'steps': 1570, 'loss/train': 4.462733268737793} -08/30/2021 13:30:29 - INFO - __main__ - Step 1572: {'lr': 0.00039275, 'samples': 301824, 'steps': 1571, 'loss/train': 4.362184524536133} -08/30/2021 13:30:30 - INFO - __main__ - Step 1573: {'lr': 0.000393, 'samples': 302016, 'steps': 1572, 'loss/train': 3.751896381378174} -08/30/2021 13:30:31 - INFO - __main__ - Step 1574: {'lr': 0.00039325, 'samples': 302208, 'steps': 1573, 'loss/train': 2.203317642211914} -08/30/2021 13:30:32 - INFO - __main__ - Step 1575: {'lr': 0.0003935, 'samples': 302400, 'steps': 1574, 'loss/train': 4.502272129058838} -08/30/2021 13:30:32 - INFO - __main__ - Step 1576: {'lr': 0.00039375, 'samples': 302592, 'steps': 1575, 'loss/train': 4.511845111846924} -08/30/2021 13:30:33 - INFO - __main__ - Step 1577: {'lr': 0.00039400000000000004, 'samples': 302784, 'steps': 1576, 'loss/train': 3.4592127799987793} -08/30/2021 13:30:33 - INFO - __main__ - Step 1578: {'lr': 0.00039425, 'samples': 302976, 'steps': 1577, 'loss/train': 5.708824634552002} -08/30/2021 13:30:34 - INFO - __main__ - Step 1579: {'lr': 0.00039450000000000005, 'samples': 303168, 'steps': 1578, 'loss/train': 4.112600803375244} -08/30/2021 13:30:35 - INFO - __main__ - Step 1580: {'lr': 0.00039474999999999997, 'samples': 303360, 'steps': 1579, 'loss/train': 4.602146625518799} -08/30/2021 13:30:35 - INFO - __main__ - Step 1581: {'lr': 0.000395, 'samples': 303552, 'steps': 1580, 'loss/train': 3.5878899097442627} -08/30/2021 13:30:36 - INFO - __main__ - Step 1582: {'lr': 0.00039525, 'samples': 303744, 'steps': 1581, 'loss/train': 4.978146076202393} -08/30/2021 13:30:36 - INFO - __main__ - Step 1583: {'lr': 0.0003955, 'samples': 303936, 'steps': 1582, 'loss/train': 4.191125869750977} -08/30/2021 13:30:36 - INFO - __main__ - Step 1584: {'lr': 0.00039575, 'samples': 304128, 'steps': 1583, 'loss/train': 4.308163166046143} -08/30/2021 13:30:38 - INFO - __main__ - Step 1585: {'lr': 0.00039600000000000003, 'samples': 304320, 'steps': 1584, 'loss/train': 3.522921085357666} -08/30/2021 13:30:38 - INFO - __main__ - Step 1586: {'lr': 0.00039625, 'samples': 304512, 'steps': 1585, 'loss/train': 4.331756591796875} -08/30/2021 13:30:39 - INFO - __main__ - Step 1587: {'lr': 0.00039650000000000004, 'samples': 304704, 'steps': 1586, 'loss/train': 4.016501426696777} -08/30/2021 13:30:39 - INFO - __main__ - Step 1588: {'lr': 0.00039675, 'samples': 304896, 'steps': 1587, 'loss/train': 3.9630494117736816} -08/30/2021 13:30:39 - INFO - __main__ - Step 1589: {'lr': 0.00039700000000000005, 'samples': 305088, 'steps': 1588, 'loss/train': 3.8252696990966797} -08/30/2021 13:30:41 - INFO - __main__ - Step 1590: {'lr': 0.00039725, 'samples': 305280, 'steps': 1589, 'loss/train': 4.543032169342041} -08/30/2021 13:30:41 - INFO - __main__ - Step 1591: {'lr': 0.0003975, 'samples': 305472, 'steps': 1590, 'loss/train': 3.9182825088500977} -08/30/2021 13:30:42 - INFO - __main__ - Step 1592: {'lr': 0.00039775, 'samples': 305664, 'steps': 1591, 'loss/train': 3.944086790084839} -08/30/2021 13:30:42 - INFO - __main__ - Step 1593: {'lr': 0.000398, 'samples': 305856, 'steps': 1592, 'loss/train': 4.1202239990234375} -08/30/2021 13:30:42 - INFO - __main__ - Step 1594: {'lr': 0.00039825, 'samples': 306048, 'steps': 1593, 'loss/train': 4.118268013000488} -08/30/2021 13:30:44 - INFO - __main__ - Step 1595: {'lr': 0.00039850000000000004, 'samples': 306240, 'steps': 1594, 'loss/train': 4.110257625579834} -08/30/2021 13:30:44 - INFO - __main__ - Step 1596: {'lr': 0.00039875, 'samples': 306432, 'steps': 1595, 'loss/train': 4.602290153503418} -08/30/2021 13:30:45 - INFO - __main__ - Step 1597: {'lr': 0.00039900000000000005, 'samples': 306624, 'steps': 1596, 'loss/train': 4.3493332862854} -08/30/2021 13:30:45 - INFO - __main__ - Step 1598: {'lr': 0.00039925000000000003, 'samples': 306816, 'steps': 1597, 'loss/train': 4.359951496124268} -08/30/2021 13:30:45 - INFO - __main__ - Step 1599: {'lr': 0.0003995, 'samples': 307008, 'steps': 1598, 'loss/train': 4.226939678192139} -08/30/2021 13:30:47 - INFO - __main__ - Step 1600: {'lr': 0.00039975, 'samples': 307200, 'steps': 1599, 'loss/train': 3.979285717010498} -08/30/2021 13:30:47 - INFO - __main__ - Step 1601: {'lr': 0.0004, 'samples': 307392, 'steps': 1600, 'loss/train': 3.927377700805664} -08/30/2021 13:30:48 - INFO - __main__ - Step 1602: {'lr': 0.00040025, 'samples': 307584, 'steps': 1601, 'loss/train': 3.437540292739868} -08/30/2021 13:30:48 - INFO - __main__ - Step 1603: {'lr': 0.00040050000000000003, 'samples': 307776, 'steps': 1602, 'loss/train': 4.3806962966918945} -08/30/2021 13:30:48 - INFO - __main__ - Step 1604: {'lr': 0.00040075, 'samples': 307968, 'steps': 1603, 'loss/train': 4.12437629699707} -08/30/2021 13:30:50 - INFO - __main__ - Step 1605: {'lr': 0.00040100000000000004, 'samples': 308160, 'steps': 1604, 'loss/train': 3.897045373916626} -08/30/2021 13:30:50 - INFO - __main__ - Step 1606: {'lr': 0.00040125, 'samples': 308352, 'steps': 1605, 'loss/train': 3.835270643234253} -08/30/2021 13:30:51 - INFO - __main__ - Step 1607: {'lr': 0.00040150000000000006, 'samples': 308544, 'steps': 1606, 'loss/train': 4.323556900024414} -08/30/2021 13:30:51 - INFO - __main__ - Step 1608: {'lr': 0.00040175, 'samples': 308736, 'steps': 1607, 'loss/train': 3.6603899002075195} -08/30/2021 13:30:52 - INFO - __main__ - Step 1609: {'lr': 0.000402, 'samples': 308928, 'steps': 1608, 'loss/train': 4.13911247253418} -08/30/2021 13:30:54 - INFO - __main__ - Step 1610: {'lr': 0.00040225, 'samples': 309120, 'steps': 1609, 'loss/train': 3.910623788833618} -08/30/2021 13:30:54 - INFO - __main__ - Step 1611: {'lr': 0.0004025, 'samples': 309312, 'steps': 1610, 'loss/train': 4.918487548828125} -08/30/2021 13:30:55 - INFO - __main__ - Step 1612: {'lr': 0.00040275, 'samples': 309504, 'steps': 1611, 'loss/train': 4.247921943664551} -08/30/2021 13:30:55 - INFO - __main__ - Step 1613: {'lr': 0.00040300000000000004, 'samples': 309696, 'steps': 1612, 'loss/train': 4.120118618011475} -08/30/2021 13:30:55 - INFO - __main__ - Step 1614: {'lr': 0.00040325, 'samples': 309888, 'steps': 1613, 'loss/train': 4.075702667236328} -08/30/2021 13:30:57 - INFO - __main__ - Step 1615: {'lr': 0.00040350000000000005, 'samples': 310080, 'steps': 1614, 'loss/train': 4.307497978210449} -08/30/2021 13:30:57 - INFO - __main__ - Step 1616: {'lr': 0.00040375000000000003, 'samples': 310272, 'steps': 1615, 'loss/train': 4.062084197998047} -08/30/2021 13:30:58 - INFO - __main__ - Step 1617: {'lr': 0.000404, 'samples': 310464, 'steps': 1616, 'loss/train': 1.957079291343689} -08/30/2021 13:30:58 - INFO - __main__ - Step 1618: {'lr': 0.00040425, 'samples': 310656, 'steps': 1617, 'loss/train': 3.859267473220825} -08/30/2021 13:30:58 - INFO - __main__ - Step 1619: {'lr': 0.0004045, 'samples': 310848, 'steps': 1618, 'loss/train': 3.921182155609131} -08/30/2021 13:30:59 - INFO - __main__ - Step 1620: {'lr': 0.00040475, 'samples': 311040, 'steps': 1619, 'loss/train': 3.962010145187378} -08/30/2021 13:31:00 - INFO - __main__ - Step 1621: {'lr': 0.00040500000000000003, 'samples': 311232, 'steps': 1620, 'loss/train': 3.9373505115509033} -08/30/2021 13:31:01 - INFO - __main__ - Step 1622: {'lr': 0.00040525, 'samples': 311424, 'steps': 1621, 'loss/train': 1.5724457502365112} -08/30/2021 13:31:01 - INFO - __main__ - Step 1623: {'lr': 0.00040550000000000004, 'samples': 311616, 'steps': 1622, 'loss/train': 3.370074510574341} -08/30/2021 13:31:01 - INFO - __main__ - Step 1624: {'lr': 0.00040575, 'samples': 311808, 'steps': 1623, 'loss/train': 4.119229316711426} -08/30/2021 13:31:02 - INFO - __main__ - Step 1625: {'lr': 0.00040600000000000006, 'samples': 312000, 'steps': 1624, 'loss/train': 4.099151611328125} -08/30/2021 13:31:03 - INFO - __main__ - Step 1626: {'lr': 0.00040625000000000004, 'samples': 312192, 'steps': 1625, 'loss/train': 4.612451553344727} -08/30/2021 13:31:04 - INFO - __main__ - Step 1627: {'lr': 0.00040649999999999996, 'samples': 312384, 'steps': 1626, 'loss/train': 5.194092750549316} -08/30/2021 13:31:04 - INFO - __main__ - Step 1628: {'lr': 0.00040675, 'samples': 312576, 'steps': 1627, 'loss/train': 3.668224334716797} -08/30/2021 13:31:04 - INFO - __main__ - Step 1629: {'lr': 0.00040699999999999997, 'samples': 312768, 'steps': 1628, 'loss/train': 5.2241363525390625} -08/30/2021 13:31:05 - INFO - __main__ - Step 1630: {'lr': 0.00040725, 'samples': 312960, 'steps': 1629, 'loss/train': 3.1308257579803467} -08/30/2021 13:31:06 - INFO - __main__ - Step 1631: {'lr': 0.0004075, 'samples': 313152, 'steps': 1630, 'loss/train': 4.357464790344238} -08/30/2021 13:31:07 - INFO - __main__ - Step 1632: {'lr': 0.00040775, 'samples': 313344, 'steps': 1631, 'loss/train': 3.7567591667175293} -08/30/2021 13:31:07 - INFO - __main__ - Step 1633: {'lr': 0.000408, 'samples': 313536, 'steps': 1632, 'loss/train': 2.5121212005615234} -08/30/2021 13:31:08 - INFO - __main__ - Step 1634: {'lr': 0.00040825000000000003, 'samples': 313728, 'steps': 1633, 'loss/train': 3.9205658435821533} -08/30/2021 13:31:08 - INFO - __main__ - Step 1635: {'lr': 0.0004085, 'samples': 313920, 'steps': 1634, 'loss/train': 3.962059259414673} -08/30/2021 13:31:08 - INFO - __main__ - Step 1636: {'lr': 0.00040875, 'samples': 314112, 'steps': 1635, 'loss/train': 1.6473331451416016} -08/30/2021 13:31:10 - INFO - __main__ - Step 1637: {'lr': 0.00040899999999999997, 'samples': 314304, 'steps': 1636, 'loss/train': 4.067282676696777} -08/30/2021 13:31:10 - INFO - __main__ - Step 1638: {'lr': 0.00040925, 'samples': 314496, 'steps': 1637, 'loss/train': 4.295927047729492} -08/30/2021 13:31:11 - INFO - __main__ - Step 1639: {'lr': 0.0004095, 'samples': 314688, 'steps': 1638, 'loss/train': 6.340890407562256} -08/30/2021 13:31:11 - INFO - __main__ - Step 1640: {'lr': 0.00040975, 'samples': 314880, 'steps': 1639, 'loss/train': 4.031452178955078} -08/30/2021 13:31:11 - INFO - __main__ - Step 1641: {'lr': 0.00041, 'samples': 315072, 'steps': 1640, 'loss/train': 4.079275131225586} -08/30/2021 13:31:13 - INFO - __main__ - Step 1642: {'lr': 0.00041025, 'samples': 315264, 'steps': 1641, 'loss/train': 4.769386291503906} -08/30/2021 13:31:13 - INFO - __main__ - Step 1643: {'lr': 0.0004105, 'samples': 315456, 'steps': 1642, 'loss/train': 3.8678455352783203} -08/30/2021 13:31:14 - INFO - __main__ - Step 1644: {'lr': 0.00041075000000000004, 'samples': 315648, 'steps': 1643, 'loss/train': 4.219468593597412} -08/30/2021 13:31:14 - INFO - __main__ - Step 1645: {'lr': 0.00041099999999999996, 'samples': 315840, 'steps': 1644, 'loss/train': 3.7112865447998047} -08/30/2021 13:31:14 - INFO - __main__ - Step 1646: {'lr': 0.00041125, 'samples': 316032, 'steps': 1645, 'loss/train': 3.841484308242798} -08/30/2021 13:31:16 - INFO - __main__ - Step 1647: {'lr': 0.0004115, 'samples': 316224, 'steps': 1646, 'loss/train': 4.261174201965332} -08/30/2021 13:31:16 - INFO - __main__ - Step 1648: {'lr': 0.00041175, 'samples': 316416, 'steps': 1647, 'loss/train': 3.7539446353912354} -08/30/2021 13:31:17 - INFO - __main__ - Step 1649: {'lr': 0.000412, 'samples': 316608, 'steps': 1648, 'loss/train': 3.9607656002044678} -08/30/2021 13:31:17 - INFO - __main__ - Step 1650: {'lr': 0.00041225, 'samples': 316800, 'steps': 1649, 'loss/train': 4.425975322723389} -08/30/2021 13:31:17 - INFO - __main__ - Step 1651: {'lr': 0.0004125, 'samples': 316992, 'steps': 1650, 'loss/train': 4.258786201477051} -08/30/2021 13:31:18 - INFO - __main__ - Step 1652: {'lr': 0.00041275000000000003, 'samples': 317184, 'steps': 1651, 'loss/train': 4.03767204284668} -08/30/2021 13:31:19 - INFO - __main__ - Step 1653: {'lr': 0.000413, 'samples': 317376, 'steps': 1652, 'loss/train': 4.375797748565674} -08/30/2021 13:31:20 - INFO - __main__ - Step 1654: {'lr': 0.00041325, 'samples': 317568, 'steps': 1653, 'loss/train': 5.396332263946533} -08/30/2021 13:31:20 - INFO - __main__ - Step 1655: {'lr': 0.00041349999999999997, 'samples': 317760, 'steps': 1654, 'loss/train': 4.422496318817139} -08/30/2021 13:31:20 - INFO - __main__ - Step 1656: {'lr': 0.00041375, 'samples': 317952, 'steps': 1655, 'loss/train': 3.649282217025757} -08/30/2021 13:31:21 - INFO - __main__ - Step 1657: {'lr': 0.000414, 'samples': 318144, 'steps': 1656, 'loss/train': 3.2264163494110107} -08/30/2021 13:31:22 - INFO - __main__ - Step 1658: {'lr': 0.00041425, 'samples': 318336, 'steps': 1657, 'loss/train': 3.597780704498291} -08/30/2021 13:31:23 - INFO - __main__ - Step 1659: {'lr': 0.0004145, 'samples': 318528, 'steps': 1658, 'loss/train': 4.033586025238037} -08/30/2021 13:31:23 - INFO - __main__ - Step 1660: {'lr': 0.00041475, 'samples': 318720, 'steps': 1659, 'loss/train': 4.188148498535156} -08/30/2021 13:31:24 - INFO - __main__ - Step 1661: {'lr': 0.000415, 'samples': 318912, 'steps': 1660, 'loss/train': 3.688339948654175} -08/30/2021 13:31:24 - INFO - __main__ - Step 1662: {'lr': 0.00041525000000000004, 'samples': 319104, 'steps': 1661, 'loss/train': 1.469415307044983} -08/30/2021 13:31:26 - INFO - __main__ - Step 1663: {'lr': 0.00041549999999999996, 'samples': 319296, 'steps': 1662, 'loss/train': 3.908815383911133} -08/30/2021 13:31:27 - INFO - __main__ - Step 1664: {'lr': 0.00041575, 'samples': 319488, 'steps': 1663, 'loss/train': 3.91666316986084} -08/30/2021 13:31:27 - INFO - __main__ - Step 1665: {'lr': 0.000416, 'samples': 319680, 'steps': 1664, 'loss/train': 4.200262069702148} -08/30/2021 13:31:27 - INFO - __main__ - Step 1666: {'lr': 0.00041625, 'samples': 319872, 'steps': 1665, 'loss/train': 4.345694065093994} -08/30/2021 13:31:28 - INFO - __main__ - Step 1667: {'lr': 0.0004165, 'samples': 320064, 'steps': 1666, 'loss/train': 3.4992318153381348} -08/30/2021 13:31:29 - INFO - __main__ - Step 1668: {'lr': 0.00041675, 'samples': 320256, 'steps': 1667, 'loss/train': 3.7306833267211914} -08/30/2021 13:31:30 - INFO - __main__ - Step 1669: {'lr': 0.000417, 'samples': 320448, 'steps': 1668, 'loss/train': 4.227388381958008} -08/30/2021 13:31:30 - INFO - __main__ - Step 1670: {'lr': 0.00041725000000000003, 'samples': 320640, 'steps': 1669, 'loss/train': 4.318609714508057} -08/30/2021 13:31:30 - INFO - __main__ - Step 1671: {'lr': 0.0004175, 'samples': 320832, 'steps': 1670, 'loss/train': 4.057160377502441} -08/30/2021 13:31:31 - INFO - __main__ - Step 1672: {'lr': 0.00041775000000000004, 'samples': 321024, 'steps': 1671, 'loss/train': 4.666829586029053} -08/30/2021 13:31:32 - INFO - __main__ - Step 1673: {'lr': 0.00041799999999999997, 'samples': 321216, 'steps': 1672, 'loss/train': 4.118185997009277} -08/30/2021 13:31:33 - INFO - __main__ - Step 1674: {'lr': 0.00041825, 'samples': 321408, 'steps': 1673, 'loss/train': 3.671118974685669} -08/30/2021 13:31:33 - INFO - __main__ - Step 1675: {'lr': 0.0004185, 'samples': 321600, 'steps': 1674, 'loss/train': 3.7217016220092773} -08/30/2021 13:31:33 - INFO - __main__ - Step 1676: {'lr': 0.00041875, 'samples': 321792, 'steps': 1675, 'loss/train': 4.462160587310791} -08/30/2021 13:31:34 - INFO - __main__ - Step 1677: {'lr': 0.000419, 'samples': 321984, 'steps': 1676, 'loss/train': 4.042119026184082} -08/30/2021 13:31:35 - INFO - __main__ - Step 1678: {'lr': 0.00041925, 'samples': 322176, 'steps': 1677, 'loss/train': 4.16783332824707} -08/30/2021 13:31:36 - INFO - __main__ - Step 1679: {'lr': 0.0004195, 'samples': 322368, 'steps': 1678, 'loss/train': 3.4674606323242188} -08/30/2021 13:31:36 - INFO - __main__ - Step 1680: {'lr': 0.00041975000000000004, 'samples': 322560, 'steps': 1679, 'loss/train': 4.066051483154297} -08/30/2021 13:31:36 - INFO - __main__ - Step 1681: {'lr': 0.00042, 'samples': 322752, 'steps': 1680, 'loss/train': 4.4997663497924805} -08/30/2021 13:31:37 - INFO - __main__ - Step 1682: {'lr': 0.00042025, 'samples': 322944, 'steps': 1681, 'loss/train': 4.407072067260742} -08/30/2021 13:31:37 - INFO - __main__ - Step 1683: {'lr': 0.0004205, 'samples': 323136, 'steps': 1682, 'loss/train': 4.428121089935303} -08/30/2021 13:31:39 - INFO - __main__ - Step 1684: {'lr': 0.00042075, 'samples': 323328, 'steps': 1683, 'loss/train': 4.961803913116455} -08/30/2021 13:31:39 - INFO - __main__ - Step 1685: {'lr': 0.000421, 'samples': 323520, 'steps': 1684, 'loss/train': 3.9315521717071533} -08/30/2021 13:31:39 - INFO - __main__ - Step 1686: {'lr': 0.00042125, 'samples': 323712, 'steps': 1685, 'loss/train': 4.466744422912598} -08/30/2021 13:31:40 - INFO - __main__ - Step 1687: {'lr': 0.0004215, 'samples': 323904, 'steps': 1686, 'loss/train': 4.479499340057373} -08/30/2021 13:31:40 - INFO - __main__ - Step 1688: {'lr': 0.00042175000000000003, 'samples': 324096, 'steps': 1687, 'loss/train': 4.021457195281982} -08/30/2021 13:31:42 - INFO - __main__ - Step 1689: {'lr': 0.000422, 'samples': 324288, 'steps': 1688, 'loss/train': 3.9127321243286133} -08/30/2021 13:31:42 - INFO - __main__ - Step 1690: {'lr': 0.00042225000000000005, 'samples': 324480, 'steps': 1689, 'loss/train': 3.905916213989258} -08/30/2021 13:31:42 - INFO - __main__ - Step 1691: {'lr': 0.00042249999999999997, 'samples': 324672, 'steps': 1690, 'loss/train': 4.201033592224121} -08/30/2021 13:31:43 - INFO - __main__ - Step 1692: {'lr': 0.00042275, 'samples': 324864, 'steps': 1691, 'loss/train': 4.329977035522461} -08/30/2021 13:31:43 - INFO - __main__ - Step 1693: {'lr': 0.000423, 'samples': 325056, 'steps': 1692, 'loss/train': 3.6381800174713135} -08/30/2021 13:31:44 - INFO - __main__ - Step 1694: {'lr': 0.00042325, 'samples': 325248, 'steps': 1693, 'loss/train': 3.683461904525757} -08/30/2021 13:31:45 - INFO - __main__ - Step 1695: {'lr': 0.0004235, 'samples': 325440, 'steps': 1694, 'loss/train': 3.852285146713257} -08/30/2021 13:31:45 - INFO - __main__ - Step 1696: {'lr': 0.00042375000000000003, 'samples': 325632, 'steps': 1695, 'loss/train': 3.511688470840454} -08/30/2021 13:31:46 - INFO - __main__ - Step 1697: {'lr': 0.000424, 'samples': 325824, 'steps': 1696, 'loss/train': 3.8069117069244385} -08/30/2021 13:31:46 - INFO - __main__ - Step 1698: {'lr': 0.00042425000000000004, 'samples': 326016, 'steps': 1697, 'loss/train': 4.340700149536133} -08/30/2021 13:31:47 - INFO - __main__ - Step 1699: {'lr': 0.0004245, 'samples': 326208, 'steps': 1698, 'loss/train': 3.7010538578033447} -08/30/2021 13:31:48 - INFO - __main__ - Step 1700: {'lr': 0.00042475000000000005, 'samples': 326400, 'steps': 1699, 'loss/train': 3.855823516845703} -08/30/2021 13:31:48 - INFO - __main__ - Step 1701: {'lr': 0.000425, 'samples': 326592, 'steps': 1700, 'loss/train': 3.2315449714660645} -08/30/2021 13:31:48 - INFO - __main__ - Step 1702: {'lr': 0.00042525, 'samples': 326784, 'steps': 1701, 'loss/train': 4.2792887687683105} -08/30/2021 13:31:49 - INFO - __main__ - Step 1703: {'lr': 0.0004255, 'samples': 326976, 'steps': 1702, 'loss/train': 3.77683424949646} -08/30/2021 13:31:50 - INFO - __main__ - Step 1704: {'lr': 0.00042575, 'samples': 327168, 'steps': 1703, 'loss/train': 4.382048606872559} -08/30/2021 13:31:51 - INFO - __main__ - Step 1705: {'lr': 0.000426, 'samples': 327360, 'steps': 1704, 'loss/train': 4.271405220031738} -08/30/2021 13:31:51 - INFO - __main__ - Step 1706: {'lr': 0.00042625000000000003, 'samples': 327552, 'steps': 1705, 'loss/train': 3.9530229568481445} -08/30/2021 13:31:51 - INFO - __main__ - Step 1707: {'lr': 0.0004265, 'samples': 327744, 'steps': 1706, 'loss/train': 3.769348382949829} -08/30/2021 13:31:52 - INFO - __main__ - Step 1708: {'lr': 0.00042675000000000005, 'samples': 327936, 'steps': 1707, 'loss/train': 3.80161452293396} -08/30/2021 13:31:53 - INFO - __main__ - Step 1709: {'lr': 0.000427, 'samples': 328128, 'steps': 1708, 'loss/train': 4.133491516113281} -08/30/2021 13:31:54 - INFO - __main__ - Step 1710: {'lr': 0.00042725, 'samples': 328320, 'steps': 1709, 'loss/train': 3.7779102325439453} -08/30/2021 13:31:54 - INFO - __main__ - Step 1711: {'lr': 0.0004275, 'samples': 328512, 'steps': 1710, 'loss/train': 3.779893159866333} -08/30/2021 13:31:54 - INFO - __main__ - Step 1712: {'lr': 0.00042775, 'samples': 328704, 'steps': 1711, 'loss/train': 4.150379180908203} -08/30/2021 13:31:55 - INFO - __main__ - Step 1713: {'lr': 0.000428, 'samples': 328896, 'steps': 1712, 'loss/train': 3.41762375831604} -08/30/2021 13:31:56 - INFO - __main__ - Step 1714: {'lr': 0.00042825000000000003, 'samples': 329088, 'steps': 1713, 'loss/train': 4.138961315155029} -08/30/2021 13:31:57 - INFO - __main__ - Step 1715: {'lr': 0.0004285, 'samples': 329280, 'steps': 1714, 'loss/train': 3.648662805557251} -08/30/2021 13:31:57 - INFO - __main__ - Step 1716: {'lr': 0.00042875000000000004, 'samples': 329472, 'steps': 1715, 'loss/train': 1.621708869934082} -08/30/2021 13:31:58 - INFO - __main__ - Step 1717: {'lr': 0.000429, 'samples': 329664, 'steps': 1716, 'loss/train': 3.648488998413086} -08/30/2021 13:31:58 - INFO - __main__ - Step 1718: {'lr': 0.00042925000000000005, 'samples': 329856, 'steps': 1717, 'loss/train': 3.774393320083618} -08/30/2021 13:32:00 - INFO - __main__ - Step 1719: {'lr': 0.0004295, 'samples': 330048, 'steps': 1718, 'loss/train': 4.18839693069458} -08/30/2021 13:32:01 - INFO - __main__ - Step 1720: {'lr': 0.00042975, 'samples': 330240, 'steps': 1719, 'loss/train': 3.8447341918945312} -08/30/2021 13:32:01 - INFO - __main__ - Step 1721: {'lr': 0.00043, 'samples': 330432, 'steps': 1720, 'loss/train': 3.534740447998047} -08/30/2021 13:32:02 - INFO - __main__ - Step 1722: {'lr': 0.00043025, 'samples': 330624, 'steps': 1721, 'loss/train': 4.641766548156738} -08/30/2021 13:32:02 - INFO - __main__ - Step 1723: {'lr': 0.0004305, 'samples': 330816, 'steps': 1722, 'loss/train': 2.236652135848999} -08/30/2021 13:32:02 - INFO - __main__ - Step 1724: {'lr': 0.00043075000000000003, 'samples': 331008, 'steps': 1723, 'loss/train': 3.677239179611206} -08/30/2021 13:32:04 - INFO - __main__ - Step 1725: {'lr': 0.000431, 'samples': 331200, 'steps': 1724, 'loss/train': 3.2222580909729004} -08/30/2021 13:32:04 - INFO - __main__ - Step 1726: {'lr': 0.00043125000000000005, 'samples': 331392, 'steps': 1725, 'loss/train': 3.922532081604004} -08/30/2021 13:32:05 - INFO - __main__ - Step 1727: {'lr': 0.0004315, 'samples': 331584, 'steps': 1726, 'loss/train': 3.244903326034546} -08/30/2021 13:32:05 - INFO - __main__ - Step 1728: {'lr': 0.00043175, 'samples': 331776, 'steps': 1727, 'loss/train': 4.074255466461182} -08/30/2021 13:32:05 - INFO - __main__ - Step 1729: {'lr': 0.000432, 'samples': 331968, 'steps': 1728, 'loss/train': 4.264842987060547} -08/30/2021 13:32:07 - INFO - __main__ - Step 1730: {'lr': 0.00043225, 'samples': 332160, 'steps': 1729, 'loss/train': 1.3039348125457764} -08/30/2021 13:32:07 - INFO - __main__ - Step 1731: {'lr': 0.0004325, 'samples': 332352, 'steps': 1730, 'loss/train': 3.8235883712768555} -08/30/2021 13:32:08 - INFO - __main__ - Step 1732: {'lr': 0.00043275000000000003, 'samples': 332544, 'steps': 1731, 'loss/train': 3.861481189727783} -08/30/2021 13:32:08 - INFO - __main__ - Step 1733: {'lr': 0.000433, 'samples': 332736, 'steps': 1732, 'loss/train': 3.660234212875366} -08/30/2021 13:32:08 - INFO - __main__ - Step 1734: {'lr': 0.00043325000000000004, 'samples': 332928, 'steps': 1733, 'loss/train': 3.09748911857605} -08/30/2021 13:32:10 - INFO - __main__ - Step 1735: {'lr': 0.0004335, 'samples': 333120, 'steps': 1734, 'loss/train': 4.138425827026367} -08/30/2021 13:32:11 - INFO - __main__ - Step 1736: {'lr': 0.00043375000000000005, 'samples': 333312, 'steps': 1735, 'loss/train': 2.873290538787842} -08/30/2021 13:32:11 - INFO - __main__ - Step 1737: {'lr': 0.00043400000000000003, 'samples': 333504, 'steps': 1736, 'loss/train': 4.770103454589844} -08/30/2021 13:32:11 - INFO - __main__ - Step 1738: {'lr': 0.00043425, 'samples': 333696, 'steps': 1737, 'loss/train': 3.8146097660064697} -08/30/2021 13:32:12 - INFO - __main__ - Step 1739: {'lr': 0.0004345, 'samples': 333888, 'steps': 1738, 'loss/train': 2.9071238040924072} -08/30/2021 13:32:12 - INFO - __main__ - Step 1740: {'lr': 0.00043475, 'samples': 334080, 'steps': 1739, 'loss/train': 2.6069204807281494} -08/30/2021 13:32:14 - INFO - __main__ - Step 1741: {'lr': 0.000435, 'samples': 334272, 'steps': 1740, 'loss/train': 3.395693302154541} -08/30/2021 13:32:14 - INFO - __main__ - Step 1742: {'lr': 0.00043525000000000004, 'samples': 334464, 'steps': 1741, 'loss/train': 3.2589519023895264} -08/30/2021 13:32:15 - INFO - __main__ - Step 1743: {'lr': 0.0004355, 'samples': 334656, 'steps': 1742, 'loss/train': 3.994988203048706} -08/30/2021 13:32:15 - INFO - __main__ - Step 1744: {'lr': 0.00043575000000000005, 'samples': 334848, 'steps': 1743, 'loss/train': 3.7896499633789062} -08/30/2021 13:32:15 - INFO - __main__ - Step 1745: {'lr': 0.000436, 'samples': 335040, 'steps': 1744, 'loss/train': 4.0110015869140625} -08/30/2021 13:32:16 - INFO - __main__ - Step 1746: {'lr': 0.00043625000000000006, 'samples': 335232, 'steps': 1745, 'loss/train': 3.9087882041931152} -08/30/2021 13:32:17 - INFO - __main__ - Step 1747: {'lr': 0.0004365, 'samples': 335424, 'steps': 1746, 'loss/train': 3.7993640899658203} -08/30/2021 13:32:18 - INFO - __main__ - Step 1748: {'lr': 0.00043675, 'samples': 335616, 'steps': 1747, 'loss/train': 4.368635177612305} -08/30/2021 13:32:18 - INFO - __main__ - Step 1749: {'lr': 0.000437, 'samples': 335808, 'steps': 1748, 'loss/train': 4.0576958656311035} -08/30/2021 13:32:19 - INFO - __main__ - Step 1750: {'lr': 0.00043725000000000003, 'samples': 336000, 'steps': 1749, 'loss/train': 3.779649019241333} -08/30/2021 13:32:19 - INFO - __main__ - Step 1751: {'lr': 0.0004375, 'samples': 336192, 'steps': 1750, 'loss/train': 3.8256595134735107} -08/30/2021 13:32:20 - INFO - __main__ - Step 1752: {'lr': 0.00043775, 'samples': 336384, 'steps': 1751, 'loss/train': 3.8933751583099365} -08/30/2021 13:32:21 - INFO - __main__ - Step 1753: {'lr': 0.000438, 'samples': 336576, 'steps': 1752, 'loss/train': 3.610065221786499} -08/30/2021 13:32:21 - INFO - __main__ - Step 1754: {'lr': 0.00043825, 'samples': 336768, 'steps': 1753, 'loss/train': 3.787497043609619} -08/30/2021 13:32:22 - INFO - __main__ - Step 1755: {'lr': 0.00043850000000000003, 'samples': 336960, 'steps': 1754, 'loss/train': 3.547999858856201} -08/30/2021 13:32:22 - INFO - __main__ - Step 1756: {'lr': 0.00043874999999999996, 'samples': 337152, 'steps': 1755, 'loss/train': 3.187812089920044} -08/30/2021 13:32:23 - INFO - __main__ - Step 1757: {'lr': 0.000439, 'samples': 337344, 'steps': 1756, 'loss/train': 3.791693925857544} -08/30/2021 13:32:24 - INFO - __main__ - Step 1758: {'lr': 0.00043924999999999997, 'samples': 337536, 'steps': 1757, 'loss/train': 3.908297300338745} -08/30/2021 13:32:24 - INFO - __main__ - Step 1759: {'lr': 0.0004395, 'samples': 337728, 'steps': 1758, 'loss/train': 4.370672702789307} -08/30/2021 13:32:25 - INFO - __main__ - Step 1760: {'lr': 0.00043975, 'samples': 337920, 'steps': 1759, 'loss/train': 2.3841192722320557} -08/30/2021 13:32:25 - INFO - __main__ - Step 1761: {'lr': 0.00044, 'samples': 338112, 'steps': 1760, 'loss/train': 2.305006742477417} -08/30/2021 13:32:25 - INFO - __main__ - Step 1762: {'lr': 0.00044025, 'samples': 338304, 'steps': 1761, 'loss/train': 4.077214241027832} -08/30/2021 13:32:27 - INFO - __main__ - Step 1763: {'lr': 0.00044050000000000003, 'samples': 338496, 'steps': 1762, 'loss/train': 3.9649477005004883} -08/30/2021 13:32:28 - INFO - __main__ - Step 1764: {'lr': 0.00044075, 'samples': 338688, 'steps': 1763, 'loss/train': 4.029394149780273} -08/30/2021 13:32:28 - INFO - __main__ - Step 1765: {'lr': 0.000441, 'samples': 338880, 'steps': 1764, 'loss/train': 3.631580352783203} -08/30/2021 13:32:28 - INFO - __main__ - Step 1766: {'lr': 0.00044124999999999996, 'samples': 339072, 'steps': 1765, 'loss/train': 3.723358154296875} -08/30/2021 13:32:29 - INFO - __main__ - Step 1767: {'lr': 0.0004415, 'samples': 339264, 'steps': 1766, 'loss/train': 2.810429573059082} -08/30/2021 13:32:29 - INFO - __main__ - Step 1768: {'lr': 0.00044175, 'samples': 339456, 'steps': 1767, 'loss/train': 2.503378391265869} -08/30/2021 13:32:31 - INFO - __main__ - Step 1769: {'lr': 0.000442, 'samples': 339648, 'steps': 1768, 'loss/train': 5.0331950187683105} -08/30/2021 13:32:32 - INFO - __main__ - Step 1770: {'lr': 0.00044225, 'samples': 339840, 'steps': 1769, 'loss/train': 4.137406349182129} -08/30/2021 13:32:32 - INFO - __main__ - Step 1771: {'lr': 0.0004425, 'samples': 340032, 'steps': 1770, 'loss/train': 3.5637762546539307} -08/30/2021 13:32:32 - INFO - __main__ - Step 1772: {'lr': 0.00044275, 'samples': 340224, 'steps': 1771, 'loss/train': 4.73265266418457} -08/30/2021 13:32:33 - INFO - __main__ - Step 1773: {'lr': 0.00044300000000000003, 'samples': 340416, 'steps': 1772, 'loss/train': 4.167478084564209} -08/30/2021 13:32:35 - INFO - __main__ - Step 1774: {'lr': 0.00044325, 'samples': 340608, 'steps': 1773, 'loss/train': 4.121479511260986} -08/30/2021 13:32:35 - INFO - __main__ - Step 1775: {'lr': 0.0004435, 'samples': 340800, 'steps': 1774, 'loss/train': 2.0559253692626953} -08/30/2021 13:32:35 - INFO - __main__ - Step 1776: {'lr': 0.00044374999999999997, 'samples': 340992, 'steps': 1775, 'loss/train': 3.804485559463501} -08/30/2021 13:32:36 - INFO - __main__ - Step 1777: {'lr': 0.000444, 'samples': 341184, 'steps': 1776, 'loss/train': 3.524785041809082} -08/30/2021 13:32:36 - INFO - __main__ - Step 1778: {'lr': 0.00044425, 'samples': 341376, 'steps': 1777, 'loss/train': 4.243947982788086} -08/30/2021 13:32:38 - INFO - __main__ - Step 1779: {'lr': 0.0004445, 'samples': 341568, 'steps': 1778, 'loss/train': 3.671976089477539} -08/30/2021 13:32:38 - INFO - __main__ - Step 1780: {'lr': 0.00044475, 'samples': 341760, 'steps': 1779, 'loss/train': 3.7523791790008545} -08/30/2021 13:32:38 - INFO - __main__ - Step 1781: {'lr': 0.00044500000000000003, 'samples': 341952, 'steps': 1780, 'loss/train': 3.83473539352417} -08/30/2021 13:32:39 - INFO - __main__ - Step 1782: {'lr': 0.00044525, 'samples': 342144, 'steps': 1781, 'loss/train': 4.172183513641357} -08/30/2021 13:32:39 - INFO - __main__ - Step 1783: {'lr': 0.00044550000000000004, 'samples': 342336, 'steps': 1782, 'loss/train': 4.258868217468262} -08/30/2021 13:32:41 - INFO - __main__ - Step 1784: {'lr': 0.00044574999999999997, 'samples': 342528, 'steps': 1783, 'loss/train': 6.953623294830322} -08/30/2021 13:32:41 - INFO - __main__ - Step 1785: {'lr': 0.000446, 'samples': 342720, 'steps': 1784, 'loss/train': 3.3653876781463623} -08/30/2021 13:32:41 - INFO - __main__ - Step 1786: {'lr': 0.00044625, 'samples': 342912, 'steps': 1785, 'loss/train': 5.904109001159668} -08/30/2021 13:32:42 - INFO - __main__ - Step 1787: {'lr': 0.0004465, 'samples': 343104, 'steps': 1786, 'loss/train': 4.541056156158447} -08/30/2021 13:32:42 - INFO - __main__ - Step 1788: {'lr': 0.00044675, 'samples': 343296, 'steps': 1787, 'loss/train': 3.6556994915008545} -08/30/2021 13:32:44 - INFO - __main__ - Step 1789: {'lr': 0.000447, 'samples': 343488, 'steps': 1788, 'loss/train': 3.887575387954712} -08/30/2021 13:32:44 - INFO - __main__ - Step 1790: {'lr': 0.00044725, 'samples': 343680, 'steps': 1789, 'loss/train': 4.294520378112793} -08/30/2021 13:32:44 - INFO - __main__ - Step 1791: {'lr': 0.00044750000000000004, 'samples': 343872, 'steps': 1790, 'loss/train': 3.997781753540039} -08/30/2021 13:32:45 - INFO - __main__ - Step 1792: {'lr': 0.00044775, 'samples': 344064, 'steps': 1791, 'loss/train': 4.512619495391846} -08/30/2021 13:32:45 - INFO - __main__ - Step 1793: {'lr': 0.000448, 'samples': 344256, 'steps': 1792, 'loss/train': 4.260393142700195} -08/30/2021 13:32:47 - INFO - __main__ - Step 1794: {'lr': 0.00044824999999999997, 'samples': 344448, 'steps': 1793, 'loss/train': 3.5534934997558594} -08/30/2021 13:32:47 - INFO - __main__ - Step 1795: {'lr': 0.0004485, 'samples': 344640, 'steps': 1794, 'loss/train': 4.273794174194336} -08/30/2021 13:32:48 - INFO - __main__ - Step 1796: {'lr': 0.00044875, 'samples': 344832, 'steps': 1795, 'loss/train': 4.101879596710205} -08/30/2021 13:32:48 - INFO - __main__ - Step 1797: {'lr': 0.000449, 'samples': 345024, 'steps': 1796, 'loss/train': 3.60370135307312} -08/30/2021 13:32:48 - INFO - __main__ - Step 1798: {'lr': 0.00044925, 'samples': 345216, 'steps': 1797, 'loss/train': 2.5743050575256348} -08/30/2021 13:32:49 - INFO - __main__ - Step 1799: {'lr': 0.00044950000000000003, 'samples': 345408, 'steps': 1798, 'loss/train': 3.873318672180176} -08/30/2021 13:32:50 - INFO - __main__ - Step 1800: {'lr': 0.00044975, 'samples': 345600, 'steps': 1799, 'loss/train': 3.587174892425537} -08/30/2021 13:32:50 - INFO - __main__ - Step 1801: {'lr': 0.00045000000000000004, 'samples': 345792, 'steps': 1800, 'loss/train': 3.988168716430664} -08/30/2021 13:32:51 - INFO - __main__ - Step 1802: {'lr': 0.00045024999999999997, 'samples': 345984, 'steps': 1801, 'loss/train': 4.558698654174805} -08/30/2021 13:32:51 - INFO - __main__ - Step 1803: {'lr': 0.0004505, 'samples': 346176, 'steps': 1802, 'loss/train': 2.978074073791504} -08/30/2021 13:32:51 - INFO - __main__ - Step 1804: {'lr': 0.00045075, 'samples': 346368, 'steps': 1803, 'loss/train': 4.602495193481445} -08/30/2021 13:32:53 - INFO - __main__ - Step 1805: {'lr': 0.000451, 'samples': 346560, 'steps': 1804, 'loss/train': 3.7294809818267822} -08/30/2021 13:32:54 - INFO - __main__ - Step 1806: {'lr': 0.00045125, 'samples': 346752, 'steps': 1805, 'loss/train': 2.315081834793091} -08/30/2021 13:32:54 - INFO - __main__ - Step 1807: {'lr': 0.0004515, 'samples': 346944, 'steps': 1806, 'loss/train': 3.4423391819000244} -08/30/2021 13:32:54 - INFO - __main__ - Step 1808: {'lr': 0.00045175, 'samples': 347136, 'steps': 1807, 'loss/train': 4.13805627822876} -08/30/2021 13:32:55 - INFO - __main__ - Step 1809: {'lr': 0.00045200000000000004, 'samples': 347328, 'steps': 1808, 'loss/train': 3.755753993988037} -08/30/2021 13:32:56 - INFO - __main__ - Step 1810: {'lr': 0.00045225, 'samples': 347520, 'steps': 1809, 'loss/train': 3.993638277053833} -08/30/2021 13:32:57 - INFO - __main__ - Step 1811: {'lr': 0.00045250000000000005, 'samples': 347712, 'steps': 1810, 'loss/train': 4.206995964050293} -08/30/2021 13:32:57 - INFO - __main__ - Step 1812: {'lr': 0.00045275, 'samples': 347904, 'steps': 1811, 'loss/train': 4.250825881958008} -08/30/2021 13:32:57 - INFO - __main__ - Step 1813: {'lr': 0.000453, 'samples': 348096, 'steps': 1812, 'loss/train': 4.152008533477783} -08/30/2021 13:32:58 - INFO - __main__ - Step 1814: {'lr': 0.00045325, 'samples': 348288, 'steps': 1813, 'loss/train': 2.5532729625701904} -08/30/2021 13:32:59 - INFO - __main__ - Step 1815: {'lr': 0.0004535, 'samples': 348480, 'steps': 1814, 'loss/train': 3.8477673530578613} -08/30/2021 13:33:00 - INFO - __main__ - Step 1816: {'lr': 0.00045375, 'samples': 348672, 'steps': 1815, 'loss/train': 4.381932735443115} -08/30/2021 13:33:00 - INFO - __main__ - Step 1817: {'lr': 0.00045400000000000003, 'samples': 348864, 'steps': 1816, 'loss/train': 3.4737496376037598} -08/30/2021 13:33:01 - INFO - __main__ - Step 1818: {'lr': 0.00045425, 'samples': 349056, 'steps': 1817, 'loss/train': 4.0976972579956055} -08/30/2021 13:33:01 - INFO - __main__ - Step 1819: {'lr': 0.00045450000000000004, 'samples': 349248, 'steps': 1818, 'loss/train': 4.001212120056152} -08/30/2021 13:33:02 - INFO - __main__ - Step 1820: {'lr': 0.00045475, 'samples': 349440, 'steps': 1819, 'loss/train': 3.7729732990264893} -08/30/2021 13:33:03 - INFO - __main__ - Step 1821: {'lr': 0.000455, 'samples': 349632, 'steps': 1820, 'loss/train': 4.435334205627441} -08/30/2021 13:33:03 - INFO - __main__ - Step 1822: {'lr': 0.00045525, 'samples': 349824, 'steps': 1821, 'loss/train': 5.007040023803711} -08/30/2021 13:33:04 - INFO - __main__ - Step 1823: {'lr': 0.0004555, 'samples': 350016, 'steps': 1822, 'loss/train': 4.017209053039551} -08/30/2021 13:33:04 - INFO - __main__ - Step 1824: {'lr': 0.00045575, 'samples': 350208, 'steps': 1823, 'loss/train': 3.8874261379241943} -08/30/2021 13:33:06 - INFO - __main__ - Step 1825: {'lr': 0.000456, 'samples': 350400, 'steps': 1824, 'loss/train': 4.341891765594482} -08/30/2021 13:33:06 - INFO - __main__ - Step 1826: {'lr': 0.00045625, 'samples': 350592, 'steps': 1825, 'loss/train': 3.9138295650482178} -08/30/2021 13:33:06 - INFO - __main__ - Step 1827: {'lr': 0.00045650000000000004, 'samples': 350784, 'steps': 1826, 'loss/train': 4.223025798797607} -08/30/2021 13:33:07 - INFO - __main__ - Step 1828: {'lr': 0.00045675, 'samples': 350976, 'steps': 1827, 'loss/train': 4.082917213439941} -08/30/2021 13:33:07 - INFO - __main__ - Step 1829: {'lr': 0.00045700000000000005, 'samples': 351168, 'steps': 1828, 'loss/train': 3.6689260005950928} -08/30/2021 13:33:09 - INFO - __main__ - Step 1830: {'lr': 0.00045725, 'samples': 351360, 'steps': 1829, 'loss/train': 4.08038854598999} -08/30/2021 13:33:09 - INFO - __main__ - Step 1831: {'lr': 0.0004575, 'samples': 351552, 'steps': 1830, 'loss/train': 3.8469529151916504} -08/30/2021 13:33:10 - INFO - __main__ - Step 1832: {'lr': 0.00045775, 'samples': 351744, 'steps': 1831, 'loss/train': 3.804262161254883} -08/30/2021 13:33:10 - INFO - __main__ - Step 1833: {'lr': 0.000458, 'samples': 351936, 'steps': 1832, 'loss/train': 3.862908363342285} -08/30/2021 13:33:10 - INFO - __main__ - Step 1834: {'lr': 0.00045825, 'samples': 352128, 'steps': 1833, 'loss/train': 4.24948787689209} -08/30/2021 13:33:11 - INFO - __main__ - Step 1835: {'lr': 0.00045850000000000003, 'samples': 352320, 'steps': 1834, 'loss/train': 3.7653462886810303} -08/30/2021 13:33:13 - INFO - __main__ - Step 1836: {'lr': 0.00045875, 'samples': 352512, 'steps': 1835, 'loss/train': 3.9597079753875732} -08/30/2021 13:33:13 - INFO - __main__ - Step 1837: {'lr': 0.00045900000000000004, 'samples': 352704, 'steps': 1836, 'loss/train': 3.816056251525879} -08/30/2021 13:33:13 - INFO - __main__ - Step 1838: {'lr': 0.00045925, 'samples': 352896, 'steps': 1837, 'loss/train': 1.7432626485824585} -08/30/2021 13:33:14 - INFO - __main__ - Step 1839: {'lr': 0.00045950000000000006, 'samples': 353088, 'steps': 1838, 'loss/train': 3.7407479286193848} -08/30/2021 13:33:14 - INFO - __main__ - Step 1840: {'lr': 0.00045975, 'samples': 353280, 'steps': 1839, 'loss/train': 4.176888942718506} -08/30/2021 13:33:15 - INFO - __main__ - Step 1841: {'lr': 0.00046, 'samples': 353472, 'steps': 1840, 'loss/train': 3.407545328140259} -08/30/2021 13:33:16 - INFO - __main__ - Step 1842: {'lr': 0.00046025, 'samples': 353664, 'steps': 1841, 'loss/train': 4.078118324279785} -08/30/2021 13:33:16 - INFO - __main__ - Step 1843: {'lr': 0.0004605, 'samples': 353856, 'steps': 1842, 'loss/train': 3.4387409687042236} -08/30/2021 13:33:17 - INFO - __main__ - Step 1844: {'lr': 0.00046075, 'samples': 354048, 'steps': 1843, 'loss/train': 4.269843101501465} -08/30/2021 13:33:17 - INFO - __main__ - Step 1845: {'lr': 0.00046100000000000004, 'samples': 354240, 'steps': 1844, 'loss/train': 3.4776978492736816} -08/30/2021 13:33:19 - INFO - __main__ - Step 1846: {'lr': 0.00046125, 'samples': 354432, 'steps': 1845, 'loss/train': 3.323798418045044} -08/30/2021 13:33:19 - INFO - __main__ - Step 1847: {'lr': 0.00046150000000000005, 'samples': 354624, 'steps': 1846, 'loss/train': 3.570096015930176} -08/30/2021 13:33:19 - INFO - __main__ - Step 1848: {'lr': 0.00046175000000000003, 'samples': 354816, 'steps': 1847, 'loss/train': 4.458643436431885} -08/30/2021 13:33:20 - INFO - __main__ - Step 1849: {'lr': 0.000462, 'samples': 355008, 'steps': 1848, 'loss/train': 3.6618752479553223} -08/30/2021 13:33:20 - INFO - __main__ - Step 1850: {'lr': 0.00046225, 'samples': 355200, 'steps': 1849, 'loss/train': 4.308147430419922} -08/30/2021 13:33:22 - INFO - __main__ - Step 1851: {'lr': 0.0004625, 'samples': 355392, 'steps': 1850, 'loss/train': 4.221744060516357} -08/30/2021 13:33:22 - INFO - __main__ - Step 1852: {'lr': 0.00046275, 'samples': 355584, 'steps': 1851, 'loss/train': 4.10622501373291} -08/30/2021 13:33:23 - INFO - __main__ - Step 1853: {'lr': 0.00046300000000000003, 'samples': 355776, 'steps': 1852, 'loss/train': 3.997800588607788} -08/30/2021 13:33:23 - INFO - __main__ - Step 1854: {'lr': 0.00046325, 'samples': 355968, 'steps': 1853, 'loss/train': 3.75465726852417} -08/30/2021 13:33:23 - INFO - __main__ - Step 1855: {'lr': 0.00046350000000000004, 'samples': 356160, 'steps': 1854, 'loss/train': 6.074405193328857} -08/30/2021 13:33:24 - INFO - __main__ - Step 1856: {'lr': 0.00046375, 'samples': 356352, 'steps': 1855, 'loss/train': 4.297353744506836} -08/30/2021 13:33:25 - INFO - __main__ - Step 1857: {'lr': 0.00046400000000000006, 'samples': 356544, 'steps': 1856, 'loss/train': 3.6608734130859375} -08/30/2021 13:33:26 - INFO - __main__ - Step 1858: {'lr': 0.00046425, 'samples': 356736, 'steps': 1857, 'loss/train': 4.111756324768066} -08/30/2021 13:33:26 - INFO - __main__ - Step 1859: {'lr': 0.0004645, 'samples': 356928, 'steps': 1858, 'loss/train': 3.2915756702423096} -08/30/2021 13:33:26 - INFO - __main__ - Step 1860: {'lr': 0.00046475, 'samples': 357120, 'steps': 1859, 'loss/train': 4.302042007446289} -08/30/2021 13:33:27 - INFO - __main__ - Step 1861: {'lr': 0.000465, 'samples': 357312, 'steps': 1860, 'loss/train': 3.8228554725646973} -08/30/2021 13:33:28 - INFO - __main__ - Step 1862: {'lr': 0.00046525, 'samples': 357504, 'steps': 1861, 'loss/train': 3.304464817047119} -08/30/2021 13:33:29 - INFO - __main__ - Step 1863: {'lr': 0.00046550000000000004, 'samples': 357696, 'steps': 1862, 'loss/train': 4.269545078277588} -08/30/2021 13:33:29 - INFO - __main__ - Step 1864: {'lr': 0.00046575, 'samples': 357888, 'steps': 1863, 'loss/train': 3.2907872200012207} -08/30/2021 13:33:29 - INFO - __main__ - Step 1865: {'lr': 0.00046600000000000005, 'samples': 358080, 'steps': 1864, 'loss/train': 4.103222370147705} -08/30/2021 13:33:30 - INFO - __main__ - Step 1866: {'lr': 0.00046625000000000003, 'samples': 358272, 'steps': 1865, 'loss/train': 4.721673488616943} -08/30/2021 13:33:31 - INFO - __main__ - Step 1867: {'lr': 0.0004665, 'samples': 358464, 'steps': 1866, 'loss/train': 4.846536636352539} -08/30/2021 13:33:32 - INFO - __main__ - Step 1868: {'lr': 0.00046675, 'samples': 358656, 'steps': 1867, 'loss/train': 4.437201976776123} -08/30/2021 13:33:32 - INFO - __main__ - Step 1869: {'lr': 0.000467, 'samples': 358848, 'steps': 1868, 'loss/train': 3.9709482192993164} -08/30/2021 13:33:32 - INFO - __main__ - Step 1870: {'lr': 0.00046725, 'samples': 359040, 'steps': 1869, 'loss/train': 3.8383877277374268} -08/30/2021 13:33:33 - INFO - __main__ - Step 1871: {'lr': 0.00046750000000000003, 'samples': 359232, 'steps': 1870, 'loss/train': 3.8616721630096436} -08/30/2021 13:33:34 - INFO - __main__ - Step 1872: {'lr': 0.00046775, 'samples': 359424, 'steps': 1871, 'loss/train': 4.496031284332275} -08/30/2021 13:33:35 - INFO - __main__ - Step 1873: {'lr': 0.00046800000000000005, 'samples': 359616, 'steps': 1872, 'loss/train': 3.8477094173431396} -08/30/2021 13:33:35 - INFO - __main__ - Step 1874: {'lr': 0.00046825, 'samples': 359808, 'steps': 1873, 'loss/train': 3.4782001972198486} -08/30/2021 13:33:36 - INFO - __main__ - Step 1875: {'lr': 0.00046850000000000006, 'samples': 360000, 'steps': 1874, 'loss/train': 3.167875289916992} -08/30/2021 13:33:36 - INFO - __main__ - Step 1876: {'lr': 0.00046875, 'samples': 360192, 'steps': 1875, 'loss/train': 3.74480938911438} -08/30/2021 13:33:37 - INFO - __main__ - Step 1877: {'lr': 0.00046899999999999996, 'samples': 360384, 'steps': 1876, 'loss/train': 3.590226650238037} -08/30/2021 13:33:38 - INFO - __main__ - Step 1878: {'lr': 0.00046925, 'samples': 360576, 'steps': 1877, 'loss/train': 3.8205149173736572} -08/30/2021 13:33:38 - INFO - __main__ - Step 1879: {'lr': 0.0004695, 'samples': 360768, 'steps': 1878, 'loss/train': 4.053231716156006} -08/30/2021 13:33:38 - INFO - __main__ - Step 1880: {'lr': 0.00046975, 'samples': 360960, 'steps': 1879, 'loss/train': 4.020791530609131} -08/30/2021 13:33:39 - INFO - __main__ - Step 1881: {'lr': 0.00047, 'samples': 361152, 'steps': 1880, 'loss/train': 3.427460193634033} -08/30/2021 13:33:41 - INFO - __main__ - Step 1882: {'lr': 0.00047025, 'samples': 361344, 'steps': 1881, 'loss/train': 2.1546480655670166} -08/30/2021 13:33:41 - INFO - __main__ - Step 1883: {'lr': 0.0004705, 'samples': 361536, 'steps': 1882, 'loss/train': 4.243077278137207} -08/30/2021 13:33:42 - INFO - __main__ - Step 1884: {'lr': 0.00047075000000000003, 'samples': 361728, 'steps': 1883, 'loss/train': 4.100534915924072} -08/30/2021 13:33:42 - INFO - __main__ - Step 1885: {'lr': 0.000471, 'samples': 361920, 'steps': 1884, 'loss/train': 3.798335313796997} -08/30/2021 13:33:42 - INFO - __main__ - Step 1886: {'lr': 0.00047125, 'samples': 362112, 'steps': 1885, 'loss/train': 4.3711466789245605} -08/30/2021 13:33:43 - INFO - __main__ - Step 1887: {'lr': 0.00047149999999999997, 'samples': 362304, 'steps': 1886, 'loss/train': 3.492220640182495} -08/30/2021 13:33:44 - INFO - __main__ - Step 1888: {'lr': 0.00047175, 'samples': 362496, 'steps': 1887, 'loss/train': 4.2310662269592285} -08/30/2021 13:33:45 - INFO - __main__ - Step 1889: {'lr': 0.000472, 'samples': 362688, 'steps': 1888, 'loss/train': 3.697628974914551} -08/30/2021 13:33:45 - INFO - __main__ - Step 1890: {'lr': 0.00047225, 'samples': 362880, 'steps': 1889, 'loss/train': 4.416256904602051} -08/30/2021 13:33:46 - INFO - __main__ - Step 1891: {'lr': 0.0004725, 'samples': 363072, 'steps': 1890, 'loss/train': 5.274457931518555} -08/30/2021 13:33:46 - INFO - __main__ - Step 1892: {'lr': 0.00047275, 'samples': 363264, 'steps': 1891, 'loss/train': 4.132111549377441} -08/30/2021 13:33:48 - INFO - __main__ - Step 1893: {'lr': 0.000473, 'samples': 363456, 'steps': 1892, 'loss/train': 4.002604007720947} -08/30/2021 13:33:48 - INFO - __main__ - Step 1894: {'lr': 0.00047325000000000004, 'samples': 363648, 'steps': 1893, 'loss/train': 4.229362964630127} -08/30/2021 13:33:48 - INFO - __main__ - Step 1895: {'lr': 0.00047349999999999996, 'samples': 363840, 'steps': 1894, 'loss/train': 4.218633651733398} -08/30/2021 13:33:49 - INFO - __main__ - Step 1896: {'lr': 0.00047375, 'samples': 364032, 'steps': 1895, 'loss/train': 5.024405479431152} -08/30/2021 13:33:49 - INFO - __main__ - Step 1897: {'lr': 0.000474, 'samples': 364224, 'steps': 1896, 'loss/train': 4.995138645172119} -08/30/2021 13:33:49 - INFO - __main__ - Step 1898: {'lr': 0.00047425, 'samples': 364416, 'steps': 1897, 'loss/train': 4.169946193695068} -08/30/2021 13:33:51 - INFO - __main__ - Step 1899: {'lr': 0.0004745, 'samples': 364608, 'steps': 1898, 'loss/train': 4.533463001251221} -08/30/2021 13:33:51 - INFO - __main__ - Step 1900: {'lr': 0.00047475, 'samples': 364800, 'steps': 1899, 'loss/train': 3.4824893474578857} -08/30/2021 13:33:52 - INFO - __main__ - Step 1901: {'lr': 0.000475, 'samples': 364992, 'steps': 1900, 'loss/train': 4.135907173156738} -08/30/2021 13:33:52 - INFO - __main__ - Step 1902: {'lr': 0.00047525000000000003, 'samples': 365184, 'steps': 1901, 'loss/train': 2.825798988342285} -08/30/2021 13:33:52 - INFO - __main__ - Step 1903: {'lr': 0.0004755, 'samples': 365376, 'steps': 1902, 'loss/train': 3.729189872741699} -08/30/2021 13:33:54 - INFO - __main__ - Step 1904: {'lr': 0.00047575, 'samples': 365568, 'steps': 1903, 'loss/train': 4.196805477142334} -08/30/2021 13:33:54 - INFO - __main__ - Step 1905: {'lr': 0.00047599999999999997, 'samples': 365760, 'steps': 1904, 'loss/train': 4.139028549194336} -08/30/2021 13:33:55 - INFO - __main__ - Step 1906: {'lr': 0.00047625, 'samples': 365952, 'steps': 1905, 'loss/train': 4.455804824829102} -08/30/2021 13:33:55 - INFO - __main__ - Step 1907: {'lr': 0.0004765, 'samples': 366144, 'steps': 1906, 'loss/train': 3.751356840133667} -08/30/2021 13:33:55 - INFO - __main__ - Step 1908: {'lr': 0.00047675, 'samples': 366336, 'steps': 1907, 'loss/train': 3.362111806869507} -08/30/2021 13:33:57 - INFO - __main__ - Step 1909: {'lr': 0.000477, 'samples': 366528, 'steps': 1908, 'loss/train': 3.608022928237915} -08/30/2021 13:33:57 - INFO - __main__ - Step 1910: {'lr': 0.00047725, 'samples': 366720, 'steps': 1909, 'loss/train': 2.9700682163238525} -08/30/2021 13:33:58 - INFO - __main__ - Step 1911: {'lr': 0.0004775, 'samples': 366912, 'steps': 1910, 'loss/train': 4.289870738983154} -08/30/2021 13:33:58 - INFO - __main__ - Step 1912: {'lr': 0.00047775000000000004, 'samples': 367104, 'steps': 1911, 'loss/train': 4.144138336181641} -08/30/2021 13:33:58 - INFO - __main__ - Step 1913: {'lr': 0.00047799999999999996, 'samples': 367296, 'steps': 1912, 'loss/train': 4.10355281829834} -08/30/2021 13:34:00 - INFO - __main__ - Step 1914: {'lr': 0.00047825, 'samples': 367488, 'steps': 1913, 'loss/train': 2.017336368560791} -08/30/2021 13:34:00 - INFO - __main__ - Step 1915: {'lr': 0.0004785, 'samples': 367680, 'steps': 1914, 'loss/train': 3.983057975769043} -08/30/2021 13:34:01 - INFO - __main__ - Step 1916: {'lr': 0.00047875, 'samples': 367872, 'steps': 1915, 'loss/train': 3.5344715118408203} -08/30/2021 13:34:01 - INFO - __main__ - Step 1917: {'lr': 0.000479, 'samples': 368064, 'steps': 1916, 'loss/train': 3.5695202350616455} -08/30/2021 13:34:01 - INFO - __main__ - Step 1918: {'lr': 0.00047925, 'samples': 368256, 'steps': 1917, 'loss/train': 3.8029837608337402} -08/30/2021 13:34:02 - INFO - __main__ - Step 1919: {'lr': 0.0004795, 'samples': 368448, 'steps': 1918, 'loss/train': 4.074838638305664} -08/30/2021 13:34:03 - INFO - __main__ - Step 1920: {'lr': 0.00047975000000000003, 'samples': 368640, 'steps': 1919, 'loss/train': 3.663607120513916} -08/30/2021 13:34:04 - INFO - __main__ - Step 1921: {'lr': 0.00048, 'samples': 368832, 'steps': 1920, 'loss/train': 3.7792277336120605} -08/30/2021 13:34:04 - INFO - __main__ - Step 1922: {'lr': 0.00048025000000000005, 'samples': 369024, 'steps': 1921, 'loss/train': 3.6022844314575195} -08/30/2021 13:34:04 - INFO - __main__ - Step 1923: {'lr': 0.00048049999999999997, 'samples': 369216, 'steps': 1922, 'loss/train': 4.036792278289795} -08/30/2021 13:34:05 - INFO - __main__ - Step 1924: {'lr': 0.00048075, 'samples': 369408, 'steps': 1923, 'loss/train': 4.241264820098877} -08/30/2021 13:34:07 - INFO - __main__ - Step 1925: {'lr': 0.000481, 'samples': 369600, 'steps': 1924, 'loss/train': 3.9819133281707764} -08/30/2021 13:34:07 - INFO - __main__ - Step 1926: {'lr': 0.00048125, 'samples': 369792, 'steps': 1925, 'loss/train': 3.559974431991577} -08/30/2021 13:34:07 - INFO - __main__ - Step 1927: {'lr': 0.0004815, 'samples': 369984, 'steps': 1926, 'loss/train': 3.747083902359009} -08/30/2021 13:34:08 - INFO - __main__ - Step 1928: {'lr': 0.00048175000000000003, 'samples': 370176, 'steps': 1927, 'loss/train': 1.3425077199935913} -08/30/2021 13:34:08 - INFO - __main__ - Step 1929: {'lr': 0.000482, 'samples': 370368, 'steps': 1928, 'loss/train': 4.593088150024414} -08/30/2021 13:34:10 - INFO - __main__ - Step 1930: {'lr': 0.00048225000000000004, 'samples': 370560, 'steps': 1929, 'loss/train': 4.031519889831543} -08/30/2021 13:34:10 - INFO - __main__ - Step 1931: {'lr': 0.0004825, 'samples': 370752, 'steps': 1930, 'loss/train': 3.6667327880859375} -08/30/2021 13:34:10 - INFO - __main__ - Step 1932: {'lr': 0.00048275, 'samples': 370944, 'steps': 1931, 'loss/train': 3.720813512802124} -08/30/2021 13:34:11 - INFO - __main__ - Step 1933: {'lr': 0.000483, 'samples': 371136, 'steps': 1932, 'loss/train': 3.514467716217041} -08/30/2021 13:34:11 - INFO - __main__ - Step 1934: {'lr': 0.00048325, 'samples': 371328, 'steps': 1933, 'loss/train': 3.9238007068634033} -08/30/2021 13:34:13 - INFO - __main__ - Step 1935: {'lr': 0.0004835, 'samples': 371520, 'steps': 1934, 'loss/train': 4.041956424713135} -08/30/2021 13:34:14 - INFO - __main__ - Step 1936: {'lr': 0.00048375, 'samples': 371712, 'steps': 1935, 'loss/train': 3.0714752674102783} -08/30/2021 13:34:14 - INFO - __main__ - Step 1937: {'lr': 0.000484, 'samples': 371904, 'steps': 1936, 'loss/train': 3.7970077991485596} -08/30/2021 13:34:15 - INFO - __main__ - Step 1938: {'lr': 0.00048425000000000003, 'samples': 372096, 'steps': 1937, 'loss/train': 1.7311993837356567} -08/30/2021 13:34:15 - INFO - __main__ - Step 1939: {'lr': 0.0004845, 'samples': 372288, 'steps': 1938, 'loss/train': 5.09821891784668} -08/30/2021 13:34:16 - INFO - __main__ - Step 1940: {'lr': 0.00048475000000000005, 'samples': 372480, 'steps': 1939, 'loss/train': 4.333300590515137} -08/30/2021 13:34:17 - INFO - __main__ - Step 1941: {'lr': 0.00048499999999999997, 'samples': 372672, 'steps': 1940, 'loss/train': 4.0591020584106445} -08/30/2021 13:34:17 - INFO - __main__ - Step 1942: {'lr': 0.00048525, 'samples': 372864, 'steps': 1941, 'loss/train': 3.329667329788208} -08/30/2021 13:34:18 - INFO - __main__ - Step 1943: {'lr': 0.0004855, 'samples': 373056, 'steps': 1942, 'loss/train': 3.636807441711426} -08/30/2021 13:34:18 - INFO - __main__ - Step 1944: {'lr': 0.00048575, 'samples': 373248, 'steps': 1943, 'loss/train': 4.212170124053955} -08/30/2021 13:34:18 - INFO - __main__ - Step 1945: {'lr': 0.000486, 'samples': 373440, 'steps': 1944, 'loss/train': 3.7817118167877197} -08/30/2021 13:34:20 - INFO - __main__ - Step 1946: {'lr': 0.00048625000000000003, 'samples': 373632, 'steps': 1945, 'loss/train': 3.895685911178589} -08/30/2021 13:34:20 - INFO - __main__ - Step 1947: {'lr': 0.0004865, 'samples': 373824, 'steps': 1946, 'loss/train': 4.491222381591797} -08/30/2021 13:34:21 - INFO - __main__ - Step 1948: {'lr': 0.00048675000000000004, 'samples': 374016, 'steps': 1947, 'loss/train': 4.426873207092285} -08/30/2021 13:34:21 - INFO - __main__ - Step 1949: {'lr': 0.000487, 'samples': 374208, 'steps': 1948, 'loss/train': 3.7109720706939697} -08/30/2021 13:34:22 - INFO - __main__ - Step 1950: {'lr': 0.00048725000000000005, 'samples': 374400, 'steps': 1949, 'loss/train': 4.7153778076171875} -08/30/2021 13:34:23 - INFO - __main__ - Step 1951: {'lr': 0.0004875, 'samples': 374592, 'steps': 1950, 'loss/train': 4.433164119720459} -08/30/2021 13:34:23 - INFO - __main__ - Step 1952: {'lr': 0.00048775, 'samples': 374784, 'steps': 1951, 'loss/train': 4.409071445465088} -08/30/2021 13:34:24 - INFO - __main__ - Step 1953: {'lr': 0.000488, 'samples': 374976, 'steps': 1952, 'loss/train': 3.639925003051758} -08/30/2021 13:34:24 - INFO - __main__ - Step 1954: {'lr': 0.00048825, 'samples': 375168, 'steps': 1953, 'loss/train': 3.6265134811401367} -08/30/2021 13:34:24 - INFO - __main__ - Step 1955: {'lr': 0.0004885, 'samples': 375360, 'steps': 1954, 'loss/train': 4.043466091156006} -08/30/2021 13:34:26 - INFO - __main__ - Step 1956: {'lr': 0.00048875, 'samples': 375552, 'steps': 1955, 'loss/train': 3.6802093982696533} -08/30/2021 13:34:26 - INFO - __main__ - Step 1957: {'lr': 0.000489, 'samples': 375744, 'steps': 1956, 'loss/train': 3.76971173286438} -08/30/2021 13:34:27 - INFO - __main__ - Step 1958: {'lr': 0.00048925, 'samples': 375936, 'steps': 1957, 'loss/train': 4.56354284286499} -08/30/2021 13:34:27 - INFO - __main__ - Step 1959: {'lr': 0.0004895, 'samples': 376128, 'steps': 1958, 'loss/train': 4.015387535095215} -08/30/2021 13:34:27 - INFO - __main__ - Step 1960: {'lr': 0.0004897500000000001, 'samples': 376320, 'steps': 1959, 'loss/train': 3.3302128314971924} -08/30/2021 13:34:29 - INFO - __main__ - Step 1961: {'lr': 0.00049, 'samples': 376512, 'steps': 1960, 'loss/train': 3.9128339290618896} -08/30/2021 13:34:30 - INFO - __main__ - Step 1962: {'lr': 0.00049025, 'samples': 376704, 'steps': 1961, 'loss/train': 3.8968732357025146} -08/30/2021 13:34:30 - INFO - __main__ - Step 1963: {'lr': 0.0004905, 'samples': 376896, 'steps': 1962, 'loss/train': 3.8942291736602783} -08/30/2021 13:34:31 - INFO - __main__ - Step 1964: {'lr': 0.0004907500000000001, 'samples': 377088, 'steps': 1963, 'loss/train': 3.332982301712036} -08/30/2021 13:34:31 - INFO - __main__ - Step 1965: {'lr': 0.000491, 'samples': 377280, 'steps': 1964, 'loss/train': 2.7537074089050293} -08/30/2021 13:34:31 - INFO - __main__ - Step 1966: {'lr': 0.00049125, 'samples': 377472, 'steps': 1965, 'loss/train': 3.9287052154541016} -08/30/2021 13:34:32 - INFO - __main__ - Step 1967: {'lr': 0.0004915, 'samples': 377664, 'steps': 1966, 'loss/train': 4.603787899017334} -08/30/2021 13:34:33 - INFO - __main__ - Step 1968: {'lr': 0.00049175, 'samples': 377856, 'steps': 1967, 'loss/train': 4.50520658493042} -08/30/2021 13:34:34 - INFO - __main__ - Step 1969: {'lr': 0.000492, 'samples': 378048, 'steps': 1968, 'loss/train': 4.162574768066406} -08/30/2021 13:34:34 - INFO - __main__ - Step 1970: {'lr': 0.0004922500000000001, 'samples': 378240, 'steps': 1969, 'loss/train': 3.282855987548828} -08/30/2021 13:34:35 - INFO - __main__ - Step 1971: {'lr': 0.0004925, 'samples': 378432, 'steps': 1970, 'loss/train': 4.245908737182617} -08/30/2021 13:34:35 - INFO - __main__ - Step 1972: {'lr': 0.00049275, 'samples': 378624, 'steps': 1971, 'loss/train': 4.855228424072266} -08/30/2021 13:34:37 - INFO - __main__ - Step 1973: {'lr': 0.0004930000000000001, 'samples': 378816, 'steps': 1972, 'loss/train': 2.7747647762298584} -08/30/2021 13:34:37 - INFO - __main__ - Step 1974: {'lr': 0.00049325, 'samples': 379008, 'steps': 1973, 'loss/train': 1.6275231838226318} -08/30/2021 13:34:38 - INFO - __main__ - Step 1975: {'lr': 0.0004935, 'samples': 379200, 'steps': 1974, 'loss/train': 3.992391586303711} -08/30/2021 13:34:38 - INFO - __main__ - Step 1976: {'lr': 0.00049375, 'samples': 379392, 'steps': 1975, 'loss/train': 3.8086373805999756} -08/30/2021 13:34:38 - INFO - __main__ - Step 1977: {'lr': 0.000494, 'samples': 379584, 'steps': 1976, 'loss/train': 3.5776429176330566} -08/30/2021 13:34:40 - INFO - __main__ - Step 1978: {'lr': 0.00049425, 'samples': 379776, 'steps': 1977, 'loss/train': 3.87422776222229} -08/30/2021 13:34:40 - INFO - __main__ - Step 1979: {'lr': 0.0004945, 'samples': 379968, 'steps': 1978, 'loss/train': 3.7341365814208984} -08/30/2021 13:34:41 - INFO - __main__ - Step 1980: {'lr': 0.0004947500000000001, 'samples': 380160, 'steps': 1979, 'loss/train': 4.149728298187256} -08/30/2021 13:34:41 - INFO - __main__ - Step 1981: {'lr': 0.000495, 'samples': 380352, 'steps': 1980, 'loss/train': 4.304142951965332} -08/30/2021 13:34:41 - INFO - __main__ - Step 1982: {'lr': 0.00049525, 'samples': 380544, 'steps': 1981, 'loss/train': 2.1806108951568604} -08/30/2021 13:34:42 - INFO - __main__ - Step 1983: {'lr': 0.0004955, 'samples': 380736, 'steps': 1982, 'loss/train': 4.651204586029053} -08/30/2021 13:34:43 - INFO - __main__ - Step 1984: {'lr': 0.00049575, 'samples': 380928, 'steps': 1983, 'loss/train': 4.128410816192627} -08/30/2021 13:34:44 - INFO - __main__ - Step 1985: {'lr': 0.000496, 'samples': 381120, 'steps': 1984, 'loss/train': 4.110437393188477} -08/30/2021 13:34:44 - INFO - __main__ - Step 1986: {'lr': 0.0004962500000000001, 'samples': 381312, 'steps': 1985, 'loss/train': 3.878854990005493} -08/30/2021 13:34:44 - INFO - __main__ - Step 1987: {'lr': 0.0004965, 'samples': 381504, 'steps': 1986, 'loss/train': 3.836554765701294} -08/30/2021 13:34:45 - INFO - __main__ - Step 1988: {'lr': 0.00049675, 'samples': 381696, 'steps': 1987, 'loss/train': 3.9784555435180664} -08/30/2021 13:34:47 - INFO - __main__ - Step 1989: {'lr': 0.000497, 'samples': 381888, 'steps': 1988, 'loss/train': 4.467948913574219} -08/30/2021 13:34:47 - INFO - __main__ - Step 1990: {'lr': 0.0004972500000000001, 'samples': 382080, 'steps': 1989, 'loss/train': 3.5761940479278564} -08/30/2021 13:34:48 - INFO - __main__ - Step 1991: {'lr': 0.0004975, 'samples': 382272, 'steps': 1990, 'loss/train': 3.889935255050659} -08/30/2021 13:34:48 - INFO - __main__ - Step 1992: {'lr': 0.00049775, 'samples': 382464, 'steps': 1991, 'loss/train': 3.6736230850219727} -08/30/2021 13:34:48 - INFO - __main__ - Step 1993: {'lr': 0.000498, 'samples': 382656, 'steps': 1992, 'loss/train': 3.549931049346924} -08/30/2021 13:34:50 - INFO - __main__ - Step 1994: {'lr': 0.00049825, 'samples': 382848, 'steps': 1993, 'loss/train': 2.8372669219970703} -08/30/2021 13:34:50 - INFO - __main__ - Step 1995: {'lr': 0.0004985, 'samples': 383040, 'steps': 1994, 'loss/train': 4.642188549041748} -08/30/2021 13:34:51 - INFO - __main__ - Step 1996: {'lr': 0.0004987500000000001, 'samples': 383232, 'steps': 1995, 'loss/train': 4.633870601654053} -08/30/2021 13:34:51 - INFO - __main__ - Step 1997: {'lr': 0.000499, 'samples': 383424, 'steps': 1996, 'loss/train': 4.201652526855469} -08/30/2021 13:34:51 - INFO - __main__ - Step 1998: {'lr': 0.00049925, 'samples': 383616, 'steps': 1997, 'loss/train': 3.846168041229248} -08/30/2021 13:34:53 - INFO - __main__ - Step 1999: {'lr': 0.0004995, 'samples': 383808, 'steps': 1998, 'loss/train': 3.3808515071868896} -08/30/2021 13:34:53 - INFO - __main__ - Step 2000: {'lr': 0.0004997500000000001, 'samples': 384000, 'steps': 1999, 'loss/train': 4.1292548179626465} -08/30/2021 13:34:54 - INFO - __main__ - Step 2001: {'lr': 0.0005, 'samples': 384192, 'steps': 2000, 'loss/train': 2.4327993392944336} -08/30/2021 13:34:54 - INFO - __main__ - Step 2002: {'lr': 0.0004999999999436769, 'samples': 384384, 'steps': 2001, 'loss/train': 4.1023712158203125} -08/30/2021 13:34:54 - INFO - __main__ - Step 2003: {'lr': 0.0004999999997747077, 'samples': 384576, 'steps': 2002, 'loss/train': 3.875941276550293} -08/30/2021 13:34:55 - INFO - __main__ - Step 2004: {'lr': 0.0004999999994930923, 'samples': 384768, 'steps': 2003, 'loss/train': 4.333718776702881} -08/30/2021 13:34:56 - INFO - __main__ - Step 2005: {'lr': 0.0004999999990988309, 'samples': 384960, 'steps': 2004, 'loss/train': 4.039220333099365} -08/30/2021 13:34:57 - INFO - __main__ - Step 2006: {'lr': 0.0004999999985919232, 'samples': 385152, 'steps': 2005, 'loss/train': 2.0358545780181885} -08/30/2021 13:34:57 - INFO - __main__ - Step 2007: {'lr': 0.0004999999979723695, 'samples': 385344, 'steps': 2006, 'loss/train': 3.6348371505737305} -08/30/2021 13:34:57 - INFO - __main__ - Step 2008: {'lr': 0.0004999999972401696, 'samples': 385536, 'steps': 2007, 'loss/train': 3.984771490097046} -08/30/2021 13:34:58 - INFO - __main__ - Step 2009: {'lr': 0.0004999999963953234, 'samples': 385728, 'steps': 2008, 'loss/train': 3.0698065757751465} -08/30/2021 13:34:59 - INFO - __main__ - Step 2010: {'lr': 0.0004999999954378312, 'samples': 385920, 'steps': 2009, 'loss/train': 2.84944486618042} -08/30/2021 13:35:00 - INFO - __main__ - Step 2011: {'lr': 0.000499999994367693, 'samples': 386112, 'steps': 2010, 'loss/train': 3.788355827331543} -08/30/2021 13:35:00 - INFO - __main__ - Step 2012: {'lr': 0.0004999999931849084, 'samples': 386304, 'steps': 2011, 'loss/train': 3.836803674697876} -08/30/2021 13:35:01 - INFO - __main__ - Step 2013: {'lr': 0.0004999999918894778, 'samples': 386496, 'steps': 2012, 'loss/train': 4.112085342407227} -08/30/2021 13:35:01 - INFO - __main__ - Step 2014: {'lr': 0.000499999990481401, 'samples': 386688, 'steps': 2013, 'loss/train': 3.578673839569092} -08/30/2021 13:35:02 - INFO - __main__ - Step 2015: {'lr': 0.0004999999889606781, 'samples': 386880, 'steps': 2014, 'loss/train': 2.6813108921051025} -08/30/2021 13:35:03 - INFO - __main__ - Step 2016: {'lr': 0.0004999999873273091, 'samples': 387072, 'steps': 2015, 'loss/train': 3.8371644020080566} -08/30/2021 13:35:03 - INFO - __main__ - Step 2017: {'lr': 0.000499999985581294, 'samples': 387264, 'steps': 2016, 'loss/train': 3.4323573112487793} -08/30/2021 13:35:04 - INFO - __main__ - Step 2018: {'lr': 0.0004999999837226326, 'samples': 387456, 'steps': 2017, 'loss/train': 3.466071128845215} -08/30/2021 13:35:04 - INFO - __main__ - Step 2019: {'lr': 0.0004999999817513252, 'samples': 387648, 'steps': 2018, 'loss/train': 3.250668525695801} -08/30/2021 13:35:06 - INFO - __main__ - Step 2020: {'lr': 0.0004999999796673716, 'samples': 387840, 'steps': 2019, 'loss/train': 3.8105993270874023} -08/30/2021 13:35:06 - INFO - __main__ - Step 2021: {'lr': 0.0004999999774707719, 'samples': 388032, 'steps': 2020, 'loss/train': 3.876354217529297} -08/30/2021 13:35:06 - INFO - __main__ - Step 2022: {'lr': 0.0004999999751615261, 'samples': 388224, 'steps': 2021, 'loss/train': 3.8295605182647705} -08/30/2021 13:35:07 - INFO - __main__ - Step 2023: {'lr': 0.0004999999727396341, 'samples': 388416, 'steps': 2022, 'loss/train': 1.8050475120544434} -08/30/2021 13:35:07 - INFO - __main__ - Step 2024: {'lr': 0.0004999999702050959, 'samples': 388608, 'steps': 2023, 'loss/train': 4.379288196563721} -08/30/2021 13:35:09 - INFO - __main__ - Step 2025: {'lr': 0.0004999999675579118, 'samples': 388800, 'steps': 2024, 'loss/train': 1.515298843383789} -08/30/2021 13:35:09 - INFO - __main__ - Step 2026: {'lr': 0.0004999999647980814, 'samples': 388992, 'steps': 2025, 'loss/train': 4.223230361938477} -08/30/2021 13:35:10 - INFO - __main__ - Step 2027: {'lr': 0.0004999999619256049, 'samples': 389184, 'steps': 2026, 'loss/train': 3.5991108417510986} -08/30/2021 13:35:10 - INFO - __main__ - Step 2028: {'lr': 0.0004999999589404822, 'samples': 389376, 'steps': 2027, 'loss/train': 4.679903984069824} -08/30/2021 13:35:10 - INFO - __main__ - Step 2029: {'lr': 0.0004999999558427136, 'samples': 389568, 'steps': 2028, 'loss/train': 3.4045114517211914} -08/30/2021 13:35:11 - INFO - __main__ - Step 2030: {'lr': 0.0004999999526322987, 'samples': 389760, 'steps': 2029, 'loss/train': 4.606021404266357} -08/30/2021 13:35:12 - INFO - __main__ - Step 2031: {'lr': 0.0004999999493092377, 'samples': 389952, 'steps': 2030, 'loss/train': 3.9545929431915283} -08/30/2021 13:35:13 - INFO - __main__ - Step 2032: {'lr': 0.0004999999458735306, 'samples': 390144, 'steps': 2031, 'loss/train': 4.512197971343994} -08/30/2021 13:35:13 - INFO - __main__ - Step 2033: {'lr': 0.0004999999423251774, 'samples': 390336, 'steps': 2032, 'loss/train': 4.206327438354492} -08/30/2021 13:35:13 - INFO - __main__ - Step 2034: {'lr': 0.0004999999386641781, 'samples': 390528, 'steps': 2033, 'loss/train': 3.3928580284118652} -08/30/2021 13:35:14 - INFO - __main__ - Step 2035: {'lr': 0.0004999999348905326, 'samples': 390720, 'steps': 2034, 'loss/train': 3.4217634201049805} -08/30/2021 13:35:16 - INFO - __main__ - Step 2036: {'lr': 0.000499999931004241, 'samples': 390912, 'steps': 2035, 'loss/train': 3.896252393722534} -08/30/2021 13:35:16 - INFO - __main__ - Step 2037: {'lr': 0.0004999999270053034, 'samples': 391104, 'steps': 2036, 'loss/train': 4.458357334136963} -08/30/2021 13:35:16 - INFO - __main__ - Step 2038: {'lr': 0.0004999999228937196, 'samples': 391296, 'steps': 2037, 'loss/train': 1.3921507596969604} -08/30/2021 13:35:17 - INFO - __main__ - Step 2039: {'lr': 0.0004999999186694897, 'samples': 391488, 'steps': 2038, 'loss/train': 3.886890172958374} -08/30/2021 13:35:17 - INFO - __main__ - Step 2040: {'lr': 0.0004999999143326137, 'samples': 391680, 'steps': 2039, 'loss/train': 3.7923433780670166} -08/30/2021 13:35:18 - INFO - __main__ - Step 2041: {'lr': 0.0004999999098830916, 'samples': 391872, 'steps': 2040, 'loss/train': 3.740668773651123} -08/30/2021 13:35:19 - INFO - __main__ - Step 2042: {'lr': 0.0004999999053209235, 'samples': 392064, 'steps': 2041, 'loss/train': 2.651597499847412} -08/30/2021 13:35:20 - INFO - __main__ - Step 2043: {'lr': 0.0004999999006461091, 'samples': 392256, 'steps': 2042, 'loss/train': 3.898331642150879} -08/30/2021 13:35:20 - INFO - __main__ - Step 2044: {'lr': 0.0004999998958586487, 'samples': 392448, 'steps': 2043, 'loss/train': 3.453770399093628} -08/30/2021 13:35:20 - INFO - __main__ - Step 2045: {'lr': 0.0004999998909585423, 'samples': 392640, 'steps': 2044, 'loss/train': 3.8533713817596436} -08/30/2021 13:35:21 - INFO - __main__ - Step 2046: {'lr': 0.0004999998859457896, 'samples': 392832, 'steps': 2045, 'loss/train': 3.980863571166992} -08/30/2021 13:35:23 - INFO - __main__ - Step 2047: {'lr': 0.0004999998808203909, 'samples': 393024, 'steps': 2046, 'loss/train': 4.354173183441162} -08/30/2021 13:35:23 - INFO - __main__ - Step 2048: {'lr': 0.0004999998755823462, 'samples': 393216, 'steps': 2047, 'loss/train': 4.712317943572998} -08/30/2021 13:35:24 - INFO - __main__ - Step 2049: {'lr': 0.0004999998702316553, 'samples': 393408, 'steps': 2048, 'loss/train': 3.9165966510772705} -08/30/2021 13:35:24 - INFO - __main__ - Step 2050: {'lr': 0.0004999998647683184, 'samples': 393600, 'steps': 2049, 'loss/train': 4.144590854644775} -08/30/2021 13:35:24 - INFO - __main__ - Step 2051: {'lr': 0.0004999998591923353, 'samples': 393792, 'steps': 2050, 'loss/train': 4.262177467346191} -08/30/2021 13:35:25 - INFO - __main__ - Step 2052: {'lr': 0.0004999998535037063, 'samples': 393984, 'steps': 2051, 'loss/train': 3.439192295074463} -08/30/2021 13:35:26 - INFO - __main__ - Step 2053: {'lr': 0.0004999998477024311, 'samples': 394176, 'steps': 2052, 'loss/train': 4.031076908111572} -08/30/2021 13:35:27 - INFO - __main__ - Step 2054: {'lr': 0.0004999998417885099, 'samples': 394368, 'steps': 2053, 'loss/train': 4.544736385345459} -08/30/2021 13:35:27 - INFO - __main__ - Step 2055: {'lr': 0.0004999998357619425, 'samples': 394560, 'steps': 2054, 'loss/train': 4.259439468383789} -08/30/2021 13:35:27 - INFO - __main__ - Step 2056: {'lr': 0.0004999998296227291, 'samples': 394752, 'steps': 2055, 'loss/train': 3.7828798294067383} -08/30/2021 13:35:28 - INFO - __main__ - Step 2057: {'lr': 0.0004999998233708697, 'samples': 394944, 'steps': 2056, 'loss/train': 3.885012626647949} -08/30/2021 13:35:29 - INFO - __main__ - Step 2058: {'lr': 0.0004999998170063642, 'samples': 395136, 'steps': 2057, 'loss/train': 4.150326251983643} -08/30/2021 13:35:30 - INFO - __main__ - Step 2059: {'lr': 0.0004999998105292126, 'samples': 395328, 'steps': 2058, 'loss/train': 3.841209888458252} -08/30/2021 13:35:30 - INFO - __main__ - Step 2060: {'lr': 0.000499999803939415, 'samples': 395520, 'steps': 2059, 'loss/train': 4.630417346954346} -08/30/2021 13:35:30 - INFO - __main__ - Step 2061: {'lr': 0.0004999997972369713, 'samples': 395712, 'steps': 2060, 'loss/train': 3.6309611797332764} -08/30/2021 13:35:31 - INFO - __main__ - Step 2062: {'lr': 0.0004999997904218816, 'samples': 395904, 'steps': 2061, 'loss/train': 4.3275017738342285} -08/30/2021 13:35:33 - INFO - __main__ - Step 2063: {'lr': 0.0004999997834941459, 'samples': 396096, 'steps': 2062, 'loss/train': 3.459217071533203} -08/30/2021 13:35:33 - INFO - __main__ - Step 2064: {'lr': 0.000499999776453764, 'samples': 396288, 'steps': 2063, 'loss/train': 3.7469112873077393} -08/30/2021 13:35:34 - INFO - __main__ - Step 2065: {'lr': 0.0004999997693007361, 'samples': 396480, 'steps': 2064, 'loss/train': 1.6411480903625488} -08/30/2021 13:35:34 - INFO - __main__ - Step 2066: {'lr': 0.0004999997620350622, 'samples': 396672, 'steps': 2065, 'loss/train': 4.02923583984375} -08/30/2021 13:35:34 - INFO - __main__ - Step 2067: {'lr': 0.0004999997546567423, 'samples': 396864, 'steps': 2066, 'loss/train': 4.513978481292725} -08/30/2021 13:35:35 - INFO - __main__ - Step 2068: {'lr': 0.0004999997471657763, 'samples': 397056, 'steps': 2067, 'loss/train': 4.028714656829834} -08/30/2021 13:35:36 - INFO - __main__ - Step 2069: {'lr': 0.0004999997395621642, 'samples': 397248, 'steps': 2068, 'loss/train': 5.7790045738220215} -08/30/2021 13:35:37 - INFO - __main__ - Step 2070: {'lr': 0.0004999997318459064, 'samples': 397440, 'steps': 2069, 'loss/train': 3.2854936122894287} -08/30/2021 13:35:37 - INFO - __main__ - Step 2071: {'lr': 0.0004999997240170023, 'samples': 397632, 'steps': 2070, 'loss/train': 4.750792503356934} -08/30/2021 13:35:38 - INFO - __main__ - Step 2072: {'lr': 0.0004999997160754522, 'samples': 397824, 'steps': 2071, 'loss/train': 3.8799290657043457} -08/30/2021 13:35:38 - INFO - __main__ - Step 2073: {'lr': 0.0004999997080212561, 'samples': 398016, 'steps': 2072, 'loss/train': 3.8270981311798096} -08/30/2021 13:35:39 - INFO - __main__ - Step 2074: {'lr': 0.000499999699854414, 'samples': 398208, 'steps': 2073, 'loss/train': 3.9468932151794434} -08/30/2021 13:35:40 - INFO - __main__ - Step 2075: {'lr': 0.0004999996915749259, 'samples': 398400, 'steps': 2074, 'loss/train': 4.303092956542969} -08/30/2021 13:35:40 - INFO - __main__ - Step 2076: {'lr': 0.0004999996831827918, 'samples': 398592, 'steps': 2075, 'loss/train': 4.116118431091309} -08/30/2021 13:35:40 - INFO - __main__ - Step 2077: {'lr': 0.0004999996746780117, 'samples': 398784, 'steps': 2076, 'loss/train': 3.8554420471191406} -08/30/2021 13:35:41 - INFO - __main__ - Step 2078: {'lr': 0.0004999996660605856, 'samples': 398976, 'steps': 2077, 'loss/train': 4.0006585121154785} -08/30/2021 13:35:42 - INFO - __main__ - Step 2079: {'lr': 0.0004999996573305135, 'samples': 399168, 'steps': 2078, 'loss/train': 4.150618076324463} -08/30/2021 13:35:43 - INFO - __main__ - Step 2080: {'lr': 0.0004999996484877955, 'samples': 399360, 'steps': 2079, 'loss/train': 3.6302833557128906} -08/30/2021 13:35:43 - INFO - __main__ - Step 2081: {'lr': 0.0004999996395324313, 'samples': 399552, 'steps': 2080, 'loss/train': 3.340209722518921} -08/30/2021 13:35:44 - INFO - __main__ - Step 2082: {'lr': 0.0004999996304644213, 'samples': 399744, 'steps': 2081, 'loss/train': 1.185246467590332} -08/30/2021 13:35:44 - INFO - __main__ - Step 2083: {'lr': 0.0004999996212837653, 'samples': 399936, 'steps': 2082, 'loss/train': 3.8154983520507812} -08/30/2021 13:35:44 - INFO - __main__ - Step 2084: {'lr': 0.0004999996119904633, 'samples': 400128, 'steps': 2083, 'loss/train': 3.679164409637451} -08/30/2021 13:35:46 - INFO - __main__ - Step 2085: {'lr': 0.0004999996025845154, 'samples': 400320, 'steps': 2084, 'loss/train': 3.6279003620147705} -08/30/2021 13:35:46 - INFO - __main__ - Step 2086: {'lr': 0.0004999995930659215, 'samples': 400512, 'steps': 2085, 'loss/train': 3.875730037689209} -08/30/2021 13:35:47 - INFO - __main__ - Step 2087: {'lr': 0.0004999995834346815, 'samples': 400704, 'steps': 2086, 'loss/train': 3.8178493976593018} -08/30/2021 13:35:47 - INFO - __main__ - Step 2088: {'lr': 0.0004999995736907957, 'samples': 400896, 'steps': 2087, 'loss/train': 2.4050605297088623} -08/30/2021 13:35:48 - INFO - __main__ - Step 2089: {'lr': 0.000499999563834264, 'samples': 401088, 'steps': 2088, 'loss/train': 4.120197772979736} -08/30/2021 13:35:49 - INFO - __main__ - Step 2090: {'lr': 0.0004999995538650862, 'samples': 401280, 'steps': 2089, 'loss/train': 3.6348252296447754} -08/30/2021 13:35:50 - INFO - __main__ - Step 2091: {'lr': 0.0004999995437832626, 'samples': 401472, 'steps': 2090, 'loss/train': 3.6068522930145264} -08/30/2021 13:35:50 - INFO - __main__ - Step 2092: {'lr': 0.0004999995335887929, 'samples': 401664, 'steps': 2091, 'loss/train': 3.4813265800476074} -08/30/2021 13:35:50 - INFO - __main__ - Step 2093: {'lr': 0.0004999995232816774, 'samples': 401856, 'steps': 2092, 'loss/train': 3.892913579940796} -08/30/2021 13:35:51 - INFO - __main__ - Step 2094: {'lr': 0.000499999512861916, 'samples': 402048, 'steps': 2093, 'loss/train': 6.413071632385254} -08/30/2021 13:35:51 - INFO - __main__ - Step 2095: {'lr': 0.0004999995023295086, 'samples': 402240, 'steps': 2094, 'loss/train': 3.990013599395752} -08/30/2021 13:35:52 - INFO - __main__ - Step 2096: {'lr': 0.0004999994916844552, 'samples': 402432, 'steps': 2095, 'loss/train': 4.004929065704346} -08/30/2021 13:35:53 - INFO - __main__ - Step 2097: {'lr': 0.0004999994809267561, 'samples': 402624, 'steps': 2096, 'loss/train': 3.6314752101898193} -08/30/2021 13:35:53 - INFO - __main__ - Step 2098: {'lr': 0.0004999994700564109, 'samples': 402816, 'steps': 2097, 'loss/train': 4.178173065185547} -08/30/2021 13:35:54 - INFO - __main__ - Step 2099: {'lr': 0.0004999994590734199, 'samples': 403008, 'steps': 2098, 'loss/train': 3.6031713485717773} -08/30/2021 13:35:54 - INFO - __main__ - Step 2100: {'lr': 0.000499999447977783, 'samples': 403200, 'steps': 2099, 'loss/train': 4.067807197570801} -08/30/2021 13:35:56 - INFO - __main__ - Step 2101: {'lr': 0.0004999994367695001, 'samples': 403392, 'steps': 2100, 'loss/train': 5.255605220794678} -08/30/2021 13:35:57 - INFO - __main__ - Step 2102: {'lr': 0.0004999994254485714, 'samples': 403584, 'steps': 2101, 'loss/train': 3.9827678203582764} -08/30/2021 13:35:57 - INFO - __main__ - Step 2103: {'lr': 0.0004999994140149969, 'samples': 403776, 'steps': 2102, 'loss/train': 3.6580848693847656} -08/30/2021 13:35:57 - INFO - __main__ - Step 2104: {'lr': 0.0004999994024687764, 'samples': 403968, 'steps': 2103, 'loss/train': 3.2820913791656494} -08/30/2021 13:35:58 - INFO - __main__ - Step 2105: {'lr': 0.00049999939080991, 'samples': 404160, 'steps': 2104, 'loss/train': 3.5947940349578857} -08/30/2021 13:36:00 - INFO - __main__ - Step 2106: {'lr': 0.0004999993790383978, 'samples': 404352, 'steps': 2105, 'loss/train': 3.8313283920288086} -08/30/2021 13:36:00 - INFO - __main__ - Step 2107: {'lr': 0.0004999993671542397, 'samples': 404544, 'steps': 2106, 'loss/train': 3.4209165573120117} -08/30/2021 13:36:00 - INFO - __main__ - Step 2108: {'lr': 0.0004999993551574358, 'samples': 404736, 'steps': 2107, 'loss/train': 2.9385299682617188} -08/30/2021 13:36:01 - INFO - __main__ - Step 2109: {'lr': 0.000499999343047986, 'samples': 404928, 'steps': 2108, 'loss/train': 3.8535799980163574} -08/30/2021 13:36:01 - INFO - __main__ - Step 2110: {'lr': 0.0004999993308258904, 'samples': 405120, 'steps': 2109, 'loss/train': 4.167038440704346} -08/30/2021 13:36:03 - INFO - __main__ - Step 2111: {'lr': 0.0004999993184911489, 'samples': 405312, 'steps': 2110, 'loss/train': 1.7652651071548462} -08/30/2021 13:36:03 - INFO - __main__ - Step 2112: {'lr': 0.0004999993060437616, 'samples': 405504, 'steps': 2111, 'loss/train': 4.371798992156982} -08/30/2021 13:36:03 - INFO - __main__ - Step 2113: {'lr': 0.0004999992934837284, 'samples': 405696, 'steps': 2112, 'loss/train': 3.9404070377349854} -08/30/2021 13:36:04 - INFO - __main__ - Step 2114: {'lr': 0.0004999992808110495, 'samples': 405888, 'steps': 2113, 'loss/train': 3.7768027782440186} -08/30/2021 13:36:04 - INFO - __main__ - Step 2115: {'lr': 0.0004999992680257247, 'samples': 406080, 'steps': 2114, 'loss/train': 3.13139271736145} -08/30/2021 13:36:06 - INFO - __main__ - Step 2116: {'lr': 0.0004999992551277541, 'samples': 406272, 'steps': 2115, 'loss/train': 3.9997286796569824} -08/30/2021 13:36:06 - INFO - __main__ - Step 2117: {'lr': 0.0004999992421171377, 'samples': 406464, 'steps': 2116, 'loss/train': 4.288055896759033} -08/30/2021 13:36:07 - INFO - __main__ - Step 2118: {'lr': 0.0004999992289938755, 'samples': 406656, 'steps': 2117, 'loss/train': 2.2618613243103027} -08/30/2021 13:36:07 - INFO - __main__ - Step 2119: {'lr': 0.0004999992157579676, 'samples': 406848, 'steps': 2118, 'loss/train': 3.53808331489563} -08/30/2021 13:36:07 - INFO - __main__ - Step 2120: {'lr': 0.0004999992024094138, 'samples': 407040, 'steps': 2119, 'loss/train': 1.2991235256195068} -08/30/2021 13:36:08 - INFO - __main__ - Step 2121: {'lr': 0.0004999991889482142, 'samples': 407232, 'steps': 2120, 'loss/train': 3.9068098068237305} -08/30/2021 13:36:08 - INFO - __main__ - Step 2122: {'lr': 0.0004999991753743689, 'samples': 407424, 'steps': 2121, 'loss/train': 4.309406757354736} -08/30/2021 13:36:10 - INFO - __main__ - Step 2123: {'lr': 0.0004999991616878777, 'samples': 407616, 'steps': 2122, 'loss/train': 5.465785503387451} -08/30/2021 13:36:10 - INFO - __main__ - Step 2124: {'lr': 0.0004999991478887409, 'samples': 407808, 'steps': 2123, 'loss/train': 3.558007001876831} -08/30/2021 13:36:11 - INFO - __main__ - Step 2125: {'lr': 0.0004999991339769582, 'samples': 408000, 'steps': 2124, 'loss/train': 3.6818957328796387} -08/30/2021 13:36:11 - INFO - __main__ - Step 2126: {'lr': 0.0004999991199525299, 'samples': 408192, 'steps': 2125, 'loss/train': 2.7842469215393066} -08/30/2021 13:36:11 - INFO - __main__ - Step 2127: {'lr': 0.0004999991058154557, 'samples': 408384, 'steps': 2126, 'loss/train': 3.7680232524871826} -08/30/2021 13:36:13 - INFO - __main__ - Step 2128: {'lr': 0.0004999990915657359, 'samples': 408576, 'steps': 2127, 'loss/train': 3.632894515991211} -08/30/2021 13:36:13 - INFO - __main__ - Step 2129: {'lr': 0.0004999990772033702, 'samples': 408768, 'steps': 2128, 'loss/train': 3.518711805343628} -08/30/2021 13:36:14 - INFO - __main__ - Step 2130: {'lr': 0.000499999062728359, 'samples': 408960, 'steps': 2129, 'loss/train': 3.6407299041748047} -08/30/2021 13:36:14 - INFO - __main__ - Step 2131: {'lr': 0.0004999990481407018, 'samples': 409152, 'steps': 2130, 'loss/train': 4.092563629150391} -08/30/2021 13:36:14 - INFO - __main__ - Step 2132: {'lr': 0.0004999990334403991, 'samples': 409344, 'steps': 2131, 'loss/train': 3.513838052749634} -08/30/2021 13:36:16 - INFO - __main__ - Step 2133: {'lr': 0.0004999990186274506, 'samples': 409536, 'steps': 2132, 'loss/train': 3.990471124649048} -08/30/2021 13:36:17 - INFO - __main__ - Step 2134: {'lr': 0.0004999990037018564, 'samples': 409728, 'steps': 2133, 'loss/train': 4.022684574127197} -08/30/2021 13:36:17 - INFO - __main__ - Step 2135: {'lr': 0.0004999989886636166, 'samples': 409920, 'steps': 2134, 'loss/train': 3.972376823425293} -08/30/2021 13:36:17 - INFO - __main__ - Step 2136: {'lr': 0.000499998973512731, 'samples': 410112, 'steps': 2135, 'loss/train': 4.383425235748291} -08/30/2021 13:36:18 - INFO - __main__ - Step 2137: {'lr': 0.0004999989582491998, 'samples': 410304, 'steps': 2136, 'loss/train': 0.9991979002952576} -08/30/2021 13:36:19 - INFO - __main__ - Step 2138: {'lr': 0.0004999989428730229, 'samples': 410496, 'steps': 2137, 'loss/train': 3.6455819606781006} -08/30/2021 13:36:19 - INFO - __main__ - Step 2139: {'lr': 0.0004999989273842003, 'samples': 410688, 'steps': 2138, 'loss/train': 3.622770071029663} -08/30/2021 13:36:20 - INFO - __main__ - Step 2140: {'lr': 0.0004999989117827321, 'samples': 410880, 'steps': 2139, 'loss/train': 4.197285175323486} -08/30/2021 13:36:20 - INFO - __main__ - Step 2141: {'lr': 0.0004999988960686182, 'samples': 411072, 'steps': 2140, 'loss/train': 3.6964786052703857} -08/30/2021 13:36:21 - INFO - __main__ - Step 2142: {'lr': 0.0004999988802418587, 'samples': 411264, 'steps': 2141, 'loss/train': 3.747947931289673} -08/30/2021 13:36:22 - INFO - __main__ - Step 2143: {'lr': 0.0004999988643024536, 'samples': 411456, 'steps': 2142, 'loss/train': 4.155553340911865} -08/30/2021 13:36:22 - INFO - __main__ - Step 2144: {'lr': 0.0004999988482504027, 'samples': 411648, 'steps': 2143, 'loss/train': 3.367722988128662} -08/30/2021 13:36:23 - INFO - __main__ - Step 2145: {'lr': 0.0004999988320857063, 'samples': 411840, 'steps': 2144, 'loss/train': 3.669928550720215} -08/30/2021 13:36:23 - INFO - __main__ - Step 2146: {'lr': 0.0004999988158083643, 'samples': 412032, 'steps': 2145, 'loss/train': 4.159835338592529} -08/30/2021 13:36:24 - INFO - __main__ - Step 2147: {'lr': 0.0004999987994183766, 'samples': 412224, 'steps': 2146, 'loss/train': 3.7286808490753174} -08/30/2021 13:36:25 - INFO - __main__ - Step 2148: {'lr': 0.0004999987829157434, 'samples': 412416, 'steps': 2147, 'loss/train': 3.789923906326294} -08/30/2021 13:36:26 - INFO - __main__ - Step 2149: {'lr': 0.0004999987663004646, 'samples': 412608, 'steps': 2148, 'loss/train': 3.821627616882324} -08/30/2021 13:36:26 - INFO - __main__ - Step 2150: {'lr': 0.0004999987495725401, 'samples': 412800, 'steps': 2149, 'loss/train': 4.026470184326172} -08/30/2021 13:36:27 - INFO - __main__ - Step 2151: {'lr': 0.0004999987327319701, 'samples': 412992, 'steps': 2150, 'loss/train': 3.941927433013916} -08/30/2021 13:36:27 - INFO - __main__ - Step 2152: {'lr': 0.0004999987157787546, 'samples': 413184, 'steps': 2151, 'loss/train': 3.9863195419311523} -08/30/2021 13:36:27 - INFO - __main__ - Step 2153: {'lr': 0.0004999986987128934, 'samples': 413376, 'steps': 2152, 'loss/train': 2.8138444423675537} -08/30/2021 13:36:28 - INFO - __main__ - Step 2154: {'lr': 0.0004999986815343867, 'samples': 413568, 'steps': 2153, 'loss/train': 2.8728902339935303} -08/30/2021 13:36:29 - INFO - __main__ - Step 2155: {'lr': 0.0004999986642432345, 'samples': 413760, 'steps': 2154, 'loss/train': 4.75545072555542} -08/30/2021 13:36:30 - INFO - __main__ - Step 2156: {'lr': 0.0004999986468394367, 'samples': 413952, 'steps': 2155, 'loss/train': 3.888580560684204} -08/30/2021 13:36:30 - INFO - __main__ - Step 2157: {'lr': 0.0004999986293229934, 'samples': 414144, 'steps': 2156, 'loss/train': 3.8104896545410156} -08/30/2021 13:36:30 - INFO - __main__ - Step 2158: {'lr': 0.0004999986116939045, 'samples': 414336, 'steps': 2157, 'loss/train': 3.6036465167999268} -08/30/2021 13:36:31 - INFO - __main__ - Step 2159: {'lr': 0.0004999985939521702, 'samples': 414528, 'steps': 2158, 'loss/train': 4.06483268737793} -08/30/2021 13:36:33 - INFO - __main__ - Step 2160: {'lr': 0.0004999985760977903, 'samples': 414720, 'steps': 2159, 'loss/train': 3.406566858291626} -08/30/2021 13:36:33 - INFO - __main__ - Step 2161: {'lr': 0.000499998558130765, 'samples': 414912, 'steps': 2160, 'loss/train': 3.4594547748565674} -08/30/2021 13:36:34 - INFO - __main__ - Step 2162: {'lr': 0.0004999985400510941, 'samples': 415104, 'steps': 2161, 'loss/train': 4.1263933181762695} -08/30/2021 13:36:34 - INFO - __main__ - Step 2163: {'lr': 0.0004999985218587777, 'samples': 415296, 'steps': 2162, 'loss/train': 3.4256396293640137} -08/30/2021 13:36:34 - INFO - __main__ - Step 2164: {'lr': 0.0004999985035538159, 'samples': 415488, 'steps': 2163, 'loss/train': 3.1839096546173096} -08/30/2021 13:36:36 - INFO - __main__ - Step 2165: {'lr': 0.0004999984851362086, 'samples': 415680, 'steps': 2164, 'loss/train': 3.763256311416626} -08/30/2021 13:36:36 - INFO - __main__ - Step 2166: {'lr': 0.0004999984666059559, 'samples': 415872, 'steps': 2165, 'loss/train': 4.361536979675293} -08/30/2021 13:36:37 - INFO - __main__ - Step 2167: {'lr': 0.0004999984479630577, 'samples': 416064, 'steps': 2166, 'loss/train': 3.8201444149017334} -08/30/2021 13:36:37 - INFO - __main__ - Step 2168: {'lr': 0.000499998429207514, 'samples': 416256, 'steps': 2167, 'loss/train': 4.29213809967041} -08/30/2021 13:36:37 - INFO - __main__ - Step 2169: {'lr': 0.000499998410339325, 'samples': 416448, 'steps': 2168, 'loss/train': 3.7384464740753174} -08/30/2021 13:36:38 - INFO - __main__ - Step 2170: {'lr': 0.0004999983913584904, 'samples': 416640, 'steps': 2169, 'loss/train': 3.6140146255493164} -08/30/2021 13:36:39 - INFO - __main__ - Step 2171: {'lr': 0.0004999983722650106, 'samples': 416832, 'steps': 2170, 'loss/train': 3.2986245155334473} -08/30/2021 13:36:40 - INFO - __main__ - Step 2172: {'lr': 0.0004999983530588853, 'samples': 417024, 'steps': 2171, 'loss/train': 3.7747888565063477} -08/30/2021 13:36:40 - INFO - __main__ - Step 2173: {'lr': 0.0004999983337401145, 'samples': 417216, 'steps': 2172, 'loss/train': 4.175738334655762} -08/30/2021 13:36:40 - INFO - __main__ - Step 2174: {'lr': 0.0004999983143086984, 'samples': 417408, 'steps': 2173, 'loss/train': 3.6769347190856934} -08/30/2021 13:36:41 - INFO - __main__ - Step 2175: {'lr': 0.0004999982947646368, 'samples': 417600, 'steps': 2174, 'loss/train': 3.5578510761260986} -08/30/2021 13:36:42 - INFO - __main__ - Step 2176: {'lr': 0.00049999827510793, 'samples': 417792, 'steps': 2175, 'loss/train': 3.85313081741333} -08/30/2021 13:36:43 - INFO - __main__ - Step 2177: {'lr': 0.0004999982553385778, 'samples': 417984, 'steps': 2176, 'loss/train': 4.286514759063721} -08/30/2021 13:36:43 - INFO - __main__ - Step 2178: {'lr': 0.0004999982354565802, 'samples': 418176, 'steps': 2177, 'loss/train': 3.313585042953491} -08/30/2021 13:36:43 - INFO - __main__ - Step 2179: {'lr': 0.0004999982154619372, 'samples': 418368, 'steps': 2178, 'loss/train': 3.698235273361206} -08/30/2021 13:36:44 - INFO - __main__ - Step 2180: {'lr': 0.000499998195354649, 'samples': 418560, 'steps': 2179, 'loss/train': 4.317075729370117} -08/30/2021 13:36:45 - INFO - __main__ - Step 2181: {'lr': 0.0004999981751347153, 'samples': 418752, 'steps': 2180, 'loss/train': 3.5049121379852295} -08/30/2021 13:36:46 - INFO - __main__ - Step 2182: {'lr': 0.0004999981548021364, 'samples': 418944, 'steps': 2181, 'loss/train': 4.226571559906006} -08/30/2021 13:36:46 - INFO - __main__ - Step 2183: {'lr': 0.0004999981343569122, 'samples': 419136, 'steps': 2182, 'loss/train': 3.4870505332946777} -08/30/2021 13:36:46 - INFO - __main__ - Step 2184: {'lr': 0.0004999981137990425, 'samples': 419328, 'steps': 2183, 'loss/train': 4.201118469238281} -08/30/2021 13:36:47 - INFO - __main__ - Step 2185: {'lr': 0.0004999980931285278, 'samples': 419520, 'steps': 2184, 'loss/train': 3.011713743209839} -08/30/2021 13:36:48 - INFO - __main__ - Step 2186: {'lr': 0.0004999980723453676, 'samples': 419712, 'steps': 2185, 'loss/train': 4.225376605987549} -08/30/2021 13:36:49 - INFO - __main__ - Step 2187: {'lr': 0.0004999980514495623, 'samples': 419904, 'steps': 2186, 'loss/train': 3.735133647918701} -08/30/2021 13:36:49 - INFO - __main__ - Step 2188: {'lr': 0.0004999980304411116, 'samples': 420096, 'steps': 2187, 'loss/train': 4.268670082092285} -08/30/2021 13:36:49 - INFO - __main__ - Step 2189: {'lr': 0.0004999980093200157, 'samples': 420288, 'steps': 2188, 'loss/train': 4.963278293609619} -08/30/2021 13:36:50 - INFO - __main__ - Step 2190: {'lr': 0.0004999979880862745, 'samples': 420480, 'steps': 2189, 'loss/train': 3.5750648975372314} -08/30/2021 13:36:51 - INFO - __main__ - Step 2191: {'lr': 0.0004999979667398882, 'samples': 420672, 'steps': 2190, 'loss/train': 2.8247759342193604} -08/30/2021 13:36:51 - INFO - __main__ - Step 2192: {'lr': 0.0004999979452808565, 'samples': 420864, 'steps': 2191, 'loss/train': 4.099137783050537} -08/30/2021 13:36:52 - INFO - __main__ - Step 2193: {'lr': 0.0004999979237091796, 'samples': 421056, 'steps': 2192, 'loss/train': 3.661343812942505} -08/30/2021 13:36:52 - INFO - __main__ - Step 2194: {'lr': 0.0004999979020248577, 'samples': 421248, 'steps': 2193, 'loss/train': 4.581142902374268} -08/30/2021 13:36:53 - INFO - __main__ - Step 2195: {'lr': 0.0004999978802278904, 'samples': 421440, 'steps': 2194, 'loss/train': 4.2670440673828125} -08/30/2021 13:36:53 - INFO - __main__ - Step 2196: {'lr': 0.000499997858318278, 'samples': 421632, 'steps': 2195, 'loss/train': 4.95889949798584} -08/30/2021 13:36:54 - INFO - __main__ - Step 2197: {'lr': 0.0004999978362960204, 'samples': 421824, 'steps': 2196, 'loss/train': 4.856159687042236} -08/30/2021 13:36:55 - INFO - __main__ - Step 2198: {'lr': 0.0004999978141611176, 'samples': 422016, 'steps': 2197, 'loss/train': 3.22304630279541} -08/30/2021 13:36:55 - INFO - __main__ - Step 2199: {'lr': 0.0004999977919135696, 'samples': 422208, 'steps': 2198, 'loss/train': 3.554565668106079} -08/30/2021 13:36:56 - INFO - __main__ - Step 2200: {'lr': 0.0004999977695533766, 'samples': 422400, 'steps': 2199, 'loss/train': 3.392871618270874} -08/30/2021 13:36:56 - INFO - __main__ - Step 2201: {'lr': 0.0004999977470805383, 'samples': 422592, 'steps': 2200, 'loss/train': 4.376364231109619} -08/30/2021 13:36:57 - INFO - __main__ - Step 2202: {'lr': 0.0004999977244950551, 'samples': 422784, 'steps': 2201, 'loss/train': 3.8810112476348877} -08/30/2021 13:36:58 - INFO - __main__ - Step 2203: {'lr': 0.0004999977017969266, 'samples': 422976, 'steps': 2202, 'loss/train': 3.221945285797119} -08/30/2021 13:36:58 - INFO - __main__ - Step 2204: {'lr': 0.000499997678986153, 'samples': 423168, 'steps': 2203, 'loss/train': 4.205539703369141} -08/30/2021 13:36:59 - INFO - __main__ - Step 2205: {'lr': 0.0004999976560627344, 'samples': 423360, 'steps': 2204, 'loss/train': 3.4441351890563965} -08/30/2021 13:36:59 - INFO - __main__ - Step 2206: {'lr': 0.0004999976330266707, 'samples': 423552, 'steps': 2205, 'loss/train': 3.697157144546509} -08/30/2021 13:37:00 - INFO - __main__ - Step 2207: {'lr': 0.0004999976098779618, 'samples': 423744, 'steps': 2206, 'loss/train': 3.6632027626037598} -08/30/2021 13:37:01 - INFO - __main__ - Step 2208: {'lr': 0.0004999975866166079, 'samples': 423936, 'steps': 2207, 'loss/train': 5.021728038787842} -08/30/2021 13:37:01 - INFO - __main__ - Step 2209: {'lr': 0.000499997563242609, 'samples': 424128, 'steps': 2208, 'loss/train': 3.6572656631469727} -08/30/2021 13:37:02 - INFO - __main__ - Step 2210: {'lr': 0.0004999975397559649, 'samples': 424320, 'steps': 2209, 'loss/train': 3.658616781234741} -08/30/2021 13:37:02 - INFO - __main__ - Step 2211: {'lr': 0.000499997516156676, 'samples': 424512, 'steps': 2210, 'loss/train': 2.9364333152770996} -08/30/2021 13:37:04 - INFO - __main__ - Step 2212: {'lr': 0.000499997492444742, 'samples': 424704, 'steps': 2211, 'loss/train': 3.404667377471924} -08/30/2021 13:37:04 - INFO - __main__ - Step 2213: {'lr': 0.0004999974686201629, 'samples': 424896, 'steps': 2212, 'loss/train': 3.665926933288574} -08/30/2021 13:37:05 - INFO - __main__ - Step 2214: {'lr': 0.0004999974446829389, 'samples': 425088, 'steps': 2213, 'loss/train': 2.8251471519470215} -08/30/2021 13:37:05 - INFO - __main__ - Step 2215: {'lr': 0.0004999974206330698, 'samples': 425280, 'steps': 2214, 'loss/train': 3.0024397373199463} -08/30/2021 13:37:05 - INFO - __main__ - Step 2216: {'lr': 0.0004999973964705558, 'samples': 425472, 'steps': 2215, 'loss/train': 3.3037800788879395} -08/30/2021 13:37:07 - INFO - __main__ - Step 2217: {'lr': 0.0004999973721953968, 'samples': 425664, 'steps': 2216, 'loss/train': 3.28297758102417} -08/30/2021 13:37:08 - INFO - __main__ - Step 2218: {'lr': 0.0004999973478075928, 'samples': 425856, 'steps': 2217, 'loss/train': 3.300427198410034} -08/30/2021 13:37:08 - INFO - __main__ - Step 2219: {'lr': 0.0004999973233071438, 'samples': 426048, 'steps': 2218, 'loss/train': 4.051426887512207} -08/30/2021 13:37:08 - INFO - __main__ - Step 2220: {'lr': 0.00049999729869405, 'samples': 426240, 'steps': 2219, 'loss/train': 5.035614490509033} -08/30/2021 13:37:09 - INFO - __main__ - Step 2221: {'lr': 0.0004999972739683113, 'samples': 426432, 'steps': 2220, 'loss/train': 3.5028154850006104} -08/30/2021 13:37:09 - INFO - __main__ - Step 2222: {'lr': 0.0004999972491299276, 'samples': 426624, 'steps': 2221, 'loss/train': 4.06950569152832} -08/30/2021 13:37:11 - INFO - __main__ - Step 2223: {'lr': 0.000499997224178899, 'samples': 426816, 'steps': 2222, 'loss/train': 4.2269134521484375} -08/30/2021 13:37:11 - INFO - __main__ - Step 2224: {'lr': 0.0004999971991152256, 'samples': 427008, 'steps': 2223, 'loss/train': 3.994997024536133} -08/30/2021 13:37:11 - INFO - __main__ - Step 2225: {'lr': 0.0004999971739389072, 'samples': 427200, 'steps': 2224, 'loss/train': 3.972487211227417} -08/30/2021 13:37:12 - INFO - __main__ - Step 2226: {'lr': 0.000499997148649944, 'samples': 427392, 'steps': 2225, 'loss/train': 2.8659262657165527} -08/30/2021 13:37:12 - INFO - __main__ - Step 2227: {'lr': 0.0004999971232483359, 'samples': 427584, 'steps': 2226, 'loss/train': 3.4539358615875244} -08/30/2021 13:37:14 - INFO - __main__ - Step 2228: {'lr': 0.0004999970977340829, 'samples': 427776, 'steps': 2227, 'loss/train': 3.7257273197174072} -08/30/2021 13:37:14 - INFO - __main__ - Step 2229: {'lr': 0.0004999970721071852, 'samples': 427968, 'steps': 2228, 'loss/train': 3.375279426574707} -08/30/2021 13:37:14 - INFO - __main__ - Step 2230: {'lr': 0.0004999970463676427, 'samples': 428160, 'steps': 2229, 'loss/train': 3.407538652420044} -08/30/2021 13:37:15 - INFO - __main__ - Step 2231: {'lr': 0.0004999970205154553, 'samples': 428352, 'steps': 2230, 'loss/train': 1.6758882999420166} -08/30/2021 13:37:15 - INFO - __main__ - Step 2232: {'lr': 0.000499996994550623, 'samples': 428544, 'steps': 2231, 'loss/train': 3.425678253173828} -08/30/2021 13:37:17 - INFO - __main__ - Step 2233: {'lr': 0.000499996968473146, 'samples': 428736, 'steps': 2232, 'loss/train': 3.820082187652588} -08/30/2021 13:37:17 - INFO - __main__ - Step 2234: {'lr': 0.0004999969422830242, 'samples': 428928, 'steps': 2233, 'loss/train': 3.4000606536865234} -08/30/2021 13:37:17 - INFO - __main__ - Step 2235: {'lr': 0.0004999969159802577, 'samples': 429120, 'steps': 2234, 'loss/train': 4.048572540283203} -08/30/2021 13:37:18 - INFO - __main__ - Step 2236: {'lr': 0.0004999968895648464, 'samples': 429312, 'steps': 2235, 'loss/train': 3.476292133331299} -08/30/2021 13:37:18 - INFO - __main__ - Step 2237: {'lr': 0.0004999968630367905, 'samples': 429504, 'steps': 2236, 'loss/train': 1.0507943630218506} -08/30/2021 13:37:20 - INFO - __main__ - Step 2238: {'lr': 0.0004999968363960897, 'samples': 429696, 'steps': 2237, 'loss/train': 3.1623053550720215} -08/30/2021 13:37:20 - INFO - __main__ - Step 2239: {'lr': 0.0004999968096427443, 'samples': 429888, 'steps': 2238, 'loss/train': 1.3669394254684448} -08/30/2021 13:37:21 - INFO - __main__ - Step 2240: {'lr': 0.0004999967827767541, 'samples': 430080, 'steps': 2239, 'loss/train': 3.8772776126861572} -08/30/2021 13:37:21 - INFO - __main__ - Step 2241: {'lr': 0.0004999967557981192, 'samples': 430272, 'steps': 2240, 'loss/train': 3.595731019973755} -08/30/2021 13:37:21 - INFO - __main__ - Step 2242: {'lr': 0.0004999967287068396, 'samples': 430464, 'steps': 2241, 'loss/train': 3.1968882083892822} -08/30/2021 13:37:23 - INFO - __main__ - Step 2243: {'lr': 0.0004999967015029155, 'samples': 430656, 'steps': 2242, 'loss/train': 3.886357069015503} -08/30/2021 13:37:23 - INFO - __main__ - Step 2244: {'lr': 0.0004999966741863467, 'samples': 430848, 'steps': 2243, 'loss/train': 3.6338374614715576} -08/30/2021 13:37:24 - INFO - __main__ - Step 2245: {'lr': 0.000499996646757133, 'samples': 431040, 'steps': 2244, 'loss/train': 0.8551651835441589} -08/30/2021 13:37:24 - INFO - __main__ - Step 2246: {'lr': 0.0004999966192152749, 'samples': 431232, 'steps': 2245, 'loss/train': 3.852029323577881} -08/30/2021 13:37:24 - INFO - __main__ - Step 2247: {'lr': 0.0004999965915607722, 'samples': 431424, 'steps': 2246, 'loss/train': 3.4796693325042725} -08/30/2021 13:37:25 - INFO - __main__ - Step 2248: {'lr': 0.0004999965637936248, 'samples': 431616, 'steps': 2247, 'loss/train': 3.049506425857544} -08/30/2021 13:37:26 - INFO - __main__ - Step 2249: {'lr': 0.0004999965359138329, 'samples': 431808, 'steps': 2248, 'loss/train': 3.1012051105499268} -08/30/2021 13:37:27 - INFO - __main__ - Step 2250: {'lr': 0.0004999965079213964, 'samples': 432000, 'steps': 2249, 'loss/train': 3.93786358833313} -08/30/2021 13:37:27 - INFO - __main__ - Step 2251: {'lr': 0.0004999964798163152, 'samples': 432192, 'steps': 2250, 'loss/train': 3.234760284423828} -08/30/2021 13:37:28 - INFO - __main__ - Step 2252: {'lr': 0.0004999964515985896, 'samples': 432384, 'steps': 2251, 'loss/train': 2.9302399158477783} -08/30/2021 13:37:28 - INFO - __main__ - Step 2253: {'lr': 0.0004999964232682194, 'samples': 432576, 'steps': 2252, 'loss/train': 4.453218460083008} -08/30/2021 13:37:29 - INFO - __main__ - Step 2254: {'lr': 0.0004999963948252046, 'samples': 432768, 'steps': 2253, 'loss/train': 3.4095213413238525} -08/30/2021 13:37:30 - INFO - __main__ - Step 2255: {'lr': 0.0004999963662695453, 'samples': 432960, 'steps': 2254, 'loss/train': 3.3248941898345947} -08/30/2021 13:37:30 - INFO - __main__ - Step 2256: {'lr': 0.0004999963376012416, 'samples': 433152, 'steps': 2255, 'loss/train': 4.129458427429199} -08/30/2021 13:37:31 - INFO - __main__ - Step 2257: {'lr': 0.0004999963088202934, 'samples': 433344, 'steps': 2256, 'loss/train': 4.100364685058594} -08/30/2021 13:37:31 - INFO - __main__ - Step 2258: {'lr': 0.0004999962799267006, 'samples': 433536, 'steps': 2257, 'loss/train': 3.511345148086548} -08/30/2021 13:37:32 - INFO - __main__ - Step 2259: {'lr': 0.0004999962509204634, 'samples': 433728, 'steps': 2258, 'loss/train': 3.9459218978881836} -08/30/2021 13:37:33 - INFO - __main__ - Step 2260: {'lr': 0.0004999962218015818, 'samples': 433920, 'steps': 2259, 'loss/train': 3.9202263355255127} -08/30/2021 13:37:33 - INFO - __main__ - Step 2261: {'lr': 0.0004999961925700557, 'samples': 434112, 'steps': 2260, 'loss/train': 3.4376957416534424} -08/30/2021 13:37:34 - INFO - __main__ - Step 2262: {'lr': 0.0004999961632258851, 'samples': 434304, 'steps': 2261, 'loss/train': 3.3409574031829834} -08/30/2021 13:37:34 - INFO - __main__ - Step 2263: {'lr': 0.0004999961337690703, 'samples': 434496, 'steps': 2262, 'loss/train': 2.983520269393921} -08/30/2021 13:37:36 - INFO - __main__ - Step 2264: {'lr': 0.0004999961041996109, 'samples': 434688, 'steps': 2263, 'loss/train': 3.066105842590332} -08/30/2021 13:37:36 - INFO - __main__ - Step 2265: {'lr': 0.0004999960745175071, 'samples': 434880, 'steps': 2264, 'loss/train': 1.4745205640792847} -08/30/2021 13:37:37 - INFO - __main__ - Step 2266: {'lr': 0.0004999960447227591, 'samples': 435072, 'steps': 2265, 'loss/train': 4.289106845855713} -08/30/2021 13:37:37 - INFO - __main__ - Step 2267: {'lr': 0.0004999960148153667, 'samples': 435264, 'steps': 2266, 'loss/train': 3.591769218444824} -08/30/2021 13:37:37 - INFO - __main__ - Step 2268: {'lr': 0.0004999959847953299, 'samples': 435456, 'steps': 2267, 'loss/train': 3.655301094055176} -08/30/2021 13:37:39 - INFO - __main__ - Step 2269: {'lr': 0.0004999959546626487, 'samples': 435648, 'steps': 2268, 'loss/train': 4.203343391418457} -08/30/2021 13:37:39 - INFO - __main__ - Step 2270: {'lr': 0.0004999959244173232, 'samples': 435840, 'steps': 2269, 'loss/train': 3.0128376483917236} -08/30/2021 13:37:40 - INFO - __main__ - Step 2271: {'lr': 0.0004999958940593535, 'samples': 436032, 'steps': 2270, 'loss/train': 3.4220640659332275} -08/30/2021 13:37:40 - INFO - __main__ - Step 2272: {'lr': 0.0004999958635887394, 'samples': 436224, 'steps': 2271, 'loss/train': 3.169811725616455} -08/30/2021 13:37:40 - INFO - __main__ - Step 2273: {'lr': 0.0004999958330054811, 'samples': 436416, 'steps': 2272, 'loss/train': 3.8526008129119873} -08/30/2021 13:37:42 - INFO - __main__ - Step 2274: {'lr': 0.0004999958023095785, 'samples': 436608, 'steps': 2273, 'loss/train': 3.528167486190796} -08/30/2021 13:37:42 - INFO - __main__ - Step 2275: {'lr': 0.0004999957715010317, 'samples': 436800, 'steps': 2274, 'loss/train': 3.7438666820526123} -08/30/2021 13:37:43 - INFO - __main__ - Step 2276: {'lr': 0.0004999957405798405, 'samples': 436992, 'steps': 2275, 'loss/train': 3.869717836380005} -08/30/2021 13:37:43 - INFO - __main__ - Step 2277: {'lr': 0.0004999957095460052, 'samples': 437184, 'steps': 2276, 'loss/train': 3.9356942176818848} -08/30/2021 13:37:44 - INFO - __main__ - Step 2278: {'lr': 0.0004999956783995257, 'samples': 437376, 'steps': 2277, 'loss/train': 3.73154878616333} -08/30/2021 13:37:44 - INFO - __main__ - Step 2279: {'lr': 0.0004999956471404021, 'samples': 437568, 'steps': 2278, 'loss/train': 1.3698467016220093} -08/30/2021 13:37:45 - INFO - __main__ - Step 2280: {'lr': 0.0004999956157686341, 'samples': 437760, 'steps': 2279, 'loss/train': 4.439995765686035} -08/30/2021 13:37:46 - INFO - __main__ - Step 2281: {'lr': 0.0004999955842842222, 'samples': 437952, 'steps': 2280, 'loss/train': 2.8386447429656982} -08/30/2021 13:37:46 - INFO - __main__ - Step 2282: {'lr': 0.0004999955526871659, 'samples': 438144, 'steps': 2281, 'loss/train': 3.9862217903137207} -08/30/2021 13:37:46 - INFO - __main__ - Step 2283: {'lr': 0.0004999955209774656, 'samples': 438336, 'steps': 2282, 'loss/train': 3.8530850410461426} -08/30/2021 13:37:47 - INFO - __main__ - Step 2284: {'lr': 0.0004999954891551211, 'samples': 438528, 'steps': 2283, 'loss/train': 3.8454504013061523} -08/30/2021 13:37:48 - INFO - __main__ - Step 2285: {'lr': 0.0004999954572201326, 'samples': 438720, 'steps': 2284, 'loss/train': 3.486356019973755} -08/30/2021 13:37:49 - INFO - __main__ - Step 2286: {'lr': 0.0004999954251724999, 'samples': 438912, 'steps': 2285, 'loss/train': 3.396296262741089} -08/30/2021 13:37:49 - INFO - __main__ - Step 2287: {'lr': 0.0004999953930122231, 'samples': 439104, 'steps': 2286, 'loss/train': 4.753914833068848} -08/30/2021 13:37:50 - INFO - __main__ - Step 2288: {'lr': 0.0004999953607393023, 'samples': 439296, 'steps': 2287, 'loss/train': 3.2592363357543945} -08/30/2021 13:37:50 - INFO - __main__ - Step 2289: {'lr': 0.0004999953283537374, 'samples': 439488, 'steps': 2288, 'loss/train': 3.8208231925964355} -08/30/2021 13:37:51 - INFO - __main__ - Step 2290: {'lr': 0.0004999952958555285, 'samples': 439680, 'steps': 2289, 'loss/train': 0.9816742539405823} -08/30/2021 13:37:52 - INFO - __main__ - Step 2291: {'lr': 0.0004999952632446756, 'samples': 439872, 'steps': 2290, 'loss/train': 3.3279073238372803} -08/30/2021 13:37:52 - INFO - __main__ - Step 2292: {'lr': 0.0004999952305211786, 'samples': 440064, 'steps': 2291, 'loss/train': 4.148941993713379} -08/30/2021 13:37:53 - INFO - __main__ - Step 2293: {'lr': 0.0004999951976850377, 'samples': 440256, 'steps': 2292, 'loss/train': 3.7233402729034424} -08/30/2021 13:37:53 - INFO - __main__ - Step 2294: {'lr': 0.0004999951647362527, 'samples': 440448, 'steps': 2293, 'loss/train': 4.325737953186035} -08/30/2021 13:37:54 - INFO - __main__ - Step 2295: {'lr': 0.0004999951316748239, 'samples': 440640, 'steps': 2294, 'loss/train': 3.879056215286255} -08/30/2021 13:37:55 - INFO - __main__ - Step 2296: {'lr': 0.0004999950985007511, 'samples': 440832, 'steps': 2295, 'loss/train': 2.587010145187378} -08/30/2021 13:37:55 - INFO - __main__ - Step 2297: {'lr': 0.0004999950652140343, 'samples': 441024, 'steps': 2296, 'loss/train': 2.7230381965637207} -08/30/2021 13:37:56 - INFO - __main__ - Step 2298: {'lr': 0.0004999950318146737, 'samples': 441216, 'steps': 2297, 'loss/train': 3.217952013015747} -08/30/2021 13:37:56 - INFO - __main__ - Step 2299: {'lr': 0.0004999949983026691, 'samples': 441408, 'steps': 2298, 'loss/train': 3.466270685195923} -08/30/2021 13:37:57 - INFO - __main__ - Step 2300: {'lr': 0.0004999949646780205, 'samples': 441600, 'steps': 2299, 'loss/train': 3.3902628421783447} -08/30/2021 13:37:58 - INFO - __main__ - Step 2301: {'lr': 0.0004999949309407283, 'samples': 441792, 'steps': 2300, 'loss/train': 3.007880926132202} -08/30/2021 13:37:58 - INFO - __main__ - Step 2302: {'lr': 0.0004999948970907921, 'samples': 441984, 'steps': 2301, 'loss/train': 3.3225274085998535} -08/30/2021 13:37:59 - INFO - __main__ - Step 2303: {'lr': 0.0004999948631282119, 'samples': 442176, 'steps': 2302, 'loss/train': 3.5667121410369873} -08/30/2021 13:37:59 - INFO - __main__ - Step 2304: {'lr': 0.0004999948290529881, 'samples': 442368, 'steps': 2303, 'loss/train': 3.3896703720092773} -08/30/2021 13:38:01 - INFO - __main__ - Step 2305: {'lr': 0.0004999947948651204, 'samples': 442560, 'steps': 2304, 'loss/train': 3.468219757080078} -08/30/2021 13:38:01 - INFO - __main__ - Step 2306: {'lr': 0.0004999947605646089, 'samples': 442752, 'steps': 2305, 'loss/train': 3.3806169033050537} -08/30/2021 13:38:01 - INFO - __main__ - Step 2307: {'lr': 0.0004999947261514537, 'samples': 442944, 'steps': 2306, 'loss/train': 3.494899272918701} -08/30/2021 13:38:02 - INFO - __main__ - Step 2308: {'lr': 0.0004999946916256547, 'samples': 443136, 'steps': 2307, 'loss/train': 3.22977352142334} -08/30/2021 13:38:02 - INFO - __main__ - Step 2309: {'lr': 0.0004999946569872118, 'samples': 443328, 'steps': 2308, 'loss/train': 3.777221918106079} -08/30/2021 13:38:04 - INFO - __main__ - Step 2310: {'lr': 0.0004999946222361254, 'samples': 443520, 'steps': 2309, 'loss/train': 3.133528232574463} -08/30/2021 13:38:04 - INFO - __main__ - Step 2311: {'lr': 0.0004999945873723951, 'samples': 443712, 'steps': 2310, 'loss/train': 3.964779853820801} -08/30/2021 13:38:04 - INFO - __main__ - Step 2312: {'lr': 0.0004999945523960212, 'samples': 443904, 'steps': 2311, 'loss/train': 3.5267961025238037} -08/30/2021 13:38:05 - INFO - __main__ - Step 2313: {'lr': 0.0004999945173070035, 'samples': 444096, 'steps': 2312, 'loss/train': 4.563134670257568} -08/30/2021 13:38:05 - INFO - __main__ - Step 2314: {'lr': 0.0004999944821053422, 'samples': 444288, 'steps': 2313, 'loss/train': 3.2205557823181152} -08/30/2021 13:38:06 - INFO - __main__ - Step 2315: {'lr': 0.0004999944467910372, 'samples': 444480, 'steps': 2314, 'loss/train': 3.1991894245147705} -08/30/2021 13:38:07 - INFO - __main__ - Step 2316: {'lr': 0.0004999944113640887, 'samples': 444672, 'steps': 2315, 'loss/train': 2.371495246887207} -08/30/2021 13:38:07 - INFO - __main__ - Step 2317: {'lr': 0.0004999943758244964, 'samples': 444864, 'steps': 2316, 'loss/train': 3.4393770694732666} -08/30/2021 13:38:08 - INFO - __main__ - Step 2318: {'lr': 0.0004999943401722606, 'samples': 445056, 'steps': 2317, 'loss/train': 3.3501834869384766} -08/30/2021 13:38:08 - INFO - __main__ - Step 2319: {'lr': 0.0004999943044073813, 'samples': 445248, 'steps': 2318, 'loss/train': 3.7185914516448975} -08/30/2021 13:38:08 - INFO - __main__ - Step 2320: {'lr': 0.0004999942685298582, 'samples': 445440, 'steps': 2319, 'loss/train': 3.5161125659942627} -08/30/2021 13:38:10 - INFO - __main__ - Step 2321: {'lr': 0.0004999942325396916, 'samples': 445632, 'steps': 2320, 'loss/train': 4.182732582092285} -08/30/2021 13:38:11 - INFO - __main__ - Step 2322: {'lr': 0.0004999941964368817, 'samples': 445824, 'steps': 2321, 'loss/train': 3.3947317600250244} -08/30/2021 13:38:11 - INFO - __main__ - Step 2323: {'lr': 0.000499994160221428, 'samples': 446016, 'steps': 2322, 'loss/train': 0.7257397174835205} -08/30/2021 13:38:12 - INFO - __main__ - Step 2324: {'lr': 0.0004999941238933308, 'samples': 446208, 'steps': 2323, 'loss/train': 3.284926414489746} -08/30/2021 13:38:12 - INFO - __main__ - Step 2325: {'lr': 0.0004999940874525902, 'samples': 446400, 'steps': 2324, 'loss/train': 3.6126582622528076} -08/30/2021 13:38:14 - INFO - __main__ - Step 2326: {'lr': 0.0004999940508992061, 'samples': 446592, 'steps': 2325, 'loss/train': 3.614366054534912} -08/30/2021 13:38:14 - INFO - __main__ - Step 2327: {'lr': 0.0004999940142331785, 'samples': 446784, 'steps': 2326, 'loss/train': 4.015449047088623} -08/30/2021 13:38:14 - INFO - __main__ - Step 2328: {'lr': 0.0004999939774545074, 'samples': 446976, 'steps': 2327, 'loss/train': 3.174699306488037} -08/30/2021 13:38:15 - INFO - __main__ - Step 2329: {'lr': 0.000499993940563193, 'samples': 447168, 'steps': 2328, 'loss/train': 3.121023416519165} -08/30/2021 13:38:15 - INFO - __main__ - Step 2330: {'lr': 0.0004999939035592351, 'samples': 447360, 'steps': 2329, 'loss/train': 3.8974084854125977} -08/30/2021 13:38:17 - INFO - __main__ - Step 2331: {'lr': 0.0004999938664426339, 'samples': 447552, 'steps': 2330, 'loss/train': 2.9231114387512207} -08/30/2021 13:38:17 - INFO - __main__ - Step 2332: {'lr': 0.0004999938292133894, 'samples': 447744, 'steps': 2331, 'loss/train': 3.9305601119995117} -08/30/2021 13:38:17 - INFO - __main__ - Step 2333: {'lr': 0.0004999937918715013, 'samples': 447936, 'steps': 2332, 'loss/train': 3.7885520458221436} -08/30/2021 13:38:18 - INFO - __main__ - Step 2334: {'lr': 0.00049999375441697, 'samples': 448128, 'steps': 2333, 'loss/train': 2.291560173034668} -08/30/2021 13:38:18 - INFO - __main__ - Step 2335: {'lr': 0.0004999937168497954, 'samples': 448320, 'steps': 2334, 'loss/train': 3.144144296646118} -08/30/2021 13:38:19 - INFO - __main__ - Step 2336: {'lr': 0.0004999936791699773, 'samples': 448512, 'steps': 2335, 'loss/train': 2.7708489894866943} -08/30/2021 13:38:20 - INFO - __main__ - Step 2337: {'lr': 0.0004999936413775161, 'samples': 448704, 'steps': 2336, 'loss/train': 3.8705344200134277} -08/30/2021 13:38:20 - INFO - __main__ - Step 2338: {'lr': 0.0004999936034724115, 'samples': 448896, 'steps': 2337, 'loss/train': 3.3609654903411865} -08/30/2021 13:38:21 - INFO - __main__ - Step 2339: {'lr': 0.0004999935654546638, 'samples': 449088, 'steps': 2338, 'loss/train': 4.000263690948486} -08/30/2021 13:38:21 - INFO - __main__ - Step 2340: {'lr': 0.0004999935273242727, 'samples': 449280, 'steps': 2339, 'loss/train': 3.526043176651001} -08/30/2021 13:38:23 - INFO - __main__ - Step 2341: {'lr': 0.0004999934890812384, 'samples': 449472, 'steps': 2340, 'loss/train': 3.6454505920410156} -08/30/2021 13:38:23 - INFO - __main__ - Step 2342: {'lr': 0.0004999934507255609, 'samples': 449664, 'steps': 2341, 'loss/train': 3.716323137283325} -08/30/2021 13:38:24 - INFO - __main__ - Step 2343: {'lr': 0.0004999934122572403, 'samples': 449856, 'steps': 2342, 'loss/train': 3.456183910369873} -08/30/2021 13:38:24 - INFO - __main__ - Step 2344: {'lr': 0.0004999933736762763, 'samples': 450048, 'steps': 2343, 'loss/train': 1.1015268564224243} -08/30/2021 13:38:24 - INFO - __main__ - Step 2345: {'lr': 0.0004999933349826694, 'samples': 450240, 'steps': 2344, 'loss/train': 4.178706645965576} -08/30/2021 13:38:26 - INFO - __main__ - Step 2346: {'lr': 0.0004999932961764192, 'samples': 450432, 'steps': 2345, 'loss/train': 3.6283633708953857} -08/30/2021 13:38:26 - INFO - __main__ - Step 2347: {'lr': 0.000499993257257526, 'samples': 450624, 'steps': 2346, 'loss/train': 3.44881534576416} -08/30/2021 13:38:27 - INFO - __main__ - Step 2348: {'lr': 0.0004999932182259897, 'samples': 450816, 'steps': 2347, 'loss/train': 3.6039113998413086} -08/30/2021 13:38:27 - INFO - __main__ - Step 2349: {'lr': 0.0004999931790818102, 'samples': 451008, 'steps': 2348, 'loss/train': 3.0283703804016113} -08/30/2021 13:38:27 - INFO - __main__ - Step 2350: {'lr': 0.0004999931398249876, 'samples': 451200, 'steps': 2349, 'loss/train': 3.891494035720825} -08/30/2021 13:38:29 - INFO - __main__ - Step 2351: {'lr': 0.0004999931004555221, 'samples': 451392, 'steps': 2350, 'loss/train': 2.625880002975464} -08/30/2021 13:38:29 - INFO - __main__ - Step 2352: {'lr': 0.0004999930609734135, 'samples': 451584, 'steps': 2351, 'loss/train': 4.154180526733398} -08/30/2021 13:38:29 - INFO - __main__ - Step 2353: {'lr': 0.0004999930213786619, 'samples': 451776, 'steps': 2352, 'loss/train': 3.700856924057007} -08/30/2021 13:38:30 - INFO - __main__ - Step 2354: {'lr': 0.0004999929816712672, 'samples': 451968, 'steps': 2353, 'loss/train': 3.392261505126953} -08/30/2021 13:38:30 - INFO - __main__ - Step 2355: {'lr': 0.0004999929418512296, 'samples': 452160, 'steps': 2354, 'loss/train': 3.879117250442505} -08/30/2021 13:38:31 - INFO - __main__ - Step 2356: {'lr': 0.0004999929019185491, 'samples': 452352, 'steps': 2355, 'loss/train': 3.42183780670166} -08/30/2021 13:38:32 - INFO - __main__ - Step 2357: {'lr': 0.0004999928618732256, 'samples': 452544, 'steps': 2356, 'loss/train': 3.023010492324829} -08/30/2021 13:38:33 - INFO - __main__ - Step 2358: {'lr': 0.0004999928217152591, 'samples': 452736, 'steps': 2357, 'loss/train': 2.951460123062134} -08/30/2021 13:38:33 - INFO - __main__ - Step 2359: {'lr': 0.0004999927814446498, 'samples': 452928, 'steps': 2358, 'loss/train': 3.4824776649475098} -08/30/2021 13:38:33 - INFO - __main__ - Step 2360: {'lr': 0.0004999927410613975, 'samples': 453120, 'steps': 2359, 'loss/train': 3.272944927215576} -08/30/2021 13:38:34 - INFO - __main__ - Step 2361: {'lr': 0.0004999927005655024, 'samples': 453312, 'steps': 2360, 'loss/train': 4.292819976806641} -08/30/2021 13:38:35 - INFO - __main__ - Step 2362: {'lr': 0.0004999926599569644, 'samples': 453504, 'steps': 2361, 'loss/train': 3.606462240219116} -08/30/2021 13:38:36 - INFO - __main__ - Step 2363: {'lr': 0.0004999926192357836, 'samples': 453696, 'steps': 2362, 'loss/train': 3.055013656616211} -08/30/2021 13:38:36 - INFO - __main__ - Step 2364: {'lr': 0.00049999257840196, 'samples': 453888, 'steps': 2363, 'loss/train': 3.5679545402526855} -08/30/2021 13:38:37 - INFO - __main__ - Step 2365: {'lr': 0.0004999925374554936, 'samples': 454080, 'steps': 2364, 'loss/train': 3.2827484607696533} -08/30/2021 13:38:37 - INFO - __main__ - Step 2366: {'lr': 0.0004999924963963845, 'samples': 454272, 'steps': 2365, 'loss/train': 3.22670578956604} -08/30/2021 13:38:37 - INFO - __main__ - Step 2367: {'lr': 0.0004999924552246324, 'samples': 454464, 'steps': 2366, 'loss/train': 3.738640546798706} -08/30/2021 13:38:39 - INFO - __main__ - Step 2368: {'lr': 0.0004999924139402378, 'samples': 454656, 'steps': 2367, 'loss/train': 3.8646726608276367} -08/30/2021 13:38:39 - INFO - __main__ - Step 2369: {'lr': 0.0004999923725432004, 'samples': 454848, 'steps': 2368, 'loss/train': 3.3699100017547607} -08/30/2021 13:38:39 - INFO - __main__ - Step 2370: {'lr': 0.0004999923310335202, 'samples': 455040, 'steps': 2369, 'loss/train': 2.9062230587005615} -08/30/2021 13:38:40 - INFO - __main__ - Step 2371: {'lr': 0.0004999922894111975, 'samples': 455232, 'steps': 2370, 'loss/train': 2.65940523147583} -08/30/2021 13:38:40 - INFO - __main__ - Step 2372: {'lr': 0.000499992247676232, 'samples': 455424, 'steps': 2371, 'loss/train': 3.379642963409424} -08/30/2021 13:38:42 - INFO - __main__ - Step 2373: {'lr': 0.0004999922058286238, 'samples': 455616, 'steps': 2372, 'loss/train': 2.7595129013061523} -08/30/2021 13:38:43 - INFO - __main__ - Step 2374: {'lr': 0.0004999921638683731, 'samples': 455808, 'steps': 2373, 'loss/train': 3.4127492904663086} -08/30/2021 13:38:43 - INFO - __main__ - Step 2375: {'lr': 0.0004999921217954797, 'samples': 456000, 'steps': 2374, 'loss/train': 3.960245370864868} -08/30/2021 13:38:43 - INFO - __main__ - Step 2376: {'lr': 0.0004999920796099437, 'samples': 456192, 'steps': 2375, 'loss/train': 4.573826313018799} -08/30/2021 13:38:44 - INFO - __main__ - Step 2377: {'lr': 0.0004999920373117652, 'samples': 456384, 'steps': 2376, 'loss/train': 3.424320697784424} -08/30/2021 13:38:45 - INFO - __main__ - Step 2378: {'lr': 0.0004999919949009442, 'samples': 456576, 'steps': 2377, 'loss/train': 3.022109031677246} -08/30/2021 13:38:46 - INFO - __main__ - Step 2379: {'lr': 0.0004999919523774806, 'samples': 456768, 'steps': 2378, 'loss/train': 3.9209976196289062} -08/30/2021 13:38:46 - INFO - __main__ - Step 2380: {'lr': 0.0004999919097413743, 'samples': 456960, 'steps': 2379, 'loss/train': 3.20947527885437} -08/30/2021 13:38:46 - INFO - __main__ - Step 2381: {'lr': 0.0004999918669926258, 'samples': 457152, 'steps': 2380, 'loss/train': 3.571824312210083} -08/30/2021 13:38:47 - INFO - __main__ - Step 2382: {'lr': 0.0004999918241312346, 'samples': 457344, 'steps': 2381, 'loss/train': 4.165573596954346} -08/30/2021 13:38:48 - INFO - __main__ - Step 2383: {'lr': 0.0004999917811572011, 'samples': 457536, 'steps': 2382, 'loss/train': 3.543983221054077} -08/30/2021 13:38:49 - INFO - __main__ - Step 2384: {'lr': 0.000499991738070525, 'samples': 457728, 'steps': 2383, 'loss/train': 3.2464683055877686} -08/30/2021 13:38:49 - INFO - __main__ - Step 2385: {'lr': 0.0004999916948712066, 'samples': 457920, 'steps': 2384, 'loss/train': 4.028754711151123} -08/30/2021 13:38:50 - INFO - __main__ - Step 2386: {'lr': 0.0004999916515592458, 'samples': 458112, 'steps': 2385, 'loss/train': 2.846074104309082} -08/30/2021 13:38:50 - INFO - __main__ - Step 2387: {'lr': 0.0004999916081346426, 'samples': 458304, 'steps': 2386, 'loss/train': 3.153379201889038} -08/30/2021 13:38:52 - INFO - __main__ - Step 2388: {'lr': 0.000499991564597397, 'samples': 458496, 'steps': 2387, 'loss/train': 3.519200086593628} -08/30/2021 13:38:52 - INFO - __main__ - Step 2389: {'lr': 0.0004999915209475091, 'samples': 458688, 'steps': 2388, 'loss/train': 3.616925001144409} -08/30/2021 13:38:52 - INFO - __main__ - Step 2390: {'lr': 0.0004999914771849788, 'samples': 458880, 'steps': 2389, 'loss/train': 2.9786550998687744} -08/30/2021 13:38:53 - INFO - __main__ - Step 2391: {'lr': 0.0004999914333098063, 'samples': 459072, 'steps': 2390, 'loss/train': 3.6126270294189453} -08/30/2021 13:38:53 - INFO - __main__ - Step 2392: {'lr': 0.0004999913893219915, 'samples': 459264, 'steps': 2391, 'loss/train': 3.707750082015991} -08/30/2021 13:38:54 - INFO - __main__ - Step 2393: {'lr': 0.0004999913452215345, 'samples': 459456, 'steps': 2392, 'loss/train': 3.7249889373779297} -08/30/2021 13:38:55 - INFO - __main__ - Step 2394: {'lr': 0.0004999913010084351, 'samples': 459648, 'steps': 2393, 'loss/train': 3.313490867614746} -08/30/2021 13:38:55 - INFO - __main__ - Step 2395: {'lr': 0.0004999912566826935, 'samples': 459840, 'steps': 2394, 'loss/train': 2.9527111053466797} -08/30/2021 13:38:56 - INFO - __main__ - Step 2396: {'lr': 0.0004999912122443098, 'samples': 460032, 'steps': 2395, 'loss/train': 3.189500570297241} -08/30/2021 13:38:56 - INFO - __main__ - Step 2397: {'lr': 0.0004999911676932838, 'samples': 460224, 'steps': 2396, 'loss/train': 4.016993045806885} -08/30/2021 13:38:56 - INFO - __main__ - Step 2398: {'lr': 0.0004999911230296158, 'samples': 460416, 'steps': 2397, 'loss/train': 5.025796413421631} -08/30/2021 13:38:58 - INFO - __main__ - Step 2399: {'lr': 0.0004999910782533055, 'samples': 460608, 'steps': 2398, 'loss/train': 2.0938472747802734} -08/30/2021 13:38:58 - INFO - __main__ - Step 2400: {'lr': 0.0004999910333643531, 'samples': 460800, 'steps': 2399, 'loss/train': 2.946650505065918} -08/30/2021 13:38:59 - INFO - __main__ - Step 2401: {'lr': 0.0004999909883627587, 'samples': 460992, 'steps': 2400, 'loss/train': 3.4790730476379395} -08/30/2021 13:38:59 - INFO - __main__ - Step 2402: {'lr': 0.0004999909432485221, 'samples': 461184, 'steps': 2401, 'loss/train': 1.8312193155288696} -08/30/2021 13:38:59 - INFO - __main__ - Step 2403: {'lr': 0.0004999908980216436, 'samples': 461376, 'steps': 2402, 'loss/train': 2.963334083557129} -08/30/2021 13:39:01 - INFO - __main__ - Step 2404: {'lr': 0.0004999908526821229, 'samples': 461568, 'steps': 2403, 'loss/train': 3.677765130996704} -08/30/2021 13:39:01 - INFO - __main__ - Step 2405: {'lr': 0.0004999908072299602, 'samples': 461760, 'steps': 2404, 'loss/train': 3.313152551651001} -08/30/2021 13:39:01 - INFO - __main__ - Step 2406: {'lr': 0.0004999907616651556, 'samples': 461952, 'steps': 2405, 'loss/train': 3.7477095127105713} -08/30/2021 13:39:02 - INFO - __main__ - Step 2407: {'lr': 0.000499990715987709, 'samples': 462144, 'steps': 2406, 'loss/train': 3.4406871795654297} -08/30/2021 13:39:02 - INFO - __main__ - Step 2408: {'lr': 0.0004999906701976203, 'samples': 462336, 'steps': 2407, 'loss/train': 3.336057186126709} -08/30/2021 13:39:04 - INFO - __main__ - Step 2409: {'lr': 0.0004999906242948898, 'samples': 462528, 'steps': 2408, 'loss/train': 2.045273542404175} -08/30/2021 13:39:04 - INFO - __main__ - Step 2410: {'lr': 0.0004999905782795173, 'samples': 462720, 'steps': 2409, 'loss/train': 3.7166590690612793} -08/30/2021 13:39:04 - INFO - __main__ - Step 2411: {'lr': 0.000499990532151503, 'samples': 462912, 'steps': 2410, 'loss/train': 3.179212808609009} -08/30/2021 13:39:05 - INFO - __main__ - Step 2412: {'lr': 0.0004999904859108467, 'samples': 463104, 'steps': 2411, 'loss/train': 3.3981876373291016} -08/30/2021 13:39:05 - INFO - __main__ - Step 2413: {'lr': 0.0004999904395575486, 'samples': 463296, 'steps': 2412, 'loss/train': 3.156912088394165} -08/30/2021 13:39:07 - INFO - __main__ - Step 2414: {'lr': 0.0004999903930916087, 'samples': 463488, 'steps': 2413, 'loss/train': 3.3669259548187256} -08/30/2021 13:39:07 - INFO - __main__ - Step 2415: {'lr': 0.000499990346513027, 'samples': 463680, 'steps': 2414, 'loss/train': 3.3963608741760254} -08/30/2021 13:39:08 - INFO - __main__ - Step 2416: {'lr': 0.0004999902998218034, 'samples': 463872, 'steps': 2415, 'loss/train': 3.2971057891845703} -08/30/2021 13:39:08 - INFO - __main__ - Step 2417: {'lr': 0.000499990253017938, 'samples': 464064, 'steps': 2416, 'loss/train': 3.180245876312256} -08/30/2021 13:39:08 - INFO - __main__ - Step 2418: {'lr': 0.0004999902061014311, 'samples': 464256, 'steps': 2417, 'loss/train': 2.1976773738861084} -08/30/2021 13:39:09 - INFO - __main__ - Step 2419: {'lr': 0.0004999901590722823, 'samples': 464448, 'steps': 2418, 'loss/train': 3.4911413192749023} -08/30/2021 13:39:10 - INFO - __main__ - Step 2420: {'lr': 0.0004999901119304919, 'samples': 464640, 'steps': 2419, 'loss/train': 3.558926582336426} -08/30/2021 13:39:11 - INFO - __main__ - Step 2421: {'lr': 0.0004999900646760597, 'samples': 464832, 'steps': 2420, 'loss/train': 3.358968734741211} -08/30/2021 13:39:11 - INFO - __main__ - Step 2422: {'lr': 0.0004999900173089858, 'samples': 465024, 'steps': 2421, 'loss/train': 3.1792385578155518} -08/30/2021 13:39:11 - INFO - __main__ - Step 2423: {'lr': 0.0004999899698292703, 'samples': 465216, 'steps': 2422, 'loss/train': 4.46215295791626} -08/30/2021 13:39:12 - INFO - __main__ - Step 2424: {'lr': 0.0004999899222369132, 'samples': 465408, 'steps': 2423, 'loss/train': 2.913651704788208} -08/30/2021 13:39:13 - INFO - __main__ - Step 2425: {'lr': 0.0004999898745319145, 'samples': 465600, 'steps': 2424, 'loss/train': 3.9791011810302734} -08/30/2021 13:39:14 - INFO - __main__ - Step 2426: {'lr': 0.0004999898267142741, 'samples': 465792, 'steps': 2425, 'loss/train': 3.211440324783325} -08/30/2021 13:39:14 - INFO - __main__ - Step 2427: {'lr': 0.0004999897787839923, 'samples': 465984, 'steps': 2426, 'loss/train': 4.253355979919434} -08/30/2021 13:39:14 - INFO - __main__ - Step 2428: {'lr': 0.000499989730741069, 'samples': 466176, 'steps': 2427, 'loss/train': 3.0943493843078613} -08/30/2021 13:39:15 - INFO - __main__ - Step 2429: {'lr': 0.000499989682585504, 'samples': 466368, 'steps': 2428, 'loss/train': 3.28936767578125} -08/30/2021 13:39:17 - INFO - __main__ - Step 2430: {'lr': 0.0004999896343172976, 'samples': 466560, 'steps': 2429, 'loss/train': 4.029385089874268} -08/30/2021 13:39:17 - INFO - __main__ - Step 2431: {'lr': 0.0004999895859364498, 'samples': 466752, 'steps': 2430, 'loss/train': 3.9884324073791504} -08/30/2021 13:39:18 - INFO - __main__ - Step 2432: {'lr': 0.0004999895374429605, 'samples': 466944, 'steps': 2431, 'loss/train': 3.7134838104248047} -08/30/2021 13:39:18 - INFO - __main__ - Step 2433: {'lr': 0.0004999894888368297, 'samples': 467136, 'steps': 2432, 'loss/train': 3.9085521697998047} -08/30/2021 13:39:18 - INFO - __main__ - Step 2434: {'lr': 0.0004999894401180576, 'samples': 467328, 'steps': 2433, 'loss/train': 2.209113121032715} -08/30/2021 13:39:20 - INFO - __main__ - Step 2435: {'lr': 0.0004999893912866441, 'samples': 467520, 'steps': 2434, 'loss/train': 3.9369819164276123} -08/30/2021 13:39:20 - INFO - __main__ - Step 2436: {'lr': 0.0004999893423425892, 'samples': 467712, 'steps': 2435, 'loss/train': 4.0529890060424805} -08/30/2021 13:39:21 - INFO - __main__ - Step 2437: {'lr': 0.0004999892932858929, 'samples': 467904, 'steps': 2436, 'loss/train': 3.331840753555298} -08/30/2021 13:39:21 - INFO - __main__ - Step 2438: {'lr': 0.0004999892441165554, 'samples': 468096, 'steps': 2437, 'loss/train': 3.2444252967834473} -08/30/2021 13:39:21 - INFO - __main__ - Step 2439: {'lr': 0.0004999891948345765, 'samples': 468288, 'steps': 2438, 'loss/train': 3.1652252674102783} -08/30/2021 13:39:23 - INFO - __main__ - Step 2440: {'lr': 0.0004999891454399565, 'samples': 468480, 'steps': 2439, 'loss/train': 3.267704725265503} -08/30/2021 13:39:23 - INFO - __main__ - Step 2441: {'lr': 0.000499989095932695, 'samples': 468672, 'steps': 2440, 'loss/train': 4.30018949508667} -08/30/2021 13:39:24 - INFO - __main__ - Step 2442: {'lr': 0.0004999890463127924, 'samples': 468864, 'steps': 2441, 'loss/train': 4.094340801239014} -08/30/2021 13:39:24 - INFO - __main__ - Step 2443: {'lr': 0.0004999889965802486, 'samples': 469056, 'steps': 2442, 'loss/train': 4.673208236694336} -08/30/2021 13:39:24 - INFO - __main__ - Step 2444: {'lr': 0.0004999889467350636, 'samples': 469248, 'steps': 2443, 'loss/train': 3.901282548904419} -08/30/2021 13:39:25 - INFO - __main__ - Step 2445: {'lr': 0.0004999888967772375, 'samples': 469440, 'steps': 2444, 'loss/train': 4.057990550994873} -08/30/2021 13:39:26 - INFO - __main__ - Step 2446: {'lr': 0.0004999888467067702, 'samples': 469632, 'steps': 2445, 'loss/train': 4.6610589027404785} -08/30/2021 13:39:27 - INFO - __main__ - Step 2447: {'lr': 0.0004999887965236617, 'samples': 469824, 'steps': 2446, 'loss/train': 3.1241021156311035} -08/30/2021 13:39:27 - INFO - __main__ - Step 2448: {'lr': 0.0004999887462279123, 'samples': 470016, 'steps': 2447, 'loss/train': 3.665513515472412} -08/30/2021 13:39:27 - INFO - __main__ - Step 2449: {'lr': 0.0004999886958195216, 'samples': 470208, 'steps': 2448, 'loss/train': 3.249267816543579} -08/30/2021 13:39:28 - INFO - __main__ - Step 2450: {'lr': 0.00049998864529849, 'samples': 470400, 'steps': 2449, 'loss/train': 3.2747325897216797} -08/30/2021 13:39:29 - INFO - __main__ - Step 2451: {'lr': 0.0004999885946648174, 'samples': 470592, 'steps': 2450, 'loss/train': 3.5657455921173096} -08/30/2021 13:39:30 - INFO - __main__ - Step 2452: {'lr': 0.0004999885439185037, 'samples': 470784, 'steps': 2451, 'loss/train': 2.537431478500366} -08/30/2021 13:39:30 - INFO - __main__ - Step 2453: {'lr': 0.0004999884930595491, 'samples': 470976, 'steps': 2452, 'loss/train': 2.845932960510254} -08/30/2021 13:39:30 - INFO - __main__ - Step 2454: {'lr': 0.0004999884420879534, 'samples': 471168, 'steps': 2453, 'loss/train': 3.258159875869751} -08/30/2021 13:39:31 - INFO - __main__ - Step 2455: {'lr': 0.000499988391003717, 'samples': 471360, 'steps': 2454, 'loss/train': 2.972184419631958} -08/30/2021 13:39:32 - INFO - __main__ - Step 2456: {'lr': 0.0004999883398068396, 'samples': 471552, 'steps': 2455, 'loss/train': 3.4724526405334473} -08/30/2021 13:39:33 - INFO - __main__ - Step 2457: {'lr': 0.0004999882884973212, 'samples': 471744, 'steps': 2456, 'loss/train': 5.70952844619751} -08/30/2021 13:39:33 - INFO - __main__ - Step 2458: {'lr': 0.000499988237075162, 'samples': 471936, 'steps': 2457, 'loss/train': 2.890782594680786} -08/30/2021 13:39:34 - INFO - __main__ - Step 2459: {'lr': 0.000499988185540362, 'samples': 472128, 'steps': 2458, 'loss/train': 3.2589898109436035} -08/30/2021 13:39:34 - INFO - __main__ - Step 2460: {'lr': 0.0004999881338929211, 'samples': 472320, 'steps': 2459, 'loss/train': 3.168170213699341} -08/30/2021 13:39:35 - INFO - __main__ - Step 2461: {'lr': 0.0004999880821328395, 'samples': 472512, 'steps': 2460, 'loss/train': 3.469691276550293} -08/30/2021 13:39:36 - INFO - __main__ - Step 2462: {'lr': 0.000499988030260117, 'samples': 472704, 'steps': 2461, 'loss/train': 4.25238037109375} -08/30/2021 13:39:36 - INFO - __main__ - Step 2463: {'lr': 0.0004999879782747539, 'samples': 472896, 'steps': 2462, 'loss/train': 3.698615074157715} -08/30/2021 13:39:36 - INFO - __main__ - Step 2464: {'lr': 0.00049998792617675, 'samples': 473088, 'steps': 2463, 'loss/train': 3.922322988510132} -08/30/2021 13:39:37 - INFO - __main__ - Step 2465: {'lr': 0.0004999878739661053, 'samples': 473280, 'steps': 2464, 'loss/train': 3.4149012565612793} -08/30/2021 13:39:38 - INFO - __main__ - Step 2466: {'lr': 0.0004999878216428201, 'samples': 473472, 'steps': 2465, 'loss/train': 3.7355833053588867} -08/30/2021 13:39:39 - INFO - __main__ - Step 2467: {'lr': 0.0004999877692068942, 'samples': 473664, 'steps': 2466, 'loss/train': 3.661376953125} -08/30/2021 13:39:39 - INFO - __main__ - Step 2468: {'lr': 0.0004999877166583276, 'samples': 473856, 'steps': 2467, 'loss/train': 3.195875406265259} -08/30/2021 13:39:40 - INFO - __main__ - Step 2469: {'lr': 0.0004999876639971204, 'samples': 474048, 'steps': 2468, 'loss/train': 3.488727569580078} -08/30/2021 13:39:40 - INFO - __main__ - Step 2470: {'lr': 0.0004999876112232726, 'samples': 474240, 'steps': 2469, 'loss/train': 3.3036279678344727} -08/30/2021 13:39:41 - INFO - __main__ - Step 2471: {'lr': 0.0004999875583367844, 'samples': 474432, 'steps': 2470, 'loss/train': 3.79384183883667} -08/30/2021 13:39:42 - INFO - __main__ - Step 2472: {'lr': 0.0004999875053376555, 'samples': 474624, 'steps': 2471, 'loss/train': 2.880828857421875} -08/30/2021 13:39:42 - INFO - __main__ - Step 2473: {'lr': 0.0004999874522258861, 'samples': 474816, 'steps': 2472, 'loss/train': 3.9294240474700928} -08/30/2021 13:39:43 - INFO - __main__ - Step 2474: {'lr': 0.0004999873990014763, 'samples': 475008, 'steps': 2473, 'loss/train': 3.158289909362793} -08/30/2021 13:39:43 - INFO - __main__ - Step 2475: {'lr': 0.0004999873456644259, 'samples': 475200, 'steps': 2474, 'loss/train': 2.3990821838378906} -08/30/2021 13:39:44 - INFO - __main__ - Step 2476: {'lr': 0.0004999872922147352, 'samples': 475392, 'steps': 2475, 'loss/train': 3.361088275909424} -08/30/2021 13:39:45 - INFO - __main__ - Step 2477: {'lr': 0.0004999872386524041, 'samples': 475584, 'steps': 2476, 'loss/train': 3.6757729053497314} -08/30/2021 13:39:45 - INFO - __main__ - Step 2478: {'lr': 0.0004999871849774325, 'samples': 475776, 'steps': 2477, 'loss/train': 3.659137725830078} -08/30/2021 13:39:46 - INFO - __main__ - Step 2479: {'lr': 0.0004999871311898205, 'samples': 475968, 'steps': 2478, 'loss/train': 3.3369903564453125} -08/30/2021 13:39:46 - INFO - __main__ - Step 2480: {'lr': 0.0004999870772895683, 'samples': 476160, 'steps': 2479, 'loss/train': 3.4437551498413086} -08/30/2021 13:39:48 - INFO - __main__ - Step 2481: {'lr': 0.0004999870232766756, 'samples': 476352, 'steps': 2480, 'loss/train': 3.702115297317505} -08/30/2021 13:39:49 - INFO - __main__ - Step 2482: {'lr': 0.0004999869691511428, 'samples': 476544, 'steps': 2481, 'loss/train': 4.077302932739258} -08/30/2021 13:39:49 - INFO - __main__ - Step 2483: {'lr': 0.0004999869149129696, 'samples': 476736, 'steps': 2482, 'loss/train': 3.502058506011963} -08/30/2021 13:39:49 - INFO - __main__ - Step 2484: {'lr': 0.0004999868605621563, 'samples': 476928, 'steps': 2483, 'loss/train': 3.562957525253296} -08/30/2021 13:39:50 - INFO - __main__ - Step 2485: {'lr': 0.0004999868060987027, 'samples': 477120, 'steps': 2484, 'loss/train': 2.818432569503784} -08/30/2021 13:39:50 - INFO - __main__ - Step 2486: {'lr': 0.0004999867515226088, 'samples': 477312, 'steps': 2485, 'loss/train': 3.346011161804199} -08/30/2021 13:39:51 - INFO - __main__ - Step 2487: {'lr': 0.0004999866968338748, 'samples': 477504, 'steps': 2486, 'loss/train': 1.1037997007369995} -08/30/2021 13:39:52 - INFO - __main__ - Step 2488: {'lr': 0.0004999866420325006, 'samples': 477696, 'steps': 2487, 'loss/train': 3.7922840118408203} -08/30/2021 13:39:52 - INFO - __main__ - Step 2489: {'lr': 0.0004999865871184863, 'samples': 477888, 'steps': 2488, 'loss/train': 3.2803664207458496} -08/30/2021 13:39:53 - INFO - __main__ - Step 2490: {'lr': 0.000499986532091832, 'samples': 478080, 'steps': 2489, 'loss/train': 3.34903883934021} -08/30/2021 13:39:53 - INFO - __main__ - Step 2491: {'lr': 0.0004999864769525375, 'samples': 478272, 'steps': 2490, 'loss/train': 3.25426983833313} -08/30/2021 13:39:54 - INFO - __main__ - Step 2492: {'lr': 0.000499986421700603, 'samples': 478464, 'steps': 2491, 'loss/train': 3.161381959915161} -08/30/2021 13:39:55 - INFO - __main__ - Step 2493: {'lr': 0.0004999863663360285, 'samples': 478656, 'steps': 2492, 'loss/train': 3.2575273513793945} -08/30/2021 13:39:55 - INFO - __main__ - Step 2494: {'lr': 0.000499986310858814, 'samples': 478848, 'steps': 2493, 'loss/train': 2.6650431156158447} -08/30/2021 13:39:56 - INFO - __main__ - Step 2495: {'lr': 0.0004999862552689595, 'samples': 479040, 'steps': 2494, 'loss/train': 3.0776734352111816} -08/30/2021 13:39:56 - INFO - __main__ - Step 2496: {'lr': 0.000499986199566465, 'samples': 479232, 'steps': 2495, 'loss/train': 3.138657808303833} -08/30/2021 13:39:57 - INFO - __main__ - Step 2497: {'lr': 0.0004999861437513306, 'samples': 479424, 'steps': 2496, 'loss/train': 1.8879177570343018} -08/30/2021 13:39:58 - INFO - __main__ - Step 2498: {'lr': 0.0004999860878235564, 'samples': 479616, 'steps': 2497, 'loss/train': 3.305360794067383} -08/30/2021 13:39:58 - INFO - __main__ - Step 2499: {'lr': 0.0004999860317831423, 'samples': 479808, 'steps': 2498, 'loss/train': 3.1247971057891846} -08/30/2021 13:39:59 - INFO - __main__ - Step 2500: {'lr': 0.0004999859756300883, 'samples': 480000, 'steps': 2499, 'loss/train': 3.1875553131103516} -08/30/2021 13:39:59 - INFO - __main__ - Step 2501: {'lr': 0.0004999859193643945, 'samples': 480192, 'steps': 2500, 'loss/train': 3.408926010131836} -08/30/2021 13:40:01 - INFO - __main__ - Step 2502: {'lr': 0.0004999858629860609, 'samples': 480384, 'steps': 2501, 'loss/train': 3.225663900375366} -08/30/2021 13:40:01 - INFO - __main__ - Step 2503: {'lr': 0.0004999858064950875, 'samples': 480576, 'steps': 2502, 'loss/train': 2.3713886737823486} -08/30/2021 13:40:01 - INFO - __main__ - Step 2504: {'lr': 0.0004999857498914744, 'samples': 480768, 'steps': 2503, 'loss/train': 2.82582688331604} -08/30/2021 13:40:02 - INFO - __main__ - Step 2505: {'lr': 0.0004999856931752215, 'samples': 480960, 'steps': 2504, 'loss/train': 3.6427695751190186} -08/30/2021 13:40:02 - INFO - __main__ - Step 2506: {'lr': 0.000499985636346329, 'samples': 481152, 'steps': 2505, 'loss/train': 2.7283215522766113} -08/30/2021 13:40:04 - INFO - __main__ - Step 2507: {'lr': 0.0004999855794047968, 'samples': 481344, 'steps': 2506, 'loss/train': 3.2982444763183594} -08/30/2021 13:40:04 - INFO - __main__ - Step 2508: {'lr': 0.000499985522350625, 'samples': 481536, 'steps': 2507, 'loss/train': 3.2410199642181396} -08/30/2021 13:40:05 - INFO - __main__ - Step 2509: {'lr': 0.0004999854651838134, 'samples': 481728, 'steps': 2508, 'loss/train': 3.3344876766204834} -08/30/2021 13:40:05 - INFO - __main__ - Step 2510: {'lr': 0.0004999854079043624, 'samples': 481920, 'steps': 2509, 'loss/train': 1.1394327878952026} -08/30/2021 13:40:05 - INFO - __main__ - Step 2511: {'lr': 0.0004999853505122718, 'samples': 482112, 'steps': 2510, 'loss/train': 0.7066466212272644} -08/30/2021 13:40:07 - INFO - __main__ - Step 2512: {'lr': 0.0004999852930075416, 'samples': 482304, 'steps': 2511, 'loss/train': 3.296462059020996} -08/30/2021 13:40:07 - INFO - __main__ - Step 2513: {'lr': 0.0004999852353901719, 'samples': 482496, 'steps': 2512, 'loss/train': 2.5775790214538574} -08/30/2021 13:40:07 - INFO - __main__ - Step 2514: {'lr': 0.0004999851776601627, 'samples': 482688, 'steps': 2513, 'loss/train': 3.0068328380584717} -08/30/2021 13:40:08 - INFO - __main__ - Step 2515: {'lr': 0.0004999851198175141, 'samples': 482880, 'steps': 2514, 'loss/train': 3.845776319503784} -08/30/2021 13:40:08 - INFO - __main__ - Step 2516: {'lr': 0.0004999850618622259, 'samples': 483072, 'steps': 2515, 'loss/train': 3.6843724250793457} -08/30/2021 13:40:08 - INFO - __main__ - Step 2517: {'lr': 0.0004999850037942984, 'samples': 483264, 'steps': 2516, 'loss/train': 3.3851566314697266} -08/30/2021 13:40:10 - INFO - __main__ - Step 2518: {'lr': 0.0004999849456137316, 'samples': 483456, 'steps': 2517, 'loss/train': 2.5815160274505615} -08/30/2021 13:40:11 - INFO - __main__ - Step 2519: {'lr': 0.0004999848873205254, 'samples': 483648, 'steps': 2518, 'loss/train': 3.131572723388672} -08/30/2021 13:40:11 - INFO - __main__ - Step 2520: {'lr': 0.0004999848289146798, 'samples': 483840, 'steps': 2519, 'loss/train': 3.4908299446105957} -08/30/2021 13:40:11 - INFO - __main__ - Step 2521: {'lr': 0.0004999847703961948, 'samples': 484032, 'steps': 2520, 'loss/train': 3.4235336780548096} -08/30/2021 13:40:12 - INFO - __main__ - Step 2522: {'lr': 0.0004999847117650708, 'samples': 484224, 'steps': 2521, 'loss/train': 2.7699456214904785} -08/30/2021 13:40:13 - INFO - __main__ - Step 2523: {'lr': 0.0004999846530213074, 'samples': 484416, 'steps': 2522, 'loss/train': 3.3291280269622803} -08/30/2021 13:40:14 - INFO - __main__ - Step 2524: {'lr': 0.0004999845941649048, 'samples': 484608, 'steps': 2523, 'loss/train': 3.7320284843444824} -08/30/2021 13:40:14 - INFO - __main__ - Step 2525: {'lr': 0.0004999845351958629, 'samples': 484800, 'steps': 2524, 'loss/train': 0.8700743913650513} -08/30/2021 13:40:15 - INFO - __main__ - Step 2526: {'lr': 0.0004999844761141818, 'samples': 484992, 'steps': 2525, 'loss/train': 2.396313428878784} -08/30/2021 13:40:15 - INFO - __main__ - Step 2527: {'lr': 0.0004999844169198617, 'samples': 485184, 'steps': 2526, 'loss/train': 3.6103646755218506} -08/30/2021 13:40:16 - INFO - __main__ - Step 2528: {'lr': 0.0004999843576129024, 'samples': 485376, 'steps': 2527, 'loss/train': 3.05768084526062} -08/30/2021 13:40:17 - INFO - __main__ - Step 2529: {'lr': 0.000499984298193304, 'samples': 485568, 'steps': 2528, 'loss/train': 4.48790979385376} -08/30/2021 13:40:17 - INFO - __main__ - Step 2530: {'lr': 0.0004999842386610666, 'samples': 485760, 'steps': 2529, 'loss/train': 3.349534273147583} -08/30/2021 13:40:18 - INFO - __main__ - Step 2531: {'lr': 0.0004999841790161901, 'samples': 485952, 'steps': 2530, 'loss/train': 3.3274784088134766} -08/30/2021 13:40:18 - INFO - __main__ - Step 2532: {'lr': 0.0004999841192586746, 'samples': 486144, 'steps': 2531, 'loss/train': 3.838348865509033} -08/30/2021 13:40:20 - INFO - __main__ - Step 2533: {'lr': 0.0004999840593885201, 'samples': 486336, 'steps': 2532, 'loss/train': 3.1673481464385986} -08/30/2021 13:40:20 - INFO - __main__ - Step 2534: {'lr': 0.0004999839994057266, 'samples': 486528, 'steps': 2533, 'loss/train': 3.536339282989502} -08/30/2021 13:40:21 - INFO - __main__ - Step 2535: {'lr': 0.0004999839393102943, 'samples': 486720, 'steps': 2534, 'loss/train': 2.235766887664795} -08/30/2021 13:40:21 - INFO - __main__ - Step 2536: {'lr': 0.0004999838791022229, 'samples': 486912, 'steps': 2535, 'loss/train': 1.8790549039840698} -08/30/2021 13:40:21 - INFO - __main__ - Step 2537: {'lr': 0.0004999838187815128, 'samples': 487104, 'steps': 2536, 'loss/train': 3.3130922317504883} -08/30/2021 13:40:23 - INFO - __main__ - Step 2538: {'lr': 0.0004999837583481638, 'samples': 487296, 'steps': 2537, 'loss/train': 2.9206509590148926} -08/30/2021 13:40:24 - INFO - __main__ - Step 2539: {'lr': 0.000499983697802176, 'samples': 487488, 'steps': 2538, 'loss/train': 2.7371299266815186} -08/30/2021 13:40:24 - INFO - __main__ - Step 2540: {'lr': 0.0004999836371435494, 'samples': 487680, 'steps': 2539, 'loss/train': 3.4457602500915527} -08/30/2021 13:40:24 - INFO - __main__ - Step 2541: {'lr': 0.000499983576372284, 'samples': 487872, 'steps': 2540, 'loss/train': 3.235722303390503} -08/30/2021 13:40:25 - INFO - __main__ - Step 2542: {'lr': 0.0004999835154883798, 'samples': 488064, 'steps': 2541, 'loss/train': 3.3214685916900635} -08/30/2021 13:40:25 - INFO - __main__ - Step 2543: {'lr': 0.0004999834544918369, 'samples': 488256, 'steps': 2542, 'loss/train': 2.9445972442626953} -08/30/2021 13:40:27 - INFO - __main__ - Step 2544: {'lr': 0.0004999833933826554, 'samples': 488448, 'steps': 2543, 'loss/train': 3.240677833557129} -08/30/2021 13:40:27 - INFO - __main__ - Step 2545: {'lr': 0.0004999833321608351, 'samples': 488640, 'steps': 2544, 'loss/train': 2.8306660652160645} -08/30/2021 13:40:27 - INFO - __main__ - Step 2546: {'lr': 0.0004999832708263764, 'samples': 488832, 'steps': 2545, 'loss/train': 3.1749751567840576} -08/30/2021 13:40:28 - INFO - __main__ - Step 2547: {'lr': 0.000499983209379279, 'samples': 489024, 'steps': 2546, 'loss/train': 3.7916362285614014} -08/30/2021 13:40:28 - INFO - __main__ - Step 2548: {'lr': 0.0004999831478195429, 'samples': 489216, 'steps': 2547, 'loss/train': 3.540221691131592} -08/30/2021 13:40:29 - INFO - __main__ - Step 2549: {'lr': 0.0004999830861471684, 'samples': 489408, 'steps': 2548, 'loss/train': 0.5375320315361023} -08/30/2021 13:40:30 - INFO - __main__ - Step 2550: {'lr': 0.0004999830243621553, 'samples': 489600, 'steps': 2549, 'loss/train': 3.567222833633423} -08/30/2021 13:40:30 - INFO - __main__ - Step 2551: {'lr': 0.0004999829624645037, 'samples': 489792, 'steps': 2550, 'loss/train': 3.402311086654663} -08/30/2021 13:40:31 - INFO - __main__ - Step 2552: {'lr': 0.0004999829004542136, 'samples': 489984, 'steps': 2551, 'loss/train': 3.234229803085327} -08/30/2021 13:40:31 - INFO - __main__ - Step 2553: {'lr': 0.0004999828383312851, 'samples': 490176, 'steps': 2552, 'loss/train': 2.6774160861968994} -08/30/2021 13:40:32 - INFO - __main__ - Step 2554: {'lr': 0.0004999827760957182, 'samples': 490368, 'steps': 2553, 'loss/train': 2.777254581451416} -08/30/2021 13:40:33 - INFO - __main__ - Step 2555: {'lr': 0.000499982713747513, 'samples': 490560, 'steps': 2554, 'loss/train': 3.821315050125122} -08/30/2021 13:40:33 - INFO - __main__ - Step 2556: {'lr': 0.0004999826512866693, 'samples': 490752, 'steps': 2555, 'loss/train': 3.441488265991211} -08/30/2021 13:40:34 - INFO - __main__ - Step 2557: {'lr': 0.0004999825887131874, 'samples': 490944, 'steps': 2556, 'loss/train': 3.2371251583099365} -08/30/2021 13:40:34 - INFO - __main__ - Step 2558: {'lr': 0.0004999825260270671, 'samples': 491136, 'steps': 2557, 'loss/train': 3.3055927753448486} -08/30/2021 13:40:35 - INFO - __main__ - Step 2559: {'lr': 0.0004999824632283086, 'samples': 491328, 'steps': 2558, 'loss/train': 2.9721972942352295} -08/30/2021 13:40:36 - INFO - __main__ - Step 2560: {'lr': 0.0004999824003169119, 'samples': 491520, 'steps': 2559, 'loss/train': 3.119234085083008} -08/30/2021 13:40:36 - INFO - __main__ - Step 2561: {'lr': 0.000499982337292877, 'samples': 491712, 'steps': 2560, 'loss/train': 3.087674617767334} -08/30/2021 13:40:37 - INFO - __main__ - Step 2562: {'lr': 0.0004999822741562038, 'samples': 491904, 'steps': 2561, 'loss/train': 3.089181661605835} -08/30/2021 13:40:37 - INFO - __main__ - Step 2563: {'lr': 0.0004999822109068925, 'samples': 492096, 'steps': 2562, 'loss/train': 3.475480079650879} -08/30/2021 13:40:38 - INFO - __main__ - Step 2564: {'lr': 0.000499982147544943, 'samples': 492288, 'steps': 2563, 'loss/train': 3.0615687370300293} -08/30/2021 13:40:39 - INFO - __main__ - Step 2565: {'lr': 0.0004999820840703554, 'samples': 492480, 'steps': 2564, 'loss/train': 3.29472279548645} -08/30/2021 13:40:39 - INFO - __main__ - Step 2566: {'lr': 0.0004999820204831298, 'samples': 492672, 'steps': 2565, 'loss/train': 3.4640440940856934} -08/30/2021 13:40:40 - INFO - __main__ - Step 2567: {'lr': 0.0004999819567832661, 'samples': 492864, 'steps': 2566, 'loss/train': 2.8388006687164307} -08/30/2021 13:40:40 - INFO - __main__ - Step 2568: {'lr': 0.0004999818929707645, 'samples': 493056, 'steps': 2567, 'loss/train': 2.959890365600586} -08/30/2021 13:40:41 - INFO - __main__ - Step 2569: {'lr': 0.0004999818290456249, 'samples': 493248, 'steps': 2568, 'loss/train': 2.944700241088867} -08/30/2021 13:40:42 - INFO - __main__ - Step 2570: {'lr': 0.0004999817650078474, 'samples': 493440, 'steps': 2569, 'loss/train': 3.516746997833252} -08/30/2021 13:40:42 - INFO - __main__ - Step 2571: {'lr': 0.0004999817008574318, 'samples': 493632, 'steps': 2570, 'loss/train': 3.095552921295166} -08/30/2021 13:40:43 - INFO - __main__ - Step 2572: {'lr': 0.0004999816365943784, 'samples': 493824, 'steps': 2571, 'loss/train': 2.8601486682891846} -08/30/2021 13:40:43 - INFO - __main__ - Step 2573: {'lr': 0.000499981572218687, 'samples': 494016, 'steps': 2572, 'loss/train': 4.528290271759033} -08/30/2021 13:40:43 - INFO - __main__ - Step 2574: {'lr': 0.0004999815077303579, 'samples': 494208, 'steps': 2573, 'loss/train': 2.300426721572876} -08/30/2021 13:40:45 - INFO - __main__ - Step 2575: {'lr': 0.000499981443129391, 'samples': 494400, 'steps': 2574, 'loss/train': 3.0739119052886963} -08/30/2021 13:40:45 - INFO - __main__ - Step 2576: {'lr': 0.0004999813784157863, 'samples': 494592, 'steps': 2575, 'loss/train': 3.223848581314087} -08/30/2021 13:40:46 - INFO - __main__ - Step 2577: {'lr': 0.0004999813135895438, 'samples': 494784, 'steps': 2576, 'loss/train': 2.8425159454345703} -08/30/2021 13:40:46 - INFO - __main__ - Step 2578: {'lr': 0.0004999812486506637, 'samples': 494976, 'steps': 2577, 'loss/train': 2.773549795150757} -08/30/2021 13:40:46 - INFO - __main__ - Step 2579: {'lr': 0.0004999811835991457, 'samples': 495168, 'steps': 2578, 'loss/train': 2.3618130683898926} -08/30/2021 13:40:48 - INFO - __main__ - Step 2580: {'lr': 0.0004999811184349902, 'samples': 495360, 'steps': 2579, 'loss/train': 3.067438840866089} -08/30/2021 13:40:48 - INFO - __main__ - Step 2581: {'lr': 0.000499981053158197, 'samples': 495552, 'steps': 2580, 'loss/train': 3.2529942989349365} -08/30/2021 13:40:49 - INFO - __main__ - Step 2582: {'lr': 0.0004999809877687662, 'samples': 495744, 'steps': 2581, 'loss/train': 3.515986204147339} -08/30/2021 13:40:49 - INFO - __main__ - Step 2583: {'lr': 0.0004999809222666978, 'samples': 495936, 'steps': 2582, 'loss/train': 2.9327030181884766} -08/30/2021 13:40:49 - INFO - __main__ - Step 2584: {'lr': 0.0004999808566519919, 'samples': 496128, 'steps': 2583, 'loss/train': 3.3252201080322266} -08/30/2021 13:40:51 - INFO - __main__ - Step 2585: {'lr': 0.0004999807909246485, 'samples': 496320, 'steps': 2584, 'loss/train': 1.8364979028701782} -08/30/2021 13:40:51 - INFO - __main__ - Step 2586: {'lr': 0.0004999807250846676, 'samples': 496512, 'steps': 2585, 'loss/train': 3.141077756881714} -08/30/2021 13:40:52 - INFO - __main__ - Step 2587: {'lr': 0.0004999806591320492, 'samples': 496704, 'steps': 2586, 'loss/train': 3.338092088699341} -08/30/2021 13:40:52 - INFO - __main__ - Step 2588: {'lr': 0.0004999805930667934, 'samples': 496896, 'steps': 2587, 'loss/train': 3.1431477069854736} -08/30/2021 13:40:52 - INFO - __main__ - Step 2589: {'lr': 0.0004999805268889003, 'samples': 497088, 'steps': 2588, 'loss/train': 2.8831489086151123} -08/30/2021 13:40:54 - INFO - __main__ - Step 2590: {'lr': 0.0004999804605983697, 'samples': 497280, 'steps': 2589, 'loss/train': 2.7750606536865234} -08/30/2021 13:40:55 - INFO - __main__ - Step 2591: {'lr': 0.0004999803941952018, 'samples': 497472, 'steps': 2590, 'loss/train': 3.2433807849884033} -08/30/2021 13:40:55 - INFO - __main__ - Step 2592: {'lr': 0.0004999803276793965, 'samples': 497664, 'steps': 2591, 'loss/train': 3.106518268585205} -08/30/2021 13:40:56 - INFO - __main__ - Step 2593: {'lr': 0.0004999802610509541, 'samples': 497856, 'steps': 2592, 'loss/train': 2.863128900527954} -08/30/2021 13:40:56 - INFO - __main__ - Step 2594: {'lr': 0.0004999801943098743, 'samples': 498048, 'steps': 2593, 'loss/train': 3.7802350521087646} -08/30/2021 13:40:58 - INFO - __main__ - Step 2595: {'lr': 0.0004999801274561573, 'samples': 498240, 'steps': 2594, 'loss/train': 3.056262254714966} -08/30/2021 13:40:58 - INFO - __main__ - Step 2596: {'lr': 0.0004999800604898032, 'samples': 498432, 'steps': 2595, 'loss/train': 3.5432939529418945} -08/30/2021 13:40:58 - INFO - __main__ - Step 2597: {'lr': 0.000499979993410812, 'samples': 498624, 'steps': 2596, 'loss/train': 3.2634787559509277} -08/30/2021 13:40:59 - INFO - __main__ - Step 2598: {'lr': 0.0004999799262191835, 'samples': 498816, 'steps': 2597, 'loss/train': 0.46490105986595154} -08/30/2021 13:40:59 - INFO - __main__ - Step 2599: {'lr': 0.0004999798589149179, 'samples': 499008, 'steps': 2598, 'loss/train': 0.9940352439880371} -08/30/2021 13:41:01 - INFO - __main__ - Step 2600: {'lr': 0.0004999797914980154, 'samples': 499200, 'steps': 2599, 'loss/train': 3.4254579544067383} -08/30/2021 13:41:01 - INFO - __main__ - Step 2601: {'lr': 0.0004999797239684757, 'samples': 499392, 'steps': 2600, 'loss/train': 3.204349994659424} -08/30/2021 13:41:01 - INFO - __main__ - Step 2602: {'lr': 0.0004999796563262991, 'samples': 499584, 'steps': 2601, 'loss/train': 3.2098374366760254} -08/30/2021 13:41:02 - INFO - __main__ - Step 2603: {'lr': 0.0004999795885714855, 'samples': 499776, 'steps': 2602, 'loss/train': 3.2374396324157715} -08/30/2021 13:41:02 - INFO - __main__ - Step 2604: {'lr': 0.0004999795207040349, 'samples': 499968, 'steps': 2603, 'loss/train': 2.9048542976379395} -08/30/2021 13:41:02 - INFO - __main__ - Step 2605: {'lr': 0.0004999794527239474, 'samples': 500160, 'steps': 2604, 'loss/train': 1.4519882202148438} -08/30/2021 13:41:04 - INFO - __main__ - Step 2606: {'lr': 0.000499979384631223, 'samples': 500352, 'steps': 2605, 'loss/train': 3.092986583709717} -08/30/2021 13:41:05 - INFO - __main__ - Step 2607: {'lr': 0.000499979316425862, 'samples': 500544, 'steps': 2606, 'loss/train': 3.087824821472168} -08/30/2021 13:41:05 - INFO - __main__ - Step 2608: {'lr': 0.0004999792481078639, 'samples': 500736, 'steps': 2607, 'loss/train': 0.5084215998649597} -08/30/2021 13:41:05 - INFO - __main__ - Step 2609: {'lr': 0.000499979179677229, 'samples': 500928, 'steps': 2608, 'loss/train': 2.7436444759368896} -08/30/2021 13:41:06 - INFO - __main__ - Step 2610: {'lr': 0.0004999791111339574, 'samples': 501120, 'steps': 2609, 'loss/train': 2.876444101333618} -08/30/2021 13:41:07 - INFO - __main__ - Step 2611: {'lr': 0.0004999790424780492, 'samples': 501312, 'steps': 2610, 'loss/train': 3.3328187465667725} -08/30/2021 13:41:08 - INFO - __main__ - Step 2612: {'lr': 0.0004999789737095041, 'samples': 501504, 'steps': 2611, 'loss/train': 3.361556053161621} -08/30/2021 13:41:08 - INFO - __main__ - Step 2613: {'lr': 0.0004999789048283224, 'samples': 501696, 'steps': 2612, 'loss/train': 2.887472152709961} -08/30/2021 13:41:08 - INFO - __main__ - Step 2614: {'lr': 0.0004999788358345041, 'samples': 501888, 'steps': 2613, 'loss/train': 3.410672903060913} -08/30/2021 13:41:09 - INFO - __main__ - Step 2615: {'lr': 0.0004999787667280492, 'samples': 502080, 'steps': 2614, 'loss/train': 3.250086784362793} -08/30/2021 13:41:10 - INFO - __main__ - Step 2616: {'lr': 0.0004999786975089577, 'samples': 502272, 'steps': 2615, 'loss/train': 3.8277294635772705} -08/30/2021 13:41:11 - INFO - __main__ - Step 2617: {'lr': 0.0004999786281772296, 'samples': 502464, 'steps': 2616, 'loss/train': 2.623059034347534} -08/30/2021 13:41:11 - INFO - __main__ - Step 2618: {'lr': 0.0004999785587328651, 'samples': 502656, 'steps': 2617, 'loss/train': 2.9890518188476562} -08/30/2021 13:41:11 - INFO - __main__ - Step 2619: {'lr': 0.0004999784891758641, 'samples': 502848, 'steps': 2618, 'loss/train': 3.5353376865386963} -08/30/2021 13:41:12 - INFO - __main__ - Step 2620: {'lr': 0.0004999784195062266, 'samples': 503040, 'steps': 2619, 'loss/train': 3.4909520149230957} -08/30/2021 13:41:13 - INFO - __main__ - Step 2621: {'lr': 0.0004999783497239526, 'samples': 503232, 'steps': 2620, 'loss/train': 3.193816661834717} -08/30/2021 13:41:13 - INFO - __main__ - Step 2622: {'lr': 0.0004999782798290424, 'samples': 503424, 'steps': 2621, 'loss/train': 3.023629903793335} -08/30/2021 13:41:14 - INFO - __main__ - Step 2623: {'lr': 0.0004999782098214957, 'samples': 503616, 'steps': 2622, 'loss/train': 2.9927542209625244} -08/30/2021 13:41:14 - INFO - __main__ - Step 2624: {'lr': 0.0004999781397013127, 'samples': 503808, 'steps': 2623, 'loss/train': 3.0726561546325684} -08/30/2021 13:41:14 - INFO - __main__ - Step 2625: {'lr': 0.0004999780694684934, 'samples': 504000, 'steps': 2624, 'loss/train': 3.3661868572235107} -08/30/2021 13:41:16 - INFO - __main__ - Step 2626: {'lr': 0.000499977999123038, 'samples': 504192, 'steps': 2625, 'loss/train': 3.088892698287964} -08/30/2021 13:41:16 - INFO - __main__ - Step 2627: {'lr': 0.0004999779286649461, 'samples': 504384, 'steps': 2626, 'loss/train': 2.8224613666534424} -08/30/2021 13:41:17 - INFO - __main__ - Step 2628: {'lr': 0.0004999778580942183, 'samples': 504576, 'steps': 2627, 'loss/train': 3.0479722023010254} -08/30/2021 13:41:17 - INFO - __main__ - Step 2629: {'lr': 0.000499977787410854, 'samples': 504768, 'steps': 2628, 'loss/train': 2.738128900527954} -08/30/2021 13:41:17 - INFO - __main__ - Step 2630: {'lr': 0.0004999777166148539, 'samples': 504960, 'steps': 2629, 'loss/train': 3.167553186416626} -08/30/2021 13:41:19 - INFO - __main__ - Step 2631: {'lr': 0.0004999776457062175, 'samples': 505152, 'steps': 2630, 'loss/train': 3.0850493907928467} -08/30/2021 13:41:19 - INFO - __main__ - Step 2632: {'lr': 0.0004999775746849451, 'samples': 505344, 'steps': 2631, 'loss/train': 2.834916353225708} -08/30/2021 13:41:20 - INFO - __main__ - Step 2633: {'lr': 0.0004999775035510367, 'samples': 505536, 'steps': 2632, 'loss/train': 3.749802827835083} -08/30/2021 13:41:20 - INFO - __main__ - Step 2634: {'lr': 0.0004999774323044922, 'samples': 505728, 'steps': 2633, 'loss/train': 0.6642865538597107} -08/30/2021 13:41:21 - INFO - __main__ - Step 2635: {'lr': 0.0004999773609453118, 'samples': 505920, 'steps': 2634, 'loss/train': 3.4033918380737305} -08/30/2021 13:41:22 - INFO - __main__ - Step 2636: {'lr': 0.0004999772894734954, 'samples': 506112, 'steps': 2635, 'loss/train': 2.8993465900421143} -08/30/2021 13:41:22 - INFO - __main__ - Step 2637: {'lr': 0.000499977217889043, 'samples': 506304, 'steps': 2636, 'loss/train': 2.7557549476623535} -08/30/2021 13:41:23 - INFO - __main__ - Step 2638: {'lr': 0.0004999771461919549, 'samples': 506496, 'steps': 2637, 'loss/train': 2.9272453784942627} -08/30/2021 13:41:23 - INFO - __main__ - Step 2639: {'lr': 0.0004999770743822309, 'samples': 506688, 'steps': 2638, 'loss/train': 3.2562336921691895} -08/30/2021 13:41:24 - INFO - __main__ - Step 2640: {'lr': 0.0004999770024598711, 'samples': 506880, 'steps': 2639, 'loss/train': 0.7742186784744263} -08/30/2021 13:41:26 - INFO - __main__ - Step 2641: {'lr': 0.0004999769304248754, 'samples': 507072, 'steps': 2640, 'loss/train': 3.7892870903015137} -08/30/2021 13:41:26 - INFO - __main__ - Step 2642: {'lr': 0.0004999768582772442, 'samples': 507264, 'steps': 2641, 'loss/train': 2.8323965072631836} -08/30/2021 13:41:27 - INFO - __main__ - Step 2643: {'lr': 0.000499976786016977, 'samples': 507456, 'steps': 2642, 'loss/train': 3.3806533813476562} -08/30/2021 13:41:27 - INFO - __main__ - Step 2644: {'lr': 0.0004999767136440742, 'samples': 507648, 'steps': 2643, 'loss/train': 0.9227195978164673} -08/30/2021 13:41:27 - INFO - __main__ - Step 2645: {'lr': 0.0004999766411585359, 'samples': 507840, 'steps': 2644, 'loss/train': 2.237401008605957} -08/30/2021 13:41:29 - INFO - __main__ - Step 2646: {'lr': 0.0004999765685603618, 'samples': 508032, 'steps': 2645, 'loss/train': 3.269773483276367} -08/30/2021 13:41:29 - INFO - __main__ - Step 2647: {'lr': 0.0004999764958495522, 'samples': 508224, 'steps': 2646, 'loss/train': 2.6229805946350098} -08/30/2021 13:41:30 - INFO - __main__ - Step 2648: {'lr': 0.0004999764230261072, 'samples': 508416, 'steps': 2647, 'loss/train': 2.917896270751953} -08/30/2021 13:41:30 - INFO - __main__ - Step 2649: {'lr': 0.0004999763500900265, 'samples': 508608, 'steps': 2648, 'loss/train': 3.118557929992676} -08/30/2021 13:41:30 - INFO - __main__ - Step 2650: {'lr': 0.0004999762770413103, 'samples': 508800, 'steps': 2649, 'loss/train': 3.798842191696167} -08/30/2021 13:41:32 - INFO - __main__ - Step 2651: {'lr': 0.0004999762038799587, 'samples': 508992, 'steps': 2650, 'loss/train': 3.517812967300415} -08/30/2021 13:41:32 - INFO - __main__ - Step 2652: {'lr': 0.0004999761306059717, 'samples': 509184, 'steps': 2651, 'loss/train': 3.0383710861206055} -08/30/2021 13:41:33 - INFO - __main__ - Step 2653: {'lr': 0.0004999760572193492, 'samples': 509376, 'steps': 2652, 'loss/train': 3.0678305625915527} -08/30/2021 13:41:33 - INFO - __main__ - Step 2654: {'lr': 0.0004999759837200914, 'samples': 509568, 'steps': 2653, 'loss/train': 2.7814712524414062} -08/30/2021 13:41:33 - INFO - __main__ - Step 2655: {'lr': 0.0004999759101081984, 'samples': 509760, 'steps': 2654, 'loss/train': 1.8292951583862305} -08/30/2021 13:41:34 - INFO - __main__ - Step 2656: {'lr': 0.0004999758363836701, 'samples': 509952, 'steps': 2655, 'loss/train': 3.360480546951294} -08/30/2021 13:41:35 - INFO - __main__ - Step 2657: {'lr': 0.0004999757625465063, 'samples': 510144, 'steps': 2656, 'loss/train': 3.593045234680176} -08/30/2021 13:41:36 - INFO - __main__ - Step 2658: {'lr': 0.0004999756885967075, 'samples': 510336, 'steps': 2657, 'loss/train': 3.1107137203216553} -08/30/2021 13:41:36 - INFO - __main__ - Step 2659: {'lr': 0.0004999756145342735, 'samples': 510528, 'steps': 2658, 'loss/train': 3.030609130859375} -08/30/2021 13:41:36 - INFO - __main__ - Step 2660: {'lr': 0.0004999755403592043, 'samples': 510720, 'steps': 2659, 'loss/train': 2.3007168769836426} -08/30/2021 13:41:37 - INFO - __main__ - Step 2661: {'lr': 0.0004999754660714999, 'samples': 510912, 'steps': 2660, 'loss/train': 2.849210262298584} -08/30/2021 13:41:38 - INFO - __main__ - Step 2662: {'lr': 0.0004999753916711606, 'samples': 511104, 'steps': 2661, 'loss/train': 3.5313100814819336} -08/30/2021 13:41:39 - INFO - __main__ - Step 2663: {'lr': 0.0004999753171581862, 'samples': 511296, 'steps': 2662, 'loss/train': 2.643601417541504} -08/30/2021 13:41:39 - INFO - __main__ - Step 2664: {'lr': 0.0004999752425325766, 'samples': 511488, 'steps': 2663, 'loss/train': 2.52886962890625} -08/30/2021 13:41:40 - INFO - __main__ - Step 2665: {'lr': 0.0004999751677943322, 'samples': 511680, 'steps': 2664, 'loss/train': 2.724182605743408} -08/30/2021 13:41:40 - INFO - __main__ - Step 2666: {'lr': 0.0004999750929434527, 'samples': 511872, 'steps': 2665, 'loss/train': 2.8596858978271484} -08/30/2021 13:41:42 - INFO - __main__ - Step 2667: {'lr': 0.0004999750179799383, 'samples': 512064, 'steps': 2666, 'loss/train': 2.4448113441467285} -08/30/2021 13:41:42 - INFO - __main__ - Step 2668: {'lr': 0.0004999749429037892, 'samples': 512256, 'steps': 2667, 'loss/train': 3.639150381088257} -08/30/2021 13:41:43 - INFO - __main__ - Step 2669: {'lr': 0.0004999748677150051, 'samples': 512448, 'steps': 2668, 'loss/train': 3.338671922683716} -08/30/2021 13:41:43 - INFO - __main__ - Step 2670: {'lr': 0.0004999747924135862, 'samples': 512640, 'steps': 2669, 'loss/train': 3.118865728378296} -08/30/2021 13:41:43 - INFO - __main__ - Step 2671: {'lr': 0.0004999747169995325, 'samples': 512832, 'steps': 2670, 'loss/train': 3.4766738414764404} -08/30/2021 13:41:44 - INFO - __main__ - Step 2672: {'lr': 0.0004999746414728441, 'samples': 513024, 'steps': 2671, 'loss/train': 1.7491579055786133} -08/30/2021 13:41:45 - INFO - __main__ - Step 2673: {'lr': 0.0004999745658335209, 'samples': 513216, 'steps': 2672, 'loss/train': 3.3436026573181152} -08/30/2021 13:41:46 - INFO - __main__ - Step 2674: {'lr': 0.000499974490081563, 'samples': 513408, 'steps': 2673, 'loss/train': 2.8469934463500977} -08/30/2021 13:41:46 - INFO - __main__ - Step 2675: {'lr': 0.0004999744142169707, 'samples': 513600, 'steps': 2674, 'loss/train': 2.5629703998565674} -08/30/2021 13:41:46 - INFO - __main__ - Step 2676: {'lr': 0.0004999743382397435, 'samples': 513792, 'steps': 2675, 'loss/train': 2.840324640274048} -08/30/2021 13:41:47 - INFO - __main__ - Step 2677: {'lr': 0.0004999742621498818, 'samples': 513984, 'steps': 2676, 'loss/train': 3.09045147895813} -08/30/2021 13:41:48 - INFO - __main__ - Step 2678: {'lr': 0.0004999741859473857, 'samples': 514176, 'steps': 2677, 'loss/train': 2.6620028018951416} -08/30/2021 13:41:49 - INFO - __main__ - Step 2679: {'lr': 0.0004999741096322549, 'samples': 514368, 'steps': 2678, 'loss/train': 2.8295633792877197} -08/30/2021 13:41:49 - INFO - __main__ - Step 2680: {'lr': 0.0004999740332044898, 'samples': 514560, 'steps': 2679, 'loss/train': 3.2034780979156494} -08/30/2021 13:41:49 - INFO - __main__ - Step 2681: {'lr': 0.0004999739566640901, 'samples': 514752, 'steps': 2680, 'loss/train': 3.100248336791992} -08/30/2021 13:41:50 - INFO - __main__ - Step 2682: {'lr': 0.000499973880011056, 'samples': 514944, 'steps': 2681, 'loss/train': 2.816262722015381} -08/30/2021 13:41:50 - INFO - __main__ - Step 2683: {'lr': 0.0004999738032453876, 'samples': 515136, 'steps': 2682, 'loss/train': 2.5822339057922363} -08/30/2021 13:41:51 - INFO - __main__ - Step 2684: {'lr': 0.0004999737263670848, 'samples': 515328, 'steps': 2683, 'loss/train': 3.399911642074585} -08/30/2021 13:41:52 - INFO - __main__ - Step 2685: {'lr': 0.0004999736493761477, 'samples': 515520, 'steps': 2684, 'loss/train': 3.240802764892578} -08/30/2021 13:41:52 - INFO - __main__ - Step 2686: {'lr': 0.0004999735722725765, 'samples': 515712, 'steps': 2685, 'loss/train': 1.476607322692871} -08/30/2021 13:41:53 - INFO - __main__ - Step 2687: {'lr': 0.0004999734950563709, 'samples': 515904, 'steps': 2686, 'loss/train': 3.037910223007202} -08/30/2021 13:41:53 - INFO - __main__ - Step 2688: {'lr': 0.0004999734177275311, 'samples': 516096, 'steps': 2687, 'loss/train': 1.8880975246429443} -08/30/2021 13:41:54 - INFO - __main__ - Step 2689: {'lr': 0.0004999733402860572, 'samples': 516288, 'steps': 2688, 'loss/train': 3.124321699142456} -08/30/2021 13:41:55 - INFO - __main__ - Step 2690: {'lr': 0.0004999732627319491, 'samples': 516480, 'steps': 2689, 'loss/train': 3.036329984664917} -08/30/2021 13:41:55 - INFO - __main__ - Step 2691: {'lr': 0.000499973185065207, 'samples': 516672, 'steps': 2690, 'loss/train': 3.331474781036377} -08/30/2021 13:41:56 - INFO - __main__ - Step 2692: {'lr': 0.0004999731072858307, 'samples': 516864, 'steps': 2691, 'loss/train': 2.3075766563415527} -08/30/2021 13:41:56 - INFO - __main__ - Step 2693: {'lr': 0.0004999730293938205, 'samples': 517056, 'steps': 2692, 'loss/train': 3.0612525939941406} -08/30/2021 13:41:58 - INFO - __main__ - Step 2694: {'lr': 0.0004999729513891762, 'samples': 517248, 'steps': 2693, 'loss/train': 3.400170087814331} -08/30/2021 13:41:59 - INFO - __main__ - Step 2695: {'lr': 0.000499972873271898, 'samples': 517440, 'steps': 2694, 'loss/train': 3.0846455097198486} -08/30/2021 13:41:59 - INFO - __main__ - Step 2696: {'lr': 0.0004999727950419859, 'samples': 517632, 'steps': 2695, 'loss/train': 0.9213229417800903} -08/30/2021 13:41:59 - INFO - __main__ - Step 2697: {'lr': 0.0004999727166994399, 'samples': 517824, 'steps': 2696, 'loss/train': 3.088224172592163} -08/30/2021 13:42:00 - INFO - __main__ - Step 2698: {'lr': 0.0004999726382442601, 'samples': 518016, 'steps': 2697, 'loss/train': 3.2991228103637695} -08/30/2021 13:42:01 - INFO - __main__ - Step 2699: {'lr': 0.0004999725596764465, 'samples': 518208, 'steps': 2698, 'loss/train': 2.712589979171753} -08/30/2021 13:42:02 - INFO - __main__ - Step 2700: {'lr': 0.000499972480995999, 'samples': 518400, 'steps': 2699, 'loss/train': 2.3636298179626465} -08/30/2021 13:42:02 - INFO - __main__ - Step 2701: {'lr': 0.0004999724022029179, 'samples': 518592, 'steps': 2700, 'loss/train': 2.9854085445404053} -08/30/2021 13:42:02 - INFO - __main__ - Step 2702: {'lr': 0.000499972323297203, 'samples': 518784, 'steps': 2701, 'loss/train': 2.5155811309814453} -08/30/2021 13:42:03 - INFO - __main__ - Step 2703: {'lr': 0.0004999722442788544, 'samples': 518976, 'steps': 2702, 'loss/train': 2.944446563720703} -08/30/2021 13:42:04 - INFO - __main__ - Step 2704: {'lr': 0.0004999721651478723, 'samples': 519168, 'steps': 2703, 'loss/train': 2.7215254306793213} -08/30/2021 13:42:05 - INFO - __main__ - Step 2705: {'lr': 0.0004999720859042565, 'samples': 519360, 'steps': 2704, 'loss/train': 3.0727028846740723} -08/30/2021 13:42:05 - INFO - __main__ - Step 2706: {'lr': 0.0004999720065480071, 'samples': 519552, 'steps': 2705, 'loss/train': 2.5038321018218994} -08/30/2021 13:42:06 - INFO - __main__ - Step 2707: {'lr': 0.0004999719270791242, 'samples': 519744, 'steps': 2706, 'loss/train': 2.4575345516204834} -08/30/2021 13:42:06 - INFO - __main__ - Step 2708: {'lr': 0.0004999718474976078, 'samples': 519936, 'steps': 2707, 'loss/train': 2.6038658618927} -08/30/2021 13:42:08 - INFO - __main__ - Step 2709: {'lr': 0.000499971767803458, 'samples': 520128, 'steps': 2708, 'loss/train': 2.9975969791412354} -08/30/2021 13:42:08 - INFO - __main__ - Step 2710: {'lr': 0.0004999716879966747, 'samples': 520320, 'steps': 2709, 'loss/train': 2.7358040809631348} -08/30/2021 13:42:08 - INFO - __main__ - Step 2711: {'lr': 0.000499971608077258, 'samples': 520512, 'steps': 2710, 'loss/train': 1.7337361574172974} -08/30/2021 13:42:09 - INFO - __main__ - Step 2712: {'lr': 0.000499971528045208, 'samples': 520704, 'steps': 2711, 'loss/train': 2.743546962738037} -08/30/2021 13:42:09 - INFO - __main__ - Step 2713: {'lr': 0.0004999714479005248, 'samples': 520896, 'steps': 2712, 'loss/train': 2.940654754638672} -08/30/2021 13:42:11 - INFO - __main__ - Step 2714: {'lr': 0.0004999713676432082, 'samples': 521088, 'steps': 2713, 'loss/train': 2.064807176589966} -08/30/2021 13:42:11 - INFO - __main__ - Step 2715: {'lr': 0.0004999712872732584, 'samples': 521280, 'steps': 2714, 'loss/train': 3.6759839057922363} -08/30/2021 13:42:12 - INFO - __main__ - Step 2716: {'lr': 0.0004999712067906754, 'samples': 521472, 'steps': 2715, 'loss/train': 2.991039514541626} -08/30/2021 13:42:12 - INFO - __main__ - Step 2717: {'lr': 0.0004999711261954591, 'samples': 521664, 'steps': 2716, 'loss/train': 2.042520046234131} -08/30/2021 13:42:12 - INFO - __main__ - Step 2718: {'lr': 0.0004999710454876099, 'samples': 521856, 'steps': 2717, 'loss/train': 2.5179977416992188} -08/30/2021 13:42:13 - INFO - __main__ - Step 2719: {'lr': 0.0004999709646671274, 'samples': 522048, 'steps': 2718, 'loss/train': 3.064622640609741} -08/30/2021 13:42:14 - INFO - __main__ - Step 2720: {'lr': 0.0004999708837340119, 'samples': 522240, 'steps': 2719, 'loss/train': 2.5993306636810303} -08/30/2021 13:42:15 - INFO - __main__ - Step 2721: {'lr': 0.0004999708026882635, 'samples': 522432, 'steps': 2720, 'loss/train': 2.747556209564209} -08/30/2021 13:42:15 - INFO - __main__ - Step 2722: {'lr': 0.000499970721529882, 'samples': 522624, 'steps': 2721, 'loss/train': 2.8838469982147217} -08/30/2021 13:42:15 - INFO - __main__ - Step 2723: {'lr': 0.0004999706402588675, 'samples': 522816, 'steps': 2722, 'loss/train': 3.420832633972168} -08/30/2021 13:42:16 - INFO - __main__ - Step 2724: {'lr': 0.0004999705588752202, 'samples': 523008, 'steps': 2723, 'loss/train': 1.2347540855407715} -08/30/2021 13:42:17 - INFO - __main__ - Step 2725: {'lr': 0.00049997047737894, 'samples': 523200, 'steps': 2724, 'loss/train': 3.2386176586151123} -08/30/2021 13:42:18 - INFO - __main__ - Step 2726: {'lr': 0.0004999703957700269, 'samples': 523392, 'steps': 2725, 'loss/train': 2.972571849822998} -08/30/2021 13:42:18 - INFO - __main__ - Step 2727: {'lr': 0.000499970314048481, 'samples': 523584, 'steps': 2726, 'loss/train': 2.3461365699768066} -08/30/2021 13:42:18 - INFO - __main__ - Step 2728: {'lr': 0.0004999702322143023, 'samples': 523776, 'steps': 2727, 'loss/train': 2.939415216445923} -08/30/2021 13:42:19 - INFO - __main__ - Step 2729: {'lr': 0.000499970150267491, 'samples': 523968, 'steps': 2728, 'loss/train': 2.949035406112671} -08/30/2021 13:42:21 - INFO - __main__ - Step 2730: {'lr': 0.0004999700682080469, 'samples': 524160, 'steps': 2729, 'loss/train': 2.9603052139282227} -08/30/2021 13:42:21 - INFO - __main__ - Step 2731: {'lr': 0.0004999699860359702, 'samples': 524352, 'steps': 2730, 'loss/train': 2.4228169918060303} -08/30/2021 13:42:21 - INFO - __main__ - Step 2732: {'lr': 0.0004999699037512608, 'samples': 524544, 'steps': 2731, 'loss/train': 3.20652174949646} -08/30/2021 13:42:22 - INFO - __main__ - Step 2733: {'lr': 0.000499969821353919, 'samples': 524736, 'steps': 2732, 'loss/train': 2.2140450477600098} -08/30/2021 13:42:22 - INFO - __main__ - Step 2734: {'lr': 0.0004999697388439444, 'samples': 524928, 'steps': 2733, 'loss/train': 3.1131787300109863} -08/30/2021 13:42:22 - INFO - __main__ - Step 2735: {'lr': 0.0004999696562213375, 'samples': 525120, 'steps': 2734, 'loss/train': 2.2171590328216553} -08/30/2021 13:42:24 - INFO - __main__ - Step 2736: {'lr': 0.0004999695734860981, 'samples': 525312, 'steps': 2735, 'loss/train': 3.1607298851013184} -08/30/2021 13:42:25 - INFO - __main__ - Step 2737: {'lr': 0.0004999694906382262, 'samples': 525504, 'steps': 2736, 'loss/train': 2.0003676414489746} -08/30/2021 13:42:25 - INFO - __main__ - Step 2738: {'lr': 0.0004999694076777219, 'samples': 525696, 'steps': 2737, 'loss/train': 2.778306722640991} -08/30/2021 13:42:25 - INFO - __main__ - Step 2739: {'lr': 0.0004999693246045854, 'samples': 525888, 'steps': 2738, 'loss/train': 2.8651514053344727} -08/30/2021 13:42:26 - INFO - __main__ - Step 2740: {'lr': 0.0004999692414188164, 'samples': 526080, 'steps': 2739, 'loss/train': 2.8148608207702637} -08/30/2021 13:42:27 - INFO - __main__ - Step 2741: {'lr': 0.0004999691581204152, 'samples': 526272, 'steps': 2740, 'loss/train': 2.772371292114258} -08/30/2021 13:42:28 - INFO - __main__ - Step 2742: {'lr': 0.0004999690747093816, 'samples': 526464, 'steps': 2741, 'loss/train': 2.3568027019500732} -08/30/2021 13:42:28 - INFO - __main__ - Step 2743: {'lr': 0.000499968991185716, 'samples': 526656, 'steps': 2742, 'loss/train': 2.353330373764038} -08/30/2021 13:42:28 - INFO - __main__ - Step 2744: {'lr': 0.0004999689075494182, 'samples': 526848, 'steps': 2743, 'loss/train': 3.9103636741638184} -08/30/2021 13:42:29 - INFO - __main__ - Step 2745: {'lr': 0.0004999688238004882, 'samples': 527040, 'steps': 2744, 'loss/train': 2.5432333946228027} -08/30/2021 13:42:30 - INFO - __main__ - Step 2746: {'lr': 0.0004999687399389262, 'samples': 527232, 'steps': 2745, 'loss/train': 3.0544979572296143} -08/30/2021 13:42:31 - INFO - __main__ - Step 2747: {'lr': 0.0004999686559647319, 'samples': 527424, 'steps': 2746, 'loss/train': 1.6781655550003052} -08/30/2021 13:42:31 - INFO - __main__ - Step 2748: {'lr': 0.0004999685718779058, 'samples': 527616, 'steps': 2747, 'loss/train': 2.2461705207824707} -08/30/2021 13:42:31 - INFO - __main__ - Step 2749: {'lr': 0.0004999684876784477, 'samples': 527808, 'steps': 2748, 'loss/train': 2.9054646492004395} -08/30/2021 13:42:32 - INFO - __main__ - Step 2750: {'lr': 0.0004999684033663576, 'samples': 528000, 'steps': 2749, 'loss/train': 2.8186492919921875} -08/30/2021 13:42:32 - INFO - __main__ - Step 2751: {'lr': 0.0004999683189416356, 'samples': 528192, 'steps': 2750, 'loss/train': 3.3227179050445557} -08/30/2021 13:42:35 - INFO - __main__ - Step 2752: {'lr': 0.0004999682344042817, 'samples': 528384, 'steps': 2751, 'loss/train': 1.0305490493774414} -08/30/2021 13:42:35 - INFO - __main__ - Step 2753: {'lr': 0.000499968149754296, 'samples': 528576, 'steps': 2752, 'loss/train': 2.0445303916931152} -08/30/2021 13:42:35 - INFO - __main__ - Step 2754: {'lr': 0.0004999680649916786, 'samples': 528768, 'steps': 2753, 'loss/train': 2.7636899948120117} -08/30/2021 13:42:36 - INFO - __main__ - Step 2755: {'lr': 0.0004999679801164295, 'samples': 528960, 'steps': 2754, 'loss/train': 0.5936917066574097} -08/30/2021 13:42:36 - INFO - __main__ - Step 2756: {'lr': 0.0004999678951285485, 'samples': 529152, 'steps': 2755, 'loss/train': 2.809025764465332} -08/30/2021 13:42:37 - INFO - __main__ - Step 2757: {'lr': 0.0004999678100280358, 'samples': 529344, 'steps': 2756, 'loss/train': 2.439009189605713} -08/30/2021 13:42:38 - INFO - __main__ - Step 2758: {'lr': 0.0004999677248148916, 'samples': 529536, 'steps': 2757, 'loss/train': 2.985081672668457} -08/30/2021 13:42:38 - INFO - __main__ - Step 2759: {'lr': 0.0004999676394891158, 'samples': 529728, 'steps': 2758, 'loss/train': 2.110480546951294} -08/30/2021 13:42:39 - INFO - __main__ - Step 2760: {'lr': 0.0004999675540507083, 'samples': 529920, 'steps': 2759, 'loss/train': 3.4083094596862793} -08/30/2021 13:42:39 - INFO - __main__ - Step 2761: {'lr': 0.0004999674684996694, 'samples': 530112, 'steps': 2760, 'loss/train': 3.2949750423431396} -08/30/2021 13:42:41 - INFO - __main__ - Step 2762: {'lr': 0.0004999673828359989, 'samples': 530304, 'steps': 2761, 'loss/train': 2.825989246368408} -08/30/2021 13:42:41 - INFO - __main__ - Step 2763: {'lr': 0.0004999672970596971, 'samples': 530496, 'steps': 2762, 'loss/train': 2.7158119678497314} -08/30/2021 13:42:41 - INFO - __main__ - Step 2764: {'lr': 0.0004999672111707639, 'samples': 530688, 'steps': 2763, 'loss/train': 2.3397819995880127} -08/30/2021 13:42:42 - INFO - __main__ - Step 2765: {'lr': 0.0004999671251691991, 'samples': 530880, 'steps': 2764, 'loss/train': 3.135607957839966} -08/30/2021 13:42:42 - INFO - __main__ - Step 2766: {'lr': 0.0004999670390550032, 'samples': 531072, 'steps': 2765, 'loss/train': 3.184204339981079} -08/30/2021 13:42:44 - INFO - __main__ - Step 2767: {'lr': 0.000499966952828176, 'samples': 531264, 'steps': 2766, 'loss/train': 1.9256181716918945} -08/30/2021 13:42:44 - INFO - __main__ - Step 2768: {'lr': 0.0004999668664887175, 'samples': 531456, 'steps': 2767, 'loss/train': 2.995103597640991} -08/30/2021 13:42:44 - INFO - __main__ - Step 2769: {'lr': 0.0004999667800366278, 'samples': 531648, 'steps': 2768, 'loss/train': 3.041548252105713} -08/30/2021 13:42:45 - INFO - __main__ - Step 2770: {'lr': 0.0004999666934719069, 'samples': 531840, 'steps': 2769, 'loss/train': 0.5235479474067688} -08/30/2021 13:42:45 - INFO - __main__ - Step 2771: {'lr': 0.0004999666067945548, 'samples': 532032, 'steps': 2770, 'loss/train': 2.7310903072357178} -08/30/2021 13:42:47 - INFO - __main__ - Step 2772: {'lr': 0.0004999665200045716, 'samples': 532224, 'steps': 2771, 'loss/train': 3.507369041442871} -08/30/2021 13:42:47 - INFO - __main__ - Step 2773: {'lr': 0.0004999664331019574, 'samples': 532416, 'steps': 2772, 'loss/train': 3.7877254486083984} -08/30/2021 13:42:47 - INFO - __main__ - Step 2774: {'lr': 0.0004999663460867123, 'samples': 532608, 'steps': 2773, 'loss/train': 3.072702169418335} -08/30/2021 13:42:48 - INFO - __main__ - Step 2775: {'lr': 0.000499966258958836, 'samples': 532800, 'steps': 2774, 'loss/train': 2.467533826828003} -08/30/2021 13:42:48 - INFO - __main__ - Step 2776: {'lr': 0.000499966171718329, 'samples': 532992, 'steps': 2775, 'loss/train': 2.8478052616119385} -08/30/2021 13:42:50 - INFO - __main__ - Step 2777: {'lr': 0.000499966084365191, 'samples': 533184, 'steps': 2776, 'loss/train': 2.8935816287994385} -08/30/2021 13:42:50 - INFO - __main__ - Step 2778: {'lr': 0.0004999659968994221, 'samples': 533376, 'steps': 2777, 'loss/train': 2.1907730102539062} -08/30/2021 13:42:51 - INFO - __main__ - Step 2779: {'lr': 0.0004999659093210223, 'samples': 533568, 'steps': 2778, 'loss/train': 2.685602903366089} -08/30/2021 13:42:51 - INFO - __main__ - Step 2780: {'lr': 0.0004999658216299919, 'samples': 533760, 'steps': 2779, 'loss/train': 2.8193023204803467} -08/30/2021 13:42:51 - INFO - __main__ - Step 2781: {'lr': 0.0004999657338263308, 'samples': 533952, 'steps': 2780, 'loss/train': 3.0136878490448} -08/30/2021 13:42:52 - INFO - __main__ - Step 2782: {'lr': 0.0004999656459100388, 'samples': 534144, 'steps': 2781, 'loss/train': 2.5547780990600586} -08/30/2021 13:42:53 - INFO - __main__ - Step 2783: {'lr': 0.0004999655578811161, 'samples': 534336, 'steps': 2782, 'loss/train': 2.158917188644409} -08/30/2021 13:42:54 - INFO - __main__ - Step 2784: {'lr': 0.0004999654697395629, 'samples': 534528, 'steps': 2783, 'loss/train': 3.0252928733825684} -08/30/2021 13:42:54 - INFO - __main__ - Step 2785: {'lr': 0.0004999653814853791, 'samples': 534720, 'steps': 2784, 'loss/train': 3.049435615539551} -08/30/2021 13:42:54 - INFO - __main__ - Step 2786: {'lr': 0.0004999652931185648, 'samples': 534912, 'steps': 2785, 'loss/train': 2.6159462928771973} -08/30/2021 13:42:55 - INFO - __main__ - Step 2787: {'lr': 0.00049996520463912, 'samples': 535104, 'steps': 2786, 'loss/train': 2.8965871334075928} -08/30/2021 13:42:56 - INFO - __main__ - Step 2788: {'lr': 0.0004999651160470447, 'samples': 535296, 'steps': 2787, 'loss/train': 2.8150036334991455} -08/30/2021 13:42:57 - INFO - __main__ - Step 2789: {'lr': 0.0004999650273423389, 'samples': 535488, 'steps': 2788, 'loss/train': 2.938845157623291} -08/30/2021 13:42:57 - INFO - __main__ - Step 2790: {'lr': 0.0004999649385250028, 'samples': 535680, 'steps': 2789, 'loss/train': 2.8934452533721924} -08/30/2021 13:42:57 - INFO - __main__ - Step 2791: {'lr': 0.0004999648495950363, 'samples': 535872, 'steps': 2790, 'loss/train': 2.1574251651763916} -08/30/2021 13:42:58 - INFO - __main__ - Step 2792: {'lr': 0.0004999647605524396, 'samples': 536064, 'steps': 2791, 'loss/train': 3.3665034770965576} -08/30/2021 13:42:59 - INFO - __main__ - Step 2793: {'lr': 0.0004999646713972126, 'samples': 536256, 'steps': 2792, 'loss/train': 2.7290778160095215} -08/30/2021 13:43:00 - INFO - __main__ - Step 2794: {'lr': 0.0004999645821293552, 'samples': 536448, 'steps': 2793, 'loss/train': 2.9117014408111572} -08/30/2021 13:43:00 - INFO - __main__ - Step 2795: {'lr': 0.0004999644927488678, 'samples': 536640, 'steps': 2794, 'loss/train': 2.8242461681365967} -08/30/2021 13:43:00 - INFO - __main__ - Step 2796: {'lr': 0.0004999644032557503, 'samples': 536832, 'steps': 2795, 'loss/train': 3.074611186981201} -08/30/2021 13:43:01 - INFO - __main__ - Step 2797: {'lr': 0.0004999643136500027, 'samples': 537024, 'steps': 2796, 'loss/train': 2.4186532497406006} -08/30/2021 13:43:02 - INFO - __main__ - Step 2798: {'lr': 0.0004999642239316249, 'samples': 537216, 'steps': 2797, 'loss/train': 3.6229336261749268} -08/30/2021 13:43:02 - INFO - __main__ - Step 2799: {'lr': 0.000499964134100617, 'samples': 537408, 'steps': 2798, 'loss/train': 3.04872465133667} -08/30/2021 13:43:03 - INFO - __main__ - Step 2800: {'lr': 0.0004999640441569793, 'samples': 537600, 'steps': 2799, 'loss/train': 2.990837574005127} -08/30/2021 13:43:03 - INFO - __main__ - Step 2801: {'lr': 0.0004999639541007116, 'samples': 537792, 'steps': 2800, 'loss/train': 2.8396661281585693} -08/30/2021 13:43:03 - INFO - __main__ - Step 2802: {'lr': 0.0004999638639318141, 'samples': 537984, 'steps': 2801, 'loss/train': 2.4867308139801025} -08/30/2021 13:43:05 - INFO - __main__ - Step 2803: {'lr': 0.0004999637736502866, 'samples': 538176, 'steps': 2802, 'loss/train': 3.2507901191711426} -08/30/2021 13:43:06 - INFO - __main__ - Step 2804: {'lr': 0.0004999636832561293, 'samples': 538368, 'steps': 2803, 'loss/train': 2.402642011642456} -08/30/2021 13:43:06 - INFO - __main__ - Step 2805: {'lr': 0.0004999635927493423, 'samples': 538560, 'steps': 2804, 'loss/train': 3.6187822818756104} -08/30/2021 13:43:07 - INFO - __main__ - Step 2806: {'lr': 0.0004999635021299255, 'samples': 538752, 'steps': 2805, 'loss/train': 2.5364692211151123} -08/30/2021 13:43:07 - INFO - __main__ - Step 2807: {'lr': 0.0004999634113978791, 'samples': 538944, 'steps': 2806, 'loss/train': 2.9410221576690674} -08/30/2021 13:43:09 - INFO - __main__ - Step 2808: {'lr': 0.0004999633205532029, 'samples': 539136, 'steps': 2807, 'loss/train': 3.006633996963501} -08/30/2021 13:43:09 - INFO - __main__ - Step 2809: {'lr': 0.0004999632295958972, 'samples': 539328, 'steps': 2808, 'loss/train': 2.751953363418579} -08/30/2021 13:43:09 - INFO - __main__ - Step 2810: {'lr': 0.0004999631385259617, 'samples': 539520, 'steps': 2809, 'loss/train': 1.81827712059021} -08/30/2021 13:43:10 - INFO - __main__ - Step 2811: {'lr': 0.000499963047343397, 'samples': 539712, 'steps': 2810, 'loss/train': 2.962376356124878} -08/30/2021 13:43:10 - INFO - __main__ - Step 2812: {'lr': 0.0004999629560482026, 'samples': 539904, 'steps': 2811, 'loss/train': 3.367459297180176} -08/30/2021 13:43:12 - INFO - __main__ - Step 2813: {'lr': 0.0004999628646403788, 'samples': 540096, 'steps': 2812, 'loss/train': 3.043518543243408} -08/30/2021 13:43:12 - INFO - __main__ - Step 2814: {'lr': 0.0004999627731199256, 'samples': 540288, 'steps': 2813, 'loss/train': 2.4826416969299316} -08/30/2021 13:43:12 - INFO - __main__ - Step 2815: {'lr': 0.0004999626814868429, 'samples': 540480, 'steps': 2814, 'loss/train': 2.8994929790496826} -08/30/2021 13:43:13 - INFO - __main__ - Step 2816: {'lr': 0.0004999625897411311, 'samples': 540672, 'steps': 2815, 'loss/train': 2.9685115814208984} -08/30/2021 13:43:13 - INFO - __main__ - Step 2817: {'lr': 0.0004999624978827899, 'samples': 540864, 'steps': 2816, 'loss/train': 3.080095052719116} -08/30/2021 13:43:13 - INFO - __main__ - Step 2818: {'lr': 0.0004999624059118194, 'samples': 541056, 'steps': 2817, 'loss/train': 2.7055742740631104} -08/30/2021 13:43:15 - INFO - __main__ - Step 2819: {'lr': 0.0004999623138282198, 'samples': 541248, 'steps': 2818, 'loss/train': 2.3578941822052} -08/30/2021 13:43:15 - INFO - __main__ - Step 2820: {'lr': 0.000499962221631991, 'samples': 541440, 'steps': 2819, 'loss/train': 2.7520699501037598} -08/30/2021 13:43:16 - INFO - __main__ - Step 2821: {'lr': 0.0004999621293231331, 'samples': 541632, 'steps': 2820, 'loss/train': 3.0708067417144775} -08/30/2021 13:43:16 - INFO - __main__ - Step 2822: {'lr': 0.0004999620369016461, 'samples': 541824, 'steps': 2821, 'loss/train': 2.742736339569092} -08/30/2021 13:43:16 - INFO - __main__ - Step 2823: {'lr': 0.00049996194436753, 'samples': 542016, 'steps': 2822, 'loss/train': 3.262277126312256} -08/30/2021 13:43:18 - INFO - __main__ - Step 2824: {'lr': 0.000499961851720785, 'samples': 542208, 'steps': 2823, 'loss/train': 2.1122236251831055} -08/30/2021 13:43:18 - INFO - __main__ - Step 2825: {'lr': 0.000499961758961411, 'samples': 542400, 'steps': 2824, 'loss/train': 3.081420660018921} -08/30/2021 13:43:19 - INFO - __main__ - Step 2826: {'lr': 0.0004999616660894081, 'samples': 542592, 'steps': 2825, 'loss/train': 2.7934391498565674} -08/30/2021 13:43:19 - INFO - __main__ - Step 2827: {'lr': 0.0004999615731047762, 'samples': 542784, 'steps': 2826, 'loss/train': 2.1765007972717285} -08/30/2021 13:43:19 - INFO - __main__ - Step 2828: {'lr': 0.0004999614800075158, 'samples': 542976, 'steps': 2827, 'loss/train': 2.8672866821289062} -08/30/2021 13:43:21 - INFO - __main__ - Step 2829: {'lr': 0.0004999613867976264, 'samples': 543168, 'steps': 2828, 'loss/train': 2.6867456436157227} -08/30/2021 13:43:21 - INFO - __main__ - Step 2830: {'lr': 0.0004999612934751082, 'samples': 543360, 'steps': 2829, 'loss/train': 1.432883381843567} -08/30/2021 13:43:22 - INFO - __main__ - Step 2831: {'lr': 0.0004999612000399614, 'samples': 543552, 'steps': 2830, 'loss/train': 2.7495994567871094} -08/30/2021 13:43:22 - INFO - __main__ - Step 2832: {'lr': 0.0004999611064921859, 'samples': 543744, 'steps': 2831, 'loss/train': 2.7531652450561523} -08/30/2021 13:43:22 - INFO - __main__ - Step 2833: {'lr': 0.0004999610128317818, 'samples': 543936, 'steps': 2832, 'loss/train': 2.5705811977386475} -08/30/2021 13:43:24 - INFO - __main__ - Step 2834: {'lr': 0.0004999609190587492, 'samples': 544128, 'steps': 2833, 'loss/train': 2.111081123352051} -08/30/2021 13:43:24 - INFO - __main__ - Step 2835: {'lr': 0.000499960825173088, 'samples': 544320, 'steps': 2834, 'loss/train': 2.756847620010376} -08/30/2021 13:43:25 - INFO - __main__ - Step 2836: {'lr': 0.0004999607311747983, 'samples': 544512, 'steps': 2835, 'loss/train': 2.611893653869629} -08/30/2021 13:43:25 - INFO - __main__ - Step 2837: {'lr': 0.0004999606370638801, 'samples': 544704, 'steps': 2836, 'loss/train': 1.6375468969345093} -08/30/2021 13:43:25 - INFO - __main__ - Step 2838: {'lr': 0.0004999605428403336, 'samples': 544896, 'steps': 2837, 'loss/train': 2.838456153869629} -08/30/2021 13:43:27 - INFO - __main__ - Step 2839: {'lr': 0.0004999604485041585, 'samples': 545088, 'steps': 2838, 'loss/train': 3.248014211654663} -08/30/2021 13:43:27 - INFO - __main__ - Step 2840: {'lr': 0.0004999603540553554, 'samples': 545280, 'steps': 2839, 'loss/train': 3.247673511505127} -08/30/2021 13:43:28 - INFO - __main__ - Step 2841: {'lr': 0.0004999602594939238, 'samples': 545472, 'steps': 2840, 'loss/train': 2.9345333576202393} -08/30/2021 13:43:28 - INFO - __main__ - Step 2842: {'lr': 0.0004999601648198641, 'samples': 545664, 'steps': 2841, 'loss/train': 2.6978485584259033} -08/30/2021 13:43:28 - INFO - __main__ - Step 2843: {'lr': 0.0004999600700331761, 'samples': 545856, 'steps': 2842, 'loss/train': 0.5655578374862671} -08/30/2021 13:43:30 - INFO - __main__ - Step 2844: {'lr': 0.0004999599751338601, 'samples': 546048, 'steps': 2843, 'loss/train': 2.8231377601623535} -08/30/2021 13:43:30 - INFO - __main__ - Step 2845: {'lr': 0.0004999598801219158, 'samples': 546240, 'steps': 2844, 'loss/train': 2.881303548812866} -08/30/2021 13:43:31 - INFO - __main__ - Step 2846: {'lr': 0.0004999597849973435, 'samples': 546432, 'steps': 2845, 'loss/train': 3.178879499435425} -08/30/2021 13:43:31 - INFO - __main__ - Step 2847: {'lr': 0.0004999596897601432, 'samples': 546624, 'steps': 2846, 'loss/train': 1.8442654609680176} -08/30/2021 13:43:31 - INFO - __main__ - Step 2848: {'lr': 0.0004999595944103149, 'samples': 546816, 'steps': 2847, 'loss/train': 2.8082611560821533} -08/30/2021 13:43:33 - INFO - __main__ - Step 2849: {'lr': 0.0004999594989478587, 'samples': 547008, 'steps': 2848, 'loss/train': 2.5219624042510986} -08/30/2021 13:43:33 - INFO - __main__ - Step 2850: {'lr': 0.0004999594033727747, 'samples': 547200, 'steps': 2849, 'loss/train': 2.0088613033294678} -08/30/2021 13:43:34 - INFO - __main__ - Step 2851: {'lr': 0.0004999593076850627, 'samples': 547392, 'steps': 2850, 'loss/train': 2.6474480628967285} -08/30/2021 13:43:34 - INFO - __main__ - Step 2852: {'lr': 0.0004999592118847229, 'samples': 547584, 'steps': 2851, 'loss/train': 2.7833218574523926} -08/30/2021 13:43:34 - INFO - __main__ - Step 2853: {'lr': 0.0004999591159717554, 'samples': 547776, 'steps': 2852, 'loss/train': 2.896838426589966} -08/30/2021 13:43:35 - INFO - __main__ - Step 2854: {'lr': 0.0004999590199461602, 'samples': 547968, 'steps': 2853, 'loss/train': 1.6673650741577148} -08/30/2021 13:43:36 - INFO - __main__ - Step 2855: {'lr': 0.0004999589238079373, 'samples': 548160, 'steps': 2854, 'loss/train': 2.6013550758361816} -08/30/2021 13:43:37 - INFO - __main__ - Step 2856: {'lr': 0.0004999588275570868, 'samples': 548352, 'steps': 2855, 'loss/train': 3.1163270473480225} -08/30/2021 13:43:37 - INFO - __main__ - Step 2857: {'lr': 0.0004999587311936086, 'samples': 548544, 'steps': 2856, 'loss/train': 2.775830030441284} -08/30/2021 13:43:38 - INFO - __main__ - Step 2858: {'lr': 0.000499958634717503, 'samples': 548736, 'steps': 2857, 'loss/train': 2.844712018966675} -08/30/2021 13:43:38 - INFO - __main__ - Step 2859: {'lr': 0.0004999585381287696, 'samples': 548928, 'steps': 2858, 'loss/train': 2.9458110332489014} -08/30/2021 13:43:40 - INFO - __main__ - Step 2860: {'lr': 0.000499958441427409, 'samples': 549120, 'steps': 2859, 'loss/train': 4.294079303741455} -08/30/2021 13:43:40 - INFO - __main__ - Step 2861: {'lr': 0.0004999583446134209, 'samples': 549312, 'steps': 2860, 'loss/train': 2.7137980461120605} -08/30/2021 13:43:41 - INFO - __main__ - Step 2862: {'lr': 0.0004999582476868055, 'samples': 549504, 'steps': 2861, 'loss/train': 2.79823637008667} -08/30/2021 13:43:41 - INFO - __main__ - Step 2863: {'lr': 0.0004999581506475627, 'samples': 549696, 'steps': 2862, 'loss/train': 1.2336348295211792} -08/30/2021 13:43:41 - INFO - __main__ - Step 2864: {'lr': 0.0004999580534956927, 'samples': 549888, 'steps': 2863, 'loss/train': 3.2243707180023193} -08/30/2021 13:43:43 - INFO - __main__ - Step 2865: {'lr': 0.0004999579562311953, 'samples': 550080, 'steps': 2864, 'loss/train': 3.012106418609619} -08/30/2021 13:43:43 - INFO - __main__ - Step 2866: {'lr': 0.0004999578588540709, 'samples': 550272, 'steps': 2865, 'loss/train': 3.1267731189727783} -08/30/2021 13:43:44 - INFO - __main__ - Step 2867: {'lr': 0.0004999577613643192, 'samples': 550464, 'steps': 2866, 'loss/train': 2.831829786300659} -08/30/2021 13:43:44 - INFO - __main__ - Step 2868: {'lr': 0.0004999576637619404, 'samples': 550656, 'steps': 2867, 'loss/train': 3.1577987670898438} -08/30/2021 13:43:44 - INFO - __main__ - Step 2869: {'lr': 0.0004999575660469347, 'samples': 550848, 'steps': 2868, 'loss/train': 2.829087018966675} -08/30/2021 13:43:45 - INFO - __main__ - Step 2870: {'lr': 0.0004999574682193017, 'samples': 551040, 'steps': 2869, 'loss/train': 3.1651971340179443} -08/30/2021 13:43:46 - INFO - __main__ - Step 2871: {'lr': 0.0004999573702790419, 'samples': 551232, 'steps': 2870, 'loss/train': 2.851490020751953} -08/30/2021 13:43:47 - INFO - __main__ - Step 2872: {'lr': 0.0004999572722261551, 'samples': 551424, 'steps': 2871, 'loss/train': 2.3922886848449707} -08/30/2021 13:43:47 - INFO - __main__ - Step 2873: {'lr': 0.0004999571740606415, 'samples': 551616, 'steps': 2872, 'loss/train': 3.3531363010406494} -08/30/2021 13:43:47 - INFO - __main__ - Step 2874: {'lr': 0.000499957075782501, 'samples': 551808, 'steps': 2873, 'loss/train': 2.9856975078582764} -08/30/2021 13:43:48 - INFO - __main__ - Step 2875: {'lr': 0.0004999569773917337, 'samples': 552000, 'steps': 2874, 'loss/train': 2.7506093978881836} -08/30/2021 13:43:49 - INFO - __main__ - Step 2876: {'lr': 0.0004999568788883397, 'samples': 552192, 'steps': 2875, 'loss/train': 2.358212947845459} -08/30/2021 13:43:50 - INFO - __main__ - Step 2877: {'lr': 0.0004999567802723188, 'samples': 552384, 'steps': 2876, 'loss/train': 1.463113784790039} -08/30/2021 13:43:50 - INFO - __main__ - Step 2878: {'lr': 0.0004999566815436715, 'samples': 552576, 'steps': 2877, 'loss/train': 2.735790729522705} -08/30/2021 13:43:50 - INFO - __main__ - Step 2879: {'lr': 0.0004999565827023974, 'samples': 552768, 'steps': 2878, 'loss/train': 2.3349661827087402} -08/30/2021 13:43:51 - INFO - __main__ - Step 2880: {'lr': 0.0004999564837484967, 'samples': 552960, 'steps': 2879, 'loss/train': 2.679495334625244} -08/30/2021 13:43:52 - INFO - __main__ - Step 2881: {'lr': 0.0004999563846819696, 'samples': 553152, 'steps': 2880, 'loss/train': 1.8391742706298828} -08/30/2021 13:43:53 - INFO - __main__ - Step 2882: {'lr': 0.0004999562855028159, 'samples': 553344, 'steps': 2881, 'loss/train': 2.791215181350708} -08/30/2021 13:43:53 - INFO - __main__ - Step 2883: {'lr': 0.0004999561862110358, 'samples': 553536, 'steps': 2882, 'loss/train': 2.320603847503662} -08/30/2021 13:43:53 - INFO - __main__ - Step 2884: {'lr': 0.0004999560868066293, 'samples': 553728, 'steps': 2883, 'loss/train': 3.279000997543335} -08/30/2021 13:43:54 - INFO - __main__ - Step 2885: {'lr': 0.0004999559872895964, 'samples': 553920, 'steps': 2884, 'loss/train': 2.206374168395996} -08/30/2021 13:43:54 - INFO - __main__ - Step 2886: {'lr': 0.0004999558876599373, 'samples': 554112, 'steps': 2885, 'loss/train': 2.559929132461548} -08/30/2021 13:43:56 - INFO - __main__ - Step 2887: {'lr': 0.0004999557879176518, 'samples': 554304, 'steps': 2886, 'loss/train': 7.318087577819824} -08/30/2021 13:43:56 - INFO - __main__ - Step 2888: {'lr': 0.0004999556880627401, 'samples': 554496, 'steps': 2887, 'loss/train': 3.7238998413085938} -08/30/2021 13:43:56 - INFO - __main__ - Step 2889: {'lr': 0.0004999555880952023, 'samples': 554688, 'steps': 2888, 'loss/train': 3.3081536293029785} -08/30/2021 13:43:57 - INFO - __main__ - Step 2890: {'lr': 0.0004999554880150383, 'samples': 554880, 'steps': 2889, 'loss/train': 3.2428319454193115} -08/30/2021 13:43:57 - INFO - __main__ - Step 2891: {'lr': 0.0004999553878222482, 'samples': 555072, 'steps': 2890, 'loss/train': 2.8276455402374268} -08/30/2021 13:43:59 - INFO - __main__ - Step 2892: {'lr': 0.0004999552875168321, 'samples': 555264, 'steps': 2891, 'loss/train': 3.1300160884857178} -08/30/2021 13:43:59 - INFO - __main__ - Step 2893: {'lr': 0.0004999551870987901, 'samples': 555456, 'steps': 2892, 'loss/train': 3.016570806503296} -08/30/2021 13:43:59 - INFO - __main__ - Step 2894: {'lr': 0.000499955086568122, 'samples': 555648, 'steps': 2893, 'loss/train': 3.561170816421509} -08/30/2021 13:44:00 - INFO - __main__ - Step 2895: {'lr': 0.000499954985924828, 'samples': 555840, 'steps': 2894, 'loss/train': 1.5887417793273926} -08/30/2021 13:44:00 - INFO - __main__ - Step 2896: {'lr': 0.0004999548851689082, 'samples': 556032, 'steps': 2895, 'loss/train': 0.6360597014427185} -08/30/2021 13:44:01 - INFO - __main__ - Step 2897: {'lr': 0.0004999547843003627, 'samples': 556224, 'steps': 2896, 'loss/train': 2.940615177154541} -08/30/2021 13:44:02 - INFO - __main__ - Step 2898: {'lr': 0.0004999546833191912, 'samples': 556416, 'steps': 2897, 'loss/train': 2.7789878845214844} -08/30/2021 13:44:02 - INFO - __main__ - Step 2899: {'lr': 0.0004999545822253941, 'samples': 556608, 'steps': 2898, 'loss/train': 3.103320837020874} -08/30/2021 13:44:03 - INFO - __main__ - Step 2900: {'lr': 0.0004999544810189713, 'samples': 556800, 'steps': 2899, 'loss/train': 2.287760019302368} -08/30/2021 13:44:03 - INFO - __main__ - Step 2901: {'lr': 0.0004999543796999228, 'samples': 556992, 'steps': 2900, 'loss/train': 3.5957651138305664} -08/30/2021 13:44:05 - INFO - __main__ - Step 2902: {'lr': 0.0004999542782682489, 'samples': 557184, 'steps': 2901, 'loss/train': 2.924877166748047} -08/30/2021 13:44:06 - INFO - __main__ - Step 2903: {'lr': 0.0004999541767239493, 'samples': 557376, 'steps': 2902, 'loss/train': 2.783628225326538} -08/30/2021 13:44:06 - INFO - __main__ - Step 2904: {'lr': 0.0004999540750670243, 'samples': 557568, 'steps': 2903, 'loss/train': 3.0987961292266846} -08/30/2021 13:44:06 - INFO - __main__ - Step 2905: {'lr': 0.0004999539732974738, 'samples': 557760, 'steps': 2904, 'loss/train': 2.848283052444458} -08/30/2021 13:44:07 - INFO - __main__ - Step 2906: {'lr': 0.0004999538714152978, 'samples': 557952, 'steps': 2905, 'loss/train': 2.8918533325195312} -08/30/2021 13:44:07 - INFO - __main__ - Step 2907: {'lr': 0.0004999537694204966, 'samples': 558144, 'steps': 2906, 'loss/train': 2.272188663482666} -08/30/2021 13:44:09 - INFO - __main__ - Step 2908: {'lr': 0.0004999536673130701, 'samples': 558336, 'steps': 2907, 'loss/train': 3.046729326248169} -08/30/2021 13:44:09 - INFO - __main__ - Step 2909: {'lr': 0.0004999535650930182, 'samples': 558528, 'steps': 2908, 'loss/train': 2.816863775253296} -08/30/2021 13:44:10 - INFO - __main__ - Step 2910: {'lr': 0.0004999534627603411, 'samples': 558720, 'steps': 2909, 'loss/train': 2.118304967880249} -08/30/2021 13:44:10 - INFO - __main__ - Step 2911: {'lr': 0.0004999533603150389, 'samples': 558912, 'steps': 2910, 'loss/train': 2.6835672855377197} -08/30/2021 13:44:10 - INFO - __main__ - Step 2912: {'lr': 0.0004999532577571116, 'samples': 559104, 'steps': 2911, 'loss/train': 3.151839017868042} -08/30/2021 13:44:12 - INFO - __main__ - Step 2913: {'lr': 0.0004999531550865592, 'samples': 559296, 'steps': 2912, 'loss/train': 2.8047454357147217} -08/30/2021 13:44:12 - INFO - __main__ - Step 2914: {'lr': 0.0004999530523033817, 'samples': 559488, 'steps': 2913, 'loss/train': 2.8529162406921387} -08/30/2021 13:44:13 - INFO - __main__ - Step 2915: {'lr': 0.0004999529494075792, 'samples': 559680, 'steps': 2914, 'loss/train': 2.7388527393341064} -08/30/2021 13:44:13 - INFO - __main__ - Step 2916: {'lr': 0.0004999528463991518, 'samples': 559872, 'steps': 2915, 'loss/train': 2.8058598041534424} -08/30/2021 13:44:13 - INFO - __main__ - Step 2917: {'lr': 0.0004999527432780995, 'samples': 560064, 'steps': 2916, 'loss/train': 3.0856664180755615} -08/30/2021 13:44:15 - INFO - __main__ - Step 2918: {'lr': 0.0004999526400444223, 'samples': 560256, 'steps': 2917, 'loss/train': 1.9239698648452759} -08/30/2021 13:44:15 - INFO - __main__ - Step 2919: {'lr': 0.0004999525366981204, 'samples': 560448, 'steps': 2918, 'loss/train': 3.4998552799224854} -08/30/2021 13:44:16 - INFO - __main__ - Step 2920: {'lr': 0.0004999524332391937, 'samples': 560640, 'steps': 2919, 'loss/train': 2.9600071907043457} -08/30/2021 13:44:16 - INFO - __main__ - Step 2921: {'lr': 0.0004999523296676423, 'samples': 560832, 'steps': 2920, 'loss/train': 2.7623751163482666} -08/30/2021 13:44:16 - INFO - __main__ - Step 2922: {'lr': 0.0004999522259834662, 'samples': 561024, 'steps': 2921, 'loss/train': 2.79846453666687} -08/30/2021 13:44:18 - INFO - __main__ - Step 2923: {'lr': 0.0004999521221866655, 'samples': 561216, 'steps': 2922, 'loss/train': 2.631439447402954} -08/30/2021 13:44:18 - INFO - __main__ - Step 2924: {'lr': 0.0004999520182772402, 'samples': 561408, 'steps': 2923, 'loss/train': 2.282538414001465} -08/30/2021 13:44:19 - INFO - __main__ - Step 2925: {'lr': 0.0004999519142551905, 'samples': 561600, 'steps': 2924, 'loss/train': 2.5863075256347656} -08/30/2021 13:44:19 - INFO - __main__ - Step 2926: {'lr': 0.0004999518101205162, 'samples': 561792, 'steps': 2925, 'loss/train': 1.9376370906829834} -08/30/2021 13:44:19 - INFO - __main__ - Step 2927: {'lr': 0.0004999517058732175, 'samples': 561984, 'steps': 2926, 'loss/train': 2.1587612628936768} -08/30/2021 13:44:20 - INFO - __main__ - Step 2928: {'lr': 0.0004999516015132945, 'samples': 562176, 'steps': 2927, 'loss/train': 3.034369945526123} -08/30/2021 13:44:21 - INFO - __main__ - Step 2929: {'lr': 0.0004999514970407471, 'samples': 562368, 'steps': 2928, 'loss/train': 2.461535930633545} -08/30/2021 13:44:22 - INFO - __main__ - Step 2930: {'lr': 0.0004999513924555754, 'samples': 562560, 'steps': 2929, 'loss/train': 2.53454327583313} -08/30/2021 13:44:22 - INFO - __main__ - Step 2931: {'lr': 0.0004999512877577794, 'samples': 562752, 'steps': 2930, 'loss/train': 2.8248937129974365} -08/30/2021 13:44:22 - INFO - __main__ - Step 2932: {'lr': 0.0004999511829473593, 'samples': 562944, 'steps': 2931, 'loss/train': 0.7965051531791687} -08/30/2021 13:44:23 - INFO - __main__ - Step 2933: {'lr': 0.0004999510780243151, 'samples': 563136, 'steps': 2932, 'loss/train': 2.673820734024048} -08/30/2021 13:44:24 - INFO - __main__ - Step 2934: {'lr': 0.0004999509729886467, 'samples': 563328, 'steps': 2933, 'loss/train': 2.241774082183838} -08/30/2021 13:44:25 - INFO - __main__ - Step 2935: {'lr': 0.0004999508678403542, 'samples': 563520, 'steps': 2934, 'loss/train': 2.892744541168213} -08/30/2021 13:44:25 - INFO - __main__ - Step 2936: {'lr': 0.0004999507625794378, 'samples': 563712, 'steps': 2935, 'loss/train': 3.223254680633545} -08/30/2021 13:44:25 - INFO - __main__ - Step 2937: {'lr': 0.0004999506572058974, 'samples': 563904, 'steps': 2936, 'loss/train': 1.714627981185913} -08/30/2021 13:44:26 - INFO - __main__ - Step 2938: {'lr': 0.0004999505517197331, 'samples': 564096, 'steps': 2937, 'loss/train': 2.4244155883789062} -08/30/2021 13:44:27 - INFO - __main__ - Step 2939: {'lr': 0.000499950446120945, 'samples': 564288, 'steps': 2938, 'loss/train': 1.4697874784469604} -08/30/2021 13:44:28 - INFO - __main__ - Step 2940: {'lr': 0.000499950340409533, 'samples': 564480, 'steps': 2939, 'loss/train': 0.44932907819747925} -08/30/2021 13:44:28 - INFO - __main__ - Step 2941: {'lr': 0.0004999502345854973, 'samples': 564672, 'steps': 2940, 'loss/train': 2.921510934829712} -08/30/2021 13:44:28 - INFO - __main__ - Step 2942: {'lr': 0.0004999501286488378, 'samples': 564864, 'steps': 2941, 'loss/train': 2.3862104415893555} -08/30/2021 13:44:29 - INFO - __main__ - Step 2943: {'lr': 0.0004999500225995547, 'samples': 565056, 'steps': 2942, 'loss/train': 2.6102335453033447} -08/30/2021 13:44:30 - INFO - __main__ - Step 2944: {'lr': 0.000499949916437648, 'samples': 565248, 'steps': 2943, 'loss/train': 2.867708683013916} -08/30/2021 13:44:31 - INFO - __main__ - Step 2945: {'lr': 0.0004999498101631177, 'samples': 565440, 'steps': 2944, 'loss/train': 3.421034336090088} -08/30/2021 13:44:31 - INFO - __main__ - Step 2946: {'lr': 0.0004999497037759638, 'samples': 565632, 'steps': 2945, 'loss/train': 2.4923837184906006} -08/30/2021 13:44:31 - INFO - __main__ - Step 2947: {'lr': 0.0004999495972761865, 'samples': 565824, 'steps': 2946, 'loss/train': 2.0850162506103516} -08/30/2021 13:44:32 - INFO - __main__ - Step 2948: {'lr': 0.0004999494906637857, 'samples': 566016, 'steps': 2947, 'loss/train': 2.3148810863494873} -08/30/2021 13:44:33 - INFO - __main__ - Step 2949: {'lr': 0.0004999493839387615, 'samples': 566208, 'steps': 2948, 'loss/train': 2.917724370956421} -08/30/2021 13:44:34 - INFO - __main__ - Step 2950: {'lr': 0.000499949277101114, 'samples': 566400, 'steps': 2949, 'loss/train': 2.8091204166412354} -08/30/2021 13:44:34 - INFO - __main__ - Step 2951: {'lr': 0.0004999491701508433, 'samples': 566592, 'steps': 2950, 'loss/train': 2.2364890575408936} -08/30/2021 13:44:34 - INFO - __main__ - Step 2952: {'lr': 0.0004999490630879493, 'samples': 566784, 'steps': 2951, 'loss/train': 2.2985527515411377} -08/30/2021 13:44:35 - INFO - __main__ - Step 2953: {'lr': 0.0004999489559124321, 'samples': 566976, 'steps': 2952, 'loss/train': 3.4640183448791504} -08/30/2021 13:44:37 - INFO - __main__ - Step 2954: {'lr': 0.0004999488486242918, 'samples': 567168, 'steps': 2953, 'loss/train': 2.5138840675354004} -08/30/2021 13:44:38 - INFO - __main__ - Step 2955: {'lr': 0.0004999487412235284, 'samples': 567360, 'steps': 2954, 'loss/train': 2.7582364082336426} -08/30/2021 13:44:38 - INFO - __main__ - Step 2956: {'lr': 0.0004999486337101419, 'samples': 567552, 'steps': 2955, 'loss/train': 1.8475825786590576} -08/30/2021 13:44:38 - INFO - __main__ - Step 2957: {'lr': 0.0004999485260841324, 'samples': 567744, 'steps': 2956, 'loss/train': 3.014390468597412} -08/30/2021 13:44:39 - INFO - __main__ - Step 2958: {'lr': 0.0004999484183455, 'samples': 567936, 'steps': 2957, 'loss/train': 2.3483035564422607} -08/30/2021 13:44:39 - INFO - __main__ - Step 2959: {'lr': 0.0004999483104942446, 'samples': 568128, 'steps': 2958, 'loss/train': 2.8362791538238525} -08/30/2021 13:44:41 - INFO - __main__ - Step 2960: {'lr': 0.0004999482025303665, 'samples': 568320, 'steps': 2959, 'loss/train': 2.887427806854248} -08/30/2021 13:44:42 - INFO - __main__ - Step 2961: {'lr': 0.0004999480944538655, 'samples': 568512, 'steps': 2960, 'loss/train': 3.5132014751434326} -08/30/2021 13:44:42 - INFO - __main__ - Step 2962: {'lr': 0.0004999479862647417, 'samples': 568704, 'steps': 2961, 'loss/train': 3.08158540725708} -08/30/2021 13:44:42 - INFO - __main__ - Step 2963: {'lr': 0.0004999478779629953, 'samples': 568896, 'steps': 2962, 'loss/train': 2.0255677700042725} -08/30/2021 13:44:43 - INFO - __main__ - Step 2964: {'lr': 0.0004999477695486261, 'samples': 569088, 'steps': 2963, 'loss/train': 0.8236057162284851} -08/30/2021 13:44:44 - INFO - __main__ - Step 2965: {'lr': 0.0004999476610216345, 'samples': 569280, 'steps': 2964, 'loss/train': 0.859920084476471} -08/30/2021 13:44:45 - INFO - __main__ - Step 2966: {'lr': 0.0004999475523820203, 'samples': 569472, 'steps': 2965, 'loss/train': 2.7543699741363525} -08/30/2021 13:44:45 - INFO - __main__ - Step 2967: {'lr': 0.0004999474436297835, 'samples': 569664, 'steps': 2966, 'loss/train': 2.5906596183776855} -08/30/2021 13:44:45 - INFO - __main__ - Step 2968: {'lr': 0.0004999473347649242, 'samples': 569856, 'steps': 2967, 'loss/train': 1.0227876901626587} -08/30/2021 13:44:46 - INFO - __main__ - Step 2969: {'lr': 0.0004999472257874426, 'samples': 570048, 'steps': 2968, 'loss/train': 2.6242566108703613} -08/30/2021 13:44:48 - INFO - __main__ - Step 2970: {'lr': 0.0004999471166973385, 'samples': 570240, 'steps': 2969, 'loss/train': 2.424834728240967} -08/30/2021 13:44:48 - INFO - __main__ - Step 2971: {'lr': 0.0004999470074946122, 'samples': 570432, 'steps': 2970, 'loss/train': 2.5786919593811035} -08/30/2021 13:44:48 - INFO - __main__ - Step 2972: {'lr': 0.0004999468981792636, 'samples': 570624, 'steps': 2971, 'loss/train': 2.902613878250122} -08/30/2021 13:44:49 - INFO - __main__ - Step 2973: {'lr': 0.0004999467887512928, 'samples': 570816, 'steps': 2972, 'loss/train': 2.933173418045044} -08/30/2021 13:44:49 - INFO - __main__ - Step 2974: {'lr': 0.0004999466792106998, 'samples': 571008, 'steps': 2973, 'loss/train': 2.886467695236206} -08/30/2021 13:44:50 - INFO - __main__ - Step 2975: {'lr': 0.0004999465695574848, 'samples': 571200, 'steps': 2974, 'loss/train': 2.3601338863372803} -08/30/2021 13:44:51 - INFO - __main__ - Step 2976: {'lr': 0.0004999464597916476, 'samples': 571392, 'steps': 2975, 'loss/train': 2.9770824909210205} -08/30/2021 13:44:51 - INFO - __main__ - Step 2977: {'lr': 0.0004999463499131884, 'samples': 571584, 'steps': 2976, 'loss/train': 2.3549747467041016} -08/30/2021 13:44:51 - INFO - __main__ - Step 2978: {'lr': 0.0004999462399221073, 'samples': 571776, 'steps': 2977, 'loss/train': 2.3175888061523438} -08/30/2021 13:44:52 - INFO - __main__ - Step 2979: {'lr': 0.0004999461298184042, 'samples': 571968, 'steps': 2978, 'loss/train': 2.9362945556640625} -08/30/2021 13:44:52 - INFO - __main__ - Step 2980: {'lr': 0.0004999460196020793, 'samples': 572160, 'steps': 2979, 'loss/train': 2.3794565200805664} -08/30/2021 13:44:54 - INFO - __main__ - Step 2981: {'lr': 0.0004999459092731326, 'samples': 572352, 'steps': 2980, 'loss/train': 2.9920153617858887} -08/30/2021 13:44:54 - INFO - __main__ - Step 2982: {'lr': 0.000499945798831564, 'samples': 572544, 'steps': 2981, 'loss/train': 1.9340310096740723} -08/30/2021 13:44:55 - INFO - __main__ - Step 2983: {'lr': 0.0004999456882773737, 'samples': 572736, 'steps': 2982, 'loss/train': 2.715445041656494} -08/30/2021 13:44:55 - INFO - __main__ - Step 2984: {'lr': 0.0004999455776105618, 'samples': 572928, 'steps': 2983, 'loss/train': 2.7663369178771973} -08/30/2021 13:44:55 - INFO - __main__ - Step 2985: {'lr': 0.0004999454668311283, 'samples': 573120, 'steps': 2984, 'loss/train': 2.597182273864746} -08/30/2021 13:44:57 - INFO - __main__ - Step 2986: {'lr': 0.0004999453559390731, 'samples': 573312, 'steps': 2985, 'loss/train': 0.6528981328010559} -08/30/2021 13:44:57 - INFO - __main__ - Step 2987: {'lr': 0.0004999452449343967, 'samples': 573504, 'steps': 2986, 'loss/train': 2.6354496479034424} -08/30/2021 13:44:58 - INFO - __main__ - Step 2988: {'lr': 0.0004999451338170985, 'samples': 573696, 'steps': 2987, 'loss/train': 2.6551873683929443} -08/30/2021 13:44:58 - INFO - __main__ - Step 2989: {'lr': 0.000499945022587179, 'samples': 573888, 'steps': 2988, 'loss/train': 2.0231504440307617} -08/30/2021 13:44:58 - INFO - __main__ - Step 2990: {'lr': 0.0004999449112446381, 'samples': 574080, 'steps': 2989, 'loss/train': 2.8025505542755127} -08/30/2021 13:45:00 - INFO - __main__ - Step 2991: {'lr': 0.000499944799789476, 'samples': 574272, 'steps': 2990, 'loss/train': 2.741412401199341} -08/30/2021 13:45:01 - INFO - __main__ - Step 2992: {'lr': 0.0004999446882216925, 'samples': 574464, 'steps': 2991, 'loss/train': 2.3821704387664795} -08/30/2021 13:45:01 - INFO - __main__ - Step 2993: {'lr': 0.0004999445765412878, 'samples': 574656, 'steps': 2992, 'loss/train': 2.259613037109375} -08/30/2021 13:45:01 - INFO - __main__ - Step 2994: {'lr': 0.0004999444647482619, 'samples': 574848, 'steps': 2993, 'loss/train': 0.6169657707214355} -08/30/2021 13:45:02 - INFO - __main__ - Step 2995: {'lr': 0.0004999443528426149, 'samples': 575040, 'steps': 2994, 'loss/train': 2.9905946254730225} -08/30/2021 13:45:03 - INFO - __main__ - Step 2996: {'lr': 0.0004999442408243469, 'samples': 575232, 'steps': 2995, 'loss/train': 2.6902949810028076} -08/30/2021 13:45:04 - INFO - __main__ - Step 2997: {'lr': 0.0004999441286934578, 'samples': 575424, 'steps': 2996, 'loss/train': 3.835057258605957} -08/30/2021 13:45:04 - INFO - __main__ - Step 2998: {'lr': 0.0004999440164499478, 'samples': 575616, 'steps': 2997, 'loss/train': 3.012542963027954} -08/30/2021 13:45:04 - INFO - __main__ - Step 2999: {'lr': 0.0004999439040938168, 'samples': 575808, 'steps': 2998, 'loss/train': 2.139873504638672} -08/30/2021 13:45:05 - INFO - __main__ - Step 3000: {'lr': 0.000499943791625065, 'samples': 576000, 'steps': 2999, 'loss/train': 2.54128360748291} -08/30/2021 13:45:06 - INFO - __main__ - Step 3001: {'lr': 0.0004999436790436923, 'samples': 576192, 'steps': 3000, 'loss/train': 1.8351815938949585} -08/30/2021 13:45:07 - INFO - __main__ - Step 3002: {'lr': 0.000499943566349699, 'samples': 576384, 'steps': 3001, 'loss/train': 2.538656234741211} -08/30/2021 13:45:07 - INFO - __main__ - Step 3003: {'lr': 0.0004999434535430848, 'samples': 576576, 'steps': 3002, 'loss/train': 2.350154399871826} -08/30/2021 13:45:07 - INFO - __main__ - Step 3004: {'lr': 0.0004999433406238501, 'samples': 576768, 'steps': 3003, 'loss/train': 2.707881212234497} -08/30/2021 13:45:08 - INFO - __main__ - Step 3005: {'lr': 0.0004999432275919947, 'samples': 576960, 'steps': 3004, 'loss/train': 2.6003835201263428} -08/30/2021 13:45:08 - INFO - __main__ - Step 3006: {'lr': 0.0004999431144475187, 'samples': 577152, 'steps': 3005, 'loss/train': 2.8380956649780273} -08/30/2021 13:45:10 - INFO - __main__ - Step 3007: {'lr': 0.0004999430011904222, 'samples': 577344, 'steps': 3006, 'loss/train': 2.5522007942199707} -08/30/2021 13:45:10 - INFO - __main__ - Step 3008: {'lr': 0.0004999428878207054, 'samples': 577536, 'steps': 3007, 'loss/train': 2.474048137664795} -08/30/2021 13:45:11 - INFO - __main__ - Step 3009: {'lr': 0.000499942774338368, 'samples': 577728, 'steps': 3008, 'loss/train': 2.4502363204956055} -08/30/2021 13:45:11 - INFO - __main__ - Step 3010: {'lr': 0.0004999426607434104, 'samples': 577920, 'steps': 3009, 'loss/train': 2.775979518890381} -08/30/2021 13:45:11 - INFO - __main__ - Step 3011: {'lr': 0.0004999425470358324, 'samples': 578112, 'steps': 3010, 'loss/train': 3.078824043273926} -08/30/2021 13:45:13 - INFO - __main__ - Step 3012: {'lr': 0.0004999424332156341, 'samples': 578304, 'steps': 3011, 'loss/train': 2.953322172164917} -08/30/2021 13:45:14 - INFO - __main__ - Step 3013: {'lr': 0.0004999423192828156, 'samples': 578496, 'steps': 3012, 'loss/train': 2.948363780975342} -08/30/2021 13:45:14 - INFO - __main__ - Step 3014: {'lr': 0.0004999422052373771, 'samples': 578688, 'steps': 3013, 'loss/train': 3.5237135887145996} -08/30/2021 13:45:14 - INFO - __main__ - Step 3015: {'lr': 0.0004999420910793183, 'samples': 578880, 'steps': 3014, 'loss/train': 2.7692630290985107} -08/30/2021 13:45:15 - INFO - __main__ - Step 3016: {'lr': 0.0004999419768086397, 'samples': 579072, 'steps': 3015, 'loss/train': 2.4753150939941406} -08/30/2021 13:45:16 - INFO - __main__ - Step 3017: {'lr': 0.0004999418624253408, 'samples': 579264, 'steps': 3016, 'loss/train': 1.1601556539535522} -08/30/2021 13:45:17 - INFO - __main__ - Step 3018: {'lr': 0.0004999417479294221, 'samples': 579456, 'steps': 3017, 'loss/train': 2.7365775108337402} -08/30/2021 13:45:17 - INFO - __main__ - Step 3019: {'lr': 0.0004999416333208835, 'samples': 579648, 'steps': 3018, 'loss/train': 2.1109657287597656} -08/30/2021 13:45:17 - INFO - __main__ - Step 3020: {'lr': 0.0004999415185997252, 'samples': 579840, 'steps': 3019, 'loss/train': 3.3136794567108154} -08/30/2021 13:45:18 - INFO - __main__ - Step 3021: {'lr': 0.0004999414037659468, 'samples': 580032, 'steps': 3020, 'loss/train': 4.073999881744385} -08/30/2021 13:45:18 - INFO - __main__ - Step 3022: {'lr': 0.000499941288819549, 'samples': 580224, 'steps': 3021, 'loss/train': 2.3366594314575195} -08/30/2021 13:45:19 - INFO - __main__ - Step 3023: {'lr': 0.0004999411737605313, 'samples': 580416, 'steps': 3022, 'loss/train': 2.9019672870635986} -08/30/2021 13:45:20 - INFO - __main__ - Step 3024: {'lr': 0.000499941058588894, 'samples': 580608, 'steps': 3023, 'loss/train': 1.7941155433654785} -08/30/2021 13:45:20 - INFO - __main__ - Step 3025: {'lr': 0.0004999409433046371, 'samples': 580800, 'steps': 3024, 'loss/train': 2.956582546234131} -08/30/2021 13:45:21 - INFO - __main__ - Step 3026: {'lr': 0.0004999408279077607, 'samples': 580992, 'steps': 3025, 'loss/train': 2.451669454574585} -08/30/2021 13:45:21 - INFO - __main__ - Step 3027: {'lr': 0.0004999407123982649, 'samples': 581184, 'steps': 3026, 'loss/train': 2.8706061840057373} -08/30/2021 13:45:23 - INFO - __main__ - Step 3028: {'lr': 0.0004999405967761495, 'samples': 581376, 'steps': 3027, 'loss/train': 2.580427885055542} -08/30/2021 13:45:23 - INFO - __main__ - Step 3029: {'lr': 0.0004999404810414149, 'samples': 581568, 'steps': 3028, 'loss/train': 2.147118330001831} -08/30/2021 13:45:24 - INFO - __main__ - Step 3030: {'lr': 0.0004999403651940608, 'samples': 581760, 'steps': 3029, 'loss/train': 2.019071340560913} -08/30/2021 13:45:24 - INFO - __main__ - Step 3031: {'lr': 0.0004999402492340875, 'samples': 581952, 'steps': 3030, 'loss/train': 0.7779306173324585} -08/30/2021 13:45:24 - INFO - __main__ - Step 3032: {'lr': 0.000499940133161495, 'samples': 582144, 'steps': 3031, 'loss/train': 2.4335618019104004} -08/30/2021 13:45:26 - INFO - __main__ - Step 3033: {'lr': 0.0004999400169762834, 'samples': 582336, 'steps': 3032, 'loss/train': 2.718484401702881} -08/30/2021 13:45:27 - INFO - __main__ - Step 3034: {'lr': 0.0004999399006784525, 'samples': 582528, 'steps': 3033, 'loss/train': 2.593709945678711} -08/30/2021 13:45:27 - INFO - __main__ - Step 3035: {'lr': 0.0004999397842680027, 'samples': 582720, 'steps': 3034, 'loss/train': 2.043519973754883} -08/30/2021 13:45:27 - INFO - __main__ - Step 3036: {'lr': 0.0004999396677449338, 'samples': 582912, 'steps': 3035, 'loss/train': 2.6912176609039307} -08/30/2021 13:45:28 - INFO - __main__ - Step 3037: {'lr': 0.000499939551109246, 'samples': 583104, 'steps': 3036, 'loss/train': 2.847600221633911} -08/30/2021 13:45:29 - INFO - __main__ - Step 3038: {'lr': 0.0004999394343609393, 'samples': 583296, 'steps': 3037, 'loss/train': 0.6094777584075928} -08/30/2021 13:45:30 - INFO - __main__ - Step 3039: {'lr': 0.0004999393175000137, 'samples': 583488, 'steps': 3038, 'loss/train': 2.4259679317474365} -08/30/2021 13:45:30 - INFO - __main__ - Step 3040: {'lr': 0.0004999392005264694, 'samples': 583680, 'steps': 3039, 'loss/train': 3.0082595348358154} -08/30/2021 13:45:30 - INFO - __main__ - Step 3041: {'lr': 0.0004999390834403062, 'samples': 583872, 'steps': 3040, 'loss/train': 2.5855770111083984} -08/30/2021 13:45:31 - INFO - __main__ - Step 3042: {'lr': 0.0004999389662415244, 'samples': 584064, 'steps': 3041, 'loss/train': 3.4849119186401367} -08/30/2021 13:45:32 - INFO - __main__ - Step 3043: {'lr': 0.000499938848930124, 'samples': 584256, 'steps': 3042, 'loss/train': 3.171412706375122} -08/30/2021 13:45:33 - INFO - __main__ - Step 3044: {'lr': 0.0004999387315061049, 'samples': 584448, 'steps': 3043, 'loss/train': 3.1442337036132812} -08/30/2021 13:45:33 - INFO - __main__ - Step 3045: {'lr': 0.0004999386139694673, 'samples': 584640, 'steps': 3044, 'loss/train': 2.964331865310669} -08/30/2021 13:45:33 - INFO - __main__ - Step 3046: {'lr': 0.0004999384963202113, 'samples': 584832, 'steps': 3045, 'loss/train': 2.6739697456359863} -08/30/2021 13:45:34 - INFO - __main__ - Step 3047: {'lr': 0.0004999383785583368, 'samples': 585024, 'steps': 3046, 'loss/train': 2.660141944885254} -08/30/2021 13:45:34 - INFO - __main__ - Step 3048: {'lr': 0.0004999382606838439, 'samples': 585216, 'steps': 3047, 'loss/train': 2.9862749576568604} -08/30/2021 13:45:36 - INFO - __main__ - Step 3049: {'lr': 0.0004999381426967327, 'samples': 585408, 'steps': 3048, 'loss/train': 1.8866349458694458} -08/30/2021 13:45:36 - INFO - __main__ - Step 3050: {'lr': 0.0004999380245970033, 'samples': 585600, 'steps': 3049, 'loss/train': 2.671400785446167} -08/30/2021 13:45:37 - INFO - __main__ - Step 3051: {'lr': 0.0004999379063846555, 'samples': 585792, 'steps': 3050, 'loss/train': 2.8302955627441406} -08/30/2021 13:45:37 - INFO - __main__ - Step 3052: {'lr': 0.0004999377880596897, 'samples': 585984, 'steps': 3051, 'loss/train': 2.9001340866088867} -08/30/2021 13:45:37 - INFO - __main__ - Step 3053: {'lr': 0.0004999376696221057, 'samples': 586176, 'steps': 3052, 'loss/train': 2.967221260070801} -08/30/2021 13:45:39 - INFO - __main__ - Step 3054: {'lr': 0.0004999375510719037, 'samples': 586368, 'steps': 3053, 'loss/train': 2.405060291290283} -08/30/2021 13:45:39 - INFO - __main__ - Step 3055: {'lr': 0.0004999374324090837, 'samples': 586560, 'steps': 3054, 'loss/train': 2.759819984436035} -08/30/2021 13:45:40 - INFO - __main__ - Step 3056: {'lr': 0.0004999373136336457, 'samples': 586752, 'steps': 3055, 'loss/train': 2.729295015335083} -08/30/2021 13:45:40 - INFO - __main__ - Step 3057: {'lr': 0.0004999371947455899, 'samples': 586944, 'steps': 3056, 'loss/train': 2.9442522525787354} -08/30/2021 13:45:40 - INFO - __main__ - Step 3058: {'lr': 0.0004999370757449162, 'samples': 587136, 'steps': 3057, 'loss/train': 2.8332059383392334} -08/30/2021 13:45:42 - INFO - __main__ - Step 3059: {'lr': 0.0004999369566316247, 'samples': 587328, 'steps': 3058, 'loss/train': 3.4595844745635986} -08/30/2021 13:45:42 - INFO - __main__ - Step 3060: {'lr': 0.0004999368374057155, 'samples': 587520, 'steps': 3059, 'loss/train': 3.0762219429016113} -08/30/2021 13:45:43 - INFO - __main__ - Step 3061: {'lr': 0.0004999367180671886, 'samples': 587712, 'steps': 3060, 'loss/train': 2.538363218307495} -08/30/2021 13:45:43 - INFO - __main__ - Step 3062: {'lr': 0.000499936598616044, 'samples': 587904, 'steps': 3061, 'loss/train': 2.421142101287842} -08/30/2021 13:45:43 - INFO - __main__ - Step 3063: {'lr': 0.0004999364790522819, 'samples': 588096, 'steps': 3062, 'loss/train': 3.322051763534546} -08/30/2021 13:45:44 - INFO - __main__ - Step 3064: {'lr': 0.0004999363593759022, 'samples': 588288, 'steps': 3063, 'loss/train': 2.883498191833496} -08/30/2021 13:45:46 - INFO - __main__ - Step 3065: {'lr': 0.0004999362395869052, 'samples': 588480, 'steps': 3064, 'loss/train': 2.4707047939300537} -08/30/2021 13:45:46 - INFO - __main__ - Step 3066: {'lr': 0.0004999361196852906, 'samples': 588672, 'steps': 3065, 'loss/train': 3.842144012451172} -08/30/2021 13:45:47 - INFO - __main__ - Step 3067: {'lr': 0.0004999359996710588, 'samples': 588864, 'steps': 3066, 'loss/train': 1.566475749015808} -08/30/2021 13:45:47 - INFO - __main__ - Step 3068: {'lr': 0.0004999358795442096, 'samples': 589056, 'steps': 3067, 'loss/train': 2.8776683807373047} -08/30/2021 13:45:47 - INFO - __main__ - Step 3069: {'lr': 0.0004999357593047431, 'samples': 589248, 'steps': 3068, 'loss/train': 1.8093340396881104} -08/30/2021 13:45:49 - INFO - __main__ - Step 3070: {'lr': 0.0004999356389526595, 'samples': 589440, 'steps': 3069, 'loss/train': 2.1377689838409424} -08/30/2021 13:45:49 - INFO - __main__ - Step 3071: {'lr': 0.0004999355184879587, 'samples': 589632, 'steps': 3070, 'loss/train': 2.0826215744018555} -08/30/2021 13:45:50 - INFO - __main__ - Step 3072: {'lr': 0.0004999353979106409, 'samples': 589824, 'steps': 3071, 'loss/train': 2.913546085357666} -08/30/2021 13:45:50 - INFO - __main__ - Step 3073: {'lr': 0.000499935277220706, 'samples': 590016, 'steps': 3072, 'loss/train': 2.7634084224700928} -08/30/2021 13:45:50 - INFO - __main__ - Step 3074: {'lr': 0.0004999351564181541, 'samples': 590208, 'steps': 3073, 'loss/train': 2.988072156906128} -08/30/2021 13:45:52 - INFO - __main__ - Step 3075: {'lr': 0.0004999350355029854, 'samples': 590400, 'steps': 3074, 'loss/train': 3.424922466278076} -08/30/2021 13:45:53 - INFO - __main__ - Step 3076: {'lr': 0.0004999349144751997, 'samples': 590592, 'steps': 3075, 'loss/train': 2.2299084663391113} -08/30/2021 13:45:53 - INFO - __main__ - Step 3077: {'lr': 0.0004999347933347972, 'samples': 590784, 'steps': 3076, 'loss/train': 2.887336015701294} -08/30/2021 13:45:53 - INFO - __main__ - Step 3078: {'lr': 0.0004999346720817779, 'samples': 590976, 'steps': 3077, 'loss/train': 2.785231590270996} -08/30/2021 13:45:54 - INFO - __main__ - Step 3079: {'lr': 0.000499934550716142, 'samples': 591168, 'steps': 3078, 'loss/train': 2.7666194438934326} -08/30/2021 13:45:54 - INFO - __main__ - Step 3080: {'lr': 0.0004999344292378893, 'samples': 591360, 'steps': 3079, 'loss/train': 1.5362716913223267} -08/30/2021 13:45:55 - INFO - __main__ - Step 3081: {'lr': 0.0004999343076470202, 'samples': 591552, 'steps': 3080, 'loss/train': 3.3281936645507812} -08/30/2021 13:45:56 - INFO - __main__ - Step 3082: {'lr': 0.0004999341859435345, 'samples': 591744, 'steps': 3081, 'loss/train': 3.255598783493042} -08/30/2021 13:45:56 - INFO - __main__ - Step 3083: {'lr': 0.0004999340641274322, 'samples': 591936, 'steps': 3082, 'loss/train': 2.720642566680908} -08/30/2021 13:45:57 - INFO - __main__ - Step 3084: {'lr': 0.0004999339421987136, 'samples': 592128, 'steps': 3083, 'loss/train': 2.823425769805908} -08/30/2021 13:45:57 - INFO - __main__ - Step 3085: {'lr': 0.0004999338201573786, 'samples': 592320, 'steps': 3084, 'loss/train': 2.087015151977539} -08/30/2021 13:45:59 - INFO - __main__ - Step 3086: {'lr': 0.0004999336980034271, 'samples': 592512, 'steps': 3085, 'loss/train': 2.859093189239502} -08/30/2021 13:45:59 - INFO - __main__ - Step 3087: {'lr': 0.0004999335757368595, 'samples': 592704, 'steps': 3086, 'loss/train': 2.915008306503296} -08/30/2021 13:45:59 - INFO - __main__ - Step 3088: {'lr': 0.0004999334533576757, 'samples': 592896, 'steps': 3087, 'loss/train': 3.409656286239624} -08/30/2021 13:46:00 - INFO - __main__ - Step 3089: {'lr': 0.0004999333308658756, 'samples': 593088, 'steps': 3088, 'loss/train': 2.9248416423797607} -08/30/2021 13:46:00 - INFO - __main__ - Step 3090: {'lr': 0.0004999332082614597, 'samples': 593280, 'steps': 3089, 'loss/train': 2.986475706100464} -08/30/2021 13:46:01 - INFO - __main__ - Step 3091: {'lr': 0.0004999330855444274, 'samples': 593472, 'steps': 3090, 'loss/train': 2.7550384998321533} -08/30/2021 13:46:02 - INFO - __main__ - Step 3092: {'lr': 0.0004999329627147792, 'samples': 593664, 'steps': 3091, 'loss/train': 2.990790367126465} -08/30/2021 13:46:02 - INFO - __main__ - Step 3093: {'lr': 0.0004999328397725152, 'samples': 593856, 'steps': 3092, 'loss/train': 3.0946664810180664} -08/30/2021 13:46:03 - INFO - __main__ - Step 3094: {'lr': 0.0004999327167176352, 'samples': 594048, 'steps': 3093, 'loss/train': 2.7758359909057617} -08/30/2021 13:46:03 - INFO - __main__ - Step 3095: {'lr': 0.0004999325935501395, 'samples': 594240, 'steps': 3094, 'loss/train': 2.7876522541046143} -08/30/2021 13:46:05 - INFO - __main__ - Step 3096: {'lr': 0.0004999324702700279, 'samples': 594432, 'steps': 3095, 'loss/train': 2.8208346366882324} -08/30/2021 13:46:05 - INFO - __main__ - Step 3097: {'lr': 0.0004999323468773007, 'samples': 594624, 'steps': 3096, 'loss/train': 2.5343258380889893} -08/30/2021 13:46:05 - INFO - __main__ - Step 3098: {'lr': 0.0004999322233719578, 'samples': 594816, 'steps': 3097, 'loss/train': 2.228133201599121} -08/30/2021 13:46:06 - INFO - __main__ - Step 3099: {'lr': 0.0004999320997539992, 'samples': 595008, 'steps': 3098, 'loss/train': 2.6890482902526855} -08/30/2021 13:46:06 - INFO - __main__ - Step 3100: {'lr': 0.0004999319760234251, 'samples': 595200, 'steps': 3099, 'loss/train': 2.4737637042999268} -08/30/2021 13:46:08 - INFO - __main__ - Step 3101: {'lr': 0.0004999318521802356, 'samples': 595392, 'steps': 3100, 'loss/train': 2.4688541889190674} -08/30/2021 13:46:08 - INFO - __main__ - Step 3102: {'lr': 0.0004999317282244305, 'samples': 595584, 'steps': 3101, 'loss/train': 3.134523391723633} -08/30/2021 13:46:08 - INFO - __main__ - Step 3103: {'lr': 0.0004999316041560102, 'samples': 595776, 'steps': 3102, 'loss/train': 3.150975465774536} -08/30/2021 13:46:09 - INFO - __main__ - Step 3104: {'lr': 0.0004999314799749745, 'samples': 595968, 'steps': 3103, 'loss/train': 3.054753303527832} -08/30/2021 13:46:09 - INFO - __main__ - Step 3105: {'lr': 0.0004999313556813235, 'samples': 596160, 'steps': 3104, 'loss/train': 2.088566541671753} -08/30/2021 13:46:11 - INFO - __main__ - Step 3106: {'lr': 0.0004999312312750573, 'samples': 596352, 'steps': 3105, 'loss/train': 2.5453414916992188} -08/30/2021 13:46:11 - INFO - __main__ - Step 3107: {'lr': 0.000499931106756176, 'samples': 596544, 'steps': 3106, 'loss/train': 2.4794046878814697} -08/30/2021 13:46:11 - INFO - __main__ - Step 3108: {'lr': 0.0004999309821246795, 'samples': 596736, 'steps': 3107, 'loss/train': 1.930832862854004} -08/30/2021 13:46:12 - INFO - __main__ - Step 3109: {'lr': 0.000499930857380568, 'samples': 596928, 'steps': 3108, 'loss/train': 2.0653395652770996} -08/30/2021 13:46:12 - INFO - __main__ - Step 3110: {'lr': 0.0004999307325238416, 'samples': 597120, 'steps': 3109, 'loss/train': 3.090510129928589} -08/30/2021 13:46:12 - INFO - __main__ - Step 3111: {'lr': 0.0004999306075545002, 'samples': 597312, 'steps': 3110, 'loss/train': 2.944995880126953} -08/30/2021 13:46:14 - INFO - __main__ - Step 3112: {'lr': 0.0004999304824725439, 'samples': 597504, 'steps': 3111, 'loss/train': 2.595315933227539} -08/30/2021 13:46:14 - INFO - __main__ - Step 3113: {'lr': 0.0004999303572779727, 'samples': 597696, 'steps': 3112, 'loss/train': 2.949462413787842} -08/30/2021 13:46:15 - INFO - __main__ - Step 3114: {'lr': 0.0004999302319707869, 'samples': 597888, 'steps': 3113, 'loss/train': 2.5815327167510986} -08/30/2021 13:46:15 - INFO - __main__ - Step 3115: {'lr': 0.0004999301065509863, 'samples': 598080, 'steps': 3114, 'loss/train': 3.0499043464660645} -08/30/2021 13:46:15 - INFO - __main__ - Step 3116: {'lr': 0.0004999299810185712, 'samples': 598272, 'steps': 3115, 'loss/train': 2.263648748397827} -08/30/2021 13:46:17 - INFO - __main__ - Step 3117: {'lr': 0.0004999298553735413, 'samples': 598464, 'steps': 3116, 'loss/train': 2.9172823429107666} -08/30/2021 13:46:17 - INFO - __main__ - Step 3118: {'lr': 0.000499929729615897, 'samples': 598656, 'steps': 3117, 'loss/train': 2.170206308364868} -08/30/2021 13:46:18 - INFO - __main__ - Step 3119: {'lr': 0.0004999296037456381, 'samples': 598848, 'steps': 3118, 'loss/train': 2.7277300357818604} -08/30/2021 13:46:18 - INFO - __main__ - Step 3120: {'lr': 0.0004999294777627649, 'samples': 599040, 'steps': 3119, 'loss/train': 2.7261152267456055} -08/30/2021 13:46:19 - INFO - __main__ - Step 3121: {'lr': 0.0004999293516672773, 'samples': 599232, 'steps': 3120, 'loss/train': 2.6429615020751953} -08/30/2021 13:46:21 - INFO - __main__ - Step 3122: {'lr': 0.0004999292254591754, 'samples': 599424, 'steps': 3121, 'loss/train': 0.48724889755249023} -08/30/2021 13:46:21 - INFO - __main__ - Step 3123: {'lr': 0.0004999290991384591, 'samples': 599616, 'steps': 3122, 'loss/train': 2.0068628787994385} -08/30/2021 13:46:22 - INFO - __main__ - Step 3124: {'lr': 0.0004999289727051289, 'samples': 599808, 'steps': 3123, 'loss/train': 2.296069860458374} -08/30/2021 13:46:22 - INFO - __main__ - Step 3125: {'lr': 0.0004999288461591842, 'samples': 600000, 'steps': 3124, 'loss/train': 3.5134057998657227} -08/30/2021 13:46:23 - INFO - __main__ - Step 3126: {'lr': 0.0004999287195006257, 'samples': 600192, 'steps': 3125, 'loss/train': 2.448402166366577} -08/30/2021 13:46:24 - INFO - __main__ - Step 3127: {'lr': 0.000499928592729453, 'samples': 600384, 'steps': 3126, 'loss/train': 2.403609037399292} -08/30/2021 13:46:24 - INFO - __main__ - Step 3128: {'lr': 0.0004999284658456665, 'samples': 600576, 'steps': 3127, 'loss/train': 2.4453182220458984} -08/30/2021 13:46:25 - INFO - __main__ - Step 3129: {'lr': 0.000499928338849266, 'samples': 600768, 'steps': 3128, 'loss/train': 2.8014326095581055} -08/30/2021 13:46:25 - INFO - __main__ - Step 3130: {'lr': 0.0004999282117402516, 'samples': 600960, 'steps': 3129, 'loss/train': 2.376030445098877} -08/30/2021 13:46:26 - INFO - __main__ - Step 3131: {'lr': 0.0004999280845186235, 'samples': 601152, 'steps': 3130, 'loss/train': 2.396571159362793} -08/30/2021 13:46:26 - INFO - __main__ - Step 3132: {'lr': 0.0004999279571843816, 'samples': 601344, 'steps': 3131, 'loss/train': 2.4883921146392822} -08/30/2021 13:46:28 - INFO - __main__ - Step 3133: {'lr': 0.000499927829737526, 'samples': 601536, 'steps': 3132, 'loss/train': 2.477632999420166} -08/30/2021 13:46:28 - INFO - __main__ - Step 3134: {'lr': 0.0004999277021780569, 'samples': 601728, 'steps': 3133, 'loss/train': 2.8598475456237793} -08/30/2021 13:46:29 - INFO - __main__ - Step 3135: {'lr': 0.0004999275745059741, 'samples': 601920, 'steps': 3134, 'loss/train': 3.3187780380249023} -08/30/2021 13:46:29 - INFO - __main__ - Step 3136: {'lr': 0.0004999274467212779, 'samples': 602112, 'steps': 3135, 'loss/train': 2.6064679622650146} -08/30/2021 13:46:29 - INFO - __main__ - Step 3137: {'lr': 0.0004999273188239681, 'samples': 602304, 'steps': 3136, 'loss/train': 3.262578248977661} -08/30/2021 13:46:31 - INFO - __main__ - Step 3138: {'lr': 0.0004999271908140451, 'samples': 602496, 'steps': 3137, 'loss/train': 4.358016490936279} -08/30/2021 13:46:31 - INFO - __main__ - Step 3139: {'lr': 0.0004999270626915086, 'samples': 602688, 'steps': 3138, 'loss/train': 2.5021872520446777} -08/30/2021 13:46:32 - INFO - __main__ - Step 3140: {'lr': 0.0004999269344563589, 'samples': 602880, 'steps': 3139, 'loss/train': 2.635646343231201} -08/30/2021 13:46:32 - INFO - __main__ - Step 3141: {'lr': 0.0004999268061085959, 'samples': 603072, 'steps': 3140, 'loss/train': 2.6724436283111572} -08/30/2021 13:46:32 - INFO - __main__ - Step 3142: {'lr': 0.0004999266776482199, 'samples': 603264, 'steps': 3141, 'loss/train': 2.859872579574585} -08/30/2021 13:46:34 - INFO - __main__ - Step 3143: {'lr': 0.0004999265490752306, 'samples': 603456, 'steps': 3142, 'loss/train': 1.779443383216858} -08/30/2021 13:46:34 - INFO - __main__ - Step 3144: {'lr': 0.0004999264203896284, 'samples': 603648, 'steps': 3143, 'loss/train': 2.3480141162872314} -08/30/2021 13:46:34 - INFO - __main__ - Step 3145: {'lr': 0.0004999262915914132, 'samples': 603840, 'steps': 3144, 'loss/train': 2.638678550720215} -08/30/2021 13:46:35 - INFO - __main__ - Step 3146: {'lr': 0.000499926162680585, 'samples': 604032, 'steps': 3145, 'loss/train': 1.5302430391311646} -08/30/2021 13:46:35 - INFO - __main__ - Step 3147: {'lr': 0.000499926033657144, 'samples': 604224, 'steps': 3146, 'loss/train': 2.6154024600982666} -08/30/2021 13:46:37 - INFO - __main__ - Step 3148: {'lr': 0.0004999259045210901, 'samples': 604416, 'steps': 3147, 'loss/train': 2.933009147644043} -08/30/2021 13:46:37 - INFO - __main__ - Step 3149: {'lr': 0.0004999257752724234, 'samples': 604608, 'steps': 3148, 'loss/train': 2.689781427383423} -08/30/2021 13:46:38 - INFO - __main__ - Step 3150: {'lr': 0.0004999256459111443, 'samples': 604800, 'steps': 3149, 'loss/train': 3.92864727973938} -08/30/2021 13:46:38 - INFO - __main__ - Step 3151: {'lr': 0.0004999255164372523, 'samples': 604992, 'steps': 3150, 'loss/train': 2.9216690063476562} -08/30/2021 13:46:38 - INFO - __main__ - Step 3152: {'lr': 0.0004999253868507476, 'samples': 605184, 'steps': 3151, 'loss/train': 1.0915896892547607} -08/30/2021 13:46:40 - INFO - __main__ - Step 3153: {'lr': 0.0004999252571516306, 'samples': 605376, 'steps': 3152, 'loss/train': 3.0541324615478516} -08/30/2021 13:46:40 - INFO - __main__ - Step 3154: {'lr': 0.0004999251273399011, 'samples': 605568, 'steps': 3153, 'loss/train': 2.8533623218536377} -08/30/2021 13:46:40 - INFO - __main__ - Step 3155: {'lr': 0.0004999249974155592, 'samples': 605760, 'steps': 3154, 'loss/train': 1.9612441062927246} -08/30/2021 13:46:41 - INFO - __main__ - Step 3156: {'lr': 0.0004999248673786049, 'samples': 605952, 'steps': 3155, 'loss/train': 2.6098594665527344} -08/30/2021 13:46:41 - INFO - __main__ - Step 3157: {'lr': 0.0004999247372290383, 'samples': 606144, 'steps': 3156, 'loss/train': 2.979992389678955} -08/30/2021 13:46:42 - INFO - __main__ - Step 3158: {'lr': 0.0004999246069668596, 'samples': 606336, 'steps': 3157, 'loss/train': 3.557257890701294} -08/30/2021 13:46:43 - INFO - __main__ - Step 3159: {'lr': 0.0004999244765920687, 'samples': 606528, 'steps': 3158, 'loss/train': 2.915217638015747} -08/30/2021 13:46:43 - INFO - __main__ - Step 3160: {'lr': 0.0004999243461046656, 'samples': 606720, 'steps': 3159, 'loss/train': 3.2726290225982666} -08/30/2021 13:46:44 - INFO - __main__ - Step 3161: {'lr': 0.0004999242155046504, 'samples': 606912, 'steps': 3160, 'loss/train': 2.917583465576172} -08/30/2021 13:46:44 - INFO - __main__ - Step 3162: {'lr': 0.0004999240847920233, 'samples': 607104, 'steps': 3161, 'loss/train': 2.02170467376709} -08/30/2021 13:46:44 - INFO - __main__ - Step 3163: {'lr': 0.0004999239539667842, 'samples': 607296, 'steps': 3162, 'loss/train': 2.193922519683838} -08/30/2021 13:46:46 - INFO - __main__ - Step 3164: {'lr': 0.0004999238230289333, 'samples': 607488, 'steps': 3163, 'loss/train': 3.0787715911865234} -08/30/2021 13:46:47 - INFO - __main__ - Step 3165: {'lr': 0.0004999236919784705, 'samples': 607680, 'steps': 3164, 'loss/train': 2.407846212387085} -08/30/2021 13:46:47 - INFO - __main__ - Step 3166: {'lr': 0.0004999235608153961, 'samples': 607872, 'steps': 3165, 'loss/train': 6.306263446807861} -08/30/2021 13:46:47 - INFO - __main__ - Step 3167: {'lr': 0.0004999234295397098, 'samples': 608064, 'steps': 3166, 'loss/train': 2.6810712814331055} -08/30/2021 13:46:48 - INFO - __main__ - Step 3168: {'lr': 0.000499923298151412, 'samples': 608256, 'steps': 3167, 'loss/train': 2.5126678943634033} -08/30/2021 13:46:48 - INFO - __main__ - Step 3169: {'lr': 0.0004999231666505025, 'samples': 608448, 'steps': 3168, 'loss/train': 2.035252332687378} -08/30/2021 13:46:50 - INFO - __main__ - Step 3170: {'lr': 0.0004999230350369816, 'samples': 608640, 'steps': 3169, 'loss/train': 2.936342716217041} -08/30/2021 13:46:51 - INFO - __main__ - Step 3171: {'lr': 0.0004999229033108492, 'samples': 608832, 'steps': 3170, 'loss/train': 2.796079397201538} -08/30/2021 13:46:51 - INFO - __main__ - Step 3172: {'lr': 0.0004999227714721054, 'samples': 609024, 'steps': 3171, 'loss/train': 2.489570379257202} -08/30/2021 13:46:52 - INFO - __main__ - Step 3173: {'lr': 0.0004999226395207501, 'samples': 609216, 'steps': 3172, 'loss/train': 2.50984525680542} -08/30/2021 13:46:52 - INFO - __main__ - Step 3174: {'lr': 0.0004999225074567837, 'samples': 609408, 'steps': 3173, 'loss/train': 2.986717939376831} -08/30/2021 13:46:52 - INFO - __main__ - Step 3175: {'lr': 0.000499922375280206, 'samples': 609600, 'steps': 3174, 'loss/train': 3.0193252563476562} -08/30/2021 13:46:55 - INFO - __main__ - Step 3176: {'lr': 0.0004999222429910171, 'samples': 609792, 'steps': 3175, 'loss/train': 3.845912218093872} -08/30/2021 13:46:55 - INFO - __main__ - Step 3177: {'lr': 0.0004999221105892172, 'samples': 609984, 'steps': 3176, 'loss/train': 3.3472275733947754} -08/30/2021 13:46:56 - INFO - __main__ - Step 3178: {'lr': 0.0004999219780748062, 'samples': 610176, 'steps': 3177, 'loss/train': 2.7961440086364746} -08/30/2021 13:46:56 - INFO - __main__ - Step 3179: {'lr': 0.0004999218454477843, 'samples': 610368, 'steps': 3178, 'loss/train': 3.055490732192993} -08/30/2021 13:46:56 - INFO - __main__ - Step 3180: {'lr': 0.0004999217127081514, 'samples': 610560, 'steps': 3179, 'loss/train': 4.990219593048096} -08/30/2021 13:46:57 - INFO - __main__ - Step 3181: {'lr': 0.0004999215798559076, 'samples': 610752, 'steps': 3180, 'loss/train': 3.0262258052825928} -08/30/2021 13:46:58 - INFO - __main__ - Step 3182: {'lr': 0.000499921446891053, 'samples': 610944, 'steps': 3181, 'loss/train': 3.575921058654785} -08/30/2021 13:46:59 - INFO - __main__ - Step 3183: {'lr': 0.0004999213138135877, 'samples': 611136, 'steps': 3182, 'loss/train': 2.4072868824005127} -08/30/2021 13:46:59 - INFO - __main__ - Step 3184: {'lr': 0.0004999211806235117, 'samples': 611328, 'steps': 3183, 'loss/train': 3.0549840927124023} -08/30/2021 13:46:59 - INFO - __main__ - Step 3185: {'lr': 0.000499921047320825, 'samples': 611520, 'steps': 3184, 'loss/train': 3.205899715423584} -08/30/2021 13:47:00 - INFO - __main__ - Step 3186: {'lr': 0.0004999209139055278, 'samples': 611712, 'steps': 3185, 'loss/train': 3.4004037380218506} -08/30/2021 13:47:01 - INFO - __main__ - Step 3187: {'lr': 0.0004999207803776201, 'samples': 611904, 'steps': 3186, 'loss/train': 3.189333438873291} -08/30/2021 13:47:02 - INFO - __main__ - Step 3188: {'lr': 0.000499920646737102, 'samples': 612096, 'steps': 3187, 'loss/train': 1.065770149230957} -08/30/2021 13:47:02 - INFO - __main__ - Step 3189: {'lr': 0.0004999205129839734, 'samples': 612288, 'steps': 3188, 'loss/train': 3.436750888824463} -08/30/2021 13:47:03 - INFO - __main__ - Step 3190: {'lr': 0.0004999203791182345, 'samples': 612480, 'steps': 3189, 'loss/train': 4.105352878570557} -08/30/2021 13:47:03 - INFO - __main__ - Step 3191: {'lr': 0.0004999202451398853, 'samples': 612672, 'steps': 3190, 'loss/train': 3.031970739364624} -08/30/2021 13:47:03 - INFO - __main__ - Step 3192: {'lr': 0.000499920111048926, 'samples': 612864, 'steps': 3191, 'loss/train': 2.3613171577453613} -08/30/2021 13:47:05 - INFO - __main__ - Step 3193: {'lr': 0.0004999199768453565, 'samples': 613056, 'steps': 3192, 'loss/train': 2.7101738452911377} -08/30/2021 13:47:05 - INFO - __main__ - Step 3194: {'lr': 0.0004999198425291769, 'samples': 613248, 'steps': 3193, 'loss/train': 3.037245035171509} -08/30/2021 13:47:06 - INFO - __main__ - Step 3195: {'lr': 0.0004999197081003873, 'samples': 613440, 'steps': 3194, 'loss/train': 3.037924289703369} -08/30/2021 13:47:06 - INFO - __main__ - Step 3196: {'lr': 0.0004999195735589877, 'samples': 613632, 'steps': 3195, 'loss/train': 3.242856025695801} -08/30/2021 13:47:06 - INFO - __main__ - Step 3197: {'lr': 0.0004999194389049783, 'samples': 613824, 'steps': 3196, 'loss/train': 3.041048765182495} -08/30/2021 13:47:08 - INFO - __main__ - Step 3198: {'lr': 0.0004999193041383588, 'samples': 614016, 'steps': 3197, 'loss/train': 3.4910566806793213} -08/30/2021 13:47:08 - INFO - __main__ - Step 3199: {'lr': 0.0004999191692591299, 'samples': 614208, 'steps': 3198, 'loss/train': 4.287659645080566} -08/30/2021 13:47:09 - INFO - __main__ - Step 3200: {'lr': 0.000499919034267291, 'samples': 614400, 'steps': 3199, 'loss/train': 2.7867040634155273} -08/30/2021 13:47:09 - INFO - __main__ - Step 3201: {'lr': 0.0004999188991628425, 'samples': 614592, 'steps': 3200, 'loss/train': 2.268404483795166} -08/30/2021 13:47:09 - INFO - __main__ - Step 3202: {'lr': 0.0004999187639457844, 'samples': 614784, 'steps': 3201, 'loss/train': 2.992171049118042} -08/30/2021 13:47:11 - INFO - __main__ - Step 3203: {'lr': 0.0004999186286161169, 'samples': 614976, 'steps': 3202, 'loss/train': 2.7562453746795654} -08/30/2021 13:47:12 - INFO - __main__ - Step 3204: {'lr': 0.0004999184931738397, 'samples': 615168, 'steps': 3203, 'loss/train': 1.3342421054840088} -08/30/2021 13:47:12 - INFO - __main__ - Step 3205: {'lr': 0.0004999183576189532, 'samples': 615360, 'steps': 3204, 'loss/train': 2.7941534519195557} -08/30/2021 13:47:12 - INFO - __main__ - Step 3206: {'lr': 0.0004999182219514573, 'samples': 615552, 'steps': 3205, 'loss/train': 2.1377646923065186} -08/30/2021 13:47:13 - INFO - __main__ - Step 3207: {'lr': 0.0004999180861713522, 'samples': 615744, 'steps': 3206, 'loss/train': 3.188704013824463} -08/30/2021 13:47:15 - INFO - __main__ - Step 3208: {'lr': 0.0004999179502786377, 'samples': 615936, 'steps': 3207, 'loss/train': 2.582209587097168} -08/30/2021 13:47:15 - INFO - __main__ - Step 3209: {'lr': 0.0004999178142733141, 'samples': 616128, 'steps': 3208, 'loss/train': 2.6052796840667725} -08/30/2021 13:47:15 - INFO - __main__ - Step 3210: {'lr': 0.0004999176781553815, 'samples': 616320, 'steps': 3209, 'loss/train': 3.0828773975372314} -08/30/2021 13:47:16 - INFO - __main__ - Step 3211: {'lr': 0.0004999175419248398, 'samples': 616512, 'steps': 3210, 'loss/train': 2.756396770477295} -08/30/2021 13:47:16 - INFO - __main__ - Step 3212: {'lr': 0.0004999174055816891, 'samples': 616704, 'steps': 3211, 'loss/train': 2.909679651260376} -08/30/2021 13:47:16 - INFO - __main__ - Step 3213: {'lr': 0.0004999172691259293, 'samples': 616896, 'steps': 3212, 'loss/train': 3.3466978073120117} -08/30/2021 13:47:18 - INFO - __main__ - Step 3214: {'lr': 0.0004999171325575609, 'samples': 617088, 'steps': 3213, 'loss/train': 0.6976868510246277} -08/30/2021 13:47:18 - INFO - __main__ - Step 3215: {'lr': 0.0004999169958765836, 'samples': 617280, 'steps': 3214, 'loss/train': 2.3229188919067383} -08/30/2021 13:47:19 - INFO - __main__ - Step 3216: {'lr': 0.0004999168590829975, 'samples': 617472, 'steps': 3215, 'loss/train': 2.50573468208313} -08/30/2021 13:47:19 - INFO - __main__ - Step 3217: {'lr': 0.0004999167221768028, 'samples': 617664, 'steps': 3216, 'loss/train': 2.442990303039551} -08/30/2021 13:47:19 - INFO - __main__ - Step 3218: {'lr': 0.0004999165851579994, 'samples': 617856, 'steps': 3217, 'loss/train': 3.084824800491333} -08/30/2021 13:47:21 - INFO - __main__ - Step 3219: {'lr': 0.0004999164480265875, 'samples': 618048, 'steps': 3218, 'loss/train': 2.7596936225891113} -08/30/2021 13:47:22 - INFO - __main__ - Step 3220: {'lr': 0.0004999163107825671, 'samples': 618240, 'steps': 3219, 'loss/train': 2.5256688594818115} -08/30/2021 13:47:22 - INFO - __main__ - Step 3221: {'lr': 0.0004999161734259383, 'samples': 618432, 'steps': 3220, 'loss/train': 3.144214630126953} -08/30/2021 13:47:22 - INFO - __main__ - Step 3222: {'lr': 0.0004999160359567011, 'samples': 618624, 'steps': 3221, 'loss/train': 2.37947940826416} -08/30/2021 13:47:23 - INFO - __main__ - Step 3223: {'lr': 0.0004999158983748555, 'samples': 618816, 'steps': 3222, 'loss/train': 2.7375147342681885} -08/30/2021 13:47:24 - INFO - __main__ - Step 3224: {'lr': 0.0004999157606804018, 'samples': 619008, 'steps': 3223, 'loss/train': 1.6062546968460083} -08/30/2021 13:47:25 - INFO - __main__ - Step 3225: {'lr': 0.0004999156228733398, 'samples': 619200, 'steps': 3224, 'loss/train': 2.4721710681915283} -08/30/2021 13:47:25 - INFO - __main__ - Step 3226: {'lr': 0.0004999154849536698, 'samples': 619392, 'steps': 3225, 'loss/train': 2.4993298053741455} -08/30/2021 13:47:25 - INFO - __main__ - Step 3227: {'lr': 0.0004999153469213917, 'samples': 619584, 'steps': 3226, 'loss/train': 2.770925283432007} -08/30/2021 13:47:26 - INFO - __main__ - Step 3228: {'lr': 0.0004999152087765055, 'samples': 619776, 'steps': 3227, 'loss/train': 2.7168385982513428} -08/30/2021 13:47:26 - INFO - __main__ - Step 3229: {'lr': 0.0004999150705190114, 'samples': 619968, 'steps': 3228, 'loss/train': 3.37111496925354} -08/30/2021 13:47:28 - INFO - __main__ - Step 3230: {'lr': 0.0004999149321489095, 'samples': 620160, 'steps': 3229, 'loss/train': 3.021174430847168} -08/30/2021 13:47:29 - INFO - __main__ - Step 3231: {'lr': 0.0004999147936661997, 'samples': 620352, 'steps': 3230, 'loss/train': 2.9290390014648438} -08/30/2021 13:47:29 - INFO - __main__ - Step 3232: {'lr': 0.0004999146550708822, 'samples': 620544, 'steps': 3231, 'loss/train': 2.412423849105835} -08/30/2021 13:47:29 - INFO - __main__ - Step 3233: {'lr': 0.000499914516362957, 'samples': 620736, 'steps': 3232, 'loss/train': 3.0570268630981445} -08/30/2021 13:47:30 - INFO - __main__ - Step 3234: {'lr': 0.0004999143775424241, 'samples': 620928, 'steps': 3233, 'loss/train': 1.90534245967865} -08/30/2021 13:47:31 - INFO - __main__ - Step 3235: {'lr': 0.0004999142386092838, 'samples': 621120, 'steps': 3234, 'loss/train': 2.9524097442626953} -08/30/2021 13:47:32 - INFO - __main__ - Step 3236: {'lr': 0.000499914099563536, 'samples': 621312, 'steps': 3235, 'loss/train': 4.571676731109619} -08/30/2021 13:47:32 - INFO - __main__ - Step 3237: {'lr': 0.0004999139604051806, 'samples': 621504, 'steps': 3236, 'loss/train': 3.1490585803985596} -08/30/2021 13:47:33 - INFO - __main__ - Step 3238: {'lr': 0.0004999138211342179, 'samples': 621696, 'steps': 3237, 'loss/train': 3.0514590740203857} -08/30/2021 13:47:33 - INFO - __main__ - Step 3239: {'lr': 0.0004999136817506478, 'samples': 621888, 'steps': 3238, 'loss/train': 0.9605992436408997} -08/30/2021 13:47:34 - INFO - __main__ - Step 3240: {'lr': 0.0004999135422544707, 'samples': 622080, 'steps': 3239, 'loss/train': 2.3694913387298584} -08/30/2021 13:47:35 - INFO - __main__ - Step 3241: {'lr': 0.0004999134026456862, 'samples': 622272, 'steps': 3240, 'loss/train': 2.468559980392456} -08/30/2021 13:47:35 - INFO - __main__ - Step 3242: {'lr': 0.0004999132629242946, 'samples': 622464, 'steps': 3241, 'loss/train': 3.220627784729004} -08/30/2021 13:47:36 - INFO - __main__ - Step 3243: {'lr': 0.000499913123090296, 'samples': 622656, 'steps': 3242, 'loss/train': 2.988105535507202} -08/30/2021 13:47:36 - INFO - __main__ - Step 3244: {'lr': 0.0004999129831436904, 'samples': 622848, 'steps': 3243, 'loss/train': 2.8485569953918457} -08/30/2021 13:47:37 - INFO - __main__ - Step 3245: {'lr': 0.0004999128430844778, 'samples': 623040, 'steps': 3244, 'loss/train': 1.7911012172698975} -08/30/2021 13:47:38 - INFO - __main__ - Step 3246: {'lr': 0.0004999127029126585, 'samples': 623232, 'steps': 3245, 'loss/train': 2.9321649074554443} -08/30/2021 13:47:38 - INFO - __main__ - Step 3247: {'lr': 0.0004999125626282322, 'samples': 623424, 'steps': 3246, 'loss/train': 2.5870540142059326} -08/30/2021 13:47:38 - INFO - __main__ - Step 3248: {'lr': 0.0004999124222311993, 'samples': 623616, 'steps': 3247, 'loss/train': 2.862294912338257} -08/30/2021 13:47:39 - INFO - __main__ - Step 3249: {'lr': 0.0004999122817215595, 'samples': 623808, 'steps': 3248, 'loss/train': 2.49239444732666} -08/30/2021 13:47:40 - INFO - __main__ - Step 3250: {'lr': 0.0004999121410993133, 'samples': 624000, 'steps': 3249, 'loss/train': 2.8708701133728027} -08/30/2021 13:47:41 - INFO - __main__ - Step 3251: {'lr': 0.0004999120003644604, 'samples': 624192, 'steps': 3250, 'loss/train': 2.5049490928649902} -08/30/2021 13:47:41 - INFO - __main__ - Step 3252: {'lr': 0.0004999118595170011, 'samples': 624384, 'steps': 3251, 'loss/train': 3.0734362602233887} -08/30/2021 13:47:41 - INFO - __main__ - Step 3253: {'lr': 0.0004999117185569354, 'samples': 624576, 'steps': 3252, 'loss/train': 2.3230626583099365} -08/30/2021 13:47:42 - INFO - __main__ - Step 3254: {'lr': 0.0004999115774842633, 'samples': 624768, 'steps': 3253, 'loss/train': 3.3489320278167725} -08/30/2021 13:47:44 - INFO - __main__ - Step 3255: {'lr': 0.0004999114362989849, 'samples': 624960, 'steps': 3254, 'loss/train': 2.6042723655700684} -08/30/2021 13:47:44 - INFO - __main__ - Step 3256: {'lr': 0.0004999112950011002, 'samples': 625152, 'steps': 3255, 'loss/train': 3.1600685119628906} -08/30/2021 13:47:44 - INFO - __main__ - Step 3257: {'lr': 0.0004999111535906094, 'samples': 625344, 'steps': 3256, 'loss/train': 3.0841994285583496} -08/30/2021 13:47:45 - INFO - __main__ - Step 3258: {'lr': 0.0004999110120675125, 'samples': 625536, 'steps': 3257, 'loss/train': 2.4904887676239014} -08/30/2021 13:47:45 - INFO - __main__ - Step 3259: {'lr': 0.0004999108704318095, 'samples': 625728, 'steps': 3258, 'loss/train': 0.7025074362754822} -08/30/2021 13:47:47 - INFO - __main__ - Step 3260: {'lr': 0.0004999107286835006, 'samples': 625920, 'steps': 3259, 'loss/train': 2.1461243629455566} -08/30/2021 13:47:47 - INFO - __main__ - Step 3261: {'lr': 0.0004999105868225858, 'samples': 626112, 'steps': 3260, 'loss/train': 2.9746410846710205} -08/30/2021 13:47:47 - INFO - __main__ - Step 3262: {'lr': 0.0004999104448490649, 'samples': 626304, 'steps': 3261, 'loss/train': 1.9697314500808716} -08/30/2021 13:47:48 - INFO - __main__ - Step 3263: {'lr': 0.0004999103027629384, 'samples': 626496, 'steps': 3262, 'loss/train': 2.3351855278015137} -08/30/2021 13:47:48 - INFO - __main__ - Step 3264: {'lr': 0.0004999101605642061, 'samples': 626688, 'steps': 3263, 'loss/train': 2.5148749351501465} -08/30/2021 13:47:49 - INFO - __main__ - Step 3265: {'lr': 0.0004999100182528683, 'samples': 626880, 'steps': 3264, 'loss/train': 2.81813383102417} -08/30/2021 13:47:50 - INFO - __main__ - Step 3266: {'lr': 0.0004999098758289248, 'samples': 627072, 'steps': 3265, 'loss/train': 2.612733840942383} -08/30/2021 13:47:50 - INFO - __main__ - Step 3267: {'lr': 0.0004999097332923758, 'samples': 627264, 'steps': 3266, 'loss/train': 2.461395740509033} -08/30/2021 13:47:51 - INFO - __main__ - Step 3268: {'lr': 0.0004999095906432213, 'samples': 627456, 'steps': 3267, 'loss/train': 2.8094491958618164} -08/30/2021 13:47:51 - INFO - __main__ - Step 3269: {'lr': 0.0004999094478814613, 'samples': 627648, 'steps': 3268, 'loss/train': 2.8189516067504883} -08/30/2021 13:47:51 - INFO - __main__ - Step 3270: {'lr': 0.0004999093050070961, 'samples': 627840, 'steps': 3269, 'loss/train': 2.4825503826141357} -08/30/2021 13:47:53 - INFO - __main__ - Step 3271: {'lr': 0.0004999091620201255, 'samples': 628032, 'steps': 3270, 'loss/train': 2.7980663776397705} -08/30/2021 13:47:53 - INFO - __main__ - Step 3272: {'lr': 0.0004999090189205498, 'samples': 628224, 'steps': 3271, 'loss/train': 2.6761281490325928} -08/30/2021 13:47:54 - INFO - __main__ - Step 3273: {'lr': 0.0004999088757083689, 'samples': 628416, 'steps': 3272, 'loss/train': 1.788774847984314} -08/30/2021 13:47:54 - INFO - __main__ - Step 3274: {'lr': 0.0004999087323835829, 'samples': 628608, 'steps': 3273, 'loss/train': 2.6867196559906006} -08/30/2021 13:47:54 - INFO - __main__ - Step 3275: {'lr': 0.0004999085889461919, 'samples': 628800, 'steps': 3274, 'loss/train': 2.401261806488037} -08/30/2021 13:47:56 - INFO - __main__ - Step 3276: {'lr': 0.0004999084453961959, 'samples': 628992, 'steps': 3275, 'loss/train': 2.571923017501831} -08/30/2021 13:47:57 - INFO - __main__ - Step 3277: {'lr': 0.0004999083017335951, 'samples': 629184, 'steps': 3276, 'loss/train': 2.670154094696045} -08/30/2021 13:47:57 - INFO - __main__ - Step 3278: {'lr': 0.0004999081579583895, 'samples': 629376, 'steps': 3277, 'loss/train': 1.959620475769043} -08/30/2021 13:47:57 - INFO - __main__ - Step 3279: {'lr': 0.0004999080140705791, 'samples': 629568, 'steps': 3278, 'loss/train': 2.1653659343719482} -08/30/2021 13:47:58 - INFO - __main__ - Step 3280: {'lr': 0.0004999078700701639, 'samples': 629760, 'steps': 3279, 'loss/train': 1.4701002836227417} -08/30/2021 13:47:58 - INFO - __main__ - Step 3281: {'lr': 0.0004999077259571442, 'samples': 629952, 'steps': 3280, 'loss/train': 1.766237497329712} -08/30/2021 13:47:59 - INFO - __main__ - Step 3282: {'lr': 0.0004999075817315199, 'samples': 630144, 'steps': 3281, 'loss/train': 2.268458843231201} -08/30/2021 13:48:00 - INFO - __main__ - Step 3283: {'lr': 0.0004999074373932911, 'samples': 630336, 'steps': 3282, 'loss/train': 2.3677804470062256} -08/30/2021 13:48:00 - INFO - __main__ - Step 3284: {'lr': 0.0004999072929424579, 'samples': 630528, 'steps': 3283, 'loss/train': 2.5171844959259033} -08/30/2021 13:48:01 - INFO - __main__ - Step 3285: {'lr': 0.0004999071483790203, 'samples': 630720, 'steps': 3284, 'loss/train': 3.5679070949554443} -08/30/2021 13:48:01 - INFO - __main__ - Step 3286: {'lr': 0.0004999070037029783, 'samples': 630912, 'steps': 3285, 'loss/train': 2.1660118103027344} -08/30/2021 13:48:03 - INFO - __main__ - Step 3287: {'lr': 0.0004999068589143322, 'samples': 631104, 'steps': 3286, 'loss/train': 2.397390365600586} -08/30/2021 13:48:04 - INFO - __main__ - Step 3288: {'lr': 0.0004999067140130819, 'samples': 631296, 'steps': 3287, 'loss/train': 2.073444128036499} -08/30/2021 13:48:04 - INFO - __main__ - Step 3289: {'lr': 0.0004999065689992273, 'samples': 631488, 'steps': 3288, 'loss/train': 0.5190285444259644} -08/30/2021 13:48:05 - INFO - __main__ - Step 3290: {'lr': 0.0004999064238727689, 'samples': 631680, 'steps': 3289, 'loss/train': 2.7662148475646973} -08/30/2021 13:48:05 - INFO - __main__ - Step 3291: {'lr': 0.0004999062786337064, 'samples': 631872, 'steps': 3290, 'loss/train': 2.8064463138580322} -08/30/2021 13:48:06 - INFO - __main__ - Step 3292: {'lr': 0.0004999061332820401, 'samples': 632064, 'steps': 3291, 'loss/train': 2.773684501647949} -08/30/2021 13:48:07 - INFO - __main__ - Step 3293: {'lr': 0.0004999059878177699, 'samples': 632256, 'steps': 3292, 'loss/train': 2.9490532875061035} -08/30/2021 13:48:07 - INFO - __main__ - Step 3294: {'lr': 0.0004999058422408959, 'samples': 632448, 'steps': 3293, 'loss/train': 2.387587785720825} -08/30/2021 13:48:08 - INFO - __main__ - Step 3295: {'lr': 0.0004999056965514181, 'samples': 632640, 'steps': 3294, 'loss/train': 2.536912679672241} -08/30/2021 13:48:08 - INFO - __main__ - Step 3296: {'lr': 0.0004999055507493368, 'samples': 632832, 'steps': 3295, 'loss/train': 2.3596861362457275} -08/30/2021 13:48:09 - INFO - __main__ - Step 3297: {'lr': 0.0004999054048346517, 'samples': 633024, 'steps': 3296, 'loss/train': 2.387342929840088} -08/30/2021 13:48:10 - INFO - __main__ - Step 3298: {'lr': 0.0004999052588073633, 'samples': 633216, 'steps': 3297, 'loss/train': 2.5546672344207764} -08/30/2021 13:48:10 - INFO - __main__ - Step 3299: {'lr': 0.0004999051126674714, 'samples': 633408, 'steps': 3298, 'loss/train': 2.604255437850952} -08/30/2021 13:48:11 - INFO - __main__ - Step 3300: {'lr': 0.0004999049664149761, 'samples': 633600, 'steps': 3299, 'loss/train': 2.6365129947662354} -08/30/2021 13:48:11 - INFO - __main__ - Step 3301: {'lr': 0.0004999048200498774, 'samples': 633792, 'steps': 3300, 'loss/train': 2.722532033920288} -08/30/2021 13:48:12 - INFO - __main__ - Step 3302: {'lr': 0.0004999046735721755, 'samples': 633984, 'steps': 3301, 'loss/train': 2.8905324935913086} -08/30/2021 13:48:13 - INFO - __main__ - Step 3303: {'lr': 0.0004999045269818704, 'samples': 634176, 'steps': 3302, 'loss/train': 2.822232961654663} -08/30/2021 13:48:13 - INFO - __main__ - Step 3304: {'lr': 0.0004999043802789622, 'samples': 634368, 'steps': 3303, 'loss/train': 2.6634597778320312} -08/30/2021 13:48:13 - INFO - __main__ - Step 3305: {'lr': 0.000499904233463451, 'samples': 634560, 'steps': 3304, 'loss/train': 2.9877405166625977} -08/30/2021 13:48:14 - INFO - __main__ - Step 3306: {'lr': 0.0004999040865353367, 'samples': 634752, 'steps': 3305, 'loss/train': 2.688408374786377} -08/30/2021 13:48:14 - INFO - __main__ - Step 3307: {'lr': 0.0004999039394946196, 'samples': 634944, 'steps': 3306, 'loss/train': 2.555669069290161} -08/30/2021 13:48:16 - INFO - __main__ - Step 3308: {'lr': 0.0004999037923412995, 'samples': 635136, 'steps': 3307, 'loss/train': 2.469919443130493} -08/30/2021 13:48:16 - INFO - __main__ - Step 3309: {'lr': 0.0004999036450753767, 'samples': 635328, 'steps': 3308, 'loss/train': 2.422785520553589} -08/30/2021 13:48:17 - INFO - __main__ - Step 3310: {'lr': 0.0004999034976968511, 'samples': 635520, 'steps': 3309, 'loss/train': 2.396209955215454} -08/30/2021 13:48:17 - INFO - __main__ - Step 3311: {'lr': 0.0004999033502057228, 'samples': 635712, 'steps': 3310, 'loss/train': 0.4965997040271759} -08/30/2021 13:48:17 - INFO - __main__ - Step 3312: {'lr': 0.000499903202601992, 'samples': 635904, 'steps': 3311, 'loss/train': 2.49814772605896} -08/30/2021 13:48:19 - INFO - __main__ - Step 3313: {'lr': 0.0004999030548856586, 'samples': 636096, 'steps': 3312, 'loss/train': 2.534740686416626} -08/30/2021 13:48:19 - INFO - __main__ - Step 3314: {'lr': 0.0004999029070567229, 'samples': 636288, 'steps': 3313, 'loss/train': 2.4719066619873047} -08/30/2021 13:48:20 - INFO - __main__ - Step 3315: {'lr': 0.0004999027591151847, 'samples': 636480, 'steps': 3314, 'loss/train': 2.980236768722534} -08/30/2021 13:48:20 - INFO - __main__ - Step 3316: {'lr': 0.0004999026110610442, 'samples': 636672, 'steps': 3315, 'loss/train': 3.3525431156158447} -08/30/2021 13:48:20 - INFO - __main__ - Step 3317: {'lr': 0.0004999024628943014, 'samples': 636864, 'steps': 3316, 'loss/train': 3.0579843521118164} -08/30/2021 13:48:22 - INFO - __main__ - Step 3318: {'lr': 0.0004999023146149565, 'samples': 637056, 'steps': 3317, 'loss/train': 3.0031614303588867} -08/30/2021 13:48:22 - INFO - __main__ - Step 3319: {'lr': 0.0004999021662230093, 'samples': 637248, 'steps': 3318, 'loss/train': 3.110140323638916} -08/30/2021 13:48:23 - INFO - __main__ - Step 3320: {'lr': 0.0004999020177184601, 'samples': 637440, 'steps': 3319, 'loss/train': 2.562987804412842} -08/30/2021 13:48:23 - INFO - __main__ - Step 3321: {'lr': 0.000499901869101309, 'samples': 637632, 'steps': 3320, 'loss/train': 2.5110275745391846} -08/30/2021 13:48:23 - INFO - __main__ - Step 3322: {'lr': 0.0004999017203715559, 'samples': 637824, 'steps': 3321, 'loss/train': 3.200589656829834} -08/30/2021 13:48:25 - INFO - __main__ - Step 3323: {'lr': 0.000499901571529201, 'samples': 638016, 'steps': 3322, 'loss/train': 2.8086395263671875} -08/30/2021 13:48:25 - INFO - __main__ - Step 3324: {'lr': 0.0004999014225742442, 'samples': 638208, 'steps': 3323, 'loss/train': 2.0978477001190186} -08/30/2021 13:48:25 - INFO - __main__ - Step 3325: {'lr': 0.0004999012735066858, 'samples': 638400, 'steps': 3324, 'loss/train': 2.442878484725952} -08/30/2021 13:48:26 - INFO - __main__ - Step 3326: {'lr': 0.0004999011243265257, 'samples': 638592, 'steps': 3325, 'loss/train': 3.172194242477417} -08/30/2021 13:48:26 - INFO - __main__ - Step 3327: {'lr': 0.000499900975033764, 'samples': 638784, 'steps': 3326, 'loss/train': 3.3617234230041504} -08/30/2021 13:48:28 - INFO - __main__ - Step 3328: {'lr': 0.0004999008256284008, 'samples': 638976, 'steps': 3327, 'loss/train': 2.6678080558776855} -08/30/2021 13:48:28 - INFO - __main__ - Step 3329: {'lr': 0.0004999006761104361, 'samples': 639168, 'steps': 3328, 'loss/train': 2.5414741039276123} -08/30/2021 13:48:28 - INFO - __main__ - Step 3330: {'lr': 0.0004999005264798701, 'samples': 639360, 'steps': 3329, 'loss/train': 2.473289728164673} -08/30/2021 13:48:29 - INFO - __main__ - Step 3331: {'lr': 0.0004999003767367027, 'samples': 639552, 'steps': 3330, 'loss/train': 2.6687510013580322} -08/30/2021 13:48:29 - INFO - __main__ - Step 3332: {'lr': 0.0004999002268809339, 'samples': 639744, 'steps': 3331, 'loss/train': 1.7362552881240845} -08/30/2021 13:48:31 - INFO - __main__ - Step 3333: {'lr': 0.0004999000769125642, 'samples': 639936, 'steps': 3332, 'loss/train': 2.652609348297119} -08/30/2021 13:48:31 - INFO - __main__ - Step 3334: {'lr': 0.0004998999268315932, 'samples': 640128, 'steps': 3333, 'loss/train': 2.4559290409088135} -08/30/2021 13:48:31 - INFO - __main__ - Step 3335: {'lr': 0.0004998997766380212, 'samples': 640320, 'steps': 3334, 'loss/train': 2.385721445083618} -08/30/2021 13:48:32 - INFO - __main__ - Step 3336: {'lr': 0.0004998996263318482, 'samples': 640512, 'steps': 3335, 'loss/train': 2.356045961380005} -08/30/2021 13:48:32 - INFO - __main__ - Step 3337: {'lr': 0.0004998994759130743, 'samples': 640704, 'steps': 3336, 'loss/train': 2.7879414558410645} -08/30/2021 13:48:34 - INFO - __main__ - Step 3338: {'lr': 0.0004998993253816996, 'samples': 640896, 'steps': 3337, 'loss/train': 2.1548779010772705} -08/30/2021 13:48:34 - INFO - __main__ - Step 3339: {'lr': 0.000499899174737724, 'samples': 641088, 'steps': 3338, 'loss/train': 2.10243821144104} -08/30/2021 13:48:35 - INFO - __main__ - Step 3340: {'lr': 0.0004998990239811477, 'samples': 641280, 'steps': 3339, 'loss/train': 2.5220203399658203} -08/30/2021 13:48:35 - INFO - __main__ - Step 3341: {'lr': 0.0004998988731119709, 'samples': 641472, 'steps': 3340, 'loss/train': 2.620222568511963} -08/30/2021 13:48:36 - INFO - __main__ - Step 3342: {'lr': 0.0004998987221301935, 'samples': 641664, 'steps': 3341, 'loss/train': 2.443495035171509} -08/30/2021 13:48:36 - INFO - __main__ - Step 3343: {'lr': 0.0004998985710358155, 'samples': 641856, 'steps': 3342, 'loss/train': 2.132190465927124} -08/30/2021 13:48:38 - INFO - __main__ - Step 3344: {'lr': 0.0004998984198288371, 'samples': 642048, 'steps': 3343, 'loss/train': 2.160667896270752} -08/30/2021 13:48:38 - INFO - __main__ - Step 3345: {'lr': 0.0004998982685092583, 'samples': 642240, 'steps': 3344, 'loss/train': 2.8251593112945557} -08/30/2021 13:48:38 - INFO - __main__ - Step 3346: {'lr': 0.0004998981170770792, 'samples': 642432, 'steps': 3345, 'loss/train': 2.4152023792266846} -08/30/2021 13:48:39 - INFO - __main__ - Step 3347: {'lr': 0.0004998979655323, 'samples': 642624, 'steps': 3346, 'loss/train': 2.6465532779693604} -08/30/2021 13:48:39 - INFO - __main__ - Step 3348: {'lr': 0.0004998978138749204, 'samples': 642816, 'steps': 3347, 'loss/train': 2.9894039630889893} -08/30/2021 13:48:41 - INFO - __main__ - Step 3349: {'lr': 0.0004998976621049408, 'samples': 643008, 'steps': 3348, 'loss/train': 2.57108998298645} -08/30/2021 13:48:41 - INFO - __main__ - Step 3350: {'lr': 0.0004998975102223612, 'samples': 643200, 'steps': 3349, 'loss/train': 2.692763328552246} -08/30/2021 13:48:41 - INFO - __main__ - Step 3351: {'lr': 0.0004998973582271817, 'samples': 643392, 'steps': 3350, 'loss/train': 1.823738694190979} -08/30/2021 13:48:42 - INFO - __main__ - Step 3352: {'lr': 0.0004998972061194022, 'samples': 643584, 'steps': 3351, 'loss/train': 2.8077547550201416} -08/30/2021 13:48:42 - INFO - __main__ - Step 3353: {'lr': 0.0004998970538990228, 'samples': 643776, 'steps': 3352, 'loss/train': 2.885777473449707} -08/30/2021 13:48:44 - INFO - __main__ - Step 3354: {'lr': 0.0004998969015660438, 'samples': 643968, 'steps': 3353, 'loss/train': 2.5239927768707275} -08/30/2021 13:48:45 - INFO - __main__ - Step 3355: {'lr': 0.0004998967491204651, 'samples': 644160, 'steps': 3354, 'loss/train': 2.5806667804718018} -08/30/2021 13:48:45 - INFO - __main__ - Step 3356: {'lr': 0.0004998965965622867, 'samples': 644352, 'steps': 3355, 'loss/train': 2.547076940536499} -08/30/2021 13:48:45 - INFO - __main__ - Step 3357: {'lr': 0.0004998964438915088, 'samples': 644544, 'steps': 3356, 'loss/train': 2.1983394622802734} -08/30/2021 13:48:46 - INFO - __main__ - Step 3358: {'lr': 0.0004998962911081314, 'samples': 644736, 'steps': 3357, 'loss/train': 1.7727375030517578} -08/30/2021 13:48:46 - INFO - __main__ - Step 3359: {'lr': 0.0004998961382121546, 'samples': 644928, 'steps': 3358, 'loss/train': 2.59871768951416} -08/30/2021 13:48:48 - INFO - __main__ - Step 3360: {'lr': 0.0004998959852035785, 'samples': 645120, 'steps': 3359, 'loss/train': 2.518486976623535} -08/30/2021 13:48:48 - INFO - __main__ - Step 3361: {'lr': 0.0004998958320824031, 'samples': 645312, 'steps': 3360, 'loss/train': 2.533982992172241} -08/30/2021 13:48:49 - INFO - __main__ - Step 3362: {'lr': 0.0004998956788486284, 'samples': 645504, 'steps': 3361, 'loss/train': 2.8132495880126953} -08/30/2021 13:48:49 - INFO - __main__ - Step 3363: {'lr': 0.0004998955255022547, 'samples': 645696, 'steps': 3362, 'loss/train': 1.9254417419433594} -08/30/2021 13:48:49 - INFO - __main__ - Step 3364: {'lr': 0.0004998953720432818, 'samples': 645888, 'steps': 3363, 'loss/train': 2.747995376586914} -08/30/2021 13:48:50 - INFO - __main__ - Step 3365: {'lr': 0.00049989521847171, 'samples': 646080, 'steps': 3364, 'loss/train': 2.550886631011963} -08/30/2021 13:48:51 - INFO - __main__ - Step 3366: {'lr': 0.0004998950647875392, 'samples': 646272, 'steps': 3365, 'loss/train': 3.939955472946167} -08/30/2021 13:48:52 - INFO - __main__ - Step 3367: {'lr': 0.0004998949109907697, 'samples': 646464, 'steps': 3366, 'loss/train': 2.9285311698913574} -08/30/2021 13:48:52 - INFO - __main__ - Step 3368: {'lr': 0.0004998947570814012, 'samples': 646656, 'steps': 3367, 'loss/train': 2.6467556953430176} -08/30/2021 13:48:52 - INFO - __main__ - Step 3369: {'lr': 0.0004998946030594341, 'samples': 646848, 'steps': 3368, 'loss/train': 2.517835855484009} -08/30/2021 13:48:53 - INFO - __main__ - Step 3370: {'lr': 0.0004998944489248683, 'samples': 647040, 'steps': 3369, 'loss/train': 2.932713270187378} -08/30/2021 13:48:54 - INFO - __main__ - Step 3371: {'lr': 0.000499894294677704, 'samples': 647232, 'steps': 3370, 'loss/train': 2.707963228225708} -08/30/2021 13:48:55 - INFO - __main__ - Step 3372: {'lr': 0.000499894140317941, 'samples': 647424, 'steps': 3371, 'loss/train': 2.471409320831299} -08/30/2021 13:48:55 - INFO - __main__ - Step 3373: {'lr': 0.0004998939858455798, 'samples': 647616, 'steps': 3372, 'loss/train': 2.475250482559204} -08/30/2021 13:48:55 - INFO - __main__ - Step 3374: {'lr': 0.0004998938312606201, 'samples': 647808, 'steps': 3373, 'loss/train': 1.9769246578216553} -08/30/2021 13:48:56 - INFO - __main__ - Step 3375: {'lr': 0.000499893676563062, 'samples': 648000, 'steps': 3374, 'loss/train': 3.2632381916046143} -08/30/2021 13:48:57 - INFO - __main__ - Step 3376: {'lr': 0.0004998935217529058, 'samples': 648192, 'steps': 3375, 'loss/train': 2.835620880126953} -08/30/2021 13:48:58 - INFO - __main__ - Step 3377: {'lr': 0.0004998933668301514, 'samples': 648384, 'steps': 3376, 'loss/train': 3.0379831790924072} -08/30/2021 13:48:58 - INFO - __main__ - Step 3378: {'lr': 0.0004998932117947989, 'samples': 648576, 'steps': 3377, 'loss/train': 2.353278875350952} -08/30/2021 13:48:58 - INFO - __main__ - Step 3379: {'lr': 0.0004998930566468484, 'samples': 648768, 'steps': 3378, 'loss/train': 2.9702203273773193} -08/30/2021 13:48:59 - INFO - __main__ - Step 3380: {'lr': 0.0004998929013863, 'samples': 648960, 'steps': 3379, 'loss/train': 2.017845630645752} -08/30/2021 13:49:00 - INFO - __main__ - Step 3381: {'lr': 0.0004998927460131535, 'samples': 649152, 'steps': 3380, 'loss/train': 2.112061023712158} -08/30/2021 13:49:01 - INFO - __main__ - Step 3382: {'lr': 0.0004998925905274094, 'samples': 649344, 'steps': 3381, 'loss/train': 1.5845096111297607} -08/30/2021 13:49:01 - INFO - __main__ - Step 3383: {'lr': 0.0004998924349290674, 'samples': 649536, 'steps': 3382, 'loss/train': 2.748828411102295} -08/30/2021 13:49:01 - INFO - __main__ - Step 3384: {'lr': 0.0004998922792181278, 'samples': 649728, 'steps': 3383, 'loss/train': 2.293346643447876} -08/30/2021 13:49:02 - INFO - __main__ - Step 3385: {'lr': 0.0004998921233945907, 'samples': 649920, 'steps': 3384, 'loss/train': 1.8696900606155396} -08/30/2021 13:49:02 - INFO - __main__ - Step 3386: {'lr': 0.0004998919674584559, 'samples': 650112, 'steps': 3385, 'loss/train': 2.5926995277404785} -08/30/2021 13:49:04 - INFO - __main__ - Step 3387: {'lr': 0.0004998918114097237, 'samples': 650304, 'steps': 3386, 'loss/train': 2.7840747833251953} -08/30/2021 13:49:05 - INFO - __main__ - Step 3388: {'lr': 0.0004998916552483941, 'samples': 650496, 'steps': 3387, 'loss/train': 2.191200017929077} -08/30/2021 13:49:05 - INFO - __main__ - Step 3389: {'lr': 0.0004998914989744671, 'samples': 650688, 'steps': 3388, 'loss/train': 2.1903586387634277} -08/30/2021 13:49:05 - INFO - __main__ - Step 3390: {'lr': 0.000499891342587943, 'samples': 650880, 'steps': 3389, 'loss/train': 2.354968309402466} -08/30/2021 13:49:06 - INFO - __main__ - Step 3391: {'lr': 0.0004998911860888217, 'samples': 651072, 'steps': 3390, 'loss/train': 1.799631118774414} -08/30/2021 13:49:06 - INFO - __main__ - Step 3392: {'lr': 0.0004998910294771032, 'samples': 651264, 'steps': 3391, 'loss/train': 1.7778704166412354} -08/30/2021 13:49:07 - INFO - __main__ - Step 3393: {'lr': 0.0004998908727527877, 'samples': 651456, 'steps': 3392, 'loss/train': 4.1373090744018555} -08/30/2021 13:49:09 - INFO - __main__ - Step 3394: {'lr': 0.0004998907159158752, 'samples': 651648, 'steps': 3393, 'loss/train': 2.655801296234131} -08/30/2021 13:49:10 - INFO - __main__ - Step 3395: {'lr': 0.0004998905589663658, 'samples': 651840, 'steps': 3394, 'loss/train': 2.715543270111084} -08/30/2021 13:49:10 - INFO - __main__ - Step 3396: {'lr': 0.0004998904019042596, 'samples': 652032, 'steps': 3395, 'loss/train': 3.3126304149627686} -08/30/2021 13:49:11 - INFO - __main__ - Step 3397: {'lr': 0.0004998902447295567, 'samples': 652224, 'steps': 3396, 'loss/train': 3.198720693588257} -08/30/2021 13:49:11 - INFO - __main__ - Step 3398: {'lr': 0.000499890087442257, 'samples': 652416, 'steps': 3397, 'loss/train': 2.64034104347229} -08/30/2021 13:49:13 - INFO - __main__ - Step 3399: {'lr': 0.0004998899300423607, 'samples': 652608, 'steps': 3398, 'loss/train': 0.8199313879013062} -08/30/2021 13:49:13 - INFO - __main__ - Step 3400: {'lr': 0.0004998897725298679, 'samples': 652800, 'steps': 3399, 'loss/train': 2.494413375854492} -08/30/2021 13:49:13 - INFO - __main__ - Step 3401: {'lr': 0.0004998896149047786, 'samples': 652992, 'steps': 3400, 'loss/train': 2.441323757171631} -08/30/2021 13:49:14 - INFO - __main__ - Step 3402: {'lr': 0.0004998894571670929, 'samples': 653184, 'steps': 3401, 'loss/train': 3.2445061206817627} -08/30/2021 13:49:14 - INFO - __main__ - Step 3403: {'lr': 0.0004998892993168109, 'samples': 653376, 'steps': 3402, 'loss/train': 2.917768955230713} -08/30/2021 13:49:16 - INFO - __main__ - Step 3404: {'lr': 0.0004998891413539326, 'samples': 653568, 'steps': 3403, 'loss/train': 3.06826114654541} -08/30/2021 13:49:16 - INFO - __main__ - Step 3405: {'lr': 0.0004998889832784581, 'samples': 653760, 'steps': 3404, 'loss/train': 3.037091016769409} -08/30/2021 13:49:17 - INFO - __main__ - Step 3406: {'lr': 0.0004998888250903875, 'samples': 653952, 'steps': 3405, 'loss/train': 2.4964957237243652} -08/30/2021 13:49:17 - INFO - __main__ - Step 3407: {'lr': 0.0004998886667897209, 'samples': 654144, 'steps': 3406, 'loss/train': 1.899567723274231} -08/30/2021 13:49:17 - INFO - __main__ - Step 3408: {'lr': 0.0004998885083764582, 'samples': 654336, 'steps': 3407, 'loss/train': 2.579331874847412} -08/30/2021 13:49:18 - INFO - __main__ - Step 3409: {'lr': 0.0004998883498505996, 'samples': 654528, 'steps': 3408, 'loss/train': 2.5077710151672363} -08/30/2021 13:49:19 - INFO - __main__ - Step 3410: {'lr': 0.0004998881912121453, 'samples': 654720, 'steps': 3409, 'loss/train': 2.3359644412994385} -08/30/2021 13:49:20 - INFO - __main__ - Step 3411: {'lr': 0.0004998880324610952, 'samples': 654912, 'steps': 3410, 'loss/train': 2.951115608215332} -08/30/2021 13:49:20 - INFO - __main__ - Step 3412: {'lr': 0.0004998878735974493, 'samples': 655104, 'steps': 3411, 'loss/train': 2.7862660884857178} -08/30/2021 13:49:20 - INFO - __main__ - Step 3413: {'lr': 0.0004998877146212079, 'samples': 655296, 'steps': 3412, 'loss/train': 2.9797847270965576} -08/30/2021 13:49:21 - INFO - __main__ - Step 3414: {'lr': 0.0004998875555323708, 'samples': 655488, 'steps': 3413, 'loss/train': 2.2499947547912598} -08/30/2021 13:49:22 - INFO - __main__ - Step 3415: {'lr': 0.0004998873963309384, 'samples': 655680, 'steps': 3414, 'loss/train': 2.724332332611084} -08/30/2021 13:49:23 - INFO - __main__ - Step 3416: {'lr': 0.0004998872370169105, 'samples': 655872, 'steps': 3415, 'loss/train': 2.579256772994995} -08/30/2021 13:49:23 - INFO - __main__ - Step 3417: {'lr': 0.0004998870775902872, 'samples': 656064, 'steps': 3416, 'loss/train': 2.531017303466797} -08/30/2021 13:49:23 - INFO - __main__ - Step 3418: {'lr': 0.0004998869180510688, 'samples': 656256, 'steps': 3417, 'loss/train': 2.8577194213867188} -08/30/2021 13:49:24 - INFO - __main__ - Step 3419: {'lr': 0.0004998867583992551, 'samples': 656448, 'steps': 3418, 'loss/train': 3.2128517627716064} -08/30/2021 13:49:25 - INFO - __main__ - Step 3420: {'lr': 0.0004998865986348464, 'samples': 656640, 'steps': 3419, 'loss/train': 4.497913360595703} -08/30/2021 13:49:26 - INFO - __main__ - Step 3421: {'lr': 0.0004998864387578426, 'samples': 656832, 'steps': 3420, 'loss/train': 2.314352512359619} -08/30/2021 13:49:26 - INFO - __main__ - Step 3422: {'lr': 0.0004998862787682438, 'samples': 657024, 'steps': 3421, 'loss/train': 3.1587514877319336} -08/30/2021 13:49:27 - INFO - __main__ - Step 3423: {'lr': 0.00049988611866605, 'samples': 657216, 'steps': 3422, 'loss/train': 2.787001609802246} -08/30/2021 13:49:27 - INFO - __main__ - Step 3424: {'lr': 0.0004998859584512615, 'samples': 657408, 'steps': 3423, 'loss/train': 3.9919040203094482} -08/30/2021 13:49:28 - INFO - __main__ - Step 3425: {'lr': 0.0004998857981238782, 'samples': 657600, 'steps': 3424, 'loss/train': 2.7004263401031494} -08/30/2021 13:49:29 - INFO - __main__ - Step 3426: {'lr': 0.0004998856376839003, 'samples': 657792, 'steps': 3425, 'loss/train': 3.263404369354248} -08/30/2021 13:49:29 - INFO - __main__ - Step 3427: {'lr': 0.0004998854771313277, 'samples': 657984, 'steps': 3426, 'loss/train': 2.738943338394165} -08/30/2021 13:49:30 - INFO - __main__ - Step 3428: {'lr': 0.0004998853164661606, 'samples': 658176, 'steps': 3427, 'loss/train': 2.4689908027648926} -08/30/2021 13:49:30 - INFO - __main__ - Step 3429: {'lr': 0.000499885155688399, 'samples': 658368, 'steps': 3428, 'loss/train': 2.7306323051452637} -08/30/2021 13:49:32 - INFO - __main__ - Step 3430: {'lr': 0.000499884994798043, 'samples': 658560, 'steps': 3429, 'loss/train': 2.639641523361206} -08/30/2021 13:49:32 - INFO - __main__ - Step 3431: {'lr': 0.0004998848337950927, 'samples': 658752, 'steps': 3430, 'loss/train': 2.4209651947021484} -08/30/2021 13:49:33 - INFO - __main__ - Step 3432: {'lr': 0.0004998846726795482, 'samples': 658944, 'steps': 3431, 'loss/train': 3.1134023666381836} -08/30/2021 13:49:33 - INFO - __main__ - Step 3433: {'lr': 0.0004998845114514095, 'samples': 659136, 'steps': 3432, 'loss/train': 2.6262388229370117} -08/30/2021 13:49:33 - INFO - __main__ - Step 3434: {'lr': 0.0004998843501106766, 'samples': 659328, 'steps': 3433, 'loss/train': 2.3508970737457275} -08/30/2021 13:49:34 - INFO - __main__ - Step 3435: {'lr': 0.0004998841886573496, 'samples': 659520, 'steps': 3434, 'loss/train': 2.84313702583313} -08/30/2021 13:49:35 - INFO - __main__ - Step 3436: {'lr': 0.0004998840270914288, 'samples': 659712, 'steps': 3435, 'loss/train': 2.950655460357666} -08/30/2021 13:49:36 - INFO - __main__ - Step 3437: {'lr': 0.0004998838654129142, 'samples': 659904, 'steps': 3436, 'loss/train': 3.063199043273926} -08/30/2021 13:49:36 - INFO - __main__ - Step 3438: {'lr': 0.0004998837036218056, 'samples': 660096, 'steps': 3437, 'loss/train': 0.5293973684310913} -08/30/2021 13:49:36 - INFO - __main__ - Step 3439: {'lr': 0.0004998835417181033, 'samples': 660288, 'steps': 3438, 'loss/train': 2.5547447204589844} -08/30/2021 13:49:37 - INFO - __main__ - Step 3440: {'lr': 0.0004998833797018074, 'samples': 660480, 'steps': 3439, 'loss/train': 2.619832992553711} -08/30/2021 13:49:37 - INFO - __main__ - Step 3441: {'lr': 0.0004998832175729179, 'samples': 660672, 'steps': 3440, 'loss/train': 2.998067855834961} -08/30/2021 13:49:39 - INFO - __main__ - Step 3442: {'lr': 0.0004998830553314349, 'samples': 660864, 'steps': 3441, 'loss/train': 2.967714786529541} -08/30/2021 13:49:39 - INFO - __main__ - Step 3443: {'lr': 0.0004998828929773583, 'samples': 661056, 'steps': 3442, 'loss/train': 2.2500030994415283} -08/30/2021 13:49:39 - INFO - __main__ - Step 3444: {'lr': 0.0004998827305106884, 'samples': 661248, 'steps': 3443, 'loss/train': 2.594834327697754} -08/30/2021 13:49:40 - INFO - __main__ - Step 3445: {'lr': 0.0004998825679314253, 'samples': 661440, 'steps': 3444, 'loss/train': 2.74992036819458} -08/30/2021 13:49:40 - INFO - __main__ - Step 3446: {'lr': 0.0004998824052395689, 'samples': 661632, 'steps': 3445, 'loss/train': 2.596956491470337} -08/30/2021 13:49:42 - INFO - __main__ - Step 3447: {'lr': 0.0004998822424351193, 'samples': 661824, 'steps': 3446, 'loss/train': 2.3737950325012207} -08/30/2021 13:49:42 - INFO - __main__ - Step 3448: {'lr': 0.0004998820795180766, 'samples': 662016, 'steps': 3447, 'loss/train': 2.3730239868164062} -08/30/2021 13:49:42 - INFO - __main__ - Step 3449: {'lr': 0.000499881916488441, 'samples': 662208, 'steps': 3448, 'loss/train': 3.0651445388793945} -08/30/2021 13:49:43 - INFO - __main__ - Step 3450: {'lr': 0.0004998817533462123, 'samples': 662400, 'steps': 3449, 'loss/train': 1.9123895168304443} -08/30/2021 13:49:43 - INFO - __main__ - Step 3451: {'lr': 0.0004998815900913909, 'samples': 662592, 'steps': 3450, 'loss/train': 2.172102212905884} -08/30/2021 13:49:45 - INFO - __main__ - Step 3452: {'lr': 0.0004998814267239767, 'samples': 662784, 'steps': 3451, 'loss/train': 2.280928134918213} -08/30/2021 13:49:46 - INFO - __main__ - Step 3453: {'lr': 0.0004998812632439697, 'samples': 662976, 'steps': 3452, 'loss/train': 1.0883467197418213} -08/30/2021 13:49:46 - INFO - __main__ - Step 3454: {'lr': 0.00049988109965137, 'samples': 663168, 'steps': 3453, 'loss/train': 2.310020685195923} -08/30/2021 13:49:46 - INFO - __main__ - Step 3455: {'lr': 0.000499880935946178, 'samples': 663360, 'steps': 3454, 'loss/train': 2.583714485168457} -08/30/2021 13:49:47 - INFO - __main__ - Step 3456: {'lr': 0.0004998807721283932, 'samples': 663552, 'steps': 3455, 'loss/train': 2.3489978313446045} -08/30/2021 13:49:48 - INFO - __main__ - Step 3457: {'lr': 0.0004998806081980162, 'samples': 663744, 'steps': 3456, 'loss/train': 2.2940306663513184} -08/30/2021 13:49:49 - INFO - __main__ - Step 3458: {'lr': 0.0004998804441550467, 'samples': 663936, 'steps': 3457, 'loss/train': 2.3305861949920654} -08/30/2021 13:49:49 - INFO - __main__ - Step 3459: {'lr': 0.000499880279999485, 'samples': 664128, 'steps': 3458, 'loss/train': 2.65053391456604} -08/30/2021 13:49:49 - INFO - __main__ - Step 3460: {'lr': 0.0004998801157313311, 'samples': 664320, 'steps': 3459, 'loss/train': 2.539475440979004} -08/30/2021 13:49:50 - INFO - __main__ - Step 3461: {'lr': 0.0004998799513505851, 'samples': 664512, 'steps': 3460, 'loss/train': 2.5797791481018066} -08/30/2021 13:49:51 - INFO - __main__ - Step 3462: {'lr': 0.000499879786857247, 'samples': 664704, 'steps': 3461, 'loss/train': 2.5145087242126465} -08/30/2021 13:49:52 - INFO - __main__ - Step 3463: {'lr': 0.0004998796222513169, 'samples': 664896, 'steps': 3462, 'loss/train': 2.658740282058716} -08/30/2021 13:49:52 - INFO - __main__ - Step 3464: {'lr': 0.000499879457532795, 'samples': 665088, 'steps': 3463, 'loss/train': 2.358705759048462} -08/30/2021 13:49:52 - INFO - __main__ - Step 3465: {'lr': 0.0004998792927016812, 'samples': 665280, 'steps': 3464, 'loss/train': 2.325634717941284} -08/30/2021 13:49:53 - INFO - __main__ - Step 3466: {'lr': 0.0004998791277579757, 'samples': 665472, 'steps': 3465, 'loss/train': 4.067972660064697} -08/30/2021 13:49:54 - INFO - __main__ - Step 3467: {'lr': 0.0004998789627016784, 'samples': 665664, 'steps': 3466, 'loss/train': 2.500408887863159} -08/30/2021 13:49:55 - INFO - __main__ - Step 3468: {'lr': 0.0004998787975327896, 'samples': 665856, 'steps': 3467, 'loss/train': 2.69610333442688} -08/30/2021 13:49:55 - INFO - __main__ - Step 3469: {'lr': 0.0004998786322513093, 'samples': 666048, 'steps': 3468, 'loss/train': 2.477757215499878} -08/30/2021 13:49:55 - INFO - __main__ - Step 3470: {'lr': 0.0004998784668572375, 'samples': 666240, 'steps': 3469, 'loss/train': 2.623246431350708} -08/30/2021 13:49:56 - INFO - __main__ - Step 3471: {'lr': 0.0004998783013505743, 'samples': 666432, 'steps': 3470, 'loss/train': 2.584547758102417} -08/30/2021 13:49:57 - INFO - __main__ - Step 3472: {'lr': 0.0004998781357313198, 'samples': 666624, 'steps': 3471, 'loss/train': 2.7669098377227783} -08/30/2021 13:49:58 - INFO - __main__ - Step 3473: {'lr': 0.0004998779699994741, 'samples': 666816, 'steps': 3472, 'loss/train': 2.470353364944458} -08/30/2021 13:49:58 - INFO - __main__ - Step 3474: {'lr': 0.0004998778041550372, 'samples': 667008, 'steps': 3473, 'loss/train': 2.6031546592712402} -08/30/2021 13:49:58 - INFO - __main__ - Step 3475: {'lr': 0.0004998776381980092, 'samples': 667200, 'steps': 3474, 'loss/train': 2.885899305343628} -08/30/2021 13:49:59 - INFO - __main__ - Step 3476: {'lr': 0.0004998774721283903, 'samples': 667392, 'steps': 3475, 'loss/train': 2.8214433193206787} -08/30/2021 13:49:59 - INFO - __main__ - Step 3477: {'lr': 0.0004998773059461803, 'samples': 667584, 'steps': 3476, 'loss/train': 2.6902358531951904} -08/30/2021 13:50:01 - INFO - __main__ - Step 3478: {'lr': 0.0004998771396513796, 'samples': 667776, 'steps': 3477, 'loss/train': 2.731186866760254} -08/30/2021 13:50:01 - INFO - __main__ - Step 3479: {'lr': 0.000499876973243988, 'samples': 667968, 'steps': 3478, 'loss/train': 1.5921486616134644} -08/30/2021 13:50:01 - INFO - __main__ - Step 3480: {'lr': 0.0004998768067240059, 'samples': 668160, 'steps': 3479, 'loss/train': 2.509577512741089} -08/30/2021 13:50:02 - INFO - __main__ - Step 3481: {'lr': 0.0004998766400914329, 'samples': 668352, 'steps': 3480, 'loss/train': 1.6335997581481934} -08/30/2021 13:50:02 - INFO - __main__ - Step 3482: {'lr': 0.0004998764733462694, 'samples': 668544, 'steps': 3481, 'loss/train': 2.6024105548858643} -08/30/2021 13:50:04 - INFO - __main__ - Step 3483: {'lr': 0.0004998763064885155, 'samples': 668736, 'steps': 3482, 'loss/train': 1.5272482633590698} -08/30/2021 13:50:04 - INFO - __main__ - Step 3484: {'lr': 0.0004998761395181712, 'samples': 668928, 'steps': 3483, 'loss/train': 2.190028667449951} -08/30/2021 13:50:05 - INFO - __main__ - Step 3485: {'lr': 0.0004998759724352365, 'samples': 669120, 'steps': 3484, 'loss/train': 2.1334502696990967} -08/30/2021 13:50:05 - INFO - __main__ - Step 3486: {'lr': 0.0004998758052397115, 'samples': 669312, 'steps': 3485, 'loss/train': 2.725038528442383} -08/30/2021 13:50:05 - INFO - __main__ - Step 3487: {'lr': 0.0004998756379315964, 'samples': 669504, 'steps': 3486, 'loss/train': 1.879176139831543} -08/30/2021 13:50:07 - INFO - __main__ - Step 3488: {'lr': 0.0004998754705108912, 'samples': 669696, 'steps': 3487, 'loss/train': 2.227513313293457} -08/30/2021 13:50:07 - INFO - __main__ - Step 3489: {'lr': 0.000499875302977596, 'samples': 669888, 'steps': 3488, 'loss/train': 2.055891513824463} -08/30/2021 13:50:07 - INFO - __main__ - Step 3490: {'lr': 0.0004998751353317108, 'samples': 670080, 'steps': 3489, 'loss/train': 2.2259504795074463} -08/30/2021 13:50:08 - INFO - __main__ - Step 3491: {'lr': 0.0004998749675732357, 'samples': 670272, 'steps': 3490, 'loss/train': 2.086120367050171} -08/30/2021 13:50:08 - INFO - __main__ - Step 3492: {'lr': 0.0004998747997021708, 'samples': 670464, 'steps': 3491, 'loss/train': 2.984645366668701} -08/30/2021 13:50:10 - INFO - __main__ - Step 3493: {'lr': 0.0004998746317185162, 'samples': 670656, 'steps': 3492, 'loss/train': 2.691204309463501} -08/30/2021 13:50:10 - INFO - __main__ - Step 3494: {'lr': 0.000499874463622272, 'samples': 670848, 'steps': 3493, 'loss/train': 3.7327635288238525} -08/30/2021 13:50:10 - INFO - __main__ - Step 3495: {'lr': 0.000499874295413438, 'samples': 671040, 'steps': 3494, 'loss/train': 1.8792227506637573} -08/30/2021 13:50:11 - INFO - __main__ - Step 3496: {'lr': 0.0004998741270920147, 'samples': 671232, 'steps': 3495, 'loss/train': 2.2878055572509766} -08/30/2021 13:50:11 - INFO - __main__ - Step 3497: {'lr': 0.0004998739586580019, 'samples': 671424, 'steps': 3496, 'loss/train': 2.5358221530914307} -08/30/2021 13:50:13 - INFO - __main__ - Step 3498: {'lr': 0.0004998737901113999, 'samples': 671616, 'steps': 3497, 'loss/train': 2.7810819149017334} -08/30/2021 13:50:13 - INFO - __main__ - Step 3499: {'lr': 0.0004998736214522084, 'samples': 671808, 'steps': 3498, 'loss/train': 2.445444107055664} -08/30/2021 13:50:13 - INFO - __main__ - Step 3500: {'lr': 0.0004998734526804278, 'samples': 672000, 'steps': 3499, 'loss/train': 2.588060140609741} -08/30/2021 13:50:14 - INFO - __main__ - Step 3501: {'lr': 0.0004998732837960581, 'samples': 672192, 'steps': 3500, 'loss/train': 2.519333600997925} -08/30/2021 13:50:14 - INFO - __main__ - Step 3502: {'lr': 0.0004998731147990993, 'samples': 672384, 'steps': 3501, 'loss/train': 2.5726373195648193} -08/30/2021 13:50:16 - INFO - __main__ - Step 3503: {'lr': 0.0004998729456895516, 'samples': 672576, 'steps': 3502, 'loss/train': 3.3219263553619385} -08/30/2021 13:50:17 - INFO - __main__ - Step 3504: {'lr': 0.0004998727764674149, 'samples': 672768, 'steps': 3503, 'loss/train': 2.2654037475585938} -08/30/2021 13:50:17 - INFO - __main__ - Step 3505: {'lr': 0.0004998726071326896, 'samples': 672960, 'steps': 3504, 'loss/train': 2.958322763442993} -08/30/2021 13:50:17 - INFO - __main__ - Step 3506: {'lr': 0.0004998724376853754, 'samples': 673152, 'steps': 3505, 'loss/train': 1.9985573291778564} -08/30/2021 13:50:18 - INFO - __main__ - Step 3507: {'lr': 0.0004998722681254725, 'samples': 673344, 'steps': 3506, 'loss/train': 2.4221041202545166} -08/30/2021 13:50:18 - INFO - __main__ - Step 3508: {'lr': 0.0004998720984529811, 'samples': 673536, 'steps': 3507, 'loss/train': 2.9456748962402344} -08/30/2021 13:50:20 - INFO - __main__ - Step 3509: {'lr': 0.0004998719286679011, 'samples': 673728, 'steps': 3508, 'loss/train': 2.9266512393951416} -08/30/2021 13:50:20 - INFO - __main__ - Step 3510: {'lr': 0.0004998717587702328, 'samples': 673920, 'steps': 3509, 'loss/train': 2.8354921340942383} -08/30/2021 13:50:20 - INFO - __main__ - Step 3511: {'lr': 0.0004998715887599759, 'samples': 674112, 'steps': 3510, 'loss/train': 2.195363998413086} -08/30/2021 13:50:21 - INFO - __main__ - Step 3512: {'lr': 0.000499871418637131, 'samples': 674304, 'steps': 3511, 'loss/train': 2.662369966506958} -08/30/2021 13:50:21 - INFO - __main__ - Step 3513: {'lr': 0.0004998712484016977, 'samples': 674496, 'steps': 3512, 'loss/train': 2.7905404567718506} -08/30/2021 13:50:23 - INFO - __main__ - Step 3514: {'lr': 0.0004998710780536763, 'samples': 674688, 'steps': 3513, 'loss/train': 2.845914363861084} -08/30/2021 13:50:23 - INFO - __main__ - Step 3515: {'lr': 0.0004998709075930669, 'samples': 674880, 'steps': 3514, 'loss/train': 2.370758056640625} -08/30/2021 13:50:23 - INFO - __main__ - Step 3516: {'lr': 0.0004998707370198695, 'samples': 675072, 'steps': 3515, 'loss/train': 2.654289484024048} -08/30/2021 13:50:24 - INFO - __main__ - Step 3517: {'lr': 0.0004998705663340843, 'samples': 675264, 'steps': 3516, 'loss/train': 0.9861878752708435} -08/30/2021 13:50:24 - INFO - __main__ - Step 3518: {'lr': 0.0004998703955357111, 'samples': 675456, 'steps': 3517, 'loss/train': 2.767317771911621} -08/30/2021 13:50:26 - INFO - __main__ - Step 3519: {'lr': 0.0004998702246247502, 'samples': 675648, 'steps': 3518, 'loss/train': 2.1342272758483887} -08/30/2021 13:50:26 - INFO - __main__ - Step 3520: {'lr': 0.0004998700536012017, 'samples': 675840, 'steps': 3519, 'loss/train': 2.54465651512146} -08/30/2021 13:50:26 - INFO - __main__ - Step 3521: {'lr': 0.0004998698824650655, 'samples': 676032, 'steps': 3520, 'loss/train': 2.619464635848999} -08/30/2021 13:50:27 - INFO - __main__ - Step 3522: {'lr': 0.000499869711216342, 'samples': 676224, 'steps': 3521, 'loss/train': 2.869643449783325} -08/30/2021 13:50:27 - INFO - __main__ - Step 3523: {'lr': 0.0004998695398550309, 'samples': 676416, 'steps': 3522, 'loss/train': 2.5181527137756348} -08/30/2021 13:50:29 - INFO - __main__ - Step 3524: {'lr': 0.0004998693683811325, 'samples': 676608, 'steps': 3523, 'loss/train': 1.9194591045379639} -08/30/2021 13:50:29 - INFO - __main__ - Step 3525: {'lr': 0.0004998691967946468, 'samples': 676800, 'steps': 3524, 'loss/train': 0.4229249954223633} -08/30/2021 13:50:30 - INFO - __main__ - Step 3526: {'lr': 0.000499869025095574, 'samples': 676992, 'steps': 3525, 'loss/train': 2.827298879623413} -08/30/2021 13:50:30 - INFO - __main__ - Step 3527: {'lr': 0.0004998688532839139, 'samples': 677184, 'steps': 3526, 'loss/train': 2.630917549133301} -08/30/2021 13:50:30 - INFO - __main__ - Step 3528: {'lr': 0.0004998686813596668, 'samples': 677376, 'steps': 3527, 'loss/train': 2.33671498298645} -08/30/2021 13:50:31 - INFO - __main__ - Step 3529: {'lr': 0.0004998685093228327, 'samples': 677568, 'steps': 3528, 'loss/train': 3.2041265964508057} -08/30/2021 13:50:32 - INFO - __main__ - Step 3530: {'lr': 0.0004998683371734118, 'samples': 677760, 'steps': 3529, 'loss/train': 3.201237440109253} -08/30/2021 13:50:33 - INFO - __main__ - Step 3531: {'lr': 0.000499868164911404, 'samples': 677952, 'steps': 3530, 'loss/train': 2.359074354171753} -08/30/2021 13:50:33 - INFO - __main__ - Step 3532: {'lr': 0.0004998679925368094, 'samples': 678144, 'steps': 3531, 'loss/train': 2.1300902366638184} -08/30/2021 13:50:33 - INFO - __main__ - Step 3533: {'lr': 0.0004998678200496283, 'samples': 678336, 'steps': 3532, 'loss/train': 3.163862705230713} -08/30/2021 13:50:34 - INFO - __main__ - Step 3534: {'lr': 0.0004998676474498606, 'samples': 678528, 'steps': 3533, 'loss/train': 2.352466583251953} -08/30/2021 13:50:35 - INFO - __main__ - Step 3535: {'lr': 0.0004998674747375063, 'samples': 678720, 'steps': 3534, 'loss/train': 2.574796199798584} -08/30/2021 13:50:36 - INFO - __main__ - Step 3536: {'lr': 0.0004998673019125657, 'samples': 678912, 'steps': 3535, 'loss/train': 2.926755666732788} -08/30/2021 13:50:36 - INFO - __main__ - Step 3537: {'lr': 0.0004998671289750386, 'samples': 679104, 'steps': 3536, 'loss/train': 2.254777669906616} -08/30/2021 13:50:36 - INFO - __main__ - Step 3538: {'lr': 0.0004998669559249252, 'samples': 679296, 'steps': 3537, 'loss/train': 2.3179006576538086} -08/30/2021 13:50:37 - INFO - __main__ - Step 3539: {'lr': 0.0004998667827622258, 'samples': 679488, 'steps': 3538, 'loss/train': 3.5752573013305664} -08/30/2021 13:50:38 - INFO - __main__ - Step 3540: {'lr': 0.0004998666094869402, 'samples': 679680, 'steps': 3539, 'loss/train': 2.8265016078948975} -08/30/2021 13:50:39 - INFO - __main__ - Step 3541: {'lr': 0.0004998664360990685, 'samples': 679872, 'steps': 3540, 'loss/train': 2.433196783065796} -08/30/2021 13:50:39 - INFO - __main__ - Step 3542: {'lr': 0.0004998662625986109, 'samples': 680064, 'steps': 3541, 'loss/train': 2.2378532886505127} -08/30/2021 13:50:39 - INFO - __main__ - Step 3543: {'lr': 0.0004998660889855674, 'samples': 680256, 'steps': 3542, 'loss/train': 2.2512288093566895} -08/30/2021 13:50:40 - INFO - __main__ - Step 3544: {'lr': 0.0004998659152599381, 'samples': 680448, 'steps': 3543, 'loss/train': 1.9482016563415527} -08/30/2021 13:50:41 - INFO - __main__ - Step 3545: {'lr': 0.000499865741421723, 'samples': 680640, 'steps': 3544, 'loss/train': 2.8362069129943848} -08/30/2021 13:50:42 - INFO - __main__ - Step 3546: {'lr': 0.0004998655674709224, 'samples': 680832, 'steps': 3545, 'loss/train': 2.060626983642578} -08/30/2021 13:50:42 - INFO - __main__ - Step 3547: {'lr': 0.0004998653934075361, 'samples': 681024, 'steps': 3546, 'loss/train': 2.338832378387451} -08/30/2021 13:50:42 - INFO - __main__ - Step 3548: {'lr': 0.0004998652192315644, 'samples': 681216, 'steps': 3547, 'loss/train': 2.950679063796997} -08/30/2021 13:50:43 - INFO - __main__ - Step 3549: {'lr': 0.0004998650449430073, 'samples': 681408, 'steps': 3548, 'loss/train': 2.219944715499878} -08/30/2021 13:50:44 - INFO - __main__ - Step 3550: {'lr': 0.0004998648705418648, 'samples': 681600, 'steps': 3549, 'loss/train': 3.002030372619629} -08/30/2021 13:50:45 - INFO - __main__ - Step 3551: {'lr': 0.000499864696028137, 'samples': 681792, 'steps': 3550, 'loss/train': 4.705066680908203} -08/30/2021 13:50:45 - INFO - __main__ - Step 3552: {'lr': 0.000499864521401824, 'samples': 681984, 'steps': 3551, 'loss/train': 2.4122514724731445} -08/30/2021 13:50:45 - INFO - __main__ - Step 3553: {'lr': 0.000499864346662926, 'samples': 682176, 'steps': 3552, 'loss/train': 2.5135066509246826} -08/30/2021 13:50:46 - INFO - __main__ - Step 3554: {'lr': 0.000499864171811443, 'samples': 682368, 'steps': 3553, 'loss/train': 2.106393337249756} -08/30/2021 13:50:46 - INFO - __main__ - Step 3555: {'lr': 0.0004998639968473751, 'samples': 682560, 'steps': 3554, 'loss/train': 2.6872506141662598} -08/30/2021 13:50:48 - INFO - __main__ - Step 3556: {'lr': 0.0004998638217707222, 'samples': 682752, 'steps': 3555, 'loss/train': 3.0624098777770996} -08/30/2021 13:50:49 - INFO - __main__ - Step 3557: {'lr': 0.0004998636465814846, 'samples': 682944, 'steps': 3556, 'loss/train': 2.931065320968628} -08/30/2021 13:50:49 - INFO - __main__ - Step 3558: {'lr': 0.0004998634712796622, 'samples': 683136, 'steps': 3557, 'loss/train': 1.2333321571350098} -08/30/2021 13:50:50 - INFO - __main__ - Step 3559: {'lr': 0.0004998632958652554, 'samples': 683328, 'steps': 3558, 'loss/train': 2.1315107345581055} -08/30/2021 13:50:50 - INFO - __main__ - Step 3560: {'lr': 0.0004998631203382639, 'samples': 683520, 'steps': 3559, 'loss/train': 2.8830904960632324} -08/30/2021 13:50:50 - INFO - __main__ - Step 3561: {'lr': 0.0004998629446986879, 'samples': 683712, 'steps': 3560, 'loss/train': 2.5116159915924072} -08/30/2021 13:50:52 - INFO - __main__ - Step 3562: {'lr': 0.0004998627689465276, 'samples': 683904, 'steps': 3561, 'loss/train': 2.426597833633423} -08/30/2021 13:50:52 - INFO - __main__ - Step 3563: {'lr': 0.0004998625930817829, 'samples': 684096, 'steps': 3562, 'loss/train': 1.8819105625152588} -08/30/2021 13:50:53 - INFO - __main__ - Step 3564: {'lr': 0.0004998624171044541, 'samples': 684288, 'steps': 3563, 'loss/train': 2.7323007583618164} -08/30/2021 13:50:53 - INFO - __main__ - Step 3565: {'lr': 0.000499862241014541, 'samples': 684480, 'steps': 3564, 'loss/train': 2.2394044399261475} -08/30/2021 13:50:53 - INFO - __main__ - Step 3566: {'lr': 0.0004998620648120439, 'samples': 684672, 'steps': 3565, 'loss/train': 2.694523572921753} -08/30/2021 13:50:55 - INFO - __main__ - Step 3567: {'lr': 0.0004998618884969628, 'samples': 684864, 'steps': 3566, 'loss/train': 2.997663974761963} -08/30/2021 13:50:55 - INFO - __main__ - Step 3568: {'lr': 0.0004998617120692977, 'samples': 685056, 'steps': 3567, 'loss/train': 2.824540853500366} -08/30/2021 13:50:56 - INFO - __main__ - Step 3569: {'lr': 0.0004998615355290489, 'samples': 685248, 'steps': 3568, 'loss/train': 2.7600889205932617} -08/30/2021 13:50:56 - INFO - __main__ - Step 3570: {'lr': 0.0004998613588762163, 'samples': 685440, 'steps': 3569, 'loss/train': 1.759244680404663} -08/30/2021 13:50:56 - INFO - __main__ - Step 3571: {'lr': 0.0004998611821108001, 'samples': 685632, 'steps': 3570, 'loss/train': 2.763533115386963} -08/30/2021 13:50:58 - INFO - __main__ - Step 3572: {'lr': 0.0004998610052328002, 'samples': 685824, 'steps': 3571, 'loss/train': 1.9221290349960327} -08/30/2021 13:50:58 - INFO - __main__ - Step 3573: {'lr': 0.0004998608282422169, 'samples': 686016, 'steps': 3572, 'loss/train': 2.7596094608306885} -08/30/2021 13:50:59 - INFO - __main__ - Step 3574: {'lr': 0.0004998606511390501, 'samples': 686208, 'steps': 3573, 'loss/train': 2.6264867782592773} -08/30/2021 13:50:59 - INFO - __main__ - Step 3575: {'lr': 0.0004998604739232999, 'samples': 686400, 'steps': 3574, 'loss/train': 2.5383200645446777} -08/30/2021 13:50:59 - INFO - __main__ - Step 3576: {'lr': 0.0004998602965949664, 'samples': 686592, 'steps': 3575, 'loss/train': 1.304887056350708} -08/30/2021 13:51:01 - INFO - __main__ - Step 3577: {'lr': 0.0004998601191540499, 'samples': 686784, 'steps': 3576, 'loss/train': 2.421765089035034} -08/30/2021 13:51:01 - INFO - __main__ - Step 3578: {'lr': 0.0004998599416005502, 'samples': 686976, 'steps': 3577, 'loss/train': 0.7924010753631592} -08/30/2021 13:51:02 - INFO - __main__ - Step 3579: {'lr': 0.0004998597639344674, 'samples': 687168, 'steps': 3578, 'loss/train': 2.5419864654541016} -08/30/2021 13:51:02 - INFO - __main__ - Step 3580: {'lr': 0.0004998595861558016, 'samples': 687360, 'steps': 3579, 'loss/train': 2.757249593734741} -08/30/2021 13:51:02 - INFO - __main__ - Step 3581: {'lr': 0.000499859408264553, 'samples': 687552, 'steps': 3580, 'loss/train': 2.6921191215515137} -08/30/2021 13:51:04 - INFO - __main__ - Step 3582: {'lr': 0.0004998592302607217, 'samples': 687744, 'steps': 3581, 'loss/train': 2.715059280395508} -08/30/2021 13:51:04 - INFO - __main__ - Step 3583: {'lr': 0.0004998590521443075, 'samples': 687936, 'steps': 3582, 'loss/train': 2.8533082008361816} -08/30/2021 13:51:05 - INFO - __main__ - Step 3584: {'lr': 0.0004998588739153108, 'samples': 688128, 'steps': 3583, 'loss/train': 1.9397984743118286} -08/30/2021 13:51:05 - INFO - __main__ - Step 3585: {'lr': 0.0004998586955737316, 'samples': 688320, 'steps': 3584, 'loss/train': 2.611144781112671} -08/30/2021 13:51:05 - INFO - __main__ - Step 3586: {'lr': 0.0004998585171195698, 'samples': 688512, 'steps': 3585, 'loss/train': 2.3520359992980957} -08/30/2021 13:51:06 - INFO - __main__ - Step 3587: {'lr': 0.0004998583385528256, 'samples': 688704, 'steps': 3586, 'loss/train': 2.5994157791137695} -08/30/2021 13:51:07 - INFO - __main__ - Step 3588: {'lr': 0.0004998581598734991, 'samples': 688896, 'steps': 3587, 'loss/train': 2.06207275390625} -08/30/2021 13:51:08 - INFO - __main__ - Step 3589: {'lr': 0.0004998579810815905, 'samples': 689088, 'steps': 3588, 'loss/train': 2.2917850017547607} -08/30/2021 13:51:08 - INFO - __main__ - Step 3590: {'lr': 0.0004998578021770995, 'samples': 689280, 'steps': 3589, 'loss/train': 2.545503616333008} -08/30/2021 13:51:08 - INFO - __main__ - Step 3591: {'lr': 0.0004998576231600267, 'samples': 689472, 'steps': 3590, 'loss/train': 2.7478041648864746} -08/30/2021 13:51:09 - INFO - __main__ - Step 3592: {'lr': 0.0004998574440303718, 'samples': 689664, 'steps': 3591, 'loss/train': 2.556713581085205} -08/30/2021 13:51:10 - INFO - __main__ - Step 3593: {'lr': 0.0004998572647881349, 'samples': 689856, 'steps': 3592, 'loss/train': 1.7167731523513794} -08/30/2021 13:51:11 - INFO - __main__ - Step 3594: {'lr': 0.0004998570854333163, 'samples': 690048, 'steps': 3593, 'loss/train': 2.6185929775238037} -08/30/2021 13:51:11 - INFO - __main__ - Step 3595: {'lr': 0.0004998569059659158, 'samples': 690240, 'steps': 3594, 'loss/train': 2.525623083114624} -08/30/2021 13:51:11 - INFO - __main__ - Step 3596: {'lr': 0.0004998567263859338, 'samples': 690432, 'steps': 3595, 'loss/train': 2.6915581226348877} -08/30/2021 13:51:12 - INFO - __main__ - Step 3597: {'lr': 0.0004998565466933702, 'samples': 690624, 'steps': 3596, 'loss/train': 2.9205996990203857} -08/30/2021 13:51:13 - INFO - __main__ - Step 3598: {'lr': 0.000499856366888225, 'samples': 690816, 'steps': 3597, 'loss/train': 2.7925093173980713} -08/30/2021 13:51:14 - INFO - __main__ - Step 3599: {'lr': 0.0004998561869704983, 'samples': 691008, 'steps': 3598, 'loss/train': 2.9762027263641357} -08/30/2021 13:51:14 - INFO - __main__ - Step 3600: {'lr': 0.0004998560069401905, 'samples': 691200, 'steps': 3599, 'loss/train': 2.4280307292938232} -08/30/2021 13:51:14 - INFO - __main__ - Step 3601: {'lr': 0.0004998558267973013, 'samples': 691392, 'steps': 3600, 'loss/train': 2.488234043121338} -08/30/2021 13:51:15 - INFO - __main__ - Step 3602: {'lr': 0.0004998556465418309, 'samples': 691584, 'steps': 3601, 'loss/train': 2.2893667221069336} -08/30/2021 13:51:16 - INFO - __main__ - Step 3603: {'lr': 0.0004998554661737795, 'samples': 691776, 'steps': 3602, 'loss/train': 1.9183200597763062} -08/30/2021 13:51:17 - INFO - __main__ - Step 3604: {'lr': 0.000499855285693147, 'samples': 691968, 'steps': 3603, 'loss/train': 1.7201327085494995} -08/30/2021 13:51:17 - INFO - __main__ - Step 3605: {'lr': 0.0004998551050999336, 'samples': 692160, 'steps': 3604, 'loss/train': 2.437591314315796} -08/30/2021 13:51:17 - INFO - __main__ - Step 3606: {'lr': 0.0004998549243941393, 'samples': 692352, 'steps': 3605, 'loss/train': 2.7183268070220947} -08/30/2021 13:51:18 - INFO - __main__ - Step 3607: {'lr': 0.0004998547435757643, 'samples': 692544, 'steps': 3606, 'loss/train': 2.594651460647583} -08/30/2021 13:51:19 - INFO - __main__ - Step 3608: {'lr': 0.0004998545626448087, 'samples': 692736, 'steps': 3607, 'loss/train': 2.3702476024627686} -08/30/2021 13:51:20 - INFO - __main__ - Step 3609: {'lr': 0.0004998543816012723, 'samples': 692928, 'steps': 3608, 'loss/train': 2.772251844406128} -08/30/2021 13:51:20 - INFO - __main__ - Step 3610: {'lr': 0.0004998542004451554, 'samples': 693120, 'steps': 3609, 'loss/train': 2.511382818222046} -08/30/2021 13:51:20 - INFO - __main__ - Step 3611: {'lr': 0.000499854019176458, 'samples': 693312, 'steps': 3610, 'loss/train': 2.1627109050750732} -08/30/2021 13:51:21 - INFO - __main__ - Step 3612: {'lr': 0.0004998538377951803, 'samples': 693504, 'steps': 3611, 'loss/train': 2.2356529235839844} -08/30/2021 13:51:23 - INFO - __main__ - Step 3613: {'lr': 0.0004998536563013224, 'samples': 693696, 'steps': 3612, 'loss/train': 2.6171715259552} -08/30/2021 13:51:23 - INFO - __main__ - Step 3614: {'lr': 0.0004998534746948843, 'samples': 693888, 'steps': 3613, 'loss/train': 2.421427011489868} -08/30/2021 13:51:24 - INFO - __main__ - Step 3615: {'lr': 0.000499853292975866, 'samples': 694080, 'steps': 3614, 'loss/train': 2.3610634803771973} -08/30/2021 13:51:24 - INFO - __main__ - Step 3616: {'lr': 0.0004998531111442676, 'samples': 694272, 'steps': 3615, 'loss/train': 2.3349177837371826} -08/30/2021 13:51:24 - INFO - __main__ - Step 3617: {'lr': 0.0004998529292000893, 'samples': 694464, 'steps': 3616, 'loss/train': 3.0114173889160156} -08/30/2021 13:51:25 - INFO - __main__ - Step 3618: {'lr': 0.0004998527471433312, 'samples': 694656, 'steps': 3617, 'loss/train': 1.8882458209991455} -08/30/2021 13:51:26 - INFO - __main__ - Step 3619: {'lr': 0.0004998525649739932, 'samples': 694848, 'steps': 3618, 'loss/train': 2.433881998062134} -08/30/2021 13:51:27 - INFO - __main__ - Step 3620: {'lr': 0.0004998523826920756, 'samples': 695040, 'steps': 3619, 'loss/train': 1.7084941864013672} -08/30/2021 13:51:27 - INFO - __main__ - Step 3621: {'lr': 0.0004998522002975783, 'samples': 695232, 'steps': 3620, 'loss/train': 2.808939218521118} -08/30/2021 13:51:28 - INFO - __main__ - Step 3622: {'lr': 0.0004998520177905015, 'samples': 695424, 'steps': 3621, 'loss/train': 0.35889846086502075} -08/30/2021 13:51:28 - INFO - __main__ - Step 3623: {'lr': 0.0004998518351708452, 'samples': 695616, 'steps': 3622, 'loss/train': 2.5196497440338135} -08/30/2021 13:51:29 - INFO - __main__ - Step 3624: {'lr': 0.0004998516524386095, 'samples': 695808, 'steps': 3623, 'loss/train': 2.8409476280212402} -08/30/2021 13:51:30 - INFO - __main__ - Step 3625: {'lr': 0.0004998514695937945, 'samples': 696000, 'steps': 3624, 'loss/train': 2.145430088043213} -08/30/2021 13:51:30 - INFO - __main__ - Step 3626: {'lr': 0.0004998512866364003, 'samples': 696192, 'steps': 3625, 'loss/train': 2.6442580223083496} -08/30/2021 13:51:31 - INFO - __main__ - Step 3627: {'lr': 0.000499851103566427, 'samples': 696384, 'steps': 3626, 'loss/train': 2.2818148136138916} -08/30/2021 13:51:31 - INFO - __main__ - Step 3628: {'lr': 0.0004998509203838746, 'samples': 696576, 'steps': 3627, 'loss/train': 2.495744466781616} -08/30/2021 13:51:32 - INFO - __main__ - Step 3629: {'lr': 0.0004998507370887433, 'samples': 696768, 'steps': 3628, 'loss/train': 1.8277839422225952} -08/30/2021 13:51:33 - INFO - __main__ - Step 3630: {'lr': 0.000499850553681033, 'samples': 696960, 'steps': 3629, 'loss/train': 2.233485221862793} -08/30/2021 13:51:33 - INFO - __main__ - Step 3631: {'lr': 0.000499850370160744, 'samples': 697152, 'steps': 3630, 'loss/train': 2.5942776203155518} -08/30/2021 13:51:34 - INFO - __main__ - Step 3632: {'lr': 0.0004998501865278762, 'samples': 697344, 'steps': 3631, 'loss/train': 3.531891107559204} -08/30/2021 13:51:34 - INFO - __main__ - Step 3633: {'lr': 0.0004998500027824298, 'samples': 697536, 'steps': 3632, 'loss/train': 1.5935769081115723} -08/30/2021 13:51:35 - INFO - __main__ - Step 3634: {'lr': 0.0004998498189244049, 'samples': 697728, 'steps': 3633, 'loss/train': 2.510176658630371} -08/30/2021 13:51:36 - INFO - __main__ - Step 3635: {'lr': 0.0004998496349538015, 'samples': 697920, 'steps': 3634, 'loss/train': 3.216143846511841} -08/30/2021 13:51:36 - INFO - __main__ - Step 3636: {'lr': 0.0004998494508706196, 'samples': 698112, 'steps': 3635, 'loss/train': 3.237640619277954} -08/30/2021 13:51:37 - INFO - __main__ - Step 3637: {'lr': 0.0004998492666748594, 'samples': 698304, 'steps': 3636, 'loss/train': 2.424060583114624} -08/30/2021 13:51:37 - INFO - __main__ - Step 3638: {'lr': 0.0004998490823665211, 'samples': 698496, 'steps': 3637, 'loss/train': 2.499631404876709} -08/30/2021 13:51:38 - INFO - __main__ - Step 3639: {'lr': 0.0004998488979456046, 'samples': 698688, 'steps': 3638, 'loss/train': 2.908761978149414} -08/30/2021 13:51:39 - INFO - __main__ - Step 3640: {'lr': 0.00049984871341211, 'samples': 698880, 'steps': 3639, 'loss/train': 2.353151798248291} -08/30/2021 13:51:39 - INFO - __main__ - Step 3641: {'lr': 0.0004998485287660375, 'samples': 699072, 'steps': 3640, 'loss/train': 2.165651559829712} -08/30/2021 13:51:40 - INFO - __main__ - Step 3642: {'lr': 0.0004998483440073871, 'samples': 699264, 'steps': 3641, 'loss/train': 2.507444381713867} -08/30/2021 13:51:40 - INFO - __main__ - Step 3643: {'lr': 0.0004998481591361589, 'samples': 699456, 'steps': 3642, 'loss/train': 2.355511426925659} -08/30/2021 13:51:40 - INFO - __main__ - Step 3644: {'lr': 0.000499847974152353, 'samples': 699648, 'steps': 3643, 'loss/train': 2.609344482421875} -08/30/2021 13:51:42 - INFO - __main__ - Step 3645: {'lr': 0.0004998477890559693, 'samples': 699840, 'steps': 3644, 'loss/train': 3.222691535949707} -08/30/2021 13:51:42 - INFO - __main__ - Step 3646: {'lr': 0.0004998476038470082, 'samples': 700032, 'steps': 3645, 'loss/train': 2.2444677352905273} -08/30/2021 13:51:43 - INFO - __main__ - Step 3647: {'lr': 0.0004998474185254696, 'samples': 700224, 'steps': 3646, 'loss/train': 2.7029998302459717} -08/30/2021 13:51:43 - INFO - __main__ - Step 3648: {'lr': 0.0004998472330913535, 'samples': 700416, 'steps': 3647, 'loss/train': 2.3544774055480957} -08/30/2021 13:51:43 - INFO - __main__ - Step 3649: {'lr': 0.0004998470475446603, 'samples': 700608, 'steps': 3648, 'loss/train': 2.172724723815918} -08/30/2021 13:51:45 - INFO - __main__ - Step 3650: {'lr': 0.0004998468618853896, 'samples': 700800, 'steps': 3649, 'loss/train': 4.969457149505615} -08/30/2021 13:51:46 - INFO - __main__ - Step 3651: {'lr': 0.000499846676113542, 'samples': 700992, 'steps': 3650, 'loss/train': 2.372426986694336} -08/30/2021 13:51:46 - INFO - __main__ - Step 3652: {'lr': 0.0004998464902291173, 'samples': 701184, 'steps': 3651, 'loss/train': 2.1848011016845703} -08/30/2021 13:51:46 - INFO - __main__ - Step 3653: {'lr': 0.0004998463042321155, 'samples': 701376, 'steps': 3652, 'loss/train': 2.1326675415039062} -08/30/2021 13:51:47 - INFO - __main__ - Step 3654: {'lr': 0.0004998461181225369, 'samples': 701568, 'steps': 3653, 'loss/train': 2.654838800430298} -08/30/2021 13:51:47 - INFO - __main__ - Step 3655: {'lr': 0.0004998459319003815, 'samples': 701760, 'steps': 3654, 'loss/train': 2.791910409927368} -08/30/2021 13:51:48 - INFO - __main__ - Step 3656: {'lr': 0.0004998457455656493, 'samples': 701952, 'steps': 3655, 'loss/train': 2.6973209381103516} -08/30/2021 13:51:49 - INFO - __main__ - Step 3657: {'lr': 0.0004998455591183406, 'samples': 702144, 'steps': 3656, 'loss/train': 2.4102044105529785} -08/30/2021 13:51:49 - INFO - __main__ - Step 3658: {'lr': 0.0004998453725584552, 'samples': 702336, 'steps': 3657, 'loss/train': 2.5161054134368896} -08/30/2021 13:51:50 - INFO - __main__ - Step 3659: {'lr': 0.0004998451858859934, 'samples': 702528, 'steps': 3658, 'loss/train': 0.9827682375907898} -08/30/2021 13:51:50 - INFO - __main__ - Step 3660: {'lr': 0.0004998449991009552, 'samples': 702720, 'steps': 3659, 'loss/train': 3.261535882949829} -08/30/2021 13:51:52 - INFO - __main__ - Step 3661: {'lr': 0.0004998448122033408, 'samples': 702912, 'steps': 3660, 'loss/train': 2.6678919792175293} -08/30/2021 13:51:52 - INFO - __main__ - Step 3662: {'lr': 0.00049984462519315, 'samples': 703104, 'steps': 3661, 'loss/train': 2.772693157196045} -08/30/2021 13:51:52 - INFO - __main__ - Step 3663: {'lr': 0.0004998444380703832, 'samples': 703296, 'steps': 3662, 'loss/train': 2.325258255004883} -08/30/2021 13:51:53 - INFO - __main__ - Step 3664: {'lr': 0.0004998442508350404, 'samples': 703488, 'steps': 3663, 'loss/train': 3.08449387550354} -08/30/2021 13:51:53 - INFO - __main__ - Step 3665: {'lr': 0.0004998440634871215, 'samples': 703680, 'steps': 3664, 'loss/train': 2.883807897567749} -08/30/2021 13:51:53 - INFO - __main__ - Step 3666: {'lr': 0.0004998438760266267, 'samples': 703872, 'steps': 3665, 'loss/train': 2.993598461151123} -08/30/2021 13:51:55 - INFO - __main__ - Step 3667: {'lr': 0.0004998436884535562, 'samples': 704064, 'steps': 3666, 'loss/train': 3.1137425899505615} -08/30/2021 13:51:56 - INFO - __main__ - Step 3668: {'lr': 0.00049984350076791, 'samples': 704256, 'steps': 3667, 'loss/train': 2.7652134895324707} -08/30/2021 13:51:56 - INFO - __main__ - Step 3669: {'lr': 0.0004998433129696882, 'samples': 704448, 'steps': 3668, 'loss/train': 4.125020503997803} -08/30/2021 13:51:57 - INFO - __main__ - Step 3670: {'lr': 0.0004998431250588907, 'samples': 704640, 'steps': 3669, 'loss/train': 2.8697245121002197} -08/30/2021 13:51:57 - INFO - __main__ - Step 3671: {'lr': 0.0004998429370355179, 'samples': 704832, 'steps': 3670, 'loss/train': 2.544102430343628} -08/30/2021 13:51:59 - INFO - __main__ - Step 3672: {'lr': 0.0004998427488995697, 'samples': 705024, 'steps': 3671, 'loss/train': 2.3762354850769043} -08/30/2021 13:51:59 - INFO - __main__ - Step 3673: {'lr': 0.0004998425606510461, 'samples': 705216, 'steps': 3672, 'loss/train': 2.556892156600952} -08/30/2021 13:51:59 - INFO - __main__ - Step 3674: {'lr': 0.0004998423722899475, 'samples': 705408, 'steps': 3673, 'loss/train': 2.7123448848724365} -08/30/2021 13:52:00 - INFO - __main__ - Step 3675: {'lr': 0.0004998421838162735, 'samples': 705600, 'steps': 3674, 'loss/train': 2.2789807319641113} -08/30/2021 13:52:00 - INFO - __main__ - Step 3676: {'lr': 0.0004998419952300247, 'samples': 705792, 'steps': 3675, 'loss/train': 2.485870838165283} -08/30/2021 13:52:02 - INFO - __main__ - Step 3677: {'lr': 0.0004998418065312009, 'samples': 705984, 'steps': 3676, 'loss/train': 2.365833282470703} -08/30/2021 13:52:02 - INFO - __main__ - Step 3678: {'lr': 0.0004998416177198022, 'samples': 706176, 'steps': 3677, 'loss/train': 2.5473415851593018} -08/30/2021 13:52:02 - INFO - __main__ - Step 3679: {'lr': 0.0004998414287958288, 'samples': 706368, 'steps': 3678, 'loss/train': 3.116532564163208} -08/30/2021 13:52:03 - INFO - __main__ - Step 3680: {'lr': 0.0004998412397592807, 'samples': 706560, 'steps': 3679, 'loss/train': 2.694526433944702} -08/30/2021 13:52:03 - INFO - __main__ - Step 3681: {'lr': 0.0004998410506101579, 'samples': 706752, 'steps': 3680, 'loss/train': 1.8455294370651245} -08/30/2021 13:52:05 - INFO - __main__ - Step 3682: {'lr': 0.0004998408613484605, 'samples': 706944, 'steps': 3681, 'loss/train': 2.552056312561035} -08/30/2021 13:52:05 - INFO - __main__ - Step 3683: {'lr': 0.0004998406719741888, 'samples': 707136, 'steps': 3682, 'loss/train': 2.147366523742676} -08/30/2021 13:52:06 - INFO - __main__ - Step 3684: {'lr': 0.0004998404824873428, 'samples': 707328, 'steps': 3683, 'loss/train': 2.796283721923828} -08/30/2021 13:52:06 - INFO - __main__ - Step 3685: {'lr': 0.0004998402928879225, 'samples': 707520, 'steps': 3684, 'loss/train': 4.553436756134033} -08/30/2021 13:52:07 - INFO - __main__ - Step 3686: {'lr': 0.000499840103175928, 'samples': 707712, 'steps': 3685, 'loss/train': 4.194932460784912} -08/30/2021 13:52:07 - INFO - __main__ - Step 3687: {'lr': 0.0004998399133513594, 'samples': 707904, 'steps': 3686, 'loss/train': 2.6775131225585938} -08/30/2021 13:52:08 - INFO - __main__ - Step 3688: {'lr': 0.0004998397234142167, 'samples': 708096, 'steps': 3687, 'loss/train': 2.5451133251190186} -08/30/2021 13:52:09 - INFO - __main__ - Step 3689: {'lr': 0.0004998395333645002, 'samples': 708288, 'steps': 3688, 'loss/train': 2.450786828994751} -08/30/2021 13:52:09 - INFO - __main__ - Step 3690: {'lr': 0.0004998393432022098, 'samples': 708480, 'steps': 3689, 'loss/train': 2.843982219696045} -08/30/2021 13:52:09 - INFO - __main__ - Step 3691: {'lr': 0.0004998391529273457, 'samples': 708672, 'steps': 3690, 'loss/train': 3.115355968475342} -08/30/2021 13:52:10 - INFO - __main__ - Step 3692: {'lr': 0.0004998389625399079, 'samples': 708864, 'steps': 3691, 'loss/train': 2.4430673122406006} -08/30/2021 13:52:11 - INFO - __main__ - Step 3693: {'lr': 0.0004998387720398965, 'samples': 709056, 'steps': 3692, 'loss/train': 2.5386247634887695} -08/30/2021 13:52:12 - INFO - __main__ - Step 3694: {'lr': 0.0004998385814273116, 'samples': 709248, 'steps': 3693, 'loss/train': 2.9216532707214355} -08/30/2021 13:52:12 - INFO - __main__ - Step 3695: {'lr': 0.0004998383907021533, 'samples': 709440, 'steps': 3694, 'loss/train': 2.920185089111328} -08/30/2021 13:52:12 - INFO - __main__ - Step 3696: {'lr': 0.0004998381998644217, 'samples': 709632, 'steps': 3695, 'loss/train': 2.953571081161499} -08/30/2021 13:52:13 - INFO - __main__ - Step 3697: {'lr': 0.0004998380089141169, 'samples': 709824, 'steps': 3696, 'loss/train': 2.786409616470337} -08/30/2021 13:52:13 - INFO - __main__ - Step 3698: {'lr': 0.0004998378178512388, 'samples': 710016, 'steps': 3697, 'loss/train': 2.8580715656280518} -08/30/2021 13:52:15 - INFO - __main__ - Step 3699: {'lr': 0.0004998376266757878, 'samples': 710208, 'steps': 3698, 'loss/train': 2.263169527053833} -08/30/2021 13:52:15 - INFO - __main__ - Step 3700: {'lr': 0.0004998374353877638, 'samples': 710400, 'steps': 3699, 'loss/train': 2.262291193008423} -08/30/2021 13:52:16 - INFO - __main__ - Step 3701: {'lr': 0.0004998372439871668, 'samples': 710592, 'steps': 3700, 'loss/train': 2.199047088623047} -08/30/2021 13:52:16 - INFO - __main__ - Step 3702: {'lr': 0.000499837052473997, 'samples': 710784, 'steps': 3701, 'loss/train': 2.673276901245117} -08/30/2021 13:52:16 - INFO - __main__ - Step 3703: {'lr': 0.0004998368608482546, 'samples': 710976, 'steps': 3702, 'loss/train': 1.017385721206665} -08/30/2021 13:52:18 - INFO - __main__ - Step 3704: {'lr': 0.0004998366691099395, 'samples': 711168, 'steps': 3703, 'loss/train': 2.869640827178955} -08/30/2021 13:52:18 - INFO - __main__ - Step 3705: {'lr': 0.0004998364772590518, 'samples': 711360, 'steps': 3704, 'loss/train': 2.46382999420166} -08/30/2021 13:52:19 - INFO - __main__ - Step 3706: {'lr': 0.0004998362852955918, 'samples': 711552, 'steps': 3705, 'loss/train': 2.588064670562744} -08/30/2021 13:52:19 - INFO - __main__ - Step 3707: {'lr': 0.0004998360932195593, 'samples': 711744, 'steps': 3706, 'loss/train': 2.1821370124816895} -08/30/2021 13:52:19 - INFO - __main__ - Step 3708: {'lr': 0.0004998359010309544, 'samples': 711936, 'steps': 3707, 'loss/train': 2.8211324214935303} -08/30/2021 13:52:21 - INFO - __main__ - Step 3709: {'lr': 0.0004998357087297775, 'samples': 712128, 'steps': 3708, 'loss/train': 2.548093795776367} -08/30/2021 13:52:21 - INFO - __main__ - Step 3710: {'lr': 0.0004998355163160285, 'samples': 712320, 'steps': 3709, 'loss/train': 2.2347397804260254} -08/30/2021 13:52:22 - INFO - __main__ - Step 3711: {'lr': 0.0004998353237897073, 'samples': 712512, 'steps': 3710, 'loss/train': 2.639876365661621} -08/30/2021 13:52:22 - INFO - __main__ - Step 3712: {'lr': 0.0004998351311508143, 'samples': 712704, 'steps': 3711, 'loss/train': 2.1529603004455566} -08/30/2021 13:52:22 - INFO - __main__ - Step 3713: {'lr': 0.0004998349383993493, 'samples': 712896, 'steps': 3712, 'loss/train': 2.668527603149414} -08/30/2021 13:52:23 - INFO - __main__ - Step 3714: {'lr': 0.0004998347455353126, 'samples': 713088, 'steps': 3713, 'loss/train': 0.8968461751937866} -08/30/2021 13:52:24 - INFO - __main__ - Step 3715: {'lr': 0.0004998345525587042, 'samples': 713280, 'steps': 3714, 'loss/train': 2.333482027053833} -08/30/2021 13:52:25 - INFO - __main__ - Step 3716: {'lr': 0.0004998343594695242, 'samples': 713472, 'steps': 3715, 'loss/train': 2.33561635017395} -08/30/2021 13:52:25 - INFO - __main__ - Step 3717: {'lr': 0.0004998341662677728, 'samples': 713664, 'steps': 3716, 'loss/train': 2.167950391769409} -08/30/2021 13:52:25 - INFO - __main__ - Step 3718: {'lr': 0.0004998339729534499, 'samples': 713856, 'steps': 3717, 'loss/train': 2.8927276134490967} -08/30/2021 13:52:26 - INFO - __main__ - Step 3719: {'lr': 0.0004998337795265557, 'samples': 714048, 'steps': 3718, 'loss/train': 2.127739667892456} -08/30/2021 13:52:28 - INFO - __main__ - Step 3720: {'lr': 0.0004998335859870903, 'samples': 714240, 'steps': 3719, 'loss/train': 2.9572927951812744} -08/30/2021 13:52:28 - INFO - __main__ - Step 3721: {'lr': 0.0004998333923350536, 'samples': 714432, 'steps': 3720, 'loss/train': 2.553959846496582} -08/30/2021 13:52:29 - INFO - __main__ - Step 3722: {'lr': 0.000499833198570446, 'samples': 714624, 'steps': 3721, 'loss/train': 2.5492050647735596} -08/30/2021 13:52:29 - INFO - __main__ - Step 3723: {'lr': 0.0004998330046932672, 'samples': 714816, 'steps': 3722, 'loss/train': 2.729675769805908} -08/30/2021 13:52:29 - INFO - __main__ - Step 3724: {'lr': 0.0004998328107035176, 'samples': 715008, 'steps': 3723, 'loss/train': 0.5745132565498352} -08/30/2021 13:52:31 - INFO - __main__ - Step 3725: {'lr': 0.0004998326166011973, 'samples': 715200, 'steps': 3724, 'loss/train': 2.6041486263275146} -08/30/2021 13:52:31 - INFO - __main__ - Step 3726: {'lr': 0.0004998324223863061, 'samples': 715392, 'steps': 3725, 'loss/train': 2.502439260482788} -08/30/2021 13:52:32 - INFO - __main__ - Step 3727: {'lr': 0.0004998322280588445, 'samples': 715584, 'steps': 3726, 'loss/train': 2.617800712585449} -08/30/2021 13:52:32 - INFO - __main__ - Step 3728: {'lr': 0.0004998320336188121, 'samples': 715776, 'steps': 3727, 'loss/train': 1.7495018243789673} -08/30/2021 13:52:32 - INFO - __main__ - Step 3729: {'lr': 0.0004998318390662095, 'samples': 715968, 'steps': 3728, 'loss/train': 2.223163366317749} -08/30/2021 13:52:34 - INFO - __main__ - Step 3730: {'lr': 0.0004998316444010363, 'samples': 716160, 'steps': 3729, 'loss/train': 2.0308051109313965} -08/30/2021 13:52:35 - INFO - __main__ - Step 3731: {'lr': 0.0004998314496232929, 'samples': 716352, 'steps': 3730, 'loss/train': 2.0826940536499023} -08/30/2021 13:52:35 - INFO - __main__ - Step 3732: {'lr': 0.0004998312547329793, 'samples': 716544, 'steps': 3731, 'loss/train': 2.4998042583465576} -08/30/2021 13:52:35 - INFO - __main__ - Step 3733: {'lr': 0.0004998310597300956, 'samples': 716736, 'steps': 3732, 'loss/train': 2.7541556358337402} -08/30/2021 13:52:36 - INFO - __main__ - Step 3734: {'lr': 0.0004998308646146419, 'samples': 716928, 'steps': 3733, 'loss/train': 1.8123992681503296} -08/30/2021 13:52:36 - INFO - __main__ - Step 3735: {'lr': 0.0004998306693866181, 'samples': 717120, 'steps': 3734, 'loss/train': 2.1201188564300537} -08/30/2021 13:52:38 - INFO - __main__ - Step 3736: {'lr': 0.0004998304740460247, 'samples': 717312, 'steps': 3735, 'loss/train': 0.5890623331069946} -08/30/2021 13:52:38 - INFO - __main__ - Step 3737: {'lr': 0.0004998302785928614, 'samples': 717504, 'steps': 3736, 'loss/train': 2.6408166885375977} -08/30/2021 13:52:39 - INFO - __main__ - Step 3738: {'lr': 0.0004998300830271285, 'samples': 717696, 'steps': 3737, 'loss/train': 2.593217134475708} -08/30/2021 13:52:39 - INFO - __main__ - Step 3739: {'lr': 0.000499829887348826, 'samples': 717888, 'steps': 3738, 'loss/train': 2.4458932876586914} -08/30/2021 13:52:40 - INFO - __main__ - Step 3740: {'lr': 0.0004998296915579539, 'samples': 718080, 'steps': 3739, 'loss/train': 2.755025625228882} -08/30/2021 13:52:40 - INFO - __main__ - Step 3741: {'lr': 0.0004998294956545125, 'samples': 718272, 'steps': 3740, 'loss/train': 0.9906896352767944} -08/30/2021 13:52:41 - INFO - __main__ - Step 3742: {'lr': 0.0004998292996385019, 'samples': 718464, 'steps': 3741, 'loss/train': 1.7878564596176147} -08/30/2021 13:52:42 - INFO - __main__ - Step 3743: {'lr': 0.0004998291035099219, 'samples': 718656, 'steps': 3742, 'loss/train': 2.2241365909576416} -08/30/2021 13:52:42 - INFO - __main__ - Step 3744: {'lr': 0.0004998289072687728, 'samples': 718848, 'steps': 3743, 'loss/train': 2.798021078109741} -08/30/2021 13:52:43 - INFO - __main__ - Step 3745: {'lr': 0.0004998287109150547, 'samples': 719040, 'steps': 3744, 'loss/train': 1.918013572692871} -08/30/2021 13:52:43 - INFO - __main__ - Step 3746: {'lr': 0.0004998285144487676, 'samples': 719232, 'steps': 3745, 'loss/train': 2.5508880615234375} -08/30/2021 13:52:44 - INFO - __main__ - Step 3747: {'lr': 0.0004998283178699116, 'samples': 719424, 'steps': 3746, 'loss/train': 2.0125818252563477} -08/30/2021 13:52:45 - INFO - __main__ - Step 3748: {'lr': 0.0004998281211784869, 'samples': 719616, 'steps': 3747, 'loss/train': 2.6958279609680176} -08/30/2021 13:52:45 - INFO - __main__ - Step 3749: {'lr': 0.0004998279243744934, 'samples': 719808, 'steps': 3748, 'loss/train': 2.651625394821167} -08/30/2021 13:52:46 - INFO - __main__ - Step 3750: {'lr': 0.0004998277274579313, 'samples': 720000, 'steps': 3749, 'loss/train': 1.690513014793396} -08/30/2021 13:52:46 - INFO - __main__ - Step 3751: {'lr': 0.0004998275304288007, 'samples': 720192, 'steps': 3750, 'loss/train': 2.3952298164367676} -08/30/2021 13:52:47 - INFO - __main__ - Step 3752: {'lr': 0.0004998273332871017, 'samples': 720384, 'steps': 3751, 'loss/train': 2.3898682594299316} -08/30/2021 13:52:48 - INFO - __main__ - Step 3753: {'lr': 0.0004998271360328344, 'samples': 720576, 'steps': 3752, 'loss/train': 2.195742607116699} -08/30/2021 13:52:48 - INFO - __main__ - Step 3754: {'lr': 0.0004998269386659988, 'samples': 720768, 'steps': 3753, 'loss/train': 2.1724729537963867} -08/30/2021 13:52:49 - INFO - __main__ - Step 3755: {'lr': 0.000499826741186595, 'samples': 720960, 'steps': 3754, 'loss/train': 1.760980248451233} -08/30/2021 13:52:49 - INFO - __main__ - Step 3756: {'lr': 0.0004998265435946232, 'samples': 721152, 'steps': 3755, 'loss/train': 2.3340656757354736} -08/30/2021 13:52:50 - INFO - __main__ - Step 3757: {'lr': 0.0004998263458900833, 'samples': 721344, 'steps': 3756, 'loss/train': 2.6274890899658203} -08/30/2021 13:52:51 - INFO - __main__ - Step 3758: {'lr': 0.0004998261480729755, 'samples': 721536, 'steps': 3757, 'loss/train': 2.353910446166992} -08/30/2021 13:52:51 - INFO - __main__ - Step 3759: {'lr': 0.0004998259501433, 'samples': 721728, 'steps': 3758, 'loss/train': 2.0382802486419678} -08/30/2021 13:52:52 - INFO - __main__ - Step 3760: {'lr': 0.0004998257521010567, 'samples': 721920, 'steps': 3759, 'loss/train': 2.4699389934539795} -08/30/2021 13:52:52 - INFO - __main__ - Step 3761: {'lr': 0.0004998255539462459, 'samples': 722112, 'steps': 3760, 'loss/train': 2.4543662071228027} -08/30/2021 13:52:52 - INFO - __main__ - Step 3762: {'lr': 0.0004998253556788675, 'samples': 722304, 'steps': 3761, 'loss/train': 2.363558292388916} -08/30/2021 13:52:54 - INFO - __main__ - Step 3763: {'lr': 0.0004998251572989217, 'samples': 722496, 'steps': 3762, 'loss/train': 2.9797966480255127} -08/30/2021 13:52:54 - INFO - __main__ - Step 3764: {'lr': 0.0004998249588064085, 'samples': 722688, 'steps': 3763, 'loss/train': 2.7801966667175293} -08/30/2021 13:52:54 - INFO - __main__ - Step 3765: {'lr': 0.0004998247602013278, 'samples': 722880, 'steps': 3764, 'loss/train': 1.3150078058242798} -08/30/2021 13:52:55 - INFO - __main__ - Step 3766: {'lr': 0.0004998245614836802, 'samples': 723072, 'steps': 3765, 'loss/train': 2.424520492553711} -08/30/2021 13:52:55 - INFO - __main__ - Step 3767: {'lr': 0.0004998243626534655, 'samples': 723264, 'steps': 3766, 'loss/train': 2.5986714363098145} -08/30/2021 13:52:57 - INFO - __main__ - Step 3768: {'lr': 0.0004998241637106836, 'samples': 723456, 'steps': 3767, 'loss/train': 2.1446802616119385} -08/30/2021 13:52:58 - INFO - __main__ - Step 3769: {'lr': 0.0004998239646553349, 'samples': 723648, 'steps': 3768, 'loss/train': 1.9051599502563477} -08/30/2021 13:52:58 - INFO - __main__ - Step 3770: {'lr': 0.0004998237654874195, 'samples': 723840, 'steps': 3769, 'loss/train': 2.1859586238861084} -08/30/2021 13:52:58 - INFO - __main__ - Step 3771: {'lr': 0.0004998235662069372, 'samples': 724032, 'steps': 3770, 'loss/train': 2.496194839477539} -08/30/2021 13:52:59 - INFO - __main__ - Step 3772: {'lr': 0.0004998233668138883, 'samples': 724224, 'steps': 3771, 'loss/train': 2.494786024093628} -08/30/2021 13:52:59 - INFO - __main__ - Step 3773: {'lr': 0.0004998231673082729, 'samples': 724416, 'steps': 3772, 'loss/train': 0.910167396068573} -08/30/2021 13:53:00 - INFO - __main__ - Step 3774: {'lr': 0.000499822967690091, 'samples': 724608, 'steps': 3773, 'loss/train': 1.0037932395935059} -08/30/2021 13:53:01 - INFO - __main__ - Step 3775: {'lr': 0.0004998227679593426, 'samples': 724800, 'steps': 3774, 'loss/train': 2.0974268913269043} -08/30/2021 13:53:01 - INFO - __main__ - Step 3776: {'lr': 0.0004998225681160281, 'samples': 724992, 'steps': 3775, 'loss/train': 2.4184041023254395} -08/30/2021 13:53:02 - INFO - __main__ - Step 3777: {'lr': 0.0004998223681601474, 'samples': 725184, 'steps': 3776, 'loss/train': 1.980934739112854} -08/30/2021 13:53:02 - INFO - __main__ - Step 3778: {'lr': 0.0004998221680917004, 'samples': 725376, 'steps': 3777, 'loss/train': 2.4494545459747314} -08/30/2021 13:53:04 - INFO - __main__ - Step 3779: {'lr': 0.0004998219679106876, 'samples': 725568, 'steps': 3778, 'loss/train': 3.0036258697509766} -08/30/2021 13:53:05 - INFO - __main__ - Step 3780: {'lr': 0.0004998217676171088, 'samples': 725760, 'steps': 3779, 'loss/train': 2.1836447715759277} -08/30/2021 13:53:05 - INFO - __main__ - Step 3781: {'lr': 0.0004998215672109641, 'samples': 725952, 'steps': 3780, 'loss/train': 2.39762544631958} -08/30/2021 13:53:05 - INFO - __main__ - Step 3782: {'lr': 0.0004998213666922537, 'samples': 726144, 'steps': 3781, 'loss/train': 6.193061351776123} -08/30/2021 13:53:06 - INFO - __main__ - Step 3783: {'lr': 0.0004998211660609777, 'samples': 726336, 'steps': 3782, 'loss/train': 2.981644868850708} -08/30/2021 13:53:06 - INFO - __main__ - Step 3784: {'lr': 0.0004998209653171361, 'samples': 726528, 'steps': 3783, 'loss/train': 4.001317977905273} -08/30/2021 13:53:08 - INFO - __main__ - Step 3785: {'lr': 0.0004998207644607291, 'samples': 726720, 'steps': 3784, 'loss/train': 3.830148458480835} -08/30/2021 13:53:09 - INFO - __main__ - Step 3786: {'lr': 0.0004998205634917566, 'samples': 726912, 'steps': 3785, 'loss/train': 3.1851704120635986} -08/30/2021 13:53:09 - INFO - __main__ - Step 3787: {'lr': 0.0004998203624102188, 'samples': 727104, 'steps': 3786, 'loss/train': 3.435906171798706} -08/30/2021 13:53:09 - INFO - __main__ - Step 3788: {'lr': 0.0004998201612161159, 'samples': 727296, 'steps': 3787, 'loss/train': 2.6408236026763916} -08/30/2021 13:53:10 - INFO - __main__ - Step 3789: {'lr': 0.0004998199599094478, 'samples': 727488, 'steps': 3788, 'loss/train': 2.8391733169555664} -08/30/2021 13:53:10 - INFO - __main__ - Step 3790: {'lr': 0.0004998197584902147, 'samples': 727680, 'steps': 3789, 'loss/train': 3.1133480072021484} -08/30/2021 13:53:11 - INFO - __main__ - Step 3791: {'lr': 0.0004998195569584168, 'samples': 727872, 'steps': 3790, 'loss/train': 1.9843635559082031} -08/30/2021 13:53:12 - INFO - __main__ - Step 3792: {'lr': 0.0004998193553140539, 'samples': 728064, 'steps': 3791, 'loss/train': 2.3932769298553467} -08/30/2021 13:53:12 - INFO - __main__ - Step 3793: {'lr': 0.0004998191535571264, 'samples': 728256, 'steps': 3792, 'loss/train': 2.2312867641448975} -08/30/2021 13:53:13 - INFO - __main__ - Step 3794: {'lr': 0.0004998189516876342, 'samples': 728448, 'steps': 3793, 'loss/train': 1.3847050666809082} -08/30/2021 13:53:13 - INFO - __main__ - Step 3795: {'lr': 0.0004998187497055773, 'samples': 728640, 'steps': 3794, 'loss/train': 5.628871440887451} -08/30/2021 13:53:14 - INFO - __main__ - Step 3796: {'lr': 0.000499818547610956, 'samples': 728832, 'steps': 3795, 'loss/train': 3.263817071914673} -08/30/2021 13:53:15 - INFO - __main__ - Step 3797: {'lr': 0.0004998183454037703, 'samples': 729024, 'steps': 3796, 'loss/train': 2.5504064559936523} -08/30/2021 13:53:15 - INFO - __main__ - Step 3798: {'lr': 0.0004998181430840204, 'samples': 729216, 'steps': 3797, 'loss/train': 3.251636266708374} -08/30/2021 13:53:16 - INFO - __main__ - Step 3799: {'lr': 0.0004998179406517063, 'samples': 729408, 'steps': 3798, 'loss/train': 2.312483787536621} -08/30/2021 13:53:16 - INFO - __main__ - Step 3800: {'lr': 0.000499817738106828, 'samples': 729600, 'steps': 3799, 'loss/train': 2.8077876567840576} -08/30/2021 13:53:18 - INFO - __main__ - Step 3801: {'lr': 0.0004998175354493857, 'samples': 729792, 'steps': 3800, 'loss/train': 2.6324970722198486} -08/30/2021 13:53:19 - INFO - __main__ - Step 3802: {'lr': 0.0004998173326793795, 'samples': 729984, 'steps': 3801, 'loss/train': 2.687063217163086} -08/30/2021 13:53:19 - INFO - __main__ - Step 3803: {'lr': 0.0004998171297968095, 'samples': 730176, 'steps': 3802, 'loss/train': 2.632704257965088} -08/30/2021 13:53:19 - INFO - __main__ - Step 3804: {'lr': 0.0004998169268016757, 'samples': 730368, 'steps': 3803, 'loss/train': 2.495011329650879} -08/30/2021 13:53:20 - INFO - __main__ - Step 3805: {'lr': 0.0004998167236939783, 'samples': 730560, 'steps': 3804, 'loss/train': 2.9213318824768066} -08/30/2021 13:53:20 - INFO - __main__ - Step 3806: {'lr': 0.0004998165204737173, 'samples': 730752, 'steps': 3805, 'loss/train': 2.8817858695983887} -08/30/2021 13:53:21 - INFO - __main__ - Step 3807: {'lr': 0.0004998163171408928, 'samples': 730944, 'steps': 3806, 'loss/train': 0.49705567955970764} -08/30/2021 13:53:22 - INFO - __main__ - Step 3808: {'lr': 0.000499816113695505, 'samples': 731136, 'steps': 3807, 'loss/train': 2.760344982147217} -08/30/2021 13:53:22 - INFO - __main__ - Step 3809: {'lr': 0.0004998159101375538, 'samples': 731328, 'steps': 3808, 'loss/train': 3.4015262126922607} -08/30/2021 13:53:23 - INFO - __main__ - Step 3810: {'lr': 0.0004998157064670395, 'samples': 731520, 'steps': 3809, 'loss/train': 2.6240994930267334} -08/30/2021 13:53:23 - INFO - __main__ - Step 3811: {'lr': 0.0004998155026839621, 'samples': 731712, 'steps': 3810, 'loss/train': 3.15437650680542} -08/30/2021 13:53:24 - INFO - __main__ - Step 3812: {'lr': 0.0004998152987883217, 'samples': 731904, 'steps': 3811, 'loss/train': 2.288787364959717} -08/30/2021 13:53:25 - INFO - __main__ - Step 3813: {'lr': 0.0004998150947801182, 'samples': 732096, 'steps': 3812, 'loss/train': 2.1823601722717285} -08/30/2021 13:53:25 - INFO - __main__ - Step 3814: {'lr': 0.000499814890659352, 'samples': 732288, 'steps': 3813, 'loss/train': 2.1743075847625732} -08/30/2021 13:53:26 - INFO - __main__ - Step 3815: {'lr': 0.0004998146864260231, 'samples': 732480, 'steps': 3814, 'loss/train': 2.6787259578704834} -08/30/2021 13:53:26 - INFO - __main__ - Step 3816: {'lr': 0.0004998144820801316, 'samples': 732672, 'steps': 3815, 'loss/train': 2.8744006156921387} -08/30/2021 13:53:26 - INFO - __main__ - Step 3817: {'lr': 0.0004998142776216775, 'samples': 732864, 'steps': 3816, 'loss/train': 3.1672487258911133} -08/30/2021 13:53:28 - INFO - __main__ - Step 3818: {'lr': 0.0004998140730506609, 'samples': 733056, 'steps': 3817, 'loss/train': 2.4270360469818115} -08/30/2021 13:53:28 - INFO - __main__ - Step 3819: {'lr': 0.000499813868367082, 'samples': 733248, 'steps': 3818, 'loss/train': 3.1737098693847656} -08/30/2021 13:53:29 - INFO - __main__ - Step 3820: {'lr': 0.0004998136635709408, 'samples': 733440, 'steps': 3819, 'loss/train': 2.706602096557617} -08/30/2021 13:53:29 - INFO - __main__ - Step 3821: {'lr': 0.0004998134586622374, 'samples': 733632, 'steps': 3820, 'loss/train': 2.02411150932312} -08/30/2021 13:53:29 - INFO - __main__ - Step 3822: {'lr': 0.0004998132536409718, 'samples': 733824, 'steps': 3821, 'loss/train': 2.643583297729492} -08/30/2021 13:53:31 - INFO - __main__ - Step 3823: {'lr': 0.0004998130485071444, 'samples': 734016, 'steps': 3822, 'loss/train': 2.867642641067505} -08/30/2021 13:53:31 - INFO - __main__ - Step 3824: {'lr': 0.000499812843260755, 'samples': 734208, 'steps': 3823, 'loss/train': 1.7342548370361328} -08/30/2021 13:53:32 - INFO - __main__ - Step 3825: {'lr': 0.0004998126379018038, 'samples': 734400, 'steps': 3824, 'loss/train': 2.3599774837493896} -08/30/2021 13:53:32 - INFO - __main__ - Step 3826: {'lr': 0.000499812432430291, 'samples': 734592, 'steps': 3825, 'loss/train': 2.6682610511779785} -08/30/2021 13:53:33 - INFO - __main__ - Step 3827: {'lr': 0.0004998122268462164, 'samples': 734784, 'steps': 3826, 'loss/train': 1.2385571002960205} -08/30/2021 13:53:34 - INFO - __main__ - Step 3828: {'lr': 0.0004998120211495803, 'samples': 734976, 'steps': 3827, 'loss/train': 2.736721992492676} -08/30/2021 13:53:35 - INFO - __main__ - Step 3829: {'lr': 0.0004998118153403827, 'samples': 735168, 'steps': 3828, 'loss/train': 2.391437292098999} -08/30/2021 13:53:35 - INFO - __main__ - Step 3830: {'lr': 0.0004998116094186239, 'samples': 735360, 'steps': 3829, 'loss/train': 1.730520248413086} -08/30/2021 13:53:35 - INFO - __main__ - Step 3831: {'lr': 0.0004998114033843038, 'samples': 735552, 'steps': 3830, 'loss/train': 2.593935966491699} -08/30/2021 13:53:36 - INFO - __main__ - Step 3832: {'lr': 0.0004998111972374225, 'samples': 735744, 'steps': 3831, 'loss/train': 1.7919846773147583} -08/30/2021 13:53:38 - INFO - __main__ - Step 3833: {'lr': 0.0004998109909779801, 'samples': 735936, 'steps': 3832, 'loss/train': 2.8192121982574463} -08/30/2021 13:53:38 - INFO - __main__ - Step 3834: {'lr': 0.0004998107846059768, 'samples': 736128, 'steps': 3833, 'loss/train': 2.320220947265625} -08/30/2021 13:53:39 - INFO - __main__ - Step 3835: {'lr': 0.0004998105781214126, 'samples': 736320, 'steps': 3834, 'loss/train': 2.549633741378784} -08/30/2021 13:53:39 - INFO - __main__ - Step 3836: {'lr': 0.0004998103715242875, 'samples': 736512, 'steps': 3835, 'loss/train': 2.1557517051696777} -08/30/2021 13:53:39 - INFO - __main__ - Step 3837: {'lr': 0.0004998101648146018, 'samples': 736704, 'steps': 3836, 'loss/train': 2.4664957523345947} -08/30/2021 13:53:41 - INFO - __main__ - Step 3838: {'lr': 0.0004998099579923555, 'samples': 736896, 'steps': 3837, 'loss/train': 2.3150134086608887} -08/30/2021 13:53:41 - INFO - __main__ - Step 3839: {'lr': 0.0004998097510575487, 'samples': 737088, 'steps': 3838, 'loss/train': 2.5504868030548096} -08/30/2021 13:53:42 - INFO - __main__ - Step 3840: {'lr': 0.0004998095440101815, 'samples': 737280, 'steps': 3839, 'loss/train': 2.8693466186523438} -08/30/2021 13:53:42 - INFO - __main__ - Step 3841: {'lr': 0.0004998093368502539, 'samples': 737472, 'steps': 3840, 'loss/train': 2.893502712249756} -08/30/2021 13:53:42 - INFO - __main__ - Step 3842: {'lr': 0.000499809129577766, 'samples': 737664, 'steps': 3841, 'loss/train': 2.001295328140259} -08/30/2021 13:53:44 - INFO - __main__ - Step 3843: {'lr': 0.0004998089221927182, 'samples': 737856, 'steps': 3842, 'loss/train': 2.1130106449127197} -08/30/2021 13:53:44 - INFO - __main__ - Step 3844: {'lr': 0.0004998087146951101, 'samples': 738048, 'steps': 3843, 'loss/train': 2.247541666030884} -08/30/2021 13:53:45 - INFO - __main__ - Step 3845: {'lr': 0.0004998085070849422, 'samples': 738240, 'steps': 3844, 'loss/train': 2.3881845474243164} -08/30/2021 13:53:45 - INFO - __main__ - Step 3846: {'lr': 0.0004998082993622144, 'samples': 738432, 'steps': 3845, 'loss/train': 2.4177701473236084} -08/30/2021 13:53:45 - INFO - __main__ - Step 3847: {'lr': 0.0004998080915269268, 'samples': 738624, 'steps': 3846, 'loss/train': 2.283220052719116} -08/30/2021 13:53:47 - INFO - __main__ - Step 3848: {'lr': 0.0004998078835790796, 'samples': 738816, 'steps': 3847, 'loss/train': 2.7085118293762207} -08/30/2021 13:53:48 - INFO - __main__ - Step 3849: {'lr': 0.0004998076755186727, 'samples': 739008, 'steps': 3848, 'loss/train': 2.1108334064483643} -08/30/2021 13:53:48 - INFO - __main__ - Step 3850: {'lr': 0.0004998074673457064, 'samples': 739200, 'steps': 3849, 'loss/train': 0.5631784796714783} -08/30/2021 13:53:48 - INFO - __main__ - Step 3851: {'lr': 0.0004998072590601808, 'samples': 739392, 'steps': 3850, 'loss/train': 0.9390645027160645} -08/30/2021 13:53:49 - INFO - __main__ - Step 3852: {'lr': 0.0004998070506620957, 'samples': 739584, 'steps': 3851, 'loss/train': 2.112011671066284} -08/30/2021 13:53:49 - INFO - __main__ - Step 3853: {'lr': 0.0004998068421514515, 'samples': 739776, 'steps': 3852, 'loss/train': 1.1400758028030396} -08/30/2021 13:53:50 - INFO - __main__ - Step 3854: {'lr': 0.0004998066335282483, 'samples': 739968, 'steps': 3853, 'loss/train': 1.3761924505233765} -08/30/2021 13:53:51 - INFO - __main__ - Step 3855: {'lr': 0.0004998064247924859, 'samples': 740160, 'steps': 3854, 'loss/train': 1.2922638654708862} -08/30/2021 13:53:51 - INFO - __main__ - Step 3856: {'lr': 0.0004998062159441648, 'samples': 740352, 'steps': 3855, 'loss/train': 2.1958119869232178} -08/30/2021 13:53:52 - INFO - __main__ - Step 3857: {'lr': 0.0004998060069832846, 'samples': 740544, 'steps': 3856, 'loss/train': 1.2535297870635986} -08/30/2021 13:53:52 - INFO - __main__ - Step 3858: {'lr': 0.0004998057979098459, 'samples': 740736, 'steps': 3857, 'loss/train': 2.8661746978759766} -08/30/2021 13:53:52 - INFO - __main__ - Step 3859: {'lr': 0.0004998055887238485, 'samples': 740928, 'steps': 3858, 'loss/train': 2.3009345531463623} -08/30/2021 13:53:54 - INFO - __main__ - Step 3860: {'lr': 0.0004998053794252925, 'samples': 741120, 'steps': 3859, 'loss/train': 2.258052110671997} -08/30/2021 13:53:54 - INFO - __main__ - Step 3861: {'lr': 0.0004998051700141781, 'samples': 741312, 'steps': 3860, 'loss/train': 2.3379745483398438} -08/30/2021 13:53:55 - INFO - __main__ - Step 3862: {'lr': 0.0004998049604905052, 'samples': 741504, 'steps': 3861, 'loss/train': 2.379669189453125} -08/30/2021 13:53:55 - INFO - __main__ - Step 3863: {'lr': 0.0004998047508542742, 'samples': 741696, 'steps': 3862, 'loss/train': 3.0659537315368652} -08/30/2021 13:53:55 - INFO - __main__ - Step 3864: {'lr': 0.000499804541105485, 'samples': 741888, 'steps': 3863, 'loss/train': 0.3776046335697174} -08/30/2021 13:53:57 - INFO - __main__ - Step 3865: {'lr': 0.0004998043312441378, 'samples': 742080, 'steps': 3864, 'loss/train': 2.317028045654297} -08/30/2021 13:53:58 - INFO - __main__ - Step 3866: {'lr': 0.0004998041212702325, 'samples': 742272, 'steps': 3865, 'loss/train': 2.523540735244751} -08/30/2021 13:53:58 - INFO - __main__ - Step 3867: {'lr': 0.0004998039111837694, 'samples': 742464, 'steps': 3866, 'loss/train': 2.123126983642578} -08/30/2021 13:53:59 - INFO - __main__ - Step 3868: {'lr': 0.0004998037009847485, 'samples': 742656, 'steps': 3867, 'loss/train': 1.5907723903656006} -08/30/2021 13:53:59 - INFO - __main__ - Step 3869: {'lr': 0.0004998034906731699, 'samples': 742848, 'steps': 3868, 'loss/train': 2.4419124126434326} -08/30/2021 13:54:00 - INFO - __main__ - Step 3870: {'lr': 0.0004998032802490337, 'samples': 743040, 'steps': 3869, 'loss/train': 2.297422409057617} -08/30/2021 13:54:01 - INFO - __main__ - Step 3871: {'lr': 0.0004998030697123399, 'samples': 743232, 'steps': 3870, 'loss/train': 2.200152635574341} -08/30/2021 13:54:01 - INFO - __main__ - Step 3872: {'lr': 0.0004998028590630887, 'samples': 743424, 'steps': 3871, 'loss/train': 2.712414264678955} -08/30/2021 13:54:01 - INFO - __main__ - Step 3873: {'lr': 0.0004998026483012803, 'samples': 743616, 'steps': 3872, 'loss/train': 2.7476024627685547} -08/30/2021 13:54:02 - INFO - __main__ - Step 3874: {'lr': 0.0004998024374269147, 'samples': 743808, 'steps': 3873, 'loss/train': 3.092353343963623} -08/30/2021 13:54:03 - INFO - __main__ - Step 3875: {'lr': 0.000499802226439992, 'samples': 744000, 'steps': 3874, 'loss/train': 1.501655101776123} -08/30/2021 13:54:04 - INFO - __main__ - Step 3876: {'lr': 0.0004998020153405121, 'samples': 744192, 'steps': 3875, 'loss/train': 2.7606687545776367} -08/30/2021 13:54:04 - INFO - __main__ - Step 3877: {'lr': 0.0004998018041284754, 'samples': 744384, 'steps': 3876, 'loss/train': 2.262582302093506} -08/30/2021 13:54:04 - INFO - __main__ - Step 3878: {'lr': 0.0004998015928038819, 'samples': 744576, 'steps': 3877, 'loss/train': 2.9484941959381104} -08/30/2021 13:54:05 - INFO - __main__ - Step 3879: {'lr': 0.0004998013813667315, 'samples': 744768, 'steps': 3878, 'loss/train': 1.1047451496124268} -08/30/2021 13:54:06 - INFO - __main__ - Step 3880: {'lr': 0.0004998011698170245, 'samples': 744960, 'steps': 3879, 'loss/train': 2.8314123153686523} -08/30/2021 13:54:07 - INFO - __main__ - Step 3881: {'lr': 0.000499800958154761, 'samples': 745152, 'steps': 3880, 'loss/train': 1.696224331855774} -08/30/2021 13:54:07 - INFO - __main__ - Step 3882: {'lr': 0.000499800746379941, 'samples': 745344, 'steps': 3881, 'loss/train': 2.514443874359131} -08/30/2021 13:54:07 - INFO - __main__ - Step 3883: {'lr': 0.0004998005344925647, 'samples': 745536, 'steps': 3882, 'loss/train': 2.567884683609009} -08/30/2021 13:54:08 - INFO - __main__ - Step 3884: {'lr': 0.0004998003224926321, 'samples': 745728, 'steps': 3883, 'loss/train': 2.229339599609375} -08/30/2021 13:54:08 - INFO - __main__ - Step 3885: {'lr': 0.0004998001103801433, 'samples': 745920, 'steps': 3884, 'loss/train': 2.397631883621216} -08/30/2021 13:54:10 - INFO - __main__ - Step 3886: {'lr': 0.0004997998981550985, 'samples': 746112, 'steps': 3885, 'loss/train': 2.341691255569458} -08/30/2021 13:54:11 - INFO - __main__ - Step 3887: {'lr': 0.0004997996858174976, 'samples': 746304, 'steps': 3886, 'loss/train': 2.5074775218963623} -08/30/2021 13:54:11 - INFO - __main__ - Step 3888: {'lr': 0.0004997994733673409, 'samples': 746496, 'steps': 3887, 'loss/train': 2.737993001937866} -08/30/2021 13:54:12 - INFO - __main__ - Step 3889: {'lr': 0.0004997992608046283, 'samples': 746688, 'steps': 3888, 'loss/train': 2.759039878845215} -08/30/2021 13:54:12 - INFO - __main__ - Step 3890: {'lr': 0.0004997990481293602, 'samples': 746880, 'steps': 3889, 'loss/train': 2.3761377334594727} -08/30/2021 13:54:13 - INFO - __main__ - Step 3891: {'lr': 0.0004997988353415364, 'samples': 747072, 'steps': 3890, 'loss/train': 2.5499308109283447} -08/30/2021 13:54:14 - INFO - __main__ - Step 3892: {'lr': 0.0004997986224411571, 'samples': 747264, 'steps': 3891, 'loss/train': 2.0588948726654053} -08/30/2021 13:54:14 - INFO - __main__ - Step 3893: {'lr': 0.0004997984094282224, 'samples': 747456, 'steps': 3892, 'loss/train': 2.512882709503174} -08/30/2021 13:54:15 - INFO - __main__ - Step 3894: {'lr': 0.0004997981963027324, 'samples': 747648, 'steps': 3893, 'loss/train': 2.513519525527954} -08/30/2021 13:54:15 - INFO - __main__ - Step 3895: {'lr': 0.0004997979830646871, 'samples': 747840, 'steps': 3894, 'loss/train': 5.267651081085205} -08/30/2021 13:54:17 - INFO - __main__ - Step 3896: {'lr': 0.0004997977697140868, 'samples': 748032, 'steps': 3895, 'loss/train': 2.0256643295288086} -08/30/2021 13:54:17 - INFO - __main__ - Step 3897: {'lr': 0.0004997975562509315, 'samples': 748224, 'steps': 3896, 'loss/train': 1.8952407836914062} -08/30/2021 13:54:18 - INFO - __main__ - Step 3898: {'lr': 0.0004997973426752212, 'samples': 748416, 'steps': 3897, 'loss/train': 3.1216516494750977} -08/30/2021 13:54:18 - INFO - __main__ - Step 3899: {'lr': 0.0004997971289869561, 'samples': 748608, 'steps': 3898, 'loss/train': 2.1845452785491943} -08/30/2021 13:54:18 - INFO - __main__ - Step 3900: {'lr': 0.0004997969151861362, 'samples': 748800, 'steps': 3899, 'loss/train': 4.411011695861816} -08/30/2021 13:54:20 - INFO - __main__ - Step 3901: {'lr': 0.0004997967012727618, 'samples': 748992, 'steps': 3900, 'loss/train': 2.7186288833618164} -08/30/2021 13:54:20 - INFO - __main__ - Step 3902: {'lr': 0.0004997964872468327, 'samples': 749184, 'steps': 3901, 'loss/train': 2.432096242904663} -08/30/2021 13:54:20 - INFO - __main__ - Step 3903: {'lr': 0.0004997962731083492, 'samples': 749376, 'steps': 3902, 'loss/train': 2.4708166122436523} -08/30/2021 13:54:21 - INFO - __main__ - Step 3904: {'lr': 0.0004997960588573115, 'samples': 749568, 'steps': 3903, 'loss/train': 0.9756361246109009} -08/30/2021 13:54:21 - INFO - __main__ - Step 3905: {'lr': 0.0004997958444937193, 'samples': 749760, 'steps': 3904, 'loss/train': 2.6296472549438477} -08/30/2021 13:54:23 - INFO - __main__ - Step 3906: {'lr': 0.0004997956300175732, 'samples': 749952, 'steps': 3905, 'loss/train': 2.711909055709839} -08/30/2021 13:54:23 - INFO - __main__ - Step 3907: {'lr': 0.000499795415428873, 'samples': 750144, 'steps': 3906, 'loss/train': 2.2133710384368896} -08/30/2021 13:54:24 - INFO - __main__ - Step 3908: {'lr': 0.0004997952007276187, 'samples': 750336, 'steps': 3907, 'loss/train': 2.634544610977173} -08/30/2021 13:54:24 - INFO - __main__ - Step 3909: {'lr': 0.0004997949859138106, 'samples': 750528, 'steps': 3908, 'loss/train': 2.506596088409424} -08/30/2021 13:54:24 - INFO - __main__ - Step 3910: {'lr': 0.0004997947709874487, 'samples': 750720, 'steps': 3909, 'loss/train': 2.404820203781128} -08/30/2021 13:54:26 - INFO - __main__ - Step 3911: {'lr': 0.0004997945559485333, 'samples': 750912, 'steps': 3910, 'loss/train': 1.8868598937988281} -08/30/2021 13:54:27 - INFO - __main__ - Step 3912: {'lr': 0.0004997943407970642, 'samples': 751104, 'steps': 3911, 'loss/train': 2.0609493255615234} -08/30/2021 13:54:27 - INFO - __main__ - Step 3913: {'lr': 0.0004997941255330416, 'samples': 751296, 'steps': 3912, 'loss/train': 2.681518316268921} -08/30/2021 13:54:27 - INFO - __main__ - Step 3914: {'lr': 0.0004997939101564656, 'samples': 751488, 'steps': 3913, 'loss/train': 0.8284855484962463} -08/30/2021 13:54:28 - INFO - __main__ - Step 3915: {'lr': 0.0004997936946673365, 'samples': 751680, 'steps': 3914, 'loss/train': 2.8293895721435547} -08/30/2021 13:54:28 - INFO - __main__ - Step 3916: {'lr': 0.000499793479065654, 'samples': 751872, 'steps': 3915, 'loss/train': 2.407503128051758} -08/30/2021 13:54:29 - INFO - __main__ - Step 3917: {'lr': 0.0004997932633514185, 'samples': 752064, 'steps': 3916, 'loss/train': 2.8127501010894775} -08/30/2021 13:54:30 - INFO - __main__ - Step 3918: {'lr': 0.00049979304752463, 'samples': 752256, 'steps': 3917, 'loss/train': 2.591407060623169} -08/30/2021 13:54:30 - INFO - __main__ - Step 3919: {'lr': 0.0004997928315852887, 'samples': 752448, 'steps': 3918, 'loss/train': 2.1050326824188232} -08/30/2021 13:54:31 - INFO - __main__ - Step 3920: {'lr': 0.0004997926155333944, 'samples': 752640, 'steps': 3919, 'loss/train': 2.3848304748535156} -08/30/2021 13:54:31 - INFO - __main__ - Step 3921: {'lr': 0.0004997923993689476, 'samples': 752832, 'steps': 3920, 'loss/train': 2.403304100036621} -08/30/2021 13:54:32 - INFO - __main__ - Step 3922: {'lr': 0.0004997921830919481, 'samples': 753024, 'steps': 3921, 'loss/train': 1.0415692329406738} -08/30/2021 13:54:33 - INFO - __main__ - Step 3923: {'lr': 0.0004997919667023962, 'samples': 753216, 'steps': 3922, 'loss/train': 1.9141919612884521} -08/30/2021 13:54:33 - INFO - __main__ - Step 3924: {'lr': 0.0004997917502002917, 'samples': 753408, 'steps': 3923, 'loss/train': 3.112239122390747} -08/30/2021 13:54:34 - INFO - __main__ - Step 3925: {'lr': 0.000499791533585635, 'samples': 753600, 'steps': 3924, 'loss/train': 2.3157529830932617} -08/30/2021 13:54:34 - INFO - __main__ - Step 3926: {'lr': 0.0004997913168584262, 'samples': 753792, 'steps': 3925, 'loss/train': 2.479858636856079} -08/30/2021 13:54:35 - INFO - __main__ - Step 3927: {'lr': 0.0004997911000186651, 'samples': 753984, 'steps': 3926, 'loss/train': 2.8407881259918213} -08/30/2021 13:54:36 - INFO - __main__ - Step 3928: {'lr': 0.0004997908830663521, 'samples': 754176, 'steps': 3927, 'loss/train': 2.1204097270965576} -08/30/2021 13:54:36 - INFO - __main__ - Step 3929: {'lr': 0.0004997906660014871, 'samples': 754368, 'steps': 3928, 'loss/train': 3.7338621616363525} -08/30/2021 13:54:37 - INFO - __main__ - Step 3930: {'lr': 0.0004997904488240704, 'samples': 754560, 'steps': 3929, 'loss/train': 2.3179407119750977} -08/30/2021 13:54:37 - INFO - __main__ - Step 3931: {'lr': 0.0004997902315341019, 'samples': 754752, 'steps': 3930, 'loss/train': 2.3511340618133545} -08/30/2021 13:54:37 - INFO - __main__ - Step 3932: {'lr': 0.0004997900141315817, 'samples': 754944, 'steps': 3931, 'loss/train': 2.584240674972534} -08/30/2021 13:54:39 - INFO - __main__ - Step 3933: {'lr': 0.0004997897966165101, 'samples': 755136, 'steps': 3932, 'loss/train': 2.6032466888427734} -08/30/2021 13:54:39 - INFO - __main__ - Step 3934: {'lr': 0.000499789578988887, 'samples': 755328, 'steps': 3933, 'loss/train': 2.606760263442993} -08/30/2021 13:54:40 - INFO - __main__ - Step 3935: {'lr': 0.0004997893612487126, 'samples': 755520, 'steps': 3934, 'loss/train': 2.5362014770507812} -08/30/2021 13:54:40 - INFO - __main__ - Step 3936: {'lr': 0.000499789143395987, 'samples': 755712, 'steps': 3935, 'loss/train': 2.227644920349121} -08/30/2021 13:54:40 - INFO - __main__ - Step 3937: {'lr': 0.0004997889254307103, 'samples': 755904, 'steps': 3936, 'loss/train': 1.789372444152832} -08/30/2021 13:54:42 - INFO - __main__ - Step 3938: {'lr': 0.0004997887073528825, 'samples': 756096, 'steps': 3937, 'loss/train': 2.282470464706421} -08/30/2021 13:54:42 - INFO - __main__ - Step 3939: {'lr': 0.0004997884891625037, 'samples': 756288, 'steps': 3938, 'loss/train': 2.672386884689331} -08/30/2021 13:54:43 - INFO - __main__ - Step 3940: {'lr': 0.0004997882708595742, 'samples': 756480, 'steps': 3939, 'loss/train': 2.443068027496338} -08/30/2021 13:54:43 - INFO - __main__ - Step 3941: {'lr': 0.0004997880524440939, 'samples': 756672, 'steps': 3940, 'loss/train': 2.0535221099853516} -08/30/2021 13:54:43 - INFO - __main__ - Step 3942: {'lr': 0.0004997878339160628, 'samples': 756864, 'steps': 3941, 'loss/train': 2.733731269836426} -08/30/2021 13:54:46 - INFO - __main__ - Step 3943: {'lr': 0.0004997876152754814, 'samples': 757056, 'steps': 3942, 'loss/train': 2.707033395767212} -08/30/2021 13:54:46 - INFO - __main__ - Step 3944: {'lr': 0.0004997873965223495, 'samples': 757248, 'steps': 3943, 'loss/train': 2.4181621074676514} -08/30/2021 13:54:46 - INFO - __main__ - Step 3945: {'lr': 0.0004997871776566672, 'samples': 757440, 'steps': 3944, 'loss/train': 0.3946099281311035} -08/30/2021 13:54:47 - INFO - __main__ - Step 3946: {'lr': 0.0004997869586784346, 'samples': 757632, 'steps': 3945, 'loss/train': 2.1933298110961914} -08/30/2021 13:54:47 - INFO - __main__ - Step 3947: {'lr': 0.0004997867395876519, 'samples': 757824, 'steps': 3946, 'loss/train': 2.572780132293701} -08/30/2021 13:54:49 - INFO - __main__ - Step 3948: {'lr': 0.0004997865203843192, 'samples': 758016, 'steps': 3947, 'loss/train': 2.0253100395202637} -08/30/2021 13:54:49 - INFO - __main__ - Step 3949: {'lr': 0.0004997863010684365, 'samples': 758208, 'steps': 3948, 'loss/train': 2.4088943004608154} -08/30/2021 13:54:49 - INFO - __main__ - Step 3950: {'lr': 0.0004997860816400039, 'samples': 758400, 'steps': 3949, 'loss/train': 2.1114790439605713} -08/30/2021 13:54:50 - INFO - __main__ - Step 3951: {'lr': 0.0004997858620990217, 'samples': 758592, 'steps': 3950, 'loss/train': 2.383887767791748} -08/30/2021 13:54:50 - INFO - __main__ - Step 3952: {'lr': 0.0004997856424454897, 'samples': 758784, 'steps': 3951, 'loss/train': 2.504924774169922} -08/30/2021 13:54:50 - INFO - __main__ - Step 3953: {'lr': 0.0004997854226794082, 'samples': 758976, 'steps': 3952, 'loss/train': 2.293032169342041} -08/30/2021 13:54:52 - INFO - __main__ - Step 3954: {'lr': 0.0004997852028007772, 'samples': 759168, 'steps': 3953, 'loss/train': 2.7769062519073486} -08/30/2021 13:54:53 - INFO - __main__ - Step 3955: {'lr': 0.0004997849828095969, 'samples': 759360, 'steps': 3954, 'loss/train': 2.057321786880493} -08/30/2021 13:54:53 - INFO - __main__ - Step 3956: {'lr': 0.0004997847627058673, 'samples': 759552, 'steps': 3955, 'loss/train': 2.4487359523773193} -08/30/2021 13:54:53 - INFO - __main__ - Step 3957: {'lr': 0.0004997845424895886, 'samples': 759744, 'steps': 3956, 'loss/train': 0.5445548892021179} -08/30/2021 13:54:54 - INFO - __main__ - Step 3958: {'lr': 0.0004997843221607607, 'samples': 759936, 'steps': 3957, 'loss/train': 2.319689989089966} -08/30/2021 13:54:55 - INFO - __main__ - Step 3959: {'lr': 0.0004997841017193841, 'samples': 760128, 'steps': 3958, 'loss/train': 2.6205952167510986} -08/30/2021 13:54:56 - INFO - __main__ - Step 3960: {'lr': 0.0004997838811654584, 'samples': 760320, 'steps': 3959, 'loss/train': 2.4733848571777344} -08/30/2021 13:54:56 - INFO - __main__ - Step 3961: {'lr': 0.000499783660498984, 'samples': 760512, 'steps': 3960, 'loss/train': 2.2484936714172363} -08/30/2021 13:54:57 - INFO - __main__ - Step 3962: {'lr': 0.0004997834397199609, 'samples': 760704, 'steps': 3961, 'loss/train': 1.6888166666030884} -08/30/2021 13:54:57 - INFO - __main__ - Step 3963: {'lr': 0.0004997832188283893, 'samples': 760896, 'steps': 3962, 'loss/train': 3.3111376762390137} -08/30/2021 13:54:59 - INFO - __main__ - Step 3964: {'lr': 0.0004997829978242693, 'samples': 761088, 'steps': 3963, 'loss/train': 2.5132648944854736} -08/30/2021 13:54:59 - INFO - __main__ - Step 3965: {'lr': 0.0004997827767076008, 'samples': 761280, 'steps': 3964, 'loss/train': 2.3481621742248535} -08/30/2021 13:54:59 - INFO - __main__ - Step 3966: {'lr': 0.0004997825554783841, 'samples': 761472, 'steps': 3965, 'loss/train': 2.779114007949829} -08/30/2021 13:55:00 - INFO - __main__ - Step 3967: {'lr': 0.0004997823341366192, 'samples': 761664, 'steps': 3966, 'loss/train': 2.357691764831543} -08/30/2021 13:55:00 - INFO - __main__ - Step 3968: {'lr': 0.0004997821126823062, 'samples': 761856, 'steps': 3967, 'loss/train': 2.790999174118042} -08/30/2021 13:55:02 - INFO - __main__ - Step 3969: {'lr': 0.0004997818911154454, 'samples': 762048, 'steps': 3968, 'loss/train': 1.1109250783920288} -08/30/2021 13:55:03 - INFO - __main__ - Step 3970: {'lr': 0.0004997816694360367, 'samples': 762240, 'steps': 3969, 'loss/train': 2.903752088546753} -08/30/2021 13:55:03 - INFO - __main__ - Step 3971: {'lr': 0.00049978144764408, 'samples': 762432, 'steps': 3970, 'loss/train': 0.630244255065918} -08/30/2021 13:55:03 - INFO - __main__ - Step 3972: {'lr': 0.0004997812257395758, 'samples': 762624, 'steps': 3971, 'loss/train': 2.2875099182128906} -08/30/2021 13:55:04 - INFO - __main__ - Step 3973: {'lr': 0.0004997810037225241, 'samples': 762816, 'steps': 3972, 'loss/train': 2.5137999057769775} -08/30/2021 13:55:05 - INFO - __main__ - Step 3974: {'lr': 0.0004997807815929248, 'samples': 763008, 'steps': 3973, 'loss/train': 2.0932538509368896} -08/30/2021 13:55:06 - INFO - __main__ - Step 3975: {'lr': 0.0004997805593507783, 'samples': 763200, 'steps': 3974, 'loss/train': 2.383582353591919} -08/30/2021 13:55:06 - INFO - __main__ - Step 3976: {'lr': 0.0004997803369960844, 'samples': 763392, 'steps': 3975, 'loss/train': 4.0104146003723145} -08/30/2021 13:55:06 - INFO - __main__ - Step 3977: {'lr': 0.0004997801145288433, 'samples': 763584, 'steps': 3976, 'loss/train': 2.166151762008667} -08/30/2021 13:55:07 - INFO - __main__ - Step 3978: {'lr': 0.0004997798919490553, 'samples': 763776, 'steps': 3977, 'loss/train': 2.4855029582977295} -08/30/2021 13:55:07 - INFO - __main__ - Step 3979: {'lr': 0.0004997796692567202, 'samples': 763968, 'steps': 3978, 'loss/train': 2.364853858947754} -08/30/2021 13:55:09 - INFO - __main__ - Step 3980: {'lr': 0.0004997794464518383, 'samples': 764160, 'steps': 3979, 'loss/train': 2.0544681549072266} -08/30/2021 13:55:09 - INFO - __main__ - Step 3981: {'lr': 0.0004997792235344096, 'samples': 764352, 'steps': 3980, 'loss/train': 2.1070480346679688} -08/30/2021 13:55:09 - INFO - __main__ - Step 3982: {'lr': 0.0004997790005044343, 'samples': 764544, 'steps': 3981, 'loss/train': 1.9082952737808228} -08/30/2021 13:55:10 - INFO - __main__ - Step 3983: {'lr': 0.0004997787773619123, 'samples': 764736, 'steps': 3982, 'loss/train': 2.3124704360961914} -08/30/2021 13:55:10 - INFO - __main__ - Step 3984: {'lr': 0.0004997785541068439, 'samples': 764928, 'steps': 3983, 'loss/train': 2.160449266433716} -08/30/2021 13:55:12 - INFO - __main__ - Step 3985: {'lr': 0.0004997783307392292, 'samples': 765120, 'steps': 3984, 'loss/train': 1.9370083808898926} -08/30/2021 13:55:12 - INFO - __main__ - Step 3986: {'lr': 0.0004997781072590683, 'samples': 765312, 'steps': 3985, 'loss/train': 2.1351189613342285} -08/30/2021 13:55:12 - INFO - __main__ - Step 3987: {'lr': 0.000499777883666361, 'samples': 765504, 'steps': 3986, 'loss/train': 3.3185460567474365} -08/30/2021 13:55:13 - INFO - __main__ - Step 3988: {'lr': 0.0004997776599611078, 'samples': 765696, 'steps': 3987, 'loss/train': 2.0844638347625732} -08/30/2021 13:55:13 - INFO - __main__ - Step 3989: {'lr': 0.0004997774361433086, 'samples': 765888, 'steps': 3988, 'loss/train': 2.7253451347351074} -08/30/2021 13:55:15 - INFO - __main__ - Step 3990: {'lr': 0.0004997772122129635, 'samples': 766080, 'steps': 3989, 'loss/train': 1.918208360671997} -08/30/2021 13:55:15 - INFO - __main__ - Step 3991: {'lr': 0.0004997769881700727, 'samples': 766272, 'steps': 3990, 'loss/train': 2.1654398441314697} -08/30/2021 13:55:16 - INFO - __main__ - Step 3992: {'lr': 0.0004997767640146363, 'samples': 766464, 'steps': 3991, 'loss/train': 2.137949228286743} -08/30/2021 13:55:16 - INFO - __main__ - Step 3993: {'lr': 0.0004997765397466543, 'samples': 766656, 'steps': 3992, 'loss/train': 2.8130013942718506} -08/30/2021 13:55:16 - INFO - __main__ - Step 3994: {'lr': 0.0004997763153661269, 'samples': 766848, 'steps': 3993, 'loss/train': 2.2077252864837646} -08/30/2021 13:55:17 - INFO - __main__ - Step 3995: {'lr': 0.000499776090873054, 'samples': 767040, 'steps': 3994, 'loss/train': 1.7503622770309448} -08/30/2021 13:55:19 - INFO - __main__ - Step 3996: {'lr': 0.000499775866267436, 'samples': 767232, 'steps': 3995, 'loss/train': 2.386577844619751} -08/30/2021 13:55:19 - INFO - __main__ - Step 3997: {'lr': 0.0004997756415492727, 'samples': 767424, 'steps': 3996, 'loss/train': 2.0418219566345215} -08/30/2021 13:55:20 - INFO - __main__ - Step 3998: {'lr': 0.0004997754167185644, 'samples': 767616, 'steps': 3997, 'loss/train': 2.39665150642395} -08/30/2021 13:55:20 - INFO - __main__ - Step 3999: {'lr': 0.0004997751917753113, 'samples': 767808, 'steps': 3998, 'loss/train': 2.5384645462036133} -08/30/2021 13:55:20 - INFO - __main__ - Step 4000: {'lr': 0.0004997749667195132, 'samples': 768000, 'steps': 3999, 'loss/train': 2.4927403926849365} -08/30/2021 13:55:22 - INFO - __main__ - Step 4001: {'lr': 0.0004997747415511704, 'samples': 768192, 'steps': 4000, 'loss/train': 2.607116460800171} -08/30/2021 13:55:22 - INFO - __main__ - Step 4002: {'lr': 0.000499774516270283, 'samples': 768384, 'steps': 4001, 'loss/train': 2.0028114318847656} -08/30/2021 13:55:23 - INFO - __main__ - Step 4003: {'lr': 0.0004997742908768508, 'samples': 768576, 'steps': 4002, 'loss/train': 1.9878151416778564} -08/30/2021 13:55:23 - INFO - __main__ - Step 4004: {'lr': 0.0004997740653708744, 'samples': 768768, 'steps': 4003, 'loss/train': 2.348004102706909} -08/30/2021 13:55:23 - INFO - __main__ - Step 4005: {'lr': 0.0004997738397523537, 'samples': 768960, 'steps': 4004, 'loss/train': 1.797458291053772} -08/30/2021 13:55:25 - INFO - __main__ - Step 4006: {'lr': 0.0004997736140212887, 'samples': 769152, 'steps': 4005, 'loss/train': 2.4697611331939697} -08/30/2021 13:55:25 - INFO - __main__ - Step 4007: {'lr': 0.0004997733881776796, 'samples': 769344, 'steps': 4006, 'loss/train': 3.012784004211426} -08/30/2021 13:55:26 - INFO - __main__ - Step 4008: {'lr': 0.0004997731622215264, 'samples': 769536, 'steps': 4007, 'loss/train': 2.257763147354126} -08/30/2021 13:55:26 - INFO - __main__ - Step 4009: {'lr': 0.0004997729361528292, 'samples': 769728, 'steps': 4008, 'loss/train': 3.1401171684265137} -08/30/2021 13:55:26 - INFO - __main__ - Step 4010: {'lr': 0.0004997727099715882, 'samples': 769920, 'steps': 4009, 'loss/train': 2.2928898334503174} -08/30/2021 13:55:28 - INFO - __main__ - Step 4011: {'lr': 0.0004997724836778036, 'samples': 770112, 'steps': 4010, 'loss/train': 1.6429706811904907} -08/30/2021 13:55:28 - INFO - __main__ - Step 4012: {'lr': 0.0004997722572714753, 'samples': 770304, 'steps': 4011, 'loss/train': 2.2672104835510254} -08/30/2021 13:55:29 - INFO - __main__ - Step 4013: {'lr': 0.0004997720307526034, 'samples': 770496, 'steps': 4012, 'loss/train': 1.7388495206832886} -08/30/2021 13:55:29 - INFO - __main__ - Step 4014: {'lr': 0.0004997718041211881, 'samples': 770688, 'steps': 4013, 'loss/train': 2.3739945888519287} -08/30/2021 13:55:29 - INFO - __main__ - Step 4015: {'lr': 0.0004997715773772296, 'samples': 770880, 'steps': 4014, 'loss/train': 2.8052685260772705} -08/30/2021 13:55:31 - INFO - __main__ - Step 4016: {'lr': 0.0004997713505207278, 'samples': 771072, 'steps': 4015, 'loss/train': 1.839080810546875} -08/30/2021 13:55:32 - INFO - __main__ - Step 4017: {'lr': 0.0004997711235516829, 'samples': 771264, 'steps': 4016, 'loss/train': 1.589301347732544} -08/30/2021 13:55:32 - INFO - __main__ - Step 4018: {'lr': 0.000499770896470095, 'samples': 771456, 'steps': 4017, 'loss/train': 1.8437907695770264} -08/30/2021 13:55:32 - INFO - __main__ - Step 4019: {'lr': 0.0004997706692759642, 'samples': 771648, 'steps': 4018, 'loss/train': 2.4364233016967773} -08/30/2021 13:55:33 - INFO - __main__ - Step 4020: {'lr': 0.0004997704419692905, 'samples': 771840, 'steps': 4019, 'loss/train': 2.4826018810272217} -08/30/2021 13:55:35 - INFO - __main__ - Step 4021: {'lr': 0.0004997702145500741, 'samples': 772032, 'steps': 4020, 'loss/train': 1.9058207273483276} -08/30/2021 13:55:35 - INFO - __main__ - Step 4022: {'lr': 0.0004997699870183151, 'samples': 772224, 'steps': 4021, 'loss/train': 2.5359270572662354} -08/30/2021 13:55:35 - INFO - __main__ - Step 4023: {'lr': 0.0004997697593740137, 'samples': 772416, 'steps': 4022, 'loss/train': 2.793123722076416} -08/30/2021 13:55:36 - INFO - __main__ - Step 4024: {'lr': 0.0004997695316171698, 'samples': 772608, 'steps': 4023, 'loss/train': 2.240602731704712} -08/30/2021 13:55:36 - INFO - __main__ - Step 4025: {'lr': 0.0004997693037477837, 'samples': 772800, 'steps': 4024, 'loss/train': 2.421320676803589} -08/30/2021 13:55:36 - INFO - __main__ - Step 4026: {'lr': 0.0004997690757658552, 'samples': 772992, 'steps': 4025, 'loss/train': 4.291104793548584} -08/30/2021 13:55:38 - INFO - __main__ - Step 4027: {'lr': 0.0004997688476713848, 'samples': 773184, 'steps': 4026, 'loss/train': 2.386380434036255} -08/30/2021 13:55:38 - INFO - __main__ - Step 4028: {'lr': 0.0004997686194643724, 'samples': 773376, 'steps': 4027, 'loss/train': 2.6655831336975098} -08/30/2021 13:55:39 - INFO - __main__ - Step 4029: {'lr': 0.0004997683911448181, 'samples': 773568, 'steps': 4028, 'loss/train': 2.5628130435943604} -08/30/2021 13:55:39 - INFO - __main__ - Step 4030: {'lr': 0.000499768162712722, 'samples': 773760, 'steps': 4029, 'loss/train': 2.468876600265503} -08/30/2021 13:55:39 - INFO - __main__ - Step 4031: {'lr': 0.0004997679341680843, 'samples': 773952, 'steps': 4030, 'loss/train': 2.633169651031494} -08/30/2021 13:55:41 - INFO - __main__ - Step 4032: {'lr': 0.0004997677055109049, 'samples': 774144, 'steps': 4031, 'loss/train': 2.7020351886749268} -08/30/2021 13:55:41 - INFO - __main__ - Step 4033: {'lr': 0.0004997674767411841, 'samples': 774336, 'steps': 4032, 'loss/train': 2.3281779289245605} -08/30/2021 13:55:42 - INFO - __main__ - Step 4034: {'lr': 0.0004997672478589219, 'samples': 774528, 'steps': 4033, 'loss/train': 2.290341377258301} -08/30/2021 13:55:42 - INFO - __main__ - Step 4035: {'lr': 0.0004997670188641183, 'samples': 774720, 'steps': 4034, 'loss/train': 2.7043285369873047} -08/30/2021 13:55:42 - INFO - __main__ - Step 4036: {'lr': 0.0004997667897567738, 'samples': 774912, 'steps': 4035, 'loss/train': 1.0439705848693848} -08/30/2021 13:55:44 - INFO - __main__ - Step 4037: {'lr': 0.0004997665605368881, 'samples': 775104, 'steps': 4036, 'loss/train': 2.1322202682495117} -08/30/2021 13:55:44 - INFO - __main__ - Step 4038: {'lr': 0.0004997663312044614, 'samples': 775296, 'steps': 4037, 'loss/train': 2.4699625968933105} -08/30/2021 13:55:45 - INFO - __main__ - Step 4039: {'lr': 0.0004997661017594939, 'samples': 775488, 'steps': 4038, 'loss/train': 3.9698586463928223} -08/30/2021 13:55:45 - INFO - __main__ - Step 4040: {'lr': 0.0004997658722019857, 'samples': 775680, 'steps': 4039, 'loss/train': 2.4469292163848877} -08/30/2021 13:55:46 - INFO - __main__ - Step 4041: {'lr': 0.0004997656425319367, 'samples': 775872, 'steps': 4040, 'loss/train': 2.307356834411621} -08/30/2021 13:55:46 - INFO - __main__ - Step 4042: {'lr': 0.0004997654127493473, 'samples': 776064, 'steps': 4041, 'loss/train': 2.4846560955047607} -08/30/2021 13:55:47 - INFO - __main__ - Step 4043: {'lr': 0.0004997651828542173, 'samples': 776256, 'steps': 4042, 'loss/train': 0.5503510236740112} -08/30/2021 13:55:48 - INFO - __main__ - Step 4044: {'lr': 0.0004997649528465471, 'samples': 776448, 'steps': 4043, 'loss/train': 2.0111496448516846} -08/30/2021 13:55:48 - INFO - __main__ - Step 4045: {'lr': 0.0004997647227263367, 'samples': 776640, 'steps': 4044, 'loss/train': 2.676067352294922} -08/30/2021 13:55:48 - INFO - __main__ - Step 4046: {'lr': 0.000499764492493586, 'samples': 776832, 'steps': 4045, 'loss/train': 2.448500633239746} -08/30/2021 13:55:49 - INFO - __main__ - Step 4047: {'lr': 0.0004997642621482955, 'samples': 777024, 'steps': 4046, 'loss/train': 2.5388779640197754} -08/30/2021 13:55:50 - INFO - __main__ - Step 4048: {'lr': 0.0004997640316904649, 'samples': 777216, 'steps': 4047, 'loss/train': 3.0572433471679688} -08/30/2021 13:55:51 - INFO - __main__ - Step 4049: {'lr': 0.0004997638011200946, 'samples': 777408, 'steps': 4048, 'loss/train': 2.5447680950164795} -08/30/2021 13:55:51 - INFO - __main__ - Step 4050: {'lr': 0.0004997635704371844, 'samples': 777600, 'steps': 4049, 'loss/train': 2.6373209953308105} -08/30/2021 13:55:51 - INFO - __main__ - Step 4051: {'lr': 0.0004997633396417348, 'samples': 777792, 'steps': 4050, 'loss/train': 2.7491040229797363} -08/30/2021 13:55:52 - INFO - __main__ - Step 4052: {'lr': 0.0004997631087337456, 'samples': 777984, 'steps': 4051, 'loss/train': 2.096184015274048} -08/30/2021 13:55:54 - INFO - __main__ - Step 4053: {'lr': 0.000499762877713217, 'samples': 778176, 'steps': 4052, 'loss/train': 2.2926199436187744} -08/30/2021 13:55:54 - INFO - __main__ - Step 4054: {'lr': 0.0004997626465801492, 'samples': 778368, 'steps': 4053, 'loss/train': 2.4043421745300293} -08/30/2021 13:55:55 - INFO - __main__ - Step 4055: {'lr': 0.000499762415334542, 'samples': 778560, 'steps': 4054, 'loss/train': 2.2378180027008057} -08/30/2021 13:55:55 - INFO - __main__ - Step 4056: {'lr': 0.0004997621839763958, 'samples': 778752, 'steps': 4055, 'loss/train': 2.306154727935791} -08/30/2021 13:55:55 - INFO - __main__ - Step 4057: {'lr': 0.0004997619525057106, 'samples': 778944, 'steps': 4056, 'loss/train': 2.423851728439331} -08/30/2021 13:55:57 - INFO - __main__ - Step 4058: {'lr': 0.0004997617209224866, 'samples': 779136, 'steps': 4057, 'loss/train': 2.433486223220825} -08/30/2021 13:55:58 - INFO - __main__ - Step 4059: {'lr': 0.0004997614892267238, 'samples': 779328, 'steps': 4058, 'loss/train': 2.9628419876098633} -08/30/2021 13:55:58 - INFO - __main__ - Step 4060: {'lr': 0.0004997612574184223, 'samples': 779520, 'steps': 4059, 'loss/train': 1.662583351135254} -08/30/2021 13:55:58 - INFO - __main__ - Step 4061: {'lr': 0.0004997610254975823, 'samples': 779712, 'steps': 4060, 'loss/train': 1.755662441253662} -08/30/2021 13:55:59 - INFO - __main__ - Step 4062: {'lr': 0.0004997607934642038, 'samples': 779904, 'steps': 4061, 'loss/train': 2.7849385738372803} -08/30/2021 13:56:00 - INFO - __main__ - Step 4063: {'lr': 0.0004997605613182868, 'samples': 780096, 'steps': 4062, 'loss/train': 2.0621323585510254} -08/30/2021 13:56:01 - INFO - __main__ - Step 4064: {'lr': 0.0004997603290598317, 'samples': 780288, 'steps': 4063, 'loss/train': 3.1318585872650146} -08/30/2021 13:56:01 - INFO - __main__ - Step 4065: {'lr': 0.0004997600966888384, 'samples': 780480, 'steps': 4064, 'loss/train': 2.4551327228546143} -08/30/2021 13:56:01 - INFO - __main__ - Step 4066: {'lr': 0.000499759864205307, 'samples': 780672, 'steps': 4065, 'loss/train': 2.489694595336914} -08/30/2021 13:56:02 - INFO - __main__ - Step 4067: {'lr': 0.0004997596316092378, 'samples': 780864, 'steps': 4066, 'loss/train': 2.8750481605529785} -08/30/2021 13:56:03 - INFO - __main__ - Step 4068: {'lr': 0.0004997593989006306, 'samples': 781056, 'steps': 4067, 'loss/train': 2.234858274459839} -08/30/2021 13:56:04 - INFO - __main__ - Step 4069: {'lr': 0.0004997591660794858, 'samples': 781248, 'steps': 4068, 'loss/train': 2.5201728343963623} -08/30/2021 13:56:04 - INFO - __main__ - Step 4070: {'lr': 0.0004997589331458034, 'samples': 781440, 'steps': 4069, 'loss/train': 1.053739309310913} -08/30/2021 13:56:05 - INFO - __main__ - Step 4071: {'lr': 0.0004997587000995833, 'samples': 781632, 'steps': 4070, 'loss/train': 3.0745999813079834} -08/30/2021 13:56:05 - INFO - __main__ - Step 4072: {'lr': 0.000499758466940826, 'samples': 781824, 'steps': 4071, 'loss/train': 2.7624387741088867} -08/30/2021 13:56:05 - INFO - __main__ - Step 4073: {'lr': 0.0004997582336695312, 'samples': 782016, 'steps': 4072, 'loss/train': 2.297905206680298} -08/30/2021 13:56:07 - INFO - __main__ - Step 4074: {'lr': 0.0004997580002856993, 'samples': 782208, 'steps': 4073, 'loss/train': 0.4014703333377838} -08/30/2021 13:56:07 - INFO - __main__ - Step 4075: {'lr': 0.0004997577667893303, 'samples': 782400, 'steps': 4074, 'loss/train': 2.3574111461639404} -08/30/2021 13:56:08 - INFO - __main__ - Step 4076: {'lr': 0.0004997575331804243, 'samples': 782592, 'steps': 4075, 'loss/train': 2.161566734313965} -08/30/2021 13:56:08 - INFO - __main__ - Step 4077: {'lr': 0.0004997572994589812, 'samples': 782784, 'steps': 4076, 'loss/train': 3.3062691688537598} -08/30/2021 13:56:08 - INFO - __main__ - Step 4078: {'lr': 0.0004997570656250016, 'samples': 782976, 'steps': 4077, 'loss/train': 2.472597599029541} -08/30/2021 13:56:10 - INFO - __main__ - Step 4079: {'lr': 0.0004997568316784852, 'samples': 783168, 'steps': 4078, 'loss/train': 2.9864468574523926} -08/30/2021 13:56:10 - INFO - __main__ - Step 4080: {'lr': 0.0004997565976194323, 'samples': 783360, 'steps': 4079, 'loss/train': 2.3666961193084717} -08/30/2021 13:56:11 - INFO - __main__ - Step 4081: {'lr': 0.0004997563634478429, 'samples': 783552, 'steps': 4080, 'loss/train': 2.6453051567077637} -08/30/2021 13:56:11 - INFO - __main__ - Step 4082: {'lr': 0.000499756129163717, 'samples': 783744, 'steps': 4081, 'loss/train': 2.544973611831665} -08/30/2021 13:56:11 - INFO - __main__ - Step 4083: {'lr': 0.000499755894767055, 'samples': 783936, 'steps': 4082, 'loss/train': 2.2215025424957275} -08/30/2021 13:56:13 - INFO - __main__ - Step 4084: {'lr': 0.0004997556602578568, 'samples': 784128, 'steps': 4083, 'loss/train': 2.718143939971924} -08/30/2021 13:56:13 - INFO - __main__ - Step 4085: {'lr': 0.0004997554256361225, 'samples': 784320, 'steps': 4084, 'loss/train': 2.04015851020813} -08/30/2021 13:56:14 - INFO - __main__ - Step 4086: {'lr': 0.0004997551909018524, 'samples': 784512, 'steps': 4085, 'loss/train': 2.7680890560150146} -08/30/2021 13:56:14 - INFO - __main__ - Step 4087: {'lr': 0.0004997549560550464, 'samples': 784704, 'steps': 4086, 'loss/train': 2.689427137374878} -08/30/2021 13:56:14 - INFO - __main__ - Step 4088: {'lr': 0.0004997547210957047, 'samples': 784896, 'steps': 4087, 'loss/train': 3.028334617614746} -08/30/2021 13:56:16 - INFO - __main__ - Step 4089: {'lr': 0.0004997544860238272, 'samples': 785088, 'steps': 4088, 'loss/train': 2.0451505184173584} -08/30/2021 13:56:16 - INFO - __main__ - Step 4090: {'lr': 0.0004997542508394144, 'samples': 785280, 'steps': 4089, 'loss/train': 2.1984105110168457} -08/30/2021 13:56:17 - INFO - __main__ - Step 4091: {'lr': 0.000499754015542466, 'samples': 785472, 'steps': 4090, 'loss/train': 3.425971269607544} -08/30/2021 13:56:17 - INFO - __main__ - Step 4092: {'lr': 0.0004997537801329824, 'samples': 785664, 'steps': 4091, 'loss/train': 2.6176960468292236} -08/30/2021 13:56:17 - INFO - __main__ - Step 4093: {'lr': 0.0004997535446109637, 'samples': 785856, 'steps': 4092, 'loss/train': 2.0059561729431152} -08/30/2021 13:56:19 - INFO - __main__ - Step 4094: {'lr': 0.0004997533089764097, 'samples': 786048, 'steps': 4093, 'loss/train': 2.5740933418273926} -08/30/2021 13:56:20 - INFO - __main__ - Step 4095: {'lr': 0.0004997530732293209, 'samples': 786240, 'steps': 4094, 'loss/train': 2.12330961227417} -08/30/2021 13:56:20 - INFO - __main__ - Step 4096: {'lr': 0.000499752837369697, 'samples': 786432, 'steps': 4095, 'loss/train': 3.3240857124328613} -08/30/2021 13:56:20 - INFO - __main__ - Step 4097: {'lr': 0.0004997526013975385, 'samples': 786624, 'steps': 4096, 'loss/train': 2.6515917778015137} -08/30/2021 13:56:21 - INFO - __main__ - Step 4098: {'lr': 0.0004997523653128453, 'samples': 786816, 'steps': 4097, 'loss/train': 3.079754590988159} -08/30/2021 13:56:21 - INFO - __main__ - Step 4099: {'lr': 0.0004997521291156175, 'samples': 787008, 'steps': 4098, 'loss/train': 2.460397481918335} -08/30/2021 13:56:22 - INFO - __main__ - Step 4100: {'lr': 0.0004997518928058553, 'samples': 787200, 'steps': 4099, 'loss/train': 2.6524083614349365} -08/30/2021 13:56:23 - INFO - __main__ - Step 4101: {'lr': 0.0004997516563835587, 'samples': 787392, 'steps': 4100, 'loss/train': 2.4772443771362305} -08/30/2021 13:56:23 - INFO - __main__ - Step 4102: {'lr': 0.0004997514198487279, 'samples': 787584, 'steps': 4101, 'loss/train': 2.363936185836792} -08/30/2021 13:56:24 - INFO - __main__ - Step 4103: {'lr': 0.0004997511832013629, 'samples': 787776, 'steps': 4102, 'loss/train': 2.742016553878784} -08/30/2021 13:56:24 - INFO - __main__ - Step 4104: {'lr': 0.0004997509464414639, 'samples': 787968, 'steps': 4103, 'loss/train': 2.8800699710845947} -08/30/2021 13:56:26 - INFO - __main__ - Step 4105: {'lr': 0.000499750709569031, 'samples': 788160, 'steps': 4104, 'loss/train': 2.4009082317352295} -08/30/2021 13:56:27 - INFO - __main__ - Step 4106: {'lr': 0.0004997504725840644, 'samples': 788352, 'steps': 4105, 'loss/train': 1.4848320484161377} -08/30/2021 13:56:27 - INFO - __main__ - Step 4107: {'lr': 0.0004997502354865639, 'samples': 788544, 'steps': 4106, 'loss/train': 2.3617055416107178} -08/30/2021 13:56:27 - INFO - __main__ - Step 4108: {'lr': 0.0004997499982765299, 'samples': 788736, 'steps': 4107, 'loss/train': 2.733996629714966} -08/30/2021 13:56:28 - INFO - __main__ - Step 4109: {'lr': 0.0004997497609539623, 'samples': 788928, 'steps': 4108, 'loss/train': 2.7251229286193848} -08/30/2021 13:56:29 - INFO - __main__ - Step 4110: {'lr': 0.0004997495235188614, 'samples': 789120, 'steps': 4109, 'loss/train': 2.193601369857788} -08/30/2021 13:56:30 - INFO - __main__ - Step 4111: {'lr': 0.0004997492859712272, 'samples': 789312, 'steps': 4110, 'loss/train': 2.574625015258789} -08/30/2021 13:56:30 - INFO - __main__ - Step 4112: {'lr': 0.0004997490483110599, 'samples': 789504, 'steps': 4111, 'loss/train': 2.4444687366485596} -08/30/2021 13:56:30 - INFO - __main__ - Step 4113: {'lr': 0.0004997488105383594, 'samples': 789696, 'steps': 4112, 'loss/train': 1.5127551555633545} -08/30/2021 13:56:31 - INFO - __main__ - Step 4114: {'lr': 0.000499748572653126, 'samples': 789888, 'steps': 4113, 'loss/train': 2.4461772441864014} -08/30/2021 13:56:32 - INFO - __main__ - Step 4115: {'lr': 0.0004997483346553597, 'samples': 790080, 'steps': 4114, 'loss/train': 2.314634323120117} -08/30/2021 13:56:33 - INFO - __main__ - Step 4116: {'lr': 0.0004997480965450607, 'samples': 790272, 'steps': 4115, 'loss/train': 2.4725961685180664} -08/30/2021 13:56:33 - INFO - __main__ - Step 4117: {'lr': 0.0004997478583222291, 'samples': 790464, 'steps': 4116, 'loss/train': 2.412627935409546} -08/30/2021 13:56:33 - INFO - __main__ - Step 4118: {'lr': 0.0004997476199868649, 'samples': 790656, 'steps': 4117, 'loss/train': 2.497490882873535} -08/30/2021 13:56:34 - INFO - __main__ - Step 4119: {'lr': 0.0004997473815389683, 'samples': 790848, 'steps': 4118, 'loss/train': 2.241377115249634} -08/30/2021 13:56:35 - INFO - __main__ - Step 4120: {'lr': 0.0004997471429785394, 'samples': 791040, 'steps': 4119, 'loss/train': 2.279694080352783} -08/30/2021 13:56:36 - INFO - __main__ - Step 4121: {'lr': 0.0004997469043055784, 'samples': 791232, 'steps': 4120, 'loss/train': 3.4058709144592285} -08/30/2021 13:56:36 - INFO - __main__ - Step 4122: {'lr': 0.000499746665520085, 'samples': 791424, 'steps': 4121, 'loss/train': 2.493852376937866} -08/30/2021 13:56:36 - INFO - __main__ - Step 4123: {'lr': 0.0004997464266220599, 'samples': 791616, 'steps': 4122, 'loss/train': 1.5343027114868164} -08/30/2021 13:56:37 - INFO - __main__ - Step 4124: {'lr': 0.0004997461876115029, 'samples': 791808, 'steps': 4123, 'loss/train': 1.5703154802322388} -08/30/2021 13:56:38 - INFO - __main__ - Step 4125: {'lr': 0.0004997459484884139, 'samples': 792000, 'steps': 4124, 'loss/train': 2.1772875785827637} -08/30/2021 13:56:39 - INFO - __main__ - Step 4126: {'lr': 0.0004997457092527934, 'samples': 792192, 'steps': 4125, 'loss/train': 2.3461971282958984} -08/30/2021 13:56:39 - INFO - __main__ - Step 4127: {'lr': 0.0004997454699046412, 'samples': 792384, 'steps': 4126, 'loss/train': 2.3878214359283447} -08/30/2021 13:56:39 - INFO - __main__ - Step 4128: {'lr': 0.0004997452304439577, 'samples': 792576, 'steps': 4127, 'loss/train': 1.971865177154541} -08/30/2021 13:56:40 - INFO - __main__ - Step 4129: {'lr': 0.0004997449908707428, 'samples': 792768, 'steps': 4128, 'loss/train': 2.165173053741455} -08/30/2021 13:56:40 - INFO - __main__ - Step 4130: {'lr': 0.0004997447511849966, 'samples': 792960, 'steps': 4129, 'loss/train': 2.409449338912964} -08/30/2021 13:56:41 - INFO - __main__ - Step 4131: {'lr': 0.0004997445113867193, 'samples': 793152, 'steps': 4130, 'loss/train': 1.8672187328338623} -08/30/2021 13:56:42 - INFO - __main__ - Step 4132: {'lr': 0.000499744271475911, 'samples': 793344, 'steps': 4131, 'loss/train': 2.3295915126800537} -08/30/2021 13:56:42 - INFO - __main__ - Step 4133: {'lr': 0.0004997440314525718, 'samples': 793536, 'steps': 4132, 'loss/train': 2.5744876861572266} -08/30/2021 13:56:43 - INFO - __main__ - Step 4134: {'lr': 0.0004997437913167018, 'samples': 793728, 'steps': 4133, 'loss/train': 2.637343645095825} -08/30/2021 13:56:43 - INFO - __main__ - Step 4135: {'lr': 0.0004997435510683011, 'samples': 793920, 'steps': 4134, 'loss/train': 2.3382296562194824} -08/30/2021 13:56:44 - INFO - __main__ - Step 4136: {'lr': 0.0004997433107073697, 'samples': 794112, 'steps': 4135, 'loss/train': 2.1141772270202637} -08/30/2021 13:56:45 - INFO - __main__ - Step 4137: {'lr': 0.000499743070233908, 'samples': 794304, 'steps': 4136, 'loss/train': 2.3558902740478516} -08/30/2021 13:56:45 - INFO - __main__ - Step 4138: {'lr': 0.0004997428296479158, 'samples': 794496, 'steps': 4137, 'loss/train': 2.1789145469665527} -08/30/2021 13:56:46 - INFO - __main__ - Step 4139: {'lr': 0.0004997425889493933, 'samples': 794688, 'steps': 4138, 'loss/train': 2.6657779216766357} -08/30/2021 13:56:46 - INFO - __main__ - Step 4140: {'lr': 0.0004997423481383407, 'samples': 794880, 'steps': 4139, 'loss/train': 2.8600826263427734} -08/30/2021 13:56:48 - INFO - __main__ - Step 4141: {'lr': 0.0004997421072147581, 'samples': 795072, 'steps': 4140, 'loss/train': 2.526305675506592} -08/30/2021 13:56:48 - INFO - __main__ - Step 4142: {'lr': 0.0004997418661786455, 'samples': 795264, 'steps': 4141, 'loss/train': 2.5764617919921875} -08/30/2021 13:56:49 - INFO - __main__ - Step 4143: {'lr': 0.0004997416250300031, 'samples': 795456, 'steps': 4142, 'loss/train': 0.9663740396499634} -08/30/2021 13:56:49 - INFO - __main__ - Step 4144: {'lr': 0.0004997413837688309, 'samples': 795648, 'steps': 4143, 'loss/train': 2.2550570964813232} -08/30/2021 13:56:49 - INFO - __main__ - Step 4145: {'lr': 0.0004997411423951292, 'samples': 795840, 'steps': 4144, 'loss/train': 2.074369192123413} -08/30/2021 13:56:50 - INFO - __main__ - Step 4146: {'lr': 0.0004997409009088979, 'samples': 796032, 'steps': 4145, 'loss/train': 1.7636322975158691} -08/30/2021 13:56:52 - INFO - __main__ - Step 4147: {'lr': 0.0004997406593101373, 'samples': 796224, 'steps': 4146, 'loss/train': 1.8120797872543335} -08/30/2021 13:56:53 - INFO - __main__ - Step 4148: {'lr': 0.0004997404175988474, 'samples': 796416, 'steps': 4147, 'loss/train': 0.9852719306945801} -08/30/2021 13:56:53 - INFO - __main__ - Step 4149: {'lr': 0.0004997401757750282, 'samples': 796608, 'steps': 4148, 'loss/train': 1.135817289352417} -08/30/2021 13:56:53 - INFO - __main__ - Step 4150: {'lr': 0.00049973993383868, 'samples': 796800, 'steps': 4149, 'loss/train': 2.8767166137695312} -08/30/2021 13:56:54 - INFO - __main__ - Step 4151: {'lr': 0.0004997396917898029, 'samples': 796992, 'steps': 4150, 'loss/train': 2.903456449508667} -08/30/2021 13:56:54 - INFO - __main__ - Step 4152: {'lr': 0.0004997394496283969, 'samples': 797184, 'steps': 4151, 'loss/train': 2.2797820568084717} -08/30/2021 13:56:56 - INFO - __main__ - Step 4153: {'lr': 0.0004997392073544622, 'samples': 797376, 'steps': 4152, 'loss/train': 2.748669385910034} -08/30/2021 13:56:56 - INFO - __main__ - Step 4154: {'lr': 0.0004997389649679987, 'samples': 797568, 'steps': 4153, 'loss/train': 3.0491771697998047} -08/30/2021 13:56:56 - INFO - __main__ - Step 4155: {'lr': 0.0004997387224690068, 'samples': 797760, 'steps': 4154, 'loss/train': 2.677032947540283} -08/30/2021 13:56:57 - INFO - __main__ - Step 4156: {'lr': 0.0004997384798574865, 'samples': 797952, 'steps': 4155, 'loss/train': 2.6187453269958496} -08/30/2021 13:56:57 - INFO - __main__ - Step 4157: {'lr': 0.0004997382371334379, 'samples': 798144, 'steps': 4156, 'loss/train': 2.9816508293151855} -08/30/2021 13:56:59 - INFO - __main__ - Step 4158: {'lr': 0.0004997379942968611, 'samples': 798336, 'steps': 4157, 'loss/train': 2.465806722640991} -08/30/2021 13:57:00 - INFO - __main__ - Step 4159: {'lr': 0.0004997377513477562, 'samples': 798528, 'steps': 4158, 'loss/train': 2.595107316970825} -08/30/2021 13:57:00 - INFO - __main__ - Step 4160: {'lr': 0.0004997375082861234, 'samples': 798720, 'steps': 4159, 'loss/train': 2.850452184677124} -08/30/2021 13:57:00 - INFO - __main__ - Step 4161: {'lr': 0.0004997372651119626, 'samples': 798912, 'steps': 4160, 'loss/train': 1.9784674644470215} -08/30/2021 13:57:01 - INFO - __main__ - Step 4162: {'lr': 0.0004997370218252741, 'samples': 799104, 'steps': 4161, 'loss/train': 3.3903627395629883} -08/30/2021 13:57:03 - INFO - __main__ - Step 4163: {'lr': 0.000499736778426058, 'samples': 799296, 'steps': 4162, 'loss/train': 1.924661636352539} -08/30/2021 13:57:03 - INFO - __main__ - Step 4164: {'lr': 0.0004997365349143142, 'samples': 799488, 'steps': 4163, 'loss/train': 4.557950496673584} -08/30/2021 13:57:03 - INFO - __main__ - Step 4165: {'lr': 0.0004997362912900432, 'samples': 799680, 'steps': 4164, 'loss/train': 2.1999592781066895} -08/30/2021 13:57:04 - INFO - __main__ - Step 4166: {'lr': 0.0004997360475532447, 'samples': 799872, 'steps': 4165, 'loss/train': 1.7625823020935059} -08/30/2021 13:57:04 - INFO - __main__ - Step 4167: {'lr': 0.000499735803703919, 'samples': 800064, 'steps': 4166, 'loss/train': 1.29753839969635} -08/30/2021 13:57:05 - INFO - __main__ - Step 4168: {'lr': 0.0004997355597420663, 'samples': 800256, 'steps': 4167, 'loss/train': 2.5071189403533936} -08/30/2021 13:57:06 - INFO - __main__ - Step 4169: {'lr': 0.0004997353156676866, 'samples': 800448, 'steps': 4168, 'loss/train': 2.628887176513672} -08/30/2021 13:57:07 - INFO - __main__ - Step 4170: {'lr': 0.0004997350714807799, 'samples': 800640, 'steps': 4169, 'loss/train': 2.701754570007324} -08/30/2021 13:57:07 - INFO - __main__ - Step 4171: {'lr': 0.0004997348271813466, 'samples': 800832, 'steps': 4170, 'loss/train': 2.419128179550171} -08/30/2021 13:57:07 - INFO - __main__ - Step 4172: {'lr': 0.0004997345827693865, 'samples': 801024, 'steps': 4171, 'loss/train': 1.9172649383544922} -08/30/2021 13:57:08 - INFO - __main__ - Step 4173: {'lr': 0.0004997343382448999, 'samples': 801216, 'steps': 4172, 'loss/train': 2.6126654148101807} -08/30/2021 13:57:08 - INFO - __main__ - Step 4174: {'lr': 0.0004997340936078869, 'samples': 801408, 'steps': 4173, 'loss/train': 2.3526010513305664} -08/30/2021 13:57:10 - INFO - __main__ - Step 4175: {'lr': 0.0004997338488583475, 'samples': 801600, 'steps': 4174, 'loss/train': 2.316492795944214} -08/30/2021 13:57:10 - INFO - __main__ - Step 4176: {'lr': 0.000499733603996282, 'samples': 801792, 'steps': 4175, 'loss/train': 2.7608721256256104} -08/30/2021 13:57:11 - INFO - __main__ - Step 4177: {'lr': 0.0004997333590216902, 'samples': 801984, 'steps': 4176, 'loss/train': 1.7769652605056763} -08/30/2021 13:57:11 - INFO - __main__ - Step 4178: {'lr': 0.0004997331139345725, 'samples': 802176, 'steps': 4177, 'loss/train': 2.848891258239746} -08/30/2021 13:57:11 - INFO - __main__ - Step 4179: {'lr': 0.000499732868734929, 'samples': 802368, 'steps': 4178, 'loss/train': 5.5596184730529785} -08/30/2021 13:57:13 - INFO - __main__ - Step 4180: {'lr': 0.0004997326234227596, 'samples': 802560, 'steps': 4179, 'loss/train': 2.2745630741119385} -08/30/2021 13:57:13 - INFO - __main__ - Step 4181: {'lr': 0.0004997323779980646, 'samples': 802752, 'steps': 4180, 'loss/train': 2.6148009300231934} -08/30/2021 13:57:14 - INFO - __main__ - Step 4182: {'lr': 0.0004997321324608441, 'samples': 802944, 'steps': 4181, 'loss/train': 2.24898624420166} -08/30/2021 13:57:14 - INFO - __main__ - Step 4183: {'lr': 0.0004997318868110981, 'samples': 803136, 'steps': 4182, 'loss/train': 2.8404312133789062} -08/30/2021 13:57:14 - INFO - __main__ - Step 4184: {'lr': 0.0004997316410488267, 'samples': 803328, 'steps': 4183, 'loss/train': 2.5526809692382812} -08/30/2021 13:57:16 - INFO - __main__ - Step 4185: {'lr': 0.0004997313951740301, 'samples': 803520, 'steps': 4184, 'loss/train': 2.9416213035583496} -08/30/2021 13:57:17 - INFO - __main__ - Step 4186: {'lr': 0.0004997311491867083, 'samples': 803712, 'steps': 4185, 'loss/train': 2.0505666732788086} -08/30/2021 13:57:17 - INFO - __main__ - Step 4187: {'lr': 0.0004997309030868617, 'samples': 803904, 'steps': 4186, 'loss/train': 1.945277214050293} -08/30/2021 13:57:17 - INFO - __main__ - Step 4188: {'lr': 0.0004997306568744901, 'samples': 804096, 'steps': 4187, 'loss/train': 3.2816596031188965} -08/30/2021 13:57:18 - INFO - __main__ - Step 4189: {'lr': 0.0004997304105495938, 'samples': 804288, 'steps': 4188, 'loss/train': 2.8236606121063232} -08/30/2021 13:57:18 - INFO - __main__ - Step 4190: {'lr': 0.0004997301641121727, 'samples': 804480, 'steps': 4189, 'loss/train': 1.0542320013046265} -08/30/2021 13:57:19 - INFO - __main__ - Step 4191: {'lr': 0.0004997299175622271, 'samples': 804672, 'steps': 4190, 'loss/train': 2.4775097370147705} -08/30/2021 13:57:20 - INFO - __main__ - Step 4192: {'lr': 0.000499729670899757, 'samples': 804864, 'steps': 4191, 'loss/train': 2.530005931854248} -08/30/2021 13:57:20 - INFO - __main__ - Step 4193: {'lr': 0.0004997294241247627, 'samples': 805056, 'steps': 4192, 'loss/train': 2.8062233924865723} -08/30/2021 13:57:21 - INFO - __main__ - Step 4194: {'lr': 0.0004997291772372441, 'samples': 805248, 'steps': 4193, 'loss/train': 1.4623937606811523} -08/30/2021 13:57:21 - INFO - __main__ - Step 4195: {'lr': 0.0004997289302372014, 'samples': 805440, 'steps': 4194, 'loss/train': 2.715535879135132} -08/30/2021 13:57:22 - INFO - __main__ - Step 4196: {'lr': 0.0004997286831246347, 'samples': 805632, 'steps': 4195, 'loss/train': 2.6134181022644043} -08/30/2021 13:57:23 - INFO - __main__ - Step 4197: {'lr': 0.0004997284358995441, 'samples': 805824, 'steps': 4196, 'loss/train': 2.440012216567993} -08/30/2021 13:57:23 - INFO - __main__ - Step 4198: {'lr': 0.0004997281885619297, 'samples': 806016, 'steps': 4197, 'loss/train': 2.4690046310424805} -08/30/2021 13:57:24 - INFO - __main__ - Step 4199: {'lr': 0.0004997279411117916, 'samples': 806208, 'steps': 4198, 'loss/train': 2.0587642192840576} -08/30/2021 13:57:24 - INFO - __main__ - Step 4200: {'lr': 0.00049972769354913, 'samples': 806400, 'steps': 4199, 'loss/train': 2.0000696182250977} -08/30/2021 13:57:26 - INFO - __main__ - Step 4201: {'lr': 0.0004997274458739449, 'samples': 806592, 'steps': 4200, 'loss/train': 2.9006898403167725} -08/30/2021 13:57:26 - INFO - __main__ - Step 4202: {'lr': 0.0004997271980862366, 'samples': 806784, 'steps': 4201, 'loss/train': 2.264946699142456} -08/30/2021 13:57:27 - INFO - __main__ - Step 4203: {'lr': 0.000499726950186005, 'samples': 806976, 'steps': 4202, 'loss/train': 2.459864616394043} -08/30/2021 13:57:27 - INFO - __main__ - Step 4204: {'lr': 0.0004997267021732502, 'samples': 807168, 'steps': 4203, 'loss/train': 0.8687018156051636} -08/30/2021 13:57:27 - INFO - __main__ - Step 4205: {'lr': 0.0004997264540479724, 'samples': 807360, 'steps': 4204, 'loss/train': 0.7052633166313171} -08/30/2021 13:57:28 - INFO - __main__ - Step 4206: {'lr': 0.0004997262058101719, 'samples': 807552, 'steps': 4205, 'loss/train': 2.1795976161956787} -08/30/2021 13:57:29 - INFO - __main__ - Step 4207: {'lr': 0.0004997259574598485, 'samples': 807744, 'steps': 4206, 'loss/train': 2.8340301513671875} -08/30/2021 13:57:30 - INFO - __main__ - Step 4208: {'lr': 0.0004997257089970024, 'samples': 807936, 'steps': 4207, 'loss/train': 2.3500144481658936} -08/30/2021 13:57:30 - INFO - __main__ - Step 4209: {'lr': 0.0004997254604216338, 'samples': 808128, 'steps': 4208, 'loss/train': 2.3471860885620117} -08/30/2021 13:57:30 - INFO - __main__ - Step 4210: {'lr': 0.0004997252117337428, 'samples': 808320, 'steps': 4209, 'loss/train': 1.684325933456421} -08/30/2021 13:57:31 - INFO - __main__ - Step 4211: {'lr': 0.0004997249629333294, 'samples': 808512, 'steps': 4210, 'loss/train': 2.3704142570495605} -08/30/2021 13:57:32 - INFO - __main__ - Step 4212: {'lr': 0.0004997247140203939, 'samples': 808704, 'steps': 4211, 'loss/train': 2.325749397277832} -08/30/2021 13:57:33 - INFO - __main__ - Step 4213: {'lr': 0.0004997244649949362, 'samples': 808896, 'steps': 4212, 'loss/train': 2.1269288063049316} -08/30/2021 13:57:33 - INFO - __main__ - Step 4214: {'lr': 0.0004997242158569564, 'samples': 809088, 'steps': 4213, 'loss/train': 2.6444509029388428} -08/30/2021 13:57:33 - INFO - __main__ - Step 4215: {'lr': 0.0004997239666064549, 'samples': 809280, 'steps': 4214, 'loss/train': 3.029888391494751} -08/30/2021 13:57:34 - INFO - __main__ - Step 4216: {'lr': 0.0004997237172434316, 'samples': 809472, 'steps': 4215, 'loss/train': 2.305338144302368} -08/30/2021 13:57:36 - INFO - __main__ - Step 4217: {'lr': 0.0004997234677678867, 'samples': 809664, 'steps': 4216, 'loss/train': 1.9964935779571533} -08/30/2021 13:57:37 - INFO - __main__ - Step 4218: {'lr': 0.0004997232181798201, 'samples': 809856, 'steps': 4217, 'loss/train': 2.813920021057129} -08/30/2021 13:57:37 - INFO - __main__ - Step 4219: {'lr': 0.0004997229684792322, 'samples': 810048, 'steps': 4218, 'loss/train': 0.4271639585494995} -08/30/2021 13:57:37 - INFO - __main__ - Step 4220: {'lr': 0.000499722718666123, 'samples': 810240, 'steps': 4219, 'loss/train': 2.1813101768493652} -08/30/2021 13:57:38 - INFO - __main__ - Step 4221: {'lr': 0.0004997224687404926, 'samples': 810432, 'steps': 4220, 'loss/train': 2.128692865371704} -08/30/2021 13:57:40 - INFO - __main__ - Step 4222: {'lr': 0.0004997222187023409, 'samples': 810624, 'steps': 4221, 'loss/train': 2.451427698135376} -08/30/2021 13:57:40 - INFO - __main__ - Step 4223: {'lr': 0.0004997219685516684, 'samples': 810816, 'steps': 4222, 'loss/train': 2.2508769035339355} -08/30/2021 13:57:41 - INFO - __main__ - Step 4224: {'lr': 0.000499721718288475, 'samples': 811008, 'steps': 4223, 'loss/train': 2.1557271480560303} -08/30/2021 13:57:41 - INFO - __main__ - Step 4225: {'lr': 0.0004997214679127609, 'samples': 811200, 'steps': 4224, 'loss/train': 1.5057705640792847} -08/30/2021 13:57:41 - INFO - __main__ - Step 4226: {'lr': 0.000499721217424526, 'samples': 811392, 'steps': 4225, 'loss/train': 4.9801859855651855} -08/30/2021 13:57:42 - INFO - __main__ - Step 4227: {'lr': 0.0004997209668237707, 'samples': 811584, 'steps': 4226, 'loss/train': 2.1657800674438477} -08/30/2021 13:57:44 - INFO - __main__ - Step 4228: {'lr': 0.0004997207161104951, 'samples': 811776, 'steps': 4227, 'loss/train': 2.620006561279297} -08/30/2021 13:57:44 - INFO - __main__ - Step 4229: {'lr': 0.0004997204652846991, 'samples': 811968, 'steps': 4228, 'loss/train': 2.7723963260650635} -08/30/2021 13:57:45 - INFO - __main__ - Step 4230: {'lr': 0.0004997202143463828, 'samples': 812160, 'steps': 4229, 'loss/train': 2.4335696697235107} -08/30/2021 13:57:45 - INFO - __main__ - Step 4231: {'lr': 0.0004997199632955464, 'samples': 812352, 'steps': 4230, 'loss/train': 2.617645025253296} -08/30/2021 13:57:45 - INFO - __main__ - Step 4232: {'lr': 0.0004997197121321903, 'samples': 812544, 'steps': 4231, 'loss/train': 1.4652386903762817} -08/30/2021 13:57:46 - INFO - __main__ - Step 4233: {'lr': 0.0004997194608563142, 'samples': 812736, 'steps': 4232, 'loss/train': 2.947063684463501} -08/30/2021 13:57:47 - INFO - __main__ - Step 4234: {'lr': 0.0004997192094679183, 'samples': 812928, 'steps': 4233, 'loss/train': 3.2186663150787354} -08/30/2021 13:57:48 - INFO - __main__ - Step 4235: {'lr': 0.0004997189579670028, 'samples': 813120, 'steps': 4234, 'loss/train': 2.9579813480377197} -08/30/2021 13:57:48 - INFO - __main__ - Step 4236: {'lr': 0.0004997187063535679, 'samples': 813312, 'steps': 4235, 'loss/train': 2.842017412185669} -08/30/2021 13:57:49 - INFO - __main__ - Step 4237: {'lr': 0.0004997184546276135, 'samples': 813504, 'steps': 4236, 'loss/train': 2.817560911178589} -08/30/2021 13:57:49 - INFO - __main__ - Step 4238: {'lr': 0.0004997182027891399, 'samples': 813696, 'steps': 4237, 'loss/train': 3.4652514457702637} -08/30/2021 13:57:50 - INFO - __main__ - Step 4239: {'lr': 0.000499717950838147, 'samples': 813888, 'steps': 4238, 'loss/train': 1.995408058166504} -08/30/2021 13:57:51 - INFO - __main__ - Step 4240: {'lr': 0.0004997176987746352, 'samples': 814080, 'steps': 4239, 'loss/train': 2.921905517578125} -08/30/2021 13:57:51 - INFO - __main__ - Step 4241: {'lr': 0.0004997174465986043, 'samples': 814272, 'steps': 4240, 'loss/train': 3.066000461578369} -08/30/2021 13:57:52 - INFO - __main__ - Step 4242: {'lr': 0.0004997171943100547, 'samples': 814464, 'steps': 4241, 'loss/train': 3.705711603164673} -08/30/2021 13:57:52 - INFO - __main__ - Step 4243: {'lr': 0.0004997169419089863, 'samples': 814656, 'steps': 4242, 'loss/train': 1.898451328277588} -08/30/2021 13:57:52 - INFO - __main__ - Step 4244: {'lr': 0.0004997166893953994, 'samples': 814848, 'steps': 4243, 'loss/train': 2.2891695499420166} -08/30/2021 13:57:54 - INFO - __main__ - Step 4245: {'lr': 0.000499716436769294, 'samples': 815040, 'steps': 4244, 'loss/train': 2.541060447692871} -08/30/2021 13:57:54 - INFO - __main__ - Step 4246: {'lr': 0.0004997161840306701, 'samples': 815232, 'steps': 4245, 'loss/train': 2.1411869525909424} -08/30/2021 13:57:55 - INFO - __main__ - Step 4247: {'lr': 0.0004997159311795281, 'samples': 815424, 'steps': 4246, 'loss/train': 2.947779417037964} -08/30/2021 13:57:55 - INFO - __main__ - Step 4248: {'lr': 0.0004997156782158679, 'samples': 815616, 'steps': 4247, 'loss/train': 2.754335880279541} -08/30/2021 13:57:55 - INFO - __main__ - Step 4249: {'lr': 0.0004997154251396896, 'samples': 815808, 'steps': 4248, 'loss/train': 2.0951056480407715} -08/30/2021 13:57:57 - INFO - __main__ - Step 4250: {'lr': 0.0004997151719509935, 'samples': 816000, 'steps': 4249, 'loss/train': 2.4612369537353516} -08/30/2021 13:57:57 - INFO - __main__ - Step 4251: {'lr': 0.0004997149186497795, 'samples': 816192, 'steps': 4250, 'loss/train': 2.6147375106811523} -08/30/2021 13:57:58 - INFO - __main__ - Step 4252: {'lr': 0.0004997146652360478, 'samples': 816384, 'steps': 4251, 'loss/train': 2.062556743621826} -08/30/2021 13:57:58 - INFO - __main__ - Step 4253: {'lr': 0.0004997144117097986, 'samples': 816576, 'steps': 4252, 'loss/train': 2.607947587966919} -08/30/2021 13:57:58 - INFO - __main__ - Step 4254: {'lr': 0.0004997141580710318, 'samples': 816768, 'steps': 4253, 'loss/train': 2.2088544368743896} -08/30/2021 13:58:00 - INFO - __main__ - Step 4255: {'lr': 0.0004997139043197478, 'samples': 816960, 'steps': 4254, 'loss/train': 2.6336066722869873} -08/30/2021 13:58:00 - INFO - __main__ - Step 4256: {'lr': 0.0004997136504559465, 'samples': 817152, 'steps': 4255, 'loss/train': 2.7068982124328613} -08/30/2021 13:58:01 - INFO - __main__ - Step 4257: {'lr': 0.0004997133964796281, 'samples': 817344, 'steps': 4256, 'loss/train': 1.9383596181869507} -08/30/2021 13:58:01 - INFO - __main__ - Step 4258: {'lr': 0.0004997131423907927, 'samples': 817536, 'steps': 4257, 'loss/train': 1.8818825483322144} -08/30/2021 13:58:01 - INFO - __main__ - Step 4259: {'lr': 0.0004997128881894404, 'samples': 817728, 'steps': 4258, 'loss/train': 2.592486619949341} -08/30/2021 13:58:03 - INFO - __main__ - Step 4260: {'lr': 0.0004997126338755714, 'samples': 817920, 'steps': 4259, 'loss/train': 0.5001815557479858} -08/30/2021 13:58:04 - INFO - __main__ - Step 4261: {'lr': 0.0004997123794491856, 'samples': 818112, 'steps': 4260, 'loss/train': 2.1100869178771973} -08/30/2021 13:58:04 - INFO - __main__ - Step 4262: {'lr': 0.0004997121249102834, 'samples': 818304, 'steps': 4261, 'loss/train': 0.4378907084465027} -08/30/2021 13:58:04 - INFO - __main__ - Step 4263: {'lr': 0.0004997118702588647, 'samples': 818496, 'steps': 4262, 'loss/train': 1.0724092721939087} -08/30/2021 13:58:05 - INFO - __main__ - Step 4264: {'lr': 0.0004997116154949297, 'samples': 818688, 'steps': 4263, 'loss/train': 2.519207715988159} -08/30/2021 13:58:05 - INFO - __main__ - Step 4265: {'lr': 0.0004997113606184785, 'samples': 818880, 'steps': 4264, 'loss/train': 2.746309280395508} -08/30/2021 13:58:07 - INFO - __main__ - Step 4266: {'lr': 0.0004997111056295111, 'samples': 819072, 'steps': 4265, 'loss/train': 2.795696496963501} -08/30/2021 13:58:07 - INFO - __main__ - Step 4267: {'lr': 0.0004997108505280279, 'samples': 819264, 'steps': 4266, 'loss/train': 3.4674010276794434} -08/30/2021 13:58:07 - INFO - __main__ - Step 4268: {'lr': 0.0004997105953140288, 'samples': 819456, 'steps': 4267, 'loss/train': 0.369831919670105} -08/30/2021 13:58:08 - INFO - __main__ - Step 4269: {'lr': 0.0004997103399875139, 'samples': 819648, 'steps': 4268, 'loss/train': 2.382072925567627} -08/30/2021 13:58:08 - INFO - __main__ - Step 4270: {'lr': 0.0004997100845484834, 'samples': 819840, 'steps': 4269, 'loss/train': 2.774012804031372} -08/30/2021 13:58:10 - INFO - __main__ - Step 4271: {'lr': 0.0004997098289969374, 'samples': 820032, 'steps': 4270, 'loss/train': 2.4658544063568115} -08/30/2021 13:58:11 - INFO - __main__ - Step 4272: {'lr': 0.0004997095733328761, 'samples': 820224, 'steps': 4271, 'loss/train': 2.229326009750366} -08/30/2021 13:58:11 - INFO - __main__ - Step 4273: {'lr': 0.0004997093175562994, 'samples': 820416, 'steps': 4272, 'loss/train': 3.0871241092681885} -08/30/2021 13:58:12 - INFO - __main__ - Step 4274: {'lr': 0.0004997090616672076, 'samples': 820608, 'steps': 4273, 'loss/train': 2.0945723056793213} -08/30/2021 13:58:12 - INFO - __main__ - Step 4275: {'lr': 0.0004997088056656006, 'samples': 820800, 'steps': 4274, 'loss/train': 2.119072437286377} -08/30/2021 13:58:13 - INFO - __main__ - Step 4276: {'lr': 0.0004997085495514788, 'samples': 820992, 'steps': 4275, 'loss/train': 2.942012310028076} -08/30/2021 13:58:14 - INFO - __main__ - Step 4277: {'lr': 0.0004997082933248421, 'samples': 821184, 'steps': 4276, 'loss/train': 1.1856452226638794} -08/30/2021 13:58:14 - INFO - __main__ - Step 4278: {'lr': 0.0004997080369856907, 'samples': 821376, 'steps': 4277, 'loss/train': 2.270286798477173} -08/30/2021 13:58:15 - INFO - __main__ - Step 4279: {'lr': 0.0004997077805340248, 'samples': 821568, 'steps': 4278, 'loss/train': 2.501870632171631} -08/30/2021 13:58:15 - INFO - __main__ - Step 4280: {'lr': 0.0004997075239698445, 'samples': 821760, 'steps': 4279, 'loss/train': 2.7107431888580322} -08/30/2021 13:58:16 - INFO - __main__ - Step 4281: {'lr': 0.0004997072672931497, 'samples': 821952, 'steps': 4280, 'loss/train': 2.063675880432129} -08/30/2021 13:58:17 - INFO - __main__ - Step 4282: {'lr': 0.0004997070105039407, 'samples': 822144, 'steps': 4281, 'loss/train': 2.674036979675293} -08/30/2021 13:58:17 - INFO - __main__ - Step 4283: {'lr': 0.0004997067536022176, 'samples': 822336, 'steps': 4282, 'loss/train': 1.758373498916626} -08/30/2021 13:58:18 - INFO - __main__ - Step 4284: {'lr': 0.0004997064965879804, 'samples': 822528, 'steps': 4283, 'loss/train': 2.2967076301574707} -08/30/2021 13:58:18 - INFO - __main__ - Step 4285: {'lr': 0.0004997062394612293, 'samples': 822720, 'steps': 4284, 'loss/train': 2.3500163555145264} -08/30/2021 13:58:18 - INFO - __main__ - Step 4286: {'lr': 0.0004997059822219645, 'samples': 822912, 'steps': 4285, 'loss/train': 2.7859182357788086} -08/30/2021 13:58:20 - INFO - __main__ - Step 4287: {'lr': 0.000499705724870186, 'samples': 823104, 'steps': 4286, 'loss/train': 2.0944437980651855} -08/30/2021 13:58:20 - INFO - __main__ - Step 4288: {'lr': 0.0004997054674058941, 'samples': 823296, 'steps': 4287, 'loss/train': 2.4240219593048096} -08/30/2021 13:58:21 - INFO - __main__ - Step 4289: {'lr': 0.0004997052098290886, 'samples': 823488, 'steps': 4288, 'loss/train': 1.5310779809951782} -08/30/2021 13:58:21 - INFO - __main__ - Step 4290: {'lr': 0.0004997049521397698, 'samples': 823680, 'steps': 4289, 'loss/train': 1.909066081047058} -08/30/2021 13:58:21 - INFO - __main__ - Step 4291: {'lr': 0.0004997046943379379, 'samples': 823872, 'steps': 4290, 'loss/train': 1.9988086223602295} -08/30/2021 13:58:23 - INFO - __main__ - Step 4292: {'lr': 0.0004997044364235928, 'samples': 824064, 'steps': 4291, 'loss/train': 2.4219062328338623} -08/30/2021 13:58:23 - INFO - __main__ - Step 4293: {'lr': 0.0004997041783967348, 'samples': 824256, 'steps': 4292, 'loss/train': 2.3637895584106445} -08/30/2021 13:58:24 - INFO - __main__ - Step 4294: {'lr': 0.0004997039202573639, 'samples': 824448, 'steps': 4293, 'loss/train': 2.4218428134918213} -08/30/2021 13:58:24 - INFO - __main__ - Step 4295: {'lr': 0.0004997036620054803, 'samples': 824640, 'steps': 4294, 'loss/train': 2.5160958766937256} -08/30/2021 13:58:24 - INFO - __main__ - Step 4296: {'lr': 0.0004997034036410841, 'samples': 824832, 'steps': 4295, 'loss/train': 2.5857794284820557} -08/30/2021 13:58:26 - INFO - __main__ - Step 4297: {'lr': 0.0004997031451641754, 'samples': 825024, 'steps': 4296, 'loss/train': 2.141510486602783} -08/30/2021 13:58:26 - INFO - __main__ - Step 4298: {'lr': 0.0004997028865747542, 'samples': 825216, 'steps': 4297, 'loss/train': 2.3709964752197266} -08/30/2021 13:58:27 - INFO - __main__ - Step 4299: {'lr': 0.0004997026278728209, 'samples': 825408, 'steps': 4298, 'loss/train': 1.2953389883041382} -08/30/2021 13:58:27 - INFO - __main__ - Step 4300: {'lr': 0.0004997023690583753, 'samples': 825600, 'steps': 4299, 'loss/train': 1.8751654624938965} -08/30/2021 13:58:27 - INFO - __main__ - Step 4301: {'lr': 0.0004997021101314179, 'samples': 825792, 'steps': 4300, 'loss/train': 2.8405394554138184} -08/30/2021 13:58:29 - INFO - __main__ - Step 4302: {'lr': 0.0004997018510919483, 'samples': 825984, 'steps': 4301, 'loss/train': 2.485252857208252} -08/30/2021 13:58:30 - INFO - __main__ - Step 4303: {'lr': 0.0004997015919399671, 'samples': 826176, 'steps': 4302, 'loss/train': 1.3849883079528809} -08/30/2021 13:58:30 - INFO - __main__ - Step 4304: {'lr': 0.0004997013326754742, 'samples': 826368, 'steps': 4303, 'loss/train': 2.836071729660034} -08/30/2021 13:58:30 - INFO - __main__ - Step 4305: {'lr': 0.0004997010732984696, 'samples': 826560, 'steps': 4304, 'loss/train': 0.530387818813324} -08/30/2021 13:58:31 - INFO - __main__ - Step 4306: {'lr': 0.0004997008138089536, 'samples': 826752, 'steps': 4305, 'loss/train': 2.038630485534668} -08/30/2021 13:58:33 - INFO - __main__ - Step 4307: {'lr': 0.0004997005542069263, 'samples': 826944, 'steps': 4306, 'loss/train': 2.2373640537261963} -08/30/2021 13:58:33 - INFO - __main__ - Step 4308: {'lr': 0.0004997002944923878, 'samples': 827136, 'steps': 4307, 'loss/train': 2.712813377380371} -08/30/2021 13:58:33 - INFO - __main__ - Step 4309: {'lr': 0.0004997000346653381, 'samples': 827328, 'steps': 4308, 'loss/train': 0.8218368291854858} -08/30/2021 13:58:34 - INFO - __main__ - Step 4310: {'lr': 0.0004996997747257775, 'samples': 827520, 'steps': 4309, 'loss/train': 0.7425898909568787} -08/30/2021 13:58:34 - INFO - __main__ - Step 4311: {'lr': 0.000499699514673706, 'samples': 827712, 'steps': 4310, 'loss/train': 2.148676633834839} -08/30/2021 13:58:36 - INFO - __main__ - Step 4312: {'lr': 0.0004996992545091239, 'samples': 827904, 'steps': 4311, 'loss/train': 1.9591997861862183} -08/30/2021 13:58:36 - INFO - __main__ - Step 4313: {'lr': 0.000499698994232031, 'samples': 828096, 'steps': 4312, 'loss/train': 2.2927918434143066} -08/30/2021 13:58:36 - INFO - __main__ - Step 4314: {'lr': 0.0004996987338424276, 'samples': 828288, 'steps': 4313, 'loss/train': 2.691950798034668} -08/30/2021 13:58:37 - INFO - __main__ - Step 4315: {'lr': 0.0004996984733403138, 'samples': 828480, 'steps': 4314, 'loss/train': 2.2400591373443604} -08/30/2021 13:58:37 - INFO - __main__ - Step 4316: {'lr': 0.0004996982127256898, 'samples': 828672, 'steps': 4315, 'loss/train': 1.3791862726211548} -08/30/2021 13:58:39 - INFO - __main__ - Step 4317: {'lr': 0.0004996979519985556, 'samples': 828864, 'steps': 4316, 'loss/train': 2.515639543533325} -08/30/2021 13:58:40 - INFO - __main__ - Step 4318: {'lr': 0.0004996976911589114, 'samples': 829056, 'steps': 4317, 'loss/train': 2.303879976272583} -08/30/2021 13:58:40 - INFO - __main__ - Step 4319: {'lr': 0.0004996974302067572, 'samples': 829248, 'steps': 4318, 'loss/train': 2.3199965953826904} -08/30/2021 13:58:40 - INFO - __main__ - Step 4320: {'lr': 0.0004996971691420931, 'samples': 829440, 'steps': 4319, 'loss/train': 2.417445421218872} -08/30/2021 13:58:41 - INFO - __main__ - Step 4321: {'lr': 0.0004996969079649195, 'samples': 829632, 'steps': 4320, 'loss/train': 1.4854261875152588} -08/30/2021 13:58:41 - INFO - __main__ - Step 4322: {'lr': 0.0004996966466752362, 'samples': 829824, 'steps': 4321, 'loss/train': 1.9340102672576904} -08/30/2021 13:58:41 - INFO - __main__ - Step 4323: {'lr': 0.0004996963852730436, 'samples': 830016, 'steps': 4322, 'loss/train': 0.8232200741767883} -08/30/2021 13:58:43 - INFO - __main__ - Step 4324: {'lr': 0.0004996961237583415, 'samples': 830208, 'steps': 4323, 'loss/train': 2.788846015930176} -08/30/2021 13:58:43 - INFO - __main__ - Step 4325: {'lr': 0.0004996958621311302, 'samples': 830400, 'steps': 4324, 'loss/train': 1.918544054031372} -08/30/2021 13:58:44 - INFO - __main__ - Step 4326: {'lr': 0.00049969560039141, 'samples': 830592, 'steps': 4325, 'loss/train': 2.509490966796875} -08/30/2021 13:58:44 - INFO - __main__ - Step 4327: {'lr': 0.0004996953385391806, 'samples': 830784, 'steps': 4326, 'loss/train': 1.5261305570602417} -08/30/2021 13:58:45 - INFO - __main__ - Step 4328: {'lr': 0.0004996950765744424, 'samples': 830976, 'steps': 4327, 'loss/train': 4.768551349639893} -08/30/2021 13:58:47 - INFO - __main__ - Step 4329: {'lr': 0.0004996948144971953, 'samples': 831168, 'steps': 4328, 'loss/train': 2.8698997497558594} -08/30/2021 13:58:47 - INFO - __main__ - Step 4330: {'lr': 0.0004996945523074398, 'samples': 831360, 'steps': 4329, 'loss/train': 2.0760560035705566} -08/30/2021 13:58:48 - INFO - __main__ - Step 4331: {'lr': 0.0004996942900051757, 'samples': 831552, 'steps': 4330, 'loss/train': 2.6386237144470215} -08/30/2021 13:58:48 - INFO - __main__ - Step 4332: {'lr': 0.0004996940275904031, 'samples': 831744, 'steps': 4331, 'loss/train': 2.426943302154541} -08/30/2021 13:58:48 - INFO - __main__ - Step 4333: {'lr': 0.0004996937650631224, 'samples': 831936, 'steps': 4332, 'loss/train': 2.3700973987579346} -08/30/2021 13:58:49 - INFO - __main__ - Step 4334: {'lr': 0.0004996935024233335, 'samples': 832128, 'steps': 4333, 'loss/train': 2.332881212234497} -08/30/2021 13:58:50 - INFO - __main__ - Step 4335: {'lr': 0.0004996932396710365, 'samples': 832320, 'steps': 4334, 'loss/train': 2.653916358947754} -08/30/2021 13:58:51 - INFO - __main__ - Step 4336: {'lr': 0.0004996929768062316, 'samples': 832512, 'steps': 4335, 'loss/train': 0.45033589005470276} -08/30/2021 13:58:51 - INFO - __main__ - Step 4337: {'lr': 0.0004996927138289189, 'samples': 832704, 'steps': 4336, 'loss/train': 2.5595593452453613} -08/30/2021 13:58:52 - INFO - __main__ - Step 4338: {'lr': 0.0004996924507390985, 'samples': 832896, 'steps': 4337, 'loss/train': 2.6162071228027344} -08/30/2021 13:58:52 - INFO - __main__ - Step 4339: {'lr': 0.0004996921875367705, 'samples': 833088, 'steps': 4338, 'loss/train': 2.4030649662017822} -08/30/2021 13:58:53 - INFO - __main__ - Step 4340: {'lr': 0.0004996919242219352, 'samples': 833280, 'steps': 4339, 'loss/train': 2.39670467376709} -08/30/2021 13:58:54 - INFO - __main__ - Step 4341: {'lr': 0.0004996916607945925, 'samples': 833472, 'steps': 4340, 'loss/train': 2.164501667022705} -08/30/2021 13:58:54 - INFO - __main__ - Step 4342: {'lr': 0.0004996913972547426, 'samples': 833664, 'steps': 4341, 'loss/train': 2.9331772327423096} -08/30/2021 13:58:55 - INFO - __main__ - Step 4343: {'lr': 0.0004996911336023855, 'samples': 833856, 'steps': 4342, 'loss/train': 2.5203447341918945} -08/30/2021 13:58:55 - INFO - __main__ - Step 4344: {'lr': 0.0004996908698375216, 'samples': 834048, 'steps': 4343, 'loss/train': 0.7685109972953796} -08/30/2021 13:58:57 - INFO - __main__ - Step 4345: {'lr': 0.0004996906059601507, 'samples': 834240, 'steps': 4344, 'loss/train': 2.147205352783203} -08/30/2021 13:58:57 - INFO - __main__ - Step 4346: {'lr': 0.0004996903419702731, 'samples': 834432, 'steps': 4345, 'loss/train': 2.3634419441223145} -08/30/2021 13:58:58 - INFO - __main__ - Step 4347: {'lr': 0.0004996900778678889, 'samples': 834624, 'steps': 4346, 'loss/train': 2.214385509490967} -08/30/2021 13:58:58 - INFO - __main__ - Step 4348: {'lr': 0.0004996898136529982, 'samples': 834816, 'steps': 4347, 'loss/train': 2.25006365776062} -08/30/2021 13:58:58 - INFO - __main__ - Step 4349: {'lr': 0.0004996895493256012, 'samples': 835008, 'steps': 4348, 'loss/train': 0.9130091667175293} -08/30/2021 13:58:59 - INFO - __main__ - Step 4350: {'lr': 0.0004996892848856978, 'samples': 835200, 'steps': 4349, 'loss/train': 2.3988945484161377} -08/30/2021 13:59:00 - INFO - __main__ - Step 4351: {'lr': 0.0004996890203332883, 'samples': 835392, 'steps': 4350, 'loss/train': 2.3409547805786133} -08/30/2021 13:59:01 - INFO - __main__ - Step 4352: {'lr': 0.0004996887556683729, 'samples': 835584, 'steps': 4351, 'loss/train': 2.735775947570801} -08/30/2021 13:59:01 - INFO - __main__ - Step 4353: {'lr': 0.0004996884908909515, 'samples': 835776, 'steps': 4352, 'loss/train': 3.0763423442840576} -08/30/2021 13:59:01 - INFO - __main__ - Step 4354: {'lr': 0.0004996882260010243, 'samples': 835968, 'steps': 4353, 'loss/train': 2.391918897628784} -08/30/2021 13:59:02 - INFO - __main__ - Step 4355: {'lr': 0.0004996879609985915, 'samples': 836160, 'steps': 4354, 'loss/train': 2.481785774230957} -08/30/2021 13:59:04 - INFO - __main__ - Step 4356: {'lr': 0.0004996876958836532, 'samples': 836352, 'steps': 4355, 'loss/train': 2.397257089614868} -08/30/2021 13:59:04 - INFO - __main__ - Step 4357: {'lr': 0.0004996874306562093, 'samples': 836544, 'steps': 4356, 'loss/train': 2.421093702316284} -08/30/2021 13:59:05 - INFO - __main__ - Step 4358: {'lr': 0.0004996871653162602, 'samples': 836736, 'steps': 4357, 'loss/train': 2.3213443756103516} -08/30/2021 13:59:05 - INFO - __main__ - Step 4359: {'lr': 0.0004996868998638059, 'samples': 836928, 'steps': 4358, 'loss/train': 3.1187126636505127} -08/30/2021 13:59:05 - INFO - __main__ - Step 4360: {'lr': 0.0004996866342988467, 'samples': 837120, 'steps': 4359, 'loss/train': 3.13950514793396} -08/30/2021 13:59:06 - INFO - __main__ - Step 4361: {'lr': 0.0004996863686213823, 'samples': 837312, 'steps': 4360, 'loss/train': 3.030313491821289} -08/30/2021 13:59:07 - INFO - __main__ - Step 4362: {'lr': 0.0004996861028314133, 'samples': 837504, 'steps': 4361, 'loss/train': 2.4247844219207764} -08/30/2021 13:59:08 - INFO - __main__ - Step 4363: {'lr': 0.0004996858369289394, 'samples': 837696, 'steps': 4362, 'loss/train': 2.6634891033172607} -08/30/2021 13:59:08 - INFO - __main__ - Step 4364: {'lr': 0.000499685570913961, 'samples': 837888, 'steps': 4363, 'loss/train': 2.71620512008667} -08/30/2021 13:59:08 - INFO - __main__ - Step 4365: {'lr': 0.0004996853047864781, 'samples': 838080, 'steps': 4364, 'loss/train': 2.6044857501983643} -08/30/2021 13:59:09 - INFO - __main__ - Step 4366: {'lr': 0.0004996850385464909, 'samples': 838272, 'steps': 4365, 'loss/train': 2.048746347427368} -08/30/2021 13:59:10 - INFO - __main__ - Step 4367: {'lr': 0.0004996847721939994, 'samples': 838464, 'steps': 4366, 'loss/train': 2.580474615097046} -08/30/2021 13:59:11 - INFO - __main__ - Step 4368: {'lr': 0.0004996845057290039, 'samples': 838656, 'steps': 4367, 'loss/train': 2.8319928646087646} -08/30/2021 13:59:11 - INFO - __main__ - Step 4369: {'lr': 0.0004996842391515044, 'samples': 838848, 'steps': 4368, 'loss/train': 2.554839611053467} -08/30/2021 13:59:11 - INFO - __main__ - Step 4370: {'lr': 0.000499683972461501, 'samples': 839040, 'steps': 4369, 'loss/train': 2.2035911083221436} -08/30/2021 13:59:12 - INFO - __main__ - Step 4371: {'lr': 0.0004996837056589938, 'samples': 839232, 'steps': 4370, 'loss/train': 2.651333808898926} -08/30/2021 13:59:12 - INFO - __main__ - Step 4372: {'lr': 0.0004996834387439831, 'samples': 839424, 'steps': 4371, 'loss/train': 1.8789271116256714} -08/30/2021 13:59:13 - INFO - __main__ - Step 4373: {'lr': 0.0004996831717164689, 'samples': 839616, 'steps': 4372, 'loss/train': 2.723007917404175} -08/30/2021 13:59:14 - INFO - __main__ - Step 4374: {'lr': 0.0004996829045764512, 'samples': 839808, 'steps': 4373, 'loss/train': 2.5256690979003906} -08/30/2021 13:59:14 - INFO - __main__ - Step 4375: {'lr': 0.0004996826373239303, 'samples': 840000, 'steps': 4374, 'loss/train': 2.008065700531006} -08/30/2021 13:59:15 - INFO - __main__ - Step 4376: {'lr': 0.0004996823699589062, 'samples': 840192, 'steps': 4375, 'loss/train': 3.023691177368164} -08/30/2021 13:59:15 - INFO - __main__ - Step 4377: {'lr': 0.0004996821024813791, 'samples': 840384, 'steps': 4376, 'loss/train': 2.7508814334869385} -08/30/2021 13:59:16 - INFO - __main__ - Step 4378: {'lr': 0.0004996818348913491, 'samples': 840576, 'steps': 4377, 'loss/train': 2.824896812438965} -08/30/2021 13:59:17 - INFO - __main__ - Step 4379: {'lr': 0.0004996815671888163, 'samples': 840768, 'steps': 4378, 'loss/train': 2.251624345779419} -08/30/2021 13:59:17 - INFO - __main__ - Step 4380: {'lr': 0.000499681299373781, 'samples': 840960, 'steps': 4379, 'loss/train': 1.3489680290222168} -08/30/2021 13:59:18 - INFO - __main__ - Step 4381: {'lr': 0.0004996810314462429, 'samples': 841152, 'steps': 4380, 'loss/train': 3.206294298171997} -08/30/2021 13:59:18 - INFO - __main__ - Step 4382: {'lr': 0.0004996807634062025, 'samples': 841344, 'steps': 4381, 'loss/train': 2.6561877727508545} -08/30/2021 13:59:20 - INFO - __main__ - Step 4383: {'lr': 0.0004996804952536599, 'samples': 841536, 'steps': 4382, 'loss/train': 2.2637486457824707} -08/30/2021 13:59:20 - INFO - __main__ - Step 4384: {'lr': 0.0004996802269886149, 'samples': 841728, 'steps': 4383, 'loss/train': 2.256096124649048} -08/30/2021 13:59:20 - INFO - __main__ - Step 4385: {'lr': 0.0004996799586110681, 'samples': 841920, 'steps': 4384, 'loss/train': 2.0771517753601074} -08/30/2021 13:59:21 - INFO - __main__ - Step 4386: {'lr': 0.0004996796901210192, 'samples': 842112, 'steps': 4385, 'loss/train': 2.951462507247925} -08/30/2021 13:59:21 - INFO - __main__ - Step 4387: {'lr': 0.0004996794215184685, 'samples': 842304, 'steps': 4386, 'loss/train': 2.0754663944244385} -08/30/2021 13:59:24 - INFO - __main__ - Step 4388: {'lr': 0.0004996791528034161, 'samples': 842496, 'steps': 4387, 'loss/train': 2.625568389892578} -08/30/2021 13:59:24 - INFO - __main__ - Step 4389: {'lr': 0.0004996788839758622, 'samples': 842688, 'steps': 4388, 'loss/train': 2.0868711471557617} -08/30/2021 13:59:24 - INFO - __main__ - Step 4390: {'lr': 0.0004996786150358068, 'samples': 842880, 'steps': 4389, 'loss/train': 1.0992119312286377} -08/30/2021 13:59:25 - INFO - __main__ - Step 4391: {'lr': 0.00049967834598325, 'samples': 843072, 'steps': 4390, 'loss/train': 2.903900146484375} -08/30/2021 13:59:25 - INFO - __main__ - Step 4392: {'lr': 0.0004996780768181921, 'samples': 843264, 'steps': 4391, 'loss/train': 2.5160937309265137} -08/30/2021 13:59:27 - INFO - __main__ - Step 4393: {'lr': 0.0004996778075406331, 'samples': 843456, 'steps': 4392, 'loss/train': 2.3703763484954834} -08/30/2021 13:59:27 - INFO - __main__ - Step 4394: {'lr': 0.0004996775381505731, 'samples': 843648, 'steps': 4393, 'loss/train': 2.8998920917510986} -08/30/2021 13:59:28 - INFO - __main__ - Step 4395: {'lr': 0.0004996772686480122, 'samples': 843840, 'steps': 4394, 'loss/train': 2.3615400791168213} -08/30/2021 13:59:28 - INFO - __main__ - Step 4396: {'lr': 0.0004996769990329507, 'samples': 844032, 'steps': 4395, 'loss/train': 2.7064578533172607} -08/30/2021 13:59:28 - INFO - __main__ - Step 4397: {'lr': 0.0004996767293053885, 'samples': 844224, 'steps': 4396, 'loss/train': 0.9128702878952026} -08/30/2021 13:59:30 - INFO - __main__ - Step 4398: {'lr': 0.0004996764594653258, 'samples': 844416, 'steps': 4397, 'loss/train': 2.0633468627929688} -08/30/2021 13:59:30 - INFO - __main__ - Step 4399: {'lr': 0.0004996761895127628, 'samples': 844608, 'steps': 4398, 'loss/train': 3.204718828201294} -08/30/2021 13:59:31 - INFO - __main__ - Step 4400: {'lr': 0.0004996759194476996, 'samples': 844800, 'steps': 4399, 'loss/train': 2.81738018989563} -08/30/2021 13:59:31 - INFO - __main__ - Step 4401: {'lr': 0.0004996756492701362, 'samples': 844992, 'steps': 4400, 'loss/train': 2.7315587997436523} -08/30/2021 13:59:31 - INFO - __main__ - Step 4402: {'lr': 0.0004996753789800729, 'samples': 845184, 'steps': 4401, 'loss/train': 2.656501293182373} -08/30/2021 13:59:32 - INFO - __main__ - Step 4403: {'lr': 0.0004996751085775096, 'samples': 845376, 'steps': 4402, 'loss/train': 3.0188190937042236} -08/30/2021 13:59:33 - INFO - __main__ - Step 4404: {'lr': 0.0004996748380624467, 'samples': 845568, 'steps': 4403, 'loss/train': 2.4543826580047607} -08/30/2021 13:59:34 - INFO - __main__ - Step 4405: {'lr': 0.000499674567434884, 'samples': 845760, 'steps': 4404, 'loss/train': 3.0986216068267822} -08/30/2021 13:59:34 - INFO - __main__ - Step 4406: {'lr': 0.0004996742966948219, 'samples': 845952, 'steps': 4405, 'loss/train': 2.609631061553955} -08/30/2021 13:59:34 - INFO - __main__ - Step 4407: {'lr': 0.0004996740258422604, 'samples': 846144, 'steps': 4406, 'loss/train': 2.6129021644592285} -08/30/2021 13:59:35 - INFO - __main__ - Step 4408: {'lr': 0.0004996737548771997, 'samples': 846336, 'steps': 4407, 'loss/train': 1.8508158922195435} -08/30/2021 13:59:36 - INFO - __main__ - Step 4409: {'lr': 0.0004996734837996397, 'samples': 846528, 'steps': 4408, 'loss/train': 2.298949956893921} -08/30/2021 13:59:37 - INFO - __main__ - Step 4410: {'lr': 0.0004996732126095807, 'samples': 846720, 'steps': 4409, 'loss/train': 2.9131104946136475} -08/30/2021 13:59:37 - INFO - __main__ - Step 4411: {'lr': 0.0004996729413070229, 'samples': 846912, 'steps': 4410, 'loss/train': 2.257246732711792} -08/30/2021 13:59:37 - INFO - __main__ - Step 4412: {'lr': 0.0004996726698919664, 'samples': 847104, 'steps': 4411, 'loss/train': 2.803863048553467} -08/30/2021 13:59:38 - INFO - __main__ - Step 4413: {'lr': 0.0004996723983644112, 'samples': 847296, 'steps': 4412, 'loss/train': 2.301168918609619} -08/30/2021 13:59:40 - INFO - __main__ - Step 4414: {'lr': 0.0004996721267243573, 'samples': 847488, 'steps': 4413, 'loss/train': 1.7177538871765137} -08/30/2021 13:59:40 - INFO - __main__ - Step 4415: {'lr': 0.0004996718549718051, 'samples': 847680, 'steps': 4414, 'loss/train': 2.3217835426330566} -08/30/2021 13:59:40 - INFO - __main__ - Step 4416: {'lr': 0.0004996715831067546, 'samples': 847872, 'steps': 4415, 'loss/train': 1.7899372577667236} -08/30/2021 13:59:41 - INFO - __main__ - Step 4417: {'lr': 0.000499671311129206, 'samples': 848064, 'steps': 4416, 'loss/train': 2.663358211517334} -08/30/2021 13:59:41 - INFO - __main__ - Step 4418: {'lr': 0.0004996710390391593, 'samples': 848256, 'steps': 4417, 'loss/train': 2.5235495567321777} -08/30/2021 13:59:43 - INFO - __main__ - Step 4419: {'lr': 0.0004996707668366147, 'samples': 848448, 'steps': 4418, 'loss/train': 0.48375609517097473} -08/30/2021 13:59:43 - INFO - __main__ - Step 4420: {'lr': 0.0004996704945215724, 'samples': 848640, 'steps': 4419, 'loss/train': 3.206803798675537} -08/30/2021 13:59:43 - INFO - __main__ - Step 4421: {'lr': 0.0004996702220940322, 'samples': 848832, 'steps': 4420, 'loss/train': 2.434300184249878} -08/30/2021 13:59:44 - INFO - __main__ - Step 4422: {'lr': 0.0004996699495539947, 'samples': 849024, 'steps': 4421, 'loss/train': 2.0685155391693115} -08/30/2021 13:59:44 - INFO - __main__ - Step 4423: {'lr': 0.0004996696769014596, 'samples': 849216, 'steps': 4422, 'loss/train': 2.4212698936462402} -08/30/2021 13:59:46 - INFO - __main__ - Step 4424: {'lr': 0.0004996694041364272, 'samples': 849408, 'steps': 4423, 'loss/train': 2.027961492538452} -08/30/2021 13:59:46 - INFO - __main__ - Step 4425: {'lr': 0.0004996691312588977, 'samples': 849600, 'steps': 4424, 'loss/train': 2.265188694000244} -08/30/2021 13:59:46 - INFO - __main__ - Step 4426: {'lr': 0.0004996688582688711, 'samples': 849792, 'steps': 4425, 'loss/train': 2.822570562362671} -08/30/2021 13:59:47 - INFO - __main__ - Step 4427: {'lr': 0.0004996685851663477, 'samples': 849984, 'steps': 4426, 'loss/train': 2.7943873405456543} -08/30/2021 13:59:47 - INFO - __main__ - Step 4428: {'lr': 0.0004996683119513274, 'samples': 850176, 'steps': 4427, 'loss/train': 2.2864913940429688} -08/30/2021 13:59:49 - INFO - __main__ - Step 4429: {'lr': 0.0004996680386238103, 'samples': 850368, 'steps': 4428, 'loss/train': 1.8238520622253418} -08/30/2021 13:59:49 - INFO - __main__ - Step 4430: {'lr': 0.0004996677651837967, 'samples': 850560, 'steps': 4429, 'loss/train': 2.325866222381592} -08/30/2021 13:59:49 - INFO - __main__ - Step 4431: {'lr': 0.0004996674916312867, 'samples': 850752, 'steps': 4430, 'loss/train': 2.2738285064697266} -08/30/2021 13:59:50 - INFO - __main__ - Step 4432: {'lr': 0.0004996672179662803, 'samples': 850944, 'steps': 4431, 'loss/train': 2.172910213470459} -08/30/2021 13:59:50 - INFO - __main__ - Step 4433: {'lr': 0.0004996669441887778, 'samples': 851136, 'steps': 4432, 'loss/train': 2.6636414527893066} -08/30/2021 13:59:51 - INFO - __main__ - Step 4434: {'lr': 0.0004996666702987791, 'samples': 851328, 'steps': 4433, 'loss/train': 2.2548768520355225} -08/30/2021 13:59:52 - INFO - __main__ - Step 4435: {'lr': 0.0004996663962962846, 'samples': 851520, 'steps': 4434, 'loss/train': 2.0982847213745117} -08/30/2021 13:59:53 - INFO - __main__ - Step 4436: {'lr': 0.0004996661221812942, 'samples': 851712, 'steps': 4435, 'loss/train': 3.23982834815979} -08/30/2021 13:59:53 - INFO - __main__ - Step 4437: {'lr': 0.0004996658479538081, 'samples': 851904, 'steps': 4436, 'loss/train': 3.0859453678131104} -08/30/2021 13:59:53 - INFO - __main__ - Step 4438: {'lr': 0.0004996655736138265, 'samples': 852096, 'steps': 4437, 'loss/train': 0.9713526368141174} -08/30/2021 13:59:54 - INFO - __main__ - Step 4439: {'lr': 0.0004996652991613494, 'samples': 852288, 'steps': 4438, 'loss/train': 2.5843000411987305} -08/30/2021 13:59:56 - INFO - __main__ - Step 4440: {'lr': 0.0004996650245963768, 'samples': 852480, 'steps': 4439, 'loss/train': 2.302584171295166} -08/30/2021 13:59:56 - INFO - __main__ - Step 4441: {'lr': 0.0004996647499189092, 'samples': 852672, 'steps': 4440, 'loss/train': 3.055056095123291} -08/30/2021 13:59:57 - INFO - __main__ - Step 4442: {'lr': 0.0004996644751289464, 'samples': 852864, 'steps': 4441, 'loss/train': 2.611168622970581} -08/30/2021 13:59:57 - INFO - __main__ - Step 4443: {'lr': 0.0004996642002264887, 'samples': 853056, 'steps': 4442, 'loss/train': 2.2941527366638184} -08/30/2021 13:59:57 - INFO - __main__ - Step 4444: {'lr': 0.0004996639252115362, 'samples': 853248, 'steps': 4443, 'loss/train': 2.7221500873565674} -08/30/2021 13:59:59 - INFO - __main__ - Step 4445: {'lr': 0.000499663650084089, 'samples': 853440, 'steps': 4444, 'loss/train': 3.0388267040252686} -08/30/2021 14:00:00 - INFO - __main__ - Step 4446: {'lr': 0.0004996633748441472, 'samples': 853632, 'steps': 4445, 'loss/train': 2.3005685806274414} -08/30/2021 14:00:00 - INFO - __main__ - Step 4447: {'lr': 0.0004996630994917108, 'samples': 853824, 'steps': 4446, 'loss/train': 0.48164039850234985} -08/30/2021 14:00:00 - INFO - __main__ - Step 4448: {'lr': 0.0004996628240267802, 'samples': 854016, 'steps': 4447, 'loss/train': 2.155078649520874} -08/30/2021 14:00:01 - INFO - __main__ - Step 4449: {'lr': 0.0004996625484493554, 'samples': 854208, 'steps': 4448, 'loss/train': 1.9735839366912842} -08/30/2021 14:00:01 - INFO - __main__ - Step 4450: {'lr': 0.0004996622727594363, 'samples': 854400, 'steps': 4449, 'loss/train': 3.0032947063446045} -08/30/2021 14:00:03 - INFO - __main__ - Step 4451: {'lr': 0.0004996619969570234, 'samples': 854592, 'steps': 4450, 'loss/train': 2.0180344581604004} -08/30/2021 14:00:04 - INFO - __main__ - Step 4452: {'lr': 0.0004996617210421166, 'samples': 854784, 'steps': 4451, 'loss/train': 1.3236488103866577} -08/30/2021 14:00:04 - INFO - __main__ - Step 4453: {'lr': 0.0004996614450147161, 'samples': 854976, 'steps': 4452, 'loss/train': 0.774139940738678} -08/30/2021 14:00:04 - INFO - __main__ - Step 4454: {'lr': 0.0004996611688748221, 'samples': 855168, 'steps': 4453, 'loss/train': 2.6716136932373047} -08/30/2021 14:00:05 - INFO - __main__ - Step 4455: {'lr': 0.0004996608926224345, 'samples': 855360, 'steps': 4454, 'loss/train': 2.286705493927002} -08/30/2021 14:00:05 - INFO - __main__ - Step 4456: {'lr': 0.0004996606162575536, 'samples': 855552, 'steps': 4455, 'loss/train': 0.7882221937179565} -08/30/2021 14:00:06 - INFO - __main__ - Step 4457: {'lr': 0.0004996603397801795, 'samples': 855744, 'steps': 4456, 'loss/train': 3.2340660095214844} -08/30/2021 14:00:07 - INFO - __main__ - Step 4458: {'lr': 0.0004996600631903123, 'samples': 855936, 'steps': 4457, 'loss/train': 3.1454315185546875} -08/30/2021 14:00:07 - INFO - __main__ - Step 4459: {'lr': 0.0004996597864879521, 'samples': 856128, 'steps': 4458, 'loss/train': 2.2844502925872803} -08/30/2021 14:00:08 - INFO - __main__ - Step 4460: {'lr': 0.000499659509673099, 'samples': 856320, 'steps': 4459, 'loss/train': 2.2326767444610596} -08/30/2021 14:00:08 - INFO - __main__ - Step 4461: {'lr': 0.0004996592327457533, 'samples': 856512, 'steps': 4460, 'loss/train': 2.3373653888702393} -08/30/2021 14:00:09 - INFO - __main__ - Step 4462: {'lr': 0.000499658955705915, 'samples': 856704, 'steps': 4461, 'loss/train': 2.4097986221313477} -08/30/2021 14:00:10 - INFO - __main__ - Step 4463: {'lr': 0.0004996586785535841, 'samples': 856896, 'steps': 4462, 'loss/train': 2.207939624786377} -08/30/2021 14:00:10 - INFO - __main__ - Step 4464: {'lr': 0.000499658401288761, 'samples': 857088, 'steps': 4463, 'loss/train': 1.9724675416946411} -08/30/2021 14:00:11 - INFO - __main__ - Step 4465: {'lr': 0.0004996581239114456, 'samples': 857280, 'steps': 4464, 'loss/train': 2.0959792137145996} -08/30/2021 14:00:11 - INFO - __main__ - Step 4466: {'lr': 0.0004996578464216381, 'samples': 857472, 'steps': 4465, 'loss/train': 2.3610620498657227} -08/30/2021 14:00:12 - INFO - __main__ - Step 4467: {'lr': 0.0004996575688193386, 'samples': 857664, 'steps': 4466, 'loss/train': 1.904547095298767} -08/30/2021 14:00:13 - INFO - __main__ - Step 4468: {'lr': 0.0004996572911045473, 'samples': 857856, 'steps': 4467, 'loss/train': 0.7102074027061462} -08/30/2021 14:00:13 - INFO - __main__ - Step 4469: {'lr': 0.0004996570132772642, 'samples': 858048, 'steps': 4468, 'loss/train': 2.963158130645752} -08/30/2021 14:00:13 - INFO - __main__ - Step 4470: {'lr': 0.0004996567353374896, 'samples': 858240, 'steps': 4469, 'loss/train': 2.5914316177368164} -08/30/2021 14:00:14 - INFO - __main__ - Step 4471: {'lr': 0.0004996564572852235, 'samples': 858432, 'steps': 4470, 'loss/train': 3.332909107208252} -08/30/2021 14:00:16 - INFO - __main__ - Step 4472: {'lr': 0.000499656179120466, 'samples': 858624, 'steps': 4471, 'loss/train': 2.154690980911255} -08/30/2021 14:00:16 - INFO - __main__ - Step 4473: {'lr': 0.0004996559008432173, 'samples': 858816, 'steps': 4472, 'loss/train': 2.439270257949829} -08/30/2021 14:00:17 - INFO - __main__ - Step 4474: {'lr': 0.0004996556224534776, 'samples': 859008, 'steps': 4473, 'loss/train': 0.8880488276481628} -08/30/2021 14:00:17 - INFO - __main__ - Step 4475: {'lr': 0.0004996553439512468, 'samples': 859200, 'steps': 4474, 'loss/train': 0.8130812644958496} -08/30/2021 14:00:17 - INFO - __main__ - Step 4476: {'lr': 0.0004996550653365253, 'samples': 859392, 'steps': 4475, 'loss/train': 2.4375765323638916} -08/30/2021 14:00:18 - INFO - __main__ - Step 4477: {'lr': 0.0004996547866093129, 'samples': 859584, 'steps': 4476, 'loss/train': 3.0253424644470215} -08/30/2021 14:00:19 - INFO - __main__ - Step 4478: {'lr': 0.00049965450776961, 'samples': 859776, 'steps': 4477, 'loss/train': 0.6013203263282776} -08/30/2021 14:00:20 - INFO - __main__ - Step 4479: {'lr': 0.0004996542288174166, 'samples': 859968, 'steps': 4478, 'loss/train': 2.0361762046813965} -08/30/2021 14:00:20 - INFO - __main__ - Step 4480: {'lr': 0.0004996539497527329, 'samples': 860160, 'steps': 4479, 'loss/train': 0.5610140562057495} -08/30/2021 14:00:21 - INFO - __main__ - Step 4481: {'lr': 0.000499653670575559, 'samples': 860352, 'steps': 4480, 'loss/train': 2.0953292846679688} -08/30/2021 14:00:21 - INFO - __main__ - Step 4482: {'lr': 0.0004996533912858949, 'samples': 860544, 'steps': 4481, 'loss/train': 1.6098066568374634} -08/30/2021 14:00:22 - INFO - __main__ - Step 4483: {'lr': 0.000499653111883741, 'samples': 860736, 'steps': 4482, 'loss/train': 2.3210976123809814} -08/30/2021 14:00:23 - INFO - __main__ - Step 4484: {'lr': 0.0004996528323690971, 'samples': 860928, 'steps': 4483, 'loss/train': 2.522338628768921} -08/30/2021 14:00:23 - INFO - __main__ - Step 4485: {'lr': 0.0004996525527419636, 'samples': 861120, 'steps': 4484, 'loss/train': 2.73907208442688} -08/30/2021 14:00:24 - INFO - __main__ - Step 4486: {'lr': 0.0004996522730023404, 'samples': 861312, 'steps': 4485, 'loss/train': 2.050724506378174} -08/30/2021 14:00:24 - INFO - __main__ - Step 4487: {'lr': 0.0004996519931502279, 'samples': 861504, 'steps': 4486, 'loss/train': 2.388427257537842} -08/30/2021 14:00:24 - INFO - __main__ - Step 4488: {'lr': 0.0004996517131856259, 'samples': 861696, 'steps': 4487, 'loss/train': 2.3693833351135254} -08/30/2021 14:00:26 - INFO - __main__ - Step 4489: {'lr': 0.0004996514331085348, 'samples': 861888, 'steps': 4488, 'loss/train': 2.3274548053741455} -08/30/2021 14:00:26 - INFO - __main__ - Step 4490: {'lr': 0.0004996511529189546, 'samples': 862080, 'steps': 4489, 'loss/train': 0.9971614480018616} -08/30/2021 14:00:27 - INFO - __main__ - Step 4491: {'lr': 0.0004996508726168854, 'samples': 862272, 'steps': 4490, 'loss/train': 2.128624439239502} -08/30/2021 14:00:27 - INFO - __main__ - Step 4492: {'lr': 0.0004996505922023274, 'samples': 862464, 'steps': 4491, 'loss/train': 5.315568923950195} -08/30/2021 14:00:27 - INFO - __main__ - Step 4493: {'lr': 0.0004996503116752807, 'samples': 862656, 'steps': 4492, 'loss/train': 0.5561769008636475} -08/30/2021 14:00:29 - INFO - __main__ - Step 4494: {'lr': 0.0004996500310357454, 'samples': 862848, 'steps': 4493, 'loss/train': 2.6158716678619385} -08/30/2021 14:00:30 - INFO - __main__ - Step 4495: {'lr': 0.0004996497502837217, 'samples': 863040, 'steps': 4494, 'loss/train': 2.018419027328491} -08/30/2021 14:00:30 - INFO - __main__ - Step 4496: {'lr': 0.0004996494694192096, 'samples': 863232, 'steps': 4495, 'loss/train': 2.135006904602051} -08/30/2021 14:00:31 - INFO - __main__ - Step 4497: {'lr': 0.0004996491884422092, 'samples': 863424, 'steps': 4496, 'loss/train': 2.594553232192993} -08/30/2021 14:00:31 - INFO - __main__ - Step 4498: {'lr': 0.0004996489073527208, 'samples': 863616, 'steps': 4497, 'loss/train': 3.1940338611602783} -08/30/2021 14:00:31 - INFO - __main__ - Step 4499: {'lr': 0.0004996486261507445, 'samples': 863808, 'steps': 4498, 'loss/train': 0.7680402398109436} -08/30/2021 14:00:32 - INFO - __main__ - Step 4500: {'lr': 0.0004996483448362805, 'samples': 864000, 'steps': 4499, 'loss/train': 0.6784037947654724} -08/30/2021 14:00:34 - INFO - __main__ - Step 4501: {'lr': 0.0004996480634093287, 'samples': 864192, 'steps': 4500, 'loss/train': 2.0224390029907227} -08/30/2021 14:00:34 - INFO - __main__ - Step 4502: {'lr': 0.0004996477818698893, 'samples': 864384, 'steps': 4501, 'loss/train': 2.3429672718048096} -08/30/2021 14:00:34 - INFO - __main__ - Step 4503: {'lr': 0.0004996475002179625, 'samples': 864576, 'steps': 4502, 'loss/train': 2.2044742107391357} -08/30/2021 14:00:35 - INFO - __main__ - Step 4504: {'lr': 0.0004996472184535484, 'samples': 864768, 'steps': 4503, 'loss/train': 2.7269012928009033} -08/30/2021 14:00:35 - INFO - __main__ - Step 4505: {'lr': 0.0004996469365766471, 'samples': 864960, 'steps': 4504, 'loss/train': 2.5406477451324463} -08/30/2021 14:00:37 - INFO - __main__ - Step 4506: {'lr': 0.0004996466545872588, 'samples': 865152, 'steps': 4505, 'loss/train': 2.55234956741333} -08/30/2021 14:00:37 - INFO - __main__ - Step 4507: {'lr': 0.0004996463724853834, 'samples': 865344, 'steps': 4506, 'loss/train': 1.5074973106384277} -08/30/2021 14:00:37 - INFO - __main__ - Step 4508: {'lr': 0.0004996460902710214, 'samples': 865536, 'steps': 4507, 'loss/train': 2.267874002456665} -08/30/2021 14:00:38 - INFO - __main__ - Step 4509: {'lr': 0.0004996458079441727, 'samples': 865728, 'steps': 4508, 'loss/train': 2.308412790298462} -08/30/2021 14:00:38 - INFO - __main__ - Step 4510: {'lr': 0.0004996455255048373, 'samples': 865920, 'steps': 4509, 'loss/train': 2.0908989906311035} -08/30/2021 14:00:40 - INFO - __main__ - Step 4511: {'lr': 0.0004996452429530156, 'samples': 866112, 'steps': 4510, 'loss/train': 2.758845329284668} -08/30/2021 14:00:40 - INFO - __main__ - Step 4512: {'lr': 0.0004996449602887075, 'samples': 866304, 'steps': 4511, 'loss/train': 2.616922616958618} -08/30/2021 14:00:41 - INFO - __main__ - Step 4513: {'lr': 0.0004996446775119134, 'samples': 866496, 'steps': 4512, 'loss/train': 2.135817289352417} -08/30/2021 14:00:41 - INFO - __main__ - Step 4514: {'lr': 0.0004996443946226331, 'samples': 866688, 'steps': 4513, 'loss/train': 2.0573575496673584} -08/30/2021 14:00:41 - INFO - __main__ - Step 4515: {'lr': 0.000499644111620867, 'samples': 866880, 'steps': 4514, 'loss/train': 2.2674593925476074} -08/30/2021 14:00:42 - INFO - __main__ - Step 4516: {'lr': 0.000499643828506615, 'samples': 867072, 'steps': 4515, 'loss/train': 2.3302407264709473} -08/30/2021 14:00:43 - INFO - __main__ - Step 4517: {'lr': 0.0004996435452798775, 'samples': 867264, 'steps': 4516, 'loss/train': 2.6249778270721436} -08/30/2021 14:00:44 - INFO - __main__ - Step 4518: {'lr': 0.0004996432619406543, 'samples': 867456, 'steps': 4517, 'loss/train': 1.8309979438781738} -08/30/2021 14:00:44 - INFO - __main__ - Step 4519: {'lr': 0.0004996429784889458, 'samples': 867648, 'steps': 4518, 'loss/train': 3.550863742828369} -08/30/2021 14:00:44 - INFO - __main__ - Step 4520: {'lr': 0.000499642694924752, 'samples': 867840, 'steps': 4519, 'loss/train': 2.6422226428985596} -08/30/2021 14:00:45 - INFO - __main__ - Step 4521: {'lr': 0.000499642411248073, 'samples': 868032, 'steps': 4520, 'loss/train': 1.8086737394332886} -08/30/2021 14:00:46 - INFO - __main__ - Step 4522: {'lr': 0.0004996421274589091, 'samples': 868224, 'steps': 4521, 'loss/train': 2.4225997924804688} -08/30/2021 14:00:47 - INFO - __main__ - Step 4523: {'lr': 0.0004996418435572603, 'samples': 868416, 'steps': 4522, 'loss/train': 4.092549800872803} -08/30/2021 14:00:47 - INFO - __main__ - Step 4524: {'lr': 0.0004996415595431267, 'samples': 868608, 'steps': 4523, 'loss/train': 2.29569149017334} -08/30/2021 14:00:48 - INFO - __main__ - Step 4525: {'lr': 0.0004996412754165084, 'samples': 868800, 'steps': 4524, 'loss/train': 3.1504571437835693} -08/30/2021 14:00:48 - INFO - __main__ - Step 4526: {'lr': 0.0004996409911774056, 'samples': 868992, 'steps': 4525, 'loss/train': 1.3656212091445923} -08/30/2021 14:00:48 - INFO - __main__ - Step 4527: {'lr': 0.0004996407068258186, 'samples': 869184, 'steps': 4526, 'loss/train': 2.564074993133545} -08/30/2021 14:00:50 - INFO - __main__ - Step 4528: {'lr': 0.0004996404223617471, 'samples': 869376, 'steps': 4527, 'loss/train': 2.1748273372650146} -08/30/2021 14:00:50 - INFO - __main__ - Step 4529: {'lr': 0.0004996401377851917, 'samples': 869568, 'steps': 4528, 'loss/train': 3.069153308868408} -08/30/2021 14:00:51 - INFO - __main__ - Step 4530: {'lr': 0.0004996398530961522, 'samples': 869760, 'steps': 4529, 'loss/train': 2.4911487102508545} -08/30/2021 14:00:51 - INFO - __main__ - Step 4531: {'lr': 0.0004996395682946288, 'samples': 869952, 'steps': 4530, 'loss/train': 2.353128433227539} -08/30/2021 14:00:51 - INFO - __main__ - Step 4532: {'lr': 0.0004996392833806217, 'samples': 870144, 'steps': 4531, 'loss/train': 2.1468746662139893} -08/30/2021 14:00:53 - INFO - __main__ - Step 4533: {'lr': 0.000499638998354131, 'samples': 870336, 'steps': 4532, 'loss/train': 2.4447340965270996} -08/30/2021 14:00:53 - INFO - __main__ - Step 4534: {'lr': 0.0004996387132151567, 'samples': 870528, 'steps': 4533, 'loss/train': 2.0875327587127686} -08/30/2021 14:00:54 - INFO - __main__ - Step 4535: {'lr': 0.0004996384279636993, 'samples': 870720, 'steps': 4534, 'loss/train': 2.412013053894043} -08/30/2021 14:00:54 - INFO - __main__ - Step 4536: {'lr': 0.0004996381425997584, 'samples': 870912, 'steps': 4535, 'loss/train': 2.2420294284820557} -08/30/2021 14:00:55 - INFO - __main__ - Step 4537: {'lr': 0.0004996378571233347, 'samples': 871104, 'steps': 4536, 'loss/train': 2.9002840518951416} -08/30/2021 14:00:55 - INFO - __main__ - Step 4538: {'lr': 0.0004996375715344278, 'samples': 871296, 'steps': 4537, 'loss/train': 2.5866057872772217} -08/30/2021 14:00:56 - INFO - __main__ - Step 4539: {'lr': 0.0004996372858330382, 'samples': 871488, 'steps': 4538, 'loss/train': 2.988987922668457} -08/30/2021 14:00:57 - INFO - __main__ - Step 4540: {'lr': 0.0004996370000191657, 'samples': 871680, 'steps': 4539, 'loss/train': 1.8763577938079834} -08/30/2021 14:00:57 - INFO - __main__ - Step 4541: {'lr': 0.0004996367140928107, 'samples': 871872, 'steps': 4540, 'loss/train': 2.400172710418701} -08/30/2021 14:00:58 - INFO - __main__ - Step 4542: {'lr': 0.0004996364280539734, 'samples': 872064, 'steps': 4541, 'loss/train': 2.4988865852355957} -08/30/2021 14:00:58 - INFO - __main__ - Step 4543: {'lr': 0.0004996361419026537, 'samples': 872256, 'steps': 4542, 'loss/train': 2.4307539463043213} -08/30/2021 14:01:00 - INFO - __main__ - Step 4544: {'lr': 0.0004996358556388518, 'samples': 872448, 'steps': 4543, 'loss/train': 2.4443089962005615} -08/30/2021 14:01:00 - INFO - __main__ - Step 4545: {'lr': 0.0004996355692625678, 'samples': 872640, 'steps': 4544, 'loss/train': 1.9704921245574951} -08/30/2021 14:01:01 - INFO - __main__ - Step 4546: {'lr': 0.0004996352827738018, 'samples': 872832, 'steps': 4545, 'loss/train': 2.219630718231201} -08/30/2021 14:01:01 - INFO - __main__ - Step 4547: {'lr': 0.0004996349961725542, 'samples': 873024, 'steps': 4546, 'loss/train': 2.1464083194732666} -08/30/2021 14:01:01 - INFO - __main__ - Step 4548: {'lr': 0.0004996347094588247, 'samples': 873216, 'steps': 4547, 'loss/train': 1.0339703559875488} -08/30/2021 14:01:02 - INFO - __main__ - Step 4549: {'lr': 0.0004996344226326137, 'samples': 873408, 'steps': 4548, 'loss/train': 0.8882812857627869} -08/30/2021 14:01:03 - INFO - __main__ - Step 4550: {'lr': 0.0004996341356939214, 'samples': 873600, 'steps': 4549, 'loss/train': 2.229863166809082} -08/30/2021 14:01:04 - INFO - __main__ - Step 4551: {'lr': 0.0004996338486427477, 'samples': 873792, 'steps': 4550, 'loss/train': 2.621331214904785} -08/30/2021 14:01:04 - INFO - __main__ - Step 4552: {'lr': 0.0004996335614790929, 'samples': 873984, 'steps': 4551, 'loss/train': 2.852511167526245} -08/30/2021 14:01:04 - INFO - __main__ - Step 4553: {'lr': 0.0004996332742029571, 'samples': 874176, 'steps': 4552, 'loss/train': 2.0260066986083984} -08/30/2021 14:01:05 - INFO - __main__ - Step 4554: {'lr': 0.0004996329868143404, 'samples': 874368, 'steps': 4553, 'loss/train': 2.789266586303711} -08/30/2021 14:01:06 - INFO - __main__ - Step 4555: {'lr': 0.0004996326993132428, 'samples': 874560, 'steps': 4554, 'loss/train': 2.3618829250335693} -08/30/2021 14:01:07 - INFO - __main__ - Step 4556: {'lr': 0.0004996324116996647, 'samples': 874752, 'steps': 4555, 'loss/train': 2.7693419456481934} -08/30/2021 14:01:07 - INFO - __main__ - Step 4557: {'lr': 0.0004996321239736059, 'samples': 874944, 'steps': 4556, 'loss/train': 2.4524588584899902} -08/30/2021 14:01:07 - INFO - __main__ - Step 4558: {'lr': 0.000499631836135067, 'samples': 875136, 'steps': 4557, 'loss/train': 2.46193265914917} -08/30/2021 14:01:08 - INFO - __main__ - Step 4559: {'lr': 0.0004996315481840476, 'samples': 875328, 'steps': 4558, 'loss/train': 2.47141432762146} -08/30/2021 14:01:10 - INFO - __main__ - Step 4560: {'lr': 0.0004996312601205482, 'samples': 875520, 'steps': 4559, 'loss/train': 2.2694461345672607} -08/30/2021 14:01:10 - INFO - __main__ - Step 4561: {'lr': 0.0004996309719445687, 'samples': 875712, 'steps': 4560, 'loss/train': 1.6245360374450684} -08/30/2021 14:01:11 - INFO - __main__ - Step 4562: {'lr': 0.0004996306836561094, 'samples': 875904, 'steps': 4561, 'loss/train': 2.070373058319092} -08/30/2021 14:01:11 - INFO - __main__ - Step 4563: {'lr': 0.0004996303952551704, 'samples': 876096, 'steps': 4562, 'loss/train': 2.3879058361053467} -08/30/2021 14:01:11 - INFO - __main__ - Step 4564: {'lr': 0.0004996301067417517, 'samples': 876288, 'steps': 4563, 'loss/train': 2.5300660133361816} -08/30/2021 14:01:13 - INFO - __main__ - Step 4565: {'lr': 0.0004996298181158536, 'samples': 876480, 'steps': 4564, 'loss/train': 2.0309441089630127} -08/30/2021 14:01:13 - INFO - __main__ - Step 4566: {'lr': 0.0004996295293774762, 'samples': 876672, 'steps': 4565, 'loss/train': 2.1152758598327637} -08/30/2021 14:01:13 - INFO - __main__ - Step 4567: {'lr': 0.0004996292405266195, 'samples': 876864, 'steps': 4566, 'loss/train': 2.372183322906494} -08/30/2021 14:01:14 - INFO - __main__ - Step 4568: {'lr': 0.0004996289515632838, 'samples': 877056, 'steps': 4567, 'loss/train': 2.0528564453125} -08/30/2021 14:01:14 - INFO - __main__ - Step 4569: {'lr': 0.0004996286624874691, 'samples': 877248, 'steps': 4568, 'loss/train': 2.6889450550079346} -08/30/2021 14:01:16 - INFO - __main__ - Step 4570: {'lr': 0.0004996283732991755, 'samples': 877440, 'steps': 4569, 'loss/train': 2.3121769428253174} -08/30/2021 14:01:16 - INFO - __main__ - Step 4571: {'lr': 0.0004996280839984033, 'samples': 877632, 'steps': 4570, 'loss/train': 2.4112284183502197} -08/30/2021 14:01:17 - INFO - __main__ - Step 4572: {'lr': 0.0004996277945851525, 'samples': 877824, 'steps': 4571, 'loss/train': 2.571039915084839} -08/30/2021 14:01:17 - INFO - __main__ - Step 4573: {'lr': 0.0004996275050594233, 'samples': 878016, 'steps': 4572, 'loss/train': 2.2443714141845703} -08/30/2021 14:01:17 - INFO - __main__ - Step 4574: {'lr': 0.0004996272154212158, 'samples': 878208, 'steps': 4573, 'loss/train': 2.3098435401916504} -08/30/2021 14:01:19 - INFO - __main__ - Step 4575: {'lr': 0.0004996269256705301, 'samples': 878400, 'steps': 4574, 'loss/train': 1.4533641338348389} -08/30/2021 14:01:19 - INFO - __main__ - Step 4576: {'lr': 0.0004996266358073664, 'samples': 878592, 'steps': 4575, 'loss/train': 1.7222477197647095} -08/30/2021 14:01:20 - INFO - __main__ - Step 4577: {'lr': 0.0004996263458317248, 'samples': 878784, 'steps': 4576, 'loss/train': 2.734583854675293} -08/30/2021 14:01:20 - INFO - __main__ - Step 4578: {'lr': 0.0004996260557436053, 'samples': 878976, 'steps': 4577, 'loss/train': 2.314223289489746} -08/30/2021 14:01:20 - INFO - __main__ - Step 4579: {'lr': 0.0004996257655430083, 'samples': 879168, 'steps': 4578, 'loss/train': 2.07610821723938} -08/30/2021 14:01:22 - INFO - __main__ - Step 4580: {'lr': 0.0004996254752299337, 'samples': 879360, 'steps': 4579, 'loss/train': 2.4870107173919678} -08/30/2021 14:01:22 - INFO - __main__ - Step 4581: {'lr': 0.0004996251848043817, 'samples': 879552, 'steps': 4580, 'loss/train': 2.2557332515716553} -08/30/2021 14:01:23 - INFO - __main__ - Step 4582: {'lr': 0.0004996248942663525, 'samples': 879744, 'steps': 4581, 'loss/train': 3.572296380996704} -08/30/2021 14:01:23 - INFO - __main__ - Step 4583: {'lr': 0.000499624603615846, 'samples': 879936, 'steps': 4582, 'loss/train': 2.7815513610839844} -08/30/2021 14:01:23 - INFO - __main__ - Step 4584: {'lr': 0.0004996243128528628, 'samples': 880128, 'steps': 4583, 'loss/train': 2.4769766330718994} -08/30/2021 14:01:24 - INFO - __main__ - Step 4585: {'lr': 0.0004996240219774025, 'samples': 880320, 'steps': 4584, 'loss/train': 1.7290468215942383} -08/30/2021 14:01:25 - INFO - __main__ - Step 4586: {'lr': 0.0004996237309894656, 'samples': 880512, 'steps': 4585, 'loss/train': 2.123121500015259} -08/30/2021 14:01:26 - INFO - __main__ - Step 4587: {'lr': 0.0004996234398890521, 'samples': 880704, 'steps': 4586, 'loss/train': 1.958060622215271} -08/30/2021 14:01:26 - INFO - __main__ - Step 4588: {'lr': 0.000499623148676162, 'samples': 880896, 'steps': 4587, 'loss/train': 2.0216751098632812} -08/30/2021 14:01:26 - INFO - __main__ - Step 4589: {'lr': 0.0004996228573507957, 'samples': 881088, 'steps': 4588, 'loss/train': 1.9924323558807373} -08/30/2021 14:01:27 - INFO - __main__ - Step 4590: {'lr': 0.0004996225659129531, 'samples': 881280, 'steps': 4589, 'loss/train': 1.249950885772705} -08/30/2021 14:01:28 - INFO - __main__ - Step 4591: {'lr': 0.0004996222743626345, 'samples': 881472, 'steps': 4590, 'loss/train': 0.6270982027053833} -08/30/2021 14:01:29 - INFO - __main__ - Step 4592: {'lr': 0.0004996219826998399, 'samples': 881664, 'steps': 4591, 'loss/train': 2.2480950355529785} -08/30/2021 14:01:29 - INFO - __main__ - Step 4593: {'lr': 0.0004996216909245695, 'samples': 881856, 'steps': 4592, 'loss/train': 2.091141700744629} -08/30/2021 14:01:30 - INFO - __main__ - Step 4594: {'lr': 0.0004996213990368234, 'samples': 882048, 'steps': 4593, 'loss/train': 1.9925917387008667} -08/30/2021 14:01:30 - INFO - __main__ - Step 4595: {'lr': 0.0004996211070366018, 'samples': 882240, 'steps': 4594, 'loss/train': 2.223419427871704} -08/30/2021 14:01:31 - INFO - __main__ - Step 4596: {'lr': 0.0004996208149239047, 'samples': 882432, 'steps': 4595, 'loss/train': 2.09906005859375} -08/30/2021 14:01:32 - INFO - __main__ - Step 4597: {'lr': 0.0004996205226987324, 'samples': 882624, 'steps': 4596, 'loss/train': 2.025024652481079} -08/30/2021 14:01:32 - INFO - __main__ - Step 4598: {'lr': 0.0004996202303610849, 'samples': 882816, 'steps': 4597, 'loss/train': 2.3278818130493164} -08/30/2021 14:01:32 - INFO - __main__ - Step 4599: {'lr': 0.0004996199379109624, 'samples': 883008, 'steps': 4598, 'loss/train': 2.1262285709381104} -08/30/2021 14:01:33 - INFO - __main__ - Step 4600: {'lr': 0.000499619645348365, 'samples': 883200, 'steps': 4599, 'loss/train': 1.6696217060089111} -08/30/2021 14:01:35 - INFO - __main__ - Step 4601: {'lr': 0.0004996193526732929, 'samples': 883392, 'steps': 4600, 'loss/train': 1.9249932765960693} -08/30/2021 14:01:36 - INFO - __main__ - Step 4602: {'lr': 0.0004996190598857461, 'samples': 883584, 'steps': 4601, 'loss/train': 2.2383718490600586} -08/30/2021 14:01:36 - INFO - __main__ - Step 4603: {'lr': 0.0004996187669857247, 'samples': 883776, 'steps': 4602, 'loss/train': 2.4671871662139893} -08/30/2021 14:01:36 - INFO - __main__ - Step 4604: {'lr': 0.0004996184739732291, 'samples': 883968, 'steps': 4603, 'loss/train': 3.1720287799835205} -08/30/2021 14:01:37 - INFO - __main__ - Step 4605: {'lr': 0.0004996181808482592, 'samples': 884160, 'steps': 4604, 'loss/train': 4.191840171813965} -08/30/2021 14:01:37 - INFO - __main__ - Step 4606: {'lr': 0.0004996178876108152, 'samples': 884352, 'steps': 4605, 'loss/train': 2.343764543533325} -08/30/2021 14:01:37 - INFO - __main__ - Step 4607: {'lr': 0.0004996175942608973, 'samples': 884544, 'steps': 4606, 'loss/train': 1.724738597869873} -08/30/2021 14:01:39 - INFO - __main__ - Step 4608: {'lr': 0.0004996173007985055, 'samples': 884736, 'steps': 4607, 'loss/train': 2.340036630630493} -08/30/2021 14:01:40 - INFO - __main__ - Step 4609: {'lr': 0.00049961700722364, 'samples': 884928, 'steps': 4608, 'loss/train': 2.5888867378234863} -08/30/2021 14:01:40 - INFO - __main__ - Step 4610: {'lr': 0.0004996167135363009, 'samples': 885120, 'steps': 4609, 'loss/train': 2.327427864074707} -08/30/2021 14:01:41 - INFO - __main__ - Step 4611: {'lr': 0.0004996164197364884, 'samples': 885312, 'steps': 4610, 'loss/train': 2.3598992824554443} -08/30/2021 14:01:41 - INFO - __main__ - Step 4612: {'lr': 0.0004996161258242025, 'samples': 885504, 'steps': 4611, 'loss/train': 2.2096822261810303} -08/30/2021 14:01:43 - INFO - __main__ - Step 4613: {'lr': 0.0004996158317994436, 'samples': 885696, 'steps': 4612, 'loss/train': 2.1788270473480225} -08/30/2021 14:01:43 - INFO - __main__ - Step 4614: {'lr': 0.0004996155376622115, 'samples': 885888, 'steps': 4613, 'loss/train': 3.035369873046875} -08/30/2021 14:01:43 - INFO - __main__ - Step 4615: {'lr': 0.0004996152434125066, 'samples': 886080, 'steps': 4614, 'loss/train': 2.6611716747283936} -08/30/2021 14:01:44 - INFO - __main__ - Step 4616: {'lr': 0.0004996149490503289, 'samples': 886272, 'steps': 4615, 'loss/train': 2.558361291885376} -08/30/2021 14:01:44 - INFO - __main__ - Step 4617: {'lr': 0.0004996146545756786, 'samples': 886464, 'steps': 4616, 'loss/train': 1.5009498596191406} -08/30/2021 14:01:45 - INFO - __main__ - Step 4618: {'lr': 0.0004996143599885557, 'samples': 886656, 'steps': 4617, 'loss/train': 2.051567554473877} -08/30/2021 14:01:46 - INFO - __main__ - Step 4619: {'lr': 0.0004996140652889603, 'samples': 886848, 'steps': 4618, 'loss/train': 2.0170814990997314} -08/30/2021 14:01:46 - INFO - __main__ - Step 4620: {'lr': 0.0004996137704768929, 'samples': 887040, 'steps': 4619, 'loss/train': 2.647442579269409} -08/30/2021 14:01:47 - INFO - __main__ - Step 4621: {'lr': 0.0004996134755523532, 'samples': 887232, 'steps': 4620, 'loss/train': 2.3504109382629395} -08/30/2021 14:01:47 - INFO - __main__ - Step 4622: {'lr': 0.0004996131805153417, 'samples': 887424, 'steps': 4621, 'loss/train': 2.1917972564697266} -08/30/2021 14:01:49 - INFO - __main__ - Step 4623: {'lr': 0.0004996128853658583, 'samples': 887616, 'steps': 4622, 'loss/train': 2.2604334354400635} -08/30/2021 14:01:49 - INFO - __main__ - Step 4624: {'lr': 0.0004996125901039031, 'samples': 887808, 'steps': 4623, 'loss/train': 2.1874806880950928} -08/30/2021 14:01:50 - INFO - __main__ - Step 4625: {'lr': 0.0004996122947294764, 'samples': 888000, 'steps': 4624, 'loss/train': 1.9336739778518677} -08/30/2021 14:01:50 - INFO - __main__ - Step 4626: {'lr': 0.0004996119992425782, 'samples': 888192, 'steps': 4625, 'loss/train': 2.149197578430176} -08/30/2021 14:01:50 - INFO - __main__ - Step 4627: {'lr': 0.0004996117036432087, 'samples': 888384, 'steps': 4626, 'loss/train': 0.39136800169944763} -08/30/2021 14:01:52 - INFO - __main__ - Step 4628: {'lr': 0.000499611407931368, 'samples': 888576, 'steps': 4627, 'loss/train': 2.2546849250793457} -08/30/2021 14:01:52 - INFO - __main__ - Step 4629: {'lr': 0.0004996111121070562, 'samples': 888768, 'steps': 4628, 'loss/train': 2.2915778160095215} -08/30/2021 14:01:53 - INFO - __main__ - Step 4630: {'lr': 0.0004996108161702736, 'samples': 888960, 'steps': 4629, 'loss/train': 1.5151708126068115} -08/30/2021 14:01:53 - INFO - __main__ - Step 4631: {'lr': 0.0004996105201210202, 'samples': 889152, 'steps': 4630, 'loss/train': 2.403064727783203} -08/30/2021 14:01:53 - INFO - __main__ - Step 4632: {'lr': 0.0004996102239592961, 'samples': 889344, 'steps': 4631, 'loss/train': 2.241124153137207} -08/30/2021 14:01:54 - INFO - __main__ - Step 4633: {'lr': 0.0004996099276851015, 'samples': 889536, 'steps': 4632, 'loss/train': 2.1955511569976807} -08/30/2021 14:01:55 - INFO - __main__ - Step 4634: {'lr': 0.0004996096312984365, 'samples': 889728, 'steps': 4633, 'loss/train': 2.775601387023926} -08/30/2021 14:01:56 - INFO - __main__ - Step 4635: {'lr': 0.0004996093347993013, 'samples': 889920, 'steps': 4634, 'loss/train': 2.951205253601074} -08/30/2021 14:01:56 - INFO - __main__ - Step 4636: {'lr': 0.000499609038187696, 'samples': 890112, 'steps': 4635, 'loss/train': 2.262634515762329} -08/30/2021 14:01:56 - INFO - __main__ - Step 4637: {'lr': 0.0004996087414636207, 'samples': 890304, 'steps': 4636, 'loss/train': 2.2803754806518555} -08/30/2021 14:01:57 - INFO - __main__ - Step 4638: {'lr': 0.0004996084446270755, 'samples': 890496, 'steps': 4637, 'loss/train': 1.7295838594436646} -08/30/2021 14:01:58 - INFO - __main__ - Step 4639: {'lr': 0.0004996081476780607, 'samples': 890688, 'steps': 4638, 'loss/train': 2.653325319290161} -08/30/2021 14:01:59 - INFO - __main__ - Step 4640: {'lr': 0.0004996078506165762, 'samples': 890880, 'steps': 4639, 'loss/train': 2.3338510990142822} -08/30/2021 14:01:59 - INFO - __main__ - Step 4641: {'lr': 0.0004996075534426222, 'samples': 891072, 'steps': 4640, 'loss/train': 2.238651990890503} -08/30/2021 14:01:59 - INFO - __main__ - Step 4642: {'lr': 0.000499607256156199, 'samples': 891264, 'steps': 4641, 'loss/train': 2.66705584526062} -08/30/2021 14:02:00 - INFO - __main__ - Step 4643: {'lr': 0.0004996069587573067, 'samples': 891456, 'steps': 4642, 'loss/train': 2.448281764984131} -08/30/2021 14:02:01 - INFO - __main__ - Step 4644: {'lr': 0.0004996066612459452, 'samples': 891648, 'steps': 4643, 'loss/train': 2.4534547328948975} -08/30/2021 14:02:02 - INFO - __main__ - Step 4645: {'lr': 0.0004996063636221148, 'samples': 891840, 'steps': 4644, 'loss/train': 2.2594292163848877} -08/30/2021 14:02:02 - INFO - __main__ - Step 4646: {'lr': 0.0004996060658858158, 'samples': 892032, 'steps': 4645, 'loss/train': 2.293121814727783} -08/30/2021 14:02:02 - INFO - __main__ - Step 4647: {'lr': 0.000499605768037048, 'samples': 892224, 'steps': 4646, 'loss/train': 2.6149797439575195} -08/30/2021 14:02:03 - INFO - __main__ - Step 4648: {'lr': 0.0004996054700758117, 'samples': 892416, 'steps': 4647, 'loss/train': 2.524472236633301} -08/30/2021 14:02:04 - INFO - __main__ - Step 4649: {'lr': 0.0004996051720021071, 'samples': 892608, 'steps': 4648, 'loss/train': 1.813582420349121} -08/30/2021 14:02:05 - INFO - __main__ - Step 4650: {'lr': 0.0004996048738159342, 'samples': 892800, 'steps': 4649, 'loss/train': 3.308600664138794} -08/30/2021 14:02:05 - INFO - __main__ - Step 4651: {'lr': 0.0004996045755172932, 'samples': 892992, 'steps': 4650, 'loss/train': 1.810467004776001} -08/30/2021 14:02:05 - INFO - __main__ - Step 4652: {'lr': 0.0004996042771061843, 'samples': 893184, 'steps': 4651, 'loss/train': 2.401333808898926} -08/30/2021 14:02:06 - INFO - __main__ - Step 4653: {'lr': 0.0004996039785826075, 'samples': 893376, 'steps': 4652, 'loss/train': 2.4568803310394287} -08/30/2021 14:02:07 - INFO - __main__ - Step 4654: {'lr': 0.000499603679946563, 'samples': 893568, 'steps': 4653, 'loss/train': 2.008197784423828} -08/30/2021 14:02:08 - INFO - __main__ - Step 4655: {'lr': 0.0004996033811980509, 'samples': 893760, 'steps': 4654, 'loss/train': 2.252939462661743} -08/30/2021 14:02:08 - INFO - __main__ - Step 4656: {'lr': 0.0004996030823370715, 'samples': 893952, 'steps': 4655, 'loss/train': 2.41216778755188} -08/30/2021 14:02:08 - INFO - __main__ - Step 4657: {'lr': 0.0004996027833636247, 'samples': 894144, 'steps': 4656, 'loss/train': 2.4887020587921143} -08/30/2021 14:02:09 - INFO - __main__ - Step 4658: {'lr': 0.0004996024842777106, 'samples': 894336, 'steps': 4657, 'loss/train': 1.7159894704818726} -08/30/2021 14:02:10 - INFO - __main__ - Step 4659: {'lr': 0.0004996021850793297, 'samples': 894528, 'steps': 4658, 'loss/train': 2.5552608966827393} -08/30/2021 14:02:11 - INFO - __main__ - Step 4660: {'lr': 0.0004996018857684818, 'samples': 894720, 'steps': 4659, 'loss/train': 2.448089838027954} -08/30/2021 14:02:11 - INFO - __main__ - Step 4661: {'lr': 0.0004996015863451672, 'samples': 894912, 'steps': 4660, 'loss/train': 2.5309102535247803} -08/30/2021 14:02:11 - INFO - __main__ - Step 4662: {'lr': 0.0004996012868093859, 'samples': 895104, 'steps': 4661, 'loss/train': 2.3204269409179688} -08/30/2021 14:02:12 - INFO - __main__ - Step 4663: {'lr': 0.0004996009871611382, 'samples': 895296, 'steps': 4662, 'loss/train': 1.337915301322937} -08/30/2021 14:02:14 - INFO - __main__ - Step 4664: {'lr': 0.0004996006874004241, 'samples': 895488, 'steps': 4663, 'loss/train': 2.4208292961120605} -08/30/2021 14:02:14 - INFO - __main__ - Step 4665: {'lr': 0.0004996003875272438, 'samples': 895680, 'steps': 4664, 'loss/train': 1.433829665184021} -08/30/2021 14:02:15 - INFO - __main__ - Step 4666: {'lr': 0.0004996000875415973, 'samples': 895872, 'steps': 4665, 'loss/train': 1.977731466293335} -08/30/2021 14:02:15 - INFO - __main__ - Step 4667: {'lr': 0.000499599787443485, 'samples': 896064, 'steps': 4666, 'loss/train': 2.47998309135437} -08/30/2021 14:02:16 - INFO - __main__ - Step 4668: {'lr': 0.0004995994872329069, 'samples': 896256, 'steps': 4667, 'loss/train': 1.9149500131607056} -08/30/2021 14:02:16 - INFO - __main__ - Step 4669: {'lr': 0.000499599186909863, 'samples': 896448, 'steps': 4668, 'loss/train': 1.824616551399231} -08/30/2021 14:02:17 - INFO - __main__ - Step 4670: {'lr': 0.0004995988864743536, 'samples': 896640, 'steps': 4669, 'loss/train': 3.030540943145752} -08/30/2021 14:02:18 - INFO - __main__ - Step 4671: {'lr': 0.0004995985859263789, 'samples': 896832, 'steps': 4670, 'loss/train': 2.6624813079833984} -08/30/2021 14:02:18 - INFO - __main__ - Step 4672: {'lr': 0.0004995982852659388, 'samples': 897024, 'steps': 4671, 'loss/train': 2.7112202644348145} -08/30/2021 14:02:18 - INFO - __main__ - Step 4673: {'lr': 0.0004995979844930336, 'samples': 897216, 'steps': 4672, 'loss/train': 2.2876665592193604} -08/30/2021 14:02:19 - INFO - __main__ - Step 4674: {'lr': 0.0004995976836076635, 'samples': 897408, 'steps': 4673, 'loss/train': 2.294339895248413} -08/30/2021 14:02:21 - INFO - __main__ - Step 4675: {'lr': 0.0004995973826098283, 'samples': 897600, 'steps': 4674, 'loss/train': 2.1953768730163574} -08/30/2021 14:02:22 - INFO - __main__ - Step 4676: {'lr': 0.0004995970814995285, 'samples': 897792, 'steps': 4675, 'loss/train': 1.3137171268463135} -08/30/2021 14:02:22 - INFO - __main__ - Step 4677: {'lr': 0.0004995967802767641, 'samples': 897984, 'steps': 4676, 'loss/train': 3.6875035762786865} -08/30/2021 14:02:22 - INFO - __main__ - Step 4678: {'lr': 0.0004995964789415353, 'samples': 898176, 'steps': 4677, 'loss/train': 1.8820013999938965} -08/30/2021 14:02:23 - INFO - __main__ - Step 4679: {'lr': 0.0004995961774938423, 'samples': 898368, 'steps': 4678, 'loss/train': 2.1136579513549805} -08/30/2021 14:02:23 - INFO - __main__ - Step 4680: {'lr': 0.0004995958759336849, 'samples': 898560, 'steps': 4679, 'loss/train': 1.7372349500656128} -08/30/2021 14:02:25 - INFO - __main__ - Step 4681: {'lr': 0.0004995955742610635, 'samples': 898752, 'steps': 4680, 'loss/train': 0.45423734188079834} -08/30/2021 14:02:25 - INFO - __main__ - Step 4682: {'lr': 0.0004995952724759781, 'samples': 898944, 'steps': 4681, 'loss/train': 2.112457036972046} -08/30/2021 14:02:25 - INFO - __main__ - Step 4683: {'lr': 0.0004995949705784291, 'samples': 899136, 'steps': 4682, 'loss/train': 1.9973746538162231} -08/30/2021 14:02:26 - INFO - __main__ - Step 4684: {'lr': 0.0004995946685684164, 'samples': 899328, 'steps': 4683, 'loss/train': 3.928039789199829} -08/30/2021 14:02:26 - INFO - __main__ - Step 4685: {'lr': 0.0004995943664459401, 'samples': 899520, 'steps': 4684, 'loss/train': 2.448692560195923} -08/30/2021 14:02:28 - INFO - __main__ - Step 4686: {'lr': 0.0004995940642110005, 'samples': 899712, 'steps': 4685, 'loss/train': 2.1602401733398438} -08/30/2021 14:02:28 - INFO - __main__ - Step 4687: {'lr': 0.0004995937618635977, 'samples': 899904, 'steps': 4686, 'loss/train': 2.453596830368042} -08/30/2021 14:02:28 - INFO - __main__ - Step 4688: {'lr': 0.0004995934594037316, 'samples': 900096, 'steps': 4687, 'loss/train': 2.4329769611358643} -08/30/2021 14:02:29 - INFO - __main__ - Step 4689: {'lr': 0.0004995931568314028, 'samples': 900288, 'steps': 4688, 'loss/train': 2.3658831119537354} -08/30/2021 14:02:29 - INFO - __main__ - Step 4690: {'lr': 0.0004995928541466111, 'samples': 900480, 'steps': 4689, 'loss/train': 2.3486440181732178} -08/30/2021 14:02:31 - INFO - __main__ - Step 4691: {'lr': 0.0004995925513493567, 'samples': 900672, 'steps': 4690, 'loss/train': 5.228073596954346} -08/30/2021 14:02:31 - INFO - __main__ - Step 4692: {'lr': 0.0004995922484396397, 'samples': 900864, 'steps': 4691, 'loss/train': 2.1782376766204834} -08/30/2021 14:02:32 - INFO - __main__ - Step 4693: {'lr': 0.0004995919454174603, 'samples': 901056, 'steps': 4692, 'loss/train': 2.515242099761963} -08/30/2021 14:02:32 - INFO - __main__ - Step 4694: {'lr': 0.0004995916422828187, 'samples': 901248, 'steps': 4693, 'loss/train': 2.117107391357422} -08/30/2021 14:02:33 - INFO - __main__ - Step 4695: {'lr': 0.0004995913390357148, 'samples': 901440, 'steps': 4694, 'loss/train': 2.398838520050049} -08/30/2021 14:02:33 - INFO - __main__ - Step 4696: {'lr': 0.0004995910356761491, 'samples': 901632, 'steps': 4695, 'loss/train': 0.874934196472168} -08/30/2021 14:02:35 - INFO - __main__ - Step 4697: {'lr': 0.0004995907322041214, 'samples': 901824, 'steps': 4696, 'loss/train': 1.6412839889526367} -08/30/2021 14:02:35 - INFO - __main__ - Step 4698: {'lr': 0.000499590428619632, 'samples': 902016, 'steps': 4697, 'loss/train': 2.336991786956787} -08/30/2021 14:02:35 - INFO - __main__ - Step 4699: {'lr': 0.000499590124922681, 'samples': 902208, 'steps': 4698, 'loss/train': 1.6142579317092896} -08/30/2021 14:02:36 - INFO - __main__ - Step 4700: {'lr': 0.0004995898211132685, 'samples': 902400, 'steps': 4699, 'loss/train': 2.539201259613037} -08/30/2021 14:02:36 - INFO - __main__ - Step 4701: {'lr': 0.0004995895171913947, 'samples': 902592, 'steps': 4700, 'loss/train': 2.6473097801208496} -08/30/2021 14:02:38 - INFO - __main__ - Step 4702: {'lr': 0.0004995892131570598, 'samples': 902784, 'steps': 4701, 'loss/train': 2.2009053230285645} -08/30/2021 14:02:38 - INFO - __main__ - Step 4703: {'lr': 0.0004995889090102638, 'samples': 902976, 'steps': 4702, 'loss/train': 2.374619960784912} -08/30/2021 14:02:39 - INFO - __main__ - Step 4704: {'lr': 0.0004995886047510068, 'samples': 903168, 'steps': 4703, 'loss/train': 2.033463954925537} -08/30/2021 14:02:39 - INFO - __main__ - Step 4705: {'lr': 0.0004995883003792891, 'samples': 903360, 'steps': 4704, 'loss/train': 2.393458127975464} -08/30/2021 14:02:39 - INFO - __main__ - Step 4706: {'lr': 0.0004995879958951107, 'samples': 903552, 'steps': 4705, 'loss/train': 1.2720915079116821} -08/30/2021 14:02:41 - INFO - __main__ - Step 4707: {'lr': 0.0004995876912984719, 'samples': 903744, 'steps': 4706, 'loss/train': 1.4228672981262207} -08/30/2021 14:02:41 - INFO - __main__ - Step 4708: {'lr': 0.0004995873865893727, 'samples': 903936, 'steps': 4707, 'loss/train': 2.5425636768341064} -08/30/2021 14:02:42 - INFO - __main__ - Step 4709: {'lr': 0.0004995870817678133, 'samples': 904128, 'steps': 4708, 'loss/train': 2.343172550201416} -08/30/2021 14:02:42 - INFO - __main__ - Step 4710: {'lr': 0.0004995867768337938, 'samples': 904320, 'steps': 4709, 'loss/train': 1.9796204566955566} -08/30/2021 14:02:42 - INFO - __main__ - Step 4711: {'lr': 0.0004995864717873143, 'samples': 904512, 'steps': 4710, 'loss/train': 2.5738954544067383} -08/30/2021 14:02:44 - INFO - __main__ - Step 4712: {'lr': 0.000499586166628375, 'samples': 904704, 'steps': 4711, 'loss/train': 2.315624952316284} -08/30/2021 14:02:44 - INFO - __main__ - Step 4713: {'lr': 0.0004995858613569761, 'samples': 904896, 'steps': 4712, 'loss/train': 1.6377177238464355} -08/30/2021 14:02:45 - INFO - __main__ - Step 4714: {'lr': 0.0004995855559731176, 'samples': 905088, 'steps': 4713, 'loss/train': 2.1084823608398438} -08/30/2021 14:02:45 - INFO - __main__ - Step 4715: {'lr': 0.0004995852504767997, 'samples': 905280, 'steps': 4714, 'loss/train': 1.9919739961624146} -08/30/2021 14:02:45 - INFO - __main__ - Step 4716: {'lr': 0.0004995849448680225, 'samples': 905472, 'steps': 4715, 'loss/train': 2.2004289627075195} -08/30/2021 14:02:46 - INFO - __main__ - Step 4717: {'lr': 0.0004995846391467862, 'samples': 905664, 'steps': 4716, 'loss/train': 2.0319464206695557} -08/30/2021 14:02:48 - INFO - __main__ - Step 4718: {'lr': 0.000499584333313091, 'samples': 905856, 'steps': 4717, 'loss/train': 8.657270431518555} -08/30/2021 14:02:49 - INFO - __main__ - Step 4719: {'lr': 0.0004995840273669369, 'samples': 906048, 'steps': 4718, 'loss/train': 2.548557996749878} -08/30/2021 14:02:49 - INFO - __main__ - Step 4720: {'lr': 0.0004995837213083241, 'samples': 906240, 'steps': 4719, 'loss/train': 1.679852843284607} -08/30/2021 14:02:49 - INFO - __main__ - Step 4721: {'lr': 0.0004995834151372526, 'samples': 906432, 'steps': 4720, 'loss/train': 2.3638381958007812} -08/30/2021 14:02:50 - INFO - __main__ - Step 4722: {'lr': 0.0004995831088537229, 'samples': 906624, 'steps': 4721, 'loss/train': 3.4459497928619385} -08/30/2021 14:02:51 - INFO - __main__ - Step 4723: {'lr': 0.0004995828024577346, 'samples': 906816, 'steps': 4722, 'loss/train': 2.5729405879974365} -08/30/2021 14:02:52 - INFO - __main__ - Step 4724: {'lr': 0.0004995824959492884, 'samples': 907008, 'steps': 4723, 'loss/train': 2.4301981925964355} -08/30/2021 14:02:52 - INFO - __main__ - Step 4725: {'lr': 0.0004995821893283841, 'samples': 907200, 'steps': 4724, 'loss/train': 1.806684970855713} -08/30/2021 14:02:52 - INFO - __main__ - Step 4726: {'lr': 0.0004995818825950218, 'samples': 907392, 'steps': 4725, 'loss/train': 2.7768712043762207} -08/30/2021 14:02:53 - INFO - __main__ - Step 4727: {'lr': 0.0004995815757492019, 'samples': 907584, 'steps': 4726, 'loss/train': 2.3350353240966797} -08/30/2021 14:02:54 - INFO - __main__ - Step 4728: {'lr': 0.0004995812687909243, 'samples': 907776, 'steps': 4727, 'loss/train': 2.3573389053344727} -08/30/2021 14:02:55 - INFO - __main__ - Step 4729: {'lr': 0.0004995809617201894, 'samples': 907968, 'steps': 4728, 'loss/train': 2.105909585952759} -08/30/2021 14:02:55 - INFO - __main__ - Step 4730: {'lr': 0.000499580654536997, 'samples': 908160, 'steps': 4729, 'loss/train': 2.9305338859558105} -08/30/2021 14:02:56 - INFO - __main__ - Step 4731: {'lr': 0.0004995803472413474, 'samples': 908352, 'steps': 4730, 'loss/train': 1.8371176719665527} -08/30/2021 14:02:56 - INFO - __main__ - Step 4732: {'lr': 0.0004995800398332409, 'samples': 908544, 'steps': 4731, 'loss/train': 0.559933602809906} -08/30/2021 14:02:56 - INFO - __main__ - Step 4733: {'lr': 0.0004995797323126774, 'samples': 908736, 'steps': 4732, 'loss/train': 2.37628173828125} -08/30/2021 14:02:58 - INFO - __main__ - Step 4734: {'lr': 0.0004995794246796571, 'samples': 908928, 'steps': 4733, 'loss/train': 1.8568031787872314} -08/30/2021 14:02:58 - INFO - __main__ - Step 4735: {'lr': 0.0004995791169341801, 'samples': 909120, 'steps': 4734, 'loss/train': 2.468707799911499} -08/30/2021 14:02:59 - INFO - __main__ - Step 4736: {'lr': 0.0004995788090762467, 'samples': 909312, 'steps': 4735, 'loss/train': 2.731025218963623} -08/30/2021 14:02:59 - INFO - __main__ - Step 4737: {'lr': 0.000499578501105857, 'samples': 909504, 'steps': 4736, 'loss/train': 2.408590793609619} -08/30/2021 14:02:59 - INFO - __main__ - Step 4738: {'lr': 0.000499578193023011, 'samples': 909696, 'steps': 4737, 'loss/train': 2.308793067932129} -08/30/2021 14:03:01 - INFO - __main__ - Step 4739: {'lr': 0.0004995778848277088, 'samples': 909888, 'steps': 4738, 'loss/train': 2.059112548828125} -08/30/2021 14:03:01 - INFO - __main__ - Step 4740: {'lr': 0.0004995775765199509, 'samples': 910080, 'steps': 4739, 'loss/train': 2.3376755714416504} -08/30/2021 14:03:02 - INFO - __main__ - Step 4741: {'lr': 0.000499577268099737, 'samples': 910272, 'steps': 4740, 'loss/train': 2.1304550170898438} -08/30/2021 14:03:02 - INFO - __main__ - Step 4742: {'lr': 0.0004995769595670675, 'samples': 910464, 'steps': 4741, 'loss/train': 2.383237361907959} -08/30/2021 14:03:02 - INFO - __main__ - Step 4743: {'lr': 0.0004995766509219425, 'samples': 910656, 'steps': 4742, 'loss/train': 2.4115703105926514} -08/30/2021 14:03:04 - INFO - __main__ - Step 4744: {'lr': 0.0004995763421643621, 'samples': 910848, 'steps': 4743, 'loss/train': 2.3305840492248535} -08/30/2021 14:03:04 - INFO - __main__ - Step 4745: {'lr': 0.0004995760332943264, 'samples': 911040, 'steps': 4744, 'loss/train': 2.6110363006591797} -08/30/2021 14:03:05 - INFO - __main__ - Step 4746: {'lr': 0.0004995757243118356, 'samples': 911232, 'steps': 4745, 'loss/train': 2.169848918914795} -08/30/2021 14:03:05 - INFO - __main__ - Step 4747: {'lr': 0.0004995754152168899, 'samples': 911424, 'steps': 4746, 'loss/train': 1.4700475931167603} -08/30/2021 14:03:05 - INFO - __main__ - Step 4748: {'lr': 0.0004995751060094893, 'samples': 911616, 'steps': 4747, 'loss/train': 0.852035403251648} -08/30/2021 14:03:07 - INFO - __main__ - Step 4749: {'lr': 0.000499574796689634, 'samples': 911808, 'steps': 4748, 'loss/train': 1.8782111406326294} -08/30/2021 14:03:07 - INFO - __main__ - Step 4750: {'lr': 0.0004995744872573242, 'samples': 912000, 'steps': 4749, 'loss/train': 1.7904566526412964} -08/30/2021 14:03:08 - INFO - __main__ - Step 4751: {'lr': 0.00049957417771256, 'samples': 912192, 'steps': 4750, 'loss/train': 1.7794671058654785} -08/30/2021 14:03:08 - INFO - __main__ - Step 4752: {'lr': 0.0004995738680553415, 'samples': 912384, 'steps': 4751, 'loss/train': 1.608269214630127} -08/30/2021 14:03:08 - INFO - __main__ - Step 4753: {'lr': 0.0004995735582856689, 'samples': 912576, 'steps': 4752, 'loss/train': 2.1375675201416016} -08/30/2021 14:03:10 - INFO - __main__ - Step 4754: {'lr': 0.0004995732484035422, 'samples': 912768, 'steps': 4753, 'loss/train': 2.6623668670654297} -08/30/2021 14:03:10 - INFO - __main__ - Step 4755: {'lr': 0.0004995729384089618, 'samples': 912960, 'steps': 4754, 'loss/train': 2.3186020851135254} -08/30/2021 14:03:11 - INFO - __main__ - Step 4756: {'lr': 0.0004995726283019275, 'samples': 913152, 'steps': 4755, 'loss/train': 2.0165352821350098} -08/30/2021 14:03:11 - INFO - __main__ - Step 4757: {'lr': 0.0004995723180824397, 'samples': 913344, 'steps': 4756, 'loss/train': 1.5398626327514648} -08/30/2021 14:03:11 - INFO - __main__ - Step 4758: {'lr': 0.0004995720077504986, 'samples': 913536, 'steps': 4757, 'loss/train': 2.2841081619262695} -08/30/2021 14:03:12 - INFO - __main__ - Step 4759: {'lr': 0.0004995716973061041, 'samples': 913728, 'steps': 4758, 'loss/train': 2.377220869064331} -08/30/2021 14:03:13 - INFO - __main__ - Step 4760: {'lr': 0.0004995713867492564, 'samples': 913920, 'steps': 4759, 'loss/train': 2.4824860095977783} -08/30/2021 14:03:14 - INFO - __main__ - Step 4761: {'lr': 0.0004995710760799557, 'samples': 914112, 'steps': 4760, 'loss/train': 1.7118556499481201} -08/30/2021 14:03:14 - INFO - __main__ - Step 4762: {'lr': 0.0004995707652982022, 'samples': 914304, 'steps': 4761, 'loss/train': 2.071098804473877} -08/30/2021 14:03:15 - INFO - __main__ - Step 4763: {'lr': 0.0004995704544039958, 'samples': 914496, 'steps': 4762, 'loss/train': 3.8153786659240723} -08/30/2021 14:03:15 - INFO - __main__ - Step 4764: {'lr': 0.0004995701433973369, 'samples': 914688, 'steps': 4763, 'loss/train': 2.1583616733551025} -08/30/2021 14:03:16 - INFO - __main__ - Step 4765: {'lr': 0.0004995698322782257, 'samples': 914880, 'steps': 4764, 'loss/train': 2.505201578140259} -08/30/2021 14:03:17 - INFO - __main__ - Step 4766: {'lr': 0.0004995695210466619, 'samples': 915072, 'steps': 4765, 'loss/train': 2.2153713703155518} -08/30/2021 14:03:17 - INFO - __main__ - Step 4767: {'lr': 0.0004995692097026461, 'samples': 915264, 'steps': 4766, 'loss/train': 2.196841239929199} -08/30/2021 14:03:18 - INFO - __main__ - Step 4768: {'lr': 0.0004995688982461783, 'samples': 915456, 'steps': 4767, 'loss/train': 2.1606943607330322} -08/30/2021 14:03:18 - INFO - __main__ - Step 4769: {'lr': 0.0004995685866772586, 'samples': 915648, 'steps': 4768, 'loss/train': 1.0300918817520142} -08/30/2021 14:03:20 - INFO - __main__ - Step 4770: {'lr': 0.000499568274995887, 'samples': 915840, 'steps': 4769, 'loss/train': 2.6956491470336914} -08/30/2021 14:03:20 - INFO - __main__ - Step 4771: {'lr': 0.0004995679632020639, 'samples': 916032, 'steps': 4770, 'loss/train': 1.5897364616394043} -08/30/2021 14:03:20 - INFO - __main__ - Step 4772: {'lr': 0.0004995676512957892, 'samples': 916224, 'steps': 4771, 'loss/train': 2.4463539123535156} -08/30/2021 14:03:21 - INFO - __main__ - Step 4773: {'lr': 0.0004995673392770634, 'samples': 916416, 'steps': 4772, 'loss/train': 1.6611323356628418} -08/30/2021 14:03:21 - INFO - __main__ - Step 4774: {'lr': 0.0004995670271458863, 'samples': 916608, 'steps': 4773, 'loss/train': 2.0660533905029297} -08/30/2021 14:03:23 - INFO - __main__ - Step 4775: {'lr': 0.0004995667149022581, 'samples': 916800, 'steps': 4774, 'loss/train': 2.0716781616210938} -08/30/2021 14:03:24 - INFO - __main__ - Step 4776: {'lr': 0.000499566402546179, 'samples': 916992, 'steps': 4775, 'loss/train': 2.422713041305542} -08/30/2021 14:03:24 - INFO - __main__ - Step 4777: {'lr': 0.0004995660900776491, 'samples': 917184, 'steps': 4776, 'loss/train': 2.204787492752075} -08/30/2021 14:03:24 - INFO - __main__ - Step 4778: {'lr': 0.0004995657774966686, 'samples': 917376, 'steps': 4777, 'loss/train': 2.6138124465942383} -08/30/2021 14:03:25 - INFO - __main__ - Step 4779: {'lr': 0.0004995654648032377, 'samples': 917568, 'steps': 4778, 'loss/train': 2.557595729827881} -08/30/2021 14:03:26 - INFO - __main__ - Step 4780: {'lr': 0.0004995651519973563, 'samples': 917760, 'steps': 4779, 'loss/train': 1.4790884256362915} -08/30/2021 14:03:27 - INFO - __main__ - Step 4781: {'lr': 0.0004995648390790249, 'samples': 917952, 'steps': 4780, 'loss/train': 1.851643443107605} -08/30/2021 14:03:27 - INFO - __main__ - Step 4782: {'lr': 0.0004995645260482432, 'samples': 918144, 'steps': 4781, 'loss/train': 2.3874449729919434} -08/30/2021 14:03:27 - INFO - __main__ - Step 4783: {'lr': 0.0004995642129050117, 'samples': 918336, 'steps': 4782, 'loss/train': 2.0189919471740723} -08/30/2021 14:03:28 - INFO - __main__ - Step 4784: {'lr': 0.0004995638996493304, 'samples': 918528, 'steps': 4783, 'loss/train': 2.4560396671295166} -08/30/2021 14:03:28 - INFO - __main__ - Step 4785: {'lr': 0.0004995635862811994, 'samples': 918720, 'steps': 4784, 'loss/train': 1.907179355621338} -08/30/2021 14:03:30 - INFO - __main__ - Step 4786: {'lr': 0.000499563272800619, 'samples': 918912, 'steps': 4785, 'loss/train': 2.069049596786499} -08/30/2021 14:03:30 - INFO - __main__ - Step 4787: {'lr': 0.0004995629592075892, 'samples': 919104, 'steps': 4786, 'loss/train': 1.8719192743301392} -08/30/2021 14:03:30 - INFO - __main__ - Step 4788: {'lr': 0.0004995626455021101, 'samples': 919296, 'steps': 4787, 'loss/train': 2.1309146881103516} -08/30/2021 14:03:31 - INFO - __main__ - Step 4789: {'lr': 0.0004995623316841821, 'samples': 919488, 'steps': 4788, 'loss/train': 2.4332520961761475} -08/30/2021 14:03:31 - INFO - __main__ - Step 4790: {'lr': 0.0004995620177538051, 'samples': 919680, 'steps': 4789, 'loss/train': 2.584012746810913} -08/30/2021 14:03:33 - INFO - __main__ - Step 4791: {'lr': 0.0004995617037109792, 'samples': 919872, 'steps': 4790, 'loss/train': 2.0938055515289307} -08/30/2021 14:03:33 - INFO - __main__ - Step 4792: {'lr': 0.0004995613895557048, 'samples': 920064, 'steps': 4791, 'loss/train': 2.628089666366577} -08/30/2021 14:03:34 - INFO - __main__ - Step 4793: {'lr': 0.0004995610752879818, 'samples': 920256, 'steps': 4792, 'loss/train': 2.253495693206787} -08/30/2021 14:03:34 - INFO - __main__ - Step 4794: {'lr': 0.0004995607609078104, 'samples': 920448, 'steps': 4793, 'loss/train': 2.293809413909912} -08/30/2021 14:03:34 - INFO - __main__ - Step 4795: {'lr': 0.0004995604464151908, 'samples': 920640, 'steps': 4794, 'loss/train': 1.1303257942199707} -08/30/2021 14:03:36 - INFO - __main__ - Step 4796: {'lr': 0.0004995601318101231, 'samples': 920832, 'steps': 4795, 'loss/train': 1.8195961713790894} -08/30/2021 14:03:37 - INFO - __main__ - Step 4797: {'lr': 0.0004995598170926074, 'samples': 921024, 'steps': 4796, 'loss/train': 1.7572760581970215} -08/30/2021 14:03:37 - INFO - __main__ - Step 4798: {'lr': 0.000499559502262644, 'samples': 921216, 'steps': 4797, 'loss/train': 2.152740716934204} -08/30/2021 14:03:37 - INFO - __main__ - Step 4799: {'lr': 0.000499559187320233, 'samples': 921408, 'steps': 4798, 'loss/train': 2.2296159267425537} -08/30/2021 14:03:38 - INFO - __main__ - Step 4800: {'lr': 0.0004995588722653743, 'samples': 921600, 'steps': 4799, 'loss/train': 0.6443192362785339} -08/30/2021 14:03:38 - INFO - __main__ - Step 4801: {'lr': 0.0004995585570980684, 'samples': 921792, 'steps': 4800, 'loss/train': 2.578104257583618} -08/30/2021 14:03:40 - INFO - __main__ - Step 4802: {'lr': 0.0004995582418183151, 'samples': 921984, 'steps': 4801, 'loss/train': 2.2058041095733643} -08/30/2021 14:03:40 - INFO - __main__ - Step 4803: {'lr': 0.0004995579264261148, 'samples': 922176, 'steps': 4802, 'loss/train': 1.4003407955169678} -08/30/2021 14:03:40 - INFO - __main__ - Step 4804: {'lr': 0.0004995576109214676, 'samples': 922368, 'steps': 4803, 'loss/train': 2.4224884510040283} -08/30/2021 14:03:41 - INFO - __main__ - Step 4805: {'lr': 0.0004995572953043736, 'samples': 922560, 'steps': 4804, 'loss/train': 2.1731059551239014} -08/30/2021 14:03:41 - INFO - __main__ - Step 4806: {'lr': 0.0004995569795748328, 'samples': 922752, 'steps': 4805, 'loss/train': 2.401675224304199} -08/30/2021 14:03:43 - INFO - __main__ - Step 4807: {'lr': 0.0004995566637328456, 'samples': 922944, 'steps': 4806, 'loss/train': 2.5750410556793213} -08/30/2021 14:03:43 - INFO - __main__ - Step 4808: {'lr': 0.0004995563477784119, 'samples': 923136, 'steps': 4807, 'loss/train': 1.8233083486557007} -08/30/2021 14:03:44 - INFO - __main__ - Step 4809: {'lr': 0.000499556031711532, 'samples': 923328, 'steps': 4808, 'loss/train': 2.4176502227783203} -08/30/2021 14:03:44 - INFO - __main__ - Step 4810: {'lr': 0.000499555715532206, 'samples': 923520, 'steps': 4809, 'loss/train': 2.2716965675354004} -08/30/2021 14:03:44 - INFO - __main__ - Step 4811: {'lr': 0.0004995553992404342, 'samples': 923712, 'steps': 4810, 'loss/train': 2.182950973510742} -08/30/2021 14:03:45 - INFO - __main__ - Step 4812: {'lr': 0.0004995550828362163, 'samples': 923904, 'steps': 4811, 'loss/train': 1.1444370746612549} -08/30/2021 14:03:46 - INFO - __main__ - Step 4813: {'lr': 0.000499554766319553, 'samples': 924096, 'steps': 4812, 'loss/train': 3.355135202407837} -08/30/2021 14:03:47 - INFO - __main__ - Step 4814: {'lr': 0.0004995544496904441, 'samples': 924288, 'steps': 4813, 'loss/train': 1.8554887771606445} -08/30/2021 14:03:47 - INFO - __main__ - Step 4815: {'lr': 0.0004995541329488897, 'samples': 924480, 'steps': 4814, 'loss/train': 1.8497685194015503} -08/30/2021 14:03:48 - INFO - __main__ - Step 4816: {'lr': 0.0004995538160948901, 'samples': 924672, 'steps': 4815, 'loss/train': 2.6320436000823975} -08/30/2021 14:03:48 - INFO - __main__ - Step 4817: {'lr': 0.0004995534991284455, 'samples': 924864, 'steps': 4816, 'loss/train': 1.436744213104248} -08/30/2021 14:03:50 - INFO - __main__ - Step 4818: {'lr': 0.0004995531820495559, 'samples': 925056, 'steps': 4817, 'loss/train': 1.9512062072753906} -08/30/2021 14:03:50 - INFO - __main__ - Step 4819: {'lr': 0.0004995528648582214, 'samples': 925248, 'steps': 4818, 'loss/train': 2.3656439781188965} -08/30/2021 14:03:51 - INFO - __main__ - Step 4820: {'lr': 0.0004995525475544423, 'samples': 925440, 'steps': 4819, 'loss/train': 1.9629491567611694} -08/30/2021 14:03:51 - INFO - __main__ - Step 4821: {'lr': 0.0004995522301382187, 'samples': 925632, 'steps': 4820, 'loss/train': 2.170275926589966} -08/30/2021 14:03:51 - INFO - __main__ - Step 4822: {'lr': 0.0004995519126095506, 'samples': 925824, 'steps': 4821, 'loss/train': 2.4914565086364746} -08/30/2021 14:03:52 - INFO - __main__ - Step 4823: {'lr': 0.0004995515949684384, 'samples': 926016, 'steps': 4822, 'loss/train': 1.9531784057617188} -08/30/2021 14:03:53 - INFO - __main__ - Step 4824: {'lr': 0.000499551277214882, 'samples': 926208, 'steps': 4823, 'loss/train': 2.2391319274902344} -08/30/2021 14:03:54 - INFO - __main__ - Step 4825: {'lr': 0.0004995509593488818, 'samples': 926400, 'steps': 4824, 'loss/train': 1.967274785041809} -08/30/2021 14:03:54 - INFO - __main__ - Step 4826: {'lr': 0.0004995506413704376, 'samples': 926592, 'steps': 4825, 'loss/train': 2.2904481887817383} -08/30/2021 14:03:54 - INFO - __main__ - Step 4827: {'lr': 0.0004995503232795498, 'samples': 926784, 'steps': 4826, 'loss/train': 1.8858319520950317} -08/30/2021 14:03:55 - INFO - __main__ - Step 4828: {'lr': 0.0004995500050762185, 'samples': 926976, 'steps': 4827, 'loss/train': 2.434027671813965} -08/30/2021 14:03:57 - INFO - __main__ - Step 4829: {'lr': 0.0004995496867604438, 'samples': 927168, 'steps': 4828, 'loss/train': 2.4201512336730957} -08/30/2021 14:03:57 - INFO - __main__ - Step 4830: {'lr': 0.0004995493683322259, 'samples': 927360, 'steps': 4829, 'loss/train': 3.496950149536133} -08/30/2021 14:03:58 - INFO - __main__ - Step 4831: {'lr': 0.0004995490497915649, 'samples': 927552, 'steps': 4830, 'loss/train': 3.0072968006134033} -08/30/2021 14:03:58 - INFO - __main__ - Step 4832: {'lr': 0.0004995487311384609, 'samples': 927744, 'steps': 4831, 'loss/train': 2.3867318630218506} -08/30/2021 14:03:59 - INFO - __main__ - Step 4833: {'lr': 0.0004995484123729141, 'samples': 927936, 'steps': 4832, 'loss/train': 1.9825752973556519} -08/30/2021 14:04:00 - INFO - __main__ - Step 4834: {'lr': 0.0004995480934949247, 'samples': 928128, 'steps': 4833, 'loss/train': 1.8303334712982178} -08/30/2021 14:04:01 - INFO - __main__ - Step 4835: {'lr': 0.0004995477745044927, 'samples': 928320, 'steps': 4834, 'loss/train': 2.512631893157959} -08/30/2021 14:04:01 - INFO - __main__ - Step 4836: {'lr': 0.0004995474554016184, 'samples': 928512, 'steps': 4835, 'loss/train': 1.1743768453598022} -08/30/2021 14:04:01 - INFO - __main__ - Step 4837: {'lr': 0.0004995471361863017, 'samples': 928704, 'steps': 4836, 'loss/train': 2.0064592361450195} -08/30/2021 14:04:02 - INFO - __main__ - Step 4838: {'lr': 0.0004995468168585431, 'samples': 928896, 'steps': 4837, 'loss/train': 2.3148019313812256} -08/30/2021 14:04:03 - INFO - __main__ - Step 4839: {'lr': 0.0004995464974183424, 'samples': 929088, 'steps': 4838, 'loss/train': 1.4140267372131348} -08/30/2021 14:04:04 - INFO - __main__ - Step 4840: {'lr': 0.0004995461778657002, 'samples': 929280, 'steps': 4839, 'loss/train': 2.034234046936035} -08/30/2021 14:04:04 - INFO - __main__ - Step 4841: {'lr': 0.000499545858200616, 'samples': 929472, 'steps': 4840, 'loss/train': 2.642103433609009} -08/30/2021 14:04:04 - INFO - __main__ - Step 4842: {'lr': 0.0004995455384230904, 'samples': 929664, 'steps': 4841, 'loss/train': 2.2454304695129395} -08/30/2021 14:04:05 - INFO - __main__ - Step 4843: {'lr': 0.0004995452185331235, 'samples': 929856, 'steps': 4842, 'loss/train': 1.9844597578048706} -08/30/2021 14:04:05 - INFO - __main__ - Step 4844: {'lr': 0.0004995448985307153, 'samples': 930048, 'steps': 4843, 'loss/train': 2.42919921875} -08/30/2021 14:04:07 - INFO - __main__ - Step 4845: {'lr': 0.0004995445784158661, 'samples': 930240, 'steps': 4844, 'loss/train': 2.58362078666687} -08/30/2021 14:04:07 - INFO - __main__ - Step 4846: {'lr': 0.0004995442581885759, 'samples': 930432, 'steps': 4845, 'loss/train': 2.5964014530181885} -08/30/2021 14:04:07 - INFO - __main__ - Step 4847: {'lr': 0.0004995439378488449, 'samples': 930624, 'steps': 4846, 'loss/train': 2.1342966556549072} -08/30/2021 14:04:08 - INFO - __main__ - Step 4848: {'lr': 0.0004995436173966733, 'samples': 930816, 'steps': 4847, 'loss/train': 2.743109941482544} -08/30/2021 14:04:08 - INFO - __main__ - Step 4849: {'lr': 0.0004995432968320611, 'samples': 931008, 'steps': 4848, 'loss/train': 2.200352668762207} -08/30/2021 14:04:10 - INFO - __main__ - Step 4850: {'lr': 0.0004995429761550086, 'samples': 931200, 'steps': 4849, 'loss/train': 2.59735369682312} -08/30/2021 14:04:10 - INFO - __main__ - Step 4851: {'lr': 0.0004995426553655159, 'samples': 931392, 'steps': 4850, 'loss/train': 2.017277956008911} -08/30/2021 14:04:10 - INFO - __main__ - Step 4852: {'lr': 0.0004995423344635831, 'samples': 931584, 'steps': 4851, 'loss/train': 2.207967519760132} -08/30/2021 14:04:11 - INFO - __main__ - Step 4853: {'lr': 0.0004995420134492105, 'samples': 931776, 'steps': 4852, 'loss/train': 2.088369369506836} -08/30/2021 14:04:11 - INFO - __main__ - Step 4854: {'lr': 0.0004995416923223979, 'samples': 931968, 'steps': 4853, 'loss/train': 2.138617992401123} -08/30/2021 14:04:13 - INFO - __main__ - Step 4855: {'lr': 0.0004995413710831458, 'samples': 932160, 'steps': 4854, 'loss/train': 2.071810007095337} -08/30/2021 14:04:13 - INFO - __main__ - Step 4856: {'lr': 0.0004995410497314542, 'samples': 932352, 'steps': 4855, 'loss/train': 2.2474253177642822} -08/30/2021 14:04:13 - INFO - __main__ - Step 4857: {'lr': 0.0004995407282673232, 'samples': 932544, 'steps': 4856, 'loss/train': 1.3294479846954346} -08/30/2021 14:04:14 - INFO - __main__ - Step 4858: {'lr': 0.000499540406690753, 'samples': 932736, 'steps': 4857, 'loss/train': 2.495647430419922} -08/30/2021 14:04:14 - INFO - __main__ - Step 4859: {'lr': 0.0004995400850017438, 'samples': 932928, 'steps': 4858, 'loss/train': 1.8881466388702393} -08/30/2021 14:04:16 - INFO - __main__ - Step 4860: {'lr': 0.0004995397632002957, 'samples': 933120, 'steps': 4859, 'loss/train': 2.295034646987915} -08/30/2021 14:04:16 - INFO - __main__ - Step 4861: {'lr': 0.0004995394412864088, 'samples': 933312, 'steps': 4860, 'loss/train': 2.3709468841552734} -08/30/2021 14:04:16 - INFO - __main__ - Step 4862: {'lr': 0.0004995391192600834, 'samples': 933504, 'steps': 4861, 'loss/train': 2.604323148727417} -08/30/2021 14:04:17 - INFO - __main__ - Step 4863: {'lr': 0.0004995387971213194, 'samples': 933696, 'steps': 4862, 'loss/train': 1.930928111076355} -08/30/2021 14:04:17 - INFO - __main__ - Step 4864: {'lr': 0.000499538474870117, 'samples': 933888, 'steps': 4863, 'loss/train': 1.811528205871582} -08/30/2021 14:04:19 - INFO - __main__ - Step 4865: {'lr': 0.0004995381525064765, 'samples': 934080, 'steps': 4864, 'loss/train': 2.3152430057525635} -08/30/2021 14:04:19 - INFO - __main__ - Step 4866: {'lr': 0.0004995378300303979, 'samples': 934272, 'steps': 4865, 'loss/train': 0.3185814321041107} -08/30/2021 14:04:20 - INFO - __main__ - Step 4867: {'lr': 0.0004995375074418815, 'samples': 934464, 'steps': 4866, 'loss/train': 1.6159205436706543} -08/30/2021 14:04:20 - INFO - __main__ - Step 4868: {'lr': 0.0004995371847409273, 'samples': 934656, 'steps': 4867, 'loss/train': 2.578643560409546} -08/30/2021 14:04:20 - INFO - __main__ - Step 4869: {'lr': 0.0004995368619275355, 'samples': 934848, 'steps': 4868, 'loss/train': 2.7576565742492676} -08/30/2021 14:04:22 - INFO - __main__ - Step 4870: {'lr': 0.0004995365390017062, 'samples': 935040, 'steps': 4869, 'loss/train': 3.0795624256134033} -08/30/2021 14:04:23 - INFO - __main__ - Step 4871: {'lr': 0.0004995362159634396, 'samples': 935232, 'steps': 4870, 'loss/train': 2.240497350692749} -08/30/2021 14:04:23 - INFO - __main__ - Step 4872: {'lr': 0.0004995358928127359, 'samples': 935424, 'steps': 4871, 'loss/train': 0.6288450956344604} -08/30/2021 14:04:23 - INFO - __main__ - Step 4873: {'lr': 0.0004995355695495952, 'samples': 935616, 'steps': 4872, 'loss/train': 0.7128564715385437} -08/30/2021 14:04:24 - INFO - __main__ - Step 4874: {'lr': 0.0004995352461740174, 'samples': 935808, 'steps': 4873, 'loss/train': 2.3273799419403076} -08/30/2021 14:04:24 - INFO - __main__ - Step 4875: {'lr': 0.0004995349226860031, 'samples': 936000, 'steps': 4874, 'loss/train': 2.4876091480255127} -08/30/2021 14:04:25 - INFO - __main__ - Step 4876: {'lr': 0.0004995345990855522, 'samples': 936192, 'steps': 4875, 'loss/train': 0.3857323229312897} -08/30/2021 14:04:26 - INFO - __main__ - Step 4877: {'lr': 0.0004995342753726647, 'samples': 936384, 'steps': 4876, 'loss/train': 2.2492923736572266} -08/30/2021 14:04:26 - INFO - __main__ - Step 4878: {'lr': 0.0004995339515473411, 'samples': 936576, 'steps': 4877, 'loss/train': 2.3254709243774414} -08/30/2021 14:04:27 - INFO - __main__ - Step 4879: {'lr': 0.0004995336276095812, 'samples': 936768, 'steps': 4878, 'loss/train': 0.2982950210571289} -08/30/2021 14:04:27 - INFO - __main__ - Step 4880: {'lr': 0.0004995333035593853, 'samples': 936960, 'steps': 4879, 'loss/train': 3.4135165214538574} -08/30/2021 14:04:27 - INFO - __main__ - Step 4881: {'lr': 0.0004995329793967537, 'samples': 937152, 'steps': 4880, 'loss/train': 2.241283893585205} -08/30/2021 14:04:30 - INFO - __main__ - Step 4882: {'lr': 0.0004995326551216862, 'samples': 937344, 'steps': 4881, 'loss/train': 2.0210165977478027} -08/30/2021 14:04:30 - INFO - __main__ - Step 4883: {'lr': 0.0004995323307341832, 'samples': 937536, 'steps': 4882, 'loss/train': 2.4769980907440186} -08/30/2021 14:04:30 - INFO - __main__ - Step 4884: {'lr': 0.0004995320062342449, 'samples': 937728, 'steps': 4883, 'loss/train': 1.26012122631073} -08/30/2021 14:04:31 - INFO - __main__ - Step 4885: {'lr': 0.0004995316816218712, 'samples': 937920, 'steps': 4884, 'loss/train': 2.107384443283081} -08/30/2021 14:04:31 - INFO - __main__ - Step 4886: {'lr': 0.0004995313568970625, 'samples': 938112, 'steps': 4885, 'loss/train': 2.4081616401672363} -08/30/2021 14:04:33 - INFO - __main__ - Step 4887: {'lr': 0.0004995310320598187, 'samples': 938304, 'steps': 4886, 'loss/train': 2.2661356925964355} -08/30/2021 14:04:33 - INFO - __main__ - Step 4888: {'lr': 0.0004995307071101401, 'samples': 938496, 'steps': 4887, 'loss/train': 2.039107084274292} -08/30/2021 14:04:33 - INFO - __main__ - Step 4889: {'lr': 0.0004995303820480268, 'samples': 938688, 'steps': 4888, 'loss/train': 2.11918044090271} -08/30/2021 14:04:34 - INFO - __main__ - Step 4890: {'lr': 0.000499530056873479, 'samples': 938880, 'steps': 4889, 'loss/train': 2.0490710735321045} -08/30/2021 14:04:34 - INFO - __main__ - Step 4891: {'lr': 0.0004995297315864968, 'samples': 939072, 'steps': 4890, 'loss/train': 1.924241304397583} -08/30/2021 14:04:36 - INFO - __main__ - Step 4892: {'lr': 0.0004995294061870802, 'samples': 939264, 'steps': 4891, 'loss/train': 2.2429251670837402} -08/30/2021 14:04:36 - INFO - __main__ - Step 4893: {'lr': 0.0004995290806752297, 'samples': 939456, 'steps': 4892, 'loss/train': 1.9073786735534668} -08/30/2021 14:04:36 - INFO - __main__ - Step 4894: {'lr': 0.0004995287550509452, 'samples': 939648, 'steps': 4893, 'loss/train': 2.1097092628479004} -08/30/2021 14:04:37 - INFO - __main__ - Step 4895: {'lr': 0.0004995284293142268, 'samples': 939840, 'steps': 4894, 'loss/train': 1.4850573539733887} -08/30/2021 14:04:37 - INFO - __main__ - Step 4896: {'lr': 0.0004995281034650748, 'samples': 940032, 'steps': 4895, 'loss/train': 2.265522003173828} -08/30/2021 14:04:39 - INFO - __main__ - Step 4897: {'lr': 0.0004995277775034894, 'samples': 940224, 'steps': 4896, 'loss/train': 2.796849250793457} -08/30/2021 14:04:39 - INFO - __main__ - Step 4898: {'lr': 0.0004995274514294706, 'samples': 940416, 'steps': 4897, 'loss/train': 2.3835463523864746} -08/30/2021 14:04:39 - INFO - __main__ - Step 4899: {'lr': 0.0004995271252430184, 'samples': 940608, 'steps': 4898, 'loss/train': 2.095919132232666} -08/30/2021 14:04:40 - INFO - __main__ - Step 4900: {'lr': 0.0004995267989441332, 'samples': 940800, 'steps': 4899, 'loss/train': 2.317500114440918} -08/30/2021 14:04:40 - INFO - __main__ - Step 4901: {'lr': 0.0004995264725328151, 'samples': 940992, 'steps': 4900, 'loss/train': 2.312500476837158} -08/30/2021 14:04:42 - INFO - __main__ - Step 4902: {'lr': 0.0004995261460090644, 'samples': 941184, 'steps': 4901, 'loss/train': 2.338080644607544} -08/30/2021 14:04:42 - INFO - __main__ - Step 4903: {'lr': 0.0004995258193728809, 'samples': 941376, 'steps': 4902, 'loss/train': 2.4022438526153564} -08/30/2021 14:04:43 - INFO - __main__ - Step 4904: {'lr': 0.0004995254926242649, 'samples': 941568, 'steps': 4903, 'loss/train': 1.979127049446106} -08/30/2021 14:04:43 - INFO - __main__ - Step 4905: {'lr': 0.0004995251657632165, 'samples': 941760, 'steps': 4904, 'loss/train': 1.7903000116348267} -08/30/2021 14:04:43 - INFO - __main__ - Step 4906: {'lr': 0.000499524838789736, 'samples': 941952, 'steps': 4905, 'loss/train': 2.0132312774658203} -08/30/2021 14:04:44 - INFO - __main__ - Step 4907: {'lr': 0.0004995245117038235, 'samples': 942144, 'steps': 4906, 'loss/train': 2.653233051300049} -08/30/2021 14:04:45 - INFO - __main__ - Step 4908: {'lr': 0.0004995241845054791, 'samples': 942336, 'steps': 4907, 'loss/train': 6.56795072555542} -08/30/2021 14:04:46 - INFO - __main__ - Step 4909: {'lr': 0.0004995238571947029, 'samples': 942528, 'steps': 4908, 'loss/train': 0.31409645080566406} -08/30/2021 14:04:46 - INFO - __main__ - Step 4910: {'lr': 0.0004995235297714951, 'samples': 942720, 'steps': 4909, 'loss/train': 3.070596694946289} -08/30/2021 14:04:46 - INFO - __main__ - Step 4911: {'lr': 0.0004995232022358559, 'samples': 942912, 'steps': 4910, 'loss/train': 2.411649703979492} -08/30/2021 14:04:47 - INFO - __main__ - Step 4912: {'lr': 0.0004995228745877853, 'samples': 943104, 'steps': 4911, 'loss/train': 2.4639906883239746} -08/30/2021 14:04:48 - INFO - __main__ - Step 4913: {'lr': 0.0004995225468272836, 'samples': 943296, 'steps': 4912, 'loss/train': 2.8082973957061768} -08/30/2021 14:04:49 - INFO - __main__ - Step 4914: {'lr': 0.0004995222189543509, 'samples': 943488, 'steps': 4913, 'loss/train': 2.173126697540283} -08/30/2021 14:04:49 - INFO - __main__ - Step 4915: {'lr': 0.0004995218909689873, 'samples': 943680, 'steps': 4914, 'loss/train': 2.0056076049804688} -08/30/2021 14:04:49 - INFO - __main__ - Step 4916: {'lr': 0.0004995215628711931, 'samples': 943872, 'steps': 4915, 'loss/train': 1.467712640762329} -08/30/2021 14:04:50 - INFO - __main__ - Step 4917: {'lr': 0.0004995212346609682, 'samples': 944064, 'steps': 4916, 'loss/train': 1.1171711683273315} -08/30/2021 14:04:51 - INFO - __main__ - Step 4918: {'lr': 0.0004995209063383129, 'samples': 944256, 'steps': 4917, 'loss/train': 2.1496872901916504} -08/30/2021 14:04:51 - INFO - __main__ - Step 4919: {'lr': 0.0004995205779032274, 'samples': 944448, 'steps': 4918, 'loss/train': 1.7300554513931274} -08/30/2021 14:04:52 - INFO - __main__ - Step 4920: {'lr': 0.0004995202493557118, 'samples': 944640, 'steps': 4919, 'loss/train': 2.637270450592041} -08/30/2021 14:04:52 - INFO - __main__ - Step 4921: {'lr': 0.0004995199206957662, 'samples': 944832, 'steps': 4920, 'loss/train': 2.460200309753418} -08/30/2021 14:04:53 - INFO - __main__ - Step 4922: {'lr': 0.0004995195919233906, 'samples': 945024, 'steps': 4921, 'loss/train': 2.2443785667419434} -08/30/2021 14:04:54 - INFO - __main__ - Step 4923: {'lr': 0.0004995192630385855, 'samples': 945216, 'steps': 4922, 'loss/train': 2.106414556503296} -08/30/2021 14:04:55 - INFO - __main__ - Step 4924: {'lr': 0.0004995189340413509, 'samples': 945408, 'steps': 4923, 'loss/train': 1.873865008354187} -08/30/2021 14:04:55 - INFO - __main__ - Step 4925: {'lr': 0.0004995186049316868, 'samples': 945600, 'steps': 4924, 'loss/train': 1.8414298295974731} -08/30/2021 14:04:55 - INFO - __main__ - Step 4926: {'lr': 0.0004995182757095935, 'samples': 945792, 'steps': 4925, 'loss/train': 2.4885571002960205} -08/30/2021 14:04:56 - INFO - __main__ - Step 4927: {'lr': 0.0004995179463750712, 'samples': 945984, 'steps': 4926, 'loss/train': 2.6049792766571045} -08/30/2021 14:04:57 - INFO - __main__ - Step 4928: {'lr': 0.0004995176169281199, 'samples': 946176, 'steps': 4927, 'loss/train': 2.603942632675171} -08/30/2021 14:04:58 - INFO - __main__ - Step 4929: {'lr': 0.0004995172873687398, 'samples': 946368, 'steps': 4928, 'loss/train': 2.30535626411438} -08/30/2021 14:04:58 - INFO - __main__ - Step 4930: {'lr': 0.0004995169576969311, 'samples': 946560, 'steps': 4929, 'loss/train': 2.0106935501098633} -08/30/2021 14:04:58 - INFO - __main__ - Step 4931: {'lr': 0.0004995166279126938, 'samples': 946752, 'steps': 4930, 'loss/train': 1.7972948551177979} -08/30/2021 14:04:59 - INFO - __main__ - Step 4932: {'lr': 0.0004995162980160283, 'samples': 946944, 'steps': 4931, 'loss/train': 2.1604394912719727} -08/30/2021 14:05:00 - INFO - __main__ - Step 4933: {'lr': 0.0004995159680069346, 'samples': 947136, 'steps': 4932, 'loss/train': 2.5004405975341797} -08/30/2021 14:05:01 - INFO - __main__ - Step 4934: {'lr': 0.0004995156378854127, 'samples': 947328, 'steps': 4933, 'loss/train': 1.1308302879333496} -08/30/2021 14:05:01 - INFO - __main__ - Step 4935: {'lr': 0.000499515307651463, 'samples': 947520, 'steps': 4934, 'loss/train': 2.3879315853118896} -08/30/2021 14:05:01 - INFO - __main__ - Step 4936: {'lr': 0.0004995149773050857, 'samples': 947712, 'steps': 4935, 'loss/train': 2.3608946800231934} -08/30/2021 14:05:02 - INFO - __main__ - Step 4937: {'lr': 0.0004995146468462806, 'samples': 947904, 'steps': 4936, 'loss/train': 2.002999782562256} -08/30/2021 14:05:02 - INFO - __main__ - Step 4938: {'lr': 0.0004995143162750481, 'samples': 948096, 'steps': 4937, 'loss/train': 2.130701780319214} -08/30/2021 14:05:05 - INFO - __main__ - Step 4939: {'lr': 0.0004995139855913883, 'samples': 948288, 'steps': 4938, 'loss/train': 2.4854297637939453} -08/30/2021 14:05:05 - INFO - __main__ - Step 4940: {'lr': 0.0004995136547953014, 'samples': 948480, 'steps': 4939, 'loss/train': 1.814285159111023} -08/30/2021 14:05:05 - INFO - __main__ - Step 4941: {'lr': 0.0004995133238867874, 'samples': 948672, 'steps': 4940, 'loss/train': 2.1046688556671143} -08/30/2021 14:05:06 - INFO - __main__ - Step 4942: {'lr': 0.0004995129928658466, 'samples': 948864, 'steps': 4941, 'loss/train': 2.03877592086792} -08/30/2021 14:05:06 - INFO - __main__ - Step 4943: {'lr': 0.0004995126617324791, 'samples': 949056, 'steps': 4942, 'loss/train': 0.757353663444519} -08/30/2021 14:05:06 - INFO - __main__ - Step 4944: {'lr': 0.000499512330486685, 'samples': 949248, 'steps': 4943, 'loss/train': 0.7588753700256348} -08/30/2021 14:05:08 - INFO - __main__ - Step 4945: {'lr': 0.0004995119991284645, 'samples': 949440, 'steps': 4944, 'loss/train': 2.301693916320801} -08/30/2021 14:05:09 - INFO - __main__ - Step 4946: {'lr': 0.0004995116676578178, 'samples': 949632, 'steps': 4945, 'loss/train': 1.6053683757781982} -08/30/2021 14:05:09 - INFO - __main__ - Step 4947: {'lr': 0.000499511336074745, 'samples': 949824, 'steps': 4946, 'loss/train': 0.3145149052143097} -08/30/2021 14:05:09 - INFO - __main__ - Step 4948: {'lr': 0.0004995110043792462, 'samples': 950016, 'steps': 4947, 'loss/train': 2.001035213470459} -08/30/2021 14:05:10 - INFO - __main__ - Step 4949: {'lr': 0.0004995106725713217, 'samples': 950208, 'steps': 4948, 'loss/train': 2.3597168922424316} -08/30/2021 14:05:11 - INFO - __main__ - Step 4950: {'lr': 0.0004995103406509713, 'samples': 950400, 'steps': 4949, 'loss/train': 2.4153897762298584} -08/30/2021 14:05:12 - INFO - __main__ - Step 4951: {'lr': 0.0004995100086181957, 'samples': 950592, 'steps': 4950, 'loss/train': 2.0533249378204346} -08/30/2021 14:05:12 - INFO - __main__ - Step 4952: {'lr': 0.0004995096764729945, 'samples': 950784, 'steps': 4951, 'loss/train': 2.1157147884368896} -08/30/2021 14:05:13 - INFO - __main__ - Step 4953: {'lr': 0.0004995093442153681, 'samples': 950976, 'steps': 4952, 'loss/train': 2.475590467453003} -08/30/2021 14:05:13 - INFO - __main__ - Step 4954: {'lr': 0.0004995090118453167, 'samples': 951168, 'steps': 4953, 'loss/train': 2.4947054386138916} -08/30/2021 14:05:15 - INFO - __main__ - Step 4955: {'lr': 0.0004995086793628405, 'samples': 951360, 'steps': 4954, 'loss/train': 2.6105780601501465} -08/30/2021 14:05:15 - INFO - __main__ - Step 4956: {'lr': 0.0004995083467679394, 'samples': 951552, 'steps': 4955, 'loss/train': 2.253298282623291} -08/30/2021 14:05:16 - INFO - __main__ - Step 4957: {'lr': 0.0004995080140606137, 'samples': 951744, 'steps': 4956, 'loss/train': 1.762590765953064} -08/30/2021 14:05:16 - INFO - __main__ - Step 4958: {'lr': 0.0004995076812408636, 'samples': 951936, 'steps': 4957, 'loss/train': 1.8989931344985962} -08/30/2021 14:05:16 - INFO - __main__ - Step 4959: {'lr': 0.0004995073483086891, 'samples': 952128, 'steps': 4958, 'loss/train': 2.4466254711151123} -08/30/2021 14:05:17 - INFO - __main__ - Step 4960: {'lr': 0.0004995070152640905, 'samples': 952320, 'steps': 4959, 'loss/train': 1.510615348815918} -08/30/2021 14:05:18 - INFO - __main__ - Step 4961: {'lr': 0.0004995066821070679, 'samples': 952512, 'steps': 4960, 'loss/train': 1.8117167949676514} -08/30/2021 14:05:19 - INFO - __main__ - Step 4962: {'lr': 0.0004995063488376214, 'samples': 952704, 'steps': 4961, 'loss/train': 2.358320713043213} -08/30/2021 14:05:19 - INFO - __main__ - Step 4963: {'lr': 0.0004995060154557513, 'samples': 952896, 'steps': 4962, 'loss/train': 1.8514835834503174} -08/30/2021 14:05:19 - INFO - __main__ - Step 4964: {'lr': 0.0004995056819614575, 'samples': 953088, 'steps': 4963, 'loss/train': 2.4489994049072266} -08/30/2021 14:05:20 - INFO - __main__ - Step 4965: {'lr': 0.0004995053483547404, 'samples': 953280, 'steps': 4964, 'loss/train': 2.4801366329193115} -08/30/2021 14:05:21 - INFO - __main__ - Step 4966: {'lr': 0.0004995050146355999, 'samples': 953472, 'steps': 4965, 'loss/train': 2.4225547313690186} -08/30/2021 14:05:22 - INFO - __main__ - Step 4967: {'lr': 0.0004995046808040363, 'samples': 953664, 'steps': 4966, 'loss/train': 0.32150137424468994} -08/30/2021 14:05:22 - INFO - __main__ - Step 4968: {'lr': 0.0004995043468600499, 'samples': 953856, 'steps': 4967, 'loss/train': 1.9236828088760376} -08/30/2021 14:05:23 - INFO - __main__ - Step 4969: {'lr': 0.0004995040128036405, 'samples': 954048, 'steps': 4968, 'loss/train': 2.0275049209594727} -08/30/2021 14:05:23 - INFO - __main__ - Step 4970: {'lr': 0.0004995036786348086, 'samples': 954240, 'steps': 4969, 'loss/train': 2.2119622230529785} -08/30/2021 14:05:25 - INFO - __main__ - Step 4971: {'lr': 0.0004995033443535541, 'samples': 954432, 'steps': 4970, 'loss/train': 2.1632797718048096} -08/30/2021 14:05:25 - INFO - __main__ - Step 4972: {'lr': 0.0004995030099598773, 'samples': 954624, 'steps': 4971, 'loss/train': 2.516055107116699} -08/30/2021 14:05:25 - INFO - __main__ - Step 4973: {'lr': 0.0004995026754537783, 'samples': 954816, 'steps': 4972, 'loss/train': 3.1148569583892822} -08/30/2021 14:05:26 - INFO - __main__ - Step 4974: {'lr': 0.0004995023408352572, 'samples': 955008, 'steps': 4973, 'loss/train': 2.2369978427886963} -08/30/2021 14:05:26 - INFO - __main__ - Step 4975: {'lr': 0.0004995020061043142, 'samples': 955200, 'steps': 4974, 'loss/train': 2.421145439147949} -08/30/2021 14:05:28 - INFO - __main__ - Step 4976: {'lr': 0.0004995016712609495, 'samples': 955392, 'steps': 4975, 'loss/train': 2.4800565242767334} -08/30/2021 14:05:28 - INFO - __main__ - Step 4977: {'lr': 0.0004995013363051631, 'samples': 955584, 'steps': 4976, 'loss/train': 2.2450156211853027} -08/30/2021 14:05:28 - INFO - __main__ - Step 4978: {'lr': 0.0004995010012369554, 'samples': 955776, 'steps': 4977, 'loss/train': 1.7701746225357056} -08/30/2021 14:05:29 - INFO - __main__ - Step 4979: {'lr': 0.0004995006660563262, 'samples': 955968, 'steps': 4978, 'loss/train': 3.6930694580078125} -08/30/2021 14:05:29 - INFO - __main__ - Step 4980: {'lr': 0.000499500330763276, 'samples': 956160, 'steps': 4979, 'loss/train': 1.9483429193496704} -08/30/2021 14:05:31 - INFO - __main__ - Step 4981: {'lr': 0.0004994999953578048, 'samples': 956352, 'steps': 4980, 'loss/train': 2.2295784950256348} -08/30/2021 14:05:31 - INFO - __main__ - Step 4982: {'lr': 0.0004994996598399127, 'samples': 956544, 'steps': 4981, 'loss/train': 2.3952081203460693} -08/30/2021 14:05:31 - INFO - __main__ - Step 4983: {'lr': 0.0004994993242095999, 'samples': 956736, 'steps': 4982, 'loss/train': 2.151777744293213} -08/30/2021 14:05:32 - INFO - __main__ - Step 4984: {'lr': 0.0004994989884668665, 'samples': 956928, 'steps': 4983, 'loss/train': 1.5608434677124023} -08/30/2021 14:05:32 - INFO - __main__ - Step 4985: {'lr': 0.0004994986526117127, 'samples': 957120, 'steps': 4984, 'loss/train': 3.0511488914489746} -08/30/2021 14:05:34 - INFO - __main__ - Step 4986: {'lr': 0.0004994983166441388, 'samples': 957312, 'steps': 4985, 'loss/train': 1.9915233850479126} -08/30/2021 14:05:34 - INFO - __main__ - Step 4987: {'lr': 0.0004994979805641448, 'samples': 957504, 'steps': 4986, 'loss/train': 2.4051709175109863} -08/30/2021 14:05:35 - INFO - __main__ - Step 4988: {'lr': 0.0004994976443717308, 'samples': 957696, 'steps': 4987, 'loss/train': 2.454705238342285} -08/30/2021 14:05:35 - INFO - __main__ - Step 4989: {'lr': 0.000499497308066897, 'samples': 957888, 'steps': 4988, 'loss/train': 1.88473379611969} -08/30/2021 14:05:36 - INFO - __main__ - Step 4990: {'lr': 0.0004994969716496435, 'samples': 958080, 'steps': 4989, 'loss/train': 1.7168686389923096} -08/30/2021 14:05:36 - INFO - __main__ - Step 4991: {'lr': 0.0004994966351199706, 'samples': 958272, 'steps': 4990, 'loss/train': 2.2099459171295166} -08/30/2021 14:05:38 - INFO - __main__ - Step 4992: {'lr': 0.0004994962984778784, 'samples': 958464, 'steps': 4991, 'loss/train': 1.5991742610931396} -08/30/2021 14:05:38 - INFO - __main__ - Step 4993: {'lr': 0.0004994959617233669, 'samples': 958656, 'steps': 4992, 'loss/train': 2.384688138961792} -08/30/2021 14:05:39 - INFO - __main__ - Step 4994: {'lr': 0.0004994956248564364, 'samples': 958848, 'steps': 4993, 'loss/train': 2.214613914489746} -08/30/2021 14:05:39 - INFO - __main__ - Step 4995: {'lr': 0.000499495287877087, 'samples': 959040, 'steps': 4994, 'loss/train': 1.851972222328186} -08/30/2021 14:05:39 - INFO - __main__ - Step 4996: {'lr': 0.000499494950785319, 'samples': 959232, 'steps': 4995, 'loss/train': 2.390132427215576} -08/30/2021 14:05:41 - INFO - __main__ - Step 4997: {'lr': 0.0004994946135811324, 'samples': 959424, 'steps': 4996, 'loss/train': 2.9583733081817627} -08/30/2021 14:05:41 - INFO - __main__ - Step 4998: {'lr': 0.0004994942762645274, 'samples': 959616, 'steps': 4997, 'loss/train': 2.035806894302368} -08/30/2021 14:05:42 - INFO - __main__ - Step 4999: {'lr': 0.000499493938835504, 'samples': 959808, 'steps': 4998, 'loss/train': 1.8996617794036865} -08/30/2021 14:05:42 - INFO - __main__ - Step 5000: {'lr': 0.0004994936012940626, 'samples': 960000, 'steps': 4999, 'loss/train': 2.6488256454467773} -08/30/2021 14:05:42 - INFO - __main__ - Step 5001: {'lr': 0.0004994932636402031, 'samples': 960192, 'steps': 5000, 'loss/train': 2.4259438514709473} -08/30/2021 14:05:44 - INFO - __main__ - Step 5002: {'lr': 0.000499492925873926, 'samples': 960384, 'steps': 5001, 'loss/train': 2.70697021484375} -08/30/2021 14:05:44 - INFO - __main__ - Step 5003: {'lr': 0.000499492587995231, 'samples': 960576, 'steps': 5002, 'loss/train': 1.759914755821228} -08/30/2021 14:05:45 - INFO - __main__ - Step 5004: {'lr': 0.0004994922500041186, 'samples': 960768, 'steps': 5003, 'loss/train': 2.4683380126953125} -08/30/2021 14:05:45 - INFO - __main__ - Step 5005: {'lr': 0.0004994919119005888, 'samples': 960960, 'steps': 5004, 'loss/train': 3.022188186645508} -08/30/2021 14:05:45 - INFO - __main__ - Step 5006: {'lr': 0.0004994915736846418, 'samples': 961152, 'steps': 5005, 'loss/train': 2.1260223388671875} -08/30/2021 14:05:47 - INFO - __main__ - Step 5007: {'lr': 0.0004994912353562778, 'samples': 961344, 'steps': 5006, 'loss/train': 2.201915740966797} -08/30/2021 14:05:47 - INFO - __main__ - Step 5008: {'lr': 0.0004994908969154968, 'samples': 961536, 'steps': 5007, 'loss/train': 2.3067941665649414} -08/30/2021 14:05:48 - INFO - __main__ - Step 5009: {'lr': 0.0004994905583622992, 'samples': 961728, 'steps': 5008, 'loss/train': 2.307985782623291} -08/30/2021 14:05:48 - INFO - __main__ - Step 5010: {'lr': 0.000499490219696685, 'samples': 961920, 'steps': 5009, 'loss/train': 2.2486019134521484} -08/30/2021 14:05:48 - INFO - __main__ - Step 5011: {'lr': 0.0004994898809186542, 'samples': 962112, 'steps': 5010, 'loss/train': 2.5013742446899414} -08/30/2021 14:05:50 - INFO - __main__ - Step 5012: {'lr': 0.0004994895420282072, 'samples': 962304, 'steps': 5011, 'loss/train': 2.4124350547790527} -08/30/2021 14:05:50 - INFO - __main__ - Step 5013: {'lr': 0.000499489203025344, 'samples': 962496, 'steps': 5012, 'loss/train': 2.271155595779419} -08/30/2021 14:05:51 - INFO - __main__ - Step 5014: {'lr': 0.000499488863910065, 'samples': 962688, 'steps': 5013, 'loss/train': 2.2971246242523193} -08/30/2021 14:05:51 - INFO - __main__ - Step 5015: {'lr': 0.00049948852468237, 'samples': 962880, 'steps': 5014, 'loss/train': 2.2773890495300293} -08/30/2021 14:05:51 - INFO - __main__ - Step 5016: {'lr': 0.0004994881853422594, 'samples': 963072, 'steps': 5015, 'loss/train': 2.1161599159240723} -08/30/2021 14:05:52 - INFO - __main__ - Step 5017: {'lr': 0.0004994878458897332, 'samples': 963264, 'steps': 5016, 'loss/train': 2.326650857925415} -08/30/2021 14:05:53 - INFO - __main__ - Step 5018: {'lr': 0.0004994875063247916, 'samples': 963456, 'steps': 5017, 'loss/train': 2.836604118347168} -08/30/2021 14:05:54 - INFO - __main__ - Step 5019: {'lr': 0.0004994871666474348, 'samples': 963648, 'steps': 5018, 'loss/train': 2.0088050365448} -08/30/2021 14:05:54 - INFO - __main__ - Step 5020: {'lr': 0.000499486826857663, 'samples': 963840, 'steps': 5019, 'loss/train': 1.8153910636901855} -08/30/2021 14:05:54 - INFO - __main__ - Step 5021: {'lr': 0.0004994864869554763, 'samples': 964032, 'steps': 5020, 'loss/train': 2.020601749420166} -08/30/2021 14:05:55 - INFO - __main__ - Step 5022: {'lr': 0.0004994861469408748, 'samples': 964224, 'steps': 5021, 'loss/train': 3.125349998474121} -08/30/2021 14:05:56 - INFO - __main__ - Step 5023: {'lr': 0.0004994858068138587, 'samples': 964416, 'steps': 5022, 'loss/train': 2.310551404953003} -08/30/2021 14:05:57 - INFO - __main__ - Step 5024: {'lr': 0.0004994854665744282, 'samples': 964608, 'steps': 5023, 'loss/train': 2.111747980117798} -08/30/2021 14:05:57 - INFO - __main__ - Step 5025: {'lr': 0.0004994851262225832, 'samples': 964800, 'steps': 5024, 'loss/train': 2.0517771244049072} -08/30/2021 14:05:58 - INFO - __main__ - Step 5026: {'lr': 0.0004994847857583242, 'samples': 964992, 'steps': 5025, 'loss/train': 2.343459367752075} -08/30/2021 14:05:58 - INFO - __main__ - Step 5027: {'lr': 0.0004994844451816512, 'samples': 965184, 'steps': 5026, 'loss/train': 2.186488389968872} -08/30/2021 14:05:58 - INFO - __main__ - Step 5028: {'lr': 0.0004994841044925644, 'samples': 965376, 'steps': 5027, 'loss/train': 2.092644691467285} -08/30/2021 14:06:00 - INFO - __main__ - Step 5029: {'lr': 0.0004994837636910638, 'samples': 965568, 'steps': 5028, 'loss/train': 1.0676257610321045} -08/30/2021 14:06:00 - INFO - __main__ - Step 5030: {'lr': 0.0004994834227771498, 'samples': 965760, 'steps': 5029, 'loss/train': 1.7181196212768555} -08/30/2021 14:06:01 - INFO - __main__ - Step 5031: {'lr': 0.0004994830817508224, 'samples': 965952, 'steps': 5030, 'loss/train': 2.0105507373809814} -08/30/2021 14:06:01 - INFO - __main__ - Step 5032: {'lr': 0.0004994827406120816, 'samples': 966144, 'steps': 5031, 'loss/train': 2.50541615486145} -08/30/2021 14:06:01 - INFO - __main__ - Step 5033: {'lr': 0.0004994823993609279, 'samples': 966336, 'steps': 5032, 'loss/train': 2.1383092403411865} -08/30/2021 14:06:03 - INFO - __main__ - Step 5034: {'lr': 0.0004994820579973612, 'samples': 966528, 'steps': 5033, 'loss/train': 2.203997850418091} -08/30/2021 14:06:03 - INFO - __main__ - Step 5035: {'lr': 0.0004994817165213817, 'samples': 966720, 'steps': 5034, 'loss/train': 1.44949209690094} -08/30/2021 14:06:04 - INFO - __main__ - Step 5036: {'lr': 0.0004994813749329897, 'samples': 966912, 'steps': 5035, 'loss/train': 2.2587904930114746} -08/30/2021 14:06:04 - INFO - __main__ - Step 5037: {'lr': 0.0004994810332321852, 'samples': 967104, 'steps': 5036, 'loss/train': 1.158984661102295} -08/30/2021 14:06:04 - INFO - __main__ - Step 5038: {'lr': 0.0004994806914189684, 'samples': 967296, 'steps': 5037, 'loss/train': 1.4465986490249634} -08/30/2021 14:06:06 - INFO - __main__ - Step 5039: {'lr': 0.0004994803494933394, 'samples': 967488, 'steps': 5038, 'loss/train': 2.1343822479248047} -08/30/2021 14:06:07 - INFO - __main__ - Step 5040: {'lr': 0.0004994800074552985, 'samples': 967680, 'steps': 5039, 'loss/train': 1.92071533203125} -08/30/2021 14:06:07 - INFO - __main__ - Step 5041: {'lr': 0.0004994796653048457, 'samples': 967872, 'steps': 5040, 'loss/train': 1.976090908050537} -08/30/2021 14:06:08 - INFO - __main__ - Step 5042: {'lr': 0.0004994793230419812, 'samples': 968064, 'steps': 5041, 'loss/train': 2.8340530395507812} -08/30/2021 14:06:08 - INFO - __main__ - Step 5043: {'lr': 0.0004994789806667052, 'samples': 968256, 'steps': 5042, 'loss/train': 2.358433246612549} -08/30/2021 14:06:08 - INFO - __main__ - Step 5044: {'lr': 0.0004994786381790178, 'samples': 968448, 'steps': 5043, 'loss/train': 0.569067120552063} -08/30/2021 14:06:09 - INFO - __main__ - Step 5045: {'lr': 0.0004994782955789191, 'samples': 968640, 'steps': 5044, 'loss/train': 2.6374900341033936} -08/30/2021 14:06:10 - INFO - __main__ - Step 5046: {'lr': 0.0004994779528664095, 'samples': 968832, 'steps': 5045, 'loss/train': 1.999448537826538} -08/30/2021 14:06:11 - INFO - __main__ - Step 5047: {'lr': 0.0004994776100414888, 'samples': 969024, 'steps': 5046, 'loss/train': 0.5370808839797974} -08/30/2021 14:06:11 - INFO - __main__ - Step 5048: {'lr': 0.0004994772671041575, 'samples': 969216, 'steps': 5047, 'loss/train': 2.0678257942199707} -08/30/2021 14:06:11 - INFO - __main__ - Step 5049: {'lr': 0.0004994769240544155, 'samples': 969408, 'steps': 5048, 'loss/train': 2.6127657890319824} -08/30/2021 14:06:12 - INFO - __main__ - Step 5050: {'lr': 0.000499476580892263, 'samples': 969600, 'steps': 5049, 'loss/train': 2.5824270248413086} -08/30/2021 14:06:14 - INFO - __main__ - Step 5051: {'lr': 0.0004994762376177004, 'samples': 969792, 'steps': 5050, 'loss/train': 2.197941541671753} -08/30/2021 14:06:14 - INFO - __main__ - Step 5052: {'lr': 0.0004994758942307274, 'samples': 969984, 'steps': 5051, 'loss/train': 1.8828701972961426} -08/30/2021 14:06:14 - INFO - __main__ - Step 5053: {'lr': 0.0004994755507313446, 'samples': 970176, 'steps': 5052, 'loss/train': 2.1294960975646973} -08/30/2021 14:06:15 - INFO - __main__ - Step 5054: {'lr': 0.000499475207119552, 'samples': 970368, 'steps': 5053, 'loss/train': 2.3135781288146973} -08/30/2021 14:06:15 - INFO - __main__ - Step 5055: {'lr': 0.0004994748633953495, 'samples': 970560, 'steps': 5054, 'loss/train': 2.251643180847168} -08/30/2021 14:06:17 - INFO - __main__ - Step 5056: {'lr': 0.0004994745195587376, 'samples': 970752, 'steps': 5055, 'loss/train': 2.17777681350708} -08/30/2021 14:06:17 - INFO - __main__ - Step 5057: {'lr': 0.0004994741756097164, 'samples': 970944, 'steps': 5056, 'loss/train': 2.6799299716949463} -08/30/2021 14:06:18 - INFO - __main__ - Step 5058: {'lr': 0.0004994738315482859, 'samples': 971136, 'steps': 5057, 'loss/train': 2.480123281478882} -08/30/2021 14:06:18 - INFO - __main__ - Step 5059: {'lr': 0.0004994734873744464, 'samples': 971328, 'steps': 5058, 'loss/train': 2.2336738109588623} -08/30/2021 14:06:18 - INFO - __main__ - Step 5060: {'lr': 0.0004994731430881979, 'samples': 971520, 'steps': 5059, 'loss/train': 2.609337091445923} -08/30/2021 14:06:20 - INFO - __main__ - Step 5061: {'lr': 0.0004994727986895408, 'samples': 971712, 'steps': 5060, 'loss/train': 2.3969571590423584} -08/30/2021 14:06:20 - INFO - __main__ - Step 5062: {'lr': 0.0004994724541784749, 'samples': 971904, 'steps': 5061, 'loss/train': 2.1014246940612793} -08/30/2021 14:06:21 - INFO - __main__ - Step 5063: {'lr': 0.0004994721095550008, 'samples': 972096, 'steps': 5062, 'loss/train': 2.0435609817504883} -08/30/2021 14:06:21 - INFO - __main__ - Step 5064: {'lr': 0.0004994717648191182, 'samples': 972288, 'steps': 5063, 'loss/train': 1.364272117614746} -08/30/2021 14:06:21 - INFO - __main__ - Step 5065: {'lr': 0.0004994714199708276, 'samples': 972480, 'steps': 5064, 'loss/train': 3.4123785495758057} -08/30/2021 14:06:23 - INFO - __main__ - Step 5066: {'lr': 0.000499471075010129, 'samples': 972672, 'steps': 5065, 'loss/train': 2.356801986694336} -08/30/2021 14:06:23 - INFO - __main__ - Step 5067: {'lr': 0.0004994707299370226, 'samples': 972864, 'steps': 5066, 'loss/train': 2.198176860809326} -08/30/2021 14:06:23 - INFO - __main__ - Step 5068: {'lr': 0.0004994703847515084, 'samples': 973056, 'steps': 5067, 'loss/train': 1.8925210237503052} -08/30/2021 14:06:24 - INFO - __main__ - Step 5069: {'lr': 0.0004994700394535869, 'samples': 973248, 'steps': 5068, 'loss/train': 2.642307996749878} -08/30/2021 14:06:24 - INFO - __main__ - Step 5070: {'lr': 0.000499469694043258, 'samples': 973440, 'steps': 5069, 'loss/train': 2.5104517936706543} -08/30/2021 14:06:26 - INFO - __main__ - Step 5071: {'lr': 0.0004994693485205218, 'samples': 973632, 'steps': 5070, 'loss/train': 2.400275707244873} -08/30/2021 14:06:26 - INFO - __main__ - Step 5072: {'lr': 0.0004994690028853787, 'samples': 973824, 'steps': 5071, 'loss/train': 2.155043125152588} -08/30/2021 14:06:26 - INFO - __main__ - Step 5073: {'lr': 0.0004994686571378286, 'samples': 974016, 'steps': 5072, 'loss/train': 1.8040902614593506} -08/30/2021 14:06:27 - INFO - __main__ - Step 5074: {'lr': 0.0004994683112778718, 'samples': 974208, 'steps': 5073, 'loss/train': 2.012456178665161} -08/30/2021 14:06:27 - INFO - __main__ - Step 5075: {'lr': 0.0004994679653055085, 'samples': 974400, 'steps': 5074, 'loss/train': 2.6727070808410645} -08/30/2021 14:06:29 - INFO - __main__ - Step 5076: {'lr': 0.0004994676192207387, 'samples': 974592, 'steps': 5075, 'loss/train': 1.9303525686264038} -08/30/2021 14:06:29 - INFO - __main__ - Step 5077: {'lr': 0.0004994672730235626, 'samples': 974784, 'steps': 5076, 'loss/train': 2.28853178024292} -08/30/2021 14:06:30 - INFO - __main__ - Step 5078: {'lr': 0.0004994669267139806, 'samples': 974976, 'steps': 5077, 'loss/train': 1.9448527097702026} -08/30/2021 14:06:30 - INFO - __main__ - Step 5079: {'lr': 0.0004994665802919925, 'samples': 975168, 'steps': 5078, 'loss/train': 1.7412238121032715} -08/30/2021 14:06:30 - INFO - __main__ - Step 5080: {'lr': 0.0004994662337575986, 'samples': 975360, 'steps': 5079, 'loss/train': 1.8150287866592407} -08/30/2021 14:06:31 - INFO - __main__ - Step 5081: {'lr': 0.000499465887110799, 'samples': 975552, 'steps': 5080, 'loss/train': 2.751884698867798} -08/30/2021 14:06:32 - INFO - __main__ - Step 5082: {'lr': 0.0004994655403515941, 'samples': 975744, 'steps': 5081, 'loss/train': 2.125681161880493} -08/30/2021 14:06:33 - INFO - __main__ - Step 5083: {'lr': 0.0004994651934799837, 'samples': 975936, 'steps': 5082, 'loss/train': 2.4222323894500732} -08/30/2021 14:06:33 - INFO - __main__ - Step 5084: {'lr': 0.0004994648464959683, 'samples': 976128, 'steps': 5083, 'loss/train': 2.4969780445098877} -08/30/2021 14:06:33 - INFO - __main__ - Step 5085: {'lr': 0.0004994644993995478, 'samples': 976320, 'steps': 5084, 'loss/train': 2.1790761947631836} -08/30/2021 14:06:34 - INFO - __main__ - Step 5086: {'lr': 0.0004994641521907224, 'samples': 976512, 'steps': 5085, 'loss/train': 2.254190444946289} -08/30/2021 14:06:35 - INFO - __main__ - Step 5087: {'lr': 0.0004994638048694924, 'samples': 976704, 'steps': 5086, 'loss/train': 1.8640891313552856} -08/30/2021 14:06:36 - INFO - __main__ - Step 5088: {'lr': 0.0004994634574358579, 'samples': 976896, 'steps': 5087, 'loss/train': 2.1303329467773438} -08/30/2021 14:06:36 - INFO - __main__ - Step 5089: {'lr': 0.0004994631098898188, 'samples': 977088, 'steps': 5088, 'loss/train': 0.36919113993644714} -08/30/2021 14:06:37 - INFO - __main__ - Step 5090: {'lr': 0.0004994627622313757, 'samples': 977280, 'steps': 5089, 'loss/train': 0.23060260713100433} -08/30/2021 14:06:37 - INFO - __main__ - Step 5091: {'lr': 0.0004994624144605284, 'samples': 977472, 'steps': 5090, 'loss/train': 2.6076836585998535} -08/30/2021 14:06:39 - INFO - __main__ - Step 5092: {'lr': 0.0004994620665772772, 'samples': 977664, 'steps': 5091, 'loss/train': 2.365443468093872} -08/30/2021 14:06:40 - INFO - __main__ - Step 5093: {'lr': 0.0004994617185816222, 'samples': 977856, 'steps': 5092, 'loss/train': 1.8796745538711548} -08/30/2021 14:06:40 - INFO - __main__ - Step 5094: {'lr': 0.0004994613704735638, 'samples': 978048, 'steps': 5093, 'loss/train': 4.509443759918213} -08/30/2021 14:06:40 - INFO - __main__ - Step 5095: {'lr': 0.0004994610222531018, 'samples': 978240, 'steps': 5094, 'loss/train': 1.762518048286438} -08/30/2021 14:06:41 - INFO - __main__ - Step 5096: {'lr': 0.0004994606739202365, 'samples': 978432, 'steps': 5095, 'loss/train': 2.1011953353881836} -08/30/2021 14:06:41 - INFO - __main__ - Step 5097: {'lr': 0.0004994603254749681, 'samples': 978624, 'steps': 5096, 'loss/train': 2.0571515560150146} -08/30/2021 14:06:41 - INFO - __main__ - Step 5098: {'lr': 0.0004994599769172967, 'samples': 978816, 'steps': 5097, 'loss/train': 2.0882222652435303} -08/30/2021 14:06:43 - INFO - __main__ - Step 5099: {'lr': 0.0004994596282472225, 'samples': 979008, 'steps': 5098, 'loss/train': 2.3541228771209717} -08/30/2021 14:06:43 - INFO - __main__ - Step 5100: {'lr': 0.0004994592794647457, 'samples': 979200, 'steps': 5099, 'loss/train': 2.067221164703369} -08/30/2021 14:06:44 - INFO - __main__ - Step 5101: {'lr': 0.0004994589305698663, 'samples': 979392, 'steps': 5100, 'loss/train': 2.012131929397583} -08/30/2021 14:06:44 - INFO - __main__ - Step 5102: {'lr': 0.0004994585815625847, 'samples': 979584, 'steps': 5101, 'loss/train': 2.259871482849121} -08/30/2021 14:06:45 - INFO - __main__ - Step 5103: {'lr': 0.0004994582324429008, 'samples': 979776, 'steps': 5102, 'loss/train': 2.6643753051757812} -08/30/2021 14:06:45 - INFO - __main__ - Step 5104: {'lr': 0.0004994578832108148, 'samples': 979968, 'steps': 5103, 'loss/train': 2.388671636581421} -08/30/2021 14:06:47 - INFO - __main__ - Step 5105: {'lr': 0.000499457533866327, 'samples': 980160, 'steps': 5104, 'loss/train': 1.8212487697601318} -08/30/2021 14:06:48 - INFO - __main__ - Step 5106: {'lr': 0.0004994571844094375, 'samples': 980352, 'steps': 5105, 'loss/train': 1.160867691040039} -08/30/2021 14:06:48 - INFO - __main__ - Step 5107: {'lr': 0.0004994568348401466, 'samples': 980544, 'steps': 5106, 'loss/train': 2.539199113845825} -08/30/2021 14:06:48 - INFO - __main__ - Step 5108: {'lr': 0.0004994564851584541, 'samples': 980736, 'steps': 5107, 'loss/train': 2.3143012523651123} -08/30/2021 14:06:49 - INFO - __main__ - Step 5109: {'lr': 0.0004994561353643604, 'samples': 980928, 'steps': 5108, 'loss/train': 1.984595537185669} -08/30/2021 14:06:50 - INFO - __main__ - Step 5110: {'lr': 0.0004994557854578656, 'samples': 981120, 'steps': 5109, 'loss/train': 2.503065586090088} -08/30/2021 14:06:51 - INFO - __main__ - Step 5111: {'lr': 0.0004994554354389699, 'samples': 981312, 'steps': 5110, 'loss/train': 2.485055685043335} -08/30/2021 14:06:51 - INFO - __main__ - Step 5112: {'lr': 0.0004994550853076734, 'samples': 981504, 'steps': 5111, 'loss/train': 2.0640735626220703} -08/30/2021 14:06:51 - INFO - __main__ - Step 5113: {'lr': 0.0004994547350639764, 'samples': 981696, 'steps': 5112, 'loss/train': 2.373863935470581} -08/30/2021 14:06:52 - INFO - __main__ - Step 5114: {'lr': 0.0004994543847078787, 'samples': 981888, 'steps': 5113, 'loss/train': 2.16861629486084} -08/30/2021 14:06:53 - INFO - __main__ - Step 5115: {'lr': 0.000499454034239381, 'samples': 982080, 'steps': 5114, 'loss/train': 2.0705621242523193} -08/30/2021 14:06:54 - INFO - __main__ - Step 5116: {'lr': 0.000499453683658483, 'samples': 982272, 'steps': 5115, 'loss/train': 2.169928789138794} -08/30/2021 14:06:54 - INFO - __main__ - Step 5117: {'lr': 0.0004994533329651849, 'samples': 982464, 'steps': 5116, 'loss/train': 2.4235708713531494} -08/30/2021 14:06:55 - INFO - __main__ - Step 5118: {'lr': 0.0004994529821594872, 'samples': 982656, 'steps': 5117, 'loss/train': 2.439915180206299} -08/30/2021 14:06:55 - INFO - __main__ - Step 5119: {'lr': 0.0004994526312413897, 'samples': 982848, 'steps': 5118, 'loss/train': 2.178100824356079} -08/30/2021 14:06:56 - INFO - __main__ - Step 5120: {'lr': 0.0004994522802108927, 'samples': 983040, 'steps': 5119, 'loss/train': 2.2076311111450195} -08/30/2021 14:06:57 - INFO - __main__ - Step 5121: {'lr': 0.0004994519290679964, 'samples': 983232, 'steps': 5120, 'loss/train': 2.2335612773895264} -08/30/2021 14:06:57 - INFO - __main__ - Step 5122: {'lr': 0.0004994515778127009, 'samples': 983424, 'steps': 5121, 'loss/train': 2.0980303287506104} -08/30/2021 14:06:58 - INFO - __main__ - Step 5123: {'lr': 0.0004994512264450064, 'samples': 983616, 'steps': 5122, 'loss/train': 2.24619460105896} -08/30/2021 14:06:58 - INFO - __main__ - Step 5124: {'lr': 0.000499450874964913, 'samples': 983808, 'steps': 5123, 'loss/train': 2.405144214630127} -08/30/2021 14:06:58 - INFO - __main__ - Step 5125: {'lr': 0.000499450523372421, 'samples': 984000, 'steps': 5124, 'loss/train': 1.82676362991333} -08/30/2021 14:07:00 - INFO - __main__ - Step 5126: {'lr': 0.0004994501716675303, 'samples': 984192, 'steps': 5125, 'loss/train': 2.571577310562134} -08/30/2021 14:07:00 - INFO - __main__ - Step 5127: {'lr': 0.0004994498198502412, 'samples': 984384, 'steps': 5126, 'loss/train': 2.3094050884246826} -08/30/2021 14:07:01 - INFO - __main__ - Step 5128: {'lr': 0.0004994494679205539, 'samples': 984576, 'steps': 5127, 'loss/train': 2.3609585762023926} -08/30/2021 14:07:01 - INFO - __main__ - Step 5129: {'lr': 0.0004994491158784684, 'samples': 984768, 'steps': 5128, 'loss/train': 2.3722198009490967} -08/30/2021 14:07:02 - INFO - __main__ - Step 5130: {'lr': 0.0004994487637239851, 'samples': 984960, 'steps': 5129, 'loss/train': 2.0476746559143066} -08/30/2021 14:07:03 - INFO - __main__ - Step 5131: {'lr': 0.0004994484114571041, 'samples': 985152, 'steps': 5130, 'loss/train': 2.3820438385009766} -08/30/2021 14:07:03 - INFO - __main__ - Step 5132: {'lr': 0.0004994480590778254, 'samples': 985344, 'steps': 5131, 'loss/train': 1.8114874362945557} -08/30/2021 14:07:04 - INFO - __main__ - Step 5133: {'lr': 0.0004994477065861493, 'samples': 985536, 'steps': 5132, 'loss/train': 2.685075521469116} -08/30/2021 14:07:04 - INFO - __main__ - Step 5134: {'lr': 0.0004994473539820758, 'samples': 985728, 'steps': 5133, 'loss/train': 2.043989419937134} -08/30/2021 14:07:04 - INFO - __main__ - Step 5135: {'lr': 0.0004994470012656052, 'samples': 985920, 'steps': 5134, 'loss/train': 2.3362574577331543} -08/30/2021 14:07:06 - INFO - __main__ - Step 5136: {'lr': 0.0004994466484367378, 'samples': 986112, 'steps': 5135, 'loss/train': 2.7829253673553467} -08/30/2021 14:07:07 - INFO - __main__ - Step 5137: {'lr': 0.0004994462954954734, 'samples': 986304, 'steps': 5136, 'loss/train': 2.145165205001831} -08/30/2021 14:07:07 - INFO - __main__ - Step 5138: {'lr': 0.0004994459424418125, 'samples': 986496, 'steps': 5137, 'loss/train': 1.6925978660583496} -08/30/2021 14:07:07 - INFO - __main__ - Step 5139: {'lr': 0.000499445589275755, 'samples': 986688, 'steps': 5138, 'loss/train': 2.0861947536468506} -08/30/2021 14:07:08 - INFO - __main__ - Step 5140: {'lr': 0.0004994452359973012, 'samples': 986880, 'steps': 5139, 'loss/train': 2.047111749649048} -08/30/2021 14:07:09 - INFO - __main__ - Step 5141: {'lr': 0.0004994448826064512, 'samples': 987072, 'steps': 5140, 'loss/train': 1.8532780408859253} -08/30/2021 14:07:10 - INFO - __main__ - Step 5142: {'lr': 0.0004994445291032053, 'samples': 987264, 'steps': 5141, 'loss/train': 1.6752511262893677} -08/30/2021 14:07:10 - INFO - __main__ - Step 5143: {'lr': 0.0004994441754875634, 'samples': 987456, 'steps': 5142, 'loss/train': 1.545415997505188} -08/30/2021 14:07:11 - INFO - __main__ - Step 5144: {'lr': 0.0004994438217595259, 'samples': 987648, 'steps': 5143, 'loss/train': 2.0602314472198486} -08/30/2021 14:07:11 - INFO - __main__ - Step 5145: {'lr': 0.0004994434679190928, 'samples': 987840, 'steps': 5144, 'loss/train': 2.4933364391326904} -08/30/2021 14:07:11 - INFO - __main__ - Step 5146: {'lr': 0.0004994431139662643, 'samples': 988032, 'steps': 5145, 'loss/train': 0.6041566133499146} -08/30/2021 14:07:12 - INFO - __main__ - Step 5147: {'lr': 0.0004994427599010406, 'samples': 988224, 'steps': 5146, 'loss/train': 2.0003671646118164} -08/30/2021 14:07:13 - INFO - __main__ - Step 5148: {'lr': 0.0004994424057234219, 'samples': 988416, 'steps': 5147, 'loss/train': 2.1199288368225098} -08/30/2021 14:07:14 - INFO - __main__ - Step 5149: {'lr': 0.0004994420514334082, 'samples': 988608, 'steps': 5148, 'loss/train': 2.1466615200042725} -08/30/2021 14:07:14 - INFO - __main__ - Step 5150: {'lr': 0.0004994416970309999, 'samples': 988800, 'steps': 5149, 'loss/train': 2.6275534629821777} -08/30/2021 14:07:15 - INFO - __main__ - Step 5151: {'lr': 0.0004994413425161969, 'samples': 988992, 'steps': 5150, 'loss/train': 1.93808114528656} -08/30/2021 14:07:15 - INFO - __main__ - Step 5152: {'lr': 0.0004994409878889995, 'samples': 989184, 'steps': 5151, 'loss/train': 1.8684135675430298} -08/30/2021 14:07:16 - INFO - __main__ - Step 5153: {'lr': 0.0004994406331494079, 'samples': 989376, 'steps': 5152, 'loss/train': 3.0381879806518555} -08/30/2021 14:07:17 - INFO - __main__ - Step 5154: {'lr': 0.0004994402782974222, 'samples': 989568, 'steps': 5153, 'loss/train': 2.2175939083099365} -08/30/2021 14:07:17 - INFO - __main__ - Step 5155: {'lr': 0.0004994399233330426, 'samples': 989760, 'steps': 5154, 'loss/train': 2.338268280029297} -08/30/2021 14:07:18 - INFO - __main__ - Step 5156: {'lr': 0.000499439568256269, 'samples': 989952, 'steps': 5155, 'loss/train': 2.682722568511963} -08/30/2021 14:07:18 - INFO - __main__ - Step 5157: {'lr': 0.000499439213067102, 'samples': 990144, 'steps': 5156, 'loss/train': 1.8515269756317139} -08/30/2021 14:07:18 - INFO - __main__ - Step 5158: {'lr': 0.0004994388577655415, 'samples': 990336, 'steps': 5157, 'loss/train': 1.8539119958877563} -08/30/2021 14:07:21 - INFO - __main__ - Step 5159: {'lr': 0.0004994385023515876, 'samples': 990528, 'steps': 5158, 'loss/train': 2.0890052318573} -08/30/2021 14:07:21 - INFO - __main__ - Step 5160: {'lr': 0.0004994381468252406, 'samples': 990720, 'steps': 5159, 'loss/train': 0.3400194048881531} -08/30/2021 14:07:21 - INFO - __main__ - Step 5161: {'lr': 0.0004994377911865007, 'samples': 990912, 'steps': 5160, 'loss/train': 2.185608386993408} -08/30/2021 14:07:22 - INFO - __main__ - Step 5162: {'lr': 0.0004994374354353679, 'samples': 991104, 'steps': 5161, 'loss/train': 1.9886928796768188} -08/30/2021 14:07:22 - INFO - __main__ - Step 5163: {'lr': 0.0004994370795718425, 'samples': 991296, 'steps': 5162, 'loss/train': 2.439370632171631} -08/30/2021 14:07:23 - INFO - __main__ - Step 5164: {'lr': 0.0004994367235959245, 'samples': 991488, 'steps': 5163, 'loss/train': 3.3344357013702393} -08/30/2021 14:07:24 - INFO - __main__ - Step 5165: {'lr': 0.0004994363675076143, 'samples': 991680, 'steps': 5164, 'loss/train': 2.0596539974212646} -08/30/2021 14:07:24 - INFO - __main__ - Step 5166: {'lr': 0.0004994360113069118, 'samples': 991872, 'steps': 5165, 'loss/train': 2.35343074798584} -08/30/2021 14:07:25 - INFO - __main__ - Step 5167: {'lr': 0.0004994356549938173, 'samples': 992064, 'steps': 5166, 'loss/train': 1.1098432540893555} -08/30/2021 14:07:25 - INFO - __main__ - Step 5168: {'lr': 0.000499435298568331, 'samples': 992256, 'steps': 5167, 'loss/train': 2.6775572299957275} -08/30/2021 14:07:27 - INFO - __main__ - Step 5169: {'lr': 0.000499434942030453, 'samples': 992448, 'steps': 5168, 'loss/train': 1.8229023218154907} -08/30/2021 14:07:27 - INFO - __main__ - Step 5170: {'lr': 0.0004994345853801834, 'samples': 992640, 'steps': 5169, 'loss/train': 2.324307918548584} -08/30/2021 14:07:27 - INFO - __main__ - Step 5171: {'lr': 0.0004994342286175225, 'samples': 992832, 'steps': 5170, 'loss/train': 1.863842248916626} -08/30/2021 14:07:28 - INFO - __main__ - Step 5172: {'lr': 0.0004994338717424704, 'samples': 993024, 'steps': 5171, 'loss/train': 0.31887251138687134} -08/30/2021 14:07:28 - INFO - __main__ - Step 5173: {'lr': 0.0004994335147550272, 'samples': 993216, 'steps': 5172, 'loss/train': 1.6892577409744263} -08/30/2021 14:07:30 - INFO - __main__ - Step 5174: {'lr': 0.0004994331576551931, 'samples': 993408, 'steps': 5173, 'loss/train': 1.34635591506958} -08/30/2021 14:07:30 - INFO - __main__ - Step 5175: {'lr': 0.0004994328004429683, 'samples': 993600, 'steps': 5174, 'loss/train': 1.6297293901443481} -08/30/2021 14:07:30 - INFO - __main__ - Step 5176: {'lr': 0.000499432443118353, 'samples': 993792, 'steps': 5175, 'loss/train': 2.1387791633605957} -08/30/2021 14:07:31 - INFO - __main__ - Step 5177: {'lr': 0.0004994320856813471, 'samples': 993984, 'steps': 5176, 'loss/train': 2.3840878009796143} -08/30/2021 14:07:31 - INFO - __main__ - Step 5178: {'lr': 0.000499431728131951, 'samples': 994176, 'steps': 5177, 'loss/train': 2.0232748985290527} -08/30/2021 14:07:33 - INFO - __main__ - Step 5179: {'lr': 0.0004994313704701648, 'samples': 994368, 'steps': 5178, 'loss/train': 1.6016216278076172} -08/30/2021 14:07:33 - INFO - __main__ - Step 5180: {'lr': 0.0004994310126959887, 'samples': 994560, 'steps': 5179, 'loss/train': 1.867646336555481} -08/30/2021 14:07:34 - INFO - __main__ - Step 5181: {'lr': 0.000499430654809423, 'samples': 994752, 'steps': 5180, 'loss/train': 2.151320695877075} -08/30/2021 14:07:34 - INFO - __main__ - Step 5182: {'lr': 0.0004994302968104675, 'samples': 994944, 'steps': 5181, 'loss/train': 1.1911743879318237} -08/30/2021 14:07:34 - INFO - __main__ - Step 5183: {'lr': 0.0004994299386991227, 'samples': 995136, 'steps': 5182, 'loss/train': 2.3783390522003174} -08/30/2021 14:07:36 - INFO - __main__ - Step 5184: {'lr': 0.0004994295804753885, 'samples': 995328, 'steps': 5183, 'loss/train': 1.7106528282165527} -08/30/2021 14:07:37 - INFO - __main__ - Step 5185: {'lr': 0.0004994292221392652, 'samples': 995520, 'steps': 5184, 'loss/train': 2.477846145629883} -08/30/2021 14:07:37 - INFO - __main__ - Step 5186: {'lr': 0.000499428863690753, 'samples': 995712, 'steps': 5185, 'loss/train': 1.889315128326416} -08/30/2021 14:07:37 - INFO - __main__ - Step 5187: {'lr': 0.0004994285051298519, 'samples': 995904, 'steps': 5186, 'loss/train': 1.52708899974823} -08/30/2021 14:07:38 - INFO - __main__ - Step 5188: {'lr': 0.0004994281464565623, 'samples': 996096, 'steps': 5187, 'loss/train': 2.420551061630249} -08/30/2021 14:07:39 - INFO - __main__ - Step 5189: {'lr': 0.0004994277876708841, 'samples': 996288, 'steps': 5188, 'loss/train': 2.140460729598999} -08/30/2021 14:07:40 - INFO - __main__ - Step 5190: {'lr': 0.0004994274287728177, 'samples': 996480, 'steps': 5189, 'loss/train': 2.421818733215332} -08/30/2021 14:07:40 - INFO - __main__ - Step 5191: {'lr': 0.0004994270697623631, 'samples': 996672, 'steps': 5190, 'loss/train': 2.2945523262023926} -08/30/2021 14:07:40 - INFO - __main__ - Step 5192: {'lr': 0.0004994267106395205, 'samples': 996864, 'steps': 5191, 'loss/train': 2.2751009464263916} -08/30/2021 14:07:41 - INFO - __main__ - Step 5193: {'lr': 0.0004994263514042901, 'samples': 997056, 'steps': 5192, 'loss/train': 2.1930885314941406} -08/30/2021 14:07:42 - INFO - __main__ - Step 5194: {'lr': 0.0004994259920566719, 'samples': 997248, 'steps': 5193, 'loss/train': 2.067279815673828} -08/30/2021 14:07:42 - INFO - __main__ - Step 5195: {'lr': 0.0004994256325966663, 'samples': 997440, 'steps': 5194, 'loss/train': 2.3864243030548096} -08/30/2021 14:07:43 - INFO - __main__ - Step 5196: {'lr': 0.0004994252730242734, 'samples': 997632, 'steps': 5195, 'loss/train': 1.791703701019287} -08/30/2021 14:07:43 - INFO - __main__ - Step 5197: {'lr': 0.0004994249133394933, 'samples': 997824, 'steps': 5196, 'loss/train': 2.1101086139678955} -08/30/2021 14:07:44 - INFO - __main__ - Step 5198: {'lr': 0.0004994245535423262, 'samples': 998016, 'steps': 5197, 'loss/train': 2.9943315982818604} -08/30/2021 14:07:45 - INFO - __main__ - Step 5199: {'lr': 0.0004994241936327722, 'samples': 998208, 'steps': 5198, 'loss/train': 2.202904224395752} -08/30/2021 14:07:45 - INFO - __main__ - Step 5200: {'lr': 0.0004994238336108315, 'samples': 998400, 'steps': 5199, 'loss/train': 2.7223398685455322} -08/30/2021 14:07:46 - INFO - __main__ - Step 5201: {'lr': 0.0004994234734765043, 'samples': 998592, 'steps': 5200, 'loss/train': 1.8800334930419922} -08/30/2021 14:07:46 - INFO - __main__ - Step 5202: {'lr': 0.0004994231132297907, 'samples': 998784, 'steps': 5201, 'loss/train': 2.0159521102905273} -08/30/2021 14:07:47 - INFO - __main__ - Step 5203: {'lr': 0.0004994227528706909, 'samples': 998976, 'steps': 5202, 'loss/train': 1.6396052837371826} -08/30/2021 14:07:47 - INFO - __main__ - Step 5204: {'lr': 0.0004994223923992052, 'samples': 999168, 'steps': 5203, 'loss/train': 1.8067177534103394} -08/30/2021 14:07:49 - INFO - __main__ - Step 5205: {'lr': 0.0004994220318153334, 'samples': 999360, 'steps': 5204, 'loss/train': 1.9630169868469238} -08/30/2021 14:07:49 - INFO - __main__ - Step 5206: {'lr': 0.000499421671119076, 'samples': 999552, 'steps': 5205, 'loss/train': 2.928579568862915} -08/30/2021 14:07:49 - INFO - __main__ - Step 5207: {'lr': 0.0004994213103104331, 'samples': 999744, 'steps': 5206, 'loss/train': 0.20592327415943146} -08/30/2021 14:07:50 - INFO - __main__ - Step 5208: {'lr': 0.0004994209493894046, 'samples': 999936, 'steps': 5207, 'loss/train': 1.9329336881637573} -08/30/2021 14:07:50 - INFO - __main__ - Step 5209: {'lr': 0.000499420588355991, 'samples': 1000128, 'steps': 5208, 'loss/train': 1.758858323097229} -08/30/2021 14:07:52 - INFO - __main__ - Step 5210: {'lr': 0.0004994202272101923, 'samples': 1000320, 'steps': 5209, 'loss/train': 1.7124828100204468} -08/30/2021 14:07:53 - INFO - __main__ - Step 5211: {'lr': 0.0004994198659520087, 'samples': 1000512, 'steps': 5210, 'loss/train': 1.8692842721939087} -08/30/2021 14:07:53 - INFO - __main__ - Step 5212: {'lr': 0.0004994195045814404, 'samples': 1000704, 'steps': 5211, 'loss/train': 1.556260108947754} -08/30/2021 14:07:54 - INFO - __main__ - Step 5213: {'lr': 0.0004994191430984876, 'samples': 1000896, 'steps': 5212, 'loss/train': 2.590009927749634} -08/30/2021 14:07:54 - INFO - __main__ - Step 5214: {'lr': 0.0004994187815031502, 'samples': 1001088, 'steps': 5213, 'loss/train': 1.8999031782150269} -08/30/2021 14:07:56 - INFO - __main__ - Step 5215: {'lr': 0.0004994184197954286, 'samples': 1001280, 'steps': 5214, 'loss/train': 1.627764105796814} -08/30/2021 14:07:56 - INFO - __main__ - Step 5216: {'lr': 0.000499418057975323, 'samples': 1001472, 'steps': 5215, 'loss/train': 1.9653759002685547} -08/30/2021 14:07:57 - INFO - __main__ - Step 5217: {'lr': 0.0004994176960428333, 'samples': 1001664, 'steps': 5216, 'loss/train': 0.42130613327026367} -08/30/2021 14:07:57 - INFO - __main__ - Step 5218: {'lr': 0.00049941733399796, 'samples': 1001856, 'steps': 5217, 'loss/train': 2.122182607650757} -08/30/2021 14:07:57 - INFO - __main__ - Step 5219: {'lr': 0.000499416971840703, 'samples': 1002048, 'steps': 5218, 'loss/train': 1.9193789958953857} -08/30/2021 14:07:59 - INFO - __main__ - Step 5220: {'lr': 0.0004994166095710626, 'samples': 1002240, 'steps': 5219, 'loss/train': 1.726962924003601} -08/30/2021 14:07:59 - INFO - __main__ - Step 5221: {'lr': 0.000499416247189039, 'samples': 1002432, 'steps': 5220, 'loss/train': 2.058763027191162} -08/30/2021 14:08:00 - INFO - __main__ - Step 5222: {'lr': 0.0004994158846946321, 'samples': 1002624, 'steps': 5221, 'loss/train': 2.678605079650879} -08/30/2021 14:08:00 - INFO - __main__ - Step 5223: {'lr': 0.0004994155220878425, 'samples': 1002816, 'steps': 5222, 'loss/train': 1.7736533880233765} -08/30/2021 14:08:00 - INFO - __main__ - Step 5224: {'lr': 0.0004994151593686699, 'samples': 1003008, 'steps': 5223, 'loss/train': 2.163242816925049} -08/30/2021 14:08:02 - INFO - __main__ - Step 5225: {'lr': 0.0004994147965371147, 'samples': 1003200, 'steps': 5224, 'loss/train': 2.59200119972229} -08/30/2021 14:08:02 - INFO - __main__ - Step 5226: {'lr': 0.0004994144335931772, 'samples': 1003392, 'steps': 5225, 'loss/train': 1.7423933744430542} -08/30/2021 14:08:03 - INFO - __main__ - Step 5227: {'lr': 0.0004994140705368573, 'samples': 1003584, 'steps': 5226, 'loss/train': 2.2525906562805176} -08/30/2021 14:08:03 - INFO - __main__ - Step 5228: {'lr': 0.0004994137073681552, 'samples': 1003776, 'steps': 5227, 'loss/train': 2.3387978076934814} -08/30/2021 14:08:03 - INFO - __main__ - Step 5229: {'lr': 0.0004994133440870712, 'samples': 1003968, 'steps': 5228, 'loss/train': 2.445462942123413} -08/30/2021 14:08:05 - INFO - __main__ - Step 5230: {'lr': 0.0004994129806936054, 'samples': 1004160, 'steps': 5229, 'loss/train': 0.27603963017463684} -08/30/2021 14:08:05 - INFO - __main__ - Step 5231: {'lr': 0.000499412617187758, 'samples': 1004352, 'steps': 5230, 'loss/train': 2.800638437271118} -08/30/2021 14:08:06 - INFO - __main__ - Step 5232: {'lr': 0.0004994122535695291, 'samples': 1004544, 'steps': 5231, 'loss/train': 1.6900337934494019} -08/30/2021 14:08:06 - INFO - __main__ - Step 5233: {'lr': 0.0004994118898389189, 'samples': 1004736, 'steps': 5232, 'loss/train': 2.201263189315796} -08/30/2021 14:08:06 - INFO - __main__ - Step 5234: {'lr': 0.0004994115259959274, 'samples': 1004928, 'steps': 5233, 'loss/train': 2.0528626441955566} -08/30/2021 14:08:08 - INFO - __main__ - Step 5235: {'lr': 0.0004994111620405551, 'samples': 1005120, 'steps': 5234, 'loss/train': 1.8250207901000977} -08/30/2021 14:08:09 - INFO - __main__ - Step 5236: {'lr': 0.0004994107979728019, 'samples': 1005312, 'steps': 5235, 'loss/train': 2.6029181480407715} -08/30/2021 14:08:09 - INFO - __main__ - Step 5237: {'lr': 0.0004994104337926681, 'samples': 1005504, 'steps': 5236, 'loss/train': 0.3338676393032074} -08/30/2021 14:08:09 - INFO - __main__ - Step 5238: {'lr': 0.0004994100695001537, 'samples': 1005696, 'steps': 5237, 'loss/train': 1.8283063173294067} -08/30/2021 14:08:10 - INFO - __main__ - Step 5239: {'lr': 0.0004994097050952591, 'samples': 1005888, 'steps': 5238, 'loss/train': 2.0244762897491455} -08/30/2021 14:08:10 - INFO - __main__ - Step 5240: {'lr': 0.0004994093405779842, 'samples': 1006080, 'steps': 5239, 'loss/train': 1.7621753215789795} -08/30/2021 14:08:11 - INFO - __main__ - Step 5241: {'lr': 0.0004994089759483294, 'samples': 1006272, 'steps': 5240, 'loss/train': 2.115987777709961} -08/30/2021 14:08:12 - INFO - __main__ - Step 5242: {'lr': 0.0004994086112062948, 'samples': 1006464, 'steps': 5241, 'loss/train': 2.5955007076263428} -08/30/2021 14:08:12 - INFO - __main__ - Step 5243: {'lr': 0.0004994082463518804, 'samples': 1006656, 'steps': 5242, 'loss/train': 1.8649080991744995} -08/30/2021 14:08:13 - INFO - __main__ - Step 5244: {'lr': 0.0004994078813850865, 'samples': 1006848, 'steps': 5243, 'loss/train': 2.2834858894348145} -08/30/2021 14:08:13 - INFO - __main__ - Step 5245: {'lr': 0.0004994075163059134, 'samples': 1007040, 'steps': 5244, 'loss/train': 1.4247674942016602} -08/30/2021 14:08:15 - INFO - __main__ - Step 5246: {'lr': 0.0004994071511143609, 'samples': 1007232, 'steps': 5245, 'loss/train': 1.9448771476745605} -08/30/2021 14:08:15 - INFO - __main__ - Step 5247: {'lr': 0.0004994067858104296, 'samples': 1007424, 'steps': 5246, 'loss/train': 2.3362410068511963} -08/30/2021 14:08:15 - INFO - __main__ - Step 5248: {'lr': 0.0004994064203941195, 'samples': 1007616, 'steps': 5247, 'loss/train': 1.9038634300231934} -08/30/2021 14:08:16 - INFO - __main__ - Step 5249: {'lr': 0.0004994060548654304, 'samples': 1007808, 'steps': 5248, 'loss/train': 2.086329460144043} -08/30/2021 14:08:16 - INFO - __main__ - Step 5250: {'lr': 0.000499405689224363, 'samples': 1008000, 'steps': 5249, 'loss/train': 1.9584294557571411} -08/30/2021 14:08:17 - INFO - __main__ - Step 5251: {'lr': 0.0004994053234709172, 'samples': 1008192, 'steps': 5250, 'loss/train': 2.260010242462158} -08/30/2021 14:08:18 - INFO - __main__ - Step 5252: {'lr': 0.0004994049576050933, 'samples': 1008384, 'steps': 5251, 'loss/train': 2.1873691082000732} -08/30/2021 14:08:18 - INFO - __main__ - Step 5253: {'lr': 0.0004994045916268913, 'samples': 1008576, 'steps': 5252, 'loss/train': 1.9193403720855713} -08/30/2021 14:08:19 - INFO - __main__ - Step 5254: {'lr': 0.0004994042255363115, 'samples': 1008768, 'steps': 5253, 'loss/train': 2.6118009090423584} -08/30/2021 14:08:19 - INFO - __main__ - Step 5255: {'lr': 0.0004994038593333539, 'samples': 1008960, 'steps': 5254, 'loss/train': 2.529608726501465} -08/30/2021 14:08:21 - INFO - __main__ - Step 5256: {'lr': 0.0004994034930180188, 'samples': 1009152, 'steps': 5255, 'loss/train': 2.4949984550476074} -08/30/2021 14:08:21 - INFO - __main__ - Step 5257: {'lr': 0.0004994031265903063, 'samples': 1009344, 'steps': 5256, 'loss/train': 2.3542065620422363} -08/30/2021 14:08:21 - INFO - __main__ - Step 5258: {'lr': 0.0004994027600502167, 'samples': 1009536, 'steps': 5257, 'loss/train': 0.22891099750995636} -08/30/2021 14:08:22 - INFO - __main__ - Step 5259: {'lr': 0.00049940239339775, 'samples': 1009728, 'steps': 5258, 'loss/train': 1.789426565170288} -08/30/2021 14:08:22 - INFO - __main__ - Step 5260: {'lr': 0.0004994020266329064, 'samples': 1009920, 'steps': 5259, 'loss/train': 1.8118581771850586} -08/30/2021 14:08:24 - INFO - __main__ - Step 5261: {'lr': 0.0004994016597556862, 'samples': 1010112, 'steps': 5260, 'loss/train': 2.465618371963501} -08/30/2021 14:08:25 - INFO - __main__ - Step 5262: {'lr': 0.0004994012927660894, 'samples': 1010304, 'steps': 5261, 'loss/train': 3.0062427520751953} -08/30/2021 14:08:25 - INFO - __main__ - Step 5263: {'lr': 0.0004994009256641162, 'samples': 1010496, 'steps': 5262, 'loss/train': 2.997375249862671} -08/30/2021 14:08:25 - INFO - __main__ - Step 5264: {'lr': 0.0004994005584497667, 'samples': 1010688, 'steps': 5263, 'loss/train': 1.7763981819152832} -08/30/2021 14:08:26 - INFO - __main__ - Step 5265: {'lr': 0.0004994001911230413, 'samples': 1010880, 'steps': 5264, 'loss/train': 2.640120029449463} -08/30/2021 14:08:26 - INFO - __main__ - Step 5266: {'lr': 0.00049939982368394, 'samples': 1011072, 'steps': 5265, 'loss/train': 2.1227917671203613} -08/30/2021 14:08:28 - INFO - __main__ - Step 5267: {'lr': 0.000499399456132463, 'samples': 1011264, 'steps': 5266, 'loss/train': 2.0941662788391113} -08/30/2021 14:08:29 - INFO - __main__ - Step 5268: {'lr': 0.0004993990884686105, 'samples': 1011456, 'steps': 5267, 'loss/train': 2.4199488162994385} -08/30/2021 14:08:29 - INFO - __main__ - Step 5269: {'lr': 0.0004993987206923825, 'samples': 1011648, 'steps': 5268, 'loss/train': 6.3083415031433105} -08/30/2021 14:08:29 - INFO - __main__ - Step 5270: {'lr': 0.0004993983528037793, 'samples': 1011840, 'steps': 5269, 'loss/train': 1.8794220685958862} -08/30/2021 14:08:30 - INFO - __main__ - Step 5271: {'lr': 0.0004993979848028011, 'samples': 1012032, 'steps': 5270, 'loss/train': 2.3997039794921875} -08/30/2021 14:08:30 - INFO - __main__ - Step 5272: {'lr': 0.000499397616689448, 'samples': 1012224, 'steps': 5271, 'loss/train': 1.3626079559326172} -08/30/2021 14:08:31 - INFO - __main__ - Step 5273: {'lr': 0.0004993972484637202, 'samples': 1012416, 'steps': 5272, 'loss/train': 1.7811495065689087} -08/30/2021 14:08:32 - INFO - __main__ - Step 5274: {'lr': 0.0004993968801256178, 'samples': 1012608, 'steps': 5273, 'loss/train': 2.639021635055542} -08/30/2021 14:08:32 - INFO - __main__ - Step 5275: {'lr': 0.0004993965116751411, 'samples': 1012800, 'steps': 5274, 'loss/train': 1.9918279647827148} -08/30/2021 14:08:33 - INFO - __main__ - Step 5276: {'lr': 0.0004993961431122901, 'samples': 1012992, 'steps': 5275, 'loss/train': 2.6671645641326904} -08/30/2021 14:08:33 - INFO - __main__ - Step 5277: {'lr': 0.0004993957744370651, 'samples': 1013184, 'steps': 5276, 'loss/train': 1.9408828020095825} -08/30/2021 14:08:34 - INFO - __main__ - Step 5278: {'lr': 0.0004993954056494662, 'samples': 1013376, 'steps': 5277, 'loss/train': 1.4799178838729858} -08/30/2021 14:08:35 - INFO - __main__ - Step 5279: {'lr': 0.0004993950367494936, 'samples': 1013568, 'steps': 5278, 'loss/train': 2.6586716175079346} -08/30/2021 14:08:35 - INFO - __main__ - Step 5280: {'lr': 0.0004993946677371474, 'samples': 1013760, 'steps': 5279, 'loss/train': 2.5127079486846924} -08/30/2021 14:08:36 - INFO - __main__ - Step 5281: {'lr': 0.0004993942986124278, 'samples': 1013952, 'steps': 5280, 'loss/train': 2.0884318351745605} -08/30/2021 14:08:36 - INFO - __main__ - Step 5282: {'lr': 0.000499393929375335, 'samples': 1014144, 'steps': 5281, 'loss/train': 2.547905445098877} -08/30/2021 14:08:37 - INFO - __main__ - Step 5283: {'lr': 0.0004993935600258691, 'samples': 1014336, 'steps': 5282, 'loss/train': 2.7553727626800537} -08/30/2021 14:08:38 - INFO - __main__ - Step 5284: {'lr': 0.0004993931905640305, 'samples': 1014528, 'steps': 5283, 'loss/train': 1.4387353658676147} -08/30/2021 14:08:38 - INFO - __main__ - Step 5285: {'lr': 0.000499392820989819, 'samples': 1014720, 'steps': 5284, 'loss/train': 2.5183651447296143} -08/30/2021 14:08:39 - INFO - __main__ - Step 5286: {'lr': 0.0004993924513032349, 'samples': 1014912, 'steps': 5285, 'loss/train': 1.3854247331619263} -08/30/2021 14:08:39 - INFO - __main__ - Step 5287: {'lr': 0.0004993920815042785, 'samples': 1015104, 'steps': 5286, 'loss/train': 2.466095447540283} -08/30/2021 14:08:41 - INFO - __main__ - Step 5288: {'lr': 0.0004993917115929498, 'samples': 1015296, 'steps': 5287, 'loss/train': 1.8673524856567383} -08/30/2021 14:08:41 - INFO - __main__ - Step 5289: {'lr': 0.0004993913415692492, 'samples': 1015488, 'steps': 5288, 'loss/train': 2.0241940021514893} -08/30/2021 14:08:42 - INFO - __main__ - Step 5290: {'lr': 0.0004993909714331766, 'samples': 1015680, 'steps': 5289, 'loss/train': 2.5281755924224854} -08/30/2021 14:08:42 - INFO - __main__ - Step 5291: {'lr': 0.0004993906011847323, 'samples': 1015872, 'steps': 5290, 'loss/train': 2.409820318222046} -08/30/2021 14:08:42 - INFO - __main__ - Step 5292: {'lr': 0.0004993902308239164, 'samples': 1016064, 'steps': 5291, 'loss/train': 2.2571828365325928} -08/30/2021 14:08:43 - INFO - __main__ - Step 5293: {'lr': 0.0004993898603507292, 'samples': 1016256, 'steps': 5292, 'loss/train': 2.139096736907959} -08/30/2021 14:08:44 - INFO - __main__ - Step 5294: {'lr': 0.0004993894897651706, 'samples': 1016448, 'steps': 5293, 'loss/train': 0.3849567174911499} -08/30/2021 14:08:45 - INFO - __main__ - Step 5295: {'lr': 0.0004993891190672411, 'samples': 1016640, 'steps': 5294, 'loss/train': 1.9131169319152832} -08/30/2021 14:08:45 - INFO - __main__ - Step 5296: {'lr': 0.0004993887482569407, 'samples': 1016832, 'steps': 5295, 'loss/train': 2.723391532897949} -08/30/2021 14:08:46 - INFO - __main__ - Step 5297: {'lr': 0.0004993883773342695, 'samples': 1017024, 'steps': 5296, 'loss/train': 1.3873577117919922} -08/30/2021 14:08:46 - INFO - __main__ - Step 5298: {'lr': 0.0004993880062992279, 'samples': 1017216, 'steps': 5297, 'loss/train': 2.1457936763763428} -08/30/2021 14:08:48 - INFO - __main__ - Step 5299: {'lr': 0.0004993876351518157, 'samples': 1017408, 'steps': 5298, 'loss/train': 1.902564287185669} -08/30/2021 14:08:48 - INFO - __main__ - Step 5300: {'lr': 0.0004993872638920335, 'samples': 1017600, 'steps': 5299, 'loss/train': 2.003303050994873} -08/30/2021 14:08:49 - INFO - __main__ - Step 5301: {'lr': 0.0004993868925198811, 'samples': 1017792, 'steps': 5300, 'loss/train': 2.5706300735473633} -08/30/2021 14:08:49 - INFO - __main__ - Step 5302: {'lr': 0.0004993865210353588, 'samples': 1017984, 'steps': 5301, 'loss/train': 0.9811980128288269} -08/30/2021 14:08:49 - INFO - __main__ - Step 5303: {'lr': 0.0004993861494384669, 'samples': 1018176, 'steps': 5302, 'loss/train': 2.2012617588043213} -08/30/2021 14:08:50 - INFO - __main__ - Step 5304: {'lr': 0.0004993857777292053, 'samples': 1018368, 'steps': 5303, 'loss/train': 0.6270977854728699} -08/30/2021 14:08:51 - INFO - __main__ - Step 5305: {'lr': 0.0004993854059075745, 'samples': 1018560, 'steps': 5304, 'loss/train': 0.540199339389801} -08/30/2021 14:08:52 - INFO - __main__ - Step 5306: {'lr': 0.0004993850339735744, 'samples': 1018752, 'steps': 5305, 'loss/train': 2.128061294555664} -08/30/2021 14:08:52 - INFO - __main__ - Step 5307: {'lr': 0.0004993846619272052, 'samples': 1018944, 'steps': 5306, 'loss/train': 2.2702066898345947} -08/30/2021 14:08:52 - INFO - __main__ - Step 5308: {'lr': 0.0004993842897684672, 'samples': 1019136, 'steps': 5307, 'loss/train': 1.5475096702575684} -08/30/2021 14:08:53 - INFO - __main__ - Step 5309: {'lr': 0.0004993839174973604, 'samples': 1019328, 'steps': 5308, 'loss/train': 1.6055527925491333} -08/30/2021 14:08:54 - INFO - __main__ - Step 5310: {'lr': 0.0004993835451138851, 'samples': 1019520, 'steps': 5309, 'loss/train': 2.285568952560425} -08/30/2021 14:08:55 - INFO - __main__ - Step 5311: {'lr': 0.0004993831726180414, 'samples': 1019712, 'steps': 5310, 'loss/train': 2.526824474334717} -08/30/2021 14:08:55 - INFO - __main__ - Step 5312: {'lr': 0.0004993828000098296, 'samples': 1019904, 'steps': 5311, 'loss/train': 2.181748390197754} -08/30/2021 14:08:55 - INFO - __main__ - Step 5313: {'lr': 0.0004993824272892497, 'samples': 1020096, 'steps': 5312, 'loss/train': 2.0193381309509277} -08/30/2021 14:08:56 - INFO - __main__ - Step 5314: {'lr': 0.0004993820544563018, 'samples': 1020288, 'steps': 5313, 'loss/train': 2.558633804321289} -08/30/2021 14:08:56 - INFO - __main__ - Step 5315: {'lr': 0.0004993816815109863, 'samples': 1020480, 'steps': 5314, 'loss/train': 1.2283902168273926} -08/30/2021 14:08:58 - INFO - __main__ - Step 5316: {'lr': 0.0004993813084533033, 'samples': 1020672, 'steps': 5315, 'loss/train': 1.9092395305633545} -08/30/2021 14:08:58 - INFO - __main__ - Step 5317: {'lr': 0.0004993809352832529, 'samples': 1020864, 'steps': 5316, 'loss/train': 2.1001288890838623} -08/30/2021 14:08:58 - INFO - __main__ - Step 5318: {'lr': 0.0004993805620008353, 'samples': 1021056, 'steps': 5317, 'loss/train': 1.6625019311904907} -08/30/2021 14:08:59 - INFO - __main__ - Step 5319: {'lr': 0.0004993801886060506, 'samples': 1021248, 'steps': 5318, 'loss/train': 2.027336597442627} -08/30/2021 14:08:59 - INFO - __main__ - Step 5320: {'lr': 0.0004993798150988991, 'samples': 1021440, 'steps': 5319, 'loss/train': 2.322761058807373} -08/30/2021 14:09:01 - INFO - __main__ - Step 5321: {'lr': 0.0004993794414793808, 'samples': 1021632, 'steps': 5320, 'loss/train': 2.293020725250244} -08/30/2021 14:09:01 - INFO - __main__ - Step 5322: {'lr': 0.0004993790677474962, 'samples': 1021824, 'steps': 5321, 'loss/train': 2.055722951889038} -08/30/2021 14:09:02 - INFO - __main__ - Step 5323: {'lr': 0.0004993786939032451, 'samples': 1022016, 'steps': 5322, 'loss/train': 2.547273635864258} -08/30/2021 14:09:02 - INFO - __main__ - Step 5324: {'lr': 0.0004993783199466278, 'samples': 1022208, 'steps': 5323, 'loss/train': 2.078728675842285} -08/30/2021 14:09:02 - INFO - __main__ - Step 5325: {'lr': 0.0004993779458776444, 'samples': 1022400, 'steps': 5324, 'loss/train': 2.3225064277648926} -08/30/2021 14:09:04 - INFO - __main__ - Step 5326: {'lr': 0.0004993775716962953, 'samples': 1022592, 'steps': 5325, 'loss/train': 2.068955183029175} -08/30/2021 14:09:05 - INFO - __main__ - Step 5327: {'lr': 0.0004993771974025805, 'samples': 1022784, 'steps': 5326, 'loss/train': 2.1536505222320557} -08/30/2021 14:09:05 - INFO - __main__ - Step 5328: {'lr': 0.0004993768229965001, 'samples': 1022976, 'steps': 5327, 'loss/train': 1.8733011484146118} -08/30/2021 14:09:06 - INFO - __main__ - Step 5329: {'lr': 0.0004993764484780543, 'samples': 1023168, 'steps': 5328, 'loss/train': 2.5774080753326416} -08/30/2021 14:09:06 - INFO - __main__ - Step 5330: {'lr': 0.0004993760738472435, 'samples': 1023360, 'steps': 5329, 'loss/train': 1.8517621755599976} -08/30/2021 14:09:07 - INFO - __main__ - Step 5331: {'lr': 0.0004993756991040675, 'samples': 1023552, 'steps': 5330, 'loss/train': 1.9004884958267212} -08/30/2021 14:09:08 - INFO - __main__ - Step 5332: {'lr': 0.0004993753242485268, 'samples': 1023744, 'steps': 5331, 'loss/train': 1.9509395360946655} -08/30/2021 14:09:08 - INFO - __main__ - Step 5333: {'lr': 0.0004993749492806214, 'samples': 1023936, 'steps': 5332, 'loss/train': 2.135444402694702} -08/30/2021 14:09:08 - INFO - __main__ - Step 5334: {'lr': 0.0004993745742003515, 'samples': 1024128, 'steps': 5333, 'loss/train': 1.30648934841156} -08/30/2021 14:09:09 - INFO - __main__ - Step 5335: {'lr': 0.0004993741990077172, 'samples': 1024320, 'steps': 5334, 'loss/train': 1.6830708980560303} -08/30/2021 14:09:10 - INFO - __main__ - Step 5336: {'lr': 0.0004993738237027188, 'samples': 1024512, 'steps': 5335, 'loss/train': 2.0417819023132324} -08/30/2021 14:09:11 - INFO - __main__ - Step 5337: {'lr': 0.0004993734482853563, 'samples': 1024704, 'steps': 5336, 'loss/train': 1.9000158309936523} -08/30/2021 14:09:11 - INFO - __main__ - Step 5338: {'lr': 0.0004993730727556301, 'samples': 1024896, 'steps': 5337, 'loss/train': 2.2786426544189453} -08/30/2021 14:09:11 - INFO - __main__ - Step 5339: {'lr': 0.0004993726971135402, 'samples': 1025088, 'steps': 5338, 'loss/train': 2.10693097114563} -08/30/2021 14:09:12 - INFO - __main__ - Step 5340: {'lr': 0.0004993723213590868, 'samples': 1025280, 'steps': 5339, 'loss/train': 2.400607109069824} -08/30/2021 14:09:13 - INFO - __main__ - Step 5341: {'lr': 0.0004993719454922701, 'samples': 1025472, 'steps': 5340, 'loss/train': 2.1272616386413574} -08/30/2021 14:09:14 - INFO - __main__ - Step 5342: {'lr': 0.0004993715695130902, 'samples': 1025664, 'steps': 5341, 'loss/train': 2.2308144569396973} -08/30/2021 14:09:14 - INFO - __main__ - Step 5343: {'lr': 0.0004993711934215473, 'samples': 1025856, 'steps': 5342, 'loss/train': 2.4320480823516846} -08/30/2021 14:09:15 - INFO - __main__ - Step 5344: {'lr': 0.0004993708172176417, 'samples': 1026048, 'steps': 5343, 'loss/train': 2.435067892074585} -08/30/2021 14:09:15 - INFO - __main__ - Step 5345: {'lr': 0.0004993704409013734, 'samples': 1026240, 'steps': 5344, 'loss/train': 1.9322372674942017} -08/30/2021 14:09:15 - INFO - __main__ - Step 5346: {'lr': 0.0004993700644727425, 'samples': 1026432, 'steps': 5345, 'loss/train': 2.1200332641601562} -08/30/2021 14:09:17 - INFO - __main__ - Step 5347: {'lr': 0.0004993696879317495, 'samples': 1026624, 'steps': 5346, 'loss/train': 2.031440496444702} -08/30/2021 14:09:18 - INFO - __main__ - Step 5348: {'lr': 0.0004993693112783943, 'samples': 1026816, 'steps': 5347, 'loss/train': 1.5683552026748657} -08/30/2021 14:09:18 - INFO - __main__ - Step 5349: {'lr': 0.0004993689345126771, 'samples': 1027008, 'steps': 5348, 'loss/train': 0.2959568202495575} -08/30/2021 14:09:18 - INFO - __main__ - Step 5350: {'lr': 0.0004993685576345981, 'samples': 1027200, 'steps': 5349, 'loss/train': 2.23846173286438} -08/30/2021 14:09:19 - INFO - __main__ - Step 5351: {'lr': 0.0004993681806441575, 'samples': 1027392, 'steps': 5350, 'loss/train': 2.4751954078674316} -08/30/2021 14:09:20 - INFO - __main__ - Step 5352: {'lr': 0.0004993678035413554, 'samples': 1027584, 'steps': 5351, 'loss/train': 2.223661184310913} -08/30/2021 14:09:21 - INFO - __main__ - Step 5353: {'lr': 0.0004993674263261921, 'samples': 1027776, 'steps': 5352, 'loss/train': 1.4263993501663208} -08/30/2021 14:09:21 - INFO - __main__ - Step 5354: {'lr': 0.0004993670489986677, 'samples': 1027968, 'steps': 5353, 'loss/train': 2.0988636016845703} -08/30/2021 14:09:21 - INFO - __main__ - Step 5355: {'lr': 0.0004993666715587823, 'samples': 1028160, 'steps': 5354, 'loss/train': 2.2328529357910156} -08/30/2021 14:09:22 - INFO - __main__ - Step 5356: {'lr': 0.0004993662940065361, 'samples': 1028352, 'steps': 5355, 'loss/train': 1.6497890949249268} -08/30/2021 14:09:23 - INFO - __main__ - Step 5357: {'lr': 0.0004993659163419294, 'samples': 1028544, 'steps': 5356, 'loss/train': 1.1058005094528198} -08/30/2021 14:09:24 - INFO - __main__ - Step 5358: {'lr': 0.0004993655385649621, 'samples': 1028736, 'steps': 5357, 'loss/train': 2.23276686668396} -08/30/2021 14:09:24 - INFO - __main__ - Step 5359: {'lr': 0.0004993651606756347, 'samples': 1028928, 'steps': 5358, 'loss/train': 2.2387802600860596} -08/30/2021 14:09:25 - INFO - __main__ - Step 5360: {'lr': 0.0004993647826739471, 'samples': 1029120, 'steps': 5359, 'loss/train': 1.8057059049606323} -08/30/2021 14:09:25 - INFO - __main__ - Step 5361: {'lr': 0.0004993644045598997, 'samples': 1029312, 'steps': 5360, 'loss/train': 0.4468001425266266} -08/30/2021 14:09:25 - INFO - __main__ - Step 5362: {'lr': 0.0004993640263334924, 'samples': 1029504, 'steps': 5361, 'loss/train': 1.9620311260223389} -08/30/2021 14:09:27 - INFO - __main__ - Step 5363: {'lr': 0.0004993636479947256, 'samples': 1029696, 'steps': 5362, 'loss/train': 2.3470122814178467} -08/30/2021 14:09:28 - INFO - __main__ - Step 5364: {'lr': 0.0004993632695435993, 'samples': 1029888, 'steps': 5363, 'loss/train': 2.2149205207824707} -08/30/2021 14:09:28 - INFO - __main__ - Step 5365: {'lr': 0.0004993628909801138, 'samples': 1030080, 'steps': 5364, 'loss/train': 1.8443580865859985} -08/30/2021 14:09:28 - INFO - __main__ - Step 5366: {'lr': 0.0004993625123042694, 'samples': 1030272, 'steps': 5365, 'loss/train': 0.44625377655029297} -08/30/2021 14:09:29 - INFO - __main__ - Step 5367: {'lr': 0.0004993621335160659, 'samples': 1030464, 'steps': 5366, 'loss/train': 2.3478190898895264} -08/30/2021 14:09:30 - INFO - __main__ - Step 5368: {'lr': 0.0004993617546155037, 'samples': 1030656, 'steps': 5367, 'loss/train': 3.7186803817749023} -08/30/2021 14:09:31 - INFO - __main__ - Step 5369: {'lr': 0.000499361375602583, 'samples': 1030848, 'steps': 5368, 'loss/train': 2.6713244915008545} -08/30/2021 14:09:31 - INFO - __main__ - Step 5370: {'lr': 0.0004993609964773039, 'samples': 1031040, 'steps': 5369, 'loss/train': 1.7321006059646606} -08/30/2021 14:09:31 - INFO - __main__ - Step 5371: {'lr': 0.0004993606172396665, 'samples': 1031232, 'steps': 5370, 'loss/train': 1.4341566562652588} -08/30/2021 14:09:32 - INFO - __main__ - Step 5372: {'lr': 0.0004993602378896712, 'samples': 1031424, 'steps': 5371, 'loss/train': 2.197713613510132} -08/30/2021 14:09:33 - INFO - __main__ - Step 5373: {'lr': 0.0004993598584273179, 'samples': 1031616, 'steps': 5372, 'loss/train': 1.3328524827957153} -08/30/2021 14:09:34 - INFO - __main__ - Step 5374: {'lr': 0.0004993594788526069, 'samples': 1031808, 'steps': 5373, 'loss/train': 2.3513150215148926} -08/30/2021 14:09:34 - INFO - __main__ - Step 5375: {'lr': 0.0004993590991655384, 'samples': 1032000, 'steps': 5374, 'loss/train': 2.0456442832946777} -08/30/2021 14:09:34 - INFO - __main__ - Step 5376: {'lr': 0.0004993587193661126, 'samples': 1032192, 'steps': 5375, 'loss/train': 2.4715588092803955} -08/30/2021 14:09:35 - INFO - __main__ - Step 5377: {'lr': 0.0004993583394543295, 'samples': 1032384, 'steps': 5376, 'loss/train': 2.196958065032959} -08/30/2021 14:09:37 - INFO - __main__ - Step 5378: {'lr': 0.0004993579594301895, 'samples': 1032576, 'steps': 5377, 'loss/train': 2.075531482696533} -08/30/2021 14:09:37 - INFO - __main__ - Step 5379: {'lr': 0.0004993575792936925, 'samples': 1032768, 'steps': 5378, 'loss/train': 2.4638051986694336} -08/30/2021 14:09:37 - INFO - __main__ - Step 5380: {'lr': 0.000499357199044839, 'samples': 1032960, 'steps': 5379, 'loss/train': 1.3880785703659058} -08/30/2021 14:09:38 - INFO - __main__ - Step 5381: {'lr': 0.0004993568186836288, 'samples': 1033152, 'steps': 5380, 'loss/train': 2.3600668907165527} -08/30/2021 14:09:38 - INFO - __main__ - Step 5382: {'lr': 0.0004993564382100624, 'samples': 1033344, 'steps': 5381, 'loss/train': 2.009852409362793} -08/30/2021 14:09:38 - INFO - __main__ - Step 5383: {'lr': 0.0004993560576241398, 'samples': 1033536, 'steps': 5382, 'loss/train': 1.336531400680542} -08/30/2021 14:09:40 - INFO - __main__ - Step 5384: {'lr': 0.0004993556769258612, 'samples': 1033728, 'steps': 5383, 'loss/train': 2.0151145458221436} -08/30/2021 14:09:40 - INFO - __main__ - Step 5385: {'lr': 0.0004993552961152268, 'samples': 1033920, 'steps': 5384, 'loss/train': 2.3672847747802734} -08/30/2021 14:09:41 - INFO - __main__ - Step 5386: {'lr': 0.0004993549151922367, 'samples': 1034112, 'steps': 5385, 'loss/train': 1.5583224296569824} -08/30/2021 14:09:41 - INFO - __main__ - Step 5387: {'lr': 0.0004993545341568912, 'samples': 1034304, 'steps': 5386, 'loss/train': 3.142512321472168} -08/30/2021 14:09:42 - INFO - __main__ - Step 5388: {'lr': 0.0004993541530091903, 'samples': 1034496, 'steps': 5387, 'loss/train': 2.7708797454833984} -08/30/2021 14:09:43 - INFO - __main__ - Step 5389: {'lr': 0.0004993537717491343, 'samples': 1034688, 'steps': 5388, 'loss/train': 2.521812677383423} -08/30/2021 14:09:44 - INFO - __main__ - Step 5390: {'lr': 0.0004993533903767235, 'samples': 1034880, 'steps': 5389, 'loss/train': 1.5467299222946167} -08/30/2021 14:09:44 - INFO - __main__ - Step 5391: {'lr': 0.0004993530088919577, 'samples': 1035072, 'steps': 5390, 'loss/train': 2.070864677429199} -08/30/2021 14:09:44 - INFO - __main__ - Step 5392: {'lr': 0.0004993526272948374, 'samples': 1035264, 'steps': 5391, 'loss/train': 2.1507418155670166} -08/30/2021 14:09:45 - INFO - __main__ - Step 5393: {'lr': 0.0004993522455853626, 'samples': 1035456, 'steps': 5392, 'loss/train': 0.9771274924278259} -08/30/2021 14:09:46 - INFO - __main__ - Step 5394: {'lr': 0.0004993518637635334, 'samples': 1035648, 'steps': 5393, 'loss/train': 2.1481733322143555} -08/30/2021 14:09:46 - INFO - __main__ - Step 5395: {'lr': 0.0004993514818293503, 'samples': 1035840, 'steps': 5394, 'loss/train': 1.9538158178329468} -08/30/2021 14:09:47 - INFO - __main__ - Step 5396: {'lr': 0.0004993510997828132, 'samples': 1036032, 'steps': 5395, 'loss/train': 1.8449543714523315} -08/30/2021 14:09:47 - INFO - __main__ - Step 5397: {'lr': 0.0004993507176239224, 'samples': 1036224, 'steps': 5396, 'loss/train': 2.1521570682525635} -08/30/2021 14:09:48 - INFO - __main__ - Step 5398: {'lr': 0.0004993503353526779, 'samples': 1036416, 'steps': 5397, 'loss/train': 2.1995091438293457} -08/30/2021 14:09:49 - INFO - __main__ - Step 5399: {'lr': 0.0004993499529690801, 'samples': 1036608, 'steps': 5398, 'loss/train': 2.096731185913086} -08/30/2021 14:09:49 - INFO - __main__ - Step 5400: {'lr': 0.000499349570473129, 'samples': 1036800, 'steps': 5399, 'loss/train': 2.673593282699585} -08/30/2021 14:09:50 - INFO - __main__ - Step 5401: {'lr': 0.0004993491878648249, 'samples': 1036992, 'steps': 5400, 'loss/train': 1.6000927686691284} -08/30/2021 14:09:50 - INFO - __main__ - Step 5402: {'lr': 0.0004993488051441677, 'samples': 1037184, 'steps': 5401, 'loss/train': 1.3312642574310303} -08/30/2021 14:09:50 - INFO - __main__ - Step 5403: {'lr': 0.000499348422311158, 'samples': 1037376, 'steps': 5402, 'loss/train': 1.9997714757919312} -08/30/2021 14:09:52 - INFO - __main__ - Step 5404: {'lr': 0.0004993480393657956, 'samples': 1037568, 'steps': 5403, 'loss/train': 2.048255443572998} -08/30/2021 14:09:52 - INFO - __main__ - Step 5405: {'lr': 0.0004993476563080809, 'samples': 1037760, 'steps': 5404, 'loss/train': 1.9504129886627197} -08/30/2021 14:09:53 - INFO - __main__ - Step 5406: {'lr': 0.000499347273138014, 'samples': 1037952, 'steps': 5405, 'loss/train': 2.440894365310669} -08/30/2021 14:09:53 - INFO - __main__ - Step 5407: {'lr': 0.000499346889855595, 'samples': 1038144, 'steps': 5406, 'loss/train': 1.7340859174728394} -08/30/2021 14:09:53 - INFO - __main__ - Step 5408: {'lr': 0.0004993465064608242, 'samples': 1038336, 'steps': 5407, 'loss/train': 2.320876359939575} -08/30/2021 14:09:55 - INFO - __main__ - Step 5409: {'lr': 0.0004993461229537017, 'samples': 1038528, 'steps': 5408, 'loss/train': 2.4220235347747803} -08/30/2021 14:09:55 - INFO - __main__ - Step 5410: {'lr': 0.0004993457393342276, 'samples': 1038720, 'steps': 5409, 'loss/train': 2.2513859272003174} -08/30/2021 14:09:56 - INFO - __main__ - Step 5411: {'lr': 0.0004993453556024023, 'samples': 1038912, 'steps': 5410, 'loss/train': 2.6174113750457764} -08/30/2021 14:09:56 - INFO - __main__ - Step 5412: {'lr': 0.0004993449717582258, 'samples': 1039104, 'steps': 5411, 'loss/train': 2.1662635803222656} -08/30/2021 14:09:56 - INFO - __main__ - Step 5413: {'lr': 0.0004993445878016982, 'samples': 1039296, 'steps': 5412, 'loss/train': 2.164144277572632} -08/30/2021 14:09:58 - INFO - __main__ - Step 5414: {'lr': 0.0004993442037328199, 'samples': 1039488, 'steps': 5413, 'loss/train': 1.9893866777420044} -08/30/2021 14:09:59 - INFO - __main__ - Step 5415: {'lr': 0.0004993438195515909, 'samples': 1039680, 'steps': 5414, 'loss/train': 2.002112865447998} -08/30/2021 14:09:59 - INFO - __main__ - Step 5416: {'lr': 0.0004993434352580115, 'samples': 1039872, 'steps': 5415, 'loss/train': 2.2562832832336426} -08/30/2021 14:09:59 - INFO - __main__ - Step 5417: {'lr': 0.0004993430508520816, 'samples': 1040064, 'steps': 5416, 'loss/train': 2.781446695327759} -08/30/2021 14:10:00 - INFO - __main__ - Step 5418: {'lr': 0.0004993426663338018, 'samples': 1040256, 'steps': 5417, 'loss/train': 3.561868906021118} -08/30/2021 14:10:00 - INFO - __main__ - Step 5419: {'lr': 0.0004993422817031719, 'samples': 1040448, 'steps': 5418, 'loss/train': 2.6206448078155518} -08/30/2021 14:10:02 - INFO - __main__ - Step 5420: {'lr': 0.0004993418969601921, 'samples': 1040640, 'steps': 5419, 'loss/train': 0.2771877646446228} -08/30/2021 14:10:02 - INFO - __main__ - Step 5421: {'lr': 0.0004993415121048629, 'samples': 1040832, 'steps': 5420, 'loss/train': 1.951654076576233} -08/30/2021 14:10:02 - INFO - __main__ - Step 5422: {'lr': 0.0004993411271371842, 'samples': 1041024, 'steps': 5421, 'loss/train': 2.035478353500366} -08/30/2021 14:10:03 - INFO - __main__ - Step 5423: {'lr': 0.0004993407420571563, 'samples': 1041216, 'steps': 5422, 'loss/train': 2.09321665763855} -08/30/2021 14:10:03 - INFO - __main__ - Step 5424: {'lr': 0.0004993403568647792, 'samples': 1041408, 'steps': 5423, 'loss/train': 1.7867854833602905} -08/30/2021 14:10:05 - INFO - __main__ - Step 5425: {'lr': 0.0004993399715600531, 'samples': 1041600, 'steps': 5424, 'loss/train': 2.204225778579712} -08/30/2021 14:10:05 - INFO - __main__ - Step 5426: {'lr': 0.0004993395861429785, 'samples': 1041792, 'steps': 5425, 'loss/train': 2.1877803802490234} -08/30/2021 14:10:06 - INFO - __main__ - Step 5427: {'lr': 0.0004993392006135552, 'samples': 1041984, 'steps': 5426, 'loss/train': 1.9577467441558838} -08/30/2021 14:10:06 - INFO - __main__ - Step 5428: {'lr': 0.0004993388149717834, 'samples': 1042176, 'steps': 5427, 'loss/train': 2.704737901687622} -08/30/2021 14:10:06 - INFO - __main__ - Step 5429: {'lr': 0.0004993384292176636, 'samples': 1042368, 'steps': 5428, 'loss/train': 2.8021090030670166} -08/30/2021 14:10:09 - INFO - __main__ - Step 5430: {'lr': 0.0004993380433511956, 'samples': 1042560, 'steps': 5429, 'loss/train': 1.9252568483352661} -08/30/2021 14:10:09 - INFO - __main__ - Step 5431: {'lr': 0.0004993376573723798, 'samples': 1042752, 'steps': 5430, 'loss/train': 2.233086109161377} -08/30/2021 14:10:09 - INFO - __main__ - Step 5432: {'lr': 0.0004993372712812162, 'samples': 1042944, 'steps': 5431, 'loss/train': 0.5660424828529358} -08/30/2021 14:10:10 - INFO - __main__ - Step 5433: {'lr': 0.0004993368850777052, 'samples': 1043136, 'steps': 5432, 'loss/train': 2.0277514457702637} -08/30/2021 14:10:10 - INFO - __main__ - Step 5434: {'lr': 0.0004993364987618468, 'samples': 1043328, 'steps': 5433, 'loss/train': 2.2109923362731934} -08/30/2021 14:10:10 - INFO - __main__ - Step 5435: {'lr': 0.0004993361123336412, 'samples': 1043520, 'steps': 5434, 'loss/train': 2.028074264526367} -08/30/2021 14:10:12 - INFO - __main__ - Step 5436: {'lr': 0.0004993357257930887, 'samples': 1043712, 'steps': 5435, 'loss/train': 1.8543492555618286} -08/30/2021 14:10:12 - INFO - __main__ - Step 5437: {'lr': 0.0004993353391401892, 'samples': 1043904, 'steps': 5436, 'loss/train': 1.626535177230835} -08/30/2021 14:10:13 - INFO - __main__ - Step 5438: {'lr': 0.0004993349523749431, 'samples': 1044096, 'steps': 5437, 'loss/train': 2.555976152420044} -08/30/2021 14:10:13 - INFO - __main__ - Step 5439: {'lr': 0.0004993345654973505, 'samples': 1044288, 'steps': 5438, 'loss/train': 1.9841675758361816} -08/30/2021 14:10:14 - INFO - __main__ - Step 5440: {'lr': 0.0004993341785074116, 'samples': 1044480, 'steps': 5439, 'loss/train': 0.9596847891807556} -08/30/2021 14:10:15 - INFO - __main__ - Step 5441: {'lr': 0.0004993337914051266, 'samples': 1044672, 'steps': 5440, 'loss/train': 1.9429361820220947} -08/30/2021 14:10:16 - INFO - __main__ - Step 5442: {'lr': 0.0004993334041904957, 'samples': 1044864, 'steps': 5441, 'loss/train': 1.9028719663619995} -08/30/2021 14:10:16 - INFO - __main__ - Step 5443: {'lr': 0.0004993330168635189, 'samples': 1045056, 'steps': 5442, 'loss/train': 1.8421297073364258} -08/30/2021 14:10:16 - INFO - __main__ - Step 5444: {'lr': 0.0004993326294241966, 'samples': 1045248, 'steps': 5443, 'loss/train': 2.274104118347168} -08/30/2021 14:10:17 - INFO - __main__ - Step 5445: {'lr': 0.0004993322418725286, 'samples': 1045440, 'steps': 5444, 'loss/train': 2.2421417236328125} -08/30/2021 14:10:18 - INFO - __main__ - Step 5446: {'lr': 0.0004993318542085157, 'samples': 1045632, 'steps': 5445, 'loss/train': 1.3372082710266113} -08/30/2021 14:10:19 - INFO - __main__ - Step 5447: {'lr': 0.0004993314664321575, 'samples': 1045824, 'steps': 5446, 'loss/train': 1.7467808723449707} -08/30/2021 14:10:19 - INFO - __main__ - Step 5448: {'lr': 0.0004993310785434544, 'samples': 1046016, 'steps': 5447, 'loss/train': 1.7305140495300293} -08/30/2021 14:10:19 - INFO - __main__ - Step 5449: {'lr': 0.0004993306905424067, 'samples': 1046208, 'steps': 5448, 'loss/train': 2.282919406890869} -08/30/2021 14:10:20 - INFO - __main__ - Step 5450: {'lr': 0.0004993303024290143, 'samples': 1046400, 'steps': 5449, 'loss/train': 2.3551671504974365} -08/30/2021 14:10:21 - INFO - __main__ - Step 5451: {'lr': 0.0004993299142032776, 'samples': 1046592, 'steps': 5450, 'loss/train': 2.360137939453125} -08/30/2021 14:10:22 - INFO - __main__ - Step 5452: {'lr': 0.0004993295258651966, 'samples': 1046784, 'steps': 5451, 'loss/train': 1.8643544912338257} -08/30/2021 14:10:22 - INFO - __main__ - Step 5453: {'lr': 0.0004993291374147716, 'samples': 1046976, 'steps': 5452, 'loss/train': 2.229452133178711} -08/30/2021 14:10:22 - INFO - __main__ - Step 5454: {'lr': 0.0004993287488520027, 'samples': 1047168, 'steps': 5453, 'loss/train': 2.066531181335449} -08/30/2021 14:10:23 - INFO - __main__ - Step 5455: {'lr': 0.0004993283601768902, 'samples': 1047360, 'steps': 5454, 'loss/train': 1.7025607824325562} -08/30/2021 14:10:24 - INFO - __main__ - Step 5456: {'lr': 0.0004993279713894342, 'samples': 1047552, 'steps': 5455, 'loss/train': 2.2028450965881348} -08/30/2021 14:10:25 - INFO - __main__ - Step 5457: {'lr': 0.0004993275824896348, 'samples': 1047744, 'steps': 5456, 'loss/train': 2.0696890354156494} -08/30/2021 14:10:25 - INFO - __main__ - Step 5458: {'lr': 0.0004993271934774922, 'samples': 1047936, 'steps': 5457, 'loss/train': 1.9927334785461426} -08/30/2021 14:10:25 - INFO - __main__ - Step 5459: {'lr': 0.0004993268043530067, 'samples': 1048128, 'steps': 5458, 'loss/train': 0.9724563956260681} -08/30/2021 14:10:26 - INFO - __main__ - Step 5460: {'lr': 0.0004993264151161783, 'samples': 1048320, 'steps': 5459, 'loss/train': 2.131405830383301} -08/30/2021 14:10:27 - INFO - __main__ - Step 5461: {'lr': 0.0004993260257670074, 'samples': 1048512, 'steps': 5460, 'loss/train': 2.383780002593994} -08/30/2021 14:10:28 - INFO - __main__ - Step 5462: {'lr': 0.000499325636305494, 'samples': 1048704, 'steps': 5461, 'loss/train': 1.9696367979049683} -08/30/2021 14:10:28 - INFO - __main__ - Step 5463: {'lr': 0.0004993252467316382, 'samples': 1048896, 'steps': 5462, 'loss/train': 0.2647189497947693} -08/30/2021 14:10:29 - INFO - __main__ - Step 5464: {'lr': 0.0004993248570454404, 'samples': 1049088, 'steps': 5463, 'loss/train': 1.9423753023147583} -08/30/2021 14:10:29 - INFO - __main__ - Step 5465: {'lr': 0.0004993244672469007, 'samples': 1049280, 'steps': 5464, 'loss/train': 2.2232024669647217} -08/30/2021 14:10:29 - INFO - __main__ - Step 5466: {'lr': 0.000499324077336019, 'samples': 1049472, 'steps': 5465, 'loss/train': 1.8365471363067627} -08/30/2021 14:10:31 - INFO - __main__ - Step 5467: {'lr': 0.000499323687312796, 'samples': 1049664, 'steps': 5466, 'loss/train': 2.3148319721221924} -08/30/2021 14:10:31 - INFO - __main__ - Step 5468: {'lr': 0.0004993232971772315, 'samples': 1049856, 'steps': 5467, 'loss/train': 1.4730870723724365} -08/30/2021 14:10:32 - INFO - __main__ - Step 5469: {'lr': 0.0004993229069293257, 'samples': 1050048, 'steps': 5468, 'loss/train': 2.107245445251465} -08/30/2021 14:10:32 - INFO - __main__ - Step 5470: {'lr': 0.0004993225165690789, 'samples': 1050240, 'steps': 5469, 'loss/train': 2.0114569664001465} -08/30/2021 14:10:32 - INFO - __main__ - Step 5471: {'lr': 0.0004993221260964912, 'samples': 1050432, 'steps': 5470, 'loss/train': 2.575805425643921} -08/30/2021 14:10:34 - INFO - __main__ - Step 5472: {'lr': 0.0004993217355115628, 'samples': 1050624, 'steps': 5471, 'loss/train': 1.0163025856018066} -08/30/2021 14:10:34 - INFO - __main__ - Step 5473: {'lr': 0.0004993213448142939, 'samples': 1050816, 'steps': 5472, 'loss/train': 2.3085601329803467} -08/30/2021 14:10:35 - INFO - __main__ - Step 5474: {'lr': 0.0004993209540046846, 'samples': 1051008, 'steps': 5473, 'loss/train': 2.156073570251465} -08/30/2021 14:10:35 - INFO - __main__ - Step 5475: {'lr': 0.0004993205630827352, 'samples': 1051200, 'steps': 5474, 'loss/train': 2.266218662261963} -08/30/2021 14:10:35 - INFO - __main__ - Step 5476: {'lr': 0.0004993201720484458, 'samples': 1051392, 'steps': 5475, 'loss/train': 1.6573611497879028} -08/30/2021 14:10:37 - INFO - __main__ - Step 5477: {'lr': 0.0004993197809018165, 'samples': 1051584, 'steps': 5476, 'loss/train': 2.014347791671753} -08/30/2021 14:10:37 - INFO - __main__ - Step 5478: {'lr': 0.0004993193896428476, 'samples': 1051776, 'steps': 5477, 'loss/train': 1.5912764072418213} -08/30/2021 14:10:38 - INFO - __main__ - Step 5479: {'lr': 0.0004993189982715392, 'samples': 1051968, 'steps': 5478, 'loss/train': 1.98436439037323} -08/30/2021 14:10:38 - INFO - __main__ - Step 5480: {'lr': 0.0004993186067878916, 'samples': 1052160, 'steps': 5479, 'loss/train': 1.3397401571273804} -08/30/2021 14:10:38 - INFO - __main__ - Step 5481: {'lr': 0.0004993182151919049, 'samples': 1052352, 'steps': 5480, 'loss/train': 2.5370564460754395} -08/30/2021 14:10:40 - INFO - __main__ - Step 5482: {'lr': 0.0004993178234835792, 'samples': 1052544, 'steps': 5481, 'loss/train': 2.3404853343963623} -08/30/2021 14:10:40 - INFO - __main__ - Step 5483: {'lr': 0.0004993174316629146, 'samples': 1052736, 'steps': 5482, 'loss/train': 1.8672559261322021} -08/30/2021 14:10:41 - INFO - __main__ - Step 5484: {'lr': 0.0004993170397299116, 'samples': 1052928, 'steps': 5483, 'loss/train': 2.132535219192505} -08/30/2021 14:10:41 - INFO - __main__ - Step 5485: {'lr': 0.0004993166476845701, 'samples': 1053120, 'steps': 5484, 'loss/train': 1.8370695114135742} -08/30/2021 14:10:41 - INFO - __main__ - Step 5486: {'lr': 0.0004993162555268903, 'samples': 1053312, 'steps': 5485, 'loss/train': 2.283796787261963} -08/30/2021 14:10:44 - INFO - __main__ - Step 5487: {'lr': 0.0004993158632568726, 'samples': 1053504, 'steps': 5486, 'loss/train': 2.285121202468872} -08/30/2021 14:10:44 - INFO - __main__ - Step 5488: {'lr': 0.000499315470874517, 'samples': 1053696, 'steps': 5487, 'loss/train': 2.177340030670166} -08/30/2021 14:10:44 - INFO - __main__ - Step 5489: {'lr': 0.0004993150783798236, 'samples': 1053888, 'steps': 5488, 'loss/train': 1.9022594690322876} -08/30/2021 14:10:45 - INFO - __main__ - Step 5490: {'lr': 0.0004993146857727927, 'samples': 1054080, 'steps': 5489, 'loss/train': 2.1659700870513916} -08/30/2021 14:10:45 - INFO - __main__ - Step 5491: {'lr': 0.0004993142930534245, 'samples': 1054272, 'steps': 5490, 'loss/train': 2.3744122982025146} -08/30/2021 14:10:45 - INFO - __main__ - Step 5492: {'lr': 0.000499313900221719, 'samples': 1054464, 'steps': 5491, 'loss/train': 1.952682375907898} -08/30/2021 14:10:47 - INFO - __main__ - Step 5493: {'lr': 0.0004993135072776766, 'samples': 1054656, 'steps': 5492, 'loss/train': 2.821582078933716} -08/30/2021 14:10:48 - INFO - __main__ - Step 5494: {'lr': 0.0004993131142212974, 'samples': 1054848, 'steps': 5493, 'loss/train': 2.6464333534240723} -08/30/2021 14:10:48 - INFO - __main__ - Step 5495: {'lr': 0.0004993127210525815, 'samples': 1055040, 'steps': 5494, 'loss/train': 2.1936745643615723} -08/30/2021 14:10:48 - INFO - __main__ - Step 5496: {'lr': 0.0004993123277715292, 'samples': 1055232, 'steps': 5495, 'loss/train': 0.46463823318481445} -08/30/2021 14:10:49 - INFO - __main__ - Step 5497: {'lr': 0.0004993119343781406, 'samples': 1055424, 'steps': 5496, 'loss/train': 1.7416826486587524} -08/30/2021 14:10:50 - INFO - __main__ - Step 5498: {'lr': 0.0004993115408724159, 'samples': 1055616, 'steps': 5497, 'loss/train': 2.226656913757324} -08/30/2021 14:10:51 - INFO - __main__ - Step 5499: {'lr': 0.0004993111472543552, 'samples': 1055808, 'steps': 5498, 'loss/train': 2.048360586166382} -08/30/2021 14:10:51 - INFO - __main__ - Step 5500: {'lr': 0.0004993107535239588, 'samples': 1056000, 'steps': 5499, 'loss/train': 1.7542228698730469} -08/30/2021 14:10:51 - INFO - __main__ - Step 5501: {'lr': 0.0004993103596812267, 'samples': 1056192, 'steps': 5500, 'loss/train': 1.8287094831466675} -08/30/2021 14:10:52 - INFO - __main__ - Step 5502: {'lr': 0.0004993099657261594, 'samples': 1056384, 'steps': 5501, 'loss/train': 2.1925034523010254} -08/30/2021 14:10:53 - INFO - __main__ - Step 5503: {'lr': 0.0004993095716587568, 'samples': 1056576, 'steps': 5502, 'loss/train': 2.2337374687194824} -08/30/2021 14:10:54 - INFO - __main__ - Step 5504: {'lr': 0.0004993091774790191, 'samples': 1056768, 'steps': 5503, 'loss/train': 2.3906707763671875} -08/30/2021 14:10:54 - INFO - __main__ - Step 5505: {'lr': 0.0004993087831869466, 'samples': 1056960, 'steps': 5504, 'loss/train': 2.1719212532043457} -08/30/2021 14:10:55 - INFO - __main__ - Step 5506: {'lr': 0.0004993083887825393, 'samples': 1057152, 'steps': 5505, 'loss/train': 1.03645920753479} -08/30/2021 14:10:55 - INFO - __main__ - Step 5507: {'lr': 0.0004993079942657976, 'samples': 1057344, 'steps': 5506, 'loss/train': 2.3380463123321533} -08/30/2021 14:10:56 - INFO - __main__ - Step 5508: {'lr': 0.0004993075996367215, 'samples': 1057536, 'steps': 5507, 'loss/train': 2.2435622215270996} -08/30/2021 14:10:57 - INFO - __main__ - Step 5509: {'lr': 0.0004993072048953113, 'samples': 1057728, 'steps': 5508, 'loss/train': 2.1776604652404785} -08/30/2021 14:10:57 - INFO - __main__ - Step 5510: {'lr': 0.0004993068100415671, 'samples': 1057920, 'steps': 5509, 'loss/train': 2.653428316116333} -08/30/2021 14:10:57 - INFO - __main__ - Step 5511: {'lr': 0.000499306415075489, 'samples': 1058112, 'steps': 5510, 'loss/train': 2.6361703872680664} -08/30/2021 14:10:58 - INFO - __main__ - Step 5512: {'lr': 0.0004993060199970774, 'samples': 1058304, 'steps': 5511, 'loss/train': 2.427008867263794} -08/30/2021 14:10:59 - INFO - __main__ - Step 5513: {'lr': 0.0004993056248063323, 'samples': 1058496, 'steps': 5512, 'loss/train': 2.2770121097564697} -08/30/2021 14:11:00 - INFO - __main__ - Step 5514: {'lr': 0.000499305229503254, 'samples': 1058688, 'steps': 5513, 'loss/train': 2.106358289718628} -08/30/2021 14:11:00 - INFO - __main__ - Step 5515: {'lr': 0.0004993048340878425, 'samples': 1058880, 'steps': 5514, 'loss/train': 2.5477981567382812} -08/30/2021 14:11:01 - INFO - __main__ - Step 5516: {'lr': 0.0004993044385600982, 'samples': 1059072, 'steps': 5515, 'loss/train': 2.0413224697113037} -08/30/2021 14:11:01 - INFO - __main__ - Step 5517: {'lr': 0.0004993040429200211, 'samples': 1059264, 'steps': 5516, 'loss/train': 1.5816320180892944} -08/30/2021 14:11:02 - INFO - __main__ - Step 5518: {'lr': 0.0004993036471676115, 'samples': 1059456, 'steps': 5517, 'loss/train': 1.999403715133667} -08/30/2021 14:11:03 - INFO - __main__ - Step 5519: {'lr': 0.0004993032513028695, 'samples': 1059648, 'steps': 5518, 'loss/train': 2.0872840881347656} -08/30/2021 14:11:03 - INFO - __main__ - Step 5520: {'lr': 0.0004993028553257952, 'samples': 1059840, 'steps': 5519, 'loss/train': 2.4998018741607666} -08/30/2021 14:11:04 - INFO - __main__ - Step 5521: {'lr': 0.000499302459236389, 'samples': 1060032, 'steps': 5520, 'loss/train': 2.7392771244049072} -08/30/2021 14:11:04 - INFO - __main__ - Step 5522: {'lr': 0.0004993020630346509, 'samples': 1060224, 'steps': 5521, 'loss/train': 2.084122657775879} -08/30/2021 14:11:04 - INFO - __main__ - Step 5523: {'lr': 0.0004993016667205812, 'samples': 1060416, 'steps': 5522, 'loss/train': 2.190417528152466} -08/30/2021 14:11:06 - INFO - __main__ - Step 5524: {'lr': 0.0004993012702941799, 'samples': 1060608, 'steps': 5523, 'loss/train': 2.637319326400757} -08/30/2021 14:11:06 - INFO - __main__ - Step 5525: {'lr': 0.0004993008737554474, 'samples': 1060800, 'steps': 5524, 'loss/train': 1.8042362928390503} -08/30/2021 14:11:07 - INFO - __main__ - Step 5526: {'lr': 0.0004993004771043837, 'samples': 1060992, 'steps': 5525, 'loss/train': 2.6689212322235107} -08/30/2021 14:11:07 - INFO - __main__ - Step 5527: {'lr': 0.0004993000803409891, 'samples': 1061184, 'steps': 5526, 'loss/train': 1.7853155136108398} -08/30/2021 14:11:07 - INFO - __main__ - Step 5528: {'lr': 0.0004992996834652638, 'samples': 1061376, 'steps': 5527, 'loss/train': 2.338870048522949} -08/30/2021 14:11:10 - INFO - __main__ - Step 5529: {'lr': 0.0004992992864772079, 'samples': 1061568, 'steps': 5528, 'loss/train': 1.9785727262496948} -08/30/2021 14:11:10 - INFO - __main__ - Step 5530: {'lr': 0.0004992988893768214, 'samples': 1061760, 'steps': 5529, 'loss/train': 0.20871050655841827} -08/30/2021 14:11:11 - INFO - __main__ - Step 5531: {'lr': 0.0004992984921641048, 'samples': 1061952, 'steps': 5530, 'loss/train': 2.4556217193603516} -08/30/2021 14:11:11 - INFO - __main__ - Step 5532: {'lr': 0.0004992980948390582, 'samples': 1062144, 'steps': 5531, 'loss/train': 2.12160062789917} -08/30/2021 14:11:11 - INFO - __main__ - Step 5533: {'lr': 0.0004992976974016817, 'samples': 1062336, 'steps': 5532, 'loss/train': 1.3040118217468262} -08/30/2021 14:11:12 - INFO - __main__ - Step 5534: {'lr': 0.0004992972998519755, 'samples': 1062528, 'steps': 5533, 'loss/train': 1.4546117782592773} -08/30/2021 14:11:13 - INFO - __main__ - Step 5535: {'lr': 0.0004992969021899397, 'samples': 1062720, 'steps': 5534, 'loss/train': 1.5991532802581787} -08/30/2021 14:11:14 - INFO - __main__ - Step 5536: {'lr': 0.0004992965044155746, 'samples': 1062912, 'steps': 5535, 'loss/train': 3.6720755100250244} -08/30/2021 14:11:14 - INFO - __main__ - Step 5537: {'lr': 0.0004992961065288803, 'samples': 1063104, 'steps': 5536, 'loss/train': 2.046330451965332} -08/30/2021 14:11:14 - INFO - __main__ - Step 5538: {'lr': 0.0004992957085298571, 'samples': 1063296, 'steps': 5537, 'loss/train': 1.8923728466033936} -08/30/2021 14:11:15 - INFO - __main__ - Step 5539: {'lr': 0.0004992953104185052, 'samples': 1063488, 'steps': 5538, 'loss/train': 1.9728093147277832} -08/30/2021 14:11:15 - INFO - __main__ - Step 5540: {'lr': 0.0004992949121948245, 'samples': 1063680, 'steps': 5539, 'loss/train': 2.3191511631011963} -08/30/2021 14:11:17 - INFO - __main__ - Step 5541: {'lr': 0.0004992945138588154, 'samples': 1063872, 'steps': 5540, 'loss/train': 1.7350372076034546} -08/30/2021 14:11:18 - INFO - __main__ - Step 5542: {'lr': 0.0004992941154104781, 'samples': 1064064, 'steps': 5541, 'loss/train': 1.5580090284347534} -08/30/2021 14:11:18 - INFO - __main__ - Step 5543: {'lr': 0.0004992937168498126, 'samples': 1064256, 'steps': 5542, 'loss/train': 2.5731587409973145} -08/30/2021 14:11:18 - INFO - __main__ - Step 5544: {'lr': 0.0004992933181768194, 'samples': 1064448, 'steps': 5543, 'loss/train': 2.2242648601531982} -08/30/2021 14:11:19 - INFO - __main__ - Step 5545: {'lr': 0.0004992929193914983, 'samples': 1064640, 'steps': 5544, 'loss/train': 2.34719181060791} -08/30/2021 14:11:20 - INFO - __main__ - Step 5546: {'lr': 0.0004992925204938498, 'samples': 1064832, 'steps': 5545, 'loss/train': 2.010756254196167} -08/30/2021 14:11:21 - INFO - __main__ - Step 5547: {'lr': 0.0004992921214838738, 'samples': 1065024, 'steps': 5546, 'loss/train': 2.0510904788970947} -08/30/2021 14:11:21 - INFO - __main__ - Step 5548: {'lr': 0.0004992917223615706, 'samples': 1065216, 'steps': 5547, 'loss/train': 1.9226391315460205} -08/30/2021 14:11:21 - INFO - __main__ - Step 5549: {'lr': 0.0004992913231269405, 'samples': 1065408, 'steps': 5548, 'loss/train': 2.1731057167053223} -08/30/2021 14:11:22 - INFO - __main__ - Step 5550: {'lr': 0.0004992909237799835, 'samples': 1065600, 'steps': 5549, 'loss/train': 1.3518481254577637} -08/30/2021 14:11:23 - INFO - __main__ - Step 5551: {'lr': 0.0004992905243206999, 'samples': 1065792, 'steps': 5550, 'loss/train': 2.6396844387054443} -08/30/2021 14:11:23 - INFO - __main__ - Step 5552: {'lr': 0.0004992901247490899, 'samples': 1065984, 'steps': 5551, 'loss/train': 2.384359836578369} -08/30/2021 14:11:24 - INFO - __main__ - Step 5553: {'lr': 0.0004992897250651535, 'samples': 1066176, 'steps': 5552, 'loss/train': 2.3147265911102295} -08/30/2021 14:11:24 - INFO - __main__ - Step 5554: {'lr': 0.000499289325268891, 'samples': 1066368, 'steps': 5553, 'loss/train': 1.9126274585723877} -08/30/2021 14:11:25 - INFO - __main__ - Step 5555: {'lr': 0.0004992889253603027, 'samples': 1066560, 'steps': 5554, 'loss/train': 2.1129536628723145} -08/30/2021 14:11:26 - INFO - __main__ - Step 5556: {'lr': 0.0004992885253393885, 'samples': 1066752, 'steps': 5555, 'loss/train': 2.1831605434417725} -08/30/2021 14:11:26 - INFO - __main__ - Step 5557: {'lr': 0.0004992881252061489, 'samples': 1066944, 'steps': 5556, 'loss/train': 1.7416491508483887} -08/30/2021 14:11:27 - INFO - __main__ - Step 5558: {'lr': 0.0004992877249605838, 'samples': 1067136, 'steps': 5557, 'loss/train': 2.1720869541168213} -08/30/2021 14:11:27 - INFO - __main__ - Step 5559: {'lr': 0.0004992873246026935, 'samples': 1067328, 'steps': 5558, 'loss/train': 1.594710350036621} -08/30/2021 14:11:28 - INFO - __main__ - Step 5560: {'lr': 0.0004992869241324783, 'samples': 1067520, 'steps': 5559, 'loss/train': 2.2681097984313965} -08/30/2021 14:11:29 - INFO - __main__ - Step 5561: {'lr': 0.000499286523549938, 'samples': 1067712, 'steps': 5560, 'loss/train': 1.0781636238098145} -08/30/2021 14:11:30 - INFO - __main__ - Step 5562: {'lr': 0.0004992861228550733, 'samples': 1067904, 'steps': 5561, 'loss/train': 2.140679121017456} -08/30/2021 14:11:30 - INFO - __main__ - Step 5563: {'lr': 0.0004992857220478841, 'samples': 1068096, 'steps': 5562, 'loss/train': 2.354631185531616} -08/30/2021 14:11:31 - INFO - __main__ - Step 5564: {'lr': 0.0004992853211283705, 'samples': 1068288, 'steps': 5563, 'loss/train': 2.1048831939697266} -08/30/2021 14:11:31 - INFO - __main__ - Step 5565: {'lr': 0.0004992849200965327, 'samples': 1068480, 'steps': 5564, 'loss/train': 1.4562908411026} -08/30/2021 14:11:31 - INFO - __main__ - Step 5566: {'lr': 0.0004992845189523711, 'samples': 1068672, 'steps': 5565, 'loss/train': 2.081939458847046} -08/30/2021 14:11:32 - INFO - __main__ - Step 5567: {'lr': 0.0004992841176958858, 'samples': 1068864, 'steps': 5566, 'loss/train': 0.5906223654747009} -08/30/2021 14:11:33 - INFO - __main__ - Step 5568: {'lr': 0.0004992837163270769, 'samples': 1069056, 'steps': 5567, 'loss/train': 0.9060255885124207} -08/30/2021 14:11:34 - INFO - __main__ - Step 5569: {'lr': 0.0004992833148459445, 'samples': 1069248, 'steps': 5568, 'loss/train': 1.7371954917907715} -08/30/2021 14:11:34 - INFO - __main__ - Step 5570: {'lr': 0.0004992829132524889, 'samples': 1069440, 'steps': 5569, 'loss/train': 3.8672800064086914} -08/30/2021 14:11:34 - INFO - __main__ - Step 5571: {'lr': 0.0004992825115467102, 'samples': 1069632, 'steps': 5570, 'loss/train': 2.0577011108398438} -08/30/2021 14:11:35 - INFO - __main__ - Step 5572: {'lr': 0.0004992821097286088, 'samples': 1069824, 'steps': 5571, 'loss/train': 2.1876301765441895} -08/30/2021 14:11:36 - INFO - __main__ - Step 5573: {'lr': 0.0004992817077981846, 'samples': 1070016, 'steps': 5572, 'loss/train': 2.2967967987060547} -08/30/2021 14:11:37 - INFO - __main__ - Step 5574: {'lr': 0.000499281305755438, 'samples': 1070208, 'steps': 5573, 'loss/train': 2.410820960998535} -08/30/2021 14:11:37 - INFO - __main__ - Step 5575: {'lr': 0.0004992809036003691, 'samples': 1070400, 'steps': 5574, 'loss/train': 2.1856136322021484} -08/30/2021 14:11:38 - INFO - __main__ - Step 5576: {'lr': 0.000499280501332978, 'samples': 1070592, 'steps': 5575, 'loss/train': 2.0397074222564697} -08/30/2021 14:11:38 - INFO - __main__ - Step 5577: {'lr': 0.000499280098953265, 'samples': 1070784, 'steps': 5576, 'loss/train': 0.2530321776866913} -08/30/2021 14:11:39 - INFO - __main__ - Step 5578: {'lr': 0.0004992796964612302, 'samples': 1070976, 'steps': 5577, 'loss/train': 2.3651294708251953} -08/30/2021 14:11:40 - INFO - __main__ - Step 5579: {'lr': 0.0004992792938568739, 'samples': 1071168, 'steps': 5578, 'loss/train': 1.9276092052459717} -08/30/2021 14:11:40 - INFO - __main__ - Step 5580: {'lr': 0.0004992788911401961, 'samples': 1071360, 'steps': 5579, 'loss/train': 1.5673604011535645} -08/30/2021 14:11:41 - INFO - __main__ - Step 5581: {'lr': 0.0004992784883111972, 'samples': 1071552, 'steps': 5580, 'loss/train': 1.9843230247497559} -08/30/2021 14:11:41 - INFO - __main__ - Step 5582: {'lr': 0.0004992780853698771, 'samples': 1071744, 'steps': 5581, 'loss/train': 2.4910387992858887} -08/30/2021 14:11:43 - INFO - __main__ - Step 5583: {'lr': 0.0004992776823162362, 'samples': 1071936, 'steps': 5582, 'loss/train': 1.471346378326416} -08/30/2021 14:11:44 - INFO - __main__ - Step 5584: {'lr': 0.0004992772791502746, 'samples': 1072128, 'steps': 5583, 'loss/train': 2.100456714630127} -08/30/2021 14:11:44 - INFO - __main__ - Step 5585: {'lr': 0.0004992768758719926, 'samples': 1072320, 'steps': 5584, 'loss/train': 1.398590087890625} -08/30/2021 14:11:45 - INFO - __main__ - Step 5586: {'lr': 0.0004992764724813902, 'samples': 1072512, 'steps': 5585, 'loss/train': 1.7602514028549194} -08/30/2021 14:11:45 - INFO - __main__ - Step 5587: {'lr': 0.0004992760689784677, 'samples': 1072704, 'steps': 5586, 'loss/train': 2.4041781425476074} -08/30/2021 14:11:45 - INFO - __main__ - Step 5588: {'lr': 0.0004992756653632252, 'samples': 1072896, 'steps': 5587, 'loss/train': 1.75435209274292} -08/30/2021 14:11:46 - INFO - __main__ - Step 5589: {'lr': 0.0004992752616356631, 'samples': 1073088, 'steps': 5588, 'loss/train': 3.5171561241149902} -08/30/2021 14:11:46 - INFO - __main__ - Step 5590: {'lr': 0.0004992748577957812, 'samples': 1073280, 'steps': 5589, 'loss/train': 2.674107551574707} -08/30/2021 14:11:47 - INFO - __main__ - Step 5591: {'lr': 0.00049927445384358, 'samples': 1073472, 'steps': 5590, 'loss/train': 6.3213324546813965} -08/30/2021 14:11:48 - INFO - __main__ - Step 5592: {'lr': 0.0004992740497790595, 'samples': 1073664, 'steps': 5591, 'loss/train': 3.5618104934692383} -08/30/2021 14:11:48 - INFO - __main__ - Step 5593: {'lr': 0.0004992736456022201, 'samples': 1073856, 'steps': 5592, 'loss/train': 3.2196736335754395} -08/30/2021 14:11:49 - INFO - __main__ - Step 5594: {'lr': 0.0004992732413130617, 'samples': 1074048, 'steps': 5593, 'loss/train': 3.2155239582061768} -08/30/2021 14:11:49 - INFO - __main__ - Step 5595: {'lr': 0.0004992728369115848, 'samples': 1074240, 'steps': 5594, 'loss/train': 3.0582523345947266} -08/30/2021 14:11:51 - INFO - __main__ - Step 5596: {'lr': 0.0004992724323977893, 'samples': 1074432, 'steps': 5595, 'loss/train': 2.801431894302368} -08/30/2021 14:11:52 - INFO - __main__ - Step 5597: {'lr': 0.0004992720277716755, 'samples': 1074624, 'steps': 5596, 'loss/train': 2.778695583343506} -08/30/2021 14:11:52 - INFO - __main__ - Step 5598: {'lr': 0.0004992716230332435, 'samples': 1074816, 'steps': 5597, 'loss/train': 3.006305694580078} -08/30/2021 14:11:52 - INFO - __main__ - Step 5599: {'lr': 0.0004992712181824936, 'samples': 1075008, 'steps': 5598, 'loss/train': 2.5861709117889404} -08/30/2021 14:11:53 - INFO - __main__ - Step 5600: {'lr': 0.0004992708132194259, 'samples': 1075200, 'steps': 5599, 'loss/train': 2.4832420349121094} -08/30/2021 14:11:54 - INFO - __main__ - Step 5601: {'lr': 0.0004992704081440407, 'samples': 1075392, 'steps': 5600, 'loss/train': 3.009307384490967} -08/30/2021 14:11:55 - INFO - __main__ - Step 5602: {'lr': 0.0004992700029563381, 'samples': 1075584, 'steps': 5601, 'loss/train': 2.7582900524139404} -08/30/2021 14:11:55 - INFO - __main__ - Step 5603: {'lr': 0.0004992695976563182, 'samples': 1075776, 'steps': 5602, 'loss/train': 2.938291072845459} -08/30/2021 14:11:55 - INFO - __main__ - Step 5604: {'lr': 0.0004992691922439814, 'samples': 1075968, 'steps': 5603, 'loss/train': 4.9404215812683105} -08/30/2021 14:11:56 - INFO - __main__ - Step 5605: {'lr': 0.0004992687867193277, 'samples': 1076160, 'steps': 5604, 'loss/train': 3.016761302947998} -08/30/2021 14:11:57 - INFO - __main__ - Step 5606: {'lr': 0.0004992683810823572, 'samples': 1076352, 'steps': 5605, 'loss/train': 3.258758306503296} -08/30/2021 14:11:58 - INFO - __main__ - Step 5607: {'lr': 0.0004992679753330703, 'samples': 1076544, 'steps': 5606, 'loss/train': 2.7077651023864746} -08/30/2021 14:11:58 - INFO - __main__ - Step 5608: {'lr': 0.0004992675694714671, 'samples': 1076736, 'steps': 5607, 'loss/train': 2.7785913944244385} -08/30/2021 14:11:58 - INFO - __main__ - Step 5609: {'lr': 0.0004992671634975477, 'samples': 1076928, 'steps': 5608, 'loss/train': 1.9022002220153809} -08/30/2021 14:11:59 - INFO - __main__ - Step 5610: {'lr': 0.0004992667574113125, 'samples': 1077120, 'steps': 5609, 'loss/train': 2.3258204460144043} -08/30/2021 14:12:00 - INFO - __main__ - Step 5611: {'lr': 0.0004992663512127615, 'samples': 1077312, 'steps': 5610, 'loss/train': 2.915809154510498} -08/30/2021 14:12:01 - INFO - __main__ - Step 5612: {'lr': 0.0004992659449018949, 'samples': 1077504, 'steps': 5611, 'loss/train': 0.5763670206069946} -08/30/2021 14:12:01 - INFO - __main__ - Step 5613: {'lr': 0.0004992655384787129, 'samples': 1077696, 'steps': 5612, 'loss/train': 2.5807242393493652} -08/30/2021 14:12:01 - INFO - __main__ - Step 5614: {'lr': 0.0004992651319432157, 'samples': 1077888, 'steps': 5613, 'loss/train': 2.2036759853363037} -08/30/2021 14:12:02 - INFO - __main__ - Step 5615: {'lr': 0.0004992647252954035, 'samples': 1078080, 'steps': 5614, 'loss/train': 2.1674485206604004} -08/30/2021 14:12:03 - INFO - __main__ - Step 5616: {'lr': 0.0004992643185352765, 'samples': 1078272, 'steps': 5615, 'loss/train': 2.368358850479126} -08/30/2021 14:12:04 - INFO - __main__ - Step 5617: {'lr': 0.0004992639116628349, 'samples': 1078464, 'steps': 5616, 'loss/train': 2.0436251163482666} -08/30/2021 14:12:04 - INFO - __main__ - Step 5618: {'lr': 0.0004992635046780786, 'samples': 1078656, 'steps': 5617, 'loss/train': 2.672504186630249} -08/30/2021 14:12:04 - INFO - __main__ - Step 5619: {'lr': 0.0004992630975810083, 'samples': 1078848, 'steps': 5618, 'loss/train': 2.3043212890625} -08/30/2021 14:12:05 - INFO - __main__ - Step 5620: {'lr': 0.0004992626903716237, 'samples': 1079040, 'steps': 5619, 'loss/train': 2.338088274002075} -08/30/2021 14:12:06 - INFO - __main__ - Step 5621: {'lr': 0.0004992622830499252, 'samples': 1079232, 'steps': 5620, 'loss/train': 2.329005002975464} -08/30/2021 14:12:07 - INFO - __main__ - Step 5622: {'lr': 0.000499261875615913, 'samples': 1079424, 'steps': 5621, 'loss/train': 2.4516048431396484} -08/30/2021 14:12:07 - INFO - __main__ - Step 5623: {'lr': 0.0004992614680695872, 'samples': 1079616, 'steps': 5622, 'loss/train': 2.6651577949523926} -08/30/2021 14:12:07 - INFO - __main__ - Step 5624: {'lr': 0.0004992610604109481, 'samples': 1079808, 'steps': 5623, 'loss/train': 2.530071258544922} -08/30/2021 14:12:08 - INFO - __main__ - Step 5625: {'lr': 0.0004992606526399957, 'samples': 1080000, 'steps': 5624, 'loss/train': 2.181800603866577} -08/30/2021 14:12:08 - INFO - __main__ - Step 5626: {'lr': 0.0004992602447567304, 'samples': 1080192, 'steps': 5625, 'loss/train': 2.483560562133789} -08/30/2021 14:12:10 - INFO - __main__ - Step 5627: {'lr': 0.0004992598367611523, 'samples': 1080384, 'steps': 5626, 'loss/train': 2.363994598388672} -08/30/2021 14:12:10 - INFO - __main__ - Step 5628: {'lr': 0.0004992594286532615, 'samples': 1080576, 'steps': 5627, 'loss/train': 2.223031759262085} -08/30/2021 14:12:10 - INFO - __main__ - Step 5629: {'lr': 0.0004992590204330583, 'samples': 1080768, 'steps': 5628, 'loss/train': 2.554281711578369} -08/30/2021 14:12:11 - INFO - __main__ - Step 5630: {'lr': 0.0004992586121005427, 'samples': 1080960, 'steps': 5629, 'loss/train': 1.5866557359695435} -08/30/2021 14:12:11 - INFO - __main__ - Step 5631: {'lr': 0.0004992582036557152, 'samples': 1081152, 'steps': 5630, 'loss/train': 1.6307365894317627} -08/30/2021 14:12:13 - INFO - __main__ - Step 5632: {'lr': 0.0004992577950985757, 'samples': 1081344, 'steps': 5631, 'loss/train': 2.209010124206543} -08/30/2021 14:12:13 - INFO - __main__ - Step 5633: {'lr': 0.0004992573864291244, 'samples': 1081536, 'steps': 5632, 'loss/train': 2.5554189682006836} -08/30/2021 14:12:13 - INFO - __main__ - Step 5634: {'lr': 0.0004992569776473616, 'samples': 1081728, 'steps': 5633, 'loss/train': 2.378779411315918} -08/30/2021 14:12:14 - INFO - __main__ - Step 5635: {'lr': 0.0004992565687532875, 'samples': 1081920, 'steps': 5634, 'loss/train': 2.0683438777923584} -08/30/2021 14:12:14 - INFO - __main__ - Step 5636: {'lr': 0.0004992561597469023, 'samples': 1082112, 'steps': 5635, 'loss/train': 2.2773492336273193} -08/30/2021 14:12:16 - INFO - __main__ - Step 5637: {'lr': 0.0004992557506282061, 'samples': 1082304, 'steps': 5636, 'loss/train': 2.407515048980713} -08/30/2021 14:12:16 - INFO - __main__ - Step 5638: {'lr': 0.0004992553413971991, 'samples': 1082496, 'steps': 5637, 'loss/train': 2.873664617538452} -08/30/2021 14:12:16 - INFO - __main__ - Step 5639: {'lr': 0.0004992549320538814, 'samples': 1082688, 'steps': 5638, 'loss/train': 2.7536582946777344} -08/30/2021 14:12:17 - INFO - __main__ - Step 5640: {'lr': 0.0004992545225982533, 'samples': 1082880, 'steps': 5639, 'loss/train': 2.0577661991119385} -08/30/2021 14:12:17 - INFO - __main__ - Step 5641: {'lr': 0.000499254113030315, 'samples': 1083072, 'steps': 5640, 'loss/train': 2.3533098697662354} -08/30/2021 14:12:19 - INFO - __main__ - Step 5642: {'lr': 0.0004992537033500667, 'samples': 1083264, 'steps': 5641, 'loss/train': 1.821448802947998} -08/30/2021 14:12:19 - INFO - __main__ - Step 5643: {'lr': 0.0004992532935575084, 'samples': 1083456, 'steps': 5642, 'loss/train': 1.7020071744918823} -08/30/2021 14:12:19 - INFO - __main__ - Step 5644: {'lr': 0.0004992528836526405, 'samples': 1083648, 'steps': 5643, 'loss/train': 2.7386322021484375} -08/30/2021 14:12:20 - INFO - __main__ - Step 5645: {'lr': 0.0004992524736354631, 'samples': 1083840, 'steps': 5644, 'loss/train': 1.5291237831115723} -08/30/2021 14:12:20 - INFO - __main__ - Step 5646: {'lr': 0.0004992520635059762, 'samples': 1084032, 'steps': 5645, 'loss/train': 2.173515558242798} -08/30/2021 14:12:22 - INFO - __main__ - Step 5647: {'lr': 0.0004992516532641804, 'samples': 1084224, 'steps': 5646, 'loss/train': 2.7405176162719727} -08/30/2021 14:12:22 - INFO - __main__ - Step 5648: {'lr': 0.0004992512429100757, 'samples': 1084416, 'steps': 5647, 'loss/train': 1.0726940631866455} -08/30/2021 14:12:23 - INFO - __main__ - Step 5649: {'lr': 0.000499250832443662, 'samples': 1084608, 'steps': 5648, 'loss/train': 2.2058637142181396} -08/30/2021 14:12:23 - INFO - __main__ - Step 5650: {'lr': 0.0004992504218649398, 'samples': 1084800, 'steps': 5649, 'loss/train': 0.40684834122657776} -08/30/2021 14:12:23 - INFO - __main__ - Step 5651: {'lr': 0.0004992500111739093, 'samples': 1084992, 'steps': 5650, 'loss/train': 2.338634490966797} -08/30/2021 14:12:24 - INFO - __main__ - Step 5652: {'lr': 0.0004992496003705705, 'samples': 1085184, 'steps': 5651, 'loss/train': 2.478384494781494} -08/30/2021 14:12:26 - INFO - __main__ - Step 5653: {'lr': 0.0004992491894549236, 'samples': 1085376, 'steps': 5652, 'loss/train': 2.0849030017852783} -08/30/2021 14:12:26 - INFO - __main__ - Step 5654: {'lr': 0.000499248778426969, 'samples': 1085568, 'steps': 5653, 'loss/train': 2.181152582168579} -08/30/2021 14:12:27 - INFO - __main__ - Step 5655: {'lr': 0.0004992483672867068, 'samples': 1085760, 'steps': 5654, 'loss/train': 2.0722830295562744} -08/30/2021 14:12:27 - INFO - __main__ - Step 5656: {'lr': 0.000499247956034137, 'samples': 1085952, 'steps': 5655, 'loss/train': 1.231980562210083} -08/30/2021 14:12:27 - INFO - __main__ - Step 5657: {'lr': 0.00049924754466926, 'samples': 1086144, 'steps': 5656, 'loss/train': 0.8097274899482727} -08/30/2021 14:12:29 - INFO - __main__ - Step 5658: {'lr': 0.0004992471331920758, 'samples': 1086336, 'steps': 5657, 'loss/train': 2.6777894496917725} -08/30/2021 14:12:29 - INFO - __main__ - Step 5659: {'lr': 0.0004992467216025848, 'samples': 1086528, 'steps': 5658, 'loss/train': 2.5285768508911133} -08/30/2021 14:12:30 - INFO - __main__ - Step 5660: {'lr': 0.0004992463099007871, 'samples': 1086720, 'steps': 5659, 'loss/train': 2.3760643005371094} -08/30/2021 14:12:30 - INFO - __main__ - Step 5661: {'lr': 0.0004992458980866827, 'samples': 1086912, 'steps': 5660, 'loss/train': 2.465883255004883} -08/30/2021 14:12:30 - INFO - __main__ - Step 5662: {'lr': 0.000499245486160272, 'samples': 1087104, 'steps': 5661, 'loss/train': 1.6989326477050781} -08/30/2021 14:12:32 - INFO - __main__ - Step 5663: {'lr': 0.0004992450741215552, 'samples': 1087296, 'steps': 5662, 'loss/train': 2.1420459747314453} -08/30/2021 14:12:33 - INFO - __main__ - Step 5664: {'lr': 0.0004992446619705324, 'samples': 1087488, 'steps': 5663, 'loss/train': 2.51448655128479} -08/30/2021 14:12:33 - INFO - __main__ - Step 5665: {'lr': 0.0004992442497072037, 'samples': 1087680, 'steps': 5664, 'loss/train': 1.8403258323669434} -08/30/2021 14:12:34 - INFO - __main__ - Step 5666: {'lr': 0.0004992438373315694, 'samples': 1087872, 'steps': 5665, 'loss/train': 3.5829086303710938} -08/30/2021 14:12:34 - INFO - __main__ - Step 5667: {'lr': 0.0004992434248436298, 'samples': 1088064, 'steps': 5666, 'loss/train': 1.30825936794281} -08/30/2021 14:12:35 - INFO - __main__ - Step 5668: {'lr': 0.0004992430122433848, 'samples': 1088256, 'steps': 5667, 'loss/train': 2.7855496406555176} -08/30/2021 14:12:36 - INFO - __main__ - Step 5669: {'lr': 0.0004992425995308349, 'samples': 1088448, 'steps': 5668, 'loss/train': 2.707829236984253} -08/30/2021 14:12:36 - INFO - __main__ - Step 5670: {'lr': 0.0004992421867059801, 'samples': 1088640, 'steps': 5669, 'loss/train': 2.8715929985046387} -08/30/2021 14:12:37 - INFO - __main__ - Step 5671: {'lr': 0.0004992417737688206, 'samples': 1088832, 'steps': 5670, 'loss/train': 2.067136287689209} -08/30/2021 14:12:37 - INFO - __main__ - Step 5672: {'lr': 0.0004992413607193566, 'samples': 1089024, 'steps': 5671, 'loss/train': 1.989829182624817} -08/30/2021 14:12:38 - INFO - __main__ - Step 5673: {'lr': 0.0004992409475575882, 'samples': 1089216, 'steps': 5672, 'loss/train': 2.6323845386505127} -08/30/2021 14:12:39 - INFO - __main__ - Step 5674: {'lr': 0.0004992405342835158, 'samples': 1089408, 'steps': 5673, 'loss/train': 2.9494431018829346} -08/30/2021 14:12:39 - INFO - __main__ - Step 5675: {'lr': 0.0004992401208971394, 'samples': 1089600, 'steps': 5674, 'loss/train': 2.3475522994995117} -08/30/2021 14:12:40 - INFO - __main__ - Step 5676: {'lr': 0.0004992397073984592, 'samples': 1089792, 'steps': 5675, 'loss/train': 2.1629555225372314} -08/30/2021 14:12:40 - INFO - __main__ - Step 5677: {'lr': 0.0004992392937874755, 'samples': 1089984, 'steps': 5676, 'loss/train': 2.100853443145752} -08/30/2021 14:12:40 - INFO - __main__ - Step 5678: {'lr': 0.0004992388800641885, 'samples': 1090176, 'steps': 5677, 'loss/train': 2.1264657974243164} -08/30/2021 14:12:42 - INFO - __main__ - Step 5679: {'lr': 0.0004992384662285981, 'samples': 1090368, 'steps': 5678, 'loss/train': 2.2811851501464844} -08/30/2021 14:12:43 - INFO - __main__ - Step 5680: {'lr': 0.0004992380522807049, 'samples': 1090560, 'steps': 5679, 'loss/train': 0.35879984498023987} -08/30/2021 14:12:43 - INFO - __main__ - Step 5681: {'lr': 0.0004992376382205088, 'samples': 1090752, 'steps': 5680, 'loss/train': 2.296266555786133} -08/30/2021 14:12:43 - INFO - __main__ - Step 5682: {'lr': 0.00049923722404801, 'samples': 1090944, 'steps': 5681, 'loss/train': 1.342445969581604} -08/30/2021 14:12:44 - INFO - __main__ - Step 5683: {'lr': 0.0004992368097632089, 'samples': 1091136, 'steps': 5682, 'loss/train': 2.1382083892822266} -08/30/2021 14:12:45 - INFO - __main__ - Step 5684: {'lr': 0.0004992363953661054, 'samples': 1091328, 'steps': 5683, 'loss/train': 2.2334742546081543} -08/30/2021 14:12:45 - INFO - __main__ - Step 5685: {'lr': 0.0004992359808566999, 'samples': 1091520, 'steps': 5684, 'loss/train': 2.283954620361328} -08/30/2021 14:12:46 - INFO - __main__ - Step 5686: {'lr': 0.0004992355662349925, 'samples': 1091712, 'steps': 5685, 'loss/train': 2.114316701889038} -08/30/2021 14:12:46 - INFO - __main__ - Step 5687: {'lr': 0.0004992351515009833, 'samples': 1091904, 'steps': 5686, 'loss/train': 2.6024370193481445} -08/30/2021 14:12:47 - INFO - __main__ - Step 5688: {'lr': 0.0004992347366546727, 'samples': 1092096, 'steps': 5687, 'loss/train': 2.1036834716796875} -08/30/2021 14:12:48 - INFO - __main__ - Step 5689: {'lr': 0.0004992343216960607, 'samples': 1092288, 'steps': 5688, 'loss/train': 2.1468937397003174} -08/30/2021 14:12:49 - INFO - __main__ - Step 5690: {'lr': 0.0004992339066251476, 'samples': 1092480, 'steps': 5689, 'loss/train': 2.0252957344055176} -08/30/2021 14:12:49 - INFO - __main__ - Step 5691: {'lr': 0.0004992334914419337, 'samples': 1092672, 'steps': 5690, 'loss/train': 2.0974056720733643} -08/30/2021 14:12:49 - INFO - __main__ - Step 5692: {'lr': 0.0004992330761464188, 'samples': 1092864, 'steps': 5691, 'loss/train': 1.116600751876831} -08/30/2021 14:12:50 - INFO - __main__ - Step 5693: {'lr': 0.0004992326607386034, 'samples': 1093056, 'steps': 5692, 'loss/train': 2.1761841773986816} -08/30/2021 14:12:51 - INFO - __main__ - Step 5694: {'lr': 0.0004992322452184876, 'samples': 1093248, 'steps': 5693, 'loss/train': 1.6583324670791626} -08/30/2021 14:12:51 - INFO - __main__ - Step 5695: {'lr': 0.0004992318295860718, 'samples': 1093440, 'steps': 5694, 'loss/train': 1.9998258352279663} -08/30/2021 14:12:52 - INFO - __main__ - Step 5696: {'lr': 0.0004992314138413557, 'samples': 1093632, 'steps': 5695, 'loss/train': 1.500299096107483} -08/30/2021 14:12:52 - INFO - __main__ - Step 5697: {'lr': 0.0004992309979843398, 'samples': 1093824, 'steps': 5696, 'loss/train': 1.796570062637329} -08/30/2021 14:12:52 - INFO - __main__ - Step 5698: {'lr': 0.0004992305820150243, 'samples': 1094016, 'steps': 5697, 'loss/train': 2.0542001724243164} -08/30/2021 14:12:54 - INFO - __main__ - Step 5699: {'lr': 0.0004992301659334095, 'samples': 1094208, 'steps': 5698, 'loss/train': 2.145958185195923} -08/30/2021 14:12:54 - INFO - __main__ - Step 5700: {'lr': 0.0004992297497394953, 'samples': 1094400, 'steps': 5699, 'loss/train': 1.3726893663406372} -08/30/2021 14:12:55 - INFO - __main__ - Step 5701: {'lr': 0.000499229333433282, 'samples': 1094592, 'steps': 5700, 'loss/train': 0.8239323496818542} -08/30/2021 14:12:55 - INFO - __main__ - Step 5702: {'lr': 0.0004992289170147699, 'samples': 1094784, 'steps': 5701, 'loss/train': 2.321021556854248} -08/30/2021 14:12:55 - INFO - __main__ - Step 5703: {'lr': 0.000499228500483959, 'samples': 1094976, 'steps': 5702, 'loss/train': 2.34973406791687} -08/30/2021 14:12:58 - INFO - __main__ - Step 5704: {'lr': 0.0004992280838408496, 'samples': 1095168, 'steps': 5703, 'loss/train': 2.7191219329833984} -08/30/2021 14:12:58 - INFO - __main__ - Step 5705: {'lr': 0.0004992276670854419, 'samples': 1095360, 'steps': 5704, 'loss/train': 2.2663156986236572} -08/30/2021 14:12:58 - INFO - __main__ - Step 5706: {'lr': 0.000499227250217736, 'samples': 1095552, 'steps': 5705, 'loss/train': 2.295117139816284} -08/30/2021 14:12:59 - INFO - __main__ - Step 5707: {'lr': 0.0004992268332377323, 'samples': 1095744, 'steps': 5706, 'loss/train': 2.4629361629486084} -08/30/2021 14:12:59 - INFO - __main__ - Step 5708: {'lr': 0.0004992264161454306, 'samples': 1095936, 'steps': 5707, 'loss/train': 1.8976025581359863} -08/30/2021 14:13:01 - INFO - __main__ - Step 5709: {'lr': 0.0004992259989408316, 'samples': 1096128, 'steps': 5708, 'loss/train': 1.6562938690185547} -08/30/2021 14:13:01 - INFO - __main__ - Step 5710: {'lr': 0.000499225581623935, 'samples': 1096320, 'steps': 5709, 'loss/train': 2.2951793670654297} -08/30/2021 14:13:01 - INFO - __main__ - Step 5711: {'lr': 0.0004992251641947412, 'samples': 1096512, 'steps': 5710, 'loss/train': 1.9760348796844482} -08/30/2021 14:13:02 - INFO - __main__ - Step 5712: {'lr': 0.0004992247466532504, 'samples': 1096704, 'steps': 5711, 'loss/train': 2.306309461593628} -08/30/2021 14:13:02 - INFO - __main__ - Step 5713: {'lr': 0.0004992243289994629, 'samples': 1096896, 'steps': 5712, 'loss/train': 2.377441644668579} -08/30/2021 14:13:03 - INFO - __main__ - Step 5714: {'lr': 0.0004992239112333787, 'samples': 1097088, 'steps': 5713, 'loss/train': 1.9280357360839844} -08/30/2021 14:13:04 - INFO - __main__ - Step 5715: {'lr': 0.000499223493354998, 'samples': 1097280, 'steps': 5714, 'loss/train': 2.1363718509674072} -08/30/2021 14:13:04 - INFO - __main__ - Step 5716: {'lr': 0.0004992230753643211, 'samples': 1097472, 'steps': 5715, 'loss/train': 2.1121766567230225} -08/30/2021 14:13:05 - INFO - __main__ - Step 5717: {'lr': 0.0004992226572613481, 'samples': 1097664, 'steps': 5716, 'loss/train': 2.4798450469970703} -08/30/2021 14:13:05 - INFO - __main__ - Step 5718: {'lr': 0.0004992222390460792, 'samples': 1097856, 'steps': 5717, 'loss/train': 1.9710110425949097} -08/30/2021 14:13:05 - INFO - __main__ - Step 5719: {'lr': 0.0004992218207185146, 'samples': 1098048, 'steps': 5718, 'loss/train': 1.659106969833374} -08/30/2021 14:13:07 - INFO - __main__ - Step 5720: {'lr': 0.0004992214022786546, 'samples': 1098240, 'steps': 5719, 'loss/train': 1.6958831548690796} -08/30/2021 14:13:07 - INFO - __main__ - Step 5721: {'lr': 0.0004992209837264991, 'samples': 1098432, 'steps': 5720, 'loss/train': 2.4289145469665527} -08/30/2021 14:13:08 - INFO - __main__ - Step 5722: {'lr': 0.0004992205650620487, 'samples': 1098624, 'steps': 5721, 'loss/train': 1.7528969049453735} -08/30/2021 14:13:08 - INFO - __main__ - Step 5723: {'lr': 0.0004992201462853032, 'samples': 1098816, 'steps': 5722, 'loss/train': 2.3579201698303223} -08/30/2021 14:13:08 - INFO - __main__ - Step 5724: {'lr': 0.000499219727396263, 'samples': 1099008, 'steps': 5723, 'loss/train': 2.2928426265716553} -08/30/2021 14:13:10 - INFO - __main__ - Step 5725: {'lr': 0.0004992193083949282, 'samples': 1099200, 'steps': 5724, 'loss/train': 1.9065685272216797} -08/30/2021 14:13:10 - INFO - __main__ - Step 5726: {'lr': 0.000499218889281299, 'samples': 1099392, 'steps': 5725, 'loss/train': 2.054805278778076} -08/30/2021 14:13:11 - INFO - __main__ - Step 5727: {'lr': 0.0004992184700553756, 'samples': 1099584, 'steps': 5726, 'loss/train': 2.198212146759033} -08/30/2021 14:13:11 - INFO - __main__ - Step 5728: {'lr': 0.0004992180507171583, 'samples': 1099776, 'steps': 5727, 'loss/train': 1.9786972999572754} -08/30/2021 14:13:11 - INFO - __main__ - Step 5729: {'lr': 0.0004992176312666472, 'samples': 1099968, 'steps': 5728, 'loss/train': 1.439853549003601} -08/30/2021 14:13:13 - INFO - __main__ - Step 5730: {'lr': 0.0004992172117038424, 'samples': 1100160, 'steps': 5729, 'loss/train': 3.0891635417938232} -08/30/2021 14:13:13 - INFO - __main__ - Step 5731: {'lr': 0.0004992167920287443, 'samples': 1100352, 'steps': 5730, 'loss/train': 1.9488180875778198} -08/30/2021 14:13:13 - INFO - __main__ - Step 5732: {'lr': 0.0004992163722413528, 'samples': 1100544, 'steps': 5731, 'loss/train': 2.0667245388031006} -08/30/2021 14:13:14 - INFO - __main__ - Step 5733: {'lr': 0.0004992159523416683, 'samples': 1100736, 'steps': 5732, 'loss/train': 2.0932631492614746} -08/30/2021 14:13:14 - INFO - __main__ - Step 5734: {'lr': 0.000499215532329691, 'samples': 1100928, 'steps': 5733, 'loss/train': 0.6742189526557922} -08/30/2021 14:13:16 - INFO - __main__ - Step 5735: {'lr': 0.000499215112205421, 'samples': 1101120, 'steps': 5734, 'loss/train': 1.9801772832870483} -08/30/2021 14:13:16 - INFO - __main__ - Step 5736: {'lr': 0.0004992146919688584, 'samples': 1101312, 'steps': 5735, 'loss/train': 2.2107222080230713} -08/30/2021 14:13:16 - INFO - __main__ - Step 5737: {'lr': 0.0004992142716200036, 'samples': 1101504, 'steps': 5736, 'loss/train': 2.240306854248047} -08/30/2021 14:13:17 - INFO - __main__ - Step 5738: {'lr': 0.0004992138511588567, 'samples': 1101696, 'steps': 5737, 'loss/train': 1.975052833557129} -08/30/2021 14:13:17 - INFO - __main__ - Step 5739: {'lr': 0.0004992134305854179, 'samples': 1101888, 'steps': 5738, 'loss/train': 2.5487613677978516} -08/30/2021 14:13:19 - INFO - __main__ - Step 5740: {'lr': 0.0004992130098996873, 'samples': 1102080, 'steps': 5739, 'loss/train': 2.0061371326446533} -08/30/2021 14:13:19 - INFO - __main__ - Step 5741: {'lr': 0.0004992125891016652, 'samples': 1102272, 'steps': 5740, 'loss/train': 2.1268246173858643} -08/30/2021 14:13:20 - INFO - __main__ - Step 5742: {'lr': 0.0004992121681913518, 'samples': 1102464, 'steps': 5741, 'loss/train': 1.9292787313461304} -08/30/2021 14:13:20 - INFO - __main__ - Step 5743: {'lr': 0.0004992117471687472, 'samples': 1102656, 'steps': 5742, 'loss/train': 2.0467426776885986} -08/30/2021 14:13:20 - INFO - __main__ - Step 5744: {'lr': 0.0004992113260338517, 'samples': 1102848, 'steps': 5743, 'loss/train': 2.078896999359131} -08/30/2021 14:13:21 - INFO - __main__ - Step 5745: {'lr': 0.0004992109047866653, 'samples': 1103040, 'steps': 5744, 'loss/train': 2.2047533988952637} -08/30/2021 14:13:22 - INFO - __main__ - Step 5746: {'lr': 0.0004992104834271884, 'samples': 1103232, 'steps': 5745, 'loss/train': 2.364816665649414} -08/30/2021 14:13:22 - INFO - __main__ - Step 5747: {'lr': 0.0004992100619554211, 'samples': 1103424, 'steps': 5746, 'loss/train': 2.120272159576416} -08/30/2021 14:13:23 - INFO - __main__ - Step 5748: {'lr': 0.0004992096403713635, 'samples': 1103616, 'steps': 5747, 'loss/train': 2.5253005027770996} -08/30/2021 14:13:23 - INFO - __main__ - Step 5749: {'lr': 0.000499209218675016, 'samples': 1103808, 'steps': 5748, 'loss/train': 2.4032397270202637} -08/30/2021 14:13:24 - INFO - __main__ - Step 5750: {'lr': 0.0004992087968663786, 'samples': 1104000, 'steps': 5749, 'loss/train': 2.4137752056121826} -08/30/2021 14:13:25 - INFO - __main__ - Step 5751: {'lr': 0.0004992083749454515, 'samples': 1104192, 'steps': 5750, 'loss/train': 1.768087387084961} -08/30/2021 14:13:25 - INFO - __main__ - Step 5752: {'lr': 0.0004992079529122351, 'samples': 1104384, 'steps': 5751, 'loss/train': 2.147995948791504} -08/30/2021 14:13:26 - INFO - __main__ - Step 5753: {'lr': 0.0004992075307667294, 'samples': 1104576, 'steps': 5752, 'loss/train': 2.203209638595581} -08/30/2021 14:13:26 - INFO - __main__ - Step 5754: {'lr': 0.0004992071085089346, 'samples': 1104768, 'steps': 5753, 'loss/train': 2.765620231628418} -08/30/2021 14:13:27 - INFO - __main__ - Step 5755: {'lr': 0.0004992066861388509, 'samples': 1104960, 'steps': 5754, 'loss/train': 2.8312582969665527} -08/30/2021 14:13:28 - INFO - __main__ - Step 5756: {'lr': 0.0004992062636564786, 'samples': 1105152, 'steps': 5755, 'loss/train': 1.6942883729934692} -08/30/2021 14:13:29 - INFO - __main__ - Step 5757: {'lr': 0.0004992058410618177, 'samples': 1105344, 'steps': 5756, 'loss/train': 2.234927177429199} -08/30/2021 14:13:29 - INFO - __main__ - Step 5758: {'lr': 0.0004992054183548685, 'samples': 1105536, 'steps': 5757, 'loss/train': 1.7898328304290771} -08/30/2021 14:13:30 - INFO - __main__ - Step 5759: {'lr': 0.0004992049955356313, 'samples': 1105728, 'steps': 5758, 'loss/train': 1.5698727369308472} -08/30/2021 14:13:30 - INFO - __main__ - Step 5760: {'lr': 0.0004992045726041061, 'samples': 1105920, 'steps': 5759, 'loss/train': 1.4664987325668335} -08/30/2021 14:13:31 - INFO - __main__ - Step 5761: {'lr': 0.0004992041495602931, 'samples': 1106112, 'steps': 5760, 'loss/train': 2.4140067100524902} -08/30/2021 14:13:32 - INFO - __main__ - Step 5762: {'lr': 0.0004992037264041927, 'samples': 1106304, 'steps': 5761, 'loss/train': 2.1634068489074707} -08/30/2021 14:13:32 - INFO - __main__ - Step 5763: {'lr': 0.0004992033031358048, 'samples': 1106496, 'steps': 5762, 'loss/train': 1.0948678255081177} -08/30/2021 14:13:33 - INFO - __main__ - Step 5764: {'lr': 0.0004992028797551298, 'samples': 1106688, 'steps': 5763, 'loss/train': 1.8745142221450806} -08/30/2021 14:13:33 - INFO - __main__ - Step 5765: {'lr': 0.0004992024562621678, 'samples': 1106880, 'steps': 5764, 'loss/train': 2.4703831672668457} -08/30/2021 14:13:33 - INFO - __main__ - Step 5766: {'lr': 0.0004992020326569191, 'samples': 1107072, 'steps': 5765, 'loss/train': 0.3508596420288086} -08/30/2021 14:13:35 - INFO - __main__ - Step 5767: {'lr': 0.0004992016089393837, 'samples': 1107264, 'steps': 5766, 'loss/train': 2.3133385181427} -08/30/2021 14:13:35 - INFO - __main__ - Step 5768: {'lr': 0.000499201185109562, 'samples': 1107456, 'steps': 5767, 'loss/train': 1.7067315578460693} -08/30/2021 14:13:36 - INFO - __main__ - Step 5769: {'lr': 0.000499200761167454, 'samples': 1107648, 'steps': 5768, 'loss/train': 1.6532922983169556} -08/30/2021 14:13:36 - INFO - __main__ - Step 5770: {'lr': 0.0004992003371130601, 'samples': 1107840, 'steps': 5769, 'loss/train': 2.325556516647339} -08/30/2021 14:13:36 - INFO - __main__ - Step 5771: {'lr': 0.0004991999129463803, 'samples': 1108032, 'steps': 5770, 'loss/train': 2.090094566345215} -08/30/2021 14:13:38 - INFO - __main__ - Step 5772: {'lr': 0.0004991994886674148, 'samples': 1108224, 'steps': 5771, 'loss/train': 2.066429376602173} -08/30/2021 14:13:38 - INFO - __main__ - Step 5773: {'lr': 0.000499199064276164, 'samples': 1108416, 'steps': 5772, 'loss/train': 2.2343039512634277} -08/30/2021 14:13:39 - INFO - __main__ - Step 5774: {'lr': 0.0004991986397726278, 'samples': 1108608, 'steps': 5773, 'loss/train': 2.1294426918029785} -08/30/2021 14:13:39 - INFO - __main__ - Step 5775: {'lr': 0.0004991982151568066, 'samples': 1108800, 'steps': 5774, 'loss/train': 2.2161622047424316} -08/30/2021 14:13:39 - INFO - __main__ - Step 5776: {'lr': 0.0004991977904287006, 'samples': 1108992, 'steps': 5775, 'loss/train': 2.51168155670166} -08/30/2021 14:13:41 - INFO - __main__ - Step 5777: {'lr': 0.0004991973655883099, 'samples': 1109184, 'steps': 5776, 'loss/train': 1.9757490158081055} -08/30/2021 14:13:41 - INFO - __main__ - Step 5778: {'lr': 0.0004991969406356346, 'samples': 1109376, 'steps': 5777, 'loss/train': 2.0249340534210205} -08/30/2021 14:13:42 - INFO - __main__ - Step 5779: {'lr': 0.0004991965155706752, 'samples': 1109568, 'steps': 5778, 'loss/train': 1.403512716293335} -08/30/2021 14:13:42 - INFO - __main__ - Step 5780: {'lr': 0.0004991960903934315, 'samples': 1109760, 'steps': 5779, 'loss/train': 1.8740057945251465} -08/30/2021 14:13:42 - INFO - __main__ - Step 5781: {'lr': 0.0004991956651039039, 'samples': 1109952, 'steps': 5780, 'loss/train': 2.0561277866363525} -08/30/2021 14:13:43 - INFO - __main__ - Step 5782: {'lr': 0.0004991952397020927, 'samples': 1110144, 'steps': 5781, 'loss/train': 0.9645845890045166} -08/30/2021 14:13:44 - INFO - __main__ - Step 5783: {'lr': 0.0004991948141879978, 'samples': 1110336, 'steps': 5782, 'loss/train': 2.164886474609375} -08/30/2021 14:13:45 - INFO - __main__ - Step 5784: {'lr': 0.0004991943885616198, 'samples': 1110528, 'steps': 5783, 'loss/train': 1.8348333835601807} -08/30/2021 14:13:45 - INFO - __main__ - Step 5785: {'lr': 0.0004991939628229585, 'samples': 1110720, 'steps': 5784, 'loss/train': 1.9779103994369507} -08/30/2021 14:13:45 - INFO - __main__ - Step 5786: {'lr': 0.0004991935369720143, 'samples': 1110912, 'steps': 5785, 'loss/train': 1.8907867670059204} -08/30/2021 14:13:46 - INFO - __main__ - Step 5787: {'lr': 0.0004991931110087873, 'samples': 1111104, 'steps': 5786, 'loss/train': 2.2632336616516113} -08/30/2021 14:13:47 - INFO - __main__ - Step 5788: {'lr': 0.0004991926849332777, 'samples': 1111296, 'steps': 5787, 'loss/train': 2.4298908710479736} -08/30/2021 14:13:48 - INFO - __main__ - Step 5789: {'lr': 0.0004991922587454858, 'samples': 1111488, 'steps': 5788, 'loss/train': 1.721315860748291} -08/30/2021 14:13:48 - INFO - __main__ - Step 5790: {'lr': 0.0004991918324454117, 'samples': 1111680, 'steps': 5789, 'loss/train': 1.5899486541748047} -08/30/2021 14:13:48 - INFO - __main__ - Step 5791: {'lr': 0.0004991914060330556, 'samples': 1111872, 'steps': 5790, 'loss/train': 1.92160165309906} -08/30/2021 14:13:49 - INFO - __main__ - Step 5792: {'lr': 0.0004991909795084177, 'samples': 1112064, 'steps': 5791, 'loss/train': 2.054802417755127} -08/30/2021 14:13:50 - INFO - __main__ - Step 5793: {'lr': 0.0004991905528714981, 'samples': 1112256, 'steps': 5792, 'loss/train': 2.0912177562713623} -08/30/2021 14:13:51 - INFO - __main__ - Step 5794: {'lr': 0.0004991901261222971, 'samples': 1112448, 'steps': 5793, 'loss/train': 1.492459774017334} -08/30/2021 14:13:51 - INFO - __main__ - Step 5795: {'lr': 0.000499189699260815, 'samples': 1112640, 'steps': 5794, 'loss/train': 2.2374181747436523} -08/30/2021 14:13:52 - INFO - __main__ - Step 5796: {'lr': 0.0004991892722870517, 'samples': 1112832, 'steps': 5795, 'loss/train': 2.1417839527130127} -08/30/2021 14:13:52 - INFO - __main__ - Step 5797: {'lr': 0.0004991888452010076, 'samples': 1113024, 'steps': 5796, 'loss/train': 2.084658145904541} -08/30/2021 14:13:52 - INFO - __main__ - Step 5798: {'lr': 0.000499188418002683, 'samples': 1113216, 'steps': 5797, 'loss/train': 2.9410722255706787} -08/30/2021 14:13:54 - INFO - __main__ - Step 5799: {'lr': 0.0004991879906920779, 'samples': 1113408, 'steps': 5798, 'loss/train': 2.235234260559082} -08/30/2021 14:13:54 - INFO - __main__ - Step 5800: {'lr': 0.0004991875632691924, 'samples': 1113600, 'steps': 5799, 'loss/train': 2.190568685531616} -08/30/2021 14:13:55 - INFO - __main__ - Step 5801: {'lr': 0.0004991871357340269, 'samples': 1113792, 'steps': 5800, 'loss/train': 2.011568546295166} -08/30/2021 14:13:55 - INFO - __main__ - Step 5802: {'lr': 0.0004991867080865815, 'samples': 1113984, 'steps': 5801, 'loss/train': 2.3917582035064697} -08/30/2021 14:13:55 - INFO - __main__ - Step 5803: {'lr': 0.0004991862803268564, 'samples': 1114176, 'steps': 5802, 'loss/train': 1.774945616722107} -08/30/2021 14:13:57 - INFO - __main__ - Step 5804: {'lr': 0.0004991858524548519, 'samples': 1114368, 'steps': 5803, 'loss/train': 1.6664633750915527} -08/30/2021 14:13:58 - INFO - __main__ - Step 5805: {'lr': 0.000499185424470568, 'samples': 1114560, 'steps': 5804, 'loss/train': 2.505523443222046} -08/30/2021 14:13:58 - INFO - __main__ - Step 5806: {'lr': 0.0004991849963740052, 'samples': 1114752, 'steps': 5805, 'loss/train': 0.5344151258468628} -08/30/2021 14:13:58 - INFO - __main__ - Step 5807: {'lr': 0.0004991845681651632, 'samples': 1114944, 'steps': 5806, 'loss/train': 2.6453616619110107} -08/30/2021 14:13:59 - INFO - __main__ - Step 5808: {'lr': 0.0004991841398440427, 'samples': 1115136, 'steps': 5807, 'loss/train': 1.5687943696975708} -08/30/2021 14:14:00 - INFO - __main__ - Step 5809: {'lr': 0.0004991837114106436, 'samples': 1115328, 'steps': 5808, 'loss/train': 1.5863301753997803} -08/30/2021 14:14:01 - INFO - __main__ - Step 5810: {'lr': 0.0004991832828649661, 'samples': 1115520, 'steps': 5809, 'loss/train': 2.273674488067627} -08/30/2021 14:14:01 - INFO - __main__ - Step 5811: {'lr': 0.0004991828542070105, 'samples': 1115712, 'steps': 5810, 'loss/train': 2.063884735107422} -08/30/2021 14:14:01 - INFO - __main__ - Step 5812: {'lr': 0.000499182425436777, 'samples': 1115904, 'steps': 5811, 'loss/train': 2.101816177368164} -08/30/2021 14:14:02 - INFO - __main__ - Step 5813: {'lr': 0.0004991819965542657, 'samples': 1116096, 'steps': 5812, 'loss/train': 1.9726061820983887} -08/30/2021 14:14:04 - INFO - __main__ - Step 5814: {'lr': 0.0004991815675594768, 'samples': 1116288, 'steps': 5813, 'loss/train': 2.189896583557129} -08/30/2021 14:14:04 - INFO - __main__ - Step 5815: {'lr': 0.0004991811384524106, 'samples': 1116480, 'steps': 5814, 'loss/train': 1.5735437870025635} -08/30/2021 14:14:05 - INFO - __main__ - Step 5816: {'lr': 0.0004991807092330671, 'samples': 1116672, 'steps': 5815, 'loss/train': 1.6591681241989136} -08/30/2021 14:14:05 - INFO - __main__ - Step 5817: {'lr': 0.0004991802799014467, 'samples': 1116864, 'steps': 5816, 'loss/train': 3.386476516723633} -08/30/2021 14:14:05 - INFO - __main__ - Step 5818: {'lr': 0.0004991798504575495, 'samples': 1117056, 'steps': 5817, 'loss/train': 2.6909241676330566} -08/30/2021 14:14:07 - INFO - __main__ - Step 5819: {'lr': 0.0004991794209013758, 'samples': 1117248, 'steps': 5818, 'loss/train': 2.2129266262054443} -08/30/2021 14:14:07 - INFO - __main__ - Step 5820: {'lr': 0.0004991789912329257, 'samples': 1117440, 'steps': 5819, 'loss/train': 2.9793317317962646} -08/30/2021 14:14:08 - INFO - __main__ - Step 5821: {'lr': 0.0004991785614521993, 'samples': 1117632, 'steps': 5820, 'loss/train': 2.5976696014404297} -08/30/2021 14:14:08 - INFO - __main__ - Step 5822: {'lr': 0.0004991781315591969, 'samples': 1117824, 'steps': 5821, 'loss/train': 1.6759430170059204} -08/30/2021 14:14:08 - INFO - __main__ - Step 5823: {'lr': 0.0004991777015539186, 'samples': 1118016, 'steps': 5822, 'loss/train': 2.5088138580322266} -08/30/2021 14:14:11 - INFO - __main__ - Step 5824: {'lr': 0.0004991772714363649, 'samples': 1118208, 'steps': 5823, 'loss/train': 2.419053077697754} -08/30/2021 14:14:11 - INFO - __main__ - Step 5825: {'lr': 0.0004991768412065355, 'samples': 1118400, 'steps': 5824, 'loss/train': 2.1020472049713135} -08/30/2021 14:14:11 - INFO - __main__ - Step 5826: {'lr': 0.000499176410864431, 'samples': 1118592, 'steps': 5825, 'loss/train': 1.631892204284668} -08/30/2021 14:14:12 - INFO - __main__ - Step 5827: {'lr': 0.0004991759804100515, 'samples': 1118784, 'steps': 5826, 'loss/train': 1.3924821615219116} -08/30/2021 14:14:12 - INFO - __main__ - Step 5828: {'lr': 0.000499175549843397, 'samples': 1118976, 'steps': 5827, 'loss/train': 1.8927206993103027} -08/30/2021 14:14:12 - INFO - __main__ - Step 5829: {'lr': 0.0004991751191644679, 'samples': 1119168, 'steps': 5828, 'loss/train': 0.4454633593559265} -08/30/2021 14:14:14 - INFO - __main__ - Step 5830: {'lr': 0.0004991746883732644, 'samples': 1119360, 'steps': 5829, 'loss/train': 0.39374086260795593} -08/30/2021 14:14:14 - INFO - __main__ - Step 5831: {'lr': 0.0004991742574697866, 'samples': 1119552, 'steps': 5830, 'loss/train': 1.9435609579086304} -08/30/2021 14:14:15 - INFO - __main__ - Step 5832: {'lr': 0.0004991738264540347, 'samples': 1119744, 'steps': 5831, 'loss/train': 2.1106748580932617} -08/30/2021 14:14:15 - INFO - __main__ - Step 5833: {'lr': 0.0004991733953260089, 'samples': 1119936, 'steps': 5832, 'loss/train': 2.182868242263794} -08/30/2021 14:14:15 - INFO - __main__ - Step 5834: {'lr': 0.0004991729640857095, 'samples': 1120128, 'steps': 5833, 'loss/train': 1.6570278406143188} -08/30/2021 14:14:17 - INFO - __main__ - Step 5835: {'lr': 0.0004991725327331366, 'samples': 1120320, 'steps': 5834, 'loss/train': 0.9613577127456665} -08/30/2021 14:14:18 - INFO - __main__ - Step 5836: {'lr': 0.0004991721012682903, 'samples': 1120512, 'steps': 5835, 'loss/train': 2.544282913208008} -08/30/2021 14:14:18 - INFO - __main__ - Step 5837: {'lr': 0.0004991716696911709, 'samples': 1120704, 'steps': 5836, 'loss/train': 2.135673999786377} -08/30/2021 14:14:18 - INFO - __main__ - Step 5838: {'lr': 0.0004991712380017786, 'samples': 1120896, 'steps': 5837, 'loss/train': 1.9499467611312866} -08/30/2021 14:14:19 - INFO - __main__ - Step 5839: {'lr': 0.0004991708062001137, 'samples': 1121088, 'steps': 5838, 'loss/train': 1.840232014656067} -08/30/2021 14:14:20 - INFO - __main__ - Step 5840: {'lr': 0.0004991703742861762, 'samples': 1121280, 'steps': 5839, 'loss/train': 2.009258270263672} -08/30/2021 14:14:21 - INFO - __main__ - Step 5841: {'lr': 0.0004991699422599664, 'samples': 1121472, 'steps': 5840, 'loss/train': 1.9192055463790894} -08/30/2021 14:14:21 - INFO - __main__ - Step 5842: {'lr': 0.0004991695101214844, 'samples': 1121664, 'steps': 5841, 'loss/train': 1.596557855606079} -08/30/2021 14:14:21 - INFO - __main__ - Step 5843: {'lr': 0.0004991690778707305, 'samples': 1121856, 'steps': 5842, 'loss/train': 1.9584181308746338} -08/30/2021 14:14:22 - INFO - __main__ - Step 5844: {'lr': 0.0004991686455077049, 'samples': 1122048, 'steps': 5843, 'loss/train': 0.23421703279018402} -08/30/2021 14:14:23 - INFO - __main__ - Step 5845: {'lr': 0.0004991682130324078, 'samples': 1122240, 'steps': 5844, 'loss/train': 2.0000855922698975} -08/30/2021 14:14:24 - INFO - __main__ - Step 5846: {'lr': 0.0004991677804448392, 'samples': 1122432, 'steps': 5845, 'loss/train': 1.8915375471115112} -08/30/2021 14:14:24 - INFO - __main__ - Step 5847: {'lr': 0.0004991673477449995, 'samples': 1122624, 'steps': 5846, 'loss/train': 2.2981455326080322} -08/30/2021 14:14:25 - INFO - __main__ - Step 5848: {'lr': 0.0004991669149328889, 'samples': 1122816, 'steps': 5847, 'loss/train': 2.2572288513183594} -08/30/2021 14:14:25 - INFO - __main__ - Step 5849: {'lr': 0.0004991664820085074, 'samples': 1123008, 'steps': 5848, 'loss/train': 1.9210668802261353} -08/30/2021 14:14:27 - INFO - __main__ - Step 5850: {'lr': 0.0004991660489718554, 'samples': 1123200, 'steps': 5849, 'loss/train': 0.2859579920768738} -08/30/2021 14:14:27 - INFO - __main__ - Step 5851: {'lr': 0.0004991656158229331, 'samples': 1123392, 'steps': 5850, 'loss/train': 2.6969258785247803} -08/30/2021 14:14:28 - INFO - __main__ - Step 5852: {'lr': 0.0004991651825617406, 'samples': 1123584, 'steps': 5851, 'loss/train': 0.5447800755500793} -08/30/2021 14:14:28 - INFO - __main__ - Step 5853: {'lr': 0.000499164749188278, 'samples': 1123776, 'steps': 5852, 'loss/train': 3.3150076866149902} -08/30/2021 14:14:29 - INFO - __main__ - Step 5854: {'lr': 0.0004991643157025458, 'samples': 1123968, 'steps': 5853, 'loss/train': 2.355253219604492} -08/30/2021 14:14:29 - INFO - __main__ - Step 5855: {'lr': 0.0004991638821045439, 'samples': 1124160, 'steps': 5854, 'loss/train': 2.568922996520996} -08/30/2021 14:14:30 - INFO - __main__ - Step 5856: {'lr': 0.0004991634483942725, 'samples': 1124352, 'steps': 5855, 'loss/train': 1.9149999618530273} -08/30/2021 14:14:31 - INFO - __main__ - Step 5857: {'lr': 0.000499163014571732, 'samples': 1124544, 'steps': 5856, 'loss/train': 2.3357861042022705} -08/30/2021 14:14:31 - INFO - __main__ - Step 5858: {'lr': 0.0004991625806369225, 'samples': 1124736, 'steps': 5857, 'loss/train': 1.2552976608276367} -08/30/2021 14:14:31 - INFO - __main__ - Step 5859: {'lr': 0.0004991621465898441, 'samples': 1124928, 'steps': 5858, 'loss/train': 2.1629445552825928} -08/30/2021 14:14:32 - INFO - __main__ - Step 5860: {'lr': 0.0004991617124304971, 'samples': 1125120, 'steps': 5859, 'loss/train': 2.0742111206054688} -08/30/2021 14:14:32 - INFO - __main__ - Step 5861: {'lr': 0.0004991612781588818, 'samples': 1125312, 'steps': 5860, 'loss/train': 1.6806098222732544} -08/30/2021 14:14:34 - INFO - __main__ - Step 5862: {'lr': 0.0004991608437749981, 'samples': 1125504, 'steps': 5861, 'loss/train': 1.7067089080810547} -08/30/2021 14:14:34 - INFO - __main__ - Step 5863: {'lr': 0.0004991604092788465, 'samples': 1125696, 'steps': 5862, 'loss/train': 1.7889811992645264} -08/30/2021 14:14:35 - INFO - __main__ - Step 5864: {'lr': 0.000499159974670427, 'samples': 1125888, 'steps': 5863, 'loss/train': 2.5286667346954346} -08/30/2021 14:14:35 - INFO - __main__ - Step 5865: {'lr': 0.00049915953994974, 'samples': 1126080, 'steps': 5864, 'loss/train': 1.9244738817214966} -08/30/2021 14:14:35 - INFO - __main__ - Step 5866: {'lr': 0.0004991591051167853, 'samples': 1126272, 'steps': 5865, 'loss/train': 1.942263126373291} -08/30/2021 14:14:37 - INFO - __main__ - Step 5867: {'lr': 0.0004991586701715635, 'samples': 1126464, 'steps': 5866, 'loss/train': 2.4721972942352295} -08/30/2021 14:14:37 - INFO - __main__ - Step 5868: {'lr': 0.0004991582351140747, 'samples': 1126656, 'steps': 5867, 'loss/train': 2.113710403442383} -08/30/2021 14:14:38 - INFO - __main__ - Step 5869: {'lr': 0.000499157799944319, 'samples': 1126848, 'steps': 5868, 'loss/train': 2.146578788757324} -08/30/2021 14:14:38 - INFO - __main__ - Step 5870: {'lr': 0.0004991573646622965, 'samples': 1127040, 'steps': 5869, 'loss/train': 2.503370761871338} -08/30/2021 14:14:38 - INFO - __main__ - Step 5871: {'lr': 0.0004991569292680078, 'samples': 1127232, 'steps': 5870, 'loss/train': 2.4791712760925293} -08/30/2021 14:14:40 - INFO - __main__ - Step 5872: {'lr': 0.0004991564937614526, 'samples': 1127424, 'steps': 5871, 'loss/train': 1.91326105594635} -08/30/2021 14:14:41 - INFO - __main__ - Step 5873: {'lr': 0.0004991560581426314, 'samples': 1127616, 'steps': 5872, 'loss/train': 1.3771426677703857} -08/30/2021 14:14:41 - INFO - __main__ - Step 5874: {'lr': 0.0004991556224115444, 'samples': 1127808, 'steps': 5873, 'loss/train': 1.8707513809204102} -08/30/2021 14:14:42 - INFO - __main__ - Step 5875: {'lr': 0.0004991551865681916, 'samples': 1128000, 'steps': 5874, 'loss/train': 1.7729097604751587} -08/30/2021 14:14:42 - INFO - __main__ - Step 5876: {'lr': 0.0004991547506125734, 'samples': 1128192, 'steps': 5875, 'loss/train': 1.8714960813522339} -08/30/2021 14:14:44 - INFO - __main__ - Step 5877: {'lr': 0.0004991543145446899, 'samples': 1128384, 'steps': 5876, 'loss/train': 0.32309070229530334} -08/30/2021 14:14:44 - INFO - __main__ - Step 5878: {'lr': 0.0004991538783645413, 'samples': 1128576, 'steps': 5877, 'loss/train': 2.4618256092071533} -08/30/2021 14:14:44 - INFO - __main__ - Step 5879: {'lr': 0.0004991534420721278, 'samples': 1128768, 'steps': 5878, 'loss/train': 2.109403610229492} -08/30/2021 14:14:45 - INFO - __main__ - Step 5880: {'lr': 0.0004991530056674496, 'samples': 1128960, 'steps': 5879, 'loss/train': 2.2718541622161865} -08/30/2021 14:14:45 - INFO - __main__ - Step 5881: {'lr': 0.000499152569150507, 'samples': 1129152, 'steps': 5880, 'loss/train': 1.8346096277236938} -08/30/2021 14:14:46 - INFO - __main__ - Step 5882: {'lr': 0.0004991521325213, 'samples': 1129344, 'steps': 5881, 'loss/train': 2.1230640411376953} -08/30/2021 14:14:47 - INFO - __main__ - Step 5883: {'lr': 0.0004991516957798289, 'samples': 1129536, 'steps': 5882, 'loss/train': 2.804133415222168} -08/30/2021 14:14:48 - INFO - __main__ - Step 5884: {'lr': 0.0004991512589260939, 'samples': 1129728, 'steps': 5883, 'loss/train': 2.043588638305664} -08/30/2021 14:14:48 - INFO - __main__ - Step 5885: {'lr': 0.0004991508219600952, 'samples': 1129920, 'steps': 5884, 'loss/train': 2.5084891319274902} -08/30/2021 14:14:48 - INFO - __main__ - Step 5886: {'lr': 0.000499150384881833, 'samples': 1130112, 'steps': 5885, 'loss/train': 2.2138478755950928} -08/30/2021 14:14:49 - INFO - __main__ - Step 5887: {'lr': 0.0004991499476913074, 'samples': 1130304, 'steps': 5886, 'loss/train': 0.22717320919036865} -08/30/2021 14:14:50 - INFO - __main__ - Step 5888: {'lr': 0.0004991495103885187, 'samples': 1130496, 'steps': 5887, 'loss/train': 1.546987533569336} -08/30/2021 14:14:51 - INFO - __main__ - Step 5889: {'lr': 0.0004991490729734672, 'samples': 1130688, 'steps': 5888, 'loss/train': 2.1046769618988037} -08/30/2021 14:14:51 - INFO - __main__ - Step 5890: {'lr': 0.0004991486354461528, 'samples': 1130880, 'steps': 5889, 'loss/train': 2.289349317550659} -08/30/2021 14:14:51 - INFO - __main__ - Step 5891: {'lr': 0.000499148197806576, 'samples': 1131072, 'steps': 5890, 'loss/train': 2.2530016899108887} -08/30/2021 14:14:52 - INFO - __main__ - Step 5892: {'lr': 0.0004991477600547367, 'samples': 1131264, 'steps': 5891, 'loss/train': 1.896599531173706} -08/30/2021 14:14:53 - INFO - __main__ - Step 5893: {'lr': 0.0004991473221906354, 'samples': 1131456, 'steps': 5892, 'loss/train': 1.9120417833328247} -08/30/2021 14:14:54 - INFO - __main__ - Step 5894: {'lr': 0.0004991468842142722, 'samples': 1131648, 'steps': 5893, 'loss/train': 2.2635602951049805} -08/30/2021 14:14:54 - INFO - __main__ - Step 5895: {'lr': 0.0004991464461256472, 'samples': 1131840, 'steps': 5894, 'loss/train': 2.137824773788452} -08/30/2021 14:14:54 - INFO - __main__ - Step 5896: {'lr': 0.0004991460079247606, 'samples': 1132032, 'steps': 5895, 'loss/train': 2.6105568408966064} -08/30/2021 14:14:55 - INFO - __main__ - Step 5897: {'lr': 0.0004991455696116128, 'samples': 1132224, 'steps': 5896, 'loss/train': 2.203672409057617} -08/30/2021 14:14:57 - INFO - __main__ - Step 5898: {'lr': 0.0004991451311862037, 'samples': 1132416, 'steps': 5897, 'loss/train': 1.998064637184143} -08/30/2021 14:14:57 - INFO - __main__ - Step 5899: {'lr': 0.0004991446926485337, 'samples': 1132608, 'steps': 5898, 'loss/train': 1.3992269039154053} -08/30/2021 14:14:57 - INFO - __main__ - Step 5900: {'lr': 0.0004991442539986029, 'samples': 1132800, 'steps': 5899, 'loss/train': 2.071692705154419} -08/30/2021 14:14:58 - INFO - __main__ - Step 5901: {'lr': 0.0004991438152364117, 'samples': 1132992, 'steps': 5900, 'loss/train': 1.4441382884979248} -08/30/2021 14:14:58 - INFO - __main__ - Step 5902: {'lr': 0.0004991433763619599, 'samples': 1133184, 'steps': 5901, 'loss/train': 1.860714316368103} -08/30/2021 14:14:58 - INFO - __main__ - Step 5903: {'lr': 0.0004991429373752482, 'samples': 1133376, 'steps': 5902, 'loss/train': 0.9205770492553711} -08/30/2021 14:15:00 - INFO - __main__ - Step 5904: {'lr': 0.0004991424982762763, 'samples': 1133568, 'steps': 5903, 'loss/train': 4.166928291320801} -08/30/2021 14:15:01 - INFO - __main__ - Step 5905: {'lr': 0.0004991420590650448, 'samples': 1133760, 'steps': 5904, 'loss/train': 2.067859411239624} -08/30/2021 14:15:01 - INFO - __main__ - Step 5906: {'lr': 0.0004991416197415537, 'samples': 1133952, 'steps': 5905, 'loss/train': 1.859840989112854} -08/30/2021 14:15:01 - INFO - __main__ - Step 5907: {'lr': 0.0004991411803058032, 'samples': 1134144, 'steps': 5906, 'loss/train': 2.4467766284942627} -08/30/2021 14:15:02 - INFO - __main__ - Step 5908: {'lr': 0.0004991407407577936, 'samples': 1134336, 'steps': 5907, 'loss/train': 1.577459454536438} -08/30/2021 14:15:04 - INFO - __main__ - Step 5909: {'lr': 0.0004991403010975249, 'samples': 1134528, 'steps': 5908, 'loss/train': 2.255033254623413} -08/30/2021 14:15:04 - INFO - __main__ - Step 5910: {'lr': 0.0004991398613249976, 'samples': 1134720, 'steps': 5909, 'loss/train': 2.581190586090088} -08/30/2021 14:15:05 - INFO - __main__ - Step 5911: {'lr': 0.0004991394214402115, 'samples': 1134912, 'steps': 5910, 'loss/train': 1.4275797605514526} -08/30/2021 14:15:05 - INFO - __main__ - Step 5912: {'lr': 0.0004991389814431672, 'samples': 1135104, 'steps': 5911, 'loss/train': 1.2042779922485352} -08/30/2021 14:15:06 - INFO - __main__ - Step 5913: {'lr': 0.0004991385413338646, 'samples': 1135296, 'steps': 5912, 'loss/train': 1.218719720840454} -08/30/2021 14:15:06 - INFO - __main__ - Step 5914: {'lr': 0.0004991381011123041, 'samples': 1135488, 'steps': 5913, 'loss/train': 2.3741183280944824} -08/30/2021 14:15:06 - INFO - __main__ - Step 5915: {'lr': 0.0004991376607784857, 'samples': 1135680, 'steps': 5914, 'loss/train': 2.6086196899414062} -08/30/2021 14:15:08 - INFO - __main__ - Step 5916: {'lr': 0.0004991372203324098, 'samples': 1135872, 'steps': 5915, 'loss/train': 2.26519775390625} -08/30/2021 14:15:08 - INFO - __main__ - Step 5917: {'lr': 0.0004991367797740765, 'samples': 1136064, 'steps': 5916, 'loss/train': 2.4970638751983643} -08/30/2021 14:15:09 - INFO - __main__ - Step 5918: {'lr': 0.0004991363391034861, 'samples': 1136256, 'steps': 5917, 'loss/train': 2.891735553741455} -08/30/2021 14:15:09 - INFO - __main__ - Step 5919: {'lr': 0.0004991358983206386, 'samples': 1136448, 'steps': 5918, 'loss/train': 2.8727993965148926} -08/30/2021 14:15:10 - INFO - __main__ - Step 5920: {'lr': 0.0004991354574255344, 'samples': 1136640, 'steps': 5919, 'loss/train': 1.0362807512283325} -08/30/2021 14:15:11 - INFO - __main__ - Step 5921: {'lr': 0.0004991350164181735, 'samples': 1136832, 'steps': 5920, 'loss/train': 1.6289128065109253} -08/30/2021 14:15:11 - INFO - __main__ - Step 5922: {'lr': 0.0004991345752985563, 'samples': 1137024, 'steps': 5921, 'loss/train': 2.078066349029541} -08/30/2021 14:15:12 - INFO - __main__ - Step 5923: {'lr': 0.0004991341340666828, 'samples': 1137216, 'steps': 5922, 'loss/train': 2.2499353885650635} -08/30/2021 14:15:12 - INFO - __main__ - Step 5924: {'lr': 0.0004991336927225534, 'samples': 1137408, 'steps': 5923, 'loss/train': 2.663357973098755} -08/30/2021 14:15:13 - INFO - __main__ - Step 5925: {'lr': 0.0004991332512661682, 'samples': 1137600, 'steps': 5924, 'loss/train': 2.081972122192383} -08/30/2021 14:15:13 - INFO - __main__ - Step 5926: {'lr': 0.0004991328096975273, 'samples': 1137792, 'steps': 5925, 'loss/train': 1.8515006303787231} -08/30/2021 14:15:15 - INFO - __main__ - Step 5927: {'lr': 0.0004991323680166312, 'samples': 1137984, 'steps': 5926, 'loss/train': 2.6087493896484375} -08/30/2021 14:15:16 - INFO - __main__ - Step 5928: {'lr': 0.0004991319262234797, 'samples': 1138176, 'steps': 5927, 'loss/train': 1.694389820098877} -08/30/2021 14:15:16 - INFO - __main__ - Step 5929: {'lr': 0.0004991314843180733, 'samples': 1138368, 'steps': 5928, 'loss/train': 2.105149984359741} -08/30/2021 14:15:16 - INFO - __main__ - Step 5930: {'lr': 0.0004991310423004121, 'samples': 1138560, 'steps': 5929, 'loss/train': 2.134931802749634} -08/30/2021 14:15:17 - INFO - __main__ - Step 5931: {'lr': 0.0004991306001704962, 'samples': 1138752, 'steps': 5930, 'loss/train': 2.170400619506836} -08/30/2021 14:15:18 - INFO - __main__ - Step 5932: {'lr': 0.000499130157928326, 'samples': 1138944, 'steps': 5931, 'loss/train': 2.15702748298645} -08/30/2021 14:15:19 - INFO - __main__ - Step 5933: {'lr': 0.0004991297155739015, 'samples': 1139136, 'steps': 5932, 'loss/train': 2.4520421028137207} -08/30/2021 14:15:19 - INFO - __main__ - Step 5934: {'lr': 0.0004991292731072231, 'samples': 1139328, 'steps': 5933, 'loss/train': 2.2806475162506104} -08/30/2021 14:15:20 - INFO - __main__ - Step 5935: {'lr': 0.0004991288305282908, 'samples': 1139520, 'steps': 5934, 'loss/train': 2.185220241546631} -08/30/2021 14:15:20 - INFO - __main__ - Step 5936: {'lr': 0.0004991283878371049, 'samples': 1139712, 'steps': 5935, 'loss/train': 2.2513556480407715} -08/30/2021 14:15:22 - INFO - __main__ - Step 5937: {'lr': 0.0004991279450336656, 'samples': 1139904, 'steps': 5936, 'loss/train': 1.4557690620422363} -08/30/2021 14:15:22 - INFO - __main__ - Step 5938: {'lr': 0.0004991275021179732, 'samples': 1140096, 'steps': 5937, 'loss/train': 2.34891939163208} -08/30/2021 14:15:22 - INFO - __main__ - Step 5939: {'lr': 0.0004991270590900277, 'samples': 1140288, 'steps': 5938, 'loss/train': 2.1917247772216797} -08/30/2021 14:15:23 - INFO - __main__ - Step 5940: {'lr': 0.0004991266159498294, 'samples': 1140480, 'steps': 5939, 'loss/train': 2.2043163776397705} -08/30/2021 14:15:23 - INFO - __main__ - Step 5941: {'lr': 0.0004991261726973784, 'samples': 1140672, 'steps': 5940, 'loss/train': 2.1503801345825195} -08/30/2021 14:15:23 - INFO - __main__ - Step 5942: {'lr': 0.0004991257293326752, 'samples': 1140864, 'steps': 5941, 'loss/train': 1.9182548522949219} -08/30/2021 14:15:25 - INFO - __main__ - Step 5943: {'lr': 0.0004991252858557196, 'samples': 1141056, 'steps': 5942, 'loss/train': 2.4979074001312256} -08/30/2021 14:15:25 - INFO - __main__ - Step 5944: {'lr': 0.0004991248422665122, 'samples': 1141248, 'steps': 5943, 'loss/train': 2.358738660812378} -08/30/2021 14:15:26 - INFO - __main__ - Step 5945: {'lr': 0.0004991243985650528, 'samples': 1141440, 'steps': 5944, 'loss/train': 2.2329964637756348} -08/30/2021 14:15:26 - INFO - __main__ - Step 5946: {'lr': 0.0004991239547513419, 'samples': 1141632, 'steps': 5945, 'loss/train': 2.327383041381836} -08/30/2021 14:15:26 - INFO - __main__ - Step 5947: {'lr': 0.0004991235108253795, 'samples': 1141824, 'steps': 5946, 'loss/train': 2.1163156032562256} -08/30/2021 14:15:29 - INFO - __main__ - Step 5948: {'lr': 0.0004991230667871659, 'samples': 1142016, 'steps': 5947, 'loss/train': 2.240360975265503} -08/30/2021 14:15:29 - INFO - __main__ - Step 5949: {'lr': 0.0004991226226367013, 'samples': 1142208, 'steps': 5948, 'loss/train': 2.160229444503784} -08/30/2021 14:15:29 - INFO - __main__ - Step 5950: {'lr': 0.0004991221783739859, 'samples': 1142400, 'steps': 5949, 'loss/train': 0.6622193455696106} -08/30/2021 14:15:30 - INFO - __main__ - Step 5951: {'lr': 0.0004991217339990199, 'samples': 1142592, 'steps': 5950, 'loss/train': 0.7783976197242737} -08/30/2021 14:15:30 - INFO - __main__ - Step 5952: {'lr': 0.0004991212895118035, 'samples': 1142784, 'steps': 5951, 'loss/train': 2.150078058242798} -08/30/2021 14:15:30 - INFO - __main__ - Step 5953: {'lr': 0.0004991208449123369, 'samples': 1142976, 'steps': 5952, 'loss/train': 2.610722303390503} -08/30/2021 14:15:32 - INFO - __main__ - Step 5954: {'lr': 0.0004991204002006203, 'samples': 1143168, 'steps': 5953, 'loss/train': 2.232699394226074} -08/30/2021 14:15:32 - INFO - __main__ - Step 5955: {'lr': 0.0004991199553766538, 'samples': 1143360, 'steps': 5954, 'loss/train': 2.651733160018921} -08/30/2021 14:15:33 - INFO - __main__ - Step 5956: {'lr': 0.0004991195104404378, 'samples': 1143552, 'steps': 5955, 'loss/train': 1.5986006259918213} -08/30/2021 14:15:33 - INFO - __main__ - Step 5957: {'lr': 0.0004991190653919723, 'samples': 1143744, 'steps': 5956, 'loss/train': 2.460905075073242} -08/30/2021 14:15:33 - INFO - __main__ - Step 5958: {'lr': 0.0004991186202312576, 'samples': 1143936, 'steps': 5957, 'loss/train': 2.2222230434417725} -08/30/2021 14:15:35 - INFO - __main__ - Step 5959: {'lr': 0.0004991181749582941, 'samples': 1144128, 'steps': 5958, 'loss/train': 1.6441094875335693} -08/30/2021 14:15:36 - INFO - __main__ - Step 5960: {'lr': 0.0004991177295730815, 'samples': 1144320, 'steps': 5959, 'loss/train': 1.7736626863479614} -08/30/2021 14:15:36 - INFO - __main__ - Step 5961: {'lr': 0.0004991172840756204, 'samples': 1144512, 'steps': 5960, 'loss/train': 0.3163501024246216} -08/30/2021 14:15:36 - INFO - __main__ - Step 5962: {'lr': 0.000499116838465911, 'samples': 1144704, 'steps': 5961, 'loss/train': 2.9587886333465576} -08/30/2021 14:15:37 - INFO - __main__ - Step 5963: {'lr': 0.0004991163927439533, 'samples': 1144896, 'steps': 5962, 'loss/train': 1.9898011684417725} -08/30/2021 14:15:38 - INFO - __main__ - Step 5964: {'lr': 0.0004991159469097476, 'samples': 1145088, 'steps': 5963, 'loss/train': 2.3663594722747803} -08/30/2021 14:15:39 - INFO - __main__ - Step 5965: {'lr': 0.0004991155009632941, 'samples': 1145280, 'steps': 5964, 'loss/train': 2.1029508113861084} -08/30/2021 14:15:39 - INFO - __main__ - Step 5966: {'lr': 0.0004991150549045931, 'samples': 1145472, 'steps': 5965, 'loss/train': 2.3237690925598145} -08/30/2021 14:15:39 - INFO - __main__ - Step 5967: {'lr': 0.0004991146087336446, 'samples': 1145664, 'steps': 5966, 'loss/train': 2.3028342723846436} -08/30/2021 14:15:40 - INFO - __main__ - Step 5968: {'lr': 0.0004991141624504489, 'samples': 1145856, 'steps': 5967, 'loss/train': 2.658325672149658} -08/30/2021 14:15:41 - INFO - __main__ - Step 5969: {'lr': 0.0004991137160550062, 'samples': 1146048, 'steps': 5968, 'loss/train': 2.123077392578125} -08/30/2021 14:15:42 - INFO - __main__ - Step 5970: {'lr': 0.0004991132695473167, 'samples': 1146240, 'steps': 5969, 'loss/train': 2.34393048286438} -08/30/2021 14:15:42 - INFO - __main__ - Step 5971: {'lr': 0.0004991128229273807, 'samples': 1146432, 'steps': 5970, 'loss/train': 2.46962833404541} -08/30/2021 14:15:42 - INFO - __main__ - Step 5972: {'lr': 0.0004991123761951982, 'samples': 1146624, 'steps': 5971, 'loss/train': 2.4148480892181396} -08/30/2021 14:15:43 - INFO - __main__ - Step 5973: {'lr': 0.0004991119293507695, 'samples': 1146816, 'steps': 5972, 'loss/train': 2.748654365539551} -08/30/2021 14:15:44 - INFO - __main__ - Step 5974: {'lr': 0.0004991114823940948, 'samples': 1147008, 'steps': 5973, 'loss/train': 1.6396844387054443} -08/30/2021 14:15:45 - INFO - __main__ - Step 5975: {'lr': 0.0004991110353251744, 'samples': 1147200, 'steps': 5974, 'loss/train': 1.744950294494629} -08/30/2021 14:15:45 - INFO - __main__ - Step 5976: {'lr': 0.0004991105881440084, 'samples': 1147392, 'steps': 5975, 'loss/train': 2.4893743991851807} -08/30/2021 14:15:45 - INFO - __main__ - Step 5977: {'lr': 0.000499110140850597, 'samples': 1147584, 'steps': 5976, 'loss/train': 1.8989903926849365} -08/30/2021 14:15:46 - INFO - __main__ - Step 5978: {'lr': 0.0004991096934449404, 'samples': 1147776, 'steps': 5977, 'loss/train': 1.3881796598434448} -08/30/2021 14:15:46 - INFO - __main__ - Step 5979: {'lr': 0.0004991092459270388, 'samples': 1147968, 'steps': 5978, 'loss/train': 2.414862871170044} -08/30/2021 14:15:48 - INFO - __main__ - Step 5980: {'lr': 0.0004991087982968924, 'samples': 1148160, 'steps': 5979, 'loss/train': 2.1698641777038574} -08/30/2021 14:15:48 - INFO - __main__ - Step 5981: {'lr': 0.0004991083505545014, 'samples': 1148352, 'steps': 5980, 'loss/train': 2.538878917694092} -08/30/2021 14:15:48 - INFO - __main__ - Step 5982: {'lr': 0.0004991079026998662, 'samples': 1148544, 'steps': 5981, 'loss/train': 2.015629768371582} -08/30/2021 14:15:49 - INFO - __main__ - Step 5983: {'lr': 0.0004991074547329867, 'samples': 1148736, 'steps': 5982, 'loss/train': 2.450441360473633} -08/30/2021 14:15:49 - INFO - __main__ - Step 5984: {'lr': 0.0004991070066538632, 'samples': 1148928, 'steps': 5983, 'loss/train': 2.5156095027923584} -08/30/2021 14:15:51 - INFO - __main__ - Step 5985: {'lr': 0.0004991065584624959, 'samples': 1149120, 'steps': 5984, 'loss/train': 2.0208370685577393} -08/30/2021 14:15:52 - INFO - __main__ - Step 5986: {'lr': 0.0004991061101588851, 'samples': 1149312, 'steps': 5985, 'loss/train': 2.035176992416382} -08/30/2021 14:15:52 - INFO - __main__ - Step 5987: {'lr': 0.0004991056617430308, 'samples': 1149504, 'steps': 5986, 'loss/train': 2.074810266494751} -08/30/2021 14:15:53 - INFO - __main__ - Step 5988: {'lr': 0.0004991052132149336, 'samples': 1149696, 'steps': 5987, 'loss/train': 1.5656373500823975} -08/30/2021 14:15:53 - INFO - __main__ - Step 5989: {'lr': 0.0004991047645745932, 'samples': 1149888, 'steps': 5988, 'loss/train': 2.0693013668060303} -08/30/2021 14:15:54 - INFO - __main__ - Step 5990: {'lr': 0.0004991043158220101, 'samples': 1150080, 'steps': 5989, 'loss/train': 2.2472169399261475} -08/30/2021 14:15:55 - INFO - __main__ - Step 5991: {'lr': 0.0004991038669571844, 'samples': 1150272, 'steps': 5990, 'loss/train': 2.137972354888916} -08/30/2021 14:15:55 - INFO - __main__ - Step 5992: {'lr': 0.0004991034179801165, 'samples': 1150464, 'steps': 5991, 'loss/train': 1.8876259326934814} -08/30/2021 14:15:55 - INFO - __main__ - Step 5993: {'lr': 0.0004991029688908063, 'samples': 1150656, 'steps': 5992, 'loss/train': 2.2228870391845703} -08/30/2021 14:15:56 - INFO - __main__ - Step 5994: {'lr': 0.0004991025196892542, 'samples': 1150848, 'steps': 5993, 'loss/train': 2.3093504905700684} -08/30/2021 14:15:57 - INFO - __main__ - Step 5995: {'lr': 0.0004991020703754603, 'samples': 1151040, 'steps': 5994, 'loss/train': 1.75906240940094} -08/30/2021 14:15:58 - INFO - __main__ - Step 5996: {'lr': 0.0004991016209494249, 'samples': 1151232, 'steps': 5995, 'loss/train': 2.2239811420440674} -08/30/2021 14:15:58 - INFO - __main__ - Step 5997: {'lr': 0.000499101171411148, 'samples': 1151424, 'steps': 5996, 'loss/train': 1.656895637512207} -08/30/2021 14:15:58 - INFO - __main__ - Step 5998: {'lr': 0.0004991007217606303, 'samples': 1151616, 'steps': 5997, 'loss/train': 2.5214390754699707} -08/30/2021 14:15:59 - INFO - __main__ - Step 5999: {'lr': 0.0004991002719978713, 'samples': 1151808, 'steps': 5998, 'loss/train': 2.1021344661712646} -08/30/2021 14:16:00 - INFO - __main__ - Step 6000: {'lr': 0.0004990998221228718, 'samples': 1152000, 'steps': 5999, 'loss/train': 2.4656269550323486} -08/30/2021 14:16:01 - INFO - __main__ - Step 6001: {'lr': 0.0004990993721356316, 'samples': 1152192, 'steps': 6000, 'loss/train': 2.3020265102386475} -08/30/2021 14:16:01 - INFO - __main__ - Step 6002: {'lr': 0.0004990989220361511, 'samples': 1152384, 'steps': 6001, 'loss/train': 1.5774675607681274} -08/30/2021 14:16:02 - INFO - __main__ - Step 6003: {'lr': 0.0004990984718244306, 'samples': 1152576, 'steps': 6002, 'loss/train': 2.2705578804016113} -08/30/2021 14:16:02 - INFO - __main__ - Step 6004: {'lr': 0.00049909802150047, 'samples': 1152768, 'steps': 6003, 'loss/train': 1.8598873615264893} -08/30/2021 14:16:04 - INFO - __main__ - Step 6005: {'lr': 0.0004990975710642699, 'samples': 1152960, 'steps': 6004, 'loss/train': 1.7920972108840942} -08/30/2021 14:16:04 - INFO - __main__ - Step 6006: {'lr': 0.0004990971205158301, 'samples': 1153152, 'steps': 6005, 'loss/train': 1.9137616157531738} -08/30/2021 14:16:04 - INFO - __main__ - Step 6007: {'lr': 0.000499096669855151, 'samples': 1153344, 'steps': 6006, 'loss/train': 1.4915194511413574} -08/30/2021 14:16:05 - INFO - __main__ - Step 6008: {'lr': 0.0004990962190822328, 'samples': 1153536, 'steps': 6007, 'loss/train': 2.0501208305358887} -08/30/2021 14:16:05 - INFO - __main__ - Step 6009: {'lr': 0.0004990957681970757, 'samples': 1153728, 'steps': 6008, 'loss/train': 2.3642265796661377} -08/30/2021 14:16:07 - INFO - __main__ - Step 6010: {'lr': 0.0004990953171996798, 'samples': 1153920, 'steps': 6009, 'loss/train': 2.1400179862976074} -08/30/2021 14:16:07 - INFO - __main__ - Step 6011: {'lr': 0.0004990948660900455, 'samples': 1154112, 'steps': 6010, 'loss/train': 1.727049708366394} -08/30/2021 14:16:07 - INFO - __main__ - Step 6012: {'lr': 0.0004990944148681729, 'samples': 1154304, 'steps': 6011, 'loss/train': 1.639033317565918} -08/30/2021 14:16:08 - INFO - __main__ - Step 6013: {'lr': 0.0004990939635340621, 'samples': 1154496, 'steps': 6012, 'loss/train': 2.5471725463867188} -08/30/2021 14:16:08 - INFO - __main__ - Step 6014: {'lr': 0.0004990935120877136, 'samples': 1154688, 'steps': 6013, 'loss/train': 1.7235260009765625} -08/30/2021 14:16:08 - INFO - __main__ - Step 6015: {'lr': 0.0004990930605291272, 'samples': 1154880, 'steps': 6014, 'loss/train': 1.799383282661438} -08/30/2021 14:16:10 - INFO - __main__ - Step 6016: {'lr': 0.0004990926088583034, 'samples': 1155072, 'steps': 6015, 'loss/train': 1.9797793626785278} -08/30/2021 14:16:10 - INFO - __main__ - Step 6017: {'lr': 0.0004990921570752424, 'samples': 1155264, 'steps': 6016, 'loss/train': 1.3015261888504028} -08/30/2021 14:16:11 - INFO - __main__ - Step 6018: {'lr': 0.0004990917051799442, 'samples': 1155456, 'steps': 6017, 'loss/train': 2.3569891452789307} -08/30/2021 14:16:11 - INFO - __main__ - Step 6019: {'lr': 0.0004990912531724092, 'samples': 1155648, 'steps': 6018, 'loss/train': 2.2145638465881348} -08/30/2021 14:16:11 - INFO - __main__ - Step 6020: {'lr': 0.0004990908010526374, 'samples': 1155840, 'steps': 6019, 'loss/train': 2.256147623062134} -08/30/2021 14:16:13 - INFO - __main__ - Step 6021: {'lr': 0.0004990903488206292, 'samples': 1156032, 'steps': 6020, 'loss/train': 2.501497268676758} -08/30/2021 14:16:13 - INFO - __main__ - Step 6022: {'lr': 0.0004990898964763847, 'samples': 1156224, 'steps': 6021, 'loss/train': 0.7916610240936279} -08/30/2021 14:16:14 - INFO - __main__ - Step 6023: {'lr': 0.0004990894440199042, 'samples': 1156416, 'steps': 6022, 'loss/train': 3.1935312747955322} -08/30/2021 14:16:14 - INFO - __main__ - Step 6024: {'lr': 0.0004990889914511878, 'samples': 1156608, 'steps': 6023, 'loss/train': 1.8197205066680908} -08/30/2021 14:16:14 - INFO - __main__ - Step 6025: {'lr': 0.0004990885387702357, 'samples': 1156800, 'steps': 6024, 'loss/train': 1.6443145275115967} -08/30/2021 14:16:16 - INFO - __main__ - Step 6026: {'lr': 0.0004990880859770483, 'samples': 1156992, 'steps': 6025, 'loss/train': 2.036121129989624} -08/30/2021 14:16:16 - INFO - __main__ - Step 6027: {'lr': 0.0004990876330716256, 'samples': 1157184, 'steps': 6026, 'loss/train': 2.313183546066284} -08/30/2021 14:16:17 - INFO - __main__ - Step 6028: {'lr': 0.0004990871800539677, 'samples': 1157376, 'steps': 6027, 'loss/train': 2.0128965377807617} -08/30/2021 14:16:17 - INFO - __main__ - Step 6029: {'lr': 0.0004990867269240751, 'samples': 1157568, 'steps': 6028, 'loss/train': 2.1478962898254395} -08/30/2021 14:16:17 - INFO - __main__ - Step 6030: {'lr': 0.0004990862736819478, 'samples': 1157760, 'steps': 6029, 'loss/train': 1.863461971282959} -08/30/2021 14:16:19 - INFO - __main__ - Step 6031: {'lr': 0.000499085820327586, 'samples': 1157952, 'steps': 6030, 'loss/train': 2.210873603820801} -08/30/2021 14:16:19 - INFO - __main__ - Step 6032: {'lr': 0.0004990853668609902, 'samples': 1158144, 'steps': 6031, 'loss/train': 2.9212305545806885} -08/30/2021 14:16:20 - INFO - __main__ - Step 6033: {'lr': 0.0004990849132821602, 'samples': 1158336, 'steps': 6032, 'loss/train': 2.9135491847991943} -08/30/2021 14:16:20 - INFO - __main__ - Step 6034: {'lr': 0.0004990844595910965, 'samples': 1158528, 'steps': 6033, 'loss/train': 1.8108850717544556} -08/30/2021 14:16:20 - INFO - __main__ - Step 6035: {'lr': 0.0004990840057877991, 'samples': 1158720, 'steps': 6034, 'loss/train': 1.9483637809753418} -08/30/2021 14:16:23 - INFO - __main__ - Step 6036: {'lr': 0.0004990835518722683, 'samples': 1158912, 'steps': 6035, 'loss/train': 0.21011456847190857} -08/30/2021 14:16:23 - INFO - __main__ - Step 6037: {'lr': 0.0004990830978445043, 'samples': 1159104, 'steps': 6036, 'loss/train': 1.8370007276535034} -08/30/2021 14:16:23 - INFO - __main__ - Step 6038: {'lr': 0.0004990826437045073, 'samples': 1159296, 'steps': 6037, 'loss/train': 1.7020741701126099} -08/30/2021 14:16:24 - INFO - __main__ - Step 6039: {'lr': 0.0004990821894522775, 'samples': 1159488, 'steps': 6038, 'loss/train': 2.23870849609375} -08/30/2021 14:16:24 - INFO - __main__ - Step 6040: {'lr': 0.0004990817350878152, 'samples': 1159680, 'steps': 6039, 'loss/train': 2.1977384090423584} -08/30/2021 14:16:26 - INFO - __main__ - Step 6041: {'lr': 0.0004990812806111205, 'samples': 1159872, 'steps': 6040, 'loss/train': 1.9331872463226318} -08/30/2021 14:16:26 - INFO - __main__ - Step 6042: {'lr': 0.0004990808260221934, 'samples': 1160064, 'steps': 6041, 'loss/train': 1.9153445959091187} -08/30/2021 14:16:26 - INFO - __main__ - Step 6043: {'lr': 0.0004990803713210345, 'samples': 1160256, 'steps': 6042, 'loss/train': 1.7708107233047485} -08/30/2021 14:16:27 - INFO - __main__ - Step 6044: {'lr': 0.0004990799165076438, 'samples': 1160448, 'steps': 6043, 'loss/train': 1.813028335571289} -08/30/2021 14:16:27 - INFO - __main__ - Step 6045: {'lr': 0.0004990794615820216, 'samples': 1160640, 'steps': 6044, 'loss/train': 1.7955721616744995} -08/30/2021 14:16:29 - INFO - __main__ - Step 6046: {'lr': 0.0004990790065441679, 'samples': 1160832, 'steps': 6045, 'loss/train': 1.5986727476119995} -08/30/2021 14:16:29 - INFO - __main__ - Step 6047: {'lr': 0.0004990785513940832, 'samples': 1161024, 'steps': 6046, 'loss/train': 1.353219985961914} -08/30/2021 14:16:29 - INFO - __main__ - Step 6048: {'lr': 0.0004990780961317674, 'samples': 1161216, 'steps': 6047, 'loss/train': 1.878985047340393} -08/30/2021 14:16:30 - INFO - __main__ - Step 6049: {'lr': 0.0004990776407572209, 'samples': 1161408, 'steps': 6048, 'loss/train': 1.7939867973327637} -08/30/2021 14:16:30 - INFO - __main__ - Step 6050: {'lr': 0.000499077185270444, 'samples': 1161600, 'steps': 6049, 'loss/train': 1.955993890762329} -08/30/2021 14:16:32 - INFO - __main__ - Step 6051: {'lr': 0.0004990767296714365, 'samples': 1161792, 'steps': 6050, 'loss/train': 1.6843774318695068} -08/30/2021 14:16:32 - INFO - __main__ - Step 6052: {'lr': 0.000499076273960199, 'samples': 1161984, 'steps': 6051, 'loss/train': 2.232264280319214} -08/30/2021 14:16:32 - INFO - __main__ - Step 6053: {'lr': 0.0004990758181367316, 'samples': 1162176, 'steps': 6052, 'loss/train': 2.2386627197265625} -08/30/2021 14:16:33 - INFO - __main__ - Step 6054: {'lr': 0.0004990753622010345, 'samples': 1162368, 'steps': 6053, 'loss/train': 1.7334731817245483} -08/30/2021 14:16:33 - INFO - __main__ - Step 6055: {'lr': 0.0004990749061531079, 'samples': 1162560, 'steps': 6054, 'loss/train': 1.7887282371520996} -08/30/2021 14:16:34 - INFO - __main__ - Step 6056: {'lr': 0.0004990744499929519, 'samples': 1162752, 'steps': 6055, 'loss/train': 1.920432448387146} -08/30/2021 14:16:35 - INFO - __main__ - Step 6057: {'lr': 0.0004990739937205668, 'samples': 1162944, 'steps': 6056, 'loss/train': 1.9344661235809326} -08/30/2021 14:16:35 - INFO - __main__ - Step 6058: {'lr': 0.0004990735373359529, 'samples': 1163136, 'steps': 6057, 'loss/train': 2.140591859817505} -08/30/2021 14:16:36 - INFO - __main__ - Step 6059: {'lr': 0.0004990730808391102, 'samples': 1163328, 'steps': 6058, 'loss/train': 2.165710687637329} -08/30/2021 14:16:36 - INFO - __main__ - Step 6060: {'lr': 0.0004990726242300391, 'samples': 1163520, 'steps': 6059, 'loss/train': 2.912585496902466} -08/30/2021 14:16:37 - INFO - __main__ - Step 6061: {'lr': 0.0004990721675087397, 'samples': 1163712, 'steps': 6060, 'loss/train': 2.143425464630127} -08/30/2021 14:16:38 - INFO - __main__ - Step 6062: {'lr': 0.0004990717106752122, 'samples': 1163904, 'steps': 6061, 'loss/train': 2.2275428771972656} -08/30/2021 14:16:38 - INFO - __main__ - Step 6063: {'lr': 0.0004990712537294568, 'samples': 1164096, 'steps': 6062, 'loss/train': 2.4941608905792236} -08/30/2021 14:16:39 - INFO - __main__ - Step 6064: {'lr': 0.0004990707966714738, 'samples': 1164288, 'steps': 6063, 'loss/train': 1.885541558265686} -08/30/2021 14:16:39 - INFO - __main__ - Step 6065: {'lr': 0.0004990703395012634, 'samples': 1164480, 'steps': 6064, 'loss/train': 2.437563180923462} -08/30/2021 14:16:39 - INFO - __main__ - Step 6066: {'lr': 0.0004990698822188255, 'samples': 1164672, 'steps': 6065, 'loss/train': 2.015489101409912} -08/30/2021 14:16:41 - INFO - __main__ - Step 6067: {'lr': 0.0004990694248241608, 'samples': 1164864, 'steps': 6066, 'loss/train': 1.2778023481369019} -08/30/2021 14:16:41 - INFO - __main__ - Step 6068: {'lr': 0.0004990689673172691, 'samples': 1165056, 'steps': 6067, 'loss/train': 2.142285108566284} -08/30/2021 14:16:42 - INFO - __main__ - Step 6069: {'lr': 0.000499068509698151, 'samples': 1165248, 'steps': 6068, 'loss/train': 2.010939836502075} -08/30/2021 14:16:42 - INFO - __main__ - Step 6070: {'lr': 0.0004990680519668063, 'samples': 1165440, 'steps': 6069, 'loss/train': 2.111518621444702} -08/30/2021 14:16:42 - INFO - __main__ - Step 6071: {'lr': 0.0004990675941232354, 'samples': 1165632, 'steps': 6070, 'loss/train': 2.1520676612854004} -08/30/2021 14:16:44 - INFO - __main__ - Step 6072: {'lr': 0.0004990671361674384, 'samples': 1165824, 'steps': 6071, 'loss/train': 1.8499726057052612} -08/30/2021 14:16:44 - INFO - __main__ - Step 6073: {'lr': 0.0004990666780994156, 'samples': 1166016, 'steps': 6072, 'loss/train': 2.289273977279663} -08/30/2021 14:16:45 - INFO - __main__ - Step 6074: {'lr': 0.0004990662199191673, 'samples': 1166208, 'steps': 6073, 'loss/train': 2.125744342803955} -08/30/2021 14:16:45 - INFO - __main__ - Step 6075: {'lr': 0.0004990657616266936, 'samples': 1166400, 'steps': 6074, 'loss/train': 2.661235809326172} -08/30/2021 14:16:45 - INFO - __main__ - Step 6076: {'lr': 0.0004990653032219947, 'samples': 1166592, 'steps': 6075, 'loss/train': 0.7951482534408569} -08/30/2021 14:16:47 - INFO - __main__ - Step 6077: {'lr': 0.0004990648447050709, 'samples': 1166784, 'steps': 6076, 'loss/train': 2.175867795944214} -08/30/2021 14:16:47 - INFO - __main__ - Step 6078: {'lr': 0.0004990643860759222, 'samples': 1166976, 'steps': 6077, 'loss/train': 1.8009334802627563} -08/30/2021 14:16:48 - INFO - __main__ - Step 6079: {'lr': 0.0004990639273345489, 'samples': 1167168, 'steps': 6078, 'loss/train': 2.1254401206970215} -08/30/2021 14:16:48 - INFO - __main__ - Step 6080: {'lr': 0.0004990634684809513, 'samples': 1167360, 'steps': 6079, 'loss/train': 1.64859139919281} -08/30/2021 14:16:48 - INFO - __main__ - Step 6081: {'lr': 0.0004990630095151296, 'samples': 1167552, 'steps': 6080, 'loss/train': 1.9777277708053589} -08/30/2021 14:16:50 - INFO - __main__ - Step 6082: {'lr': 0.0004990625504370838, 'samples': 1167744, 'steps': 6081, 'loss/train': 2.201955556869507} -08/30/2021 14:16:50 - INFO - __main__ - Step 6083: {'lr': 0.0004990620912468143, 'samples': 1167936, 'steps': 6082, 'loss/train': 2.1902480125427246} -08/30/2021 14:16:51 - INFO - __main__ - Step 6084: {'lr': 0.0004990616319443214, 'samples': 1168128, 'steps': 6083, 'loss/train': 1.993706464767456} -08/30/2021 14:16:51 - INFO - __main__ - Step 6085: {'lr': 0.0004990611725296052, 'samples': 1168320, 'steps': 6084, 'loss/train': 2.217761993408203} -08/30/2021 14:16:51 - INFO - __main__ - Step 6086: {'lr': 0.0004990607130026657, 'samples': 1168512, 'steps': 6085, 'loss/train': 2.5983235836029053} -08/30/2021 14:16:52 - INFO - __main__ - Step 6087: {'lr': 0.0004990602533635033, 'samples': 1168704, 'steps': 6086, 'loss/train': 2.3596651554107666} -08/30/2021 14:16:54 - INFO - __main__ - Step 6088: {'lr': 0.0004990597936121182, 'samples': 1168896, 'steps': 6087, 'loss/train': 2.0918681621551514} -08/30/2021 14:16:55 - INFO - __main__ - Step 6089: {'lr': 0.0004990593337485108, 'samples': 1169088, 'steps': 6088, 'loss/train': 2.3481647968292236} -08/30/2021 14:16:55 - INFO - __main__ - Step 6090: {'lr': 0.0004990588737726809, 'samples': 1169280, 'steps': 6089, 'loss/train': 2.553339958190918} -08/30/2021 14:16:56 - INFO - __main__ - Step 6091: {'lr': 0.0004990584136846289, 'samples': 1169472, 'steps': 6090, 'loss/train': 2.537722587585449} -08/30/2021 14:16:56 - INFO - __main__ - Step 6092: {'lr': 0.0004990579534843551, 'samples': 1169664, 'steps': 6091, 'loss/train': 0.21205846965312958} -08/30/2021 14:16:56 - INFO - __main__ - Step 6093: {'lr': 0.0004990574931718597, 'samples': 1169856, 'steps': 6092, 'loss/train': 1.1033707857131958} -08/30/2021 14:16:57 - INFO - __main__ - Step 6094: {'lr': 0.0004990570327471427, 'samples': 1170048, 'steps': 6093, 'loss/train': 0.9622670412063599} -08/30/2021 14:16:58 - INFO - __main__ - Step 6095: {'lr': 0.0004990565722102045, 'samples': 1170240, 'steps': 6094, 'loss/train': 0.774612545967102} -08/30/2021 14:16:59 - INFO - __main__ - Step 6096: {'lr': 0.0004990561115610452, 'samples': 1170432, 'steps': 6095, 'loss/train': 2.0248193740844727} -08/30/2021 14:16:59 - INFO - __main__ - Step 6097: {'lr': 0.0004990556507996652, 'samples': 1170624, 'steps': 6096, 'loss/train': 1.7581862211227417} -08/30/2021 14:17:00 - INFO - __main__ - Step 6098: {'lr': 0.0004990551899260644, 'samples': 1170816, 'steps': 6097, 'loss/train': 2.1386702060699463} -08/30/2021 14:17:00 - INFO - __main__ - Step 6099: {'lr': 0.0004990547289402433, 'samples': 1171008, 'steps': 6098, 'loss/train': 2.6330530643463135} -08/30/2021 14:17:02 - INFO - __main__ - Step 6100: {'lr': 0.0004990542678422019, 'samples': 1171200, 'steps': 6099, 'loss/train': 1.5033752918243408} -08/30/2021 14:17:02 - INFO - __main__ - Step 6101: {'lr': 0.0004990538066319406, 'samples': 1171392, 'steps': 6100, 'loss/train': 0.4551768898963928} -08/30/2021 14:17:03 - INFO - __main__ - Step 6102: {'lr': 0.0004990533453094594, 'samples': 1171584, 'steps': 6101, 'loss/train': 2.0008089542388916} -08/30/2021 14:17:03 - INFO - __main__ - Step 6103: {'lr': 0.0004990528838747586, 'samples': 1171776, 'steps': 6102, 'loss/train': 2.0956332683563232} -08/30/2021 14:17:03 - INFO - __main__ - Step 6104: {'lr': 0.0004990524223278384, 'samples': 1171968, 'steps': 6103, 'loss/train': 2.2818100452423096} -08/30/2021 14:17:05 - INFO - __main__ - Step 6105: {'lr': 0.0004990519606686991, 'samples': 1172160, 'steps': 6104, 'loss/train': 2.261725664138794} -08/30/2021 14:17:05 - INFO - __main__ - Step 6106: {'lr': 0.0004990514988973408, 'samples': 1172352, 'steps': 6105, 'loss/train': 1.611903429031372} -08/30/2021 14:17:06 - INFO - __main__ - Step 6107: {'lr': 0.0004990510370137637, 'samples': 1172544, 'steps': 6106, 'loss/train': 1.9110937118530273} -08/30/2021 14:17:06 - INFO - __main__ - Step 6108: {'lr': 0.0004990505750179682, 'samples': 1172736, 'steps': 6107, 'loss/train': 1.362024188041687} -08/30/2021 14:17:06 - INFO - __main__ - Step 6109: {'lr': 0.0004990501129099542, 'samples': 1172928, 'steps': 6108, 'loss/train': 1.0821868181228638} -08/30/2021 14:17:08 - INFO - __main__ - Step 6110: {'lr': 0.000499049650689722, 'samples': 1173120, 'steps': 6109, 'loss/train': 1.912007212638855} -08/30/2021 14:17:08 - INFO - __main__ - Step 6111: {'lr': 0.000499049188357272, 'samples': 1173312, 'steps': 6110, 'loss/train': 2.309844970703125} -08/30/2021 14:17:09 - INFO - __main__ - Step 6112: {'lr': 0.0004990487259126043, 'samples': 1173504, 'steps': 6111, 'loss/train': 2.6369924545288086} -08/30/2021 14:17:09 - INFO - __main__ - Step 6113: {'lr': 0.0004990482633557189, 'samples': 1173696, 'steps': 6112, 'loss/train': 1.12046480178833} -08/30/2021 14:17:10 - INFO - __main__ - Step 6114: {'lr': 0.0004990478006866165, 'samples': 1173888, 'steps': 6113, 'loss/train': 2.1313536167144775} -08/30/2021 14:17:10 - INFO - __main__ - Step 6115: {'lr': 0.0004990473379052968, 'samples': 1174080, 'steps': 6114, 'loss/train': 1.6079707145690918} -08/30/2021 14:17:11 - INFO - __main__ - Step 6116: {'lr': 0.0004990468750117602, 'samples': 1174272, 'steps': 6115, 'loss/train': 1.6931512355804443} -08/30/2021 14:17:12 - INFO - __main__ - Step 6117: {'lr': 0.000499046412006007, 'samples': 1174464, 'steps': 6116, 'loss/train': 1.952774167060852} -08/30/2021 14:17:12 - INFO - __main__ - Step 6118: {'lr': 0.0004990459488880372, 'samples': 1174656, 'steps': 6117, 'loss/train': 1.8816965818405151} -08/30/2021 14:17:12 - INFO - __main__ - Step 6119: {'lr': 0.0004990454856578513, 'samples': 1174848, 'steps': 6118, 'loss/train': 2.5326578617095947} -08/30/2021 14:17:13 - INFO - __main__ - Step 6120: {'lr': 0.0004990450223154492, 'samples': 1175040, 'steps': 6119, 'loss/train': 1.5734384059906006} -08/30/2021 14:17:14 - INFO - __main__ - Step 6121: {'lr': 0.0004990445588608313, 'samples': 1175232, 'steps': 6120, 'loss/train': 1.8786181211471558} -08/30/2021 14:17:15 - INFO - __main__ - Step 6122: {'lr': 0.0004990440952939979, 'samples': 1175424, 'steps': 6121, 'loss/train': 1.7350105047225952} -08/30/2021 14:17:15 - INFO - __main__ - Step 6123: {'lr': 0.0004990436316149489, 'samples': 1175616, 'steps': 6122, 'loss/train': 2.220349073410034} -08/30/2021 14:17:15 - INFO - __main__ - Step 6124: {'lr': 0.0004990431678236849, 'samples': 1175808, 'steps': 6123, 'loss/train': 2.1604645252227783} -08/30/2021 14:17:16 - INFO - __main__ - Step 6125: {'lr': 0.0004990427039202057, 'samples': 1176000, 'steps': 6124, 'loss/train': 2.588308811187744} -08/30/2021 14:17:17 - INFO - __main__ - Step 6126: {'lr': 0.0004990422399045117, 'samples': 1176192, 'steps': 6125, 'loss/train': 1.2041592597961426} -08/30/2021 14:17:18 - INFO - __main__ - Step 6127: {'lr': 0.0004990417757766031, 'samples': 1176384, 'steps': 6126, 'loss/train': 1.7451285123825073} -08/30/2021 14:17:18 - INFO - __main__ - Step 6128: {'lr': 0.0004990413115364803, 'samples': 1176576, 'steps': 6127, 'loss/train': 2.5466935634613037} -08/30/2021 14:17:18 - INFO - __main__ - Step 6129: {'lr': 0.0004990408471841431, 'samples': 1176768, 'steps': 6128, 'loss/train': 2.152479887008667} -08/30/2021 14:17:19 - INFO - __main__ - Step 6130: {'lr': 0.0004990403827195921, 'samples': 1176960, 'steps': 6129, 'loss/train': 2.1017420291900635} -08/30/2021 14:17:20 - INFO - __main__ - Step 6131: {'lr': 0.0004990399181428273, 'samples': 1177152, 'steps': 6130, 'loss/train': 1.4404301643371582} -08/30/2021 14:17:21 - INFO - __main__ - Step 6132: {'lr': 0.000499039453453849, 'samples': 1177344, 'steps': 6131, 'loss/train': 2.3782787322998047} -08/30/2021 14:17:21 - INFO - __main__ - Step 6133: {'lr': 0.0004990389886526573, 'samples': 1177536, 'steps': 6132, 'loss/train': 2.0950968265533447} -08/30/2021 14:17:21 - INFO - __main__ - Step 6134: {'lr': 0.0004990385237392524, 'samples': 1177728, 'steps': 6133, 'loss/train': 2.377577543258667} -08/30/2021 14:17:22 - INFO - __main__ - Step 6135: {'lr': 0.0004990380587136347, 'samples': 1177920, 'steps': 6134, 'loss/train': 2.1193230152130127} -08/30/2021 14:17:24 - INFO - __main__ - Step 6136: {'lr': 0.0004990375935758042, 'samples': 1178112, 'steps': 6135, 'loss/train': 1.4899842739105225} -08/30/2021 14:17:24 - INFO - __main__ - Step 6137: {'lr': 0.0004990371283257613, 'samples': 1178304, 'steps': 6136, 'loss/train': 6.589000701904297} -08/30/2021 14:17:24 - INFO - __main__ - Step 6138: {'lr': 0.0004990366629635062, 'samples': 1178496, 'steps': 6137, 'loss/train': 1.8414204120635986} -08/30/2021 14:17:25 - INFO - __main__ - Step 6139: {'lr': 0.0004990361974890388, 'samples': 1178688, 'steps': 6138, 'loss/train': 1.9632432460784912} -08/30/2021 14:17:25 - INFO - __main__ - Step 6140: {'lr': 0.0004990357319023597, 'samples': 1178880, 'steps': 6139, 'loss/train': 1.5291732549667358} -08/30/2021 14:17:26 - INFO - __main__ - Step 6141: {'lr': 0.0004990352662034689, 'samples': 1179072, 'steps': 6140, 'loss/train': 0.552104651927948} -08/30/2021 14:17:28 - INFO - __main__ - Step 6142: {'lr': 0.0004990348003923665, 'samples': 1179264, 'steps': 6141, 'loss/train': 2.363502025604248} -08/30/2021 14:17:28 - INFO - __main__ - Step 6143: {'lr': 0.000499034334469053, 'samples': 1179456, 'steps': 6142, 'loss/train': 2.386108875274658} -08/30/2021 14:17:29 - INFO - __main__ - Step 6144: {'lr': 0.0004990338684335285, 'samples': 1179648, 'steps': 6143, 'loss/train': 2.582843065261841} -08/30/2021 14:17:29 - INFO - __main__ - Step 6145: {'lr': 0.0004990334022857932, 'samples': 1179840, 'steps': 6144, 'loss/train': 0.34102797508239746} -08/30/2021 14:17:29 - INFO - __main__ - Step 6146: {'lr': 0.0004990329360258472, 'samples': 1180032, 'steps': 6145, 'loss/train': 1.8113882541656494} -08/30/2021 14:17:30 - INFO - __main__ - Step 6147: {'lr': 0.0004990324696536908, 'samples': 1180224, 'steps': 6146, 'loss/train': 2.0144941806793213} -08/30/2021 14:17:32 - INFO - __main__ - Step 6148: {'lr': 0.0004990320031693242, 'samples': 1180416, 'steps': 6147, 'loss/train': 1.286054015159607} -08/30/2021 14:17:32 - INFO - __main__ - Step 6149: {'lr': 0.0004990315365727476, 'samples': 1180608, 'steps': 6148, 'loss/train': 1.892910122871399} -08/30/2021 14:17:33 - INFO - __main__ - Step 6150: {'lr': 0.0004990310698639614, 'samples': 1180800, 'steps': 6149, 'loss/train': 1.7210521697998047} -08/30/2021 14:17:33 - INFO - __main__ - Step 6151: {'lr': 0.0004990306030429655, 'samples': 1180992, 'steps': 6150, 'loss/train': 2.0882198810577393} -08/30/2021 14:17:33 - INFO - __main__ - Step 6152: {'lr': 0.0004990301361097603, 'samples': 1181184, 'steps': 6151, 'loss/train': 1.6206170320510864} -08/30/2021 14:17:35 - INFO - __main__ - Step 6153: {'lr': 0.000499029669064346, 'samples': 1181376, 'steps': 6152, 'loss/train': 0.4024379849433899} -08/30/2021 14:17:35 - INFO - __main__ - Step 6154: {'lr': 0.0004990292019067227, 'samples': 1181568, 'steps': 6153, 'loss/train': 2.0156362056732178} -08/30/2021 14:17:36 - INFO - __main__ - Step 6155: {'lr': 0.0004990287346368908, 'samples': 1181760, 'steps': 6154, 'loss/train': 2.4578709602355957} -08/30/2021 14:17:36 - INFO - __main__ - Step 6156: {'lr': 0.0004990282672548503, 'samples': 1181952, 'steps': 6155, 'loss/train': 1.9091486930847168} -08/30/2021 14:17:36 - INFO - __main__ - Step 6157: {'lr': 0.0004990277997606016, 'samples': 1182144, 'steps': 6156, 'loss/train': 1.8755120038986206} -08/30/2021 14:17:38 - INFO - __main__ - Step 6158: {'lr': 0.0004990273321541447, 'samples': 1182336, 'steps': 6157, 'loss/train': 2.099588632583618} -08/30/2021 14:17:38 - INFO - __main__ - Step 6159: {'lr': 0.0004990268644354799, 'samples': 1182528, 'steps': 6158, 'loss/train': 2.256617546081543} -08/30/2021 14:17:39 - INFO - __main__ - Step 6160: {'lr': 0.0004990263966046075, 'samples': 1182720, 'steps': 6159, 'loss/train': 1.7035191059112549} -08/30/2021 14:17:39 - INFO - __main__ - Step 6161: {'lr': 0.0004990259286615276, 'samples': 1182912, 'steps': 6160, 'loss/train': 1.9849936962127686} -08/30/2021 14:17:39 - INFO - __main__ - Step 6162: {'lr': 0.0004990254606062406, 'samples': 1183104, 'steps': 6161, 'loss/train': 2.512209892272949} -08/30/2021 14:17:41 - INFO - __main__ - Step 6163: {'lr': 0.0004990249924387465, 'samples': 1183296, 'steps': 6162, 'loss/train': 2.401766300201416} -08/30/2021 14:17:42 - INFO - __main__ - Step 6164: {'lr': 0.0004990245241590455, 'samples': 1183488, 'steps': 6163, 'loss/train': 1.8561409711837769} -08/30/2021 14:17:42 - INFO - __main__ - Step 6165: {'lr': 0.0004990240557671379, 'samples': 1183680, 'steps': 6164, 'loss/train': 2.1383039951324463} -08/30/2021 14:17:42 - INFO - __main__ - Step 6166: {'lr': 0.000499023587263024, 'samples': 1183872, 'steps': 6165, 'loss/train': 1.8972554206848145} -08/30/2021 14:17:43 - INFO - __main__ - Step 6167: {'lr': 0.0004990231186467039, 'samples': 1184064, 'steps': 6166, 'loss/train': 1.9691927433013916} -08/30/2021 14:17:43 - INFO - __main__ - Step 6168: {'lr': 0.0004990226499181778, 'samples': 1184256, 'steps': 6167, 'loss/train': 0.3678905963897705} -08/30/2021 14:17:45 - INFO - __main__ - Step 6169: {'lr': 0.0004990221810774459, 'samples': 1184448, 'steps': 6168, 'loss/train': 2.058572769165039} -08/30/2021 14:17:45 - INFO - __main__ - Step 6170: {'lr': 0.0004990217121245084, 'samples': 1184640, 'steps': 6169, 'loss/train': 2.1512398719787598} -08/30/2021 14:17:45 - INFO - __main__ - Step 6171: {'lr': 0.0004990212430593657, 'samples': 1184832, 'steps': 6170, 'loss/train': 1.8302189111709595} -08/30/2021 14:17:46 - INFO - __main__ - Step 6172: {'lr': 0.0004990207738820178, 'samples': 1185024, 'steps': 6171, 'loss/train': 1.883941650390625} -08/30/2021 14:17:46 - INFO - __main__ - Step 6173: {'lr': 0.000499020304592465, 'samples': 1185216, 'steps': 6172, 'loss/train': 2.1236584186553955} -08/30/2021 14:17:48 - INFO - __main__ - Step 6174: {'lr': 0.0004990198351907075, 'samples': 1185408, 'steps': 6173, 'loss/train': 2.120842456817627} -08/30/2021 14:17:48 - INFO - __main__ - Step 6175: {'lr': 0.0004990193656767455, 'samples': 1185600, 'steps': 6174, 'loss/train': 1.4066747426986694} -08/30/2021 14:17:49 - INFO - __main__ - Step 6176: {'lr': 0.0004990188960505792, 'samples': 1185792, 'steps': 6175, 'loss/train': 2.0758004188537598} -08/30/2021 14:17:49 - INFO - __main__ - Step 6177: {'lr': 0.0004990184263122088, 'samples': 1185984, 'steps': 6176, 'loss/train': 1.8765077590942383} -08/30/2021 14:17:50 - INFO - __main__ - Step 6178: {'lr': 0.0004990179564616346, 'samples': 1186176, 'steps': 6177, 'loss/train': 0.41296014189720154} -08/30/2021 14:17:51 - INFO - __main__ - Step 6179: {'lr': 0.0004990174864988566, 'samples': 1186368, 'steps': 6178, 'loss/train': 2.0812172889709473} -08/30/2021 14:17:52 - INFO - __main__ - Step 6180: {'lr': 0.0004990170164238754, 'samples': 1186560, 'steps': 6179, 'loss/train': 2.5438144207000732} -08/30/2021 14:17:52 - INFO - __main__ - Step 6181: {'lr': 0.0004990165462366909, 'samples': 1186752, 'steps': 6180, 'loss/train': 0.5283352136611938} -08/30/2021 14:17:53 - INFO - __main__ - Step 6182: {'lr': 0.0004990160759373033, 'samples': 1186944, 'steps': 6181, 'loss/train': 1.8242038488388062} -08/30/2021 14:17:53 - INFO - __main__ - Step 6183: {'lr': 0.0004990156055257129, 'samples': 1187136, 'steps': 6182, 'loss/train': 1.3752305507659912} -08/30/2021 14:17:55 - INFO - __main__ - Step 6184: {'lr': 0.00049901513500192, 'samples': 1187328, 'steps': 6183, 'loss/train': 2.3722639083862305} -08/30/2021 14:17:55 - INFO - __main__ - Step 6185: {'lr': 0.0004990146643659247, 'samples': 1187520, 'steps': 6184, 'loss/train': 2.003141164779663} -08/30/2021 14:17:55 - INFO - __main__ - Step 6186: {'lr': 0.0004990141936177272, 'samples': 1187712, 'steps': 6185, 'loss/train': 1.7587296962738037} -08/30/2021 14:17:56 - INFO - __main__ - Step 6187: {'lr': 0.0004990137227573278, 'samples': 1187904, 'steps': 6186, 'loss/train': 1.947689414024353} -08/30/2021 14:17:56 - INFO - __main__ - Step 6188: {'lr': 0.0004990132517847266, 'samples': 1188096, 'steps': 6187, 'loss/train': 2.373015880584717} -08/30/2021 14:17:56 - INFO - __main__ - Step 6189: {'lr': 0.0004990127806999239, 'samples': 1188288, 'steps': 6188, 'loss/train': 1.674223780632019} -08/30/2021 14:17:58 - INFO - __main__ - Step 6190: {'lr': 0.0004990123095029199, 'samples': 1188480, 'steps': 6189, 'loss/train': 2.42575740814209} -08/30/2021 14:17:59 - INFO - __main__ - Step 6191: {'lr': 0.0004990118381937148, 'samples': 1188672, 'steps': 6190, 'loss/train': 1.8693678379058838} -08/30/2021 14:17:59 - INFO - __main__ - Step 6192: {'lr': 0.0004990113667723088, 'samples': 1188864, 'steps': 6191, 'loss/train': 3.1117334365844727} -08/30/2021 14:17:59 - INFO - __main__ - Step 6193: {'lr': 0.000499010895238702, 'samples': 1189056, 'steps': 6192, 'loss/train': 1.974090814590454} -08/30/2021 14:18:00 - INFO - __main__ - Step 6194: {'lr': 0.0004990104235928948, 'samples': 1189248, 'steps': 6193, 'loss/train': 2.349508762359619} -08/30/2021 14:18:01 - INFO - __main__ - Step 6195: {'lr': 0.0004990099518348874, 'samples': 1189440, 'steps': 6194, 'loss/train': 0.2854999899864197} -08/30/2021 14:18:02 - INFO - __main__ - Step 6196: {'lr': 0.00049900947996468, 'samples': 1189632, 'steps': 6195, 'loss/train': 2.0679450035095215} -08/30/2021 14:18:02 - INFO - __main__ - Step 6197: {'lr': 0.0004990090079822726, 'samples': 1189824, 'steps': 6196, 'loss/train': 2.156909704208374} -08/30/2021 14:18:02 - INFO - __main__ - Step 6198: {'lr': 0.0004990085358876658, 'samples': 1190016, 'steps': 6197, 'loss/train': 1.727145791053772} -08/30/2021 14:18:03 - INFO - __main__ - Step 6199: {'lr': 0.0004990080636808595, 'samples': 1190208, 'steps': 6198, 'loss/train': 1.08854341506958} -08/30/2021 14:18:03 - INFO - __main__ - Step 6200: {'lr': 0.000499007591361854, 'samples': 1190400, 'steps': 6199, 'loss/train': 1.5549006462097168} -08/30/2021 14:18:05 - INFO - __main__ - Step 6201: {'lr': 0.0004990071189306495, 'samples': 1190592, 'steps': 6200, 'loss/train': 2.4462223052978516} -08/30/2021 14:18:06 - INFO - __main__ - Step 6202: {'lr': 0.0004990066463872462, 'samples': 1190784, 'steps': 6201, 'loss/train': 2.5784995555877686} -08/30/2021 14:18:06 - INFO - __main__ - Step 6203: {'lr': 0.0004990061737316445, 'samples': 1190976, 'steps': 6202, 'loss/train': 2.134146213531494} -08/30/2021 14:18:07 - INFO - __main__ - Step 6204: {'lr': 0.0004990057009638443, 'samples': 1191168, 'steps': 6203, 'loss/train': 2.2616889476776123} -08/30/2021 14:18:07 - INFO - __main__ - Step 6205: {'lr': 0.000499005228083846, 'samples': 1191360, 'steps': 6204, 'loss/train': 0.5354210138320923} -08/30/2021 14:18:08 - INFO - __main__ - Step 6206: {'lr': 0.0004990047550916498, 'samples': 1191552, 'steps': 6205, 'loss/train': 2.0784218311309814} -08/30/2021 14:18:09 - INFO - __main__ - Step 6207: {'lr': 0.000499004281987256, 'samples': 1191744, 'steps': 6206, 'loss/train': 2.5894880294799805} -08/30/2021 14:18:09 - INFO - __main__ - Step 6208: {'lr': 0.0004990038087706646, 'samples': 1191936, 'steps': 6207, 'loss/train': 2.2595319747924805} -08/30/2021 14:18:10 - INFO - __main__ - Step 6209: {'lr': 0.000499003335441876, 'samples': 1192128, 'steps': 6208, 'loss/train': 2.4695115089416504} -08/30/2021 14:18:10 - INFO - __main__ - Step 6210: {'lr': 0.0004990028620008903, 'samples': 1192320, 'steps': 6209, 'loss/train': 1.9695442914962769} -08/30/2021 14:18:12 - INFO - __main__ - Step 6211: {'lr': 0.0004990023884477077, 'samples': 1192512, 'steps': 6210, 'loss/train': 1.8410488367080688} -08/30/2021 14:18:12 - INFO - __main__ - Step 6212: {'lr': 0.0004990019147823286, 'samples': 1192704, 'steps': 6211, 'loss/train': 2.443037748336792} -08/30/2021 14:18:12 - INFO - __main__ - Step 6213: {'lr': 0.000499001441004753, 'samples': 1192896, 'steps': 6212, 'loss/train': 1.5597666501998901} -08/30/2021 14:18:13 - INFO - __main__ - Step 6214: {'lr': 0.0004990009671149811, 'samples': 1193088, 'steps': 6213, 'loss/train': 2.178555488586426} -08/30/2021 14:18:13 - INFO - __main__ - Step 6215: {'lr': 0.0004990004931130133, 'samples': 1193280, 'steps': 6214, 'loss/train': 1.4102318286895752} -08/30/2021 14:18:14 - INFO - __main__ - Step 6216: {'lr': 0.0004990000189988497, 'samples': 1193472, 'steps': 6215, 'loss/train': 2.2533822059631348} -08/30/2021 14:18:15 - INFO - __main__ - Step 6217: {'lr': 0.0004989995447724907, 'samples': 1193664, 'steps': 6216, 'loss/train': 2.015746831893921} -08/30/2021 14:18:15 - INFO - __main__ - Step 6218: {'lr': 0.0004989990704339361, 'samples': 1193856, 'steps': 6217, 'loss/train': 2.105013608932495} -08/30/2021 14:18:16 - INFO - __main__ - Step 6219: {'lr': 0.0004989985959831865, 'samples': 1194048, 'steps': 6218, 'loss/train': 2.5074172019958496} -08/30/2021 14:18:16 - INFO - __main__ - Step 6220: {'lr': 0.0004989981214202419, 'samples': 1194240, 'steps': 6219, 'loss/train': 2.59159255027771} -08/30/2021 14:18:16 - INFO - __main__ - Step 6221: {'lr': 0.0004989976467451026, 'samples': 1194432, 'steps': 6220, 'loss/train': 1.5907371044158936} -08/30/2021 14:18:18 - INFO - __main__ - Step 6222: {'lr': 0.0004989971719577688, 'samples': 1194624, 'steps': 6221, 'loss/train': 2.125783681869507} -08/30/2021 14:18:18 - INFO - __main__ - Step 6223: {'lr': 0.0004989966970582408, 'samples': 1194816, 'steps': 6222, 'loss/train': 2.1885910034179688} -08/30/2021 14:18:19 - INFO - __main__ - Step 6224: {'lr': 0.0004989962220465187, 'samples': 1195008, 'steps': 6223, 'loss/train': 2.1810812950134277} -08/30/2021 14:18:19 - INFO - __main__ - Step 6225: {'lr': 0.0004989957469226027, 'samples': 1195200, 'steps': 6224, 'loss/train': 1.6825599670410156} -08/30/2021 14:18:19 - INFO - __main__ - Step 6226: {'lr': 0.0004989952716864931, 'samples': 1195392, 'steps': 6225, 'loss/train': 2.1403675079345703} -08/30/2021 14:18:21 - INFO - __main__ - Step 6227: {'lr': 0.00049899479633819, 'samples': 1195584, 'steps': 6226, 'loss/train': 1.7359288930892944} -08/30/2021 14:18:21 - INFO - __main__ - Step 6228: {'lr': 0.0004989943208776938, 'samples': 1195776, 'steps': 6227, 'loss/train': 1.8733208179473877} -08/30/2021 14:18:22 - INFO - __main__ - Step 6229: {'lr': 0.0004989938453050045, 'samples': 1195968, 'steps': 6228, 'loss/train': 1.642006516456604} -08/30/2021 14:18:22 - INFO - __main__ - Step 6230: {'lr': 0.0004989933696201225, 'samples': 1196160, 'steps': 6229, 'loss/train': 1.9372864961624146} -08/30/2021 14:18:22 - INFO - __main__ - Step 6231: {'lr': 0.0004989928938230478, 'samples': 1196352, 'steps': 6230, 'loss/train': 2.230191707611084} -08/30/2021 14:18:24 - INFO - __main__ - Step 6232: {'lr': 0.0004989924179137808, 'samples': 1196544, 'steps': 6231, 'loss/train': 2.5581588745117188} -08/30/2021 14:18:24 - INFO - __main__ - Step 6233: {'lr': 0.0004989919418923218, 'samples': 1196736, 'steps': 6232, 'loss/train': 2.114278554916382} -08/30/2021 14:18:24 - INFO - __main__ - Step 6234: {'lr': 0.0004989914657586707, 'samples': 1196928, 'steps': 6233, 'loss/train': 2.0605738162994385} -08/30/2021 14:18:25 - INFO - __main__ - Step 6235: {'lr': 0.000498990989512828, 'samples': 1197120, 'steps': 6234, 'loss/train': 1.9753429889678955} -08/30/2021 14:18:25 - INFO - __main__ - Step 6236: {'lr': 0.0004989905131547937, 'samples': 1197312, 'steps': 6235, 'loss/train': 2.2529351711273193} -08/30/2021 14:18:27 - INFO - __main__ - Step 6237: {'lr': 0.0004989900366845682, 'samples': 1197504, 'steps': 6236, 'loss/train': 2.2310385704040527} -08/30/2021 14:18:27 - INFO - __main__ - Step 6238: {'lr': 0.0004989895601021515, 'samples': 1197696, 'steps': 6237, 'loss/train': 1.9800227880477905} -08/30/2021 14:18:27 - INFO - __main__ - Step 6239: {'lr': 0.0004989890834075441, 'samples': 1197888, 'steps': 6238, 'loss/train': 1.9875377416610718} -08/30/2021 14:18:28 - INFO - __main__ - Step 6240: {'lr': 0.000498988606600746, 'samples': 1198080, 'steps': 6239, 'loss/train': 2.0325026512145996} -08/30/2021 14:18:28 - INFO - __main__ - Step 6241: {'lr': 0.0004989881296817575, 'samples': 1198272, 'steps': 6240, 'loss/train': 2.1536710262298584} -08/30/2021 14:18:30 - INFO - __main__ - Step 6242: {'lr': 0.0004989876526505788, 'samples': 1198464, 'steps': 6241, 'loss/train': 2.5535590648651123} -08/30/2021 14:18:30 - INFO - __main__ - Step 6243: {'lr': 0.0004989871755072101, 'samples': 1198656, 'steps': 6242, 'loss/train': 2.3413236141204834} -08/30/2021 14:18:30 - INFO - __main__ - Step 6244: {'lr': 0.0004989866982516516, 'samples': 1198848, 'steps': 6243, 'loss/train': 1.6933993101119995} -08/30/2021 14:18:31 - INFO - __main__ - Step 6245: {'lr': 0.0004989862208839035, 'samples': 1199040, 'steps': 6244, 'loss/train': 2.150791883468628} -08/30/2021 14:18:31 - INFO - __main__ - Step 6246: {'lr': 0.0004989857434039661, 'samples': 1199232, 'steps': 6245, 'loss/train': 2.0392470359802246} -08/30/2021 14:18:33 - INFO - __main__ - Step 6247: {'lr': 0.0004989852658118395, 'samples': 1199424, 'steps': 6246, 'loss/train': 1.798715591430664} -08/30/2021 14:18:33 - INFO - __main__ - Step 6248: {'lr': 0.000498984788107524, 'samples': 1199616, 'steps': 6247, 'loss/train': 2.3154523372650146} -08/30/2021 14:18:33 - INFO - __main__ - Step 6249: {'lr': 0.0004989843102910198, 'samples': 1199808, 'steps': 6248, 'loss/train': 2.6237261295318604} -08/30/2021 14:18:34 - INFO - __main__ - Step 6250: {'lr': 0.0004989838323623272, 'samples': 1200000, 'steps': 6249, 'loss/train': 1.3969299793243408} -08/30/2021 14:18:34 - INFO - __main__ - Step 6251: {'lr': 0.0004989833543214463, 'samples': 1200192, 'steps': 6250, 'loss/train': 1.8402429819107056} -08/30/2021 14:18:36 - INFO - __main__ - Step 6252: {'lr': 0.0004989828761683774, 'samples': 1200384, 'steps': 6251, 'loss/train': 0.9740005135536194} -08/30/2021 14:18:36 - INFO - __main__ - Step 6253: {'lr': 0.0004989823979031205, 'samples': 1200576, 'steps': 6252, 'loss/train': 1.827061414718628} -08/30/2021 14:18:37 - INFO - __main__ - Step 6254: {'lr': 0.000498981919525676, 'samples': 1200768, 'steps': 6253, 'loss/train': 1.2323906421661377} -08/30/2021 14:18:37 - INFO - __main__ - Step 6255: {'lr': 0.0004989814410360442, 'samples': 1200960, 'steps': 6254, 'loss/train': 2.6655220985412598} -08/30/2021 14:18:37 - INFO - __main__ - Step 6256: {'lr': 0.0004989809624342251, 'samples': 1201152, 'steps': 6255, 'loss/train': 2.2425320148468018} -08/30/2021 14:18:39 - INFO - __main__ - Step 6257: {'lr': 0.000498980483720219, 'samples': 1201344, 'steps': 6256, 'loss/train': 2.5152058601379395} -08/30/2021 14:18:40 - INFO - __main__ - Step 6258: {'lr': 0.0004989800048940263, 'samples': 1201536, 'steps': 6257, 'loss/train': 1.9815870523452759} -08/30/2021 14:18:40 - INFO - __main__ - Step 6259: {'lr': 0.0004989795259556469, 'samples': 1201728, 'steps': 6258, 'loss/train': 1.9239863157272339} -08/30/2021 14:18:41 - INFO - __main__ - Step 6260: {'lr': 0.0004989790469050813, 'samples': 1201920, 'steps': 6259, 'loss/train': 1.7363396883010864} -08/30/2021 14:18:41 - INFO - __main__ - Step 6261: {'lr': 0.0004989785677423295, 'samples': 1202112, 'steps': 6260, 'loss/train': 0.8849676251411438} -08/30/2021 14:18:42 - INFO - __main__ - Step 6262: {'lr': 0.0004989780884673917, 'samples': 1202304, 'steps': 6261, 'loss/train': 2.0852367877960205} -08/30/2021 14:18:43 - INFO - __main__ - Step 6263: {'lr': 0.0004989776090802683, 'samples': 1202496, 'steps': 6262, 'loss/train': 2.010713577270508} -08/30/2021 14:18:43 - INFO - __main__ - Step 6264: {'lr': 0.0004989771295809594, 'samples': 1202688, 'steps': 6263, 'loss/train': 1.6176643371582031} -08/30/2021 14:18:44 - INFO - __main__ - Step 6265: {'lr': 0.0004989766499694653, 'samples': 1202880, 'steps': 6264, 'loss/train': 1.9133375883102417} -08/30/2021 14:18:44 - INFO - __main__ - Step 6266: {'lr': 0.0004989761702457862, 'samples': 1203072, 'steps': 6265, 'loss/train': 1.3014731407165527} -08/30/2021 14:18:45 - INFO - __main__ - Step 6267: {'lr': 0.0004989756904099222, 'samples': 1203264, 'steps': 6266, 'loss/train': 2.108015537261963} -08/30/2021 14:18:46 - INFO - __main__ - Step 6268: {'lr': 0.0004989752104618736, 'samples': 1203456, 'steps': 6267, 'loss/train': 2.1357452869415283} -08/30/2021 14:18:46 - INFO - __main__ - Step 6269: {'lr': 0.0004989747304016407, 'samples': 1203648, 'steps': 6268, 'loss/train': 2.0290212631225586} -08/30/2021 14:18:47 - INFO - __main__ - Step 6270: {'lr': 0.0004989742502292235, 'samples': 1203840, 'steps': 6269, 'loss/train': 1.945146918296814} -08/30/2021 14:18:47 - INFO - __main__ - Step 6271: {'lr': 0.0004989737699446225, 'samples': 1204032, 'steps': 6270, 'loss/train': 2.129586935043335} -08/30/2021 14:18:47 - INFO - __main__ - Step 6272: {'lr': 0.0004989732895478376, 'samples': 1204224, 'steps': 6271, 'loss/train': 2.221515655517578} -08/30/2021 14:18:49 - INFO - __main__ - Step 6273: {'lr': 0.0004989728090388693, 'samples': 1204416, 'steps': 6272, 'loss/train': 1.7734287977218628} -08/30/2021 14:18:49 - INFO - __main__ - Step 6274: {'lr': 0.0004989723284177177, 'samples': 1204608, 'steps': 6273, 'loss/train': 2.149461507797241} -08/30/2021 14:18:50 - INFO - __main__ - Step 6275: {'lr': 0.0004989718476843828, 'samples': 1204800, 'steps': 6274, 'loss/train': 1.9583441019058228} -08/30/2021 14:18:50 - INFO - __main__ - Step 6276: {'lr': 0.0004989713668388652, 'samples': 1204992, 'steps': 6275, 'loss/train': 2.027327537536621} -08/30/2021 14:18:50 - INFO - __main__ - Step 6277: {'lr': 0.000498970885881165, 'samples': 1205184, 'steps': 6276, 'loss/train': 2.7661585807800293} -08/30/2021 14:18:52 - INFO - __main__ - Step 6278: {'lr': 0.0004989704048112823, 'samples': 1205376, 'steps': 6277, 'loss/train': 2.363206386566162} -08/30/2021 14:18:52 - INFO - __main__ - Step 6279: {'lr': 0.0004989699236292173, 'samples': 1205568, 'steps': 6278, 'loss/train': 2.557337522506714} -08/30/2021 14:18:53 - INFO - __main__ - Step 6280: {'lr': 0.0004989694423349704, 'samples': 1205760, 'steps': 6279, 'loss/train': 1.611116886138916} -08/30/2021 14:18:53 - INFO - __main__ - Step 6281: {'lr': 0.0004989689609285417, 'samples': 1205952, 'steps': 6280, 'loss/train': 2.5754168033599854} -08/30/2021 14:18:53 - INFO - __main__ - Step 6282: {'lr': 0.0004989684794099314, 'samples': 1206144, 'steps': 6281, 'loss/train': 2.283574104309082} -08/30/2021 14:18:55 - INFO - __main__ - Step 6283: {'lr': 0.0004989679977791397, 'samples': 1206336, 'steps': 6282, 'loss/train': 1.8226563930511475} -08/30/2021 14:18:55 - INFO - __main__ - Step 6284: {'lr': 0.0004989675160361669, 'samples': 1206528, 'steps': 6283, 'loss/train': 1.9837374687194824} -08/30/2021 14:18:56 - INFO - __main__ - Step 6285: {'lr': 0.0004989670341810132, 'samples': 1206720, 'steps': 6284, 'loss/train': 2.731910228729248} -08/30/2021 14:18:56 - INFO - __main__ - Step 6286: {'lr': 0.0004989665522136789, 'samples': 1206912, 'steps': 6285, 'loss/train': 1.9442856311798096} -08/30/2021 14:18:56 - INFO - __main__ - Step 6287: {'lr': 0.0004989660701341639, 'samples': 1207104, 'steps': 6286, 'loss/train': 1.8635879755020142} -08/30/2021 14:18:58 - INFO - __main__ - Step 6288: {'lr': 0.0004989655879424687, 'samples': 1207296, 'steps': 6287, 'loss/train': 1.9705373048782349} -08/30/2021 14:18:58 - INFO - __main__ - Step 6289: {'lr': 0.0004989651056385936, 'samples': 1207488, 'steps': 6288, 'loss/train': 1.9441709518432617} -08/30/2021 14:18:59 - INFO - __main__ - Step 6290: {'lr': 0.0004989646232225384, 'samples': 1207680, 'steps': 6289, 'loss/train': 1.605919361114502} -08/30/2021 14:18:59 - INFO - __main__ - Step 6291: {'lr': 0.0004989641406943037, 'samples': 1207872, 'steps': 6290, 'loss/train': 1.3890336751937866} -08/30/2021 14:18:59 - INFO - __main__ - Step 6292: {'lr': 0.0004989636580538896, 'samples': 1208064, 'steps': 6291, 'loss/train': 1.718228816986084} -08/30/2021 14:19:01 - INFO - __main__ - Step 6293: {'lr': 0.0004989631753012964, 'samples': 1208256, 'steps': 6292, 'loss/train': 2.0688412189483643} -08/30/2021 14:19:01 - INFO - __main__ - Step 6294: {'lr': 0.0004989626924365242, 'samples': 1208448, 'steps': 6293, 'loss/train': 1.2345472574234009} -08/30/2021 14:19:02 - INFO - __main__ - Step 6295: {'lr': 0.0004989622094595733, 'samples': 1208640, 'steps': 6294, 'loss/train': 1.4485729932785034} -08/30/2021 14:19:02 - INFO - __main__ - Step 6296: {'lr': 0.0004989617263704437, 'samples': 1208832, 'steps': 6295, 'loss/train': 2.0158963203430176} -08/30/2021 14:19:02 - INFO - __main__ - Step 6297: {'lr': 0.0004989612431691359, 'samples': 1209024, 'steps': 6296, 'loss/train': 1.9707484245300293} -08/30/2021 14:19:03 - INFO - __main__ - Step 6298: {'lr': 0.0004989607598556501, 'samples': 1209216, 'steps': 6297, 'loss/train': 2.353196144104004} -08/30/2021 14:19:05 - INFO - __main__ - Step 6299: {'lr': 0.0004989602764299862, 'samples': 1209408, 'steps': 6298, 'loss/train': 1.7036041021347046} -08/30/2021 14:19:05 - INFO - __main__ - Step 6300: {'lr': 0.0004989597928921447, 'samples': 1209600, 'steps': 6299, 'loss/train': 0.30971235036849976} -08/30/2021 14:19:05 - INFO - __main__ - Step 6301: {'lr': 0.0004989593092421258, 'samples': 1209792, 'steps': 6300, 'loss/train': 1.692036747932434} -08/30/2021 14:19:06 - INFO - __main__ - Step 6302: {'lr': 0.0004989588254799297, 'samples': 1209984, 'steps': 6301, 'loss/train': 2.0625877380371094} -08/30/2021 14:19:06 - INFO - __main__ - Step 6303: {'lr': 0.0004989583416055566, 'samples': 1210176, 'steps': 6302, 'loss/train': 1.2793693542480469} -08/30/2021 14:19:08 - INFO - __main__ - Step 6304: {'lr': 0.0004989578576190068, 'samples': 1210368, 'steps': 6303, 'loss/train': 2.2753987312316895} -08/30/2021 14:19:08 - INFO - __main__ - Step 6305: {'lr': 0.0004989573735202802, 'samples': 1210560, 'steps': 6304, 'loss/train': 2.163113594055176} -08/30/2021 14:19:08 - INFO - __main__ - Step 6306: {'lr': 0.0004989568893093774, 'samples': 1210752, 'steps': 6305, 'loss/train': 2.0276966094970703} -08/30/2021 14:19:09 - INFO - __main__ - Step 6307: {'lr': 0.0004989564049862986, 'samples': 1210944, 'steps': 6306, 'loss/train': 2.8450539112091064} -08/30/2021 14:19:09 - INFO - __main__ - Step 6308: {'lr': 0.0004989559205510436, 'samples': 1211136, 'steps': 6307, 'loss/train': 2.1560885906219482} -08/30/2021 14:19:09 - INFO - __main__ - Step 6309: {'lr': 0.000498955436003613, 'samples': 1211328, 'steps': 6308, 'loss/train': 2.1145544052124023} -08/30/2021 14:19:12 - INFO - __main__ - Step 6310: {'lr': 0.0004989549513440071, 'samples': 1211520, 'steps': 6309, 'loss/train': 2.2295072078704834} -08/30/2021 14:19:12 - INFO - __main__ - Step 6311: {'lr': 0.0004989544665722258, 'samples': 1211712, 'steps': 6310, 'loss/train': 1.5627377033233643} -08/30/2021 14:19:13 - INFO - __main__ - Step 6312: {'lr': 0.0004989539816882694, 'samples': 1211904, 'steps': 6311, 'loss/train': 2.430529832839966} -08/30/2021 14:19:13 - INFO - __main__ - Step 6313: {'lr': 0.0004989534966921382, 'samples': 1212096, 'steps': 6312, 'loss/train': 1.8771684169769287} -08/30/2021 14:19:14 - INFO - __main__ - Step 6314: {'lr': 0.0004989530115838324, 'samples': 1212288, 'steps': 6313, 'loss/train': 0.33140167593955994} -08/30/2021 14:19:15 - INFO - __main__ - Step 6315: {'lr': 0.0004989525263633523, 'samples': 1212480, 'steps': 6314, 'loss/train': 1.9396084547042847} -08/30/2021 14:19:16 - INFO - __main__ - Step 6316: {'lr': 0.0004989520410306979, 'samples': 1212672, 'steps': 6315, 'loss/train': 1.6873884201049805} -08/30/2021 14:19:16 - INFO - __main__ - Step 6317: {'lr': 0.0004989515555858697, 'samples': 1212864, 'steps': 6316, 'loss/train': 2.732889413833618} -08/30/2021 14:19:16 - INFO - __main__ - Step 6318: {'lr': 0.0004989510700288678, 'samples': 1213056, 'steps': 6317, 'loss/train': 2.062293291091919} -08/30/2021 14:19:17 - INFO - __main__ - Step 6319: {'lr': 0.0004989505843596922, 'samples': 1213248, 'steps': 6318, 'loss/train': 2.04461932182312} -08/30/2021 14:19:18 - INFO - __main__ - Step 6320: {'lr': 0.0004989500985783434, 'samples': 1213440, 'steps': 6319, 'loss/train': 1.9916492700576782} -08/30/2021 14:19:19 - INFO - __main__ - Step 6321: {'lr': 0.0004989496126848215, 'samples': 1213632, 'steps': 6320, 'loss/train': 1.9172712564468384} -08/30/2021 14:19:19 - INFO - __main__ - Step 6322: {'lr': 0.0004989491266791268, 'samples': 1213824, 'steps': 6321, 'loss/train': 1.4685570001602173} -08/30/2021 14:19:19 - INFO - __main__ - Step 6323: {'lr': 0.0004989486405612595, 'samples': 1214016, 'steps': 6322, 'loss/train': 2.379302978515625} -08/30/2021 14:19:20 - INFO - __main__ - Step 6324: {'lr': 0.0004989481543312196, 'samples': 1214208, 'steps': 6323, 'loss/train': 2.27948260307312} -08/30/2021 14:19:21 - INFO - __main__ - Step 6325: {'lr': 0.0004989476679890077, 'samples': 1214400, 'steps': 6324, 'loss/train': 2.2262282371520996} -08/30/2021 14:19:22 - INFO - __main__ - Step 6326: {'lr': 0.0004989471815346237, 'samples': 1214592, 'steps': 6325, 'loss/train': 1.691623568534851} -08/30/2021 14:19:22 - INFO - __main__ - Step 6327: {'lr': 0.000498946694968068, 'samples': 1214784, 'steps': 6326, 'loss/train': 1.5407147407531738} -08/30/2021 14:19:22 - INFO - __main__ - Step 6328: {'lr': 0.0004989462082893407, 'samples': 1214976, 'steps': 6327, 'loss/train': 1.9831125736236572} -08/30/2021 14:19:23 - INFO - __main__ - Step 6329: {'lr': 0.0004989457214984421, 'samples': 1215168, 'steps': 6328, 'loss/train': 2.3993725776672363} -08/30/2021 14:19:24 - INFO - __main__ - Step 6330: {'lr': 0.0004989452345953725, 'samples': 1215360, 'steps': 6329, 'loss/train': 1.287635087966919} -08/30/2021 14:19:25 - INFO - __main__ - Step 6331: {'lr': 0.000498944747580132, 'samples': 1215552, 'steps': 6330, 'loss/train': 1.7396970987319946} -08/30/2021 14:19:25 - INFO - __main__ - Step 6332: {'lr': 0.0004989442604527208, 'samples': 1215744, 'steps': 6331, 'loss/train': 1.8150804042816162} -08/30/2021 14:19:25 - INFO - __main__ - Step 6333: {'lr': 0.0004989437732131391, 'samples': 1215936, 'steps': 6332, 'loss/train': 2.2430362701416016} -08/30/2021 14:19:26 - INFO - __main__ - Step 6334: {'lr': 0.0004989432858613873, 'samples': 1216128, 'steps': 6333, 'loss/train': 1.4362497329711914} -08/30/2021 14:19:27 - INFO - __main__ - Step 6335: {'lr': 0.0004989427983974653, 'samples': 1216320, 'steps': 6334, 'loss/train': 2.403474807739258} -08/30/2021 14:19:28 - INFO - __main__ - Step 6336: {'lr': 0.0004989423108213737, 'samples': 1216512, 'steps': 6335, 'loss/train': 1.6801766157150269} -08/30/2021 14:19:28 - INFO - __main__ - Step 6337: {'lr': 0.0004989418231331124, 'samples': 1216704, 'steps': 6336, 'loss/train': 1.848619818687439} -08/30/2021 14:19:28 - INFO - __main__ - Step 6338: {'lr': 0.0004989413353326818, 'samples': 1216896, 'steps': 6337, 'loss/train': 2.519618034362793} -08/30/2021 14:19:29 - INFO - __main__ - Step 6339: {'lr': 0.0004989408474200821, 'samples': 1217088, 'steps': 6338, 'loss/train': 1.8634679317474365} -08/30/2021 14:19:29 - INFO - __main__ - Step 6340: {'lr': 0.0004989403593953135, 'samples': 1217280, 'steps': 6339, 'loss/train': 1.661281704902649} -08/30/2021 14:19:31 - INFO - __main__ - Step 6341: {'lr': 0.0004989398712583762, 'samples': 1217472, 'steps': 6340, 'loss/train': 0.8902767896652222} -08/30/2021 14:19:31 - INFO - __main__ - Step 6342: {'lr': 0.0004989393830092705, 'samples': 1217664, 'steps': 6341, 'loss/train': 0.21483157575130463} -08/30/2021 14:19:32 - INFO - __main__ - Step 6343: {'lr': 0.0004989388946479965, 'samples': 1217856, 'steps': 6342, 'loss/train': 1.917526125907898} -08/30/2021 14:19:32 - INFO - __main__ - Step 6344: {'lr': 0.0004989384061745545, 'samples': 1218048, 'steps': 6343, 'loss/train': 2.1375091075897217} -08/30/2021 14:19:32 - INFO - __main__ - Step 6345: {'lr': 0.0004989379175889447, 'samples': 1218240, 'steps': 6344, 'loss/train': 1.9298045635223389} -08/30/2021 14:19:34 - INFO - __main__ - Step 6346: {'lr': 0.0004989374288911672, 'samples': 1218432, 'steps': 6345, 'loss/train': 0.2548641264438629} -08/30/2021 14:19:35 - INFO - __main__ - Step 6347: {'lr': 0.0004989369400812225, 'samples': 1218624, 'steps': 6346, 'loss/train': 1.0864231586456299} -08/30/2021 14:19:35 - INFO - __main__ - Step 6348: {'lr': 0.0004989364511591106, 'samples': 1218816, 'steps': 6347, 'loss/train': 2.2659149169921875} -08/30/2021 14:19:35 - INFO - __main__ - Step 6349: {'lr': 0.0004989359621248317, 'samples': 1219008, 'steps': 6348, 'loss/train': 2.0931715965270996} -08/30/2021 14:19:36 - INFO - __main__ - Step 6350: {'lr': 0.0004989354729783861, 'samples': 1219200, 'steps': 6349, 'loss/train': 1.9924660921096802} -08/30/2021 14:19:36 - INFO - __main__ - Step 6351: {'lr': 0.0004989349837197742, 'samples': 1219392, 'steps': 6350, 'loss/train': 0.22452615201473236} -08/30/2021 14:19:37 - INFO - __main__ - Step 6352: {'lr': 0.0004989344943489958, 'samples': 1219584, 'steps': 6351, 'loss/train': 2.3767666816711426} -08/30/2021 14:19:38 - INFO - __main__ - Step 6353: {'lr': 0.0004989340048660515, 'samples': 1219776, 'steps': 6352, 'loss/train': 1.9281697273254395} -08/30/2021 14:19:38 - INFO - __main__ - Step 6354: {'lr': 0.0004989335152709414, 'samples': 1219968, 'steps': 6353, 'loss/train': 2.7251996994018555} -08/30/2021 14:19:39 - INFO - __main__ - Step 6355: {'lr': 0.0004989330255636656, 'samples': 1220160, 'steps': 6354, 'loss/train': 1.8787678480148315} -08/30/2021 14:19:39 - INFO - __main__ - Step 6356: {'lr': 0.0004989325357442245, 'samples': 1220352, 'steps': 6355, 'loss/train': 1.6053874492645264} -08/30/2021 14:19:41 - INFO - __main__ - Step 6357: {'lr': 0.0004989320458126182, 'samples': 1220544, 'steps': 6356, 'loss/train': 2.2343366146087646} -08/30/2021 14:19:42 - INFO - __main__ - Step 6358: {'lr': 0.0004989315557688469, 'samples': 1220736, 'steps': 6357, 'loss/train': 1.4021246433258057} -08/30/2021 14:19:42 - INFO - __main__ - Step 6359: {'lr': 0.000498931065612911, 'samples': 1220928, 'steps': 6358, 'loss/train': 2.5814125537872314} -08/30/2021 14:19:42 - INFO - __main__ - Step 6360: {'lr': 0.0004989305753448106, 'samples': 1221120, 'steps': 6359, 'loss/train': 1.7415645122528076} -08/30/2021 14:19:43 - INFO - __main__ - Step 6361: {'lr': 0.0004989300849645459, 'samples': 1221312, 'steps': 6360, 'loss/train': 2.3653414249420166} -08/30/2021 14:19:43 - INFO - __main__ - Step 6362: {'lr': 0.0004989295944721171, 'samples': 1221504, 'steps': 6361, 'loss/train': 2.4741456508636475} -08/30/2021 14:19:43 - INFO - __main__ - Step 6363: {'lr': 0.0004989291038675245, 'samples': 1221696, 'steps': 6362, 'loss/train': 2.3353641033172607} -08/30/2021 14:19:45 - INFO - __main__ - Step 6364: {'lr': 0.0004989286131507682, 'samples': 1221888, 'steps': 6363, 'loss/train': 0.33484983444213867} -08/30/2021 14:19:46 - INFO - __main__ - Step 6365: {'lr': 0.0004989281223218486, 'samples': 1222080, 'steps': 6364, 'loss/train': 2.1490490436553955} -08/30/2021 14:19:46 - INFO - __main__ - Step 6366: {'lr': 0.0004989276313807658, 'samples': 1222272, 'steps': 6365, 'loss/train': 2.045421838760376} -08/30/2021 14:19:47 - INFO - __main__ - Step 6367: {'lr': 0.00049892714032752, 'samples': 1222464, 'steps': 6366, 'loss/train': 1.8140629529953003} -08/30/2021 14:19:47 - INFO - __main__ - Step 6368: {'lr': 0.0004989266491621117, 'samples': 1222656, 'steps': 6367, 'loss/train': 2.209887981414795} -08/30/2021 14:19:48 - INFO - __main__ - Step 6369: {'lr': 0.0004989261578845406, 'samples': 1222848, 'steps': 6368, 'loss/train': 1.681424856185913} -08/30/2021 14:19:49 - INFO - __main__ - Step 6370: {'lr': 0.0004989256664948073, 'samples': 1223040, 'steps': 6369, 'loss/train': 1.6200883388519287} -08/30/2021 14:19:49 - INFO - __main__ - Step 6371: {'lr': 0.000498925174992912, 'samples': 1223232, 'steps': 6370, 'loss/train': 3.0206379890441895} -08/30/2021 14:19:49 - INFO - __main__ - Step 6372: {'lr': 0.0004989246833788549, 'samples': 1223424, 'steps': 6371, 'loss/train': 2.03474760055542} -08/30/2021 14:19:50 - INFO - __main__ - Step 6373: {'lr': 0.000498924191652636, 'samples': 1223616, 'steps': 6372, 'loss/train': 1.6458381414413452} -08/30/2021 14:19:51 - INFO - __main__ - Step 6374: {'lr': 0.0004989236998142559, 'samples': 1223808, 'steps': 6373, 'loss/train': 2.533975124359131} -08/30/2021 14:19:52 - INFO - __main__ - Step 6375: {'lr': 0.0004989232078637145, 'samples': 1224000, 'steps': 6374, 'loss/train': 2.086960792541504} -08/30/2021 14:19:52 - INFO - __main__ - Step 6376: {'lr': 0.0004989227158010123, 'samples': 1224192, 'steps': 6375, 'loss/train': 1.8674033880233765} -08/30/2021 14:19:53 - INFO - __main__ - Step 6377: {'lr': 0.0004989222236261491, 'samples': 1224384, 'steps': 6376, 'loss/train': 1.910085916519165} -08/30/2021 14:19:53 - INFO - __main__ - Step 6378: {'lr': 0.0004989217313391256, 'samples': 1224576, 'steps': 6377, 'loss/train': 2.0162723064422607} -08/30/2021 14:19:54 - INFO - __main__ - Step 6379: {'lr': 0.0004989212389399417, 'samples': 1224768, 'steps': 6378, 'loss/train': 2.0569067001342773} -08/30/2021 14:19:55 - INFO - __main__ - Step 6380: {'lr': 0.0004989207464285978, 'samples': 1224960, 'steps': 6379, 'loss/train': 1.8085367679595947} -08/30/2021 14:19:55 - INFO - __main__ - Step 6381: {'lr': 0.0004989202538050939, 'samples': 1225152, 'steps': 6380, 'loss/train': 1.903486728668213} -08/30/2021 14:19:56 - INFO - __main__ - Step 6382: {'lr': 0.0004989197610694306, 'samples': 1225344, 'steps': 6381, 'loss/train': 1.8851052522659302} -08/30/2021 14:19:56 - INFO - __main__ - Step 6383: {'lr': 0.0004989192682216078, 'samples': 1225536, 'steps': 6382, 'loss/train': 2.309662342071533} -08/30/2021 14:19:57 - INFO - __main__ - Step 6384: {'lr': 0.0004989187752616258, 'samples': 1225728, 'steps': 6383, 'loss/train': 2.068089008331299} -08/30/2021 14:19:58 - INFO - __main__ - Step 6385: {'lr': 0.0004989182821894849, 'samples': 1225920, 'steps': 6384, 'loss/train': 1.5951160192489624} -08/30/2021 14:19:58 - INFO - __main__ - Step 6386: {'lr': 0.0004989177890051852, 'samples': 1226112, 'steps': 6385, 'loss/train': 2.226026773452759} -08/30/2021 14:19:59 - INFO - __main__ - Step 6387: {'lr': 0.000498917295708727, 'samples': 1226304, 'steps': 6386, 'loss/train': 2.1340386867523193} -08/30/2021 14:19:59 - INFO - __main__ - Step 6388: {'lr': 0.0004989168023001105, 'samples': 1226496, 'steps': 6387, 'loss/train': 1.9530478715896606} -08/30/2021 14:20:00 - INFO - __main__ - Step 6389: {'lr': 0.0004989163087793359, 'samples': 1226688, 'steps': 6388, 'loss/train': 0.7116537690162659} -08/30/2021 14:20:01 - INFO - __main__ - Step 6390: {'lr': 0.0004989158151464036, 'samples': 1226880, 'steps': 6389, 'loss/train': 1.7949714660644531} -08/30/2021 14:20:01 - INFO - __main__ - Step 6391: {'lr': 0.0004989153214013135, 'samples': 1227072, 'steps': 6390, 'loss/train': 2.08050537109375} -08/30/2021 14:20:02 - INFO - __main__ - Step 6392: {'lr': 0.0004989148275440661, 'samples': 1227264, 'steps': 6391, 'loss/train': 1.6071804761886597} -08/30/2021 14:20:02 - INFO - __main__ - Step 6393: {'lr': 0.0004989143335746614, 'samples': 1227456, 'steps': 6392, 'loss/train': 1.5674817562103271} -08/30/2021 14:20:03 - INFO - __main__ - Step 6394: {'lr': 0.0004989138394930998, 'samples': 1227648, 'steps': 6393, 'loss/train': 1.3918814659118652} -08/30/2021 14:20:04 - INFO - __main__ - Step 6395: {'lr': 0.0004989133452993816, 'samples': 1227840, 'steps': 6394, 'loss/train': 2.240018129348755} -08/30/2021 14:20:04 - INFO - __main__ - Step 6396: {'lr': 0.0004989128509935068, 'samples': 1228032, 'steps': 6395, 'loss/train': 2.1449835300445557} -08/30/2021 14:20:05 - INFO - __main__ - Step 6397: {'lr': 0.0004989123565754756, 'samples': 1228224, 'steps': 6396, 'loss/train': 2.164830207824707} -08/30/2021 14:20:05 - INFO - __main__ - Step 6398: {'lr': 0.0004989118620452884, 'samples': 1228416, 'steps': 6397, 'loss/train': 2.341160535812378} -08/30/2021 14:20:06 - INFO - __main__ - Step 6399: {'lr': 0.0004989113674029454, 'samples': 1228608, 'steps': 6398, 'loss/train': 1.8842697143554688} -08/30/2021 14:20:07 - INFO - __main__ - Step 6400: {'lr': 0.0004989108726484469, 'samples': 1228800, 'steps': 6399, 'loss/train': 2.3316967487335205} -08/30/2021 14:20:07 - INFO - __main__ - Step 6401: {'lr': 0.0004989103777817928, 'samples': 1228992, 'steps': 6400, 'loss/train': 1.546118974685669} -08/30/2021 14:20:07 - INFO - __main__ - Step 6402: {'lr': 0.0004989098828029836, 'samples': 1229184, 'steps': 6401, 'loss/train': 2.2582178115844727} -08/30/2021 14:20:08 - INFO - __main__ - Step 6403: {'lr': 0.0004989093877120194, 'samples': 1229376, 'steps': 6402, 'loss/train': 1.7887744903564453} -08/30/2021 14:20:08 - INFO - __main__ - Step 6404: {'lr': 0.0004989088925089005, 'samples': 1229568, 'steps': 6403, 'loss/train': 1.4423006772994995} -08/30/2021 14:20:10 - INFO - __main__ - Step 6405: {'lr': 0.0004989083971936271, 'samples': 1229760, 'steps': 6404, 'loss/train': 2.076840877532959} -08/30/2021 14:20:10 - INFO - __main__ - Step 6406: {'lr': 0.0004989079017661994, 'samples': 1229952, 'steps': 6405, 'loss/train': 2.444427490234375} -08/30/2021 14:20:10 - INFO - __main__ - Step 6407: {'lr': 0.0004989074062266177, 'samples': 1230144, 'steps': 6406, 'loss/train': 2.0568270683288574} -08/30/2021 14:20:11 - INFO - __main__ - Step 6408: {'lr': 0.0004989069105748821, 'samples': 1230336, 'steps': 6407, 'loss/train': 1.5928832292556763} -08/30/2021 14:20:11 - INFO - __main__ - Step 6409: {'lr': 0.0004989064148109929, 'samples': 1230528, 'steps': 6408, 'loss/train': 2.200293779373169} -08/30/2021 14:20:13 - INFO - __main__ - Step 6410: {'lr': 0.0004989059189349503, 'samples': 1230720, 'steps': 6409, 'loss/train': 2.3416473865509033} -08/30/2021 14:20:13 - INFO - __main__ - Step 6411: {'lr': 0.0004989054229467546, 'samples': 1230912, 'steps': 6410, 'loss/train': 2.1792893409729004} -08/30/2021 14:20:13 - INFO - __main__ - Step 6412: {'lr': 0.0004989049268464058, 'samples': 1231104, 'steps': 6411, 'loss/train': 2.018517255783081} -08/30/2021 14:20:14 - INFO - __main__ - Step 6413: {'lr': 0.0004989044306339044, 'samples': 1231296, 'steps': 6412, 'loss/train': 1.3932756185531616} -08/30/2021 14:20:14 - INFO - __main__ - Step 6414: {'lr': 0.0004989039343092505, 'samples': 1231488, 'steps': 6413, 'loss/train': 2.0457987785339355} -08/30/2021 14:20:16 - INFO - __main__ - Step 6415: {'lr': 0.0004989034378724443, 'samples': 1231680, 'steps': 6414, 'loss/train': 1.9669859409332275} -08/30/2021 14:20:17 - INFO - __main__ - Step 6416: {'lr': 0.0004989029413234861, 'samples': 1231872, 'steps': 6415, 'loss/train': 1.5404988527297974} -08/30/2021 14:20:17 - INFO - __main__ - Step 6417: {'lr': 0.000498902444662376, 'samples': 1232064, 'steps': 6416, 'loss/train': 1.5640596151351929} -08/30/2021 14:20:17 - INFO - __main__ - Step 6418: {'lr': 0.0004989019478891144, 'samples': 1232256, 'steps': 6417, 'loss/train': 2.1557815074920654} -08/30/2021 14:20:18 - INFO - __main__ - Step 6419: {'lr': 0.0004989014510037013, 'samples': 1232448, 'steps': 6418, 'loss/train': 2.441948890686035} -08/30/2021 14:20:19 - INFO - __main__ - Step 6420: {'lr': 0.0004989009540061373, 'samples': 1232640, 'steps': 6419, 'loss/train': 2.0749902725219727} -08/30/2021 14:20:20 - INFO - __main__ - Step 6421: {'lr': 0.0004989004568964221, 'samples': 1232832, 'steps': 6420, 'loss/train': 2.3868441581726074} -08/30/2021 14:20:20 - INFO - __main__ - Step 6422: {'lr': 0.0004988999596745562, 'samples': 1233024, 'steps': 6421, 'loss/train': 0.33942484855651855} -08/30/2021 14:20:20 - INFO - __main__ - Step 6423: {'lr': 0.00049889946234054, 'samples': 1233216, 'steps': 6422, 'loss/train': 2.162052631378174} -08/30/2021 14:20:21 - INFO - __main__ - Step 6424: {'lr': 0.0004988989648943734, 'samples': 1233408, 'steps': 6423, 'loss/train': 1.4928768873214722} -08/30/2021 14:20:22 - INFO - __main__ - Step 6425: {'lr': 0.0004988984673360568, 'samples': 1233600, 'steps': 6424, 'loss/train': 2.068682909011841} -08/30/2021 14:20:23 - INFO - __main__ - Step 6426: {'lr': 0.0004988979696655904, 'samples': 1233792, 'steps': 6425, 'loss/train': 1.5039173364639282} -08/30/2021 14:20:23 - INFO - __main__ - Step 6427: {'lr': 0.0004988974718829744, 'samples': 1233984, 'steps': 6426, 'loss/train': 2.104384660720825} -08/30/2021 14:20:23 - INFO - __main__ - Step 6428: {'lr': 0.0004988969739882091, 'samples': 1234176, 'steps': 6427, 'loss/train': 2.0742006301879883} -08/30/2021 14:20:24 - INFO - __main__ - Step 6429: {'lr': 0.0004988964759812946, 'samples': 1234368, 'steps': 6428, 'loss/train': 1.9064100980758667} -08/30/2021 14:20:25 - INFO - __main__ - Step 6430: {'lr': 0.0004988959778622313, 'samples': 1234560, 'steps': 6429, 'loss/train': 2.0313098430633545} -08/30/2021 14:20:26 - INFO - __main__ - Step 6431: {'lr': 0.0004988954796310191, 'samples': 1234752, 'steps': 6430, 'loss/train': 1.8159887790679932} -08/30/2021 14:20:26 - INFO - __main__ - Step 6432: {'lr': 0.0004988949812876586, 'samples': 1234944, 'steps': 6431, 'loss/train': 2.025383472442627} -08/30/2021 14:20:27 - INFO - __main__ - Step 6433: {'lr': 0.0004988944828321499, 'samples': 1235136, 'steps': 6432, 'loss/train': 1.7181217670440674} -08/30/2021 14:20:27 - INFO - __main__ - Step 6434: {'lr': 0.0004988939842644931, 'samples': 1235328, 'steps': 6433, 'loss/train': 2.1547458171844482} -08/30/2021 14:20:29 - INFO - __main__ - Step 6435: {'lr': 0.0004988934855846885, 'samples': 1235520, 'steps': 6434, 'loss/train': 3.3640191555023193} -08/30/2021 14:20:30 - INFO - __main__ - Step 6436: {'lr': 0.0004988929867927363, 'samples': 1235712, 'steps': 6435, 'loss/train': 1.8474713563919067} -08/30/2021 14:20:30 - INFO - __main__ - Step 6437: {'lr': 0.0004988924878886368, 'samples': 1235904, 'steps': 6436, 'loss/train': 0.1729724258184433} -08/30/2021 14:20:31 - INFO - __main__ - Step 6438: {'lr': 0.0004988919888723902, 'samples': 1236096, 'steps': 6437, 'loss/train': 2.002051591873169} -08/30/2021 14:20:31 - INFO - __main__ - Step 6439: {'lr': 0.0004988914897439968, 'samples': 1236288, 'steps': 6438, 'loss/train': 1.6145069599151611} -08/30/2021 14:20:31 - INFO - __main__ - Step 6440: {'lr': 0.0004988909905034566, 'samples': 1236480, 'steps': 6439, 'loss/train': 0.868749737739563} -08/30/2021 14:20:32 - INFO - __main__ - Step 6441: {'lr': 0.00049889049115077, 'samples': 1236672, 'steps': 6440, 'loss/train': 0.8868799209594727} -08/30/2021 14:20:33 - INFO - __main__ - Step 6442: {'lr': 0.0004988899916859372, 'samples': 1236864, 'steps': 6441, 'loss/train': 0.7765102386474609} -08/30/2021 14:20:34 - INFO - __main__ - Step 6443: {'lr': 0.0004988894921089584, 'samples': 1237056, 'steps': 6442, 'loss/train': 2.336009979248047} -08/30/2021 14:20:34 - INFO - __main__ - Step 6444: {'lr': 0.0004988889924198339, 'samples': 1237248, 'steps': 6443, 'loss/train': 1.799240231513977} -08/30/2021 14:20:34 - INFO - __main__ - Step 6445: {'lr': 0.0004988884926185637, 'samples': 1237440, 'steps': 6444, 'loss/train': 1.823669672012329} -08/30/2021 14:20:35 - INFO - __main__ - Step 6446: {'lr': 0.0004988879927051484, 'samples': 1237632, 'steps': 6445, 'loss/train': 2.093698740005493} -08/30/2021 14:20:36 - INFO - __main__ - Step 6447: {'lr': 0.0004988874926795878, 'samples': 1237824, 'steps': 6446, 'loss/train': 1.9283031225204468} -08/30/2021 14:20:37 - INFO - __main__ - Step 6448: {'lr': 0.0004988869925418825, 'samples': 1238016, 'steps': 6447, 'loss/train': 2.1458723545074463} -08/30/2021 14:20:37 - INFO - __main__ - Step 6449: {'lr': 0.0004988864922920325, 'samples': 1238208, 'steps': 6448, 'loss/train': 1.6288421154022217} -08/30/2021 14:20:37 - INFO - __main__ - Step 6450: {'lr': 0.000498885991930038, 'samples': 1238400, 'steps': 6449, 'loss/train': 1.8976569175720215} -08/30/2021 14:20:38 - INFO - __main__ - Step 6451: {'lr': 0.0004988854914558994, 'samples': 1238592, 'steps': 6450, 'loss/train': 2.386488437652588} -08/30/2021 14:20:39 - INFO - __main__ - Step 6452: {'lr': 0.0004988849908696169, 'samples': 1238784, 'steps': 6451, 'loss/train': 2.1098759174346924} -08/30/2021 14:20:40 - INFO - __main__ - Step 6453: {'lr': 0.0004988844901711905, 'samples': 1238976, 'steps': 6452, 'loss/train': 0.5721170902252197} -08/30/2021 14:20:40 - INFO - __main__ - Step 6454: {'lr': 0.0004988839893606208, 'samples': 1239168, 'steps': 6453, 'loss/train': 2.66838002204895} -08/30/2021 14:20:40 - INFO - __main__ - Step 6455: {'lr': 0.0004988834884379076, 'samples': 1239360, 'steps': 6454, 'loss/train': 2.5370492935180664} -08/30/2021 14:20:41 - INFO - __main__ - Step 6456: {'lr': 0.0004988829874030514, 'samples': 1239552, 'steps': 6455, 'loss/train': 2.045966863632202} -08/30/2021 14:20:42 - INFO - __main__ - Step 6457: {'lr': 0.0004988824862560525, 'samples': 1239744, 'steps': 6456, 'loss/train': 1.981670618057251} -08/30/2021 14:20:43 - INFO - __main__ - Step 6458: {'lr': 0.0004988819849969109, 'samples': 1239936, 'steps': 6457, 'loss/train': 2.628972053527832} -08/30/2021 14:20:43 - INFO - __main__ - Step 6459: {'lr': 0.0004988814836256269, 'samples': 1240128, 'steps': 6458, 'loss/train': 1.9126405715942383} -08/30/2021 14:20:43 - INFO - __main__ - Step 6460: {'lr': 0.0004988809821422008, 'samples': 1240320, 'steps': 6459, 'loss/train': 1.4414652585983276} -08/30/2021 14:20:44 - INFO - __main__ - Step 6461: {'lr': 0.0004988804805466327, 'samples': 1240512, 'steps': 6460, 'loss/train': 2.5868492126464844} -08/30/2021 14:20:45 - INFO - __main__ - Step 6462: {'lr': 0.000498879978838923, 'samples': 1240704, 'steps': 6461, 'loss/train': 2.3106813430786133} -08/30/2021 14:20:46 - INFO - __main__ - Step 6463: {'lr': 0.0004988794770190717, 'samples': 1240896, 'steps': 6462, 'loss/train': 1.930501103401184} -08/30/2021 14:20:46 - INFO - __main__ - Step 6464: {'lr': 0.0004988789750870792, 'samples': 1241088, 'steps': 6463, 'loss/train': 2.0551917552948} -08/30/2021 14:20:46 - INFO - __main__ - Step 6465: {'lr': 0.0004988784730429457, 'samples': 1241280, 'steps': 6464, 'loss/train': 1.1791571378707886} -08/30/2021 14:20:47 - INFO - __main__ - Step 6466: {'lr': 0.0004988779708866714, 'samples': 1241472, 'steps': 6465, 'loss/train': 2.0136468410491943} -08/30/2021 14:20:47 - INFO - __main__ - Step 6467: {'lr': 0.0004988774686182564, 'samples': 1241664, 'steps': 6466, 'loss/train': 1.6396267414093018} -08/30/2021 14:20:49 - INFO - __main__ - Step 6468: {'lr': 0.0004988769662377013, 'samples': 1241856, 'steps': 6467, 'loss/train': 1.455800175666809} -08/30/2021 14:20:49 - INFO - __main__ - Step 6469: {'lr': 0.0004988764637450058, 'samples': 1242048, 'steps': 6468, 'loss/train': 2.1185052394866943} -08/30/2021 14:20:50 - INFO - __main__ - Step 6470: {'lr': 0.0004988759611401706, 'samples': 1242240, 'steps': 6469, 'loss/train': 1.7665050029754639} -08/30/2021 14:20:50 - INFO - __main__ - Step 6471: {'lr': 0.0004988754584231957, 'samples': 1242432, 'steps': 6470, 'loss/train': 1.9007976055145264} -08/30/2021 14:20:50 - INFO - __main__ - Step 6472: {'lr': 0.0004988749555940814, 'samples': 1242624, 'steps': 6471, 'loss/train': 2.1194381713867188} -08/30/2021 14:20:53 - INFO - __main__ - Step 6473: {'lr': 0.0004988744526528277, 'samples': 1242816, 'steps': 6472, 'loss/train': 2.066175937652588} -08/30/2021 14:20:53 - INFO - __main__ - Step 6474: {'lr': 0.0004988739495994352, 'samples': 1243008, 'steps': 6473, 'loss/train': 1.561000943183899} -08/30/2021 14:20:54 - INFO - __main__ - Step 6475: {'lr': 0.0004988734464339038, 'samples': 1243200, 'steps': 6474, 'loss/train': 1.8860431909561157} -08/30/2021 14:20:54 - INFO - __main__ - Step 6476: {'lr': 0.0004988729431562339, 'samples': 1243392, 'steps': 6475, 'loss/train': 2.3497374057769775} -08/30/2021 14:20:54 - INFO - __main__ - Step 6477: {'lr': 0.0004988724397664258, 'samples': 1243584, 'steps': 6476, 'loss/train': 1.6888527870178223} -08/30/2021 14:20:55 - INFO - __main__ - Step 6478: {'lr': 0.0004988719362644795, 'samples': 1243776, 'steps': 6477, 'loss/train': 0.6262373924255371} -08/30/2021 14:20:57 - INFO - __main__ - Step 6479: {'lr': 0.0004988714326503953, 'samples': 1243968, 'steps': 6478, 'loss/train': 2.5752835273742676} -08/30/2021 14:20:57 - INFO - __main__ - Step 6480: {'lr': 0.0004988709289241736, 'samples': 1244160, 'steps': 6479, 'loss/train': 0.6004495024681091} -08/30/2021 14:20:57 - INFO - __main__ - Step 6481: {'lr': 0.0004988704250858145, 'samples': 1244352, 'steps': 6480, 'loss/train': 0.6630047559738159} -08/30/2021 14:20:58 - INFO - __main__ - Step 6482: {'lr': 0.0004988699211353182, 'samples': 1244544, 'steps': 6481, 'loss/train': 2.088484764099121} -08/30/2021 14:20:58 - INFO - __main__ - Step 6483: {'lr': 0.000498869417072685, 'samples': 1244736, 'steps': 6482, 'loss/train': 1.8390841484069824} -08/30/2021 14:20:58 - INFO - __main__ - Step 6484: {'lr': 0.000498868912897915, 'samples': 1244928, 'steps': 6483, 'loss/train': 2.163666248321533} -08/30/2021 14:21:00 - INFO - __main__ - Step 6485: {'lr': 0.0004988684086110085, 'samples': 1245120, 'steps': 6484, 'loss/train': 0.8672804832458496} -08/30/2021 14:21:00 - INFO - __main__ - Step 6486: {'lr': 0.0004988679042119658, 'samples': 1245312, 'steps': 6485, 'loss/train': 1.329594373703003} -08/30/2021 14:21:01 - INFO - __main__ - Step 6487: {'lr': 0.000498867399700787, 'samples': 1245504, 'steps': 6486, 'loss/train': 1.6521679162979126} -08/30/2021 14:21:01 - INFO - __main__ - Step 6488: {'lr': 0.0004988668950774724, 'samples': 1245696, 'steps': 6487, 'loss/train': 2.360351800918579} -08/30/2021 14:21:01 - INFO - __main__ - Step 6489: {'lr': 0.0004988663903420222, 'samples': 1245888, 'steps': 6488, 'loss/train': 1.4756020307540894} -08/30/2021 14:21:02 - INFO - __main__ - Step 6490: {'lr': 0.0004988658854944367, 'samples': 1246080, 'steps': 6489, 'loss/train': 2.232346773147583} -08/30/2021 14:21:04 - INFO - __main__ - Step 6491: {'lr': 0.0004988653805347161, 'samples': 1246272, 'steps': 6490, 'loss/train': 2.4621121883392334} -08/30/2021 14:21:04 - INFO - __main__ - Step 6492: {'lr': 0.0004988648754628605, 'samples': 1246464, 'steps': 6491, 'loss/train': 2.4820644855499268} -08/30/2021 14:21:05 - INFO - __main__ - Step 6493: {'lr': 0.0004988643702788703, 'samples': 1246656, 'steps': 6492, 'loss/train': 0.569169282913208} -08/30/2021 14:21:05 - INFO - __main__ - Step 6494: {'lr': 0.0004988638649827456, 'samples': 1246848, 'steps': 6493, 'loss/train': 2.4743144512176514} -08/30/2021 14:21:05 - INFO - __main__ - Step 6495: {'lr': 0.0004988633595744867, 'samples': 1247040, 'steps': 6494, 'loss/train': 2.5574920177459717} -08/30/2021 14:21:07 - INFO - __main__ - Step 6496: {'lr': 0.0004988628540540939, 'samples': 1247232, 'steps': 6495, 'loss/train': 0.23879817128181458} -08/30/2021 14:21:08 - INFO - __main__ - Step 6497: {'lr': 0.0004988623484215673, 'samples': 1247424, 'steps': 6496, 'loss/train': 2.619365692138672} -08/30/2021 14:21:08 - INFO - __main__ - Step 6498: {'lr': 0.0004988618426769071, 'samples': 1247616, 'steps': 6497, 'loss/train': 4.272124767303467} -08/30/2021 14:21:08 - INFO - __main__ - Step 6499: {'lr': 0.0004988613368201135, 'samples': 1247808, 'steps': 6498, 'loss/train': 1.8268860578536987} -08/30/2021 14:21:09 - INFO - __main__ - Step 6500: {'lr': 0.0004988608308511871, 'samples': 1248000, 'steps': 6499, 'loss/train': 1.9207829236984253} -08/30/2021 14:21:09 - INFO - __main__ - Step 6501: {'lr': 0.0004988603247701276, 'samples': 1248192, 'steps': 6500, 'loss/train': 2.391490936279297} -08/30/2021 14:21:10 - INFO - __main__ - Step 6502: {'lr': 0.0004988598185769357, 'samples': 1248384, 'steps': 6501, 'loss/train': 2.5124106407165527} -08/30/2021 14:21:11 - INFO - __main__ - Step 6503: {'lr': 0.0004988593122716112, 'samples': 1248576, 'steps': 6502, 'loss/train': 2.56439208984375} -08/30/2021 14:21:12 - INFO - __main__ - Step 6504: {'lr': 0.0004988588058541547, 'samples': 1248768, 'steps': 6503, 'loss/train': 1.1140613555908203} -08/30/2021 14:21:12 - INFO - __main__ - Step 6505: {'lr': 0.0004988582993245661, 'samples': 1248960, 'steps': 6504, 'loss/train': 2.11283540725708} -08/30/2021 14:21:12 - INFO - __main__ - Step 6506: {'lr': 0.0004988577926828459, 'samples': 1249152, 'steps': 6505, 'loss/train': 2.564568042755127} -08/30/2021 14:21:13 - INFO - __main__ - Step 6507: {'lr': 0.0004988572859289941, 'samples': 1249344, 'steps': 6506, 'loss/train': 2.540116310119629} -08/30/2021 14:21:14 - INFO - __main__ - Step 6508: {'lr': 0.0004988567790630111, 'samples': 1249536, 'steps': 6507, 'loss/train': 1.8360543251037598} -08/30/2021 14:21:15 - INFO - __main__ - Step 6509: {'lr': 0.0004988562720848973, 'samples': 1249728, 'steps': 6508, 'loss/train': 1.8385865688323975} -08/30/2021 14:21:15 - INFO - __main__ - Step 6510: {'lr': 0.0004988557649946525, 'samples': 1249920, 'steps': 6509, 'loss/train': 2.23394513130188} -08/30/2021 14:21:15 - INFO - __main__ - Step 6511: {'lr': 0.000498855257792277, 'samples': 1250112, 'steps': 6510, 'loss/train': 2.1976659297943115} -08/30/2021 14:21:16 - INFO - __main__ - Step 6512: {'lr': 0.0004988547504777714, 'samples': 1250304, 'steps': 6511, 'loss/train': 2.638313055038452} -08/30/2021 14:21:17 - INFO - __main__ - Step 6513: {'lr': 0.0004988542430511356, 'samples': 1250496, 'steps': 6512, 'loss/train': 1.8395999670028687} -08/30/2021 14:21:18 - INFO - __main__ - Step 6514: {'lr': 0.0004988537355123699, 'samples': 1250688, 'steps': 6513, 'loss/train': 1.7342604398727417} -08/30/2021 14:21:18 - INFO - __main__ - Step 6515: {'lr': 0.0004988532278614745, 'samples': 1250880, 'steps': 6514, 'loss/train': 1.4590171575546265} -08/30/2021 14:21:18 - INFO - __main__ - Step 6516: {'lr': 0.0004988527200984498, 'samples': 1251072, 'steps': 6515, 'loss/train': 2.354767084121704} -08/30/2021 14:21:19 - INFO - __main__ - Step 6517: {'lr': 0.0004988522122232958, 'samples': 1251264, 'steps': 6516, 'loss/train': 1.9950506687164307} -08/30/2021 14:21:20 - INFO - __main__ - Step 6518: {'lr': 0.0004988517042360128, 'samples': 1251456, 'steps': 6517, 'loss/train': 2.5752596855163574} -08/30/2021 14:21:21 - INFO - __main__ - Step 6519: {'lr': 0.0004988511961366012, 'samples': 1251648, 'steps': 6518, 'loss/train': 1.9904118776321411} -08/30/2021 14:21:21 - INFO - __main__ - Step 6520: {'lr': 0.000498850687925061, 'samples': 1251840, 'steps': 6519, 'loss/train': 2.0929312705993652} -08/30/2021 14:21:22 - INFO - __main__ - Step 6521: {'lr': 0.0004988501796013926, 'samples': 1252032, 'steps': 6520, 'loss/train': 1.6906882524490356} -08/30/2021 14:21:22 - INFO - __main__ - Step 6522: {'lr': 0.0004988496711655961, 'samples': 1252224, 'steps': 6521, 'loss/train': 2.0665812492370605} -08/30/2021 14:21:23 - INFO - __main__ - Step 6523: {'lr': 0.0004988491626176718, 'samples': 1252416, 'steps': 6522, 'loss/train': 1.7329615354537964} -08/30/2021 14:21:24 - INFO - __main__ - Step 6524: {'lr': 0.0004988486539576198, 'samples': 1252608, 'steps': 6523, 'loss/train': 1.7640632390975952} -08/30/2021 14:21:24 - INFO - __main__ - Step 6525: {'lr': 0.0004988481451854406, 'samples': 1252800, 'steps': 6524, 'loss/train': 1.9644182920455933} -08/30/2021 14:21:24 - INFO - __main__ - Step 6526: {'lr': 0.0004988476363011341, 'samples': 1252992, 'steps': 6525, 'loss/train': 2.612196922302246} -08/30/2021 14:21:25 - INFO - __main__ - Step 6527: {'lr': 0.0004988471273047008, 'samples': 1253184, 'steps': 6526, 'loss/train': 2.3033361434936523} -08/30/2021 14:21:27 - INFO - __main__ - Step 6528: {'lr': 0.0004988466181961408, 'samples': 1253376, 'steps': 6527, 'loss/train': 1.3639360666275024} -08/30/2021 14:21:27 - INFO - __main__ - Step 6529: {'lr': 0.0004988461089754544, 'samples': 1253568, 'steps': 6528, 'loss/train': 0.4032314121723175} -08/30/2021 14:21:28 - INFO - __main__ - Step 6530: {'lr': 0.0004988455996426418, 'samples': 1253760, 'steps': 6529, 'loss/train': 2.104724168777466} -08/30/2021 14:21:28 - INFO - __main__ - Step 6531: {'lr': 0.0004988450901977031, 'samples': 1253952, 'steps': 6530, 'loss/train': 2.3243253231048584} -08/30/2021 14:21:28 - INFO - __main__ - Step 6532: {'lr': 0.0004988445806406387, 'samples': 1254144, 'steps': 6531, 'loss/train': 2.694326639175415} -08/30/2021 14:21:30 - INFO - __main__ - Step 6533: {'lr': 0.0004988440709714487, 'samples': 1254336, 'steps': 6532, 'loss/train': 2.872575521469116} -08/30/2021 14:21:31 - INFO - __main__ - Step 6534: {'lr': 0.0004988435611901335, 'samples': 1254528, 'steps': 6533, 'loss/train': 2.5049407482147217} -08/30/2021 14:21:31 - INFO - __main__ - Step 6535: {'lr': 0.0004988430512966932, 'samples': 1254720, 'steps': 6534, 'loss/train': 2.041015625} -08/30/2021 14:21:32 - INFO - __main__ - Step 6536: {'lr': 0.000498842541291128, 'samples': 1254912, 'steps': 6535, 'loss/train': 1.6580395698547363} -08/30/2021 14:21:32 - INFO - __main__ - Step 6537: {'lr': 0.0004988420311734383, 'samples': 1255104, 'steps': 6536, 'loss/train': 1.8963825702667236} -08/30/2021 14:21:32 - INFO - __main__ - Step 6538: {'lr': 0.0004988415209436243, 'samples': 1255296, 'steps': 6537, 'loss/train': 1.7755156755447388} -08/30/2021 14:21:33 - INFO - __main__ - Step 6539: {'lr': 0.000498841010601686, 'samples': 1255488, 'steps': 6538, 'loss/train': 0.5022989511489868} -08/30/2021 14:21:34 - INFO - __main__ - Step 6540: {'lr': 0.0004988405001476237, 'samples': 1255680, 'steps': 6539, 'loss/train': 0.5564445853233337} -08/30/2021 14:21:35 - INFO - __main__ - Step 6541: {'lr': 0.0004988399895814378, 'samples': 1255872, 'steps': 6540, 'loss/train': 1.9793373346328735} -08/30/2021 14:21:35 - INFO - __main__ - Step 6542: {'lr': 0.0004988394789031286, 'samples': 1256064, 'steps': 6541, 'loss/train': 1.841233491897583} -08/30/2021 14:21:35 - INFO - __main__ - Step 6543: {'lr': 0.000498838968112696, 'samples': 1256256, 'steps': 6542, 'loss/train': 1.683853030204773} -08/30/2021 14:21:36 - INFO - __main__ - Step 6544: {'lr': 0.0004988384572101403, 'samples': 1256448, 'steps': 6543, 'loss/train': 1.94686758518219} -08/30/2021 14:21:37 - INFO - __main__ - Step 6545: {'lr': 0.000498837946195462, 'samples': 1256640, 'steps': 6544, 'loss/train': 1.6687226295471191} -08/30/2021 14:21:38 - INFO - __main__ - Step 6546: {'lr': 0.0004988374350686611, 'samples': 1256832, 'steps': 6545, 'loss/train': 1.9942381381988525} -08/30/2021 14:21:38 - INFO - __main__ - Step 6547: {'lr': 0.000498836923829738, 'samples': 1257024, 'steps': 6546, 'loss/train': 1.8168758153915405} -08/30/2021 14:21:38 - INFO - __main__ - Step 6548: {'lr': 0.0004988364124786927, 'samples': 1257216, 'steps': 6547, 'loss/train': 1.0306893587112427} -08/30/2021 14:21:39 - INFO - __main__ - Step 6549: {'lr': 0.0004988359010155255, 'samples': 1257408, 'steps': 6548, 'loss/train': 1.4069682359695435} -08/30/2021 14:21:40 - INFO - __main__ - Step 6550: {'lr': 0.0004988353894402368, 'samples': 1257600, 'steps': 6549, 'loss/train': 2.189601421356201} -08/30/2021 14:21:41 - INFO - __main__ - Step 6551: {'lr': 0.0004988348777528267, 'samples': 1257792, 'steps': 6550, 'loss/train': 1.8493245840072632} -08/30/2021 14:21:41 - INFO - __main__ - Step 6552: {'lr': 0.0004988343659532954, 'samples': 1257984, 'steps': 6551, 'loss/train': 1.8024691343307495} -08/30/2021 14:21:41 - INFO - __main__ - Step 6553: {'lr': 0.0004988338540416432, 'samples': 1258176, 'steps': 6552, 'loss/train': 1.883184790611267} -08/30/2021 14:21:42 - INFO - __main__ - Step 6554: {'lr': 0.0004988333420178704, 'samples': 1258368, 'steps': 6553, 'loss/train': 2.450090169906616} -08/30/2021 14:21:43 - INFO - __main__ - Step 6555: {'lr': 0.000498832829881977, 'samples': 1258560, 'steps': 6554, 'loss/train': 1.9142794609069824} -08/30/2021 14:21:44 - INFO - __main__ - Step 6556: {'lr': 0.0004988323176339633, 'samples': 1258752, 'steps': 6555, 'loss/train': 2.114475965499878} -08/30/2021 14:21:44 - INFO - __main__ - Step 6557: {'lr': 0.0004988318052738298, 'samples': 1258944, 'steps': 6556, 'loss/train': 1.1729118824005127} -08/30/2021 14:21:44 - INFO - __main__ - Step 6558: {'lr': 0.0004988312928015763, 'samples': 1259136, 'steps': 6557, 'loss/train': 0.6530615091323853} -08/30/2021 14:21:45 - INFO - __main__ - Step 6559: {'lr': 0.0004988307802172035, 'samples': 1259328, 'steps': 6558, 'loss/train': 1.4921109676361084} -08/30/2021 14:21:46 - INFO - __main__ - Step 6560: {'lr': 0.0004988302675207112, 'samples': 1259520, 'steps': 6559, 'loss/train': 2.1001718044281006} -08/30/2021 14:21:47 - INFO - __main__ - Step 6561: {'lr': 0.0004988297547121, 'samples': 1259712, 'steps': 6560, 'loss/train': 1.6432491540908813} -08/30/2021 14:21:47 - INFO - __main__ - Step 6562: {'lr': 0.0004988292417913698, 'samples': 1259904, 'steps': 6561, 'loss/train': 1.8221440315246582} -08/30/2021 14:21:48 - INFO - __main__ - Step 6563: {'lr': 0.0004988287287585211, 'samples': 1260096, 'steps': 6562, 'loss/train': 0.19723446667194366} -08/30/2021 14:21:48 - INFO - __main__ - Step 6564: {'lr': 0.0004988282156135539, 'samples': 1260288, 'steps': 6563, 'loss/train': 2.1554503440856934} -08/30/2021 14:21:50 - INFO - __main__ - Step 6565: {'lr': 0.0004988277023564685, 'samples': 1260480, 'steps': 6564, 'loss/train': 1.8825099468231201} -08/30/2021 14:21:50 - INFO - __main__ - Step 6566: {'lr': 0.0004988271889872654, 'samples': 1260672, 'steps': 6565, 'loss/train': 2.1260039806365967} -08/30/2021 14:21:50 - INFO - __main__ - Step 6567: {'lr': 0.0004988266755059444, 'samples': 1260864, 'steps': 6566, 'loss/train': 0.2590658664703369} -08/30/2021 14:21:51 - INFO - __main__ - Step 6568: {'lr': 0.000498826161912506, 'samples': 1261056, 'steps': 6567, 'loss/train': 1.3511930704116821} -08/30/2021 14:21:51 - INFO - __main__ - Step 6569: {'lr': 0.0004988256482069505, 'samples': 1261248, 'steps': 6568, 'loss/train': 1.351592779159546} -08/30/2021 14:21:51 - INFO - __main__ - Step 6570: {'lr': 0.0004988251343892779, 'samples': 1261440, 'steps': 6569, 'loss/train': 0.2593085467815399} -08/30/2021 14:21:53 - INFO - __main__ - Step 6571: {'lr': 0.0004988246204594885, 'samples': 1261632, 'steps': 6570, 'loss/train': 2.4204938411712646} -08/30/2021 14:21:54 - INFO - __main__ - Step 6572: {'lr': 0.0004988241064175826, 'samples': 1261824, 'steps': 6571, 'loss/train': 2.4856679439544678} -08/30/2021 14:21:54 - INFO - __main__ - Step 6573: {'lr': 0.0004988235922635604, 'samples': 1262016, 'steps': 6572, 'loss/train': 2.4744157791137695} -08/30/2021 14:21:54 - INFO - __main__ - Step 6574: {'lr': 0.0004988230779974221, 'samples': 1262208, 'steps': 6573, 'loss/train': 1.8752230405807495} -08/30/2021 14:21:55 - INFO - __main__ - Step 6575: {'lr': 0.000498822563619168, 'samples': 1262400, 'steps': 6574, 'loss/train': 1.711130976676941} -08/30/2021 14:21:57 - INFO - __main__ - Step 6576: {'lr': 0.0004988220491287983, 'samples': 1262592, 'steps': 6575, 'loss/train': 0.5284066200256348} -08/30/2021 14:21:57 - INFO - __main__ - Step 6577: {'lr': 0.0004988215345263132, 'samples': 1262784, 'steps': 6576, 'loss/train': 1.5665788650512695} -08/30/2021 14:21:57 - INFO - __main__ - Step 6578: {'lr': 0.0004988210198117129, 'samples': 1262976, 'steps': 6577, 'loss/train': 1.9515835046768188} -08/30/2021 14:21:58 - INFO - __main__ - Step 6579: {'lr': 0.0004988205049849978, 'samples': 1263168, 'steps': 6578, 'loss/train': 2.016845703125} -08/30/2021 14:21:58 - INFO - __main__ - Step 6580: {'lr': 0.0004988199900461679, 'samples': 1263360, 'steps': 6579, 'loss/train': 2.2204203605651855} -08/30/2021 14:22:00 - INFO - __main__ - Step 6581: {'lr': 0.0004988194749952237, 'samples': 1263552, 'steps': 6580, 'loss/train': 1.7538809776306152} -08/30/2021 14:22:01 - INFO - __main__ - Step 6582: {'lr': 0.0004988189598321652, 'samples': 1263744, 'steps': 6581, 'loss/train': 2.3705499172210693} -08/30/2021 14:22:01 - INFO - __main__ - Step 6583: {'lr': 0.0004988184445569926, 'samples': 1263936, 'steps': 6582, 'loss/train': 1.9933667182922363} -08/30/2021 14:22:01 - INFO - __main__ - Step 6584: {'lr': 0.0004988179291697064, 'samples': 1264128, 'steps': 6583, 'loss/train': 1.7881734371185303} -08/30/2021 14:22:02 - INFO - __main__ - Step 6585: {'lr': 0.0004988174136703066, 'samples': 1264320, 'steps': 6584, 'loss/train': 2.433642864227295} -08/30/2021 14:22:02 - INFO - __main__ - Step 6586: {'lr': 0.0004988168980587936, 'samples': 1264512, 'steps': 6585, 'loss/train': 1.5064575672149658} -08/30/2021 14:22:04 - INFO - __main__ - Step 6587: {'lr': 0.0004988163823351676, 'samples': 1264704, 'steps': 6586, 'loss/train': 1.5597121715545654} -08/30/2021 14:22:04 - INFO - __main__ - Step 6588: {'lr': 0.0004988158664994286, 'samples': 1264896, 'steps': 6587, 'loss/train': 1.962697982788086} -08/30/2021 14:22:05 - INFO - __main__ - Step 6589: {'lr': 0.0004988153505515771, 'samples': 1265088, 'steps': 6588, 'loss/train': 1.6837493181228638} -08/30/2021 14:22:05 - INFO - __main__ - Step 6590: {'lr': 0.0004988148344916133, 'samples': 1265280, 'steps': 6589, 'loss/train': 2.305677890777588} -08/30/2021 14:22:05 - INFO - __main__ - Step 6591: {'lr': 0.0004988143183195373, 'samples': 1265472, 'steps': 6590, 'loss/train': 1.7598168849945068} -08/30/2021 14:22:07 - INFO - __main__ - Step 6592: {'lr': 0.0004988138020353493, 'samples': 1265664, 'steps': 6591, 'loss/train': 1.722815990447998} -08/30/2021 14:22:07 - INFO - __main__ - Step 6593: {'lr': 0.0004988132856390498, 'samples': 1265856, 'steps': 6592, 'loss/train': 2.120572328567505} -08/30/2021 14:22:07 - INFO - __main__ - Step 6594: {'lr': 0.0004988127691306388, 'samples': 1266048, 'steps': 6593, 'loss/train': 2.207150459289551} -08/30/2021 14:22:08 - INFO - __main__ - Step 6595: {'lr': 0.0004988122525101166, 'samples': 1266240, 'steps': 6594, 'loss/train': 1.9245821237564087} -08/30/2021 14:22:08 - INFO - __main__ - Step 6596: {'lr': 0.0004988117357774835, 'samples': 1266432, 'steps': 6595, 'loss/train': 2.0989673137664795} -08/30/2021 14:22:09 - INFO - __main__ - Step 6597: {'lr': 0.0004988112189327397, 'samples': 1266624, 'steps': 6596, 'loss/train': 2.10762882232666} -08/30/2021 14:22:10 - INFO - __main__ - Step 6598: {'lr': 0.0004988107019758853, 'samples': 1266816, 'steps': 6597, 'loss/train': 2.0031373500823975} -08/30/2021 14:22:10 - INFO - __main__ - Step 6599: {'lr': 0.0004988101849069208, 'samples': 1267008, 'steps': 6598, 'loss/train': 2.4327340126037598} -08/30/2021 14:22:11 - INFO - __main__ - Step 6600: {'lr': 0.0004988096677258461, 'samples': 1267200, 'steps': 6599, 'loss/train': 0.5378065705299377} -08/30/2021 14:22:11 - INFO - __main__ - Step 6601: {'lr': 0.0004988091504326616, 'samples': 1267392, 'steps': 6600, 'loss/train': 2.8171443939208984} -08/30/2021 14:22:12 - INFO - __main__ - Step 6602: {'lr': 0.0004988086330273676, 'samples': 1267584, 'steps': 6601, 'loss/train': 0.8903299570083618} -08/30/2021 14:22:13 - INFO - __main__ - Step 6603: {'lr': 0.0004988081155099643, 'samples': 1267776, 'steps': 6602, 'loss/train': 2.2301132678985596} -08/30/2021 14:22:13 - INFO - __main__ - Step 6604: {'lr': 0.0004988075978804518, 'samples': 1267968, 'steps': 6603, 'loss/train': 2.353480815887451} -08/30/2021 14:22:14 - INFO - __main__ - Step 6605: {'lr': 0.0004988070801388306, 'samples': 1268160, 'steps': 6604, 'loss/train': 2.3417277336120605} -08/30/2021 14:22:14 - INFO - __main__ - Step 6606: {'lr': 0.0004988065622851006, 'samples': 1268352, 'steps': 6605, 'loss/train': 2.152053117752075} -08/30/2021 14:22:14 - INFO - __main__ - Step 6607: {'lr': 0.0004988060443192623, 'samples': 1268544, 'steps': 6606, 'loss/train': 1.458253264427185} -08/30/2021 14:22:16 - INFO - __main__ - Step 6608: {'lr': 0.0004988055262413158, 'samples': 1268736, 'steps': 6607, 'loss/train': 2.4444892406463623} -08/30/2021 14:22:16 - INFO - __main__ - Step 6609: {'lr': 0.0004988050080512614, 'samples': 1268928, 'steps': 6608, 'loss/train': 2.097615957260132} -08/30/2021 14:22:17 - INFO - __main__ - Step 6610: {'lr': 0.0004988044897490993, 'samples': 1269120, 'steps': 6609, 'loss/train': 1.5639092922210693} -08/30/2021 14:22:17 - INFO - __main__ - Step 6611: {'lr': 0.0004988039713348297, 'samples': 1269312, 'steps': 6610, 'loss/train': 1.8592551946640015} -08/30/2021 14:22:17 - INFO - __main__ - Step 6612: {'lr': 0.0004988034528084529, 'samples': 1269504, 'steps': 6611, 'loss/train': 2.4343392848968506} -08/30/2021 14:22:19 - INFO - __main__ - Step 6613: {'lr': 0.000498802934169969, 'samples': 1269696, 'steps': 6612, 'loss/train': 1.7656254768371582} -08/30/2021 14:22:20 - INFO - __main__ - Step 6614: {'lr': 0.0004988024154193785, 'samples': 1269888, 'steps': 6613, 'loss/train': 2.0158333778381348} -08/30/2021 14:22:20 - INFO - __main__ - Step 6615: {'lr': 0.0004988018965566814, 'samples': 1270080, 'steps': 6614, 'loss/train': 2.1076645851135254} -08/30/2021 14:22:20 - INFO - __main__ - Step 6616: {'lr': 0.000498801377581878, 'samples': 1270272, 'steps': 6615, 'loss/train': 2.292289972305298} -08/30/2021 14:22:21 - INFO - __main__ - Step 6617: {'lr': 0.0004988008584949686, 'samples': 1270464, 'steps': 6616, 'loss/train': 2.0487987995147705} -08/30/2021 14:22:21 - INFO - __main__ - Step 6618: {'lr': 0.0004988003392959533, 'samples': 1270656, 'steps': 6617, 'loss/train': 1.718287706375122} -08/30/2021 14:22:23 - INFO - __main__ - Step 6619: {'lr': 0.0004987998199848324, 'samples': 1270848, 'steps': 6618, 'loss/train': 4.278743267059326} -08/30/2021 14:22:23 - INFO - __main__ - Step 6620: {'lr': 0.0004987993005616061, 'samples': 1271040, 'steps': 6619, 'loss/train': 2.775883197784424} -08/30/2021 14:22:23 - INFO - __main__ - Step 6621: {'lr': 0.0004987987810262747, 'samples': 1271232, 'steps': 6620, 'loss/train': 4.488855361938477} -08/30/2021 14:22:24 - INFO - __main__ - Step 6622: {'lr': 0.0004987982613788384, 'samples': 1271424, 'steps': 6621, 'loss/train': 2.5627167224884033} -08/30/2021 14:22:24 - INFO - __main__ - Step 6623: {'lr': 0.0004987977416192976, 'samples': 1271616, 'steps': 6622, 'loss/train': 2.950546979904175} -08/30/2021 14:22:26 - INFO - __main__ - Step 6624: {'lr': 0.0004987972217476523, 'samples': 1271808, 'steps': 6623, 'loss/train': 3.310699701309204} -08/30/2021 14:22:26 - INFO - __main__ - Step 6625: {'lr': 0.0004987967017639027, 'samples': 1272000, 'steps': 6624, 'loss/train': 2.5881409645080566} -08/30/2021 14:22:26 - INFO - __main__ - Step 6626: {'lr': 0.0004987961816680492, 'samples': 1272192, 'steps': 6625, 'loss/train': 1.8328700065612793} -08/30/2021 14:22:27 - INFO - __main__ - Step 6627: {'lr': 0.000498795661460092, 'samples': 1272384, 'steps': 6626, 'loss/train': 2.1922333240509033} -08/30/2021 14:22:27 - INFO - __main__ - Step 6628: {'lr': 0.0004987951411400313, 'samples': 1272576, 'steps': 6627, 'loss/train': 2.490633726119995} -08/30/2021 14:22:29 - INFO - __main__ - Step 6629: {'lr': 0.0004987946207078674, 'samples': 1272768, 'steps': 6628, 'loss/train': 2.7946274280548096} -08/30/2021 14:22:29 - INFO - __main__ - Step 6630: {'lr': 0.0004987941001636004, 'samples': 1272960, 'steps': 6629, 'loss/train': 1.7833830118179321} -08/30/2021 14:22:29 - INFO - __main__ - Step 6631: {'lr': 0.0004987935795072307, 'samples': 1273152, 'steps': 6630, 'loss/train': 2.3059895038604736} -08/30/2021 14:22:30 - INFO - __main__ - Step 6632: {'lr': 0.0004987930587387584, 'samples': 1273344, 'steps': 6631, 'loss/train': 2.5678598880767822} -08/30/2021 14:22:30 - INFO - __main__ - Step 6633: {'lr': 0.0004987925378581838, 'samples': 1273536, 'steps': 6632, 'loss/train': 2.6430764198303223} -08/30/2021 14:22:30 - INFO - __main__ - Step 6634: {'lr': 0.0004987920168655071, 'samples': 1273728, 'steps': 6633, 'loss/train': 2.5122742652893066} -08/30/2021 14:22:32 - INFO - __main__ - Step 6635: {'lr': 0.0004987914957607286, 'samples': 1273920, 'steps': 6634, 'loss/train': 2.150352954864502} -08/30/2021 14:22:33 - INFO - __main__ - Step 6636: {'lr': 0.0004987909745438484, 'samples': 1274112, 'steps': 6635, 'loss/train': 2.924222707748413} -08/30/2021 14:22:33 - INFO - __main__ - Step 6637: {'lr': 0.000498790453214867, 'samples': 1274304, 'steps': 6636, 'loss/train': 2.5753657817840576} -08/30/2021 14:22:33 - INFO - __main__ - Step 6638: {'lr': 0.0004987899317737843, 'samples': 1274496, 'steps': 6637, 'loss/train': 0.3753221929073334} -08/30/2021 14:22:34 - INFO - __main__ - Step 6639: {'lr': 0.0004987894102206008, 'samples': 1274688, 'steps': 6638, 'loss/train': 2.109752655029297} -08/30/2021 14:22:36 - INFO - __main__ - Step 6640: {'lr': 0.0004987888885553166, 'samples': 1274880, 'steps': 6639, 'loss/train': 2.4767367839813232} -08/30/2021 14:22:36 - INFO - __main__ - Step 6641: {'lr': 0.0004987883667779319, 'samples': 1275072, 'steps': 6640, 'loss/train': 1.2963693141937256} -08/30/2021 14:22:37 - INFO - __main__ - Step 6642: {'lr': 0.0004987878448884471, 'samples': 1275264, 'steps': 6641, 'loss/train': 2.4667558670043945} -08/30/2021 14:22:37 - INFO - __main__ - Step 6643: {'lr': 0.0004987873228868622, 'samples': 1275456, 'steps': 6642, 'loss/train': 1.9709516763687134} -08/30/2021 14:22:37 - INFO - __main__ - Step 6644: {'lr': 0.0004987868007731778, 'samples': 1275648, 'steps': 6643, 'loss/train': 2.4716739654541016} -08/30/2021 14:22:39 - INFO - __main__ - Step 6645: {'lr': 0.0004987862785473937, 'samples': 1275840, 'steps': 6644, 'loss/train': 2.1465580463409424} -08/30/2021 14:22:39 - INFO - __main__ - Step 6646: {'lr': 0.0004987857562095103, 'samples': 1276032, 'steps': 6645, 'loss/train': 3.1854329109191895} -08/30/2021 14:22:39 - INFO - __main__ - Step 6647: {'lr': 0.0004987852337595281, 'samples': 1276224, 'steps': 6646, 'loss/train': 2.152782917022705} -08/30/2021 14:22:40 - INFO - __main__ - Step 6648: {'lr': 0.0004987847111974469, 'samples': 1276416, 'steps': 6647, 'loss/train': 2.2000057697296143} -08/30/2021 14:22:40 - INFO - __main__ - Step 6649: {'lr': 0.0004987841885232674, 'samples': 1276608, 'steps': 6648, 'loss/train': 2.0557470321655273} -08/30/2021 14:22:42 - INFO - __main__ - Step 6650: {'lr': 0.0004987836657369893, 'samples': 1276800, 'steps': 6649, 'loss/train': 2.4511828422546387} -08/30/2021 14:22:42 - INFO - __main__ - Step 6651: {'lr': 0.0004987831428386133, 'samples': 1276992, 'steps': 6650, 'loss/train': 2.5166261196136475} -08/30/2021 14:22:43 - INFO - __main__ - Step 6652: {'lr': 0.0004987826198281394, 'samples': 1277184, 'steps': 6651, 'loss/train': 1.671008586883545} -08/30/2021 14:22:43 - INFO - __main__ - Step 6653: {'lr': 0.0004987820967055678, 'samples': 1277376, 'steps': 6652, 'loss/train': 2.2135016918182373} -08/30/2021 14:22:43 - INFO - __main__ - Step 6654: {'lr': 0.000498781573470899, 'samples': 1277568, 'steps': 6653, 'loss/train': 2.2522799968719482} -08/30/2021 14:22:44 - INFO - __main__ - Step 6655: {'lr': 0.000498781050124133, 'samples': 1277760, 'steps': 6654, 'loss/train': 2.269852876663208} -08/30/2021 14:22:45 - INFO - __main__ - Step 6656: {'lr': 0.0004987805266652701, 'samples': 1277952, 'steps': 6655, 'loss/train': 0.5961964726448059} -08/30/2021 14:22:46 - INFO - __main__ - Step 6657: {'lr': 0.0004987800030943105, 'samples': 1278144, 'steps': 6656, 'loss/train': 2.3606173992156982} -08/30/2021 14:22:46 - INFO - __main__ - Step 6658: {'lr': 0.0004987794794112545, 'samples': 1278336, 'steps': 6657, 'loss/train': 1.9812132120132446} -08/30/2021 14:22:46 - INFO - __main__ - Step 6659: {'lr': 0.0004987789556161022, 'samples': 1278528, 'steps': 6658, 'loss/train': 2.4071691036224365} -08/30/2021 14:22:47 - INFO - __main__ - Step 6660: {'lr': 0.0004987784317088541, 'samples': 1278720, 'steps': 6659, 'loss/train': 2.365825653076172} -08/30/2021 14:22:48 - INFO - __main__ - Step 6661: {'lr': 0.0004987779076895102, 'samples': 1278912, 'steps': 6660, 'loss/train': 2.412134885787964} -08/30/2021 14:22:48 - INFO - __main__ - Step 6662: {'lr': 0.0004987773835580708, 'samples': 1279104, 'steps': 6661, 'loss/train': 2.232940912246704} -08/30/2021 14:22:49 - INFO - __main__ - Step 6663: {'lr': 0.0004987768593145362, 'samples': 1279296, 'steps': 6662, 'loss/train': 2.327805757522583} -08/30/2021 14:22:49 - INFO - __main__ - Step 6664: {'lr': 0.0004987763349589065, 'samples': 1279488, 'steps': 6663, 'loss/train': 2.547085762023926} -08/30/2021 14:22:50 - INFO - __main__ - Step 6665: {'lr': 0.0004987758104911821, 'samples': 1279680, 'steps': 6664, 'loss/train': 2.1866228580474854} -08/30/2021 14:22:51 - INFO - __main__ - Step 6666: {'lr': 0.0004987752859113631, 'samples': 1279872, 'steps': 6665, 'loss/train': 2.459322929382324} -08/30/2021 14:22:52 - INFO - __main__ - Step 6667: {'lr': 0.0004987747612194499, 'samples': 1280064, 'steps': 6666, 'loss/train': 2.3056182861328125} -08/30/2021 14:22:52 - INFO - __main__ - Step 6668: {'lr': 0.0004987742364154425, 'samples': 1280256, 'steps': 6667, 'loss/train': 1.7542593479156494} -08/30/2021 14:22:52 - INFO - __main__ - Step 6669: {'lr': 0.0004987737114993413, 'samples': 1280448, 'steps': 6668, 'loss/train': 1.9462021589279175} -08/30/2021 14:22:53 - INFO - __main__ - Step 6670: {'lr': 0.0004987731864711466, 'samples': 1280640, 'steps': 6669, 'loss/train': 2.1933953762054443} -08/30/2021 14:22:54 - INFO - __main__ - Step 6671: {'lr': 0.0004987726613308584, 'samples': 1280832, 'steps': 6670, 'loss/train': 0.7411926984786987} -08/30/2021 14:22:55 - INFO - __main__ - Step 6672: {'lr': 0.0004987721360784772, 'samples': 1281024, 'steps': 6671, 'loss/train': 2.0831236839294434} -08/30/2021 14:22:55 - INFO - __main__ - Step 6673: {'lr': 0.0004987716107140031, 'samples': 1281216, 'steps': 6672, 'loss/train': 2.2045445442199707} -08/30/2021 14:22:55 - INFO - __main__ - Step 6674: {'lr': 0.0004987710852374363, 'samples': 1281408, 'steps': 6673, 'loss/train': 1.5553992986679077} -08/30/2021 14:22:56 - INFO - __main__ - Step 6675: {'lr': 0.0004987705596487771, 'samples': 1281600, 'steps': 6674, 'loss/train': 1.3769099712371826} -08/30/2021 14:22:57 - INFO - __main__ - Step 6676: {'lr': 0.0004987700339480258, 'samples': 1281792, 'steps': 6675, 'loss/train': 2.0253024101257324} -08/30/2021 14:22:58 - INFO - __main__ - Step 6677: {'lr': 0.0004987695081351824, 'samples': 1281984, 'steps': 6676, 'loss/train': 1.4973565340042114} -08/30/2021 14:22:58 - INFO - __main__ - Step 6678: {'lr': 0.0004987689822102474, 'samples': 1282176, 'steps': 6677, 'loss/train': 1.3071269989013672} -08/30/2021 14:22:58 - INFO - __main__ - Step 6679: {'lr': 0.000498768456173221, 'samples': 1282368, 'steps': 6678, 'loss/train': 2.8483200073242188} -08/30/2021 14:22:59 - INFO - __main__ - Step 6680: {'lr': 0.0004987679300241033, 'samples': 1282560, 'steps': 6679, 'loss/train': 2.096766233444214} -08/30/2021 14:22:59 - INFO - __main__ - Step 6681: {'lr': 0.0004987674037628945, 'samples': 1282752, 'steps': 6680, 'loss/train': 1.8682585954666138} -08/30/2021 14:23:01 - INFO - __main__ - Step 6682: {'lr': 0.0004987668773895951, 'samples': 1282944, 'steps': 6681, 'loss/train': 2.0440986156463623} -08/30/2021 14:23:01 - INFO - __main__ - Step 6683: {'lr': 0.0004987663509042052, 'samples': 1283136, 'steps': 6682, 'loss/train': 2.422579526901245} -08/30/2021 14:23:02 - INFO - __main__ - Step 6684: {'lr': 0.000498765824306725, 'samples': 1283328, 'steps': 6683, 'loss/train': 1.7745413780212402} -08/30/2021 14:23:02 - INFO - __main__ - Step 6685: {'lr': 0.0004987652975971546, 'samples': 1283520, 'steps': 6684, 'loss/train': 2.5755810737609863} -08/30/2021 14:23:02 - INFO - __main__ - Step 6686: {'lr': 0.0004987647707754945, 'samples': 1283712, 'steps': 6685, 'loss/train': 1.5059664249420166} -08/30/2021 14:23:04 - INFO - __main__ - Step 6687: {'lr': 0.0004987642438417449, 'samples': 1283904, 'steps': 6686, 'loss/train': 0.24417662620544434} -08/30/2021 14:23:04 - INFO - __main__ - Step 6688: {'lr': 0.0004987637167959059, 'samples': 1284096, 'steps': 6687, 'loss/train': 2.0323636531829834} -08/30/2021 14:23:04 - INFO - __main__ - Step 6689: {'lr': 0.0004987631896379779, 'samples': 1284288, 'steps': 6688, 'loss/train': 2.0033011436462402} -08/30/2021 14:23:05 - INFO - __main__ - Step 6690: {'lr': 0.0004987626623679609, 'samples': 1284480, 'steps': 6689, 'loss/train': 2.01468825340271} -08/30/2021 14:23:05 - INFO - __main__ - Step 6691: {'lr': 0.0004987621349858553, 'samples': 1284672, 'steps': 6690, 'loss/train': 2.1882097721099854} -08/30/2021 14:23:07 - INFO - __main__ - Step 6692: {'lr': 0.0004987616074916615, 'samples': 1284864, 'steps': 6691, 'loss/train': 1.3407942056655884} -08/30/2021 14:23:08 - INFO - __main__ - Step 6693: {'lr': 0.0004987610798853794, 'samples': 1285056, 'steps': 6692, 'loss/train': 2.410564661026001} -08/30/2021 14:23:08 - INFO - __main__ - Step 6694: {'lr': 0.0004987605521670094, 'samples': 1285248, 'steps': 6693, 'loss/train': 1.6637507677078247} -08/30/2021 14:23:08 - INFO - __main__ - Step 6695: {'lr': 0.0004987600243365518, 'samples': 1285440, 'steps': 6694, 'loss/train': 2.1286065578460693} -08/30/2021 14:23:09 - INFO - __main__ - Step 6696: {'lr': 0.0004987594963940066, 'samples': 1285632, 'steps': 6695, 'loss/train': 2.305081367492676} -08/30/2021 14:23:11 - INFO - __main__ - Step 6697: {'lr': 0.0004987589683393744, 'samples': 1285824, 'steps': 6696, 'loss/train': 2.856034755706787} -08/30/2021 14:23:11 - INFO - __main__ - Step 6698: {'lr': 0.0004987584401726552, 'samples': 1286016, 'steps': 6697, 'loss/train': 1.4844515323638916} -08/30/2021 14:23:12 - INFO - __main__ - Step 6699: {'lr': 0.0004987579118938492, 'samples': 1286208, 'steps': 6698, 'loss/train': 0.41757792234420776} -08/30/2021 14:23:12 - INFO - __main__ - Step 6700: {'lr': 0.0004987573835029569, 'samples': 1286400, 'steps': 6699, 'loss/train': 1.9921799898147583} -08/30/2021 14:23:12 - INFO - __main__ - Step 6701: {'lr': 0.0004987568549999782, 'samples': 1286592, 'steps': 6700, 'loss/train': 0.9336510300636292} -08/30/2021 14:23:14 - INFO - __main__ - Step 6702: {'lr': 0.0004987563263849136, 'samples': 1286784, 'steps': 6701, 'loss/train': 1.6154801845550537} -08/30/2021 14:23:14 - INFO - __main__ - Step 6703: {'lr': 0.0004987557976577632, 'samples': 1286976, 'steps': 6702, 'loss/train': 2.2903635501861572} -08/30/2021 14:23:15 - INFO - __main__ - Step 6704: {'lr': 0.0004987552688185273, 'samples': 1287168, 'steps': 6703, 'loss/train': 2.2099227905273438} -08/30/2021 14:23:15 - INFO - __main__ - Step 6705: {'lr': 0.0004987547398672061, 'samples': 1287360, 'steps': 6704, 'loss/train': 2.618635892868042} -08/30/2021 14:23:15 - INFO - __main__ - Step 6706: {'lr': 0.0004987542108037998, 'samples': 1287552, 'steps': 6705, 'loss/train': 2.328796625137329} -08/30/2021 14:23:16 - INFO - __main__ - Step 6707: {'lr': 0.0004987536816283087, 'samples': 1287744, 'steps': 6706, 'loss/train': 2.121213436126709} -08/30/2021 14:23:17 - INFO - __main__ - Step 6708: {'lr': 0.0004987531523407331, 'samples': 1287936, 'steps': 6707, 'loss/train': 2.0505807399749756} -08/30/2021 14:23:18 - INFO - __main__ - Step 6709: {'lr': 0.0004987526229410732, 'samples': 1288128, 'steps': 6708, 'loss/train': 2.2908124923706055} -08/30/2021 14:23:18 - INFO - __main__ - Step 6710: {'lr': 0.000498752093429329, 'samples': 1288320, 'steps': 6709, 'loss/train': 1.6176339387893677} -08/30/2021 14:23:19 - INFO - __main__ - Step 6711: {'lr': 0.0004987515638055012, 'samples': 1288512, 'steps': 6710, 'loss/train': 1.9946929216384888} -08/30/2021 14:23:19 - INFO - __main__ - Step 6712: {'lr': 0.0004987510340695896, 'samples': 1288704, 'steps': 6711, 'loss/train': 1.9904903173446655} -08/30/2021 14:23:19 - INFO - __main__ - Step 6713: {'lr': 0.0004987505042215948, 'samples': 1288896, 'steps': 6712, 'loss/train': 0.5952053070068359} -08/30/2021 14:23:21 - INFO - __main__ - Step 6714: {'lr': 0.0004987499742615167, 'samples': 1289088, 'steps': 6713, 'loss/train': 2.0942940711975098} -08/30/2021 14:23:21 - INFO - __main__ - Step 6715: {'lr': 0.0004987494441893557, 'samples': 1289280, 'steps': 6714, 'loss/train': 1.748814582824707} -08/30/2021 14:23:22 - INFO - __main__ - Step 6716: {'lr': 0.0004987489140051121, 'samples': 1289472, 'steps': 6715, 'loss/train': 1.7371820211410522} -08/30/2021 14:23:22 - INFO - __main__ - Step 6717: {'lr': 0.000498748383708786, 'samples': 1289664, 'steps': 6716, 'loss/train': 1.1997138261795044} -08/30/2021 14:23:22 - INFO - __main__ - Step 6718: {'lr': 0.0004987478533003779, 'samples': 1289856, 'steps': 6717, 'loss/train': 1.6917279958724976} -08/30/2021 14:23:24 - INFO - __main__ - Step 6719: {'lr': 0.0004987473227798877, 'samples': 1290048, 'steps': 6718, 'loss/train': 1.7157011032104492} -08/30/2021 14:23:24 - INFO - __main__ - Step 6720: {'lr': 0.0004987467921473157, 'samples': 1290240, 'steps': 6719, 'loss/train': 1.812124490737915} -08/30/2021 14:23:25 - INFO - __main__ - Step 6721: {'lr': 0.0004987462614026624, 'samples': 1290432, 'steps': 6720, 'loss/train': 1.4346495866775513} -08/30/2021 14:23:25 - INFO - __main__ - Step 6722: {'lr': 0.0004987457305459279, 'samples': 1290624, 'steps': 6721, 'loss/train': 0.9984289407730103} -08/30/2021 14:23:26 - INFO - __main__ - Step 6723: {'lr': 0.0004987451995771124, 'samples': 1290816, 'steps': 6722, 'loss/train': 2.1301305294036865} -08/30/2021 14:23:27 - INFO - __main__ - Step 6724: {'lr': 0.000498744668496216, 'samples': 1291008, 'steps': 6723, 'loss/train': 0.3405721187591553} -08/30/2021 14:23:27 - INFO - __main__ - Step 6725: {'lr': 0.0004987441373032393, 'samples': 1291200, 'steps': 6724, 'loss/train': 2.0260512828826904} -08/30/2021 14:23:28 - INFO - __main__ - Step 6726: {'lr': 0.0004987436059981821, 'samples': 1291392, 'steps': 6725, 'loss/train': 2.4161086082458496} -08/30/2021 14:23:28 - INFO - __main__ - Step 6727: {'lr': 0.0004987430745810451, 'samples': 1291584, 'steps': 6726, 'loss/train': 1.8530292510986328} -08/30/2021 14:23:29 - INFO - __main__ - Step 6728: {'lr': 0.0004987425430518282, 'samples': 1291776, 'steps': 6727, 'loss/train': 2.0817573070526123} -08/30/2021 14:23:30 - INFO - __main__ - Step 6729: {'lr': 0.0004987420114105317, 'samples': 1291968, 'steps': 6728, 'loss/train': 2.337291955947876} -08/30/2021 14:23:31 - INFO - __main__ - Step 6730: {'lr': 0.000498741479657156, 'samples': 1292160, 'steps': 6729, 'loss/train': 1.9573829174041748} -08/30/2021 14:23:31 - INFO - __main__ - Step 6731: {'lr': 0.0004987409477917011, 'samples': 1292352, 'steps': 6730, 'loss/train': 2.6872239112854004} -08/30/2021 14:23:31 - INFO - __main__ - Step 6732: {'lr': 0.0004987404158141675, 'samples': 1292544, 'steps': 6731, 'loss/train': 1.9681702852249146} -08/30/2021 14:23:32 - INFO - __main__ - Step 6733: {'lr': 0.0004987398837245552, 'samples': 1292736, 'steps': 6732, 'loss/train': 2.351219415664673} -08/30/2021 14:23:33 - INFO - __main__ - Step 6734: {'lr': 0.0004987393515228646, 'samples': 1292928, 'steps': 6733, 'loss/train': 2.2109556198120117} -08/30/2021 14:23:33 - INFO - __main__ - Step 6735: {'lr': 0.0004987388192090959, 'samples': 1293120, 'steps': 6734, 'loss/train': 2.4044573307037354} -08/30/2021 14:23:34 - INFO - __main__ - Step 6736: {'lr': 0.0004987382867832493, 'samples': 1293312, 'steps': 6735, 'loss/train': 2.394789457321167} -08/30/2021 14:23:34 - INFO - __main__ - Step 6737: {'lr': 0.0004987377542453251, 'samples': 1293504, 'steps': 6736, 'loss/train': 1.1733660697937012} -08/30/2021 14:23:34 - INFO - __main__ - Step 6738: {'lr': 0.0004987372215953234, 'samples': 1293696, 'steps': 6737, 'loss/train': 1.9348593950271606} -08/30/2021 14:23:36 - INFO - __main__ - Step 6739: {'lr': 0.0004987366888332446, 'samples': 1293888, 'steps': 6738, 'loss/train': 1.234695315361023} -08/30/2021 14:23:36 - INFO - __main__ - Step 6740: {'lr': 0.0004987361559590889, 'samples': 1294080, 'steps': 6739, 'loss/train': 2.0923051834106445} -08/30/2021 14:23:37 - INFO - __main__ - Step 6741: {'lr': 0.0004987356229728566, 'samples': 1294272, 'steps': 6740, 'loss/train': 3.1357924938201904} -08/30/2021 14:23:37 - INFO - __main__ - Step 6742: {'lr': 0.0004987350898745477, 'samples': 1294464, 'steps': 6741, 'loss/train': 1.7173526287078857} -08/30/2021 14:23:37 - INFO - __main__ - Step 6743: {'lr': 0.0004987345566641628, 'samples': 1294656, 'steps': 6742, 'loss/train': 1.8840594291687012} -08/30/2021 14:23:38 - INFO - __main__ - Step 6744: {'lr': 0.0004987340233417019, 'samples': 1294848, 'steps': 6743, 'loss/train': 2.293461799621582} -08/30/2021 14:23:39 - INFO - __main__ - Step 6745: {'lr': 0.0004987334899071652, 'samples': 1295040, 'steps': 6744, 'loss/train': 2.139820098876953} -08/30/2021 14:23:40 - INFO - __main__ - Step 6746: {'lr': 0.000498732956360553, 'samples': 1295232, 'steps': 6745, 'loss/train': 1.7622076272964478} -08/30/2021 14:23:40 - INFO - __main__ - Step 6747: {'lr': 0.0004987324227018657, 'samples': 1295424, 'steps': 6746, 'loss/train': 2.011033535003662} -08/30/2021 14:23:41 - INFO - __main__ - Step 6748: {'lr': 0.0004987318889311033, 'samples': 1295616, 'steps': 6747, 'loss/train': 1.996565818786621} -08/30/2021 14:23:41 - INFO - __main__ - Step 6749: {'lr': 0.0004987313550482663, 'samples': 1295808, 'steps': 6748, 'loss/train': 2.0381922721862793} -08/30/2021 14:23:43 - INFO - __main__ - Step 6750: {'lr': 0.0004987308210533546, 'samples': 1296000, 'steps': 6749, 'loss/train': 2.241203784942627} -08/30/2021 14:23:43 - INFO - __main__ - Step 6751: {'lr': 0.0004987302869463686, 'samples': 1296192, 'steps': 6750, 'loss/train': 1.5493972301483154} -08/30/2021 14:23:44 - INFO - __main__ - Step 6752: {'lr': 0.0004987297527273088, 'samples': 1296384, 'steps': 6751, 'loss/train': 1.926452875137329} -08/30/2021 14:23:44 - INFO - __main__ - Step 6753: {'lr': 0.0004987292183961751, 'samples': 1296576, 'steps': 6752, 'loss/train': 2.1413750648498535} -08/30/2021 14:23:45 - INFO - __main__ - Step 6754: {'lr': 0.0004987286839529679, 'samples': 1296768, 'steps': 6753, 'loss/train': 2.2889134883880615} -08/30/2021 14:23:46 - INFO - __main__ - Step 6755: {'lr': 0.0004987281493976873, 'samples': 1296960, 'steps': 6754, 'loss/train': 1.719522476196289} -08/30/2021 14:23:47 - INFO - __main__ - Step 6756: {'lr': 0.0004987276147303337, 'samples': 1297152, 'steps': 6755, 'loss/train': 1.0310285091400146} -08/30/2021 14:23:47 - INFO - __main__ - Step 6757: {'lr': 0.0004987270799509071, 'samples': 1297344, 'steps': 6756, 'loss/train': 1.7240643501281738} -08/30/2021 14:23:47 - INFO - __main__ - Step 6758: {'lr': 0.0004987265450594082, 'samples': 1297536, 'steps': 6757, 'loss/train': 2.399144411087036} -08/30/2021 14:23:48 - INFO - __main__ - Step 6759: {'lr': 0.0004987260100558368, 'samples': 1297728, 'steps': 6758, 'loss/train': 1.979913592338562} -08/30/2021 14:23:48 - INFO - __main__ - Step 6760: {'lr': 0.0004987254749401933, 'samples': 1297920, 'steps': 6759, 'loss/train': 2.0695018768310547} -08/30/2021 14:23:50 - INFO - __main__ - Step 6761: {'lr': 0.000498724939712478, 'samples': 1298112, 'steps': 6760, 'loss/train': 1.8059402704238892} -08/30/2021 14:23:50 - INFO - __main__ - Step 6762: {'lr': 0.000498724404372691, 'samples': 1298304, 'steps': 6761, 'loss/train': 2.115511894226074} -08/30/2021 14:23:51 - INFO - __main__ - Step 6763: {'lr': 0.0004987238689208327, 'samples': 1298496, 'steps': 6762, 'loss/train': 1.4486254453659058} -08/30/2021 14:23:51 - INFO - __main__ - Step 6764: {'lr': 0.0004987233333569031, 'samples': 1298688, 'steps': 6763, 'loss/train': 1.998164415359497} -08/30/2021 14:23:52 - INFO - __main__ - Step 6765: {'lr': 0.0004987227976809028, 'samples': 1298880, 'steps': 6764, 'loss/train': 1.8888225555419922} -08/30/2021 14:23:53 - INFO - __main__ - Step 6766: {'lr': 0.0004987222618928318, 'samples': 1299072, 'steps': 6765, 'loss/train': 2.2598750591278076} -08/30/2021 14:23:54 - INFO - __main__ - Step 6767: {'lr': 0.0004987217259926904, 'samples': 1299264, 'steps': 6766, 'loss/train': 2.020343542098999} -08/30/2021 14:23:54 - INFO - __main__ - Step 6768: {'lr': 0.0004987211899804788, 'samples': 1299456, 'steps': 6767, 'loss/train': 0.40296754240989685} -08/30/2021 14:23:55 - INFO - __main__ - Step 6769: {'lr': 0.0004987206538561972, 'samples': 1299648, 'steps': 6768, 'loss/train': 1.9753944873809814} -08/30/2021 14:23:55 - INFO - __main__ - Step 6770: {'lr': 0.000498720117619846, 'samples': 1299840, 'steps': 6769, 'loss/train': 2.3677124977111816} -08/30/2021 14:23:55 - INFO - __main__ - Step 6771: {'lr': 0.0004987195812714252, 'samples': 1300032, 'steps': 6770, 'loss/train': 2.1042680740356445} -08/30/2021 14:23:57 - INFO - __main__ - Step 6772: {'lr': 0.0004987190448109354, 'samples': 1300224, 'steps': 6771, 'loss/train': 1.5415616035461426} -08/30/2021 14:23:57 - INFO - __main__ - Step 6773: {'lr': 0.0004987185082383765, 'samples': 1300416, 'steps': 6772, 'loss/train': 2.4632744789123535} -08/30/2021 14:23:58 - INFO - __main__ - Step 6774: {'lr': 0.000498717971553749, 'samples': 1300608, 'steps': 6773, 'loss/train': 2.1802873611450195} -08/30/2021 14:23:58 - INFO - __main__ - Step 6775: {'lr': 0.0004987174347570529, 'samples': 1300800, 'steps': 6774, 'loss/train': 2.395963191986084} -08/30/2021 14:23:58 - INFO - __main__ - Step 6776: {'lr': 0.0004987168978482886, 'samples': 1300992, 'steps': 6775, 'loss/train': 0.7819046974182129} -08/30/2021 14:24:00 - INFO - __main__ - Step 6777: {'lr': 0.0004987163608274564, 'samples': 1301184, 'steps': 6776, 'loss/train': 1.1793291568756104} -08/30/2021 14:24:01 - INFO - __main__ - Step 6778: {'lr': 0.0004987158236945563, 'samples': 1301376, 'steps': 6777, 'loss/train': 1.8890621662139893} -08/30/2021 14:24:01 - INFO - __main__ - Step 6779: {'lr': 0.0004987152864495887, 'samples': 1301568, 'steps': 6778, 'loss/train': 1.978233814239502} -08/30/2021 14:24:01 - INFO - __main__ - Step 6780: {'lr': 0.000498714749092554, 'samples': 1301760, 'steps': 6779, 'loss/train': 1.9923200607299805} -08/30/2021 14:24:02 - INFO - __main__ - Step 6781: {'lr': 0.0004987142116234521, 'samples': 1301952, 'steps': 6780, 'loss/train': 2.3988027572631836} -08/30/2021 14:24:02 - INFO - __main__ - Step 6782: {'lr': 0.0004987136740422835, 'samples': 1302144, 'steps': 6781, 'loss/train': 1.3582043647766113} -08/30/2021 14:24:03 - INFO - __main__ - Step 6783: {'lr': 0.0004987131363490483, 'samples': 1302336, 'steps': 6782, 'loss/train': 1.930040717124939} -08/30/2021 14:24:04 - INFO - __main__ - Step 6784: {'lr': 0.0004987125985437468, 'samples': 1302528, 'steps': 6783, 'loss/train': 1.0334081649780273} -08/30/2021 14:24:04 - INFO - __main__ - Step 6785: {'lr': 0.0004987120606263794, 'samples': 1302720, 'steps': 6784, 'loss/train': 1.7500663995742798} -08/30/2021 14:24:05 - INFO - __main__ - Step 6786: {'lr': 0.000498711522596946, 'samples': 1302912, 'steps': 6785, 'loss/train': 0.2875692546367645} -08/30/2021 14:24:05 - INFO - __main__ - Step 6787: {'lr': 0.000498710984455447, 'samples': 1303104, 'steps': 6786, 'loss/train': 1.5875511169433594} -08/30/2021 14:24:07 - INFO - __main__ - Step 6788: {'lr': 0.0004987104462018828, 'samples': 1303296, 'steps': 6787, 'loss/train': 2.2025222778320312} -08/30/2021 14:24:07 - INFO - __main__ - Step 6789: {'lr': 0.0004987099078362534, 'samples': 1303488, 'steps': 6788, 'loss/train': 2.0818910598754883} -08/30/2021 14:24:07 - INFO - __main__ - Step 6790: {'lr': 0.0004987093693585591, 'samples': 1303680, 'steps': 6789, 'loss/train': 0.3496999740600586} -08/30/2021 14:24:08 - INFO - __main__ - Step 6791: {'lr': 0.0004987088307688004, 'samples': 1303872, 'steps': 6790, 'loss/train': 2.0117506980895996} -08/30/2021 14:24:08 - INFO - __main__ - Step 6792: {'lr': 0.0004987082920669772, 'samples': 1304064, 'steps': 6791, 'loss/train': 1.7049227952957153} -08/30/2021 14:24:10 - INFO - __main__ - Step 6793: {'lr': 0.0004987077532530899, 'samples': 1304256, 'steps': 6792, 'loss/train': 1.7496565580368042} -08/30/2021 14:24:11 - INFO - __main__ - Step 6794: {'lr': 0.0004987072143271388, 'samples': 1304448, 'steps': 6793, 'loss/train': 1.5691767930984497} -08/30/2021 14:24:11 - INFO - __main__ - Step 6795: {'lr': 0.000498706675289124, 'samples': 1304640, 'steps': 6794, 'loss/train': 1.5983797311782837} -08/30/2021 14:24:11 - INFO - __main__ - Step 6796: {'lr': 0.0004987061361390458, 'samples': 1304832, 'steps': 6795, 'loss/train': 2.4334306716918945} -08/30/2021 14:24:12 - INFO - __main__ - Step 6797: {'lr': 0.0004987055968769045, 'samples': 1305024, 'steps': 6796, 'loss/train': 2.1273531913757324} -08/30/2021 14:24:14 - INFO - __main__ - Step 6798: {'lr': 0.0004987050575027002, 'samples': 1305216, 'steps': 6797, 'loss/train': 2.0953638553619385} -08/30/2021 14:24:14 - INFO - __main__ - Step 6799: {'lr': 0.0004987045180164333, 'samples': 1305408, 'steps': 6798, 'loss/train': 2.4452297687530518} -08/30/2021 14:24:14 - INFO - __main__ - Step 6800: {'lr': 0.0004987039784181041, 'samples': 1305600, 'steps': 6799, 'loss/train': 1.2725753784179688} -08/30/2021 14:24:15 - INFO - __main__ - Step 6801: {'lr': 0.0004987034387077126, 'samples': 1305792, 'steps': 6800, 'loss/train': 2.0912978649139404} -08/30/2021 14:24:15 - INFO - __main__ - Step 6802: {'lr': 0.0004987028988852592, 'samples': 1305984, 'steps': 6801, 'loss/train': 2.162841796875} -08/30/2021 14:24:17 - INFO - __main__ - Step 6803: {'lr': 0.0004987023589507441, 'samples': 1306176, 'steps': 6802, 'loss/train': 0.22545507550239563} -08/30/2021 14:24:18 - INFO - __main__ - Step 6804: {'lr': 0.0004987018189041675, 'samples': 1306368, 'steps': 6803, 'loss/train': 1.98037850856781} -08/30/2021 14:24:18 - INFO - __main__ - Step 6805: {'lr': 0.0004987012787455297, 'samples': 1306560, 'steps': 6804, 'loss/train': 2.3976211547851562} -08/30/2021 14:24:19 - INFO - __main__ - Step 6806: {'lr': 0.000498700738474831, 'samples': 1306752, 'steps': 6805, 'loss/train': 1.7677881717681885} -08/30/2021 14:24:19 - INFO - __main__ - Step 6807: {'lr': 0.0004987001980920716, 'samples': 1306944, 'steps': 6806, 'loss/train': 1.782514214515686} -08/30/2021 14:24:19 - INFO - __main__ - Step 6808: {'lr': 0.0004986996575972517, 'samples': 1307136, 'steps': 6807, 'loss/train': 1.991308331489563} -08/30/2021 14:24:21 - INFO - __main__ - Step 6809: {'lr': 0.0004986991169903716, 'samples': 1307328, 'steps': 6808, 'loss/train': 1.7893410921096802} -08/30/2021 14:24:21 - INFO - __main__ - Step 6810: {'lr': 0.0004986985762714314, 'samples': 1307520, 'steps': 6809, 'loss/train': 2.308098077774048} -08/30/2021 14:24:22 - INFO - __main__ - Step 6811: {'lr': 0.0004986980354404316, 'samples': 1307712, 'steps': 6810, 'loss/train': 2.290099859237671} -08/30/2021 14:24:22 - INFO - __main__ - Step 6812: {'lr': 0.0004986974944973723, 'samples': 1307904, 'steps': 6811, 'loss/train': 1.5586804151535034} -08/30/2021 14:24:22 - INFO - __main__ - Step 6813: {'lr': 0.0004986969534422537, 'samples': 1308096, 'steps': 6812, 'loss/train': 1.7913575172424316} -08/30/2021 14:24:24 - INFO - __main__ - Step 6814: {'lr': 0.000498696412275076, 'samples': 1308288, 'steps': 6813, 'loss/train': 2.0737788677215576} -08/30/2021 14:24:24 - INFO - __main__ - Step 6815: {'lr': 0.0004986958709958396, 'samples': 1308480, 'steps': 6814, 'loss/train': 1.83364737033844} -08/30/2021 14:24:25 - INFO - __main__ - Step 6816: {'lr': 0.0004986953296045448, 'samples': 1308672, 'steps': 6815, 'loss/train': 2.073204278945923} -08/30/2021 14:24:25 - INFO - __main__ - Step 6817: {'lr': 0.0004986947881011917, 'samples': 1308864, 'steps': 6816, 'loss/train': 1.7709569931030273} -08/30/2021 14:24:25 - INFO - __main__ - Step 6818: {'lr': 0.0004986942464857804, 'samples': 1309056, 'steps': 6817, 'loss/train': 2.5167927742004395} -08/30/2021 14:24:27 - INFO - __main__ - Step 6819: {'lr': 0.0004986937047583114, 'samples': 1309248, 'steps': 6818, 'loss/train': 2.1112968921661377} -08/30/2021 14:24:27 - INFO - __main__ - Step 6820: {'lr': 0.0004986931629187848, 'samples': 1309440, 'steps': 6819, 'loss/train': 1.6558749675750732} -08/30/2021 14:24:28 - INFO - __main__ - Step 6821: {'lr': 0.0004986926209672011, 'samples': 1309632, 'steps': 6820, 'loss/train': 2.2070367336273193} -08/30/2021 14:24:28 - INFO - __main__ - Step 6822: {'lr': 0.0004986920789035601, 'samples': 1309824, 'steps': 6821, 'loss/train': 2.034654378890991} -08/30/2021 14:24:28 - INFO - __main__ - Step 6823: {'lr': 0.0004986915367278623, 'samples': 1310016, 'steps': 6822, 'loss/train': 2.2571158409118652} -08/30/2021 14:24:30 - INFO - __main__ - Step 6824: {'lr': 0.0004986909944401082, 'samples': 1310208, 'steps': 6823, 'loss/train': 1.7329366207122803} -08/30/2021 14:24:30 - INFO - __main__ - Step 6825: {'lr': 0.0004986904520402975, 'samples': 1310400, 'steps': 6824, 'loss/train': 2.0557992458343506} -08/30/2021 14:24:31 - INFO - __main__ - Step 6826: {'lr': 0.0004986899095284308, 'samples': 1310592, 'steps': 6825, 'loss/train': 2.339568853378296} -08/30/2021 14:24:31 - INFO - __main__ - Step 6827: {'lr': 0.0004986893669045083, 'samples': 1310784, 'steps': 6826, 'loss/train': 2.054544448852539} -08/30/2021 14:24:31 - INFO - __main__ - Step 6828: {'lr': 0.0004986888241685301, 'samples': 1310976, 'steps': 6827, 'loss/train': 2.110914707183838} -08/30/2021 14:24:32 - INFO - __main__ - Step 6829: {'lr': 0.0004986882813204967, 'samples': 1311168, 'steps': 6828, 'loss/train': 1.8011455535888672} -08/30/2021 14:24:33 - INFO - __main__ - Step 6830: {'lr': 0.0004986877383604081, 'samples': 1311360, 'steps': 6829, 'loss/train': 0.4001435339450836} -08/30/2021 14:24:34 - INFO - __main__ - Step 6831: {'lr': 0.0004986871952882647, 'samples': 1311552, 'steps': 6830, 'loss/train': 2.1137337684631348} -08/30/2021 14:24:34 - INFO - __main__ - Step 6832: {'lr': 0.0004986866521040666, 'samples': 1311744, 'steps': 6831, 'loss/train': 1.8895313739776611} -08/30/2021 14:24:34 - INFO - __main__ - Step 6833: {'lr': 0.0004986861088078142, 'samples': 1311936, 'steps': 6832, 'loss/train': 2.1450235843658447} -08/30/2021 14:24:35 - INFO - __main__ - Step 6834: {'lr': 0.0004986855653995077, 'samples': 1312128, 'steps': 6833, 'loss/train': 2.0607025623321533} -08/30/2021 14:24:36 - INFO - __main__ - Step 6835: {'lr': 0.0004986850218791474, 'samples': 1312320, 'steps': 6834, 'loss/train': 1.6316173076629639} -08/30/2021 14:24:37 - INFO - __main__ - Step 6836: {'lr': 0.0004986844782467332, 'samples': 1312512, 'steps': 6835, 'loss/train': 1.3658430576324463} -08/30/2021 14:24:37 - INFO - __main__ - Step 6837: {'lr': 0.0004986839345022658, 'samples': 1312704, 'steps': 6836, 'loss/train': 1.4744865894317627} -08/30/2021 14:24:37 - INFO - __main__ - Step 6838: {'lr': 0.0004986833906457453, 'samples': 1312896, 'steps': 6837, 'loss/train': 1.8350540399551392} -08/30/2021 14:24:38 - INFO - __main__ - Step 6839: {'lr': 0.0004986828466771718, 'samples': 1313088, 'steps': 6838, 'loss/train': 1.6223552227020264} -08/30/2021 14:24:40 - INFO - __main__ - Step 6840: {'lr': 0.0004986823025965457, 'samples': 1313280, 'steps': 6839, 'loss/train': 2.226318120956421} -08/30/2021 14:24:40 - INFO - __main__ - Step 6841: {'lr': 0.0004986817584038671, 'samples': 1313472, 'steps': 6840, 'loss/train': 2.0610363483428955} -08/30/2021 14:24:41 - INFO - __main__ - Step 6842: {'lr': 0.0004986812140991365, 'samples': 1313664, 'steps': 6841, 'loss/train': 2.3503642082214355} -08/30/2021 14:24:41 - INFO - __main__ - Step 6843: {'lr': 0.0004986806696823538, 'samples': 1313856, 'steps': 6842, 'loss/train': 1.8314342498779297} -08/30/2021 14:24:41 - INFO - __main__ - Step 6844: {'lr': 0.0004986801251535195, 'samples': 1314048, 'steps': 6843, 'loss/train': 1.357712745666504} -08/30/2021 14:24:42 - INFO - __main__ - Step 6845: {'lr': 0.0004986795805126339, 'samples': 1314240, 'steps': 6844, 'loss/train': 2.556453227996826} -08/30/2021 14:24:43 - INFO - __main__ - Step 6846: {'lr': 0.000498679035759697, 'samples': 1314432, 'steps': 6845, 'loss/train': 2.0000977516174316} -08/30/2021 14:24:44 - INFO - __main__ - Step 6847: {'lr': 0.0004986784908947091, 'samples': 1314624, 'steps': 6846, 'loss/train': 1.7936652898788452} -08/30/2021 14:24:44 - INFO - __main__ - Step 6848: {'lr': 0.0004986779459176706, 'samples': 1314816, 'steps': 6847, 'loss/train': 2.091332197189331} -08/30/2021 14:24:44 - INFO - __main__ - Step 6849: {'lr': 0.0004986774008285816, 'samples': 1315008, 'steps': 6848, 'loss/train': 1.9367101192474365} -08/30/2021 14:24:45 - INFO - __main__ - Step 6850: {'lr': 0.0004986768556274425, 'samples': 1315200, 'steps': 6849, 'loss/train': 1.8169887065887451} -08/30/2021 14:24:47 - INFO - __main__ - Step 6851: {'lr': 0.0004986763103142533, 'samples': 1315392, 'steps': 6850, 'loss/train': 1.878724217414856} -08/30/2021 14:24:47 - INFO - __main__ - Step 6852: {'lr': 0.0004986757648890145, 'samples': 1315584, 'steps': 6851, 'loss/train': 0.44878795742988586} -08/30/2021 14:24:47 - INFO - __main__ - Step 6853: {'lr': 0.0004986752193517262, 'samples': 1315776, 'steps': 6852, 'loss/train': 0.3569950461387634} -08/30/2021 14:24:48 - INFO - __main__ - Step 6854: {'lr': 0.0004986746737023887, 'samples': 1315968, 'steps': 6853, 'loss/train': 1.8973006010055542} -08/30/2021 14:24:48 - INFO - __main__ - Step 6855: {'lr': 0.0004986741279410023, 'samples': 1316160, 'steps': 6854, 'loss/train': 2.3209033012390137} -08/30/2021 14:24:49 - INFO - __main__ - Step 6856: {'lr': 0.000498673582067567, 'samples': 1316352, 'steps': 6855, 'loss/train': 1.9644896984100342} -08/30/2021 14:24:51 - INFO - __main__ - Step 6857: {'lr': 0.0004986730360820833, 'samples': 1316544, 'steps': 6856, 'loss/train': 0.8535609841346741} -08/30/2021 14:24:51 - INFO - __main__ - Step 6858: {'lr': 0.0004986724899845514, 'samples': 1316736, 'steps': 6857, 'loss/train': 2.2894835472106934} -08/30/2021 14:24:52 - INFO - __main__ - Step 6859: {'lr': 0.0004986719437749716, 'samples': 1316928, 'steps': 6858, 'loss/train': 1.8458828926086426} -08/30/2021 14:24:52 - INFO - __main__ - Step 6860: {'lr': 0.0004986713974533439, 'samples': 1317120, 'steps': 6859, 'loss/train': 1.8802374601364136} -08/30/2021 14:24:52 - INFO - __main__ - Step 6861: {'lr': 0.0004986708510196688, 'samples': 1317312, 'steps': 6860, 'loss/train': 1.9847824573516846} -08/30/2021 14:24:54 - INFO - __main__ - Step 6862: {'lr': 0.0004986703044739464, 'samples': 1317504, 'steps': 6861, 'loss/train': 1.9645650386810303} -08/30/2021 14:24:54 - INFO - __main__ - Step 6863: {'lr': 0.000498669757816177, 'samples': 1317696, 'steps': 6862, 'loss/train': 2.2547049522399902} -08/30/2021 14:24:55 - INFO - __main__ - Step 6864: {'lr': 0.0004986692110463609, 'samples': 1317888, 'steps': 6863, 'loss/train': 1.7505618333816528} -08/30/2021 14:24:55 - INFO - __main__ - Step 6865: {'lr': 0.0004986686641644982, 'samples': 1318080, 'steps': 6864, 'loss/train': 1.7786399126052856} -08/30/2021 14:24:55 - INFO - __main__ - Step 6866: {'lr': 0.0004986681171705893, 'samples': 1318272, 'steps': 6865, 'loss/train': 2.016984462738037} -08/30/2021 14:24:57 - INFO - __main__ - Step 6867: {'lr': 0.0004986675700646343, 'samples': 1318464, 'steps': 6866, 'loss/train': 2.2723960876464844} -08/30/2021 14:24:57 - INFO - __main__ - Step 6868: {'lr': 0.0004986670228466337, 'samples': 1318656, 'steps': 6867, 'loss/train': 1.8527895212173462} -08/30/2021 14:24:58 - INFO - __main__ - Step 6869: {'lr': 0.0004986664755165874, 'samples': 1318848, 'steps': 6868, 'loss/train': 1.8059288263320923} -08/30/2021 14:24:58 - INFO - __main__ - Step 6870: {'lr': 0.000498665928074496, 'samples': 1319040, 'steps': 6869, 'loss/train': 2.1040046215057373} -08/30/2021 14:24:58 - INFO - __main__ - Step 6871: {'lr': 0.0004986653805203594, 'samples': 1319232, 'steps': 6870, 'loss/train': 1.7492882013320923} -08/30/2021 14:25:01 - INFO - __main__ - Step 6872: {'lr': 0.0004986648328541781, 'samples': 1319424, 'steps': 6871, 'loss/train': 2.2070772647857666} -08/30/2021 14:25:01 - INFO - __main__ - Step 6873: {'lr': 0.0004986642850759522, 'samples': 1319616, 'steps': 6872, 'loss/train': 2.392061471939087} -08/30/2021 14:25:02 - INFO - __main__ - Step 6874: {'lr': 0.0004986637371856822, 'samples': 1319808, 'steps': 6873, 'loss/train': 2.4519708156585693} -08/30/2021 14:25:02 - INFO - __main__ - Step 6875: {'lr': 0.000498663189183368, 'samples': 1320000, 'steps': 6874, 'loss/train': 1.9604814052581787} -08/30/2021 14:25:02 - INFO - __main__ - Step 6876: {'lr': 0.0004986626410690099, 'samples': 1320192, 'steps': 6875, 'loss/train': 3.5625247955322266} -08/30/2021 14:25:03 - INFO - __main__ - Step 6877: {'lr': 0.0004986620928426085, 'samples': 1320384, 'steps': 6876, 'loss/train': 3.1079251766204834} -08/30/2021 14:25:03 - INFO - __main__ - Step 6878: {'lr': 0.0004986615445041636, 'samples': 1320576, 'steps': 6877, 'loss/train': 3.7473766803741455} -08/30/2021 14:25:05 - INFO - __main__ - Step 6879: {'lr': 0.0004986609960536757, 'samples': 1320768, 'steps': 6878, 'loss/train': 3.530379295349121} -08/30/2021 14:25:05 - INFO - __main__ - Step 6880: {'lr': 0.000498660447491145, 'samples': 1320960, 'steps': 6879, 'loss/train': 2.179630756378174} -08/30/2021 14:25:05 - INFO - __main__ - Step 6881: {'lr': 0.0004986598988165718, 'samples': 1321152, 'steps': 6880, 'loss/train': 2.343501091003418} -08/30/2021 14:25:06 - INFO - __main__ - Step 6882: {'lr': 0.0004986593500299562, 'samples': 1321344, 'steps': 6881, 'loss/train': 2.252079486846924} -08/30/2021 14:25:06 - INFO - __main__ - Step 6883: {'lr': 0.0004986588011312986, 'samples': 1321536, 'steps': 6882, 'loss/train': 1.9850687980651855} -08/30/2021 14:25:07 - INFO - __main__ - Step 6884: {'lr': 0.0004986582521205992, 'samples': 1321728, 'steps': 6883, 'loss/train': 2.7311408519744873} -08/30/2021 14:25:08 - INFO - __main__ - Step 6885: {'lr': 0.0004986577029978581, 'samples': 1321920, 'steps': 6884, 'loss/train': 2.176633834838867} -08/30/2021 14:25:08 - INFO - __main__ - Step 6886: {'lr': 0.0004986571537630757, 'samples': 1322112, 'steps': 6885, 'loss/train': 2.2490451335906982} -08/30/2021 14:25:09 - INFO - __main__ - Step 6887: {'lr': 0.0004986566044162523, 'samples': 1322304, 'steps': 6886, 'loss/train': 2.356243848800659} -08/30/2021 14:25:09 - INFO - __main__ - Step 6888: {'lr': 0.0004986560549573881, 'samples': 1322496, 'steps': 6887, 'loss/train': 2.1619279384613037} -08/30/2021 14:25:11 - INFO - __main__ - Step 6889: {'lr': 0.0004986555053864833, 'samples': 1322688, 'steps': 6888, 'loss/train': 1.0654551982879639} -08/30/2021 14:25:11 - INFO - __main__ - Step 6890: {'lr': 0.0004986549557035381, 'samples': 1322880, 'steps': 6889, 'loss/train': 2.1010587215423584} -08/30/2021 14:25:11 - INFO - __main__ - Step 6891: {'lr': 0.0004986544059085528, 'samples': 1323072, 'steps': 6890, 'loss/train': 2.5215981006622314} -08/30/2021 14:25:12 - INFO - __main__ - Step 6892: {'lr': 0.0004986538560015277, 'samples': 1323264, 'steps': 6891, 'loss/train': 1.2634923458099365} -08/30/2021 14:25:12 - INFO - __main__ - Step 6893: {'lr': 0.000498653305982463, 'samples': 1323456, 'steps': 6892, 'loss/train': 2.037827968597412} -08/30/2021 14:25:14 - INFO - __main__ - Step 6894: {'lr': 0.0004986527558513591, 'samples': 1323648, 'steps': 6893, 'loss/train': 2.1294493675231934} -08/30/2021 14:25:14 - INFO - __main__ - Step 6895: {'lr': 0.0004986522056082159, 'samples': 1323840, 'steps': 6894, 'loss/train': 2.2286181449890137} -08/30/2021 14:25:14 - INFO - __main__ - Step 6896: {'lr': 0.0004986516552530339, 'samples': 1324032, 'steps': 6895, 'loss/train': 2.290353536605835} -08/30/2021 14:25:15 - INFO - __main__ - Step 6897: {'lr': 0.0004986511047858134, 'samples': 1324224, 'steps': 6896, 'loss/train': 2.7949278354644775} -08/30/2021 14:25:15 - INFO - __main__ - Step 6898: {'lr': 0.0004986505542065545, 'samples': 1324416, 'steps': 6897, 'loss/train': 2.1150217056274414} -08/30/2021 14:25:15 - INFO - __main__ - Step 6899: {'lr': 0.0004986500035152574, 'samples': 1324608, 'steps': 6898, 'loss/train': 6.054328441619873} -08/30/2021 14:25:17 - INFO - __main__ - Step 6900: {'lr': 0.0004986494527119226, 'samples': 1324800, 'steps': 6899, 'loss/train': 1.3928371667861938} -08/30/2021 14:25:17 - INFO - __main__ - Step 6901: {'lr': 0.0004986489017965501, 'samples': 1324992, 'steps': 6900, 'loss/train': 2.4879472255706787} -08/30/2021 14:25:18 - INFO - __main__ - Step 6902: {'lr': 0.0004986483507691403, 'samples': 1325184, 'steps': 6901, 'loss/train': 2.4172821044921875} -08/30/2021 14:25:18 - INFO - __main__ - Step 6903: {'lr': 0.0004986477996296934, 'samples': 1325376, 'steps': 6902, 'loss/train': 2.3754258155822754} -08/30/2021 14:25:18 - INFO - __main__ - Step 6904: {'lr': 0.0004986472483782096, 'samples': 1325568, 'steps': 6903, 'loss/train': 2.2065625190734863} -08/30/2021 14:25:20 - INFO - __main__ - Step 6905: {'lr': 0.0004986466970146891, 'samples': 1325760, 'steps': 6904, 'loss/train': 1.9135076999664307} -08/30/2021 14:25:20 - INFO - __main__ - Step 6906: {'lr': 0.0004986461455391323, 'samples': 1325952, 'steps': 6905, 'loss/train': 2.574843168258667} -08/30/2021 14:25:21 - INFO - __main__ - Step 6907: {'lr': 0.0004986455939515395, 'samples': 1326144, 'steps': 6906, 'loss/train': 2.348473310470581} -08/30/2021 14:25:21 - INFO - __main__ - Step 6908: {'lr': 0.0004986450422519107, 'samples': 1326336, 'steps': 6907, 'loss/train': 1.73892343044281} -08/30/2021 14:25:21 - INFO - __main__ - Step 6909: {'lr': 0.0004986444904402463, 'samples': 1326528, 'steps': 6908, 'loss/train': 2.617375612258911} -08/30/2021 14:25:24 - INFO - __main__ - Step 6910: {'lr': 0.0004986439385165464, 'samples': 1326720, 'steps': 6909, 'loss/train': 1.8800106048583984} -08/30/2021 14:25:24 - INFO - __main__ - Step 6911: {'lr': 0.0004986433864808115, 'samples': 1326912, 'steps': 6910, 'loss/train': 1.7740297317504883} -08/30/2021 14:25:24 - INFO - __main__ - Step 6912: {'lr': 0.0004986428343330418, 'samples': 1327104, 'steps': 6911, 'loss/train': 1.7741312980651855} -08/30/2021 14:25:25 - INFO - __main__ - Step 6913: {'lr': 0.0004986422820732375, 'samples': 1327296, 'steps': 6912, 'loss/train': 2.144261121749878} -08/30/2021 14:25:25 - INFO - __main__ - Step 6914: {'lr': 0.0004986417297013987, 'samples': 1327488, 'steps': 6913, 'loss/train': 1.825107216835022} -08/30/2021 14:25:27 - INFO - __main__ - Step 6915: {'lr': 0.0004986411772175258, 'samples': 1327680, 'steps': 6914, 'loss/train': 1.8923066854476929} -08/30/2021 14:25:27 - INFO - __main__ - Step 6916: {'lr': 0.000498640624621619, 'samples': 1327872, 'steps': 6915, 'loss/train': 2.145782470703125} -08/30/2021 14:25:27 - INFO - __main__ - Step 6917: {'lr': 0.0004986400719136786, 'samples': 1328064, 'steps': 6916, 'loss/train': 1.1515460014343262} -08/30/2021 14:25:28 - INFO - __main__ - Step 6918: {'lr': 0.0004986395190937048, 'samples': 1328256, 'steps': 6917, 'loss/train': 1.7062408924102783} -08/30/2021 14:25:28 - INFO - __main__ - Step 6919: {'lr': 0.000498638966161698, 'samples': 1328448, 'steps': 6918, 'loss/train': 2.4489738941192627} -08/30/2021 14:25:30 - INFO - __main__ - Step 6920: {'lr': 0.0004986384131176583, 'samples': 1328640, 'steps': 6919, 'loss/train': 1.9976365566253662} -08/30/2021 14:25:30 - INFO - __main__ - Step 6921: {'lr': 0.0004986378599615858, 'samples': 1328832, 'steps': 6920, 'loss/train': 1.6281598806381226} -08/30/2021 14:25:31 - INFO - __main__ - Step 6922: {'lr': 0.000498637306693481, 'samples': 1329024, 'steps': 6921, 'loss/train': 0.7272114157676697} -08/30/2021 14:25:31 - INFO - __main__ - Step 6923: {'lr': 0.0004986367533133441, 'samples': 1329216, 'steps': 6922, 'loss/train': 0.37977930903434753} -08/30/2021 14:25:31 - INFO - __main__ - Step 6924: {'lr': 0.0004986361998211752, 'samples': 1329408, 'steps': 6923, 'loss/train': 1.578798532485962} -08/30/2021 14:25:32 - INFO - __main__ - Step 6925: {'lr': 0.0004986356462169748, 'samples': 1329600, 'steps': 6924, 'loss/train': 1.8063700199127197} -08/30/2021 14:25:33 - INFO - __main__ - Step 6926: {'lr': 0.0004986350925007429, 'samples': 1329792, 'steps': 6925, 'loss/train': 1.6588304042816162} -08/30/2021 14:25:34 - INFO - __main__ - Step 6927: {'lr': 0.00049863453867248, 'samples': 1329984, 'steps': 6926, 'loss/train': 1.6391549110412598} -08/30/2021 14:25:34 - INFO - __main__ - Step 6928: {'lr': 0.0004986339847321862, 'samples': 1330176, 'steps': 6927, 'loss/train': 2.2844653129577637} -08/30/2021 14:25:35 - INFO - __main__ - Step 6929: {'lr': 0.0004986334306798616, 'samples': 1330368, 'steps': 6928, 'loss/train': 2.1090357303619385} -08/30/2021 14:25:35 - INFO - __main__ - Step 6930: {'lr': 0.0004986328765155068, 'samples': 1330560, 'steps': 6929, 'loss/train': 2.138875961303711} -08/30/2021 14:25:36 - INFO - __main__ - Step 6931: {'lr': 0.0004986323222391217, 'samples': 1330752, 'steps': 6930, 'loss/train': 1.4466071128845215} -08/30/2021 14:25:37 - INFO - __main__ - Step 6932: {'lr': 0.0004986317678507069, 'samples': 1330944, 'steps': 6931, 'loss/train': 2.406386137008667} -08/30/2021 14:25:37 - INFO - __main__ - Step 6933: {'lr': 0.0004986312133502623, 'samples': 1331136, 'steps': 6932, 'loss/train': 2.288001537322998} -08/30/2021 14:25:38 - INFO - __main__ - Step 6934: {'lr': 0.0004986306587377884, 'samples': 1331328, 'steps': 6933, 'loss/train': 2.0331573486328125} -08/30/2021 14:25:38 - INFO - __main__ - Step 6935: {'lr': 0.0004986301040132853, 'samples': 1331520, 'steps': 6934, 'loss/train': 1.7046838998794556} -08/30/2021 14:25:39 - INFO - __main__ - Step 6936: {'lr': 0.0004986295491767533, 'samples': 1331712, 'steps': 6935, 'loss/train': 2.325742244720459} -08/30/2021 14:25:40 - INFO - __main__ - Step 6937: {'lr': 0.0004986289942281927, 'samples': 1331904, 'steps': 6936, 'loss/train': 2.508173942565918} -08/30/2021 14:25:40 - INFO - __main__ - Step 6938: {'lr': 0.0004986284391676037, 'samples': 1332096, 'steps': 6937, 'loss/train': 0.506510853767395} -08/30/2021 14:25:41 - INFO - __main__ - Step 6939: {'lr': 0.0004986278839949866, 'samples': 1332288, 'steps': 6938, 'loss/train': 2.2064061164855957} -08/30/2021 14:25:41 - INFO - __main__ - Step 6940: {'lr': 0.0004986273287103416, 'samples': 1332480, 'steps': 6939, 'loss/train': 2.2642083168029785} -08/30/2021 14:25:41 - INFO - __main__ - Step 6941: {'lr': 0.0004986267733136689, 'samples': 1332672, 'steps': 6940, 'loss/train': 2.348919153213501} -08/30/2021 14:25:43 - INFO - __main__ - Step 6942: {'lr': 0.0004986262178049689, 'samples': 1332864, 'steps': 6941, 'loss/train': 1.9068524837493896} -08/30/2021 14:25:43 - INFO - __main__ - Step 6943: {'lr': 0.0004986256621842417, 'samples': 1333056, 'steps': 6942, 'loss/train': 2.513831853866577} -08/30/2021 14:25:44 - INFO - __main__ - Step 6944: {'lr': 0.0004986251064514878, 'samples': 1333248, 'steps': 6943, 'loss/train': 2.5233402252197266} -08/30/2021 14:25:44 - INFO - __main__ - Step 6945: {'lr': 0.000498624550606707, 'samples': 1333440, 'steps': 6944, 'loss/train': 2.2280867099761963} -08/30/2021 14:25:44 - INFO - __main__ - Step 6946: {'lr': 0.0004986239946498999, 'samples': 1333632, 'steps': 6945, 'loss/train': 1.7360042333602905} -08/30/2021 14:25:46 - INFO - __main__ - Step 6947: {'lr': 0.0004986234385810668, 'samples': 1333824, 'steps': 6946, 'loss/train': 3.6465749740600586} -08/30/2021 14:25:46 - INFO - __main__ - Step 6948: {'lr': 0.0004986228824002076, 'samples': 1334016, 'steps': 6947, 'loss/train': 2.2492029666900635} -08/30/2021 14:25:47 - INFO - __main__ - Step 6949: {'lr': 0.0004986223261073228, 'samples': 1334208, 'steps': 6948, 'loss/train': 1.952388882637024} -08/30/2021 14:25:47 - INFO - __main__ - Step 6950: {'lr': 0.0004986217697024128, 'samples': 1334400, 'steps': 6949, 'loss/train': 2.0262415409088135} -08/30/2021 14:25:47 - INFO - __main__ - Step 6951: {'lr': 0.0004986212131854775, 'samples': 1334592, 'steps': 6950, 'loss/train': 2.334930896759033} -08/30/2021 14:25:49 - INFO - __main__ - Step 6952: {'lr': 0.0004986206565565173, 'samples': 1334784, 'steps': 6951, 'loss/train': 1.644972801208496} -08/30/2021 14:25:50 - INFO - __main__ - Step 6953: {'lr': 0.0004986200998155325, 'samples': 1334976, 'steps': 6952, 'loss/train': 1.7954020500183105} -08/30/2021 14:25:50 - INFO - __main__ - Step 6954: {'lr': 0.0004986195429625234, 'samples': 1335168, 'steps': 6953, 'loss/train': 0.19723883271217346} -08/30/2021 14:25:50 - INFO - __main__ - Step 6955: {'lr': 0.0004986189859974901, 'samples': 1335360, 'steps': 6954, 'loss/train': 2.0334248542785645} -08/30/2021 14:25:51 - INFO - __main__ - Step 6956: {'lr': 0.000498618428920433, 'samples': 1335552, 'steps': 6955, 'loss/train': 1.721176028251648} -08/30/2021 14:25:51 - INFO - __main__ - Step 6957: {'lr': 0.0004986178717313522, 'samples': 1335744, 'steps': 6956, 'loss/train': 0.44948306679725647} -08/30/2021 14:25:53 - INFO - __main__ - Step 6958: {'lr': 0.000498617314430248, 'samples': 1335936, 'steps': 6957, 'loss/train': 0.3447542190551758} -08/30/2021 14:25:54 - INFO - __main__ - Step 6959: {'lr': 0.0004986167570171208, 'samples': 1336128, 'steps': 6958, 'loss/train': 2.662984609603882} -08/30/2021 14:25:54 - INFO - __main__ - Step 6960: {'lr': 0.0004986161994919706, 'samples': 1336320, 'steps': 6959, 'loss/train': 2.0758748054504395} -08/30/2021 14:25:54 - INFO - __main__ - Step 6961: {'lr': 0.0004986156418547978, 'samples': 1336512, 'steps': 6960, 'loss/train': 1.8414498567581177} -08/30/2021 14:25:55 - INFO - __main__ - Step 6962: {'lr': 0.0004986150841056027, 'samples': 1336704, 'steps': 6961, 'loss/train': 2.1176645755767822} -08/30/2021 14:25:55 - INFO - __main__ - Step 6963: {'lr': 0.0004986145262443854, 'samples': 1336896, 'steps': 6962, 'loss/train': 2.3262994289398193} -08/30/2021 14:25:56 - INFO - __main__ - Step 6964: {'lr': 0.0004986139682711463, 'samples': 1337088, 'steps': 6963, 'loss/train': 2.2248663902282715} -08/30/2021 14:25:57 - INFO - __main__ - Step 6965: {'lr': 0.0004986134101858854, 'samples': 1337280, 'steps': 6964, 'loss/train': 2.1714463233947754} -08/30/2021 14:25:57 - INFO - __main__ - Step 6966: {'lr': 0.0004986128519886033, 'samples': 1337472, 'steps': 6965, 'loss/train': 2.0460751056671143} -08/30/2021 14:25:58 - INFO - __main__ - Step 6967: {'lr': 0.0004986122936793, 'samples': 1337664, 'steps': 6966, 'loss/train': 2.76940655708313} -08/30/2021 14:25:58 - INFO - __main__ - Step 6968: {'lr': 0.000498611735257976, 'samples': 1337856, 'steps': 6967, 'loss/train': 2.16974139213562} -08/30/2021 14:26:00 - INFO - __main__ - Step 6969: {'lr': 0.0004986111767246313, 'samples': 1338048, 'steps': 6968, 'loss/train': 2.816469192504883} -08/30/2021 14:26:01 - INFO - __main__ - Step 6970: {'lr': 0.0004986106180792662, 'samples': 1338240, 'steps': 6969, 'loss/train': 2.0011513233184814} -08/30/2021 14:26:01 - INFO - __main__ - Step 6971: {'lr': 0.000498610059321881, 'samples': 1338432, 'steps': 6970, 'loss/train': 2.0067129135131836} -08/30/2021 14:26:01 - INFO - __main__ - Step 6972: {'lr': 0.000498609500452476, 'samples': 1338624, 'steps': 6971, 'loss/train': 2.03497576713562} -08/30/2021 14:26:02 - INFO - __main__ - Step 6973: {'lr': 0.0004986089414710513, 'samples': 1338816, 'steps': 6972, 'loss/train': 2.0776422023773193} -08/30/2021 14:26:03 - INFO - __main__ - Step 6974: {'lr': 0.0004986083823776073, 'samples': 1339008, 'steps': 6973, 'loss/train': 2.151496171951294} -08/30/2021 14:26:04 - INFO - __main__ - Step 6975: {'lr': 0.0004986078231721443, 'samples': 1339200, 'steps': 6974, 'loss/train': 1.8441307544708252} -08/30/2021 14:26:04 - INFO - __main__ - Step 6976: {'lr': 0.0004986072638546623, 'samples': 1339392, 'steps': 6975, 'loss/train': 1.173264503479004} -08/30/2021 14:26:04 - INFO - __main__ - Step 6977: {'lr': 0.0004986067044251617, 'samples': 1339584, 'steps': 6976, 'loss/train': 1.4295763969421387} -08/30/2021 14:26:05 - INFO - __main__ - Step 6978: {'lr': 0.0004986061448836428, 'samples': 1339776, 'steps': 6977, 'loss/train': 1.6548140048980713} -08/30/2021 14:26:05 - INFO - __main__ - Step 6979: {'lr': 0.0004986055852301058, 'samples': 1339968, 'steps': 6978, 'loss/train': 1.9921854734420776} -08/30/2021 14:26:06 - INFO - __main__ - Step 6980: {'lr': 0.000498605025464551, 'samples': 1340160, 'steps': 6979, 'loss/train': 1.6484514474868774} -08/30/2021 14:26:07 - INFO - __main__ - Step 6981: {'lr': 0.0004986044655869786, 'samples': 1340352, 'steps': 6980, 'loss/train': 2.116065502166748} -08/30/2021 14:26:07 - INFO - __main__ - Step 6982: {'lr': 0.0004986039055973889, 'samples': 1340544, 'steps': 6981, 'loss/train': 2.010517120361328} -08/30/2021 14:26:08 - INFO - __main__ - Step 6983: {'lr': 0.000498603345495782, 'samples': 1340736, 'steps': 6982, 'loss/train': 2.0259077548980713} -08/30/2021 14:26:08 - INFO - __main__ - Step 6984: {'lr': 0.0004986027852821583, 'samples': 1340928, 'steps': 6983, 'loss/train': 2.8793866634368896} -08/30/2021 14:26:09 - INFO - __main__ - Step 6985: {'lr': 0.000498602224956518, 'samples': 1341120, 'steps': 6984, 'loss/train': 2.0337533950805664} -08/30/2021 14:26:10 - INFO - __main__ - Step 6986: {'lr': 0.0004986016645188615, 'samples': 1341312, 'steps': 6985, 'loss/train': 2.2896721363067627} -08/30/2021 14:26:10 - INFO - __main__ - Step 6987: {'lr': 0.0004986011039691889, 'samples': 1341504, 'steps': 6986, 'loss/train': 1.809281826019287} -08/30/2021 14:26:11 - INFO - __main__ - Step 6988: {'lr': 0.0004986005433075004, 'samples': 1341696, 'steps': 6987, 'loss/train': 0.2523254156112671} -08/30/2021 14:26:11 - INFO - __main__ - Step 6989: {'lr': 0.0004985999825337964, 'samples': 1341888, 'steps': 6988, 'loss/train': 2.344238042831421} -08/30/2021 14:26:12 - INFO - __main__ - Step 6990: {'lr': 0.000498599421648077, 'samples': 1342080, 'steps': 6989, 'loss/train': 1.9715166091918945} -08/30/2021 14:26:13 - INFO - __main__ - Step 6991: {'lr': 0.0004985988606503426, 'samples': 1342272, 'steps': 6990, 'loss/train': 1.8085249662399292} -08/30/2021 14:26:13 - INFO - __main__ - Step 6992: {'lr': 0.0004985982995405933, 'samples': 1342464, 'steps': 6991, 'loss/train': 2.09302020072937} -08/30/2021 14:26:14 - INFO - __main__ - Step 6993: {'lr': 0.0004985977383188296, 'samples': 1342656, 'steps': 6992, 'loss/train': 2.913682460784912} -08/30/2021 14:26:14 - INFO - __main__ - Step 6994: {'lr': 0.0004985971769850515, 'samples': 1342848, 'steps': 6993, 'loss/train': 1.6446220874786377} -08/30/2021 14:26:16 - INFO - __main__ - Step 6995: {'lr': 0.0004985966155392593, 'samples': 1343040, 'steps': 6994, 'loss/train': 1.8418692350387573} -08/30/2021 14:26:16 - INFO - __main__ - Step 6996: {'lr': 0.0004985960539814534, 'samples': 1343232, 'steps': 6995, 'loss/train': 2.144650459289551} -08/30/2021 14:26:16 - INFO - __main__ - Step 6997: {'lr': 0.000498595492311634, 'samples': 1343424, 'steps': 6996, 'loss/train': 0.34487003087997437} -08/30/2021 14:26:17 - INFO - __main__ - Step 6998: {'lr': 0.0004985949305298012, 'samples': 1343616, 'steps': 6997, 'loss/train': 1.9332834482192993} -08/30/2021 14:26:17 - INFO - __main__ - Step 6999: {'lr': 0.0004985943686359554, 'samples': 1343808, 'steps': 6998, 'loss/train': 2.3357770442962646} -08/30/2021 14:26:19 - INFO - __main__ - Step 7000: {'lr': 0.0004985938066300968, 'samples': 1344000, 'steps': 6999, 'loss/train': 1.23027765750885} -08/30/2021 14:26:19 - INFO - __main__ - Step 7001: {'lr': 0.0004985932445122257, 'samples': 1344192, 'steps': 7000, 'loss/train': 2.541163444519043} -08/30/2021 14:26:19 - INFO - __main__ - Step 7002: {'lr': 0.0004985926822823422, 'samples': 1344384, 'steps': 7001, 'loss/train': 2.5520241260528564} -08/30/2021 14:26:20 - INFO - __main__ - Step 7003: {'lr': 0.0004985921199404467, 'samples': 1344576, 'steps': 7002, 'loss/train': 2.276765823364258} -08/30/2021 14:26:20 - INFO - __main__ - Step 7004: {'lr': 0.0004985915574865395, 'samples': 1344768, 'steps': 7003, 'loss/train': 2.1749000549316406} -08/30/2021 14:26:20 - INFO - __main__ - Step 7005: {'lr': 0.0004985909949206209, 'samples': 1344960, 'steps': 7004, 'loss/train': 2.2031936645507812} -08/30/2021 14:26:22 - INFO - __main__ - Step 7006: {'lr': 0.0004985904322426909, 'samples': 1345152, 'steps': 7005, 'loss/train': 2.3593475818634033} -08/30/2021 14:26:22 - INFO - __main__ - Step 7007: {'lr': 0.0004985898694527498, 'samples': 1345344, 'steps': 7006, 'loss/train': 2.2181200981140137} -08/30/2021 14:26:23 - INFO - __main__ - Step 7008: {'lr': 0.000498589306550798, 'samples': 1345536, 'steps': 7007, 'loss/train': 0.8213203549385071} -08/30/2021 14:26:23 - INFO - __main__ - Step 7009: {'lr': 0.0004985887435368357, 'samples': 1345728, 'steps': 7008, 'loss/train': 2.2370710372924805} -08/30/2021 14:26:24 - INFO - __main__ - Step 7010: {'lr': 0.0004985881804108632, 'samples': 1345920, 'steps': 7009, 'loss/train': 2.477621555328369} -08/30/2021 14:26:25 - INFO - __main__ - Step 7011: {'lr': 0.0004985876171728807, 'samples': 1346112, 'steps': 7010, 'loss/train': 1.947131633758545} -08/30/2021 14:26:26 - INFO - __main__ - Step 7012: {'lr': 0.0004985870538228884, 'samples': 1346304, 'steps': 7011, 'loss/train': 1.5513256788253784} -08/30/2021 14:26:26 - INFO - __main__ - Step 7013: {'lr': 0.0004985864903608866, 'samples': 1346496, 'steps': 7012, 'loss/train': 2.0416758060455322} -08/30/2021 14:26:26 - INFO - __main__ - Step 7014: {'lr': 0.0004985859267868756, 'samples': 1346688, 'steps': 7013, 'loss/train': 0.25593629479408264} -08/30/2021 14:26:27 - INFO - __main__ - Step 7015: {'lr': 0.0004985853631008557, 'samples': 1346880, 'steps': 7014, 'loss/train': 2.3708863258361816} -08/30/2021 14:26:28 - INFO - __main__ - Step 7016: {'lr': 0.000498584799302827, 'samples': 1347072, 'steps': 7015, 'loss/train': 0.8170610070228577} -08/30/2021 14:26:29 - INFO - __main__ - Step 7017: {'lr': 0.0004985842353927897, 'samples': 1347264, 'steps': 7016, 'loss/train': 2.0751936435699463} -08/30/2021 14:26:29 - INFO - __main__ - Step 7018: {'lr': 0.0004985836713707443, 'samples': 1347456, 'steps': 7017, 'loss/train': 2.1809775829315186} -08/30/2021 14:26:29 - INFO - __main__ - Step 7019: {'lr': 0.000498583107236691, 'samples': 1347648, 'steps': 7018, 'loss/train': 2.044480085372925} -08/30/2021 14:26:30 - INFO - __main__ - Step 7020: {'lr': 0.0004985825429906299, 'samples': 1347840, 'steps': 7019, 'loss/train': 2.1939988136291504} -08/30/2021 14:26:31 - INFO - __main__ - Step 7021: {'lr': 0.0004985819786325614, 'samples': 1348032, 'steps': 7020, 'loss/train': 2.0760951042175293} -08/30/2021 14:26:32 - INFO - __main__ - Step 7022: {'lr': 0.0004985814141624856, 'samples': 1348224, 'steps': 7021, 'loss/train': 1.8965190649032593} -08/30/2021 14:26:32 - INFO - __main__ - Step 7023: {'lr': 0.000498580849580403, 'samples': 1348416, 'steps': 7022, 'loss/train': 1.8502427339553833} -08/30/2021 14:26:32 - INFO - __main__ - Step 7024: {'lr': 0.0004985802848863135, 'samples': 1348608, 'steps': 7023, 'loss/train': 2.7550241947174072} -08/30/2021 14:26:33 - INFO - __main__ - Step 7025: {'lr': 0.0004985797200802176, 'samples': 1348800, 'steps': 7024, 'loss/train': 2.3097569942474365} -08/30/2021 14:26:35 - INFO - __main__ - Step 7026: {'lr': 0.0004985791551621158, 'samples': 1348992, 'steps': 7025, 'loss/train': 1.8013461828231812} -08/30/2021 14:26:35 - INFO - __main__ - Step 7027: {'lr': 0.0004985785901320078, 'samples': 1349184, 'steps': 7026, 'loss/train': 2.9754016399383545} -08/30/2021 14:26:36 - INFO - __main__ - Step 7028: {'lr': 0.0004985780249898941, 'samples': 1349376, 'steps': 7027, 'loss/train': 2.4538865089416504} -08/30/2021 14:26:36 - INFO - __main__ - Step 7029: {'lr': 0.0004985774597357751, 'samples': 1349568, 'steps': 7028, 'loss/train': 2.5522937774658203} -08/30/2021 14:26:36 - INFO - __main__ - Step 7030: {'lr': 0.0004985768943696509, 'samples': 1349760, 'steps': 7029, 'loss/train': 1.8235198259353638} -08/30/2021 14:26:38 - INFO - __main__ - Step 7031: {'lr': 0.0004985763288915217, 'samples': 1349952, 'steps': 7030, 'loss/train': 2.3612794876098633} -08/30/2021 14:26:38 - INFO - __main__ - Step 7032: {'lr': 0.0004985757633013879, 'samples': 1350144, 'steps': 7031, 'loss/train': 2.2243618965148926} -08/30/2021 14:26:39 - INFO - __main__ - Step 7033: {'lr': 0.0004985751975992497, 'samples': 1350336, 'steps': 7032, 'loss/train': 2.0661380290985107} -08/30/2021 14:26:39 - INFO - __main__ - Step 7034: {'lr': 0.0004985746317851074, 'samples': 1350528, 'steps': 7033, 'loss/train': 1.7722347974777222} -08/30/2021 14:26:39 - INFO - __main__ - Step 7035: {'lr': 0.0004985740658589612, 'samples': 1350720, 'steps': 7034, 'loss/train': 2.697772264480591} -08/30/2021 14:26:41 - INFO - __main__ - Step 7036: {'lr': 0.0004985734998208112, 'samples': 1350912, 'steps': 7035, 'loss/train': 2.218561887741089} -08/30/2021 14:26:41 - INFO - __main__ - Step 7037: {'lr': 0.000498572933670658, 'samples': 1351104, 'steps': 7036, 'loss/train': 2.1016488075256348} -08/30/2021 14:26:42 - INFO - __main__ - Step 7038: {'lr': 0.0004985723674085016, 'samples': 1351296, 'steps': 7037, 'loss/train': 1.9448717832565308} -08/30/2021 14:26:42 - INFO - __main__ - Step 7039: {'lr': 0.0004985718010343424, 'samples': 1351488, 'steps': 7038, 'loss/train': 1.8086481094360352} -08/30/2021 14:26:42 - INFO - __main__ - Step 7040: {'lr': 0.0004985712345481805, 'samples': 1351680, 'steps': 7039, 'loss/train': 2.5131611824035645} -08/30/2021 14:26:44 - INFO - __main__ - Step 7041: {'lr': 0.0004985706679500163, 'samples': 1351872, 'steps': 7040, 'loss/train': 1.7539966106414795} -08/30/2021 14:26:44 - INFO - __main__ - Step 7042: {'lr': 0.0004985701012398499, 'samples': 1352064, 'steps': 7041, 'loss/train': 1.6048985719680786} -08/30/2021 14:26:45 - INFO - __main__ - Step 7043: {'lr': 0.0004985695344176817, 'samples': 1352256, 'steps': 7042, 'loss/train': 0.719610869884491} -08/30/2021 14:26:45 - INFO - __main__ - Step 7044: {'lr': 0.0004985689674835119, 'samples': 1352448, 'steps': 7043, 'loss/train': 2.022465229034424} -08/30/2021 14:26:45 - INFO - __main__ - Step 7045: {'lr': 0.0004985684004373409, 'samples': 1352640, 'steps': 7044, 'loss/train': 0.8750408291816711} -08/30/2021 14:26:47 - INFO - __main__ - Step 7046: {'lr': 0.0004985678332791686, 'samples': 1352832, 'steps': 7045, 'loss/train': 2.137831926345825} -08/30/2021 14:26:47 - INFO - __main__ - Step 7047: {'lr': 0.0004985672660089956, 'samples': 1353024, 'steps': 7046, 'loss/train': 1.8576068878173828} -08/30/2021 14:26:48 - INFO - __main__ - Step 7048: {'lr': 0.000498566698626822, 'samples': 1353216, 'steps': 7047, 'loss/train': 2.100839138031006} -08/30/2021 14:26:48 - INFO - __main__ - Step 7049: {'lr': 0.000498566131132648, 'samples': 1353408, 'steps': 7048, 'loss/train': 4.702973365783691} -08/30/2021 14:26:49 - INFO - __main__ - Step 7050: {'lr': 0.0004985655635264739, 'samples': 1353600, 'steps': 7049, 'loss/train': 2.195896625518799} -08/30/2021 14:26:49 - INFO - __main__ - Step 7051: {'lr': 0.0004985649958083001, 'samples': 1353792, 'steps': 7050, 'loss/train': 1.644945740699768} -08/30/2021 14:26:50 - INFO - __main__ - Step 7052: {'lr': 0.0004985644279781268, 'samples': 1353984, 'steps': 7051, 'loss/train': 1.3386199474334717} -08/30/2021 14:26:51 - INFO - __main__ - Step 7053: {'lr': 0.0004985638600359542, 'samples': 1354176, 'steps': 7052, 'loss/train': 1.4313273429870605} -08/30/2021 14:26:51 - INFO - __main__ - Step 7054: {'lr': 0.0004985632919817824, 'samples': 1354368, 'steps': 7053, 'loss/train': 1.8021634817123413} -08/30/2021 14:26:52 - INFO - __main__ - Step 7055: {'lr': 0.000498562723815612, 'samples': 1354560, 'steps': 7054, 'loss/train': 0.2595697045326233} -08/30/2021 14:26:52 - INFO - __main__ - Step 7056: {'lr': 0.000498562155537443, 'samples': 1354752, 'steps': 7055, 'loss/train': 2.2817718982696533} -08/30/2021 14:26:53 - INFO - __main__ - Step 7057: {'lr': 0.0004985615871472757, 'samples': 1354944, 'steps': 7056, 'loss/train': 1.7531142234802246} -08/30/2021 14:26:54 - INFO - __main__ - Step 7058: {'lr': 0.0004985610186451104, 'samples': 1355136, 'steps': 7057, 'loss/train': 2.0245070457458496} -08/30/2021 14:26:54 - INFO - __main__ - Step 7059: {'lr': 0.0004985604500309473, 'samples': 1355328, 'steps': 7058, 'loss/train': 2.275963306427002} -08/30/2021 14:26:55 - INFO - __main__ - Step 7060: {'lr': 0.0004985598813047868, 'samples': 1355520, 'steps': 7059, 'loss/train': 1.4255527257919312} -08/30/2021 14:26:55 - INFO - __main__ - Step 7061: {'lr': 0.000498559312466629, 'samples': 1355712, 'steps': 7060, 'loss/train': 1.9848852157592773} -08/30/2021 14:26:56 - INFO - __main__ - Step 7062: {'lr': 0.0004985587435164742, 'samples': 1355904, 'steps': 7061, 'loss/train': 2.0852506160736084} -08/30/2021 14:26:57 - INFO - __main__ - Step 7063: {'lr': 0.0004985581744543226, 'samples': 1356096, 'steps': 7062, 'loss/train': 1.8649299144744873} -08/30/2021 14:26:57 - INFO - __main__ - Step 7064: {'lr': 0.0004985576052801747, 'samples': 1356288, 'steps': 7063, 'loss/train': 1.4704043865203857} -08/30/2021 14:26:58 - INFO - __main__ - Step 7065: {'lr': 0.0004985570359940304, 'samples': 1356480, 'steps': 7064, 'loss/train': 2.110185146331787} -08/30/2021 14:26:58 - INFO - __main__ - Step 7066: {'lr': 0.0004985564665958901, 'samples': 1356672, 'steps': 7065, 'loss/train': 1.8290075063705444} -08/30/2021 14:27:00 - INFO - __main__ - Step 7067: {'lr': 0.0004985558970857543, 'samples': 1356864, 'steps': 7066, 'loss/train': 1.6149054765701294} -08/30/2021 14:27:00 - INFO - __main__ - Step 7068: {'lr': 0.000498555327463623, 'samples': 1357056, 'steps': 7067, 'loss/train': 2.0574913024902344} -08/30/2021 14:27:00 - INFO - __main__ - Step 7069: {'lr': 0.0004985547577294963, 'samples': 1357248, 'steps': 7068, 'loss/train': 2.1082918643951416} -08/30/2021 14:27:01 - INFO - __main__ - Step 7070: {'lr': 0.0004985541878833749, 'samples': 1357440, 'steps': 7069, 'loss/train': 1.3834682703018188} -08/30/2021 14:27:01 - INFO - __main__ - Step 7071: {'lr': 0.0004985536179252587, 'samples': 1357632, 'steps': 7070, 'loss/train': 1.9284027814865112} -08/30/2021 14:27:01 - INFO - __main__ - Step 7072: {'lr': 0.0004985530478551481, 'samples': 1357824, 'steps': 7071, 'loss/train': 1.990464448928833} -08/30/2021 14:27:03 - INFO - __main__ - Step 7073: {'lr': 0.0004985524776730434, 'samples': 1358016, 'steps': 7072, 'loss/train': 1.6240383386611938} -08/30/2021 14:27:03 - INFO - __main__ - Step 7074: {'lr': 0.0004985519073789447, 'samples': 1358208, 'steps': 7073, 'loss/train': 1.859412670135498} -08/30/2021 14:27:04 - INFO - __main__ - Step 7075: {'lr': 0.0004985513369728524, 'samples': 1358400, 'steps': 7074, 'loss/train': 1.9900660514831543} -08/30/2021 14:27:04 - INFO - __main__ - Step 7076: {'lr': 0.0004985507664547666, 'samples': 1358592, 'steps': 7075, 'loss/train': 2.0464377403259277} -08/30/2021 14:27:04 - INFO - __main__ - Step 7077: {'lr': 0.0004985501958246878, 'samples': 1358784, 'steps': 7076, 'loss/train': 2.6055030822753906} -08/30/2021 14:27:07 - INFO - __main__ - Step 7078: {'lr': 0.000498549625082616, 'samples': 1358976, 'steps': 7077, 'loss/train': 0.6727930307388306} -08/30/2021 14:27:07 - INFO - __main__ - Step 7079: {'lr': 0.0004985490542285516, 'samples': 1359168, 'steps': 7078, 'loss/train': 2.0788557529449463} -08/30/2021 14:27:08 - INFO - __main__ - Step 7080: {'lr': 0.0004985484832624949, 'samples': 1359360, 'steps': 7079, 'loss/train': 2.1179535388946533} -08/30/2021 14:27:08 - INFO - __main__ - Step 7081: {'lr': 0.000498547912184446, 'samples': 1359552, 'steps': 7080, 'loss/train': 1.881097435951233} -08/30/2021 14:27:08 - INFO - __main__ - Step 7082: {'lr': 0.0004985473409944054, 'samples': 1359744, 'steps': 7081, 'loss/train': 1.996102213859558} -08/30/2021 14:27:09 - INFO - __main__ - Step 7083: {'lr': 0.000498546769692373, 'samples': 1359936, 'steps': 7082, 'loss/train': 2.7988317012786865} -08/30/2021 14:27:10 - INFO - __main__ - Step 7084: {'lr': 0.0004985461982783494, 'samples': 1360128, 'steps': 7083, 'loss/train': 1.7322026491165161} -08/30/2021 14:27:11 - INFO - __main__ - Step 7085: {'lr': 0.0004985456267523346, 'samples': 1360320, 'steps': 7084, 'loss/train': 2.3654000759124756} -08/30/2021 14:27:11 - INFO - __main__ - Step 7086: {'lr': 0.0004985450551143291, 'samples': 1360512, 'steps': 7085, 'loss/train': 1.8243162631988525} -08/30/2021 14:27:11 - INFO - __main__ - Step 7087: {'lr': 0.000498544483364333, 'samples': 1360704, 'steps': 7086, 'loss/train': 2.002641439437866} -08/30/2021 14:27:12 - INFO - __main__ - Step 7088: {'lr': 0.0004985439115023465, 'samples': 1360896, 'steps': 7087, 'loss/train': 1.816934585571289} -08/30/2021 14:27:13 - INFO - __main__ - Step 7089: {'lr': 0.0004985433395283701, 'samples': 1361088, 'steps': 7088, 'loss/train': 2.1620287895202637} -08/30/2021 14:27:14 - INFO - __main__ - Step 7090: {'lr': 0.0004985427674424038, 'samples': 1361280, 'steps': 7089, 'loss/train': 2.1201906204223633} -08/30/2021 14:27:14 - INFO - __main__ - Step 7091: {'lr': 0.000498542195244448, 'samples': 1361472, 'steps': 7090, 'loss/train': 1.913047432899475} -08/30/2021 14:27:14 - INFO - __main__ - Step 7092: {'lr': 0.0004985416229345029, 'samples': 1361664, 'steps': 7091, 'loss/train': 1.9856257438659668} -08/30/2021 14:27:15 - INFO - __main__ - Step 7093: {'lr': 0.0004985410505125689, 'samples': 1361856, 'steps': 7092, 'loss/train': 2.2616918087005615} -08/30/2021 14:27:16 - INFO - __main__ - Step 7094: {'lr': 0.0004985404779786459, 'samples': 1362048, 'steps': 7093, 'loss/train': 1.852012276649475} -08/30/2021 14:27:17 - INFO - __main__ - Step 7095: {'lr': 0.0004985399053327346, 'samples': 1362240, 'steps': 7094, 'loss/train': 1.8436076641082764} -08/30/2021 14:27:17 - INFO - __main__ - Step 7096: {'lr': 0.000498539332574835, 'samples': 1362432, 'steps': 7095, 'loss/train': 2.006499767303467} -08/30/2021 14:27:18 - INFO - __main__ - Step 7097: {'lr': 0.0004985387597049474, 'samples': 1362624, 'steps': 7096, 'loss/train': 1.0633573532104492} -08/30/2021 14:27:18 - INFO - __main__ - Step 7098: {'lr': 0.0004985381867230721, 'samples': 1362816, 'steps': 7097, 'loss/train': 1.9722651243209839} -08/30/2021 14:27:18 - INFO - __main__ - Step 7099: {'lr': 0.0004985376136292093, 'samples': 1363008, 'steps': 7098, 'loss/train': 5.240437030792236} -08/30/2021 14:27:20 - INFO - __main__ - Step 7100: {'lr': 0.0004985370404233592, 'samples': 1363200, 'steps': 7099, 'loss/train': 1.9567259550094604} -08/30/2021 14:27:20 - INFO - __main__ - Step 7101: {'lr': 0.0004985364671055223, 'samples': 1363392, 'steps': 7100, 'loss/train': 2.0685393810272217} -08/30/2021 14:27:21 - INFO - __main__ - Step 7102: {'lr': 0.0004985358936756985, 'samples': 1363584, 'steps': 7101, 'loss/train': 1.7404972314834595} -08/30/2021 14:27:21 - INFO - __main__ - Step 7103: {'lr': 0.0004985353201338885, 'samples': 1363776, 'steps': 7102, 'loss/train': 2.0010063648223877} -08/30/2021 14:27:21 - INFO - __main__ - Step 7104: {'lr': 0.0004985347464800921, 'samples': 1363968, 'steps': 7103, 'loss/train': 1.8056018352508545} -08/30/2021 14:27:23 - INFO - __main__ - Step 7105: {'lr': 0.0004985341727143099, 'samples': 1364160, 'steps': 7104, 'loss/train': 2.1832635402679443} -08/30/2021 14:27:24 - INFO - __main__ - Step 7106: {'lr': 0.000498533598836542, 'samples': 1364352, 'steps': 7105, 'loss/train': 2.127995729446411} -08/30/2021 14:27:24 - INFO - __main__ - Step 7107: {'lr': 0.0004985330248467888, 'samples': 1364544, 'steps': 7106, 'loss/train': 3.5202279090881348} -08/30/2021 14:27:24 - INFO - __main__ - Step 7108: {'lr': 0.0004985324507450504, 'samples': 1364736, 'steps': 7107, 'loss/train': 1.5345447063446045} -08/30/2021 14:27:25 - INFO - __main__ - Step 7109: {'lr': 0.000498531876531327, 'samples': 1364928, 'steps': 7108, 'loss/train': 1.7388873100280762} -08/30/2021 14:27:25 - INFO - __main__ - Step 7110: {'lr': 0.0004985313022056191, 'samples': 1365120, 'steps': 7109, 'loss/train': 1.996155858039856} -08/30/2021 14:27:26 - INFO - __main__ - Step 7111: {'lr': 0.0004985307277679267, 'samples': 1365312, 'steps': 7110, 'loss/train': 2.645927667617798} -08/30/2021 14:27:27 - INFO - __main__ - Step 7112: {'lr': 0.0004985301532182503, 'samples': 1365504, 'steps': 7111, 'loss/train': 2.7811317443847656} -08/30/2021 14:27:27 - INFO - __main__ - Step 7113: {'lr': 0.0004985295785565901, 'samples': 1365696, 'steps': 7112, 'loss/train': 2.0135228633880615} -08/30/2021 14:27:28 - INFO - __main__ - Step 7114: {'lr': 0.0004985290037829462, 'samples': 1365888, 'steps': 7113, 'loss/train': 1.8710907697677612} -08/30/2021 14:27:28 - INFO - __main__ - Step 7115: {'lr': 0.000498528428897319, 'samples': 1366080, 'steps': 7114, 'loss/train': 2.2685768604278564} -08/30/2021 14:27:30 - INFO - __main__ - Step 7116: {'lr': 0.0004985278538997088, 'samples': 1366272, 'steps': 7115, 'loss/train': 2.0806174278259277} -08/30/2021 14:27:30 - INFO - __main__ - Step 7117: {'lr': 0.0004985272787901156, 'samples': 1366464, 'steps': 7116, 'loss/train': 2.5690901279449463} -08/30/2021 14:27:31 - INFO - __main__ - Step 7118: {'lr': 0.00049852670356854, 'samples': 1366656, 'steps': 7117, 'loss/train': 2.0994789600372314} -08/30/2021 14:27:31 - INFO - __main__ - Step 7119: {'lr': 0.000498526128234982, 'samples': 1366848, 'steps': 7118, 'loss/train': 2.1290652751922607} -08/30/2021 14:27:31 - INFO - __main__ - Step 7120: {'lr': 0.000498525552789442, 'samples': 1367040, 'steps': 7119, 'loss/train': 0.41349098086357117} -08/30/2021 14:27:33 - INFO - __main__ - Step 7121: {'lr': 0.0004985249772319202, 'samples': 1367232, 'steps': 7120, 'loss/train': 1.3266475200653076} -08/30/2021 14:27:33 - INFO - __main__ - Step 7122: {'lr': 0.000498524401562417, 'samples': 1367424, 'steps': 7121, 'loss/train': 0.3361709713935852} -08/30/2021 14:27:34 - INFO - __main__ - Step 7123: {'lr': 0.0004985238257809325, 'samples': 1367616, 'steps': 7122, 'loss/train': 1.5390362739562988} -08/30/2021 14:27:34 - INFO - __main__ - Step 7124: {'lr': 0.0004985232498874669, 'samples': 1367808, 'steps': 7123, 'loss/train': 1.0099903345108032} -08/30/2021 14:27:34 - INFO - __main__ - Step 7125: {'lr': 0.0004985226738820207, 'samples': 1368000, 'steps': 7124, 'loss/train': 1.572208046913147} -08/30/2021 14:27:35 - INFO - __main__ - Step 7126: {'lr': 0.0004985220977645939, 'samples': 1368192, 'steps': 7125, 'loss/train': 2.1918258666992188} -08/30/2021 14:27:36 - INFO - __main__ - Step 7127: {'lr': 0.0004985215215351869, 'samples': 1368384, 'steps': 7126, 'loss/train': 1.7024544477462769} -08/30/2021 14:27:37 - INFO - __main__ - Step 7128: {'lr': 0.0004985209451937999, 'samples': 1368576, 'steps': 7127, 'loss/train': 0.7918288111686707} -08/30/2021 14:27:37 - INFO - __main__ - Step 7129: {'lr': 0.0004985203687404333, 'samples': 1368768, 'steps': 7128, 'loss/train': 2.8895046710968018} -08/30/2021 14:27:37 - INFO - __main__ - Step 7130: {'lr': 0.0004985197921750871, 'samples': 1368960, 'steps': 7129, 'loss/train': 1.8123682737350464} -08/30/2021 14:27:38 - INFO - __main__ - Step 7131: {'lr': 0.0004985192154977619, 'samples': 1369152, 'steps': 7130, 'loss/train': 1.624388575553894} -08/30/2021 14:27:40 - INFO - __main__ - Step 7132: {'lr': 0.0004985186387084577, 'samples': 1369344, 'steps': 7131, 'loss/train': 2.02010440826416} -08/30/2021 14:27:40 - INFO - __main__ - Step 7133: {'lr': 0.0004985180618071748, 'samples': 1369536, 'steps': 7132, 'loss/train': 2.0973570346832275} -08/30/2021 14:27:40 - INFO - __main__ - Step 7134: {'lr': 0.0004985174847939135, 'samples': 1369728, 'steps': 7133, 'loss/train': 1.9209593534469604} -08/30/2021 14:27:41 - INFO - __main__ - Step 7135: {'lr': 0.0004985169076686741, 'samples': 1369920, 'steps': 7134, 'loss/train': 1.8563427925109863} -08/30/2021 14:27:41 - INFO - __main__ - Step 7136: {'lr': 0.0004985163304314568, 'samples': 1370112, 'steps': 7135, 'loss/train': 2.0697617530822754} -08/30/2021 14:27:43 - INFO - __main__ - Step 7137: {'lr': 0.0004985157530822619, 'samples': 1370304, 'steps': 7136, 'loss/train': 1.9680343866348267} -08/30/2021 14:27:43 - INFO - __main__ - Step 7138: {'lr': 0.0004985151756210897, 'samples': 1370496, 'steps': 7137, 'loss/train': 2.235201120376587} -08/30/2021 14:27:44 - INFO - __main__ - Step 7139: {'lr': 0.0004985145980479402, 'samples': 1370688, 'steps': 7138, 'loss/train': 1.5232306718826294} -08/30/2021 14:27:44 - INFO - __main__ - Step 7140: {'lr': 0.000498514020362814, 'samples': 1370880, 'steps': 7139, 'loss/train': 2.722341299057007} -08/30/2021 14:27:44 - INFO - __main__ - Step 7141: {'lr': 0.0004985134425657111, 'samples': 1371072, 'steps': 7140, 'loss/train': 2.0578699111938477} -08/30/2021 14:27:45 - INFO - __main__ - Step 7142: {'lr': 0.000498512864656632, 'samples': 1371264, 'steps': 7141, 'loss/train': 1.8936917781829834} -08/30/2021 14:27:46 - INFO - __main__ - Step 7143: {'lr': 0.0004985122866355768, 'samples': 1371456, 'steps': 7142, 'loss/train': 1.4562264680862427} -08/30/2021 14:27:47 - INFO - __main__ - Step 7144: {'lr': 0.0004985117085025458, 'samples': 1371648, 'steps': 7143, 'loss/train': 1.9897072315216064} -08/30/2021 14:27:47 - INFO - __main__ - Step 7145: {'lr': 0.0004985111302575392, 'samples': 1371840, 'steps': 7144, 'loss/train': 0.3156071603298187} -08/30/2021 14:27:47 - INFO - __main__ - Step 7146: {'lr': 0.0004985105519005573, 'samples': 1372032, 'steps': 7145, 'loss/train': 2.3269412517547607} -08/30/2021 14:27:48 - INFO - __main__ - Step 7147: {'lr': 0.0004985099734316006, 'samples': 1372224, 'steps': 7146, 'loss/train': 2.2848379611968994} -08/30/2021 14:27:49 - INFO - __main__ - Step 7148: {'lr': 0.0004985093948506689, 'samples': 1372416, 'steps': 7147, 'loss/train': 1.7950539588928223} -08/30/2021 14:27:50 - INFO - __main__ - Step 7149: {'lr': 0.0004985088161577628, 'samples': 1372608, 'steps': 7148, 'loss/train': 2.1088075637817383} -08/30/2021 14:27:50 - INFO - __main__ - Step 7150: {'lr': 0.0004985082373528825, 'samples': 1372800, 'steps': 7149, 'loss/train': 2.343796730041504} -08/30/2021 14:27:51 - INFO - __main__ - Step 7151: {'lr': 0.0004985076584360282, 'samples': 1372992, 'steps': 7150, 'loss/train': 1.1312609910964966} -08/30/2021 14:27:51 - INFO - __main__ - Step 7152: {'lr': 0.0004985070794072002, 'samples': 1373184, 'steps': 7151, 'loss/train': 2.176933765411377} -08/30/2021 14:27:53 - INFO - __main__ - Step 7153: {'lr': 0.0004985065002663986, 'samples': 1373376, 'steps': 7152, 'loss/train': 2.1957783699035645} -08/30/2021 14:27:53 - INFO - __main__ - Step 7154: {'lr': 0.000498505921013624, 'samples': 1373568, 'steps': 7153, 'loss/train': 1.7569538354873657} -08/30/2021 14:27:53 - INFO - __main__ - Step 7155: {'lr': 0.0004985053416488764, 'samples': 1373760, 'steps': 7154, 'loss/train': 2.051624059677124} -08/30/2021 14:27:54 - INFO - __main__ - Step 7156: {'lr': 0.0004985047621721561, 'samples': 1373952, 'steps': 7155, 'loss/train': 2.253840923309326} -08/30/2021 14:27:54 - INFO - __main__ - Step 7157: {'lr': 0.0004985041825834634, 'samples': 1374144, 'steps': 7156, 'loss/train': 2.9600563049316406} -08/30/2021 14:27:55 - INFO - __main__ - Step 7158: {'lr': 0.0004985036028827986, 'samples': 1374336, 'steps': 7157, 'loss/train': 2.6560614109039307} -08/30/2021 14:27:56 - INFO - __main__ - Step 7159: {'lr': 0.0004985030230701619, 'samples': 1374528, 'steps': 7158, 'loss/train': 1.9453258514404297} -08/30/2021 14:27:56 - INFO - __main__ - Step 7160: {'lr': 0.0004985024431455534, 'samples': 1374720, 'steps': 7159, 'loss/train': 2.2521843910217285} -08/30/2021 14:27:57 - INFO - __main__ - Step 7161: {'lr': 0.0004985018631089738, 'samples': 1374912, 'steps': 7160, 'loss/train': 2.00766658782959} -08/30/2021 14:27:57 - INFO - __main__ - Step 7162: {'lr': 0.0004985012829604228, 'samples': 1375104, 'steps': 7161, 'loss/train': 2.114105224609375} -08/30/2021 14:27:58 - INFO - __main__ - Step 7163: {'lr': 0.0004985007026999011, 'samples': 1375296, 'steps': 7162, 'loss/train': 2.3569719791412354} -08/30/2021 14:27:59 - INFO - __main__ - Step 7164: {'lr': 0.0004985001223274089, 'samples': 1375488, 'steps': 7163, 'loss/train': 2.06986927986145} -08/30/2021 14:27:59 - INFO - __main__ - Step 7165: {'lr': 0.0004984995418429463, 'samples': 1375680, 'steps': 7164, 'loss/train': 1.9990451335906982} -08/30/2021 14:28:00 - INFO - __main__ - Step 7166: {'lr': 0.0004984989612465137, 'samples': 1375872, 'steps': 7165, 'loss/train': 2.072549343109131} -08/30/2021 14:28:00 - INFO - __main__ - Step 7167: {'lr': 0.0004984983805381112, 'samples': 1376064, 'steps': 7166, 'loss/train': 1.874739408493042} -08/30/2021 14:28:00 - INFO - __main__ - Step 7168: {'lr': 0.0004984977997177393, 'samples': 1376256, 'steps': 7167, 'loss/train': 2.100863218307495} -08/30/2021 14:28:02 - INFO - __main__ - Step 7169: {'lr': 0.000498497218785398, 'samples': 1376448, 'steps': 7168, 'loss/train': 2.31718373298645} -08/30/2021 14:28:03 - INFO - __main__ - Step 7170: {'lr': 0.0004984966377410878, 'samples': 1376640, 'steps': 7169, 'loss/train': 1.911266565322876} -08/30/2021 14:28:03 - INFO - __main__ - Step 7171: {'lr': 0.0004984960565848086, 'samples': 1376832, 'steps': 7170, 'loss/train': 1.6877858638763428} -08/30/2021 14:28:03 - INFO - __main__ - Step 7172: {'lr': 0.0004984954753165612, 'samples': 1377024, 'steps': 7171, 'loss/train': 1.5156139135360718} -08/30/2021 14:28:04 - INFO - __main__ - Step 7173: {'lr': 0.0004984948939363455, 'samples': 1377216, 'steps': 7172, 'loss/train': 1.1622527837753296} -08/30/2021 14:28:05 - INFO - __main__ - Step 7174: {'lr': 0.0004984943124441617, 'samples': 1377408, 'steps': 7173, 'loss/train': 0.2638666033744812} -08/30/2021 14:28:06 - INFO - __main__ - Step 7175: {'lr': 0.0004984937308400104, 'samples': 1377600, 'steps': 7174, 'loss/train': 2.5236616134643555} -08/30/2021 14:28:06 - INFO - __main__ - Step 7176: {'lr': 0.0004984931491238915, 'samples': 1377792, 'steps': 7175, 'loss/train': 1.7262253761291504} -08/30/2021 14:28:06 - INFO - __main__ - Step 7177: {'lr': 0.0004984925672958055, 'samples': 1377984, 'steps': 7176, 'loss/train': 2.168788194656372} -08/30/2021 14:28:07 - INFO - __main__ - Step 7178: {'lr': 0.0004984919853557526, 'samples': 1378176, 'steps': 7177, 'loss/train': 2.1983604431152344} -08/30/2021 14:28:07 - INFO - __main__ - Step 7179: {'lr': 0.000498491403303733, 'samples': 1378368, 'steps': 7178, 'loss/train': 1.6143860816955566} -08/30/2021 14:28:09 - INFO - __main__ - Step 7180: {'lr': 0.000498490821139747, 'samples': 1378560, 'steps': 7179, 'loss/train': 2.6613736152648926} -08/30/2021 14:28:09 - INFO - __main__ - Step 7181: {'lr': 0.0004984902388637949, 'samples': 1378752, 'steps': 7180, 'loss/train': 1.8948392868041992} -08/30/2021 14:28:10 - INFO - __main__ - Step 7182: {'lr': 0.000498489656475877, 'samples': 1378944, 'steps': 7181, 'loss/train': 2.170236587524414} -08/30/2021 14:28:10 - INFO - __main__ - Step 7183: {'lr': 0.0004984890739759934, 'samples': 1379136, 'steps': 7182, 'loss/train': 2.422713041305542} -08/30/2021 14:28:10 - INFO - __main__ - Step 7184: {'lr': 0.0004984884913641444, 'samples': 1379328, 'steps': 7183, 'loss/train': 3.144796371459961} -08/30/2021 14:28:12 - INFO - __main__ - Step 7185: {'lr': 0.0004984879086403304, 'samples': 1379520, 'steps': 7184, 'loss/train': 2.126748561859131} -08/30/2021 14:28:13 - INFO - __main__ - Step 7186: {'lr': 0.0004984873258045517, 'samples': 1379712, 'steps': 7185, 'loss/train': 1.6775095462799072} -08/30/2021 14:28:13 - INFO - __main__ - Step 7187: {'lr': 0.0004984867428568083, 'samples': 1379904, 'steps': 7186, 'loss/train': 1.8703340291976929} -08/30/2021 14:28:14 - INFO - __main__ - Step 7188: {'lr': 0.0004984861597971006, 'samples': 1380096, 'steps': 7187, 'loss/train': 2.2406716346740723} -08/30/2021 14:28:14 - INFO - __main__ - Step 7189: {'lr': 0.000498485576625429, 'samples': 1380288, 'steps': 7188, 'loss/train': 1.5232924222946167} -08/30/2021 14:28:15 - INFO - __main__ - Step 7190: {'lr': 0.0004984849933417935, 'samples': 1380480, 'steps': 7189, 'loss/train': 1.4126814603805542} -08/30/2021 14:28:16 - INFO - __main__ - Step 7191: {'lr': 0.0004984844099461945, 'samples': 1380672, 'steps': 7190, 'loss/train': 1.9961045980453491} -08/30/2021 14:28:16 - INFO - __main__ - Step 7192: {'lr': 0.0004984838264386322, 'samples': 1380864, 'steps': 7191, 'loss/train': 0.8886036276817322} -08/30/2021 14:28:17 - INFO - __main__ - Step 7193: {'lr': 0.000498483242819107, 'samples': 1381056, 'steps': 7192, 'loss/train': 2.149461030960083} -08/30/2021 14:28:17 - INFO - __main__ - Step 7194: {'lr': 0.0004984826590876192, 'samples': 1381248, 'steps': 7193, 'loss/train': 2.0714566707611084} -08/30/2021 14:28:17 - INFO - __main__ - Step 7195: {'lr': 0.0004984820752441688, 'samples': 1381440, 'steps': 7194, 'loss/train': 2.455793857574463} -08/30/2021 14:28:19 - INFO - __main__ - Step 7196: {'lr': 0.0004984814912887563, 'samples': 1381632, 'steps': 7195, 'loss/train': 1.7198436260223389} -08/30/2021 14:28:19 - INFO - __main__ - Step 7197: {'lr': 0.0004984809072213818, 'samples': 1381824, 'steps': 7196, 'loss/train': 2.2517521381378174} -08/30/2021 14:28:20 - INFO - __main__ - Step 7198: {'lr': 0.0004984803230420457, 'samples': 1382016, 'steps': 7197, 'loss/train': 1.8150054216384888} -08/30/2021 14:28:20 - INFO - __main__ - Step 7199: {'lr': 0.0004984797387507481, 'samples': 1382208, 'steps': 7198, 'loss/train': 1.7893643379211426} -08/30/2021 14:28:20 - INFO - __main__ - Step 7200: {'lr': 0.0004984791543474896, 'samples': 1382400, 'steps': 7199, 'loss/train': 2.0862998962402344} -08/30/2021 14:28:22 - INFO - __main__ - Step 7201: {'lr': 0.0004984785698322699, 'samples': 1382592, 'steps': 7200, 'loss/train': 1.967714786529541} -08/30/2021 14:28:23 - INFO - __main__ - Step 7202: {'lr': 0.0004984779852050898, 'samples': 1382784, 'steps': 7201, 'loss/train': 1.6195945739746094} -08/30/2021 14:28:23 - INFO - __main__ - Step 7203: {'lr': 0.0004984774004659493, 'samples': 1382976, 'steps': 7202, 'loss/train': 1.4425938129425049} -08/30/2021 14:28:23 - INFO - __main__ - Step 7204: {'lr': 0.0004984768156148489, 'samples': 1383168, 'steps': 7203, 'loss/train': 2.1850192546844482} -08/30/2021 14:28:24 - INFO - __main__ - Step 7205: {'lr': 0.0004984762306517883, 'samples': 1383360, 'steps': 7204, 'loss/train': 1.778074860572815} -08/30/2021 14:28:25 - INFO - __main__ - Step 7206: {'lr': 0.0004984756455767684, 'samples': 1383552, 'steps': 7205, 'loss/train': 2.0839364528656006} -08/30/2021 14:28:26 - INFO - __main__ - Step 7207: {'lr': 0.0004984750603897892, 'samples': 1383744, 'steps': 7206, 'loss/train': 1.8351918458938599} -08/30/2021 14:28:26 - INFO - __main__ - Step 7208: {'lr': 0.0004984744750908509, 'samples': 1383936, 'steps': 7207, 'loss/train': 1.970173954963684} -08/30/2021 14:28:26 - INFO - __main__ - Step 7209: {'lr': 0.0004984738896799539, 'samples': 1384128, 'steps': 7208, 'loss/train': 2.300081729888916} -08/30/2021 14:28:27 - INFO - __main__ - Step 7210: {'lr': 0.0004984733041570983, 'samples': 1384320, 'steps': 7209, 'loss/train': 1.91078519821167} -08/30/2021 14:28:27 - INFO - __main__ - Step 7211: {'lr': 0.0004984727185222846, 'samples': 1384512, 'steps': 7210, 'loss/train': 1.4283580780029297} -08/30/2021 14:28:29 - INFO - __main__ - Step 7212: {'lr': 0.0004984721327755128, 'samples': 1384704, 'steps': 7211, 'loss/train': 2.2765932083129883} -08/30/2021 14:28:29 - INFO - __main__ - Step 7213: {'lr': 0.0004984715469167835, 'samples': 1384896, 'steps': 7212, 'loss/train': 5.389716625213623} -08/30/2021 14:28:29 - INFO - __main__ - Step 7214: {'lr': 0.0004984709609460966, 'samples': 1385088, 'steps': 7213, 'loss/train': 1.9275394678115845} -08/30/2021 14:28:30 - INFO - __main__ - Step 7215: {'lr': 0.0004984703748634524, 'samples': 1385280, 'steps': 7214, 'loss/train': 2.6016764640808105} -08/30/2021 14:28:30 - INFO - __main__ - Step 7216: {'lr': 0.0004984697886688514, 'samples': 1385472, 'steps': 7215, 'loss/train': 1.416304111480713} -08/30/2021 14:28:32 - INFO - __main__ - Step 7217: {'lr': 0.0004984692023622938, 'samples': 1385664, 'steps': 7216, 'loss/train': 2.0171456336975098} -08/30/2021 14:28:32 - INFO - __main__ - Step 7218: {'lr': 0.0004984686159437798, 'samples': 1385856, 'steps': 7217, 'loss/train': 2.2392613887786865} -08/30/2021 14:28:32 - INFO - __main__ - Step 7219: {'lr': 0.0004984680294133096, 'samples': 1386048, 'steps': 7218, 'loss/train': 1.8295966386795044} -08/30/2021 14:28:33 - INFO - __main__ - Step 7220: {'lr': 0.0004984674427708836, 'samples': 1386240, 'steps': 7219, 'loss/train': 1.8244532346725464} -08/30/2021 14:28:33 - INFO - __main__ - Step 7221: {'lr': 0.000498466856016502, 'samples': 1386432, 'steps': 7220, 'loss/train': 0.27827927470207214} -08/30/2021 14:28:35 - INFO - __main__ - Step 7222: {'lr': 0.000498466269150165, 'samples': 1386624, 'steps': 7221, 'loss/train': 2.1558480262756348} -08/30/2021 14:28:35 - INFO - __main__ - Step 7223: {'lr': 0.000498465682171873, 'samples': 1386816, 'steps': 7222, 'loss/train': 2.070441484451294} -08/30/2021 14:28:36 - INFO - __main__ - Step 7224: {'lr': 0.0004984650950816262, 'samples': 1387008, 'steps': 7223, 'loss/train': 1.7885586023330688} -08/30/2021 14:28:36 - INFO - __main__ - Step 7225: {'lr': 0.0004984645078794248, 'samples': 1387200, 'steps': 7224, 'loss/train': 1.909603238105774} -08/30/2021 14:28:36 - INFO - __main__ - Step 7226: {'lr': 0.0004984639205652692, 'samples': 1387392, 'steps': 7225, 'loss/train': 2.0837244987487793} -08/30/2021 14:28:39 - INFO - __main__ - Step 7227: {'lr': 0.0004984633331391596, 'samples': 1387584, 'steps': 7226, 'loss/train': 1.5744858980178833} -08/30/2021 14:28:39 - INFO - __main__ - Step 7228: {'lr': 0.0004984627456010962, 'samples': 1387776, 'steps': 7227, 'loss/train': 1.8887664079666138} -08/30/2021 14:28:40 - INFO - __main__ - Step 7229: {'lr': 0.0004984621579510794, 'samples': 1387968, 'steps': 7228, 'loss/train': 2.21808123588562} -08/30/2021 14:28:40 - INFO - __main__ - Step 7230: {'lr': 0.0004984615701891093, 'samples': 1388160, 'steps': 7229, 'loss/train': 2.937943935394287} -08/30/2021 14:28:41 - INFO - __main__ - Step 7231: {'lr': 0.0004984609823151863, 'samples': 1388352, 'steps': 7230, 'loss/train': 1.2554011344909668} -08/30/2021 14:28:41 - INFO - __main__ - Step 7232: {'lr': 0.0004984603943293106, 'samples': 1388544, 'steps': 7231, 'loss/train': 1.3749245405197144} -08/30/2021 14:28:41 - INFO - __main__ - Step 7233: {'lr': 0.0004984598062314824, 'samples': 1388736, 'steps': 7232, 'loss/train': 2.8922464847564697} -08/30/2021 14:28:42 - INFO - __main__ - Step 7234: {'lr': 0.0004984592180217022, 'samples': 1388928, 'steps': 7233, 'loss/train': 2.127946376800537} -08/30/2021 14:28:43 - INFO - __main__ - Step 7235: {'lr': 0.00049845862969997, 'samples': 1389120, 'steps': 7234, 'loss/train': 2.808744192123413} -08/30/2021 14:28:44 - INFO - __main__ - Step 7236: {'lr': 0.0004984580412662862, 'samples': 1389312, 'steps': 7235, 'loss/train': 1.8293496370315552} -08/30/2021 14:28:44 - INFO - __main__ - Step 7237: {'lr': 0.000498457452720651, 'samples': 1389504, 'steps': 7236, 'loss/train': 0.6578748822212219} -08/30/2021 14:28:44 - INFO - __main__ - Step 7238: {'lr': 0.0004984568640630648, 'samples': 1389696, 'steps': 7237, 'loss/train': 2.1225314140319824} -08/30/2021 14:28:45 - INFO - __main__ - Step 7239: {'lr': 0.0004984562752935278, 'samples': 1389888, 'steps': 7238, 'loss/train': 3.227290153503418} -08/30/2021 14:28:46 - INFO - __main__ - Step 7240: {'lr': 0.0004984556864120401, 'samples': 1390080, 'steps': 7239, 'loss/train': 2.11092472076416} -08/30/2021 14:28:47 - INFO - __main__ - Step 7241: {'lr': 0.0004984550974186021, 'samples': 1390272, 'steps': 7240, 'loss/train': 2.6050875186920166} -08/30/2021 14:28:47 - INFO - __main__ - Step 7242: {'lr': 0.0004984545083132142, 'samples': 1390464, 'steps': 7241, 'loss/train': 1.6543530225753784} -08/30/2021 14:28:48 - INFO - __main__ - Step 7243: {'lr': 0.0004984539190958765, 'samples': 1390656, 'steps': 7242, 'loss/train': 7.976821422576904} -08/30/2021 14:28:48 - INFO - __main__ - Step 7244: {'lr': 0.0004984533297665892, 'samples': 1390848, 'steps': 7243, 'loss/train': 7.9502434730529785} -08/30/2021 14:28:48 - INFO - __main__ - Step 7245: {'lr': 0.0004984527403253527, 'samples': 1391040, 'steps': 7244, 'loss/train': 0.6018803715705872} -08/30/2021 14:28:49 - INFO - __main__ - Step 7246: {'lr': 0.0004984521507721672, 'samples': 1391232, 'steps': 7245, 'loss/train': 2.226489782333374} -08/30/2021 14:28:51 - INFO - __main__ - Step 7247: {'lr': 0.0004984515611070331, 'samples': 1391424, 'steps': 7246, 'loss/train': 1.9661298990249634} -08/30/2021 14:28:52 - INFO - __main__ - Step 7248: {'lr': 0.0004984509713299505, 'samples': 1391616, 'steps': 7247, 'loss/train': 3.112241744995117} -08/30/2021 14:28:52 - INFO - __main__ - Step 7249: {'lr': 0.0004984503814409198, 'samples': 1391808, 'steps': 7248, 'loss/train': 3.0227649211883545} -08/30/2021 14:28:52 - INFO - __main__ - Step 7250: {'lr': 0.000498449791439941, 'samples': 1392000, 'steps': 7249, 'loss/train': 0.5346341729164124} -08/30/2021 14:28:53 - INFO - __main__ - Step 7251: {'lr': 0.0004984492013270147, 'samples': 1392192, 'steps': 7250, 'loss/train': 2.410288095474243} -08/30/2021 14:28:53 - INFO - __main__ - Step 7252: {'lr': 0.0004984486111021411, 'samples': 1392384, 'steps': 7251, 'loss/train': 2.261244773864746} -08/30/2021 14:28:53 - INFO - __main__ - Step 7253: {'lr': 0.0004984480207653202, 'samples': 1392576, 'steps': 7252, 'loss/train': 3.137852191925049} -08/30/2021 14:28:55 - INFO - __main__ - Step 7254: {'lr': 0.0004984474303165526, 'samples': 1392768, 'steps': 7253, 'loss/train': 3.3458287715911865} -08/30/2021 14:28:56 - INFO - __main__ - Step 7255: {'lr': 0.0004984468397558384, 'samples': 1392960, 'steps': 7254, 'loss/train': 2.5857832431793213} -08/30/2021 14:28:56 - INFO - __main__ - Step 7256: {'lr': 0.0004984462490831778, 'samples': 1393152, 'steps': 7255, 'loss/train': 2.4637887477874756} -08/30/2021 14:28:56 - INFO - __main__ - Step 7257: {'lr': 0.0004984456582985713, 'samples': 1393344, 'steps': 7256, 'loss/train': 1.8142101764678955} -08/30/2021 14:28:57 - INFO - __main__ - Step 7258: {'lr': 0.0004984450674020189, 'samples': 1393536, 'steps': 7257, 'loss/train': 2.649630546569824} -08/30/2021 14:28:58 - INFO - __main__ - Step 7259: {'lr': 0.000498444476393521, 'samples': 1393728, 'steps': 7258, 'loss/train': 2.293332815170288} -08/30/2021 14:28:59 - INFO - __main__ - Step 7260: {'lr': 0.0004984438852730779, 'samples': 1393920, 'steps': 7259, 'loss/train': 1.4812675714492798} -08/30/2021 14:28:59 - INFO - __main__ - Step 7261: {'lr': 0.0004984432940406898, 'samples': 1394112, 'steps': 7260, 'loss/train': 2.5667483806610107} -08/30/2021 14:28:59 - INFO - __main__ - Step 7262: {'lr': 0.0004984427026963569, 'samples': 1394304, 'steps': 7261, 'loss/train': 2.730210781097412} -08/30/2021 14:29:00 - INFO - __main__ - Step 7263: {'lr': 0.0004984421112400796, 'samples': 1394496, 'steps': 7262, 'loss/train': 2.477018356323242} -08/30/2021 14:29:01 - INFO - __main__ - Step 7264: {'lr': 0.0004984415196718582, 'samples': 1394688, 'steps': 7263, 'loss/train': 2.386280059814453} -08/30/2021 14:29:02 - INFO - __main__ - Step 7265: {'lr': 0.0004984409279916929, 'samples': 1394880, 'steps': 7264, 'loss/train': 2.290518045425415} -08/30/2021 14:29:02 - INFO - __main__ - Step 7266: {'lr': 0.0004984403361995839, 'samples': 1395072, 'steps': 7265, 'loss/train': 2.308997869491577} -08/30/2021 14:29:02 - INFO - __main__ - Step 7267: {'lr': 0.0004984397442955315, 'samples': 1395264, 'steps': 7266, 'loss/train': 2.263298988342285} -08/30/2021 14:29:03 - INFO - __main__ - Step 7268: {'lr': 0.0004984391522795359, 'samples': 1395456, 'steps': 7267, 'loss/train': 2.382741689682007} -08/30/2021 14:29:04 - INFO - __main__ - Step 7269: {'lr': 0.0004984385601515977, 'samples': 1395648, 'steps': 7268, 'loss/train': 2.2990920543670654} -08/30/2021 14:29:05 - INFO - __main__ - Step 7270: {'lr': 0.0004984379679117166, 'samples': 1395840, 'steps': 7269, 'loss/train': 2.7670998573303223} -08/30/2021 14:29:05 - INFO - __main__ - Step 7271: {'lr': 0.0004984373755598934, 'samples': 1396032, 'steps': 7270, 'loss/train': 2.1212124824523926} -08/30/2021 14:29:05 - INFO - __main__ - Step 7272: {'lr': 0.0004984367830961281, 'samples': 1396224, 'steps': 7271, 'loss/train': 2.1122045516967773} -08/30/2021 14:29:06 - INFO - __main__ - Step 7273: {'lr': 0.0004984361905204209, 'samples': 1396416, 'steps': 7272, 'loss/train': 2.5294036865234375} -08/30/2021 14:29:07 - INFO - __main__ - Step 7274: {'lr': 0.0004984355978327724, 'samples': 1396608, 'steps': 7273, 'loss/train': 2.684483528137207} -08/30/2021 14:29:08 - INFO - __main__ - Step 7275: {'lr': 0.0004984350050331826, 'samples': 1396800, 'steps': 7274, 'loss/train': 2.8753700256347656} -08/30/2021 14:29:08 - INFO - __main__ - Step 7276: {'lr': 0.0004984344121216518, 'samples': 1396992, 'steps': 7275, 'loss/train': 2.7209572792053223} -08/30/2021 14:29:08 - INFO - __main__ - Step 7277: {'lr': 0.0004984338190981802, 'samples': 1397184, 'steps': 7276, 'loss/train': 2.787548780441284} -08/30/2021 14:29:09 - INFO - __main__ - Step 7278: {'lr': 0.0004984332259627682, 'samples': 1397376, 'steps': 7277, 'loss/train': 1.2269775867462158} -08/30/2021 14:29:11 - INFO - __main__ - Step 7279: {'lr': 0.000498432632715416, 'samples': 1397568, 'steps': 7278, 'loss/train': 2.464550733566284} -08/30/2021 14:29:11 - INFO - __main__ - Step 7280: {'lr': 0.000498432039356124, 'samples': 1397760, 'steps': 7279, 'loss/train': 2.4765076637268066} -08/30/2021 14:29:12 - INFO - __main__ - Step 7281: {'lr': 0.0004984314458848923, 'samples': 1397952, 'steps': 7280, 'loss/train': 0.7683911919593811} -08/30/2021 14:29:12 - INFO - __main__ - Step 7282: {'lr': 0.0004984308523017212, 'samples': 1398144, 'steps': 7281, 'loss/train': 1.5597885847091675} -08/30/2021 14:29:12 - INFO - __main__ - Step 7283: {'lr': 0.000498430258606611, 'samples': 1398336, 'steps': 7282, 'loss/train': 2.402383804321289} -08/30/2021 14:29:14 - INFO - __main__ - Step 7284: {'lr': 0.000498429664799562, 'samples': 1398528, 'steps': 7283, 'loss/train': 0.47472572326660156} -08/30/2021 14:29:15 - INFO - __main__ - Step 7285: {'lr': 0.0004984290708805743, 'samples': 1398720, 'steps': 7284, 'loss/train': 1.5766929388046265} -08/30/2021 14:29:15 - INFO - __main__ - Step 7286: {'lr': 0.0004984284768496484, 'samples': 1398912, 'steps': 7285, 'loss/train': 2.2995853424072266} -08/30/2021 14:29:15 - INFO - __main__ - Step 7287: {'lr': 0.0004984278827067844, 'samples': 1399104, 'steps': 7286, 'loss/train': 2.6046810150146484} -08/30/2021 14:29:16 - INFO - __main__ - Step 7288: {'lr': 0.0004984272884519827, 'samples': 1399296, 'steps': 7287, 'loss/train': 1.3832066059112549} -08/30/2021 14:29:16 - INFO - __main__ - Step 7289: {'lr': 0.0004984266940852434, 'samples': 1399488, 'steps': 7288, 'loss/train': 2.2288410663604736} -08/30/2021 14:29:17 - INFO - __main__ - Step 7290: {'lr': 0.0004984260996065671, 'samples': 1399680, 'steps': 7289, 'loss/train': 2.1831796169281006} -08/30/2021 14:29:18 - INFO - __main__ - Step 7291: {'lr': 0.0004984255050159536, 'samples': 1399872, 'steps': 7290, 'loss/train': 1.6125967502593994} -08/30/2021 14:29:18 - INFO - __main__ - Step 7292: {'lr': 0.0004984249103134035, 'samples': 1400064, 'steps': 7291, 'loss/train': 2.1078720092773438} -08/30/2021 14:29:18 - INFO - __main__ - Step 7293: {'lr': 0.0004984243154989168, 'samples': 1400256, 'steps': 7292, 'loss/train': 2.4023003578186035} -08/30/2021 14:29:19 - INFO - __main__ - Step 7294: {'lr': 0.0004984237205724942, 'samples': 1400448, 'steps': 7293, 'loss/train': 2.2205755710601807} -08/30/2021 14:29:21 - INFO - __main__ - Step 7295: {'lr': 0.0004984231255341355, 'samples': 1400640, 'steps': 7294, 'loss/train': 1.6430696249008179} -08/30/2021 14:29:21 - INFO - __main__ - Step 7296: {'lr': 0.0004984225303838413, 'samples': 1400832, 'steps': 7295, 'loss/train': 1.9313017129898071} -08/30/2021 14:29:21 - INFO - __main__ - Step 7297: {'lr': 0.0004984219351216116, 'samples': 1401024, 'steps': 7296, 'loss/train': 2.0928707122802734} -08/30/2021 14:29:22 - INFO - __main__ - Step 7298: {'lr': 0.000498421339747447, 'samples': 1401216, 'steps': 7297, 'loss/train': 1.7971556186676025} -08/30/2021 14:29:22 - INFO - __main__ - Step 7299: {'lr': 0.0004984207442613474, 'samples': 1401408, 'steps': 7298, 'loss/train': 2.812422037124634} -08/30/2021 14:29:25 - INFO - __main__ - Step 7300: {'lr': 0.0004984201486633134, 'samples': 1401600, 'steps': 7299, 'loss/train': 2.3023829460144043} -08/30/2021 14:29:25 - INFO - __main__ - Step 7301: {'lr': 0.0004984195529533451, 'samples': 1401792, 'steps': 7300, 'loss/train': 2.187779426574707} -08/30/2021 14:29:26 - INFO - __main__ - Step 7302: {'lr': 0.0004984189571314426, 'samples': 1401984, 'steps': 7301, 'loss/train': 1.8578436374664307} -08/30/2021 14:29:26 - INFO - __main__ - Step 7303: {'lr': 0.0004984183611976065, 'samples': 1402176, 'steps': 7302, 'loss/train': 2.4243733882904053} -08/30/2021 14:29:26 - INFO - __main__ - Step 7304: {'lr': 0.0004984177651518369, 'samples': 1402368, 'steps': 7303, 'loss/train': 2.580448627471924} -08/30/2021 14:29:27 - INFO - __main__ - Step 7305: {'lr': 0.0004984171689941341, 'samples': 1402560, 'steps': 7304, 'loss/train': 1.3540310859680176} -08/30/2021 14:29:28 - INFO - __main__ - Step 7306: {'lr': 0.0004984165727244984, 'samples': 1402752, 'steps': 7305, 'loss/train': 0.48593971133232117} -08/30/2021 14:29:29 - INFO - __main__ - Step 7307: {'lr': 0.0004984159763429299, 'samples': 1402944, 'steps': 7306, 'loss/train': 0.3630259335041046} -08/30/2021 14:29:29 - INFO - __main__ - Step 7308: {'lr': 0.0004984153798494291, 'samples': 1403136, 'steps': 7307, 'loss/train': 2.3465182781219482} -08/30/2021 14:29:30 - INFO - __main__ - Step 7309: {'lr': 0.000498414783243996, 'samples': 1403328, 'steps': 7308, 'loss/train': 2.074223279953003} -08/30/2021 14:29:30 - INFO - __main__ - Step 7310: {'lr': 0.0004984141865266312, 'samples': 1403520, 'steps': 7309, 'loss/train': 2.2703497409820557} -08/30/2021 14:29:31 - INFO - __main__ - Step 7311: {'lr': 0.0004984135896973348, 'samples': 1403712, 'steps': 7310, 'loss/train': 2.1518030166625977} -08/30/2021 14:29:32 - INFO - __main__ - Step 7312: {'lr': 0.000498412992756107, 'samples': 1403904, 'steps': 7311, 'loss/train': 1.5375657081604004} -08/30/2021 14:29:32 - INFO - __main__ - Step 7313: {'lr': 0.0004984123957029482, 'samples': 1404096, 'steps': 7312, 'loss/train': 2.6248369216918945} -08/30/2021 14:29:33 - INFO - __main__ - Step 7314: {'lr': 0.0004984117985378586, 'samples': 1404288, 'steps': 7313, 'loss/train': 2.0702261924743652} -08/30/2021 14:29:33 - INFO - __main__ - Step 7315: {'lr': 0.0004984112012608384, 'samples': 1404480, 'steps': 7314, 'loss/train': 1.9362568855285645} -08/30/2021 14:29:34 - INFO - __main__ - Step 7316: {'lr': 0.000498410603871888, 'samples': 1404672, 'steps': 7315, 'loss/train': 2.604275941848755} -08/30/2021 14:29:35 - INFO - __main__ - Step 7317: {'lr': 0.0004984100063710076, 'samples': 1404864, 'steps': 7316, 'loss/train': 2.0040323734283447} -08/30/2021 14:29:35 - INFO - __main__ - Step 7318: {'lr': 0.0004984094087581975, 'samples': 1405056, 'steps': 7317, 'loss/train': 2.2937192916870117} -08/30/2021 14:29:36 - INFO - __main__ - Step 7319: {'lr': 0.0004984088110334579, 'samples': 1405248, 'steps': 7318, 'loss/train': 2.2699267864227295} -08/30/2021 14:29:36 - INFO - __main__ - Step 7320: {'lr': 0.0004984082131967892, 'samples': 1405440, 'steps': 7319, 'loss/train': 2.281672954559326} -08/30/2021 14:29:38 - INFO - __main__ - Step 7321: {'lr': 0.0004984076152481916, 'samples': 1405632, 'steps': 7320, 'loss/train': 2.3214380741119385} -08/30/2021 14:29:38 - INFO - __main__ - Step 7322: {'lr': 0.0004984070171876653, 'samples': 1405824, 'steps': 7321, 'loss/train': 1.8340390920639038} -08/30/2021 14:29:39 - INFO - __main__ - Step 7323: {'lr': 0.0004984064190152106, 'samples': 1406016, 'steps': 7322, 'loss/train': 2.1536357402801514} -08/30/2021 14:29:39 - INFO - __main__ - Step 7324: {'lr': 0.0004984058207308279, 'samples': 1406208, 'steps': 7323, 'loss/train': 2.2334518432617188} -08/30/2021 14:29:39 - INFO - __main__ - Step 7325: {'lr': 0.0004984052223345174, 'samples': 1406400, 'steps': 7324, 'loss/train': 2.2364373207092285} -08/30/2021 14:29:40 - INFO - __main__ - Step 7326: {'lr': 0.0004984046238262792, 'samples': 1406592, 'steps': 7325, 'loss/train': 2.1886324882507324} -08/30/2021 14:29:41 - INFO - __main__ - Step 7327: {'lr': 0.0004984040252061137, 'samples': 1406784, 'steps': 7326, 'loss/train': 1.6918123960494995} -08/30/2021 14:29:42 - INFO - __main__ - Step 7328: {'lr': 0.0004984034264740213, 'samples': 1406976, 'steps': 7327, 'loss/train': 2.175912618637085} -08/30/2021 14:29:42 - INFO - __main__ - Step 7329: {'lr': 0.0004984028276300021, 'samples': 1407168, 'steps': 7328, 'loss/train': 0.998396098613739} -08/30/2021 14:29:42 - INFO - __main__ - Step 7330: {'lr': 0.0004984022286740565, 'samples': 1407360, 'steps': 7329, 'loss/train': 2.3154714107513428} -08/30/2021 14:29:43 - INFO - __main__ - Step 7331: {'lr': 0.0004984016296061846, 'samples': 1407552, 'steps': 7330, 'loss/train': 2.078317880630493} -08/30/2021 14:29:44 - INFO - __main__ - Step 7332: {'lr': 0.0004984010304263868, 'samples': 1407744, 'steps': 7331, 'loss/train': 2.328183889389038} -08/30/2021 14:29:45 - INFO - __main__ - Step 7333: {'lr': 0.0004984004311346632, 'samples': 1407936, 'steps': 7332, 'loss/train': 2.2446072101593018} -08/30/2021 14:29:45 - INFO - __main__ - Step 7334: {'lr': 0.0004983998317310143, 'samples': 1408128, 'steps': 7333, 'loss/train': 2.094515323638916} -08/30/2021 14:29:45 - INFO - __main__ - Step 7335: {'lr': 0.0004983992322154403, 'samples': 1408320, 'steps': 7334, 'loss/train': 2.0975446701049805} -08/30/2021 14:29:46 - INFO - __main__ - Step 7336: {'lr': 0.0004983986325879414, 'samples': 1408512, 'steps': 7335, 'loss/train': 2.3745675086975098} -08/30/2021 14:29:47 - INFO - __main__ - Step 7337: {'lr': 0.0004983980328485179, 'samples': 1408704, 'steps': 7336, 'loss/train': 2.052238702774048} -08/30/2021 14:29:48 - INFO - __main__ - Step 7338: {'lr': 0.0004983974329971702, 'samples': 1408896, 'steps': 7337, 'loss/train': 2.013025999069214} -08/30/2021 14:29:48 - INFO - __main__ - Step 7339: {'lr': 0.0004983968330338983, 'samples': 1409088, 'steps': 7338, 'loss/train': 2.086759328842163} -08/30/2021 14:29:48 - INFO - __main__ - Step 7340: {'lr': 0.0004983962329587026, 'samples': 1409280, 'steps': 7339, 'loss/train': 2.233823299407959} -08/30/2021 14:29:49 - INFO - __main__ - Step 7341: {'lr': 0.0004983956327715835, 'samples': 1409472, 'steps': 7340, 'loss/train': 1.8948982954025269} -08/30/2021 14:29:50 - INFO - __main__ - Step 7342: {'lr': 0.000498395032472541, 'samples': 1409664, 'steps': 7341, 'loss/train': 2.163719892501831} -08/30/2021 14:29:51 - INFO - __main__ - Step 7343: {'lr': 0.0004983944320615757, 'samples': 1409856, 'steps': 7342, 'loss/train': 2.064788579940796} -08/30/2021 14:29:51 - INFO - __main__ - Step 7344: {'lr': 0.0004983938315386877, 'samples': 1410048, 'steps': 7343, 'loss/train': 2.149324893951416} -08/30/2021 14:29:51 - INFO - __main__ - Step 7345: {'lr': 0.0004983932309038773, 'samples': 1410240, 'steps': 7344, 'loss/train': 1.6421600580215454} -08/30/2021 14:29:52 - INFO - __main__ - Step 7346: {'lr': 0.0004983926301571445, 'samples': 1410432, 'steps': 7345, 'loss/train': 1.915958046913147} -08/30/2021 14:29:52 - INFO - __main__ - Step 7347: {'lr': 0.00049839202929849, 'samples': 1410624, 'steps': 7346, 'loss/train': 2.089918613433838} -08/30/2021 14:29:54 - INFO - __main__ - Step 7348: {'lr': 0.0004983914283279139, 'samples': 1410816, 'steps': 7347, 'loss/train': 2.4067695140838623} -08/30/2021 14:29:54 - INFO - __main__ - Step 7349: {'lr': 0.0004983908272454164, 'samples': 1411008, 'steps': 7348, 'loss/train': 1.8284673690795898} -08/30/2021 14:29:55 - INFO - __main__ - Step 7350: {'lr': 0.0004983902260509978, 'samples': 1411200, 'steps': 7349, 'loss/train': 0.35611075162887573} -08/30/2021 14:29:55 - INFO - __main__ - Step 7351: {'lr': 0.0004983896247446585, 'samples': 1411392, 'steps': 7350, 'loss/train': 2.664098024368286} -08/30/2021 14:29:55 - INFO - __main__ - Step 7352: {'lr': 0.0004983890233263986, 'samples': 1411584, 'steps': 7351, 'loss/train': 2.089432716369629} -08/30/2021 14:29:56 - INFO - __main__ - Step 7353: {'lr': 0.0004983884217962185, 'samples': 1411776, 'steps': 7352, 'loss/train': 0.6431196928024292} -08/30/2021 14:29:57 - INFO - __main__ - Step 7354: {'lr': 0.0004983878201541183, 'samples': 1411968, 'steps': 7353, 'loss/train': 0.7944732308387756} -08/30/2021 14:29:58 - INFO - __main__ - Step 7355: {'lr': 0.0004983872184000984, 'samples': 1412160, 'steps': 7354, 'loss/train': 2.156621217727661} -08/30/2021 14:29:58 - INFO - __main__ - Step 7356: {'lr': 0.0004983866165341592, 'samples': 1412352, 'steps': 7355, 'loss/train': 2.0597763061523438} -08/30/2021 14:29:59 - INFO - __main__ - Step 7357: {'lr': 0.0004983860145563006, 'samples': 1412544, 'steps': 7356, 'loss/train': 1.9994845390319824} -08/30/2021 14:29:59 - INFO - __main__ - Step 7358: {'lr': 0.0004983854124665232, 'samples': 1412736, 'steps': 7357, 'loss/train': 2.909639596939087} -08/30/2021 14:30:00 - INFO - __main__ - Step 7359: {'lr': 0.0004983848102648273, 'samples': 1412928, 'steps': 7358, 'loss/train': 1.9383361339569092} -08/30/2021 14:30:01 - INFO - __main__ - Step 7360: {'lr': 0.0004983842079512128, 'samples': 1413120, 'steps': 7359, 'loss/train': 1.5737757682800293} -08/30/2021 14:30:01 - INFO - __main__ - Step 7361: {'lr': 0.0004983836055256804, 'samples': 1413312, 'steps': 7360, 'loss/train': 2.7860159873962402} -08/30/2021 14:30:02 - INFO - __main__ - Step 7362: {'lr': 0.0004983830029882301, 'samples': 1413504, 'steps': 7361, 'loss/train': 1.4995863437652588} -08/30/2021 14:30:02 - INFO - __main__ - Step 7363: {'lr': 0.0004983824003388622, 'samples': 1413696, 'steps': 7362, 'loss/train': 2.1719024181365967} -08/30/2021 14:30:03 - INFO - __main__ - Step 7364: {'lr': 0.0004983817975775771, 'samples': 1413888, 'steps': 7363, 'loss/train': 1.7462650537490845} -08/30/2021 14:30:04 - INFO - __main__ - Step 7365: {'lr': 0.000498381194704375, 'samples': 1414080, 'steps': 7364, 'loss/train': 2.0631139278411865} -08/30/2021 14:30:04 - INFO - __main__ - Step 7366: {'lr': 0.000498380591719256, 'samples': 1414272, 'steps': 7365, 'loss/train': 1.9877134561538696} -08/30/2021 14:30:04 - INFO - __main__ - Step 7367: {'lr': 0.0004983799886222207, 'samples': 1414464, 'steps': 7366, 'loss/train': 2.4696197509765625} -08/30/2021 14:30:05 - INFO - __main__ - Step 7368: {'lr': 0.0004983793854132693, 'samples': 1414656, 'steps': 7367, 'loss/train': 2.257033586502075} -08/30/2021 14:30:07 - INFO - __main__ - Step 7369: {'lr': 0.0004983787820924019, 'samples': 1414848, 'steps': 7368, 'loss/train': 2.3936657905578613} -08/30/2021 14:30:07 - INFO - __main__ - Step 7370: {'lr': 0.0004983781786596187, 'samples': 1415040, 'steps': 7369, 'loss/train': 2.3956568241119385} -08/30/2021 14:30:08 - INFO - __main__ - Step 7371: {'lr': 0.0004983775751149204, 'samples': 1415232, 'steps': 7370, 'loss/train': 2.376009702682495} -08/30/2021 14:30:08 - INFO - __main__ - Step 7372: {'lr': 0.0004983769714583067, 'samples': 1415424, 'steps': 7371, 'loss/train': 2.920656681060791} -08/30/2021 14:30:08 - INFO - __main__ - Step 7373: {'lr': 0.0004983763676897784, 'samples': 1415616, 'steps': 7372, 'loss/train': 1.9536528587341309} -08/30/2021 14:30:10 - INFO - __main__ - Step 7374: {'lr': 0.0004983757638093355, 'samples': 1415808, 'steps': 7373, 'loss/train': 1.974847435951233} -08/30/2021 14:30:10 - INFO - __main__ - Step 7375: {'lr': 0.0004983751598169781, 'samples': 1416000, 'steps': 7374, 'loss/train': 1.821936011314392} -08/30/2021 14:30:11 - INFO - __main__ - Step 7376: {'lr': 0.000498374555712707, 'samples': 1416192, 'steps': 7375, 'loss/train': 2.4945473670959473} -08/30/2021 14:30:11 - INFO - __main__ - Step 7377: {'lr': 0.000498373951496522, 'samples': 1416384, 'steps': 7376, 'loss/train': 2.7330830097198486} -08/30/2021 14:30:11 - INFO - __main__ - Step 7378: {'lr': 0.0004983733471684234, 'samples': 1416576, 'steps': 7377, 'loss/train': 2.330193519592285} -08/30/2021 14:30:12 - INFO - __main__ - Step 7379: {'lr': 0.0004983727427284118, 'samples': 1416768, 'steps': 7378, 'loss/train': 1.9637912511825562} -08/30/2021 14:30:13 - INFO - __main__ - Step 7380: {'lr': 0.0004983721381764873, 'samples': 1416960, 'steps': 7379, 'loss/train': 1.901741862297058} -08/30/2021 14:30:14 - INFO - __main__ - Step 7381: {'lr': 0.00049837153351265, 'samples': 1417152, 'steps': 7380, 'loss/train': 1.9059598445892334} -08/30/2021 14:30:14 - INFO - __main__ - Step 7382: {'lr': 0.0004983709287369004, 'samples': 1417344, 'steps': 7381, 'loss/train': 2.421776056289673} -08/30/2021 14:30:14 - INFO - __main__ - Step 7383: {'lr': 0.0004983703238492386, 'samples': 1417536, 'steps': 7382, 'loss/train': 2.3350424766540527} -08/30/2021 14:30:15 - INFO - __main__ - Step 7384: {'lr': 0.000498369718849665, 'samples': 1417728, 'steps': 7383, 'loss/train': 2.4568023681640625} -08/30/2021 14:30:16 - INFO - __main__ - Step 7385: {'lr': 0.00049836911373818, 'samples': 1417920, 'steps': 7384, 'loss/train': 1.2539393901824951} -08/30/2021 14:30:16 - INFO - __main__ - Step 7386: {'lr': 0.0004983685085147836, 'samples': 1418112, 'steps': 7385, 'loss/train': 2.3377857208251953} -08/30/2021 14:30:17 - INFO - __main__ - Step 7387: {'lr': 0.0004983679031794762, 'samples': 1418304, 'steps': 7386, 'loss/train': 2.0887928009033203} -08/30/2021 14:30:17 - INFO - __main__ - Step 7388: {'lr': 0.000498367297732258, 'samples': 1418496, 'steps': 7387, 'loss/train': 2.3747024536132812} -08/30/2021 14:30:18 - INFO - __main__ - Step 7389: {'lr': 0.0004983666921731293, 'samples': 1418688, 'steps': 7388, 'loss/train': 1.945997953414917} -08/30/2021 14:30:19 - INFO - __main__ - Step 7390: {'lr': 0.0004983660865020905, 'samples': 1418880, 'steps': 7389, 'loss/train': 2.0669167041778564} -08/30/2021 14:30:20 - INFO - __main__ - Step 7391: {'lr': 0.0004983654807191418, 'samples': 1419072, 'steps': 7390, 'loss/train': 1.9517908096313477} -08/30/2021 14:30:20 - INFO - __main__ - Step 7392: {'lr': 0.0004983648748242833, 'samples': 1419264, 'steps': 7391, 'loss/train': 2.733821392059326} -08/30/2021 14:30:20 - INFO - __main__ - Step 7393: {'lr': 0.0004983642688175155, 'samples': 1419456, 'steps': 7392, 'loss/train': 2.7295315265655518} -08/30/2021 14:30:21 - INFO - __main__ - Step 7394: {'lr': 0.0004983636626988386, 'samples': 1419648, 'steps': 7393, 'loss/train': 1.5603747367858887} -08/30/2021 14:30:22 - INFO - __main__ - Step 7395: {'lr': 0.0004983630564682529, 'samples': 1419840, 'steps': 7394, 'loss/train': 1.9845948219299316} -08/30/2021 14:30:23 - INFO - __main__ - Step 7396: {'lr': 0.0004983624501257585, 'samples': 1420032, 'steps': 7395, 'loss/train': 1.4001693725585938} -08/30/2021 14:30:23 - INFO - __main__ - Step 7397: {'lr': 0.000498361843671356, 'samples': 1420224, 'steps': 7396, 'loss/train': 2.3412017822265625} -08/30/2021 14:30:23 - INFO - __main__ - Step 7398: {'lr': 0.0004983612371050453, 'samples': 1420416, 'steps': 7397, 'loss/train': 1.9006016254425049} -08/30/2021 14:30:24 - INFO - __main__ - Step 7399: {'lr': 0.000498360630426827, 'samples': 1420608, 'steps': 7398, 'loss/train': 2.0284204483032227} -08/30/2021 14:30:25 - INFO - __main__ - Step 7400: {'lr': 0.0004983600236367012, 'samples': 1420800, 'steps': 7399, 'loss/train': 1.6678403615951538} -08/30/2021 14:30:26 - INFO - __main__ - Step 7401: {'lr': 0.0004983594167346681, 'samples': 1420992, 'steps': 7400, 'loss/train': 1.9424364566802979} -08/30/2021 14:30:26 - INFO - __main__ - Step 7402: {'lr': 0.0004983588097207283, 'samples': 1421184, 'steps': 7401, 'loss/train': 1.8753180503845215} -08/30/2021 14:30:26 - INFO - __main__ - Step 7403: {'lr': 0.0004983582025948816, 'samples': 1421376, 'steps': 7402, 'loss/train': 1.6198694705963135} -08/30/2021 14:30:27 - INFO - __main__ - Step 7404: {'lr': 0.0004983575953571287, 'samples': 1421568, 'steps': 7403, 'loss/train': 2.0816402435302734} -08/30/2021 14:30:28 - INFO - __main__ - Step 7405: {'lr': 0.0004983569880074696, 'samples': 1421760, 'steps': 7404, 'loss/train': 2.150106430053711} -08/30/2021 14:30:28 - INFO - __main__ - Step 7406: {'lr': 0.0004983563805459048, 'samples': 1421952, 'steps': 7405, 'loss/train': 1.9102110862731934} -08/30/2021 14:30:29 - INFO - __main__ - Step 7407: {'lr': 0.0004983557729724343, 'samples': 1422144, 'steps': 7406, 'loss/train': 2.9529612064361572} -08/30/2021 14:30:29 - INFO - __main__ - Step 7408: {'lr': 0.0004983551652870586, 'samples': 1422336, 'steps': 7407, 'loss/train': 2.0352892875671387} -08/30/2021 14:30:30 - INFO - __main__ - Step 7409: {'lr': 0.000498354557489778, 'samples': 1422528, 'steps': 7408, 'loss/train': 0.8830174803733826} -08/30/2021 14:30:31 - INFO - __main__ - Step 7410: {'lr': 0.0004983539495805925, 'samples': 1422720, 'steps': 7409, 'loss/train': 1.8262628316879272} -08/30/2021 14:30:31 - INFO - __main__ - Step 7411: {'lr': 0.0004983533415595026, 'samples': 1422912, 'steps': 7410, 'loss/train': 1.6404615640640259} -08/30/2021 14:30:32 - INFO - __main__ - Step 7412: {'lr': 0.0004983527334265085, 'samples': 1423104, 'steps': 7411, 'loss/train': 1.8170119524002075} -08/30/2021 14:30:32 - INFO - __main__ - Step 7413: {'lr': 0.0004983521251816105, 'samples': 1423296, 'steps': 7412, 'loss/train': 2.4166505336761475} -08/30/2021 14:30:32 - INFO - __main__ - Step 7414: {'lr': 0.0004983515168248088, 'samples': 1423488, 'steps': 7413, 'loss/train': 1.8743215799331665} -08/30/2021 14:30:33 - INFO - __main__ - Step 7415: {'lr': 0.0004983509083561038, 'samples': 1423680, 'steps': 7414, 'loss/train': 1.871317744255066} -08/30/2021 14:30:34 - INFO - __main__ - Step 7416: {'lr': 0.0004983502997754958, 'samples': 1423872, 'steps': 7415, 'loss/train': 1.6531336307525635} -08/30/2021 14:30:35 - INFO - __main__ - Step 7417: {'lr': 0.0004983496910829849, 'samples': 1424064, 'steps': 7416, 'loss/train': 2.0444021224975586} -08/30/2021 14:30:35 - INFO - __main__ - Step 7418: {'lr': 0.0004983490822785715, 'samples': 1424256, 'steps': 7417, 'loss/train': 0.7739229202270508} -08/30/2021 14:30:35 - INFO - __main__ - Step 7419: {'lr': 0.0004983484733622558, 'samples': 1424448, 'steps': 7418, 'loss/train': 1.9896584749221802} -08/30/2021 14:30:36 - INFO - __main__ - Step 7420: {'lr': 0.0004983478643340382, 'samples': 1424640, 'steps': 7419, 'loss/train': 1.5574097633361816} -08/30/2021 14:30:38 - INFO - __main__ - Step 7421: {'lr': 0.0004983472551939186, 'samples': 1424832, 'steps': 7420, 'loss/train': 1.8600473403930664} -08/30/2021 14:30:38 - INFO - __main__ - Step 7422: {'lr': 0.0004983466459418978, 'samples': 1425024, 'steps': 7421, 'loss/train': 2.0000452995300293} -08/30/2021 14:30:39 - INFO - __main__ - Step 7423: {'lr': 0.0004983460365779759, 'samples': 1425216, 'steps': 7422, 'loss/train': 1.8882938623428345} -08/30/2021 14:30:39 - INFO - __main__ - Step 7424: {'lr': 0.0004983454271021529, 'samples': 1425408, 'steps': 7423, 'loss/train': 2.1789987087249756} -08/30/2021 14:30:39 - INFO - __main__ - Step 7425: {'lr': 0.0004983448175144294, 'samples': 1425600, 'steps': 7424, 'loss/train': 1.816618800163269} -08/30/2021 14:30:41 - INFO - __main__ - Step 7426: {'lr': 0.0004983442078148056, 'samples': 1425792, 'steps': 7425, 'loss/train': 1.7849947214126587} -08/30/2021 14:30:42 - INFO - __main__ - Step 7427: {'lr': 0.0004983435980032817, 'samples': 1425984, 'steps': 7426, 'loss/train': 0.6277517080307007} -08/30/2021 14:30:42 - INFO - __main__ - Step 7428: {'lr': 0.0004983429880798579, 'samples': 1426176, 'steps': 7427, 'loss/train': 0.7024663090705872} -08/30/2021 14:30:42 - INFO - __main__ - Step 7429: {'lr': 0.0004983423780445346, 'samples': 1426368, 'steps': 7428, 'loss/train': 2.2815916538238525} -08/30/2021 14:30:43 - INFO - __main__ - Step 7430: {'lr': 0.0004983417678973123, 'samples': 1426560, 'steps': 7429, 'loss/train': 1.468602180480957} -08/30/2021 14:30:43 - INFO - __main__ - Step 7431: {'lr': 0.0004983411576381907, 'samples': 1426752, 'steps': 7430, 'loss/train': 1.9443392753601074} -08/30/2021 14:30:45 - INFO - __main__ - Step 7432: {'lr': 0.0004983405472671706, 'samples': 1426944, 'steps': 7431, 'loss/train': 2.1994972229003906} -08/30/2021 14:30:45 - INFO - __main__ - Step 7433: {'lr': 0.000498339936784252, 'samples': 1427136, 'steps': 7432, 'loss/train': 2.496755361557007} -08/30/2021 14:30:45 - INFO - __main__ - Step 7434: {'lr': 0.0004983393261894354, 'samples': 1427328, 'steps': 7433, 'loss/train': 2.039398431777954} -08/30/2021 14:30:46 - INFO - __main__ - Step 7435: {'lr': 0.0004983387154827208, 'samples': 1427520, 'steps': 7434, 'loss/train': 2.1109769344329834} -08/30/2021 14:30:46 - INFO - __main__ - Step 7436: {'lr': 0.0004983381046641085, 'samples': 1427712, 'steps': 7435, 'loss/train': 1.9635385274887085} -08/30/2021 14:30:47 - INFO - __main__ - Step 7437: {'lr': 0.0004983374937335991, 'samples': 1427904, 'steps': 7436, 'loss/train': 1.7011244297027588} -08/30/2021 14:30:48 - INFO - __main__ - Step 7438: {'lr': 0.0004983368826911926, 'samples': 1428096, 'steps': 7437, 'loss/train': 2.3067703247070312} -08/30/2021 14:30:48 - INFO - __main__ - Step 7439: {'lr': 0.0004983362715368893, 'samples': 1428288, 'steps': 7438, 'loss/train': 2.313699960708618} -08/30/2021 14:30:49 - INFO - __main__ - Step 7440: {'lr': 0.0004983356602706895, 'samples': 1428480, 'steps': 7439, 'loss/train': 2.028313398361206} -08/30/2021 14:30:49 - INFO - __main__ - Step 7441: {'lr': 0.0004983350488925936, 'samples': 1428672, 'steps': 7440, 'loss/train': 1.9797123670578003} -08/30/2021 14:30:49 - INFO - __main__ - Step 7442: {'lr': 0.0004983344374026016, 'samples': 1428864, 'steps': 7441, 'loss/train': 1.7195743322372437} -08/30/2021 14:30:51 - INFO - __main__ - Step 7443: {'lr': 0.0004983338258007139, 'samples': 1429056, 'steps': 7442, 'loss/train': 2.02921462059021} -08/30/2021 14:30:51 - INFO - __main__ - Step 7444: {'lr': 0.0004983332140869309, 'samples': 1429248, 'steps': 7443, 'loss/train': 2.007859230041504} -08/30/2021 14:30:52 - INFO - __main__ - Step 7445: {'lr': 0.0004983326022612528, 'samples': 1429440, 'steps': 7444, 'loss/train': 1.9799222946166992} -08/30/2021 14:30:52 - INFO - __main__ - Step 7446: {'lr': 0.0004983319903236799, 'samples': 1429632, 'steps': 7445, 'loss/train': 1.4338672161102295} -08/30/2021 14:30:52 - INFO - __main__ - Step 7447: {'lr': 0.0004983313782742124, 'samples': 1429824, 'steps': 7446, 'loss/train': 1.4499529600143433} -08/30/2021 14:30:54 - INFO - __main__ - Step 7448: {'lr': 0.0004983307661128505, 'samples': 1430016, 'steps': 7447, 'loss/train': 1.8329721689224243} -08/30/2021 14:30:55 - INFO - __main__ - Step 7449: {'lr': 0.0004983301538395948, 'samples': 1430208, 'steps': 7448, 'loss/train': 1.7827765941619873} -08/30/2021 14:30:55 - INFO - __main__ - Step 7450: {'lr': 0.0004983295414544452, 'samples': 1430400, 'steps': 7449, 'loss/train': 2.311680316925049} -08/30/2021 14:30:55 - INFO - __main__ - Step 7451: {'lr': 0.0004983289289574022, 'samples': 1430592, 'steps': 7450, 'loss/train': 2.8694517612457275} -08/30/2021 14:30:56 - INFO - __main__ - Step 7452: {'lr': 0.000498328316348466, 'samples': 1430784, 'steps': 7451, 'loss/train': 1.5860830545425415} -08/30/2021 14:30:56 - INFO - __main__ - Step 7453: {'lr': 0.0004983277036276369, 'samples': 1430976, 'steps': 7452, 'loss/train': 1.9333540201187134} -08/30/2021 14:30:58 - INFO - __main__ - Step 7454: {'lr': 0.0004983270907949152, 'samples': 1431168, 'steps': 7453, 'loss/train': 0.31429755687713623} -08/30/2021 14:30:58 - INFO - __main__ - Step 7455: {'lr': 0.0004983264778503011, 'samples': 1431360, 'steps': 7454, 'loss/train': 1.7631436586380005} -08/30/2021 14:30:58 - INFO - __main__ - Step 7456: {'lr': 0.0004983258647937949, 'samples': 1431552, 'steps': 7455, 'loss/train': 2.311392307281494} -08/30/2021 14:30:59 - INFO - __main__ - Step 7457: {'lr': 0.0004983252516253969, 'samples': 1431744, 'steps': 7456, 'loss/train': 1.570852518081665} -08/30/2021 14:30:59 - INFO - __main__ - Step 7458: {'lr': 0.0004983246383451074, 'samples': 1431936, 'steps': 7457, 'loss/train': 2.570781946182251} -08/30/2021 14:30:59 - INFO - __main__ - Step 7459: {'lr': 0.0004983240249529267, 'samples': 1432128, 'steps': 7458, 'loss/train': 2.4136455059051514} -08/30/2021 14:31:01 - INFO - __main__ - Step 7460: {'lr': 0.000498323411448855, 'samples': 1432320, 'steps': 7459, 'loss/train': 2.0277886390686035} -08/30/2021 14:31:01 - INFO - __main__ - Step 7461: {'lr': 0.0004983227978328926, 'samples': 1432512, 'steps': 7460, 'loss/train': 3.357154369354248} -08/30/2021 14:31:02 - INFO - __main__ - Step 7462: {'lr': 0.0004983221841050397, 'samples': 1432704, 'steps': 7461, 'loss/train': 1.9147751331329346} -08/30/2021 14:31:02 - INFO - __main__ - Step 7463: {'lr': 0.0004983215702652968, 'samples': 1432896, 'steps': 7462, 'loss/train': 2.4763360023498535} -08/30/2021 14:31:02 - INFO - __main__ - Step 7464: {'lr': 0.0004983209563136639, 'samples': 1433088, 'steps': 7463, 'loss/train': 1.8825286626815796} -08/30/2021 14:31:04 - INFO - __main__ - Step 7465: {'lr': 0.0004983203422501414, 'samples': 1433280, 'steps': 7464, 'loss/train': 2.0879411697387695} -08/30/2021 14:31:04 - INFO - __main__ - Step 7466: {'lr': 0.0004983197280747297, 'samples': 1433472, 'steps': 7465, 'loss/train': 1.7000820636749268} -08/30/2021 14:31:05 - INFO - __main__ - Step 7467: {'lr': 0.0004983191137874289, 'samples': 1433664, 'steps': 7466, 'loss/train': 2.187587261199951} -08/30/2021 14:31:05 - INFO - __main__ - Step 7468: {'lr': 0.0004983184993882394, 'samples': 1433856, 'steps': 7467, 'loss/train': 2.4067704677581787} -08/30/2021 14:31:05 - INFO - __main__ - Step 7469: {'lr': 0.0004983178848771613, 'samples': 1434048, 'steps': 7468, 'loss/train': 2.186933994293213} -08/30/2021 14:31:07 - INFO - __main__ - Step 7470: {'lr': 0.0004983172702541951, 'samples': 1434240, 'steps': 7469, 'loss/train': 1.7947266101837158} -08/30/2021 14:31:07 - INFO - __main__ - Step 7471: {'lr': 0.0004983166555193409, 'samples': 1434432, 'steps': 7470, 'loss/train': 1.9566001892089844} -08/30/2021 14:31:08 - INFO - __main__ - Step 7472: {'lr': 0.000498316040672599, 'samples': 1434624, 'steps': 7471, 'loss/train': 2.3320071697235107} -08/30/2021 14:31:08 - INFO - __main__ - Step 7473: {'lr': 0.00049831542571397, 'samples': 1434816, 'steps': 7472, 'loss/train': 2.0690970420837402} -08/30/2021 14:31:08 - INFO - __main__ - Step 7474: {'lr': 0.0004983148106434536, 'samples': 1435008, 'steps': 7473, 'loss/train': 1.548442006111145} -08/30/2021 14:31:10 - INFO - __main__ - Step 7475: {'lr': 0.0004983141954610505, 'samples': 1435200, 'steps': 7474, 'loss/train': 2.0176265239715576} -08/30/2021 14:31:11 - INFO - __main__ - Step 7476: {'lr': 0.0004983135801667608, 'samples': 1435392, 'steps': 7475, 'loss/train': 1.918919324874878} -08/30/2021 14:31:11 - INFO - __main__ - Step 7477: {'lr': 0.0004983129647605849, 'samples': 1435584, 'steps': 7476, 'loss/train': 1.9551241397857666} -08/30/2021 14:31:12 - INFO - __main__ - Step 7478: {'lr': 0.0004983123492425229, 'samples': 1435776, 'steps': 7477, 'loss/train': 2.201251745223999} -08/30/2021 14:31:12 - INFO - __main__ - Step 7479: {'lr': 0.0004983117336125753, 'samples': 1435968, 'steps': 7478, 'loss/train': 2.257244825363159} -08/30/2021 14:31:14 - INFO - __main__ - Step 7480: {'lr': 0.0004983111178707422, 'samples': 1436160, 'steps': 7479, 'loss/train': 2.2179291248321533} -08/30/2021 14:31:14 - INFO - __main__ - Step 7481: {'lr': 0.0004983105020170239, 'samples': 1436352, 'steps': 7480, 'loss/train': 2.157257318496704} -08/30/2021 14:31:14 - INFO - __main__ - Step 7482: {'lr': 0.0004983098860514209, 'samples': 1436544, 'steps': 7481, 'loss/train': 2.0019609928131104} -08/30/2021 14:31:15 - INFO - __main__ - Step 7483: {'lr': 0.0004983092699739331, 'samples': 1436736, 'steps': 7482, 'loss/train': 2.1381466388702393} -08/30/2021 14:31:15 - INFO - __main__ - Step 7484: {'lr': 0.0004983086537845611, 'samples': 1436928, 'steps': 7483, 'loss/train': 1.8621677160263062} -08/30/2021 14:31:17 - INFO - __main__ - Step 7485: {'lr': 0.000498308037483305, 'samples': 1437120, 'steps': 7484, 'loss/train': 1.6330540180206299} -08/30/2021 14:31:17 - INFO - __main__ - Step 7486: {'lr': 0.0004983074210701651, 'samples': 1437312, 'steps': 7485, 'loss/train': 5.841049671173096} -08/30/2021 14:31:18 - INFO - __main__ - Step 7487: {'lr': 0.0004983068045451418, 'samples': 1437504, 'steps': 7486, 'loss/train': 6.140170097351074} -08/30/2021 14:31:18 - INFO - __main__ - Step 7488: {'lr': 0.0004983061879082352, 'samples': 1437696, 'steps': 7487, 'loss/train': 1.758646845817566} -08/30/2021 14:31:18 - INFO - __main__ - Step 7489: {'lr': 0.0004983055711594458, 'samples': 1437888, 'steps': 7488, 'loss/train': 0.30131110548973083} -08/30/2021 14:31:19 - INFO - __main__ - Step 7490: {'lr': 0.0004983049542987736, 'samples': 1438080, 'steps': 7489, 'loss/train': 1.9802919626235962} -08/30/2021 14:31:20 - INFO - __main__ - Step 7491: {'lr': 0.000498304337326219, 'samples': 1438272, 'steps': 7490, 'loss/train': 2.3930904865264893} -08/30/2021 14:31:21 - INFO - __main__ - Step 7492: {'lr': 0.0004983037202417824, 'samples': 1438464, 'steps': 7491, 'loss/train': 2.141775369644165} -08/30/2021 14:31:21 - INFO - __main__ - Step 7493: {'lr': 0.0004983031030454639, 'samples': 1438656, 'steps': 7492, 'loss/train': 2.0787320137023926} -08/30/2021 14:31:21 - INFO - __main__ - Step 7494: {'lr': 0.0004983024857372639, 'samples': 1438848, 'steps': 7493, 'loss/train': 1.6597785949707031} -08/30/2021 14:31:22 - INFO - __main__ - Step 7495: {'lr': 0.0004983018683171826, 'samples': 1439040, 'steps': 7494, 'loss/train': 2.1893529891967773} -08/30/2021 14:31:23 - INFO - __main__ - Step 7496: {'lr': 0.0004983012507852203, 'samples': 1439232, 'steps': 7495, 'loss/train': 1.8672926425933838} -08/30/2021 14:31:24 - INFO - __main__ - Step 7497: {'lr': 0.0004983006331413773, 'samples': 1439424, 'steps': 7496, 'loss/train': 2.1031692028045654} -08/30/2021 14:31:24 - INFO - __main__ - Step 7498: {'lr': 0.0004983000153856539, 'samples': 1439616, 'steps': 7497, 'loss/train': 1.776388168334961} -08/30/2021 14:31:24 - INFO - __main__ - Step 7499: {'lr': 0.0004982993975180504, 'samples': 1439808, 'steps': 7498, 'loss/train': 1.5209027528762817} -08/30/2021 14:31:25 - INFO - __main__ - Step 7500: {'lr': 0.0004982987795385669, 'samples': 1440000, 'steps': 7499, 'loss/train': 2.2507176399230957} -08/30/2021 14:31:25 - INFO - __main__ - Step 7501: {'lr': 0.0004982981614472039, 'samples': 1440192, 'steps': 7500, 'loss/train': 1.0047045946121216} -08/30/2021 14:31:26 - INFO - __main__ - Step 7502: {'lr': 0.0004982975432439615, 'samples': 1440384, 'steps': 7501, 'loss/train': 2.038471221923828} -08/30/2021 14:31:27 - INFO - __main__ - Step 7503: {'lr': 0.0004982969249288401, 'samples': 1440576, 'steps': 7502, 'loss/train': 2.0150177478790283} -08/30/2021 14:31:27 - INFO - __main__ - Step 7504: {'lr': 0.0004982963065018399, 'samples': 1440768, 'steps': 7503, 'loss/train': 2.293520450592041} -08/30/2021 14:31:28 - INFO - __main__ - Step 7505: {'lr': 0.0004982956879629612, 'samples': 1440960, 'steps': 7504, 'loss/train': 1.9492920637130737} -08/30/2021 14:31:28 - INFO - __main__ - Step 7506: {'lr': 0.0004982950693122044, 'samples': 1441152, 'steps': 7505, 'loss/train': 2.2154383659362793} -08/30/2021 14:31:30 - INFO - __main__ - Step 7507: {'lr': 0.0004982944505495696, 'samples': 1441344, 'steps': 7506, 'loss/train': 2.200798749923706} -08/30/2021 14:31:30 - INFO - __main__ - Step 7508: {'lr': 0.0004982938316750572, 'samples': 1441536, 'steps': 7507, 'loss/train': 2.2443289756774902} -08/30/2021 14:31:30 - INFO - __main__ - Step 7509: {'lr': 0.0004982932126886674, 'samples': 1441728, 'steps': 7508, 'loss/train': 1.1262670755386353} -08/30/2021 14:31:31 - INFO - __main__ - Step 7510: {'lr': 0.0004982925935904004, 'samples': 1441920, 'steps': 7509, 'loss/train': 2.0964956283569336} -08/30/2021 14:31:31 - INFO - __main__ - Step 7511: {'lr': 0.0004982919743802567, 'samples': 1442112, 'steps': 7510, 'loss/train': 2.082104444503784} -08/30/2021 14:31:33 - INFO - __main__ - Step 7512: {'lr': 0.0004982913550582364, 'samples': 1442304, 'steps': 7511, 'loss/train': 1.5259950160980225} -08/30/2021 14:31:33 - INFO - __main__ - Step 7513: {'lr': 0.00049829073562434, 'samples': 1442496, 'steps': 7512, 'loss/train': 2.34053897857666} -08/30/2021 14:31:33 - INFO - __main__ - Step 7514: {'lr': 0.0004982901160785675, 'samples': 1442688, 'steps': 7513, 'loss/train': 1.7912914752960205} -08/30/2021 14:31:34 - INFO - __main__ - Step 7515: {'lr': 0.0004982894964209193, 'samples': 1442880, 'steps': 7514, 'loss/train': 1.35605788230896} -08/30/2021 14:31:34 - INFO - __main__ - Step 7516: {'lr': 0.0004982888766513957, 'samples': 1443072, 'steps': 7515, 'loss/train': 2.033628463745117} -08/30/2021 14:31:36 - INFO - __main__ - Step 7517: {'lr': 0.000498288256769997, 'samples': 1443264, 'steps': 7516, 'loss/train': 1.995079755783081} -08/30/2021 14:31:36 - INFO - __main__ - Step 7518: {'lr': 0.0004982876367767234, 'samples': 1443456, 'steps': 7517, 'loss/train': 1.6700373888015747} -08/30/2021 14:31:36 - INFO - __main__ - Step 7519: {'lr': 0.0004982870166715753, 'samples': 1443648, 'steps': 7518, 'loss/train': 1.7990601062774658} -08/30/2021 14:31:37 - INFO - __main__ - Step 7520: {'lr': 0.0004982863964545529, 'samples': 1443840, 'steps': 7519, 'loss/train': 2.0874156951904297} -08/30/2021 14:31:37 - INFO - __main__ - Step 7521: {'lr': 0.0004982857761256564, 'samples': 1444032, 'steps': 7520, 'loss/train': 2.185539960861206} -08/30/2021 14:31:39 - INFO - __main__ - Step 7522: {'lr': 0.0004982851556848861, 'samples': 1444224, 'steps': 7521, 'loss/train': 1.9383097887039185} -08/30/2021 14:31:39 - INFO - __main__ - Step 7523: {'lr': 0.0004982845351322424, 'samples': 1444416, 'steps': 7522, 'loss/train': 2.156398057937622} -08/30/2021 14:31:39 - INFO - __main__ - Step 7524: {'lr': 0.0004982839144677257, 'samples': 1444608, 'steps': 7523, 'loss/train': 2.3161704540252686} -08/30/2021 14:31:40 - INFO - __main__ - Step 7525: {'lr': 0.0004982832936913359, 'samples': 1444800, 'steps': 7524, 'loss/train': 1.7087222337722778} -08/30/2021 14:31:40 - INFO - __main__ - Step 7526: {'lr': 0.0004982826728030735, 'samples': 1444992, 'steps': 7525, 'loss/train': 1.8901242017745972} -08/30/2021 14:31:40 - INFO - __main__ - Step 7527: {'lr': 0.0004982820518029387, 'samples': 1445184, 'steps': 7526, 'loss/train': 1.875933289527893} -08/30/2021 14:31:42 - INFO - __main__ - Step 7528: {'lr': 0.000498281430690932, 'samples': 1445376, 'steps': 7527, 'loss/train': 2.131187677383423} -08/30/2021 14:31:43 - INFO - __main__ - Step 7529: {'lr': 0.0004982808094670534, 'samples': 1445568, 'steps': 7528, 'loss/train': 1.9248706102371216} -08/30/2021 14:31:43 - INFO - __main__ - Step 7530: {'lr': 0.0004982801881313034, 'samples': 1445760, 'steps': 7529, 'loss/train': 2.176140785217285} -08/30/2021 14:31:43 - INFO - __main__ - Step 7531: {'lr': 0.0004982795666836821, 'samples': 1445952, 'steps': 7530, 'loss/train': 2.0840225219726562} -08/30/2021 14:31:44 - INFO - __main__ - Step 7532: {'lr': 0.00049827894512419, 'samples': 1446144, 'steps': 7531, 'loss/train': 2.8085975646972656} -08/30/2021 14:31:46 - INFO - __main__ - Step 7533: {'lr': 0.000498278323452827, 'samples': 1446336, 'steps': 7532, 'loss/train': 0.224198579788208} -08/30/2021 14:31:46 - INFO - __main__ - Step 7534: {'lr': 0.0004982777016695937, 'samples': 1446528, 'steps': 7533, 'loss/train': 2.6613540649414062} -08/30/2021 14:31:46 - INFO - __main__ - Step 7535: {'lr': 0.0004982770797744904, 'samples': 1446720, 'steps': 7534, 'loss/train': 1.0777910947799683} -08/30/2021 14:31:47 - INFO - __main__ - Step 7536: {'lr': 0.0004982764577675172, 'samples': 1446912, 'steps': 7535, 'loss/train': 2.2682013511657715} -08/30/2021 14:31:47 - INFO - __main__ - Step 7537: {'lr': 0.0004982758356486746, 'samples': 1447104, 'steps': 7536, 'loss/train': 2.113523244857788} -08/30/2021 14:31:49 - INFO - __main__ - Step 7538: {'lr': 0.0004982752134179624, 'samples': 1447296, 'steps': 7537, 'loss/train': 2.2558867931365967} -08/30/2021 14:31:49 - INFO - __main__ - Step 7539: {'lr': 0.0004982745910753815, 'samples': 1447488, 'steps': 7538, 'loss/train': 1.9438822269439697} -08/30/2021 14:31:49 - INFO - __main__ - Step 7540: {'lr': 0.0004982739686209319, 'samples': 1447680, 'steps': 7539, 'loss/train': 1.8464691638946533} -08/30/2021 14:31:50 - INFO - __main__ - Step 7541: {'lr': 0.0004982733460546138, 'samples': 1447872, 'steps': 7540, 'loss/train': 1.8391351699829102} -08/30/2021 14:31:50 - INFO - __main__ - Step 7542: {'lr': 0.0004982727233764276, 'samples': 1448064, 'steps': 7541, 'loss/train': 1.9969525337219238} -08/30/2021 14:31:52 - INFO - __main__ - Step 7543: {'lr': 0.0004982721005863734, 'samples': 1448256, 'steps': 7542, 'loss/train': 1.9569755792617798} -08/30/2021 14:31:52 - INFO - __main__ - Step 7544: {'lr': 0.0004982714776844518, 'samples': 1448448, 'steps': 7543, 'loss/train': 2.4319441318511963} -08/30/2021 14:31:52 - INFO - __main__ - Step 7545: {'lr': 0.0004982708546706628, 'samples': 1448640, 'steps': 7544, 'loss/train': 1.3967210054397583} -08/30/2021 14:31:53 - INFO - __main__ - Step 7546: {'lr': 0.0004982702315450068, 'samples': 1448832, 'steps': 7545, 'loss/train': 1.4815490245819092} -08/30/2021 14:31:53 - INFO - __main__ - Step 7547: {'lr': 0.0004982696083074841, 'samples': 1449024, 'steps': 7546, 'loss/train': 2.012848377227783} -08/30/2021 14:31:55 - INFO - __main__ - Step 7548: {'lr': 0.0004982689849580951, 'samples': 1449216, 'steps': 7547, 'loss/train': 0.8206766247749329} -08/30/2021 14:31:55 - INFO - __main__ - Step 7549: {'lr': 0.0004982683614968396, 'samples': 1449408, 'steps': 7548, 'loss/train': 2.089946985244751} -08/30/2021 14:31:55 - INFO - __main__ - Step 7550: {'lr': 0.0004982677379237185, 'samples': 1449600, 'steps': 7549, 'loss/train': 2.0351805686950684} -08/30/2021 14:31:56 - INFO - __main__ - Step 7551: {'lr': 0.0004982671142387316, 'samples': 1449792, 'steps': 7550, 'loss/train': 1.9914253950119019} -08/30/2021 14:31:56 - INFO - __main__ - Step 7552: {'lr': 0.0004982664904418794, 'samples': 1449984, 'steps': 7551, 'loss/train': 2.4036357402801514} -08/30/2021 14:31:56 - INFO - __main__ - Step 7553: {'lr': 0.0004982658665331622, 'samples': 1450176, 'steps': 7552, 'loss/train': 2.1153810024261475} -08/30/2021 14:31:58 - INFO - __main__ - Step 7554: {'lr': 0.0004982652425125802, 'samples': 1450368, 'steps': 7553, 'loss/train': 2.22267746925354} -08/30/2021 14:31:59 - INFO - __main__ - Step 7555: {'lr': 0.0004982646183801337, 'samples': 1450560, 'steps': 7554, 'loss/train': 1.5154162645339966} -08/30/2021 14:31:59 - INFO - __main__ - Step 7556: {'lr': 0.000498263994135823, 'samples': 1450752, 'steps': 7555, 'loss/train': 2.205740213394165} -08/30/2021 14:31:59 - INFO - __main__ - Step 7557: {'lr': 0.0004982633697796484, 'samples': 1450944, 'steps': 7556, 'loss/train': 2.1476902961730957} -08/30/2021 14:32:00 - INFO - __main__ - Step 7558: {'lr': 0.0004982627453116102, 'samples': 1451136, 'steps': 7557, 'loss/train': 2.2479989528656006} -08/30/2021 14:32:01 - INFO - __main__ - Step 7559: {'lr': 0.0004982621207317086, 'samples': 1451328, 'steps': 7558, 'loss/train': 1.9805433750152588} -08/30/2021 14:32:02 - INFO - __main__ - Step 7560: {'lr': 0.0004982614960399439, 'samples': 1451520, 'steps': 7559, 'loss/train': 2.081728219985962} -08/30/2021 14:32:02 - INFO - __main__ - Step 7561: {'lr': 0.0004982608712363163, 'samples': 1451712, 'steps': 7560, 'loss/train': 2.3973753452301025} -08/30/2021 14:32:02 - INFO - __main__ - Step 7562: {'lr': 0.0004982602463208263, 'samples': 1451904, 'steps': 7561, 'loss/train': 1.589126706123352} -08/30/2021 14:32:03 - INFO - __main__ - Step 7563: {'lr': 0.0004982596212934742, 'samples': 1452096, 'steps': 7562, 'loss/train': 2.282374143600464} -08/30/2021 14:32:04 - INFO - __main__ - Step 7564: {'lr': 0.00049825899615426, 'samples': 1452288, 'steps': 7563, 'loss/train': 1.7362415790557861} -08/30/2021 14:32:05 - INFO - __main__ - Step 7565: {'lr': 0.000498258370903184, 'samples': 1452480, 'steps': 7564, 'loss/train': 1.7438775300979614} -08/30/2021 14:32:05 - INFO - __main__ - Step 7566: {'lr': 0.0004982577455402467, 'samples': 1452672, 'steps': 7565, 'loss/train': 2.1081855297088623} -08/30/2021 14:32:05 - INFO - __main__ - Step 7567: {'lr': 0.0004982571200654485, 'samples': 1452864, 'steps': 7566, 'loss/train': 2.0620479583740234} -08/30/2021 14:32:06 - INFO - __main__ - Step 7568: {'lr': 0.0004982564944787892, 'samples': 1453056, 'steps': 7567, 'loss/train': 0.9706790447235107} -08/30/2021 14:32:06 - INFO - __main__ - Step 7569: {'lr': 0.0004982558687802695, 'samples': 1453248, 'steps': 7568, 'loss/train': 2.075424909591675} -08/30/2021 14:32:08 - INFO - __main__ - Step 7570: {'lr': 0.0004982552429698894, 'samples': 1453440, 'steps': 7569, 'loss/train': 2.015124559402466} -08/30/2021 14:32:08 - INFO - __main__ - Step 7571: {'lr': 0.0004982546170476494, 'samples': 1453632, 'steps': 7570, 'loss/train': 2.06308913230896} -08/30/2021 14:32:08 - INFO - __main__ - Step 7572: {'lr': 0.0004982539910135497, 'samples': 1453824, 'steps': 7571, 'loss/train': 2.22385835647583} -08/30/2021 14:32:09 - INFO - __main__ - Step 7573: {'lr': 0.0004982533648675906, 'samples': 1454016, 'steps': 7572, 'loss/train': 1.735123872756958} -08/30/2021 14:32:09 - INFO - __main__ - Step 7574: {'lr': 0.0004982527386097723, 'samples': 1454208, 'steps': 7573, 'loss/train': 1.3776600360870361} -08/30/2021 14:32:10 - INFO - __main__ - Step 7575: {'lr': 0.0004982521122400953, 'samples': 1454400, 'steps': 7574, 'loss/train': 2.298922300338745} -08/30/2021 14:32:11 - INFO - __main__ - Step 7576: {'lr': 0.0004982514857585596, 'samples': 1454592, 'steps': 7575, 'loss/train': 1.628009557723999} -08/30/2021 14:32:11 - INFO - __main__ - Step 7577: {'lr': 0.0004982508591651657, 'samples': 1454784, 'steps': 7576, 'loss/train': 1.6538323163986206} -08/30/2021 14:32:12 - INFO - __main__ - Step 7578: {'lr': 0.0004982502324599137, 'samples': 1454976, 'steps': 7577, 'loss/train': 1.6575632095336914} -08/30/2021 14:32:12 - INFO - __main__ - Step 7579: {'lr': 0.000498249605642804, 'samples': 1455168, 'steps': 7578, 'loss/train': 2.3769774436950684} -08/30/2021 14:32:13 - INFO - __main__ - Step 7580: {'lr': 0.0004982489787138369, 'samples': 1455360, 'steps': 7579, 'loss/train': 1.8219870328903198} -08/30/2021 14:32:14 - INFO - __main__ - Step 7581: {'lr': 0.0004982483516730126, 'samples': 1455552, 'steps': 7580, 'loss/train': 2.2146756649017334} -08/30/2021 14:32:14 - INFO - __main__ - Step 7582: {'lr': 0.0004982477245203314, 'samples': 1455744, 'steps': 7581, 'loss/train': 1.9243416786193848} -08/30/2021 14:32:15 - INFO - __main__ - Step 7583: {'lr': 0.0004982470972557936, 'samples': 1455936, 'steps': 7582, 'loss/train': 1.8740180730819702} -08/30/2021 14:32:15 - INFO - __main__ - Step 7584: {'lr': 0.0004982464698793995, 'samples': 1456128, 'steps': 7583, 'loss/train': 2.0148367881774902} -08/30/2021 14:32:17 - INFO - __main__ - Step 7585: {'lr': 0.0004982458423911495, 'samples': 1456320, 'steps': 7584, 'loss/train': 2.3391404151916504} -08/30/2021 14:32:18 - INFO - __main__ - Step 7586: {'lr': 0.0004982452147910437, 'samples': 1456512, 'steps': 7585, 'loss/train': 0.4455569088459015} -08/30/2021 14:32:18 - INFO - __main__ - Step 7587: {'lr': 0.0004982445870790823, 'samples': 1456704, 'steps': 7586, 'loss/train': 1.9164934158325195} -08/30/2021 14:32:18 - INFO - __main__ - Step 7588: {'lr': 0.0004982439592552658, 'samples': 1456896, 'steps': 7587, 'loss/train': 1.9756067991256714} -08/30/2021 14:32:19 - INFO - __main__ - Step 7589: {'lr': 0.0004982433313195945, 'samples': 1457088, 'steps': 7588, 'loss/train': 2.1519882678985596} -08/30/2021 14:32:21 - INFO - __main__ - Step 7590: {'lr': 0.0004982427032720685, 'samples': 1457280, 'steps': 7589, 'loss/train': 1.8529356718063354} -08/30/2021 14:32:21 - INFO - __main__ - Step 7591: {'lr': 0.0004982420751126882, 'samples': 1457472, 'steps': 7590, 'loss/train': 2.0144546031951904} -08/30/2021 14:32:22 - INFO - __main__ - Step 7592: {'lr': 0.0004982414468414538, 'samples': 1457664, 'steps': 7591, 'loss/train': 2.052746057510376} -08/30/2021 14:32:22 - INFO - __main__ - Step 7593: {'lr': 0.0004982408184583656, 'samples': 1457856, 'steps': 7592, 'loss/train': 1.869333267211914} -08/30/2021 14:32:22 - INFO - __main__ - Step 7594: {'lr': 0.000498240189963424, 'samples': 1458048, 'steps': 7593, 'loss/train': 0.4741004407405853} -08/30/2021 14:32:23 - INFO - __main__ - Step 7595: {'lr': 0.0004982395613566291, 'samples': 1458240, 'steps': 7594, 'loss/train': 0.48749151825904846} -08/30/2021 14:32:23 - INFO - __main__ - Step 7596: {'lr': 0.0004982389326379814, 'samples': 1458432, 'steps': 7595, 'loss/train': 1.4670989513397217} -08/30/2021 14:32:24 - INFO - __main__ - Step 7597: {'lr': 0.000498238303807481, 'samples': 1458624, 'steps': 7596, 'loss/train': 1.3657543659210205} -08/30/2021 14:32:25 - INFO - __main__ - Step 7598: {'lr': 0.0004982376748651283, 'samples': 1458816, 'steps': 7597, 'loss/train': 1.751383662223816} -08/30/2021 14:32:25 - INFO - __main__ - Step 7599: {'lr': 0.0004982370458109235, 'samples': 1459008, 'steps': 7598, 'loss/train': 2.3496954441070557} -08/30/2021 14:32:26 - INFO - __main__ - Step 7600: {'lr': 0.0004982364166448669, 'samples': 1459200, 'steps': 7599, 'loss/train': 1.9759198427200317} -08/30/2021 14:32:26 - INFO - __main__ - Step 7601: {'lr': 0.0004982357873669588, 'samples': 1459392, 'steps': 7600, 'loss/train': 2.449190378189087} -08/30/2021 14:32:28 - INFO - __main__ - Step 7602: {'lr': 0.0004982351579771995, 'samples': 1459584, 'steps': 7601, 'loss/train': 2.4566941261291504} -08/30/2021 14:32:29 - INFO - __main__ - Step 7603: {'lr': 0.0004982345284755893, 'samples': 1459776, 'steps': 7602, 'loss/train': 1.5778398513793945} -08/30/2021 14:32:29 - INFO - __main__ - Step 7604: {'lr': 0.0004982338988621284, 'samples': 1459968, 'steps': 7603, 'loss/train': 0.2906356453895569} -08/30/2021 14:32:29 - INFO - __main__ - Step 7605: {'lr': 0.0004982332691368172, 'samples': 1460160, 'steps': 7604, 'loss/train': 1.720291018486023} -08/30/2021 14:32:30 - INFO - __main__ - Step 7606: {'lr': 0.0004982326392996559, 'samples': 1460352, 'steps': 7605, 'loss/train': 1.7239372730255127} -08/30/2021 14:32:31 - INFO - __main__ - Step 7607: {'lr': 0.0004982320093506449, 'samples': 1460544, 'steps': 7606, 'loss/train': 1.5500638484954834} -08/30/2021 14:32:32 - INFO - __main__ - Step 7608: {'lr': 0.0004982313792897843, 'samples': 1460736, 'steps': 7607, 'loss/train': 2.3881630897521973} -08/30/2021 14:32:32 - INFO - __main__ - Step 7609: {'lr': 0.0004982307491170744, 'samples': 1460928, 'steps': 7608, 'loss/train': 1.9098057746887207} -08/30/2021 14:32:32 - INFO - __main__ - Step 7610: {'lr': 0.0004982301188325156, 'samples': 1461120, 'steps': 7609, 'loss/train': 2.543076515197754} -08/30/2021 14:32:33 - INFO - __main__ - Step 7611: {'lr': 0.0004982294884361081, 'samples': 1461312, 'steps': 7610, 'loss/train': 1.7057809829711914} -08/30/2021 14:32:34 - INFO - __main__ - Step 7612: {'lr': 0.0004982288579278522, 'samples': 1461504, 'steps': 7611, 'loss/train': 1.8376268148422241} -08/30/2021 14:32:35 - INFO - __main__ - Step 7613: {'lr': 0.0004982282273077483, 'samples': 1461696, 'steps': 7612, 'loss/train': 1.9261051416397095} -08/30/2021 14:32:35 - INFO - __main__ - Step 7614: {'lr': 0.0004982275965757965, 'samples': 1461888, 'steps': 7613, 'loss/train': 1.7783925533294678} -08/30/2021 14:32:35 - INFO - __main__ - Step 7615: {'lr': 0.0004982269657319974, 'samples': 1462080, 'steps': 7614, 'loss/train': 2.282299757003784} -08/30/2021 14:32:36 - INFO - __main__ - Step 7616: {'lr': 0.0004982263347763508, 'samples': 1462272, 'steps': 7615, 'loss/train': 1.796460509300232} -08/30/2021 14:32:36 - INFO - __main__ - Step 7617: {'lr': 0.0004982257037088574, 'samples': 1462464, 'steps': 7616, 'loss/train': 1.541679859161377} -08/30/2021 14:32:37 - INFO - __main__ - Step 7618: {'lr': 0.0004982250725295173, 'samples': 1462656, 'steps': 7617, 'loss/train': 1.7694965600967407} -08/30/2021 14:32:38 - INFO - __main__ - Step 7619: {'lr': 0.0004982244412383307, 'samples': 1462848, 'steps': 7618, 'loss/train': 1.8106591701507568} -08/30/2021 14:32:38 - INFO - __main__ - Step 7620: {'lr': 0.0004982238098352981, 'samples': 1463040, 'steps': 7619, 'loss/train': 2.0153603553771973} -08/30/2021 14:32:39 - INFO - __main__ - Step 7621: {'lr': 0.0004982231783204196, 'samples': 1463232, 'steps': 7620, 'loss/train': 2.341870069503784} -08/30/2021 14:32:39 - INFO - __main__ - Step 7622: {'lr': 0.0004982225466936957, 'samples': 1463424, 'steps': 7621, 'loss/train': 1.6655136346817017} -08/30/2021 14:32:40 - INFO - __main__ - Step 7623: {'lr': 0.0004982219149551265, 'samples': 1463616, 'steps': 7622, 'loss/train': 1.1686482429504395} -08/30/2021 14:32:41 - INFO - __main__ - Step 7624: {'lr': 0.0004982212831047123, 'samples': 1463808, 'steps': 7623, 'loss/train': 1.8940069675445557} -08/30/2021 14:32:41 - INFO - __main__ - Step 7625: {'lr': 0.0004982206511424534, 'samples': 1464000, 'steps': 7624, 'loss/train': 2.999492883682251} -08/30/2021 14:32:42 - INFO - __main__ - Step 7626: {'lr': 0.0004982200190683502, 'samples': 1464192, 'steps': 7625, 'loss/train': 1.9776214361190796} -08/30/2021 14:32:42 - INFO - __main__ - Step 7627: {'lr': 0.0004982193868824028, 'samples': 1464384, 'steps': 7626, 'loss/train': 2.043475389480591} -08/30/2021 14:32:44 - INFO - __main__ - Step 7628: {'lr': 0.0004982187545846116, 'samples': 1464576, 'steps': 7627, 'loss/train': 1.5122380256652832} -08/30/2021 14:32:44 - INFO - __main__ - Step 7629: {'lr': 0.0004982181221749769, 'samples': 1464768, 'steps': 7628, 'loss/train': 2.130232810974121} -08/30/2021 14:32:44 - INFO - __main__ - Step 7630: {'lr': 0.0004982174896534989, 'samples': 1464960, 'steps': 7629, 'loss/train': 2.17044734954834} -08/30/2021 14:32:45 - INFO - __main__ - Step 7631: {'lr': 0.0004982168570201779, 'samples': 1465152, 'steps': 7630, 'loss/train': 2.147237539291382} -08/30/2021 14:32:45 - INFO - __main__ - Step 7632: {'lr': 0.0004982162242750143, 'samples': 1465344, 'steps': 7631, 'loss/train': 1.9035475254058838} -08/30/2021 14:32:47 - INFO - __main__ - Step 7633: {'lr': 0.0004982155914180082, 'samples': 1465536, 'steps': 7632, 'loss/train': 2.0401601791381836} -08/30/2021 14:32:47 - INFO - __main__ - Step 7634: {'lr': 0.0004982149584491601, 'samples': 1465728, 'steps': 7633, 'loss/train': 2.2002885341644287} -08/30/2021 14:32:48 - INFO - __main__ - Step 7635: {'lr': 0.0004982143253684701, 'samples': 1465920, 'steps': 7634, 'loss/train': 2.4061896800994873} -08/30/2021 14:32:48 - INFO - __main__ - Step 7636: {'lr': 0.0004982136921759385, 'samples': 1466112, 'steps': 7635, 'loss/train': 2.3751139640808105} -08/30/2021 14:32:48 - INFO - __main__ - Step 7637: {'lr': 0.0004982130588715657, 'samples': 1466304, 'steps': 7636, 'loss/train': 1.6981489658355713} -08/30/2021 14:32:49 - INFO - __main__ - Step 7638: {'lr': 0.000498212425455352, 'samples': 1466496, 'steps': 7637, 'loss/train': 0.2940669059753418} -08/30/2021 14:32:50 - INFO - __main__ - Step 7639: {'lr': 0.0004982117919272975, 'samples': 1466688, 'steps': 7638, 'loss/train': 1.4565587043762207} -08/30/2021 14:32:51 - INFO - __main__ - Step 7640: {'lr': 0.0004982111582874026, 'samples': 1466880, 'steps': 7639, 'loss/train': 2.233288049697876} -08/30/2021 14:32:51 - INFO - __main__ - Step 7641: {'lr': 0.0004982105245356676, 'samples': 1467072, 'steps': 7640, 'loss/train': 2.2874677181243896} -08/30/2021 14:32:51 - INFO - __main__ - Step 7642: {'lr': 0.0004982098906720928, 'samples': 1467264, 'steps': 7641, 'loss/train': 2.661987781524658} -08/30/2021 14:32:52 - INFO - __main__ - Step 7643: {'lr': 0.0004982092566966785, 'samples': 1467456, 'steps': 7642, 'loss/train': 1.7330474853515625} -08/30/2021 14:32:54 - INFO - __main__ - Step 7644: {'lr': 0.0004982086226094248, 'samples': 1467648, 'steps': 7643, 'loss/train': 1.758739709854126} -08/30/2021 14:32:54 - INFO - __main__ - Step 7645: {'lr': 0.0004982079884103322, 'samples': 1467840, 'steps': 7644, 'loss/train': 1.550981044769287} -08/30/2021 14:32:55 - INFO - __main__ - Step 7646: {'lr': 0.0004982073540994009, 'samples': 1468032, 'steps': 7645, 'loss/train': 1.6437125205993652} -08/30/2021 14:32:55 - INFO - __main__ - Step 7647: {'lr': 0.0004982067196766312, 'samples': 1468224, 'steps': 7646, 'loss/train': 1.827168583869934} -08/30/2021 14:32:55 - INFO - __main__ - Step 7648: {'lr': 0.0004982060851420235, 'samples': 1468416, 'steps': 7647, 'loss/train': 1.9852111339569092} -08/30/2021 14:32:57 - INFO - __main__ - Step 7649: {'lr': 0.0004982054504955778, 'samples': 1468608, 'steps': 7648, 'loss/train': 1.8847118616104126} -08/30/2021 14:32:57 - INFO - __main__ - Step 7650: {'lr': 0.0004982048157372946, 'samples': 1468800, 'steps': 7649, 'loss/train': 1.9492592811584473} -08/30/2021 14:32:58 - INFO - __main__ - Step 7651: {'lr': 0.0004982041808671741, 'samples': 1468992, 'steps': 7650, 'loss/train': 1.8398195505142212} -08/30/2021 14:32:58 - INFO - __main__ - Step 7652: {'lr': 0.0004982035458852168, 'samples': 1469184, 'steps': 7651, 'loss/train': 1.9448692798614502} -08/30/2021 14:32:58 - INFO - __main__ - Step 7653: {'lr': 0.0004982029107914226, 'samples': 1469376, 'steps': 7652, 'loss/train': 1.842936396598816} -08/30/2021 14:32:59 - INFO - __main__ - Step 7654: {'lr': 0.0004982022755857921, 'samples': 1469568, 'steps': 7653, 'loss/train': 2.1686980724334717} -08/30/2021 14:33:00 - INFO - __main__ - Step 7655: {'lr': 0.0004982016402683255, 'samples': 1469760, 'steps': 7654, 'loss/train': 3.0476479530334473} -08/30/2021 14:33:01 - INFO - __main__ - Step 7656: {'lr': 0.000498201004839023, 'samples': 1469952, 'steps': 7655, 'loss/train': 1.9071561098098755} -08/30/2021 14:33:01 - INFO - __main__ - Step 7657: {'lr': 0.000498200369297885, 'samples': 1470144, 'steps': 7656, 'loss/train': 1.9576544761657715} -08/30/2021 14:33:02 - INFO - __main__ - Step 7658: {'lr': 0.0004981997336449118, 'samples': 1470336, 'steps': 7657, 'loss/train': 2.221675157546997} -08/30/2021 14:33:02 - INFO - __main__ - Step 7659: {'lr': 0.0004981990978801035, 'samples': 1470528, 'steps': 7658, 'loss/train': 0.7236251831054688} -08/30/2021 14:33:04 - INFO - __main__ - Step 7660: {'lr': 0.0004981984620034606, 'samples': 1470720, 'steps': 7659, 'loss/train': 1.8968356847763062} -08/30/2021 14:33:04 - INFO - __main__ - Step 7661: {'lr': 0.0004981978260149833, 'samples': 1470912, 'steps': 7660, 'loss/train': 2.056927442550659} -08/30/2021 14:33:04 - INFO - __main__ - Step 7662: {'lr': 0.0004981971899146719, 'samples': 1471104, 'steps': 7661, 'loss/train': 1.60395348072052} -08/30/2021 14:33:05 - INFO - __main__ - Step 7663: {'lr': 0.0004981965537025267, 'samples': 1471296, 'steps': 7662, 'loss/train': 2.0221469402313232} -08/30/2021 14:33:05 - INFO - __main__ - Step 7664: {'lr': 0.000498195917378548, 'samples': 1471488, 'steps': 7663, 'loss/train': 1.7255994081497192} -08/30/2021 14:33:07 - INFO - __main__ - Step 7665: {'lr': 0.0004981952809427359, 'samples': 1471680, 'steps': 7664, 'loss/train': 2.2085747718811035} -08/30/2021 14:33:07 - INFO - __main__ - Step 7666: {'lr': 0.0004981946443950909, 'samples': 1471872, 'steps': 7665, 'loss/train': 1.760868787765503} -08/30/2021 14:33:08 - INFO - __main__ - Step 7667: {'lr': 0.0004981940077356132, 'samples': 1472064, 'steps': 7666, 'loss/train': 1.9882076978683472} -08/30/2021 14:33:08 - INFO - __main__ - Step 7668: {'lr': 0.0004981933709643032, 'samples': 1472256, 'steps': 7667, 'loss/train': 2.031376361846924} -08/30/2021 14:33:08 - INFO - __main__ - Step 7669: {'lr': 0.000498192734081161, 'samples': 1472448, 'steps': 7668, 'loss/train': 1.1171282529830933} -08/30/2021 14:33:10 - INFO - __main__ - Step 7670: {'lr': 0.000498192097086187, 'samples': 1472640, 'steps': 7669, 'loss/train': 0.3261836767196655} -08/30/2021 14:33:10 - INFO - __main__ - Step 7671: {'lr': 0.0004981914599793816, 'samples': 1472832, 'steps': 7670, 'loss/train': 2.1289432048797607} -08/30/2021 14:33:11 - INFO - __main__ - Step 7672: {'lr': 0.0004981908227607448, 'samples': 1473024, 'steps': 7671, 'loss/train': 1.897096872329712} -08/30/2021 14:33:11 - INFO - __main__ - Step 7673: {'lr': 0.0004981901854302771, 'samples': 1473216, 'steps': 7672, 'loss/train': 2.2631258964538574} -08/30/2021 14:33:11 - INFO - __main__ - Step 7674: {'lr': 0.0004981895479879787, 'samples': 1473408, 'steps': 7673, 'loss/train': 0.18086963891983032} -08/30/2021 14:33:13 - INFO - __main__ - Step 7675: {'lr': 0.0004981889104338499, 'samples': 1473600, 'steps': 7674, 'loss/train': 1.6707899570465088} -08/30/2021 14:33:13 - INFO - __main__ - Step 7676: {'lr': 0.0004981882727678912, 'samples': 1473792, 'steps': 7675, 'loss/train': 1.721340537071228} -08/30/2021 14:33:14 - INFO - __main__ - Step 7677: {'lr': 0.0004981876349901025, 'samples': 1473984, 'steps': 7676, 'loss/train': 2.6755495071411133} -08/30/2021 14:33:14 - INFO - __main__ - Step 7678: {'lr': 0.0004981869971004843, 'samples': 1474176, 'steps': 7677, 'loss/train': 2.2184014320373535} -08/30/2021 14:33:14 - INFO - __main__ - Step 7679: {'lr': 0.0004981863590990369, 'samples': 1474368, 'steps': 7678, 'loss/train': 2.0429258346557617} -08/30/2021 14:33:16 - INFO - __main__ - Step 7680: {'lr': 0.0004981857209857605, 'samples': 1474560, 'steps': 7679, 'loss/train': 2.1642518043518066} -08/30/2021 14:33:16 - INFO - __main__ - Step 7681: {'lr': 0.0004981850827606556, 'samples': 1474752, 'steps': 7680, 'loss/train': 2.048515558242798} -08/30/2021 14:33:17 - INFO - __main__ - Step 7682: {'lr': 0.0004981844444237223, 'samples': 1474944, 'steps': 7681, 'loss/train': 1.869009256362915} -08/30/2021 14:33:17 - INFO - __main__ - Step 7683: {'lr': 0.0004981838059749607, 'samples': 1475136, 'steps': 7682, 'loss/train': 1.895453929901123} -08/30/2021 14:33:17 - INFO - __main__ - Step 7684: {'lr': 0.0004981831674143716, 'samples': 1475328, 'steps': 7683, 'loss/train': 5.6247382164001465} -08/30/2021 14:33:19 - INFO - __main__ - Step 7685: {'lr': 0.0004981825287419549, 'samples': 1475520, 'steps': 7684, 'loss/train': 2.1324689388275146} -08/30/2021 14:33:20 - INFO - __main__ - Step 7686: {'lr': 0.0004981818899577108, 'samples': 1475712, 'steps': 7685, 'loss/train': 0.21272243559360504} -08/30/2021 14:33:20 - INFO - __main__ - Step 7687: {'lr': 0.0004981812510616399, 'samples': 1475904, 'steps': 7686, 'loss/train': 1.6858524084091187} -08/30/2021 14:33:20 - INFO - __main__ - Step 7688: {'lr': 0.0004981806120537424, 'samples': 1476096, 'steps': 7687, 'loss/train': 1.5783642530441284} -08/30/2021 14:33:21 - INFO - __main__ - Step 7689: {'lr': 0.0004981799729340185, 'samples': 1476288, 'steps': 7688, 'loss/train': 1.5531423091888428} -08/30/2021 14:33:22 - INFO - __main__ - Step 7690: {'lr': 0.0004981793337024685, 'samples': 1476480, 'steps': 7689, 'loss/train': 2.4547955989837646} -08/30/2021 14:33:23 - INFO - __main__ - Step 7691: {'lr': 0.0004981786943590928, 'samples': 1476672, 'steps': 7690, 'loss/train': 1.785744547843933} -08/30/2021 14:33:23 - INFO - __main__ - Step 7692: {'lr': 0.0004981780549038916, 'samples': 1476864, 'steps': 7691, 'loss/train': 1.6092928647994995} -08/30/2021 14:33:23 - INFO - __main__ - Step 7693: {'lr': 0.0004981774153368651, 'samples': 1477056, 'steps': 7692, 'loss/train': 1.8361210823059082} -08/30/2021 14:33:24 - INFO - __main__ - Step 7694: {'lr': 0.0004981767756580138, 'samples': 1477248, 'steps': 7693, 'loss/train': 2.2799594402313232} -08/30/2021 14:33:24 - INFO - __main__ - Step 7695: {'lr': 0.0004981761358673378, 'samples': 1477440, 'steps': 7694, 'loss/train': 4.373284339904785} -08/30/2021 14:33:27 - INFO - __main__ - Step 7696: {'lr': 0.0004981754959648376, 'samples': 1477632, 'steps': 7695, 'loss/train': 1.950577735900879} -08/30/2021 14:33:27 - INFO - __main__ - Step 7697: {'lr': 0.0004981748559505131, 'samples': 1477824, 'steps': 7696, 'loss/train': 2.0849568843841553} -08/30/2021 14:33:27 - INFO - __main__ - Step 7698: {'lr': 0.0004981742158243651, 'samples': 1478016, 'steps': 7697, 'loss/train': 1.7016234397888184} -08/30/2021 14:33:28 - INFO - __main__ - Step 7699: {'lr': 0.0004981735755863934, 'samples': 1478208, 'steps': 7698, 'loss/train': 3.159191846847534} -08/30/2021 14:33:28 - INFO - __main__ - Step 7700: {'lr': 0.0004981729352365986, 'samples': 1478400, 'steps': 7699, 'loss/train': 3.891718626022339} -08/30/2021 14:33:29 - INFO - __main__ - Step 7701: {'lr': 0.0004981722947749811, 'samples': 1478592, 'steps': 7700, 'loss/train': 2.0479910373687744} -08/30/2021 14:33:30 - INFO - __main__ - Step 7702: {'lr': 0.0004981716542015408, 'samples': 1478784, 'steps': 7701, 'loss/train': 1.7043089866638184} -08/30/2021 14:33:30 - INFO - __main__ - Step 7703: {'lr': 0.0004981710135162781, 'samples': 1478976, 'steps': 7702, 'loss/train': 2.0409011840820312} -08/30/2021 14:33:31 - INFO - __main__ - Step 7704: {'lr': 0.0004981703727191935, 'samples': 1479168, 'steps': 7703, 'loss/train': 1.478135585784912} -08/30/2021 14:33:31 - INFO - __main__ - Step 7705: {'lr': 0.0004981697318102872, 'samples': 1479360, 'steps': 7704, 'loss/train': 1.5815083980560303} -08/30/2021 14:33:31 - INFO - __main__ - Step 7706: {'lr': 0.0004981690907895594, 'samples': 1479552, 'steps': 7705, 'loss/train': 1.8284897804260254} -08/30/2021 14:33:33 - INFO - __main__ - Step 7707: {'lr': 0.0004981684496570104, 'samples': 1479744, 'steps': 7706, 'loss/train': 1.9333336353302002} -08/30/2021 14:33:34 - INFO - __main__ - Step 7708: {'lr': 0.0004981678084126405, 'samples': 1479936, 'steps': 7707, 'loss/train': 2.1768548488616943} -08/30/2021 14:33:34 - INFO - __main__ - Step 7709: {'lr': 0.0004981671670564502, 'samples': 1480128, 'steps': 7708, 'loss/train': 2.0018832683563232} -08/30/2021 14:33:34 - INFO - __main__ - Step 7710: {'lr': 0.0004981665255884394, 'samples': 1480320, 'steps': 7709, 'loss/train': 1.8176385164260864} -08/30/2021 14:33:35 - INFO - __main__ - Step 7711: {'lr': 0.0004981658840086087, 'samples': 1480512, 'steps': 7710, 'loss/train': 2.4641194343566895} -08/30/2021 14:33:37 - INFO - __main__ - Step 7712: {'lr': 0.0004981652423169582, 'samples': 1480704, 'steps': 7711, 'loss/train': 2.517939805984497} -08/30/2021 14:33:37 - INFO - __main__ - Step 7713: {'lr': 0.0004981646005134884, 'samples': 1480896, 'steps': 7712, 'loss/train': 1.9476361274719238} -08/30/2021 14:33:38 - INFO - __main__ - Step 7714: {'lr': 0.0004981639585981993, 'samples': 1481088, 'steps': 7713, 'loss/train': 1.4016057252883911} -08/30/2021 14:33:38 - INFO - __main__ - Step 7715: {'lr': 0.0004981633165710914, 'samples': 1481280, 'steps': 7714, 'loss/train': 2.2590274810791016} -08/30/2021 14:33:38 - INFO - __main__ - Step 7716: {'lr': 0.000498162674432165, 'samples': 1481472, 'steps': 7715, 'loss/train': 1.2550439834594727} -08/30/2021 14:33:39 - INFO - __main__ - Step 7717: {'lr': 0.0004981620321814203, 'samples': 1481664, 'steps': 7716, 'loss/train': 1.630491852760315} -08/30/2021 14:33:40 - INFO - __main__ - Step 7718: {'lr': 0.0004981613898188576, 'samples': 1481856, 'steps': 7717, 'loss/train': 0.3752845227718353} -08/30/2021 14:33:41 - INFO - __main__ - Step 7719: {'lr': 0.0004981607473444772, 'samples': 1482048, 'steps': 7718, 'loss/train': 2.00740385055542} -08/30/2021 14:33:41 - INFO - __main__ - Step 7720: {'lr': 0.0004981601047582794, 'samples': 1482240, 'steps': 7719, 'loss/train': 1.7867883443832397} -08/30/2021 14:33:41 - INFO - __main__ - Step 7721: {'lr': 0.0004981594620602645, 'samples': 1482432, 'steps': 7720, 'loss/train': 1.9333055019378662} -08/30/2021 14:33:42 - INFO - __main__ - Step 7722: {'lr': 0.0004981588192504329, 'samples': 1482624, 'steps': 7721, 'loss/train': 2.3572096824645996} -08/30/2021 14:33:42 - INFO - __main__ - Step 7723: {'lr': 0.0004981581763287845, 'samples': 1482816, 'steps': 7722, 'loss/train': 2.277782440185547} -08/30/2021 14:33:44 - INFO - __main__ - Step 7724: {'lr': 0.0004981575332953201, 'samples': 1483008, 'steps': 7723, 'loss/train': 2.4683494567871094} -08/30/2021 14:33:44 - INFO - __main__ - Step 7725: {'lr': 0.0004981568901500396, 'samples': 1483200, 'steps': 7724, 'loss/train': 1.2349966764450073} -08/30/2021 14:33:44 - INFO - __main__ - Step 7726: {'lr': 0.0004981562468929435, 'samples': 1483392, 'steps': 7725, 'loss/train': 2.003632068634033} -08/30/2021 14:33:45 - INFO - __main__ - Step 7727: {'lr': 0.000498155603524032, 'samples': 1483584, 'steps': 7726, 'loss/train': 2.1388509273529053} -08/30/2021 14:33:45 - INFO - __main__ - Step 7728: {'lr': 0.0004981549600433054, 'samples': 1483776, 'steps': 7727, 'loss/train': 2.016356945037842} -08/30/2021 14:33:46 - INFO - __main__ - Step 7729: {'lr': 0.000498154316450764, 'samples': 1483968, 'steps': 7728, 'loss/train': 1.7072561979293823} -08/30/2021 14:33:47 - INFO - __main__ - Step 7730: {'lr': 0.0004981536727464082, 'samples': 1484160, 'steps': 7729, 'loss/train': 2.40846586227417} -08/30/2021 14:33:47 - INFO - __main__ - Step 7731: {'lr': 0.0004981530289302381, 'samples': 1484352, 'steps': 7730, 'loss/train': 2.1133437156677246} -08/30/2021 14:33:48 - INFO - __main__ - Step 7732: {'lr': 0.000498152385002254, 'samples': 1484544, 'steps': 7731, 'loss/train': 2.262312889099121} -08/30/2021 14:33:48 - INFO - __main__ - Step 7733: {'lr': 0.0004981517409624564, 'samples': 1484736, 'steps': 7732, 'loss/train': 2.06803822517395} -08/30/2021 14:33:49 - INFO - __main__ - Step 7734: {'lr': 0.0004981510968108453, 'samples': 1484928, 'steps': 7733, 'loss/train': 1.520646572113037} -08/30/2021 14:33:50 - INFO - __main__ - Step 7735: {'lr': 0.0004981504525474214, 'samples': 1485120, 'steps': 7734, 'loss/train': 2.074373245239258} -08/30/2021 14:33:50 - INFO - __main__ - Step 7736: {'lr': 0.0004981498081721845, 'samples': 1485312, 'steps': 7735, 'loss/train': 1.8635661602020264} -08/30/2021 14:33:51 - INFO - __main__ - Step 7737: {'lr': 0.0004981491636851351, 'samples': 1485504, 'steps': 7736, 'loss/train': 1.557376742362976} -08/30/2021 14:33:51 - INFO - __main__ - Step 7738: {'lr': 0.0004981485190862737, 'samples': 1485696, 'steps': 7737, 'loss/train': 1.9101672172546387} -08/30/2021 14:33:52 - INFO - __main__ - Step 7739: {'lr': 0.0004981478743756004, 'samples': 1485888, 'steps': 7738, 'loss/train': 2.0683064460754395} -08/30/2021 14:33:53 - INFO - __main__ - Step 7740: {'lr': 0.0004981472295531153, 'samples': 1486080, 'steps': 7739, 'loss/train': 2.0462048053741455} -08/30/2021 14:33:53 - INFO - __main__ - Step 7741: {'lr': 0.000498146584618819, 'samples': 1486272, 'steps': 7740, 'loss/train': 2.059128999710083} -08/30/2021 14:33:53 - INFO - __main__ - Step 7742: {'lr': 0.0004981459395727117, 'samples': 1486464, 'steps': 7741, 'loss/train': 1.4216228723526} -08/30/2021 14:33:54 - INFO - __main__ - Step 7743: {'lr': 0.0004981452944147937, 'samples': 1486656, 'steps': 7742, 'loss/train': 1.7106612920761108} -08/30/2021 14:33:55 - INFO - __main__ - Step 7744: {'lr': 0.0004981446491450652, 'samples': 1486848, 'steps': 7743, 'loss/train': 2.3453712463378906} -08/30/2021 14:33:56 - INFO - __main__ - Step 7745: {'lr': 0.0004981440037635266, 'samples': 1487040, 'steps': 7744, 'loss/train': 1.805321216583252} -08/30/2021 14:33:56 - INFO - __main__ - Step 7746: {'lr': 0.0004981433582701781, 'samples': 1487232, 'steps': 7745, 'loss/train': 1.8666877746582031} -08/30/2021 14:33:57 - INFO - __main__ - Step 7747: {'lr': 0.00049814271266502, 'samples': 1487424, 'steps': 7746, 'loss/train': 1.5551704168319702} -08/30/2021 14:33:57 - INFO - __main__ - Step 7748: {'lr': 0.0004981420669480526, 'samples': 1487616, 'steps': 7747, 'loss/train': 1.9459718465805054} -08/30/2021 14:33:58 - INFO - __main__ - Step 7749: {'lr': 0.0004981414211192763, 'samples': 1487808, 'steps': 7748, 'loss/train': 1.812592625617981} -08/30/2021 14:33:59 - INFO - __main__ - Step 7750: {'lr': 0.0004981407751786913, 'samples': 1488000, 'steps': 7749, 'loss/train': 2.0698540210723877} -08/30/2021 14:33:59 - INFO - __main__ - Step 7751: {'lr': 0.0004981401291262979, 'samples': 1488192, 'steps': 7750, 'loss/train': 2.1763041019439697} -08/30/2021 14:34:00 - INFO - __main__ - Step 7752: {'lr': 0.0004981394829620963, 'samples': 1488384, 'steps': 7751, 'loss/train': 1.6592662334442139} -08/30/2021 14:34:00 - INFO - __main__ - Step 7753: {'lr': 0.0004981388366860869, 'samples': 1488576, 'steps': 7752, 'loss/train': 2.004002571105957} -08/30/2021 14:34:02 - INFO - __main__ - Step 7754: {'lr': 0.0004981381902982702, 'samples': 1488768, 'steps': 7753, 'loss/train': 1.9877376556396484} -08/30/2021 14:34:02 - INFO - __main__ - Step 7755: {'lr': 0.0004981375437986459, 'samples': 1488960, 'steps': 7754, 'loss/train': 1.8999247550964355} -08/30/2021 14:34:03 - INFO - __main__ - Step 7756: {'lr': 0.0004981368971872149, 'samples': 1489152, 'steps': 7755, 'loss/train': 1.6776868104934692} -08/30/2021 14:34:03 - INFO - __main__ - Step 7757: {'lr': 0.0004981362504639772, 'samples': 1489344, 'steps': 7756, 'loss/train': 1.939148187637329} -08/30/2021 14:34:04 - INFO - __main__ - Step 7758: {'lr': 0.0004981356036289331, 'samples': 1489536, 'steps': 7757, 'loss/train': 2.2283542156219482} -08/30/2021 14:34:05 - INFO - __main__ - Step 7759: {'lr': 0.0004981349566820828, 'samples': 1489728, 'steps': 7758, 'loss/train': 2.072937250137329} -08/30/2021 14:34:05 - INFO - __main__ - Step 7760: {'lr': 0.0004981343096234268, 'samples': 1489920, 'steps': 7759, 'loss/train': 1.9974037408828735} -08/30/2021 14:34:06 - INFO - __main__ - Step 7761: {'lr': 0.0004981336624529654, 'samples': 1490112, 'steps': 7760, 'loss/train': 1.4315470457077026} -08/30/2021 14:34:06 - INFO - __main__ - Step 7762: {'lr': 0.0004981330151706988, 'samples': 1490304, 'steps': 7761, 'loss/train': 2.379178762435913} -08/30/2021 14:34:07 - INFO - __main__ - Step 7763: {'lr': 0.0004981323677766273, 'samples': 1490496, 'steps': 7762, 'loss/train': 2.22389554977417} -08/30/2021 14:34:08 - INFO - __main__ - Step 7764: {'lr': 0.000498131720270751, 'samples': 1490688, 'steps': 7763, 'loss/train': 2.1621785163879395} -08/30/2021 14:34:08 - INFO - __main__ - Step 7765: {'lr': 0.0004981310726530706, 'samples': 1490880, 'steps': 7764, 'loss/train': 1.9238741397857666} -08/30/2021 14:34:09 - INFO - __main__ - Step 7766: {'lr': 0.0004981304249235861, 'samples': 1491072, 'steps': 7765, 'loss/train': 2.118007183074951} -08/30/2021 14:34:09 - INFO - __main__ - Step 7767: {'lr': 0.0004981297770822977, 'samples': 1491264, 'steps': 7766, 'loss/train': 1.4278289079666138} -08/30/2021 14:34:09 - INFO - __main__ - Step 7768: {'lr': 0.0004981291291292061, 'samples': 1491456, 'steps': 7767, 'loss/train': 2.1991090774536133} -08/30/2021 14:34:10 - INFO - __main__ - Step 7769: {'lr': 0.0004981284810643112, 'samples': 1491648, 'steps': 7768, 'loss/train': 1.9503018856048584} -08/30/2021 14:34:11 - INFO - __main__ - Step 7770: {'lr': 0.0004981278328876134, 'samples': 1491840, 'steps': 7769, 'loss/train': 1.9926166534423828} -08/30/2021 14:34:12 - INFO - __main__ - Step 7771: {'lr': 0.0004981271845991131, 'samples': 1492032, 'steps': 7770, 'loss/train': 2.072086811065674} -08/30/2021 14:34:12 - INFO - __main__ - Step 7772: {'lr': 0.0004981265361988105, 'samples': 1492224, 'steps': 7771, 'loss/train': 1.7195425033569336} -08/30/2021 14:34:13 - INFO - __main__ - Step 7773: {'lr': 0.000498125887686706, 'samples': 1492416, 'steps': 7772, 'loss/train': 2.0277905464172363} -08/30/2021 14:34:13 - INFO - __main__ - Step 7774: {'lr': 0.0004981252390627997, 'samples': 1492608, 'steps': 7773, 'loss/train': 1.9627342224121094} -08/30/2021 14:34:14 - INFO - __main__ - Step 7775: {'lr': 0.000498124590327092, 'samples': 1492800, 'steps': 7774, 'loss/train': 1.5249673128128052} -08/30/2021 14:34:15 - INFO - __main__ - Step 7776: {'lr': 0.0004981239414795832, 'samples': 1492992, 'steps': 7775, 'loss/train': 2.2362020015716553} -08/30/2021 14:34:15 - INFO - __main__ - Step 7777: {'lr': 0.0004981232925202736, 'samples': 1493184, 'steps': 7776, 'loss/train': 2.6314713954925537} -08/30/2021 14:34:15 - INFO - __main__ - Step 7778: {'lr': 0.0004981226434491635, 'samples': 1493376, 'steps': 7777, 'loss/train': 2.2494640350341797} -08/30/2021 14:34:16 - INFO - __main__ - Step 7779: {'lr': 0.000498121994266253, 'samples': 1493568, 'steps': 7778, 'loss/train': 2.3969132900238037} -08/30/2021 14:34:17 - INFO - __main__ - Step 7780: {'lr': 0.0004981213449715427, 'samples': 1493760, 'steps': 7779, 'loss/train': 1.8594331741333008} -08/30/2021 14:34:18 - INFO - __main__ - Step 7781: {'lr': 0.0004981206955650328, 'samples': 1493952, 'steps': 7780, 'loss/train': 2.656524658203125} -08/30/2021 14:34:18 - INFO - __main__ - Step 7782: {'lr': 0.0004981200460467234, 'samples': 1494144, 'steps': 7781, 'loss/train': 2.2213633060455322} -08/30/2021 14:34:19 - INFO - __main__ - Step 7783: {'lr': 0.0004981193964166151, 'samples': 1494336, 'steps': 7782, 'loss/train': 1.5977270603179932} -08/30/2021 14:34:19 - INFO - __main__ - Step 7784: {'lr': 0.0004981187466747079, 'samples': 1494528, 'steps': 7783, 'loss/train': 2.01069974899292} -08/30/2021 14:34:20 - INFO - __main__ - Step 7785: {'lr': 0.0004981180968210023, 'samples': 1494720, 'steps': 7784, 'loss/train': 1.7394118309020996} -08/30/2021 14:34:21 - INFO - __main__ - Step 7786: {'lr': 0.0004981174468554984, 'samples': 1494912, 'steps': 7785, 'loss/train': 6.545466423034668} -08/30/2021 14:34:21 - INFO - __main__ - Step 7787: {'lr': 0.0004981167967781968, 'samples': 1495104, 'steps': 7786, 'loss/train': 1.223050594329834} -08/30/2021 14:34:22 - INFO - __main__ - Step 7788: {'lr': 0.0004981161465890975, 'samples': 1495296, 'steps': 7787, 'loss/train': 1.7190486192703247} -08/30/2021 14:34:22 - INFO - __main__ - Step 7789: {'lr': 0.0004981154962882008, 'samples': 1495488, 'steps': 7788, 'loss/train': 1.9940739870071411} -08/30/2021 14:34:22 - INFO - __main__ - Step 7790: {'lr': 0.0004981148458755071, 'samples': 1495680, 'steps': 7789, 'loss/train': 2.0188848972320557} -08/30/2021 14:34:24 - INFO - __main__ - Step 7791: {'lr': 0.0004981141953510169, 'samples': 1495872, 'steps': 7790, 'loss/train': 1.7441670894622803} -08/30/2021 14:34:24 - INFO - __main__ - Step 7792: {'lr': 0.00049811354471473, 'samples': 1496064, 'steps': 7791, 'loss/train': 1.5147539377212524} -08/30/2021 14:34:25 - INFO - __main__ - Step 7793: {'lr': 0.0004981128939666471, 'samples': 1496256, 'steps': 7792, 'loss/train': 1.9101200103759766} -08/30/2021 14:34:25 - INFO - __main__ - Step 7794: {'lr': 0.0004981122431067683, 'samples': 1496448, 'steps': 7793, 'loss/train': 1.965456485748291} -08/30/2021 14:34:25 - INFO - __main__ - Step 7795: {'lr': 0.0004981115921350941, 'samples': 1496640, 'steps': 7794, 'loss/train': 2.0283596515655518} -08/30/2021 14:34:27 - INFO - __main__ - Step 7796: {'lr': 0.0004981109410516245, 'samples': 1496832, 'steps': 7795, 'loss/train': 1.6873531341552734} -08/30/2021 14:34:27 - INFO - __main__ - Step 7797: {'lr': 0.00049811028985636, 'samples': 1497024, 'steps': 7796, 'loss/train': 1.7942057847976685} -08/30/2021 14:34:28 - INFO - __main__ - Step 7798: {'lr': 0.0004981096385493007, 'samples': 1497216, 'steps': 7797, 'loss/train': 1.788494348526001} -08/30/2021 14:34:28 - INFO - __main__ - Step 7799: {'lr': 0.0004981089871304472, 'samples': 1497408, 'steps': 7798, 'loss/train': 2.047255754470825} -08/30/2021 14:34:28 - INFO - __main__ - Step 7800: {'lr': 0.0004981083355997995, 'samples': 1497600, 'steps': 7799, 'loss/train': 2.0315942764282227} -08/30/2021 14:34:30 - INFO - __main__ - Step 7801: {'lr': 0.0004981076839573581, 'samples': 1497792, 'steps': 7800, 'loss/train': 1.8836919069290161} -08/30/2021 14:34:30 - INFO - __main__ - Step 7802: {'lr': 0.0004981070322031231, 'samples': 1497984, 'steps': 7801, 'loss/train': 1.91158926486969} -08/30/2021 14:34:31 - INFO - __main__ - Step 7803: {'lr': 0.000498106380337095, 'samples': 1498176, 'steps': 7802, 'loss/train': 2.595004081726074} -08/30/2021 14:34:31 - INFO - __main__ - Step 7804: {'lr': 0.000498105728359274, 'samples': 1498368, 'steps': 7803, 'loss/train': 2.024995803833008} -08/30/2021 14:34:31 - INFO - __main__ - Step 7805: {'lr': 0.0004981050762696604, 'samples': 1498560, 'steps': 7804, 'loss/train': 1.6393280029296875} -08/30/2021 14:34:33 - INFO - __main__ - Step 7806: {'lr': 0.0004981044240682544, 'samples': 1498752, 'steps': 7805, 'loss/train': 1.9961345195770264} -08/30/2021 14:34:34 - INFO - __main__ - Step 7807: {'lr': 0.0004981037717550564, 'samples': 1498944, 'steps': 7806, 'loss/train': 1.8909987211227417} -08/30/2021 14:34:34 - INFO - __main__ - Step 7808: {'lr': 0.0004981031193300667, 'samples': 1499136, 'steps': 7807, 'loss/train': 1.900766134262085} -08/30/2021 14:34:35 - INFO - __main__ - Step 7809: {'lr': 0.0004981024667932855, 'samples': 1499328, 'steps': 7808, 'loss/train': 1.8486652374267578} -08/30/2021 14:34:35 - INFO - __main__ - Step 7810: {'lr': 0.0004981018141447133, 'samples': 1499520, 'steps': 7809, 'loss/train': 1.9063693284988403} -08/30/2021 14:34:36 - INFO - __main__ - Step 7811: {'lr': 0.00049810116138435, 'samples': 1499712, 'steps': 7810, 'loss/train': 1.9456430673599243} -08/30/2021 14:34:37 - INFO - __main__ - Step 7812: {'lr': 0.0004981005085121963, 'samples': 1499904, 'steps': 7811, 'loss/train': 1.6784391403198242} -08/30/2021 14:34:37 - INFO - __main__ - Step 7813: {'lr': 0.0004980998555282524, 'samples': 1500096, 'steps': 7812, 'loss/train': 2.22102952003479} -08/30/2021 14:34:38 - INFO - __main__ - Step 7814: {'lr': 0.0004980992024325185, 'samples': 1500288, 'steps': 7813, 'loss/train': 0.6577968001365662} -08/30/2021 14:34:38 - INFO - __main__ - Step 7815: {'lr': 0.0004980985492249949, 'samples': 1500480, 'steps': 7814, 'loss/train': 1.84895658493042} -08/30/2021 14:34:39 - INFO - __main__ - Step 7816: {'lr': 0.0004980978959056819, 'samples': 1500672, 'steps': 7815, 'loss/train': 1.110809564590454} -08/30/2021 14:34:40 - INFO - __main__ - Step 7817: {'lr': 0.0004980972424745798, 'samples': 1500864, 'steps': 7816, 'loss/train': 1.6254597902297974} -08/30/2021 14:34:40 - INFO - __main__ - Step 7818: {'lr': 0.000498096588931689, 'samples': 1501056, 'steps': 7817, 'loss/train': 1.8533543348312378} -08/30/2021 14:34:41 - INFO - __main__ - Step 7819: {'lr': 0.0004980959352770095, 'samples': 1501248, 'steps': 7818, 'loss/train': 2.1147758960723877} -08/30/2021 14:34:41 - INFO - __main__ - Step 7820: {'lr': 0.000498095281510542, 'samples': 1501440, 'steps': 7819, 'loss/train': 2.053044080734253} -08/30/2021 14:34:42 - INFO - __main__ - Step 7821: {'lr': 0.0004980946276322866, 'samples': 1501632, 'steps': 7820, 'loss/train': 1.740517258644104} -08/30/2021 14:34:43 - INFO - __main__ - Step 7822: {'lr': 0.0004980939736422436, 'samples': 1501824, 'steps': 7821, 'loss/train': 1.7762596607208252} -08/30/2021 14:34:43 - INFO - __main__ - Step 7823: {'lr': 0.0004980933195404131, 'samples': 1502016, 'steps': 7822, 'loss/train': 1.9814330339431763} -08/30/2021 14:34:44 - INFO - __main__ - Step 7824: {'lr': 0.0004980926653267957, 'samples': 1502208, 'steps': 7823, 'loss/train': 1.6790393590927124} -08/30/2021 14:34:44 - INFO - __main__ - Step 7825: {'lr': 0.0004980920110013915, 'samples': 1502400, 'steps': 7824, 'loss/train': 2.0899534225463867} -08/30/2021 14:34:45 - INFO - __main__ - Step 7826: {'lr': 0.000498091356564201, 'samples': 1502592, 'steps': 7825, 'loss/train': 1.817801833152771} -08/30/2021 14:34:46 - INFO - __main__ - Step 7827: {'lr': 0.0004980907020152242, 'samples': 1502784, 'steps': 7826, 'loss/train': 1.7425017356872559} -08/30/2021 14:34:46 - INFO - __main__ - Step 7828: {'lr': 0.0004980900473544617, 'samples': 1502976, 'steps': 7827, 'loss/train': 2.0283257961273193} -08/30/2021 14:34:47 - INFO - __main__ - Step 7829: {'lr': 0.0004980893925819137, 'samples': 1503168, 'steps': 7828, 'loss/train': 1.756772756576538} -08/30/2021 14:34:47 - INFO - __main__ - Step 7830: {'lr': 0.0004980887376975804, 'samples': 1503360, 'steps': 7829, 'loss/train': 1.8477866649627686} -08/30/2021 14:34:49 - INFO - __main__ - Step 7831: {'lr': 0.000498088082701462, 'samples': 1503552, 'steps': 7830, 'loss/train': 1.9399091005325317} -08/30/2021 14:34:49 - INFO - __main__ - Step 7832: {'lr': 0.0004980874275935591, 'samples': 1503744, 'steps': 7831, 'loss/train': 1.925467848777771} -08/30/2021 14:34:49 - INFO - __main__ - Step 7833: {'lr': 0.0004980867723738717, 'samples': 1503936, 'steps': 7832, 'loss/train': 2.454023599624634} -08/30/2021 14:34:50 - INFO - __main__ - Step 7834: {'lr': 0.0004980861170424003, 'samples': 1504128, 'steps': 7833, 'loss/train': 2.172863245010376} -08/30/2021 14:34:50 - INFO - __main__ - Step 7835: {'lr': 0.0004980854615991452, 'samples': 1504320, 'steps': 7834, 'loss/train': 5.90132999420166} -08/30/2021 14:34:51 - INFO - __main__ - Step 7836: {'lr': 0.0004980848060441064, 'samples': 1504512, 'steps': 7835, 'loss/train': 8.035666465759277} -08/30/2021 14:34:52 - INFO - __main__ - Step 7837: {'lr': 0.0004980841503772846, 'samples': 1504704, 'steps': 7836, 'loss/train': 2.5694777965545654} -08/30/2021 14:34:53 - INFO - __main__ - Step 7838: {'lr': 0.0004980834945986799, 'samples': 1504896, 'steps': 7837, 'loss/train': 2.299912691116333} -08/30/2021 14:34:53 - INFO - __main__ - Step 7839: {'lr': 0.0004980828387082925, 'samples': 1505088, 'steps': 7838, 'loss/train': 2.200338840484619} -08/30/2021 14:34:53 - INFO - __main__ - Step 7840: {'lr': 0.000498082182706123, 'samples': 1505280, 'steps': 7839, 'loss/train': 1.0367792844772339} -08/30/2021 14:34:54 - INFO - __main__ - Step 7841: {'lr': 0.0004980815265921713, 'samples': 1505472, 'steps': 7840, 'loss/train': 1.7248426675796509} -08/30/2021 14:34:54 - INFO - __main__ - Step 7842: {'lr': 0.000498080870366438, 'samples': 1505664, 'steps': 7841, 'loss/train': 3.7187607288360596} -08/30/2021 14:34:56 - INFO - __main__ - Step 7843: {'lr': 0.0004980802140289232, 'samples': 1505856, 'steps': 7842, 'loss/train': 1.994019865989685} -08/30/2021 14:34:56 - INFO - __main__ - Step 7844: {'lr': 0.0004980795575796273, 'samples': 1506048, 'steps': 7843, 'loss/train': 2.1058144569396973} -08/30/2021 14:34:56 - INFO - __main__ - Step 7845: {'lr': 0.0004980789010185507, 'samples': 1506240, 'steps': 7844, 'loss/train': 2.454730749130249} -08/30/2021 14:34:57 - INFO - __main__ - Step 7846: {'lr': 0.0004980782443456935, 'samples': 1506432, 'steps': 7845, 'loss/train': 2.023253917694092} -08/30/2021 14:34:57 - INFO - __main__ - Step 7847: {'lr': 0.000498077587561056, 'samples': 1506624, 'steps': 7846, 'loss/train': 2.3231048583984375} -08/30/2021 14:34:59 - INFO - __main__ - Step 7848: {'lr': 0.0004980769306646386, 'samples': 1506816, 'steps': 7847, 'loss/train': 2.014291286468506} -08/30/2021 14:34:59 - INFO - __main__ - Step 7849: {'lr': 0.0004980762736564417, 'samples': 1507008, 'steps': 7848, 'loss/train': 2.087556838989258} -08/30/2021 14:35:00 - INFO - __main__ - Step 7850: {'lr': 0.0004980756165364653, 'samples': 1507200, 'steps': 7849, 'loss/train': 2.1835293769836426} -08/30/2021 14:35:00 - INFO - __main__ - Step 7851: {'lr': 0.0004980749593047099, 'samples': 1507392, 'steps': 7850, 'loss/train': 1.7254502773284912} -08/30/2021 14:35:00 - INFO - __main__ - Step 7852: {'lr': 0.0004980743019611757, 'samples': 1507584, 'steps': 7851, 'loss/train': 0.8205849528312683} -08/30/2021 14:35:02 - INFO - __main__ - Step 7853: {'lr': 0.0004980736445058631, 'samples': 1507776, 'steps': 7852, 'loss/train': 0.36747708916664124} -08/30/2021 14:35:02 - INFO - __main__ - Step 7854: {'lr': 0.0004980729869387724, 'samples': 1507968, 'steps': 7853, 'loss/train': 1.8287383317947388} -08/30/2021 14:35:03 - INFO - __main__ - Step 7855: {'lr': 0.0004980723292599037, 'samples': 1508160, 'steps': 7854, 'loss/train': 2.253176689147949} -08/30/2021 14:35:03 - INFO - __main__ - Step 7856: {'lr': 0.0004980716714692576, 'samples': 1508352, 'steps': 7855, 'loss/train': 1.9407721757888794} -08/30/2021 14:35:03 - INFO - __main__ - Step 7857: {'lr': 0.0004980710135668342, 'samples': 1508544, 'steps': 7856, 'loss/train': 1.7226452827453613} -08/30/2021 14:35:06 - INFO - __main__ - Step 7858: {'lr': 0.0004980703555526338, 'samples': 1508736, 'steps': 7857, 'loss/train': 1.948722004890442} -08/30/2021 14:35:06 - INFO - __main__ - Step 7859: {'lr': 0.0004980696974266566, 'samples': 1508928, 'steps': 7858, 'loss/train': 2.246548891067505} -08/30/2021 14:35:07 - INFO - __main__ - Step 7860: {'lr': 0.0004980690391889033, 'samples': 1509120, 'steps': 7859, 'loss/train': 2.173987627029419} -08/30/2021 14:35:07 - INFO - __main__ - Step 7861: {'lr': 0.0004980683808393737, 'samples': 1509312, 'steps': 7860, 'loss/train': 1.4272888898849487} -08/30/2021 14:35:07 - INFO - __main__ - Step 7862: {'lr': 0.0004980677223780683, 'samples': 1509504, 'steps': 7861, 'loss/train': 0.162075012922287} -08/30/2021 14:35:08 - INFO - __main__ - Step 7863: {'lr': 0.0004980670638049875, 'samples': 1509696, 'steps': 7862, 'loss/train': 1.9510797262191772} -08/30/2021 14:35:09 - INFO - __main__ - Step 7864: {'lr': 0.0004980664051201315, 'samples': 1509888, 'steps': 7863, 'loss/train': 2.119154214859009} -08/30/2021 14:35:10 - INFO - __main__ - Step 7865: {'lr': 0.0004980657463235006, 'samples': 1510080, 'steps': 7864, 'loss/train': 1.5261328220367432} -08/30/2021 14:35:10 - INFO - __main__ - Step 7866: {'lr': 0.0004980650874150951, 'samples': 1510272, 'steps': 7865, 'loss/train': 1.7908101081848145} -08/30/2021 14:35:10 - INFO - __main__ - Step 7867: {'lr': 0.0004980644283949152, 'samples': 1510464, 'steps': 7866, 'loss/train': 1.9720752239227295} -08/30/2021 14:35:11 - INFO - __main__ - Step 7868: {'lr': 0.0004980637692629615, 'samples': 1510656, 'steps': 7867, 'loss/train': 1.6608741283416748} -08/30/2021 14:35:12 - INFO - __main__ - Step 7869: {'lr': 0.0004980631100192339, 'samples': 1510848, 'steps': 7868, 'loss/train': 2.1481995582580566} -08/30/2021 14:35:13 - INFO - __main__ - Step 7870: {'lr': 0.000498062450663733, 'samples': 1511040, 'steps': 7869, 'loss/train': 2.110429286956787} -08/30/2021 14:35:13 - INFO - __main__ - Step 7871: {'lr': 0.000498061791196459, 'samples': 1511232, 'steps': 7870, 'loss/train': 1.9926373958587646} -08/30/2021 14:35:14 - INFO - __main__ - Step 7872: {'lr': 0.0004980611316174122, 'samples': 1511424, 'steps': 7871, 'loss/train': 2.056915760040283} -08/30/2021 14:35:14 - INFO - __main__ - Step 7873: {'lr': 0.0004980604719265928, 'samples': 1511616, 'steps': 7872, 'loss/train': 1.4854575395584106} -08/30/2021 14:35:15 - INFO - __main__ - Step 7874: {'lr': 0.0004980598121240012, 'samples': 1511808, 'steps': 7873, 'loss/train': 2.2308859825134277} -08/30/2021 14:35:16 - INFO - __main__ - Step 7875: {'lr': 0.0004980591522096377, 'samples': 1512000, 'steps': 7874, 'loss/train': 2.1588919162750244} -08/30/2021 14:35:16 - INFO - __main__ - Step 7876: {'lr': 0.0004980584921835025, 'samples': 1512192, 'steps': 7875, 'loss/train': 2.146693706512451} -08/30/2021 14:35:17 - INFO - __main__ - Step 7877: {'lr': 0.000498057832045596, 'samples': 1512384, 'steps': 7876, 'loss/train': 2.067829132080078} -08/30/2021 14:35:17 - INFO - __main__ - Step 7878: {'lr': 0.0004980571717959186, 'samples': 1512576, 'steps': 7877, 'loss/train': 2.116293430328369} -08/30/2021 14:35:19 - INFO - __main__ - Step 7879: {'lr': 0.0004980565114344704, 'samples': 1512768, 'steps': 7878, 'loss/train': 1.7423810958862305} -08/30/2021 14:35:19 - INFO - __main__ - Step 7880: {'lr': 0.0004980558509612516, 'samples': 1512960, 'steps': 7879, 'loss/train': 1.727136492729187} -08/30/2021 14:35:19 - INFO - __main__ - Step 7881: {'lr': 0.0004980551903762629, 'samples': 1513152, 'steps': 7880, 'loss/train': 2.0340633392333984} -08/30/2021 14:35:20 - INFO - __main__ - Step 7882: {'lr': 0.0004980545296795043, 'samples': 1513344, 'steps': 7881, 'loss/train': 1.2240817546844482} -08/30/2021 14:35:20 - INFO - __main__ - Step 7883: {'lr': 0.0004980538688709761, 'samples': 1513536, 'steps': 7882, 'loss/train': 1.252685546875} -08/30/2021 14:35:22 - INFO - __main__ - Step 7884: {'lr': 0.0004980532079506786, 'samples': 1513728, 'steps': 7883, 'loss/train': 1.0615259408950806} -08/30/2021 14:35:22 - INFO - __main__ - Step 7885: {'lr': 0.0004980525469186122, 'samples': 1513920, 'steps': 7884, 'loss/train': 1.0931607484817505} -08/30/2021 14:35:23 - INFO - __main__ - Step 7886: {'lr': 0.0004980518857747772, 'samples': 1514112, 'steps': 7885, 'loss/train': 1.81352698802948} -08/30/2021 14:35:23 - INFO - __main__ - Step 7887: {'lr': 0.0004980512245191738, 'samples': 1514304, 'steps': 7886, 'loss/train': 1.7306314706802368} -08/30/2021 14:35:23 - INFO - __main__ - Step 7888: {'lr': 0.0004980505631518023, 'samples': 1514496, 'steps': 7887, 'loss/train': 2.4788763523101807} -08/30/2021 14:35:25 - INFO - __main__ - Step 7889: {'lr': 0.0004980499016726632, 'samples': 1514688, 'steps': 7888, 'loss/train': 1.7479809522628784} -08/30/2021 14:35:25 - INFO - __main__ - Step 7890: {'lr': 0.0004980492400817564, 'samples': 1514880, 'steps': 7889, 'loss/train': 2.2409465312957764} -08/30/2021 14:35:26 - INFO - __main__ - Step 7891: {'lr': 0.0004980485783790827, 'samples': 1515072, 'steps': 7890, 'loss/train': 2.0339908599853516} -08/30/2021 14:35:26 - INFO - __main__ - Step 7892: {'lr': 0.0004980479165646419, 'samples': 1515264, 'steps': 7891, 'loss/train': 2.3462719917297363} -08/30/2021 14:35:26 - INFO - __main__ - Step 7893: {'lr': 0.0004980472546384347, 'samples': 1515456, 'steps': 7892, 'loss/train': 2.127397298812866} -08/30/2021 14:35:28 - INFO - __main__ - Step 7894: {'lr': 0.0004980465926004613, 'samples': 1515648, 'steps': 7893, 'loss/train': 1.0002518892288208} -08/30/2021 14:35:28 - INFO - __main__ - Step 7895: {'lr': 0.0004980459304507218, 'samples': 1515840, 'steps': 7894, 'loss/train': 1.8891297578811646} -08/30/2021 14:35:29 - INFO - __main__ - Step 7896: {'lr': 0.0004980452681892166, 'samples': 1516032, 'steps': 7895, 'loss/train': 1.329634428024292} -08/30/2021 14:35:29 - INFO - __main__ - Step 7897: {'lr': 0.0004980446058159461, 'samples': 1516224, 'steps': 7896, 'loss/train': 1.7612277269363403} -08/30/2021 14:35:29 - INFO - __main__ - Step 7898: {'lr': 0.0004980439433309106, 'samples': 1516416, 'steps': 7897, 'loss/train': 1.8305355310440063} -08/30/2021 14:35:30 - INFO - __main__ - Step 7899: {'lr': 0.0004980432807341102, 'samples': 1516608, 'steps': 7898, 'loss/train': 1.9770076274871826} -08/30/2021 14:35:31 - INFO - __main__ - Step 7900: {'lr': 0.0004980426180255453, 'samples': 1516800, 'steps': 7899, 'loss/train': 2.2382895946502686} -08/30/2021 14:35:32 - INFO - __main__ - Step 7901: {'lr': 0.0004980419552052163, 'samples': 1516992, 'steps': 7900, 'loss/train': 1.5814892053604126} -08/30/2021 14:35:32 - INFO - __main__ - Step 7902: {'lr': 0.0004980412922731234, 'samples': 1517184, 'steps': 7901, 'loss/train': 1.792866587638855} -08/30/2021 14:35:32 - INFO - __main__ - Step 7903: {'lr': 0.0004980406292292669, 'samples': 1517376, 'steps': 7902, 'loss/train': 2.3232505321502686} -08/30/2021 14:35:33 - INFO - __main__ - Step 7904: {'lr': 0.0004980399660736472, 'samples': 1517568, 'steps': 7903, 'loss/train': 1.5798043012619019} -08/30/2021 14:35:34 - INFO - __main__ - Step 7905: {'lr': 0.0004980393028062646, 'samples': 1517760, 'steps': 7904, 'loss/train': 2.43125057220459} -08/30/2021 14:35:35 - INFO - __main__ - Step 7906: {'lr': 0.0004980386394271191, 'samples': 1517952, 'steps': 7905, 'loss/train': 2.2891671657562256} -08/30/2021 14:35:35 - INFO - __main__ - Step 7907: {'lr': 0.0004980379759362113, 'samples': 1518144, 'steps': 7906, 'loss/train': 2.1696372032165527} -08/30/2021 14:35:35 - INFO - __main__ - Step 7908: {'lr': 0.0004980373123335414, 'samples': 1518336, 'steps': 7907, 'loss/train': 2.017667770385742} -08/30/2021 14:35:36 - INFO - __main__ - Step 7909: {'lr': 0.0004980366486191098, 'samples': 1518528, 'steps': 7908, 'loss/train': 1.5882924795150757} -08/30/2021 14:35:38 - INFO - __main__ - Step 7910: {'lr': 0.0004980359847929167, 'samples': 1518720, 'steps': 7909, 'loss/train': 2.1881558895111084} -08/30/2021 14:35:38 - INFO - __main__ - Step 7911: {'lr': 0.0004980353208549623, 'samples': 1518912, 'steps': 7910, 'loss/train': 1.9824440479278564} -08/30/2021 14:35:38 - INFO - __main__ - Step 7912: {'lr': 0.0004980346568052471, 'samples': 1519104, 'steps': 7911, 'loss/train': 1.9016330242156982} -08/30/2021 14:35:39 - INFO - __main__ - Step 7913: {'lr': 0.0004980339926437713, 'samples': 1519296, 'steps': 7912, 'loss/train': 1.8732227087020874} -08/30/2021 14:35:39 - INFO - __main__ - Step 7914: {'lr': 0.0004980333283705351, 'samples': 1519488, 'steps': 7913, 'loss/train': 2.991459846496582} -08/30/2021 14:35:39 - INFO - __main__ - Step 7915: {'lr': 0.000498032663985539, 'samples': 1519680, 'steps': 7914, 'loss/train': 3.000925064086914} -08/30/2021 14:35:42 - INFO - __main__ - Step 7916: {'lr': 0.0004980319994887833, 'samples': 1519872, 'steps': 7915, 'loss/train': 2.2439892292022705} -08/30/2021 14:35:43 - INFO - __main__ - Step 7917: {'lr': 0.0004980313348802681, 'samples': 1520064, 'steps': 7916, 'loss/train': 1.8466578722000122} -08/30/2021 14:35:43 - INFO - __main__ - Step 7918: {'lr': 0.0004980306701599938, 'samples': 1520256, 'steps': 7917, 'loss/train': 2.148094654083252} -08/30/2021 14:35:43 - INFO - __main__ - Step 7919: {'lr': 0.0004980300053279607, 'samples': 1520448, 'steps': 7918, 'loss/train': 2.8910977840423584} -08/30/2021 14:35:44 - INFO - __main__ - Step 7920: {'lr': 0.0004980293403841693, 'samples': 1520640, 'steps': 7919, 'loss/train': 1.7436580657958984} -08/30/2021 14:35:44 - INFO - __main__ - Step 7921: {'lr': 0.0004980286753286195, 'samples': 1520832, 'steps': 7920, 'loss/train': 0.4521118700504303} -08/30/2021 14:35:44 - INFO - __main__ - Step 7922: {'lr': 0.0004980280101613119, 'samples': 1521024, 'steps': 7921, 'loss/train': 0.3283317983150482} -08/30/2021 14:35:45 - INFO - __main__ - Step 7923: {'lr': 0.0004980273448822466, 'samples': 1521216, 'steps': 7922, 'loss/train': 0.28704833984375} -08/30/2021 14:35:46 - INFO - __main__ - Step 7924: {'lr': 0.000498026679491424, 'samples': 1521408, 'steps': 7923, 'loss/train': 1.5692418813705444} -08/30/2021 14:35:47 - INFO - __main__ - Step 7925: {'lr': 0.0004980260139888445, 'samples': 1521600, 'steps': 7924, 'loss/train': 0.6815661787986755} -08/30/2021 14:35:47 - INFO - __main__ - Step 7926: {'lr': 0.0004980253483745083, 'samples': 1521792, 'steps': 7925, 'loss/train': 1.844468355178833} -08/30/2021 14:35:47 - INFO - __main__ - Step 7927: {'lr': 0.0004980246826484157, 'samples': 1521984, 'steps': 7926, 'loss/train': 1.6807992458343506} -08/30/2021 14:35:48 - INFO - __main__ - Step 7928: {'lr': 0.000498024016810567, 'samples': 1522176, 'steps': 7927, 'loss/train': 1.8619461059570312} -08/30/2021 14:35:49 - INFO - __main__ - Step 7929: {'lr': 0.0004980233508609625, 'samples': 1522368, 'steps': 7928, 'loss/train': 1.9839160442352295} -08/30/2021 14:35:50 - INFO - __main__ - Step 7930: {'lr': 0.0004980226847996025, 'samples': 1522560, 'steps': 7929, 'loss/train': 1.683982014656067} -08/30/2021 14:35:50 - INFO - __main__ - Step 7931: {'lr': 0.0004980220186264874, 'samples': 1522752, 'steps': 7930, 'loss/train': 1.829045057296753} -08/30/2021 14:35:50 - INFO - __main__ - Step 7932: {'lr': 0.0004980213523416172, 'samples': 1522944, 'steps': 7931, 'loss/train': 2.1909728050231934} -08/30/2021 14:35:51 - INFO - __main__ - Step 7933: {'lr': 0.0004980206859449926, 'samples': 1523136, 'steps': 7932, 'loss/train': 1.7288392782211304} -08/30/2021 14:35:52 - INFO - __main__ - Step 7934: {'lr': 0.0004980200194366136, 'samples': 1523328, 'steps': 7933, 'loss/train': 2.5279312133789062} -08/30/2021 14:35:53 - INFO - __main__ - Step 7935: {'lr': 0.0004980193528164806, 'samples': 1523520, 'steps': 7934, 'loss/train': 1.7118288278579712} -08/30/2021 14:35:53 - INFO - __main__ - Step 7936: {'lr': 0.0004980186860845939, 'samples': 1523712, 'steps': 7935, 'loss/train': 1.9207849502563477} -08/30/2021 14:35:53 - INFO - __main__ - Step 7937: {'lr': 0.0004980180192409539, 'samples': 1523904, 'steps': 7936, 'loss/train': 1.6872050762176514} -08/30/2021 14:35:54 - INFO - __main__ - Step 7938: {'lr': 0.0004980173522855608, 'samples': 1524096, 'steps': 7937, 'loss/train': 2.444744825363159} -08/30/2021 14:35:55 - INFO - __main__ - Step 7939: {'lr': 0.0004980166852184148, 'samples': 1524288, 'steps': 7938, 'loss/train': 1.7128517627716064} -08/30/2021 14:35:56 - INFO - __main__ - Step 7940: {'lr': 0.0004980160180395164, 'samples': 1524480, 'steps': 7939, 'loss/train': 1.9546692371368408} -08/30/2021 14:35:56 - INFO - __main__ - Step 7941: {'lr': 0.0004980153507488657, 'samples': 1524672, 'steps': 7940, 'loss/train': 2.101292133331299} -08/30/2021 14:35:56 - INFO - __main__ - Step 7942: {'lr': 0.0004980146833464633, 'samples': 1524864, 'steps': 7941, 'loss/train': 2.1375372409820557} -08/30/2021 14:35:57 - INFO - __main__ - Step 7943: {'lr': 0.0004980140158323092, 'samples': 1525056, 'steps': 7942, 'loss/train': 2.116997003555298} -08/30/2021 14:35:58 - INFO - __main__ - Step 7944: {'lr': 0.0004980133482064038, 'samples': 1525248, 'steps': 7943, 'loss/train': 2.504096508026123} -08/30/2021 14:35:59 - INFO - __main__ - Step 7945: {'lr': 0.0004980126804687474, 'samples': 1525440, 'steps': 7944, 'loss/train': 1.845743179321289} -08/30/2021 14:35:59 - INFO - __main__ - Step 7946: {'lr': 0.0004980120126193403, 'samples': 1525632, 'steps': 7945, 'loss/train': 0.4973115622997284} -08/30/2021 14:35:59 - INFO - __main__ - Step 7947: {'lr': 0.0004980113446581829, 'samples': 1525824, 'steps': 7946, 'loss/train': 1.9411251544952393} -08/30/2021 14:36:00 - INFO - __main__ - Step 7948: {'lr': 0.0004980106765852753, 'samples': 1526016, 'steps': 7947, 'loss/train': 2.3189473152160645} -08/30/2021 14:36:01 - INFO - __main__ - Step 7949: {'lr': 0.0004980100084006181, 'samples': 1526208, 'steps': 7948, 'loss/train': 1.9953863620758057} -08/30/2021 14:36:02 - INFO - __main__ - Step 7950: {'lr': 0.0004980093401042113, 'samples': 1526400, 'steps': 7949, 'loss/train': 2.287334442138672} -08/30/2021 14:36:02 - INFO - __main__ - Step 7951: {'lr': 0.0004980086716960552, 'samples': 1526592, 'steps': 7950, 'loss/train': 0.17116063833236694} -08/30/2021 14:36:02 - INFO - __main__ - Step 7952: {'lr': 0.0004980080031761504, 'samples': 1526784, 'steps': 7951, 'loss/train': 1.6895288228988647} -08/30/2021 14:36:03 - INFO - __main__ - Step 7953: {'lr': 0.000498007334544497, 'samples': 1526976, 'steps': 7952, 'loss/train': 1.9028524160385132} -08/30/2021 14:36:04 - INFO - __main__ - Step 7954: {'lr': 0.0004980066658010952, 'samples': 1527168, 'steps': 7953, 'loss/train': 2.0068423748016357} -08/30/2021 14:36:05 - INFO - __main__ - Step 7955: {'lr': 0.0004980059969459455, 'samples': 1527360, 'steps': 7954, 'loss/train': 2.3404934406280518} -08/30/2021 14:36:05 - INFO - __main__ - Step 7956: {'lr': 0.0004980053279790481, 'samples': 1527552, 'steps': 7955, 'loss/train': 1.9536232948303223} -08/30/2021 14:36:05 - INFO - __main__ - Step 7957: {'lr': 0.0004980046589004034, 'samples': 1527744, 'steps': 7956, 'loss/train': 0.4819597005844116} -08/30/2021 14:36:06 - INFO - __main__ - Step 7958: {'lr': 0.0004980039897100115, 'samples': 1527936, 'steps': 7957, 'loss/train': 2.34667706489563} -08/30/2021 14:36:06 - INFO - __main__ - Step 7959: {'lr': 0.000498003320407873, 'samples': 1528128, 'steps': 7958, 'loss/train': 1.59219491481781} -08/30/2021 14:36:08 - INFO - __main__ - Step 7960: {'lr': 0.000498002650993988, 'samples': 1528320, 'steps': 7959, 'loss/train': 1.3361490964889526} -08/30/2021 14:36:08 - INFO - __main__ - Step 7961: {'lr': 0.0004980019814683568, 'samples': 1528512, 'steps': 7960, 'loss/train': 1.800642967224121} -08/30/2021 14:36:09 - INFO - __main__ - Step 7962: {'lr': 0.0004980013118309796, 'samples': 1528704, 'steps': 7961, 'loss/train': 1.2711882591247559} -08/30/2021 14:36:09 - INFO - __main__ - Step 7963: {'lr': 0.000498000642081857, 'samples': 1528896, 'steps': 7962, 'loss/train': 2.0844485759735107} -08/30/2021 14:36:10 - INFO - __main__ - Step 7964: {'lr': 0.0004979999722209891, 'samples': 1529088, 'steps': 7963, 'loss/train': 3.0170657634735107} -08/30/2021 14:36:11 - INFO - __main__ - Step 7965: {'lr': 0.0004979993022483762, 'samples': 1529280, 'steps': 7964, 'loss/train': 2.1732215881347656} -08/30/2021 14:36:11 - INFO - __main__ - Step 7966: {'lr': 0.0004979986321640187, 'samples': 1529472, 'steps': 7965, 'loss/train': 1.7630354166030884} -08/30/2021 14:36:12 - INFO - __main__ - Step 7967: {'lr': 0.0004979979619679168, 'samples': 1529664, 'steps': 7966, 'loss/train': 2.0841562747955322} -08/30/2021 14:36:12 - INFO - __main__ - Step 7968: {'lr': 0.0004979972916600708, 'samples': 1529856, 'steps': 7967, 'loss/train': 1.6400091648101807} -08/30/2021 14:36:12 - INFO - __main__ - Step 7969: {'lr': 0.0004979966212404812, 'samples': 1530048, 'steps': 7968, 'loss/train': 1.864302158355713} -08/30/2021 14:36:14 - INFO - __main__ - Step 7970: {'lr': 0.0004979959507091479, 'samples': 1530240, 'steps': 7969, 'loss/train': 1.8296929597854614} -08/30/2021 14:36:15 - INFO - __main__ - Step 7971: {'lr': 0.0004979952800660717, 'samples': 1530432, 'steps': 7970, 'loss/train': 2.113858461380005} -08/30/2021 14:36:15 - INFO - __main__ - Step 7972: {'lr': 0.0004979946093112525, 'samples': 1530624, 'steps': 7971, 'loss/train': 1.1817271709442139} -08/30/2021 14:36:16 - INFO - __main__ - Step 7973: {'lr': 0.0004979939384446908, 'samples': 1530816, 'steps': 7972, 'loss/train': 1.7022167444229126} -08/30/2021 14:36:16 - INFO - __main__ - Step 7974: {'lr': 0.0004979932674663869, 'samples': 1531008, 'steps': 7973, 'loss/train': 2.165408134460449} -08/30/2021 14:36:18 - INFO - __main__ - Step 7975: {'lr': 0.000497992596376341, 'samples': 1531200, 'steps': 7974, 'loss/train': 2.0156679153442383} -08/30/2021 14:36:18 - INFO - __main__ - Step 7976: {'lr': 0.0004979919251745535, 'samples': 1531392, 'steps': 7975, 'loss/train': 2.6220502853393555} -08/30/2021 14:36:18 - INFO - __main__ - Step 7977: {'lr': 0.0004979912538610247, 'samples': 1531584, 'steps': 7976, 'loss/train': 1.8627681732177734} -08/30/2021 14:36:19 - INFO - __main__ - Step 7978: {'lr': 0.0004979905824357548, 'samples': 1531776, 'steps': 7977, 'loss/train': 1.6736421585083008} -08/30/2021 14:36:19 - INFO - __main__ - Step 7979: {'lr': 0.0004979899108987442, 'samples': 1531968, 'steps': 7978, 'loss/train': 2.027559995651245} -08/30/2021 14:36:21 - INFO - __main__ - Step 7980: {'lr': 0.0004979892392499932, 'samples': 1532160, 'steps': 7979, 'loss/train': 2.053459644317627} -08/30/2021 14:36:21 - INFO - __main__ - Step 7981: {'lr': 0.0004979885674895021, 'samples': 1532352, 'steps': 7980, 'loss/train': 2.142665386199951} -08/30/2021 14:36:22 - INFO - __main__ - Step 7982: {'lr': 0.0004979878956172711, 'samples': 1532544, 'steps': 7981, 'loss/train': 2.910045623779297} -08/30/2021 14:36:22 - INFO - __main__ - Step 7983: {'lr': 0.0004979872236333005, 'samples': 1532736, 'steps': 7982, 'loss/train': 2.21919846534729} -08/30/2021 14:36:22 - INFO - __main__ - Step 7984: {'lr': 0.0004979865515375908, 'samples': 1532928, 'steps': 7983, 'loss/train': 0.5169633030891418} -08/30/2021 14:36:23 - INFO - __main__ - Step 7985: {'lr': 0.0004979858793301422, 'samples': 1533120, 'steps': 7984, 'loss/train': 1.3447307348251343} -08/30/2021 14:36:24 - INFO - __main__ - Step 7986: {'lr': 0.000497985207010955, 'samples': 1533312, 'steps': 7985, 'loss/train': 1.9778574705123901} -08/30/2021 14:36:25 - INFO - __main__ - Step 7987: {'lr': 0.0004979845345800294, 'samples': 1533504, 'steps': 7986, 'loss/train': 3.0037994384765625} -08/30/2021 14:36:25 - INFO - __main__ - Step 7988: {'lr': 0.0004979838620373659, 'samples': 1533696, 'steps': 7987, 'loss/train': 0.644941508769989} -08/30/2021 14:36:25 - INFO - __main__ - Step 7989: {'lr': 0.0004979831893829646, 'samples': 1533888, 'steps': 7988, 'loss/train': 1.3515015840530396} -08/30/2021 14:36:26 - INFO - __main__ - Step 7990: {'lr': 0.0004979825166168259, 'samples': 1534080, 'steps': 7989, 'loss/train': 1.641153335571289} -08/30/2021 14:36:27 - INFO - __main__ - Step 7991: {'lr': 0.0004979818437389502, 'samples': 1534272, 'steps': 7990, 'loss/train': 1.7243032455444336} -08/30/2021 14:36:28 - INFO - __main__ - Step 7992: {'lr': 0.0004979811707493377, 'samples': 1534464, 'steps': 7991, 'loss/train': 2.0713040828704834} -08/30/2021 14:36:28 - INFO - __main__ - Step 7993: {'lr': 0.0004979804976479887, 'samples': 1534656, 'steps': 7992, 'loss/train': 1.9589450359344482} -08/30/2021 14:36:28 - INFO - __main__ - Step 7994: {'lr': 0.0004979798244349034, 'samples': 1534848, 'steps': 7993, 'loss/train': 2.1670055389404297} -08/30/2021 14:36:29 - INFO - __main__ - Step 7995: {'lr': 0.0004979791511100823, 'samples': 1535040, 'steps': 7994, 'loss/train': 2.0286285877227783} -08/30/2021 14:36:31 - INFO - __main__ - Step 7996: {'lr': 0.0004979784776735257, 'samples': 1535232, 'steps': 7995, 'loss/train': 1.703765869140625} -08/30/2021 14:36:31 - INFO - __main__ - Step 7997: {'lr': 0.0004979778041252338, 'samples': 1535424, 'steps': 7996, 'loss/train': 1.8905060291290283} -08/30/2021 14:36:31 - INFO - __main__ - Step 7998: {'lr': 0.0004979771304652068, 'samples': 1535616, 'steps': 7997, 'loss/train': 0.36253124475479126} -08/30/2021 14:36:32 - INFO - __main__ - Step 7999: {'lr': 0.0004979764566934452, 'samples': 1535808, 'steps': 7998, 'loss/train': 1.8920336961746216} -08/30/2021 14:36:32 - INFO - __main__ - Step 8000: {'lr': 0.0004979757828099492, 'samples': 1536000, 'steps': 7999, 'loss/train': 4.387569427490234} -08/30/2021 14:36:32 - INFO - __main__ - Step 8001: {'lr': 0.0004979751088147192, 'samples': 1536192, 'steps': 8000, 'loss/train': 1.4285427331924438} -08/30/2021 14:36:34 - INFO - __main__ - Step 8002: {'lr': 0.0004979744347077555, 'samples': 1536384, 'steps': 8001, 'loss/train': 2.4966976642608643} -08/30/2021 14:36:34 - INFO - __main__ - Step 8003: {'lr': 0.0004979737604890582, 'samples': 1536576, 'steps': 8002, 'loss/train': 1.9589344263076782} -08/30/2021 14:36:35 - INFO - __main__ - Step 8004: {'lr': 0.0004979730861586278, 'samples': 1536768, 'steps': 8003, 'loss/train': 1.8467297554016113} -08/30/2021 14:36:35 - INFO - __main__ - Step 8005: {'lr': 0.0004979724117164646, 'samples': 1536960, 'steps': 8004, 'loss/train': 2.14319109916687} -08/30/2021 14:36:35 - INFO - __main__ - Step 8006: {'lr': 0.0004979717371625689, 'samples': 1537152, 'steps': 8005, 'loss/train': 2.146137237548828} -08/30/2021 14:36:37 - INFO - __main__ - Step 8007: {'lr': 0.0004979710624969408, 'samples': 1537344, 'steps': 8006, 'loss/train': 2.2626583576202393} -08/30/2021 14:36:37 - INFO - __main__ - Step 8008: {'lr': 0.000497970387719581, 'samples': 1537536, 'steps': 8007, 'loss/train': 1.4100250005722046} -08/30/2021 14:36:38 - INFO - __main__ - Step 8009: {'lr': 0.0004979697128304893, 'samples': 1537728, 'steps': 8008, 'loss/train': 1.6080433130264282} -08/30/2021 14:36:38 - INFO - __main__ - Step 8010: {'lr': 0.0004979690378296665, 'samples': 1537920, 'steps': 8009, 'loss/train': 1.759553074836731} -08/30/2021 14:36:38 - INFO - __main__ - Step 8011: {'lr': 0.0004979683627171125, 'samples': 1538112, 'steps': 8010, 'loss/train': 2.5464515686035156} -08/30/2021 14:36:40 - INFO - __main__ - Step 8012: {'lr': 0.0004979676874928278, 'samples': 1538304, 'steps': 8011, 'loss/train': 1.9359408617019653} -08/30/2021 14:36:41 - INFO - __main__ - Step 8013: {'lr': 0.0004979670121568129, 'samples': 1538496, 'steps': 8012, 'loss/train': 1.395814061164856} -08/30/2021 14:36:41 - INFO - __main__ - Step 8014: {'lr': 0.0004979663367090676, 'samples': 1538688, 'steps': 8013, 'loss/train': 1.2997294664382935} -08/30/2021 14:36:41 - INFO - __main__ - Step 8015: {'lr': 0.0004979656611495927, 'samples': 1538880, 'steps': 8014, 'loss/train': 1.9417048692703247} -08/30/2021 14:36:42 - INFO - __main__ - Step 8016: {'lr': 0.0004979649854783883, 'samples': 1539072, 'steps': 8015, 'loss/train': 3.8958165645599365} -08/30/2021 14:36:43 - INFO - __main__ - Step 8017: {'lr': 0.0004979643096954545, 'samples': 1539264, 'steps': 8016, 'loss/train': 2.0222980976104736} -08/30/2021 14:36:44 - INFO - __main__ - Step 8018: {'lr': 0.000497963633800792, 'samples': 1539456, 'steps': 8017, 'loss/train': 0.9974882006645203} -08/30/2021 14:36:44 - INFO - __main__ - Step 8019: {'lr': 0.0004979629577944009, 'samples': 1539648, 'steps': 8018, 'loss/train': 1.9589250087738037} -08/30/2021 14:36:44 - INFO - __main__ - Step 8020: {'lr': 0.0004979622816762815, 'samples': 1539840, 'steps': 8019, 'loss/train': 1.955483317375183} -08/30/2021 14:36:45 - INFO - __main__ - Step 8021: {'lr': 0.0004979616054464341, 'samples': 1540032, 'steps': 8020, 'loss/train': 1.9251713752746582} -08/30/2021 14:36:47 - INFO - __main__ - Step 8022: {'lr': 0.000497960929104859, 'samples': 1540224, 'steps': 8021, 'loss/train': 0.7427318096160889} -08/30/2021 14:36:47 - INFO - __main__ - Step 8023: {'lr': 0.0004979602526515566, 'samples': 1540416, 'steps': 8022, 'loss/train': 1.4187557697296143} -08/30/2021 14:36:48 - INFO - __main__ - Step 8024: {'lr': 0.0004979595760865271, 'samples': 1540608, 'steps': 8023, 'loss/train': 2.1171064376831055} -08/30/2021 14:36:48 - INFO - __main__ - Step 8025: {'lr': 0.0004979588994097708, 'samples': 1540800, 'steps': 8024, 'loss/train': 3.3683278560638428} -08/30/2021 14:36:48 - INFO - __main__ - Step 8026: {'lr': 0.0004979582226212881, 'samples': 1540992, 'steps': 8025, 'loss/train': 2.1514739990234375} -08/30/2021 14:36:50 - INFO - __main__ - Step 8027: {'lr': 0.0004979575457210792, 'samples': 1541184, 'steps': 8026, 'loss/train': 1.720782995223999} -08/30/2021 14:36:50 - INFO - __main__ - Step 8028: {'lr': 0.0004979568687091446, 'samples': 1541376, 'steps': 8027, 'loss/train': 2.471392869949341} -08/30/2021 14:36:51 - INFO - __main__ - Step 8029: {'lr': 0.0004979561915854843, 'samples': 1541568, 'steps': 8028, 'loss/train': 1.839748740196228} -08/30/2021 14:36:51 - INFO - __main__ - Step 8030: {'lr': 0.0004979555143500988, 'samples': 1541760, 'steps': 8029, 'loss/train': 1.1976137161254883} -08/30/2021 14:36:51 - INFO - __main__ - Step 8031: {'lr': 0.0004979548370029884, 'samples': 1541952, 'steps': 8030, 'loss/train': 2.1068124771118164} -08/30/2021 14:36:53 - INFO - __main__ - Step 8032: {'lr': 0.0004979541595441534, 'samples': 1542144, 'steps': 8031, 'loss/train': 1.758437156677246} -08/30/2021 14:36:53 - INFO - __main__ - Step 8033: {'lr': 0.000497953481973594, 'samples': 1542336, 'steps': 8032, 'loss/train': 1.7716573476791382} -08/30/2021 14:36:54 - INFO - __main__ - Step 8034: {'lr': 0.0004979528042913106, 'samples': 1542528, 'steps': 8033, 'loss/train': 2.0524511337280273} -08/30/2021 14:36:54 - INFO - __main__ - Step 8035: {'lr': 0.0004979521264973036, 'samples': 1542720, 'steps': 8034, 'loss/train': 1.1920688152313232} -08/30/2021 14:36:54 - INFO - __main__ - Step 8036: {'lr': 0.0004979514485915731, 'samples': 1542912, 'steps': 8035, 'loss/train': 2.018043041229248} -08/30/2021 14:36:55 - INFO - __main__ - Step 8037: {'lr': 0.0004979507705741195, 'samples': 1543104, 'steps': 8036, 'loss/train': 2.270192861557007} -08/30/2021 14:36:56 - INFO - __main__ - Step 8038: {'lr': 0.0004979500924449431, 'samples': 1543296, 'steps': 8037, 'loss/train': 1.5486962795257568} -08/30/2021 14:36:57 - INFO - __main__ - Step 8039: {'lr': 0.0004979494142040444, 'samples': 1543488, 'steps': 8038, 'loss/train': 1.6932404041290283} -08/30/2021 14:36:57 - INFO - __main__ - Step 8040: {'lr': 0.0004979487358514233, 'samples': 1543680, 'steps': 8039, 'loss/train': 1.8105981349945068} -08/30/2021 14:36:57 - INFO - __main__ - Step 8041: {'lr': 0.0004979480573870803, 'samples': 1543872, 'steps': 8040, 'loss/train': 2.0685484409332275} -08/30/2021 14:36:58 - INFO - __main__ - Step 8042: {'lr': 0.000497947378811016, 'samples': 1544064, 'steps': 8041, 'loss/train': 1.8281188011169434} -08/30/2021 14:36:59 - INFO - __main__ - Step 8043: {'lr': 0.0004979467001232302, 'samples': 1544256, 'steps': 8042, 'loss/train': 1.946904182434082} -08/30/2021 14:37:00 - INFO - __main__ - Step 8044: {'lr': 0.0004979460213237235, 'samples': 1544448, 'steps': 8043, 'loss/train': 2.2791924476623535} -08/30/2021 14:37:00 - INFO - __main__ - Step 8045: {'lr': 0.0004979453424124961, 'samples': 1544640, 'steps': 8044, 'loss/train': 2.8117494583129883} -08/30/2021 14:37:00 - INFO - __main__ - Step 8046: {'lr': 0.0004979446633895484, 'samples': 1544832, 'steps': 8045, 'loss/train': 1.5231140851974487} -08/30/2021 14:37:01 - INFO - __main__ - Step 8047: {'lr': 0.0004979439842548808, 'samples': 1545024, 'steps': 8046, 'loss/train': 2.0871026515960693} -08/30/2021 14:37:03 - INFO - __main__ - Step 8048: {'lr': 0.0004979433050084933, 'samples': 1545216, 'steps': 8047, 'loss/train': 1.9119102954864502} -08/30/2021 14:37:03 - INFO - __main__ - Step 8049: {'lr': 0.0004979426256503863, 'samples': 1545408, 'steps': 8048, 'loss/train': 2.0319998264312744} -08/30/2021 14:37:03 - INFO - __main__ - Step 8050: {'lr': 0.0004979419461805603, 'samples': 1545600, 'steps': 8049, 'loss/train': 2.023425817489624} -08/30/2021 14:37:04 - INFO - __main__ - Step 8051: {'lr': 0.0004979412665990156, 'samples': 1545792, 'steps': 8050, 'loss/train': 0.29502061009407043} -08/30/2021 14:37:04 - INFO - __main__ - Step 8052: {'lr': 0.0004979405869057522, 'samples': 1545984, 'steps': 8051, 'loss/train': 1.7866392135620117} -08/30/2021 14:37:06 - INFO - __main__ - Step 8053: {'lr': 0.0004979399071007707, 'samples': 1546176, 'steps': 8052, 'loss/train': 2.1674277782440186} -08/30/2021 14:37:06 - INFO - __main__ - Step 8054: {'lr': 0.0004979392271840712, 'samples': 1546368, 'steps': 8053, 'loss/train': 2.000279664993286} -08/30/2021 14:37:06 - INFO - __main__ - Step 8055: {'lr': 0.0004979385471556542, 'samples': 1546560, 'steps': 8054, 'loss/train': 1.5608389377593994} -08/30/2021 14:37:07 - INFO - __main__ - Step 8056: {'lr': 0.00049793786701552, 'samples': 1546752, 'steps': 8055, 'loss/train': 1.789946436882019} -08/30/2021 14:37:07 - INFO - __main__ - Step 8057: {'lr': 0.0004979371867636687, 'samples': 1546944, 'steps': 8056, 'loss/train': 1.7204139232635498} -08/30/2021 14:37:07 - INFO - __main__ - Step 8058: {'lr': 0.0004979365064001007, 'samples': 1547136, 'steps': 8057, 'loss/train': 1.940467357635498} -08/30/2021 14:37:09 - INFO - __main__ - Step 8059: {'lr': 0.0004979358259248164, 'samples': 1547328, 'steps': 8058, 'loss/train': 1.6927646398544312} -08/30/2021 14:37:09 - INFO - __main__ - Step 8060: {'lr': 0.000497935145337816, 'samples': 1547520, 'steps': 8059, 'loss/train': 2.008763313293457} -08/30/2021 14:37:10 - INFO - __main__ - Step 8061: {'lr': 0.0004979344646390999, 'samples': 1547712, 'steps': 8060, 'loss/train': 1.753297209739685} -08/30/2021 14:37:10 - INFO - __main__ - Step 8062: {'lr': 0.0004979337838286684, 'samples': 1547904, 'steps': 8061, 'loss/train': 2.1832754611968994} -08/30/2021 14:37:10 - INFO - __main__ - Step 8063: {'lr': 0.0004979331029065216, 'samples': 1548096, 'steps': 8062, 'loss/train': 1.679816484451294} -08/30/2021 14:37:12 - INFO - __main__ - Step 8064: {'lr': 0.00049793242187266, 'samples': 1548288, 'steps': 8063, 'loss/train': 2.2498199939727783} -08/30/2021 14:37:12 - INFO - __main__ - Step 8065: {'lr': 0.000497931740727084, 'samples': 1548480, 'steps': 8064, 'loss/train': 1.5963996648788452} -08/30/2021 14:37:13 - INFO - __main__ - Step 8066: {'lr': 0.0004979310594697937, 'samples': 1548672, 'steps': 8065, 'loss/train': 1.532086730003357} -08/30/2021 14:37:13 - INFO - __main__ - Step 8067: {'lr': 0.0004979303781007896, 'samples': 1548864, 'steps': 8066, 'loss/train': 1.1951234340667725} -08/30/2021 14:37:13 - INFO - __main__ - Step 8068: {'lr': 0.0004979296966200718, 'samples': 1549056, 'steps': 8067, 'loss/train': 1.3954778909683228} -08/30/2021 14:37:15 - INFO - __main__ - Step 8069: {'lr': 0.0004979290150276407, 'samples': 1549248, 'steps': 8068, 'loss/train': 2.2659614086151123} -08/30/2021 14:37:15 - INFO - __main__ - Step 8070: {'lr': 0.0004979283333234966, 'samples': 1549440, 'steps': 8069, 'loss/train': 1.849366307258606} -08/30/2021 14:37:16 - INFO - __main__ - Step 8071: {'lr': 0.0004979276515076399, 'samples': 1549632, 'steps': 8070, 'loss/train': 2.1270198822021484} -08/30/2021 14:37:16 - INFO - __main__ - Step 8072: {'lr': 0.0004979269695800707, 'samples': 1549824, 'steps': 8071, 'loss/train': 0.9996500611305237} -08/30/2021 14:37:16 - INFO - __main__ - Step 8073: {'lr': 0.0004979262875407896, 'samples': 1550016, 'steps': 8072, 'loss/train': 1.990217685699463} -08/30/2021 14:37:18 - INFO - __main__ - Step 8074: {'lr': 0.0004979256053897966, 'samples': 1550208, 'steps': 8073, 'loss/train': 2.1046195030212402} -08/30/2021 14:37:19 - INFO - __main__ - Step 8075: {'lr': 0.0004979249231270923, 'samples': 1550400, 'steps': 8074, 'loss/train': 2.477461338043213} -08/30/2021 14:37:19 - INFO - __main__ - Step 8076: {'lr': 0.0004979242407526766, 'samples': 1550592, 'steps': 8075, 'loss/train': 1.9458473920822144} -08/30/2021 14:37:19 - INFO - __main__ - Step 8077: {'lr': 0.0004979235582665503, 'samples': 1550784, 'steps': 8076, 'loss/train': 0.31497299671173096} -08/30/2021 14:37:20 - INFO - __main__ - Step 8078: {'lr': 0.0004979228756687135, 'samples': 1550976, 'steps': 8077, 'loss/train': 1.9776636362075806} -08/30/2021 14:37:20 - INFO - __main__ - Step 8079: {'lr': 0.0004979221929591663, 'samples': 1551168, 'steps': 8078, 'loss/train': 1.7904404401779175} -08/30/2021 14:37:22 - INFO - __main__ - Step 8080: {'lr': 0.0004979215101379093, 'samples': 1551360, 'steps': 8079, 'loss/train': 1.9985524415969849} -08/30/2021 14:37:23 - INFO - __main__ - Step 8081: {'lr': 0.0004979208272049426, 'samples': 1551552, 'steps': 8080, 'loss/train': 1.1416809558868408} -08/30/2021 14:37:23 - INFO - __main__ - Step 8082: {'lr': 0.0004979201441602665, 'samples': 1551744, 'steps': 8081, 'loss/train': 1.9365806579589844} -08/30/2021 14:37:23 - INFO - __main__ - Step 8083: {'lr': 0.0004979194610038816, 'samples': 1551936, 'steps': 8082, 'loss/train': 2.0888302326202393} -08/30/2021 14:37:24 - INFO - __main__ - Step 8084: {'lr': 0.000497918777735788, 'samples': 1552128, 'steps': 8083, 'loss/train': 1.875905156135559} -08/30/2021 14:37:25 - INFO - __main__ - Step 8085: {'lr': 0.000497918094355986, 'samples': 1552320, 'steps': 8084, 'loss/train': 1.9774138927459717} -08/30/2021 14:37:26 - INFO - __main__ - Step 8086: {'lr': 0.000497917410864476, 'samples': 1552512, 'steps': 8085, 'loss/train': 1.722417950630188} -08/30/2021 14:37:26 - INFO - __main__ - Step 8087: {'lr': 0.0004979167272612581, 'samples': 1552704, 'steps': 8086, 'loss/train': 1.8413053750991821} -08/30/2021 14:37:26 - INFO - __main__ - Step 8088: {'lr': 0.0004979160435463328, 'samples': 1552896, 'steps': 8087, 'loss/train': 1.4524587392807007} -08/30/2021 14:37:27 - INFO - __main__ - Step 8089: {'lr': 0.0004979153597197003, 'samples': 1553088, 'steps': 8088, 'loss/train': 2.0809855461120605} -08/30/2021 14:37:28 - INFO - __main__ - Step 8090: {'lr': 0.0004979146757813611, 'samples': 1553280, 'steps': 8089, 'loss/train': 1.5562987327575684} -08/30/2021 14:37:29 - INFO - __main__ - Step 8091: {'lr': 0.0004979139917313153, 'samples': 1553472, 'steps': 8090, 'loss/train': 2.171715497970581} -08/30/2021 14:37:29 - INFO - __main__ - Step 8092: {'lr': 0.0004979133075695634, 'samples': 1553664, 'steps': 8091, 'loss/train': 1.915298342704773} -08/30/2021 14:37:29 - INFO - __main__ - Step 8093: {'lr': 0.0004979126232961054, 'samples': 1553856, 'steps': 8092, 'loss/train': 1.7592092752456665} -08/30/2021 14:37:30 - INFO - __main__ - Step 8094: {'lr': 0.0004979119389109419, 'samples': 1554048, 'steps': 8093, 'loss/train': 1.0209548473358154} -08/30/2021 14:37:32 - INFO - __main__ - Step 8095: {'lr': 0.000497911254414073, 'samples': 1554240, 'steps': 8094, 'loss/train': 1.552551031112671} -08/30/2021 14:37:32 - INFO - __main__ - Step 8096: {'lr': 0.0004979105698054992, 'samples': 1554432, 'steps': 8095, 'loss/train': 2.2468039989471436} -08/30/2021 14:37:32 - INFO - __main__ - Step 8097: {'lr': 0.0004979098850852208, 'samples': 1554624, 'steps': 8096, 'loss/train': 1.9784367084503174} -08/30/2021 14:37:33 - INFO - __main__ - Step 8098: {'lr': 0.0004979092002532379, 'samples': 1554816, 'steps': 8097, 'loss/train': 2.148533821105957} -08/30/2021 14:37:33 - INFO - __main__ - Step 8099: {'lr': 0.0004979085153095509, 'samples': 1555008, 'steps': 8098, 'loss/train': 1.7559521198272705} -08/30/2021 14:37:34 - INFO - __main__ - Step 8100: {'lr': 0.0004979078302541604, 'samples': 1555200, 'steps': 8099, 'loss/train': 2.5532238483428955} -08/30/2021 14:37:35 - INFO - __main__ - Step 8101: {'lr': 0.0004979071450870662, 'samples': 1555392, 'steps': 8100, 'loss/train': 1.8217830657958984} -08/30/2021 14:37:35 - INFO - __main__ - Step 8102: {'lr': 0.0004979064598082689, 'samples': 1555584, 'steps': 8101, 'loss/train': 1.4963428974151611} -08/30/2021 14:37:36 - INFO - __main__ - Step 8103: {'lr': 0.0004979057744177689, 'samples': 1555776, 'steps': 8102, 'loss/train': 1.7607156038284302} -08/30/2021 14:37:36 - INFO - __main__ - Step 8104: {'lr': 0.0004979050889155663, 'samples': 1555968, 'steps': 8103, 'loss/train': 2.1021783351898193} -08/30/2021 14:37:37 - INFO - __main__ - Step 8105: {'lr': 0.0004979044033016616, 'samples': 1556160, 'steps': 8104, 'loss/train': 2.1359758377075195} -08/30/2021 14:37:38 - INFO - __main__ - Step 8106: {'lr': 0.0004979037175760548, 'samples': 1556352, 'steps': 8105, 'loss/train': 1.453436017036438} -08/30/2021 14:37:38 - INFO - __main__ - Step 8107: {'lr': 0.0004979030317387466, 'samples': 1556544, 'steps': 8106, 'loss/train': 2.0098989009857178} -08/30/2021 14:37:39 - INFO - __main__ - Step 8108: {'lr': 0.0004979023457897371, 'samples': 1556736, 'steps': 8107, 'loss/train': 2.1559696197509766} -08/30/2021 14:37:39 - INFO - __main__ - Step 8109: {'lr': 0.0004979016597290264, 'samples': 1556928, 'steps': 8108, 'loss/train': 6.67866849899292} -08/30/2021 14:37:40 - INFO - __main__ - Step 8110: {'lr': 0.0004979009735566152, 'samples': 1557120, 'steps': 8109, 'loss/train': 1.5541415214538574} -08/30/2021 14:37:40 - INFO - __main__ - Step 8111: {'lr': 0.0004979002872725037, 'samples': 1557312, 'steps': 8110, 'loss/train': 1.5444889068603516} -08/30/2021 14:37:41 - INFO - __main__ - Step 8112: {'lr': 0.0004978996008766922, 'samples': 1557504, 'steps': 8111, 'loss/train': 1.3902102708816528} -08/30/2021 14:37:42 - INFO - __main__ - Step 8113: {'lr': 0.0004978989143691808, 'samples': 1557696, 'steps': 8112, 'loss/train': 1.7067283391952515} -08/30/2021 14:37:42 - INFO - __main__ - Step 8114: {'lr': 0.00049789822774997, 'samples': 1557888, 'steps': 8113, 'loss/train': 2.329395055770874} -08/30/2021 14:37:43 - INFO - __main__ - Step 8115: {'lr': 0.0004978975410190601, 'samples': 1558080, 'steps': 8114, 'loss/train': 1.9429705142974854} -08/30/2021 14:37:43 - INFO - __main__ - Step 8116: {'lr': 0.0004978968541764515, 'samples': 1558272, 'steps': 8115, 'loss/train': 2.8889026641845703} -08/30/2021 14:37:44 - INFO - __main__ - Step 8117: {'lr': 0.0004978961672221444, 'samples': 1558464, 'steps': 8116, 'loss/train': 2.5362284183502197} -08/30/2021 14:37:45 - INFO - __main__ - Step 8118: {'lr': 0.000497895480156139, 'samples': 1558656, 'steps': 8117, 'loss/train': 2.1038477420806885} -08/30/2021 14:37:45 - INFO - __main__ - Step 8119: {'lr': 0.0004978947929784358, 'samples': 1558848, 'steps': 8118, 'loss/train': 2.1302146911621094} -08/30/2021 14:37:46 - INFO - __main__ - Step 8120: {'lr': 0.0004978941056890349, 'samples': 1559040, 'steps': 8119, 'loss/train': 1.6071606874465942} -08/30/2021 14:37:46 - INFO - __main__ - Step 8121: {'lr': 0.0004978934182879369, 'samples': 1559232, 'steps': 8120, 'loss/train': 1.5273759365081787} -08/30/2021 14:37:48 - INFO - __main__ - Step 8122: {'lr': 0.0004978927307751419, 'samples': 1559424, 'steps': 8121, 'loss/train': 2.2686712741851807} -08/30/2021 14:37:48 - INFO - __main__ - Step 8123: {'lr': 0.0004978920431506501, 'samples': 1559616, 'steps': 8122, 'loss/train': 2.2746353149414062} -08/30/2021 14:37:48 - INFO - __main__ - Step 8124: {'lr': 0.0004978913554144623, 'samples': 1559808, 'steps': 8123, 'loss/train': 1.6839054822921753} -08/30/2021 14:37:49 - INFO - __main__ - Step 8125: {'lr': 0.0004978906675665782, 'samples': 1560000, 'steps': 8124, 'loss/train': 2.4230728149414062} -08/30/2021 14:37:49 - INFO - __main__ - Step 8126: {'lr': 0.0004978899796069985, 'samples': 1560192, 'steps': 8125, 'loss/train': 0.9257344007492065} -08/30/2021 14:37:51 - INFO - __main__ - Step 8127: {'lr': 0.0004978892915357234, 'samples': 1560384, 'steps': 8126, 'loss/train': 1.9891599416732788} -08/30/2021 14:37:51 - INFO - __main__ - Step 8128: {'lr': 0.0004978886033527532, 'samples': 1560576, 'steps': 8127, 'loss/train': 1.9861290454864502} -08/30/2021 14:37:51 - INFO - __main__ - Step 8129: {'lr': 0.0004978879150580882, 'samples': 1560768, 'steps': 8128, 'loss/train': 1.973615288734436} -08/30/2021 14:37:52 - INFO - __main__ - Step 8130: {'lr': 0.0004978872266517288, 'samples': 1560960, 'steps': 8129, 'loss/train': 1.6166166067123413} -08/30/2021 14:37:52 - INFO - __main__ - Step 8131: {'lr': 0.0004978865381336752, 'samples': 1561152, 'steps': 8130, 'loss/train': 2.2141826152801514} -08/30/2021 14:37:54 - INFO - __main__ - Step 8132: {'lr': 0.0004978858495039277, 'samples': 1561344, 'steps': 8131, 'loss/train': 1.6094841957092285} -08/30/2021 14:37:55 - INFO - __main__ - Step 8133: {'lr': 0.0004978851607624867, 'samples': 1561536, 'steps': 8132, 'loss/train': 1.0781852006912231} -08/30/2021 14:37:55 - INFO - __main__ - Step 8134: {'lr': 0.0004978844719093525, 'samples': 1561728, 'steps': 8133, 'loss/train': 2.2774407863616943} -08/30/2021 14:37:55 - INFO - __main__ - Step 8135: {'lr': 0.0004978837829445254, 'samples': 1561920, 'steps': 8134, 'loss/train': 1.151728630065918} -08/30/2021 14:37:56 - INFO - __main__ - Step 8136: {'lr': 0.0004978830938680056, 'samples': 1562112, 'steps': 8135, 'loss/train': 1.9238930940628052} -08/30/2021 14:37:56 - INFO - __main__ - Step 8137: {'lr': 0.0004978824046797935, 'samples': 1562304, 'steps': 8136, 'loss/train': 1.9096646308898926} -08/30/2021 14:37:57 - INFO - __main__ - Step 8138: {'lr': 0.0004978817153798895, 'samples': 1562496, 'steps': 8137, 'loss/train': 1.603022575378418} -08/30/2021 14:37:58 - INFO - __main__ - Step 8139: {'lr': 0.0004978810259682939, 'samples': 1562688, 'steps': 8138, 'loss/train': 2.0701990127563477} -08/30/2021 14:37:58 - INFO - __main__ - Step 8140: {'lr': 0.0004978803364450068, 'samples': 1562880, 'steps': 8139, 'loss/train': 2.0248944759368896} -08/30/2021 14:37:59 - INFO - __main__ - Step 8141: {'lr': 0.0004978796468100286, 'samples': 1563072, 'steps': 8140, 'loss/train': 1.6021981239318848} -08/30/2021 14:37:59 - INFO - __main__ - Step 8142: {'lr': 0.0004978789570633598, 'samples': 1563264, 'steps': 8141, 'loss/train': 2.0543816089630127} -08/30/2021 14:38:00 - INFO - __main__ - Step 8143: {'lr': 0.0004978782672050004, 'samples': 1563456, 'steps': 8142, 'loss/train': 1.8658058643341064} -08/30/2021 14:38:01 - INFO - __main__ - Step 8144: {'lr': 0.000497877577234951, 'samples': 1563648, 'steps': 8143, 'loss/train': 1.800978660583496} -08/30/2021 14:38:01 - INFO - __main__ - Step 8145: {'lr': 0.0004978768871532117, 'samples': 1563840, 'steps': 8144, 'loss/train': 3.682251214981079} -08/30/2021 14:38:02 - INFO - __main__ - Step 8146: {'lr': 0.0004978761969597831, 'samples': 1564032, 'steps': 8145, 'loss/train': 1.07888925075531} -08/30/2021 14:38:02 - INFO - __main__ - Step 8147: {'lr': 0.0004978755066546651, 'samples': 1564224, 'steps': 8146, 'loss/train': 2.555426597595215} -08/30/2021 14:38:04 - INFO - __main__ - Step 8148: {'lr': 0.0004978748162378583, 'samples': 1564416, 'steps': 8147, 'loss/train': 1.6210819482803345} -08/30/2021 14:38:04 - INFO - __main__ - Step 8149: {'lr': 0.0004978741257093629, 'samples': 1564608, 'steps': 8148, 'loss/train': 2.622602701187134} -08/30/2021 14:38:04 - INFO - __main__ - Step 8150: {'lr': 0.0004978734350691793, 'samples': 1564800, 'steps': 8149, 'loss/train': 1.7691289186477661} -08/30/2021 14:38:05 - INFO - __main__ - Step 8151: {'lr': 0.0004978727443173077, 'samples': 1564992, 'steps': 8150, 'loss/train': 1.8896803855895996} -08/30/2021 14:38:05 - INFO - __main__ - Step 8152: {'lr': 0.0004978720534537485, 'samples': 1565184, 'steps': 8151, 'loss/train': 2.401085376739502} -08/30/2021 14:38:06 - INFO - __main__ - Step 8153: {'lr': 0.000497871362478502, 'samples': 1565376, 'steps': 8152, 'loss/train': 2.000427484512329} -08/30/2021 14:38:07 - INFO - __main__ - Step 8154: {'lr': 0.0004978706713915684, 'samples': 1565568, 'steps': 8153, 'loss/train': 1.5050705671310425} -08/30/2021 14:38:07 - INFO - __main__ - Step 8155: {'lr': 0.0004978699801929481, 'samples': 1565760, 'steps': 8154, 'loss/train': 1.8289058208465576} -08/30/2021 14:38:08 - INFO - __main__ - Step 8156: {'lr': 0.0004978692888826415, 'samples': 1565952, 'steps': 8155, 'loss/train': 1.6264549493789673} -08/30/2021 14:38:08 - INFO - __main__ - Step 8157: {'lr': 0.0004978685974606488, 'samples': 1566144, 'steps': 8156, 'loss/train': 1.897903561592102} -08/30/2021 14:38:10 - INFO - __main__ - Step 8158: {'lr': 0.0004978679059269704, 'samples': 1566336, 'steps': 8157, 'loss/train': 1.8008724451065063} -08/30/2021 14:38:10 - INFO - __main__ - Step 8159: {'lr': 0.0004978672142816064, 'samples': 1566528, 'steps': 8158, 'loss/train': 1.5293163061141968} -08/30/2021 14:38:10 - INFO - __main__ - Step 8160: {'lr': 0.0004978665225245573, 'samples': 1566720, 'steps': 8159, 'loss/train': 0.18761011958122253} -08/30/2021 14:38:11 - INFO - __main__ - Step 8161: {'lr': 0.0004978658306558234, 'samples': 1566912, 'steps': 8160, 'loss/train': 2.037343978881836} -08/30/2021 14:38:11 - INFO - __main__ - Step 8162: {'lr': 0.000497865138675405, 'samples': 1567104, 'steps': 8161, 'loss/train': 1.8936717510223389} -08/30/2021 14:38:14 - INFO - __main__ - Step 8163: {'lr': 0.0004978644465833024, 'samples': 1567296, 'steps': 8162, 'loss/train': 0.6448262929916382} -08/30/2021 14:38:14 - INFO - __main__ - Step 8164: {'lr': 0.000497863754379516, 'samples': 1567488, 'steps': 8163, 'loss/train': 2.2714755535125732} -08/30/2021 14:38:14 - INFO - __main__ - Step 8165: {'lr': 0.0004978630620640458, 'samples': 1567680, 'steps': 8164, 'loss/train': 2.571237087249756} -08/30/2021 14:38:15 - INFO - __main__ - Step 8166: {'lr': 0.0004978623696368924, 'samples': 1567872, 'steps': 8165, 'loss/train': 3.3331093788146973} -08/30/2021 14:38:15 - INFO - __main__ - Step 8167: {'lr': 0.0004978616770980561, 'samples': 1568064, 'steps': 8166, 'loss/train': 1.8288649320602417} -08/30/2021 14:38:16 - INFO - __main__ - Step 8168: {'lr': 0.0004978609844475371, 'samples': 1568256, 'steps': 8167, 'loss/train': 0.547390341758728} -08/30/2021 14:38:16 - INFO - __main__ - Step 8169: {'lr': 0.0004978602916853359, 'samples': 1568448, 'steps': 8168, 'loss/train': 0.4615233540534973} -08/30/2021 14:38:17 - INFO - __main__ - Step 8170: {'lr': 0.0004978595988114525, 'samples': 1568640, 'steps': 8169, 'loss/train': 1.8013758659362793} -08/30/2021 14:38:18 - INFO - __main__ - Step 8171: {'lr': 0.0004978589058258874, 'samples': 1568832, 'steps': 8170, 'loss/train': 1.5720739364624023} -08/30/2021 14:38:18 - INFO - __main__ - Step 8172: {'lr': 0.0004978582127286409, 'samples': 1569024, 'steps': 8171, 'loss/train': 1.885957956314087} -08/30/2021 14:38:19 - INFO - __main__ - Step 8173: {'lr': 0.0004978575195197135, 'samples': 1569216, 'steps': 8172, 'loss/train': 2.101001024246216} -08/30/2021 14:38:19 - INFO - __main__ - Step 8174: {'lr': 0.0004978568261991051, 'samples': 1569408, 'steps': 8173, 'loss/train': 2.2357654571533203} -08/30/2021 14:38:20 - INFO - __main__ - Step 8175: {'lr': 0.0004978561327668164, 'samples': 1569600, 'steps': 8174, 'loss/train': 0.8115916848182678} -08/30/2021 14:38:21 - INFO - __main__ - Step 8176: {'lr': 0.0004978554392228475, 'samples': 1569792, 'steps': 8175, 'loss/train': 1.8347346782684326} -08/30/2021 14:38:21 - INFO - __main__ - Step 8177: {'lr': 0.0004978547455671986, 'samples': 1569984, 'steps': 8176, 'loss/train': 1.6068774461746216} -08/30/2021 14:38:22 - INFO - __main__ - Step 8178: {'lr': 0.0004978540517998704, 'samples': 1570176, 'steps': 8177, 'loss/train': 1.7253652811050415} -08/30/2021 14:38:22 - INFO - __main__ - Step 8179: {'lr': 0.0004978533579208629, 'samples': 1570368, 'steps': 8178, 'loss/train': 2.012005567550659} -08/30/2021 14:38:24 - INFO - __main__ - Step 8180: {'lr': 0.0004978526639301766, 'samples': 1570560, 'steps': 8179, 'loss/train': 1.7065232992172241} -08/30/2021 14:38:24 - INFO - __main__ - Step 8181: {'lr': 0.0004978519698278116, 'samples': 1570752, 'steps': 8180, 'loss/train': 2.276918411254883} -08/30/2021 14:38:24 - INFO - __main__ - Step 8182: {'lr': 0.0004978512756137684, 'samples': 1570944, 'steps': 8181, 'loss/train': 2.1926393508911133} -08/30/2021 14:38:25 - INFO - __main__ - Step 8183: {'lr': 0.0004978505812880472, 'samples': 1571136, 'steps': 8182, 'loss/train': 1.0561655759811401} -08/30/2021 14:38:25 - INFO - __main__ - Step 8184: {'lr': 0.0004978498868506483, 'samples': 1571328, 'steps': 8183, 'loss/train': 1.8270405530929565} -08/30/2021 14:38:27 - INFO - __main__ - Step 8185: {'lr': 0.0004978491923015721, 'samples': 1571520, 'steps': 8184, 'loss/train': 1.9421552419662476} -08/30/2021 14:38:28 - INFO - __main__ - Step 8186: {'lr': 0.0004978484976408189, 'samples': 1571712, 'steps': 8185, 'loss/train': 1.0923749208450317} -08/30/2021 14:38:28 - INFO - __main__ - Step 8187: {'lr': 0.000497847802868389, 'samples': 1571904, 'steps': 8186, 'loss/train': 1.879454493522644} -08/30/2021 14:38:28 - INFO - __main__ - Step 8188: {'lr': 0.0004978471079842827, 'samples': 1572096, 'steps': 8187, 'loss/train': 1.3024580478668213} -08/30/2021 14:38:29 - INFO - __main__ - Step 8189: {'lr': 0.0004978464129885003, 'samples': 1572288, 'steps': 8188, 'loss/train': 1.5856817960739136} -08/30/2021 14:38:29 - INFO - __main__ - Step 8190: {'lr': 0.0004978457178810422, 'samples': 1572480, 'steps': 8189, 'loss/train': 1.9360442161560059} -08/30/2021 14:38:30 - INFO - __main__ - Step 8191: {'lr': 0.0004978450226619085, 'samples': 1572672, 'steps': 8190, 'loss/train': 1.846137285232544} -08/30/2021 14:38:31 - INFO - __main__ - Step 8192: {'lr': 0.0004978443273310997, 'samples': 1572864, 'steps': 8191, 'loss/train': 1.784417986869812} -08/30/2021 14:38:31 - INFO - __main__ - Step 8193: {'lr': 0.0004978436318886162, 'samples': 1573056, 'steps': 8192, 'loss/train': 1.7672758102416992} -08/30/2021 14:38:32 - INFO - __main__ - Step 8194: {'lr': 0.0004978429363344581, 'samples': 1573248, 'steps': 8193, 'loss/train': 2.1513454914093018} -08/30/2021 14:38:32 - INFO - __main__ - Step 8195: {'lr': 0.0004978422406686257, 'samples': 1573440, 'steps': 8194, 'loss/train': 1.3442859649658203} -08/30/2021 14:38:33 - INFO - __main__ - Step 8196: {'lr': 0.0004978415448911196, 'samples': 1573632, 'steps': 8195, 'loss/train': 1.701888918876648} -08/30/2021 14:38:34 - INFO - __main__ - Step 8197: {'lr': 0.0004978408490019398, 'samples': 1573824, 'steps': 8196, 'loss/train': 1.7170556783676147} -08/30/2021 14:38:34 - INFO - __main__ - Step 8198: {'lr': 0.0004978401530010868, 'samples': 1574016, 'steps': 8197, 'loss/train': 1.5774528980255127} -08/30/2021 14:38:35 - INFO - __main__ - Step 8199: {'lr': 0.0004978394568885608, 'samples': 1574208, 'steps': 8198, 'loss/train': 1.5584241151809692} -08/30/2021 14:38:35 - INFO - __main__ - Step 8200: {'lr': 0.0004978387606643621, 'samples': 1574400, 'steps': 8199, 'loss/train': 2.1084234714508057} -08/30/2021 14:38:36 - INFO - __main__ - Step 8201: {'lr': 0.0004978380643284912, 'samples': 1574592, 'steps': 8200, 'loss/train': 1.483100175857544} -08/30/2021 14:38:37 - INFO - __main__ - Step 8202: {'lr': 0.0004978373678809482, 'samples': 1574784, 'steps': 8201, 'loss/train': 2.0869522094726562} -08/30/2021 14:38:37 - INFO - __main__ - Step 8203: {'lr': 0.0004978366713217336, 'samples': 1574976, 'steps': 8202, 'loss/train': 1.4451258182525635} -08/30/2021 14:38:38 - INFO - __main__ - Step 8204: {'lr': 0.0004978359746508476, 'samples': 1575168, 'steps': 8203, 'loss/train': 2.497816801071167} -08/30/2021 14:38:38 - INFO - __main__ - Step 8205: {'lr': 0.0004978352778682905, 'samples': 1575360, 'steps': 8204, 'loss/train': 2.0786960124969482} -08/30/2021 14:38:39 - INFO - __main__ - Step 8206: {'lr': 0.0004978345809740626, 'samples': 1575552, 'steps': 8205, 'loss/train': 2.1304829120635986} -08/30/2021 14:38:40 - INFO - __main__ - Step 8207: {'lr': 0.0004978338839681644, 'samples': 1575744, 'steps': 8206, 'loss/train': 2.44885516166687} -08/30/2021 14:38:40 - INFO - __main__ - Step 8208: {'lr': 0.000497833186850596, 'samples': 1575936, 'steps': 8207, 'loss/train': 1.7707266807556152} -08/30/2021 14:38:41 - INFO - __main__ - Step 8209: {'lr': 0.0004978324896213577, 'samples': 1576128, 'steps': 8208, 'loss/train': 1.025614857673645} -08/30/2021 14:38:41 - INFO - __main__ - Step 8210: {'lr': 0.00049783179228045, 'samples': 1576320, 'steps': 8209, 'loss/train': 2.0632054805755615} -08/30/2021 14:38:43 - INFO - __main__ - Step 8211: {'lr': 0.0004978310948278731, 'samples': 1576512, 'steps': 8210, 'loss/train': 1.8370667695999146} -08/30/2021 14:38:43 - INFO - __main__ - Step 8212: {'lr': 0.0004978303972636275, 'samples': 1576704, 'steps': 8211, 'loss/train': 1.8413089513778687} -08/30/2021 14:38:44 - INFO - __main__ - Step 8213: {'lr': 0.0004978296995877132, 'samples': 1576896, 'steps': 8212, 'loss/train': 2.230380058288574} -08/30/2021 14:38:44 - INFO - __main__ - Step 8214: {'lr': 0.0004978290018001306, 'samples': 1577088, 'steps': 8213, 'loss/train': 1.8136948347091675} -08/30/2021 14:38:44 - INFO - __main__ - Step 8215: {'lr': 0.0004978283039008801, 'samples': 1577280, 'steps': 8214, 'loss/train': 2.0986435413360596} -08/30/2021 14:38:46 - INFO - __main__ - Step 8216: {'lr': 0.000497827605889962, 'samples': 1577472, 'steps': 8215, 'loss/train': 1.3486262559890747} -08/30/2021 14:38:46 - INFO - __main__ - Step 8217: {'lr': 0.0004978269077673766, 'samples': 1577664, 'steps': 8216, 'loss/train': 1.6297059059143066} -08/30/2021 14:38:47 - INFO - __main__ - Step 8218: {'lr': 0.0004978262095331243, 'samples': 1577856, 'steps': 8217, 'loss/train': 1.6320127248764038} -08/30/2021 14:38:47 - INFO - __main__ - Step 8219: {'lr': 0.0004978255111872053, 'samples': 1578048, 'steps': 8218, 'loss/train': 2.2392680644989014} -08/30/2021 14:38:47 - INFO - __main__ - Step 8220: {'lr': 0.0004978248127296198, 'samples': 1578240, 'steps': 8219, 'loss/train': 5.774405002593994} -08/30/2021 14:38:48 - INFO - __main__ - Step 8221: {'lr': 0.0004978241141603685, 'samples': 1578432, 'steps': 8220, 'loss/train': 1.8457382917404175} -08/30/2021 14:38:49 - INFO - __main__ - Step 8222: {'lr': 0.0004978234154794514, 'samples': 1578624, 'steps': 8221, 'loss/train': 0.22618632018566132} -08/30/2021 14:38:50 - INFO - __main__ - Step 8223: {'lr': 0.0004978227166868689, 'samples': 1578816, 'steps': 8222, 'loss/train': 1.9204914569854736} -08/30/2021 14:38:50 - INFO - __main__ - Step 8224: {'lr': 0.0004978220177826212, 'samples': 1579008, 'steps': 8223, 'loss/train': 1.5733602046966553} -08/30/2021 14:38:50 - INFO - __main__ - Step 8225: {'lr': 0.0004978213187667087, 'samples': 1579200, 'steps': 8224, 'loss/train': 2.2170279026031494} -08/30/2021 14:38:51 - INFO - __main__ - Step 8226: {'lr': 0.0004978206196391319, 'samples': 1579392, 'steps': 8225, 'loss/train': 1.963765025138855} -08/30/2021 14:38:52 - INFO - __main__ - Step 8227: {'lr': 0.0004978199203998909, 'samples': 1579584, 'steps': 8226, 'loss/train': 2.0112295150756836} -08/30/2021 14:38:53 - INFO - __main__ - Step 8228: {'lr': 0.0004978192210489861, 'samples': 1579776, 'steps': 8227, 'loss/train': 2.229060649871826} -08/30/2021 14:38:53 - INFO - __main__ - Step 8229: {'lr': 0.0004978185215864177, 'samples': 1579968, 'steps': 8228, 'loss/train': 1.990768313407898} -08/30/2021 14:38:53 - INFO - __main__ - Step 8230: {'lr': 0.0004978178220121862, 'samples': 1580160, 'steps': 8229, 'loss/train': 1.9822341203689575} -08/30/2021 14:38:54 - INFO - __main__ - Step 8231: {'lr': 0.0004978171223262917, 'samples': 1580352, 'steps': 8230, 'loss/train': 2.1127185821533203} -08/30/2021 14:38:55 - INFO - __main__ - Step 8232: {'lr': 0.0004978164225287346, 'samples': 1580544, 'steps': 8231, 'loss/train': 2.167787790298462} -08/30/2021 14:38:56 - INFO - __main__ - Step 8233: {'lr': 0.0004978157226195153, 'samples': 1580736, 'steps': 8232, 'loss/train': 2.097172498703003} -08/30/2021 14:38:56 - INFO - __main__ - Step 8234: {'lr': 0.0004978150225986342, 'samples': 1580928, 'steps': 8233, 'loss/train': 2.1805906295776367} -08/30/2021 14:38:56 - INFO - __main__ - Step 8235: {'lr': 0.0004978143224660913, 'samples': 1581120, 'steps': 8234, 'loss/train': 1.5666084289550781} -08/30/2021 14:38:57 - INFO - __main__ - Step 8236: {'lr': 0.0004978136222218872, 'samples': 1581312, 'steps': 8235, 'loss/train': 2.2275607585906982} -08/30/2021 14:38:58 - INFO - __main__ - Step 8237: {'lr': 0.000497812921866022, 'samples': 1581504, 'steps': 8236, 'loss/train': 3.4134950637817383} -08/30/2021 14:38:59 - INFO - __main__ - Step 8238: {'lr': 0.0004978122213984961, 'samples': 1581696, 'steps': 8237, 'loss/train': 1.6897222995758057} -08/30/2021 14:38:59 - INFO - __main__ - Step 8239: {'lr': 0.00049781152081931, 'samples': 1581888, 'steps': 8238, 'loss/train': 1.742550253868103} -08/30/2021 14:39:00 - INFO - __main__ - Step 8240: {'lr': 0.0004978108201284638, 'samples': 1582080, 'steps': 8239, 'loss/train': 1.5577292442321777} -08/30/2021 14:39:00 - INFO - __main__ - Step 8241: {'lr': 0.0004978101193259578, 'samples': 1582272, 'steps': 8240, 'loss/train': 1.952988862991333} -08/30/2021 14:39:00 - INFO - __main__ - Step 8242: {'lr': 0.0004978094184117924, 'samples': 1582464, 'steps': 8241, 'loss/train': 2.8648812770843506} -08/30/2021 14:39:02 - INFO - __main__ - Step 8243: {'lr': 0.0004978087173859679, 'samples': 1582656, 'steps': 8242, 'loss/train': 1.7859591245651245} -08/30/2021 14:39:03 - INFO - __main__ - Step 8244: {'lr': 0.0004978080162484846, 'samples': 1582848, 'steps': 8243, 'loss/train': 1.9046686887741089} -08/30/2021 14:39:03 - INFO - __main__ - Step 8245: {'lr': 0.000497807314999343, 'samples': 1583040, 'steps': 8244, 'loss/train': 2.035637617111206} -08/30/2021 14:39:03 - INFO - __main__ - Step 8246: {'lr': 0.000497806613638543, 'samples': 1583232, 'steps': 8245, 'loss/train': 1.5470324754714966} -08/30/2021 14:39:04 - INFO - __main__ - Step 8247: {'lr': 0.0004978059121660853, 'samples': 1583424, 'steps': 8246, 'loss/train': 1.7327110767364502} -08/30/2021 14:39:05 - INFO - __main__ - Step 8248: {'lr': 0.0004978052105819701, 'samples': 1583616, 'steps': 8247, 'loss/train': 1.8364574909210205} -08/30/2021 14:39:06 - INFO - __main__ - Step 8249: {'lr': 0.0004978045088861976, 'samples': 1583808, 'steps': 8248, 'loss/train': 1.7338567972183228} -08/30/2021 14:39:06 - INFO - __main__ - Step 8250: {'lr': 0.0004978038070787683, 'samples': 1584000, 'steps': 8249, 'loss/train': 1.8751275539398193} -08/30/2021 14:39:07 - INFO - __main__ - Step 8251: {'lr': 0.0004978031051596824, 'samples': 1584192, 'steps': 8250, 'loss/train': 2.0312037467956543} -08/30/2021 14:39:07 - INFO - __main__ - Step 8252: {'lr': 0.0004978024031289402, 'samples': 1584384, 'steps': 8251, 'loss/train': 0.29449352622032166} -08/30/2021 14:39:09 - INFO - __main__ - Step 8253: {'lr': 0.0004978017009865421, 'samples': 1584576, 'steps': 8252, 'loss/train': 2.181436538696289} -08/30/2021 14:39:09 - INFO - __main__ - Step 8254: {'lr': 0.0004978009987324884, 'samples': 1584768, 'steps': 8253, 'loss/train': 1.90069580078125} -08/30/2021 14:39:09 - INFO - __main__ - Step 8255: {'lr': 0.0004978002963667794, 'samples': 1584960, 'steps': 8254, 'loss/train': 1.7839347124099731} -08/30/2021 14:39:10 - INFO - __main__ - Step 8256: {'lr': 0.0004977995938894153, 'samples': 1585152, 'steps': 8255, 'loss/train': 1.9654022455215454} -08/30/2021 14:39:10 - INFO - __main__ - Step 8257: {'lr': 0.0004977988913003966, 'samples': 1585344, 'steps': 8256, 'loss/train': 2.3844034671783447} -08/30/2021 14:39:11 - INFO - __main__ - Step 8258: {'lr': 0.0004977981885997235, 'samples': 1585536, 'steps': 8257, 'loss/train': 1.7496044635772705} -08/30/2021 14:39:12 - INFO - __main__ - Step 8259: {'lr': 0.0004977974857873964, 'samples': 1585728, 'steps': 8258, 'loss/train': 1.4685555696487427} -08/30/2021 14:39:12 - INFO - __main__ - Step 8260: {'lr': 0.0004977967828634157, 'samples': 1585920, 'steps': 8259, 'loss/train': 2.159745454788208} -08/30/2021 14:39:13 - INFO - __main__ - Step 8261: {'lr': 0.0004977960798277814, 'samples': 1586112, 'steps': 8260, 'loss/train': 1.9144850969314575} -08/30/2021 14:39:13 - INFO - __main__ - Step 8262: {'lr': 0.0004977953766804941, 'samples': 1586304, 'steps': 8261, 'loss/train': 1.647459864616394} -08/30/2021 14:39:15 - INFO - __main__ - Step 8263: {'lr': 0.0004977946734215541, 'samples': 1586496, 'steps': 8262, 'loss/train': 2.100821018218994} -08/30/2021 14:39:15 - INFO - __main__ - Step 8264: {'lr': 0.0004977939700509615, 'samples': 1586688, 'steps': 8263, 'loss/train': 2.0801079273223877} -08/30/2021 14:39:15 - INFO - __main__ - Step 8265: {'lr': 0.0004977932665687168, 'samples': 1586880, 'steps': 8264, 'loss/train': 1.5985188484191895} -08/30/2021 14:39:16 - INFO - __main__ - Step 8266: {'lr': 0.0004977925629748203, 'samples': 1587072, 'steps': 8265, 'loss/train': 1.9863077402114868} -08/30/2021 14:39:16 - INFO - __main__ - Step 8267: {'lr': 0.0004977918592692723, 'samples': 1587264, 'steps': 8266, 'loss/train': 1.772147536277771} -08/30/2021 14:39:17 - INFO - __main__ - Step 8268: {'lr': 0.0004977911554520731, 'samples': 1587456, 'steps': 8267, 'loss/train': 2.3003275394439697} -08/30/2021 14:39:18 - INFO - __main__ - Step 8269: {'lr': 0.000497790451523223, 'samples': 1587648, 'steps': 8268, 'loss/train': 0.24372439086437225} -08/30/2021 14:39:19 - INFO - __main__ - Step 8270: {'lr': 0.0004977897474827224, 'samples': 1587840, 'steps': 8269, 'loss/train': 1.8935787677764893} -08/30/2021 14:39:19 - INFO - __main__ - Step 8271: {'lr': 0.0004977890433305716, 'samples': 1588032, 'steps': 8270, 'loss/train': 2.200939655303955} -08/30/2021 14:39:19 - INFO - __main__ - Step 8272: {'lr': 0.0004977883390667707, 'samples': 1588224, 'steps': 8271, 'loss/train': 1.963395118713379} -08/30/2021 14:39:20 - INFO - __main__ - Step 8273: {'lr': 0.0004977876346913204, 'samples': 1588416, 'steps': 8272, 'loss/train': 2.0750908851623535} -08/30/2021 14:39:21 - INFO - __main__ - Step 8274: {'lr': 0.0004977869302042207, 'samples': 1588608, 'steps': 8273, 'loss/train': 1.9805692434310913} -08/30/2021 14:39:21 - INFO - __main__ - Step 8275: {'lr': 0.0004977862256054721, 'samples': 1588800, 'steps': 8274, 'loss/train': 2.431096076965332} -08/30/2021 14:39:22 - INFO - __main__ - Step 8276: {'lr': 0.0004977855208950748, 'samples': 1588992, 'steps': 8275, 'loss/train': 1.9583996534347534} -08/30/2021 14:39:22 - INFO - __main__ - Step 8277: {'lr': 0.0004977848160730292, 'samples': 1589184, 'steps': 8276, 'loss/train': 1.602217674255371} -08/30/2021 14:39:23 - INFO - __main__ - Step 8278: {'lr': 0.0004977841111393356, 'samples': 1589376, 'steps': 8277, 'loss/train': 2.1538069248199463} -08/30/2021 14:39:24 - INFO - __main__ - Step 8279: {'lr': 0.0004977834060939943, 'samples': 1589568, 'steps': 8278, 'loss/train': 2.474278688430786} -08/30/2021 14:39:24 - INFO - __main__ - Step 8280: {'lr': 0.0004977827009370056, 'samples': 1589760, 'steps': 8279, 'loss/train': 1.5699925422668457} -08/30/2021 14:39:25 - INFO - __main__ - Step 8281: {'lr': 0.0004977819956683698, 'samples': 1589952, 'steps': 8280, 'loss/train': 1.9401789903640747} -08/30/2021 14:39:25 - INFO - __main__ - Step 8282: {'lr': 0.0004977812902880873, 'samples': 1590144, 'steps': 8281, 'loss/train': 1.7837632894515991} -08/30/2021 14:39:25 - INFO - __main__ - Step 8283: {'lr': 0.0004977805847961584, 'samples': 1590336, 'steps': 8282, 'loss/train': 1.7989060878753662} -08/30/2021 14:39:27 - INFO - __main__ - Step 8284: {'lr': 0.0004977798791925834, 'samples': 1590528, 'steps': 8283, 'loss/train': 1.8197380304336548} -08/30/2021 14:39:28 - INFO - __main__ - Step 8285: {'lr': 0.0004977791734773624, 'samples': 1590720, 'steps': 8284, 'loss/train': 1.4514490365982056} -08/30/2021 14:39:28 - INFO - __main__ - Step 8286: {'lr': 0.0004977784676504962, 'samples': 1590912, 'steps': 8285, 'loss/train': 1.4975500106811523} -08/30/2021 14:39:29 - INFO - __main__ - Step 8287: {'lr': 0.0004977777617119847, 'samples': 1591104, 'steps': 8286, 'loss/train': 0.2620598077774048} -08/30/2021 14:39:29 - INFO - __main__ - Step 8288: {'lr': 0.0004977770556618284, 'samples': 1591296, 'steps': 8287, 'loss/train': 0.7323072552680969} -08/30/2021 14:39:30 - INFO - __main__ - Step 8289: {'lr': 0.0004977763495000276, 'samples': 1591488, 'steps': 8288, 'loss/train': 1.7614859342575073} -08/30/2021 14:39:31 - INFO - __main__ - Step 8290: {'lr': 0.0004977756432265827, 'samples': 1591680, 'steps': 8289, 'loss/train': 2.2198972702026367} -08/30/2021 14:39:31 - INFO - __main__ - Step 8291: {'lr': 0.0004977749368414937, 'samples': 1591872, 'steps': 8290, 'loss/train': 2.3375096321105957} -08/30/2021 14:39:32 - INFO - __main__ - Step 8292: {'lr': 0.0004977742303447613, 'samples': 1592064, 'steps': 8291, 'loss/train': 2.0485856533050537} -08/30/2021 14:39:32 - INFO - __main__ - Step 8293: {'lr': 0.0004977735237363855, 'samples': 1592256, 'steps': 8292, 'loss/train': 1.8509224653244019} -08/30/2021 14:39:32 - INFO - __main__ - Step 8294: {'lr': 0.0004977728170163669, 'samples': 1592448, 'steps': 8293, 'loss/train': 1.587689995765686} -08/30/2021 14:39:34 - INFO - __main__ - Step 8295: {'lr': 0.0004977721101847057, 'samples': 1592640, 'steps': 8294, 'loss/train': 3.0057520866394043} -08/30/2021 14:39:35 - INFO - __main__ - Step 8296: {'lr': 0.0004977714032414021, 'samples': 1592832, 'steps': 8295, 'loss/train': 2.1064672470092773} -08/30/2021 14:39:35 - INFO - __main__ - Step 8297: {'lr': 0.0004977706961864566, 'samples': 1593024, 'steps': 8296, 'loss/train': 1.5779653787612915} -08/30/2021 14:39:36 - INFO - __main__ - Step 8298: {'lr': 0.0004977699890198695, 'samples': 1593216, 'steps': 8297, 'loss/train': 2.4405040740966797} -08/30/2021 14:39:36 - INFO - __main__ - Step 8299: {'lr': 0.0004977692817416411, 'samples': 1593408, 'steps': 8298, 'loss/train': 0.7004013657569885} -08/30/2021 14:39:37 - INFO - __main__ - Step 8300: {'lr': 0.0004977685743517715, 'samples': 1593600, 'steps': 8299, 'loss/train': 2.3566508293151855} -08/30/2021 14:39:38 - INFO - __main__ - Step 8301: {'lr': 0.0004977678668502614, 'samples': 1593792, 'steps': 8300, 'loss/train': 1.4274485111236572} -08/30/2021 14:39:38 - INFO - __main__ - Step 8302: {'lr': 0.0004977671592371108, 'samples': 1593984, 'steps': 8301, 'loss/train': 1.6844537258148193} -08/30/2021 14:39:39 - INFO - __main__ - Step 8303: {'lr': 0.0004977664515123201, 'samples': 1594176, 'steps': 8302, 'loss/train': 2.629887104034424} -08/30/2021 14:39:39 - INFO - __main__ - Step 8304: {'lr': 0.0004977657436758898, 'samples': 1594368, 'steps': 8303, 'loss/train': 2.1009836196899414} -08/30/2021 14:39:40 - INFO - __main__ - Step 8305: {'lr': 0.00049776503572782, 'samples': 1594560, 'steps': 8304, 'loss/train': 2.045954942703247} -08/30/2021 14:39:41 - INFO - __main__ - Step 8306: {'lr': 0.0004977643276681111, 'samples': 1594752, 'steps': 8305, 'loss/train': 1.9974339008331299} -08/30/2021 14:39:41 - INFO - __main__ - Step 8307: {'lr': 0.0004977636194967634, 'samples': 1594944, 'steps': 8306, 'loss/train': 1.535595417022705} -08/30/2021 14:39:42 - INFO - __main__ - Step 8308: {'lr': 0.0004977629112137773, 'samples': 1595136, 'steps': 8307, 'loss/train': 2.3111045360565186} -08/30/2021 14:39:42 - INFO - __main__ - Step 8309: {'lr': 0.000497762202819153, 'samples': 1595328, 'steps': 8308, 'loss/train': 1.8173013925552368} -08/30/2021 14:39:43 - INFO - __main__ - Step 8310: {'lr': 0.0004977614943128909, 'samples': 1595520, 'steps': 8309, 'loss/train': 2.3394112586975098} -08/30/2021 14:39:44 - INFO - __main__ - Step 8311: {'lr': 0.0004977607856949913, 'samples': 1595712, 'steps': 8310, 'loss/train': 1.3983229398727417} -08/30/2021 14:39:44 - INFO - __main__ - Step 8312: {'lr': 0.0004977600769654545, 'samples': 1595904, 'steps': 8311, 'loss/train': 2.004567861557007} -08/30/2021 14:39:44 - INFO - __main__ - Step 8313: {'lr': 0.0004977593681242808, 'samples': 1596096, 'steps': 8312, 'loss/train': 2.938127279281616} -08/30/2021 14:39:45 - INFO - __main__ - Step 8314: {'lr': 0.0004977586591714706, 'samples': 1596288, 'steps': 8313, 'loss/train': 1.8273831605911255} -08/30/2021 14:39:46 - INFO - __main__ - Step 8315: {'lr': 0.0004977579501070241, 'samples': 1596480, 'steps': 8314, 'loss/train': 1.5774086713790894} -08/30/2021 14:39:47 - INFO - __main__ - Step 8316: {'lr': 0.0004977572409309418, 'samples': 1596672, 'steps': 8315, 'loss/train': 1.8776001930236816} -08/30/2021 14:39:47 - INFO - __main__ - Step 8317: {'lr': 0.0004977565316432238, 'samples': 1596864, 'steps': 8316, 'loss/train': 2.654694080352783} -08/30/2021 14:39:47 - INFO - __main__ - Step 8318: {'lr': 0.0004977558222438707, 'samples': 1597056, 'steps': 8317, 'loss/train': 2.268955707550049} -08/30/2021 14:39:48 - INFO - __main__ - Step 8319: {'lr': 0.0004977551127328824, 'samples': 1597248, 'steps': 8318, 'loss/train': 2.0821802616119385} -08/30/2021 14:39:49 - INFO - __main__ - Step 8320: {'lr': 0.0004977544031102597, 'samples': 1597440, 'steps': 8319, 'loss/train': 2.3473060131073} -08/30/2021 14:39:50 - INFO - __main__ - Step 8321: {'lr': 0.0004977536933760025, 'samples': 1597632, 'steps': 8320, 'loss/train': 0.9266359210014343} -08/30/2021 14:39:50 - INFO - __main__ - Step 8322: {'lr': 0.0004977529835301115, 'samples': 1597824, 'steps': 8321, 'loss/train': 1.9030746221542358} -08/30/2021 14:39:50 - INFO - __main__ - Step 8323: {'lr': 0.0004977522735725866, 'samples': 1598016, 'steps': 8322, 'loss/train': 2.0451583862304688} -08/30/2021 14:39:51 - INFO - __main__ - Step 8324: {'lr': 0.0004977515635034285, 'samples': 1598208, 'steps': 8323, 'loss/train': 1.973549246788025} -08/30/2021 14:39:53 - INFO - __main__ - Step 8325: {'lr': 0.0004977508533226374, 'samples': 1598400, 'steps': 8324, 'loss/train': 2.45467209815979} -08/30/2021 14:39:54 - INFO - __main__ - Step 8326: {'lr': 0.0004977501430302136, 'samples': 1598592, 'steps': 8325, 'loss/train': 1.719396710395813} -08/30/2021 14:39:54 - INFO - __main__ - Step 8327: {'lr': 0.0004977494326261573, 'samples': 1598784, 'steps': 8326, 'loss/train': 2.267773151397705} -08/30/2021 14:39:54 - INFO - __main__ - Step 8328: {'lr': 0.000497748722110469, 'samples': 1598976, 'steps': 8327, 'loss/train': 1.4115350246429443} -08/30/2021 14:39:55 - INFO - __main__ - Step 8329: {'lr': 0.0004977480114831489, 'samples': 1599168, 'steps': 8328, 'loss/train': 1.7805625200271606} -08/30/2021 14:39:55 - INFO - __main__ - Step 8330: {'lr': 0.0004977473007441973, 'samples': 1599360, 'steps': 8329, 'loss/train': 2.217846155166626} -08/30/2021 14:39:56 - INFO - __main__ - Step 8331: {'lr': 0.0004977465898936147, 'samples': 1599552, 'steps': 8330, 'loss/train': 1.5316822528839111} -08/30/2021 14:39:57 - INFO - __main__ - Step 8332: {'lr': 0.0004977458789314014, 'samples': 1599744, 'steps': 8331, 'loss/train': 2.6083035469055176} -08/30/2021 14:39:57 - INFO - __main__ - Step 8333: {'lr': 0.0004977451678575575, 'samples': 1599936, 'steps': 8332, 'loss/train': 1.696162223815918} -08/30/2021 14:39:58 - INFO - __main__ - Step 8334: {'lr': 0.0004977444566720834, 'samples': 1600128, 'steps': 8333, 'loss/train': 1.7151960134506226} -08/30/2021 14:39:58 - INFO - __main__ - Step 8335: {'lr': 0.0004977437453749795, 'samples': 1600320, 'steps': 8334, 'loss/train': 1.0623595714569092} -08/30/2021 14:39:58 - INFO - __main__ - Step 8336: {'lr': 0.0004977430339662462, 'samples': 1600512, 'steps': 8335, 'loss/train': 2.3184456825256348} -08/30/2021 14:40:00 - INFO - __main__ - Step 8337: {'lr': 0.0004977423224458837, 'samples': 1600704, 'steps': 8336, 'loss/train': 3.447991371154785} -08/30/2021 14:40:01 - INFO - __main__ - Step 8338: {'lr': 0.0004977416108138922, 'samples': 1600896, 'steps': 8337, 'loss/train': 2.3565752506256104} -08/30/2021 14:40:01 - INFO - __main__ - Step 8339: {'lr': 0.0004977408990702722, 'samples': 1601088, 'steps': 8338, 'loss/train': 1.8986552953720093} -08/30/2021 14:40:01 - INFO - __main__ - Step 8340: {'lr': 0.0004977401872150241, 'samples': 1601280, 'steps': 8339, 'loss/train': 1.8980979919433594} -08/30/2021 14:40:02 - INFO - __main__ - Step 8341: {'lr': 0.000497739475248148, 'samples': 1601472, 'steps': 8340, 'loss/train': 1.9785181283950806} -08/30/2021 14:40:03 - INFO - __main__ - Step 8342: {'lr': 0.0004977387631696443, 'samples': 1601664, 'steps': 8341, 'loss/train': 2.0182082653045654} -08/30/2021 14:40:04 - INFO - __main__ - Step 8343: {'lr': 0.0004977380509795133, 'samples': 1601856, 'steps': 8342, 'loss/train': 1.7331864833831787} -08/30/2021 14:40:04 - INFO - __main__ - Step 8344: {'lr': 0.0004977373386777554, 'samples': 1602048, 'steps': 8343, 'loss/train': 1.4820590019226074} -08/30/2021 14:40:04 - INFO - __main__ - Step 8345: {'lr': 0.0004977366262643709, 'samples': 1602240, 'steps': 8344, 'loss/train': 1.9779471158981323} -08/30/2021 14:40:05 - INFO - __main__ - Step 8346: {'lr': 0.0004977359137393601, 'samples': 1602432, 'steps': 8345, 'loss/train': 2.3275482654571533} -08/30/2021 14:40:07 - INFO - __main__ - Step 8347: {'lr': 0.0004977352011027233, 'samples': 1602624, 'steps': 8346, 'loss/train': 1.9353443384170532} -08/30/2021 14:40:07 - INFO - __main__ - Step 8348: {'lr': 0.0004977344883544608, 'samples': 1602816, 'steps': 8347, 'loss/train': 1.8399087190628052} -08/30/2021 14:40:08 - INFO - __main__ - Step 8349: {'lr': 0.0004977337754945731, 'samples': 1603008, 'steps': 8348, 'loss/train': 1.6668757200241089} -08/30/2021 14:40:08 - INFO - __main__ - Step 8350: {'lr': 0.0004977330625230603, 'samples': 1603200, 'steps': 8349, 'loss/train': 1.7841429710388184} -08/30/2021 14:40:08 - INFO - __main__ - Step 8351: {'lr': 0.0004977323494399227, 'samples': 1603392, 'steps': 8350, 'loss/train': 1.3776886463165283} -08/30/2021 14:40:10 - INFO - __main__ - Step 8352: {'lr': 0.0004977316362451608, 'samples': 1603584, 'steps': 8351, 'loss/train': 1.904458999633789} -08/30/2021 14:40:10 - INFO - __main__ - Step 8353: {'lr': 0.0004977309229387749, 'samples': 1603776, 'steps': 8352, 'loss/train': 1.7164230346679688} -08/30/2021 14:40:11 - INFO - __main__ - Step 8354: {'lr': 0.0004977302095207653, 'samples': 1603968, 'steps': 8353, 'loss/train': 2.028139352798462} -08/30/2021 14:40:11 - INFO - __main__ - Step 8355: {'lr': 0.0004977294959911322, 'samples': 1604160, 'steps': 8354, 'loss/train': 1.74051833152771} -08/30/2021 14:40:11 - INFO - __main__ - Step 8356: {'lr': 0.0004977287823498761, 'samples': 1604352, 'steps': 8355, 'loss/train': 2.0430409908294678} -08/30/2021 14:40:13 - INFO - __main__ - Step 8357: {'lr': 0.0004977280685969971, 'samples': 1604544, 'steps': 8356, 'loss/train': 4.812134265899658} -08/30/2021 14:40:13 - INFO - __main__ - Step 8358: {'lr': 0.0004977273547324958, 'samples': 1604736, 'steps': 8357, 'loss/train': 1.7824848890304565} -08/30/2021 14:40:14 - INFO - __main__ - Step 8359: {'lr': 0.0004977266407563722, 'samples': 1604928, 'steps': 8358, 'loss/train': 0.14400193095207214} -08/30/2021 14:40:14 - INFO - __main__ - Step 8360: {'lr': 0.0004977259266686269, 'samples': 1605120, 'steps': 8359, 'loss/train': 2.008903741836548} -08/30/2021 14:40:14 - INFO - __main__ - Step 8361: {'lr': 0.0004977252124692601, 'samples': 1605312, 'steps': 8360, 'loss/train': 2.2109179496765137} -08/30/2021 14:40:16 - INFO - __main__ - Step 8362: {'lr': 0.0004977244981582723, 'samples': 1605504, 'steps': 8361, 'loss/train': 1.3149958848953247} -08/30/2021 14:40:16 - INFO - __main__ - Step 8363: {'lr': 0.0004977237837356634, 'samples': 1605696, 'steps': 8362, 'loss/train': 1.4814249277114868} -08/30/2021 14:40:17 - INFO - __main__ - Step 8364: {'lr': 0.0004977230692014341, 'samples': 1605888, 'steps': 8363, 'loss/train': 1.2680524587631226} -08/30/2021 14:40:17 - INFO - __main__ - Step 8365: {'lr': 0.0004977223545555847, 'samples': 1606080, 'steps': 8364, 'loss/train': 1.889567494392395} -08/30/2021 14:40:18 - INFO - __main__ - Step 8366: {'lr': 0.0004977216397981153, 'samples': 1606272, 'steps': 8365, 'loss/train': 1.7285511493682861} -08/30/2021 14:40:20 - INFO - __main__ - Step 8367: {'lr': 0.0004977209249290264, 'samples': 1606464, 'steps': 8366, 'loss/train': 1.7076337337493896} -08/30/2021 14:40:20 - INFO - __main__ - Step 8368: {'lr': 0.0004977202099483184, 'samples': 1606656, 'steps': 8367, 'loss/train': 0.6797472238540649} -08/30/2021 14:40:20 - INFO - __main__ - Step 8369: {'lr': 0.0004977194948559913, 'samples': 1606848, 'steps': 8368, 'loss/train': 0.28144410252571106} -08/30/2021 14:40:21 - INFO - __main__ - Step 8370: {'lr': 0.0004977187796520457, 'samples': 1607040, 'steps': 8369, 'loss/train': 0.25786641240119934} -08/30/2021 14:40:21 - INFO - __main__ - Step 8371: {'lr': 0.0004977180643364819, 'samples': 1607232, 'steps': 8370, 'loss/train': 1.8771089315414429} -08/30/2021 14:40:21 - INFO - __main__ - Step 8372: {'lr': 0.0004977173489093, 'samples': 1607424, 'steps': 8371, 'loss/train': 1.7017828226089478} -08/30/2021 14:40:22 - INFO - __main__ - Step 8373: {'lr': 0.0004977166333705005, 'samples': 1607616, 'steps': 8372, 'loss/train': 1.0374953746795654} -08/30/2021 14:40:23 - INFO - __main__ - Step 8374: {'lr': 0.0004977159177200839, 'samples': 1607808, 'steps': 8373, 'loss/train': 0.9303935766220093} -08/30/2021 14:40:24 - INFO - __main__ - Step 8375: {'lr': 0.0004977152019580502, 'samples': 1608000, 'steps': 8374, 'loss/train': 2.3022544384002686} -08/30/2021 14:40:24 - INFO - __main__ - Step 8376: {'lr': 0.0004977144860843998, 'samples': 1608192, 'steps': 8375, 'loss/train': 1.7339766025543213} -08/30/2021 14:40:24 - INFO - __main__ - Step 8377: {'lr': 0.0004977137700991332, 'samples': 1608384, 'steps': 8376, 'loss/train': 1.1866298913955688} -08/30/2021 14:40:25 - INFO - __main__ - Step 8378: {'lr': 0.0004977130540022506, 'samples': 1608576, 'steps': 8377, 'loss/train': 2.2286288738250732} -08/30/2021 14:40:26 - INFO - __main__ - Step 8379: {'lr': 0.0004977123377937523, 'samples': 1608768, 'steps': 8378, 'loss/train': 1.5812745094299316} -08/30/2021 14:40:27 - INFO - __main__ - Step 8380: {'lr': 0.0004977116214736385, 'samples': 1608960, 'steps': 8379, 'loss/train': 2.0170328617095947} -08/30/2021 14:40:27 - INFO - __main__ - Step 8381: {'lr': 0.0004977109050419097, 'samples': 1609152, 'steps': 8380, 'loss/train': 1.406911015510559} -08/30/2021 14:40:28 - INFO - __main__ - Step 8382: {'lr': 0.0004977101884985663, 'samples': 1609344, 'steps': 8381, 'loss/train': 1.9083555936813354} -08/30/2021 14:40:28 - INFO - __main__ - Step 8383: {'lr': 0.0004977094718436085, 'samples': 1609536, 'steps': 8382, 'loss/train': 1.6277457475662231} -08/30/2021 14:40:29 - INFO - __main__ - Step 8384: {'lr': 0.0004977087550770366, 'samples': 1609728, 'steps': 8383, 'loss/train': 1.8766511678695679} -08/30/2021 14:40:30 - INFO - __main__ - Step 8385: {'lr': 0.000497708038198851, 'samples': 1609920, 'steps': 8384, 'loss/train': 1.82414972782135} -08/30/2021 14:40:30 - INFO - __main__ - Step 8386: {'lr': 0.0004977073212090519, 'samples': 1610112, 'steps': 8385, 'loss/train': 1.6500340700149536} -08/30/2021 14:40:31 - INFO - __main__ - Step 8387: {'lr': 0.0004977066041076398, 'samples': 1610304, 'steps': 8386, 'loss/train': 1.7735825777053833} -08/30/2021 14:40:31 - INFO - __main__ - Step 8388: {'lr': 0.0004977058868946148, 'samples': 1610496, 'steps': 8387, 'loss/train': 2.3419904708862305} -08/30/2021 14:40:31 - INFO - __main__ - Step 8389: {'lr': 0.0004977051695699775, 'samples': 1610688, 'steps': 8388, 'loss/train': 1.884500503540039} -08/30/2021 14:40:33 - INFO - __main__ - Step 8390: {'lr': 0.000497704452133728, 'samples': 1610880, 'steps': 8389, 'loss/train': 1.5366007089614868} -08/30/2021 14:40:33 - INFO - __main__ - Step 8391: {'lr': 0.0004977037345858667, 'samples': 1611072, 'steps': 8390, 'loss/train': 1.8311564922332764} -08/30/2021 14:40:34 - INFO - __main__ - Step 8392: {'lr': 0.0004977030169263938, 'samples': 1611264, 'steps': 8391, 'loss/train': 1.4765764474868774} -08/30/2021 14:40:34 - INFO - __main__ - Step 8393: {'lr': 0.0004977022991553099, 'samples': 1611456, 'steps': 8392, 'loss/train': 1.2311745882034302} -08/30/2021 14:40:34 - INFO - __main__ - Step 8394: {'lr': 0.0004977015812726151, 'samples': 1611648, 'steps': 8393, 'loss/train': 2.1788699626922607} -08/30/2021 14:40:36 - INFO - __main__ - Step 8395: {'lr': 0.0004977008632783098, 'samples': 1611840, 'steps': 8394, 'loss/train': 2.254236936569214} -08/30/2021 14:40:37 - INFO - __main__ - Step 8396: {'lr': 0.0004977001451723944, 'samples': 1612032, 'steps': 8395, 'loss/train': 1.889039397239685} -08/30/2021 14:40:37 - INFO - __main__ - Step 8397: {'lr': 0.000497699426954869, 'samples': 1612224, 'steps': 8396, 'loss/train': 0.2786397933959961} -08/30/2021 14:40:37 - INFO - __main__ - Step 8398: {'lr': 0.0004976987086257342, 'samples': 1612416, 'steps': 8397, 'loss/train': 2.030327320098877} -08/30/2021 14:40:38 - INFO - __main__ - Step 8399: {'lr': 0.0004976979901849901, 'samples': 1612608, 'steps': 8398, 'loss/train': 1.8387422561645508} -08/30/2021 14:40:39 - INFO - __main__ - Step 8400: {'lr': 0.000497697271632637, 'samples': 1612800, 'steps': 8399, 'loss/train': 0.24667046964168549} -08/30/2021 14:40:40 - INFO - __main__ - Step 8401: {'lr': 0.0004976965529686756, 'samples': 1612992, 'steps': 8400, 'loss/train': 1.3080761432647705} -08/30/2021 14:40:40 - INFO - __main__ - Step 8402: {'lr': 0.0004976958341931057, 'samples': 1613184, 'steps': 8401, 'loss/train': 2.1053905487060547} -08/30/2021 14:40:41 - INFO - __main__ - Step 8403: {'lr': 0.000497695115305928, 'samples': 1613376, 'steps': 8402, 'loss/train': 1.9701963663101196} -08/30/2021 14:40:41 - INFO - __main__ - Step 8404: {'lr': 0.0004976943963071426, 'samples': 1613568, 'steps': 8403, 'loss/train': 1.962083339691162} -08/30/2021 14:40:43 - INFO - __main__ - Step 8405: {'lr': 0.0004976936771967501, 'samples': 1613760, 'steps': 8404, 'loss/train': 1.8074135780334473} -08/30/2021 14:40:44 - INFO - __main__ - Step 8406: {'lr': 0.0004976929579747505, 'samples': 1613952, 'steps': 8405, 'loss/train': 1.9674524068832397} -08/30/2021 14:40:44 - INFO - __main__ - Step 8407: {'lr': 0.0004976922386411444, 'samples': 1614144, 'steps': 8406, 'loss/train': 2.0371336936950684} -08/30/2021 14:40:44 - INFO - __main__ - Step 8408: {'lr': 0.0004976915191959319, 'samples': 1614336, 'steps': 8407, 'loss/train': 3.048996686935425} -08/30/2021 14:40:45 - INFO - __main__ - Step 8409: {'lr': 0.0004976907996391135, 'samples': 1614528, 'steps': 8408, 'loss/train': 1.9434444904327393} -08/30/2021 14:40:46 - INFO - __main__ - Step 8410: {'lr': 0.0004976900799706894, 'samples': 1614720, 'steps': 8409, 'loss/train': 1.6855064630508423} -08/30/2021 14:40:47 - INFO - __main__ - Step 8411: {'lr': 0.00049768936019066, 'samples': 1614912, 'steps': 8410, 'loss/train': 2.3353629112243652} -08/30/2021 14:40:47 - INFO - __main__ - Step 8412: {'lr': 0.0004976886402990255, 'samples': 1615104, 'steps': 8411, 'loss/train': 2.074800968170166} -08/30/2021 14:40:47 - INFO - __main__ - Step 8413: {'lr': 0.0004976879202957864, 'samples': 1615296, 'steps': 8412, 'loss/train': 2.114934206008911} -08/30/2021 14:40:48 - INFO - __main__ - Step 8414: {'lr': 0.000497687200180943, 'samples': 1615488, 'steps': 8413, 'loss/train': 2.45617413520813} -08/30/2021 14:40:48 - INFO - __main__ - Step 8415: {'lr': 0.0004976864799544954, 'samples': 1615680, 'steps': 8414, 'loss/train': 2.501805305480957} -08/30/2021 14:40:50 - INFO - __main__ - Step 8416: {'lr': 0.0004976857596164443, 'samples': 1615872, 'steps': 8415, 'loss/train': 1.850860357284546} -08/30/2021 14:40:50 - INFO - __main__ - Step 8417: {'lr': 0.0004976850391667897, 'samples': 1616064, 'steps': 8416, 'loss/train': 1.9494117498397827} -08/30/2021 14:40:50 - INFO - __main__ - Step 8418: {'lr': 0.0004976843186055321, 'samples': 1616256, 'steps': 8417, 'loss/train': 1.4619063138961792} -08/30/2021 14:40:51 - INFO - __main__ - Step 8419: {'lr': 0.0004976835979326718, 'samples': 1616448, 'steps': 8418, 'loss/train': 2.0630555152893066} -08/30/2021 14:40:51 - INFO - __main__ - Step 8420: {'lr': 0.0004976828771482089, 'samples': 1616640, 'steps': 8419, 'loss/train': 1.6443235874176025} -08/30/2021 14:40:53 - INFO - __main__ - Step 8421: {'lr': 0.0004976821562521441, 'samples': 1616832, 'steps': 8420, 'loss/train': 1.9582713842391968} -08/30/2021 14:40:53 - INFO - __main__ - Step 8422: {'lr': 0.0004976814352444775, 'samples': 1617024, 'steps': 8421, 'loss/train': 2.0009896755218506} -08/30/2021 14:40:53 - INFO - __main__ - Step 8423: {'lr': 0.0004976807141252094, 'samples': 1617216, 'steps': 8422, 'loss/train': 2.197566032409668} -08/30/2021 14:40:54 - INFO - __main__ - Step 8424: {'lr': 0.0004976799928943403, 'samples': 1617408, 'steps': 8423, 'loss/train': 1.372810959815979} -08/30/2021 14:40:54 - INFO - __main__ - Step 8425: {'lr': 0.0004976792715518703, 'samples': 1617600, 'steps': 8424, 'loss/train': 2.1167540550231934} -08/30/2021 14:40:56 - INFO - __main__ - Step 8426: {'lr': 0.0004976785500978, 'samples': 1617792, 'steps': 8425, 'loss/train': 1.62273108959198} -08/30/2021 14:40:56 - INFO - __main__ - Step 8427: {'lr': 0.0004976778285321294, 'samples': 1617984, 'steps': 8426, 'loss/train': 1.919689416885376} -08/30/2021 14:40:57 - INFO - __main__ - Step 8428: {'lr': 0.0004976771068548591, 'samples': 1618176, 'steps': 8427, 'loss/train': 2.0481975078582764} -08/30/2021 14:40:57 - INFO - __main__ - Step 8429: {'lr': 0.0004976763850659893, 'samples': 1618368, 'steps': 8428, 'loss/train': 2.188000202178955} -08/30/2021 14:40:57 - INFO - __main__ - Step 8430: {'lr': 0.0004976756631655203, 'samples': 1618560, 'steps': 8429, 'loss/train': 1.6878498792648315} -08/30/2021 14:40:59 - INFO - __main__ - Step 8431: {'lr': 0.0004976749411534525, 'samples': 1618752, 'steps': 8430, 'loss/train': 2.0530524253845215} -08/30/2021 14:40:59 - INFO - __main__ - Step 8432: {'lr': 0.0004976742190297862, 'samples': 1618944, 'steps': 8431, 'loss/train': 1.426246166229248} -08/30/2021 14:41:00 - INFO - __main__ - Step 8433: {'lr': 0.0004976734967945217, 'samples': 1619136, 'steps': 8432, 'loss/train': 2.087311029434204} -08/30/2021 14:41:00 - INFO - __main__ - Step 8434: {'lr': 0.0004976727744476593, 'samples': 1619328, 'steps': 8433, 'loss/train': 1.9107396602630615} -08/30/2021 14:41:01 - INFO - __main__ - Step 8435: {'lr': 0.0004976720519891994, 'samples': 1619520, 'steps': 8434, 'loss/train': 2.3749823570251465} -08/30/2021 14:41:01 - INFO - __main__ - Step 8436: {'lr': 0.0004976713294191423, 'samples': 1619712, 'steps': 8435, 'loss/train': 1.8813793659210205} -08/30/2021 14:41:02 - INFO - __main__ - Step 8437: {'lr': 0.0004976706067374885, 'samples': 1619904, 'steps': 8436, 'loss/train': 1.721274971961975} -08/30/2021 14:41:03 - INFO - __main__ - Step 8438: {'lr': 0.0004976698839442379, 'samples': 1620096, 'steps': 8437, 'loss/train': 1.6744798421859741} -08/30/2021 14:41:03 - INFO - __main__ - Step 8439: {'lr': 0.0004976691610393911, 'samples': 1620288, 'steps': 8438, 'loss/train': 2.0879571437835693} -08/30/2021 14:41:04 - INFO - __main__ - Step 8440: {'lr': 0.0004976684380229485, 'samples': 1620480, 'steps': 8439, 'loss/train': 0.20244963467121124} -08/30/2021 14:41:04 - INFO - __main__ - Step 8441: {'lr': 0.0004976677148949102, 'samples': 1620672, 'steps': 8440, 'loss/train': 1.9900668859481812} -08/30/2021 14:41:06 - INFO - __main__ - Step 8442: {'lr': 0.0004976669916552768, 'samples': 1620864, 'steps': 8441, 'loss/train': 1.7141551971435547} -08/30/2021 14:41:06 - INFO - __main__ - Step 8443: {'lr': 0.0004976662683040484, 'samples': 1621056, 'steps': 8442, 'loss/train': 1.8672370910644531} -08/30/2021 14:41:06 - INFO - __main__ - Step 8444: {'lr': 0.0004976655448412254, 'samples': 1621248, 'steps': 8443, 'loss/train': 2.3276731967926025} -08/30/2021 14:41:07 - INFO - __main__ - Step 8445: {'lr': 0.0004976648212668081, 'samples': 1621440, 'steps': 8444, 'loss/train': 2.4769723415374756} -08/30/2021 14:41:07 - INFO - __main__ - Step 8446: {'lr': 0.0004976640975807969, 'samples': 1621632, 'steps': 8445, 'loss/train': 2.1962947845458984} -08/30/2021 14:41:09 - INFO - __main__ - Step 8447: {'lr': 0.0004976633737831921, 'samples': 1621824, 'steps': 8446, 'loss/train': 1.7524241209030151} -08/30/2021 14:41:09 - INFO - __main__ - Step 8448: {'lr': 0.000497662649873994, 'samples': 1622016, 'steps': 8447, 'loss/train': 1.8559969663619995} -08/30/2021 14:41:10 - INFO - __main__ - Step 8449: {'lr': 0.0004976619258532029, 'samples': 1622208, 'steps': 8448, 'loss/train': 1.780842900276184} -08/30/2021 14:41:10 - INFO - __main__ - Step 8450: {'lr': 0.0004976612017208191, 'samples': 1622400, 'steps': 8449, 'loss/train': 2.192594528198242} -08/30/2021 14:41:10 - INFO - __main__ - Step 8451: {'lr': 0.000497660477476843, 'samples': 1622592, 'steps': 8450, 'loss/train': 2.020826578140259} -08/30/2021 14:41:12 - INFO - __main__ - Step 8452: {'lr': 0.000497659753121275, 'samples': 1622784, 'steps': 8451, 'loss/train': 2.2761666774749756} -08/30/2021 14:41:12 - INFO - __main__ - Step 8453: {'lr': 0.0004976590286541152, 'samples': 1622976, 'steps': 8452, 'loss/train': 1.6590408086776733} -08/30/2021 14:41:12 - INFO - __main__ - Step 8454: {'lr': 0.0004976583040753643, 'samples': 1623168, 'steps': 8453, 'loss/train': 2.0330984592437744} -08/30/2021 14:41:13 - INFO - __main__ - Step 8455: {'lr': 0.0004976575793850223, 'samples': 1623360, 'steps': 8454, 'loss/train': 1.8798871040344238} -08/30/2021 14:41:13 - INFO - __main__ - Step 8456: {'lr': 0.0004976568545830894, 'samples': 1623552, 'steps': 8455, 'loss/train': 1.8375606536865234} -08/30/2021 14:41:15 - INFO - __main__ - Step 8457: {'lr': 0.0004976561296695663, 'samples': 1623744, 'steps': 8456, 'loss/train': 1.9186795949935913} -08/30/2021 14:41:16 - INFO - __main__ - Step 8458: {'lr': 0.0004976554046444532, 'samples': 1623936, 'steps': 8457, 'loss/train': 1.598724603652954} -08/30/2021 14:41:16 - INFO - __main__ - Step 8459: {'lr': 0.0004976546795077503, 'samples': 1624128, 'steps': 8458, 'loss/train': 2.0605580806732178} -08/30/2021 14:41:17 - INFO - __main__ - Step 8460: {'lr': 0.0004976539542594582, 'samples': 1624320, 'steps': 8459, 'loss/train': 0.7667750120162964} -08/30/2021 14:41:17 - INFO - __main__ - Step 8461: {'lr': 0.0004976532288995768, 'samples': 1624512, 'steps': 8460, 'loss/train': 1.062516689300537} -08/30/2021 14:41:17 - INFO - __main__ - Step 8462: {'lr': 0.0004976525034281069, 'samples': 1624704, 'steps': 8461, 'loss/train': 2.5350990295410156} -08/30/2021 14:41:19 - INFO - __main__ - Step 8463: {'lr': 0.0004976517778450486, 'samples': 1624896, 'steps': 8462, 'loss/train': 1.7621550559997559} -08/30/2021 14:41:20 - INFO - __main__ - Step 8464: {'lr': 0.000497651052150402, 'samples': 1625088, 'steps': 8463, 'loss/train': 1.9986919164657593} -08/30/2021 14:41:20 - INFO - __main__ - Step 8465: {'lr': 0.0004976503263441679, 'samples': 1625280, 'steps': 8464, 'loss/train': 0.3113585412502289} -08/30/2021 14:41:20 - INFO - __main__ - Step 8466: {'lr': 0.0004976496004263463, 'samples': 1625472, 'steps': 8465, 'loss/train': 1.6023749113082886} -08/30/2021 14:41:21 - INFO - __main__ - Step 8467: {'lr': 0.0004976488743969376, 'samples': 1625664, 'steps': 8466, 'loss/train': 2.0465993881225586} -08/30/2021 14:41:21 - INFO - __main__ - Step 8468: {'lr': 0.0004976481482559421, 'samples': 1625856, 'steps': 8467, 'loss/train': 3.549811601638794} -08/30/2021 14:41:23 - INFO - __main__ - Step 8469: {'lr': 0.0004976474220033602, 'samples': 1626048, 'steps': 8468, 'loss/train': 2.1560614109039307} -08/30/2021 14:41:23 - INFO - __main__ - Step 8470: {'lr': 0.0004976466956391922, 'samples': 1626240, 'steps': 8469, 'loss/train': 2.440587282180786} -08/30/2021 14:41:23 - INFO - __main__ - Step 8471: {'lr': 0.0004976459691634384, 'samples': 1626432, 'steps': 8470, 'loss/train': 1.8070740699768066} -08/30/2021 14:41:24 - INFO - __main__ - Step 8472: {'lr': 0.0004976452425760992, 'samples': 1626624, 'steps': 8471, 'loss/train': 2.6197290420532227} -08/30/2021 14:41:24 - INFO - __main__ - Step 8473: {'lr': 0.0004976445158771748, 'samples': 1626816, 'steps': 8472, 'loss/train': 2.0030508041381836} -08/30/2021 14:41:26 - INFO - __main__ - Step 8474: {'lr': 0.0004976437890666657, 'samples': 1627008, 'steps': 8473, 'loss/train': 1.2487941980361938} -08/30/2021 14:41:26 - INFO - __main__ - Step 8475: {'lr': 0.0004976430621445721, 'samples': 1627200, 'steps': 8474, 'loss/train': 1.7159271240234375} -08/30/2021 14:41:27 - INFO - __main__ - Step 8476: {'lr': 0.0004976423351108943, 'samples': 1627392, 'steps': 8475, 'loss/train': 2.32255482673645} -08/30/2021 14:41:27 - INFO - __main__ - Step 8477: {'lr': 0.0004976416079656328, 'samples': 1627584, 'steps': 8476, 'loss/train': 2.0413544178009033} -08/30/2021 14:41:28 - INFO - __main__ - Step 8478: {'lr': 0.0004976408807087876, 'samples': 1627776, 'steps': 8477, 'loss/train': 2.082794666290283} -08/30/2021 14:41:29 - INFO - __main__ - Step 8479: {'lr': 0.0004976401533403594, 'samples': 1627968, 'steps': 8478, 'loss/train': 2.3448400497436523} -08/30/2021 14:41:29 - INFO - __main__ - Step 8480: {'lr': 0.0004976394258603484, 'samples': 1628160, 'steps': 8479, 'loss/train': 1.9288054704666138} -08/30/2021 14:41:30 - INFO - __main__ - Step 8481: {'lr': 0.0004976386982687549, 'samples': 1628352, 'steps': 8480, 'loss/train': 1.887291669845581} -08/30/2021 14:41:30 - INFO - __main__ - Step 8482: {'lr': 0.0004976379705655791, 'samples': 1628544, 'steps': 8481, 'loss/train': 2.1422014236450195} -08/30/2021 14:41:31 - INFO - __main__ - Step 8483: {'lr': 0.0004976372427508215, 'samples': 1628736, 'steps': 8482, 'loss/train': 2.495030164718628} -08/30/2021 14:41:32 - INFO - __main__ - Step 8484: {'lr': 0.0004976365148244824, 'samples': 1628928, 'steps': 8483, 'loss/train': 3.080559015274048} -08/30/2021 14:41:33 - INFO - __main__ - Step 8485: {'lr': 0.0004976357867865621, 'samples': 1629120, 'steps': 8484, 'loss/train': 1.867462158203125} -08/30/2021 14:41:33 - INFO - __main__ - Step 8486: {'lr': 0.0004976350586370609, 'samples': 1629312, 'steps': 8485, 'loss/train': 2.1726021766662598} -08/30/2021 14:41:33 - INFO - __main__ - Step 8487: {'lr': 0.0004976343303759792, 'samples': 1629504, 'steps': 8486, 'loss/train': 1.6485310792922974} -08/30/2021 14:41:34 - INFO - __main__ - Step 8488: {'lr': 0.0004976336020033174, 'samples': 1629696, 'steps': 8487, 'loss/train': 2.2282848358154297} -08/30/2021 14:41:35 - INFO - __main__ - Step 8489: {'lr': 0.0004976328735190755, 'samples': 1629888, 'steps': 8488, 'loss/train': 1.8821983337402344} -08/30/2021 14:41:36 - INFO - __main__ - Step 8490: {'lr': 0.0004976321449232542, 'samples': 1630080, 'steps': 8489, 'loss/train': 0.7413626909255981} -08/30/2021 14:41:36 - INFO - __main__ - Step 8491: {'lr': 0.0004976314162158536, 'samples': 1630272, 'steps': 8490, 'loss/train': 1.9485259056091309} -08/30/2021 14:41:36 - INFO - __main__ - Step 8492: {'lr': 0.0004976306873968741, 'samples': 1630464, 'steps': 8491, 'loss/train': 0.3117968440055847} -08/30/2021 14:41:37 - INFO - __main__ - Step 8493: {'lr': 0.0004976299584663161, 'samples': 1630656, 'steps': 8492, 'loss/train': 2.099956512451172} -08/30/2021 14:41:37 - INFO - __main__ - Step 8494: {'lr': 0.0004976292294241798, 'samples': 1630848, 'steps': 8493, 'loss/train': 2.1442737579345703} -08/30/2021 14:41:39 - INFO - __main__ - Step 8495: {'lr': 0.0004976285002704656, 'samples': 1631040, 'steps': 8494, 'loss/train': 1.9286046028137207} -08/30/2021 14:41:39 - INFO - __main__ - Step 8496: {'lr': 0.0004976277710051739, 'samples': 1631232, 'steps': 8495, 'loss/train': 1.6619433164596558} -08/30/2021 14:41:39 - INFO - __main__ - Step 8497: {'lr': 0.0004976270416283049, 'samples': 1631424, 'steps': 8496, 'loss/train': 2.144641160964966} -08/30/2021 14:41:40 - INFO - __main__ - Step 8498: {'lr': 0.000497626312139859, 'samples': 1631616, 'steps': 8497, 'loss/train': 2.459773302078247} -08/30/2021 14:41:40 - INFO - __main__ - Step 8499: {'lr': 0.0004976255825398365, 'samples': 1631808, 'steps': 8498, 'loss/train': 2.3068463802337646} -08/30/2021 14:41:42 - INFO - __main__ - Step 8500: {'lr': 0.0004976248528282376, 'samples': 1632000, 'steps': 8499, 'loss/train': 2.0007362365722656} -08/30/2021 14:41:42 - INFO - __main__ - Step 8501: {'lr': 0.000497624123005063, 'samples': 1632192, 'steps': 8500, 'loss/train': 1.9711920022964478} -08/30/2021 14:41:42 - INFO - __main__ - Step 8502: {'lr': 0.0004976233930703126, 'samples': 1632384, 'steps': 8501, 'loss/train': 1.1688724756240845} -08/30/2021 14:41:43 - INFO - __main__ - Step 8503: {'lr': 0.000497622663023987, 'samples': 1632576, 'steps': 8502, 'loss/train': 2.0451629161834717} -08/30/2021 14:41:43 - INFO - __main__ - Step 8504: {'lr': 0.0004976219328660864, 'samples': 1632768, 'steps': 8503, 'loss/train': 2.319286346435547} -08/30/2021 14:41:44 - INFO - __main__ - Step 8505: {'lr': 0.0004976212025966112, 'samples': 1632960, 'steps': 8504, 'loss/train': 2.3594236373901367} -08/30/2021 14:41:45 - INFO - __main__ - Step 8506: {'lr': 0.0004976204722155617, 'samples': 1633152, 'steps': 8505, 'loss/train': 2.0503997802734375} -08/30/2021 14:41:45 - INFO - __main__ - Step 8507: {'lr': 0.0004976197417229383, 'samples': 1633344, 'steps': 8506, 'loss/train': 2.303234100341797} -08/30/2021 14:41:46 - INFO - __main__ - Step 8508: {'lr': 0.0004976190111187412, 'samples': 1633536, 'steps': 8507, 'loss/train': 1.8147375583648682} -08/30/2021 14:41:46 - INFO - __main__ - Step 8509: {'lr': 0.0004976182804029708, 'samples': 1633728, 'steps': 8508, 'loss/train': 1.4946863651275635} -08/30/2021 14:41:47 - INFO - __main__ - Step 8510: {'lr': 0.0004976175495756274, 'samples': 1633920, 'steps': 8509, 'loss/train': 2.2374181747436523} -08/30/2021 14:41:48 - INFO - __main__ - Step 8511: {'lr': 0.0004976168186367115, 'samples': 1634112, 'steps': 8510, 'loss/train': 1.914146065711975} -08/30/2021 14:41:48 - INFO - __main__ - Step 8512: {'lr': 0.0004976160875862231, 'samples': 1634304, 'steps': 8511, 'loss/train': 1.9570538997650146} -08/30/2021 14:41:49 - INFO - __main__ - Step 8513: {'lr': 0.0004976153564241628, 'samples': 1634496, 'steps': 8512, 'loss/train': 2.3283867835998535} -08/30/2021 14:41:49 - INFO - __main__ - Step 8514: {'lr': 0.0004976146251505309, 'samples': 1634688, 'steps': 8513, 'loss/train': 1.7819856405258179} -08/30/2021 14:41:49 - INFO - __main__ - Step 8515: {'lr': 0.0004976138937653275, 'samples': 1634880, 'steps': 8514, 'loss/train': 2.3694818019866943} -08/30/2021 14:41:51 - INFO - __main__ - Step 8516: {'lr': 0.0004976131622685532, 'samples': 1635072, 'steps': 8515, 'loss/train': 1.8378411531448364} -08/30/2021 14:41:52 - INFO - __main__ - Step 8517: {'lr': 0.0004976124306602083, 'samples': 1635264, 'steps': 8516, 'loss/train': 2.0556554794311523} -08/30/2021 14:41:52 - INFO - __main__ - Step 8518: {'lr': 0.0004976116989402929, 'samples': 1635456, 'steps': 8517, 'loss/train': 2.6223933696746826} -08/30/2021 14:41:53 - INFO - __main__ - Step 8519: {'lr': 0.0004976109671088076, 'samples': 1635648, 'steps': 8518, 'loss/train': 1.8509653806686401} -08/30/2021 14:41:53 - INFO - __main__ - Step 8520: {'lr': 0.0004976102351657526, 'samples': 1635840, 'steps': 8519, 'loss/train': 2.9559926986694336} -08/30/2021 14:41:53 - INFO - __main__ - Step 8521: {'lr': 0.0004976095031111283, 'samples': 1636032, 'steps': 8520, 'loss/train': 1.9471144676208496} -08/30/2021 14:41:55 - INFO - __main__ - Step 8522: {'lr': 0.0004976087709449348, 'samples': 1636224, 'steps': 8521, 'loss/train': 2.1203227043151855} -08/30/2021 14:41:56 - INFO - __main__ - Step 8523: {'lr': 0.0004976080386671728, 'samples': 1636416, 'steps': 8522, 'loss/train': 0.2881372570991516} -08/30/2021 14:41:56 - INFO - __main__ - Step 8524: {'lr': 0.0004976073062778423, 'samples': 1636608, 'steps': 8523, 'loss/train': 2.4722959995269775} -08/30/2021 14:41:56 - INFO - __main__ - Step 8525: {'lr': 0.0004976065737769439, 'samples': 1636800, 'steps': 8524, 'loss/train': 2.5211868286132812} -08/30/2021 14:41:57 - INFO - __main__ - Step 8526: {'lr': 0.0004976058411644777, 'samples': 1636992, 'steps': 8525, 'loss/train': 2.07977294921875} -08/30/2021 14:41:58 - INFO - __main__ - Step 8527: {'lr': 0.0004976051084404443, 'samples': 1637184, 'steps': 8526, 'loss/train': 1.9101005792617798} -08/30/2021 14:41:59 - INFO - __main__ - Step 8528: {'lr': 0.0004976043756048436, 'samples': 1637376, 'steps': 8527, 'loss/train': 2.264810562133789} -08/30/2021 14:41:59 - INFO - __main__ - Step 8529: {'lr': 0.0004976036426576763, 'samples': 1637568, 'steps': 8528, 'loss/train': 1.7202534675598145} -08/30/2021 14:41:59 - INFO - __main__ - Step 8530: {'lr': 0.0004976029095989427, 'samples': 1637760, 'steps': 8529, 'loss/train': 1.697363257408142} -08/30/2021 14:42:00 - INFO - __main__ - Step 8531: {'lr': 0.000497602176428643, 'samples': 1637952, 'steps': 8530, 'loss/train': 1.708794355392456} -08/30/2021 14:42:01 - INFO - __main__ - Step 8532: {'lr': 0.0004976014431467775, 'samples': 1638144, 'steps': 8531, 'loss/train': 2.5881059169769287} -08/30/2021 14:42:02 - INFO - __main__ - Step 8533: {'lr': 0.0004976007097533467, 'samples': 1638336, 'steps': 8532, 'loss/train': 1.8518662452697754} -08/30/2021 14:42:02 - INFO - __main__ - Step 8534: {'lr': 0.0004975999762483509, 'samples': 1638528, 'steps': 8533, 'loss/train': 0.20579160749912262} -08/30/2021 14:42:03 - INFO - __main__ - Step 8535: {'lr': 0.0004975992426317902, 'samples': 1638720, 'steps': 8534, 'loss/train': 2.5459859371185303} -08/30/2021 14:42:03 - INFO - __main__ - Step 8536: {'lr': 0.0004975985089036652, 'samples': 1638912, 'steps': 8535, 'loss/train': 1.9717767238616943} -08/30/2021 14:42:04 - INFO - __main__ - Step 8537: {'lr': 0.0004975977750639761, 'samples': 1639104, 'steps': 8536, 'loss/train': 3.9437596797943115} -08/30/2021 14:42:05 - INFO - __main__ - Step 8538: {'lr': 0.0004975970411127233, 'samples': 1639296, 'steps': 8537, 'loss/train': 2.1195478439331055} -08/30/2021 14:42:05 - INFO - __main__ - Step 8539: {'lr': 0.0004975963070499071, 'samples': 1639488, 'steps': 8538, 'loss/train': 1.6157540082931519} -08/30/2021 14:42:06 - INFO - __main__ - Step 8540: {'lr': 0.0004975955728755277, 'samples': 1639680, 'steps': 8539, 'loss/train': 2.056792974472046} -08/30/2021 14:42:06 - INFO - __main__ - Step 8541: {'lr': 0.0004975948385895858, 'samples': 1639872, 'steps': 8540, 'loss/train': 1.8156791925430298} -08/30/2021 14:42:08 - INFO - __main__ - Step 8542: {'lr': 0.0004975941041920813, 'samples': 1640064, 'steps': 8541, 'loss/train': 2.3577349185943604} -08/30/2021 14:42:08 - INFO - __main__ - Step 8543: {'lr': 0.0004975933696830147, 'samples': 1640256, 'steps': 8542, 'loss/train': 0.6268185377120972} -08/30/2021 14:42:09 - INFO - __main__ - Step 8544: {'lr': 0.0004975926350623864, 'samples': 1640448, 'steps': 8543, 'loss/train': 0.7368513941764832} -08/30/2021 14:42:09 - INFO - __main__ - Step 8545: {'lr': 0.0004975919003301967, 'samples': 1640640, 'steps': 8544, 'loss/train': 1.5377479791641235} -08/30/2021 14:42:09 - INFO - __main__ - Step 8546: {'lr': 0.0004975911654864459, 'samples': 1640832, 'steps': 8545, 'loss/train': 1.5808402299880981} -08/30/2021 14:42:10 - INFO - __main__ - Step 8547: {'lr': 0.0004975904305311344, 'samples': 1641024, 'steps': 8546, 'loss/train': 2.248965263366699} -08/30/2021 14:42:11 - INFO - __main__ - Step 8548: {'lr': 0.0004975896954642623, 'samples': 1641216, 'steps': 8547, 'loss/train': 2.206531524658203} -08/30/2021 14:42:12 - INFO - __main__ - Step 8549: {'lr': 0.0004975889602858303, 'samples': 1641408, 'steps': 8548, 'loss/train': 2.012965440750122} -08/30/2021 14:42:12 - INFO - __main__ - Step 8550: {'lr': 0.0004975882249958385, 'samples': 1641600, 'steps': 8549, 'loss/train': 1.8193858861923218} -08/30/2021 14:42:12 - INFO - __main__ - Step 8551: {'lr': 0.0004975874895942872, 'samples': 1641792, 'steps': 8550, 'loss/train': 2.252633571624756} -08/30/2021 14:42:13 - INFO - __main__ - Step 8552: {'lr': 0.0004975867540811768, 'samples': 1641984, 'steps': 8551, 'loss/train': 1.5177539587020874} -08/30/2021 14:42:14 - INFO - __main__ - Step 8553: {'lr': 0.0004975860184565076, 'samples': 1642176, 'steps': 8552, 'loss/train': 1.8967360258102417} -08/30/2021 14:42:15 - INFO - __main__ - Step 8554: {'lr': 0.0004975852827202801, 'samples': 1642368, 'steps': 8553, 'loss/train': 1.8044441938400269} -08/30/2021 14:42:15 - INFO - __main__ - Step 8555: {'lr': 0.0004975845468724944, 'samples': 1642560, 'steps': 8554, 'loss/train': 1.6104270219802856} -08/30/2021 14:42:16 - INFO - __main__ - Step 8556: {'lr': 0.0004975838109131509, 'samples': 1642752, 'steps': 8555, 'loss/train': 1.7505496740341187} -08/30/2021 14:42:16 - INFO - __main__ - Step 8557: {'lr': 0.0004975830748422499, 'samples': 1642944, 'steps': 8556, 'loss/train': 1.9093105792999268} -08/30/2021 14:42:16 - INFO - __main__ - Step 8558: {'lr': 0.0004975823386597918, 'samples': 1643136, 'steps': 8557, 'loss/train': 1.6590849161148071} -08/30/2021 14:42:18 - INFO - __main__ - Step 8559: {'lr': 0.000497581602365777, 'samples': 1643328, 'steps': 8558, 'loss/train': 2.215555191040039} -08/30/2021 14:42:18 - INFO - __main__ - Step 8560: {'lr': 0.0004975808659602058, 'samples': 1643520, 'steps': 8559, 'loss/train': 2.3118512630462646} -08/30/2021 14:42:18 - INFO - __main__ - Step 8561: {'lr': 0.0004975801294430784, 'samples': 1643712, 'steps': 8560, 'loss/train': 2.343376398086548} -08/30/2021 14:42:19 - INFO - __main__ - Step 8562: {'lr': 0.0004975793928143952, 'samples': 1643904, 'steps': 8561, 'loss/train': 2.2122883796691895} -08/30/2021 14:42:19 - INFO - __main__ - Step 8563: {'lr': 0.0004975786560741566, 'samples': 1644096, 'steps': 8562, 'loss/train': 3.140326499938965} -08/30/2021 14:42:21 - INFO - __main__ - Step 8564: {'lr': 0.0004975779192223629, 'samples': 1644288, 'steps': 8563, 'loss/train': 2.540897846221924} -08/30/2021 14:42:21 - INFO - __main__ - Step 8565: {'lr': 0.0004975771822590143, 'samples': 1644480, 'steps': 8564, 'loss/train': 1.8659827709197998} -08/30/2021 14:42:21 - INFO - __main__ - Step 8566: {'lr': 0.0004975764451841114, 'samples': 1644672, 'steps': 8565, 'loss/train': 2.5408880710601807} -08/30/2021 14:42:22 - INFO - __main__ - Step 8567: {'lr': 0.0004975757079976542, 'samples': 1644864, 'steps': 8566, 'loss/train': 2.0472939014434814} -08/30/2021 14:42:22 - INFO - __main__ - Step 8568: {'lr': 0.0004975749706996433, 'samples': 1645056, 'steps': 8567, 'loss/train': 2.1713831424713135} -08/30/2021 14:42:25 - INFO - __main__ - Step 8569: {'lr': 0.0004975742332900789, 'samples': 1645248, 'steps': 8568, 'loss/train': 2.100381374359131} -08/30/2021 14:42:25 - INFO - __main__ - Step 8570: {'lr': 0.0004975734957689614, 'samples': 1645440, 'steps': 8569, 'loss/train': 1.6959052085876465} -08/30/2021 14:42:26 - INFO - __main__ - Step 8571: {'lr': 0.0004975727581362911, 'samples': 1645632, 'steps': 8570, 'loss/train': 1.5239940881729126} -08/30/2021 14:42:26 - INFO - __main__ - Step 8572: {'lr': 0.0004975720203920683, 'samples': 1645824, 'steps': 8571, 'loss/train': 1.7015442848205566} -08/30/2021 14:42:26 - INFO - __main__ - Step 8573: {'lr': 0.0004975712825362934, 'samples': 1646016, 'steps': 8572, 'loss/train': 0.6614782214164734} -08/30/2021 14:42:27 - INFO - __main__ - Step 8574: {'lr': 0.0004975705445689668, 'samples': 1646208, 'steps': 8573, 'loss/train': 0.4116190969944} -08/30/2021 14:42:28 - INFO - __main__ - Step 8575: {'lr': 0.0004975698064900886, 'samples': 1646400, 'steps': 8574, 'loss/train': 2.1950554847717285} -08/30/2021 14:42:29 - INFO - __main__ - Step 8576: {'lr': 0.0004975690682996592, 'samples': 1646592, 'steps': 8575, 'loss/train': 2.125760316848755} -08/30/2021 14:42:29 - INFO - __main__ - Step 8577: {'lr': 0.0004975683299976791, 'samples': 1646784, 'steps': 8576, 'loss/train': 2.403451442718506} -08/30/2021 14:42:29 - INFO - __main__ - Step 8578: {'lr': 0.0004975675915841485, 'samples': 1646976, 'steps': 8577, 'loss/train': 1.502326488494873} -08/30/2021 14:42:30 - INFO - __main__ - Step 8579: {'lr': 0.0004975668530590679, 'samples': 1647168, 'steps': 8578, 'loss/train': 1.7058626413345337} -08/30/2021 14:42:31 - INFO - __main__ - Step 8580: {'lr': 0.0004975661144224374, 'samples': 1647360, 'steps': 8579, 'loss/train': 1.582490086555481} -08/30/2021 14:42:32 - INFO - __main__ - Step 8581: {'lr': 0.0004975653756742574, 'samples': 1647552, 'steps': 8580, 'loss/train': 1.988918662071228} -08/30/2021 14:42:32 - INFO - __main__ - Step 8582: {'lr': 0.0004975646368145282, 'samples': 1647744, 'steps': 8581, 'loss/train': 2.1653411388397217} -08/30/2021 14:42:32 - INFO - __main__ - Step 8583: {'lr': 0.0004975638978432503, 'samples': 1647936, 'steps': 8582, 'loss/train': 1.8184610605239868} -08/30/2021 14:42:33 - INFO - __main__ - Step 8584: {'lr': 0.0004975631587604239, 'samples': 1648128, 'steps': 8583, 'loss/train': 1.9685587882995605} -08/30/2021 14:42:34 - INFO - __main__ - Step 8585: {'lr': 0.0004975624195660494, 'samples': 1648320, 'steps': 8584, 'loss/train': 1.4592111110687256} -08/30/2021 14:42:34 - INFO - __main__ - Step 8586: {'lr': 0.0004975616802601271, 'samples': 1648512, 'steps': 8585, 'loss/train': 2.1038765907287598} -08/30/2021 14:42:35 - INFO - __main__ - Step 8587: {'lr': 0.0004975609408426572, 'samples': 1648704, 'steps': 8586, 'loss/train': 2.09875750541687} -08/30/2021 14:42:35 - INFO - __main__ - Step 8588: {'lr': 0.0004975602013136403, 'samples': 1648896, 'steps': 8587, 'loss/train': 2.227600574493408} -08/30/2021 14:42:36 - INFO - __main__ - Step 8589: {'lr': 0.0004975594616730766, 'samples': 1649088, 'steps': 8588, 'loss/train': 2.5306458473205566} -08/30/2021 14:42:37 - INFO - __main__ - Step 8590: {'lr': 0.0004975587219209663, 'samples': 1649280, 'steps': 8589, 'loss/train': 1.9463310241699219} -08/30/2021 14:42:38 - INFO - __main__ - Step 8591: {'lr': 0.0004975579820573099, 'samples': 1649472, 'steps': 8590, 'loss/train': 2.1328811645507812} -08/30/2021 14:42:38 - INFO - __main__ - Step 8592: {'lr': 0.0004975572420821078, 'samples': 1649664, 'steps': 8591, 'loss/train': 1.6399412155151367} -08/30/2021 14:42:38 - INFO - __main__ - Step 8593: {'lr': 0.0004975565019953601, 'samples': 1649856, 'steps': 8592, 'loss/train': 2.179776668548584} -08/30/2021 14:42:39 - INFO - __main__ - Step 8594: {'lr': 0.0004975557617970673, 'samples': 1650048, 'steps': 8593, 'loss/train': 2.4166452884674072} -08/30/2021 14:42:40 - INFO - __main__ - Step 8595: {'lr': 0.0004975550214872296, 'samples': 1650240, 'steps': 8594, 'loss/train': 1.673804759979248} -08/30/2021 14:42:41 - INFO - __main__ - Step 8596: {'lr': 0.0004975542810658476, 'samples': 1650432, 'steps': 8595, 'loss/train': 2.1727705001831055} -08/30/2021 14:42:41 - INFO - __main__ - Step 8597: {'lr': 0.0004975535405329213, 'samples': 1650624, 'steps': 8596, 'loss/train': 1.2749512195587158} -08/30/2021 14:42:41 - INFO - __main__ - Step 8598: {'lr': 0.0004975527998884513, 'samples': 1650816, 'steps': 8597, 'loss/train': 1.899662733078003} -08/30/2021 14:42:42 - INFO - __main__ - Step 8599: {'lr': 0.0004975520591324378, 'samples': 1651008, 'steps': 8598, 'loss/train': 1.7861813306808472} -08/30/2021 14:42:42 - INFO - __main__ - Step 8600: {'lr': 0.0004975513182648812, 'samples': 1651200, 'steps': 8599, 'loss/train': 0.19180971384048462} -08/30/2021 14:42:43 - INFO - __main__ - Step 8601: {'lr': 0.0004975505772857818, 'samples': 1651392, 'steps': 8600, 'loss/train': 1.532994270324707} -08/30/2021 14:42:44 - INFO - __main__ - Step 8602: {'lr': 0.0004975498361951398, 'samples': 1651584, 'steps': 8601, 'loss/train': 1.1918660402297974} -08/30/2021 14:42:44 - INFO - __main__ - Step 8603: {'lr': 0.0004975490949929558, 'samples': 1651776, 'steps': 8602, 'loss/train': 2.378145933151245} -08/30/2021 14:42:45 - INFO - __main__ - Step 8604: {'lr': 0.00049754835367923, 'samples': 1651968, 'steps': 8603, 'loss/train': 2.563058853149414} -08/30/2021 14:42:45 - INFO - __main__ - Step 8605: {'lr': 0.0004975476122539627, 'samples': 1652160, 'steps': 8604, 'loss/train': 1.4181443452835083} -08/30/2021 14:42:46 - INFO - __main__ - Step 8606: {'lr': 0.0004975468707171542, 'samples': 1652352, 'steps': 8605, 'loss/train': 3.0092220306396484} -08/30/2021 14:42:47 - INFO - __main__ - Step 8607: {'lr': 0.000497546129068805, 'samples': 1652544, 'steps': 8606, 'loss/train': 2.0059804916381836} -08/30/2021 14:42:47 - INFO - __main__ - Step 8608: {'lr': 0.0004975453873089153, 'samples': 1652736, 'steps': 8607, 'loss/train': 1.853925108909607} -08/30/2021 14:42:48 - INFO - __main__ - Step 8609: {'lr': 0.0004975446454374854, 'samples': 1652928, 'steps': 8608, 'loss/train': 1.9299236536026} -08/30/2021 14:42:48 - INFO - __main__ - Step 8610: {'lr': 0.0004975439034545158, 'samples': 1653120, 'steps': 8609, 'loss/train': 1.9878500699996948} -08/30/2021 14:42:49 - INFO - __main__ - Step 8611: {'lr': 0.0004975431613600067, 'samples': 1653312, 'steps': 8610, 'loss/train': 1.9883729219436646} -08/30/2021 14:42:50 - INFO - __main__ - Step 8612: {'lr': 0.0004975424191539585, 'samples': 1653504, 'steps': 8611, 'loss/train': 1.722756266593933} -08/30/2021 14:42:50 - INFO - __main__ - Step 8613: {'lr': 0.0004975416768363715, 'samples': 1653696, 'steps': 8612, 'loss/train': 1.7571719884872437} -08/30/2021 14:42:51 - INFO - __main__ - Step 8614: {'lr': 0.0004975409344072459, 'samples': 1653888, 'steps': 8613, 'loss/train': 1.6866161823272705} -08/30/2021 14:42:51 - INFO - __main__ - Step 8615: {'lr': 0.0004975401918665823, 'samples': 1654080, 'steps': 8614, 'loss/train': 2.357454538345337} -08/30/2021 14:42:52 - INFO - __main__ - Step 8616: {'lr': 0.0004975394492143808, 'samples': 1654272, 'steps': 8615, 'loss/train': 2.7173142433166504} -08/30/2021 14:42:53 - INFO - __main__ - Step 8617: {'lr': 0.0004975387064506421, 'samples': 1654464, 'steps': 8616, 'loss/train': 1.6634690761566162} -08/30/2021 14:42:53 - INFO - __main__ - Step 8618: {'lr': 0.000497537963575366, 'samples': 1654656, 'steps': 8617, 'loss/train': 2.087928056716919} -08/30/2021 14:42:54 - INFO - __main__ - Step 8619: {'lr': 0.0004975372205885533, 'samples': 1654848, 'steps': 8618, 'loss/train': 1.3401358127593994} -08/30/2021 14:42:54 - INFO - __main__ - Step 8620: {'lr': 0.0004975364774902041, 'samples': 1655040, 'steps': 8619, 'loss/train': 1.4630038738250732} -08/30/2021 14:42:56 - INFO - __main__ - Step 8621: {'lr': 0.0004975357342803187, 'samples': 1655232, 'steps': 8620, 'loss/train': 1.9419286251068115} -08/30/2021 14:42:57 - INFO - __main__ - Step 8622: {'lr': 0.0004975349909588976, 'samples': 1655424, 'steps': 8621, 'loss/train': 2.0865018367767334} -08/30/2021 14:42:57 - INFO - __main__ - Step 8623: {'lr': 0.000497534247525941, 'samples': 1655616, 'steps': 8622, 'loss/train': 2.239246129989624} -08/30/2021 14:42:57 - INFO - __main__ - Step 8624: {'lr': 0.0004975335039814493, 'samples': 1655808, 'steps': 8623, 'loss/train': 2.177828788757324} -08/30/2021 14:42:58 - INFO - __main__ - Step 8625: {'lr': 0.0004975327603254229, 'samples': 1656000, 'steps': 8624, 'loss/train': 2.105170249938965} -08/30/2021 14:42:58 - INFO - __main__ - Step 8626: {'lr': 0.000497532016557862, 'samples': 1656192, 'steps': 8625, 'loss/train': 2.0102388858795166} -08/30/2021 14:43:00 - INFO - __main__ - Step 8627: {'lr': 0.0004975312726787671, 'samples': 1656384, 'steps': 8626, 'loss/train': 1.3716613054275513} -08/30/2021 14:43:00 - INFO - __main__ - Step 8628: {'lr': 0.0004975305286881383, 'samples': 1656576, 'steps': 8627, 'loss/train': 1.680583119392395} -08/30/2021 14:43:01 - INFO - __main__ - Step 8629: {'lr': 0.0004975297845859761, 'samples': 1656768, 'steps': 8628, 'loss/train': 1.1578835248947144} -08/30/2021 14:43:01 - INFO - __main__ - Step 8630: {'lr': 0.0004975290403722807, 'samples': 1656960, 'steps': 8629, 'loss/train': 4.564239501953125} -08/30/2021 14:43:01 - INFO - __main__ - Step 8631: {'lr': 0.0004975282960470527, 'samples': 1657152, 'steps': 8630, 'loss/train': 2.5652618408203125} -08/30/2021 14:43:03 - INFO - __main__ - Step 8632: {'lr': 0.0004975275516102922, 'samples': 1657344, 'steps': 8631, 'loss/train': 1.707463026046753} -08/30/2021 14:43:03 - INFO - __main__ - Step 8633: {'lr': 0.0004975268070619996, 'samples': 1657536, 'steps': 8632, 'loss/train': 1.591426134109497} -08/30/2021 14:43:04 - INFO - __main__ - Step 8634: {'lr': 0.0004975260624021752, 'samples': 1657728, 'steps': 8633, 'loss/train': 1.105669617652893} -08/30/2021 14:43:04 - INFO - __main__ - Step 8635: {'lr': 0.0004975253176308194, 'samples': 1657920, 'steps': 8634, 'loss/train': 2.1665873527526855} -08/30/2021 14:43:04 - INFO - __main__ - Step 8636: {'lr': 0.0004975245727479325, 'samples': 1658112, 'steps': 8635, 'loss/train': 1.5017696619033813} -08/30/2021 14:43:06 - INFO - __main__ - Step 8637: {'lr': 0.0004975238277535149, 'samples': 1658304, 'steps': 8636, 'loss/train': 2.1164751052856445} -08/30/2021 14:43:06 - INFO - __main__ - Step 8638: {'lr': 0.0004975230826475669, 'samples': 1658496, 'steps': 8637, 'loss/train': 1.8092982769012451} -08/30/2021 14:43:07 - INFO - __main__ - Step 8639: {'lr': 0.0004975223374300887, 'samples': 1658688, 'steps': 8638, 'loss/train': 1.9563103914260864} -08/30/2021 14:43:07 - INFO - __main__ - Step 8640: {'lr': 0.0004975215921010808, 'samples': 1658880, 'steps': 8639, 'loss/train': 2.1875200271606445} -08/30/2021 14:43:07 - INFO - __main__ - Step 8641: {'lr': 0.0004975208466605435, 'samples': 1659072, 'steps': 8640, 'loss/train': 2.4847347736358643} -08/30/2021 14:43:08 - INFO - __main__ - Step 8642: {'lr': 0.0004975201011084773, 'samples': 1659264, 'steps': 8641, 'loss/train': 0.8208606839179993} -08/30/2021 14:43:09 - INFO - __main__ - Step 8643: {'lr': 0.0004975193554448821, 'samples': 1659456, 'steps': 8642, 'loss/train': 2.074352741241455} -08/30/2021 14:43:10 - INFO - __main__ - Step 8644: {'lr': 0.0004975186096697585, 'samples': 1659648, 'steps': 8643, 'loss/train': 1.1441607475280762} -08/30/2021 14:43:10 - INFO - __main__ - Step 8645: {'lr': 0.000497517863783107, 'samples': 1659840, 'steps': 8644, 'loss/train': 2.4295613765716553} -08/30/2021 14:43:10 - INFO - __main__ - Step 8646: {'lr': 0.0004975171177849277, 'samples': 1660032, 'steps': 8645, 'loss/train': 1.7394776344299316} -08/30/2021 14:43:11 - INFO - __main__ - Step 8647: {'lr': 0.000497516371675221, 'samples': 1660224, 'steps': 8646, 'loss/train': 1.3165230751037598} -08/30/2021 14:43:12 - INFO - __main__ - Step 8648: {'lr': 0.0004975156254539873, 'samples': 1660416, 'steps': 8647, 'loss/train': 1.8042141199111938} -08/30/2021 14:43:13 - INFO - __main__ - Step 8649: {'lr': 0.0004975148791212269, 'samples': 1660608, 'steps': 8648, 'loss/train': 1.4219919443130493} -08/30/2021 14:43:13 - INFO - __main__ - Step 8650: {'lr': 0.00049751413267694, 'samples': 1660800, 'steps': 8649, 'loss/train': 1.4245812892913818} -08/30/2021 14:43:14 - INFO - __main__ - Step 8651: {'lr': 0.000497513386121127, 'samples': 1660992, 'steps': 8650, 'loss/train': 1.7138100862503052} -08/30/2021 14:43:14 - INFO - __main__ - Step 8652: {'lr': 0.0004975126394537884, 'samples': 1661184, 'steps': 8651, 'loss/train': 2.302199363708496} -08/30/2021 14:43:16 - INFO - __main__ - Step 8653: {'lr': 0.0004975118926749245, 'samples': 1661376, 'steps': 8652, 'loss/train': 1.9023785591125488} -08/30/2021 14:43:16 - INFO - __main__ - Step 8654: {'lr': 0.0004975111457845354, 'samples': 1661568, 'steps': 8653, 'loss/train': 2.1786036491394043} -08/30/2021 14:43:16 - INFO - __main__ - Step 8655: {'lr': 0.0004975103987826217, 'samples': 1661760, 'steps': 8654, 'loss/train': 1.6991146802902222} -08/30/2021 14:43:17 - INFO - __main__ - Step 8656: {'lr': 0.0004975096516691836, 'samples': 1661952, 'steps': 8655, 'loss/train': 1.50784432888031} -08/30/2021 14:43:17 - INFO - __main__ - Step 8657: {'lr': 0.0004975089044442215, 'samples': 1662144, 'steps': 8656, 'loss/train': 1.257446527481079} -08/30/2021 14:43:19 - INFO - __main__ - Step 8658: {'lr': 0.0004975081571077357, 'samples': 1662336, 'steps': 8657, 'loss/train': 2.638295888900757} -08/30/2021 14:43:19 - INFO - __main__ - Step 8659: {'lr': 0.0004975074096597265, 'samples': 1662528, 'steps': 8658, 'loss/train': 2.5325398445129395} -08/30/2021 14:43:19 - INFO - __main__ - Step 8660: {'lr': 0.0004975066621001943, 'samples': 1662720, 'steps': 8659, 'loss/train': 2.105074167251587} -08/30/2021 14:43:20 - INFO - __main__ - Step 8661: {'lr': 0.0004975059144291394, 'samples': 1662912, 'steps': 8660, 'loss/train': 2.0656898021698} -08/30/2021 14:43:20 - INFO - __main__ - Step 8662: {'lr': 0.0004975051666465622, 'samples': 1663104, 'steps': 8661, 'loss/train': 1.915766954421997} -08/30/2021 14:43:22 - INFO - __main__ - Step 8663: {'lr': 0.0004975044187524629, 'samples': 1663296, 'steps': 8662, 'loss/train': 1.1128897666931152} -08/30/2021 14:43:22 - INFO - __main__ - Step 8664: {'lr': 0.000497503670746842, 'samples': 1663488, 'steps': 8663, 'loss/train': 2.4669487476348877} -08/30/2021 14:43:22 - INFO - __main__ - Step 8665: {'lr': 0.0004975029226296998, 'samples': 1663680, 'steps': 8664, 'loss/train': 1.8786349296569824} -08/30/2021 14:43:23 - INFO - __main__ - Step 8666: {'lr': 0.0004975021744010365, 'samples': 1663872, 'steps': 8665, 'loss/train': 1.954643964767456} -08/30/2021 14:43:23 - INFO - __main__ - Step 8667: {'lr': 0.0004975014260608527, 'samples': 1664064, 'steps': 8666, 'loss/train': 2.062811851501465} -08/30/2021 14:43:24 - INFO - __main__ - Step 8668: {'lr': 0.0004975006776091484, 'samples': 1664256, 'steps': 8667, 'loss/train': 1.7372324466705322} -08/30/2021 14:43:25 - INFO - __main__ - Step 8669: {'lr': 0.0004974999290459243, 'samples': 1664448, 'steps': 8668, 'loss/train': 1.4187322854995728} -08/30/2021 14:43:25 - INFO - __main__ - Step 8670: {'lr': 0.0004974991803711803, 'samples': 1664640, 'steps': 8669, 'loss/train': 2.0661065578460693} -08/30/2021 14:43:26 - INFO - __main__ - Step 8671: {'lr': 0.0004974984315849172, 'samples': 1664832, 'steps': 8670, 'loss/train': 2.532565116882324} -08/30/2021 14:43:26 - INFO - __main__ - Step 8672: {'lr': 0.000497497682687135, 'samples': 1665024, 'steps': 8671, 'loss/train': 2.3772478103637695} -08/30/2021 14:43:27 - INFO - __main__ - Step 8673: {'lr': 0.0004974969336778343, 'samples': 1665216, 'steps': 8672, 'loss/train': 2.5523412227630615} -08/30/2021 14:43:28 - INFO - __main__ - Step 8674: {'lr': 0.0004974961845570152, 'samples': 1665408, 'steps': 8673, 'loss/train': 2.1624512672424316} -08/30/2021 14:43:28 - INFO - __main__ - Step 8675: {'lr': 0.0004974954353246781, 'samples': 1665600, 'steps': 8674, 'loss/train': 1.8108201026916504} -08/30/2021 14:43:29 - INFO - __main__ - Step 8676: {'lr': 0.0004974946859808235, 'samples': 1665792, 'steps': 8675, 'loss/train': 2.1599326133728027} -08/30/2021 14:43:29 - INFO - __main__ - Step 8677: {'lr': 0.0004974939365254515, 'samples': 1665984, 'steps': 8676, 'loss/train': 1.6962110996246338} -08/30/2021 14:43:31 - INFO - __main__ - Step 8678: {'lr': 0.0004974931869585626, 'samples': 1666176, 'steps': 8677, 'loss/train': 2.2996740341186523} -08/30/2021 14:43:31 - INFO - __main__ - Step 8679: {'lr': 0.0004974924372801572, 'samples': 1666368, 'steps': 8678, 'loss/train': 1.165061116218567} -08/30/2021 14:43:32 - INFO - __main__ - Step 8680: {'lr': 0.0004974916874902353, 'samples': 1666560, 'steps': 8679, 'loss/train': 1.9003016948699951} -08/30/2021 14:43:32 - INFO - __main__ - Step 8681: {'lr': 0.0004974909375887976, 'samples': 1666752, 'steps': 8680, 'loss/train': 1.6566135883331299} -08/30/2021 14:43:32 - INFO - __main__ - Step 8682: {'lr': 0.0004974901875758444, 'samples': 1666944, 'steps': 8681, 'loss/train': 1.013210654258728} -08/30/2021 14:43:33 - INFO - __main__ - Step 8683: {'lr': 0.0004974894374513757, 'samples': 1667136, 'steps': 8682, 'loss/train': 1.8741066455841064} -08/30/2021 14:43:34 - INFO - __main__ - Step 8684: {'lr': 0.0004974886872153922, 'samples': 1667328, 'steps': 8683, 'loss/train': 1.609816312789917} -08/30/2021 14:43:35 - INFO - __main__ - Step 8685: {'lr': 0.0004974879368678942, 'samples': 1667520, 'steps': 8684, 'loss/train': 1.2252821922302246} -08/30/2021 14:43:35 - INFO - __main__ - Step 8686: {'lr': 0.0004974871864088818, 'samples': 1667712, 'steps': 8685, 'loss/train': 0.8664953112602234} -08/30/2021 14:43:36 - INFO - __main__ - Step 8687: {'lr': 0.0004974864358383555, 'samples': 1667904, 'steps': 8686, 'loss/train': 1.586924433708191} -08/30/2021 14:43:36 - INFO - __main__ - Step 8688: {'lr': 0.0004974856851563158, 'samples': 1668096, 'steps': 8687, 'loss/train': 2.1468544006347656} -08/30/2021 14:43:36 - INFO - __main__ - Step 8689: {'lr': 0.0004974849343627628, 'samples': 1668288, 'steps': 8688, 'loss/train': 3.491004467010498} -08/30/2021 14:43:38 - INFO - __main__ - Step 8690: {'lr': 0.0004974841834576968, 'samples': 1668480, 'steps': 8689, 'loss/train': 2.16768217086792} -08/30/2021 14:43:38 - INFO - __main__ - Step 8691: {'lr': 0.0004974834324411183, 'samples': 1668672, 'steps': 8690, 'loss/train': 2.1313111782073975} -08/30/2021 14:43:39 - INFO - __main__ - Step 8692: {'lr': 0.0004974826813130276, 'samples': 1668864, 'steps': 8691, 'loss/train': 2.2426517009735107} -08/30/2021 14:43:39 - INFO - __main__ - Step 8693: {'lr': 0.000497481930073425, 'samples': 1669056, 'steps': 8692, 'loss/train': 1.9979678392410278} -08/30/2021 14:43:39 - INFO - __main__ - Step 8694: {'lr': 0.000497481178722311, 'samples': 1669248, 'steps': 8693, 'loss/train': 1.9313017129898071} -08/30/2021 14:43:41 - INFO - __main__ - Step 8695: {'lr': 0.0004974804272596857, 'samples': 1669440, 'steps': 8694, 'loss/train': 1.756946325302124} -08/30/2021 14:43:42 - INFO - __main__ - Step 8696: {'lr': 0.0004974796756855494, 'samples': 1669632, 'steps': 8695, 'loss/train': 1.9956234693527222} -08/30/2021 14:43:42 - INFO - __main__ - Step 8697: {'lr': 0.0004974789239999027, 'samples': 1669824, 'steps': 8696, 'loss/train': 1.2921825647354126} -08/30/2021 14:43:42 - INFO - __main__ - Step 8698: {'lr': 0.0004974781722027459, 'samples': 1670016, 'steps': 8697, 'loss/train': 1.7339524030685425} -08/30/2021 14:43:43 - INFO - __main__ - Step 8699: {'lr': 0.0004974774202940791, 'samples': 1670208, 'steps': 8698, 'loss/train': 2.2512190341949463} -08/30/2021 14:43:43 - INFO - __main__ - Step 8700: {'lr': 0.000497476668273903, 'samples': 1670400, 'steps': 8699, 'loss/train': 1.6991277933120728} -08/30/2021 14:43:44 - INFO - __main__ - Step 8701: {'lr': 0.0004974759161422175, 'samples': 1670592, 'steps': 8700, 'loss/train': 2.36647367477417} -08/30/2021 14:43:45 - INFO - __main__ - Step 8702: {'lr': 0.0004974751638990233, 'samples': 1670784, 'steps': 8701, 'loss/train': 2.3939263820648193} -08/30/2021 14:43:45 - INFO - __main__ - Step 8703: {'lr': 0.0004974744115443206, 'samples': 1670976, 'steps': 8702, 'loss/train': 1.317129373550415} -08/30/2021 14:43:46 - INFO - __main__ - Step 8704: {'lr': 0.0004974736590781097, 'samples': 1671168, 'steps': 8703, 'loss/train': 0.5579120516777039} -08/30/2021 14:43:46 - INFO - __main__ - Step 8705: {'lr': 0.000497472906500391, 'samples': 1671360, 'steps': 8704, 'loss/train': 2.1611592769622803} -08/30/2021 14:43:48 - INFO - __main__ - Step 8706: {'lr': 0.0004974721538111649, 'samples': 1671552, 'steps': 8705, 'loss/train': 2.159956216812134} -08/30/2021 14:43:48 - INFO - __main__ - Step 8707: {'lr': 0.0004974714010104315, 'samples': 1671744, 'steps': 8706, 'loss/train': 1.906781554222107} -08/30/2021 14:43:49 - INFO - __main__ - Step 8708: {'lr': 0.0004974706480981914, 'samples': 1671936, 'steps': 8707, 'loss/train': 2.110795736312866} -08/30/2021 14:43:49 - INFO - __main__ - Step 8709: {'lr': 0.0004974698950744449, 'samples': 1672128, 'steps': 8708, 'loss/train': 2.0629167556762695} -08/30/2021 14:43:49 - INFO - __main__ - Step 8710: {'lr': 0.0004974691419391922, 'samples': 1672320, 'steps': 8709, 'loss/train': 1.7386436462402344} -08/30/2021 14:43:51 - INFO - __main__ - Step 8711: {'lr': 0.0004974683886924339, 'samples': 1672512, 'steps': 8710, 'loss/train': 4.081793308258057} -08/30/2021 14:43:51 - INFO - __main__ - Step 8712: {'lr': 0.00049746763533417, 'samples': 1672704, 'steps': 8711, 'loss/train': 2.1162335872650146} -08/30/2021 14:43:52 - INFO - __main__ - Step 8713: {'lr': 0.000497466881864401, 'samples': 1672896, 'steps': 8712, 'loss/train': 0.8779681324958801} -08/30/2021 14:43:52 - INFO - __main__ - Step 8714: {'lr': 0.0004974661282831272, 'samples': 1673088, 'steps': 8713, 'loss/train': 2.3679370880126953} -08/30/2021 14:43:52 - INFO - __main__ - Step 8715: {'lr': 0.0004974653745903491, 'samples': 1673280, 'steps': 8714, 'loss/train': 1.9404504299163818} -08/30/2021 14:43:54 - INFO - __main__ - Step 8716: {'lr': 0.0004974646207860668, 'samples': 1673472, 'steps': 8715, 'loss/train': 1.8773442506790161} -08/30/2021 14:43:54 - INFO - __main__ - Step 8717: {'lr': 0.0004974638668702809, 'samples': 1673664, 'steps': 8716, 'loss/train': 2.295478343963623} -08/30/2021 14:43:55 - INFO - __main__ - Step 8718: {'lr': 0.0004974631128429915, 'samples': 1673856, 'steps': 8717, 'loss/train': 1.716551423072815} -08/30/2021 14:43:55 - INFO - __main__ - Step 8719: {'lr': 0.0004974623587041991, 'samples': 1674048, 'steps': 8718, 'loss/train': 2.1509275436401367} -08/30/2021 14:43:55 - INFO - __main__ - Step 8720: {'lr': 0.000497461604453904, 'samples': 1674240, 'steps': 8719, 'loss/train': 1.9106303453445435} -08/30/2021 14:43:56 - INFO - __main__ - Step 8721: {'lr': 0.0004974608500921064, 'samples': 1674432, 'steps': 8720, 'loss/train': 2.128234624862671} -08/30/2021 14:43:57 - INFO - __main__ - Step 8722: {'lr': 0.0004974600956188068, 'samples': 1674624, 'steps': 8721, 'loss/train': 2.0519943237304688} -08/30/2021 14:43:58 - INFO - __main__ - Step 8723: {'lr': 0.0004974593410340056, 'samples': 1674816, 'steps': 8722, 'loss/train': 2.685260534286499} -08/30/2021 14:43:58 - INFO - __main__ - Step 8724: {'lr': 0.000497458586337703, 'samples': 1675008, 'steps': 8723, 'loss/train': 1.4179587364196777} -08/30/2021 14:43:59 - INFO - __main__ - Step 8725: {'lr': 0.0004974578315298993, 'samples': 1675200, 'steps': 8724, 'loss/train': 1.850721001625061} -08/30/2021 14:43:59 - INFO - __main__ - Step 8726: {'lr': 0.000497457076610595, 'samples': 1675392, 'steps': 8725, 'loss/train': 1.9255950450897217} -08/30/2021 14:44:00 - INFO - __main__ - Step 8727: {'lr': 0.0004974563215797903, 'samples': 1675584, 'steps': 8726, 'loss/train': 1.7172802686691284} -08/30/2021 14:44:01 - INFO - __main__ - Step 8728: {'lr': 0.0004974555664374857, 'samples': 1675776, 'steps': 8727, 'loss/train': 1.844247817993164} -08/30/2021 14:44:01 - INFO - __main__ - Step 8729: {'lr': 0.0004974548111836812, 'samples': 1675968, 'steps': 8728, 'loss/train': 1.299993634223938} -08/30/2021 14:44:02 - INFO - __main__ - Step 8730: {'lr': 0.0004974540558183776, 'samples': 1676160, 'steps': 8729, 'loss/train': 1.2942192554473877} -08/30/2021 14:44:02 - INFO - __main__ - Step 8731: {'lr': 0.0004974533003415751, 'samples': 1676352, 'steps': 8730, 'loss/train': 2.199471950531006} -08/30/2021 14:44:04 - INFO - __main__ - Step 8732: {'lr': 0.0004974525447532737, 'samples': 1676544, 'steps': 8731, 'loss/train': 1.7526211738586426} -08/30/2021 14:44:04 - INFO - __main__ - Step 8733: {'lr': 0.0004974517890534742, 'samples': 1676736, 'steps': 8732, 'loss/train': 0.8656116127967834} -08/30/2021 14:44:05 - INFO - __main__ - Step 8734: {'lr': 0.0004974510332421767, 'samples': 1676928, 'steps': 8733, 'loss/train': 0.3058996796607971} -08/30/2021 14:44:05 - INFO - __main__ - Step 8735: {'lr': 0.0004974502773193815, 'samples': 1677120, 'steps': 8734, 'loss/train': 1.2710117101669312} -08/30/2021 14:44:05 - INFO - __main__ - Step 8736: {'lr': 0.0004974495212850892, 'samples': 1677312, 'steps': 8735, 'loss/train': 1.5743685960769653} -08/30/2021 14:44:06 - INFO - __main__ - Step 8737: {'lr': 0.0004974487651392998, 'samples': 1677504, 'steps': 8736, 'loss/train': 1.848976492881775} -08/30/2021 14:44:08 - INFO - __main__ - Step 8738: {'lr': 0.0004974480088820139, 'samples': 1677696, 'steps': 8737, 'loss/train': 1.7711901664733887} -08/30/2021 14:44:08 - INFO - __main__ - Step 8739: {'lr': 0.0004974472525132316, 'samples': 1677888, 'steps': 8738, 'loss/train': 2.0195536613464355} -08/30/2021 14:44:09 - INFO - __main__ - Step 8740: {'lr': 0.0004974464960329536, 'samples': 1678080, 'steps': 8739, 'loss/train': 1.9348527193069458} -08/30/2021 14:44:09 - INFO - __main__ - Step 8741: {'lr': 0.0004974457394411798, 'samples': 1678272, 'steps': 8740, 'loss/train': 2.030661106109619} -08/30/2021 14:44:09 - INFO - __main__ - Step 8742: {'lr': 0.0004974449827379109, 'samples': 1678464, 'steps': 8741, 'loss/train': 2.020113468170166} -08/30/2021 14:44:11 - INFO - __main__ - Step 8743: {'lr': 0.000497444225923147, 'samples': 1678656, 'steps': 8742, 'loss/train': 2.2659518718719482} -08/30/2021 14:44:11 - INFO - __main__ - Step 8744: {'lr': 0.0004974434689968887, 'samples': 1678848, 'steps': 8743, 'loss/train': 2.0322535037994385} -08/30/2021 14:44:12 - INFO - __main__ - Step 8745: {'lr': 0.0004974427119591361, 'samples': 1679040, 'steps': 8744, 'loss/train': 2.128535747528076} -08/30/2021 14:44:12 - INFO - __main__ - Step 8746: {'lr': 0.0004974419548098897, 'samples': 1679232, 'steps': 8745, 'loss/train': 0.27330482006073} -08/30/2021 14:44:12 - INFO - __main__ - Step 8747: {'lr': 0.0004974411975491498, 'samples': 1679424, 'steps': 8746, 'loss/train': 1.9819375276565552} -08/30/2021 14:44:14 - INFO - __main__ - Step 8748: {'lr': 0.0004974404401769167, 'samples': 1679616, 'steps': 8747, 'loss/train': 1.8071480989456177} -08/30/2021 14:44:14 - INFO - __main__ - Step 8749: {'lr': 0.0004974396826931906, 'samples': 1679808, 'steps': 8748, 'loss/train': 1.9712427854537964} -08/30/2021 14:44:15 - INFO - __main__ - Step 8750: {'lr': 0.0004974389250979722, 'samples': 1680000, 'steps': 8749, 'loss/train': 2.3223397731781006} -08/30/2021 14:44:15 - INFO - __main__ - Step 8751: {'lr': 0.0004974381673912614, 'samples': 1680192, 'steps': 8750, 'loss/train': 1.570473551750183} -08/30/2021 14:44:15 - INFO - __main__ - Step 8752: {'lr': 0.000497437409573059, 'samples': 1680384, 'steps': 8751, 'loss/train': 1.8036528825759888} -08/30/2021 14:44:17 - INFO - __main__ - Step 8753: {'lr': 0.000497436651643365, 'samples': 1680576, 'steps': 8752, 'loss/train': 1.7375524044036865} -08/30/2021 14:44:17 - INFO - __main__ - Step 8754: {'lr': 0.00049743589360218, 'samples': 1680768, 'steps': 8753, 'loss/train': 1.3110918998718262} -08/30/2021 14:44:18 - INFO - __main__ - Step 8755: {'lr': 0.0004974351354495041, 'samples': 1680960, 'steps': 8754, 'loss/train': 1.7762739658355713} -08/30/2021 14:44:18 - INFO - __main__ - Step 8756: {'lr': 0.0004974343771853377, 'samples': 1681152, 'steps': 8755, 'loss/train': 2.0317671298980713} -08/30/2021 14:44:18 - INFO - __main__ - Step 8757: {'lr': 0.0004974336188096813, 'samples': 1681344, 'steps': 8756, 'loss/train': 1.98769211769104} -08/30/2021 14:44:20 - INFO - __main__ - Step 8758: {'lr': 0.0004974328603225351, 'samples': 1681536, 'steps': 8757, 'loss/train': 2.112428903579712} -08/30/2021 14:44:20 - INFO - __main__ - Step 8759: {'lr': 0.0004974321017238994, 'samples': 1681728, 'steps': 8758, 'loss/train': 2.0258026123046875} -08/30/2021 14:44:20 - INFO - __main__ - Step 8760: {'lr': 0.0004974313430137747, 'samples': 1681920, 'steps': 8759, 'loss/train': 2.1777615547180176} -08/30/2021 14:44:21 - INFO - __main__ - Step 8761: {'lr': 0.0004974305841921612, 'samples': 1682112, 'steps': 8760, 'loss/train': 1.7240231037139893} -08/30/2021 14:44:21 - INFO - __main__ - Step 8762: {'lr': 0.0004974298252590593, 'samples': 1682304, 'steps': 8761, 'loss/train': 2.205961227416992} -08/30/2021 14:44:23 - INFO - __main__ - Step 8763: {'lr': 0.0004974290662144694, 'samples': 1682496, 'steps': 8762, 'loss/train': 2.2492496967315674} -08/30/2021 14:44:23 - INFO - __main__ - Step 8764: {'lr': 0.0004974283070583917, 'samples': 1682688, 'steps': 8763, 'loss/train': 1.6165436506271362} -08/30/2021 14:44:23 - INFO - __main__ - Step 8765: {'lr': 0.0004974275477908266, 'samples': 1682880, 'steps': 8764, 'loss/train': 2.0821170806884766} -08/30/2021 14:44:24 - INFO - __main__ - Step 8766: {'lr': 0.0004974267884117746, 'samples': 1683072, 'steps': 8765, 'loss/train': 1.7335976362228394} -08/30/2021 14:44:24 - INFO - __main__ - Step 8767: {'lr': 0.0004974260289212358, 'samples': 1683264, 'steps': 8766, 'loss/train': 2.383117437362671} -08/30/2021 14:44:26 - INFO - __main__ - Step 8768: {'lr': 0.0004974252693192106, 'samples': 1683456, 'steps': 8767, 'loss/train': 2.205899715423584} -08/30/2021 14:44:26 - INFO - __main__ - Step 8769: {'lr': 0.0004974245096056995, 'samples': 1683648, 'steps': 8768, 'loss/train': 1.9440041780471802} -08/30/2021 14:44:27 - INFO - __main__ - Step 8770: {'lr': 0.0004974237497807027, 'samples': 1683840, 'steps': 8769, 'loss/train': 1.7581126689910889} -08/30/2021 14:44:27 - INFO - __main__ - Step 8771: {'lr': 0.0004974229898442207, 'samples': 1684032, 'steps': 8770, 'loss/train': 1.769744634628296} -08/30/2021 14:44:27 - INFO - __main__ - Step 8772: {'lr': 0.0004974222297962535, 'samples': 1684224, 'steps': 8771, 'loss/train': 1.9801572561264038} -08/30/2021 14:44:29 - INFO - __main__ - Step 8773: {'lr': 0.0004974214696368017, 'samples': 1684416, 'steps': 8772, 'loss/train': 2.896915912628174} -08/30/2021 14:44:29 - INFO - __main__ - Step 8774: {'lr': 0.0004974207093658657, 'samples': 1684608, 'steps': 8773, 'loss/train': 2.1361005306243896} -08/30/2021 14:44:30 - INFO - __main__ - Step 8775: {'lr': 0.0004974199489834457, 'samples': 1684800, 'steps': 8774, 'loss/train': 2.0194149017333984} -08/30/2021 14:44:30 - INFO - __main__ - Step 8776: {'lr': 0.0004974191884895421, 'samples': 1684992, 'steps': 8775, 'loss/train': 1.1998473405838013} -08/30/2021 14:44:30 - INFO - __main__ - Step 8777: {'lr': 0.0004974184278841552, 'samples': 1685184, 'steps': 8776, 'loss/train': 2.1794116497039795} -08/30/2021 14:44:32 - INFO - __main__ - Step 8778: {'lr': 0.0004974176671672854, 'samples': 1685376, 'steps': 8777, 'loss/train': 1.6326193809509277} -08/30/2021 14:44:32 - INFO - __main__ - Step 8779: {'lr': 0.000497416906338933, 'samples': 1685568, 'steps': 8778, 'loss/train': 1.7596262693405151} -08/30/2021 14:44:33 - INFO - __main__ - Step 8780: {'lr': 0.0004974161453990985, 'samples': 1685760, 'steps': 8779, 'loss/train': 1.9646741151809692} -08/30/2021 14:44:33 - INFO - __main__ - Step 8781: {'lr': 0.0004974153843477819, 'samples': 1685952, 'steps': 8780, 'loss/train': 2.227012872695923} -08/30/2021 14:44:33 - INFO - __main__ - Step 8782: {'lr': 0.0004974146231849838, 'samples': 1686144, 'steps': 8781, 'loss/train': 1.4969590902328491} -08/30/2021 14:44:34 - INFO - __main__ - Step 8783: {'lr': 0.0004974138619107046, 'samples': 1686336, 'steps': 8782, 'loss/train': 2.840508460998535} -08/30/2021 14:44:35 - INFO - __main__ - Step 8784: {'lr': 0.0004974131005249444, 'samples': 1686528, 'steps': 8783, 'loss/train': 1.302711009979248} -08/30/2021 14:44:36 - INFO - __main__ - Step 8785: {'lr': 0.0004974123390277037, 'samples': 1686720, 'steps': 8784, 'loss/train': 2.0307395458221436} -08/30/2021 14:44:36 - INFO - __main__ - Step 8786: {'lr': 0.0004974115774189829, 'samples': 1686912, 'steps': 8785, 'loss/train': 1.7665915489196777} -08/30/2021 14:44:36 - INFO - __main__ - Step 8787: {'lr': 0.0004974108156987822, 'samples': 1687104, 'steps': 8786, 'loss/train': 2.0021626949310303} -08/30/2021 14:44:37 - INFO - __main__ - Step 8788: {'lr': 0.000497410053867102, 'samples': 1687296, 'steps': 8787, 'loss/train': 2.2938144207000732} -08/30/2021 14:44:38 - INFO - __main__ - Step 8789: {'lr': 0.0004974092919239427, 'samples': 1687488, 'steps': 8788, 'loss/train': 2.082855224609375} -08/30/2021 14:44:39 - INFO - __main__ - Step 8790: {'lr': 0.0004974085298693045, 'samples': 1687680, 'steps': 8789, 'loss/train': 1.652678370475769} -08/30/2021 14:44:39 - INFO - __main__ - Step 8791: {'lr': 0.0004974077677031879, 'samples': 1687872, 'steps': 8790, 'loss/train': 2.036776065826416} -08/30/2021 14:44:40 - INFO - __main__ - Step 8792: {'lr': 0.0004974070054255932, 'samples': 1688064, 'steps': 8791, 'loss/train': 1.903337001800537} -08/30/2021 14:44:40 - INFO - __main__ - Step 8793: {'lr': 0.0004974062430365206, 'samples': 1688256, 'steps': 8792, 'loss/train': 1.8099795579910278} -08/30/2021 14:44:41 - INFO - __main__ - Step 8794: {'lr': 0.0004974054805359706, 'samples': 1688448, 'steps': 8793, 'loss/train': 1.4995594024658203} -08/30/2021 14:44:42 - INFO - __main__ - Step 8795: {'lr': 0.0004974047179239436, 'samples': 1688640, 'steps': 8794, 'loss/train': 1.7680137157440186} -08/30/2021 14:44:42 - INFO - __main__ - Step 8796: {'lr': 0.0004974039552004398, 'samples': 1688832, 'steps': 8795, 'loss/train': 2.226763963699341} -08/30/2021 14:44:43 - INFO - __main__ - Step 8797: {'lr': 0.0004974031923654596, 'samples': 1689024, 'steps': 8796, 'loss/train': 2.083266019821167} -08/30/2021 14:44:43 - INFO - __main__ - Step 8798: {'lr': 0.0004974024294190034, 'samples': 1689216, 'steps': 8797, 'loss/train': 2.0445456504821777} -08/30/2021 14:44:44 - INFO - __main__ - Step 8799: {'lr': 0.0004974016663610713, 'samples': 1689408, 'steps': 8798, 'loss/train': 1.7572485208511353} -08/30/2021 14:44:45 - INFO - __main__ - Step 8800: {'lr': 0.000497400903191664, 'samples': 1689600, 'steps': 8799, 'loss/train': 2.339501142501831} -08/30/2021 14:44:45 - INFO - __main__ - Step 8801: {'lr': 0.0004974001399107816, 'samples': 1689792, 'steps': 8800, 'loss/train': 1.8961145877838135} -08/30/2021 14:44:46 - INFO - __main__ - Step 8802: {'lr': 0.0004973993765184246, 'samples': 1689984, 'steps': 8801, 'loss/train': 2.1814019680023193} -08/30/2021 14:44:46 - INFO - __main__ - Step 8803: {'lr': 0.0004973986130145931, 'samples': 1690176, 'steps': 8802, 'loss/train': 1.8656163215637207} -08/30/2021 14:44:47 - INFO - __main__ - Step 8804: {'lr': 0.0004973978493992877, 'samples': 1690368, 'steps': 8803, 'loss/train': 2.049767255783081} -08/30/2021 14:44:48 - INFO - __main__ - Step 8805: {'lr': 0.0004973970856725086, 'samples': 1690560, 'steps': 8804, 'loss/train': 1.2457367181777954} -08/30/2021 14:44:48 - INFO - __main__ - Step 8806: {'lr': 0.0004973963218342563, 'samples': 1690752, 'steps': 8805, 'loss/train': 1.601210355758667} -08/30/2021 14:44:49 - INFO - __main__ - Step 8807: {'lr': 0.000497395557884531, 'samples': 1690944, 'steps': 8806, 'loss/train': 2.3677077293395996} -08/30/2021 14:44:49 - INFO - __main__ - Step 8808: {'lr': 0.000497394793823333, 'samples': 1691136, 'steps': 8807, 'loss/train': 1.7051234245300293} -08/30/2021 14:44:51 - INFO - __main__ - Step 8809: {'lr': 0.0004973940296506627, 'samples': 1691328, 'steps': 8808, 'loss/train': 2.554412364959717} -08/30/2021 14:44:51 - INFO - __main__ - Step 8810: {'lr': 0.0004973932653665206, 'samples': 1691520, 'steps': 8809, 'loss/train': 2.2054378986358643} -08/30/2021 14:44:52 - INFO - __main__ - Step 8811: {'lr': 0.0004973925009709068, 'samples': 1691712, 'steps': 8810, 'loss/train': 1.6742802858352661} -08/30/2021 14:44:52 - INFO - __main__ - Step 8812: {'lr': 0.0004973917364638218, 'samples': 1691904, 'steps': 8811, 'loss/train': 1.5483663082122803} -08/30/2021 14:44:52 - INFO - __main__ - Step 8813: {'lr': 0.0004973909718452659, 'samples': 1692096, 'steps': 8812, 'loss/train': 3.061603307723999} -08/30/2021 14:44:53 - INFO - __main__ - Step 8814: {'lr': 0.0004973902071152396, 'samples': 1692288, 'steps': 8813, 'loss/train': 2.0185563564300537} -08/30/2021 14:44:54 - INFO - __main__ - Step 8815: {'lr': 0.0004973894422737428, 'samples': 1692480, 'steps': 8814, 'loss/train': 1.6258715391159058} -08/30/2021 14:44:55 - INFO - __main__ - Step 8816: {'lr': 0.0004973886773207763, 'samples': 1692672, 'steps': 8815, 'loss/train': 2.1002321243286133} -08/30/2021 14:44:55 - INFO - __main__ - Step 8817: {'lr': 0.0004973879122563403, 'samples': 1692864, 'steps': 8816, 'loss/train': 2.069121837615967} -08/30/2021 14:44:55 - INFO - __main__ - Step 8818: {'lr': 0.000497387147080435, 'samples': 1693056, 'steps': 8817, 'loss/train': 1.8075968027114868} -08/30/2021 14:44:56 - INFO - __main__ - Step 8819: {'lr': 0.000497386381793061, 'samples': 1693248, 'steps': 8818, 'loss/train': 2.181338310241699} -08/30/2021 14:44:58 - INFO - __main__ - Step 8820: {'lr': 0.0004973856163942185, 'samples': 1693440, 'steps': 8819, 'loss/train': 1.995102047920227} -08/30/2021 14:44:58 - INFO - __main__ - Step 8821: {'lr': 0.0004973848508839077, 'samples': 1693632, 'steps': 8820, 'loss/train': 1.3736721277236938} -08/30/2021 14:44:59 - INFO - __main__ - Step 8822: {'lr': 0.0004973840852621293, 'samples': 1693824, 'steps': 8821, 'loss/train': 1.822910189628601} -08/30/2021 14:44:59 - INFO - __main__ - Step 8823: {'lr': 0.0004973833195288834, 'samples': 1694016, 'steps': 8822, 'loss/train': 2.0831680297851562} -08/30/2021 14:44:59 - INFO - __main__ - Step 8824: {'lr': 0.0004973825536841703, 'samples': 1694208, 'steps': 8823, 'loss/train': 1.275166392326355} -08/30/2021 14:45:01 - INFO - __main__ - Step 8825: {'lr': 0.0004973817877279906, 'samples': 1694400, 'steps': 8824, 'loss/train': 1.6611217260360718} -08/30/2021 14:45:01 - INFO - __main__ - Step 8826: {'lr': 0.0004973810216603443, 'samples': 1694592, 'steps': 8825, 'loss/train': 2.4509193897247314} -08/30/2021 14:45:01 - INFO - __main__ - Step 8827: {'lr': 0.000497380255481232, 'samples': 1694784, 'steps': 8826, 'loss/train': 2.011107921600342} -08/30/2021 14:45:02 - INFO - __main__ - Step 8828: {'lr': 0.000497379489190654, 'samples': 1694976, 'steps': 8827, 'loss/train': 2.1602694988250732} -08/30/2021 14:45:02 - INFO - __main__ - Step 8829: {'lr': 0.0004973787227886106, 'samples': 1695168, 'steps': 8828, 'loss/train': 2.0835742950439453} -08/30/2021 14:45:04 - INFO - __main__ - Step 8830: {'lr': 0.0004973779562751022, 'samples': 1695360, 'steps': 8829, 'loss/train': 1.5882266759872437} -08/30/2021 14:45:04 - INFO - __main__ - Step 8831: {'lr': 0.0004973771896501292, 'samples': 1695552, 'steps': 8830, 'loss/train': 2.53253436088562} -08/30/2021 14:45:04 - INFO - __main__ - Step 8832: {'lr': 0.0004973764229136917, 'samples': 1695744, 'steps': 8831, 'loss/train': 2.3874685764312744} -08/30/2021 14:45:05 - INFO - __main__ - Step 8833: {'lr': 0.0004973756560657901, 'samples': 1695936, 'steps': 8832, 'loss/train': 2.0688607692718506} -08/30/2021 14:45:05 - INFO - __main__ - Step 8834: {'lr': 0.0004973748891064251, 'samples': 1696128, 'steps': 8833, 'loss/train': 1.7769646644592285} -08/30/2021 14:45:06 - INFO - __main__ - Step 8835: {'lr': 0.0004973741220355967, 'samples': 1696320, 'steps': 8834, 'loss/train': 1.3691630363464355} -08/30/2021 14:45:07 - INFO - __main__ - Step 8836: {'lr': 0.0004973733548533052, 'samples': 1696512, 'steps': 8835, 'loss/train': 1.6993151903152466} -08/30/2021 14:45:07 - INFO - __main__ - Step 8837: {'lr': 0.0004973725875595513, 'samples': 1696704, 'steps': 8836, 'loss/train': 1.8598029613494873} -08/30/2021 14:45:08 - INFO - __main__ - Step 8838: {'lr': 0.000497371820154335, 'samples': 1696896, 'steps': 8837, 'loss/train': 1.9826390743255615} -08/30/2021 14:45:08 - INFO - __main__ - Step 8839: {'lr': 0.0004973710526376569, 'samples': 1697088, 'steps': 8838, 'loss/train': 1.9499104022979736} -08/30/2021 14:45:10 - INFO - __main__ - Step 8840: {'lr': 0.000497370285009517, 'samples': 1697280, 'steps': 8839, 'loss/train': 2.063833475112915} -08/30/2021 14:45:10 - INFO - __main__ - Step 8841: {'lr': 0.000497369517269916, 'samples': 1697472, 'steps': 8840, 'loss/train': 1.849187970161438} -08/30/2021 14:45:10 - INFO - __main__ - Step 8842: {'lr': 0.0004973687494188541, 'samples': 1697664, 'steps': 8841, 'loss/train': 2.716994524002075} -08/30/2021 14:45:11 - INFO - __main__ - Step 8843: {'lr': 0.0004973679814563318, 'samples': 1697856, 'steps': 8842, 'loss/train': 1.7706921100616455} -08/30/2021 14:45:11 - INFO - __main__ - Step 8844: {'lr': 0.0004973672133823491, 'samples': 1698048, 'steps': 8843, 'loss/train': 1.6797070503234863} -08/30/2021 14:45:13 - INFO - __main__ - Step 8845: {'lr': 0.0004973664451969066, 'samples': 1698240, 'steps': 8844, 'loss/train': 1.817637324333191} -08/30/2021 14:45:13 - INFO - __main__ - Step 8846: {'lr': 0.0004973656769000046, 'samples': 1698432, 'steps': 8845, 'loss/train': 1.572250247001648} -08/30/2021 14:45:13 - INFO - __main__ - Step 8847: {'lr': 0.0004973649084916435, 'samples': 1698624, 'steps': 8846, 'loss/train': 1.8365846872329712} -08/30/2021 14:45:14 - INFO - __main__ - Step 8848: {'lr': 0.0004973641399718236, 'samples': 1698816, 'steps': 8847, 'loss/train': 1.6546167135238647} -08/30/2021 14:45:14 - INFO - __main__ - Step 8849: {'lr': 0.0004973633713405451, 'samples': 1699008, 'steps': 8848, 'loss/train': 1.8078968524932861} -08/30/2021 14:45:14 - INFO - __main__ - Step 8850: {'lr': 0.0004973626025978086, 'samples': 1699200, 'steps': 8849, 'loss/train': 1.7147395610809326} -08/30/2021 14:45:16 - INFO - __main__ - Step 8851: {'lr': 0.0004973618337436143, 'samples': 1699392, 'steps': 8850, 'loss/train': 2.0545716285705566} -08/30/2021 14:45:16 - INFO - __main__ - Step 8852: {'lr': 0.0004973610647779626, 'samples': 1699584, 'steps': 8851, 'loss/train': 1.7343103885650635} -08/30/2021 14:45:17 - INFO - __main__ - Step 8853: {'lr': 0.0004973602957008537, 'samples': 1699776, 'steps': 8852, 'loss/train': 1.7753850221633911} -08/30/2021 14:45:17 - INFO - __main__ - Step 8854: {'lr': 0.0004973595265122883, 'samples': 1699968, 'steps': 8853, 'loss/train': 2.30344820022583} -08/30/2021 14:45:18 - INFO - __main__ - Step 8855: {'lr': 0.0004973587572122663, 'samples': 1700160, 'steps': 8854, 'loss/train': 2.225299119949341} -08/30/2021 14:45:19 - INFO - __main__ - Step 8856: {'lr': 0.0004973579878007884, 'samples': 1700352, 'steps': 8855, 'loss/train': 1.4403730630874634} -08/30/2021 14:45:20 - INFO - __main__ - Step 8857: {'lr': 0.0004973572182778546, 'samples': 1700544, 'steps': 8856, 'loss/train': 1.8367085456848145} -08/30/2021 14:45:20 - INFO - __main__ - Step 8858: {'lr': 0.0004973564486434656, 'samples': 1700736, 'steps': 8857, 'loss/train': 1.9998410940170288} -08/30/2021 14:45:20 - INFO - __main__ - Step 8859: {'lr': 0.0004973556788976217, 'samples': 1700928, 'steps': 8858, 'loss/train': 1.8122602701187134} -08/30/2021 14:45:21 - INFO - __main__ - Step 8860: {'lr': 0.000497354909040323, 'samples': 1701120, 'steps': 8859, 'loss/train': 3.0772290229797363} -08/30/2021 14:45:22 - INFO - __main__ - Step 8861: {'lr': 0.00049735413907157, 'samples': 1701312, 'steps': 8860, 'loss/train': 2.1263930797576904} -08/30/2021 14:45:23 - INFO - __main__ - Step 8862: {'lr': 0.0004973533689913631, 'samples': 1701504, 'steps': 8861, 'loss/train': 1.99599027633667} -08/30/2021 14:45:23 - INFO - __main__ - Step 8863: {'lr': 0.0004973525987997026, 'samples': 1701696, 'steps': 8862, 'loss/train': 1.8839139938354492} -08/30/2021 14:45:23 - INFO - __main__ - Step 8864: {'lr': 0.0004973518284965888, 'samples': 1701888, 'steps': 8863, 'loss/train': 2.3447067737579346} -08/30/2021 14:45:24 - INFO - __main__ - Step 8865: {'lr': 0.0004973510580820221, 'samples': 1702080, 'steps': 8864, 'loss/train': 2.4118566513061523} -08/30/2021 14:45:25 - INFO - __main__ - Step 8866: {'lr': 0.0004973502875560028, 'samples': 1702272, 'steps': 8865, 'loss/train': 2.1668953895568848} -08/30/2021 14:45:26 - INFO - __main__ - Step 8867: {'lr': 0.0004973495169185313, 'samples': 1702464, 'steps': 8866, 'loss/train': 1.8227133750915527} -08/30/2021 14:45:26 - INFO - __main__ - Step 8868: {'lr': 0.0004973487461696079, 'samples': 1702656, 'steps': 8867, 'loss/train': 2.0894923210144043} -08/30/2021 14:45:27 - INFO - __main__ - Step 8869: {'lr': 0.000497347975309233, 'samples': 1702848, 'steps': 8868, 'loss/train': 1.4945451021194458} -08/30/2021 14:45:27 - INFO - __main__ - Step 8870: {'lr': 0.0004973472043374069, 'samples': 1703040, 'steps': 8869, 'loss/train': 2.2598202228546143} -08/30/2021 14:45:27 - INFO - __main__ - Step 8871: {'lr': 0.00049734643325413, 'samples': 1703232, 'steps': 8870, 'loss/train': 1.9570155143737793} -08/30/2021 14:45:29 - INFO - __main__ - Step 8872: {'lr': 0.0004973456620594026, 'samples': 1703424, 'steps': 8871, 'loss/train': 1.706239938735962} -08/30/2021 14:45:30 - INFO - __main__ - Step 8873: {'lr': 0.0004973448907532251, 'samples': 1703616, 'steps': 8872, 'loss/train': 0.6889956593513489} -08/30/2021 14:45:30 - INFO - __main__ - Step 8874: {'lr': 0.0004973441193355978, 'samples': 1703808, 'steps': 8873, 'loss/train': 2.18713116645813} -08/30/2021 14:45:31 - INFO - __main__ - Step 8875: {'lr': 0.0004973433478065209, 'samples': 1704000, 'steps': 8874, 'loss/train': 1.3478615283966064} -08/30/2021 14:45:31 - INFO - __main__ - Step 8876: {'lr': 0.0004973425761659951, 'samples': 1704192, 'steps': 8875, 'loss/train': 1.8509184122085571} -08/30/2021 14:45:31 - INFO - __main__ - Step 8877: {'lr': 0.0004973418044140204, 'samples': 1704384, 'steps': 8876, 'loss/train': 2.8088579177856445} -08/30/2021 14:45:33 - INFO - __main__ - Step 8878: {'lr': 0.0004973410325505974, 'samples': 1704576, 'steps': 8877, 'loss/train': 2.0067989826202393} -08/30/2021 14:45:33 - INFO - __main__ - Step 8879: {'lr': 0.0004973402605757263, 'samples': 1704768, 'steps': 8878, 'loss/train': 2.421041250228882} -08/30/2021 14:45:34 - INFO - __main__ - Step 8880: {'lr': 0.0004973394884894075, 'samples': 1704960, 'steps': 8879, 'loss/train': 1.387993574142456} -08/30/2021 14:45:34 - INFO - __main__ - Step 8881: {'lr': 0.0004973387162916415, 'samples': 1705152, 'steps': 8880, 'loss/train': 1.5879567861557007} -08/30/2021 14:45:34 - INFO - __main__ - Step 8882: {'lr': 0.0004973379439824283, 'samples': 1705344, 'steps': 8881, 'loss/train': 1.4843741655349731} -08/30/2021 14:45:36 - INFO - __main__ - Step 8883: {'lr': 0.0004973371715617685, 'samples': 1705536, 'steps': 8882, 'loss/train': 1.8437132835388184} -08/30/2021 14:45:37 - INFO - __main__ - Step 8884: {'lr': 0.0004973363990296624, 'samples': 1705728, 'steps': 8883, 'loss/train': 1.6015136241912842} -08/30/2021 14:45:37 - INFO - __main__ - Step 8885: {'lr': 0.0004973356263861103, 'samples': 1705920, 'steps': 8884, 'loss/train': 1.8598570823669434} -08/30/2021 14:45:37 - INFO - __main__ - Step 8886: {'lr': 0.0004973348536311126, 'samples': 1706112, 'steps': 8885, 'loss/train': 0.8148157000541687} -08/30/2021 14:45:38 - INFO - __main__ - Step 8887: {'lr': 0.0004973340807646696, 'samples': 1706304, 'steps': 8886, 'loss/train': 2.130687713623047} -08/30/2021 14:45:38 - INFO - __main__ - Step 8888: {'lr': 0.0004973333077867817, 'samples': 1706496, 'steps': 8887, 'loss/train': 2.5316741466522217} -08/30/2021 14:45:39 - INFO - __main__ - Step 8889: {'lr': 0.0004973325346974493, 'samples': 1706688, 'steps': 8888, 'loss/train': 1.3335115909576416} -08/30/2021 14:45:40 - INFO - __main__ - Step 8890: {'lr': 0.0004973317614966726, 'samples': 1706880, 'steps': 8889, 'loss/train': 2.006979465484619} -08/30/2021 14:45:40 - INFO - __main__ - Step 8891: {'lr': 0.000497330988184452, 'samples': 1707072, 'steps': 8890, 'loss/train': 1.3788468837738037} -08/30/2021 14:45:41 - INFO - __main__ - Step 8892: {'lr': 0.000497330214760788, 'samples': 1707264, 'steps': 8891, 'loss/train': 2.031247854232788} -08/30/2021 14:45:41 - INFO - __main__ - Step 8893: {'lr': 0.0004973294412256807, 'samples': 1707456, 'steps': 8892, 'loss/train': 2.3019416332244873} -08/30/2021 14:45:42 - INFO - __main__ - Step 8894: {'lr': 0.0004973286675791305, 'samples': 1707648, 'steps': 8893, 'loss/train': 1.702967643737793} -08/30/2021 14:45:43 - INFO - __main__ - Step 8895: {'lr': 0.000497327893821138, 'samples': 1707840, 'steps': 8894, 'loss/train': 1.826103925704956} -08/30/2021 14:45:43 - INFO - __main__ - Step 8896: {'lr': 0.0004973271199517033, 'samples': 1708032, 'steps': 8895, 'loss/train': 1.4104102849960327} -08/30/2021 14:45:44 - INFO - __main__ - Step 8897: {'lr': 0.0004973263459708268, 'samples': 1708224, 'steps': 8896, 'loss/train': 0.6963333487510681} -08/30/2021 14:45:44 - INFO - __main__ - Step 8898: {'lr': 0.0004973255718785088, 'samples': 1708416, 'steps': 8897, 'loss/train': 1.4177162647247314} -08/30/2021 14:45:45 - INFO - __main__ - Step 8899: {'lr': 0.0004973247976747499, 'samples': 1708608, 'steps': 8898, 'loss/train': 2.370511054992676} -08/30/2021 14:45:46 - INFO - __main__ - Step 8900: {'lr': 0.00049732402335955, 'samples': 1708800, 'steps': 8899, 'loss/train': 1.8502165079116821} -08/30/2021 14:45:46 - INFO - __main__ - Step 8901: {'lr': 0.0004973232489329099, 'samples': 1708992, 'steps': 8900, 'loss/train': 2.1080193519592285} -08/30/2021 14:45:47 - INFO - __main__ - Step 8902: {'lr': 0.0004973224743948298, 'samples': 1709184, 'steps': 8901, 'loss/train': 2.1878201961517334} -08/30/2021 14:45:47 - INFO - __main__ - Step 8903: {'lr': 0.00049732169974531, 'samples': 1709376, 'steps': 8902, 'loss/train': 2.459467649459839} -08/30/2021 14:45:48 - INFO - __main__ - Step 8904: {'lr': 0.0004973209249843507, 'samples': 1709568, 'steps': 8903, 'loss/train': 1.4813534021377563} -08/30/2021 14:45:49 - INFO - __main__ - Step 8905: {'lr': 0.0004973201501119525, 'samples': 1709760, 'steps': 8904, 'loss/train': 1.8868945837020874} -08/30/2021 14:45:49 - INFO - __main__ - Step 8906: {'lr': 0.0004973193751281156, 'samples': 1709952, 'steps': 8905, 'loss/train': 2.3907878398895264} -08/30/2021 14:45:50 - INFO - __main__ - Step 8907: {'lr': 0.0004973186000328405, 'samples': 1710144, 'steps': 8906, 'loss/train': 1.8003449440002441} -08/30/2021 14:45:50 - INFO - __main__ - Step 8908: {'lr': 0.0004973178248261274, 'samples': 1710336, 'steps': 8907, 'loss/train': 1.5820327997207642} -08/30/2021 14:45:52 - INFO - __main__ - Step 8909: {'lr': 0.0004973170495079768, 'samples': 1710528, 'steps': 8908, 'loss/train': 1.7473973035812378} -08/30/2021 14:45:52 - INFO - __main__ - Step 8910: {'lr': 0.0004973162740783888, 'samples': 1710720, 'steps': 8909, 'loss/train': 1.7038699388504028} -08/30/2021 14:45:53 - INFO - __main__ - Step 8911: {'lr': 0.000497315498537364, 'samples': 1710912, 'steps': 8910, 'loss/train': 1.7031673192977905} -08/30/2021 14:45:53 - INFO - __main__ - Step 8912: {'lr': 0.0004973147228849027, 'samples': 1711104, 'steps': 8911, 'loss/train': 2.1056363582611084} -08/30/2021 14:45:53 - INFO - __main__ - Step 8913: {'lr': 0.0004973139471210051, 'samples': 1711296, 'steps': 8912, 'loss/train': 0.4294566512107849} -08/30/2021 14:45:54 - INFO - __main__ - Step 8914: {'lr': 0.0004973131712456717, 'samples': 1711488, 'steps': 8913, 'loss/train': 1.8426896333694458} -08/30/2021 14:45:55 - INFO - __main__ - Step 8915: {'lr': 0.0004973123952589027, 'samples': 1711680, 'steps': 8914, 'loss/train': 1.698033332824707} -08/30/2021 14:45:56 - INFO - __main__ - Step 8916: {'lr': 0.0004973116191606987, 'samples': 1711872, 'steps': 8915, 'loss/train': 1.9066834449768066} -08/30/2021 14:45:56 - INFO - __main__ - Step 8917: {'lr': 0.0004973108429510598, 'samples': 1712064, 'steps': 8916, 'loss/train': 1.8417645692825317} -08/30/2021 14:45:56 - INFO - __main__ - Step 8918: {'lr': 0.0004973100666299864, 'samples': 1712256, 'steps': 8917, 'loss/train': 1.8167082071304321} -08/30/2021 14:45:57 - INFO - __main__ - Step 8919: {'lr': 0.000497309290197479, 'samples': 1712448, 'steps': 8918, 'loss/train': 2.034162759780884} -08/30/2021 14:45:58 - INFO - __main__ - Step 8920: {'lr': 0.0004973085136535379, 'samples': 1712640, 'steps': 8919, 'loss/train': 2.1454975605010986} -08/30/2021 14:45:59 - INFO - __main__ - Step 8921: {'lr': 0.0004973077369981633, 'samples': 1712832, 'steps': 8920, 'loss/train': 2.238969326019287} -08/30/2021 14:45:59 - INFO - __main__ - Step 8922: {'lr': 0.0004973069602313557, 'samples': 1713024, 'steps': 8921, 'loss/train': 1.4229657649993896} -08/30/2021 14:46:00 - INFO - __main__ - Step 8923: {'lr': 0.0004973061833531154, 'samples': 1713216, 'steps': 8922, 'loss/train': 1.5363589525222778} -08/30/2021 14:46:00 - INFO - __main__ - Step 8924: {'lr': 0.0004973054063634428, 'samples': 1713408, 'steps': 8923, 'loss/train': 1.8894785642623901} -08/30/2021 14:46:02 - INFO - __main__ - Step 8925: {'lr': 0.0004973046292623382, 'samples': 1713600, 'steps': 8924, 'loss/train': 1.615864872932434} -08/30/2021 14:46:02 - INFO - __main__ - Step 8926: {'lr': 0.0004973038520498017, 'samples': 1713792, 'steps': 8925, 'loss/train': 2.2542076110839844} -08/30/2021 14:46:03 - INFO - __main__ - Step 8927: {'lr': 0.0004973030747258342, 'samples': 1713984, 'steps': 8926, 'loss/train': 1.6344541311264038} -08/30/2021 14:46:03 - INFO - __main__ - Step 8928: {'lr': 0.0004973022972904356, 'samples': 1714176, 'steps': 8927, 'loss/train': 1.416045069694519} -08/30/2021 14:46:03 - INFO - __main__ - Step 8929: {'lr': 0.0004973015197436063, 'samples': 1714368, 'steps': 8928, 'loss/train': 1.836950659751892} -08/30/2021 14:46:04 - INFO - __main__ - Step 8930: {'lr': 0.0004973007420853471, 'samples': 1714560, 'steps': 8929, 'loss/train': 1.8327442407608032} -08/30/2021 14:46:06 - INFO - __main__ - Step 8931: {'lr': 0.0004972999643156577, 'samples': 1714752, 'steps': 8930, 'loss/train': 2.138300895690918} -08/30/2021 14:46:06 - INFO - __main__ - Step 8932: {'lr': 0.0004972991864345389, 'samples': 1714944, 'steps': 8931, 'loss/train': 0.41218137741088867} -08/30/2021 14:46:06 - INFO - __main__ - Step 8933: {'lr': 0.0004972984084419908, 'samples': 1715136, 'steps': 8932, 'loss/train': 0.3619674742221832} -08/30/2021 14:46:07 - INFO - __main__ - Step 8934: {'lr': 0.0004972976303380139, 'samples': 1715328, 'steps': 8933, 'loss/train': 1.6116410493850708} -08/30/2021 14:46:07 - INFO - __main__ - Step 8935: {'lr': 0.0004972968521226085, 'samples': 1715520, 'steps': 8934, 'loss/train': 2.2196226119995117} -08/30/2021 14:46:07 - INFO - __main__ - Step 8936: {'lr': 0.0004972960737957749, 'samples': 1715712, 'steps': 8935, 'loss/train': 2.018220901489258} -08/30/2021 14:46:09 - INFO - __main__ - Step 8937: {'lr': 0.0004972952953575136, 'samples': 1715904, 'steps': 8936, 'loss/train': 1.8370572328567505} -08/30/2021 14:46:10 - INFO - __main__ - Step 8938: {'lr': 0.0004972945168078248, 'samples': 1716096, 'steps': 8937, 'loss/train': 0.41641080379486084} -08/30/2021 14:46:10 - INFO - __main__ - Step 8939: {'lr': 0.000497293738146709, 'samples': 1716288, 'steps': 8938, 'loss/train': 2.1680476665496826} -08/30/2021 14:46:11 - INFO - __main__ - Step 8940: {'lr': 0.0004972929593741662, 'samples': 1716480, 'steps': 8939, 'loss/train': 2.002331256866455} -08/30/2021 14:46:11 - INFO - __main__ - Step 8941: {'lr': 0.0004972921804901973, 'samples': 1716672, 'steps': 8940, 'loss/train': 0.567217230796814} -08/30/2021 14:46:11 - INFO - __main__ - Step 8942: {'lr': 0.0004972914014948023, 'samples': 1716864, 'steps': 8941, 'loss/train': 0.4307175874710083} -08/30/2021 14:46:13 - INFO - __main__ - Step 8943: {'lr': 0.0004972906223879815, 'samples': 1717056, 'steps': 8942, 'loss/train': 1.0863940715789795} -08/30/2021 14:46:14 - INFO - __main__ - Step 8944: {'lr': 0.0004972898431697355, 'samples': 1717248, 'steps': 8943, 'loss/train': 1.9866523742675781} -08/30/2021 14:46:14 - INFO - __main__ - Step 8945: {'lr': 0.0004972890638400644, 'samples': 1717440, 'steps': 8944, 'loss/train': 2.160125970840454} -08/30/2021 14:46:15 - INFO - __main__ - Step 8946: {'lr': 0.0004972882843989687, 'samples': 1717632, 'steps': 8945, 'loss/train': 1.9607785940170288} -08/30/2021 14:46:15 - INFO - __main__ - Step 8947: {'lr': 0.0004972875048464487, 'samples': 1717824, 'steps': 8946, 'loss/train': 0.3123684823513031} -08/30/2021 14:46:15 - INFO - __main__ - Step 8948: {'lr': 0.0004972867251825048, 'samples': 1718016, 'steps': 8947, 'loss/train': 1.7114638090133667} -08/30/2021 14:46:16 - INFO - __main__ - Step 8949: {'lr': 0.0004972859454071373, 'samples': 1718208, 'steps': 8948, 'loss/train': 1.0696732997894287} -08/30/2021 14:46:17 - INFO - __main__ - Step 8950: {'lr': 0.0004972851655203465, 'samples': 1718400, 'steps': 8949, 'loss/train': 2.3935022354125977} -08/30/2021 14:46:18 - INFO - __main__ - Step 8951: {'lr': 0.000497284385522133, 'samples': 1718592, 'steps': 8950, 'loss/train': 1.9937423467636108} -08/30/2021 14:46:18 - INFO - __main__ - Step 8952: {'lr': 0.0004972836054124968, 'samples': 1718784, 'steps': 8951, 'loss/train': 1.2871404886245728} -08/30/2021 14:46:18 - INFO - __main__ - Step 8953: {'lr': 0.0004972828251914384, 'samples': 1718976, 'steps': 8952, 'loss/train': 1.8947973251342773} -08/30/2021 14:46:19 - INFO - __main__ - Step 8954: {'lr': 0.0004972820448589584, 'samples': 1719168, 'steps': 8953, 'loss/train': 2.2932281494140625} -08/30/2021 14:46:21 - INFO - __main__ - Step 8955: {'lr': 0.0004972812644150567, 'samples': 1719360, 'steps': 8954, 'loss/train': 2.2850396633148193} -08/30/2021 14:46:21 - INFO - __main__ - Step 8956: {'lr': 0.000497280483859734, 'samples': 1719552, 'steps': 8955, 'loss/train': 2.493499279022217} -08/30/2021 14:46:21 - INFO - __main__ - Step 8957: {'lr': 0.0004972797031929904, 'samples': 1719744, 'steps': 8956, 'loss/train': 1.801703929901123} -08/30/2021 14:46:22 - INFO - __main__ - Step 8958: {'lr': 0.0004972789224148266, 'samples': 1719936, 'steps': 8957, 'loss/train': 0.33974945545196533} -08/30/2021 14:46:22 - INFO - __main__ - Step 8959: {'lr': 0.0004972781415252426, 'samples': 1720128, 'steps': 8958, 'loss/train': 1.8467414379119873} -08/30/2021 14:46:24 - INFO - __main__ - Step 8960: {'lr': 0.0004972773605242388, 'samples': 1720320, 'steps': 8959, 'loss/train': 1.8445549011230469} -08/30/2021 14:46:24 - INFO - __main__ - Step 8961: {'lr': 0.0004972765794118158, 'samples': 1720512, 'steps': 8960, 'loss/train': 2.001028060913086} -08/30/2021 14:46:24 - INFO - __main__ - Step 8962: {'lr': 0.0004972757981879737, 'samples': 1720704, 'steps': 8961, 'loss/train': 1.944581151008606} -08/30/2021 14:46:25 - INFO - __main__ - Step 8963: {'lr': 0.000497275016852713, 'samples': 1720896, 'steps': 8962, 'loss/train': 0.15324637293815613} -08/30/2021 14:46:25 - INFO - __main__ - Step 8964: {'lr': 0.0004972742354060339, 'samples': 1721088, 'steps': 8963, 'loss/train': 2.0042412281036377} -08/30/2021 14:46:27 - INFO - __main__ - Step 8965: {'lr': 0.0004972734538479369, 'samples': 1721280, 'steps': 8964, 'loss/train': 2.059574604034424} -08/30/2021 14:46:27 - INFO - __main__ - Step 8966: {'lr': 0.0004972726721784223, 'samples': 1721472, 'steps': 8965, 'loss/train': 1.6372652053833008} -08/30/2021 14:46:28 - INFO - __main__ - Step 8967: {'lr': 0.0004972718903974904, 'samples': 1721664, 'steps': 8966, 'loss/train': 1.243790864944458} -08/30/2021 14:46:28 - INFO - __main__ - Step 8968: {'lr': 0.0004972711085051417, 'samples': 1721856, 'steps': 8967, 'loss/train': 1.6012420654296875} -08/30/2021 14:46:28 - INFO - __main__ - Step 8969: {'lr': 0.0004972703265013764, 'samples': 1722048, 'steps': 8968, 'loss/train': 1.6654213666915894} -08/30/2021 14:46:30 - INFO - __main__ - Step 8970: {'lr': 0.0004972695443861949, 'samples': 1722240, 'steps': 8969, 'loss/train': 2.1250109672546387} -08/30/2021 14:46:30 - INFO - __main__ - Step 8971: {'lr': 0.0004972687621595975, 'samples': 1722432, 'steps': 8970, 'loss/train': 1.3418915271759033} -08/30/2021 14:46:31 - INFO - __main__ - Step 8972: {'lr': 0.0004972679798215847, 'samples': 1722624, 'steps': 8971, 'loss/train': 1.7405096292495728} -08/30/2021 14:46:31 - INFO - __main__ - Step 8973: {'lr': 0.0004972671973721567, 'samples': 1722816, 'steps': 8972, 'loss/train': 1.445396065711975} -08/30/2021 14:46:31 - INFO - __main__ - Step 8974: {'lr': 0.000497266414811314, 'samples': 1723008, 'steps': 8973, 'loss/train': 1.874290108680725} -08/30/2021 14:46:32 - INFO - __main__ - Step 8975: {'lr': 0.0004972656321390568, 'samples': 1723200, 'steps': 8974, 'loss/train': 1.9991459846496582} -08/30/2021 14:46:33 - INFO - __main__ - Step 8976: {'lr': 0.0004972648493553856, 'samples': 1723392, 'steps': 8975, 'loss/train': 1.369490385055542} -08/30/2021 14:46:34 - INFO - __main__ - Step 8977: {'lr': 0.0004972640664603006, 'samples': 1723584, 'steps': 8976, 'loss/train': 2.310957670211792} -08/30/2021 14:46:34 - INFO - __main__ - Step 8978: {'lr': 0.0004972632834538023, 'samples': 1723776, 'steps': 8977, 'loss/train': 2.124022960662842} -08/30/2021 14:46:34 - INFO - __main__ - Step 8979: {'lr': 0.0004972625003358908, 'samples': 1723968, 'steps': 8978, 'loss/train': 1.5275260210037231} -08/30/2021 14:46:35 - INFO - __main__ - Step 8980: {'lr': 0.0004972617171065668, 'samples': 1724160, 'steps': 8979, 'loss/train': 1.8284701108932495} -08/30/2021 14:46:37 - INFO - __main__ - Step 8981: {'lr': 0.0004972609337658305, 'samples': 1724352, 'steps': 8980, 'loss/train': 2.2119197845458984} -08/30/2021 14:46:37 - INFO - __main__ - Step 8982: {'lr': 0.0004972601503136822, 'samples': 1724544, 'steps': 8981, 'loss/train': 1.2716857194900513} -08/30/2021 14:46:38 - INFO - __main__ - Step 8983: {'lr': 0.0004972593667501222, 'samples': 1724736, 'steps': 8982, 'loss/train': 1.8443129062652588} -08/30/2021 14:46:38 - INFO - __main__ - Step 8984: {'lr': 0.0004972585830751511, 'samples': 1724928, 'steps': 8983, 'loss/train': 2.1716959476470947} -08/30/2021 14:46:38 - INFO - __main__ - Step 8985: {'lr': 0.0004972577992887689, 'samples': 1725120, 'steps': 8984, 'loss/train': 2.3679816722869873} -08/30/2021 14:46:39 - INFO - __main__ - Step 8986: {'lr': 0.0004972570153909763, 'samples': 1725312, 'steps': 8985, 'loss/train': 1.4090771675109863} -08/30/2021 14:46:40 - INFO - __main__ - Step 8987: {'lr': 0.0004972562313817735, 'samples': 1725504, 'steps': 8986, 'loss/train': 5.555885314941406} -08/30/2021 14:46:41 - INFO - __main__ - Step 8988: {'lr': 0.0004972554472611609, 'samples': 1725696, 'steps': 8987, 'loss/train': 1.9008162021636963} -08/30/2021 14:46:41 - INFO - __main__ - Step 8989: {'lr': 0.0004972546630291387, 'samples': 1725888, 'steps': 8988, 'loss/train': 2.138808012008667} -08/30/2021 14:46:41 - INFO - __main__ - Step 8990: {'lr': 0.0004972538786857073, 'samples': 1726080, 'steps': 8989, 'loss/train': 2.1921675205230713} -08/30/2021 14:46:42 - INFO - __main__ - Step 8991: {'lr': 0.0004972530942308673, 'samples': 1726272, 'steps': 8990, 'loss/train': 1.5733258724212646} -08/30/2021 14:46:43 - INFO - __main__ - Step 8992: {'lr': 0.0004972523096646188, 'samples': 1726464, 'steps': 8991, 'loss/train': 1.8545182943344116} -08/30/2021 14:46:44 - INFO - __main__ - Step 8993: {'lr': 0.0004972515249869622, 'samples': 1726656, 'steps': 8992, 'loss/train': 2.081447124481201} -08/30/2021 14:46:44 - INFO - __main__ - Step 8994: {'lr': 0.000497250740197898, 'samples': 1726848, 'steps': 8993, 'loss/train': 1.9429447650909424} -08/30/2021 14:46:44 - INFO - __main__ - Step 8995: {'lr': 0.0004972499552974263, 'samples': 1727040, 'steps': 8994, 'loss/train': 1.5408134460449219} -08/30/2021 14:46:45 - INFO - __main__ - Step 8996: {'lr': 0.0004972491702855477, 'samples': 1727232, 'steps': 8995, 'loss/train': 2.4530506134033203} -08/30/2021 14:46:46 - INFO - __main__ - Step 8997: {'lr': 0.0004972483851622623, 'samples': 1727424, 'steps': 8996, 'loss/train': 1.8891547918319702} -08/30/2021 14:46:47 - INFO - __main__ - Step 8998: {'lr': 0.0004972475999275707, 'samples': 1727616, 'steps': 8997, 'loss/train': 2.088207721710205} -08/30/2021 14:46:47 - INFO - __main__ - Step 8999: {'lr': 0.0004972468145814729, 'samples': 1727808, 'steps': 8998, 'loss/train': 2.1565043926239014} -08/30/2021 14:46:47 - INFO - __main__ - Step 9000: {'lr': 0.0004972460291239697, 'samples': 1728000, 'steps': 8999, 'loss/train': 1.3041085004806519} -08/30/2021 14:46:48 - INFO - __main__ - Step 9001: {'lr': 0.0004972452435550613, 'samples': 1728192, 'steps': 9000, 'loss/train': 1.81965172290802} -08/30/2021 14:46:49 - INFO - __main__ - Step 9002: {'lr': 0.000497244457874748, 'samples': 1728384, 'steps': 9001, 'loss/train': 2.1079812049865723} -08/30/2021 14:46:50 - INFO - __main__ - Step 9003: {'lr': 0.0004972436720830301, 'samples': 1728576, 'steps': 9002, 'loss/train': 1.979142665863037} -08/30/2021 14:46:50 - INFO - __main__ - Step 9004: {'lr': 0.000497242886179908, 'samples': 1728768, 'steps': 9003, 'loss/train': 2.252262830734253} -08/30/2021 14:46:50 - INFO - __main__ - Step 9005: {'lr': 0.0004972421001653822, 'samples': 1728960, 'steps': 9004, 'loss/train': 1.3209646940231323} -08/30/2021 14:46:51 - INFO - __main__ - Step 9006: {'lr': 0.0004972413140394528, 'samples': 1729152, 'steps': 9005, 'loss/train': 1.8071860074996948} -08/30/2021 14:46:52 - INFO - __main__ - Step 9007: {'lr': 0.0004972405278021203, 'samples': 1729344, 'steps': 9006, 'loss/train': 1.5674419403076172} -08/30/2021 14:46:53 - INFO - __main__ - Step 9008: {'lr': 0.000497239741453385, 'samples': 1729536, 'steps': 9007, 'loss/train': 2.1593832969665527} -08/30/2021 14:46:53 - INFO - __main__ - Step 9009: {'lr': 0.0004972389549932473, 'samples': 1729728, 'steps': 9008, 'loss/train': 1.8619449138641357} -08/30/2021 14:46:53 - INFO - __main__ - Step 9010: {'lr': 0.0004972381684217077, 'samples': 1729920, 'steps': 9009, 'loss/train': 1.7730443477630615} -08/30/2021 14:46:54 - INFO - __main__ - Step 9011: {'lr': 0.0004972373817387662, 'samples': 1730112, 'steps': 9010, 'loss/train': 0.21746385097503662} -08/30/2021 14:46:55 - INFO - __main__ - Step 9012: {'lr': 0.0004972365949444234, 'samples': 1730304, 'steps': 9011, 'loss/train': 1.2569061517715454} -08/30/2021 14:46:56 - INFO - __main__ - Step 9013: {'lr': 0.0004972358080386796, 'samples': 1730496, 'steps': 9012, 'loss/train': 1.710551381111145} -08/30/2021 14:46:56 - INFO - __main__ - Step 9014: {'lr': 0.0004972350210215353, 'samples': 1730688, 'steps': 9013, 'loss/train': 1.9982478618621826} -08/30/2021 14:46:56 - INFO - __main__ - Step 9015: {'lr': 0.0004972342338929906, 'samples': 1730880, 'steps': 9014, 'loss/train': 1.455694317817688} -08/30/2021 14:46:57 - INFO - __main__ - Step 9016: {'lr': 0.000497233446653046, 'samples': 1731072, 'steps': 9015, 'loss/train': 1.478135347366333} -08/30/2021 14:46:58 - INFO - __main__ - Step 9017: {'lr': 0.0004972326593017017, 'samples': 1731264, 'steps': 9016, 'loss/train': 0.3686990439891815} -08/30/2021 14:46:59 - INFO - __main__ - Step 9018: {'lr': 0.0004972318718389583, 'samples': 1731456, 'steps': 9017, 'loss/train': 2.315657138824463} -08/30/2021 14:46:59 - INFO - __main__ - Step 9019: {'lr': 0.000497231084264816, 'samples': 1731648, 'steps': 9018, 'loss/train': 1.9352573156356812} -08/30/2021 14:46:59 - INFO - __main__ - Step 9020: {'lr': 0.0004972302965792752, 'samples': 1731840, 'steps': 9019, 'loss/train': 1.8115142583847046} -08/30/2021 14:47:00 - INFO - __main__ - Step 9021: {'lr': 0.0004972295087823362, 'samples': 1732032, 'steps': 9020, 'loss/train': 2.0826833248138428} -08/30/2021 14:47:00 - INFO - __main__ - Step 9022: {'lr': 0.0004972287208739995, 'samples': 1732224, 'steps': 9021, 'loss/train': 2.076280355453491} -08/30/2021 14:47:02 - INFO - __main__ - Step 9023: {'lr': 0.0004972279328542652, 'samples': 1732416, 'steps': 9022, 'loss/train': 1.655226469039917} -08/30/2021 14:47:02 - INFO - __main__ - Step 9024: {'lr': 0.000497227144723134, 'samples': 1732608, 'steps': 9023, 'loss/train': 1.9644949436187744} -08/30/2021 14:47:02 - INFO - __main__ - Step 9025: {'lr': 0.0004972263564806059, 'samples': 1732800, 'steps': 9024, 'loss/train': 1.738426685333252} -08/30/2021 14:47:03 - INFO - __main__ - Step 9026: {'lr': 0.0004972255681266816, 'samples': 1732992, 'steps': 9025, 'loss/train': 2.129232406616211} -08/30/2021 14:47:03 - INFO - __main__ - Step 9027: {'lr': 0.0004972247796613611, 'samples': 1733184, 'steps': 9026, 'loss/train': 1.6423194408416748} -08/30/2021 14:47:05 - INFO - __main__ - Step 9028: {'lr': 0.000497223991084645, 'samples': 1733376, 'steps': 9027, 'loss/train': 2.716042995452881} -08/30/2021 14:47:05 - INFO - __main__ - Step 9029: {'lr': 0.0004972232023965335, 'samples': 1733568, 'steps': 9028, 'loss/train': 1.9740265607833862} -08/30/2021 14:47:06 - INFO - __main__ - Step 9030: {'lr': 0.0004972224135970271, 'samples': 1733760, 'steps': 9029, 'loss/train': 2.0346691608428955} -08/30/2021 14:47:06 - INFO - __main__ - Step 9031: {'lr': 0.0004972216246861262, 'samples': 1733952, 'steps': 9030, 'loss/train': 1.3250304460525513} -08/30/2021 14:47:06 - INFO - __main__ - Step 9032: {'lr': 0.0004972208356638309, 'samples': 1734144, 'steps': 9031, 'loss/train': 0.7586222290992737} -08/30/2021 14:47:08 - INFO - __main__ - Step 9033: {'lr': 0.0004972200465301418, 'samples': 1734336, 'steps': 9032, 'loss/train': 0.13911418616771698} -08/30/2021 14:47:08 - INFO - __main__ - Step 9034: {'lr': 0.0004972192572850592, 'samples': 1734528, 'steps': 9033, 'loss/train': 2.3646790981292725} -08/30/2021 14:47:09 - INFO - __main__ - Step 9035: {'lr': 0.0004972184679285833, 'samples': 1734720, 'steps': 9034, 'loss/train': 2.102095603942871} -08/30/2021 14:47:09 - INFO - __main__ - Step 9036: {'lr': 0.0004972176784607146, 'samples': 1734912, 'steps': 9035, 'loss/train': 1.5774246454238892} -08/30/2021 14:47:09 - INFO - __main__ - Step 9037: {'lr': 0.0004972168888814533, 'samples': 1735104, 'steps': 9036, 'loss/train': 1.9236433506011963} -08/30/2021 14:47:11 - INFO - __main__ - Step 9038: {'lr': 0.0004972160991908001, 'samples': 1735296, 'steps': 9037, 'loss/train': 2.431725263595581} -08/30/2021 14:47:12 - INFO - __main__ - Step 9039: {'lr': 0.0004972153093887551, 'samples': 1735488, 'steps': 9038, 'loss/train': 2.3673272132873535} -08/30/2021 14:47:12 - INFO - __main__ - Step 9040: {'lr': 0.0004972145194753186, 'samples': 1735680, 'steps': 9039, 'loss/train': 1.0304653644561768} -08/30/2021 14:47:13 - INFO - __main__ - Step 9041: {'lr': 0.0004972137294504912, 'samples': 1735872, 'steps': 9040, 'loss/train': 2.5453944206237793} -08/30/2021 14:47:13 - INFO - __main__ - Step 9042: {'lr': 0.000497212939314273, 'samples': 1736064, 'steps': 9041, 'loss/train': 2.106966257095337} -08/30/2021 14:47:13 - INFO - __main__ - Step 9043: {'lr': 0.0004972121490666644, 'samples': 1736256, 'steps': 9042, 'loss/train': 1.8059356212615967} -08/30/2021 14:47:15 - INFO - __main__ - Step 9044: {'lr': 0.000497211358707666, 'samples': 1736448, 'steps': 9043, 'loss/train': 5.437865257263184} -08/30/2021 14:47:15 - INFO - __main__ - Step 9045: {'lr': 0.0004972105682372779, 'samples': 1736640, 'steps': 9044, 'loss/train': 0.7333853840827942} -08/30/2021 14:47:16 - INFO - __main__ - Step 9046: {'lr': 0.0004972097776555005, 'samples': 1736832, 'steps': 9045, 'loss/train': 4.125444412231445} -08/30/2021 14:47:16 - INFO - __main__ - Step 9047: {'lr': 0.0004972089869623342, 'samples': 1737024, 'steps': 9046, 'loss/train': 2.1651124954223633} -08/30/2021 14:47:16 - INFO - __main__ - Step 9048: {'lr': 0.0004972081961577793, 'samples': 1737216, 'steps': 9047, 'loss/train': 1.1374707221984863} -08/30/2021 14:47:17 - INFO - __main__ - Step 9049: {'lr': 0.0004972074052418363, 'samples': 1737408, 'steps': 9048, 'loss/train': 1.8395694494247437} -08/30/2021 14:47:18 - INFO - __main__ - Step 9050: {'lr': 0.0004972066142145055, 'samples': 1737600, 'steps': 9049, 'loss/train': 2.260136127471924} -08/30/2021 14:47:19 - INFO - __main__ - Step 9051: {'lr': 0.0004972058230757871, 'samples': 1737792, 'steps': 9050, 'loss/train': 1.9717533588409424} -08/30/2021 14:47:19 - INFO - __main__ - Step 9052: {'lr': 0.0004972050318256815, 'samples': 1737984, 'steps': 9051, 'loss/train': 2.301158905029297} -08/30/2021 14:47:19 - INFO - __main__ - Step 9053: {'lr': 0.0004972042404641893, 'samples': 1738176, 'steps': 9052, 'loss/train': 2.252315044403076} -08/30/2021 14:47:20 - INFO - __main__ - Step 9054: {'lr': 0.0004972034489913106, 'samples': 1738368, 'steps': 9053, 'loss/train': 2.236299753189087} -08/30/2021 14:47:21 - INFO - __main__ - Step 9055: {'lr': 0.0004972026574070459, 'samples': 1738560, 'steps': 9054, 'loss/train': 2.087787389755249} -08/30/2021 14:47:22 - INFO - __main__ - Step 9056: {'lr': 0.0004972018657113953, 'samples': 1738752, 'steps': 9055, 'loss/train': 2.945784330368042} -08/30/2021 14:47:22 - INFO - __main__ - Step 9057: {'lr': 0.0004972010739043596, 'samples': 1738944, 'steps': 9056, 'loss/train': 2.9534263610839844} -08/30/2021 14:47:22 - INFO - __main__ - Step 9058: {'lr': 0.0004972002819859388, 'samples': 1739136, 'steps': 9057, 'loss/train': 2.2367610931396484} -08/30/2021 14:47:23 - INFO - __main__ - Step 9059: {'lr': 0.0004971994899561334, 'samples': 1739328, 'steps': 9058, 'loss/train': 2.444326162338257} -08/30/2021 14:47:24 - INFO - __main__ - Step 9060: {'lr': 0.0004971986978149437, 'samples': 1739520, 'steps': 9059, 'loss/train': 1.7260419130325317} -08/30/2021 14:47:25 - INFO - __main__ - Step 9061: {'lr': 0.0004971979055623701, 'samples': 1739712, 'steps': 9060, 'loss/train': 2.3490841388702393} -08/30/2021 14:47:25 - INFO - __main__ - Step 9062: {'lr': 0.0004971971131984129, 'samples': 1739904, 'steps': 9061, 'loss/train': 1.640828013420105} -08/30/2021 14:47:25 - INFO - __main__ - Step 9063: {'lr': 0.0004971963207230725, 'samples': 1740096, 'steps': 9062, 'loss/train': 2.176591634750366} -08/30/2021 14:47:26 - INFO - __main__ - Step 9064: {'lr': 0.0004971955281363493, 'samples': 1740288, 'steps': 9063, 'loss/train': 2.0326313972473145} -08/30/2021 14:47:27 - INFO - __main__ - Step 9065: {'lr': 0.0004971947354382436, 'samples': 1740480, 'steps': 9064, 'loss/train': 1.402564525604248} -08/30/2021 14:47:28 - INFO - __main__ - Step 9066: {'lr': 0.0004971939426287557, 'samples': 1740672, 'steps': 9065, 'loss/train': 2.0635030269622803} -08/30/2021 14:47:28 - INFO - __main__ - Step 9067: {'lr': 0.0004971931497078861, 'samples': 1740864, 'steps': 9066, 'loss/train': 0.9907790422439575} -08/30/2021 14:47:28 - INFO - __main__ - Step 9068: {'lr': 0.000497192356675635, 'samples': 1741056, 'steps': 9067, 'loss/train': 2.3744184970855713} -08/30/2021 14:47:29 - INFO - __main__ - Step 9069: {'lr': 0.0004971915635320029, 'samples': 1741248, 'steps': 9068, 'loss/train': 2.2521064281463623} -08/30/2021 14:47:29 - INFO - __main__ - Step 9070: {'lr': 0.0004971907702769901, 'samples': 1741440, 'steps': 9069, 'loss/train': 1.4979050159454346} -08/30/2021 14:47:31 - INFO - __main__ - Step 9071: {'lr': 0.000497189976910597, 'samples': 1741632, 'steps': 9070, 'loss/train': 2.048565149307251} -08/30/2021 14:47:31 - INFO - __main__ - Step 9072: {'lr': 0.0004971891834328238, 'samples': 1741824, 'steps': 9071, 'loss/train': 1.8345752954483032} -08/30/2021 14:47:31 - INFO - __main__ - Step 9073: {'lr': 0.000497188389843671, 'samples': 1742016, 'steps': 9072, 'loss/train': 1.6389049291610718} -08/30/2021 14:47:32 - INFO - __main__ - Step 9074: {'lr': 0.0004971875961431389, 'samples': 1742208, 'steps': 9073, 'loss/train': 2.1482186317443848} -08/30/2021 14:47:32 - INFO - __main__ - Step 9075: {'lr': 0.000497186802331228, 'samples': 1742400, 'steps': 9074, 'loss/train': 2.09512996673584} -08/30/2021 14:47:34 - INFO - __main__ - Step 9076: {'lr': 0.0004971860084079385, 'samples': 1742592, 'steps': 9075, 'loss/train': 2.276905059814453} -08/30/2021 14:47:34 - INFO - __main__ - Step 9077: {'lr': 0.0004971852143732707, 'samples': 1742784, 'steps': 9076, 'loss/train': 1.8982940912246704} -08/30/2021 14:47:35 - INFO - __main__ - Step 9078: {'lr': 0.0004971844202272251, 'samples': 1742976, 'steps': 9077, 'loss/train': 1.3196507692337036} -08/30/2021 14:47:35 - INFO - __main__ - Step 9079: {'lr': 0.000497183625969802, 'samples': 1743168, 'steps': 9078, 'loss/train': 1.0520685911178589} -08/30/2021 14:47:35 - INFO - __main__ - Step 9080: {'lr': 0.0004971828316010019, 'samples': 1743360, 'steps': 9079, 'loss/train': 2.0894603729248047} -08/30/2021 14:47:36 - INFO - __main__ - Step 9081: {'lr': 0.0004971820371208248, 'samples': 1743552, 'steps': 9080, 'loss/train': 2.3856382369995117} -08/30/2021 14:47:37 - INFO - __main__ - Step 9082: {'lr': 0.0004971812425292716, 'samples': 1743744, 'steps': 9081, 'loss/train': 1.1970280408859253} -08/30/2021 14:47:38 - INFO - __main__ - Step 9083: {'lr': 0.000497180447826342, 'samples': 1743936, 'steps': 9082, 'loss/train': 1.8861169815063477} -08/30/2021 14:47:38 - INFO - __main__ - Step 9084: {'lr': 0.0004971796530120371, 'samples': 1744128, 'steps': 9083, 'loss/train': 1.9659919738769531} -08/30/2021 14:47:38 - INFO - __main__ - Step 9085: {'lr': 0.0004971788580863566, 'samples': 1744320, 'steps': 9084, 'loss/train': 1.5286049842834473} -08/30/2021 14:47:39 - INFO - __main__ - Step 9086: {'lr': 0.0004971780630493012, 'samples': 1744512, 'steps': 9085, 'loss/train': 2.2692182064056396} -08/30/2021 14:47:40 - INFO - __main__ - Step 9087: {'lr': 0.000497177267900871, 'samples': 1744704, 'steps': 9086, 'loss/train': 2.5457873344421387} -08/30/2021 14:47:41 - INFO - __main__ - Step 9088: {'lr': 0.0004971764726410668, 'samples': 1744896, 'steps': 9087, 'loss/train': 1.9081003665924072} -08/30/2021 14:47:41 - INFO - __main__ - Step 9089: {'lr': 0.0004971756772698886, 'samples': 1745088, 'steps': 9088, 'loss/train': 1.959722638130188} -08/30/2021 14:47:41 - INFO - __main__ - Step 9090: {'lr': 0.0004971748817873367, 'samples': 1745280, 'steps': 9089, 'loss/train': 2.1897709369659424} -08/30/2021 14:47:42 - INFO - __main__ - Step 9091: {'lr': 0.0004971740861934117, 'samples': 1745472, 'steps': 9090, 'loss/train': 1.7882908582687378} -08/30/2021 14:47:44 - INFO - __main__ - Step 9092: {'lr': 0.000497173290488114, 'samples': 1745664, 'steps': 9091, 'loss/train': 1.8940757513046265} -08/30/2021 14:47:45 - INFO - __main__ - Step 9093: {'lr': 0.0004971724946714437, 'samples': 1745856, 'steps': 9092, 'loss/train': 1.9856022596359253} -08/30/2021 14:47:45 - INFO - __main__ - Step 9094: {'lr': 0.0004971716987434014, 'samples': 1746048, 'steps': 9093, 'loss/train': 2.1157851219177246} -08/30/2021 14:47:45 - INFO - __main__ - Step 9095: {'lr': 0.0004971709027039872, 'samples': 1746240, 'steps': 9094, 'loss/train': 1.0603735446929932} -08/30/2021 14:47:46 - INFO - __main__ - Step 9096: {'lr': 0.0004971701065532017, 'samples': 1746432, 'steps': 9095, 'loss/train': 1.6940349340438843} -08/30/2021 14:47:46 - INFO - __main__ - Step 9097: {'lr': 0.0004971693102910451, 'samples': 1746624, 'steps': 9096, 'loss/train': 2.09838604927063} -08/30/2021 14:47:47 - INFO - __main__ - Step 9098: {'lr': 0.0004971685139175179, 'samples': 1746816, 'steps': 9097, 'loss/train': 1.5774281024932861} -08/30/2021 14:47:48 - INFO - __main__ - Step 9099: {'lr': 0.0004971677174326204, 'samples': 1747008, 'steps': 9098, 'loss/train': 1.008238673210144} -08/30/2021 14:47:48 - INFO - __main__ - Step 9100: {'lr': 0.0004971669208363529, 'samples': 1747200, 'steps': 9099, 'loss/train': 2.993015766143799} -08/30/2021 14:47:49 - INFO - __main__ - Step 9101: {'lr': 0.0004971661241287157, 'samples': 1747392, 'steps': 9100, 'loss/train': 2.0401124954223633} -08/30/2021 14:47:49 - INFO - __main__ - Step 9102: {'lr': 0.0004971653273097094, 'samples': 1747584, 'steps': 9101, 'loss/train': 1.9922418594360352} -08/30/2021 14:47:51 - INFO - __main__ - Step 9103: {'lr': 0.0004971645303793342, 'samples': 1747776, 'steps': 9102, 'loss/train': 2.352294683456421} -08/30/2021 14:47:51 - INFO - __main__ - Step 9104: {'lr': 0.0004971637333375904, 'samples': 1747968, 'steps': 9103, 'loss/train': 2.1351101398468018} -08/30/2021 14:47:51 - INFO - __main__ - Step 9105: {'lr': 0.0004971629361844785, 'samples': 1748160, 'steps': 9104, 'loss/train': 1.8639625310897827} -08/30/2021 14:47:52 - INFO - __main__ - Step 9106: {'lr': 0.0004971621389199988, 'samples': 1748352, 'steps': 9105, 'loss/train': 1.1813985109329224} -08/30/2021 14:47:52 - INFO - __main__ - Step 9107: {'lr': 0.0004971613415441516, 'samples': 1748544, 'steps': 9106, 'loss/train': 0.2463376671075821} -08/30/2021 14:47:54 - INFO - __main__ - Step 9108: {'lr': 0.0004971605440569374, 'samples': 1748736, 'steps': 9107, 'loss/train': 1.4703516960144043} -08/30/2021 14:47:54 - INFO - __main__ - Step 9109: {'lr': 0.0004971597464583563, 'samples': 1748928, 'steps': 9108, 'loss/train': 2.059968948364258} -08/30/2021 14:47:54 - INFO - __main__ - Step 9110: {'lr': 0.0004971589487484091, 'samples': 1749120, 'steps': 9109, 'loss/train': 1.6971399784088135} -08/30/2021 14:47:55 - INFO - __main__ - Step 9111: {'lr': 0.0004971581509270956, 'samples': 1749312, 'steps': 9110, 'loss/train': 2.133328914642334} -08/30/2021 14:47:55 - INFO - __main__ - Step 9112: {'lr': 0.0004971573529944167, 'samples': 1749504, 'steps': 9111, 'loss/train': 1.024994969367981} -08/30/2021 14:47:57 - INFO - __main__ - Step 9113: {'lr': 0.0004971565549503723, 'samples': 1749696, 'steps': 9112, 'loss/train': 2.169511318206787} -08/30/2021 14:47:57 - INFO - __main__ - Step 9114: {'lr': 0.0004971557567949631, 'samples': 1749888, 'steps': 9113, 'loss/train': 2.1940808296203613} -08/30/2021 14:47:58 - INFO - __main__ - Step 9115: {'lr': 0.0004971549585281893, 'samples': 1750080, 'steps': 9114, 'loss/train': 1.2247960567474365} -08/30/2021 14:47:58 - INFO - __main__ - Step 9116: {'lr': 0.0004971541601500513, 'samples': 1750272, 'steps': 9115, 'loss/train': 1.9117571115493774} -08/30/2021 14:47:58 - INFO - __main__ - Step 9117: {'lr': 0.0004971533616605495, 'samples': 1750464, 'steps': 9116, 'loss/train': 2.526611328125} -08/30/2021 14:48:00 - INFO - __main__ - Step 9118: {'lr': 0.0004971525630596841, 'samples': 1750656, 'steps': 9117, 'loss/train': 2.296067714691162} -08/30/2021 14:48:00 - INFO - __main__ - Step 9119: {'lr': 0.0004971517643474556, 'samples': 1750848, 'steps': 9118, 'loss/train': 1.3903931379318237} -08/30/2021 14:48:01 - INFO - __main__ - Step 9120: {'lr': 0.0004971509655238643, 'samples': 1751040, 'steps': 9119, 'loss/train': 2.030454397201538} -08/30/2021 14:48:01 - INFO - __main__ - Step 9121: {'lr': 0.0004971501665889107, 'samples': 1751232, 'steps': 9120, 'loss/train': 2.2768170833587646} -08/30/2021 14:48:01 - INFO - __main__ - Step 9122: {'lr': 0.000497149367542595, 'samples': 1751424, 'steps': 9121, 'loss/train': 2.0302062034606934} -08/30/2021 14:48:03 - INFO - __main__ - Step 9123: {'lr': 0.0004971485683849176, 'samples': 1751616, 'steps': 9122, 'loss/train': 2.2915782928466797} -08/30/2021 14:48:04 - INFO - __main__ - Step 9124: {'lr': 0.0004971477691158788, 'samples': 1751808, 'steps': 9123, 'loss/train': 2.106600761413574} -08/30/2021 14:48:04 - INFO - __main__ - Step 9125: {'lr': 0.0004971469697354792, 'samples': 1752000, 'steps': 9124, 'loss/train': 2.216188907623291} -08/30/2021 14:48:04 - INFO - __main__ - Step 9126: {'lr': 0.0004971461702437188, 'samples': 1752192, 'steps': 9125, 'loss/train': 2.044036388397217} -08/30/2021 14:48:05 - INFO - __main__ - Step 9127: {'lr': 0.0004971453706405981, 'samples': 1752384, 'steps': 9126, 'loss/train': 2.044644355773926} -08/30/2021 14:48:05 - INFO - __main__ - Step 9128: {'lr': 0.0004971445709261177, 'samples': 1752576, 'steps': 9127, 'loss/train': 1.7316431999206543} -08/30/2021 14:48:06 - INFO - __main__ - Step 9129: {'lr': 0.0004971437711002777, 'samples': 1752768, 'steps': 9128, 'loss/train': 2.2101809978485107} -08/30/2021 14:48:07 - INFO - __main__ - Step 9130: {'lr': 0.0004971429711630786, 'samples': 1752960, 'steps': 9129, 'loss/train': 1.6328277587890625} -08/30/2021 14:48:07 - INFO - __main__ - Step 9131: {'lr': 0.0004971421711145207, 'samples': 1753152, 'steps': 9130, 'loss/train': 1.7874112129211426} -08/30/2021 14:48:08 - INFO - __main__ - Step 9132: {'lr': 0.0004971413709546043, 'samples': 1753344, 'steps': 9131, 'loss/train': 2.4208216667175293} -08/30/2021 14:48:08 - INFO - __main__ - Step 9133: {'lr': 0.0004971405706833297, 'samples': 1753536, 'steps': 9132, 'loss/train': 1.4205937385559082} -08/30/2021 14:48:09 - INFO - __main__ - Step 9134: {'lr': 0.0004971397703006974, 'samples': 1753728, 'steps': 9133, 'loss/train': 1.6057732105255127} -08/30/2021 14:48:10 - INFO - __main__ - Step 9135: {'lr': 0.0004971389698067079, 'samples': 1753920, 'steps': 9134, 'loss/train': 1.9402657747268677} -08/30/2021 14:48:10 - INFO - __main__ - Step 9136: {'lr': 0.0004971381692013612, 'samples': 1754112, 'steps': 9135, 'loss/train': 1.7869319915771484} -08/30/2021 14:48:11 - INFO - __main__ - Step 9137: {'lr': 0.000497137368484658, 'samples': 1754304, 'steps': 9136, 'loss/train': 1.8371540307998657} -08/30/2021 14:48:11 - INFO - __main__ - Step 9138: {'lr': 0.0004971365676565984, 'samples': 1754496, 'steps': 9137, 'loss/train': 1.7519088983535767} -08/30/2021 14:48:13 - INFO - __main__ - Step 9139: {'lr': 0.000497135766717183, 'samples': 1754688, 'steps': 9138, 'loss/train': 1.834581971168518} -08/30/2021 14:48:13 - INFO - __main__ - Step 9140: {'lr': 0.000497134965666412, 'samples': 1754880, 'steps': 9139, 'loss/train': 1.8342030048370361} -08/30/2021 14:48:13 - INFO - __main__ - Step 9141: {'lr': 0.0004971341645042857, 'samples': 1755072, 'steps': 9140, 'loss/train': 2.3751776218414307} -08/30/2021 14:48:14 - INFO - __main__ - Step 9142: {'lr': 0.0004971333632308047, 'samples': 1755264, 'steps': 9141, 'loss/train': 1.7557752132415771} -08/30/2021 14:48:14 - INFO - __main__ - Step 9143: {'lr': 0.0004971325618459691, 'samples': 1755456, 'steps': 9142, 'loss/train': 1.6465389728546143} -08/30/2021 14:48:17 - INFO - __main__ - Step 9144: {'lr': 0.0004971317603497795, 'samples': 1755648, 'steps': 9143, 'loss/train': 1.9172916412353516} -08/30/2021 14:48:17 - INFO - __main__ - Step 9145: {'lr': 0.000497130958742236, 'samples': 1755840, 'steps': 9144, 'loss/train': 1.1707823276519775} -08/30/2021 14:48:17 - INFO - __main__ - Step 9146: {'lr': 0.0004971301570233392, 'samples': 1756032, 'steps': 9145, 'loss/train': 1.9727407693862915} -08/30/2021 14:48:18 - INFO - __main__ - Step 9147: {'lr': 0.0004971293551930894, 'samples': 1756224, 'steps': 9146, 'loss/train': 0.9874273538589478} -08/30/2021 14:48:18 - INFO - __main__ - Step 9148: {'lr': 0.0004971285532514868, 'samples': 1756416, 'steps': 9147, 'loss/train': 1.1770209074020386} -08/30/2021 14:48:20 - INFO - __main__ - Step 9149: {'lr': 0.000497127751198532, 'samples': 1756608, 'steps': 9148, 'loss/train': 2.8048670291900635} -08/30/2021 14:48:20 - INFO - __main__ - Step 9150: {'lr': 0.0004971269490342252, 'samples': 1756800, 'steps': 9149, 'loss/train': 2.3494205474853516} -08/30/2021 14:48:21 - INFO - __main__ - Step 9151: {'lr': 0.0004971261467585669, 'samples': 1756992, 'steps': 9150, 'loss/train': 1.4400689601898193} -08/30/2021 14:48:21 - INFO - __main__ - Step 9152: {'lr': 0.0004971253443715572, 'samples': 1757184, 'steps': 9151, 'loss/train': 2.275338888168335} -08/30/2021 14:48:21 - INFO - __main__ - Step 9153: {'lr': 0.0004971245418731966, 'samples': 1757376, 'steps': 9152, 'loss/train': 0.3372267782688141} -08/30/2021 14:48:23 - INFO - __main__ - Step 9154: {'lr': 0.0004971237392634857, 'samples': 1757568, 'steps': 9153, 'loss/train': 2.4787211418151855} -08/30/2021 14:48:23 - INFO - __main__ - Step 9155: {'lr': 0.0004971229365424246, 'samples': 1757760, 'steps': 9154, 'loss/train': 1.8553352355957031} -08/30/2021 14:48:24 - INFO - __main__ - Step 9156: {'lr': 0.0004971221337100137, 'samples': 1757952, 'steps': 9155, 'loss/train': 1.895383358001709} -08/30/2021 14:48:24 - INFO - __main__ - Step 9157: {'lr': 0.0004971213307662534, 'samples': 1758144, 'steps': 9156, 'loss/train': 1.497563362121582} -08/30/2021 14:48:24 - INFO - __main__ - Step 9158: {'lr': 0.000497120527711144, 'samples': 1758336, 'steps': 9157, 'loss/train': 1.8233681917190552} -08/30/2021 14:48:26 - INFO - __main__ - Step 9159: {'lr': 0.0004971197245446859, 'samples': 1758528, 'steps': 9158, 'loss/train': 1.5231906175613403} -08/30/2021 14:48:26 - INFO - __main__ - Step 9160: {'lr': 0.0004971189212668794, 'samples': 1758720, 'steps': 9159, 'loss/train': 1.780755877494812} -08/30/2021 14:48:27 - INFO - __main__ - Step 9161: {'lr': 0.0004971181178777251, 'samples': 1758912, 'steps': 9160, 'loss/train': 2.956045150756836} -08/30/2021 14:48:27 - INFO - __main__ - Step 9162: {'lr': 0.0004971173143772231, 'samples': 1759104, 'steps': 9161, 'loss/train': 0.981243908405304} -08/30/2021 14:48:27 - INFO - __main__ - Step 9163: {'lr': 0.0004971165107653738, 'samples': 1759296, 'steps': 9162, 'loss/train': 1.437286615371704} -08/30/2021 14:48:28 - INFO - __main__ - Step 9164: {'lr': 0.0004971157070421776, 'samples': 1759488, 'steps': 9163, 'loss/train': 1.465252161026001} -08/30/2021 14:48:29 - INFO - __main__ - Step 9165: {'lr': 0.000497114903207635, 'samples': 1759680, 'steps': 9164, 'loss/train': 2.0578012466430664} -08/30/2021 14:48:30 - INFO - __main__ - Step 9166: {'lr': 0.0004971140992617462, 'samples': 1759872, 'steps': 9165, 'loss/train': 1.0709028244018555} -08/30/2021 14:48:30 - INFO - __main__ - Step 9167: {'lr': 0.0004971132952045115, 'samples': 1760064, 'steps': 9166, 'loss/train': 2.3895819187164307} -08/30/2021 14:48:30 - INFO - __main__ - Step 9168: {'lr': 0.0004971124910359315, 'samples': 1760256, 'steps': 9167, 'loss/train': 2.0490262508392334} -08/30/2021 14:48:32 - INFO - __main__ - Step 9169: {'lr': 0.0004971116867560064, 'samples': 1760448, 'steps': 9168, 'loss/train': 1.772620677947998} -08/30/2021 14:48:32 - INFO - __main__ - Step 9170: {'lr': 0.0004971108823647365, 'samples': 1760640, 'steps': 9169, 'loss/train': 1.069950819015503} -08/30/2021 14:48:33 - INFO - __main__ - Step 9171: {'lr': 0.0004971100778621223, 'samples': 1760832, 'steps': 9170, 'loss/train': 1.874866247177124} -08/30/2021 14:48:33 - INFO - __main__ - Step 9172: {'lr': 0.0004971092732481641, 'samples': 1761024, 'steps': 9171, 'loss/train': 2.2963037490844727} -08/30/2021 14:48:33 - INFO - __main__ - Step 9173: {'lr': 0.0004971084685228623, 'samples': 1761216, 'steps': 9172, 'loss/train': 2.192671298980713} -08/30/2021 14:48:34 - INFO - __main__ - Step 9174: {'lr': 0.0004971076636862172, 'samples': 1761408, 'steps': 9173, 'loss/train': 1.6010810136795044} -08/30/2021 14:48:35 - INFO - __main__ - Step 9175: {'lr': 0.0004971068587382293, 'samples': 1761600, 'steps': 9174, 'loss/train': 1.7634247541427612} -08/30/2021 14:48:36 - INFO - __main__ - Step 9176: {'lr': 0.0004971060536788988, 'samples': 1761792, 'steps': 9175, 'loss/train': 2.308720350265503} -08/30/2021 14:48:36 - INFO - __main__ - Step 9177: {'lr': 0.000497105248508226, 'samples': 1761984, 'steps': 9176, 'loss/train': 1.5760347843170166} -08/30/2021 14:48:36 - INFO - __main__ - Step 9178: {'lr': 0.0004971044432262115, 'samples': 1762176, 'steps': 9177, 'loss/train': 2.1757302284240723} -08/30/2021 14:48:37 - INFO - __main__ - Step 9179: {'lr': 0.0004971036378328556, 'samples': 1762368, 'steps': 9178, 'loss/train': 1.770199179649353} -08/30/2021 14:48:38 - INFO - __main__ - Step 9180: {'lr': 0.0004971028323281586, 'samples': 1762560, 'steps': 9179, 'loss/train': 1.6086231470108032} -08/30/2021 14:48:39 - INFO - __main__ - Step 9181: {'lr': 0.0004971020267121208, 'samples': 1762752, 'steps': 9180, 'loss/train': 1.730339765548706} -08/30/2021 14:48:39 - INFO - __main__ - Step 9182: {'lr': 0.0004971012209847427, 'samples': 1762944, 'steps': 9181, 'loss/train': 2.1406893730163574} -08/30/2021 14:48:40 - INFO - __main__ - Step 9183: {'lr': 0.0004971004151460245, 'samples': 1763136, 'steps': 9182, 'loss/train': 0.3436744213104248} -08/30/2021 14:48:40 - INFO - __main__ - Step 9184: {'lr': 0.0004970996091959668, 'samples': 1763328, 'steps': 9183, 'loss/train': 2.0354251861572266} -08/30/2021 14:48:42 - INFO - __main__ - Step 9185: {'lr': 0.0004970988031345698, 'samples': 1763520, 'steps': 9184, 'loss/train': 1.9346362352371216} -08/30/2021 14:48:43 - INFO - __main__ - Step 9186: {'lr': 0.0004970979969618338, 'samples': 1763712, 'steps': 9185, 'loss/train': 1.3773599863052368} -08/30/2021 14:48:43 - INFO - __main__ - Step 9187: {'lr': 0.0004970971906777593, 'samples': 1763904, 'steps': 9186, 'loss/train': 2.4897844791412354} -08/30/2021 14:48:43 - INFO - __main__ - Step 9188: {'lr': 0.0004970963842823468, 'samples': 1764096, 'steps': 9187, 'loss/train': 1.7319952249526978} -08/30/2021 14:48:44 - INFO - __main__ - Step 9189: {'lr': 0.0004970955777755963, 'samples': 1764288, 'steps': 9188, 'loss/train': 2.0576400756835938} -08/30/2021 14:48:45 - INFO - __main__ - Step 9190: {'lr': 0.0004970947711575083, 'samples': 1764480, 'steps': 9189, 'loss/train': 2.112687349319458} -08/30/2021 14:48:46 - INFO - __main__ - Step 9191: {'lr': 0.0004970939644280833, 'samples': 1764672, 'steps': 9190, 'loss/train': 1.8706601858139038} -08/30/2021 14:48:46 - INFO - __main__ - Step 9192: {'lr': 0.0004970931575873215, 'samples': 1764864, 'steps': 9191, 'loss/train': 2.5577428340911865} -08/30/2021 14:48:46 - INFO - __main__ - Step 9193: {'lr': 0.0004970923506352234, 'samples': 1765056, 'steps': 9192, 'loss/train': 1.8557285070419312} -08/30/2021 14:48:47 - INFO - __main__ - Step 9194: {'lr': 0.0004970915435717893, 'samples': 1765248, 'steps': 9193, 'loss/train': 2.146958589553833} -08/30/2021 14:48:47 - INFO - __main__ - Step 9195: {'lr': 0.0004970907363970196, 'samples': 1765440, 'steps': 9194, 'loss/train': 1.617411732673645} -08/30/2021 14:48:49 - INFO - __main__ - Step 9196: {'lr': 0.0004970899291109145, 'samples': 1765632, 'steps': 9195, 'loss/train': 0.2605523467063904} -08/30/2021 14:48:50 - INFO - __main__ - Step 9197: {'lr': 0.0004970891217134746, 'samples': 1765824, 'steps': 9196, 'loss/train': 1.556320071220398} -08/30/2021 14:48:50 - INFO - __main__ - Step 9198: {'lr': 0.0004970883142047001, 'samples': 1766016, 'steps': 9197, 'loss/train': 1.5277460813522339} -08/30/2021 14:48:51 - INFO - __main__ - Step 9199: {'lr': 0.0004970875065845914, 'samples': 1766208, 'steps': 9198, 'loss/train': 2.1826789379119873} -08/30/2021 14:48:51 - INFO - __main__ - Step 9200: {'lr': 0.000497086698853149, 'samples': 1766400, 'steps': 9199, 'loss/train': 2.515925645828247} -08/30/2021 14:48:53 - INFO - __main__ - Step 9201: {'lr': 0.0004970858910103731, 'samples': 1766592, 'steps': 9200, 'loss/train': 1.4338728189468384} -08/30/2021 14:48:53 - INFO - __main__ - Step 9202: {'lr': 0.0004970850830562641, 'samples': 1766784, 'steps': 9201, 'loss/train': 0.18572726845741272} -08/30/2021 14:48:53 - INFO - __main__ - Step 9203: {'lr': 0.0004970842749908223, 'samples': 1766976, 'steps': 9202, 'loss/train': 2.248081922531128} -08/30/2021 14:48:54 - INFO - __main__ - Step 9204: {'lr': 0.0004970834668140482, 'samples': 1767168, 'steps': 9203, 'loss/train': 2.0930335521698} -08/30/2021 14:48:54 - INFO - __main__ - Step 9205: {'lr': 0.0004970826585259421, 'samples': 1767360, 'steps': 9204, 'loss/train': 2.057454824447632} -08/30/2021 14:48:56 - INFO - __main__ - Step 9206: {'lr': 0.0004970818501265044, 'samples': 1767552, 'steps': 9205, 'loss/train': 1.6054198741912842} -08/30/2021 14:48:57 - INFO - __main__ - Step 9207: {'lr': 0.0004970810416157354, 'samples': 1767744, 'steps': 9206, 'loss/train': 1.9816429615020752} -08/30/2021 14:48:57 - INFO - __main__ - Step 9208: {'lr': 0.0004970802329936355, 'samples': 1767936, 'steps': 9207, 'loss/train': 1.237385630607605} -08/30/2021 14:48:57 - INFO - __main__ - Step 9209: {'lr': 0.000497079424260205, 'samples': 1768128, 'steps': 9208, 'loss/train': 1.6543488502502441} -08/30/2021 14:48:58 - INFO - __main__ - Step 9210: {'lr': 0.0004970786154154444, 'samples': 1768320, 'steps': 9209, 'loss/train': 2.1490519046783447} -08/30/2021 14:48:58 - INFO - __main__ - Step 9211: {'lr': 0.000497077806459354, 'samples': 1768512, 'steps': 9210, 'loss/train': 0.6202272176742554} -08/30/2021 14:49:00 - INFO - __main__ - Step 9212: {'lr': 0.0004970769973919341, 'samples': 1768704, 'steps': 9211, 'loss/train': 0.711371123790741} -08/30/2021 14:49:00 - INFO - __main__ - Step 9213: {'lr': 0.0004970761882131851, 'samples': 1768896, 'steps': 9212, 'loss/train': 2.2477684020996094} -08/30/2021 14:49:01 - INFO - __main__ - Step 9214: {'lr': 0.0004970753789231074, 'samples': 1769088, 'steps': 9213, 'loss/train': 2.07246470451355} -08/30/2021 14:49:01 - INFO - __main__ - Step 9215: {'lr': 0.0004970745695217014, 'samples': 1769280, 'steps': 9214, 'loss/train': 1.9545146226882935} -08/30/2021 14:49:01 - INFO - __main__ - Step 9216: {'lr': 0.0004970737600089673, 'samples': 1769472, 'steps': 9215, 'loss/train': 0.15511734783649445} -08/30/2021 14:49:03 - INFO - __main__ - Step 9217: {'lr': 0.0004970729503849057, 'samples': 1769664, 'steps': 9216, 'loss/train': 2.0614912509918213} -08/30/2021 14:49:03 - INFO - __main__ - Step 9218: {'lr': 0.0004970721406495168, 'samples': 1769856, 'steps': 9217, 'loss/train': 1.8605259656906128} -08/30/2021 14:49:04 - INFO - __main__ - Step 9219: {'lr': 0.000497071330802801, 'samples': 1770048, 'steps': 9218, 'loss/train': 2.124539613723755} -08/30/2021 14:49:04 - INFO - __main__ - Step 9220: {'lr': 0.0004970705208447587, 'samples': 1770240, 'steps': 9219, 'loss/train': 1.8342972993850708} -08/30/2021 14:49:04 - INFO - __main__ - Step 9221: {'lr': 0.0004970697107753902, 'samples': 1770432, 'steps': 9220, 'loss/train': 1.8214855194091797} -08/30/2021 14:49:06 - INFO - __main__ - Step 9222: {'lr': 0.0004970689005946959, 'samples': 1770624, 'steps': 9221, 'loss/train': 1.7121367454528809} -08/30/2021 14:49:06 - INFO - __main__ - Step 9223: {'lr': 0.0004970680903026762, 'samples': 1770816, 'steps': 9222, 'loss/train': 1.2820076942443848} -08/30/2021 14:49:06 - INFO - __main__ - Step 9224: {'lr': 0.0004970672798993313, 'samples': 1771008, 'steps': 9223, 'loss/train': 2.2044875621795654} -08/30/2021 14:49:07 - INFO - __main__ - Step 9225: {'lr': 0.0004970664693846618, 'samples': 1771200, 'steps': 9224, 'loss/train': 2.00738787651062} -08/30/2021 14:49:07 - INFO - __main__ - Step 9226: {'lr': 0.000497065658758668, 'samples': 1771392, 'steps': 9225, 'loss/train': 1.7194164991378784} -08/30/2021 14:49:09 - INFO - __main__ - Step 9227: {'lr': 0.0004970648480213502, 'samples': 1771584, 'steps': 9226, 'loss/train': 2.0624279975891113} -08/30/2021 14:49:09 - INFO - __main__ - Step 9228: {'lr': 0.0004970640371727088, 'samples': 1771776, 'steps': 9227, 'loss/train': 1.580984354019165} -08/30/2021 14:49:10 - INFO - __main__ - Step 9229: {'lr': 0.0004970632262127441, 'samples': 1771968, 'steps': 9228, 'loss/train': 1.6961482763290405} -08/30/2021 14:49:10 - INFO - __main__ - Step 9230: {'lr': 0.0004970624151414565, 'samples': 1772160, 'steps': 9229, 'loss/train': 1.8536534309387207} -08/30/2021 14:49:10 - INFO - __main__ - Step 9231: {'lr': 0.0004970616039588465, 'samples': 1772352, 'steps': 9230, 'loss/train': 1.6463274955749512} -08/30/2021 14:49:12 - INFO - __main__ - Step 9232: {'lr': 0.0004970607926649143, 'samples': 1772544, 'steps': 9231, 'loss/train': 1.9842034578323364} -08/30/2021 14:49:13 - INFO - __main__ - Step 9233: {'lr': 0.0004970599812596603, 'samples': 1772736, 'steps': 9232, 'loss/train': 0.9124844670295715} -08/30/2021 14:49:13 - INFO - __main__ - Step 9234: {'lr': 0.0004970591697430849, 'samples': 1772928, 'steps': 9233, 'loss/train': 2.3479666709899902} -08/30/2021 14:49:13 - INFO - __main__ - Step 9235: {'lr': 0.0004970583581151885, 'samples': 1773120, 'steps': 9234, 'loss/train': 2.9768569469451904} -08/30/2021 14:49:14 - INFO - __main__ - Step 9236: {'lr': 0.0004970575463759713, 'samples': 1773312, 'steps': 9235, 'loss/train': 1.4549553394317627} -08/30/2021 14:49:14 - INFO - __main__ - Step 9237: {'lr': 0.0004970567345254339, 'samples': 1773504, 'steps': 9236, 'loss/train': 1.7700152397155762} -08/30/2021 14:49:15 - INFO - __main__ - Step 9238: {'lr': 0.0004970559225635765, 'samples': 1773696, 'steps': 9237, 'loss/train': 1.04756498336792} -08/30/2021 14:49:16 - INFO - __main__ - Step 9239: {'lr': 0.0004970551104903995, 'samples': 1773888, 'steps': 9238, 'loss/train': 2.0631184577941895} -08/30/2021 14:49:16 - INFO - __main__ - Step 9240: {'lr': 0.0004970542983059033, 'samples': 1774080, 'steps': 9239, 'loss/train': 1.9168970584869385} -08/30/2021 14:49:17 - INFO - __main__ - Step 9241: {'lr': 0.0004970534860100883, 'samples': 1774272, 'steps': 9240, 'loss/train': 1.7760001420974731} -08/30/2021 14:49:17 - INFO - __main__ - Step 9242: {'lr': 0.0004970526736029547, 'samples': 1774464, 'steps': 9241, 'loss/train': 1.739051342010498} -08/30/2021 14:49:19 - INFO - __main__ - Step 9243: {'lr': 0.000497051861084503, 'samples': 1774656, 'steps': 9242, 'loss/train': 2.3888537883758545} -08/30/2021 14:49:19 - INFO - __main__ - Step 9244: {'lr': 0.0004970510484547336, 'samples': 1774848, 'steps': 9243, 'loss/train': 2.1341841220855713} -08/30/2021 14:49:20 - INFO - __main__ - Step 9245: {'lr': 0.0004970502357136468, 'samples': 1775040, 'steps': 9244, 'loss/train': 2.0101072788238525} -08/30/2021 14:49:20 - INFO - __main__ - Step 9246: {'lr': 0.0004970494228612429, 'samples': 1775232, 'steps': 9245, 'loss/train': 0.35101956129074097} -08/30/2021 14:49:20 - INFO - __main__ - Step 9247: {'lr': 0.0004970486098975224, 'samples': 1775424, 'steps': 9246, 'loss/train': 0.26647070050239563} -08/30/2021 14:49:21 - INFO - __main__ - Step 9248: {'lr': 0.0004970477968224856, 'samples': 1775616, 'steps': 9247, 'loss/train': 1.8340070247650146} -08/30/2021 14:49:22 - INFO - __main__ - Step 9249: {'lr': 0.000497046983636133, 'samples': 1775808, 'steps': 9248, 'loss/train': 2.2194974422454834} -08/30/2021 14:49:23 - INFO - __main__ - Step 9250: {'lr': 0.0004970461703384647, 'samples': 1776000, 'steps': 9249, 'loss/train': 2.377347946166992} -08/30/2021 14:49:23 - INFO - __main__ - Step 9251: {'lr': 0.0004970453569294812, 'samples': 1776192, 'steps': 9250, 'loss/train': 1.8733460903167725} -08/30/2021 14:49:23 - INFO - __main__ - Step 9252: {'lr': 0.000497044543409183, 'samples': 1776384, 'steps': 9251, 'loss/train': 1.556471347808838} -08/30/2021 14:49:24 - INFO - __main__ - Step 9253: {'lr': 0.0004970437297775702, 'samples': 1776576, 'steps': 9252, 'loss/train': 2.4468936920166016} -08/30/2021 14:49:26 - INFO - __main__ - Step 9254: {'lr': 0.0004970429160346433, 'samples': 1776768, 'steps': 9253, 'loss/train': 2.3511977195739746} -08/30/2021 14:49:26 - INFO - __main__ - Step 9255: {'lr': 0.0004970421021804027, 'samples': 1776960, 'steps': 9254, 'loss/train': 1.5434702634811401} -08/30/2021 14:49:27 - INFO - __main__ - Step 9256: {'lr': 0.0004970412882148488, 'samples': 1777152, 'steps': 9255, 'loss/train': 1.8306480646133423} -08/30/2021 14:49:27 - INFO - __main__ - Step 9257: {'lr': 0.0004970404741379818, 'samples': 1777344, 'steps': 9256, 'loss/train': 1.9176039695739746} -08/30/2021 14:49:27 - INFO - __main__ - Step 9258: {'lr': 0.0004970396599498023, 'samples': 1777536, 'steps': 9257, 'loss/train': 1.1820268630981445} -08/30/2021 14:49:29 - INFO - __main__ - Step 9259: {'lr': 0.0004970388456503105, 'samples': 1777728, 'steps': 9258, 'loss/train': 1.8463993072509766} -08/30/2021 14:49:29 - INFO - __main__ - Step 9260: {'lr': 0.0004970380312395069, 'samples': 1777920, 'steps': 9259, 'loss/train': 1.7795135974884033} -08/30/2021 14:49:30 - INFO - __main__ - Step 9261: {'lr': 0.0004970372167173915, 'samples': 1778112, 'steps': 9260, 'loss/train': 1.6793103218078613} -08/30/2021 14:49:30 - INFO - __main__ - Step 9262: {'lr': 0.0004970364020839652, 'samples': 1778304, 'steps': 9261, 'loss/train': 2.0650460720062256} -08/30/2021 14:49:30 - INFO - __main__ - Step 9263: {'lr': 0.0004970355873392281, 'samples': 1778496, 'steps': 9262, 'loss/train': 1.8135298490524292} -08/30/2021 14:49:32 - INFO - __main__ - Step 9264: {'lr': 0.0004970347724831804, 'samples': 1778688, 'steps': 9263, 'loss/train': 1.5799111127853394} -08/30/2021 14:49:33 - INFO - __main__ - Step 9265: {'lr': 0.0004970339575158228, 'samples': 1778880, 'steps': 9264, 'loss/train': 3.0635735988616943} -08/30/2021 14:49:33 - INFO - __main__ - Step 9266: {'lr': 0.0004970331424371555, 'samples': 1779072, 'steps': 9265, 'loss/train': 0.1606554388999939} -08/30/2021 14:49:33 - INFO - __main__ - Step 9267: {'lr': 0.0004970323272471788, 'samples': 1779264, 'steps': 9266, 'loss/train': 1.526602864265442} -08/30/2021 14:49:34 - INFO - __main__ - Step 9268: {'lr': 0.0004970315119458931, 'samples': 1779456, 'steps': 9267, 'loss/train': 1.529158353805542} -08/30/2021 14:49:35 - INFO - __main__ - Step 9269: {'lr': 0.000497030696533299, 'samples': 1779648, 'steps': 9268, 'loss/train': 1.557956576347351} -08/30/2021 14:49:35 - INFO - __main__ - Step 9270: {'lr': 0.0004970298810093965, 'samples': 1779840, 'steps': 9269, 'loss/train': 1.7843255996704102} -08/30/2021 14:49:36 - INFO - __main__ - Step 9271: {'lr': 0.0004970290653741863, 'samples': 1780032, 'steps': 9270, 'loss/train': 1.910145878791809} -08/30/2021 14:49:36 - INFO - __main__ - Step 9272: {'lr': 0.0004970282496276684, 'samples': 1780224, 'steps': 9271, 'loss/train': 1.6822428703308105} -08/30/2021 14:49:37 - INFO - __main__ - Step 9273: {'lr': 0.0004970274337698436, 'samples': 1780416, 'steps': 9272, 'loss/train': 2.1968302726745605} -08/30/2021 14:49:37 - INFO - __main__ - Step 9274: {'lr': 0.000497026617800712, 'samples': 1780608, 'steps': 9273, 'loss/train': 1.8006296157836914} -08/30/2021 14:49:38 - INFO - __main__ - Step 9275: {'lr': 0.000497025801720274, 'samples': 1780800, 'steps': 9274, 'loss/train': 1.6218938827514648} -08/30/2021 14:49:39 - INFO - __main__ - Step 9276: {'lr': 0.00049702498552853, 'samples': 1780992, 'steps': 9275, 'loss/train': 1.7838683128356934} -08/30/2021 14:49:39 - INFO - __main__ - Step 9277: {'lr': 0.0004970241692254803, 'samples': 1781184, 'steps': 9276, 'loss/train': 2.7925031185150146} -08/30/2021 14:49:40 - INFO - __main__ - Step 9278: {'lr': 0.0004970233528111253, 'samples': 1781376, 'steps': 9277, 'loss/train': 2.448387384414673} -08/30/2021 14:49:40 - INFO - __main__ - Step 9279: {'lr': 0.0004970225362854654, 'samples': 1781568, 'steps': 9278, 'loss/train': 1.8577622175216675} -08/30/2021 14:49:41 - INFO - __main__ - Step 9280: {'lr': 0.0004970217196485011, 'samples': 1781760, 'steps': 9279, 'loss/train': 1.6791255474090576} -08/30/2021 14:49:42 - INFO - __main__ - Step 9281: {'lr': 0.0004970209029002325, 'samples': 1781952, 'steps': 9280, 'loss/train': 1.815529704093933} -08/30/2021 14:49:42 - INFO - __main__ - Step 9282: {'lr': 0.0004970200860406601, 'samples': 1782144, 'steps': 9281, 'loss/train': 1.7856688499450684} -08/30/2021 14:49:42 - INFO - __main__ - Step 9283: {'lr': 0.0004970192690697843, 'samples': 1782336, 'steps': 9282, 'loss/train': 1.3884061574935913} -08/30/2021 14:49:43 - INFO - __main__ - Step 9284: {'lr': 0.0004970184519876053, 'samples': 1782528, 'steps': 9283, 'loss/train': 1.9603992700576782} -08/30/2021 14:49:44 - INFO - __main__ - Step 9285: {'lr': 0.0004970176347941237, 'samples': 1782720, 'steps': 9284, 'loss/train': 2.057486057281494} -08/30/2021 14:49:45 - INFO - __main__ - Step 9286: {'lr': 0.0004970168174893398, 'samples': 1782912, 'steps': 9285, 'loss/train': 1.7812455892562866} -08/30/2021 14:49:45 - INFO - __main__ - Step 9287: {'lr': 0.0004970160000732539, 'samples': 1783104, 'steps': 9286, 'loss/train': 0.725993812084198} -08/30/2021 14:49:46 - INFO - __main__ - Step 9288: {'lr': 0.0004970151825458664, 'samples': 1783296, 'steps': 9287, 'loss/train': 2.4390835762023926} -08/30/2021 14:49:46 - INFO - __main__ - Step 9289: {'lr': 0.0004970143649071777, 'samples': 1783488, 'steps': 9288, 'loss/train': 2.1218433380126953} -08/30/2021 14:49:47 - INFO - __main__ - Step 9290: {'lr': 0.0004970135471571881, 'samples': 1783680, 'steps': 9289, 'loss/train': 1.61763334274292} -08/30/2021 14:49:48 - INFO - __main__ - Step 9291: {'lr': 0.000497012729295898, 'samples': 1783872, 'steps': 9290, 'loss/train': 2.6236159801483154} -08/30/2021 14:49:48 - INFO - __main__ - Step 9292: {'lr': 0.0004970119113233078, 'samples': 1784064, 'steps': 9291, 'loss/train': 1.4758740663528442} -08/30/2021 14:49:48 - INFO - __main__ - Step 9293: {'lr': 0.0004970110932394178, 'samples': 1784256, 'steps': 9292, 'loss/train': 2.0144641399383545} -08/30/2021 14:49:49 - INFO - __main__ - Step 9294: {'lr': 0.0004970102750442285, 'samples': 1784448, 'steps': 9293, 'loss/train': 0.9846737384796143} -08/30/2021 14:49:51 - INFO - __main__ - Step 9295: {'lr': 0.0004970094567377402, 'samples': 1784640, 'steps': 9294, 'loss/train': 1.7332916259765625} -08/30/2021 14:49:51 - INFO - __main__ - Step 9296: {'lr': 0.0004970086383199532, 'samples': 1784832, 'steps': 9295, 'loss/train': 1.6792523860931396} -08/30/2021 14:49:51 - INFO - __main__ - Step 9297: {'lr': 0.0004970078197908678, 'samples': 1785024, 'steps': 9296, 'loss/train': 2.2584574222564697} -08/30/2021 14:49:52 - INFO - __main__ - Step 9298: {'lr': 0.0004970070011504846, 'samples': 1785216, 'steps': 9297, 'loss/train': 1.9478328227996826} -08/30/2021 14:49:52 - INFO - __main__ - Step 9299: {'lr': 0.0004970061823988038, 'samples': 1785408, 'steps': 9298, 'loss/train': 2.174748659133911} -08/30/2021 14:49:53 - INFO - __main__ - Step 9300: {'lr': 0.0004970053635358259, 'samples': 1785600, 'steps': 9299, 'loss/train': 1.427147626876831} -08/30/2021 14:49:54 - INFO - __main__ - Step 9301: {'lr': 0.0004970045445615512, 'samples': 1785792, 'steps': 9300, 'loss/train': 2.43338680267334} -08/30/2021 14:49:54 - INFO - __main__ - Step 9302: {'lr': 0.00049700372547598, 'samples': 1785984, 'steps': 9301, 'loss/train': 2.0076563358306885} -08/30/2021 14:49:55 - INFO - __main__ - Step 9303: {'lr': 0.0004970029062791128, 'samples': 1786176, 'steps': 9302, 'loss/train': 1.8735857009887695} -08/30/2021 14:49:55 - INFO - __main__ - Step 9304: {'lr': 0.0004970020869709498, 'samples': 1786368, 'steps': 9303, 'loss/train': 1.7932754755020142} -08/30/2021 14:49:55 - INFO - __main__ - Step 9305: {'lr': 0.0004970012675514915, 'samples': 1786560, 'steps': 9304, 'loss/train': 2.0158021450042725} -08/30/2021 14:49:58 - INFO - __main__ - Step 9306: {'lr': 0.0004970004480207384, 'samples': 1786752, 'steps': 9305, 'loss/train': 2.2706642150878906} -08/30/2021 14:49:58 - INFO - __main__ - Step 9307: {'lr': 0.0004969996283786905, 'samples': 1786944, 'steps': 9306, 'loss/train': 1.4431320428848267} -08/30/2021 14:49:58 - INFO - __main__ - Step 9308: {'lr': 0.0004969988086253486, 'samples': 1787136, 'steps': 9307, 'loss/train': 2.0406265258789062} -08/30/2021 14:49:59 - INFO - __main__ - Step 9309: {'lr': 0.0004969979887607125, 'samples': 1787328, 'steps': 9308, 'loss/train': 1.8976439237594604} -08/30/2021 14:49:59 - INFO - __main__ - Step 9310: {'lr': 0.0004969971687847832, 'samples': 1787520, 'steps': 9309, 'loss/train': 1.7175661325454712} -08/30/2021 14:50:01 - INFO - __main__ - Step 9311: {'lr': 0.0004969963486975607, 'samples': 1787712, 'steps': 9310, 'loss/train': 1.9850002527236938} -08/30/2021 14:50:01 - INFO - __main__ - Step 9312: {'lr': 0.0004969955284990455, 'samples': 1787904, 'steps': 9311, 'loss/train': 2.112910747528076} -08/30/2021 14:50:02 - INFO - __main__ - Step 9313: {'lr': 0.0004969947081892379, 'samples': 1788096, 'steps': 9312, 'loss/train': 0.1662347912788391} -08/30/2021 14:50:02 - INFO - __main__ - Step 9314: {'lr': 0.0004969938877681383, 'samples': 1788288, 'steps': 9313, 'loss/train': 0.2272965908050537} -08/30/2021 14:50:02 - INFO - __main__ - Step 9315: {'lr': 0.0004969930672357471, 'samples': 1788480, 'steps': 9314, 'loss/train': 1.179009199142456} -08/30/2021 14:50:04 - INFO - __main__ - Step 9316: {'lr': 0.0004969922465920645, 'samples': 1788672, 'steps': 9315, 'loss/train': 1.317862868309021} -08/30/2021 14:50:05 - INFO - __main__ - Step 9317: {'lr': 0.0004969914258370912, 'samples': 1788864, 'steps': 9316, 'loss/train': 1.5546584129333496} -08/30/2021 14:50:05 - INFO - __main__ - Step 9318: {'lr': 0.0004969906049708272, 'samples': 1789056, 'steps': 9317, 'loss/train': 1.9591002464294434} -08/30/2021 14:50:05 - INFO - __main__ - Step 9319: {'lr': 0.0004969897839932732, 'samples': 1789248, 'steps': 9318, 'loss/train': 0.42939651012420654} -08/30/2021 14:50:06 - INFO - __main__ - Step 9320: {'lr': 0.0004969889629044293, 'samples': 1789440, 'steps': 9319, 'loss/train': 2.0537118911743164} -08/30/2021 14:50:07 - INFO - __main__ - Step 9321: {'lr': 0.000496988141704296, 'samples': 1789632, 'steps': 9320, 'loss/train': 1.2576552629470825} -08/30/2021 14:50:08 - INFO - __main__ - Step 9322: {'lr': 0.0004969873203928737, 'samples': 1789824, 'steps': 9321, 'loss/train': 1.7723240852355957} -08/30/2021 14:50:08 - INFO - __main__ - Step 9323: {'lr': 0.0004969864989701626, 'samples': 1790016, 'steps': 9322, 'loss/train': 2.057669162750244} -08/30/2021 14:50:08 - INFO - __main__ - Step 9324: {'lr': 0.0004969856774361634, 'samples': 1790208, 'steps': 9323, 'loss/train': 1.8261970281600952} -08/30/2021 14:50:09 - INFO - __main__ - Step 9325: {'lr': 0.0004969848557908761, 'samples': 1790400, 'steps': 9324, 'loss/train': 1.5761268138885498} -08/30/2021 14:50:09 - INFO - __main__ - Step 9326: {'lr': 0.0004969840340343013, 'samples': 1790592, 'steps': 9325, 'loss/train': 2.015223264694214} -08/30/2021 14:50:11 - INFO - __main__ - Step 9327: {'lr': 0.0004969832121664394, 'samples': 1790784, 'steps': 9326, 'loss/train': 1.8708689212799072} -08/30/2021 14:50:11 - INFO - __main__ - Step 9328: {'lr': 0.0004969823901872906, 'samples': 1790976, 'steps': 9327, 'loss/train': 2.039632558822632} -08/30/2021 14:50:11 - INFO - __main__ - Step 9329: {'lr': 0.0004969815680968552, 'samples': 1791168, 'steps': 9328, 'loss/train': 2.0620734691619873} -08/30/2021 14:50:12 - INFO - __main__ - Step 9330: {'lr': 0.0004969807458951339, 'samples': 1791360, 'steps': 9329, 'loss/train': 1.9500455856323242} -08/30/2021 14:50:12 - INFO - __main__ - Step 9331: {'lr': 0.0004969799235821268, 'samples': 1791552, 'steps': 9330, 'loss/train': 1.9190891981124878} -08/30/2021 14:50:14 - INFO - __main__ - Step 9332: {'lr': 0.0004969791011578344, 'samples': 1791744, 'steps': 9331, 'loss/train': 1.569718837738037} -08/30/2021 14:50:14 - INFO - __main__ - Step 9333: {'lr': 0.000496978278622257, 'samples': 1791936, 'steps': 9332, 'loss/train': 2.2379322052001953} -08/30/2021 14:50:15 - INFO - __main__ - Step 9334: {'lr': 0.000496977455975395, 'samples': 1792128, 'steps': 9333, 'loss/train': 0.2754552364349365} -08/30/2021 14:50:15 - INFO - __main__ - Step 9335: {'lr': 0.0004969766332172488, 'samples': 1792320, 'steps': 9334, 'loss/train': 2.2136521339416504} -08/30/2021 14:50:15 - INFO - __main__ - Step 9336: {'lr': 0.0004969758103478187, 'samples': 1792512, 'steps': 9335, 'loss/train': 1.8635731935501099} -08/30/2021 14:50:17 - INFO - __main__ - Step 9337: {'lr': 0.0004969749873671051, 'samples': 1792704, 'steps': 9336, 'loss/train': 1.954540729522705} -08/30/2021 14:50:17 - INFO - __main__ - Step 9338: {'lr': 0.0004969741642751085, 'samples': 1792896, 'steps': 9337, 'loss/train': 2.115929126739502} -08/30/2021 14:50:18 - INFO - __main__ - Step 9339: {'lr': 0.000496973341071829, 'samples': 1793088, 'steps': 9338, 'loss/train': 2.2687363624572754} -08/30/2021 14:50:18 - INFO - __main__ - Step 9340: {'lr': 0.0004969725177572672, 'samples': 1793280, 'steps': 9339, 'loss/train': 1.9051958322525024} -08/30/2021 14:50:18 - INFO - __main__ - Step 9341: {'lr': 0.0004969716943314234, 'samples': 1793472, 'steps': 9340, 'loss/train': 1.7493877410888672} -08/30/2021 14:50:20 - INFO - __main__ - Step 9342: {'lr': 0.0004969708707942979, 'samples': 1793664, 'steps': 9341, 'loss/train': 2.1003103256225586} -08/30/2021 14:50:20 - INFO - __main__ - Step 9343: {'lr': 0.0004969700471458913, 'samples': 1793856, 'steps': 9342, 'loss/train': 1.5054258108139038} -08/30/2021 14:50:21 - INFO - __main__ - Step 9344: {'lr': 0.0004969692233862036, 'samples': 1794048, 'steps': 9343, 'loss/train': 2.7108588218688965} -08/30/2021 14:50:21 - INFO - __main__ - Step 9345: {'lr': 0.0004969683995152355, 'samples': 1794240, 'steps': 9344, 'loss/train': 1.6341618299484253} -08/30/2021 14:50:21 - INFO - __main__ - Step 9346: {'lr': 0.0004969675755329872, 'samples': 1794432, 'steps': 9345, 'loss/train': 2.0203230381011963} -08/30/2021 14:50:23 - INFO - __main__ - Step 9347: {'lr': 0.0004969667514394592, 'samples': 1794624, 'steps': 9346, 'loss/train': 2.1350884437561035} -08/30/2021 14:50:23 - INFO - __main__ - Step 9348: {'lr': 0.0004969659272346517, 'samples': 1794816, 'steps': 9347, 'loss/train': 1.983215093612671} -08/30/2021 14:50:24 - INFO - __main__ - Step 9349: {'lr': 0.0004969651029185652, 'samples': 1795008, 'steps': 9348, 'loss/train': 2.0139341354370117} -08/30/2021 14:50:24 - INFO - __main__ - Step 9350: {'lr': 0.0004969642784912001, 'samples': 1795200, 'steps': 9349, 'loss/train': 2.193344831466675} -08/30/2021 14:50:24 - INFO - __main__ - Step 9351: {'lr': 0.0004969634539525566, 'samples': 1795392, 'steps': 9350, 'loss/train': 1.4754719734191895} -08/30/2021 14:50:25 - INFO - __main__ - Step 9352: {'lr': 0.0004969626293026353, 'samples': 1795584, 'steps': 9351, 'loss/train': 2.1202762126922607} -08/30/2021 14:50:26 - INFO - __main__ - Step 9353: {'lr': 0.0004969618045414363, 'samples': 1795776, 'steps': 9352, 'loss/train': 1.3586260080337524} -08/30/2021 14:50:27 - INFO - __main__ - Step 9354: {'lr': 0.0004969609796689602, 'samples': 1795968, 'steps': 9353, 'loss/train': 1.8787740468978882} -08/30/2021 14:50:27 - INFO - __main__ - Step 9355: {'lr': 0.0004969601546852073, 'samples': 1796160, 'steps': 9354, 'loss/train': 1.8635075092315674} -08/30/2021 14:50:27 - INFO - __main__ - Step 9356: {'lr': 0.0004969593295901779, 'samples': 1796352, 'steps': 9355, 'loss/train': 1.9155939817428589} -08/30/2021 14:50:28 - INFO - __main__ - Step 9357: {'lr': 0.0004969585043838725, 'samples': 1796544, 'steps': 9356, 'loss/train': 2.4200963973999023} -08/30/2021 14:50:30 - INFO - __main__ - Step 9358: {'lr': 0.0004969576790662914, 'samples': 1796736, 'steps': 9357, 'loss/train': 1.6718475818634033} -08/30/2021 14:50:30 - INFO - __main__ - Step 9359: {'lr': 0.0004969568536374349, 'samples': 1796928, 'steps': 9358, 'loss/train': 0.1486867070198059} -08/30/2021 14:50:31 - INFO - __main__ - Step 9360: {'lr': 0.0004969560280973036, 'samples': 1797120, 'steps': 9359, 'loss/train': 1.8262906074523926} -08/30/2021 14:50:31 - INFO - __main__ - Step 9361: {'lr': 0.0004969552024458976, 'samples': 1797312, 'steps': 9360, 'loss/train': 2.6798460483551025} -08/30/2021 14:50:31 - INFO - __main__ - Step 9362: {'lr': 0.0004969543766832176, 'samples': 1797504, 'steps': 9361, 'loss/train': 1.361230731010437} -08/30/2021 14:50:32 - INFO - __main__ - Step 9363: {'lr': 0.0004969535508092635, 'samples': 1797696, 'steps': 9362, 'loss/train': 1.794560432434082} -08/30/2021 14:50:33 - INFO - __main__ - Step 9364: {'lr': 0.0004969527248240361, 'samples': 1797888, 'steps': 9363, 'loss/train': 1.8477025032043457} -08/30/2021 14:50:34 - INFO - __main__ - Step 9365: {'lr': 0.0004969518987275356, 'samples': 1798080, 'steps': 9364, 'loss/train': 1.7897114753723145} -08/30/2021 14:50:34 - INFO - __main__ - Step 9366: {'lr': 0.0004969510725197624, 'samples': 1798272, 'steps': 9365, 'loss/train': 2.2025904655456543} -08/30/2021 14:50:34 - INFO - __main__ - Step 9367: {'lr': 0.0004969502462007167, 'samples': 1798464, 'steps': 9366, 'loss/train': 1.8683362007141113} -08/30/2021 14:50:35 - INFO - __main__ - Step 9368: {'lr': 0.0004969494197703992, 'samples': 1798656, 'steps': 9367, 'loss/train': 1.8720678091049194} -08/30/2021 14:50:37 - INFO - __main__ - Step 9369: {'lr': 0.00049694859322881, 'samples': 1798848, 'steps': 9368, 'loss/train': 1.8280768394470215} -08/30/2021 14:50:37 - INFO - __main__ - Step 9370: {'lr': 0.0004969477665759496, 'samples': 1799040, 'steps': 9369, 'loss/train': 1.9363033771514893} -08/30/2021 14:50:38 - INFO - __main__ - Step 9371: {'lr': 0.0004969469398118184, 'samples': 1799232, 'steps': 9370, 'loss/train': 1.9637559652328491} -08/30/2021 14:50:38 - INFO - __main__ - Step 9372: {'lr': 0.0004969461129364167, 'samples': 1799424, 'steps': 9371, 'loss/train': 2.121222972869873} -08/30/2021 14:50:38 - INFO - __main__ - Step 9373: {'lr': 0.0004969452859497449, 'samples': 1799616, 'steps': 9372, 'loss/train': 1.653204321861267} -08/30/2021 14:50:40 - INFO - __main__ - Step 9374: {'lr': 0.0004969444588518034, 'samples': 1799808, 'steps': 9373, 'loss/train': 2.1637487411499023} -08/30/2021 14:50:40 - INFO - __main__ - Step 9375: {'lr': 0.0004969436316425924, 'samples': 1800000, 'steps': 9374, 'loss/train': 2.070594549179077} -08/30/2021 14:50:41 - INFO - __main__ - Step 9376: {'lr': 0.0004969428043221125, 'samples': 1800192, 'steps': 9375, 'loss/train': 2.100050210952759} -08/30/2021 14:50:41 - INFO - __main__ - Step 9377: {'lr': 0.000496941976890364, 'samples': 1800384, 'steps': 9376, 'loss/train': 2.5154988765716553} -08/30/2021 14:50:41 - INFO - __main__ - Step 9378: {'lr': 0.0004969411493473472, 'samples': 1800576, 'steps': 9377, 'loss/train': 1.6724045276641846} -08/30/2021 14:50:42 - INFO - __main__ - Step 9379: {'lr': 0.0004969403216930626, 'samples': 1800768, 'steps': 9378, 'loss/train': 1.6164556741714478} -08/30/2021 14:50:43 - INFO - __main__ - Step 9380: {'lr': 0.0004969394939275105, 'samples': 1800960, 'steps': 9379, 'loss/train': 2.2861320972442627} -08/30/2021 14:50:44 - INFO - __main__ - Step 9381: {'lr': 0.0004969386660506912, 'samples': 1801152, 'steps': 9380, 'loss/train': 1.7749894857406616} -08/30/2021 14:50:44 - INFO - __main__ - Step 9382: {'lr': 0.0004969378380626051, 'samples': 1801344, 'steps': 9381, 'loss/train': 2.0912327766418457} -08/30/2021 14:50:44 - INFO - __main__ - Step 9383: {'lr': 0.0004969370099632528, 'samples': 1801536, 'steps': 9382, 'loss/train': 1.6605771780014038} -08/30/2021 14:50:45 - INFO - __main__ - Step 9384: {'lr': 0.0004969361817526343, 'samples': 1801728, 'steps': 9383, 'loss/train': 2.2192394733428955} -08/30/2021 14:50:46 - INFO - __main__ - Step 9385: {'lr': 0.0004969353534307504, 'samples': 1801920, 'steps': 9384, 'loss/train': 1.7540037631988525} -08/30/2021 14:50:47 - INFO - __main__ - Step 9386: {'lr': 0.000496934524997601, 'samples': 1802112, 'steps': 9385, 'loss/train': 1.8286198377609253} -08/30/2021 14:50:47 - INFO - __main__ - Step 9387: {'lr': 0.0004969336964531869, 'samples': 1802304, 'steps': 9386, 'loss/train': 1.9215701818466187} -08/30/2021 14:50:47 - INFO - __main__ - Step 9388: {'lr': 0.0004969328677975083, 'samples': 1802496, 'steps': 9387, 'loss/train': 1.9116616249084473} -08/30/2021 14:50:48 - INFO - __main__ - Step 9389: {'lr': 0.0004969320390305654, 'samples': 1802688, 'steps': 9388, 'loss/train': 1.8428884744644165} -08/30/2021 14:50:49 - INFO - __main__ - Step 9390: {'lr': 0.0004969312101523588, 'samples': 1802880, 'steps': 9389, 'loss/train': 1.4747421741485596} -08/30/2021 14:50:50 - INFO - __main__ - Step 9391: {'lr': 0.0004969303811628888, 'samples': 1803072, 'steps': 9390, 'loss/train': 1.980588436126709} -08/30/2021 14:50:50 - INFO - __main__ - Step 9392: {'lr': 0.0004969295520621558, 'samples': 1803264, 'steps': 9391, 'loss/train': 0.13408294320106506} -08/30/2021 14:50:50 - INFO - __main__ - Step 9393: {'lr': 0.0004969287228501602, 'samples': 1803456, 'steps': 9392, 'loss/train': 2.0473554134368896} -08/30/2021 14:50:51 - INFO - __main__ - Step 9394: {'lr': 0.0004969278935269022, 'samples': 1803648, 'steps': 9393, 'loss/train': 1.6537960767745972} -08/30/2021 14:50:52 - INFO - __main__ - Step 9395: {'lr': 0.0004969270640923823, 'samples': 1803840, 'steps': 9394, 'loss/train': 1.537422776222229} -08/30/2021 14:50:53 - INFO - __main__ - Step 9396: {'lr': 0.0004969262345466011, 'samples': 1804032, 'steps': 9395, 'loss/train': 1.6788089275360107} -08/30/2021 14:50:53 - INFO - __main__ - Step 9397: {'lr': 0.0004969254048895585, 'samples': 1804224, 'steps': 9396, 'loss/train': 1.6357635259628296} -08/30/2021 14:50:54 - INFO - __main__ - Step 9398: {'lr': 0.0004969245751212552, 'samples': 1804416, 'steps': 9397, 'loss/train': 1.9354521036148071} -08/30/2021 14:50:54 - INFO - __main__ - Step 9399: {'lr': 0.0004969237452416915, 'samples': 1804608, 'steps': 9398, 'loss/train': 1.7608600854873657} -08/30/2021 14:50:55 - INFO - __main__ - Step 9400: {'lr': 0.0004969229152508678, 'samples': 1804800, 'steps': 9399, 'loss/train': 1.6554512977600098} -08/30/2021 14:50:56 - INFO - __main__ - Step 9401: {'lr': 0.0004969220851487844, 'samples': 1804992, 'steps': 9400, 'loss/train': 1.4405708312988281} -08/30/2021 14:50:56 - INFO - __main__ - Step 9402: {'lr': 0.0004969212549354418, 'samples': 1805184, 'steps': 9401, 'loss/train': 1.9279801845550537} -08/30/2021 14:50:57 - INFO - __main__ - Step 9403: {'lr': 0.0004969204246108402, 'samples': 1805376, 'steps': 9402, 'loss/train': 1.7291628122329712} -08/30/2021 14:50:57 - INFO - __main__ - Step 9404: {'lr': 0.0004969195941749801, 'samples': 1805568, 'steps': 9403, 'loss/train': 2.056635618209839} -08/30/2021 14:50:58 - INFO - __main__ - Step 9405: {'lr': 0.000496918763627862, 'samples': 1805760, 'steps': 9404, 'loss/train': 2.1522889137268066} -08/30/2021 14:50:59 - INFO - __main__ - Step 9406: {'lr': 0.0004969179329694859, 'samples': 1805952, 'steps': 9405, 'loss/train': 2.2526438236236572} -08/30/2021 14:50:59 - INFO - __main__ - Step 9407: {'lr': 0.0004969171021998525, 'samples': 1806144, 'steps': 9406, 'loss/train': 1.9701427221298218} -08/30/2021 14:51:00 - INFO - __main__ - Step 9408: {'lr': 0.0004969162713189619, 'samples': 1806336, 'steps': 9407, 'loss/train': 1.499146580696106} -08/30/2021 14:51:00 - INFO - __main__ - Step 9409: {'lr': 0.0004969154403268148, 'samples': 1806528, 'steps': 9408, 'loss/train': 2.4673938751220703} -08/30/2021 14:51:00 - INFO - __main__ - Step 9410: {'lr': 0.0004969146092234114, 'samples': 1806720, 'steps': 9409, 'loss/train': 1.3679702281951904} -08/30/2021 14:51:02 - INFO - __main__ - Step 9411: {'lr': 0.000496913778008752, 'samples': 1806912, 'steps': 9410, 'loss/train': 1.5414880514144897} -08/30/2021 14:51:02 - INFO - __main__ - Step 9412: {'lr': 0.0004969129466828371, 'samples': 1807104, 'steps': 9411, 'loss/train': 1.9186081886291504} -08/30/2021 14:51:03 - INFO - __main__ - Step 9413: {'lr': 0.0004969121152456671, 'samples': 1807296, 'steps': 9412, 'loss/train': 1.4455149173736572} -08/30/2021 14:51:03 - INFO - __main__ - Step 9414: {'lr': 0.0004969112836972423, 'samples': 1807488, 'steps': 9413, 'loss/train': 1.8019697666168213} -08/30/2021 14:51:03 - INFO - __main__ - Step 9415: {'lr': 0.000496910452037563, 'samples': 1807680, 'steps': 9414, 'loss/train': 1.9133750200271606} -08/30/2021 14:51:05 - INFO - __main__ - Step 9416: {'lr': 0.0004969096202666297, 'samples': 1807872, 'steps': 9415, 'loss/train': 1.8285832405090332} -08/30/2021 14:51:05 - INFO - __main__ - Step 9417: {'lr': 0.0004969087883844428, 'samples': 1808064, 'steps': 9416, 'loss/train': 1.9302802085876465} -08/30/2021 14:51:06 - INFO - __main__ - Step 9418: {'lr': 0.0004969079563910025, 'samples': 1808256, 'steps': 9417, 'loss/train': 1.6582567691802979} -08/30/2021 14:51:06 - INFO - __main__ - Step 9419: {'lr': 0.0004969071242863093, 'samples': 1808448, 'steps': 9418, 'loss/train': 0.6336837410926819} -08/30/2021 14:51:06 - INFO - __main__ - Step 9420: {'lr': 0.0004969062920703636, 'samples': 1808640, 'steps': 9419, 'loss/train': 1.6298236846923828} -08/30/2021 14:51:09 - INFO - __main__ - Step 9421: {'lr': 0.0004969054597431658, 'samples': 1808832, 'steps': 9420, 'loss/train': 2.063265800476074} -08/30/2021 14:51:09 - INFO - __main__ - Step 9422: {'lr': 0.0004969046273047161, 'samples': 1809024, 'steps': 9421, 'loss/train': 2.3442225456237793} -08/30/2021 14:51:10 - INFO - __main__ - Step 9423: {'lr': 0.0004969037947550151, 'samples': 1809216, 'steps': 9422, 'loss/train': 1.5826541185379028} -08/30/2021 14:51:10 - INFO - __main__ - Step 9424: {'lr': 0.000496902962094063, 'samples': 1809408, 'steps': 9423, 'loss/train': 2.43269944190979} -08/30/2021 14:51:10 - INFO - __main__ - Step 9425: {'lr': 0.0004969021293218602, 'samples': 1809600, 'steps': 9424, 'loss/train': 1.674534797668457} -08/30/2021 14:51:11 - INFO - __main__ - Step 9426: {'lr': 0.0004969012964384071, 'samples': 1809792, 'steps': 9425, 'loss/train': 2.499333381652832} -08/30/2021 14:51:13 - INFO - __main__ - Step 9427: {'lr': 0.0004969004634437042, 'samples': 1809984, 'steps': 9426, 'loss/train': 1.3876187801361084} -08/30/2021 14:51:13 - INFO - __main__ - Step 9428: {'lr': 0.0004968996303377517, 'samples': 1810176, 'steps': 9427, 'loss/train': 0.2191656529903412} -08/30/2021 14:51:13 - INFO - __main__ - Step 9429: {'lr': 0.00049689879712055, 'samples': 1810368, 'steps': 9428, 'loss/train': 0.17023412883281708} -08/30/2021 14:51:14 - INFO - __main__ - Step 9430: {'lr': 0.0004968979637920995, 'samples': 1810560, 'steps': 9429, 'loss/train': 1.1126787662506104} -08/30/2021 14:51:14 - INFO - __main__ - Step 9431: {'lr': 0.0004968971303524007, 'samples': 1810752, 'steps': 9430, 'loss/train': 1.171593189239502} -08/30/2021 14:51:14 - INFO - __main__ - Step 9432: {'lr': 0.0004968962968014537, 'samples': 1810944, 'steps': 9431, 'loss/train': 1.8794907331466675} -08/30/2021 14:51:16 - INFO - __main__ - Step 9433: {'lr': 0.0004968954631392592, 'samples': 1811136, 'steps': 9432, 'loss/train': 1.5810835361480713} -08/30/2021 14:51:16 - INFO - __main__ - Step 9434: {'lr': 0.0004968946293658173, 'samples': 1811328, 'steps': 9433, 'loss/train': 1.717587947845459} -08/30/2021 14:51:17 - INFO - __main__ - Step 9435: {'lr': 0.0004968937954811284, 'samples': 1811520, 'steps': 9434, 'loss/train': 1.9044227600097656} -08/30/2021 14:51:17 - INFO - __main__ - Step 9436: {'lr': 0.0004968929614851932, 'samples': 1811712, 'steps': 9435, 'loss/train': 2.173994779586792} -08/30/2021 14:51:18 - INFO - __main__ - Step 9437: {'lr': 0.0004968921273780118, 'samples': 1811904, 'steps': 9436, 'loss/train': 1.477209448814392} -08/30/2021 14:51:19 - INFO - __main__ - Step 9438: {'lr': 0.0004968912931595845, 'samples': 1812096, 'steps': 9437, 'loss/train': 1.643391728401184} -08/30/2021 14:51:20 - INFO - __main__ - Step 9439: {'lr': 0.0004968904588299118, 'samples': 1812288, 'steps': 9438, 'loss/train': 2.1049187183380127} -08/30/2021 14:51:20 - INFO - __main__ - Step 9440: {'lr': 0.0004968896243889941, 'samples': 1812480, 'steps': 9439, 'loss/train': 1.4536027908325195} -08/30/2021 14:51:21 - INFO - __main__ - Step 9441: {'lr': 0.0004968887898368318, 'samples': 1812672, 'steps': 9440, 'loss/train': 1.6639186143875122} -08/30/2021 14:51:21 - INFO - __main__ - Step 9442: {'lr': 0.0004968879551734252, 'samples': 1812864, 'steps': 9441, 'loss/train': 0.5168627500534058} -08/30/2021 14:51:21 - INFO - __main__ - Step 9443: {'lr': 0.0004968871203987746, 'samples': 1813056, 'steps': 9442, 'loss/train': 0.1469617784023285} -08/30/2021 14:51:23 - INFO - __main__ - Step 9444: {'lr': 0.0004968862855128806, 'samples': 1813248, 'steps': 9443, 'loss/train': 1.4375885725021362} -08/30/2021 14:51:23 - INFO - __main__ - Step 9445: {'lr': 0.0004968854505157434, 'samples': 1813440, 'steps': 9444, 'loss/train': 1.534547209739685} -08/30/2021 14:51:24 - INFO - __main__ - Step 9446: {'lr': 0.0004968846154073634, 'samples': 1813632, 'steps': 9445, 'loss/train': 1.9740641117095947} -08/30/2021 14:51:24 - INFO - __main__ - Step 9447: {'lr': 0.0004968837801877411, 'samples': 1813824, 'steps': 9446, 'loss/train': 1.5035918951034546} -08/30/2021 14:51:24 - INFO - __main__ - Step 9448: {'lr': 0.0004968829448568766, 'samples': 1814016, 'steps': 9447, 'loss/train': 2.2901721000671387} -08/30/2021 14:51:25 - INFO - __main__ - Step 9449: {'lr': 0.0004968821094147706, 'samples': 1814208, 'steps': 9448, 'loss/train': 1.6791605949401855} -08/30/2021 14:51:26 - INFO - __main__ - Step 9450: {'lr': 0.0004968812738614232, 'samples': 1814400, 'steps': 9449, 'loss/train': 1.6993780136108398} -08/30/2021 14:51:27 - INFO - __main__ - Step 9451: {'lr': 0.000496880438196835, 'samples': 1814592, 'steps': 9450, 'loss/train': 2.3020646572113037} -08/30/2021 14:51:27 - INFO - __main__ - Step 9452: {'lr': 0.0004968796024210064, 'samples': 1814784, 'steps': 9451, 'loss/train': 1.5926811695098877} -08/30/2021 14:51:27 - INFO - __main__ - Step 9453: {'lr': 0.0004968787665339375, 'samples': 1814976, 'steps': 9452, 'loss/train': 0.1305505633354187} -08/30/2021 14:51:28 - INFO - __main__ - Step 9454: {'lr': 0.0004968779305356289, 'samples': 1815168, 'steps': 9453, 'loss/train': 2.2053568363189697} -08/30/2021 14:51:29 - INFO - __main__ - Step 9455: {'lr': 0.0004968770944260808, 'samples': 1815360, 'steps': 9454, 'loss/train': 1.9923434257507324} -08/30/2021 14:51:30 - INFO - __main__ - Step 9456: {'lr': 0.0004968762582052938, 'samples': 1815552, 'steps': 9455, 'loss/train': 2.0484702587127686} -08/30/2021 14:51:30 - INFO - __main__ - Step 9457: {'lr': 0.0004968754218732682, 'samples': 1815744, 'steps': 9456, 'loss/train': 2.0139009952545166} -08/30/2021 14:51:30 - INFO - __main__ - Step 9458: {'lr': 0.0004968745854300043, 'samples': 1815936, 'steps': 9457, 'loss/train': 3.09591007232666} -08/30/2021 14:51:31 - INFO - __main__ - Step 9459: {'lr': 0.0004968737488755025, 'samples': 1816128, 'steps': 9458, 'loss/train': 2.00433611869812} -08/30/2021 14:51:33 - INFO - __main__ - Step 9460: {'lr': 0.0004968729122097632, 'samples': 1816320, 'steps': 9459, 'loss/train': 1.778140902519226} -08/30/2021 14:51:33 - INFO - __main__ - Step 9461: {'lr': 0.0004968720754327867, 'samples': 1816512, 'steps': 9460, 'loss/train': 1.7109475135803223} -08/30/2021 14:51:34 - INFO - __main__ - Step 9462: {'lr': 0.0004968712385445737, 'samples': 1816704, 'steps': 9461, 'loss/train': 0.22620485723018646} -08/30/2021 14:51:34 - INFO - __main__ - Step 9463: {'lr': 0.0004968704015451241, 'samples': 1816896, 'steps': 9462, 'loss/train': 1.6831026077270508} -08/30/2021 14:51:34 - INFO - __main__ - Step 9464: {'lr': 0.0004968695644344387, 'samples': 1817088, 'steps': 9463, 'loss/train': 2.1342976093292236} -08/30/2021 14:51:35 - INFO - __main__ - Step 9465: {'lr': 0.0004968687272125174, 'samples': 1817280, 'steps': 9464, 'loss/train': 1.927371621131897} -08/30/2021 14:51:36 - INFO - __main__ - Step 9466: {'lr': 0.0004968678898793611, 'samples': 1817472, 'steps': 9465, 'loss/train': 1.3137162923812866} -08/30/2021 14:51:37 - INFO - __main__ - Step 9467: {'lr': 0.0004968670524349699, 'samples': 1817664, 'steps': 9466, 'loss/train': 1.5771915912628174} -08/30/2021 14:51:37 - INFO - __main__ - Step 9468: {'lr': 0.0004968662148793441, 'samples': 1817856, 'steps': 9467, 'loss/train': 1.8674590587615967} -08/30/2021 14:51:37 - INFO - __main__ - Step 9469: {'lr': 0.0004968653772124843, 'samples': 1818048, 'steps': 9468, 'loss/train': 1.9872907400131226} -08/30/2021 14:51:38 - INFO - __main__ - Step 9470: {'lr': 0.0004968645394343908, 'samples': 1818240, 'steps': 9469, 'loss/train': 1.0401135683059692} -08/30/2021 14:51:38 - INFO - __main__ - Step 9471: {'lr': 0.0004968637015450639, 'samples': 1818432, 'steps': 9470, 'loss/train': 2.21691632270813} -08/30/2021 14:51:40 - INFO - __main__ - Step 9472: {'lr': 0.000496862863544504, 'samples': 1818624, 'steps': 9471, 'loss/train': 0.1765308529138565} -08/30/2021 14:51:40 - INFO - __main__ - Step 9473: {'lr': 0.0004968620254327114, 'samples': 1818816, 'steps': 9472, 'loss/train': 1.7371716499328613} -08/30/2021 14:51:40 - INFO - __main__ - Step 9474: {'lr': 0.0004968611872096868, 'samples': 1819008, 'steps': 9473, 'loss/train': 1.7049574851989746} -08/30/2021 14:51:41 - INFO - __main__ - Step 9475: {'lr': 0.0004968603488754302, 'samples': 1819200, 'steps': 9474, 'loss/train': 1.7634905576705933} -08/30/2021 14:51:41 - INFO - __main__ - Step 9476: {'lr': 0.0004968595104299422, 'samples': 1819392, 'steps': 9475, 'loss/train': 2.0750572681427} -08/30/2021 14:51:43 - INFO - __main__ - Step 9477: {'lr': 0.000496858671873223, 'samples': 1819584, 'steps': 9476, 'loss/train': 2.400235891342163} -08/30/2021 14:51:44 - INFO - __main__ - Step 9478: {'lr': 0.0004968578332052733, 'samples': 1819776, 'steps': 9477, 'loss/train': 2.051832675933838} -08/30/2021 14:51:44 - INFO - __main__ - Step 9479: {'lr': 0.0004968569944260932, 'samples': 1819968, 'steps': 9478, 'loss/train': 0.609390377998352} -08/30/2021 14:51:44 - INFO - __main__ - Step 9480: {'lr': 0.0004968561555356831, 'samples': 1820160, 'steps': 9479, 'loss/train': 1.7644001245498657} -08/30/2021 14:51:45 - INFO - __main__ - Step 9481: {'lr': 0.0004968553165340435, 'samples': 1820352, 'steps': 9480, 'loss/train': 1.7184343338012695} -08/30/2021 14:51:46 - INFO - __main__ - Step 9482: {'lr': 0.0004968544774211746, 'samples': 1820544, 'steps': 9481, 'loss/train': 1.5007576942443848} -08/30/2021 14:51:47 - INFO - __main__ - Step 9483: {'lr': 0.0004968536381970769, 'samples': 1820736, 'steps': 9482, 'loss/train': 1.4033454656600952} -08/30/2021 14:51:47 - INFO - __main__ - Step 9484: {'lr': 0.0004968527988617508, 'samples': 1820928, 'steps': 9483, 'loss/train': 1.3734347820281982} -08/30/2021 14:51:47 - INFO - __main__ - Step 9485: {'lr': 0.0004968519594151966, 'samples': 1821120, 'steps': 9484, 'loss/train': 1.854420781135559} -08/30/2021 14:51:48 - INFO - __main__ - Step 9486: {'lr': 0.0004968511198574147, 'samples': 1821312, 'steps': 9485, 'loss/train': 1.7000813484191895} -08/30/2021 14:51:49 - INFO - __main__ - Step 9487: {'lr': 0.0004968502801884056, 'samples': 1821504, 'steps': 9486, 'loss/train': 0.19344857335090637} -08/30/2021 14:51:50 - INFO - __main__ - Step 9488: {'lr': 0.0004968494404081695, 'samples': 1821696, 'steps': 9487, 'loss/train': 1.6949357986450195} -08/30/2021 14:51:50 - INFO - __main__ - Step 9489: {'lr': 0.0004968486005167069, 'samples': 1821888, 'steps': 9488, 'loss/train': 1.9569776058197021} -08/30/2021 14:51:51 - INFO - __main__ - Step 9490: {'lr': 0.000496847760514018, 'samples': 1822080, 'steps': 9489, 'loss/train': 1.227189540863037} -08/30/2021 14:51:51 - INFO - __main__ - Step 9491: {'lr': 0.0004968469204001035, 'samples': 1822272, 'steps': 9490, 'loss/train': 1.703311800956726} -08/30/2021 14:51:51 - INFO - __main__ - Step 9492: {'lr': 0.0004968460801749635, 'samples': 1822464, 'steps': 9491, 'loss/train': 1.6264091730117798} -08/30/2021 14:51:53 - INFO - __main__ - Step 9493: {'lr': 0.0004968452398385984, 'samples': 1822656, 'steps': 9492, 'loss/train': 1.5646148920059204} -08/30/2021 14:51:53 - INFO - __main__ - Step 9494: {'lr': 0.0004968443993910086, 'samples': 1822848, 'steps': 9493, 'loss/train': 1.6149001121520996} -08/30/2021 14:51:54 - INFO - __main__ - Step 9495: {'lr': 0.0004968435588321947, 'samples': 1823040, 'steps': 9494, 'loss/train': 3.129379987716675} -08/30/2021 14:51:54 - INFO - __main__ - Step 9496: {'lr': 0.0004968427181621567, 'samples': 1823232, 'steps': 9495, 'loss/train': 1.9704177379608154} -08/30/2021 14:51:54 - INFO - __main__ - Step 9497: {'lr': 0.0004968418773808954, 'samples': 1823424, 'steps': 9496, 'loss/train': 1.985621452331543} -08/30/2021 14:51:56 - INFO - __main__ - Step 9498: {'lr': 0.0004968410364884109, 'samples': 1823616, 'steps': 9497, 'loss/train': 2.15446138381958} -08/30/2021 14:51:56 - INFO - __main__ - Step 9499: {'lr': 0.0004968401954847035, 'samples': 1823808, 'steps': 9498, 'loss/train': 1.961751103401184} -08/30/2021 14:51:57 - INFO - __main__ - Step 9500: {'lr': 0.0004968393543697739, 'samples': 1824000, 'steps': 9499, 'loss/train': 1.8978371620178223} -08/30/2021 14:51:57 - INFO - __main__ - Step 9501: {'lr': 0.0004968385131436222, 'samples': 1824192, 'steps': 9500, 'loss/train': 2.069866895675659} -08/30/2021 14:51:57 - INFO - __main__ - Step 9502: {'lr': 0.0004968376718062488, 'samples': 1824384, 'steps': 9501, 'loss/train': 2.285006284713745} -08/30/2021 14:51:58 - INFO - __main__ - Step 9503: {'lr': 0.0004968368303576542, 'samples': 1824576, 'steps': 9502, 'loss/train': 2.062350034713745} -08/30/2021 14:51:59 - INFO - __main__ - Step 9504: {'lr': 0.0004968359887978389, 'samples': 1824768, 'steps': 9503, 'loss/train': 2.0324878692626953} -08/30/2021 14:52:00 - INFO - __main__ - Step 9505: {'lr': 0.0004968351471268029, 'samples': 1824960, 'steps': 9504, 'loss/train': 1.6162992715835571} -08/30/2021 14:52:00 - INFO - __main__ - Step 9506: {'lr': 0.0004968343053445469, 'samples': 1825152, 'steps': 9505, 'loss/train': 1.7939414978027344} -08/30/2021 14:52:00 - INFO - __main__ - Step 9507: {'lr': 0.0004968334634510712, 'samples': 1825344, 'steps': 9506, 'loss/train': 1.7104524374008179} -08/30/2021 14:52:01 - INFO - __main__ - Step 9508: {'lr': 0.000496832621446376, 'samples': 1825536, 'steps': 9507, 'loss/train': 1.705259919166565} -08/30/2021 14:52:02 - INFO - __main__ - Step 9509: {'lr': 0.000496831779330462, 'samples': 1825728, 'steps': 9508, 'loss/train': 2.0026159286499023} -08/30/2021 14:52:03 - INFO - __main__ - Step 9510: {'lr': 0.0004968309371033293, 'samples': 1825920, 'steps': 9509, 'loss/train': 2.0757880210876465} -08/30/2021 14:52:03 - INFO - __main__ - Step 9511: {'lr': 0.0004968300947649784, 'samples': 1826112, 'steps': 9510, 'loss/train': 0.965133547782898} -08/30/2021 14:52:03 - INFO - __main__ - Step 9512: {'lr': 0.0004968292523154096, 'samples': 1826304, 'steps': 9511, 'loss/train': 1.057422161102295} -08/30/2021 14:52:04 - INFO - __main__ - Step 9513: {'lr': 0.0004968284097546235, 'samples': 1826496, 'steps': 9512, 'loss/train': 2.2127723693847656} -08/30/2021 14:52:05 - INFO - __main__ - Step 9514: {'lr': 0.0004968275670826204, 'samples': 1826688, 'steps': 9513, 'loss/train': 1.9112217426300049} -08/30/2021 14:52:06 - INFO - __main__ - Step 9515: {'lr': 0.0004968267242994003, 'samples': 1826880, 'steps': 9514, 'loss/train': 2.016266345977783} -08/30/2021 14:52:06 - INFO - __main__ - Step 9516: {'lr': 0.0004968258814049641, 'samples': 1827072, 'steps': 9515, 'loss/train': 1.8917293548583984} -08/30/2021 14:52:06 - INFO - __main__ - Step 9517: {'lr': 0.0004968250383993119, 'samples': 1827264, 'steps': 9516, 'loss/train': 1.3322018384933472} -08/30/2021 14:52:07 - INFO - __main__ - Step 9518: {'lr': 0.0004968241952824442, 'samples': 1827456, 'steps': 9517, 'loss/train': 1.6007182598114014} -08/30/2021 14:52:08 - INFO - __main__ - Step 9519: {'lr': 0.0004968233520543613, 'samples': 1827648, 'steps': 9518, 'loss/train': 2.4424338340759277} -08/30/2021 14:52:09 - INFO - __main__ - Step 9520: {'lr': 0.0004968225087150636, 'samples': 1827840, 'steps': 9519, 'loss/train': 1.8217027187347412} -08/30/2021 14:52:09 - INFO - __main__ - Step 9521: {'lr': 0.0004968216652645515, 'samples': 1828032, 'steps': 9520, 'loss/train': 0.14912250638008118} -08/30/2021 14:52:09 - INFO - __main__ - Step 9522: {'lr': 0.0004968208217028254, 'samples': 1828224, 'steps': 9521, 'loss/train': 1.905614972114563} -08/30/2021 14:52:10 - INFO - __main__ - Step 9523: {'lr': 0.0004968199780298855, 'samples': 1828416, 'steps': 9522, 'loss/train': 2.1052048206329346} -08/30/2021 14:52:10 - INFO - __main__ - Step 9524: {'lr': 0.0004968191342457325, 'samples': 1828608, 'steps': 9523, 'loss/train': 1.7192381620407104} -08/30/2021 14:52:12 - INFO - __main__ - Step 9525: {'lr': 0.0004968182903503665, 'samples': 1828800, 'steps': 9524, 'loss/train': 1.6907083988189697} -08/30/2021 14:52:12 - INFO - __main__ - Step 9526: {'lr': 0.0004968174463437881, 'samples': 1828992, 'steps': 9525, 'loss/train': 2.139465570449829} -08/30/2021 14:52:13 - INFO - __main__ - Step 9527: {'lr': 0.0004968166022259974, 'samples': 1829184, 'steps': 9526, 'loss/train': 1.5463396310806274} -08/30/2021 14:52:13 - INFO - __main__ - Step 9528: {'lr': 0.0004968157579969951, 'samples': 1829376, 'steps': 9527, 'loss/train': 1.697893738746643} -08/30/2021 14:52:13 - INFO - __main__ - Step 9529: {'lr': 0.0004968149136567814, 'samples': 1829568, 'steps': 9528, 'loss/train': 1.9812012910842896} -08/30/2021 14:52:15 - INFO - __main__ - Step 9530: {'lr': 0.0004968140692053567, 'samples': 1829760, 'steps': 9529, 'loss/train': 1.7304465770721436} -08/30/2021 14:52:16 - INFO - __main__ - Step 9531: {'lr': 0.0004968132246427212, 'samples': 1829952, 'steps': 9530, 'loss/train': 1.9630389213562012} -08/30/2021 14:52:16 - INFO - __main__ - Step 9532: {'lr': 0.0004968123799688757, 'samples': 1830144, 'steps': 9531, 'loss/train': 1.8219130039215088} -08/30/2021 14:52:17 - INFO - __main__ - Step 9533: {'lr': 0.0004968115351838203, 'samples': 1830336, 'steps': 9532, 'loss/train': 2.0107686519622803} -08/30/2021 14:52:17 - INFO - __main__ - Step 9534: {'lr': 0.0004968106902875554, 'samples': 1830528, 'steps': 9533, 'loss/train': 1.0331999063491821} -08/30/2021 14:52:19 - INFO - __main__ - Step 9535: {'lr': 0.0004968098452800815, 'samples': 1830720, 'steps': 9534, 'loss/train': 2.015059471130371} -08/30/2021 14:52:19 - INFO - __main__ - Step 9536: {'lr': 0.0004968090001613987, 'samples': 1830912, 'steps': 9535, 'loss/train': 1.7272931337356567} -08/30/2021 14:52:20 - INFO - __main__ - Step 9537: {'lr': 0.0004968081549315078, 'samples': 1831104, 'steps': 9536, 'loss/train': 2.008720874786377} -08/30/2021 14:52:20 - INFO - __main__ - Step 9538: {'lr': 0.0004968073095904088, 'samples': 1831296, 'steps': 9537, 'loss/train': 1.7935843467712402} -08/30/2021 14:52:20 - INFO - __main__ - Step 9539: {'lr': 0.0004968064641381022, 'samples': 1831488, 'steps': 9538, 'loss/train': 0.15976040065288544} -08/30/2021 14:52:22 - INFO - __main__ - Step 9540: {'lr': 0.0004968056185745886, 'samples': 1831680, 'steps': 9539, 'loss/train': 1.9459625482559204} -08/30/2021 14:52:22 - INFO - __main__ - Step 9541: {'lr': 0.000496804772899868, 'samples': 1831872, 'steps': 9540, 'loss/train': 1.6825783252716064} -08/30/2021 14:52:23 - INFO - __main__ - Step 9542: {'lr': 0.0004968039271139412, 'samples': 1832064, 'steps': 9541, 'loss/train': 1.8675510883331299} -08/30/2021 14:52:23 - INFO - __main__ - Step 9543: {'lr': 0.0004968030812168082, 'samples': 1832256, 'steps': 9542, 'loss/train': 1.6803189516067505} -08/30/2021 14:52:23 - INFO - __main__ - Step 9544: {'lr': 0.0004968022352084695, 'samples': 1832448, 'steps': 9543, 'loss/train': 2.097487211227417} -08/30/2021 14:52:25 - INFO - __main__ - Step 9545: {'lr': 0.0004968013890889256, 'samples': 1832640, 'steps': 9544, 'loss/train': 1.791940689086914} -08/30/2021 14:52:26 - INFO - __main__ - Step 9546: {'lr': 0.0004968005428581767, 'samples': 1832832, 'steps': 9545, 'loss/train': 2.2272696495056152} -08/30/2021 14:52:26 - INFO - __main__ - Step 9547: {'lr': 0.0004967996965162235, 'samples': 1833024, 'steps': 9546, 'loss/train': 4.577334403991699} -08/30/2021 14:52:27 - INFO - __main__ - Step 9548: {'lr': 0.0004967988500630661, 'samples': 1833216, 'steps': 9547, 'loss/train': 7.04046630859375} -08/30/2021 14:52:27 - INFO - __main__ - Step 9549: {'lr': 0.0004967980034987048, 'samples': 1833408, 'steps': 9548, 'loss/train': 1.5037380456924438} -08/30/2021 14:52:27 - INFO - __main__ - Step 9550: {'lr': 0.0004967971568231402, 'samples': 1833600, 'steps': 9549, 'loss/train': 2.0027918815612793} -08/30/2021 14:52:29 - INFO - __main__ - Step 9551: {'lr': 0.0004967963100363726, 'samples': 1833792, 'steps': 9550, 'loss/train': 1.8694095611572266} -08/30/2021 14:52:29 - INFO - __main__ - Step 9552: {'lr': 0.0004967954631384025, 'samples': 1833984, 'steps': 9551, 'loss/train': 2.3288567066192627} -08/30/2021 14:52:30 - INFO - __main__ - Step 9553: {'lr': 0.00049679461612923, 'samples': 1834176, 'steps': 9552, 'loss/train': 1.8898195028305054} -08/30/2021 14:52:30 - INFO - __main__ - Step 9554: {'lr': 0.0004967937690088558, 'samples': 1834368, 'steps': 9553, 'loss/train': 1.0987898111343384} -08/30/2021 14:52:30 - INFO - __main__ - Step 9555: {'lr': 0.0004967929217772801, 'samples': 1834560, 'steps': 9554, 'loss/train': 1.653060793876648} -08/30/2021 14:52:32 - INFO - __main__ - Step 9556: {'lr': 0.0004967920744345033, 'samples': 1834752, 'steps': 9555, 'loss/train': 1.5633423328399658} -08/30/2021 14:52:32 - INFO - __main__ - Step 9557: {'lr': 0.0004967912269805257, 'samples': 1834944, 'steps': 9556, 'loss/train': 1.1584726572036743} -08/30/2021 14:52:33 - INFO - __main__ - Step 9558: {'lr': 0.000496790379415348, 'samples': 1835136, 'steps': 9557, 'loss/train': 2.092374563217163} -08/30/2021 14:52:33 - INFO - __main__ - Step 9559: {'lr': 0.0004967895317389702, 'samples': 1835328, 'steps': 9558, 'loss/train': 1.9063400030136108} -08/30/2021 14:52:33 - INFO - __main__ - Step 9560: {'lr': 0.0004967886839513929, 'samples': 1835520, 'steps': 9559, 'loss/train': 1.8805854320526123} -08/30/2021 14:52:35 - INFO - __main__ - Step 9561: {'lr': 0.0004967878360526163, 'samples': 1835712, 'steps': 9560, 'loss/train': 0.5825358629226685} -08/30/2021 14:52:35 - INFO - __main__ - Step 9562: {'lr': 0.0004967869880426411, 'samples': 1835904, 'steps': 9561, 'loss/train': 1.65834379196167} -08/30/2021 14:52:36 - INFO - __main__ - Step 9563: {'lr': 0.0004967861399214674, 'samples': 1836096, 'steps': 9562, 'loss/train': 1.0580202341079712} -08/30/2021 14:52:36 - INFO - __main__ - Step 9564: {'lr': 0.0004967852916890958, 'samples': 1836288, 'steps': 9563, 'loss/train': 1.9563688039779663} -08/30/2021 14:52:36 - INFO - __main__ - Step 9565: {'lr': 0.0004967844433455263, 'samples': 1836480, 'steps': 9564, 'loss/train': 1.885180115699768} -08/30/2021 14:52:38 - INFO - __main__ - Step 9566: {'lr': 0.0004967835948907598, 'samples': 1836672, 'steps': 9565, 'loss/train': 2.490196466445923} -08/30/2021 14:52:38 - INFO - __main__ - Step 9567: {'lr': 0.0004967827463247962, 'samples': 1836864, 'steps': 9566, 'loss/train': 1.6596322059631348} -08/30/2021 14:52:39 - INFO - __main__ - Step 9568: {'lr': 0.0004967818976476363, 'samples': 1837056, 'steps': 9567, 'loss/train': 1.840817928314209} -08/30/2021 14:52:39 - INFO - __main__ - Step 9569: {'lr': 0.0004967810488592801, 'samples': 1837248, 'steps': 9568, 'loss/train': 2.142194986343384} -08/30/2021 14:52:39 - INFO - __main__ - Step 9570: {'lr': 0.0004967801999597283, 'samples': 1837440, 'steps': 9569, 'loss/train': 2.2547035217285156} -08/30/2021 14:52:41 - INFO - __main__ - Step 9571: {'lr': 0.0004967793509489811, 'samples': 1837632, 'steps': 9570, 'loss/train': 1.8984874486923218} -08/30/2021 14:52:42 - INFO - __main__ - Step 9572: {'lr': 0.0004967785018270389, 'samples': 1837824, 'steps': 9571, 'loss/train': 1.471620798110962} -08/30/2021 14:52:42 - INFO - __main__ - Step 9573: {'lr': 0.0004967776525939022, 'samples': 1838016, 'steps': 9572, 'loss/train': 2.029245615005493} -08/30/2021 14:52:42 - INFO - __main__ - Step 9574: {'lr': 0.0004967768032495712, 'samples': 1838208, 'steps': 9573, 'loss/train': 1.9916651248931885} -08/30/2021 14:52:43 - INFO - __main__ - Step 9575: {'lr': 0.0004967759537940464, 'samples': 1838400, 'steps': 9574, 'loss/train': 0.35771846771240234} -08/30/2021 14:52:44 - INFO - __main__ - Step 9576: {'lr': 0.0004967751042273282, 'samples': 1838592, 'steps': 9575, 'loss/train': 1.7091983556747437} -08/30/2021 14:52:45 - INFO - __main__ - Step 9577: {'lr': 0.000496774254549417, 'samples': 1838784, 'steps': 9576, 'loss/train': 2.095242738723755} -08/30/2021 14:52:45 - INFO - __main__ - Step 9578: {'lr': 0.0004967734047603131, 'samples': 1838976, 'steps': 9577, 'loss/train': 0.8464174866676331} -08/30/2021 14:52:45 - INFO - __main__ - Step 9579: {'lr': 0.0004967725548600168, 'samples': 1839168, 'steps': 9578, 'loss/train': 1.780236840248108} -08/30/2021 14:52:46 - INFO - __main__ - Step 9580: {'lr': 0.0004967717048485287, 'samples': 1839360, 'steps': 9579, 'loss/train': 1.5458338260650635} -08/30/2021 14:52:46 - INFO - __main__ - Step 9581: {'lr': 0.000496770854725849, 'samples': 1839552, 'steps': 9580, 'loss/train': 1.8168420791625977} -08/30/2021 14:52:48 - INFO - __main__ - Step 9582: {'lr': 0.0004967700044919783, 'samples': 1839744, 'steps': 9581, 'loss/train': 2.481297731399536} -08/30/2021 14:52:48 - INFO - __main__ - Step 9583: {'lr': 0.0004967691541469167, 'samples': 1839936, 'steps': 9582, 'loss/train': 1.9234411716461182} -08/30/2021 14:52:49 - INFO - __main__ - Step 9584: {'lr': 0.0004967683036906648, 'samples': 1840128, 'steps': 9583, 'loss/train': 0.19581331312656403} -08/30/2021 14:52:49 - INFO - __main__ - Step 9585: {'lr': 0.0004967674531232229, 'samples': 1840320, 'steps': 9584, 'loss/train': 2.079195261001587} -08/30/2021 14:52:49 - INFO - __main__ - Step 9586: {'lr': 0.0004967666024445913, 'samples': 1840512, 'steps': 9585, 'loss/train': 1.999889612197876} -08/30/2021 14:52:51 - INFO - __main__ - Step 9587: {'lr': 0.0004967657516547707, 'samples': 1840704, 'steps': 9586, 'loss/train': 2.023404359817505} -08/30/2021 14:52:52 - INFO - __main__ - Step 9588: {'lr': 0.0004967649007537611, 'samples': 1840896, 'steps': 9587, 'loss/train': 2.1839041709899902} -08/30/2021 14:52:52 - INFO - __main__ - Step 9589: {'lr': 0.0004967640497415631, 'samples': 1841088, 'steps': 9588, 'loss/train': 1.8167579174041748} -08/30/2021 14:52:52 - INFO - __main__ - Step 9590: {'lr': 0.000496763198618177, 'samples': 1841280, 'steps': 9589, 'loss/train': 1.192988395690918} -08/30/2021 14:52:53 - INFO - __main__ - Step 9591: {'lr': 0.0004967623473836032, 'samples': 1841472, 'steps': 9590, 'loss/train': 1.9897503852844238} -08/30/2021 14:52:54 - INFO - __main__ - Step 9592: {'lr': 0.0004967614960378421, 'samples': 1841664, 'steps': 9591, 'loss/train': 1.6394896507263184} -08/30/2021 14:52:55 - INFO - __main__ - Step 9593: {'lr': 0.000496760644580894, 'samples': 1841856, 'steps': 9592, 'loss/train': 1.881445288658142} -08/30/2021 14:52:55 - INFO - __main__ - Step 9594: {'lr': 0.0004967597930127595, 'samples': 1842048, 'steps': 9593, 'loss/train': 3.591984987258911} -08/30/2021 14:52:56 - INFO - __main__ - Step 9595: {'lr': 0.0004967589413334387, 'samples': 1842240, 'steps': 9594, 'loss/train': 1.8645308017730713} -08/30/2021 14:52:56 - INFO - __main__ - Step 9596: {'lr': 0.0004967580895429322, 'samples': 1842432, 'steps': 9595, 'loss/train': 1.7857896089553833} -08/30/2021 14:52:57 - INFO - __main__ - Step 9597: {'lr': 0.0004967572376412405, 'samples': 1842624, 'steps': 9596, 'loss/train': 2.2183992862701416} -08/30/2021 14:52:58 - INFO - __main__ - Step 9598: {'lr': 0.0004967563856283636, 'samples': 1842816, 'steps': 9597, 'loss/train': 1.6056443452835083} -08/30/2021 14:52:58 - INFO - __main__ - Step 9599: {'lr': 0.000496755533504302, 'samples': 1843008, 'steps': 9598, 'loss/train': 1.9285104274749756} -08/30/2021 14:52:59 - INFO - __main__ - Step 9600: {'lr': 0.0004967546812690563, 'samples': 1843200, 'steps': 9599, 'loss/train': 2.4664130210876465} -08/30/2021 14:52:59 - INFO - __main__ - Step 9601: {'lr': 0.0004967538289226267, 'samples': 1843392, 'steps': 9600, 'loss/train': 2.390072822570801} -08/30/2021 14:52:59 - INFO - __main__ - Step 9602: {'lr': 0.0004967529764650137, 'samples': 1843584, 'steps': 9601, 'loss/train': 1.3265252113342285} -08/30/2021 14:53:01 - INFO - __main__ - Step 9603: {'lr': 0.0004967521238962175, 'samples': 1843776, 'steps': 9602, 'loss/train': 2.01141095161438} -08/30/2021 14:53:01 - INFO - __main__ - Step 9604: {'lr': 0.0004967512712162387, 'samples': 1843968, 'steps': 9603, 'loss/train': 1.1177914142608643} -08/30/2021 14:53:02 - INFO - __main__ - Step 9605: {'lr': 0.0004967504184250775, 'samples': 1844160, 'steps': 9604, 'loss/train': 1.9945052862167358} -08/30/2021 14:53:02 - INFO - __main__ - Step 9606: {'lr': 0.0004967495655227344, 'samples': 1844352, 'steps': 9605, 'loss/train': 2.2381575107574463} -08/30/2021 14:53:02 - INFO - __main__ - Step 9607: {'lr': 0.0004967487125092098, 'samples': 1844544, 'steps': 9606, 'loss/train': 1.798716425895691} -08/30/2021 14:53:04 - INFO - __main__ - Step 9608: {'lr': 0.0004967478593845041, 'samples': 1844736, 'steps': 9607, 'loss/train': 1.7776857614517212} -08/30/2021 14:53:04 - INFO - __main__ - Step 9609: {'lr': 0.0004967470061486175, 'samples': 1844928, 'steps': 9608, 'loss/train': 1.7392473220825195} -08/30/2021 14:53:05 - INFO - __main__ - Step 9610: {'lr': 0.0004967461528015506, 'samples': 1845120, 'steps': 9609, 'loss/train': 1.9466431140899658} -08/30/2021 14:53:05 - INFO - __main__ - Step 9611: {'lr': 0.0004967452993433036, 'samples': 1845312, 'steps': 9610, 'loss/train': 1.838362216949463} -08/30/2021 14:53:05 - INFO - __main__ - Step 9612: {'lr': 0.0004967444457738769, 'samples': 1845504, 'steps': 9611, 'loss/train': 0.1852114498615265} -08/30/2021 14:53:07 - INFO - __main__ - Step 9613: {'lr': 0.0004967435920932711, 'samples': 1845696, 'steps': 9612, 'loss/train': 2.0451154708862305} -08/30/2021 14:53:07 - INFO - __main__ - Step 9614: {'lr': 0.0004967427383014865, 'samples': 1845888, 'steps': 9613, 'loss/train': 0.8990710973739624} -08/30/2021 14:53:08 - INFO - __main__ - Step 9615: {'lr': 0.0004967418843985233, 'samples': 1846080, 'steps': 9614, 'loss/train': 1.021018624305725} -08/30/2021 14:53:08 - INFO - __main__ - Step 9616: {'lr': 0.0004967410303843821, 'samples': 1846272, 'steps': 9615, 'loss/train': 1.8680695295333862} -08/30/2021 14:53:08 - INFO - __main__ - Step 9617: {'lr': 0.0004967401762590631, 'samples': 1846464, 'steps': 9616, 'loss/train': 1.7404403686523438} -08/30/2021 14:53:10 - INFO - __main__ - Step 9618: {'lr': 0.0004967393220225668, 'samples': 1846656, 'steps': 9617, 'loss/train': 2.0626628398895264} -08/30/2021 14:53:10 - INFO - __main__ - Step 9619: {'lr': 0.0004967384676748936, 'samples': 1846848, 'steps': 9618, 'loss/train': 2.7807576656341553} -08/30/2021 14:53:11 - INFO - __main__ - Step 9620: {'lr': 0.0004967376132160438, 'samples': 1847040, 'steps': 9619, 'loss/train': 2.164260149002075} -08/30/2021 14:53:11 - INFO - __main__ - Step 9621: {'lr': 0.000496736758646018, 'samples': 1847232, 'steps': 9620, 'loss/train': 1.8069162368774414} -08/30/2021 14:53:11 - INFO - __main__ - Step 9622: {'lr': 0.0004967359039648163, 'samples': 1847424, 'steps': 9621, 'loss/train': 1.8062012195587158} -08/30/2021 14:53:13 - INFO - __main__ - Step 9623: {'lr': 0.0004967350491724392, 'samples': 1847616, 'steps': 9622, 'loss/train': 1.4811952114105225} -08/30/2021 14:53:13 - INFO - __main__ - Step 9624: {'lr': 0.0004967341942688872, 'samples': 1847808, 'steps': 9623, 'loss/train': 2.2838680744171143} -08/30/2021 14:53:14 - INFO - __main__ - Step 9625: {'lr': 0.0004967333392541604, 'samples': 1848000, 'steps': 9624, 'loss/train': 1.7904081344604492} -08/30/2021 14:53:14 - INFO - __main__ - Step 9626: {'lr': 0.0004967324841282596, 'samples': 1848192, 'steps': 9625, 'loss/train': 2.0094234943389893} -08/30/2021 14:53:14 - INFO - __main__ - Step 9627: {'lr': 0.0004967316288911847, 'samples': 1848384, 'steps': 9626, 'loss/train': 2.010408401489258} -08/30/2021 14:53:16 - INFO - __main__ - Step 9628: {'lr': 0.0004967307735429365, 'samples': 1848576, 'steps': 9627, 'loss/train': 1.8527088165283203} -08/30/2021 14:53:17 - INFO - __main__ - Step 9629: {'lr': 0.0004967299180835153, 'samples': 1848768, 'steps': 9628, 'loss/train': 1.859185814857483} -08/30/2021 14:53:17 - INFO - __main__ - Step 9630: {'lr': 0.0004967290625129212, 'samples': 1848960, 'steps': 9629, 'loss/train': 1.5661931037902832} -08/30/2021 14:53:17 - INFO - __main__ - Step 9631: {'lr': 0.0004967282068311548, 'samples': 1849152, 'steps': 9630, 'loss/train': 1.8538151979446411} -08/30/2021 14:53:18 - INFO - __main__ - Step 9632: {'lr': 0.0004967273510382166, 'samples': 1849344, 'steps': 9631, 'loss/train': 1.946212887763977} -08/30/2021 14:53:18 - INFO - __main__ - Step 9633: {'lr': 0.0004967264951341069, 'samples': 1849536, 'steps': 9632, 'loss/train': 1.5135653018951416} -08/30/2021 14:53:20 - INFO - __main__ - Step 9634: {'lr': 0.0004967256391188258, 'samples': 1849728, 'steps': 9633, 'loss/train': 0.2908616065979004} -08/30/2021 14:53:20 - INFO - __main__ - Step 9635: {'lr': 0.0004967247829923742, 'samples': 1849920, 'steps': 9634, 'loss/train': 1.8376696109771729} -08/30/2021 14:53:20 - INFO - __main__ - Step 9636: {'lr': 0.0004967239267547521, 'samples': 1850112, 'steps': 9635, 'loss/train': 1.7155654430389404} -08/30/2021 14:53:21 - INFO - __main__ - Step 9637: {'lr': 0.00049672307040596, 'samples': 1850304, 'steps': 9636, 'loss/train': 1.8015106916427612} -08/30/2021 14:53:21 - INFO - __main__ - Step 9638: {'lr': 0.0004967222139459983, 'samples': 1850496, 'steps': 9637, 'loss/train': 1.6642169952392578} -08/30/2021 14:53:23 - INFO - __main__ - Step 9639: {'lr': 0.0004967213573748674, 'samples': 1850688, 'steps': 9638, 'loss/train': 2.2503201961517334} -08/30/2021 14:53:24 - INFO - __main__ - Step 9640: {'lr': 0.0004967205006925677, 'samples': 1850880, 'steps': 9639, 'loss/train': 1.7300949096679688} -08/30/2021 14:53:24 - INFO - __main__ - Step 9641: {'lr': 0.0004967196438990995, 'samples': 1851072, 'steps': 9640, 'loss/train': 1.4293779134750366} -08/30/2021 14:53:24 - INFO - __main__ - Step 9642: {'lr': 0.0004967187869944632, 'samples': 1851264, 'steps': 9641, 'loss/train': 2.84515380859375} -08/30/2021 14:53:25 - INFO - __main__ - Step 9643: {'lr': 0.0004967179299786593, 'samples': 1851456, 'steps': 9642, 'loss/train': 1.5416079759597778} -08/30/2021 14:53:25 - INFO - __main__ - Step 9644: {'lr': 0.000496717072851688, 'samples': 1851648, 'steps': 9643, 'loss/train': 1.9394845962524414} -08/30/2021 14:53:27 - INFO - __main__ - Step 9645: {'lr': 0.0004967162156135499, 'samples': 1851840, 'steps': 9644, 'loss/train': 2.371034860610962} -08/30/2021 14:53:27 - INFO - __main__ - Step 9646: {'lr': 0.0004967153582642452, 'samples': 1852032, 'steps': 9645, 'loss/train': 1.4911154508590698} -08/30/2021 14:53:27 - INFO - __main__ - Step 9647: {'lr': 0.0004967145008037744, 'samples': 1852224, 'steps': 9646, 'loss/train': 2.4870901107788086} -08/30/2021 14:53:28 - INFO - __main__ - Step 9648: {'lr': 0.000496713643232138, 'samples': 1852416, 'steps': 9647, 'loss/train': 2.0515434741973877} -08/30/2021 14:53:28 - INFO - __main__ - Step 9649: {'lr': 0.000496712785549336, 'samples': 1852608, 'steps': 9648, 'loss/train': 2.0488858222961426} -08/30/2021 14:53:30 - INFO - __main__ - Step 9650: {'lr': 0.0004967119277553692, 'samples': 1852800, 'steps': 9649, 'loss/train': 1.652200698852539} -08/30/2021 14:53:30 - INFO - __main__ - Step 9651: {'lr': 0.0004967110698502377, 'samples': 1852992, 'steps': 9650, 'loss/train': 1.6506527662277222} -08/30/2021 14:53:31 - INFO - __main__ - Step 9652: {'lr': 0.000496710211833942, 'samples': 1853184, 'steps': 9651, 'loss/train': 1.3091411590576172} -08/30/2021 14:53:31 - INFO - __main__ - Step 9653: {'lr': 0.0004967093537064825, 'samples': 1853376, 'steps': 9652, 'loss/train': 2.4822838306427} -08/30/2021 14:53:31 - INFO - __main__ - Step 9654: {'lr': 0.0004967084954678597, 'samples': 1853568, 'steps': 9653, 'loss/train': 1.5479607582092285} -08/30/2021 14:53:33 - INFO - __main__ - Step 9655: {'lr': 0.0004967076371180738, 'samples': 1853760, 'steps': 9654, 'loss/train': 1.7819963693618774} -08/30/2021 14:53:33 - INFO - __main__ - Step 9656: {'lr': 0.0004967067786571251, 'samples': 1853952, 'steps': 9655, 'loss/train': 0.712238609790802} -08/30/2021 14:53:34 - INFO - __main__ - Step 9657: {'lr': 0.0004967059200850142, 'samples': 1854144, 'steps': 9656, 'loss/train': 1.739729881286621} -08/30/2021 14:53:34 - INFO - __main__ - Step 9658: {'lr': 0.0004967050614017415, 'samples': 1854336, 'steps': 9657, 'loss/train': 0.6492201089859009} -08/30/2021 14:53:35 - INFO - __main__ - Step 9659: {'lr': 0.0004967042026073073, 'samples': 1854528, 'steps': 9658, 'loss/train': 2.296637773513794} -08/30/2021 14:53:35 - INFO - __main__ - Step 9660: {'lr': 0.000496703343701712, 'samples': 1854720, 'steps': 9659, 'loss/train': 1.7050857543945312} -08/30/2021 14:53:36 - INFO - __main__ - Step 9661: {'lr': 0.0004967024846849558, 'samples': 1854912, 'steps': 9660, 'loss/train': 1.9776008129119873} -08/30/2021 14:53:37 - INFO - __main__ - Step 9662: {'lr': 0.0004967016255570394, 'samples': 1855104, 'steps': 9661, 'loss/train': 0.28526273369789124} -08/30/2021 14:53:37 - INFO - __main__ - Step 9663: {'lr': 0.0004967007663179632, 'samples': 1855296, 'steps': 9662, 'loss/train': 0.7856886982917786} -08/30/2021 14:53:38 - INFO - __main__ - Step 9664: {'lr': 0.0004966999069677272, 'samples': 1855488, 'steps': 9663, 'loss/train': 1.9313335418701172} -08/30/2021 14:53:38 - INFO - __main__ - Step 9665: {'lr': 0.0004966990475063321, 'samples': 1855680, 'steps': 9664, 'loss/train': 1.558266282081604} -08/30/2021 14:53:39 - INFO - __main__ - Step 9666: {'lr': 0.0004966981879337783, 'samples': 1855872, 'steps': 9665, 'loss/train': 1.5345159769058228} -08/30/2021 14:53:40 - INFO - __main__ - Step 9667: {'lr': 0.0004966973282500661, 'samples': 1856064, 'steps': 9666, 'loss/train': 1.8651546239852905} -08/30/2021 14:53:40 - INFO - __main__ - Step 9668: {'lr': 0.0004966964684551958, 'samples': 1856256, 'steps': 9667, 'loss/train': 1.5681730508804321} -08/30/2021 14:53:40 - INFO - __main__ - Step 9669: {'lr': 0.0004966956085491679, 'samples': 1856448, 'steps': 9668, 'loss/train': 1.5579904317855835} -08/30/2021 14:53:41 - INFO - __main__ - Step 9670: {'lr': 0.0004966947485319828, 'samples': 1856640, 'steps': 9669, 'loss/train': 1.712479829788208} -08/30/2021 14:53:42 - INFO - __main__ - Step 9671: {'lr': 0.0004966938884036408, 'samples': 1856832, 'steps': 9670, 'loss/train': 1.6334211826324463} -08/30/2021 14:53:43 - INFO - __main__ - Step 9672: {'lr': 0.0004966930281641423, 'samples': 1857024, 'steps': 9671, 'loss/train': 3.4267959594726562} -08/30/2021 14:53:43 - INFO - __main__ - Step 9673: {'lr': 0.0004966921678134879, 'samples': 1857216, 'steps': 9672, 'loss/train': 1.9703158140182495} -08/30/2021 14:53:44 - INFO - __main__ - Step 9674: {'lr': 0.0004966913073516777, 'samples': 1857408, 'steps': 9673, 'loss/train': 2.0359699726104736} -08/30/2021 14:53:44 - INFO - __main__ - Step 9675: {'lr': 0.0004966904467787123, 'samples': 1857600, 'steps': 9674, 'loss/train': 2.0441136360168457} -08/30/2021 14:53:44 - INFO - __main__ - Step 9676: {'lr': 0.0004966895860945918, 'samples': 1857792, 'steps': 9675, 'loss/train': 2.440521717071533} -08/30/2021 14:53:46 - INFO - __main__ - Step 9677: {'lr': 0.0004966887252993169, 'samples': 1857984, 'steps': 9676, 'loss/train': 1.7095386981964111} -08/30/2021 14:53:47 - INFO - __main__ - Step 9678: {'lr': 0.0004966878643928879, 'samples': 1858176, 'steps': 9677, 'loss/train': 1.8088562488555908} -08/30/2021 14:53:47 - INFO - __main__ - Step 9679: {'lr': 0.0004966870033753051, 'samples': 1858368, 'steps': 9678, 'loss/train': 2.0200352668762207} -08/30/2021 14:53:47 - INFO - __main__ - Step 9680: {'lr': 0.0004966861422465689, 'samples': 1858560, 'steps': 9679, 'loss/train': 0.2883291244506836} -08/30/2021 14:53:48 - INFO - __main__ - Step 9681: {'lr': 0.0004966852810066798, 'samples': 1858752, 'steps': 9680, 'loss/train': 2.0641093254089355} -08/30/2021 14:53:49 - INFO - __main__ - Step 9682: {'lr': 0.0004966844196556382, 'samples': 1858944, 'steps': 9681, 'loss/train': 1.7363930940628052} -08/30/2021 14:53:50 - INFO - __main__ - Step 9683: {'lr': 0.0004966835581934442, 'samples': 1859136, 'steps': 9682, 'loss/train': 1.9491764307022095} -08/30/2021 14:53:50 - INFO - __main__ - Step 9684: {'lr': 0.0004966826966200985, 'samples': 1859328, 'steps': 9683, 'loss/train': 1.997516393661499} -08/30/2021 14:53:50 - INFO - __main__ - Step 9685: {'lr': 0.0004966818349356015, 'samples': 1859520, 'steps': 9684, 'loss/train': 2.0222957134246826} -08/30/2021 14:53:51 - INFO - __main__ - Step 9686: {'lr': 0.0004966809731399533, 'samples': 1859712, 'steps': 9685, 'loss/train': 1.3625972270965576} -08/30/2021 14:53:52 - INFO - __main__ - Step 9687: {'lr': 0.0004966801112331545, 'samples': 1859904, 'steps': 9686, 'loss/train': 1.7286548614501953} -08/30/2021 14:53:53 - INFO - __main__ - Step 9688: {'lr': 0.0004966792492152054, 'samples': 1860096, 'steps': 9687, 'loss/train': 1.8468976020812988} -08/30/2021 14:53:53 - INFO - __main__ - Step 9689: {'lr': 0.0004966783870861066, 'samples': 1860288, 'steps': 9688, 'loss/train': 2.112144947052002} -08/30/2021 14:53:54 - INFO - __main__ - Step 9690: {'lr': 0.0004966775248458582, 'samples': 1860480, 'steps': 9689, 'loss/train': 1.7111119031906128} -08/30/2021 14:53:54 - INFO - __main__ - Step 9691: {'lr': 0.0004966766624944607, 'samples': 1860672, 'steps': 9690, 'loss/train': 1.796911597251892} -08/30/2021 14:53:54 - INFO - __main__ - Step 9692: {'lr': 0.0004966758000319147, 'samples': 1860864, 'steps': 9691, 'loss/train': 2.128903865814209} -08/30/2021 14:53:57 - INFO - __main__ - Step 9693: {'lr': 0.0004966749374582202, 'samples': 1861056, 'steps': 9692, 'loss/train': 1.1706323623657227} -08/30/2021 14:53:57 - INFO - __main__ - Step 9694: {'lr': 0.0004966740747733778, 'samples': 1861248, 'steps': 9693, 'loss/train': 1.07637619972229} -08/30/2021 14:53:57 - INFO - __main__ - Step 9695: {'lr': 0.0004966732119773879, 'samples': 1861440, 'steps': 9694, 'loss/train': 0.9190359711647034} -08/30/2021 14:53:58 - INFO - __main__ - Step 9696: {'lr': 0.0004966723490702509, 'samples': 1861632, 'steps': 9695, 'loss/train': 1.8705346584320068} -08/30/2021 14:53:58 - INFO - __main__ - Step 9697: {'lr': 0.000496671486051967, 'samples': 1861824, 'steps': 9696, 'loss/train': 1.7523695230484009} -08/30/2021 14:54:00 - INFO - __main__ - Step 9698: {'lr': 0.0004966706229225368, 'samples': 1862016, 'steps': 9697, 'loss/train': 2.006720542907715} -08/30/2021 14:54:00 - INFO - __main__ - Step 9699: {'lr': 0.0004966697596819607, 'samples': 1862208, 'steps': 9698, 'loss/train': 1.9750852584838867} -08/30/2021 14:54:01 - INFO - __main__ - Step 9700: {'lr': 0.0004966688963302389, 'samples': 1862400, 'steps': 9699, 'loss/train': 2.217642307281494} -08/30/2021 14:54:01 - INFO - __main__ - Step 9701: {'lr': 0.000496668032867372, 'samples': 1862592, 'steps': 9700, 'loss/train': 2.213373899459839} -08/30/2021 14:54:01 - INFO - __main__ - Step 9702: {'lr': 0.0004966671692933603, 'samples': 1862784, 'steps': 9701, 'loss/train': 1.9149820804595947} -08/30/2021 14:54:03 - INFO - __main__ - Step 9703: {'lr': 0.0004966663056082041, 'samples': 1862976, 'steps': 9702, 'loss/train': 1.9143811464309692} -08/30/2021 14:54:03 - INFO - __main__ - Step 9704: {'lr': 0.0004966654418119039, 'samples': 1863168, 'steps': 9703, 'loss/train': 1.3695147037506104} -08/30/2021 14:54:04 - INFO - __main__ - Step 9705: {'lr': 0.00049666457790446, 'samples': 1863360, 'steps': 9704, 'loss/train': 2.261863946914673} -08/30/2021 14:54:04 - INFO - __main__ - Step 9706: {'lr': 0.000496663713885873, 'samples': 1863552, 'steps': 9705, 'loss/train': 1.9517362117767334} -08/30/2021 14:54:04 - INFO - __main__ - Step 9707: {'lr': 0.0004966628497561431, 'samples': 1863744, 'steps': 9706, 'loss/train': 2.2061758041381836} -08/30/2021 14:54:06 - INFO - __main__ - Step 9708: {'lr': 0.0004966619855152706, 'samples': 1863936, 'steps': 9707, 'loss/train': 1.8381626605987549} -08/30/2021 14:54:06 - INFO - __main__ - Step 9709: {'lr': 0.0004966611211632561, 'samples': 1864128, 'steps': 9708, 'loss/train': 3.0681979656219482} -08/30/2021 14:54:07 - INFO - __main__ - Step 9710: {'lr': 0.0004966602567000999, 'samples': 1864320, 'steps': 9709, 'loss/train': 1.9511271715164185} -08/30/2021 14:54:07 - INFO - __main__ - Step 9711: {'lr': 0.0004966593921258023, 'samples': 1864512, 'steps': 9710, 'loss/train': 2.433972120285034} -08/30/2021 14:54:07 - INFO - __main__ - Step 9712: {'lr': 0.000496658527440364, 'samples': 1864704, 'steps': 9711, 'loss/train': 1.9139094352722168} -08/30/2021 14:54:08 - INFO - __main__ - Step 9713: {'lr': 0.000496657662643785, 'samples': 1864896, 'steps': 9712, 'loss/train': 1.9728235006332397} -08/30/2021 14:54:09 - INFO - __main__ - Step 9714: {'lr': 0.000496656797736066, 'samples': 1865088, 'steps': 9713, 'loss/train': 2.6217501163482666} -08/30/2021 14:54:10 - INFO - __main__ - Step 9715: {'lr': 0.0004966559327172071, 'samples': 1865280, 'steps': 9714, 'loss/train': 2.076709270477295} -08/30/2021 14:54:10 - INFO - __main__ - Step 9716: {'lr': 0.0004966550675872089, 'samples': 1865472, 'steps': 9715, 'loss/train': 2.4587104320526123} -08/30/2021 14:54:10 - INFO - __main__ - Step 9717: {'lr': 0.0004966542023460718, 'samples': 1865664, 'steps': 9716, 'loss/train': 2.441128969192505} -08/30/2021 14:54:11 - INFO - __main__ - Step 9718: {'lr': 0.000496653336993796, 'samples': 1865856, 'steps': 9717, 'loss/train': 1.9450116157531738} -08/30/2021 14:54:12 - INFO - __main__ - Step 9719: {'lr': 0.0004966524715303821, 'samples': 1866048, 'steps': 9718, 'loss/train': 2.079266309738159} -08/30/2021 14:54:13 - INFO - __main__ - Step 9720: {'lr': 0.0004966516059558304, 'samples': 1866240, 'steps': 9719, 'loss/train': 1.6373075246810913} -08/30/2021 14:54:13 - INFO - __main__ - Step 9721: {'lr': 0.0004966507402701413, 'samples': 1866432, 'steps': 9720, 'loss/train': 1.7225592136383057} -08/30/2021 14:54:14 - INFO - __main__ - Step 9722: {'lr': 0.0004966498744733151, 'samples': 1866624, 'steps': 9721, 'loss/train': 2.1595609188079834} -08/30/2021 14:54:14 - INFO - __main__ - Step 9723: {'lr': 0.0004966490085653523, 'samples': 1866816, 'steps': 9722, 'loss/train': 1.6869670152664185} -08/30/2021 14:54:15 - INFO - __main__ - Step 9724: {'lr': 0.0004966481425462533, 'samples': 1867008, 'steps': 9723, 'loss/train': 0.24262908101081848} -08/30/2021 14:54:16 - INFO - __main__ - Step 9725: {'lr': 0.0004966472764160183, 'samples': 1867200, 'steps': 9724, 'loss/train': 1.9964102506637573} -08/30/2021 14:54:16 - INFO - __main__ - Step 9726: {'lr': 0.000496646410174648, 'samples': 1867392, 'steps': 9725, 'loss/train': 4.726476669311523} -08/30/2021 14:54:17 - INFO - __main__ - Step 9727: {'lr': 0.0004966455438221427, 'samples': 1867584, 'steps': 9726, 'loss/train': 1.2921795845031738} -08/30/2021 14:54:17 - INFO - __main__ - Step 9728: {'lr': 0.0004966446773585026, 'samples': 1867776, 'steps': 9727, 'loss/train': 2.107571840286255} -08/30/2021 14:54:18 - INFO - __main__ - Step 9729: {'lr': 0.0004966438107837283, 'samples': 1867968, 'steps': 9728, 'loss/train': 6.637866973876953} -08/30/2021 14:54:19 - INFO - __main__ - Step 9730: {'lr': 0.00049664294409782, 'samples': 1868160, 'steps': 9729, 'loss/train': 2.1792266368865967} -08/30/2021 14:54:19 - INFO - __main__ - Step 9731: {'lr': 0.0004966420773007782, 'samples': 1868352, 'steps': 9730, 'loss/train': 1.0178474187850952} -08/30/2021 14:54:20 - INFO - __main__ - Step 9732: {'lr': 0.0004966412103926034, 'samples': 1868544, 'steps': 9731, 'loss/train': 1.7584015130996704} -08/30/2021 14:54:20 - INFO - __main__ - Step 9733: {'lr': 0.0004966403433732958, 'samples': 1868736, 'steps': 9732, 'loss/train': 1.9877625703811646} -08/30/2021 14:54:22 - INFO - __main__ - Step 9734: {'lr': 0.0004966394762428559, 'samples': 1868928, 'steps': 9733, 'loss/train': 1.9409760236740112} -08/30/2021 14:54:22 - INFO - __main__ - Step 9735: {'lr': 0.0004966386090012841, 'samples': 1869120, 'steps': 9734, 'loss/train': 1.9843204021453857} -08/30/2021 14:54:22 - INFO - __main__ - Step 9736: {'lr': 0.0004966377416485806, 'samples': 1869312, 'steps': 9735, 'loss/train': 1.9466495513916016} -08/30/2021 14:54:23 - INFO - __main__ - Step 9737: {'lr': 0.0004966368741847461, 'samples': 1869504, 'steps': 9736, 'loss/train': 1.8497463464736938} -08/30/2021 14:54:23 - INFO - __main__ - Step 9738: {'lr': 0.0004966360066097807, 'samples': 1869696, 'steps': 9737, 'loss/train': 1.6434361934661865} -08/30/2021 14:54:23 - INFO - __main__ - Step 9739: {'lr': 0.0004966351389236851, 'samples': 1869888, 'steps': 9738, 'loss/train': 0.1551797240972519} -08/30/2021 14:54:25 - INFO - __main__ - Step 9740: {'lr': 0.0004966342711264593, 'samples': 1870080, 'steps': 9739, 'loss/train': 0.14922592043876648} -08/30/2021 14:54:25 - INFO - __main__ - Step 9741: {'lr': 0.000496633403218104, 'samples': 1870272, 'steps': 9740, 'loss/train': 1.4524890184402466} -08/30/2021 14:54:26 - INFO - __main__ - Step 9742: {'lr': 0.0004966325351986195, 'samples': 1870464, 'steps': 9741, 'loss/train': 1.8672969341278076} -08/30/2021 14:54:26 - INFO - __main__ - Step 9743: {'lr': 0.0004966316670680062, 'samples': 1870656, 'steps': 9742, 'loss/train': 1.6861193180084229} -08/30/2021 14:54:26 - INFO - __main__ - Step 9744: {'lr': 0.0004966307988262644, 'samples': 1870848, 'steps': 9743, 'loss/train': 2.0013606548309326} -08/30/2021 14:54:28 - INFO - __main__ - Step 9745: {'lr': 0.0004966299304733947, 'samples': 1871040, 'steps': 9744, 'loss/train': 2.092226028442383} -08/30/2021 14:54:29 - INFO - __main__ - Step 9746: {'lr': 0.0004966290620093972, 'samples': 1871232, 'steps': 9745, 'loss/train': 2.124173879623413} -08/30/2021 14:54:29 - INFO - __main__ - Step 9747: {'lr': 0.0004966281934342725, 'samples': 1871424, 'steps': 9746, 'loss/train': 1.5140055418014526} -08/30/2021 14:54:29 - INFO - __main__ - Step 9748: {'lr': 0.000496627324748021, 'samples': 1871616, 'steps': 9747, 'loss/train': 1.7213398218154907} -08/30/2021 14:54:30 - INFO - __main__ - Step 9749: {'lr': 0.000496626455950643, 'samples': 1871808, 'steps': 9748, 'loss/train': 1.8757199048995972} -08/30/2021 14:54:32 - INFO - __main__ - Step 9750: {'lr': 0.000496625587042139, 'samples': 1872000, 'steps': 9749, 'loss/train': 1.5113251209259033} -08/30/2021 14:54:32 - INFO - __main__ - Step 9751: {'lr': 0.0004966247180225092, 'samples': 1872192, 'steps': 9750, 'loss/train': 1.7895302772521973} -08/30/2021 14:54:32 - INFO - __main__ - Step 9752: {'lr': 0.0004966238488917542, 'samples': 1872384, 'steps': 9751, 'loss/train': 1.876662254333496} -08/30/2021 14:54:33 - INFO - __main__ - Step 9753: {'lr': 0.0004966229796498742, 'samples': 1872576, 'steps': 9752, 'loss/train': 1.9065462350845337} -08/30/2021 14:54:33 - INFO - __main__ - Step 9754: {'lr': 0.0004966221102968698, 'samples': 1872768, 'steps': 9753, 'loss/train': 1.8621559143066406} -08/30/2021 14:54:33 - INFO - __main__ - Step 9755: {'lr': 0.0004966212408327412, 'samples': 1872960, 'steps': 9754, 'loss/train': 1.696763038635254} -08/30/2021 14:54:35 - INFO - __main__ - Step 9756: {'lr': 0.0004966203712574889, 'samples': 1873152, 'steps': 9755, 'loss/train': 1.6754891872406006} -08/30/2021 14:54:35 - INFO - __main__ - Step 9757: {'lr': 0.0004966195015711132, 'samples': 1873344, 'steps': 9756, 'loss/train': 2.2423617839813232} -08/30/2021 14:54:36 - INFO - __main__ - Step 9758: {'lr': 0.0004966186317736146, 'samples': 1873536, 'steps': 9757, 'loss/train': 2.1737141609191895} -08/30/2021 14:54:36 - INFO - __main__ - Step 9759: {'lr': 0.0004966177618649935, 'samples': 1873728, 'steps': 9758, 'loss/train': 1.8301485776901245} -08/30/2021 14:54:36 - INFO - __main__ - Step 9760: {'lr': 0.0004966168918452503, 'samples': 1873920, 'steps': 9759, 'loss/train': 1.9839552640914917} -08/30/2021 14:54:38 - INFO - __main__ - Step 9761: {'lr': 0.0004966160217143852, 'samples': 1874112, 'steps': 9760, 'loss/train': 1.8732393980026245} -08/30/2021 14:54:38 - INFO - __main__ - Step 9762: {'lr': 0.0004966151514723988, 'samples': 1874304, 'steps': 9761, 'loss/train': 1.56182062625885} -08/30/2021 14:54:39 - INFO - __main__ - Step 9763: {'lr': 0.0004966142811192914, 'samples': 1874496, 'steps': 9762, 'loss/train': 1.9897133111953735} -08/30/2021 14:54:39 - INFO - __main__ - Step 9764: {'lr': 0.0004966134106550634, 'samples': 1874688, 'steps': 9763, 'loss/train': 1.981635332107544} -08/30/2021 14:54:40 - INFO - __main__ - Step 9765: {'lr': 0.0004966125400797152, 'samples': 1874880, 'steps': 9764, 'loss/train': 1.4501882791519165} -08/30/2021 14:54:41 - INFO - __main__ - Step 9766: {'lr': 0.0004966116693932472, 'samples': 1875072, 'steps': 9765, 'loss/train': 1.7068828344345093} -08/30/2021 14:54:42 - INFO - __main__ - Step 9767: {'lr': 0.0004966107985956598, 'samples': 1875264, 'steps': 9766, 'loss/train': 2.004703998565674} -08/30/2021 14:54:42 - INFO - __main__ - Step 9768: {'lr': 0.0004966099276869534, 'samples': 1875456, 'steps': 9767, 'loss/train': 1.7816212177276611} -08/30/2021 14:54:42 - INFO - __main__ - Step 9769: {'lr': 0.0004966090566671283, 'samples': 1875648, 'steps': 9768, 'loss/train': 1.9179739952087402} -08/30/2021 14:54:43 - INFO - __main__ - Step 9770: {'lr': 0.000496608185536185, 'samples': 1875840, 'steps': 9769, 'loss/train': 2.208346366882324} -08/30/2021 14:54:44 - INFO - __main__ - Step 9771: {'lr': 0.0004966073142941239, 'samples': 1876032, 'steps': 9770, 'loss/train': 2.0073368549346924} -08/30/2021 14:54:45 - INFO - __main__ - Step 9772: {'lr': 0.0004966064429409452, 'samples': 1876224, 'steps': 9771, 'loss/train': 1.1819682121276855} -08/30/2021 14:54:45 - INFO - __main__ - Step 9773: {'lr': 0.0004966055714766496, 'samples': 1876416, 'steps': 9772, 'loss/train': 2.517453670501709} -08/30/2021 14:54:45 - INFO - __main__ - Step 9774: {'lr': 0.0004966046999012373, 'samples': 1876608, 'steps': 9773, 'loss/train': 1.1560664176940918} -08/30/2021 14:54:46 - INFO - __main__ - Step 9775: {'lr': 0.0004966038282147087, 'samples': 1876800, 'steps': 9774, 'loss/train': 1.7246750593185425} -08/30/2021 14:54:47 - INFO - __main__ - Step 9776: {'lr': 0.0004966029564170643, 'samples': 1876992, 'steps': 9775, 'loss/train': 1.8625199794769287} -08/30/2021 14:54:48 - INFO - __main__ - Step 9777: {'lr': 0.0004966020845083044, 'samples': 1877184, 'steps': 9776, 'loss/train': 1.667828917503357} -08/30/2021 14:54:48 - INFO - __main__ - Step 9778: {'lr': 0.0004966012124884292, 'samples': 1877376, 'steps': 9777, 'loss/train': 1.385165810585022} -08/30/2021 14:54:48 - INFO - __main__ - Step 9779: {'lr': 0.0004966003403574395, 'samples': 1877568, 'steps': 9778, 'loss/train': 2.03983998298645} -08/30/2021 14:54:49 - INFO - __main__ - Step 9780: {'lr': 0.0004965994681153355, 'samples': 1877760, 'steps': 9779, 'loss/train': 2.0109755992889404} -08/30/2021 14:54:50 - INFO - __main__ - Step 9781: {'lr': 0.0004965985957621175, 'samples': 1877952, 'steps': 9780, 'loss/train': 2.1260452270507812} -08/30/2021 14:54:50 - INFO - __main__ - Step 9782: {'lr': 0.0004965977232977861, 'samples': 1878144, 'steps': 9781, 'loss/train': 1.8748568296432495} -08/30/2021 14:54:51 - INFO - __main__ - Step 9783: {'lr': 0.0004965968507223414, 'samples': 1878336, 'steps': 9782, 'loss/train': 2.1814732551574707} -08/30/2021 14:54:51 - INFO - __main__ - Step 9784: {'lr': 0.000496595978035784, 'samples': 1878528, 'steps': 9783, 'loss/train': 1.618996500968933} -08/30/2021 14:54:51 - INFO - __main__ - Step 9785: {'lr': 0.0004965951052381144, 'samples': 1878720, 'steps': 9784, 'loss/train': 2.164748191833496} -08/30/2021 14:54:53 - INFO - __main__ - Step 9786: {'lr': 0.0004965942323293328, 'samples': 1878912, 'steps': 9785, 'loss/train': 1.624773621559143} -08/30/2021 14:54:53 - INFO - __main__ - Step 9787: {'lr': 0.0004965933593094395, 'samples': 1879104, 'steps': 9786, 'loss/train': 2.1712048053741455} -08/30/2021 14:54:54 - INFO - __main__ - Step 9788: {'lr': 0.0004965924861784352, 'samples': 1879296, 'steps': 9787, 'loss/train': 1.660886526107788} -08/30/2021 14:54:54 - INFO - __main__ - Step 9789: {'lr': 0.0004965916129363201, 'samples': 1879488, 'steps': 9788, 'loss/train': 1.4098634719848633} -08/30/2021 14:54:55 - INFO - __main__ - Step 9790: {'lr': 0.0004965907395830945, 'samples': 1879680, 'steps': 9789, 'loss/train': 1.5025256872177124} -08/30/2021 14:54:56 - INFO - __main__ - Step 9791: {'lr': 0.000496589866118759, 'samples': 1879872, 'steps': 9790, 'loss/train': 1.7650216817855835} -08/30/2021 14:54:56 - INFO - __main__ - Step 9792: {'lr': 0.000496588992543314, 'samples': 1880064, 'steps': 9791, 'loss/train': 1.3867985010147095} -08/30/2021 14:54:57 - INFO - __main__ - Step 9793: {'lr': 0.0004965881188567597, 'samples': 1880256, 'steps': 9792, 'loss/train': 1.0742295980453491} -08/30/2021 14:54:57 - INFO - __main__ - Step 9794: {'lr': 0.0004965872450590965, 'samples': 1880448, 'steps': 9793, 'loss/train': 2.1396424770355225} -08/30/2021 14:54:58 - INFO - __main__ - Step 9795: {'lr': 0.0004965863711503251, 'samples': 1880640, 'steps': 9794, 'loss/train': 1.7687004804611206} -08/30/2021 14:54:58 - INFO - __main__ - Step 9796: {'lr': 0.0004965854971304457, 'samples': 1880832, 'steps': 9795, 'loss/train': 1.7895843982696533} -08/30/2021 14:54:59 - INFO - __main__ - Step 9797: {'lr': 0.0004965846229994586, 'samples': 1881024, 'steps': 9796, 'loss/train': 1.84823477268219} -08/30/2021 14:55:00 - INFO - __main__ - Step 9798: {'lr': 0.0004965837487573641, 'samples': 1881216, 'steps': 9797, 'loss/train': 1.886412501335144} -08/30/2021 14:55:00 - INFO - __main__ - Step 9799: {'lr': 0.000496582874404163, 'samples': 1881408, 'steps': 9798, 'loss/train': 1.9770792722702026} -08/30/2021 14:55:01 - INFO - __main__ - Step 9800: {'lr': 0.0004965819999398554, 'samples': 1881600, 'steps': 9799, 'loss/train': 2.7488694190979004} -08/30/2021 14:55:01 - INFO - __main__ - Step 9801: {'lr': 0.0004965811253644418, 'samples': 1881792, 'steps': 9800, 'loss/train': 2.4854705333709717} -08/30/2021 14:55:03 - INFO - __main__ - Step 9802: {'lr': 0.0004965802506779225, 'samples': 1881984, 'steps': 9801, 'loss/train': 1.3518996238708496} -08/30/2021 14:55:04 - INFO - __main__ - Step 9803: {'lr': 0.0004965793758802978, 'samples': 1882176, 'steps': 9802, 'loss/train': 1.8334020376205444} -08/30/2021 14:55:04 - INFO - __main__ - Step 9804: {'lr': 0.0004965785009715684, 'samples': 1882368, 'steps': 9803, 'loss/train': 1.8531948328018188} -08/30/2021 14:55:04 - INFO - __main__ - Step 9805: {'lr': 0.0004965776259517345, 'samples': 1882560, 'steps': 9804, 'loss/train': 1.7855840921401978} -08/30/2021 14:55:05 - INFO - __main__ - Step 9806: {'lr': 0.0004965767508207966, 'samples': 1882752, 'steps': 9805, 'loss/train': 2.297307014465332} -08/30/2021 14:55:06 - INFO - __main__ - Step 9807: {'lr': 0.000496575875578755, 'samples': 1882944, 'steps': 9806, 'loss/train': 1.3045541048049927} -08/30/2021 14:55:07 - INFO - __main__ - Step 9808: {'lr': 0.00049657500022561, 'samples': 1883136, 'steps': 9807, 'loss/train': 1.8016923666000366} -08/30/2021 14:55:07 - INFO - __main__ - Step 9809: {'lr': 0.0004965741247613622, 'samples': 1883328, 'steps': 9808, 'loss/train': 2.0325369834899902} -08/30/2021 14:55:07 - INFO - __main__ - Step 9810: {'lr': 0.0004965732491860119, 'samples': 1883520, 'steps': 9809, 'loss/train': 2.054710626602173} -08/30/2021 14:55:08 - INFO - __main__ - Step 9811: {'lr': 0.0004965723734995594, 'samples': 1883712, 'steps': 9810, 'loss/train': 1.7265582084655762} -08/30/2021 14:55:08 - INFO - __main__ - Step 9812: {'lr': 0.0004965714977020053, 'samples': 1883904, 'steps': 9811, 'loss/train': 2.0104353427886963} -08/30/2021 14:55:10 - INFO - __main__ - Step 9813: {'lr': 0.0004965706217933499, 'samples': 1884096, 'steps': 9812, 'loss/train': 1.5940203666687012} -08/30/2021 14:55:10 - INFO - __main__ - Step 9814: {'lr': 0.0004965697457735936, 'samples': 1884288, 'steps': 9813, 'loss/train': 1.9238561391830444} -08/30/2021 14:55:11 - INFO - __main__ - Step 9815: {'lr': 0.0004965688696427366, 'samples': 1884480, 'steps': 9814, 'loss/train': 1.7064625024795532} -08/30/2021 14:55:11 - INFO - __main__ - Step 9816: {'lr': 0.0004965679934007797, 'samples': 1884672, 'steps': 9815, 'loss/train': 1.8641884326934814} -08/30/2021 14:55:11 - INFO - __main__ - Step 9817: {'lr': 0.0004965671170477229, 'samples': 1884864, 'steps': 9816, 'loss/train': 0.137808158993721} -08/30/2021 14:55:13 - INFO - __main__ - Step 9818: {'lr': 0.0004965662405835668, 'samples': 1885056, 'steps': 9817, 'loss/train': 1.7908711433410645} -08/30/2021 14:55:13 - INFO - __main__ - Step 9819: {'lr': 0.0004965653640083118, 'samples': 1885248, 'steps': 9818, 'loss/train': 1.8567848205566406} -08/30/2021 14:55:14 - INFO - __main__ - Step 9820: {'lr': 0.0004965644873219583, 'samples': 1885440, 'steps': 9819, 'loss/train': 1.9928535223007202} -08/30/2021 14:55:14 - INFO - __main__ - Step 9821: {'lr': 0.0004965636105245066, 'samples': 1885632, 'steps': 9820, 'loss/train': 1.633752465248108} -08/30/2021 14:55:14 - INFO - __main__ - Step 9822: {'lr': 0.000496562733615957, 'samples': 1885824, 'steps': 9821, 'loss/train': 1.330245852470398} -08/30/2021 14:55:16 - INFO - __main__ - Step 9823: {'lr': 0.0004965618565963102, 'samples': 1886016, 'steps': 9822, 'loss/train': 1.980771780014038} -08/30/2021 14:55:16 - INFO - __main__ - Step 9824: {'lr': 0.0004965609794655664, 'samples': 1886208, 'steps': 9823, 'loss/train': 1.154754877090454} -08/30/2021 14:55:17 - INFO - __main__ - Step 9825: {'lr': 0.0004965601022237261, 'samples': 1886400, 'steps': 9824, 'loss/train': 1.9220635890960693} -08/30/2021 14:55:17 - INFO - __main__ - Step 9826: {'lr': 0.0004965592248707895, 'samples': 1886592, 'steps': 9825, 'loss/train': 1.9596201181411743} -08/30/2021 14:55:17 - INFO - __main__ - Step 9827: {'lr': 0.0004965583474067571, 'samples': 1886784, 'steps': 9826, 'loss/train': 1.6688120365142822} -08/30/2021 14:55:19 - INFO - __main__ - Step 9828: {'lr': 0.0004965574698316294, 'samples': 1886976, 'steps': 9827, 'loss/train': 1.6392722129821777} -08/30/2021 14:55:20 - INFO - __main__ - Step 9829: {'lr': 0.0004965565921454067, 'samples': 1887168, 'steps': 9828, 'loss/train': 1.8479280471801758} -08/30/2021 14:55:20 - INFO - __main__ - Step 9830: {'lr': 0.0004965557143480893, 'samples': 1887360, 'steps': 9829, 'loss/train': 2.1281254291534424} -08/30/2021 14:55:20 - INFO - __main__ - Step 9831: {'lr': 0.0004965548364396779, 'samples': 1887552, 'steps': 9830, 'loss/train': 1.7769168615341187} -08/30/2021 14:55:21 - INFO - __main__ - Step 9832: {'lr': 0.0004965539584201725, 'samples': 1887744, 'steps': 9831, 'loss/train': 2.1063497066497803} -08/30/2021 14:55:22 - INFO - __main__ - Step 9833: {'lr': 0.0004965530802895738, 'samples': 1887936, 'steps': 9832, 'loss/train': 2.6677818298339844} -08/30/2021 14:55:23 - INFO - __main__ - Step 9834: {'lr': 0.000496552202047882, 'samples': 1888128, 'steps': 9833, 'loss/train': 1.7689239978790283} -08/30/2021 14:55:23 - INFO - __main__ - Step 9835: {'lr': 0.0004965513236950977, 'samples': 1888320, 'steps': 9834, 'loss/train': 1.2834495306015015} -08/30/2021 14:55:23 - INFO - __main__ - Step 9836: {'lr': 0.0004965504452312211, 'samples': 1888512, 'steps': 9835, 'loss/train': 2.4768779277801514} -08/30/2021 14:55:24 - INFO - __main__ - Step 9837: {'lr': 0.0004965495666562527, 'samples': 1888704, 'steps': 9836, 'loss/train': 2.052020788192749} -08/30/2021 14:55:25 - INFO - __main__ - Step 9838: {'lr': 0.0004965486879701928, 'samples': 1888896, 'steps': 9837, 'loss/train': 1.5721266269683838} -08/30/2021 14:55:26 - INFO - __main__ - Step 9839: {'lr': 0.000496547809173042, 'samples': 1889088, 'steps': 9838, 'loss/train': 1.5373854637145996} -08/30/2021 14:55:26 - INFO - __main__ - Step 9840: {'lr': 0.0004965469302648005, 'samples': 1889280, 'steps': 9839, 'loss/train': 1.5755141973495483} -08/30/2021 14:55:26 - INFO - __main__ - Step 9841: {'lr': 0.0004965460512454688, 'samples': 1889472, 'steps': 9840, 'loss/train': 2.2881150245666504} -08/30/2021 14:55:27 - INFO - __main__ - Step 9842: {'lr': 0.0004965451721150471, 'samples': 1889664, 'steps': 9841, 'loss/train': 1.7578301429748535} -08/30/2021 14:55:27 - INFO - __main__ - Step 9843: {'lr': 0.0004965442928735361, 'samples': 1889856, 'steps': 9842, 'loss/train': 1.351906418800354} -08/30/2021 14:55:29 - INFO - __main__ - Step 9844: {'lr': 0.000496543413520936, 'samples': 1890048, 'steps': 9843, 'loss/train': 1.3496830463409424} -08/30/2021 14:55:29 - INFO - __main__ - Step 9845: {'lr': 0.0004965425340572472, 'samples': 1890240, 'steps': 9844, 'loss/train': 2.4627909660339355} -08/30/2021 14:55:29 - INFO - __main__ - Step 9846: {'lr': 0.0004965416544824703, 'samples': 1890432, 'steps': 9845, 'loss/train': 2.1591267585754395} -08/30/2021 14:55:30 - INFO - __main__ - Step 9847: {'lr': 0.0004965407747966053, 'samples': 1890624, 'steps': 9846, 'loss/train': 1.8776334524154663} -08/30/2021 14:55:30 - INFO - __main__ - Step 9848: {'lr': 0.000496539894999653, 'samples': 1890816, 'steps': 9847, 'loss/train': 2.76639461517334} -08/30/2021 14:55:32 - INFO - __main__ - Step 9849: {'lr': 0.0004965390150916136, 'samples': 1891008, 'steps': 9848, 'loss/train': 1.2349870204925537} -08/30/2021 14:55:32 - INFO - __main__ - Step 9850: {'lr': 0.0004965381350724874, 'samples': 1891200, 'steps': 9849, 'loss/train': 1.6132527589797974} -08/30/2021 14:55:32 - INFO - __main__ - Step 9851: {'lr': 0.000496537254942275, 'samples': 1891392, 'steps': 9850, 'loss/train': 1.6223324537277222} -08/30/2021 14:55:33 - INFO - __main__ - Step 9852: {'lr': 0.0004965363747009767, 'samples': 1891584, 'steps': 9851, 'loss/train': 0.2330079823732376} -08/30/2021 14:55:33 - INFO - __main__ - Step 9853: {'lr': 0.000496535494348593, 'samples': 1891776, 'steps': 9852, 'loss/train': 1.5762956142425537} -08/30/2021 14:55:35 - INFO - __main__ - Step 9854: {'lr': 0.0004965346138851241, 'samples': 1891968, 'steps': 9853, 'loss/train': 1.8432313203811646} -08/30/2021 14:55:36 - INFO - __main__ - Step 9855: {'lr': 0.0004965337333105706, 'samples': 1892160, 'steps': 9854, 'loss/train': 2.1151010990142822} -08/30/2021 14:55:36 - INFO - __main__ - Step 9856: {'lr': 0.0004965328526249328, 'samples': 1892352, 'steps': 9855, 'loss/train': 1.7464637756347656} -08/30/2021 14:55:36 - INFO - __main__ - Step 9857: {'lr': 0.000496531971828211, 'samples': 1892544, 'steps': 9856, 'loss/train': 1.6803183555603027} -08/30/2021 14:55:37 - INFO - __main__ - Step 9858: {'lr': 0.0004965310909204058, 'samples': 1892736, 'steps': 9857, 'loss/train': 1.2403587102890015} -08/30/2021 14:55:39 - INFO - __main__ - Step 9859: {'lr': 0.0004965302099015175, 'samples': 1892928, 'steps': 9858, 'loss/train': 2.3438684940338135} -08/30/2021 14:55:39 - INFO - __main__ - Step 9860: {'lr': 0.0004965293287715464, 'samples': 1893120, 'steps': 9859, 'loss/train': 1.7576836347579956} -08/30/2021 14:55:40 - INFO - __main__ - Step 9861: {'lr': 0.0004965284475304931, 'samples': 1893312, 'steps': 9860, 'loss/train': 1.1783772706985474} -08/30/2021 14:55:40 - INFO - __main__ - Step 9862: {'lr': 0.0004965275661783579, 'samples': 1893504, 'steps': 9861, 'loss/train': 0.9311202168464661} -08/30/2021 14:55:41 - INFO - __main__ - Step 9863: {'lr': 0.0004965266847151411, 'samples': 1893696, 'steps': 9862, 'loss/train': 1.0494866371154785} -08/30/2021 14:55:41 - INFO - __main__ - Step 9864: {'lr': 0.0004965258031408432, 'samples': 1893888, 'steps': 9863, 'loss/train': 0.23961587250232697} -08/30/2021 14:55:41 - INFO - __main__ - Step 9865: {'lr': 0.0004965249214554645, 'samples': 1894080, 'steps': 9864, 'loss/train': 1.5181031227111816} -08/30/2021 14:55:43 - INFO - __main__ - Step 9866: {'lr': 0.0004965240396590055, 'samples': 1894272, 'steps': 9865, 'loss/train': 2.282358407974243} -08/30/2021 14:55:43 - INFO - __main__ - Step 9867: {'lr': 0.0004965231577514666, 'samples': 1894464, 'steps': 9866, 'loss/train': 1.474616527557373} -08/30/2021 14:55:44 - INFO - __main__ - Step 9868: {'lr': 0.0004965222757328482, 'samples': 1894656, 'steps': 9867, 'loss/train': 1.6655150651931763} -08/30/2021 14:55:44 - INFO - __main__ - Step 9869: {'lr': 0.0004965213936031507, 'samples': 1894848, 'steps': 9868, 'loss/train': 1.9786831140518188} -08/30/2021 14:55:44 - INFO - __main__ - Step 9870: {'lr': 0.0004965205113623744, 'samples': 1895040, 'steps': 9869, 'loss/train': 1.7262904644012451} -08/30/2021 14:55:46 - INFO - __main__ - Step 9871: {'lr': 0.0004965196290105197, 'samples': 1895232, 'steps': 9870, 'loss/train': 2.089165210723877} -08/30/2021 14:55:46 - INFO - __main__ - Step 9872: {'lr': 0.0004965187465475873, 'samples': 1895424, 'steps': 9871, 'loss/train': 2.1268012523651123} -08/30/2021 14:55:47 - INFO - __main__ - Step 9873: {'lr': 0.0004965178639735772, 'samples': 1895616, 'steps': 9872, 'loss/train': 1.8712267875671387} -08/30/2021 14:55:47 - INFO - __main__ - Step 9874: {'lr': 0.0004965169812884898, 'samples': 1895808, 'steps': 9873, 'loss/train': 2.069993734359741} -08/30/2021 14:55:47 - INFO - __main__ - Step 9875: {'lr': 0.0004965160984923259, 'samples': 1896000, 'steps': 9874, 'loss/train': 1.7645589113235474} -08/30/2021 14:55:49 - INFO - __main__ - Step 9876: {'lr': 0.0004965152155850855, 'samples': 1896192, 'steps': 9875, 'loss/train': 1.3823093175888062} -08/30/2021 14:55:49 - INFO - __main__ - Step 9877: {'lr': 0.0004965143325667692, 'samples': 1896384, 'steps': 9876, 'loss/train': 2.205920696258545} -08/30/2021 14:55:50 - INFO - __main__ - Step 9878: {'lr': 0.0004965134494373773, 'samples': 1896576, 'steps': 9877, 'loss/train': 2.026207208633423} -08/30/2021 14:55:50 - INFO - __main__ - Step 9879: {'lr': 0.0004965125661969103, 'samples': 1896768, 'steps': 9878, 'loss/train': 2.5216455459594727} -08/30/2021 14:55:50 - INFO - __main__ - Step 9880: {'lr': 0.0004965116828453685, 'samples': 1896960, 'steps': 9879, 'loss/train': 1.4107859134674072} -08/30/2021 14:55:52 - INFO - __main__ - Step 9881: {'lr': 0.0004965107993827524, 'samples': 1897152, 'steps': 9880, 'loss/train': 0.6729925870895386} -08/30/2021 14:55:52 - INFO - __main__ - Step 9882: {'lr': 0.0004965099158090624, 'samples': 1897344, 'steps': 9881, 'loss/train': 2.0988662242889404} -08/30/2021 14:55:53 - INFO - __main__ - Step 9883: {'lr': 0.0004965090321242987, 'samples': 1897536, 'steps': 9882, 'loss/train': 2.131324052810669} -08/30/2021 14:55:53 - INFO - __main__ - Step 9884: {'lr': 0.0004965081483284618, 'samples': 1897728, 'steps': 9883, 'loss/train': 1.6686666011810303} -08/30/2021 14:55:53 - INFO - __main__ - Step 9885: {'lr': 0.0004965072644215522, 'samples': 1897920, 'steps': 9884, 'loss/train': 1.809524655342102} -08/30/2021 14:55:55 - INFO - __main__ - Step 9886: {'lr': 0.0004965063804035703, 'samples': 1898112, 'steps': 9885, 'loss/train': 1.9635182619094849} -08/30/2021 14:55:55 - INFO - __main__ - Step 9887: {'lr': 0.0004965054962745163, 'samples': 1898304, 'steps': 9886, 'loss/train': 2.151871681213379} -08/30/2021 14:55:56 - INFO - __main__ - Step 9888: {'lr': 0.0004965046120343908, 'samples': 1898496, 'steps': 9887, 'loss/train': 1.6386842727661133} -08/30/2021 14:55:56 - INFO - __main__ - Step 9889: {'lr': 0.0004965037276831942, 'samples': 1898688, 'steps': 9888, 'loss/train': 0.20835186541080475} -08/30/2021 14:55:56 - INFO - __main__ - Step 9890: {'lr': 0.0004965028432209267, 'samples': 1898880, 'steps': 9889, 'loss/train': 1.7828727960586548} -08/30/2021 14:55:58 - INFO - __main__ - Step 9891: {'lr': 0.0004965019586475888, 'samples': 1899072, 'steps': 9890, 'loss/train': 2.0863196849823} -08/30/2021 14:55:58 - INFO - __main__ - Step 9892: {'lr': 0.000496501073963181, 'samples': 1899264, 'steps': 9891, 'loss/train': 1.5739202499389648} -08/30/2021 14:55:59 - INFO - __main__ - Step 9893: {'lr': 0.0004965001891677037, 'samples': 1899456, 'steps': 9892, 'loss/train': 1.9914906024932861} -08/30/2021 14:55:59 - INFO - __main__ - Step 9894: {'lr': 0.000496499304261157, 'samples': 1899648, 'steps': 9893, 'loss/train': 1.992610216140747} -08/30/2021 14:56:00 - INFO - __main__ - Step 9895: {'lr': 0.0004964984192435417, 'samples': 1899840, 'steps': 9894, 'loss/train': 1.7929564714431763} -08/30/2021 14:56:00 - INFO - __main__ - Step 9896: {'lr': 0.000496497534114858, 'samples': 1900032, 'steps': 9895, 'loss/train': 1.3171859979629517} -08/30/2021 14:56:02 - INFO - __main__ - Step 9897: {'lr': 0.0004964966488751062, 'samples': 1900224, 'steps': 9896, 'loss/train': 1.057159423828125} -08/30/2021 14:56:02 - INFO - __main__ - Step 9898: {'lr': 0.000496495763524287, 'samples': 1900416, 'steps': 9897, 'loss/train': 2.5412673950195312} -08/30/2021 14:56:03 - INFO - __main__ - Step 9899: {'lr': 0.0004964948780624005, 'samples': 1900608, 'steps': 9898, 'loss/train': 1.423126220703125} -08/30/2021 14:56:03 - INFO - __main__ - Step 9900: {'lr': 0.0004964939924894472, 'samples': 1900800, 'steps': 9899, 'loss/train': 0.8339024186134338} -08/30/2021 14:56:03 - INFO - __main__ - Step 9901: {'lr': 0.0004964931068054274, 'samples': 1900992, 'steps': 9900, 'loss/train': 1.9488730430603027} -08/30/2021 14:56:04 - INFO - __main__ - Step 9902: {'lr': 0.0004964922210103418, 'samples': 1901184, 'steps': 9901, 'loss/train': 1.639295220375061} -08/30/2021 14:56:05 - INFO - __main__ - Step 9903: {'lr': 0.0004964913351041905, 'samples': 1901376, 'steps': 9902, 'loss/train': 1.8759537935256958} -08/30/2021 14:56:06 - INFO - __main__ - Step 9904: {'lr': 0.000496490449086974, 'samples': 1901568, 'steps': 9903, 'loss/train': 2.187781572341919} -08/30/2021 14:56:06 - INFO - __main__ - Step 9905: {'lr': 0.0004964895629586928, 'samples': 1901760, 'steps': 9904, 'loss/train': 1.7618857622146606} -08/30/2021 14:56:06 - INFO - __main__ - Step 9906: {'lr': 0.0004964886767193471, 'samples': 1901952, 'steps': 9905, 'loss/train': 0.11265911161899567} -08/30/2021 14:56:07 - INFO - __main__ - Step 9907: {'lr': 0.0004964877903689375, 'samples': 1902144, 'steps': 9906, 'loss/train': 1.943421483039856} -08/30/2021 14:56:09 - INFO - __main__ - Step 9908: {'lr': 0.0004964869039074643, 'samples': 1902336, 'steps': 9907, 'loss/train': 1.5840805768966675} -08/30/2021 14:56:09 - INFO - __main__ - Step 9909: {'lr': 0.000496486017334928, 'samples': 1902528, 'steps': 9908, 'loss/train': 1.8387268781661987} -08/30/2021 14:56:09 - INFO - __main__ - Step 9910: {'lr': 0.0004964851306513287, 'samples': 1902720, 'steps': 9909, 'loss/train': 2.056471824645996} -08/30/2021 14:56:10 - INFO - __main__ - Step 9911: {'lr': 0.0004964842438566671, 'samples': 1902912, 'steps': 9910, 'loss/train': 2.14296817779541} -08/30/2021 14:56:10 - INFO - __main__ - Step 9912: {'lr': 0.0004964833569509434, 'samples': 1903104, 'steps': 9911, 'loss/train': 0.1421142816543579} -08/30/2021 14:56:12 - INFO - __main__ - Step 9913: {'lr': 0.0004964824699341582, 'samples': 1903296, 'steps': 9912, 'loss/train': 1.7805852890014648} -08/30/2021 14:56:13 - INFO - __main__ - Step 9914: {'lr': 0.0004964815828063118, 'samples': 1903488, 'steps': 9913, 'loss/train': 1.9573044776916504} -08/30/2021 14:56:13 - INFO - __main__ - Step 9915: {'lr': 0.0004964806955674046, 'samples': 1903680, 'steps': 9914, 'loss/train': 1.6270732879638672} -08/30/2021 14:56:14 - INFO - __main__ - Step 9916: {'lr': 0.0004964798082174371, 'samples': 1903872, 'steps': 9915, 'loss/train': 1.7032448053359985} -08/30/2021 14:56:14 - INFO - __main__ - Step 9917: {'lr': 0.0004964789207564094, 'samples': 1904064, 'steps': 9916, 'loss/train': 6.233009338378906} -08/30/2021 14:56:16 - INFO - __main__ - Step 9918: {'lr': 0.0004964780331843223, 'samples': 1904256, 'steps': 9917, 'loss/train': 1.977447271347046} -08/30/2021 14:56:17 - INFO - __main__ - Step 9919: {'lr': 0.0004964771455011758, 'samples': 1904448, 'steps': 9918, 'loss/train': 1.8892210721969604} -08/30/2021 14:56:17 - INFO - __main__ - Step 9920: {'lr': 0.0004964762577069707, 'samples': 1904640, 'steps': 9919, 'loss/train': 0.3782086670398712} -08/30/2021 14:56:17 - INFO - __main__ - Step 9921: {'lr': 0.0004964753698017071, 'samples': 1904832, 'steps': 9920, 'loss/train': 1.2212785482406616} -08/30/2021 14:56:18 - INFO - __main__ - Step 9922: {'lr': 0.0004964744817853855, 'samples': 1905024, 'steps': 9921, 'loss/train': 1.2019864320755005} -08/30/2021 14:56:18 - INFO - __main__ - Step 9923: {'lr': 0.0004964735936580063, 'samples': 1905216, 'steps': 9922, 'loss/train': 1.9790148735046387} -08/30/2021 14:56:20 - INFO - __main__ - Step 9924: {'lr': 0.00049647270541957, 'samples': 1905408, 'steps': 9923, 'loss/train': 0.15961384773254395} -08/30/2021 14:56:20 - INFO - __main__ - Step 9925: {'lr': 0.0004964718170700767, 'samples': 1905600, 'steps': 9924, 'loss/train': 1.9123448133468628} -08/30/2021 14:56:20 - INFO - __main__ - Step 9926: {'lr': 0.0004964709286095271, 'samples': 1905792, 'steps': 9925, 'loss/train': 1.9273356199264526} -08/30/2021 14:56:21 - INFO - __main__ - Step 9927: {'lr': 0.0004964700400379215, 'samples': 1905984, 'steps': 9926, 'loss/train': 1.5638554096221924} -08/30/2021 14:56:21 - INFO - __main__ - Step 9928: {'lr': 0.0004964691513552604, 'samples': 1906176, 'steps': 9927, 'loss/train': 2.2048823833465576} -08/30/2021 14:56:23 - INFO - __main__ - Step 9929: {'lr': 0.000496468262561544, 'samples': 1906368, 'steps': 9928, 'loss/train': 1.6114774942398071} -08/30/2021 14:56:23 - INFO - __main__ - Step 9930: {'lr': 0.0004964673736567728, 'samples': 1906560, 'steps': 9929, 'loss/train': 2.6401917934417725} -08/30/2021 14:56:23 - INFO - __main__ - Step 9931: {'lr': 0.0004964664846409473, 'samples': 1906752, 'steps': 9930, 'loss/train': 1.914066195487976} -08/30/2021 14:56:24 - INFO - __main__ - Step 9932: {'lr': 0.0004964655955140677, 'samples': 1906944, 'steps': 9931, 'loss/train': 1.8376495838165283} -08/30/2021 14:56:24 - INFO - __main__ - Step 9933: {'lr': 0.0004964647062761345, 'samples': 1907136, 'steps': 9932, 'loss/train': 1.5977219343185425} -08/30/2021 14:56:26 - INFO - __main__ - Step 9934: {'lr': 0.0004964638169271482, 'samples': 1907328, 'steps': 9933, 'loss/train': 2.038529396057129} -08/30/2021 14:56:26 - INFO - __main__ - Step 9935: {'lr': 0.0004964629274671091, 'samples': 1907520, 'steps': 9934, 'loss/train': 1.771410346031189} -08/30/2021 14:56:26 - INFO - __main__ - Step 9936: {'lr': 0.0004964620378960175, 'samples': 1907712, 'steps': 9935, 'loss/train': 1.7764892578125} -08/30/2021 14:56:27 - INFO - __main__ - Step 9937: {'lr': 0.000496461148213874, 'samples': 1907904, 'steps': 9936, 'loss/train': 1.1905723810195923} -08/30/2021 14:56:27 - INFO - __main__ - Step 9938: {'lr': 0.0004964602584206788, 'samples': 1908096, 'steps': 9937, 'loss/train': 1.829355001449585} -08/30/2021 14:56:29 - INFO - __main__ - Step 9939: {'lr': 0.0004964593685164326, 'samples': 1908288, 'steps': 9938, 'loss/train': 2.1132514476776123} -08/30/2021 14:56:29 - INFO - __main__ - Step 9940: {'lr': 0.0004964584785011355, 'samples': 1908480, 'steps': 9939, 'loss/train': 2.7216434478759766} -08/30/2021 14:56:29 - INFO - __main__ - Step 9941: {'lr': 0.000496457588374788, 'samples': 1908672, 'steps': 9940, 'loss/train': 1.8941521644592285} -08/30/2021 14:56:30 - INFO - __main__ - Step 9942: {'lr': 0.0004964566981373905, 'samples': 1908864, 'steps': 9941, 'loss/train': 1.9584522247314453} -08/30/2021 14:56:30 - INFO - __main__ - Step 9943: {'lr': 0.0004964558077889435, 'samples': 1909056, 'steps': 9942, 'loss/train': 2.0020854473114014} -08/30/2021 14:56:32 - INFO - __main__ - Step 9944: {'lr': 0.0004964549173294472, 'samples': 1909248, 'steps': 9943, 'loss/train': 1.4657632112503052} -08/30/2021 14:56:32 - INFO - __main__ - Step 9945: {'lr': 0.0004964540267589023, 'samples': 1909440, 'steps': 9944, 'loss/train': 1.6888188123703003} -08/30/2021 14:56:32 - INFO - __main__ - Step 9946: {'lr': 0.0004964531360773088, 'samples': 1909632, 'steps': 9945, 'loss/train': 1.991836667060852} -08/30/2021 14:56:33 - INFO - __main__ - Step 9947: {'lr': 0.0004964522452846675, 'samples': 1909824, 'steps': 9946, 'loss/train': 1.441489577293396} -08/30/2021 14:56:33 - INFO - __main__ - Step 9948: {'lr': 0.0004964513543809785, 'samples': 1910016, 'steps': 9947, 'loss/train': 1.6609220504760742} -08/30/2021 14:56:35 - INFO - __main__ - Step 9949: {'lr': 0.0004964504633662424, 'samples': 1910208, 'steps': 9948, 'loss/train': 2.0449202060699463} -08/30/2021 14:56:35 - INFO - __main__ - Step 9950: {'lr': 0.0004964495722404595, 'samples': 1910400, 'steps': 9949, 'loss/train': 1.8106787204742432} -08/30/2021 14:56:36 - INFO - __main__ - Step 9951: {'lr': 0.0004964486810036301, 'samples': 1910592, 'steps': 9950, 'loss/train': 1.1692430973052979} -08/30/2021 14:56:36 - INFO - __main__ - Step 9952: {'lr': 0.000496447789655755, 'samples': 1910784, 'steps': 9951, 'loss/train': 0.809981644153595} -08/30/2021 14:56:36 - INFO - __main__ - Step 9953: {'lr': 0.0004964468981968341, 'samples': 1910976, 'steps': 9952, 'loss/train': 1.773395299911499} -08/30/2021 14:56:38 - INFO - __main__ - Step 9954: {'lr': 0.0004964460066268681, 'samples': 1911168, 'steps': 9953, 'loss/train': 1.162157416343689} -08/30/2021 14:56:38 - INFO - __main__ - Step 9955: {'lr': 0.0004964451149458573, 'samples': 1911360, 'steps': 9954, 'loss/train': 1.6730577945709229} -08/30/2021 14:56:39 - INFO - __main__ - Step 9956: {'lr': 0.0004964442231538023, 'samples': 1911552, 'steps': 9955, 'loss/train': 1.6550753116607666} -08/30/2021 14:56:39 - INFO - __main__ - Step 9957: {'lr': 0.000496443331250703, 'samples': 1911744, 'steps': 9956, 'loss/train': 1.7674018144607544} -08/30/2021 14:56:39 - INFO - __main__ - Step 9958: {'lr': 0.0004964424392365604, 'samples': 1911936, 'steps': 9957, 'loss/train': 1.8954929113388062} -08/30/2021 14:56:40 - INFO - __main__ - Step 9959: {'lr': 0.0004964415471113747, 'samples': 1912128, 'steps': 9958, 'loss/train': 1.3786265850067139} -08/30/2021 14:56:41 - INFO - __main__ - Step 9960: {'lr': 0.0004964406548751461, 'samples': 1912320, 'steps': 9959, 'loss/train': 2.2502574920654297} -08/30/2021 14:56:42 - INFO - __main__ - Step 9961: {'lr': 0.0004964397625278751, 'samples': 1912512, 'steps': 9960, 'loss/train': 1.9674396514892578} -08/30/2021 14:56:42 - INFO - __main__ - Step 9962: {'lr': 0.0004964388700695623, 'samples': 1912704, 'steps': 9961, 'loss/train': 1.7398422956466675} -08/30/2021 14:56:42 - INFO - __main__ - Step 9963: {'lr': 0.0004964379775002078, 'samples': 1912896, 'steps': 9962, 'loss/train': 1.7798408269882202} -08/30/2021 14:56:43 - INFO - __main__ - Step 9964: {'lr': 0.0004964370848198122, 'samples': 1913088, 'steps': 9963, 'loss/train': 1.5920237302780151} -08/30/2021 14:56:45 - INFO - __main__ - Step 9965: {'lr': 0.0004964361920283759, 'samples': 1913280, 'steps': 9964, 'loss/train': 1.7673590183258057} -08/30/2021 14:56:45 - INFO - __main__ - Step 9966: {'lr': 0.0004964352991258992, 'samples': 1913472, 'steps': 9965, 'loss/train': 1.5249208211898804} -08/30/2021 14:56:45 - INFO - __main__ - Step 9967: {'lr': 0.0004964344061123826, 'samples': 1913664, 'steps': 9966, 'loss/train': 1.9139293432235718} -08/30/2021 14:56:46 - INFO - __main__ - Step 9968: {'lr': 0.0004964335129878264, 'samples': 1913856, 'steps': 9967, 'loss/train': 1.420186161994934} -08/30/2021 14:56:46 - INFO - __main__ - Step 9969: {'lr': 0.0004964326197522311, 'samples': 1914048, 'steps': 9968, 'loss/train': 1.9627630710601807} -08/30/2021 14:56:48 - INFO - __main__ - Step 9970: {'lr': 0.0004964317264055971, 'samples': 1914240, 'steps': 9969, 'loss/train': 1.156221866607666} -08/30/2021 14:56:48 - INFO - __main__ - Step 9971: {'lr': 0.0004964308329479247, 'samples': 1914432, 'steps': 9970, 'loss/train': 1.1966806650161743} -08/30/2021 14:56:48 - INFO - __main__ - Step 9972: {'lr': 0.0004964299393792143, 'samples': 1914624, 'steps': 9971, 'loss/train': 1.853172779083252} -08/30/2021 14:56:49 - INFO - __main__ - Step 9973: {'lr': 0.0004964290456994666, 'samples': 1914816, 'steps': 9972, 'loss/train': 1.675586462020874} -08/30/2021 14:56:49 - INFO - __main__ - Step 9974: {'lr': 0.0004964281519086816, 'samples': 1915008, 'steps': 9973, 'loss/train': 2.259634256362915} -08/30/2021 14:56:51 - INFO - __main__ - Step 9975: {'lr': 0.0004964272580068599, 'samples': 1915200, 'steps': 9974, 'loss/train': 1.6877899169921875} -08/30/2021 14:56:51 - INFO - __main__ - Step 9976: {'lr': 0.0004964263639940018, 'samples': 1915392, 'steps': 9975, 'loss/train': 1.482268214225769} -08/30/2021 14:56:51 - INFO - __main__ - Step 9977: {'lr': 0.000496425469870108, 'samples': 1915584, 'steps': 9976, 'loss/train': 1.7324260473251343} -08/30/2021 14:56:52 - INFO - __main__ - Step 9978: {'lr': 0.0004964245756351786, 'samples': 1915776, 'steps': 9977, 'loss/train': 1.5633198022842407} -08/30/2021 14:56:52 - INFO - __main__ - Step 9979: {'lr': 0.000496423681289214, 'samples': 1915968, 'steps': 9978, 'loss/train': 1.7842503786087036} -08/30/2021 14:56:53 - INFO - __main__ - Step 9980: {'lr': 0.0004964227868322148, 'samples': 1916160, 'steps': 9979, 'loss/train': 1.7017784118652344} -08/30/2021 14:56:54 - INFO - __main__ - Step 9981: {'lr': 0.0004964218922641812, 'samples': 1916352, 'steps': 9980, 'loss/train': 1.4904532432556152} -08/30/2021 14:56:54 - INFO - __main__ - Step 9982: {'lr': 0.0004964209975851137, 'samples': 1916544, 'steps': 9981, 'loss/train': 1.8057057857513428} -08/30/2021 14:56:55 - INFO - __main__ - Step 9983: {'lr': 0.0004964201027950129, 'samples': 1916736, 'steps': 9982, 'loss/train': 1.4644185304641724} -08/30/2021 14:56:55 - INFO - __main__ - Step 9984: {'lr': 0.0004964192078938788, 'samples': 1916928, 'steps': 9983, 'loss/train': 1.6545456647872925} -08/30/2021 14:56:57 - INFO - __main__ - Step 9985: {'lr': 0.0004964183128817121, 'samples': 1917120, 'steps': 9984, 'loss/train': 1.7370964288711548} -08/30/2021 14:56:57 - INFO - __main__ - Step 9986: {'lr': 0.000496417417758513, 'samples': 1917312, 'steps': 9985, 'loss/train': 2.379159927368164} -08/30/2021 14:56:57 - INFO - __main__ - Step 9987: {'lr': 0.000496416522524282, 'samples': 1917504, 'steps': 9986, 'loss/train': 1.9058454036712646} -08/30/2021 14:56:58 - INFO - __main__ - Step 9988: {'lr': 0.0004964156271790197, 'samples': 1917696, 'steps': 9987, 'loss/train': 1.170692801475525} -08/30/2021 14:56:58 - INFO - __main__ - Step 9989: {'lr': 0.0004964147317227262, 'samples': 1917888, 'steps': 9988, 'loss/train': 1.8171964883804321} -08/30/2021 14:56:59 - INFO - __main__ - Step 9990: {'lr': 0.000496413836155402, 'samples': 1918080, 'steps': 9989, 'loss/train': 1.9222526550292969} -08/30/2021 14:57:00 - INFO - __main__ - Step 9991: {'lr': 0.0004964129404770476, 'samples': 1918272, 'steps': 9990, 'loss/train': 1.1143251657485962} -08/30/2021 14:57:00 - INFO - __main__ - Step 9992: {'lr': 0.0004964120446876633, 'samples': 1918464, 'steps': 9991, 'loss/train': 1.8447924852371216} -08/30/2021 14:57:01 - INFO - __main__ - Step 9993: {'lr': 0.0004964111487872495, 'samples': 1918656, 'steps': 9992, 'loss/train': 2.0372166633605957} -08/30/2021 14:57:01 - INFO - __main__ - Step 9994: {'lr': 0.0004964102527758067, 'samples': 1918848, 'steps': 9993, 'loss/train': 1.631529688835144} -08/30/2021 14:57:01 - INFO - __main__ - Step 9995: {'lr': 0.0004964093566533352, 'samples': 1919040, 'steps': 9994, 'loss/train': 1.91537344455719} -08/30/2021 14:57:03 - INFO - __main__ - Step 9996: {'lr': 0.0004964084604198354, 'samples': 1919232, 'steps': 9995, 'loss/train': 1.7254267930984497} -08/30/2021 14:57:03 - INFO - __main__ - Step 9997: {'lr': 0.0004964075640753079, 'samples': 1919424, 'steps': 9996, 'loss/train': 1.6130692958831787} -08/30/2021 14:57:04 - INFO - __main__ - Step 9998: {'lr': 0.0004964066676197528, 'samples': 1919616, 'steps': 9997, 'loss/train': 1.1783849000930786} -08/30/2021 14:57:04 - INFO - __main__ - Step 9999: {'lr': 0.0004964057710531707, 'samples': 1919808, 'steps': 9998, 'loss/train': 1.6470781564712524} -08/30/2021 14:57:04 - INFO - __main__ - Step 10000: {'lr': 0.0004964048743755621, 'samples': 1920000, 'steps': 9999, 'loss/train': 1.5546714067459106} -08/30/2021 14:57:06 - INFO - __main__ - Step 10001: {'lr': 0.0004964039775869272, 'samples': 1920192, 'steps': 10000, 'loss/train': 1.6607551574707031} -08/30/2021 14:57:06 - INFO - __main__ - Step 10002: {'lr': 0.0004964030806872664, 'samples': 1920384, 'steps': 10001, 'loss/train': 2.0873374938964844} -08/30/2021 14:57:07 - INFO - __main__ - Step 10003: {'lr': 0.0004964021836765802, 'samples': 1920576, 'steps': 10002, 'loss/train': 2.0015244483947754} -08/30/2021 14:57:07 - INFO - __main__ - Step 10004: {'lr': 0.000496401286554869, 'samples': 1920768, 'steps': 10003, 'loss/train': 1.5208274126052856} -08/30/2021 14:57:07 - INFO - __main__ - Step 10005: {'lr': 0.000496400389322133, 'samples': 1920960, 'steps': 10004, 'loss/train': 2.051011562347412} -08/30/2021 14:57:09 - INFO - __main__ - Step 10006: {'lr': 0.000496399491978373, 'samples': 1921152, 'steps': 10005, 'loss/train': 2.166624069213867} -08/30/2021 14:57:10 - INFO - __main__ - Step 10007: {'lr': 0.0004963985945235891, 'samples': 1921344, 'steps': 10006, 'loss/train': 4.9143900871276855} -08/30/2021 14:57:10 - INFO - __main__ - Step 10008: {'lr': 0.0004963976969577819, 'samples': 1921536, 'steps': 10007, 'loss/train': 2.3767783641815186} -08/30/2021 14:57:10 - INFO - __main__ - Step 10009: {'lr': 0.0004963967992809516, 'samples': 1921728, 'steps': 10008, 'loss/train': 0.2657642662525177} -08/30/2021 14:57:11 - INFO - __main__ - Step 10010: {'lr': 0.0004963959014930988, 'samples': 1921920, 'steps': 10009, 'loss/train': 2.181117534637451} -08/30/2021 14:57:12 - INFO - __main__ - Step 10011: {'lr': 0.0004963950035942237, 'samples': 1922112, 'steps': 10010, 'loss/train': 2.0658130645751953} -08/30/2021 14:57:13 - INFO - __main__ - Step 10012: {'lr': 0.0004963941055843268, 'samples': 1922304, 'steps': 10011, 'loss/train': 1.91506028175354} -08/30/2021 14:57:13 - INFO - __main__ - Step 10013: {'lr': 0.0004963932074634087, 'samples': 1922496, 'steps': 10012, 'loss/train': 1.8211382627487183} -08/30/2021 14:57:13 - INFO - __main__ - Step 10014: {'lr': 0.0004963923092314694, 'samples': 1922688, 'steps': 10013, 'loss/train': 1.928120493888855} -08/30/2021 14:57:14 - INFO - __main__ - Step 10015: {'lr': 0.0004963914108885097, 'samples': 1922880, 'steps': 10014, 'loss/train': 1.6316910982131958} -08/30/2021 14:57:15 - INFO - __main__ - Step 10016: {'lr': 0.0004963905124345297, 'samples': 1923072, 'steps': 10015, 'loss/train': 1.9263784885406494} -08/30/2021 14:57:16 - INFO - __main__ - Step 10017: {'lr': 0.00049638961386953, 'samples': 1923264, 'steps': 10016, 'loss/train': 1.7138534784317017} -08/30/2021 14:57:16 - INFO - __main__ - Step 10018: {'lr': 0.000496388715193511, 'samples': 1923456, 'steps': 10017, 'loss/train': 1.8585059642791748} -08/30/2021 14:57:16 - INFO - __main__ - Step 10019: {'lr': 0.000496387816406473, 'samples': 1923648, 'steps': 10018, 'loss/train': 2.00970458984375} -08/30/2021 14:57:17 - INFO - __main__ - Step 10020: {'lr': 0.0004963869175084164, 'samples': 1923840, 'steps': 10019, 'loss/train': 1.9403449296951294} -08/30/2021 14:57:17 - INFO - __main__ - Step 10021: {'lr': 0.0004963860184993416, 'samples': 1924032, 'steps': 10020, 'loss/train': 1.5665193796157837} -08/30/2021 14:57:19 - INFO - __main__ - Step 10022: {'lr': 0.0004963851193792492, 'samples': 1924224, 'steps': 10021, 'loss/train': 1.9872945547103882} -08/30/2021 14:57:20 - INFO - __main__ - Step 10023: {'lr': 0.0004963842201481394, 'samples': 1924416, 'steps': 10022, 'loss/train': 2.0834667682647705} -08/30/2021 14:57:20 - INFO - __main__ - Step 10024: {'lr': 0.0004963833208060128, 'samples': 1924608, 'steps': 10023, 'loss/train': 2.122685432434082} -08/30/2021 14:57:20 - INFO - __main__ - Step 10025: {'lr': 0.0004963824213528696, 'samples': 1924800, 'steps': 10024, 'loss/train': 2.247332811355591} -08/30/2021 14:57:21 - INFO - __main__ - Step 10026: {'lr': 0.0004963815217887102, 'samples': 1924992, 'steps': 10025, 'loss/train': 1.3828188180923462} -08/30/2021 14:57:22 - INFO - __main__ - Step 10027: {'lr': 0.0004963806221135351, 'samples': 1925184, 'steps': 10026, 'loss/train': 3.7562947273254395} -08/30/2021 14:57:23 - INFO - __main__ - Step 10028: {'lr': 0.0004963797223273448, 'samples': 1925376, 'steps': 10027, 'loss/train': 1.1838608980178833} -08/30/2021 14:57:23 - INFO - __main__ - Step 10029: {'lr': 0.0004963788224301395, 'samples': 1925568, 'steps': 10028, 'loss/train': 1.8303600549697876} -08/30/2021 14:57:23 - INFO - __main__ - Step 10030: {'lr': 0.0004963779224219197, 'samples': 1925760, 'steps': 10029, 'loss/train': 1.9881763458251953} -08/30/2021 14:57:24 - INFO - __main__ - Step 10031: {'lr': 0.0004963770223026858, 'samples': 1925952, 'steps': 10030, 'loss/train': 1.942649006843567} -08/30/2021 14:57:25 - INFO - __main__ - Step 10032: {'lr': 0.0004963761220724384, 'samples': 1926144, 'steps': 10031, 'loss/train': 1.647000789642334} -08/30/2021 14:57:25 - INFO - __main__ - Step 10033: {'lr': 0.0004963752217311775, 'samples': 1926336, 'steps': 10032, 'loss/train': 1.5193215608596802} -08/30/2021 14:57:26 - INFO - __main__ - Step 10034: {'lr': 0.0004963743212789038, 'samples': 1926528, 'steps': 10033, 'loss/train': 2.008763551712036} -08/30/2021 14:57:26 - INFO - __main__ - Step 10035: {'lr': 0.0004963734207156178, 'samples': 1926720, 'steps': 10034, 'loss/train': 1.6514290571212769} -08/30/2021 14:57:26 - INFO - __main__ - Step 10036: {'lr': 0.0004963725200413195, 'samples': 1926912, 'steps': 10035, 'loss/train': 1.63376784324646} -08/30/2021 14:57:28 - INFO - __main__ - Step 10037: {'lr': 0.0004963716192560097, 'samples': 1927104, 'steps': 10036, 'loss/train': 1.6030821800231934} -08/30/2021 14:57:28 - INFO - __main__ - Step 10038: {'lr': 0.0004963707183596885, 'samples': 1927296, 'steps': 10037, 'loss/train': 1.554940938949585} -08/30/2021 14:57:29 - INFO - __main__ - Step 10039: {'lr': 0.0004963698173523566, 'samples': 1927488, 'steps': 10038, 'loss/train': 2.125246047973633} -08/30/2021 14:57:29 - INFO - __main__ - Step 10040: {'lr': 0.0004963689162340142, 'samples': 1927680, 'steps': 10039, 'loss/train': 1.491138219833374} -08/30/2021 14:57:30 - INFO - __main__ - Step 10041: {'lr': 0.0004963680150046618, 'samples': 1927872, 'steps': 10040, 'loss/train': 1.8210960626602173} -08/30/2021 14:57:31 - INFO - __main__ - Step 10042: {'lr': 0.0004963671136642997, 'samples': 1928064, 'steps': 10041, 'loss/train': 1.8418312072753906} -08/30/2021 14:57:32 - INFO - __main__ - Step 10043: {'lr': 0.0004963662122129284, 'samples': 1928256, 'steps': 10042, 'loss/train': 0.6766268610954285} -08/30/2021 14:57:32 - INFO - __main__ - Step 10044: {'lr': 0.0004963653106505483, 'samples': 1928448, 'steps': 10043, 'loss/train': 1.8348647356033325} -08/30/2021 14:57:32 - INFO - __main__ - Step 10045: {'lr': 0.0004963644089771598, 'samples': 1928640, 'steps': 10044, 'loss/train': 2.135529041290283} -08/30/2021 14:57:33 - INFO - __main__ - Step 10046: {'lr': 0.0004963635071927633, 'samples': 1928832, 'steps': 10045, 'loss/train': 1.9546533823013306} -08/30/2021 14:57:34 - INFO - __main__ - Step 10047: {'lr': 0.0004963626052973592, 'samples': 1929024, 'steps': 10046, 'loss/train': 1.526484489440918} -08/30/2021 14:57:35 - INFO - __main__ - Step 10048: {'lr': 0.0004963617032909479, 'samples': 1929216, 'steps': 10047, 'loss/train': 1.817151427268982} -08/30/2021 14:57:35 - INFO - __main__ - Step 10049: {'lr': 0.0004963608011735298, 'samples': 1929408, 'steps': 10048, 'loss/train': 1.9247368574142456} -08/30/2021 14:57:35 - INFO - __main__ - Step 10050: {'lr': 0.0004963598989451053, 'samples': 1929600, 'steps': 10049, 'loss/train': 1.6581131219863892} -08/30/2021 14:57:36 - INFO - __main__ - Step 10051: {'lr': 0.000496358996605675, 'samples': 1929792, 'steps': 10050, 'loss/train': 1.4466031789779663} -08/30/2021 14:57:37 - INFO - __main__ - Step 10052: {'lr': 0.0004963580941552391, 'samples': 1929984, 'steps': 10051, 'loss/train': 1.6546374559402466} -08/30/2021 14:57:38 - INFO - __main__ - Step 10053: {'lr': 0.0004963571915937979, 'samples': 1930176, 'steps': 10052, 'loss/train': 2.0494463443756104} -08/30/2021 14:57:38 - INFO - __main__ - Step 10054: {'lr': 0.000496356288921352, 'samples': 1930368, 'steps': 10053, 'loss/train': 1.6917833089828491} -08/30/2021 14:57:38 - INFO - __main__ - Step 10055: {'lr': 0.0004963553861379018, 'samples': 1930560, 'steps': 10054, 'loss/train': 1.950510859489441} -08/30/2021 14:57:39 - INFO - __main__ - Step 10056: {'lr': 0.0004963544832434476, 'samples': 1930752, 'steps': 10055, 'loss/train': 1.8846999406814575} -08/30/2021 14:57:40 - INFO - __main__ - Step 10057: {'lr': 0.00049635358023799, 'samples': 1930944, 'steps': 10056, 'loss/train': 1.5036273002624512} -08/30/2021 14:57:41 - INFO - __main__ - Step 10058: {'lr': 0.0004963526771215291, 'samples': 1931136, 'steps': 10057, 'loss/train': 1.988438606262207} -08/30/2021 14:57:41 - INFO - __main__ - Step 10059: {'lr': 0.0004963517738940656, 'samples': 1931328, 'steps': 10058, 'loss/train': 2.1263527870178223} -08/30/2021 14:57:41 - INFO - __main__ - Step 10060: {'lr': 0.0004963508705555998, 'samples': 1931520, 'steps': 10059, 'loss/train': 2.0561323165893555} -08/30/2021 14:57:42 - INFO - __main__ - Step 10061: {'lr': 0.000496349967106132, 'samples': 1931712, 'steps': 10060, 'loss/train': 1.9084632396697998} -08/30/2021 14:57:43 - INFO - __main__ - Step 10062: {'lr': 0.0004963490635456629, 'samples': 1931904, 'steps': 10061, 'loss/train': 2.1884217262268066} -08/30/2021 14:57:44 - INFO - __main__ - Step 10063: {'lr': 0.0004963481598741925, 'samples': 1932096, 'steps': 10062, 'loss/train': 1.8260231018066406} -08/30/2021 14:57:44 - INFO - __main__ - Step 10064: {'lr': 0.0004963472560917216, 'samples': 1932288, 'steps': 10063, 'loss/train': 2.044750213623047} -08/30/2021 14:57:44 - INFO - __main__ - Step 10065: {'lr': 0.0004963463521982503, 'samples': 1932480, 'steps': 10064, 'loss/train': 1.5723226070404053} -08/30/2021 14:57:45 - INFO - __main__ - Step 10066: {'lr': 0.0004963454481937791, 'samples': 1932672, 'steps': 10065, 'loss/train': 2.119046688079834} -08/30/2021 14:57:46 - INFO - __main__ - Step 10067: {'lr': 0.0004963445440783086, 'samples': 1932864, 'steps': 10066, 'loss/train': 1.9843782186508179} -08/30/2021 14:57:47 - INFO - __main__ - Step 10068: {'lr': 0.0004963436398518389, 'samples': 1933056, 'steps': 10067, 'loss/train': 1.5568156242370605} -08/30/2021 14:57:47 - INFO - __main__ - Step 10069: {'lr': 0.0004963427355143706, 'samples': 1933248, 'steps': 10068, 'loss/train': 1.9988080263137817} -08/30/2021 14:57:47 - INFO - __main__ - Step 10070: {'lr': 0.0004963418310659041, 'samples': 1933440, 'steps': 10069, 'loss/train': 1.257478952407837} -08/30/2021 14:57:48 - INFO - __main__ - Step 10071: {'lr': 0.0004963409265064398, 'samples': 1933632, 'steps': 10070, 'loss/train': 0.793785810470581} -08/30/2021 14:57:48 - INFO - __main__ - Step 10072: {'lr': 0.0004963400218359781, 'samples': 1933824, 'steps': 10071, 'loss/train': 1.8985668420791626} -08/30/2021 14:57:50 - INFO - __main__ - Step 10073: {'lr': 0.0004963391170545193, 'samples': 1934016, 'steps': 10072, 'loss/train': 0.1252242475748062} -08/30/2021 14:57:50 - INFO - __main__ - Step 10074: {'lr': 0.0004963382121620639, 'samples': 1934208, 'steps': 10073, 'loss/train': 2.0857741832733154} -08/30/2021 14:57:50 - INFO - __main__ - Step 10075: {'lr': 0.0004963373071586123, 'samples': 1934400, 'steps': 10074, 'loss/train': 2.034210443496704} -08/30/2021 14:57:51 - INFO - __main__ - Step 10076: {'lr': 0.000496336402044165, 'samples': 1934592, 'steps': 10075, 'loss/train': 1.6108455657958984} -08/30/2021 14:57:51 - INFO - __main__ - Step 10077: {'lr': 0.0004963354968187222, 'samples': 1934784, 'steps': 10076, 'loss/train': 2.5568816661834717} -08/30/2021 14:57:53 - INFO - __main__ - Step 10078: {'lr': 0.0004963345914822845, 'samples': 1934976, 'steps': 10077, 'loss/train': 1.9205923080444336} -08/30/2021 14:57:54 - INFO - __main__ - Step 10079: {'lr': 0.0004963336860348521, 'samples': 1935168, 'steps': 10078, 'loss/train': 1.9299153089523315} -08/30/2021 14:57:54 - INFO - __main__ - Step 10080: {'lr': 0.0004963327804764257, 'samples': 1935360, 'steps': 10079, 'loss/train': 1.9766066074371338} -08/30/2021 14:57:54 - INFO - __main__ - Step 10081: {'lr': 0.0004963318748070056, 'samples': 1935552, 'steps': 10080, 'loss/train': 1.97420334815979} -08/30/2021 14:57:55 - INFO - __main__ - Step 10082: {'lr': 0.0004963309690265921, 'samples': 1935744, 'steps': 10081, 'loss/train': 1.6910001039505005} -08/30/2021 14:57:56 - INFO - __main__ - Step 10083: {'lr': 0.0004963300631351856, 'samples': 1935936, 'steps': 10082, 'loss/train': 1.0413610935211182} -08/30/2021 14:57:57 - INFO - __main__ - Step 10084: {'lr': 0.0004963291571327866, 'samples': 1936128, 'steps': 10083, 'loss/train': 1.5702033042907715} -08/30/2021 14:57:57 - INFO - __main__ - Step 10085: {'lr': 0.0004963282510193955, 'samples': 1936320, 'steps': 10084, 'loss/train': 1.4221917390823364} -08/30/2021 14:57:57 - INFO - __main__ - Step 10086: {'lr': 0.0004963273447950126, 'samples': 1936512, 'steps': 10085, 'loss/train': 1.863145112991333} -08/30/2021 14:57:58 - INFO - __main__ - Step 10087: {'lr': 0.0004963264384596386, 'samples': 1936704, 'steps': 10086, 'loss/train': 2.041637659072876} -08/30/2021 14:57:59 - INFO - __main__ - Step 10088: {'lr': 0.0004963255320132735, 'samples': 1936896, 'steps': 10087, 'loss/train': 1.5413753986358643} -08/30/2021 14:58:00 - INFO - __main__ - Step 10089: {'lr': 0.0004963246254559181, 'samples': 1937088, 'steps': 10088, 'loss/train': 1.2902778387069702} -08/30/2021 14:58:00 - INFO - __main__ - Step 10090: {'lr': 0.0004963237187875724, 'samples': 1937280, 'steps': 10089, 'loss/train': 1.2422256469726562} -08/30/2021 14:58:00 - INFO - __main__ - Step 10091: {'lr': 0.0004963228120082372, 'samples': 1937472, 'steps': 10090, 'loss/train': 2.091702461242676} -08/30/2021 14:58:01 - INFO - __main__ - Step 10092: {'lr': 0.0004963219051179127, 'samples': 1937664, 'steps': 10091, 'loss/train': 2.056105852127075} -08/30/2021 14:58:02 - INFO - __main__ - Step 10093: {'lr': 0.0004963209981165993, 'samples': 1937856, 'steps': 10092, 'loss/train': 1.5542057752609253} -08/30/2021 14:58:03 - INFO - __main__ - Step 10094: {'lr': 0.0004963200910042976, 'samples': 1938048, 'steps': 10093, 'loss/train': 1.575708270072937} -08/30/2021 14:58:03 - INFO - __main__ - Step 10095: {'lr': 0.0004963191837810077, 'samples': 1938240, 'steps': 10094, 'loss/train': 2.1271841526031494} -08/30/2021 14:58:03 - INFO - __main__ - Step 10096: {'lr': 0.0004963182764467303, 'samples': 1938432, 'steps': 10095, 'loss/train': 0.9086203575134277} -08/30/2021 14:58:04 - INFO - __main__ - Step 10097: {'lr': 0.0004963173690014656, 'samples': 1938624, 'steps': 10096, 'loss/train': 1.4094364643096924} -08/30/2021 14:58:05 - INFO - __main__ - Step 10098: {'lr': 0.0004963164614452142, 'samples': 1938816, 'steps': 10097, 'loss/train': 2.0525710582733154} -08/30/2021 14:58:06 - INFO - __main__ - Step 10099: {'lr': 0.0004963155537779764, 'samples': 1939008, 'steps': 10098, 'loss/train': 2.0697312355041504} -08/30/2021 14:58:06 - INFO - __main__ - Step 10100: {'lr': 0.0004963146459997525, 'samples': 1939200, 'steps': 10099, 'loss/train': 1.7506622076034546} -08/30/2021 14:58:07 - INFO - __main__ - Step 10101: {'lr': 0.0004963137381105431, 'samples': 1939392, 'steps': 10100, 'loss/train': 1.7772756814956665} -08/30/2021 14:58:07 - INFO - __main__ - Step 10102: {'lr': 0.0004963128301103485, 'samples': 1939584, 'steps': 10101, 'loss/train': 1.4139899015426636} -08/30/2021 14:58:07 - INFO - __main__ - Step 10103: {'lr': 0.0004963119219991691, 'samples': 1939776, 'steps': 10102, 'loss/train': 2.061192750930786} -08/30/2021 14:58:09 - INFO - __main__ - Step 10104: {'lr': 0.0004963110137770054, 'samples': 1939968, 'steps': 10103, 'loss/train': 1.6963818073272705} -08/30/2021 14:58:09 - INFO - __main__ - Step 10105: {'lr': 0.0004963101054438578, 'samples': 1940160, 'steps': 10104, 'loss/train': 2.4496877193450928} -08/30/2021 14:58:10 - INFO - __main__ - Step 10106: {'lr': 0.0004963091969997265, 'samples': 1940352, 'steps': 10105, 'loss/train': 1.8720544576644897} -08/30/2021 14:58:10 - INFO - __main__ - Step 10107: {'lr': 0.0004963082884446123, 'samples': 1940544, 'steps': 10106, 'loss/train': 1.7878438234329224} -08/30/2021 14:58:10 - INFO - __main__ - Step 10108: {'lr': 0.0004963073797785153, 'samples': 1940736, 'steps': 10107, 'loss/train': 1.8549368381500244} -08/30/2021 14:58:12 - INFO - __main__ - Step 10109: {'lr': 0.000496306471001436, 'samples': 1940928, 'steps': 10108, 'loss/train': 2.173051595687866} -08/30/2021 14:58:12 - INFO - __main__ - Step 10110: {'lr': 0.0004963055621133748, 'samples': 1941120, 'steps': 10109, 'loss/train': 2.741757392883301} -08/30/2021 14:58:13 - INFO - __main__ - Step 10111: {'lr': 0.0004963046531143321, 'samples': 1941312, 'steps': 10110, 'loss/train': 1.8910725116729736} -08/30/2021 14:58:13 - INFO - __main__ - Step 10112: {'lr': 0.0004963037440043083, 'samples': 1941504, 'steps': 10111, 'loss/train': 2.3466920852661133} -08/30/2021 14:58:13 - INFO - __main__ - Step 10113: {'lr': 0.0004963028347833038, 'samples': 1941696, 'steps': 10112, 'loss/train': 1.580188512802124} -08/30/2021 14:58:15 - INFO - __main__ - Step 10114: {'lr': 0.0004963019254513191, 'samples': 1941888, 'steps': 10113, 'loss/train': 1.651946783065796} -08/30/2021 14:58:15 - INFO - __main__ - Step 10115: {'lr': 0.0004963010160083546, 'samples': 1942080, 'steps': 10114, 'loss/train': 1.6463650465011597} -08/30/2021 14:58:16 - INFO - __main__ - Step 10116: {'lr': 0.0004963001064544106, 'samples': 1942272, 'steps': 10115, 'loss/train': 2.0618479251861572} -08/30/2021 14:58:16 - INFO - __main__ - Step 10117: {'lr': 0.0004962991967894876, 'samples': 1942464, 'steps': 10116, 'loss/train': 1.668412208557129} -08/30/2021 14:58:16 - INFO - __main__ - Step 10118: {'lr': 0.0004962982870135859, 'samples': 1942656, 'steps': 10117, 'loss/train': 2.3173820972442627} -08/30/2021 14:58:18 - INFO - __main__ - Step 10119: {'lr': 0.0004962973771267061, 'samples': 1942848, 'steps': 10118, 'loss/train': 1.8275506496429443} -08/30/2021 14:58:18 - INFO - __main__ - Step 10120: {'lr': 0.0004962964671288484, 'samples': 1943040, 'steps': 10119, 'loss/train': 1.7746307849884033} -08/30/2021 14:58:19 - INFO - __main__ - Step 10121: {'lr': 0.0004962955570200135, 'samples': 1943232, 'steps': 10120, 'loss/train': 1.8133124113082886} -08/30/2021 14:58:19 - INFO - __main__ - Step 10122: {'lr': 0.0004962946468002014, 'samples': 1943424, 'steps': 10121, 'loss/train': 1.0313243865966797} -08/30/2021 14:58:20 - INFO - __main__ - Step 10123: {'lr': 0.0004962937364694129, 'samples': 1943616, 'steps': 10122, 'loss/train': 2.112544059753418} -08/30/2021 14:58:21 - INFO - __main__ - Step 10124: {'lr': 0.0004962928260276481, 'samples': 1943808, 'steps': 10123, 'loss/train': 2.061617374420166} -08/30/2021 14:58:21 - INFO - __main__ - Step 10125: {'lr': 0.0004962919154749077, 'samples': 1944000, 'steps': 10124, 'loss/train': 2.033141851425171} -08/30/2021 14:58:22 - INFO - __main__ - Step 10126: {'lr': 0.0004962910048111919, 'samples': 1944192, 'steps': 10125, 'loss/train': 1.267006754875183} -08/30/2021 14:58:22 - INFO - __main__ - Step 10127: {'lr': 0.0004962900940365012, 'samples': 1944384, 'steps': 10126, 'loss/train': 2.104240894317627} -08/30/2021 14:58:22 - INFO - __main__ - Step 10128: {'lr': 0.0004962891831508359, 'samples': 1944576, 'steps': 10127, 'loss/train': 1.6723476648330688} -08/30/2021 14:58:25 - INFO - __main__ - Step 10129: {'lr': 0.0004962882721541965, 'samples': 1944768, 'steps': 10128, 'loss/train': 2.021334409713745} -08/30/2021 14:58:25 - INFO - __main__ - Step 10130: {'lr': 0.0004962873610465835, 'samples': 1944960, 'steps': 10129, 'loss/train': 1.295798420906067} -08/30/2021 14:58:26 - INFO - __main__ - Step 10131: {'lr': 0.0004962864498279972, 'samples': 1945152, 'steps': 10130, 'loss/train': 2.0763285160064697} -08/30/2021 14:58:26 - INFO - __main__ - Step 10132: {'lr': 0.000496285538498438, 'samples': 1945344, 'steps': 10131, 'loss/train': 2.2645416259765625} -08/30/2021 14:58:26 - INFO - __main__ - Step 10133: {'lr': 0.0004962846270579062, 'samples': 1945536, 'steps': 10132, 'loss/train': 3.4351065158843994} -08/30/2021 14:58:27 - INFO - __main__ - Step 10134: {'lr': 0.0004962837155064025, 'samples': 1945728, 'steps': 10133, 'loss/train': 1.7721301317214966} -08/30/2021 14:58:28 - INFO - __main__ - Step 10135: {'lr': 0.0004962828038439272, 'samples': 1945920, 'steps': 10134, 'loss/train': 1.7989479303359985} -08/30/2021 14:58:29 - INFO - __main__ - Step 10136: {'lr': 0.0004962818920704805, 'samples': 1946112, 'steps': 10135, 'loss/train': 1.469241976737976} -08/30/2021 14:58:29 - INFO - __main__ - Step 10137: {'lr': 0.0004962809801860632, 'samples': 1946304, 'steps': 10136, 'loss/train': 1.559409737586975} -08/30/2021 14:58:29 - INFO - __main__ - Step 10138: {'lr': 0.0004962800681906753, 'samples': 1946496, 'steps': 10137, 'loss/train': 1.8546239137649536} -08/30/2021 14:58:30 - INFO - __main__ - Step 10139: {'lr': 0.0004962791560843175, 'samples': 1946688, 'steps': 10138, 'loss/train': 1.006983757019043} -08/30/2021 14:58:31 - INFO - __main__ - Step 10140: {'lr': 0.00049627824386699, 'samples': 1946880, 'steps': 10139, 'loss/train': 1.4265390634536743} -08/30/2021 14:58:31 - INFO - __main__ - Step 10141: {'lr': 0.0004962773315386935, 'samples': 1947072, 'steps': 10140, 'loss/train': 1.695970058441162} -08/30/2021 14:58:32 - INFO - __main__ - Step 10142: {'lr': 0.0004962764190994282, 'samples': 1947264, 'steps': 10141, 'loss/train': 2.147231101989746} -08/30/2021 14:58:32 - INFO - __main__ - Step 10143: {'lr': 0.0004962755065491944, 'samples': 1947456, 'steps': 10142, 'loss/train': 2.2169349193573} -08/30/2021 14:58:32 - INFO - __main__ - Step 10144: {'lr': 0.0004962745938879928, 'samples': 1947648, 'steps': 10143, 'loss/train': 1.2095531225204468} -08/30/2021 14:58:34 - INFO - __main__ - Step 10145: {'lr': 0.0004962736811158236, 'samples': 1947840, 'steps': 10144, 'loss/train': 1.8546603918075562} -08/30/2021 14:58:34 - INFO - __main__ - Step 10146: {'lr': 0.0004962727682326873, 'samples': 1948032, 'steps': 10145, 'loss/train': 2.2555429935455322} -08/30/2021 14:58:35 - INFO - __main__ - Step 10147: {'lr': 0.0004962718552385843, 'samples': 1948224, 'steps': 10146, 'loss/train': 2.1229538917541504} -08/30/2021 14:58:35 - INFO - __main__ - Step 10148: {'lr': 0.000496270942133515, 'samples': 1948416, 'steps': 10147, 'loss/train': 2.273806095123291} -08/30/2021 14:58:35 - INFO - __main__ - Step 10149: {'lr': 0.0004962700289174798, 'samples': 1948608, 'steps': 10148, 'loss/train': 1.9142259359359741} -08/30/2021 14:58:37 - INFO - __main__ - Step 10150: {'lr': 0.0004962691155904791, 'samples': 1948800, 'steps': 10149, 'loss/train': 1.9062116146087646} -08/30/2021 14:58:38 - INFO - __main__ - Step 10151: {'lr': 0.0004962682021525134, 'samples': 1948992, 'steps': 10150, 'loss/train': 1.9266009330749512} -08/30/2021 14:58:38 - INFO - __main__ - Step 10152: {'lr': 0.000496267288603583, 'samples': 1949184, 'steps': 10151, 'loss/train': 1.9904824495315552} -08/30/2021 14:58:38 - INFO - __main__ - Step 10153: {'lr': 0.0004962663749436883, 'samples': 1949376, 'steps': 10152, 'loss/train': 1.9961860179901123} -08/30/2021 14:58:39 - INFO - __main__ - Step 10154: {'lr': 0.0004962654611728299, 'samples': 1949568, 'steps': 10153, 'loss/train': 2.2490758895874023} -08/30/2021 14:58:41 - INFO - __main__ - Step 10155: {'lr': 0.000496264547291008, 'samples': 1949760, 'steps': 10154, 'loss/train': 0.6669377088546753} -08/30/2021 14:58:42 - INFO - __main__ - Step 10156: {'lr': 0.0004962636332982232, 'samples': 1949952, 'steps': 10155, 'loss/train': 1.332995057106018} -08/30/2021 14:58:42 - INFO - __main__ - Step 10157: {'lr': 0.0004962627191944756, 'samples': 1950144, 'steps': 10156, 'loss/train': 1.3511934280395508} -08/30/2021 14:58:42 - INFO - __main__ - Step 10158: {'lr': 0.000496261804979766, 'samples': 1950336, 'steps': 10157, 'loss/train': 1.125753402709961} -08/30/2021 14:58:43 - INFO - __main__ - Step 10159: {'lr': 0.0004962608906540946, 'samples': 1950528, 'steps': 10158, 'loss/train': 1.8245738744735718} -08/30/2021 14:58:43 - INFO - __main__ - Step 10160: {'lr': 0.0004962599762174618, 'samples': 1950720, 'steps': 10159, 'loss/train': 2.2537107467651367} -08/30/2021 14:58:45 - INFO - __main__ - Step 10161: {'lr': 0.0004962590616698681, 'samples': 1950912, 'steps': 10160, 'loss/train': 1.7657158374786377} -08/30/2021 14:58:45 - INFO - __main__ - Step 10162: {'lr': 0.0004962581470113138, 'samples': 1951104, 'steps': 10161, 'loss/train': 1.1433213949203491} -08/30/2021 14:58:45 - INFO - __main__ - Step 10163: {'lr': 0.0004962572322417994, 'samples': 1951296, 'steps': 10162, 'loss/train': 1.5990948677062988} -08/30/2021 14:58:46 - INFO - __main__ - Step 10164: {'lr': 0.0004962563173613254, 'samples': 1951488, 'steps': 10163, 'loss/train': 1.731681227684021} -08/30/2021 14:58:46 - INFO - __main__ - Step 10165: {'lr': 0.000496255402369892, 'samples': 1951680, 'steps': 10164, 'loss/train': 1.8948761224746704} -08/30/2021 14:58:48 - INFO - __main__ - Step 10166: {'lr': 0.0004962544872674997, 'samples': 1951872, 'steps': 10165, 'loss/train': 1.9159555435180664} -08/30/2021 14:58:48 - INFO - __main__ - Step 10167: {'lr': 0.000496253572054149, 'samples': 1952064, 'steps': 10166, 'loss/train': 1.0995639562606812} -08/30/2021 14:58:48 - INFO - __main__ - Step 10168: {'lr': 0.0004962526567298402, 'samples': 1952256, 'steps': 10167, 'loss/train': 1.8773449659347534} -08/30/2021 14:58:49 - INFO - __main__ - Step 10169: {'lr': 0.0004962517412945738, 'samples': 1952448, 'steps': 10168, 'loss/train': 2.614912986755371} -08/30/2021 14:58:49 - INFO - __main__ - Step 10170: {'lr': 0.00049625082574835, 'samples': 1952640, 'steps': 10169, 'loss/train': 1.9321526288986206} -08/30/2021 14:58:51 - INFO - __main__ - Step 10171: {'lr': 0.0004962499100911696, 'samples': 1952832, 'steps': 10170, 'loss/train': 2.2004430294036865} -08/30/2021 14:58:51 - INFO - __main__ - Step 10172: {'lr': 0.0004962489943230326, 'samples': 1953024, 'steps': 10171, 'loss/train': 2.0654022693634033} -08/30/2021 14:58:52 - INFO - __main__ - Step 10173: {'lr': 0.0004962480784439397, 'samples': 1953216, 'steps': 10172, 'loss/train': 0.2123950868844986} -08/30/2021 14:58:52 - INFO - __main__ - Step 10174: {'lr': 0.0004962471624538913, 'samples': 1953408, 'steps': 10173, 'loss/train': 1.478588342666626} -08/30/2021 14:58:52 - INFO - __main__ - Step 10175: {'lr': 0.0004962462463528875, 'samples': 1953600, 'steps': 10174, 'loss/train': 2.060807704925537} -08/30/2021 14:58:53 - INFO - __main__ - Step 10176: {'lr': 0.0004962453301409291, 'samples': 1953792, 'steps': 10175, 'loss/train': 1.8203874826431274} -08/30/2021 14:58:54 - INFO - __main__ - Step 10177: {'lr': 0.0004962444138180164, 'samples': 1953984, 'steps': 10176, 'loss/train': 2.0431928634643555} -08/30/2021 14:58:55 - INFO - __main__ - Step 10178: {'lr': 0.0004962434973841497, 'samples': 1954176, 'steps': 10177, 'loss/train': 1.9818137884140015} -08/30/2021 14:58:55 - INFO - __main__ - Step 10179: {'lr': 0.0004962425808393295, 'samples': 1954368, 'steps': 10178, 'loss/train': 1.7735495567321777} -08/30/2021 14:58:55 - INFO - __main__ - Step 10180: {'lr': 0.000496241664183556, 'samples': 1954560, 'steps': 10179, 'loss/train': 1.8552825450897217} -08/30/2021 14:58:56 - INFO - __main__ - Step 10181: {'lr': 0.0004962407474168301, 'samples': 1954752, 'steps': 10180, 'loss/train': 1.430060863494873} -08/30/2021 14:58:58 - INFO - __main__ - Step 10182: {'lr': 0.0004962398305391518, 'samples': 1954944, 'steps': 10181, 'loss/train': 2.282010555267334} -08/30/2021 14:58:58 - INFO - __main__ - Step 10183: {'lr': 0.0004962389135505217, 'samples': 1955136, 'steps': 10182, 'loss/train': 1.7378416061401367} -08/30/2021 14:58:58 - INFO - __main__ - Step 10184: {'lr': 0.00049623799645094, 'samples': 1955328, 'steps': 10183, 'loss/train': 1.8816922903060913} -08/30/2021 14:58:59 - INFO - __main__ - Step 10185: {'lr': 0.0004962370792404073, 'samples': 1955520, 'steps': 10184, 'loss/train': 1.8497915267944336} -08/30/2021 14:58:59 - INFO - __main__ - Step 10186: {'lr': 0.000496236161918924, 'samples': 1955712, 'steps': 10185, 'loss/train': 1.3993608951568604} -08/30/2021 14:59:01 - INFO - __main__ - Step 10187: {'lr': 0.0004962352444864904, 'samples': 1955904, 'steps': 10186, 'loss/train': 1.2489163875579834} -08/30/2021 14:59:01 - INFO - __main__ - Step 10188: {'lr': 0.0004962343269431072, 'samples': 1956096, 'steps': 10187, 'loss/train': 2.148186683654785} -08/30/2021 14:59:01 - INFO - __main__ - Step 10189: {'lr': 0.0004962334092887744, 'samples': 1956288, 'steps': 10188, 'loss/train': 1.3455642461776733} -08/30/2021 14:59:02 - INFO - __main__ - Step 10190: {'lr': 0.0004962324915234928, 'samples': 1956480, 'steps': 10189, 'loss/train': 1.4936561584472656} -08/30/2021 14:59:02 - INFO - __main__ - Step 10191: {'lr': 0.0004962315736472626, 'samples': 1956672, 'steps': 10190, 'loss/train': 1.494005560874939} -08/30/2021 14:59:04 - INFO - __main__ - Step 10192: {'lr': 0.0004962306556600842, 'samples': 1956864, 'steps': 10191, 'loss/train': 1.1978964805603027} -08/30/2021 14:59:04 - INFO - __main__ - Step 10193: {'lr': 0.0004962297375619581, 'samples': 1957056, 'steps': 10192, 'loss/train': 2.197383403778076} -08/30/2021 14:59:04 - INFO - __main__ - Step 10194: {'lr': 0.0004962288193528846, 'samples': 1957248, 'steps': 10193, 'loss/train': 1.8029744625091553} -08/30/2021 14:59:05 - INFO - __main__ - Step 10195: {'lr': 0.0004962279010328642, 'samples': 1957440, 'steps': 10194, 'loss/train': 1.7458617687225342} -08/30/2021 14:59:05 - INFO - __main__ - Step 10196: {'lr': 0.0004962269826018974, 'samples': 1957632, 'steps': 10195, 'loss/train': 2.464775562286377} -08/30/2021 14:59:06 - INFO - __main__ - Step 10197: {'lr': 0.0004962260640599845, 'samples': 1957824, 'steps': 10196, 'loss/train': 1.7174395322799683} -08/30/2021 14:59:07 - INFO - __main__ - Step 10198: {'lr': 0.0004962251454071259, 'samples': 1958016, 'steps': 10197, 'loss/train': 1.703747272491455} -08/30/2021 14:59:07 - INFO - __main__ - Step 10199: {'lr': 0.0004962242266433221, 'samples': 1958208, 'steps': 10198, 'loss/train': 1.5412509441375732} -08/30/2021 14:59:08 - INFO - __main__ - Step 10200: {'lr': 0.0004962233077685734, 'samples': 1958400, 'steps': 10199, 'loss/train': 2.7553746700286865} -08/30/2021 14:59:08 - INFO - __main__ - Step 10201: {'lr': 0.0004962223887828803, 'samples': 1958592, 'steps': 10200, 'loss/train': 1.7935335636138916} -08/30/2021 14:59:08 - INFO - __main__ - Step 10202: {'lr': 0.0004962214696862432, 'samples': 1958784, 'steps': 10201, 'loss/train': 2.0126538276672363} -08/30/2021 14:59:10 - INFO - __main__ - Step 10203: {'lr': 0.0004962205504786626, 'samples': 1958976, 'steps': 10202, 'loss/train': 1.3321278095245361} -08/30/2021 14:59:10 - INFO - __main__ - Step 10204: {'lr': 0.0004962196311601386, 'samples': 1959168, 'steps': 10203, 'loss/train': 1.842808485031128} -08/30/2021 14:59:11 - INFO - __main__ - Step 10205: {'lr': 0.000496218711730672, 'samples': 1959360, 'steps': 10204, 'loss/train': 1.4248859882354736} -08/30/2021 14:59:11 - INFO - __main__ - Step 10206: {'lr': 0.000496217792190263, 'samples': 1959552, 'steps': 10205, 'loss/train': 1.6323902606964111} -08/30/2021 14:59:11 - INFO - __main__ - Step 10207: {'lr': 0.0004962168725389121, 'samples': 1959744, 'steps': 10206, 'loss/train': 2.1328465938568115} -08/30/2021 14:59:13 - INFO - __main__ - Step 10208: {'lr': 0.0004962159527766196, 'samples': 1959936, 'steps': 10207, 'loss/train': 1.3635426759719849} -08/30/2021 14:59:13 - INFO - __main__ - Step 10209: {'lr': 0.000496215032903386, 'samples': 1960128, 'steps': 10208, 'loss/train': 2.454707622528076} -08/30/2021 14:59:14 - INFO - __main__ - Step 10210: {'lr': 0.0004962141129192118, 'samples': 1960320, 'steps': 10209, 'loss/train': 2.0520107746124268} -08/30/2021 14:59:14 - INFO - __main__ - Step 10211: {'lr': 0.0004962131928240972, 'samples': 1960512, 'steps': 10210, 'loss/train': 1.4252179861068726} -08/30/2021 14:59:14 - INFO - __main__ - Step 10212: {'lr': 0.0004962122726180428, 'samples': 1960704, 'steps': 10211, 'loss/train': 2.0074338912963867} -08/30/2021 14:59:16 - INFO - __main__ - Step 10213: {'lr': 0.000496211352301049, 'samples': 1960896, 'steps': 10212, 'loss/train': 1.5113064050674438} -08/30/2021 14:59:17 - INFO - __main__ - Step 10214: {'lr': 0.0004962104318731161, 'samples': 1961088, 'steps': 10213, 'loss/train': 1.8424110412597656} -08/30/2021 14:59:17 - INFO - __main__ - Step 10215: {'lr': 0.0004962095113342445, 'samples': 1961280, 'steps': 10214, 'loss/train': 1.7881007194519043} -08/30/2021 14:59:17 - INFO - __main__ - Step 10216: {'lr': 0.0004962085906844348, 'samples': 1961472, 'steps': 10215, 'loss/train': 1.9657223224639893} -08/30/2021 14:59:18 - INFO - __main__ - Step 10217: {'lr': 0.0004962076699236873, 'samples': 1961664, 'steps': 10216, 'loss/train': 1.7973517179489136} -08/30/2021 14:59:19 - INFO - __main__ - Step 10218: {'lr': 0.0004962067490520024, 'samples': 1961856, 'steps': 10217, 'loss/train': 1.897365689277649} -08/30/2021 14:59:20 - INFO - __main__ - Step 10219: {'lr': 0.0004962058280693805, 'samples': 1962048, 'steps': 10218, 'loss/train': 2.0293540954589844} -08/30/2021 14:59:20 - INFO - __main__ - Step 10220: {'lr': 0.0004962049069758221, 'samples': 1962240, 'steps': 10219, 'loss/train': 1.0238850116729736} -08/30/2021 14:59:20 - INFO - __main__ - Step 10221: {'lr': 0.0004962039857713276, 'samples': 1962432, 'steps': 10220, 'loss/train': 1.2621748447418213} -08/30/2021 14:59:21 - INFO - __main__ - Step 10222: {'lr': 0.0004962030644558974, 'samples': 1962624, 'steps': 10221, 'loss/train': 1.9189428091049194} -08/30/2021 14:59:22 - INFO - __main__ - Step 10223: {'lr': 0.0004962021430295319, 'samples': 1962816, 'steps': 10222, 'loss/train': 1.4690589904785156} -08/30/2021 14:59:22 - INFO - __main__ - Step 10224: {'lr': 0.0004962012214922314, 'samples': 1963008, 'steps': 10223, 'loss/train': 1.8067803382873535} -08/30/2021 14:59:23 - INFO - __main__ - Step 10225: {'lr': 0.0004962002998439966, 'samples': 1963200, 'steps': 10224, 'loss/train': 2.0416476726531982} -08/30/2021 14:59:23 - INFO - __main__ - Step 10226: {'lr': 0.0004961993780848276, 'samples': 1963392, 'steps': 10225, 'loss/train': 2.1884548664093018} -08/30/2021 14:59:24 - INFO - __main__ - Step 10227: {'lr': 0.000496198456214725, 'samples': 1963584, 'steps': 10226, 'loss/train': 1.9522669315338135} -08/30/2021 14:59:24 - INFO - __main__ - Step 10228: {'lr': 0.0004961975342336891, 'samples': 1963776, 'steps': 10227, 'loss/train': 1.6798677444458008} -08/30/2021 14:59:26 - INFO - __main__ - Step 10229: {'lr': 0.0004961966121417204, 'samples': 1963968, 'steps': 10228, 'loss/train': 1.9442551136016846} -08/30/2021 14:59:26 - INFO - __main__ - Step 10230: {'lr': 0.0004961956899388195, 'samples': 1964160, 'steps': 10229, 'loss/train': 2.0396888256073} -08/30/2021 14:59:26 - INFO - __main__ - Step 10231: {'lr': 0.0004961947676249864, 'samples': 1964352, 'steps': 10230, 'loss/train': 1.2092286348342896} -08/30/2021 14:59:27 - INFO - __main__ - Step 10232: {'lr': 0.0004961938452002218, 'samples': 1964544, 'steps': 10231, 'loss/train': 1.9337029457092285} -08/30/2021 14:59:27 - INFO - __main__ - Step 10233: {'lr': 0.0004961929226645261, 'samples': 1964736, 'steps': 10232, 'loss/train': 1.5241643190383911} -08/30/2021 14:59:29 - INFO - __main__ - Step 10234: {'lr': 0.0004961920000178996, 'samples': 1964928, 'steps': 10233, 'loss/train': 0.17785747349262238} -08/30/2021 14:59:30 - INFO - __main__ - Step 10235: {'lr': 0.0004961910772603429, 'samples': 1965120, 'steps': 10234, 'loss/train': 1.5663559436798096} -08/30/2021 14:59:30 - INFO - __main__ - Step 10236: {'lr': 0.0004961901543918563, 'samples': 1965312, 'steps': 10235, 'loss/train': 1.8163416385650635} -08/30/2021 14:59:30 - INFO - __main__ - Step 10237: {'lr': 0.0004961892314124401, 'samples': 1965504, 'steps': 10236, 'loss/train': 0.13995641469955444} -08/30/2021 14:59:31 - INFO - __main__ - Step 10238: {'lr': 0.0004961883083220948, 'samples': 1965696, 'steps': 10237, 'loss/train': 1.5841563940048218} -08/30/2021 14:59:32 - INFO - __main__ - Step 10239: {'lr': 0.0004961873851208209, 'samples': 1965888, 'steps': 10238, 'loss/train': 1.8104028701782227} -08/30/2021 14:59:33 - INFO - __main__ - Step 10240: {'lr': 0.0004961864618086188, 'samples': 1966080, 'steps': 10239, 'loss/train': 1.8419852256774902} -08/30/2021 14:59:33 - INFO - __main__ - Step 10241: {'lr': 0.0004961855383854889, 'samples': 1966272, 'steps': 10240, 'loss/train': 1.3559045791625977} -08/30/2021 14:59:33 - INFO - __main__ - Step 10242: {'lr': 0.0004961846148514315, 'samples': 1966464, 'steps': 10241, 'loss/train': 1.6722393035888672} -08/30/2021 14:59:34 - INFO - __main__ - Step 10243: {'lr': 0.0004961836912064472, 'samples': 1966656, 'steps': 10242, 'loss/train': 2.03438401222229} -08/30/2021 14:59:34 - INFO - __main__ - Step 10244: {'lr': 0.0004961827674505363, 'samples': 1966848, 'steps': 10243, 'loss/train': 1.5678279399871826} -08/30/2021 14:59:36 - INFO - __main__ - Step 10245: {'lr': 0.0004961818435836993, 'samples': 1967040, 'steps': 10244, 'loss/train': 1.594085693359375} -08/30/2021 14:59:36 - INFO - __main__ - Step 10246: {'lr': 0.0004961809196059365, 'samples': 1967232, 'steps': 10245, 'loss/train': 1.276477336883545} -08/30/2021 14:59:37 - INFO - __main__ - Step 10247: {'lr': 0.0004961799955172483, 'samples': 1967424, 'steps': 10246, 'loss/train': 1.8070474863052368} -08/30/2021 14:59:37 - INFO - __main__ - Step 10248: {'lr': 0.0004961790713176353, 'samples': 1967616, 'steps': 10247, 'loss/train': 2.1185221672058105} -08/30/2021 14:59:37 - INFO - __main__ - Step 10249: {'lr': 0.0004961781470070978, 'samples': 1967808, 'steps': 10248, 'loss/train': 1.6459875106811523} -08/30/2021 14:59:39 - INFO - __main__ - Step 10250: {'lr': 0.0004961772225856362, 'samples': 1968000, 'steps': 10249, 'loss/train': 2.2528064250946045} -08/30/2021 14:59:39 - INFO - __main__ - Step 10251: {'lr': 0.0004961762980532509, 'samples': 1968192, 'steps': 10250, 'loss/train': 1.6697717905044556} -08/30/2021 14:59:40 - INFO - __main__ - Step 10252: {'lr': 0.0004961753734099425, 'samples': 1968384, 'steps': 10251, 'loss/train': 1.2199863195419312} -08/30/2021 14:59:40 - INFO - __main__ - Step 10253: {'lr': 0.0004961744486557112, 'samples': 1968576, 'steps': 10252, 'loss/train': 1.805417776107788} -08/30/2021 14:59:40 - INFO - __main__ - Step 10254: {'lr': 0.0004961735237905574, 'samples': 1968768, 'steps': 10253, 'loss/train': 1.678693175315857} -08/30/2021 14:59:42 - INFO - __main__ - Step 10255: {'lr': 0.0004961725988144816, 'samples': 1968960, 'steps': 10254, 'loss/train': 1.8911503553390503} -08/30/2021 14:59:42 - INFO - __main__ - Step 10256: {'lr': 0.0004961716737274844, 'samples': 1969152, 'steps': 10255, 'loss/train': 2.1664628982543945} -08/30/2021 14:59:43 - INFO - __main__ - Step 10257: {'lr': 0.0004961707485295659, 'samples': 1969344, 'steps': 10256, 'loss/train': 1.5524919033050537} -08/30/2021 14:59:43 - INFO - __main__ - Step 10258: {'lr': 0.0004961698232207268, 'samples': 1969536, 'steps': 10257, 'loss/train': 2.3951942920684814} -08/30/2021 14:59:44 - INFO - __main__ - Step 10259: {'lr': 0.0004961688978009672, 'samples': 1969728, 'steps': 10258, 'loss/train': 1.9480458498001099} -08/30/2021 14:59:44 - INFO - __main__ - Step 10260: {'lr': 0.0004961679722702879, 'samples': 1969920, 'steps': 10259, 'loss/train': 1.864726185798645} -08/30/2021 14:59:45 - INFO - __main__ - Step 10261: {'lr': 0.0004961670466286889, 'samples': 1970112, 'steps': 10260, 'loss/train': 1.902874231338501} -08/30/2021 14:59:46 - INFO - __main__ - Step 10262: {'lr': 0.000496166120876171, 'samples': 1970304, 'steps': 10261, 'loss/train': 1.6221438646316528} -08/30/2021 14:59:46 - INFO - __main__ - Step 10263: {'lr': 0.0004961651950127343, 'samples': 1970496, 'steps': 10262, 'loss/train': 1.7727737426757812} -08/30/2021 14:59:46 - INFO - __main__ - Step 10264: {'lr': 0.0004961642690383794, 'samples': 1970688, 'steps': 10263, 'loss/train': 2.0062689781188965} -08/30/2021 14:59:47 - INFO - __main__ - Step 10265: {'lr': 0.0004961633429531068, 'samples': 1970880, 'steps': 10264, 'loss/train': 1.6899843215942383} -08/30/2021 14:59:48 - INFO - __main__ - Step 10266: {'lr': 0.0004961624167569166, 'samples': 1971072, 'steps': 10265, 'loss/train': 1.6278786659240723} -08/30/2021 14:59:49 - INFO - __main__ - Step 10267: {'lr': 0.0004961614904498095, 'samples': 1971264, 'steps': 10266, 'loss/train': 1.3537687063217163} -08/30/2021 14:59:49 - INFO - __main__ - Step 10268: {'lr': 0.0004961605640317858, 'samples': 1971456, 'steps': 10267, 'loss/train': 2.5009100437164307} -08/30/2021 14:59:50 - INFO - __main__ - Step 10269: {'lr': 0.0004961596375028461, 'samples': 1971648, 'steps': 10268, 'loss/train': 1.6418747901916504} -08/30/2021 14:59:50 - INFO - __main__ - Step 10270: {'lr': 0.0004961587108629906, 'samples': 1971840, 'steps': 10269, 'loss/train': 2.304105758666992} -08/30/2021 14:59:51 - INFO - __main__ - Step 10271: {'lr': 0.0004961577841122197, 'samples': 1972032, 'steps': 10270, 'loss/train': 1.972224235534668} -08/30/2021 14:59:52 - INFO - __main__ - Step 10272: {'lr': 0.000496156857250534, 'samples': 1972224, 'steps': 10271, 'loss/train': 1.9679875373840332} -08/30/2021 14:59:52 - INFO - __main__ - Step 10273: {'lr': 0.0004961559302779338, 'samples': 1972416, 'steps': 10272, 'loss/train': 1.7676537036895752} -08/30/2021 14:59:53 - INFO - __main__ - Step 10274: {'lr': 0.0004961550031944194, 'samples': 1972608, 'steps': 10273, 'loss/train': 1.8500806093215942} -08/30/2021 14:59:53 - INFO - __main__ - Step 10275: {'lr': 0.0004961540759999914, 'samples': 1972800, 'steps': 10274, 'loss/train': 1.77291738986969} -08/30/2021 14:59:55 - INFO - __main__ - Step 10276: {'lr': 0.0004961531486946502, 'samples': 1972992, 'steps': 10275, 'loss/train': 1.9960471391677856} -08/30/2021 14:59:55 - INFO - __main__ - Step 10277: {'lr': 0.0004961522212783962, 'samples': 1973184, 'steps': 10276, 'loss/train': 1.7660590410232544} -08/30/2021 14:59:56 - INFO - __main__ - Step 10278: {'lr': 0.00049615129375123, 'samples': 1973376, 'steps': 10277, 'loss/train': 1.6322904825210571} -08/30/2021 14:59:56 - INFO - __main__ - Step 10279: {'lr': 0.0004961503661131515, 'samples': 1973568, 'steps': 10278, 'loss/train': 1.6495939493179321} -08/30/2021 14:59:56 - INFO - __main__ - Step 10280: {'lr': 0.0004961494383641616, 'samples': 1973760, 'steps': 10279, 'loss/train': 0.3866509795188904} -08/30/2021 14:59:57 - INFO - __main__ - Step 10281: {'lr': 0.0004961485105042606, 'samples': 1973952, 'steps': 10280, 'loss/train': 0.7199074029922485} -08/30/2021 14:59:59 - INFO - __main__ - Step 10282: {'lr': 0.0004961475825334488, 'samples': 1974144, 'steps': 10281, 'loss/train': 1.5392190217971802} -08/30/2021 14:59:59 - INFO - __main__ - Step 10283: {'lr': 0.0004961466544517267, 'samples': 1974336, 'steps': 10282, 'loss/train': 2.1678366661071777} -08/30/2021 15:00:00 - INFO - __main__ - Step 10284: {'lr': 0.0004961457262590948, 'samples': 1974528, 'steps': 10283, 'loss/train': 1.7925416231155396} -08/30/2021 15:00:00 - INFO - __main__ - Step 10285: {'lr': 0.0004961447979555533, 'samples': 1974720, 'steps': 10284, 'loss/train': 2.2487778663635254} -08/30/2021 15:00:00 - INFO - __main__ - Step 10286: {'lr': 0.000496143869541103, 'samples': 1974912, 'steps': 10285, 'loss/train': 1.3042547702789307} -08/30/2021 15:00:01 - INFO - __main__ - Step 10287: {'lr': 0.0004961429410157437, 'samples': 1975104, 'steps': 10286, 'loss/train': 1.5594148635864258} -08/30/2021 15:00:02 - INFO - __main__ - Step 10288: {'lr': 0.0004961420123794764, 'samples': 1975296, 'steps': 10287, 'loss/train': 2.6012120246887207} -08/30/2021 15:00:03 - INFO - __main__ - Step 10289: {'lr': 0.0004961410836323014, 'samples': 1975488, 'steps': 10288, 'loss/train': 2.121105670928955} -08/30/2021 15:00:03 - INFO - __main__ - Step 10290: {'lr': 0.0004961401547742189, 'samples': 1975680, 'steps': 10289, 'loss/train': 2.434382915496826} -08/30/2021 15:00:03 - INFO - __main__ - Step 10291: {'lr': 0.0004961392258052294, 'samples': 1975872, 'steps': 10290, 'loss/train': 1.2272709608078003} -08/30/2021 15:00:04 - INFO - __main__ - Step 10292: {'lr': 0.0004961382967253335, 'samples': 1976064, 'steps': 10291, 'loss/train': 2.383918285369873} -08/30/2021 15:00:06 - INFO - __main__ - Step 10293: {'lr': 0.0004961373675345315, 'samples': 1976256, 'steps': 10292, 'loss/train': 2.726109266281128} -08/30/2021 15:00:06 - INFO - __main__ - Step 10294: {'lr': 0.0004961364382328236, 'samples': 1976448, 'steps': 10293, 'loss/train': 1.2619708776474} -08/30/2021 15:00:06 - INFO - __main__ - Step 10295: {'lr': 0.0004961355088202106, 'samples': 1976640, 'steps': 10294, 'loss/train': 2.0212178230285645} -08/30/2021 15:00:07 - INFO - __main__ - Step 10296: {'lr': 0.0004961345792966926, 'samples': 1976832, 'steps': 10295, 'loss/train': 2.1003832817077637} -08/30/2021 15:00:07 - INFO - __main__ - Step 10297: {'lr': 0.0004961336496622702, 'samples': 1977024, 'steps': 10296, 'loss/train': 1.3134616613388062} -08/30/2021 15:00:09 - INFO - __main__ - Step 10298: {'lr': 0.0004961327199169438, 'samples': 1977216, 'steps': 10297, 'loss/train': 1.7765445709228516} -08/30/2021 15:00:09 - INFO - __main__ - Step 10299: {'lr': 0.0004961317900607138, 'samples': 1977408, 'steps': 10298, 'loss/train': 2.0218944549560547} -08/30/2021 15:00:09 - INFO - __main__ - Step 10300: {'lr': 0.0004961308600935807, 'samples': 1977600, 'steps': 10299, 'loss/train': 0.15296944975852966} -08/30/2021 15:00:10 - INFO - __main__ - Step 10301: {'lr': 0.0004961299300155446, 'samples': 1977792, 'steps': 10300, 'loss/train': 1.8994289636611938} -08/30/2021 15:00:10 - INFO - __main__ - Step 10302: {'lr': 0.0004961289998266064, 'samples': 1977984, 'steps': 10301, 'loss/train': 1.953522801399231} -08/30/2021 15:00:12 - INFO - __main__ - Step 10303: {'lr': 0.0004961280695267662, 'samples': 1978176, 'steps': 10302, 'loss/train': 1.8934563398361206} -08/30/2021 15:00:12 - INFO - __main__ - Step 10304: {'lr': 0.0004961271391160243, 'samples': 1978368, 'steps': 10303, 'loss/train': 1.4899977445602417} -08/30/2021 15:00:12 - INFO - __main__ - Step 10305: {'lr': 0.0004961262085943815, 'samples': 1978560, 'steps': 10304, 'loss/train': 2.116154193878174} -08/30/2021 15:00:13 - INFO - __main__ - Step 10306: {'lr': 0.000496125277961838, 'samples': 1978752, 'steps': 10305, 'loss/train': 2.0883262157440186} -08/30/2021 15:00:13 - INFO - __main__ - Step 10307: {'lr': 0.0004961243472183942, 'samples': 1978944, 'steps': 10306, 'loss/train': 1.5113731622695923} -08/30/2021 15:00:15 - INFO - __main__ - Step 10308: {'lr': 0.0004961234163640507, 'samples': 1979136, 'steps': 10307, 'loss/train': 2.18200421333313} -08/30/2021 15:00:15 - INFO - __main__ - Step 10309: {'lr': 0.0004961224853988076, 'samples': 1979328, 'steps': 10308, 'loss/train': 1.2948338985443115} -08/30/2021 15:00:16 - INFO - __main__ - Step 10310: {'lr': 0.0004961215543226657, 'samples': 1979520, 'steps': 10309, 'loss/train': 1.7266885042190552} -08/30/2021 15:00:16 - INFO - __main__ - Step 10311: {'lr': 0.0004961206231356251, 'samples': 1979712, 'steps': 10310, 'loss/train': 2.103034257888794} -08/30/2021 15:00:16 - INFO - __main__ - Step 10312: {'lr': 0.0004961196918376864, 'samples': 1979904, 'steps': 10311, 'loss/train': 0.7564037442207336} -08/30/2021 15:00:18 - INFO - __main__ - Step 10313: {'lr': 0.0004961187604288498, 'samples': 1980096, 'steps': 10312, 'loss/train': 1.8156440258026123} -08/30/2021 15:00:18 - INFO - __main__ - Step 10314: {'lr': 0.0004961178289091161, 'samples': 1980288, 'steps': 10313, 'loss/train': 1.8133211135864258} -08/30/2021 15:00:18 - INFO - __main__ - Step 10315: {'lr': 0.0004961168972784855, 'samples': 1980480, 'steps': 10314, 'loss/train': 1.6111654043197632} -08/30/2021 15:00:19 - INFO - __main__ - Step 10316: {'lr': 0.0004961159655369582, 'samples': 1980672, 'steps': 10315, 'loss/train': 1.7434855699539185} -08/30/2021 15:00:19 - INFO - __main__ - Step 10317: {'lr': 0.0004961150336845351, 'samples': 1980864, 'steps': 10316, 'loss/train': 1.8589189052581787} -08/30/2021 15:00:21 - INFO - __main__ - Step 10318: {'lr': 0.0004961141017212162, 'samples': 1981056, 'steps': 10317, 'loss/train': 1.2972108125686646} -08/30/2021 15:00:21 - INFO - __main__ - Step 10319: {'lr': 0.0004961131696470021, 'samples': 1981248, 'steps': 10318, 'loss/train': 0.16804327070713043} -08/30/2021 15:00:22 - INFO - __main__ - Step 10320: {'lr': 0.0004961122374618933, 'samples': 1981440, 'steps': 10319, 'loss/train': 1.0443837642669678} -08/30/2021 15:00:22 - INFO - __main__ - Step 10321: {'lr': 0.00049611130516589, 'samples': 1981632, 'steps': 10320, 'loss/train': 2.0743186473846436} -08/30/2021 15:00:22 - INFO - __main__ - Step 10322: {'lr': 0.0004961103727589929, 'samples': 1981824, 'steps': 10321, 'loss/train': 2.1763031482696533} -08/30/2021 15:00:23 - INFO - __main__ - Step 10323: {'lr': 0.0004961094402412021, 'samples': 1982016, 'steps': 10322, 'loss/train': 1.3292943239212036} -08/30/2021 15:00:24 - INFO - __main__ - Step 10324: {'lr': 0.0004961085076125182, 'samples': 1982208, 'steps': 10323, 'loss/train': 2.464029550552368} -08/30/2021 15:00:25 - INFO - __main__ - Step 10325: {'lr': 0.0004961075748729418, 'samples': 1982400, 'steps': 10324, 'loss/train': 1.8568816184997559} -08/30/2021 15:00:25 - INFO - __main__ - Step 10326: {'lr': 0.0004961066420224729, 'samples': 1982592, 'steps': 10325, 'loss/train': 1.8566415309906006} -08/30/2021 15:00:26 - INFO - __main__ - Step 10327: {'lr': 0.0004961057090611123, 'samples': 1982784, 'steps': 10326, 'loss/train': 1.667598843574524} -08/30/2021 15:00:26 - INFO - __main__ - Step 10328: {'lr': 0.0004961047759888601, 'samples': 1982976, 'steps': 10327, 'loss/train': 1.8366225957870483} -08/30/2021 15:00:27 - INFO - __main__ - Step 10329: {'lr': 0.000496103842805717, 'samples': 1983168, 'steps': 10328, 'loss/train': 0.7898144125938416} -08/30/2021 15:00:28 - INFO - __main__ - Step 10330: {'lr': 0.0004961029095116833, 'samples': 1983360, 'steps': 10329, 'loss/train': 1.4821635484695435} -08/30/2021 15:00:28 - INFO - __main__ - Step 10331: {'lr': 0.0004961019761067594, 'samples': 1983552, 'steps': 10330, 'loss/train': 1.6974904537200928} -08/30/2021 15:00:29 - INFO - __main__ - Step 10332: {'lr': 0.0004961010425909458, 'samples': 1983744, 'steps': 10331, 'loss/train': 1.7204148769378662} -08/30/2021 15:00:29 - INFO - __main__ - Step 10333: {'lr': 0.0004961001089642428, 'samples': 1983936, 'steps': 10332, 'loss/train': 1.5524461269378662} -08/30/2021 15:00:30 - INFO - __main__ - Step 10334: {'lr': 0.000496099175226651, 'samples': 1984128, 'steps': 10333, 'loss/train': 2.2729852199554443} -08/30/2021 15:00:31 - INFO - __main__ - Step 10335: {'lr': 0.0004960982413781705, 'samples': 1984320, 'steps': 10334, 'loss/train': 2.2635409832000732} -08/30/2021 15:00:31 - INFO - __main__ - Step 10336: {'lr': 0.0004960973074188021, 'samples': 1984512, 'steps': 10335, 'loss/train': 2.2586538791656494} -08/30/2021 15:00:32 - INFO - __main__ - Step 10337: {'lr': 0.000496096373348546, 'samples': 1984704, 'steps': 10336, 'loss/train': 1.6437163352966309} -08/30/2021 15:00:32 - INFO - __main__ - Step 10338: {'lr': 0.0004960954391674026, 'samples': 1984896, 'steps': 10337, 'loss/train': 1.271201491355896} -08/30/2021 15:00:34 - INFO - __main__ - Step 10339: {'lr': 0.0004960945048753725, 'samples': 1985088, 'steps': 10338, 'loss/train': 1.8340805768966675} -08/30/2021 15:00:35 - INFO - __main__ - Step 10340: {'lr': 0.000496093570472456, 'samples': 1985280, 'steps': 10339, 'loss/train': 1.3790926933288574} -08/30/2021 15:00:35 - INFO - __main__ - Step 10341: {'lr': 0.0004960926359586535, 'samples': 1985472, 'steps': 10340, 'loss/train': 1.9897993803024292} -08/30/2021 15:00:35 - INFO - __main__ - Step 10342: {'lr': 0.0004960917013339656, 'samples': 1985664, 'steps': 10341, 'loss/train': 2.4562790393829346} -08/30/2021 15:00:36 - INFO - __main__ - Step 10343: {'lr': 0.0004960907665983923, 'samples': 1985856, 'steps': 10342, 'loss/train': 0.17296990752220154} -08/30/2021 15:00:36 - INFO - __main__ - Step 10344: {'lr': 0.0004960898317519345, 'samples': 1986048, 'steps': 10343, 'loss/train': 1.7110241651535034} -08/30/2021 15:00:38 - INFO - __main__ - Step 10345: {'lr': 0.0004960888967945924, 'samples': 1986240, 'steps': 10344, 'loss/train': 2.053333282470703} -08/30/2021 15:00:38 - INFO - __main__ - Step 10346: {'lr': 0.0004960879617263664, 'samples': 1986432, 'steps': 10345, 'loss/train': 1.8550726175308228} -08/30/2021 15:00:38 - INFO - __main__ - Step 10347: {'lr': 0.000496087026547257, 'samples': 1986624, 'steps': 10346, 'loss/train': 1.9350652694702148} -08/30/2021 15:00:39 - INFO - __main__ - Step 10348: {'lr': 0.0004960860912572645, 'samples': 1986816, 'steps': 10347, 'loss/train': 1.3675235509872437} -08/30/2021 15:00:39 - INFO - __main__ - Step 10349: {'lr': 0.0004960851558563895, 'samples': 1987008, 'steps': 10348, 'loss/train': 1.7497878074645996} -08/30/2021 15:00:41 - INFO - __main__ - Step 10350: {'lr': 0.0004960842203446322, 'samples': 1987200, 'steps': 10349, 'loss/train': 1.941586971282959} -08/30/2021 15:00:42 - INFO - __main__ - Step 10351: {'lr': 0.0004960832847219933, 'samples': 1987392, 'steps': 10350, 'loss/train': 2.722203493118286} -08/30/2021 15:00:42 - INFO - __main__ - Step 10352: {'lr': 0.000496082348988473, 'samples': 1987584, 'steps': 10351, 'loss/train': 1.4358041286468506} -08/30/2021 15:00:42 - INFO - __main__ - Step 10353: {'lr': 0.0004960814131440717, 'samples': 1987776, 'steps': 10352, 'loss/train': 1.8353437185287476} -08/30/2021 15:00:43 - INFO - __main__ - Step 10354: {'lr': 0.0004960804771887901, 'samples': 1987968, 'steps': 10353, 'loss/train': 2.3006680011749268} -08/30/2021 15:00:43 - INFO - __main__ - Step 10355: {'lr': 0.0004960795411226283, 'samples': 1988160, 'steps': 10354, 'loss/train': 3.0335726737976074} -08/30/2021 15:00:43 - INFO - __main__ - Step 10356: {'lr': 0.0004960786049455868, 'samples': 1988352, 'steps': 10355, 'loss/train': 2.2150301933288574} -08/30/2021 15:00:45 - INFO - __main__ - Step 10357: {'lr': 0.0004960776686576663, 'samples': 1988544, 'steps': 10356, 'loss/train': 1.997801661491394} -08/30/2021 15:00:45 - INFO - __main__ - Step 10358: {'lr': 0.0004960767322588668, 'samples': 1988736, 'steps': 10357, 'loss/train': 2.2359557151794434} -08/30/2021 15:00:46 - INFO - __main__ - Step 10359: {'lr': 0.000496075795749189, 'samples': 1988928, 'steps': 10358, 'loss/train': 2.1683826446533203} -08/30/2021 15:00:46 - INFO - __main__ - Step 10360: {'lr': 0.0004960748591286332, 'samples': 1989120, 'steps': 10359, 'loss/train': 1.3156667947769165} -08/30/2021 15:00:46 - INFO - __main__ - Step 10361: {'lr': 0.0004960739223971999, 'samples': 1989312, 'steps': 10360, 'loss/train': 1.5570313930511475} -08/30/2021 15:00:48 - INFO - __main__ - Step 10362: {'lr': 0.0004960729855548895, 'samples': 1989504, 'steps': 10361, 'loss/train': 2.5488858222961426} -08/30/2021 15:00:48 - INFO - __main__ - Step 10363: {'lr': 0.0004960720486017025, 'samples': 1989696, 'steps': 10362, 'loss/train': 2.133307695388794} -08/30/2021 15:00:49 - INFO - __main__ - Step 10364: {'lr': 0.0004960711115376391, 'samples': 1989888, 'steps': 10363, 'loss/train': 2.004369020462036} -08/30/2021 15:00:49 - INFO - __main__ - Step 10365: {'lr': 0.0004960701743626999, 'samples': 1990080, 'steps': 10364, 'loss/train': 1.4569731950759888} -08/30/2021 15:00:49 - INFO - __main__ - Step 10366: {'lr': 0.0004960692370768853, 'samples': 1990272, 'steps': 10365, 'loss/train': 2.0143885612487793} -08/30/2021 15:00:51 - INFO - __main__ - Step 10367: {'lr': 0.0004960682996801956, 'samples': 1990464, 'steps': 10366, 'loss/train': 1.5447354316711426} -08/30/2021 15:00:51 - INFO - __main__ - Step 10368: {'lr': 0.0004960673621726314, 'samples': 1990656, 'steps': 10367, 'loss/train': 0.3495093286037445} -08/30/2021 15:00:52 - INFO - __main__ - Step 10369: {'lr': 0.000496066424554193, 'samples': 1990848, 'steps': 10368, 'loss/train': 1.817546010017395} -08/30/2021 15:00:52 - INFO - __main__ - Step 10370: {'lr': 0.0004960654868248809, 'samples': 1991040, 'steps': 10369, 'loss/train': 2.059018135070801} -08/30/2021 15:00:53 - INFO - __main__ - Step 10371: {'lr': 0.0004960645489846955, 'samples': 1991232, 'steps': 10370, 'loss/train': 2.0338845252990723} -08/30/2021 15:00:54 - INFO - __main__ - Step 10372: {'lr': 0.0004960636110336371, 'samples': 1991424, 'steps': 10371, 'loss/train': 2.1590704917907715} -08/30/2021 15:00:55 - INFO - __main__ - Step 10373: {'lr': 0.0004960626729717064, 'samples': 1991616, 'steps': 10372, 'loss/train': 1.9552867412567139} -08/30/2021 15:00:55 - INFO - __main__ - Step 10374: {'lr': 0.0004960617347989036, 'samples': 1991808, 'steps': 10373, 'loss/train': 1.9777945280075073} -08/30/2021 15:00:55 - INFO - __main__ - Step 10375: {'lr': 0.0004960607965152292, 'samples': 1992000, 'steps': 10374, 'loss/train': 2.2696774005889893} -08/30/2021 15:00:56 - INFO - __main__ - Step 10376: {'lr': 0.0004960598581206835, 'samples': 1992192, 'steps': 10375, 'loss/train': 1.7620307207107544} -08/30/2021 15:00:57 - INFO - __main__ - Step 10377: {'lr': 0.000496058919615267, 'samples': 1992384, 'steps': 10376, 'loss/train': 1.7011475563049316} -08/30/2021 15:00:58 - INFO - __main__ - Step 10378: {'lr': 0.0004960579809989803, 'samples': 1992576, 'steps': 10377, 'loss/train': 2.0998213291168213} -08/30/2021 15:00:58 - INFO - __main__ - Step 10379: {'lr': 0.0004960570422718237, 'samples': 1992768, 'steps': 10378, 'loss/train': 1.3776031732559204} -08/30/2021 15:00:58 - INFO - __main__ - Step 10380: {'lr': 0.0004960561034337975, 'samples': 1992960, 'steps': 10379, 'loss/train': 2.4718332290649414} -08/30/2021 15:00:59 - INFO - __main__ - Step 10381: {'lr': 0.0004960551644849022, 'samples': 1993152, 'steps': 10380, 'loss/train': 2.3681163787841797} -08/30/2021 15:01:00 - INFO - __main__ - Step 10382: {'lr': 0.0004960542254251382, 'samples': 1993344, 'steps': 10381, 'loss/train': 1.9731279611587524} -08/30/2021 15:01:01 - INFO - __main__ - Step 10383: {'lr': 0.0004960532862545061, 'samples': 1993536, 'steps': 10382, 'loss/train': 1.7828351259231567} -08/30/2021 15:01:01 - INFO - __main__ - Step 10384: {'lr': 0.0004960523469730061, 'samples': 1993728, 'steps': 10383, 'loss/train': 1.567101001739502} -08/30/2021 15:01:01 - INFO - __main__ - Step 10385: {'lr': 0.0004960514075806387, 'samples': 1993920, 'steps': 10384, 'loss/train': 1.9627090692520142} -08/30/2021 15:01:02 - INFO - __main__ - Step 10386: {'lr': 0.0004960504680774043, 'samples': 1994112, 'steps': 10385, 'loss/train': 1.5318666696548462} -08/30/2021 15:01:02 - INFO - __main__ - Step 10387: {'lr': 0.0004960495284633034, 'samples': 1994304, 'steps': 10386, 'loss/train': 2.256319046020508} -08/30/2021 15:01:04 - INFO - __main__ - Step 10388: {'lr': 0.0004960485887383363, 'samples': 1994496, 'steps': 10387, 'loss/train': 2.194608688354492} -08/30/2021 15:01:05 - INFO - __main__ - Step 10389: {'lr': 0.0004960476489025037, 'samples': 1994688, 'steps': 10388, 'loss/train': 1.449400544166565} -08/30/2021 15:01:05 - INFO - __main__ - Step 10390: {'lr': 0.0004960467089558057, 'samples': 1994880, 'steps': 10389, 'loss/train': 1.9933476448059082} -08/30/2021 15:01:06 - INFO - __main__ - Step 10391: {'lr': 0.0004960457688982428, 'samples': 1995072, 'steps': 10390, 'loss/train': 1.4009701013565063} -08/30/2021 15:01:06 - INFO - __main__ - Step 10392: {'lr': 0.0004960448287298156, 'samples': 1995264, 'steps': 10391, 'loss/train': 1.9637444019317627} -08/30/2021 15:01:06 - INFO - __main__ - Step 10393: {'lr': 0.0004960438884505242, 'samples': 1995456, 'steps': 10392, 'loss/train': 0.5234134793281555} -08/30/2021 15:01:08 - INFO - __main__ - Step 10394: {'lr': 0.0004960429480603694, 'samples': 1995648, 'steps': 10393, 'loss/train': 0.3800166845321655} -08/30/2021 15:01:09 - INFO - __main__ - Step 10395: {'lr': 0.0004960420075593515, 'samples': 1995840, 'steps': 10394, 'loss/train': 1.6070040464401245} -08/30/2021 15:01:09 - INFO - __main__ - Step 10396: {'lr': 0.0004960410669474708, 'samples': 1996032, 'steps': 10395, 'loss/train': 2.3613502979278564} -08/30/2021 15:01:10 - INFO - __main__ - Step 10397: {'lr': 0.0004960401262247277, 'samples': 1996224, 'steps': 10396, 'loss/train': 2.0823814868927} -08/30/2021 15:01:10 - INFO - __main__ - Step 10398: {'lr': 0.0004960391853911228, 'samples': 1996416, 'steps': 10397, 'loss/train': 1.2456631660461426} -08/30/2021 15:01:10 - INFO - __main__ - Step 10399: {'lr': 0.0004960382444466564, 'samples': 1996608, 'steps': 10398, 'loss/train': 1.2787742614746094} -08/30/2021 15:01:12 - INFO - __main__ - Step 10400: {'lr': 0.0004960373033913289, 'samples': 1996800, 'steps': 10399, 'loss/train': 1.6688364744186401} -08/30/2021 15:01:12 - INFO - __main__ - Step 10401: {'lr': 0.0004960363622251409, 'samples': 1996992, 'steps': 10400, 'loss/train': 1.5278105735778809} -08/30/2021 15:01:13 - INFO - __main__ - Step 10402: {'lr': 0.0004960354209480927, 'samples': 1997184, 'steps': 10401, 'loss/train': 2.1272647380828857} -08/30/2021 15:01:13 - INFO - __main__ - Step 10403: {'lr': 0.0004960344795601847, 'samples': 1997376, 'steps': 10402, 'loss/train': 1.744810938835144} -08/30/2021 15:01:13 - INFO - __main__ - Step 10404: {'lr': 0.0004960335380614174, 'samples': 1997568, 'steps': 10403, 'loss/train': 1.9196399450302124} -08/30/2021 15:01:15 - INFO - __main__ - Step 10405: {'lr': 0.0004960325964517912, 'samples': 1997760, 'steps': 10404, 'loss/train': 0.2159660905599594} -08/30/2021 15:01:15 - INFO - __main__ - Step 10406: {'lr': 0.0004960316547313064, 'samples': 1997952, 'steps': 10405, 'loss/train': 1.7362682819366455} -08/30/2021 15:01:16 - INFO - __main__ - Step 10407: {'lr': 0.0004960307128999636, 'samples': 1998144, 'steps': 10406, 'loss/train': 0.17416583001613617} -08/30/2021 15:01:16 - INFO - __main__ - Step 10408: {'lr': 0.0004960297709577632, 'samples': 1998336, 'steps': 10407, 'loss/train': 1.4828909635543823} -08/30/2021 15:01:17 - INFO - __main__ - Step 10409: {'lr': 0.0004960288289047054, 'samples': 1998528, 'steps': 10408, 'loss/train': 1.8124011754989624} -08/30/2021 15:01:18 - INFO - __main__ - Step 10410: {'lr': 0.000496027886740791, 'samples': 1998720, 'steps': 10409, 'loss/train': 2.082686424255371} -08/30/2021 15:01:19 - INFO - __main__ - Step 10411: {'lr': 0.0004960269444660201, 'samples': 1998912, 'steps': 10410, 'loss/train': 1.58790922164917} -08/30/2021 15:01:19 - INFO - __main__ - Step 10412: {'lr': 0.0004960260020803934, 'samples': 1999104, 'steps': 10411, 'loss/train': 1.5263381004333496} -08/30/2021 15:01:19 - INFO - __main__ - Step 10413: {'lr': 0.0004960250595839111, 'samples': 1999296, 'steps': 10412, 'loss/train': 1.935903549194336} -08/30/2021 15:01:20 - INFO - __main__ - Step 10414: {'lr': 0.0004960241169765737, 'samples': 1999488, 'steps': 10413, 'loss/train': 2.782301902770996} -08/30/2021 15:01:20 - INFO - __main__ - Step 10415: {'lr': 0.0004960231742583817, 'samples': 1999680, 'steps': 10414, 'loss/train': 1.631529450416565} -08/30/2021 15:01:22 - INFO - __main__ - Step 10416: {'lr': 0.0004960222314293354, 'samples': 1999872, 'steps': 10415, 'loss/train': 2.455029010772705} -08/30/2021 15:01:22 - INFO - __main__ - Step 10417: {'lr': 0.0004960212884894353, 'samples': 2000064, 'steps': 10416, 'loss/train': 2.097196340560913} -08/30/2021 15:01:22 - INFO - __main__ - Step 10418: {'lr': 0.0004960203454386817, 'samples': 2000256, 'steps': 10417, 'loss/train': 2.1052653789520264} -08/30/2021 15:01:23 - INFO - __main__ - Step 10419: {'lr': 0.0004960194022770753, 'samples': 2000448, 'steps': 10418, 'loss/train': 2.01723051071167} -08/30/2021 15:01:23 - INFO - __main__ - Step 10420: {'lr': 0.0004960184590046162, 'samples': 2000640, 'steps': 10419, 'loss/train': 3.389378070831299} -08/30/2021 15:01:25 - INFO - __main__ - Step 10421: {'lr': 0.0004960175156213051, 'samples': 2000832, 'steps': 10420, 'loss/train': 1.6210967302322388} -08/30/2021 15:01:25 - INFO - __main__ - Step 10422: {'lr': 0.0004960165721271422, 'samples': 2001024, 'steps': 10421, 'loss/train': 2.0531251430511475} -08/30/2021 15:01:26 - INFO - __main__ - Step 10423: {'lr': 0.000496015628522128, 'samples': 2001216, 'steps': 10422, 'loss/train': 1.0741275548934937} -08/30/2021 15:01:26 - INFO - __main__ - Step 10424: {'lr': 0.000496014684806263, 'samples': 2001408, 'steps': 10423, 'loss/train': 2.350569009780884} -08/30/2021 15:01:26 - INFO - __main__ - Step 10425: {'lr': 0.0004960137409795477, 'samples': 2001600, 'steps': 10424, 'loss/train': 0.19224587082862854} -08/30/2021 15:01:28 - INFO - __main__ - Step 10426: {'lr': 0.0004960127970419822, 'samples': 2001792, 'steps': 10425, 'loss/train': 2.09647274017334} -08/30/2021 15:01:28 - INFO - __main__ - Step 10427: {'lr': 0.0004960118529935674, 'samples': 2001984, 'steps': 10426, 'loss/train': 1.908085823059082} -08/30/2021 15:01:29 - INFO - __main__ - Step 10428: {'lr': 0.0004960109088343032, 'samples': 2002176, 'steps': 10427, 'loss/train': 1.8560950756072998} -08/30/2021 15:01:29 - INFO - __main__ - Step 10429: {'lr': 0.0004960099645641903, 'samples': 2002368, 'steps': 10428, 'loss/train': 3.4126241207122803} -08/30/2021 15:01:29 - INFO - __main__ - Step 10430: {'lr': 0.0004960090201832293, 'samples': 2002560, 'steps': 10429, 'loss/train': 1.7569758892059326} -08/30/2021 15:01:31 - INFO - __main__ - Step 10431: {'lr': 0.0004960080756914203, 'samples': 2002752, 'steps': 10430, 'loss/train': 1.8876203298568726} -08/30/2021 15:01:31 - INFO - __main__ - Step 10432: {'lr': 0.0004960071310887638, 'samples': 2002944, 'steps': 10431, 'loss/train': 1.8103290796279907} -08/30/2021 15:01:32 - INFO - __main__ - Step 10433: {'lr': 0.0004960061863752604, 'samples': 2003136, 'steps': 10432, 'loss/train': 0.9473888278007507} -08/30/2021 15:01:32 - INFO - __main__ - Step 10434: {'lr': 0.0004960052415509103, 'samples': 2003328, 'steps': 10433, 'loss/train': 0.2175418883562088} -08/30/2021 15:01:32 - INFO - __main__ - Step 10435: {'lr': 0.0004960042966157141, 'samples': 2003520, 'steps': 10434, 'loss/train': 1.807892084121704} -08/30/2021 15:01:34 - INFO - __main__ - Step 10436: {'lr': 0.0004960033515696722, 'samples': 2003712, 'steps': 10435, 'loss/train': 2.193671703338623} -08/30/2021 15:01:35 - INFO - __main__ - Step 10437: {'lr': 0.0004960024064127849, 'samples': 2003904, 'steps': 10436, 'loss/train': 0.8680984973907471} -08/30/2021 15:01:35 - INFO - __main__ - Step 10438: {'lr': 0.0004960014611450527, 'samples': 2004096, 'steps': 10437, 'loss/train': 1.7945085763931274} -08/30/2021 15:01:35 - INFO - __main__ - Step 10439: {'lr': 0.0004960005157664762, 'samples': 2004288, 'steps': 10438, 'loss/train': 1.8623465299606323} -08/30/2021 15:01:36 - INFO - __main__ - Step 10440: {'lr': 0.0004959995702770555, 'samples': 2004480, 'steps': 10439, 'loss/train': 1.8561207056045532} -08/30/2021 15:01:37 - INFO - __main__ - Step 10441: {'lr': 0.0004959986246767913, 'samples': 2004672, 'steps': 10440, 'loss/train': 1.9420788288116455} -08/30/2021 15:01:38 - INFO - __main__ - Step 10442: {'lr': 0.0004959976789656838, 'samples': 2004864, 'steps': 10441, 'loss/train': 2.0702946186065674} -08/30/2021 15:01:38 - INFO - __main__ - Step 10443: {'lr': 0.0004959967331437336, 'samples': 2005056, 'steps': 10442, 'loss/train': 1.6848121881484985} -08/30/2021 15:01:38 - INFO - __main__ - Step 10444: {'lr': 0.0004959957872109411, 'samples': 2005248, 'steps': 10443, 'loss/train': 1.9728987216949463} -08/30/2021 15:01:39 - INFO - __main__ - Step 10445: {'lr': 0.0004959948411673066, 'samples': 2005440, 'steps': 10444, 'loss/train': 1.6918926239013672} -08/30/2021 15:01:39 - INFO - __main__ - Step 10446: {'lr': 0.0004959938950128308, 'samples': 2005632, 'steps': 10445, 'loss/train': 1.0344536304473877} -08/30/2021 15:01:41 - INFO - __main__ - Step 10447: {'lr': 0.0004959929487475138, 'samples': 2005824, 'steps': 10446, 'loss/train': 1.6557822227478027} -08/30/2021 15:01:41 - INFO - __main__ - Step 10448: {'lr': 0.0004959920023713563, 'samples': 2006016, 'steps': 10447, 'loss/train': 2.1298668384552} -08/30/2021 15:01:41 - INFO - __main__ - Step 10449: {'lr': 0.0004959910558843584, 'samples': 2006208, 'steps': 10448, 'loss/train': 2.1713783740997314} -08/30/2021 15:01:42 - INFO - __main__ - Step 10450: {'lr': 0.0004959901092865208, 'samples': 2006400, 'steps': 10449, 'loss/train': 1.8460066318511963} -08/30/2021 15:01:42 - INFO - __main__ - Step 10451: {'lr': 0.0004959891625778438, 'samples': 2006592, 'steps': 10450, 'loss/train': 1.6569113731384277} -08/30/2021 15:01:44 - INFO - __main__ - Step 10452: {'lr': 0.0004959882157583281, 'samples': 2006784, 'steps': 10451, 'loss/train': 1.660936951637268} -08/30/2021 15:01:45 - INFO - __main__ - Step 10453: {'lr': 0.0004959872688279737, 'samples': 2006976, 'steps': 10452, 'loss/train': 2.017768144607544} -08/30/2021 15:01:45 - INFO - __main__ - Step 10454: {'lr': 0.0004959863217867814, 'samples': 2007168, 'steps': 10453, 'loss/train': 1.8957213163375854} -08/30/2021 15:01:45 - INFO - __main__ - Step 10455: {'lr': 0.0004959853746347513, 'samples': 2007360, 'steps': 10454, 'loss/train': 1.0855712890625} -08/30/2021 15:01:46 - INFO - __main__ - Step 10456: {'lr': 0.0004959844273718841, 'samples': 2007552, 'steps': 10455, 'loss/train': 1.6310032606124878} -08/30/2021 15:01:48 - INFO - __main__ - Step 10457: {'lr': 0.00049598347999818, 'samples': 2007744, 'steps': 10456, 'loss/train': 1.9456843137741089} -08/30/2021 15:01:48 - INFO - __main__ - Step 10458: {'lr': 0.0004959825325136396, 'samples': 2007936, 'steps': 10457, 'loss/train': 1.8384852409362793} -08/30/2021 15:01:49 - INFO - __main__ - Step 10459: {'lr': 0.0004959815849182633, 'samples': 2008128, 'steps': 10458, 'loss/train': 2.7311923503875732} -08/30/2021 15:01:49 - INFO - __main__ - Step 10460: {'lr': 0.0004959806372120515, 'samples': 2008320, 'steps': 10459, 'loss/train': 1.7400085926055908} -08/30/2021 15:01:49 - INFO - __main__ - Step 10461: {'lr': 0.0004959796893950045, 'samples': 2008512, 'steps': 10460, 'loss/train': 2.2166435718536377} -08/30/2021 15:01:50 - INFO - __main__ - Step 10462: {'lr': 0.0004959787414671229, 'samples': 2008704, 'steps': 10461, 'loss/train': 0.8627303838729858} -08/30/2021 15:01:51 - INFO - __main__ - Step 10463: {'lr': 0.000495977793428407, 'samples': 2008896, 'steps': 10462, 'loss/train': 0.1974806934595108} -08/30/2021 15:01:52 - INFO - __main__ - Step 10464: {'lr': 0.0004959768452788575, 'samples': 2009088, 'steps': 10463, 'loss/train': 2.158440351486206} -08/30/2021 15:01:52 - INFO - __main__ - Step 10465: {'lr': 0.0004959758970184745, 'samples': 2009280, 'steps': 10464, 'loss/train': 1.5986219644546509} -08/30/2021 15:01:52 - INFO - __main__ - Step 10466: {'lr': 0.0004959749486472587, 'samples': 2009472, 'steps': 10465, 'loss/train': 1.4605861902236938} -08/30/2021 15:01:53 - INFO - __main__ - Step 10467: {'lr': 0.0004959740001652102, 'samples': 2009664, 'steps': 10466, 'loss/train': 2.0068705081939697} -08/30/2021 15:01:54 - INFO - __main__ - Step 10468: {'lr': 0.0004959730515723298, 'samples': 2009856, 'steps': 10467, 'loss/train': 2.039984703063965} -08/30/2021 15:01:55 - INFO - __main__ - Step 10469: {'lr': 0.0004959721028686175, 'samples': 2010048, 'steps': 10468, 'loss/train': 2.137545585632324} -08/30/2021 15:01:55 - INFO - __main__ - Step 10470: {'lr': 0.0004959711540540741, 'samples': 2010240, 'steps': 10469, 'loss/train': 1.297655701637268} -08/30/2021 15:01:56 - INFO - __main__ - Step 10471: {'lr': 0.0004959702051286999, 'samples': 2010432, 'steps': 10470, 'loss/train': 0.3394823968410492} -08/30/2021 15:01:56 - INFO - __main__ - Step 10472: {'lr': 0.0004959692560924954, 'samples': 2010624, 'steps': 10471, 'loss/train': 2.455857515335083} -08/30/2021 15:01:57 - INFO - __main__ - Step 10473: {'lr': 0.0004959683069454608, 'samples': 2010816, 'steps': 10472, 'loss/train': 2.466825246810913} -08/30/2021 15:01:58 - INFO - __main__ - Step 10474: {'lr': 0.0004959673576875967, 'samples': 2011008, 'steps': 10473, 'loss/train': 1.654446005821228} -08/30/2021 15:01:58 - INFO - __main__ - Step 10475: {'lr': 0.0004959664083189035, 'samples': 2011200, 'steps': 10474, 'loss/train': 1.4932245016098022} -08/30/2021 15:01:59 - INFO - __main__ - Step 10476: {'lr': 0.0004959654588393818, 'samples': 2011392, 'steps': 10475, 'loss/train': 1.8561971187591553} -08/30/2021 15:01:59 - INFO - __main__ - Step 10477: {'lr': 0.0004959645092490316, 'samples': 2011584, 'steps': 10476, 'loss/train': 1.9416553974151611} -08/30/2021 15:02:00 - INFO - __main__ - Step 10478: {'lr': 0.0004959635595478537, 'samples': 2011776, 'steps': 10477, 'loss/train': 2.313185930252075} -08/30/2021 15:02:01 - INFO - __main__ - Step 10479: {'lr': 0.0004959626097358485, 'samples': 2011968, 'steps': 10478, 'loss/train': 1.9820820093154907} -08/30/2021 15:02:01 - INFO - __main__ - Step 10480: {'lr': 0.0004959616598130162, 'samples': 2012160, 'steps': 10479, 'loss/train': 2.019428253173828} -08/30/2021 15:02:02 - INFO - __main__ - Step 10481: {'lr': 0.0004959607097793575, 'samples': 2012352, 'steps': 10480, 'loss/train': 2.0295042991638184} -08/30/2021 15:02:02 - INFO - __main__ - Step 10482: {'lr': 0.0004959597596348726, 'samples': 2012544, 'steps': 10481, 'loss/train': 1.7402756214141846} -08/30/2021 15:02:03 - INFO - __main__ - Step 10483: {'lr': 0.0004959588093795621, 'samples': 2012736, 'steps': 10482, 'loss/train': 1.6770402193069458} -08/30/2021 15:02:04 - INFO - __main__ - Step 10484: {'lr': 0.0004959578590134262, 'samples': 2012928, 'steps': 10483, 'loss/train': 1.5392616987228394} -08/30/2021 15:02:04 - INFO - __main__ - Step 10485: {'lr': 0.0004959569085364657, 'samples': 2013120, 'steps': 10484, 'loss/train': 1.9837473630905151} -08/30/2021 15:02:05 - INFO - __main__ - Step 10486: {'lr': 0.0004959559579486807, 'samples': 2013312, 'steps': 10485, 'loss/train': 1.8422056436538696} -08/30/2021 15:02:05 - INFO - __main__ - Step 10487: {'lr': 0.0004959550072500718, 'samples': 2013504, 'steps': 10486, 'loss/train': 1.5745959281921387} -08/30/2021 15:02:05 - INFO - __main__ - Step 10488: {'lr': 0.0004959540564406393, 'samples': 2013696, 'steps': 10487, 'loss/train': 1.6322102546691895} -08/30/2021 15:02:07 - INFO - __main__ - Step 10489: {'lr': 0.0004959531055203837, 'samples': 2013888, 'steps': 10488, 'loss/train': 2.0236124992370605} -08/30/2021 15:02:07 - INFO - __main__ - Step 10490: {'lr': 0.0004959521544893055, 'samples': 2014080, 'steps': 10489, 'loss/train': 1.785768985748291} -08/30/2021 15:02:08 - INFO - __main__ - Step 10491: {'lr': 0.000495951203347405, 'samples': 2014272, 'steps': 10490, 'loss/train': 1.6534106731414795} -08/30/2021 15:02:08 - INFO - __main__ - Step 10492: {'lr': 0.0004959502520946827, 'samples': 2014464, 'steps': 10491, 'loss/train': 0.2743142247200012} -08/30/2021 15:02:08 - INFO - __main__ - Step 10493: {'lr': 0.000495949300731139, 'samples': 2014656, 'steps': 10492, 'loss/train': 1.8411226272583008} -08/30/2021 15:02:10 - INFO - __main__ - Step 10494: {'lr': 0.0004959483492567744, 'samples': 2014848, 'steps': 10493, 'loss/train': 2.1134486198425293} -08/30/2021 15:02:10 - INFO - __main__ - Step 10495: {'lr': 0.0004959473976715892, 'samples': 2015040, 'steps': 10494, 'loss/train': 1.650178074836731} -08/30/2021 15:02:11 - INFO - __main__ - Step 10496: {'lr': 0.0004959464459755839, 'samples': 2015232, 'steps': 10495, 'loss/train': 1.9412351846694946} -08/30/2021 15:02:11 - INFO - __main__ - Step 10497: {'lr': 0.0004959454941687589, 'samples': 2015424, 'steps': 10496, 'loss/train': 2.2524361610412598} -08/30/2021 15:02:11 - INFO - __main__ - Step 10498: {'lr': 0.0004959445422511148, 'samples': 2015616, 'steps': 10497, 'loss/train': 1.2734662294387817} -08/30/2021 15:02:13 - INFO - __main__ - Step 10499: {'lr': 0.0004959435902226517, 'samples': 2015808, 'steps': 10498, 'loss/train': 1.9825326204299927} -08/30/2021 15:02:13 - INFO - __main__ - Step 10500: {'lr': 0.0004959426380833703, 'samples': 2016000, 'steps': 10499, 'loss/train': 2.5058553218841553} -08/30/2021 15:02:14 - INFO - __main__ - Step 10501: {'lr': 0.0004959416858332709, 'samples': 2016192, 'steps': 10500, 'loss/train': 0.8799305558204651} -08/30/2021 15:02:14 - INFO - __main__ - Step 10502: {'lr': 0.000495940733472354, 'samples': 2016384, 'steps': 10501, 'loss/train': 2.027930498123169} -08/30/2021 15:02:14 - INFO - __main__ - Step 10503: {'lr': 0.00049593978100062, 'samples': 2016576, 'steps': 10502, 'loss/train': 1.6999003887176514} -08/30/2021 15:02:17 - INFO - __main__ - Step 10504: {'lr': 0.0004959388284180694, 'samples': 2016768, 'steps': 10503, 'loss/train': 1.9339839220046997} -08/30/2021 15:02:17 - INFO - __main__ - Step 10505: {'lr': 0.0004959378757247024, 'samples': 2016960, 'steps': 10504, 'loss/train': 1.9652814865112305} -08/30/2021 15:02:17 - INFO - __main__ - Step 10506: {'lr': 0.0004959369229205197, 'samples': 2017152, 'steps': 10505, 'loss/train': 1.5221179723739624} -08/30/2021 15:02:18 - INFO - __main__ - Step 10507: {'lr': 0.0004959359700055216, 'samples': 2017344, 'steps': 10506, 'loss/train': 2.0980300903320312} -08/30/2021 15:02:18 - INFO - __main__ - Step 10508: {'lr': 0.0004959350169797085, 'samples': 2017536, 'steps': 10507, 'loss/train': 2.3725430965423584} -08/30/2021 15:02:20 - INFO - __main__ - Step 10509: {'lr': 0.000495934063843081, 'samples': 2017728, 'steps': 10508, 'loss/train': 1.781004548072815} -08/30/2021 15:02:20 - INFO - __main__ - Step 10510: {'lr': 0.0004959331105956393, 'samples': 2017920, 'steps': 10509, 'loss/train': 1.3632245063781738} -08/30/2021 15:02:21 - INFO - __main__ - Step 10511: {'lr': 0.000495932157237384, 'samples': 2018112, 'steps': 10510, 'loss/train': 1.4666327238082886} -08/30/2021 15:02:21 - INFO - __main__ - Step 10512: {'lr': 0.0004959312037683154, 'samples': 2018304, 'steps': 10511, 'loss/train': 1.8845940828323364} -08/30/2021 15:02:21 - INFO - __main__ - Step 10513: {'lr': 0.0004959302501884341, 'samples': 2018496, 'steps': 10512, 'loss/train': 1.7574174404144287} -08/30/2021 15:02:22 - INFO - __main__ - Step 10514: {'lr': 0.0004959292964977403, 'samples': 2018688, 'steps': 10513, 'loss/train': 0.6841381788253784} -08/30/2021 15:02:23 - INFO - __main__ - Step 10515: {'lr': 0.0004959283426962345, 'samples': 2018880, 'steps': 10514, 'loss/train': 2.153968334197998} -08/30/2021 15:02:24 - INFO - __main__ - Step 10516: {'lr': 0.0004959273887839175, 'samples': 2019072, 'steps': 10515, 'loss/train': 1.4942861795425415} -08/30/2021 15:02:24 - INFO - __main__ - Step 10517: {'lr': 0.000495926434760789, 'samples': 2019264, 'steps': 10516, 'loss/train': 1.9657281637191772} -08/30/2021 15:02:24 - INFO - __main__ - Step 10518: {'lr': 0.0004959254806268501, 'samples': 2019456, 'steps': 10517, 'loss/train': 2.0604641437530518} -08/30/2021 15:02:25 - INFO - __main__ - Step 10519: {'lr': 0.0004959245263821009, 'samples': 2019648, 'steps': 10518, 'loss/train': 1.4639756679534912} -08/30/2021 15:02:26 - INFO - __main__ - Step 10520: {'lr': 0.0004959235720265419, 'samples': 2019840, 'steps': 10519, 'loss/train': 2.400418281555176} -08/30/2021 15:02:27 - INFO - __main__ - Step 10521: {'lr': 0.0004959226175601736, 'samples': 2020032, 'steps': 10520, 'loss/train': 2.2565877437591553} -08/30/2021 15:02:27 - INFO - __main__ - Step 10522: {'lr': 0.0004959216629829964, 'samples': 2020224, 'steps': 10521, 'loss/train': 1.641075849533081} -08/30/2021 15:02:27 - INFO - __main__ - Step 10523: {'lr': 0.0004959207082950105, 'samples': 2020416, 'steps': 10522, 'loss/train': 1.942132592201233} -08/30/2021 15:02:28 - INFO - __main__ - Step 10524: {'lr': 0.0004959197534962166, 'samples': 2020608, 'steps': 10523, 'loss/train': 1.78141450881958} -08/30/2021 15:02:29 - INFO - __main__ - Step 10525: {'lr': 0.0004959187985866152, 'samples': 2020800, 'steps': 10524, 'loss/train': 2.446502208709717} -08/30/2021 15:02:30 - INFO - __main__ - Step 10526: {'lr': 0.0004959178435662064, 'samples': 2020992, 'steps': 10525, 'loss/train': 2.1773462295532227} -08/30/2021 15:02:30 - INFO - __main__ - Step 10527: {'lr': 0.0004959168884349909, 'samples': 2021184, 'steps': 10526, 'loss/train': 2.262411117553711} -08/30/2021 15:02:31 - INFO - __main__ - Step 10528: {'lr': 0.0004959159331929691, 'samples': 2021376, 'steps': 10527, 'loss/train': 0.8106072545051575} -08/30/2021 15:02:31 - INFO - __main__ - Step 10529: {'lr': 0.0004959149778401412, 'samples': 2021568, 'steps': 10528, 'loss/train': 1.9869590997695923} -08/30/2021 15:02:32 - INFO - __main__ - Step 10530: {'lr': 0.000495914022376508, 'samples': 2021760, 'steps': 10529, 'loss/train': 1.2052595615386963} -08/30/2021 15:02:33 - INFO - __main__ - Step 10531: {'lr': 0.0004959130668020696, 'samples': 2021952, 'steps': 10530, 'loss/train': 1.4175198078155518} -08/30/2021 15:02:33 - INFO - __main__ - Step 10532: {'lr': 0.0004959121111168266, 'samples': 2022144, 'steps': 10531, 'loss/train': 1.635396957397461} -08/30/2021 15:02:34 - INFO - __main__ - Step 10533: {'lr': 0.0004959111553207794, 'samples': 2022336, 'steps': 10532, 'loss/train': 1.8357553482055664} -08/30/2021 15:02:34 - INFO - __main__ - Step 10534: {'lr': 0.0004959101994139284, 'samples': 2022528, 'steps': 10533, 'loss/train': 1.7777599096298218} -08/30/2021 15:02:34 - INFO - __main__ - Step 10535: {'lr': 0.0004959092433962742, 'samples': 2022720, 'steps': 10534, 'loss/train': 2.3951852321624756} -08/30/2021 15:02:36 - INFO - __main__ - Step 10536: {'lr': 0.0004959082872678169, 'samples': 2022912, 'steps': 10535, 'loss/train': 2.1775715351104736} -08/30/2021 15:02:36 - INFO - __main__ - Step 10537: {'lr': 0.0004959073310285572, 'samples': 2023104, 'steps': 10536, 'loss/train': 1.9282255172729492} -08/30/2021 15:02:37 - INFO - __main__ - Step 10538: {'lr': 0.0004959063746784955, 'samples': 2023296, 'steps': 10537, 'loss/train': 1.8154288530349731} -08/30/2021 15:02:37 - INFO - __main__ - Step 10539: {'lr': 0.0004959054182176321, 'samples': 2023488, 'steps': 10538, 'loss/train': 1.49866783618927} -08/30/2021 15:02:37 - INFO - __main__ - Step 10540: {'lr': 0.0004959044616459676, 'samples': 2023680, 'steps': 10539, 'loss/train': 1.614794135093689} -08/30/2021 15:02:39 - INFO - __main__ - Step 10541: {'lr': 0.0004959035049635023, 'samples': 2023872, 'steps': 10540, 'loss/train': 1.7843995094299316} -08/30/2021 15:02:39 - INFO - __main__ - Step 10542: {'lr': 0.0004959025481702366, 'samples': 2024064, 'steps': 10541, 'loss/train': 1.7165087461471558} -08/30/2021 15:02:40 - INFO - __main__ - Step 10543: {'lr': 0.0004959015912661712, 'samples': 2024256, 'steps': 10542, 'loss/train': 1.9312180280685425} -08/30/2021 15:02:40 - INFO - __main__ - Step 10544: {'lr': 0.0004959006342513062, 'samples': 2024448, 'steps': 10543, 'loss/train': 1.9411728382110596} -08/30/2021 15:02:40 - INFO - __main__ - Step 10545: {'lr': 0.0004958996771256422, 'samples': 2024640, 'steps': 10544, 'loss/train': 1.5995982885360718} -08/30/2021 15:02:42 - INFO - __main__ - Step 10546: {'lr': 0.0004958987198891796, 'samples': 2024832, 'steps': 10545, 'loss/train': 2.497468948364258} -08/30/2021 15:02:42 - INFO - __main__ - Step 10547: {'lr': 0.0004958977625419187, 'samples': 2025024, 'steps': 10546, 'loss/train': 1.703046202659607} -08/30/2021 15:02:43 - INFO - __main__ - Step 10548: {'lr': 0.0004958968050838603, 'samples': 2025216, 'steps': 10547, 'loss/train': 3.0953104496002197} -08/30/2021 15:02:43 - INFO - __main__ - Step 10549: {'lr': 0.0004958958475150044, 'samples': 2025408, 'steps': 10548, 'loss/train': 3.4171063899993896} -08/30/2021 15:02:44 - INFO - __main__ - Step 10550: {'lr': 0.0004958948898353516, 'samples': 2025600, 'steps': 10549, 'loss/train': 1.3698984384536743} -08/30/2021 15:02:45 - INFO - __main__ - Step 10551: {'lr': 0.0004958939320449026, 'samples': 2025792, 'steps': 10550, 'loss/train': 1.527429461479187} -08/30/2021 15:02:45 - INFO - __main__ - Step 10552: {'lr': 0.0004958929741436574, 'samples': 2025984, 'steps': 10551, 'loss/train': 1.6819144487380981} -08/30/2021 15:02:46 - INFO - __main__ - Step 10553: {'lr': 0.0004958920161316167, 'samples': 2026176, 'steps': 10552, 'loss/train': 1.7151061296463013} -08/30/2021 15:02:46 - INFO - __main__ - Step 10554: {'lr': 0.0004958910580087808, 'samples': 2026368, 'steps': 10553, 'loss/train': 1.8407119512557983} -08/30/2021 15:02:46 - INFO - __main__ - Step 10555: {'lr': 0.0004958900997751502, 'samples': 2026560, 'steps': 10554, 'loss/train': 1.6887060403823853} -08/30/2021 15:02:48 - INFO - __main__ - Step 10556: {'lr': 0.0004958891414307253, 'samples': 2026752, 'steps': 10555, 'loss/train': 1.3946881294250488} -08/30/2021 15:02:49 - INFO - __main__ - Step 10557: {'lr': 0.0004958881829755066, 'samples': 2026944, 'steps': 10556, 'loss/train': 1.9798439741134644} -08/30/2021 15:02:49 - INFO - __main__ - Step 10558: {'lr': 0.0004958872244094944, 'samples': 2027136, 'steps': 10557, 'loss/train': 0.20437650382518768} -08/30/2021 15:02:49 - INFO - __main__ - Step 10559: {'lr': 0.0004958862657326893, 'samples': 2027328, 'steps': 10558, 'loss/train': 2.201343297958374} -08/30/2021 15:02:50 - INFO - __main__ - Step 10560: {'lr': 0.0004958853069450916, 'samples': 2027520, 'steps': 10559, 'loss/train': 1.8643922805786133} -08/30/2021 15:02:50 - INFO - __main__ - Step 10561: {'lr': 0.0004958843480467017, 'samples': 2027712, 'steps': 10560, 'loss/train': 0.7602496147155762} -08/30/2021 15:02:52 - INFO - __main__ - Step 10562: {'lr': 0.0004958833890375202, 'samples': 2027904, 'steps': 10561, 'loss/train': 1.807782769203186} -08/30/2021 15:02:52 - INFO - __main__ - Step 10563: {'lr': 0.0004958824299175474, 'samples': 2028096, 'steps': 10562, 'loss/train': 2.3995413780212402} -08/30/2021 15:02:53 - INFO - __main__ - Step 10564: {'lr': 0.0004958814706867838, 'samples': 2028288, 'steps': 10563, 'loss/train': 1.6300077438354492} -08/30/2021 15:02:53 - INFO - __main__ - Step 10565: {'lr': 0.0004958805113452298, 'samples': 2028480, 'steps': 10564, 'loss/train': 1.9002076387405396} -08/30/2021 15:02:53 - INFO - __main__ - Step 10566: {'lr': 0.0004958795518928858, 'samples': 2028672, 'steps': 10565, 'loss/train': 1.4706333875656128} -08/30/2021 15:02:55 - INFO - __main__ - Step 10567: {'lr': 0.0004958785923297522, 'samples': 2028864, 'steps': 10566, 'loss/train': 2.03666090965271} -08/30/2021 15:02:55 - INFO - __main__ - Step 10568: {'lr': 0.0004958776326558298, 'samples': 2029056, 'steps': 10567, 'loss/train': 2.123552083969116} -08/30/2021 15:02:56 - INFO - __main__ - Step 10569: {'lr': 0.0004958766728711184, 'samples': 2029248, 'steps': 10568, 'loss/train': 1.7179365158081055} -08/30/2021 15:02:56 - INFO - __main__ - Step 10570: {'lr': 0.000495875712975619, 'samples': 2029440, 'steps': 10569, 'loss/train': 0.7491295337677002} -08/30/2021 15:02:56 - INFO - __main__ - Step 10571: {'lr': 0.0004958747529693316, 'samples': 2029632, 'steps': 10570, 'loss/train': 1.47507643699646} -08/30/2021 15:02:58 - INFO - __main__ - Step 10572: {'lr': 0.000495873792852257, 'samples': 2029824, 'steps': 10571, 'loss/train': 2.0478882789611816} -08/30/2021 15:02:58 - INFO - __main__ - Step 10573: {'lr': 0.0004958728326243954, 'samples': 2030016, 'steps': 10572, 'loss/train': 1.4584681987762451} -08/30/2021 15:02:59 - INFO - __main__ - Step 10574: {'lr': 0.0004958718722857473, 'samples': 2030208, 'steps': 10573, 'loss/train': 1.727081298828125} -08/30/2021 15:02:59 - INFO - __main__ - Step 10575: {'lr': 0.0004958709118363131, 'samples': 2030400, 'steps': 10574, 'loss/train': 2.439725399017334} -08/30/2021 15:02:59 - INFO - __main__ - Step 10576: {'lr': 0.0004958699512760933, 'samples': 2030592, 'steps': 10575, 'loss/train': 2.0526723861694336} -08/30/2021 15:03:01 - INFO - __main__ - Step 10577: {'lr': 0.0004958689906050882, 'samples': 2030784, 'steps': 10576, 'loss/train': 1.855075716972351} -08/30/2021 15:03:01 - INFO - __main__ - Step 10578: {'lr': 0.0004958680298232983, 'samples': 2030976, 'steps': 10577, 'loss/train': 1.7913870811462402} -08/30/2021 15:03:02 - INFO - __main__ - Step 10579: {'lr': 0.0004958670689307242, 'samples': 2031168, 'steps': 10578, 'loss/train': 1.8129478693008423} -08/30/2021 15:03:02 - INFO - __main__ - Step 10580: {'lr': 0.0004958661079273662, 'samples': 2031360, 'steps': 10579, 'loss/train': 2.041513681411743} -08/30/2021 15:03:02 - INFO - __main__ - Step 10581: {'lr': 0.0004958651468132246, 'samples': 2031552, 'steps': 10580, 'loss/train': 1.4812042713165283} -08/30/2021 15:03:04 - INFO - __main__ - Step 10582: {'lr': 0.0004958641855883001, 'samples': 2031744, 'steps': 10581, 'loss/train': 1.9945106506347656} -08/30/2021 15:03:04 - INFO - __main__ - Step 10583: {'lr': 0.0004958632242525929, 'samples': 2031936, 'steps': 10582, 'loss/train': 2.056206226348877} -08/30/2021 15:03:05 - INFO - __main__ - Step 10584: {'lr': 0.0004958622628061035, 'samples': 2032128, 'steps': 10583, 'loss/train': 1.8133273124694824} -08/30/2021 15:03:05 - INFO - __main__ - Step 10585: {'lr': 0.0004958613012488324, 'samples': 2032320, 'steps': 10584, 'loss/train': 1.2229818105697632} -08/30/2021 15:03:05 - INFO - __main__ - Step 10586: {'lr': 0.00049586033958078, 'samples': 2032512, 'steps': 10585, 'loss/train': 1.4508144855499268} -08/30/2021 15:03:07 - INFO - __main__ - Step 10587: {'lr': 0.0004958593778019468, 'samples': 2032704, 'steps': 10586, 'loss/train': 1.7170994281768799} -08/30/2021 15:03:08 - INFO - __main__ - Step 10588: {'lr': 0.0004958584159123331, 'samples': 2032896, 'steps': 10587, 'loss/train': 1.9261326789855957} -08/30/2021 15:03:08 - INFO - __main__ - Step 10589: {'lr': 0.0004958574539119392, 'samples': 2033088, 'steps': 10588, 'loss/train': 1.8346456289291382} -08/30/2021 15:03:09 - INFO - __main__ - Step 10590: {'lr': 0.0004958564918007659, 'samples': 2033280, 'steps': 10589, 'loss/train': 1.7016843557357788} -08/30/2021 15:03:09 - INFO - __main__ - Step 10591: {'lr': 0.0004958555295788135, 'samples': 2033472, 'steps': 10590, 'loss/train': 2.2442336082458496} -08/30/2021 15:03:09 - INFO - __main__ - Step 10592: {'lr': 0.0004958545672460824, 'samples': 2033664, 'steps': 10591, 'loss/train': 1.699468970298767} -08/30/2021 15:03:11 - INFO - __main__ - Step 10593: {'lr': 0.0004958536048025729, 'samples': 2033856, 'steps': 10592, 'loss/train': 1.7041306495666504} -08/30/2021 15:03:11 - INFO - __main__ - Step 10594: {'lr': 0.0004958526422482857, 'samples': 2034048, 'steps': 10593, 'loss/train': 1.6113286018371582} -08/30/2021 15:03:12 - INFO - __main__ - Step 10595: {'lr': 0.000495851679583221, 'samples': 2034240, 'steps': 10594, 'loss/train': 1.5139615535736084} -08/30/2021 15:03:12 - INFO - __main__ - Step 10596: {'lr': 0.0004958507168073793, 'samples': 2034432, 'steps': 10595, 'loss/train': 1.9657795429229736} -08/30/2021 15:03:12 - INFO - __main__ - Step 10597: {'lr': 0.0004958497539207611, 'samples': 2034624, 'steps': 10596, 'loss/train': 1.6898196935653687} -08/30/2021 15:03:14 - INFO - __main__ - Step 10598: {'lr': 0.0004958487909233669, 'samples': 2034816, 'steps': 10597, 'loss/train': 1.334596872329712} -08/30/2021 15:03:15 - INFO - __main__ - Step 10599: {'lr': 0.0004958478278151969, 'samples': 2035008, 'steps': 10598, 'loss/train': 2.027326822280884} -08/30/2021 15:03:15 - INFO - __main__ - Step 10600: {'lr': 0.0004958468645962517, 'samples': 2035200, 'steps': 10599, 'loss/train': 1.7834383249282837} -08/30/2021 15:03:15 - INFO - __main__ - Step 10601: {'lr': 0.0004958459012665317, 'samples': 2035392, 'steps': 10600, 'loss/train': 2.2354843616485596} -08/30/2021 15:03:16 - INFO - __main__ - Step 10602: {'lr': 0.0004958449378260374, 'samples': 2035584, 'steps': 10601, 'loss/train': 1.237476110458374} -08/30/2021 15:03:16 - INFO - __main__ - Step 10603: {'lr': 0.000495843974274769, 'samples': 2035776, 'steps': 10602, 'loss/train': 2.2609970569610596} -08/30/2021 15:03:18 - INFO - __main__ - Step 10604: {'lr': 0.0004958430106127272, 'samples': 2035968, 'steps': 10603, 'loss/train': 1.93257474899292} -08/30/2021 15:03:18 - INFO - __main__ - Step 10605: {'lr': 0.0004958420468399123, 'samples': 2036160, 'steps': 10604, 'loss/train': 2.401864528656006} -08/30/2021 15:03:18 - INFO - __main__ - Step 10606: {'lr': 0.0004958410829563248, 'samples': 2036352, 'steps': 10605, 'loss/train': 1.4825185537338257} -08/30/2021 15:03:19 - INFO - __main__ - Step 10607: {'lr': 0.0004958401189619652, 'samples': 2036544, 'steps': 10606, 'loss/train': 2.18910813331604} -08/30/2021 15:03:19 - INFO - __main__ - Step 10608: {'lr': 0.0004958391548568336, 'samples': 2036736, 'steps': 10607, 'loss/train': 1.8769748210906982} -08/30/2021 15:03:21 - INFO - __main__ - Step 10609: {'lr': 0.0004958381906409308, 'samples': 2036928, 'steps': 10608, 'loss/train': 2.0168251991271973} -08/30/2021 15:03:21 - INFO - __main__ - Step 10610: {'lr': 0.0004958372263142571, 'samples': 2037120, 'steps': 10609, 'loss/train': 2.0536816120147705} -08/30/2021 15:03:21 - INFO - __main__ - Step 10611: {'lr': 0.0004958362618768129, 'samples': 2037312, 'steps': 10610, 'loss/train': 2.5476222038269043} -08/30/2021 15:03:22 - INFO - __main__ - Step 10612: {'lr': 0.0004958352973285987, 'samples': 2037504, 'steps': 10611, 'loss/train': 0.4447791576385498} -08/30/2021 15:03:22 - INFO - __main__ - Step 10613: {'lr': 0.000495834332669615, 'samples': 2037696, 'steps': 10612, 'loss/train': 2.6342968940734863} -08/30/2021 15:03:24 - INFO - __main__ - Step 10614: {'lr': 0.0004958333678998622, 'samples': 2037888, 'steps': 10613, 'loss/train': 2.205479860305786} -08/30/2021 15:03:25 - INFO - __main__ - Step 10615: {'lr': 0.0004958324030193404, 'samples': 2038080, 'steps': 10614, 'loss/train': 0.6903966069221497} -08/30/2021 15:03:25 - INFO - __main__ - Step 10616: {'lr': 0.0004958314380280504, 'samples': 2038272, 'steps': 10615, 'loss/train': 1.73091459274292} -08/30/2021 15:03:25 - INFO - __main__ - Step 10617: {'lr': 0.0004958304729259927, 'samples': 2038464, 'steps': 10616, 'loss/train': 1.6818708181381226} -08/30/2021 15:03:26 - INFO - __main__ - Step 10618: {'lr': 0.0004958295077131674, 'samples': 2038656, 'steps': 10617, 'loss/train': 1.7798888683319092} -08/30/2021 15:03:27 - INFO - __main__ - Step 10619: {'lr': 0.0004958285423895752, 'samples': 2038848, 'steps': 10618, 'loss/train': 1.265381932258606} -08/30/2021 15:03:28 - INFO - __main__ - Step 10620: {'lr': 0.0004958275769552165, 'samples': 2039040, 'steps': 10619, 'loss/train': 1.98273766040802} -08/30/2021 15:03:28 - INFO - __main__ - Step 10621: {'lr': 0.0004958266114100917, 'samples': 2039232, 'steps': 10620, 'loss/train': 2.1460537910461426} -08/30/2021 15:03:28 - INFO - __main__ - Step 10622: {'lr': 0.0004958256457542011, 'samples': 2039424, 'steps': 10621, 'loss/train': 1.9756097793579102} -08/30/2021 15:03:29 - INFO - __main__ - Step 10623: {'lr': 0.0004958246799875453, 'samples': 2039616, 'steps': 10622, 'loss/train': 2.048715591430664} -08/30/2021 15:03:31 - INFO - __main__ - Step 10624: {'lr': 0.0004958237141101247, 'samples': 2039808, 'steps': 10623, 'loss/train': 2.2093610763549805} -08/30/2021 15:03:32 - INFO - __main__ - Step 10625: {'lr': 0.0004958227481219399, 'samples': 2040000, 'steps': 10624, 'loss/train': 1.5564757585525513} -08/30/2021 15:03:32 - INFO - __main__ - Step 10626: {'lr': 0.0004958217820229909, 'samples': 2040192, 'steps': 10625, 'loss/train': 2.1298341751098633} -08/30/2021 15:03:32 - INFO - __main__ - Step 10627: {'lr': 0.0004958208158132785, 'samples': 2040384, 'steps': 10626, 'loss/train': 1.748016595840454} -08/30/2021 15:03:33 - INFO - __main__ - Step 10628: {'lr': 0.000495819849492803, 'samples': 2040576, 'steps': 10627, 'loss/train': 1.7894550561904907} -08/30/2021 15:03:33 - INFO - __main__ - Step 10629: {'lr': 0.0004958188830615649, 'samples': 2040768, 'steps': 10628, 'loss/train': 2.3215763568878174} -08/30/2021 15:03:33 - INFO - __main__ - Step 10630: {'lr': 0.0004958179165195646, 'samples': 2040960, 'steps': 10629, 'loss/train': 1.9983327388763428} -08/30/2021 15:03:34 - INFO - __main__ - Step 10631: {'lr': 0.0004958169498668026, 'samples': 2041152, 'steps': 10630, 'loss/train': 2.1977379322052} -08/30/2021 15:03:35 - INFO - __main__ - Step 10632: {'lr': 0.0004958159831032793, 'samples': 2041344, 'steps': 10631, 'loss/train': 2.129565477371216} -08/30/2021 15:03:36 - INFO - __main__ - Step 10633: {'lr': 0.000495815016228995, 'samples': 2041536, 'steps': 10632, 'loss/train': 2.476797103881836} -08/30/2021 15:03:36 - INFO - __main__ - Step 10634: {'lr': 0.0004958140492439502, 'samples': 2041728, 'steps': 10633, 'loss/train': 2.1424500942230225} -08/30/2021 15:03:36 - INFO - __main__ - Step 10635: {'lr': 0.0004958130821481455, 'samples': 2041920, 'steps': 10634, 'loss/train': 1.9851062297821045} -08/30/2021 15:03:37 - INFO - __main__ - Step 10636: {'lr': 0.0004958121149415812, 'samples': 2042112, 'steps': 10635, 'loss/train': 1.7994110584259033} -08/30/2021 15:03:38 - INFO - __main__ - Step 10637: {'lr': 0.0004958111476242577, 'samples': 2042304, 'steps': 10636, 'loss/train': 2.2752678394317627} -08/30/2021 15:03:39 - INFO - __main__ - Step 10638: {'lr': 0.0004958101801961755, 'samples': 2042496, 'steps': 10637, 'loss/train': 2.3514392375946045} -08/30/2021 15:03:39 - INFO - __main__ - Step 10639: {'lr': 0.0004958092126573352, 'samples': 2042688, 'steps': 10638, 'loss/train': 2.0725250244140625} -08/30/2021 15:03:40 - INFO - __main__ - Step 10640: {'lr': 0.0004958082450077369, 'samples': 2042880, 'steps': 10639, 'loss/train': 2.194011926651001} -08/30/2021 15:03:40 - INFO - __main__ - Step 10641: {'lr': 0.0004958072772473812, 'samples': 2043072, 'steps': 10640, 'loss/train': 1.7174255847930908} -08/30/2021 15:03:40 - INFO - __main__ - Step 10642: {'lr': 0.0004958063093762684, 'samples': 2043264, 'steps': 10641, 'loss/train': 2.1803905963897705} -08/30/2021 15:03:42 - INFO - __main__ - Step 10643: {'lr': 0.0004958053413943993, 'samples': 2043456, 'steps': 10642, 'loss/train': 1.8791708946228027} -08/30/2021 15:03:42 - INFO - __main__ - Step 10644: {'lr': 0.0004958043733017741, 'samples': 2043648, 'steps': 10643, 'loss/train': 1.8752700090408325} -08/30/2021 15:03:43 - INFO - __main__ - Step 10645: {'lr': 0.0004958034050983932, 'samples': 2043840, 'steps': 10644, 'loss/train': 1.724615454673767} -08/30/2021 15:03:43 - INFO - __main__ - Step 10646: {'lr': 0.0004958024367842569, 'samples': 2044032, 'steps': 10645, 'loss/train': 1.894936442375183} -08/30/2021 15:03:44 - INFO - __main__ - Step 10647: {'lr': 0.000495801468359366, 'samples': 2044224, 'steps': 10646, 'loss/train': 2.294870615005493} -08/30/2021 15:03:45 - INFO - __main__ - Step 10648: {'lr': 0.0004958004998237207, 'samples': 2044416, 'steps': 10647, 'loss/train': 2.764667510986328} -08/30/2021 15:03:46 - INFO - __main__ - Step 10649: {'lr': 0.0004957995311773215, 'samples': 2044608, 'steps': 10648, 'loss/train': 6.3452253341674805} -08/30/2021 15:03:46 - INFO - __main__ - Step 10650: {'lr': 0.0004957985624201688, 'samples': 2044800, 'steps': 10649, 'loss/train': 1.8892719745635986} -08/30/2021 15:03:46 - INFO - __main__ - Step 10651: {'lr': 0.0004957975935522632, 'samples': 2044992, 'steps': 10650, 'loss/train': 0.9367871284484863} -08/30/2021 15:03:47 - INFO - __main__ - Step 10652: {'lr': 0.0004957966245736048, 'samples': 2045184, 'steps': 10651, 'loss/train': 1.7667204141616821} -08/30/2021 15:03:48 - INFO - __main__ - Step 10653: {'lr': 0.0004957956554841943, 'samples': 2045376, 'steps': 10652, 'loss/train': 1.3119536638259888} -08/30/2021 15:03:49 - INFO - __main__ - Step 10654: {'lr': 0.0004957946862840321, 'samples': 2045568, 'steps': 10653, 'loss/train': 2.294827938079834} -08/30/2021 15:03:49 - INFO - __main__ - Step 10655: {'lr': 0.0004957937169731186, 'samples': 2045760, 'steps': 10654, 'loss/train': 1.4760403633117676} -08/30/2021 15:03:49 - INFO - __main__ - Step 10656: {'lr': 0.0004957927475514542, 'samples': 2045952, 'steps': 10655, 'loss/train': 1.6929547786712646} -08/30/2021 15:03:50 - INFO - __main__ - Step 10657: {'lr': 0.0004957917780190395, 'samples': 2046144, 'steps': 10656, 'loss/train': 2.8597707748413086} -08/30/2021 15:03:51 - INFO - __main__ - Step 10658: {'lr': 0.0004957908083758747, 'samples': 2046336, 'steps': 10657, 'loss/train': 1.512115240097046} -08/30/2021 15:03:52 - INFO - __main__ - Step 10659: {'lr': 0.0004957898386219603, 'samples': 2046528, 'steps': 10658, 'loss/train': 2.175381660461426} -08/30/2021 15:03:52 - INFO - __main__ - Step 10660: {'lr': 0.000495788868757297, 'samples': 2046720, 'steps': 10659, 'loss/train': 1.9193998575210571} -08/30/2021 15:03:52 - INFO - __main__ - Step 10661: {'lr': 0.0004957878987818849, 'samples': 2046912, 'steps': 10660, 'loss/train': 2.146965742111206} -08/30/2021 15:03:53 - INFO - __main__ - Step 10662: {'lr': 0.0004957869286957246, 'samples': 2047104, 'steps': 10661, 'loss/train': 2.098656415939331} -08/30/2021 15:03:53 - INFO - __main__ - Step 10663: {'lr': 0.0004957859584988164, 'samples': 2047296, 'steps': 10662, 'loss/train': 1.5975902080535889} -08/30/2021 15:03:55 - INFO - __main__ - Step 10664: {'lr': 0.0004957849881911609, 'samples': 2047488, 'steps': 10663, 'loss/train': 1.6310983896255493} -08/30/2021 15:03:55 - INFO - __main__ - Step 10665: {'lr': 0.0004957840177727585, 'samples': 2047680, 'steps': 10664, 'loss/train': 1.9936878681182861} -08/30/2021 15:03:56 - INFO - __main__ - Step 10666: {'lr': 0.0004957830472436097, 'samples': 2047872, 'steps': 10665, 'loss/train': 1.8515408039093018} -08/30/2021 15:03:56 - INFO - __main__ - Step 10667: {'lr': 0.0004957820766037147, 'samples': 2048064, 'steps': 10666, 'loss/train': 1.6449856758117676} -08/30/2021 15:03:56 - INFO - __main__ - Step 10668: {'lr': 0.0004957811058530742, 'samples': 2048256, 'steps': 10667, 'loss/train': 1.3918766975402832} -08/30/2021 15:03:58 - INFO - __main__ - Step 10669: {'lr': 0.0004957801349916884, 'samples': 2048448, 'steps': 10668, 'loss/train': 0.8530736565589905} -08/30/2021 15:03:59 - INFO - __main__ - Step 10670: {'lr': 0.000495779164019558, 'samples': 2048640, 'steps': 10669, 'loss/train': 1.6328083276748657} -08/30/2021 15:03:59 - INFO - __main__ - Step 10671: {'lr': 0.0004957781929366832, 'samples': 2048832, 'steps': 10670, 'loss/train': 1.8257925510406494} -08/30/2021 15:03:59 - INFO - __main__ - Step 10672: {'lr': 0.0004957772217430646, 'samples': 2049024, 'steps': 10671, 'loss/train': 1.3351576328277588} -08/30/2021 15:04:00 - INFO - __main__ - Step 10673: {'lr': 0.0004957762504387025, 'samples': 2049216, 'steps': 10672, 'loss/train': 1.3350465297698975} -08/30/2021 15:04:01 - INFO - __main__ - Step 10674: {'lr': 0.0004957752790235976, 'samples': 2049408, 'steps': 10673, 'loss/train': 2.212059259414673} -08/30/2021 15:04:02 - INFO - __main__ - Step 10675: {'lr': 0.00049577430749775, 'samples': 2049600, 'steps': 10674, 'loss/train': 2.780787229537964} -08/30/2021 15:04:02 - INFO - __main__ - Step 10676: {'lr': 0.0004957733358611602, 'samples': 2049792, 'steps': 10675, 'loss/train': 1.6459110975265503} -08/30/2021 15:04:02 - INFO - __main__ - Step 10677: {'lr': 0.0004957723641138289, 'samples': 2049984, 'steps': 10676, 'loss/train': 1.5592550039291382} -08/30/2021 15:04:03 - INFO - __main__ - Step 10678: {'lr': 0.0004957713922557563, 'samples': 2050176, 'steps': 10677, 'loss/train': 1.8758960962295532} -08/30/2021 15:04:03 - INFO - __main__ - Step 10679: {'lr': 0.0004957704202869429, 'samples': 2050368, 'steps': 10678, 'loss/train': 2.0165200233459473} -08/30/2021 15:04:05 - INFO - __main__ - Step 10680: {'lr': 0.0004957694482073891, 'samples': 2050560, 'steps': 10679, 'loss/train': 2.3360977172851562} -08/30/2021 15:04:05 - INFO - __main__ - Step 10681: {'lr': 0.0004957684760170955, 'samples': 2050752, 'steps': 10680, 'loss/train': 1.9172230958938599} -08/30/2021 15:04:05 - INFO - __main__ - Step 10682: {'lr': 0.0004957675037160624, 'samples': 2050944, 'steps': 10681, 'loss/train': 1.6415748596191406} -08/30/2021 15:04:06 - INFO - __main__ - Step 10683: {'lr': 0.0004957665313042902, 'samples': 2051136, 'steps': 10682, 'loss/train': 1.8189716339111328} -08/30/2021 15:04:06 - INFO - __main__ - Step 10684: {'lr': 0.0004957655587817793, 'samples': 2051328, 'steps': 10683, 'loss/train': 2.129347324371338} -08/30/2021 15:04:08 - INFO - __main__ - Step 10685: {'lr': 0.0004957645861485304, 'samples': 2051520, 'steps': 10684, 'loss/train': 1.7494794130325317} -08/30/2021 15:04:08 - INFO - __main__ - Step 10686: {'lr': 0.0004957636134045437, 'samples': 2051712, 'steps': 10685, 'loss/train': 1.7605416774749756} -08/30/2021 15:04:08 - INFO - __main__ - Step 10687: {'lr': 0.0004957626405498196, 'samples': 2051904, 'steps': 10686, 'loss/train': 2.2078678607940674} -08/30/2021 15:04:09 - INFO - __main__ - Step 10688: {'lr': 0.0004957616675843588, 'samples': 2052096, 'steps': 10687, 'loss/train': 1.554547667503357} -08/30/2021 15:04:09 - INFO - __main__ - Step 10689: {'lr': 0.0004957606945081615, 'samples': 2052288, 'steps': 10688, 'loss/train': 1.8485602140426636} -08/30/2021 15:04:11 - INFO - __main__ - Step 10690: {'lr': 0.0004957597213212284, 'samples': 2052480, 'steps': 10689, 'loss/train': 2.1953125} -08/30/2021 15:04:11 - INFO - __main__ - Step 10691: {'lr': 0.0004957587480235595, 'samples': 2052672, 'steps': 10690, 'loss/train': 1.8529311418533325} -08/30/2021 15:04:12 - INFO - __main__ - Step 10692: {'lr': 0.0004957577746151556, 'samples': 2052864, 'steps': 10691, 'loss/train': 0.44848647713661194} -08/30/2021 15:04:12 - INFO - __main__ - Step 10693: {'lr': 0.0004957568010960171, 'samples': 2053056, 'steps': 10692, 'loss/train': 0.3356359899044037} -08/30/2021 15:04:12 - INFO - __main__ - Step 10694: {'lr': 0.0004957558274661444, 'samples': 2053248, 'steps': 10693, 'loss/train': 1.0516051054000854} -08/30/2021 15:04:13 - INFO - __main__ - Step 10695: {'lr': 0.0004957548537255378, 'samples': 2053440, 'steps': 10694, 'loss/train': 0.15695035457611084} -08/30/2021 15:04:14 - INFO - __main__ - Step 10696: {'lr': 0.000495753879874198, 'samples': 2053632, 'steps': 10695, 'loss/train': 1.8583338260650635} -08/30/2021 15:04:15 - INFO - __main__ - Step 10697: {'lr': 0.0004957529059121251, 'samples': 2053824, 'steps': 10696, 'loss/train': 1.9161690473556519} -08/30/2021 15:04:15 - INFO - __main__ - Step 10698: {'lr': 0.0004957519318393199, 'samples': 2054016, 'steps': 10697, 'loss/train': 2.220370054244995} -08/30/2021 15:04:15 - INFO - __main__ - Step 10699: {'lr': 0.0004957509576557826, 'samples': 2054208, 'steps': 10698, 'loss/train': 1.381768822669983} -08/30/2021 15:04:16 - INFO - __main__ - Step 10700: {'lr': 0.0004957499833615137, 'samples': 2054400, 'steps': 10699, 'loss/train': 1.659382700920105} -08/30/2021 15:04:17 - INFO - __main__ - Step 10701: {'lr': 0.0004957490089565137, 'samples': 2054592, 'steps': 10700, 'loss/train': 1.5124784708023071} -08/30/2021 15:04:18 - INFO - __main__ - Step 10702: {'lr': 0.0004957480344407829, 'samples': 2054784, 'steps': 10701, 'loss/train': 1.7778509855270386} -08/30/2021 15:04:18 - INFO - __main__ - Step 10703: {'lr': 0.0004957470598143218, 'samples': 2054976, 'steps': 10702, 'loss/train': 1.084619164466858} -08/30/2021 15:04:18 - INFO - __main__ - Step 10704: {'lr': 0.000495746085077131, 'samples': 2055168, 'steps': 10703, 'loss/train': 1.7560259103775024} -08/30/2021 15:04:19 - INFO - __main__ - Step 10705: {'lr': 0.0004957451102292108, 'samples': 2055360, 'steps': 10704, 'loss/train': 1.4236453771591187} -08/30/2021 15:04:20 - INFO - __main__ - Step 10706: {'lr': 0.0004957441352705616, 'samples': 2055552, 'steps': 10705, 'loss/train': 2.126816987991333} -08/30/2021 15:04:20 - INFO - __main__ - Step 10707: {'lr': 0.0004957431602011839, 'samples': 2055744, 'steps': 10706, 'loss/train': 1.8676573038101196} -08/30/2021 15:04:21 - INFO - __main__ - Step 10708: {'lr': 0.0004957421850210781, 'samples': 2055936, 'steps': 10707, 'loss/train': 1.5977020263671875} -08/30/2021 15:04:21 - INFO - __main__ - Step 10709: {'lr': 0.0004957412097302446, 'samples': 2056128, 'steps': 10708, 'loss/train': 1.7649636268615723} -08/30/2021 15:04:22 - INFO - __main__ - Step 10710: {'lr': 0.000495740234328684, 'samples': 2056320, 'steps': 10709, 'loss/train': 1.82119882106781} -08/30/2021 15:04:23 - INFO - __main__ - Step 10711: {'lr': 0.0004957392588163967, 'samples': 2056512, 'steps': 10710, 'loss/train': 1.584668517112732} -08/30/2021 15:04:23 - INFO - __main__ - Step 10712: {'lr': 0.000495738283193383, 'samples': 2056704, 'steps': 10711, 'loss/train': 1.978911280632019} -08/30/2021 15:04:24 - INFO - __main__ - Step 10713: {'lr': 0.0004957373074596434, 'samples': 2056896, 'steps': 10712, 'loss/train': 1.8620069026947021} -08/30/2021 15:04:24 - INFO - __main__ - Step 10714: {'lr': 0.0004957363316151784, 'samples': 2057088, 'steps': 10713, 'loss/train': 2.139443874359131} -08/30/2021 15:04:25 - INFO - __main__ - Step 10715: {'lr': 0.0004957353556599884, 'samples': 2057280, 'steps': 10714, 'loss/train': 1.900222897529602} -08/30/2021 15:04:26 - INFO - __main__ - Step 10716: {'lr': 0.0004957343795940738, 'samples': 2057472, 'steps': 10715, 'loss/train': 1.6313177347183228} -08/30/2021 15:04:27 - INFO - __main__ - Step 10717: {'lr': 0.0004957334034174351, 'samples': 2057664, 'steps': 10716, 'loss/train': 1.8593275547027588} -08/30/2021 15:04:27 - INFO - __main__ - Step 10718: {'lr': 0.0004957324271300728, 'samples': 2057856, 'steps': 10717, 'loss/train': 1.7024364471435547} -08/30/2021 15:04:27 - INFO - __main__ - Step 10719: {'lr': 0.0004957314507319871, 'samples': 2058048, 'steps': 10718, 'loss/train': 1.9018559455871582} -08/30/2021 15:04:28 - INFO - __main__ - Step 10720: {'lr': 0.0004957304742231787, 'samples': 2058240, 'steps': 10719, 'loss/train': 2.215010643005371} -08/30/2021 15:04:29 - INFO - __main__ - Step 10721: {'lr': 0.0004957294976036479, 'samples': 2058432, 'steps': 10720, 'loss/train': 2.1520371437072754} -08/30/2021 15:04:30 - INFO - __main__ - Step 10722: {'lr': 0.0004957285208733953, 'samples': 2058624, 'steps': 10721, 'loss/train': 1.8115051984786987} -08/30/2021 15:04:30 - INFO - __main__ - Step 10723: {'lr': 0.0004957275440324211, 'samples': 2058816, 'steps': 10722, 'loss/train': 1.914891242980957} -08/30/2021 15:04:30 - INFO - __main__ - Step 10724: {'lr': 0.0004957265670807258, 'samples': 2059008, 'steps': 10723, 'loss/train': 1.5794235467910767} -08/30/2021 15:04:31 - INFO - __main__ - Step 10725: {'lr': 0.0004957255900183101, 'samples': 2059200, 'steps': 10724, 'loss/train': 1.5233807563781738} -08/30/2021 15:04:33 - INFO - __main__ - Step 10726: {'lr': 0.000495724612845174, 'samples': 2059392, 'steps': 10725, 'loss/train': 2.3213930130004883} -08/30/2021 15:04:33 - INFO - __main__ - Step 10727: {'lr': 0.0004957236355613184, 'samples': 2059584, 'steps': 10726, 'loss/train': 1.919843316078186} -08/30/2021 15:04:33 - INFO - __main__ - Step 10728: {'lr': 0.0004957226581667434, 'samples': 2059776, 'steps': 10727, 'loss/train': 1.8233662843704224} -08/30/2021 15:04:34 - INFO - __main__ - Step 10729: {'lr': 0.0004957216806614496, 'samples': 2059968, 'steps': 10728, 'loss/train': 1.996636152267456} -08/30/2021 15:04:34 - INFO - __main__ - Step 10730: {'lr': 0.0004957207030454374, 'samples': 2060160, 'steps': 10729, 'loss/train': 1.5340129137039185} -08/30/2021 15:04:36 - INFO - __main__ - Step 10731: {'lr': 0.0004957197253187073, 'samples': 2060352, 'steps': 10730, 'loss/train': 2.3949286937713623} -08/30/2021 15:04:36 - INFO - __main__ - Step 10732: {'lr': 0.0004957187474812595, 'samples': 2060544, 'steps': 10731, 'loss/train': 1.8444056510925293} -08/30/2021 15:04:36 - INFO - __main__ - Step 10733: {'lr': 0.0004957177695330948, 'samples': 2060736, 'steps': 10732, 'loss/train': 2.0066213607788086} -08/30/2021 15:04:37 - INFO - __main__ - Step 10734: {'lr': 0.0004957167914742134, 'samples': 2060928, 'steps': 10733, 'loss/train': 2.3742356300354004} -08/30/2021 15:04:37 - INFO - __main__ - Step 10735: {'lr': 0.0004957158133046158, 'samples': 2061120, 'steps': 10734, 'loss/train': 1.9590860605239868} -08/30/2021 15:04:39 - INFO - __main__ - Step 10736: {'lr': 0.0004957148350243025, 'samples': 2061312, 'steps': 10735, 'loss/train': 1.4728792905807495} -08/30/2021 15:04:39 - INFO - __main__ - Step 10737: {'lr': 0.0004957138566332738, 'samples': 2061504, 'steps': 10736, 'loss/train': 1.831321358680725} -08/30/2021 15:04:39 - INFO - __main__ - Step 10738: {'lr': 0.0004957128781315303, 'samples': 2061696, 'steps': 10737, 'loss/train': 2.2706210613250732} -08/30/2021 15:04:40 - INFO - __main__ - Step 10739: {'lr': 0.0004957118995190723, 'samples': 2061888, 'steps': 10738, 'loss/train': 1.7025460004806519} -08/30/2021 15:04:40 - INFO - __main__ - Step 10740: {'lr': 0.0004957109207959004, 'samples': 2062080, 'steps': 10739, 'loss/train': 1.8625162839889526} -08/30/2021 15:04:41 - INFO - __main__ - Step 10741: {'lr': 0.0004957099419620149, 'samples': 2062272, 'steps': 10740, 'loss/train': 1.711644172668457} -08/30/2021 15:04:42 - INFO - __main__ - Step 10742: {'lr': 0.0004957089630174163, 'samples': 2062464, 'steps': 10741, 'loss/train': 1.967525839805603} -08/30/2021 15:04:43 - INFO - __main__ - Step 10743: {'lr': 0.0004957079839621051, 'samples': 2062656, 'steps': 10742, 'loss/train': 2.0031445026397705} -08/30/2021 15:04:43 - INFO - __main__ - Step 10744: {'lr': 0.0004957070047960816, 'samples': 2062848, 'steps': 10743, 'loss/train': 1.391197919845581} -08/30/2021 15:04:43 - INFO - __main__ - Step 10745: {'lr': 0.0004957060255193462, 'samples': 2063040, 'steps': 10744, 'loss/train': 1.7929103374481201} -08/30/2021 15:04:44 - INFO - __main__ - Step 10746: {'lr': 0.0004957050461318997, 'samples': 2063232, 'steps': 10745, 'loss/train': 1.8188024759292603} -08/30/2021 15:04:45 - INFO - __main__ - Step 10747: {'lr': 0.0004957040666337422, 'samples': 2063424, 'steps': 10746, 'loss/train': 2.108142614364624} -08/30/2021 15:04:46 - INFO - __main__ - Step 10748: {'lr': 0.0004957030870248742, 'samples': 2063616, 'steps': 10747, 'loss/train': 2.050351142883301} -08/30/2021 15:04:46 - INFO - __main__ - Step 10749: {'lr': 0.0004957021073052962, 'samples': 2063808, 'steps': 10748, 'loss/train': 2.325164556503296} -08/30/2021 15:04:46 - INFO - __main__ - Step 10750: {'lr': 0.0004957011274750086, 'samples': 2064000, 'steps': 10749, 'loss/train': 6.031447410583496} -08/30/2021 15:04:47 - INFO - __main__ - Step 10751: {'lr': 0.0004957001475340119, 'samples': 2064192, 'steps': 10750, 'loss/train': 1.8415454626083374} -08/30/2021 15:04:48 - INFO - __main__ - Step 10752: {'lr': 0.0004956991674823065, 'samples': 2064384, 'steps': 10751, 'loss/train': 1.3722048997879028} -08/30/2021 15:04:49 - INFO - __main__ - Step 10753: {'lr': 0.0004956981873198928, 'samples': 2064576, 'steps': 10752, 'loss/train': 1.9432214498519897} -08/30/2021 15:04:49 - INFO - __main__ - Step 10754: {'lr': 0.0004956972070467712, 'samples': 2064768, 'steps': 10753, 'loss/train': 1.7503266334533691} -08/30/2021 15:04:49 - INFO - __main__ - Step 10755: {'lr': 0.0004956962266629424, 'samples': 2064960, 'steps': 10754, 'loss/train': 1.7071924209594727} -08/30/2021 15:04:50 - INFO - __main__ - Step 10756: {'lr': 0.0004956952461684066, 'samples': 2065152, 'steps': 10755, 'loss/train': 2.0466485023498535} -08/30/2021 15:04:51 - INFO - __main__ - Step 10757: {'lr': 0.0004956942655631644, 'samples': 2065344, 'steps': 10756, 'loss/train': 1.9296818971633911} -08/30/2021 15:04:52 - INFO - __main__ - Step 10758: {'lr': 0.0004956932848472161, 'samples': 2065536, 'steps': 10757, 'loss/train': 2.400909662246704} -08/30/2021 15:04:52 - INFO - __main__ - Step 10759: {'lr': 0.0004956923040205622, 'samples': 2065728, 'steps': 10758, 'loss/train': 1.9308323860168457} -08/30/2021 15:04:52 - INFO - __main__ - Step 10760: {'lr': 0.0004956913230832031, 'samples': 2065920, 'steps': 10759, 'loss/train': 2.390636682510376} -08/30/2021 15:04:53 - INFO - __main__ - Step 10761: {'lr': 0.0004956903420351393, 'samples': 2066112, 'steps': 10760, 'loss/train': 1.8706105947494507} -08/30/2021 15:04:53 - INFO - __main__ - Step 10762: {'lr': 0.0004956893608763713, 'samples': 2066304, 'steps': 10761, 'loss/train': 1.8931701183319092} -08/30/2021 15:04:55 - INFO - __main__ - Step 10763: {'lr': 0.0004956883796068993, 'samples': 2066496, 'steps': 10762, 'loss/train': 1.5289864540100098} -08/30/2021 15:04:55 - INFO - __main__ - Step 10764: {'lr': 0.000495687398226724, 'samples': 2066688, 'steps': 10763, 'loss/train': 2.0399932861328125} -08/30/2021 15:04:56 - INFO - __main__ - Step 10765: {'lr': 0.0004956864167358458, 'samples': 2066880, 'steps': 10764, 'loss/train': 1.2210923433303833} -08/30/2021 15:04:56 - INFO - __main__ - Step 10766: {'lr': 0.000495685435134265, 'samples': 2067072, 'steps': 10765, 'loss/train': 0.17922018468379974} -08/30/2021 15:04:56 - INFO - __main__ - Step 10767: {'lr': 0.0004956844534219822, 'samples': 2067264, 'steps': 10766, 'loss/train': 1.8820480108261108} -08/30/2021 15:04:58 - INFO - __main__ - Step 10768: {'lr': 0.0004956834715989977, 'samples': 2067456, 'steps': 10767, 'loss/train': 1.8264802694320679} -08/30/2021 15:04:58 - INFO - __main__ - Step 10769: {'lr': 0.0004956824896653122, 'samples': 2067648, 'steps': 10768, 'loss/train': 2.1791439056396484} -08/30/2021 15:04:59 - INFO - __main__ - Step 10770: {'lr': 0.0004956815076209257, 'samples': 2067840, 'steps': 10769, 'loss/train': 2.34114146232605} -08/30/2021 15:04:59 - INFO - __main__ - Step 10771: {'lr': 0.0004956805254658391, 'samples': 2068032, 'steps': 10770, 'loss/train': 1.9452028274536133} -08/30/2021 15:04:59 - INFO - __main__ - Step 10772: {'lr': 0.0004956795432000526, 'samples': 2068224, 'steps': 10771, 'loss/train': 1.3862152099609375} -08/30/2021 15:05:01 - INFO - __main__ - Step 10773: {'lr': 0.0004956785608235667, 'samples': 2068416, 'steps': 10772, 'loss/train': 1.6177400350570679} -08/30/2021 15:05:01 - INFO - __main__ - Step 10774: {'lr': 0.0004956775783363817, 'samples': 2068608, 'steps': 10773, 'loss/train': 2.16396427154541} -08/30/2021 15:05:02 - INFO - __main__ - Step 10775: {'lr': 0.0004956765957384984, 'samples': 2068800, 'steps': 10774, 'loss/train': 1.21666419506073} -08/30/2021 15:05:02 - INFO - __main__ - Step 10776: {'lr': 0.0004956756130299169, 'samples': 2068992, 'steps': 10775, 'loss/train': 2.0430588722229004} -08/30/2021 15:05:03 - INFO - __main__ - Step 10777: {'lr': 0.0004956746302106378, 'samples': 2069184, 'steps': 10776, 'loss/train': 1.5963610410690308} -08/30/2021 15:05:03 - INFO - __main__ - Step 10778: {'lr': 0.0004956736472806614, 'samples': 2069376, 'steps': 10777, 'loss/train': 0.8859256505966187} -08/30/2021 15:05:05 - INFO - __main__ - Step 10779: {'lr': 0.0004956726642399883, 'samples': 2069568, 'steps': 10778, 'loss/train': 1.70272958278656} -08/30/2021 15:05:05 - INFO - __main__ - Step 10780: {'lr': 0.0004956716810886189, 'samples': 2069760, 'steps': 10779, 'loss/train': 1.4417139291763306} -08/30/2021 15:05:06 - INFO - __main__ - Step 10781: {'lr': 0.0004956706978265536, 'samples': 2069952, 'steps': 10780, 'loss/train': 1.981103539466858} -08/30/2021 15:05:06 - INFO - __main__ - Step 10782: {'lr': 0.0004956697144537929, 'samples': 2070144, 'steps': 10781, 'loss/train': 1.9347819089889526} -08/30/2021 15:05:07 - INFO - __main__ - Step 10783: {'lr': 0.0004956687309703372, 'samples': 2070336, 'steps': 10782, 'loss/train': 1.5819716453552246} -08/30/2021 15:05:08 - INFO - __main__ - Step 10784: {'lr': 0.0004956677473761871, 'samples': 2070528, 'steps': 10783, 'loss/train': 1.8309073448181152} -08/30/2021 15:05:09 - INFO - __main__ - Step 10785: {'lr': 0.0004956667636713427, 'samples': 2070720, 'steps': 10784, 'loss/train': 2.0952024459838867} -08/30/2021 15:05:09 - INFO - __main__ - Step 10786: {'lr': 0.0004956657798558047, 'samples': 2070912, 'steps': 10785, 'loss/train': 1.7727491855621338} -08/30/2021 15:05:10 - INFO - __main__ - Step 10787: {'lr': 0.0004956647959295735, 'samples': 2071104, 'steps': 10786, 'loss/train': 1.6489266157150269} -08/30/2021 15:05:10 - INFO - __main__ - Step 10788: {'lr': 0.0004956638118926495, 'samples': 2071296, 'steps': 10787, 'loss/train': 2.277691125869751} -08/30/2021 15:05:10 - INFO - __main__ - Step 10789: {'lr': 0.0004956628277450333, 'samples': 2071488, 'steps': 10788, 'loss/train': 0.22366197407245636} -08/30/2021 15:05:12 - INFO - __main__ - Step 10790: {'lr': 0.0004956618434867251, 'samples': 2071680, 'steps': 10789, 'loss/train': 0.8237656354904175} -08/30/2021 15:05:13 - INFO - __main__ - Step 10791: {'lr': 0.0004956608591177256, 'samples': 2071872, 'steps': 10790, 'loss/train': 1.5902841091156006} -08/30/2021 15:05:13 - INFO - __main__ - Step 10792: {'lr': 0.0004956598746380349, 'samples': 2072064, 'steps': 10791, 'loss/train': 2.4441492557525635} -08/30/2021 15:05:13 - INFO - __main__ - Step 10793: {'lr': 0.0004956588900476538, 'samples': 2072256, 'steps': 10792, 'loss/train': 1.6774741411209106} -08/30/2021 15:05:14 - INFO - __main__ - Step 10794: {'lr': 0.0004956579053465826, 'samples': 2072448, 'steps': 10793, 'loss/train': 1.44629967212677} -08/30/2021 15:05:15 - INFO - __main__ - Step 10795: {'lr': 0.0004956569205348217, 'samples': 2072640, 'steps': 10794, 'loss/train': 2.2983968257904053} -08/30/2021 15:05:16 - INFO - __main__ - Step 10796: {'lr': 0.0004956559356123717, 'samples': 2072832, 'steps': 10795, 'loss/train': 1.6858317852020264} -08/30/2021 15:05:16 - INFO - __main__ - Step 10797: {'lr': 0.0004956549505792327, 'samples': 2073024, 'steps': 10796, 'loss/train': 1.852107286453247} -08/30/2021 15:05:16 - INFO - __main__ - Step 10798: {'lr': 0.0004956539654354055, 'samples': 2073216, 'steps': 10797, 'loss/train': 1.9083333015441895} -08/30/2021 15:05:17 - INFO - __main__ - Step 10799: {'lr': 0.0004956529801808904, 'samples': 2073408, 'steps': 10798, 'loss/train': 2.384979486465454} -08/30/2021 15:05:18 - INFO - __main__ - Step 10800: {'lr': 0.0004956519948156879, 'samples': 2073600, 'steps': 10799, 'loss/train': 1.8847366571426392} -08/30/2021 15:05:19 - INFO - __main__ - Step 10801: {'lr': 0.0004956510093397983, 'samples': 2073792, 'steps': 10800, 'loss/train': 1.7802255153656006} -08/30/2021 15:05:19 - INFO - __main__ - Step 10802: {'lr': 0.0004956500237532222, 'samples': 2073984, 'steps': 10801, 'loss/train': 2.1447055339813232} -08/30/2021 15:05:19 - INFO - __main__ - Step 10803: {'lr': 0.0004956490380559601, 'samples': 2074176, 'steps': 10802, 'loss/train': 1.235166072845459} -08/30/2021 15:05:20 - INFO - __main__ - Step 10804: {'lr': 0.0004956480522480121, 'samples': 2074368, 'steps': 10803, 'loss/train': 1.3955796957015991} -08/30/2021 15:05:20 - INFO - __main__ - Step 10805: {'lr': 0.000495647066329379, 'samples': 2074560, 'steps': 10804, 'loss/train': 1.908759355545044} -08/30/2021 15:05:21 - INFO - __main__ - Step 10806: {'lr': 0.0004956460803000612, 'samples': 2074752, 'steps': 10805, 'loss/train': 2.0857725143432617} -08/30/2021 15:05:22 - INFO - __main__ - Step 10807: {'lr': 0.0004956450941600589, 'samples': 2074944, 'steps': 10806, 'loss/train': 1.4821279048919678} -08/30/2021 15:05:22 - INFO - __main__ - Step 10808: {'lr': 0.0004956441079093729, 'samples': 2075136, 'steps': 10807, 'loss/train': 1.3489822149276733} -08/30/2021 15:05:23 - INFO - __main__ - Step 10809: {'lr': 0.0004956431215480034, 'samples': 2075328, 'steps': 10808, 'loss/train': 1.640360713005066} -08/30/2021 15:05:23 - INFO - __main__ - Step 10810: {'lr': 0.0004956421350759508, 'samples': 2075520, 'steps': 10809, 'loss/train': 1.8221944570541382} -08/30/2021 15:05:25 - INFO - __main__ - Step 10811: {'lr': 0.0004956411484932158, 'samples': 2075712, 'steps': 10810, 'loss/train': 2.3182005882263184} -08/30/2021 15:05:25 - INFO - __main__ - Step 10812: {'lr': 0.0004956401617997985, 'samples': 2075904, 'steps': 10811, 'loss/train': 1.3666365146636963} -08/30/2021 15:05:25 - INFO - __main__ - Step 10813: {'lr': 0.0004956391749956997, 'samples': 2076096, 'steps': 10812, 'loss/train': 2.203580141067505} -08/30/2021 15:05:26 - INFO - __main__ - Step 10814: {'lr': 0.0004956381880809195, 'samples': 2076288, 'steps': 10813, 'loss/train': 1.4165306091308594} -08/30/2021 15:05:26 - INFO - __main__ - Step 10815: {'lr': 0.0004956372010554587, 'samples': 2076480, 'steps': 10814, 'loss/train': 1.9504467248916626} -08/30/2021 15:05:28 - INFO - __main__ - Step 10816: {'lr': 0.0004956362139193174, 'samples': 2076672, 'steps': 10815, 'loss/train': 1.3715782165527344} -08/30/2021 15:05:29 - INFO - __main__ - Step 10817: {'lr': 0.0004956352266724964, 'samples': 2076864, 'steps': 10816, 'loss/train': 1.748165249824524} -08/30/2021 15:05:29 - INFO - __main__ - Step 10818: {'lr': 0.0004956342393149959, 'samples': 2077056, 'steps': 10817, 'loss/train': 1.8582464456558228} -08/30/2021 15:05:29 - INFO - __main__ - Step 10819: {'lr': 0.0004956332518468163, 'samples': 2077248, 'steps': 10818, 'loss/train': 2.4562318325042725} -08/30/2021 15:05:30 - INFO - __main__ - Step 10820: {'lr': 0.0004956322642679583, 'samples': 2077440, 'steps': 10819, 'loss/train': 1.5791183710098267} -08/30/2021 15:05:30 - INFO - __main__ - Step 10821: {'lr': 0.000495631276578422, 'samples': 2077632, 'steps': 10820, 'loss/train': 2.010395050048828} -08/30/2021 15:05:31 - INFO - __main__ - Step 10822: {'lr': 0.0004956302887782082, 'samples': 2077824, 'steps': 10821, 'loss/train': 3.501922607421875} -08/30/2021 15:05:32 - INFO - __main__ - Step 10823: {'lr': 0.0004956293008673172, 'samples': 2078016, 'steps': 10822, 'loss/train': 1.802160382270813} -08/30/2021 15:05:32 - INFO - __main__ - Step 10824: {'lr': 0.0004956283128457493, 'samples': 2078208, 'steps': 10823, 'loss/train': 0.9121621251106262} -08/30/2021 15:05:33 - INFO - __main__ - Step 10825: {'lr': 0.0004956273247135051, 'samples': 2078400, 'steps': 10824, 'loss/train': 1.7308368682861328} -08/30/2021 15:05:33 - INFO - __main__ - Step 10826: {'lr': 0.0004956263364705851, 'samples': 2078592, 'steps': 10825, 'loss/train': 2.583685874938965} -08/30/2021 15:05:34 - INFO - __main__ - Step 10827: {'lr': 0.0004956253481169895, 'samples': 2078784, 'steps': 10826, 'loss/train': 1.3237332105636597} -08/30/2021 15:05:35 - INFO - __main__ - Step 10828: {'lr': 0.0004956243596527191, 'samples': 2078976, 'steps': 10827, 'loss/train': 1.858522891998291} -08/30/2021 15:05:35 - INFO - __main__ - Step 10829: {'lr': 0.000495623371077774, 'samples': 2079168, 'steps': 10828, 'loss/train': 1.7161418199539185} -08/30/2021 15:05:36 - INFO - __main__ - Step 10830: {'lr': 0.000495622382392155, 'samples': 2079360, 'steps': 10829, 'loss/train': 1.9857534170150757} -08/30/2021 15:05:36 - INFO - __main__ - Step 10831: {'lr': 0.0004956213935958621, 'samples': 2079552, 'steps': 10830, 'loss/train': 2.1369400024414062} -08/30/2021 15:05:38 - INFO - __main__ - Step 10832: {'lr': 0.0004956204046888961, 'samples': 2079744, 'steps': 10831, 'loss/train': 2.037320137023926} -08/30/2021 15:05:38 - INFO - __main__ - Step 10833: {'lr': 0.0004956194156712574, 'samples': 2079936, 'steps': 10832, 'loss/train': 2.415008068084717} -08/30/2021 15:05:39 - INFO - __main__ - Step 10834: {'lr': 0.0004956184265429463, 'samples': 2080128, 'steps': 10833, 'loss/train': 1.4726933240890503} -08/30/2021 15:05:39 - INFO - __main__ - Step 10835: {'lr': 0.0004956174373039634, 'samples': 2080320, 'steps': 10834, 'loss/train': 1.9649070501327515} -08/30/2021 15:05:40 - INFO - __main__ - Step 10836: {'lr': 0.0004956164479543089, 'samples': 2080512, 'steps': 10835, 'loss/train': 1.7382912635803223} -08/30/2021 15:05:41 - INFO - __main__ - Step 10837: {'lr': 0.0004956154584939836, 'samples': 2080704, 'steps': 10836, 'loss/train': 1.7427713871002197} -08/30/2021 15:05:41 - INFO - __main__ - Step 10838: {'lr': 0.0004956144689229877, 'samples': 2080896, 'steps': 10837, 'loss/train': 1.9309769868850708} -08/30/2021 15:05:42 - INFO - __main__ - Step 10839: {'lr': 0.0004956134792413218, 'samples': 2081088, 'steps': 10838, 'loss/train': 1.404088020324707} -08/30/2021 15:05:42 - INFO - __main__ - Step 10840: {'lr': 0.0004956124894489861, 'samples': 2081280, 'steps': 10839, 'loss/train': 1.8259860277175903} -08/30/2021 15:05:43 - INFO - __main__ - Step 10841: {'lr': 0.0004956114995459813, 'samples': 2081472, 'steps': 10840, 'loss/train': 2.3432869911193848} -08/30/2021 15:05:44 - INFO - __main__ - Step 10842: {'lr': 0.0004956105095323077, 'samples': 2081664, 'steps': 10841, 'loss/train': 1.6931630373001099} -08/30/2021 15:05:44 - INFO - __main__ - Step 10843: {'lr': 0.0004956095194079658, 'samples': 2081856, 'steps': 10842, 'loss/train': 1.7168824672698975} -08/30/2021 15:05:45 - INFO - __main__ - Step 10844: {'lr': 0.000495608529172956, 'samples': 2082048, 'steps': 10843, 'loss/train': 1.6522506475448608} -08/30/2021 15:05:45 - INFO - __main__ - Step 10845: {'lr': 0.0004956075388272789, 'samples': 2082240, 'steps': 10844, 'loss/train': 1.83405601978302} -08/30/2021 15:05:46 - INFO - __main__ - Step 10846: {'lr': 0.0004956065483709348, 'samples': 2082432, 'steps': 10845, 'loss/train': 1.6893846988677979} -08/30/2021 15:05:47 - INFO - __main__ - Step 10847: {'lr': 0.0004956055578039241, 'samples': 2082624, 'steps': 10846, 'loss/train': 1.9587448835372925} -08/30/2021 15:05:48 - INFO - __main__ - Step 10848: {'lr': 0.0004956045671262475, 'samples': 2082816, 'steps': 10847, 'loss/train': 1.714124083518982} -08/30/2021 15:05:48 - INFO - __main__ - Step 10849: {'lr': 0.0004956035763379051, 'samples': 2083008, 'steps': 10848, 'loss/train': 1.9753811359405518} -08/30/2021 15:05:48 - INFO - __main__ - Step 10850: {'lr': 0.0004956025854388976, 'samples': 2083200, 'steps': 10849, 'loss/train': 1.519775152206421} -08/30/2021 15:05:49 - INFO - __main__ - Step 10851: {'lr': 0.0004956015944292253, 'samples': 2083392, 'steps': 10850, 'loss/train': 2.0994579792022705} -08/30/2021 15:05:49 - INFO - __main__ - Step 10852: {'lr': 0.0004956006033088888, 'samples': 2083584, 'steps': 10851, 'loss/train': 1.41232430934906} -08/30/2021 15:05:50 - INFO - __main__ - Step 10853: {'lr': 0.0004955996120778884, 'samples': 2083776, 'steps': 10852, 'loss/train': 1.8957570791244507} -08/30/2021 15:05:51 - INFO - __main__ - Step 10854: {'lr': 0.0004955986207362246, 'samples': 2083968, 'steps': 10853, 'loss/train': 1.628380537033081} -08/30/2021 15:05:51 - INFO - __main__ - Step 10855: {'lr': 0.0004955976292838979, 'samples': 2084160, 'steps': 10854, 'loss/train': 1.215693473815918} -08/30/2021 15:05:52 - INFO - __main__ - Step 10856: {'lr': 0.0004955966377209086, 'samples': 2084352, 'steps': 10855, 'loss/train': 2.0183258056640625} -08/30/2021 15:05:52 - INFO - __main__ - Step 10857: {'lr': 0.0004955956460472573, 'samples': 2084544, 'steps': 10856, 'loss/train': 1.1334675550460815} -08/30/2021 15:05:53 - INFO - __main__ - Step 10858: {'lr': 0.0004955946542629444, 'samples': 2084736, 'steps': 10857, 'loss/train': 2.163619041442871} -08/30/2021 15:05:54 - INFO - __main__ - Step 10859: {'lr': 0.0004955936623679703, 'samples': 2084928, 'steps': 10858, 'loss/train': 2.0362842082977295} -08/30/2021 15:05:54 - INFO - __main__ - Step 10860: {'lr': 0.0004955926703623356, 'samples': 2085120, 'steps': 10859, 'loss/train': 2.509580373764038} -08/30/2021 15:05:55 - INFO - __main__ - Step 10861: {'lr': 0.0004955916782460405, 'samples': 2085312, 'steps': 10860, 'loss/train': 1.321964144706726} -08/30/2021 15:05:55 - INFO - __main__ - Step 10862: {'lr': 0.0004955906860190857, 'samples': 2085504, 'steps': 10861, 'loss/train': 1.9093550443649292} -08/30/2021 15:05:56 - INFO - __main__ - Step 10863: {'lr': 0.0004955896936814714, 'samples': 2085696, 'steps': 10862, 'loss/train': 1.8934608697891235} -08/30/2021 15:05:57 - INFO - __main__ - Step 10864: {'lr': 0.0004955887012331982, 'samples': 2085888, 'steps': 10863, 'loss/train': 1.4681134223937988} -08/30/2021 15:05:57 - INFO - __main__ - Step 10865: {'lr': 0.0004955877086742666, 'samples': 2086080, 'steps': 10864, 'loss/train': 1.4558637142181396} -08/30/2021 15:05:58 - INFO - __main__ - Step 10866: {'lr': 0.0004955867160046769, 'samples': 2086272, 'steps': 10865, 'loss/train': 1.5033838748931885} -08/30/2021 15:05:58 - INFO - __main__ - Step 10867: {'lr': 0.0004955857232244297, 'samples': 2086464, 'steps': 10866, 'loss/train': 1.7385921478271484} -08/30/2021 15:05:59 - INFO - __main__ - Step 10868: {'lr': 0.0004955847303335253, 'samples': 2086656, 'steps': 10867, 'loss/train': 1.893783450126648} -08/30/2021 15:06:00 - INFO - __main__ - Step 10869: {'lr': 0.0004955837373319641, 'samples': 2086848, 'steps': 10868, 'loss/train': 1.7365012168884277} -08/30/2021 15:06:00 - INFO - __main__ - Step 10870: {'lr': 0.0004955827442197468, 'samples': 2087040, 'steps': 10869, 'loss/train': 2.0834131240844727} -08/30/2021 15:06:00 - INFO - __main__ - Step 10871: {'lr': 0.0004955817509968737, 'samples': 2087232, 'steps': 10870, 'loss/train': 1.402953863143921} -08/30/2021 15:06:01 - INFO - __main__ - Step 10872: {'lr': 0.0004955807576633452, 'samples': 2087424, 'steps': 10871, 'loss/train': 1.8041726350784302} -08/30/2021 15:06:02 - INFO - __main__ - Step 10873: {'lr': 0.0004955797642191618, 'samples': 2087616, 'steps': 10872, 'loss/train': 1.912751317024231} -08/30/2021 15:06:03 - INFO - __main__ - Step 10874: {'lr': 0.000495578770664324, 'samples': 2087808, 'steps': 10873, 'loss/train': 1.5906606912612915} -08/30/2021 15:06:03 - INFO - __main__ - Step 10875: {'lr': 0.0004955777769988322, 'samples': 2088000, 'steps': 10874, 'loss/train': 1.8554505109786987} -08/30/2021 15:06:04 - INFO - __main__ - Step 10876: {'lr': 0.0004955767832226868, 'samples': 2088192, 'steps': 10875, 'loss/train': 1.8426434993743896} -08/30/2021 15:06:04 - INFO - __main__ - Step 10877: {'lr': 0.0004955757893358884, 'samples': 2088384, 'steps': 10876, 'loss/train': 1.6191202402114868} -08/30/2021 15:06:05 - INFO - __main__ - Step 10878: {'lr': 0.0004955747953384372, 'samples': 2088576, 'steps': 10877, 'loss/train': 1.8443479537963867} -08/30/2021 15:06:06 - INFO - __main__ - Step 10879: {'lr': 0.0004955738012303338, 'samples': 2088768, 'steps': 10878, 'loss/train': 1.4832504987716675} -08/30/2021 15:06:06 - INFO - __main__ - Step 10880: {'lr': 0.0004955728070115787, 'samples': 2088960, 'steps': 10879, 'loss/train': 1.53128981590271} -08/30/2021 15:06:07 - INFO - __main__ - Step 10881: {'lr': 0.0004955718126821722, 'samples': 2089152, 'steps': 10880, 'loss/train': 1.054487943649292} -08/30/2021 15:06:07 - INFO - __main__ - Step 10882: {'lr': 0.0004955708182421149, 'samples': 2089344, 'steps': 10881, 'loss/train': 1.8855987787246704} -08/30/2021 15:06:07 - INFO - __main__ - Step 10883: {'lr': 0.0004955698236914071, 'samples': 2089536, 'steps': 10882, 'loss/train': 1.1770527362823486} -08/30/2021 15:06:09 - INFO - __main__ - Step 10884: {'lr': 0.0004955688290300494, 'samples': 2089728, 'steps': 10883, 'loss/train': 2.011972427368164} -08/30/2021 15:06:09 - INFO - __main__ - Step 10885: {'lr': 0.0004955678342580421, 'samples': 2089920, 'steps': 10884, 'loss/train': 1.6012986898422241} -08/30/2021 15:06:10 - INFO - __main__ - Step 10886: {'lr': 0.0004955668393753858, 'samples': 2090112, 'steps': 10885, 'loss/train': 1.8417295217514038} -08/30/2021 15:06:10 - INFO - __main__ - Step 10887: {'lr': 0.0004955658443820809, 'samples': 2090304, 'steps': 10886, 'loss/train': 1.6421327590942383} -08/30/2021 15:06:10 - INFO - __main__ - Step 10888: {'lr': 0.0004955648492781277, 'samples': 2090496, 'steps': 10887, 'loss/train': 1.7306485176086426} -08/30/2021 15:06:12 - INFO - __main__ - Step 10889: {'lr': 0.0004955638540635269, 'samples': 2090688, 'steps': 10888, 'loss/train': 2.8198189735412598} -08/30/2021 15:06:13 - INFO - __main__ - Step 10890: {'lr': 0.0004955628587382788, 'samples': 2090880, 'steps': 10889, 'loss/train': 1.3991672992706299} -08/30/2021 15:06:13 - INFO - __main__ - Step 10891: {'lr': 0.0004955618633023837, 'samples': 2091072, 'steps': 10890, 'loss/train': 1.8839037418365479} -08/30/2021 15:06:14 - INFO - __main__ - Step 10892: {'lr': 0.0004955608677558424, 'samples': 2091264, 'steps': 10891, 'loss/train': 2.153796434402466} -08/30/2021 15:06:14 - INFO - __main__ - Step 10893: {'lr': 0.0004955598720986551, 'samples': 2091456, 'steps': 10892, 'loss/train': 1.9644924402236938} -08/30/2021 15:06:16 - INFO - __main__ - Step 10894: {'lr': 0.0004955588763308223, 'samples': 2091648, 'steps': 10893, 'loss/train': 1.9918394088745117} -08/30/2021 15:06:16 - INFO - __main__ - Step 10895: {'lr': 0.0004955578804523445, 'samples': 2091840, 'steps': 10894, 'loss/train': 1.637222170829773} -08/30/2021 15:06:16 - INFO - __main__ - Step 10896: {'lr': 0.000495556884463222, 'samples': 2092032, 'steps': 10895, 'loss/train': 1.9392727613449097} -08/30/2021 15:06:17 - INFO - __main__ - Step 10897: {'lr': 0.0004955558883634555, 'samples': 2092224, 'steps': 10896, 'loss/train': 1.738175392150879} -08/30/2021 15:06:17 - INFO - __main__ - Step 10898: {'lr': 0.0004955548921530452, 'samples': 2092416, 'steps': 10897, 'loss/train': 1.5670162439346313} -08/30/2021 15:06:19 - INFO - __main__ - Step 10899: {'lr': 0.0004955538958319917, 'samples': 2092608, 'steps': 10898, 'loss/train': 1.8713189363479614} -08/30/2021 15:06:19 - INFO - __main__ - Step 10900: {'lr': 0.0004955528994002954, 'samples': 2092800, 'steps': 10899, 'loss/train': 0.1321968138217926} -08/30/2021 15:06:20 - INFO - __main__ - Step 10901: {'lr': 0.0004955519028579568, 'samples': 2092992, 'steps': 10900, 'loss/train': 1.6792168617248535} -08/30/2021 15:06:20 - INFO - __main__ - Step 10902: {'lr': 0.0004955509062049763, 'samples': 2093184, 'steps': 10901, 'loss/train': 1.908568263053894} -08/30/2021 15:06:20 - INFO - __main__ - Step 10903: {'lr': 0.0004955499094413542, 'samples': 2093376, 'steps': 10902, 'loss/train': 1.5589418411254883} -08/30/2021 15:06:22 - INFO - __main__ - Step 10904: {'lr': 0.0004955489125670912, 'samples': 2093568, 'steps': 10903, 'loss/train': 1.966796875} -08/30/2021 15:06:23 - INFO - __main__ - Step 10905: {'lr': 0.0004955479155821877, 'samples': 2093760, 'steps': 10904, 'loss/train': 1.5975741147994995} -08/30/2021 15:06:23 - INFO - __main__ - Step 10906: {'lr': 0.000495546918486644, 'samples': 2093952, 'steps': 10905, 'loss/train': 2.3270199298858643} -08/30/2021 15:06:23 - INFO - __main__ - Step 10907: {'lr': 0.0004955459212804607, 'samples': 2094144, 'steps': 10906, 'loss/train': 1.711856484413147} -08/30/2021 15:06:24 - INFO - __main__ - Step 10908: {'lr': 0.0004955449239636382, 'samples': 2094336, 'steps': 10907, 'loss/train': 0.9151084423065186} -08/30/2021 15:06:24 - INFO - __main__ - Step 10909: {'lr': 0.000495543926536177, 'samples': 2094528, 'steps': 10908, 'loss/train': 0.19393007457256317} -08/30/2021 15:06:26 - INFO - __main__ - Step 10910: {'lr': 0.0004955429289980774, 'samples': 2094720, 'steps': 10909, 'loss/train': 1.8715108633041382} -08/30/2021 15:06:26 - INFO - __main__ - Step 10911: {'lr': 0.00049554193134934, 'samples': 2094912, 'steps': 10910, 'loss/train': 1.3734896183013916} -08/30/2021 15:06:26 - INFO - __main__ - Step 10912: {'lr': 0.0004955409335899651, 'samples': 2095104, 'steps': 10911, 'loss/train': 1.781131625175476} -08/30/2021 15:06:27 - INFO - __main__ - Step 10913: {'lr': 0.0004955399357199534, 'samples': 2095296, 'steps': 10912, 'loss/train': 1.7393033504486084} -08/30/2021 15:06:27 - INFO - __main__ - Step 10914: {'lr': 0.0004955389377393051, 'samples': 2095488, 'steps': 10913, 'loss/train': 1.8202251195907593} -08/30/2021 15:06:29 - INFO - __main__ - Step 10915: {'lr': 0.0004955379396480207, 'samples': 2095680, 'steps': 10914, 'loss/train': 1.7318600416183472} -08/30/2021 15:06:29 - INFO - __main__ - Step 10916: {'lr': 0.0004955369414461007, 'samples': 2095872, 'steps': 10915, 'loss/train': 1.7824913263320923} -08/30/2021 15:06:29 - INFO - __main__ - Step 10917: {'lr': 0.0004955359431335456, 'samples': 2096064, 'steps': 10916, 'loss/train': 1.9956517219543457} -08/30/2021 15:06:30 - INFO - __main__ - Step 10918: {'lr': 0.0004955349447103559, 'samples': 2096256, 'steps': 10917, 'loss/train': 1.4670724868774414} -08/30/2021 15:06:30 - INFO - __main__ - Step 10919: {'lr': 0.0004955339461765318, 'samples': 2096448, 'steps': 10918, 'loss/train': 1.981136441230774} -08/30/2021 15:06:31 - INFO - __main__ - Step 10920: {'lr': 0.0004955329475320739, 'samples': 2096640, 'steps': 10919, 'loss/train': 1.8170489072799683} -08/30/2021 15:06:32 - INFO - __main__ - Step 10921: {'lr': 0.0004955319487769827, 'samples': 2096832, 'steps': 10920, 'loss/train': 1.0184874534606934} -08/30/2021 15:06:33 - INFO - __main__ - Step 10922: {'lr': 0.0004955309499112586, 'samples': 2097024, 'steps': 10921, 'loss/train': 1.5790601968765259} -08/30/2021 15:06:33 - INFO - __main__ - Step 10923: {'lr': 0.000495529950934902, 'samples': 2097216, 'steps': 10922, 'loss/train': 0.7173398733139038} -08/30/2021 15:06:34 - INFO - __main__ - Step 10924: {'lr': 0.0004955289518479134, 'samples': 2097408, 'steps': 10923, 'loss/train': 0.11908797174692154} -08/30/2021 15:06:34 - INFO - __main__ - Step 10925: {'lr': 0.0004955279526502931, 'samples': 2097600, 'steps': 10924, 'loss/train': 1.7190030813217163} -08/30/2021 15:06:34 - INFO - __main__ - Step 10926: {'lr': 0.0004955269533420419, 'samples': 2097792, 'steps': 10925, 'loss/train': 1.594948172569275} -08/30/2021 15:06:36 - INFO - __main__ - Step 10927: {'lr': 0.00049552595392316, 'samples': 2097984, 'steps': 10926, 'loss/train': 1.4549708366394043} -08/30/2021 15:06:36 - INFO - __main__ - Step 10928: {'lr': 0.0004955249543936479, 'samples': 2098176, 'steps': 10927, 'loss/train': 1.8931047916412354} -08/30/2021 15:06:37 - INFO - __main__ - Step 10929: {'lr': 0.000495523954753506, 'samples': 2098368, 'steps': 10928, 'loss/train': 1.5164992809295654} -08/30/2021 15:06:37 - INFO - __main__ - Step 10930: {'lr': 0.0004955229550027347, 'samples': 2098560, 'steps': 10929, 'loss/train': 1.9918193817138672} -08/30/2021 15:06:37 - INFO - __main__ - Step 10931: {'lr': 0.0004955219551413347, 'samples': 2098752, 'steps': 10930, 'loss/train': 1.8009387254714966} -08/30/2021 15:06:39 - INFO - __main__ - Step 10932: {'lr': 0.0004955209551693063, 'samples': 2098944, 'steps': 10931, 'loss/train': 1.9979090690612793} -08/30/2021 15:06:39 - INFO - __main__ - Step 10933: {'lr': 0.0004955199550866498, 'samples': 2099136, 'steps': 10932, 'loss/train': 1.3799176216125488} -08/30/2021 15:06:40 - INFO - __main__ - Step 10934: {'lr': 0.000495518954893366, 'samples': 2099328, 'steps': 10933, 'loss/train': 2.3226423263549805} -08/30/2021 15:06:40 - INFO - __main__ - Step 10935: {'lr': 0.000495517954589455, 'samples': 2099520, 'steps': 10934, 'loss/train': 1.6888556480407715} -08/30/2021 15:06:40 - INFO - __main__ - Step 10936: {'lr': 0.0004955169541749173, 'samples': 2099712, 'steps': 10935, 'loss/train': 1.7350400686264038} -08/30/2021 15:06:42 - INFO - __main__ - Step 10937: {'lr': 0.0004955159536497536, 'samples': 2099904, 'steps': 10936, 'loss/train': 1.9043257236480713} -08/30/2021 15:06:42 - INFO - __main__ - Step 10938: {'lr': 0.0004955149530139643, 'samples': 2100096, 'steps': 10937, 'loss/train': 1.8911716938018799} -08/30/2021 15:06:43 - INFO - __main__ - Step 10939: {'lr': 0.0004955139522675496, 'samples': 2100288, 'steps': 10938, 'loss/train': 1.575310468673706} -08/30/2021 15:06:43 - INFO - __main__ - Step 10940: {'lr': 0.0004955129514105101, 'samples': 2100480, 'steps': 10939, 'loss/train': 2.421666383743286} -08/30/2021 15:06:43 - INFO - __main__ - Step 10941: {'lr': 0.0004955119504428464, 'samples': 2100672, 'steps': 10940, 'loss/train': 1.5355712175369263} -08/30/2021 15:06:45 - INFO - __main__ - Step 10942: {'lr': 0.0004955109493645587, 'samples': 2100864, 'steps': 10941, 'loss/train': 1.5693624019622803} -08/30/2021 15:06:46 - INFO - __main__ - Step 10943: {'lr': 0.0004955099481756475, 'samples': 2101056, 'steps': 10942, 'loss/train': 2.2295072078704834} -08/30/2021 15:06:46 - INFO - __main__ - Step 10944: {'lr': 0.0004955089468761133, 'samples': 2101248, 'steps': 10943, 'loss/train': 2.020923614501953} -08/30/2021 15:06:47 - INFO - __main__ - Step 10945: {'lr': 0.0004955079454659567, 'samples': 2101440, 'steps': 10944, 'loss/train': 1.5080363750457764} -08/30/2021 15:06:47 - INFO - __main__ - Step 10946: {'lr': 0.0004955069439451778, 'samples': 2101632, 'steps': 10945, 'loss/train': 1.6412315368652344} -08/30/2021 15:06:48 - INFO - __main__ - Step 10947: {'lr': 0.0004955059423137774, 'samples': 2101824, 'steps': 10946, 'loss/train': 2.3839101791381836} -08/30/2021 15:06:49 - INFO - __main__ - Step 10948: {'lr': 0.0004955049405717558, 'samples': 2102016, 'steps': 10947, 'loss/train': 1.5545134544372559} -08/30/2021 15:06:49 - INFO - __main__ - Step 10949: {'lr': 0.0004955039387191135, 'samples': 2102208, 'steps': 10948, 'loss/train': 2.256082773208618} -08/30/2021 15:06:50 - INFO - __main__ - Step 10950: {'lr': 0.0004955029367558508, 'samples': 2102400, 'steps': 10949, 'loss/train': 2.0131309032440186} -08/30/2021 15:06:50 - INFO - __main__ - Step 10951: {'lr': 0.0004955019346819684, 'samples': 2102592, 'steps': 10950, 'loss/train': 1.2138655185699463} -08/30/2021 15:06:52 - INFO - __main__ - Step 10952: {'lr': 0.0004955009324974666, 'samples': 2102784, 'steps': 10951, 'loss/train': 1.7613660097122192} -08/30/2021 15:06:53 - INFO - __main__ - Step 10953: {'lr': 0.0004954999302023458, 'samples': 2102976, 'steps': 10952, 'loss/train': 2.2590949535369873} -08/30/2021 15:06:53 - INFO - __main__ - Step 10954: {'lr': 0.0004954989277966064, 'samples': 2103168, 'steps': 10953, 'loss/train': 0.3394987881183624} -08/30/2021 15:06:53 - INFO - __main__ - Step 10955: {'lr': 0.0004954979252802491, 'samples': 2103360, 'steps': 10954, 'loss/train': 1.7576954364776611} -08/30/2021 15:06:54 - INFO - __main__ - Step 10956: {'lr': 0.0004954969226532743, 'samples': 2103552, 'steps': 10955, 'loss/train': 2.596856117248535} -08/30/2021 15:06:54 - INFO - __main__ - Step 10957: {'lr': 0.0004954959199156824, 'samples': 2103744, 'steps': 10956, 'loss/train': 2.258389472961426} -08/30/2021 15:06:54 - INFO - __main__ - Step 10958: {'lr': 0.0004954949170674736, 'samples': 2103936, 'steps': 10957, 'loss/train': 1.8016879558563232} -08/30/2021 15:06:56 - INFO - __main__ - Step 10959: {'lr': 0.0004954939141086488, 'samples': 2104128, 'steps': 10958, 'loss/train': 1.6330764293670654} -08/30/2021 15:06:56 - INFO - __main__ - Step 10960: {'lr': 0.0004954929110392081, 'samples': 2104320, 'steps': 10959, 'loss/train': 1.2186224460601807} -08/30/2021 15:06:57 - INFO - __main__ - Step 10961: {'lr': 0.0004954919078591521, 'samples': 2104512, 'steps': 10960, 'loss/train': 1.5763354301452637} -08/30/2021 15:06:57 - INFO - __main__ - Step 10962: {'lr': 0.0004954909045684812, 'samples': 2104704, 'steps': 10961, 'loss/train': 2.034541130065918} -08/30/2021 15:06:58 - INFO - __main__ - Step 10963: {'lr': 0.000495489901167196, 'samples': 2104896, 'steps': 10962, 'loss/train': 1.691429615020752} -08/30/2021 15:06:59 - INFO - __main__ - Step 10964: {'lr': 0.0004954888976552968, 'samples': 2105088, 'steps': 10963, 'loss/train': 1.9321132898330688} -08/30/2021 15:07:00 - INFO - __main__ - Step 10965: {'lr': 0.0004954878940327841, 'samples': 2105280, 'steps': 10964, 'loss/train': 2.259718418121338} -08/30/2021 15:07:00 - INFO - __main__ - Step 10966: {'lr': 0.0004954868902996582, 'samples': 2105472, 'steps': 10965, 'loss/train': 2.1547393798828125} -08/30/2021 15:07:00 - INFO - __main__ - Step 10967: {'lr': 0.0004954858864559199, 'samples': 2105664, 'steps': 10966, 'loss/train': 1.9617149829864502} -08/30/2021 15:07:01 - INFO - __main__ - Step 10968: {'lr': 0.0004954848825015694, 'samples': 2105856, 'steps': 10967, 'loss/train': 1.6756328344345093} -08/30/2021 15:07:02 - INFO - __main__ - Step 10969: {'lr': 0.0004954838784366071, 'samples': 2106048, 'steps': 10968, 'loss/train': 0.9359736442565918} -08/30/2021 15:07:02 - INFO - __main__ - Step 10970: {'lr': 0.0004954828742610336, 'samples': 2106240, 'steps': 10969, 'loss/train': 2.3840291500091553} -08/30/2021 15:07:03 - INFO - __main__ - Step 10971: {'lr': 0.0004954818699748493, 'samples': 2106432, 'steps': 10970, 'loss/train': 1.601196527481079} -08/30/2021 15:07:03 - INFO - __main__ - Step 10972: {'lr': 0.0004954808655780546, 'samples': 2106624, 'steps': 10971, 'loss/train': 1.8679625988006592} -08/30/2021 15:07:03 - INFO - __main__ - Step 10973: {'lr': 0.0004954798610706502, 'samples': 2106816, 'steps': 10972, 'loss/train': 1.8949376344680786} -08/30/2021 15:07:04 - INFO - __main__ - Step 10974: {'lr': 0.0004954788564526362, 'samples': 2107008, 'steps': 10973, 'loss/train': 1.9796686172485352} -08/30/2021 15:07:05 - INFO - __main__ - Step 10975: {'lr': 0.0004954778517240133, 'samples': 2107200, 'steps': 10974, 'loss/train': 1.6100986003875732} -08/30/2021 15:07:06 - INFO - __main__ - Step 10976: {'lr': 0.0004954768468847818, 'samples': 2107392, 'steps': 10975, 'loss/train': 1.5986541509628296} -08/30/2021 15:07:06 - INFO - __main__ - Step 10977: {'lr': 0.0004954758419349422, 'samples': 2107584, 'steps': 10976, 'loss/train': 2.278153896331787} -08/30/2021 15:07:07 - INFO - __main__ - Step 10978: {'lr': 0.000495474836874495, 'samples': 2107776, 'steps': 10977, 'loss/train': 1.215874433517456} -08/30/2021 15:07:07 - INFO - __main__ - Step 10979: {'lr': 0.0004954738317034408, 'samples': 2107968, 'steps': 10978, 'loss/train': 2.0640335083007812} -08/30/2021 15:07:08 - INFO - __main__ - Step 10980: {'lr': 0.0004954728264217796, 'samples': 2108160, 'steps': 10979, 'loss/train': 2.2727065086364746} -08/30/2021 15:07:09 - INFO - __main__ - Step 10981: {'lr': 0.0004954718210295123, 'samples': 2108352, 'steps': 10980, 'loss/train': 1.4322324991226196} -08/30/2021 15:07:09 - INFO - __main__ - Step 10982: {'lr': 0.0004954708155266392, 'samples': 2108544, 'steps': 10981, 'loss/train': 1.4696931838989258} -08/30/2021 15:07:09 - INFO - __main__ - Step 10983: {'lr': 0.0004954698099131606, 'samples': 2108736, 'steps': 10982, 'loss/train': 1.9921832084655762} -08/30/2021 15:07:10 - INFO - __main__ - Step 10984: {'lr': 0.0004954688041890772, 'samples': 2108928, 'steps': 10983, 'loss/train': 1.360575795173645} -08/30/2021 15:07:12 - INFO - __main__ - Step 10985: {'lr': 0.0004954677983543893, 'samples': 2109120, 'steps': 10984, 'loss/train': 1.0472240447998047} -08/30/2021 15:07:12 - INFO - __main__ - Step 10986: {'lr': 0.0004954667924090974, 'samples': 2109312, 'steps': 10985, 'loss/train': 2.046184778213501} -08/30/2021 15:07:13 - INFO - __main__ - Step 10987: {'lr': 0.000495465786353202, 'samples': 2109504, 'steps': 10986, 'loss/train': 0.4741063117980957} -08/30/2021 15:07:13 - INFO - __main__ - Step 10988: {'lr': 0.0004954647801867035, 'samples': 2109696, 'steps': 10987, 'loss/train': 1.2116178274154663} -08/30/2021 15:07:13 - INFO - __main__ - Step 10989: {'lr': 0.0004954637739096023, 'samples': 2109888, 'steps': 10988, 'loss/train': 1.4974844455718994} -08/30/2021 15:07:14 - INFO - __main__ - Step 10990: {'lr': 0.0004954627675218989, 'samples': 2110080, 'steps': 10989, 'loss/train': 0.41842901706695557} -08/30/2021 15:07:15 - INFO - __main__ - Step 10991: {'lr': 0.0004954617610235939, 'samples': 2110272, 'steps': 10990, 'loss/train': 0.5526917576789856} -08/30/2021 15:07:16 - INFO - __main__ - Step 10992: {'lr': 0.0004954607544146875, 'samples': 2110464, 'steps': 10991, 'loss/train': 1.8407448530197144} -08/30/2021 15:07:16 - INFO - __main__ - Step 10993: {'lr': 0.0004954597476951804, 'samples': 2110656, 'steps': 10992, 'loss/train': 2.113936185836792} -08/30/2021 15:07:16 - INFO - __main__ - Step 10994: {'lr': 0.0004954587408650727, 'samples': 2110848, 'steps': 10993, 'loss/train': 1.3653898239135742} -08/30/2021 15:07:17 - INFO - __main__ - Step 10995: {'lr': 0.0004954577339243652, 'samples': 2111040, 'steps': 10994, 'loss/train': 1.7567837238311768} -08/30/2021 15:07:19 - INFO - __main__ - Step 10996: {'lr': 0.0004954567268730582, 'samples': 2111232, 'steps': 10995, 'loss/train': 2.195679187774658} -08/30/2021 15:07:19 - INFO - __main__ - Step 10997: {'lr': 0.0004954557197111522, 'samples': 2111424, 'steps': 10996, 'loss/train': 1.7838292121887207} -08/30/2021 15:07:20 - INFO - __main__ - Step 10998: {'lr': 0.0004954547124386477, 'samples': 2111616, 'steps': 10997, 'loss/train': 1.5152627229690552} -08/30/2021 15:07:20 - INFO - __main__ - Step 10999: {'lr': 0.0004954537050555451, 'samples': 2111808, 'steps': 10998, 'loss/train': 1.8554701805114746} -08/30/2021 15:07:20 - INFO - __main__ - Step 11000: {'lr': 0.0004954526975618447, 'samples': 2112000, 'steps': 10999, 'loss/train': 2.9708855152130127} -08/30/2021 15:07:22 - INFO - __main__ - Step 11001: {'lr': 0.0004954516899575473, 'samples': 2112192, 'steps': 11000, 'loss/train': 2.17421817779541} -08/30/2021 15:07:22 - INFO - __main__ - Step 11002: {'lr': 0.000495450682242653, 'samples': 2112384, 'steps': 11001, 'loss/train': 1.5058897733688354} -08/30/2021 15:07:23 - INFO - __main__ - Step 11003: {'lr': 0.0004954496744171624, 'samples': 2112576, 'steps': 11002, 'loss/train': 1.8715373277664185} -08/30/2021 15:07:23 - INFO - __main__ - Step 11004: {'lr': 0.0004954486664810762, 'samples': 2112768, 'steps': 11003, 'loss/train': 1.563541054725647} -08/30/2021 15:07:23 - INFO - __main__ - Step 11005: {'lr': 0.0004954476584343945, 'samples': 2112960, 'steps': 11004, 'loss/train': 1.8025926351547241} -08/30/2021 15:07:24 - INFO - __main__ - Step 11006: {'lr': 0.0004954466502771178, 'samples': 2113152, 'steps': 11005, 'loss/train': 2.0239102840423584} -08/30/2021 15:07:25 - INFO - __main__ - Step 11007: {'lr': 0.0004954456420092466, 'samples': 2113344, 'steps': 11006, 'loss/train': 1.1946940422058105} -08/30/2021 15:07:26 - INFO - __main__ - Step 11008: {'lr': 0.0004954446336307814, 'samples': 2113536, 'steps': 11007, 'loss/train': 2.891005277633667} -08/30/2021 15:07:26 - INFO - __main__ - Step 11009: {'lr': 0.0004954436251417227, 'samples': 2113728, 'steps': 11008, 'loss/train': 2.0502946376800537} -08/30/2021 15:07:27 - INFO - __main__ - Step 11010: {'lr': 0.0004954426165420709, 'samples': 2113920, 'steps': 11009, 'loss/train': 2.938062906265259} -08/30/2021 15:07:27 - INFO - __main__ - Step 11011: {'lr': 0.0004954416078318263, 'samples': 2114112, 'steps': 11010, 'loss/train': 1.9612449407577515} -08/30/2021 15:07:29 - INFO - __main__ - Step 11012: {'lr': 0.0004954405990109897, 'samples': 2114304, 'steps': 11011, 'loss/train': 1.929292917251587} -08/30/2021 15:07:29 - INFO - __main__ - Step 11013: {'lr': 0.0004954395900795611, 'samples': 2114496, 'steps': 11012, 'loss/train': 1.0514862537384033} -08/30/2021 15:07:30 - INFO - __main__ - Step 11014: {'lr': 0.0004954385810375415, 'samples': 2114688, 'steps': 11013, 'loss/train': 1.8498998880386353} -08/30/2021 15:07:30 - INFO - __main__ - Step 11015: {'lr': 0.0004954375718849308, 'samples': 2114880, 'steps': 11014, 'loss/train': 1.6812744140625} -08/30/2021 15:07:30 - INFO - __main__ - Step 11016: {'lr': 0.0004954365626217299, 'samples': 2115072, 'steps': 11015, 'loss/train': 1.5532358884811401} -08/30/2021 15:07:31 - INFO - __main__ - Step 11017: {'lr': 0.0004954355532479391, 'samples': 2115264, 'steps': 11016, 'loss/train': 1.8510565757751465} -08/30/2021 15:07:32 - INFO - __main__ - Step 11018: {'lr': 0.0004954345437635587, 'samples': 2115456, 'steps': 11017, 'loss/train': 1.8996973037719727} -08/30/2021 15:07:33 - INFO - __main__ - Step 11019: {'lr': 0.0004954335341685893, 'samples': 2115648, 'steps': 11018, 'loss/train': 1.0813733339309692} -08/30/2021 15:07:33 - INFO - __main__ - Step 11020: {'lr': 0.0004954325244630315, 'samples': 2115840, 'steps': 11019, 'loss/train': 0.32894089818000793} -08/30/2021 15:07:33 - INFO - __main__ - Step 11021: {'lr': 0.0004954315146468854, 'samples': 2116032, 'steps': 11020, 'loss/train': 2.2050979137420654} -08/30/2021 15:07:34 - INFO - __main__ - Step 11022: {'lr': 0.0004954305047201517, 'samples': 2116224, 'steps': 11021, 'loss/train': 1.703669548034668} -08/30/2021 15:07:36 - INFO - __main__ - Step 11023: {'lr': 0.0004954294946828308, 'samples': 2116416, 'steps': 11022, 'loss/train': 1.627677083015442} -08/30/2021 15:07:36 - INFO - __main__ - Step 11024: {'lr': 0.0004954284845349232, 'samples': 2116608, 'steps': 11023, 'loss/train': 2.1991710662841797} -08/30/2021 15:07:36 - INFO - __main__ - Step 11025: {'lr': 0.0004954274742764292, 'samples': 2116800, 'steps': 11024, 'loss/train': 2.265136957168579} -08/30/2021 15:07:37 - INFO - __main__ - Step 11026: {'lr': 0.0004954264639073495, 'samples': 2116992, 'steps': 11025, 'loss/train': 1.7266194820404053} -08/30/2021 15:07:37 - INFO - __main__ - Step 11027: {'lr': 0.0004954254534276843, 'samples': 2117184, 'steps': 11026, 'loss/train': 1.9154466390609741} -08/30/2021 15:07:38 - INFO - __main__ - Step 11028: {'lr': 0.0004954244428374343, 'samples': 2117376, 'steps': 11027, 'loss/train': 2.7888379096984863} -08/30/2021 15:07:39 - INFO - __main__ - Step 11029: {'lr': 0.0004954234321365998, 'samples': 2117568, 'steps': 11028, 'loss/train': 2.136707305908203} -08/30/2021 15:07:39 - INFO - __main__ - Step 11030: {'lr': 0.0004954224213251813, 'samples': 2117760, 'steps': 11029, 'loss/train': 1.9650870561599731} -08/30/2021 15:07:40 - INFO - __main__ - Step 11031: {'lr': 0.0004954214104031791, 'samples': 2117952, 'steps': 11030, 'loss/train': 1.2592624425888062} -08/30/2021 15:07:40 - INFO - __main__ - Step 11032: {'lr': 0.0004954203993705939, 'samples': 2118144, 'steps': 11031, 'loss/train': 1.9525206089019775} -08/30/2021 15:07:40 - INFO - __main__ - Step 11033: {'lr': 0.0004954193882274261, 'samples': 2118336, 'steps': 11032, 'loss/train': 2.9623115062713623} -08/30/2021 15:07:42 - INFO - __main__ - Step 11034: {'lr': 0.000495418376973676, 'samples': 2118528, 'steps': 11033, 'loss/train': 1.8920893669128418} -08/30/2021 15:07:42 - INFO - __main__ - Step 11035: {'lr': 0.0004954173656093443, 'samples': 2118720, 'steps': 11034, 'loss/train': 2.404442071914673} -08/30/2021 15:07:43 - INFO - __main__ - Step 11036: {'lr': 0.0004954163541344312, 'samples': 2118912, 'steps': 11035, 'loss/train': 2.047079563140869} -08/30/2021 15:07:43 - INFO - __main__ - Step 11037: {'lr': 0.0004954153425489374, 'samples': 2119104, 'steps': 11036, 'loss/train': 1.9804679155349731} -08/30/2021 15:07:43 - INFO - __main__ - Step 11038: {'lr': 0.0004954143308528631, 'samples': 2119296, 'steps': 11037, 'loss/train': 1.642622947692871} -08/30/2021 15:07:45 - INFO - __main__ - Step 11039: {'lr': 0.000495413319046209, 'samples': 2119488, 'steps': 11038, 'loss/train': 1.897440791130066} -08/30/2021 15:07:45 - INFO - __main__ - Step 11040: {'lr': 0.0004954123071289754, 'samples': 2119680, 'steps': 11039, 'loss/train': 2.106625556945801} -08/30/2021 15:07:46 - INFO - __main__ - Step 11041: {'lr': 0.0004954112951011628, 'samples': 2119872, 'steps': 11040, 'loss/train': 2.0594820976257324} -08/30/2021 15:07:46 - INFO - __main__ - Step 11042: {'lr': 0.0004954102829627717, 'samples': 2120064, 'steps': 11041, 'loss/train': 2.2841925621032715} -08/30/2021 15:07:46 - INFO - __main__ - Step 11043: {'lr': 0.0004954092707138024, 'samples': 2120256, 'steps': 11042, 'loss/train': 1.6776620149612427} -08/30/2021 15:07:48 - INFO - __main__ - Step 11044: {'lr': 0.0004954082583542557, 'samples': 2120448, 'steps': 11043, 'loss/train': 1.779884934425354} -08/30/2021 15:07:48 - INFO - __main__ - Step 11045: {'lr': 0.0004954072458841315, 'samples': 2120640, 'steps': 11044, 'loss/train': 1.9558268785476685} -08/30/2021 15:07:49 - INFO - __main__ - Step 11046: {'lr': 0.0004954062333034308, 'samples': 2120832, 'steps': 11045, 'loss/train': 2.6233487129211426} -08/30/2021 15:07:49 - INFO - __main__ - Step 11047: {'lr': 0.0004954052206121538, 'samples': 2121024, 'steps': 11046, 'loss/train': 2.042098045349121} -08/30/2021 15:07:49 - INFO - __main__ - Step 11048: {'lr': 0.000495404207810301, 'samples': 2121216, 'steps': 11047, 'loss/train': 1.839972972869873} -08/30/2021 15:07:50 - INFO - __main__ - Step 11049: {'lr': 0.0004954031948978729, 'samples': 2121408, 'steps': 11048, 'loss/train': 1.4205790758132935} -08/30/2021 15:07:51 - INFO - __main__ - Step 11050: {'lr': 0.0004954021818748698, 'samples': 2121600, 'steps': 11049, 'loss/train': 2.023576259613037} -08/30/2021 15:07:52 - INFO - __main__ - Step 11051: {'lr': 0.0004954011687412923, 'samples': 2121792, 'steps': 11050, 'loss/train': 2.613823890686035} -08/30/2021 15:07:52 - INFO - __main__ - Step 11052: {'lr': 0.0004954001554971409, 'samples': 2121984, 'steps': 11051, 'loss/train': 1.4308427572250366} -08/30/2021 15:07:53 - INFO - __main__ - Step 11053: {'lr': 0.0004953991421424159, 'samples': 2122176, 'steps': 11052, 'loss/train': 2.029387950897217} -08/30/2021 15:07:53 - INFO - __main__ - Step 11054: {'lr': 0.0004953981286771178, 'samples': 2122368, 'steps': 11053, 'loss/train': 0.22284691035747528} -08/30/2021 15:07:54 - INFO - __main__ - Step 11055: {'lr': 0.0004953971151012471, 'samples': 2122560, 'steps': 11054, 'loss/train': 0.20293185114860535} -08/30/2021 15:07:55 - INFO - __main__ - Step 11056: {'lr': 0.0004953961014148043, 'samples': 2122752, 'steps': 11055, 'loss/train': 1.7698132991790771} -08/30/2021 15:07:56 - INFO - __main__ - Step 11057: {'lr': 0.0004953950876177897, 'samples': 2122944, 'steps': 11056, 'loss/train': 2.290742874145508} -08/30/2021 15:07:56 - INFO - __main__ - Step 11058: {'lr': 0.000495394073710204, 'samples': 2123136, 'steps': 11057, 'loss/train': 1.5787354707717896} -08/30/2021 15:07:57 - INFO - __main__ - Step 11059: {'lr': 0.0004953930596920474, 'samples': 2123328, 'steps': 11058, 'loss/train': 2.0530502796173096} -08/30/2021 15:07:57 - INFO - __main__ - Step 11060: {'lr': 0.0004953920455633206, 'samples': 2123520, 'steps': 11059, 'loss/train': 1.7764960527420044} -08/30/2021 15:07:59 - INFO - __main__ - Step 11061: {'lr': 0.0004953910313240239, 'samples': 2123712, 'steps': 11060, 'loss/train': 2.048180341720581} -08/30/2021 15:07:59 - INFO - __main__ - Step 11062: {'lr': 0.0004953900169741577, 'samples': 2123904, 'steps': 11061, 'loss/train': 1.8457850217819214} -08/30/2021 15:07:59 - INFO - __main__ - Step 11063: {'lr': 0.0004953890025137226, 'samples': 2124096, 'steps': 11062, 'loss/train': 2.0374860763549805} -08/30/2021 15:08:00 - INFO - __main__ - Step 11064: {'lr': 0.000495387987942719, 'samples': 2124288, 'steps': 11063, 'loss/train': 1.988455891609192} -08/30/2021 15:08:00 - INFO - __main__ - Step 11065: {'lr': 0.0004953869732611474, 'samples': 2124480, 'steps': 11064, 'loss/train': 2.169694662094116} -08/30/2021 15:08:02 - INFO - __main__ - Step 11066: {'lr': 0.0004953859584690081, 'samples': 2124672, 'steps': 11065, 'loss/train': 2.019395589828491} -08/30/2021 15:08:02 - INFO - __main__ - Step 11067: {'lr': 0.0004953849435663018, 'samples': 2124864, 'steps': 11066, 'loss/train': 2.0245816707611084} -08/30/2021 15:08:02 - INFO - __main__ - Step 11068: {'lr': 0.0004953839285530287, 'samples': 2125056, 'steps': 11067, 'loss/train': 1.5807219743728638} -08/30/2021 15:08:03 - INFO - __main__ - Step 11069: {'lr': 0.0004953829134291895, 'samples': 2125248, 'steps': 11068, 'loss/train': 2.100602388381958} -08/30/2021 15:08:03 - INFO - __main__ - Step 11070: {'lr': 0.0004953818981947845, 'samples': 2125440, 'steps': 11069, 'loss/train': 2.384111166000366} -08/30/2021 15:08:05 - INFO - __main__ - Step 11071: {'lr': 0.0004953808828498142, 'samples': 2125632, 'steps': 11070, 'loss/train': 1.9089192152023315} -08/30/2021 15:08:05 - INFO - __main__ - Step 11072: {'lr': 0.0004953798673942791, 'samples': 2125824, 'steps': 11071, 'loss/train': 1.695746660232544} -08/30/2021 15:08:05 - INFO - __main__ - Step 11073: {'lr': 0.0004953788518281796, 'samples': 2126016, 'steps': 11072, 'loss/train': 2.089404821395874} -08/30/2021 15:08:06 - INFO - __main__ - Step 11074: {'lr': 0.0004953778361515163, 'samples': 2126208, 'steps': 11073, 'loss/train': 0.22820700705051422} -08/30/2021 15:08:06 - INFO - __main__ - Step 11075: {'lr': 0.0004953768203642893, 'samples': 2126400, 'steps': 11074, 'loss/train': 2.138831377029419} -08/30/2021 15:08:08 - INFO - __main__ - Step 11076: {'lr': 0.0004953758044664994, 'samples': 2126592, 'steps': 11075, 'loss/train': 2.0137264728546143} -08/30/2021 15:08:09 - INFO - __main__ - Step 11077: {'lr': 0.0004953747884581469, 'samples': 2126784, 'steps': 11076, 'loss/train': 1.7807413339614868} -08/30/2021 15:08:09 - INFO - __main__ - Step 11078: {'lr': 0.0004953737723392324, 'samples': 2126976, 'steps': 11077, 'loss/train': 1.8768905401229858} -08/30/2021 15:08:09 - INFO - __main__ - Step 11079: {'lr': 0.0004953727561097562, 'samples': 2127168, 'steps': 11078, 'loss/train': 0.15849746763706207} -08/30/2021 15:08:10 - INFO - __main__ - Step 11080: {'lr': 0.0004953717397697189, 'samples': 2127360, 'steps': 11079, 'loss/train': 2.526132583618164} -08/30/2021 15:08:10 - INFO - __main__ - Step 11081: {'lr': 0.0004953707233191207, 'samples': 2127552, 'steps': 11080, 'loss/train': 1.420319676399231} -08/30/2021 15:08:11 - INFO - __main__ - Step 11082: {'lr': 0.0004953697067579624, 'samples': 2127744, 'steps': 11081, 'loss/train': 0.12702490389347076} -08/30/2021 15:08:12 - INFO - __main__ - Step 11083: {'lr': 0.0004953686900862442, 'samples': 2127936, 'steps': 11082, 'loss/train': 1.7738608121871948} -08/30/2021 15:08:12 - INFO - __main__ - Step 11084: {'lr': 0.0004953676733039668, 'samples': 2128128, 'steps': 11083, 'loss/train': 1.782198190689087} -08/30/2021 15:08:13 - INFO - __main__ - Step 11085: {'lr': 0.0004953666564111303, 'samples': 2128320, 'steps': 11084, 'loss/train': 1.7017955780029297} -08/30/2021 15:08:13 - INFO - __main__ - Step 11086: {'lr': 0.0004953656394077355, 'samples': 2128512, 'steps': 11085, 'loss/train': 1.9793652296066284} -08/30/2021 15:08:13 - INFO - __main__ - Step 11087: {'lr': 0.0004953646222937828, 'samples': 2128704, 'steps': 11086, 'loss/train': 1.6664254665374756} -08/30/2021 15:08:15 - INFO - __main__ - Step 11088: {'lr': 0.0004953636050692724, 'samples': 2128896, 'steps': 11087, 'loss/train': 2.2110068798065186} -08/30/2021 15:08:15 - INFO - __main__ - Step 11089: {'lr': 0.0004953625877342051, 'samples': 2129088, 'steps': 11088, 'loss/train': 1.5275801420211792} -08/30/2021 15:08:16 - INFO - __main__ - Step 11090: {'lr': 0.0004953615702885812, 'samples': 2129280, 'steps': 11089, 'loss/train': 2.0113110542297363} -08/30/2021 15:08:16 - INFO - __main__ - Step 11091: {'lr': 0.0004953605527324011, 'samples': 2129472, 'steps': 11090, 'loss/train': 1.7620744705200195} -08/30/2021 15:08:16 - INFO - __main__ - Step 11092: {'lr': 0.0004953595350656653, 'samples': 2129664, 'steps': 11091, 'loss/train': 1.4105721712112427} -08/30/2021 15:08:18 - INFO - __main__ - Step 11093: {'lr': 0.0004953585172883743, 'samples': 2129856, 'steps': 11092, 'loss/train': 2.1221680641174316} -08/30/2021 15:08:19 - INFO - __main__ - Step 11094: {'lr': 0.0004953574994005286, 'samples': 2130048, 'steps': 11093, 'loss/train': 2.283801317214966} -08/30/2021 15:08:19 - INFO - __main__ - Step 11095: {'lr': 0.0004953564814021285, 'samples': 2130240, 'steps': 11094, 'loss/train': 2.1612584590911865} -08/30/2021 15:08:19 - INFO - __main__ - Step 11096: {'lr': 0.0004953554632931746, 'samples': 2130432, 'steps': 11095, 'loss/train': 2.52555775642395} -08/30/2021 15:08:20 - INFO - __main__ - Step 11097: {'lr': 0.0004953544450736674, 'samples': 2130624, 'steps': 11096, 'loss/train': 1.6636079549789429} -08/30/2021 15:08:21 - INFO - __main__ - Step 11098: {'lr': 0.0004953534267436072, 'samples': 2130816, 'steps': 11097, 'loss/train': 2.2485923767089844} -08/30/2021 15:08:22 - INFO - __main__ - Step 11099: {'lr': 0.0004953524083029945, 'samples': 2131008, 'steps': 11098, 'loss/train': 1.338276743888855} -08/30/2021 15:08:22 - INFO - __main__ - Step 11100: {'lr': 0.0004953513897518298, 'samples': 2131200, 'steps': 11099, 'loss/train': 2.069579601287842} -08/30/2021 15:08:22 - INFO - __main__ - Step 11101: {'lr': 0.0004953503710901136, 'samples': 2131392, 'steps': 11100, 'loss/train': 1.864101767539978} -08/30/2021 15:08:23 - INFO - __main__ - Step 11102: {'lr': 0.0004953493523178463, 'samples': 2131584, 'steps': 11101, 'loss/train': 1.582018256187439} -08/30/2021 15:08:24 - INFO - __main__ - Step 11103: {'lr': 0.0004953483334350283, 'samples': 2131776, 'steps': 11102, 'loss/train': 1.651454210281372} -08/30/2021 15:08:25 - INFO - __main__ - Step 11104: {'lr': 0.0004953473144416602, 'samples': 2131968, 'steps': 11103, 'loss/train': 1.8541146516799927} -08/30/2021 15:08:25 - INFO - __main__ - Step 11105: {'lr': 0.0004953462953377424, 'samples': 2132160, 'steps': 11104, 'loss/train': 1.8567306995391846} -08/30/2021 15:08:25 - INFO - __main__ - Step 11106: {'lr': 0.0004953452761232753, 'samples': 2132352, 'steps': 11105, 'loss/train': 2.2671186923980713} -08/30/2021 15:08:26 - INFO - __main__ - Step 11107: {'lr': 0.0004953442567982593, 'samples': 2132544, 'steps': 11106, 'loss/train': 1.8087079524993896} -08/30/2021 15:08:28 - INFO - __main__ - Step 11108: {'lr': 0.0004953432373626951, 'samples': 2132736, 'steps': 11107, 'loss/train': 1.1706079244613647} -08/30/2021 15:08:29 - INFO - __main__ - Step 11109: {'lr': 0.0004953422178165831, 'samples': 2132928, 'steps': 11108, 'loss/train': 1.936245322227478} -08/30/2021 15:08:29 - INFO - __main__ - Step 11110: {'lr': 0.0004953411981599235, 'samples': 2133120, 'steps': 11109, 'loss/train': 1.7550830841064453} -08/30/2021 15:08:29 - INFO - __main__ - Step 11111: {'lr': 0.0004953401783927171, 'samples': 2133312, 'steps': 11110, 'loss/train': 1.4070396423339844} -08/30/2021 15:08:30 - INFO - __main__ - Step 11112: {'lr': 0.000495339158514964, 'samples': 2133504, 'steps': 11111, 'loss/train': 0.23815692961215973} -08/30/2021 15:08:30 - INFO - __main__ - Step 11113: {'lr': 0.0004953381385266651, 'samples': 2133696, 'steps': 11112, 'loss/train': 1.2586719989776611} -08/30/2021 15:08:31 - INFO - __main__ - Step 11114: {'lr': 0.0004953371184278205, 'samples': 2133888, 'steps': 11113, 'loss/train': 1.926695466041565} -08/30/2021 15:08:32 - INFO - __main__ - Step 11115: {'lr': 0.0004953360982184308, 'samples': 2134080, 'steps': 11114, 'loss/train': 1.8673443794250488} -08/30/2021 15:08:32 - INFO - __main__ - Step 11116: {'lr': 0.0004953350778984963, 'samples': 2134272, 'steps': 11115, 'loss/train': 1.7017509937286377} -08/30/2021 15:08:33 - INFO - __main__ - Step 11117: {'lr': 0.0004953340574680177, 'samples': 2134464, 'steps': 11116, 'loss/train': 2.141362428665161} -08/30/2021 15:08:33 - INFO - __main__ - Step 11118: {'lr': 0.0004953330369269955, 'samples': 2134656, 'steps': 11117, 'loss/train': 1.6088838577270508} -08/30/2021 15:08:35 - INFO - __main__ - Step 11119: {'lr': 0.0004953320162754298, 'samples': 2134848, 'steps': 11118, 'loss/train': 0.1882239282131195} -08/30/2021 15:08:35 - INFO - __main__ - Step 11120: {'lr': 0.0004953309955133214, 'samples': 2135040, 'steps': 11119, 'loss/train': 1.9355123043060303} -08/30/2021 15:08:35 - INFO - __main__ - Step 11121: {'lr': 0.0004953299746406707, 'samples': 2135232, 'steps': 11120, 'loss/train': 1.5760687589645386} -08/30/2021 15:08:36 - INFO - __main__ - Step 11122: {'lr': 0.000495328953657478, 'samples': 2135424, 'steps': 11121, 'loss/train': 0.14006000757217407} -08/30/2021 15:08:36 - INFO - __main__ - Step 11123: {'lr': 0.0004953279325637438, 'samples': 2135616, 'steps': 11122, 'loss/train': 1.6309653520584106} -08/30/2021 15:08:38 - INFO - __main__ - Step 11124: {'lr': 0.0004953269113594687, 'samples': 2135808, 'steps': 11123, 'loss/train': 1.455532193183899} -08/30/2021 15:08:38 - INFO - __main__ - Step 11125: {'lr': 0.0004953258900446531, 'samples': 2136000, 'steps': 11124, 'loss/train': 2.2158398628234863} -08/30/2021 15:08:38 - INFO - __main__ - Step 11126: {'lr': 0.0004953248686192975, 'samples': 2136192, 'steps': 11125, 'loss/train': 1.9556537866592407} -08/30/2021 15:08:39 - INFO - __main__ - Step 11127: {'lr': 0.0004953238470834022, 'samples': 2136384, 'steps': 11126, 'loss/train': 1.7583212852478027} -08/30/2021 15:08:39 - INFO - __main__ - Step 11128: {'lr': 0.0004953228254369677, 'samples': 2136576, 'steps': 11127, 'loss/train': 1.7490719556808472} -08/30/2021 15:08:41 - INFO - __main__ - Step 11129: {'lr': 0.0004953218036799946, 'samples': 2136768, 'steps': 11128, 'loss/train': 1.490636944770813} -08/30/2021 15:08:41 - INFO - __main__ - Step 11130: {'lr': 0.0004953207818124833, 'samples': 2136960, 'steps': 11129, 'loss/train': 2.097973108291626} -08/30/2021 15:08:41 - INFO - __main__ - Step 11131: {'lr': 0.0004953197598344342, 'samples': 2137152, 'steps': 11130, 'loss/train': 2.425636053085327} -08/30/2021 15:08:42 - INFO - __main__ - Step 11132: {'lr': 0.0004953187377458478, 'samples': 2137344, 'steps': 11131, 'loss/train': 1.5264713764190674} -08/30/2021 15:08:42 - INFO - __main__ - Step 11133: {'lr': 0.0004953177155467246, 'samples': 2137536, 'steps': 11132, 'loss/train': 1.6516380310058594} -08/30/2021 15:08:44 - INFO - __main__ - Step 11134: {'lr': 0.0004953166932370651, 'samples': 2137728, 'steps': 11133, 'loss/train': 1.5329843759536743} -08/30/2021 15:08:44 - INFO - __main__ - Step 11135: {'lr': 0.0004953156708168695, 'samples': 2137920, 'steps': 11134, 'loss/train': 1.7588341236114502} -08/30/2021 15:08:44 - INFO - __main__ - Step 11136: {'lr': 0.0004953146482861385, 'samples': 2138112, 'steps': 11135, 'loss/train': 2.2730307579040527} -08/30/2021 15:08:45 - INFO - __main__ - Step 11137: {'lr': 0.0004953136256448725, 'samples': 2138304, 'steps': 11136, 'loss/train': 1.6751506328582764} -08/30/2021 15:08:45 - INFO - __main__ - Step 11138: {'lr': 0.0004953126028930721, 'samples': 2138496, 'steps': 11137, 'loss/train': 1.8939454555511475} -08/30/2021 15:08:45 - INFO - __main__ - Step 11139: {'lr': 0.0004953115800307375, 'samples': 2138688, 'steps': 11138, 'loss/train': 1.992057204246521} -08/30/2021 15:08:47 - INFO - __main__ - Step 11140: {'lr': 0.0004953105570578693, 'samples': 2138880, 'steps': 11139, 'loss/train': 1.5404541492462158} -08/30/2021 15:08:47 - INFO - __main__ - Step 11141: {'lr': 0.000495309533974468, 'samples': 2139072, 'steps': 11140, 'loss/train': 1.944646954536438} -08/30/2021 15:08:48 - INFO - __main__ - Step 11142: {'lr': 0.0004953085107805339, 'samples': 2139264, 'steps': 11141, 'loss/train': 1.9030653238296509} -08/30/2021 15:08:48 - INFO - __main__ - Step 11143: {'lr': 0.0004953074874760677, 'samples': 2139456, 'steps': 11142, 'loss/train': 2.5180866718292236} -08/30/2021 15:08:48 - INFO - __main__ - Step 11144: {'lr': 0.0004953064640610697, 'samples': 2139648, 'steps': 11143, 'loss/train': 1.5613799095153809} -08/30/2021 15:08:50 - INFO - __main__ - Step 11145: {'lr': 0.0004953054405355404, 'samples': 2139840, 'steps': 11144, 'loss/train': 1.4012560844421387} -08/30/2021 15:08:51 - INFO - __main__ - Step 11146: {'lr': 0.0004953044168994802, 'samples': 2140032, 'steps': 11145, 'loss/train': 0.13021203875541687} -08/30/2021 15:08:51 - INFO - __main__ - Step 11147: {'lr': 0.0004953033931528897, 'samples': 2140224, 'steps': 11146, 'loss/train': 1.2138471603393555} -08/30/2021 15:08:51 - INFO - __main__ - Step 11148: {'lr': 0.0004953023692957691, 'samples': 2140416, 'steps': 11147, 'loss/train': 1.539682149887085} -08/30/2021 15:08:52 - INFO - __main__ - Step 11149: {'lr': 0.0004953013453281193, 'samples': 2140608, 'steps': 11148, 'loss/train': 2.223832845687866} -08/30/2021 15:08:53 - INFO - __main__ - Step 11150: {'lr': 0.0004953003212499403, 'samples': 2140800, 'steps': 11149, 'loss/train': 2.070180654525757} -08/30/2021 15:08:54 - INFO - __main__ - Step 11151: {'lr': 0.0004952992970612328, 'samples': 2140992, 'steps': 11150, 'loss/train': 2.378373146057129} -08/30/2021 15:08:54 - INFO - __main__ - Step 11152: {'lr': 0.0004952982727619973, 'samples': 2141184, 'steps': 11151, 'loss/train': 2.1110410690307617} -08/30/2021 15:08:54 - INFO - __main__ - Step 11153: {'lr': 0.000495297248352234, 'samples': 2141376, 'steps': 11152, 'loss/train': 1.975611686706543} -08/30/2021 15:08:55 - INFO - __main__ - Step 11154: {'lr': 0.0004952962238319436, 'samples': 2141568, 'steps': 11153, 'loss/train': 1.8950594663619995} -08/30/2021 15:08:57 - INFO - __main__ - Step 11155: {'lr': 0.0004952951992011266, 'samples': 2141760, 'steps': 11154, 'loss/train': 1.828566074371338} -08/30/2021 15:08:58 - INFO - __main__ - Step 11156: {'lr': 0.0004952941744597834, 'samples': 2141952, 'steps': 11155, 'loss/train': 2.4585282802581787} -08/30/2021 15:08:58 - INFO - __main__ - Step 11157: {'lr': 0.0004952931496079143, 'samples': 2142144, 'steps': 11156, 'loss/train': 0.4626551568508148} -08/30/2021 15:08:58 - INFO - __main__ - Step 11158: {'lr': 0.00049529212464552, 'samples': 2142336, 'steps': 11157, 'loss/train': 1.9143321514129639} -08/30/2021 15:08:59 - INFO - __main__ - Step 11159: {'lr': 0.0004952910995726008, 'samples': 2142528, 'steps': 11158, 'loss/train': 1.5643495321273804} -08/30/2021 15:08:59 - INFO - __main__ - Step 11160: {'lr': 0.0004952900743891573, 'samples': 2142720, 'steps': 11159, 'loss/train': 0.9213781356811523} -08/30/2021 15:08:59 - INFO - __main__ - Step 11161: {'lr': 0.0004952890490951898, 'samples': 2142912, 'steps': 11160, 'loss/train': 0.9682077765464783} -08/30/2021 15:09:01 - INFO - __main__ - Step 11162: {'lr': 0.0004952880236906988, 'samples': 2143104, 'steps': 11161, 'loss/train': 1.2100898027420044} -08/30/2021 15:09:01 - INFO - __main__ - Step 11163: {'lr': 0.0004952869981756848, 'samples': 2143296, 'steps': 11162, 'loss/train': 1.7945683002471924} -08/30/2021 15:09:02 - INFO - __main__ - Step 11164: {'lr': 0.0004952859725501484, 'samples': 2143488, 'steps': 11163, 'loss/train': 2.1535260677337646} -08/30/2021 15:09:02 - INFO - __main__ - Step 11165: {'lr': 0.0004952849468140898, 'samples': 2143680, 'steps': 11164, 'loss/train': 1.7730416059494019} -08/30/2021 15:09:03 - INFO - __main__ - Step 11166: {'lr': 0.0004952839209675096, 'samples': 2143872, 'steps': 11165, 'loss/train': 1.5191484689712524} -08/30/2021 15:09:04 - INFO - __main__ - Step 11167: {'lr': 0.0004952828950104083, 'samples': 2144064, 'steps': 11166, 'loss/train': 0.5176580548286438} -08/30/2021 15:09:05 - INFO - __main__ - Step 11168: {'lr': 0.0004952818689427863, 'samples': 2144256, 'steps': 11167, 'loss/train': 1.9282982349395752} -08/30/2021 15:09:05 - INFO - __main__ - Step 11169: {'lr': 0.0004952808427646441, 'samples': 2144448, 'steps': 11168, 'loss/train': 1.4896656274795532} -08/30/2021 15:09:06 - INFO - __main__ - Step 11170: {'lr': 0.000495279816475982, 'samples': 2144640, 'steps': 11169, 'loss/train': 1.80918550491333} -08/30/2021 15:09:06 - INFO - __main__ - Step 11171: {'lr': 0.0004952787900768008, 'samples': 2144832, 'steps': 11170, 'loss/train': 1.5024809837341309} -08/30/2021 15:09:08 - INFO - __main__ - Step 11172: {'lr': 0.0004952777635671006, 'samples': 2145024, 'steps': 11171, 'loss/train': 2.058274030685425} -08/30/2021 15:09:08 - INFO - __main__ - Step 11173: {'lr': 0.0004952767369468821, 'samples': 2145216, 'steps': 11172, 'loss/train': 1.8573354482650757} -08/30/2021 15:09:08 - INFO - __main__ - Step 11174: {'lr': 0.0004952757102161457, 'samples': 2145408, 'steps': 11173, 'loss/train': 1.9735442399978638} -08/30/2021 15:09:09 - INFO - __main__ - Step 11175: {'lr': 0.0004952746833748918, 'samples': 2145600, 'steps': 11174, 'loss/train': 1.7319947481155396} -08/30/2021 15:09:09 - INFO - __main__ - Step 11176: {'lr': 0.0004952736564231209, 'samples': 2145792, 'steps': 11175, 'loss/train': 1.817901611328125} -08/30/2021 15:09:11 - INFO - __main__ - Step 11177: {'lr': 0.0004952726293608335, 'samples': 2145984, 'steps': 11176, 'loss/train': 2.117215633392334} -08/30/2021 15:09:11 - INFO - __main__ - Step 11178: {'lr': 0.0004952716021880301, 'samples': 2146176, 'steps': 11177, 'loss/train': 1.3609068393707275} -08/30/2021 15:09:11 - INFO - __main__ - Step 11179: {'lr': 0.0004952705749047111, 'samples': 2146368, 'steps': 11178, 'loss/train': 1.5699869394302368} -08/30/2021 15:09:12 - INFO - __main__ - Step 11180: {'lr': 0.0004952695475108768, 'samples': 2146560, 'steps': 11179, 'loss/train': 1.5526151657104492} -08/30/2021 15:09:12 - INFO - __main__ - Step 11181: {'lr': 0.000495268520006528, 'samples': 2146752, 'steps': 11180, 'loss/train': 1.577141284942627} -08/30/2021 15:09:14 - INFO - __main__ - Step 11182: {'lr': 0.000495267492391665, 'samples': 2146944, 'steps': 11181, 'loss/train': 2.015547752380371} -08/30/2021 15:09:14 - INFO - __main__ - Step 11183: {'lr': 0.0004952664646662882, 'samples': 2147136, 'steps': 11182, 'loss/train': 1.9722617864608765} -08/30/2021 15:09:15 - INFO - __main__ - Step 11184: {'lr': 0.000495265436830398, 'samples': 2147328, 'steps': 11183, 'loss/train': 1.9817020893096924} -08/30/2021 15:09:15 - INFO - __main__ - Step 11185: {'lr': 0.0004952644088839951, 'samples': 2147520, 'steps': 11184, 'loss/train': 2.0684518814086914} -08/30/2021 15:09:15 - INFO - __main__ - Step 11186: {'lr': 0.0004952633808270797, 'samples': 2147712, 'steps': 11185, 'loss/train': 1.2863656282424927} -08/30/2021 15:09:16 - INFO - __main__ - Step 11187: {'lr': 0.0004952623526596526, 'samples': 2147904, 'steps': 11186, 'loss/train': 1.9380815029144287} -08/30/2021 15:09:17 - INFO - __main__ - Step 11188: {'lr': 0.000495261324381714, 'samples': 2148096, 'steps': 11187, 'loss/train': 1.7953402996063232} -08/30/2021 15:09:18 - INFO - __main__ - Step 11189: {'lr': 0.0004952602959932644, 'samples': 2148288, 'steps': 11188, 'loss/train': 2.091665029525757} -08/30/2021 15:09:18 - INFO - __main__ - Step 11190: {'lr': 0.0004952592674943043, 'samples': 2148480, 'steps': 11189, 'loss/train': 1.566051959991455} -08/30/2021 15:09:18 - INFO - __main__ - Step 11191: {'lr': 0.0004952582388848343, 'samples': 2148672, 'steps': 11190, 'loss/train': 1.6068222522735596} -08/30/2021 15:09:19 - INFO - __main__ - Step 11192: {'lr': 0.0004952572101648545, 'samples': 2148864, 'steps': 11191, 'loss/train': 1.6725513935089111} -08/30/2021 15:09:20 - INFO - __main__ - Step 11193: {'lr': 0.0004952561813343657, 'samples': 2149056, 'steps': 11192, 'loss/train': 1.7708979845046997} -08/30/2021 15:09:21 - INFO - __main__ - Step 11194: {'lr': 0.0004952551523933682, 'samples': 2149248, 'steps': 11193, 'loss/train': 1.3797221183776855} -08/30/2021 15:09:21 - INFO - __main__ - Step 11195: {'lr': 0.0004952541233418626, 'samples': 2149440, 'steps': 11194, 'loss/train': 1.7353644371032715} -08/30/2021 15:09:21 - INFO - __main__ - Step 11196: {'lr': 0.0004952530941798492, 'samples': 2149632, 'steps': 11195, 'loss/train': 1.5461173057556152} -08/30/2021 15:09:22 - INFO - __main__ - Step 11197: {'lr': 0.0004952520649073286, 'samples': 2149824, 'steps': 11196, 'loss/train': 1.756289005279541} -08/30/2021 15:09:23 - INFO - __main__ - Step 11198: {'lr': 0.0004952510355243012, 'samples': 2150016, 'steps': 11197, 'loss/train': 1.3803040981292725} -08/30/2021 15:09:24 - INFO - __main__ - Step 11199: {'lr': 0.0004952500060307674, 'samples': 2150208, 'steps': 11198, 'loss/train': 2.0660104751586914} -08/30/2021 15:09:25 - INFO - __main__ - Step 11200: {'lr': 0.0004952489764267278, 'samples': 2150400, 'steps': 11199, 'loss/train': 1.9330822229385376} -08/30/2021 15:09:25 - INFO - __main__ - Step 11201: {'lr': 0.0004952479467121827, 'samples': 2150592, 'steps': 11200, 'loss/train': 6.268353462219238} -08/30/2021 15:09:25 - INFO - __main__ - Step 11202: {'lr': 0.0004952469168871327, 'samples': 2150784, 'steps': 11201, 'loss/train': 6.152014255523682} -08/30/2021 15:09:26 - INFO - __main__ - Step 11203: {'lr': 0.0004952458869515782, 'samples': 2150976, 'steps': 11202, 'loss/train': 3.165759801864624} -08/30/2021 15:09:28 - INFO - __main__ - Step 11204: {'lr': 0.0004952448569055198, 'samples': 2151168, 'steps': 11203, 'loss/train': 1.6261491775512695} -08/30/2021 15:09:28 - INFO - __main__ - Step 11205: {'lr': 0.0004952438267489578, 'samples': 2151360, 'steps': 11204, 'loss/train': 1.5949993133544922} -08/30/2021 15:09:29 - INFO - __main__ - Step 11206: {'lr': 0.0004952427964818927, 'samples': 2151552, 'steps': 11205, 'loss/train': 0.1325102001428604} -08/30/2021 15:09:29 - INFO - __main__ - Step 11207: {'lr': 0.0004952417661043249, 'samples': 2151744, 'steps': 11206, 'loss/train': 1.750083088874817} -08/30/2021 15:09:29 - INFO - __main__ - Step 11208: {'lr': 0.0004952407356162551, 'samples': 2151936, 'steps': 11207, 'loss/train': 1.6897622346878052} -08/30/2021 15:09:30 - INFO - __main__ - Step 11209: {'lr': 0.0004952397050176835, 'samples': 2152128, 'steps': 11208, 'loss/train': 1.6857823133468628} -08/30/2021 15:09:30 - INFO - __main__ - Step 11210: {'lr': 0.0004952386743086107, 'samples': 2152320, 'steps': 11209, 'loss/train': 1.4603480100631714} -08/30/2021 15:09:32 - INFO - __main__ - Step 11211: {'lr': 0.0004952376434890372, 'samples': 2152512, 'steps': 11210, 'loss/train': 1.1289713382720947} -08/30/2021 15:09:32 - INFO - __main__ - Step 11212: {'lr': 0.0004952366125589633, 'samples': 2152704, 'steps': 11211, 'loss/train': 2.1865925788879395} -08/30/2021 15:09:33 - INFO - __main__ - Step 11213: {'lr': 0.0004952355815183897, 'samples': 2152896, 'steps': 11212, 'loss/train': 1.869810700416565} -08/30/2021 15:09:33 - INFO - __main__ - Step 11214: {'lr': 0.0004952345503673166, 'samples': 2153088, 'steps': 11213, 'loss/train': 0.21112875640392303} -08/30/2021 15:09:33 - INFO - __main__ - Step 11215: {'lr': 0.0004952335191057447, 'samples': 2153280, 'steps': 11214, 'loss/train': 2.077345371246338} -08/30/2021 15:09:35 - INFO - __main__ - Step 11216: {'lr': 0.0004952324877336743, 'samples': 2153472, 'steps': 11215, 'loss/train': 2.015061855316162} -08/30/2021 15:09:35 - INFO - __main__ - Step 11217: {'lr': 0.0004952314562511059, 'samples': 2153664, 'steps': 11216, 'loss/train': 1.6336077451705933} -08/30/2021 15:09:36 - INFO - __main__ - Step 11218: {'lr': 0.00049523042465804, 'samples': 2153856, 'steps': 11217, 'loss/train': 1.9728543758392334} -08/30/2021 15:09:36 - INFO - __main__ - Step 11219: {'lr': 0.0004952293929544771, 'samples': 2154048, 'steps': 11218, 'loss/train': 1.814045786857605} -08/30/2021 15:09:36 - INFO - __main__ - Step 11220: {'lr': 0.0004952283611404176, 'samples': 2154240, 'steps': 11219, 'loss/train': 1.9692790508270264} -08/30/2021 15:09:39 - INFO - __main__ - Step 11221: {'lr': 0.0004952273292158619, 'samples': 2154432, 'steps': 11220, 'loss/train': 1.3120520114898682} -08/30/2021 15:09:39 - INFO - __main__ - Step 11222: {'lr': 0.0004952262971808106, 'samples': 2154624, 'steps': 11221, 'loss/train': 1.9009259939193726} -08/30/2021 15:09:40 - INFO - __main__ - Step 11223: {'lr': 0.0004952252650352642, 'samples': 2154816, 'steps': 11222, 'loss/train': 2.608480215072632} -08/30/2021 15:09:40 - INFO - __main__ - Step 11224: {'lr': 0.000495224232779223, 'samples': 2155008, 'steps': 11223, 'loss/train': 1.6276488304138184} -08/30/2021 15:09:40 - INFO - __main__ - Step 11225: {'lr': 0.0004952232004126876, 'samples': 2155200, 'steps': 11224, 'loss/train': 2.3533132076263428} -08/30/2021 15:09:41 - INFO - __main__ - Step 11226: {'lr': 0.0004952221679356583, 'samples': 2155392, 'steps': 11225, 'loss/train': 1.5897690057754517} -08/30/2021 15:09:42 - INFO - __main__ - Step 11227: {'lr': 0.0004952211353481358, 'samples': 2155584, 'steps': 11226, 'loss/train': 2.033146858215332} -08/30/2021 15:09:43 - INFO - __main__ - Step 11228: {'lr': 0.0004952201026501204, 'samples': 2155776, 'steps': 11227, 'loss/train': 2.0458672046661377} -08/30/2021 15:09:43 - INFO - __main__ - Step 11229: {'lr': 0.0004952190698416126, 'samples': 2155968, 'steps': 11228, 'loss/train': 1.9060672521591187} -08/30/2021 15:09:43 - INFO - __main__ - Step 11230: {'lr': 0.0004952180369226129, 'samples': 2156160, 'steps': 11229, 'loss/train': 2.1047184467315674} -08/30/2021 15:09:44 - INFO - __main__ - Step 11231: {'lr': 0.0004952170038931217, 'samples': 2156352, 'steps': 11230, 'loss/train': 1.7409850358963013} -08/30/2021 15:09:45 - INFO - __main__ - Step 11232: {'lr': 0.0004952159707531395, 'samples': 2156544, 'steps': 11231, 'loss/train': 2.201941728591919} -08/30/2021 15:09:46 - INFO - __main__ - Step 11233: {'lr': 0.0004952149375026668, 'samples': 2156736, 'steps': 11232, 'loss/train': 1.949341058731079} -08/30/2021 15:09:46 - INFO - __main__ - Step 11234: {'lr': 0.000495213904141704, 'samples': 2156928, 'steps': 11233, 'loss/train': 2.10192608833313} -08/30/2021 15:09:46 - INFO - __main__ - Step 11235: {'lr': 0.0004952128706702516, 'samples': 2157120, 'steps': 11234, 'loss/train': 1.432446002960205} -08/30/2021 15:09:47 - INFO - __main__ - Step 11236: {'lr': 0.0004952118370883101, 'samples': 2157312, 'steps': 11235, 'loss/train': 1.860512137413025} -08/30/2021 15:09:48 - INFO - __main__ - Step 11237: {'lr': 0.0004952108033958798, 'samples': 2157504, 'steps': 11236, 'loss/train': 1.7600961923599243} -08/30/2021 15:09:49 - INFO - __main__ - Step 11238: {'lr': 0.0004952097695929614, 'samples': 2157696, 'steps': 11237, 'loss/train': 1.8075411319732666} -08/30/2021 15:09:49 - INFO - __main__ - Step 11239: {'lr': 0.0004952087356795553, 'samples': 2157888, 'steps': 11238, 'loss/train': 1.9469932317733765} -08/30/2021 15:09:49 - INFO - __main__ - Step 11240: {'lr': 0.0004952077016556619, 'samples': 2158080, 'steps': 11239, 'loss/train': 2.207625389099121} -08/30/2021 15:09:50 - INFO - __main__ - Step 11241: {'lr': 0.0004952066675212816, 'samples': 2158272, 'steps': 11240, 'loss/train': 1.5010963678359985} -08/30/2021 15:09:50 - INFO - __main__ - Step 11242: {'lr': 0.0004952056332764151, 'samples': 2158464, 'steps': 11241, 'loss/train': 1.7851382493972778} -08/30/2021 15:09:52 - INFO - __main__ - Step 11243: {'lr': 0.0004952045989210627, 'samples': 2158656, 'steps': 11242, 'loss/train': 1.4927185773849487} -08/30/2021 15:09:52 - INFO - __main__ - Step 11244: {'lr': 0.0004952035644552249, 'samples': 2158848, 'steps': 11243, 'loss/train': 1.7379070520401} -08/30/2021 15:09:53 - INFO - __main__ - Step 11245: {'lr': 0.000495202529878902, 'samples': 2159040, 'steps': 11244, 'loss/train': 1.5175026655197144} -08/30/2021 15:09:53 - INFO - __main__ - Step 11246: {'lr': 0.0004952014951920948, 'samples': 2159232, 'steps': 11245, 'loss/train': 1.0634227991104126} -08/30/2021 15:09:53 - INFO - __main__ - Step 11247: {'lr': 0.0004952004603948034, 'samples': 2159424, 'steps': 11246, 'loss/train': 1.5533729791641235} -08/30/2021 15:09:55 - INFO - __main__ - Step 11248: {'lr': 0.0004951994254870286, 'samples': 2159616, 'steps': 11247, 'loss/train': 2.3674063682556152} -08/30/2021 15:09:55 - INFO - __main__ - Step 11249: {'lr': 0.0004951983904687708, 'samples': 2159808, 'steps': 11248, 'loss/train': 1.8283774852752686} -08/30/2021 15:09:56 - INFO - __main__ - Step 11250: {'lr': 0.0004951973553400303, 'samples': 2160000, 'steps': 11249, 'loss/train': 1.98063325881958} -08/30/2021 15:09:56 - INFO - __main__ - Step 11251: {'lr': 0.0004951963201008077, 'samples': 2160192, 'steps': 11250, 'loss/train': 1.6316938400268555} -08/30/2021 15:09:56 - INFO - __main__ - Step 11252: {'lr': 0.0004951952847511033, 'samples': 2160384, 'steps': 11251, 'loss/train': 1.882524013519287} -08/30/2021 15:09:57 - INFO - __main__ - Step 11253: {'lr': 0.0004951942492909177, 'samples': 2160576, 'steps': 11252, 'loss/train': 2.1029202938079834} -08/30/2021 15:09:58 - INFO - __main__ - Step 11254: {'lr': 0.0004951932137202515, 'samples': 2160768, 'steps': 11253, 'loss/train': 1.8152189254760742} -08/30/2021 15:09:59 - INFO - __main__ - Step 11255: {'lr': 0.0004951921780391049, 'samples': 2160960, 'steps': 11254, 'loss/train': 0.2853429615497589} -08/30/2021 15:09:59 - INFO - __main__ - Step 11256: {'lr': 0.0004951911422474785, 'samples': 2161152, 'steps': 11255, 'loss/train': 1.8781239986419678} -08/30/2021 15:10:00 - INFO - __main__ - Step 11257: {'lr': 0.0004951901063453728, 'samples': 2161344, 'steps': 11256, 'loss/train': 1.6769670248031616} -08/30/2021 15:10:00 - INFO - __main__ - Step 11258: {'lr': 0.0004951890703327883, 'samples': 2161536, 'steps': 11257, 'loss/train': 1.7944586277008057} -08/30/2021 15:10:01 - INFO - __main__ - Step 11259: {'lr': 0.0004951880342097251, 'samples': 2161728, 'steps': 11258, 'loss/train': 2.091442823410034} -08/30/2021 15:10:02 - INFO - __main__ - Step 11260: {'lr': 0.0004951869979761842, 'samples': 2161920, 'steps': 11259, 'loss/train': 2.2156801223754883} -08/30/2021 15:10:02 - INFO - __main__ - Step 11261: {'lr': 0.0004951859616321658, 'samples': 2162112, 'steps': 11260, 'loss/train': 1.9757577180862427} -08/30/2021 15:10:03 - INFO - __main__ - Step 11262: {'lr': 0.0004951849251776703, 'samples': 2162304, 'steps': 11261, 'loss/train': 1.3211166858673096} -08/30/2021 15:10:03 - INFO - __main__ - Step 11263: {'lr': 0.0004951838886126983, 'samples': 2162496, 'steps': 11262, 'loss/train': 1.3247021436691284} -08/30/2021 15:10:04 - INFO - __main__ - Step 11264: {'lr': 0.0004951828519372503, 'samples': 2162688, 'steps': 11263, 'loss/train': 1.8176363706588745} -08/30/2021 15:10:05 - INFO - __main__ - Step 11265: {'lr': 0.0004951818151513267, 'samples': 2162880, 'steps': 11264, 'loss/train': 1.9629976749420166} -08/30/2021 15:10:05 - INFO - __main__ - Step 11266: {'lr': 0.0004951807782549277, 'samples': 2163072, 'steps': 11265, 'loss/train': 1.8665183782577515} -08/30/2021 15:10:05 - INFO - __main__ - Step 11267: {'lr': 0.0004951797412480544, 'samples': 2163264, 'steps': 11266, 'loss/train': 2.1557822227478027} -08/30/2021 15:10:06 - INFO - __main__ - Step 11268: {'lr': 0.0004951787041307066, 'samples': 2163456, 'steps': 11267, 'loss/train': 1.923411250114441} -08/30/2021 15:10:07 - INFO - __main__ - Step 11269: {'lr': 0.0004951776669028851, 'samples': 2163648, 'steps': 11268, 'loss/train': 2.5946178436279297} -08/30/2021 15:10:08 - INFO - __main__ - Step 11270: {'lr': 0.0004951766295645904, 'samples': 2163840, 'steps': 11269, 'loss/train': 1.7681535482406616} -08/30/2021 15:10:08 - INFO - __main__ - Step 11271: {'lr': 0.000495175592115823, 'samples': 2164032, 'steps': 11270, 'loss/train': 1.0833417177200317} -08/30/2021 15:10:09 - INFO - __main__ - Step 11272: {'lr': 0.0004951745545565831, 'samples': 2164224, 'steps': 11271, 'loss/train': 1.4488327503204346} -08/30/2021 15:10:09 - INFO - __main__ - Step 11273: {'lr': 0.0004951735168868713, 'samples': 2164416, 'steps': 11272, 'loss/train': 1.5733282566070557} -08/30/2021 15:10:11 - INFO - __main__ - Step 11274: {'lr': 0.0004951724791066881, 'samples': 2164608, 'steps': 11273, 'loss/train': 1.629154086112976} -08/30/2021 15:10:11 - INFO - __main__ - Step 11275: {'lr': 0.0004951714412160342, 'samples': 2164800, 'steps': 11274, 'loss/train': 1.9060413837432861} -08/30/2021 15:10:12 - INFO - __main__ - Step 11276: {'lr': 0.0004951704032149096, 'samples': 2164992, 'steps': 11275, 'loss/train': 1.9716060161590576} -08/30/2021 15:10:12 - INFO - __main__ - Step 11277: {'lr': 0.000495169365103315, 'samples': 2165184, 'steps': 11276, 'loss/train': 2.704251766204834} -08/30/2021 15:10:12 - INFO - __main__ - Step 11278: {'lr': 0.0004951683268812511, 'samples': 2165376, 'steps': 11277, 'loss/train': 1.8629169464111328} -08/30/2021 15:10:13 - INFO - __main__ - Step 11279: {'lr': 0.0004951672885487178, 'samples': 2165568, 'steps': 11278, 'loss/train': 1.880487084388733} -08/30/2021 15:10:13 - INFO - __main__ - Step 11280: {'lr': 0.0004951662501057161, 'samples': 2165760, 'steps': 11279, 'loss/train': 2.465620994567871} -08/30/2021 15:10:15 - INFO - __main__ - Step 11281: {'lr': 0.0004951652115522462, 'samples': 2165952, 'steps': 11280, 'loss/train': 1.8681460618972778} -08/30/2021 15:10:16 - INFO - __main__ - Step 11282: {'lr': 0.0004951641728883087, 'samples': 2166144, 'steps': 11281, 'loss/train': 1.5482832193374634} -08/30/2021 15:10:16 - INFO - __main__ - Step 11283: {'lr': 0.000495163134113904, 'samples': 2166336, 'steps': 11282, 'loss/train': 1.5466859340667725} -08/30/2021 15:10:16 - INFO - __main__ - Step 11284: {'lr': 0.0004951620952290325, 'samples': 2166528, 'steps': 11283, 'loss/train': 1.0799888372421265} -08/30/2021 15:10:17 - INFO - __main__ - Step 11285: {'lr': 0.0004951610562336949, 'samples': 2166720, 'steps': 11284, 'loss/train': 1.5446174144744873} -08/30/2021 15:10:18 - INFO - __main__ - Step 11286: {'lr': 0.0004951600171278914, 'samples': 2166912, 'steps': 11285, 'loss/train': 2.0954701900482178} -08/30/2021 15:10:19 - INFO - __main__ - Step 11287: {'lr': 0.0004951589779116225, 'samples': 2167104, 'steps': 11286, 'loss/train': 1.807062029838562} -08/30/2021 15:10:19 - INFO - __main__ - Step 11288: {'lr': 0.0004951579385848889, 'samples': 2167296, 'steps': 11287, 'loss/train': 1.0833994150161743} -08/30/2021 15:10:19 - INFO - __main__ - Step 11289: {'lr': 0.0004951568991476908, 'samples': 2167488, 'steps': 11288, 'loss/train': 1.6628488302230835} -08/30/2021 15:10:20 - INFO - __main__ - Step 11290: {'lr': 0.0004951558596000289, 'samples': 2167680, 'steps': 11289, 'loss/train': 1.7167960405349731} -08/30/2021 15:10:21 - INFO - __main__ - Step 11291: {'lr': 0.0004951548199419035, 'samples': 2167872, 'steps': 11290, 'loss/train': 1.8201220035552979} -08/30/2021 15:10:22 - INFO - __main__ - Step 11292: {'lr': 0.0004951537801733152, 'samples': 2168064, 'steps': 11291, 'loss/train': 1.7071702480316162} -08/30/2021 15:10:22 - INFO - __main__ - Step 11293: {'lr': 0.0004951527402942643, 'samples': 2168256, 'steps': 11292, 'loss/train': 1.5277527570724487} -08/30/2021 15:10:23 - INFO - __main__ - Step 11294: {'lr': 0.0004951517003047512, 'samples': 2168448, 'steps': 11293, 'loss/train': 2.013002872467041} -08/30/2021 15:10:23 - INFO - __main__ - Step 11295: {'lr': 0.0004951506602047767, 'samples': 2168640, 'steps': 11294, 'loss/train': 1.782727837562561} -08/30/2021 15:10:24 - INFO - __main__ - Step 11296: {'lr': 0.0004951496199943412, 'samples': 2168832, 'steps': 11295, 'loss/train': 2.2067103385925293} -08/30/2021 15:10:25 - INFO - __main__ - Step 11297: {'lr': 0.0004951485796734448, 'samples': 2169024, 'steps': 11296, 'loss/train': 1.5037710666656494} -08/30/2021 15:10:25 - INFO - __main__ - Step 11298: {'lr': 0.0004951475392420884, 'samples': 2169216, 'steps': 11297, 'loss/train': 1.933862328529358} -08/30/2021 15:10:26 - INFO - __main__ - Step 11299: {'lr': 0.0004951464987002724, 'samples': 2169408, 'steps': 11298, 'loss/train': 2.2062699794769287} -08/30/2021 15:10:26 - INFO - __main__ - Step 11300: {'lr': 0.000495145458047997, 'samples': 2169600, 'steps': 11299, 'loss/train': 1.884720802307129} -08/30/2021 15:10:26 - INFO - __main__ - Step 11301: {'lr': 0.0004951444172852629, 'samples': 2169792, 'steps': 11300, 'loss/train': 1.504366397857666} -08/30/2021 15:10:28 - INFO - __main__ - Step 11302: {'lr': 0.0004951433764120705, 'samples': 2169984, 'steps': 11301, 'loss/train': 1.9274585247039795} -08/30/2021 15:10:28 - INFO - __main__ - Step 11303: {'lr': 0.0004951423354284202, 'samples': 2170176, 'steps': 11302, 'loss/train': 1.6363259553909302} -08/30/2021 15:10:29 - INFO - __main__ - Step 11304: {'lr': 0.0004951412943343126, 'samples': 2170368, 'steps': 11303, 'loss/train': 1.5677433013916016} -08/30/2021 15:10:29 - INFO - __main__ - Step 11305: {'lr': 0.0004951402531297482, 'samples': 2170560, 'steps': 11304, 'loss/train': 1.9196350574493408} -08/30/2021 15:10:29 - INFO - __main__ - Step 11306: {'lr': 0.0004951392118147273, 'samples': 2170752, 'steps': 11305, 'loss/train': 1.9655555486679077} -08/30/2021 15:10:31 - INFO - __main__ - Step 11307: {'lr': 0.0004951381703892506, 'samples': 2170944, 'steps': 11306, 'loss/train': 1.900527000427246} -08/30/2021 15:10:31 - INFO - __main__ - Step 11308: {'lr': 0.0004951371288533182, 'samples': 2171136, 'steps': 11307, 'loss/train': 6.5954670906066895} -08/30/2021 15:10:32 - INFO - __main__ - Step 11309: {'lr': 0.0004951360872069309, 'samples': 2171328, 'steps': 11308, 'loss/train': 1.617108941078186} -08/30/2021 15:10:32 - INFO - __main__ - Step 11310: {'lr': 0.0004951350454500891, 'samples': 2171520, 'steps': 11309, 'loss/train': 1.9250389337539673} -08/30/2021 15:10:32 - INFO - __main__ - Step 11311: {'lr': 0.0004951340035827932, 'samples': 2171712, 'steps': 11310, 'loss/train': 1.5192028284072876} -08/30/2021 15:10:33 - INFO - __main__ - Step 11312: {'lr': 0.0004951329616050437, 'samples': 2171904, 'steps': 11311, 'loss/train': 1.6938209533691406} -08/30/2021 15:10:34 - INFO - __main__ - Step 11313: {'lr': 0.000495131919516841, 'samples': 2172096, 'steps': 11312, 'loss/train': 0.6564881801605225} -08/30/2021 15:10:35 - INFO - __main__ - Step 11314: {'lr': 0.0004951308773181856, 'samples': 2172288, 'steps': 11313, 'loss/train': 1.6009490489959717} -08/30/2021 15:10:35 - INFO - __main__ - Step 11315: {'lr': 0.0004951298350090782, 'samples': 2172480, 'steps': 11314, 'loss/train': 2.257167339324951} -08/30/2021 15:10:35 - INFO - __main__ - Step 11316: {'lr': 0.000495128792589519, 'samples': 2172672, 'steps': 11315, 'loss/train': 1.8359655141830444} -08/30/2021 15:10:36 - INFO - __main__ - Step 11317: {'lr': 0.0004951277500595085, 'samples': 2172864, 'steps': 11316, 'loss/train': 2.183683395385742} -08/30/2021 15:10:37 - INFO - __main__ - Step 11318: {'lr': 0.0004951267074190473, 'samples': 2173056, 'steps': 11317, 'loss/train': 1.9519745111465454} -08/30/2021 15:10:38 - INFO - __main__ - Step 11319: {'lr': 0.0004951256646681356, 'samples': 2173248, 'steps': 11318, 'loss/train': 2.677309036254883} -08/30/2021 15:10:38 - INFO - __main__ - Step 11320: {'lr': 0.0004951246218067744, 'samples': 2173440, 'steps': 11319, 'loss/train': 2.2664835453033447} -08/30/2021 15:10:38 - INFO - __main__ - Step 11321: {'lr': 0.0004951235788349636, 'samples': 2173632, 'steps': 11320, 'loss/train': 1.917419672012329} -08/30/2021 15:10:39 - INFO - __main__ - Step 11322: {'lr': 0.0004951225357527038, 'samples': 2173824, 'steps': 11321, 'loss/train': 2.0854012966156006} -08/30/2021 15:10:40 - INFO - __main__ - Step 11323: {'lr': 0.0004951214925599957, 'samples': 2174016, 'steps': 11322, 'loss/train': 0.2760118246078491} -08/30/2021 15:10:41 - INFO - __main__ - Step 11324: {'lr': 0.0004951204492568397, 'samples': 2174208, 'steps': 11323, 'loss/train': 1.9507191181182861} -08/30/2021 15:10:41 - INFO - __main__ - Step 11325: {'lr': 0.0004951194058432361, 'samples': 2174400, 'steps': 11324, 'loss/train': 2.103816270828247} -08/30/2021 15:10:41 - INFO - __main__ - Step 11326: {'lr': 0.0004951183623191855, 'samples': 2174592, 'steps': 11325, 'loss/train': 2.3394269943237305} -08/30/2021 15:10:42 - INFO - __main__ - Step 11327: {'lr': 0.0004951173186846884, 'samples': 2174784, 'steps': 11326, 'loss/train': 0.3999486565589905} -08/30/2021 15:10:44 - INFO - __main__ - Step 11328: {'lr': 0.0004951162749397452, 'samples': 2174976, 'steps': 11327, 'loss/train': 1.5916470289230347} -08/30/2021 15:10:44 - INFO - __main__ - Step 11329: {'lr': 0.0004951152310843564, 'samples': 2175168, 'steps': 11328, 'loss/train': 1.4261094331741333} -08/30/2021 15:10:44 - INFO - __main__ - Step 11330: {'lr': 0.0004951141871185224, 'samples': 2175360, 'steps': 11329, 'loss/train': 1.7575404644012451} -08/30/2021 15:10:45 - INFO - __main__ - Step 11331: {'lr': 0.0004951131430422438, 'samples': 2175552, 'steps': 11330, 'loss/train': 2.1405422687530518} -08/30/2021 15:10:45 - INFO - __main__ - Step 11332: {'lr': 0.0004951120988555209, 'samples': 2175744, 'steps': 11331, 'loss/train': 1.8434191942214966} -08/30/2021 15:10:45 - INFO - __main__ - Step 11333: {'lr': 0.0004951110545583543, 'samples': 2175936, 'steps': 11332, 'loss/train': 1.2429536581039429} -08/30/2021 15:10:47 - INFO - __main__ - Step 11334: {'lr': 0.0004951100101507445, 'samples': 2176128, 'steps': 11333, 'loss/train': 0.1674688160419464} -08/30/2021 15:10:48 - INFO - __main__ - Step 11335: {'lr': 0.0004951089656326919, 'samples': 2176320, 'steps': 11334, 'loss/train': 1.6125035285949707} -08/30/2021 15:10:48 - INFO - __main__ - Step 11336: {'lr': 0.0004951079210041969, 'samples': 2176512, 'steps': 11335, 'loss/train': 1.5547882318496704} -08/30/2021 15:10:49 - INFO - __main__ - Step 11337: {'lr': 0.0004951068762652602, 'samples': 2176704, 'steps': 11336, 'loss/train': 1.0038021802902222} -08/30/2021 15:10:49 - INFO - __main__ - Step 11338: {'lr': 0.000495105831415882, 'samples': 2176896, 'steps': 11337, 'loss/train': 2.2198216915130615} -08/30/2021 15:10:50 - INFO - __main__ - Step 11339: {'lr': 0.0004951047864560629, 'samples': 2177088, 'steps': 11338, 'loss/train': 1.911068081855774} -08/30/2021 15:10:51 - INFO - __main__ - Step 11340: {'lr': 0.0004951037413858034, 'samples': 2177280, 'steps': 11339, 'loss/train': 1.9215306043624878} -08/30/2021 15:10:51 - INFO - __main__ - Step 11341: {'lr': 0.000495102696205104, 'samples': 2177472, 'steps': 11340, 'loss/train': 1.4014047384262085} -08/30/2021 15:10:51 - INFO - __main__ - Step 11342: {'lr': 0.000495101650913965, 'samples': 2177664, 'steps': 11341, 'loss/train': 1.8121275901794434} -08/30/2021 15:10:52 - INFO - __main__ - Step 11343: {'lr': 0.000495100605512387, 'samples': 2177856, 'steps': 11342, 'loss/train': 1.7509299516677856} -08/30/2021 15:10:53 - INFO - __main__ - Step 11344: {'lr': 0.0004950995600003705, 'samples': 2178048, 'steps': 11343, 'loss/train': 1.6537495851516724} -08/30/2021 15:10:54 - INFO - __main__ - Step 11345: {'lr': 0.0004950985143779159, 'samples': 2178240, 'steps': 11344, 'loss/train': 0.7755739688873291} -08/30/2021 15:10:54 - INFO - __main__ - Step 11346: {'lr': 0.0004950974686450237, 'samples': 2178432, 'steps': 11345, 'loss/train': 1.8410006761550903} -08/30/2021 15:10:54 - INFO - __main__ - Step 11347: {'lr': 0.0004950964228016944, 'samples': 2178624, 'steps': 11346, 'loss/train': 1.2583353519439697} -08/30/2021 15:10:55 - INFO - __main__ - Step 11348: {'lr': 0.0004950953768479284, 'samples': 2178816, 'steps': 11347, 'loss/train': 1.8307527303695679} -08/30/2021 15:10:57 - INFO - __main__ - Step 11349: {'lr': 0.0004950943307837261, 'samples': 2179008, 'steps': 11348, 'loss/train': 1.7371530532836914} -08/30/2021 15:10:57 - INFO - __main__ - Step 11350: {'lr': 0.0004950932846090882, 'samples': 2179200, 'steps': 11349, 'loss/train': 1.1253018379211426} -08/30/2021 15:10:58 - INFO - __main__ - Step 11351: {'lr': 0.000495092238324015, 'samples': 2179392, 'steps': 11350, 'loss/train': 1.8747700452804565} -08/30/2021 15:10:58 - INFO - __main__ - Step 11352: {'lr': 0.0004950911919285071, 'samples': 2179584, 'steps': 11351, 'loss/train': 1.7259424924850464} -08/30/2021 15:10:58 - INFO - __main__ - Step 11353: {'lr': 0.0004950901454225647, 'samples': 2179776, 'steps': 11352, 'loss/train': 1.6113831996917725} -08/30/2021 15:10:59 - INFO - __main__ - Step 11354: {'lr': 0.0004950890988061886, 'samples': 2179968, 'steps': 11353, 'loss/train': 0.8323259949684143} -08/30/2021 15:11:00 - INFO - __main__ - Step 11355: {'lr': 0.0004950880520793791, 'samples': 2180160, 'steps': 11354, 'loss/train': 0.23962008953094482} -08/30/2021 15:11:01 - INFO - __main__ - Step 11356: {'lr': 0.0004950870052421368, 'samples': 2180352, 'steps': 11355, 'loss/train': 2.2951104640960693} -08/30/2021 15:11:01 - INFO - __main__ - Step 11357: {'lr': 0.000495085958294462, 'samples': 2180544, 'steps': 11356, 'loss/train': 1.816585898399353} -08/30/2021 15:11:01 - INFO - __main__ - Step 11358: {'lr': 0.0004950849112363553, 'samples': 2180736, 'steps': 11357, 'loss/train': 2.080604314804077} -08/30/2021 15:11:02 - INFO - __main__ - Step 11359: {'lr': 0.000495083864067817, 'samples': 2180928, 'steps': 11358, 'loss/train': 1.6112520694732666} -08/30/2021 15:11:03 - INFO - __main__ - Step 11360: {'lr': 0.0004950828167888478, 'samples': 2181120, 'steps': 11359, 'loss/train': 1.975584864616394} -08/30/2021 15:11:04 - INFO - __main__ - Step 11361: {'lr': 0.0004950817693994481, 'samples': 2181312, 'steps': 11360, 'loss/train': 1.4203985929489136} -08/30/2021 15:11:04 - INFO - __main__ - Step 11362: {'lr': 0.0004950807218996182, 'samples': 2181504, 'steps': 11361, 'loss/train': 1.7508667707443237} -08/30/2021 15:11:04 - INFO - __main__ - Step 11363: {'lr': 0.0004950796742893588, 'samples': 2181696, 'steps': 11362, 'loss/train': 1.8694329261779785} -08/30/2021 15:11:05 - INFO - __main__ - Step 11364: {'lr': 0.0004950786265686702, 'samples': 2181888, 'steps': 11363, 'loss/train': 2.099109411239624} -08/30/2021 15:11:06 - INFO - __main__ - Step 11365: {'lr': 0.000495077578737553, 'samples': 2182080, 'steps': 11364, 'loss/train': 1.7561641931533813} -08/30/2021 15:11:07 - INFO - __main__ - Step 11366: {'lr': 0.0004950765307960076, 'samples': 2182272, 'steps': 11365, 'loss/train': 2.115619659423828} -08/30/2021 15:11:07 - INFO - __main__ - Step 11367: {'lr': 0.0004950754827440346, 'samples': 2182464, 'steps': 11366, 'loss/train': 2.081895112991333} -08/30/2021 15:11:07 - INFO - __main__ - Step 11368: {'lr': 0.0004950744345816342, 'samples': 2182656, 'steps': 11367, 'loss/train': 2.2468907833099365} -08/30/2021 15:11:08 - INFO - __main__ - Step 11369: {'lr': 0.0004950733863088072, 'samples': 2182848, 'steps': 11368, 'loss/train': 1.8041374683380127} -08/30/2021 15:11:09 - INFO - __main__ - Step 11370: {'lr': 0.0004950723379255538, 'samples': 2183040, 'steps': 11369, 'loss/train': 1.4568737745285034} -08/30/2021 15:11:10 - INFO - __main__ - Step 11371: {'lr': 0.0004950712894318748, 'samples': 2183232, 'steps': 11370, 'loss/train': 1.7635802030563354} -08/30/2021 15:11:10 - INFO - __main__ - Step 11372: {'lr': 0.0004950702408277702, 'samples': 2183424, 'steps': 11371, 'loss/train': 1.8993170261383057} -08/30/2021 15:11:10 - INFO - __main__ - Step 11373: {'lr': 0.0004950691921132409, 'samples': 2183616, 'steps': 11372, 'loss/train': 1.6851987838745117} -08/30/2021 15:11:11 - INFO - __main__ - Step 11374: {'lr': 0.000495068143288287, 'samples': 2183808, 'steps': 11373, 'loss/train': 1.5347603559494019} -08/30/2021 15:11:12 - INFO - __main__ - Step 11375: {'lr': 0.0004950670943529094, 'samples': 2184000, 'steps': 11374, 'loss/train': 0.24422170221805573} -08/30/2021 15:11:12 - INFO - __main__ - Step 11376: {'lr': 0.0004950660453071082, 'samples': 2184192, 'steps': 11375, 'loss/train': 1.4798616170883179} -08/30/2021 15:11:13 - INFO - __main__ - Step 11377: {'lr': 0.0004950649961508841, 'samples': 2184384, 'steps': 11376, 'loss/train': 1.8383647203445435} -08/30/2021 15:11:13 - INFO - __main__ - Step 11378: {'lr': 0.0004950639468842375, 'samples': 2184576, 'steps': 11377, 'loss/train': 1.9406672716140747} -08/30/2021 15:11:14 - INFO - __main__ - Step 11379: {'lr': 0.0004950628975071688, 'samples': 2184768, 'steps': 11378, 'loss/train': 1.8875216245651245} -08/30/2021 15:11:14 - INFO - __main__ - Step 11380: {'lr': 0.0004950618480196785, 'samples': 2184960, 'steps': 11379, 'loss/train': 2.387690305709839} -08/30/2021 15:11:15 - INFO - __main__ - Step 11381: {'lr': 0.0004950607984217674, 'samples': 2185152, 'steps': 11380, 'loss/train': 1.5684969425201416} -08/30/2021 15:11:16 - INFO - __main__ - Step 11382: {'lr': 0.0004950597487134354, 'samples': 2185344, 'steps': 11381, 'loss/train': 1.6480615139007568} -08/30/2021 15:11:16 - INFO - __main__ - Step 11383: {'lr': 0.0004950586988946834, 'samples': 2185536, 'steps': 11382, 'loss/train': 1.244276523590088} -08/30/2021 15:11:17 - INFO - __main__ - Step 11384: {'lr': 0.0004950576489655116, 'samples': 2185728, 'steps': 11383, 'loss/train': 1.6742000579833984} -08/30/2021 15:11:17 - INFO - __main__ - Step 11385: {'lr': 0.0004950565989259207, 'samples': 2185920, 'steps': 11384, 'loss/train': 4.0317583084106445} -08/30/2021 15:11:19 - INFO - __main__ - Step 11386: {'lr': 0.000495055548775911, 'samples': 2186112, 'steps': 11385, 'loss/train': 1.1463463306427002} -08/30/2021 15:11:19 - INFO - __main__ - Step 11387: {'lr': 0.0004950544985154831, 'samples': 2186304, 'steps': 11386, 'loss/train': 2.13299298286438} -08/30/2021 15:11:20 - INFO - __main__ - Step 11388: {'lr': 0.0004950534481446375, 'samples': 2186496, 'steps': 11387, 'loss/train': 1.6333603858947754} -08/30/2021 15:11:20 - INFO - __main__ - Step 11389: {'lr': 0.0004950523976633745, 'samples': 2186688, 'steps': 11388, 'loss/train': 1.558982253074646} -08/30/2021 15:11:21 - INFO - __main__ - Step 11390: {'lr': 0.0004950513470716947, 'samples': 2186880, 'steps': 11389, 'loss/train': 1.686103105545044} -08/30/2021 15:11:22 - INFO - __main__ - Step 11391: {'lr': 0.0004950502963695985, 'samples': 2187072, 'steps': 11390, 'loss/train': 1.4806197881698608} -08/30/2021 15:11:22 - INFO - __main__ - Step 11392: {'lr': 0.0004950492455570865, 'samples': 2187264, 'steps': 11391, 'loss/train': 1.9360294342041016} -08/30/2021 15:11:23 - INFO - __main__ - Step 11393: {'lr': 0.000495048194634159, 'samples': 2187456, 'steps': 11392, 'loss/train': 1.743755578994751} -08/30/2021 15:11:23 - INFO - __main__ - Step 11394: {'lr': 0.0004950471436008167, 'samples': 2187648, 'steps': 11393, 'loss/train': 1.9910410642623901} -08/30/2021 15:11:24 - INFO - __main__ - Step 11395: {'lr': 0.0004950460924570598, 'samples': 2187840, 'steps': 11394, 'loss/train': 1.5394583940505981} -08/30/2021 15:11:25 - INFO - __main__ - Step 11396: {'lr': 0.0004950450412028889, 'samples': 2188032, 'steps': 11395, 'loss/train': 2.050934314727783} -08/30/2021 15:11:26 - INFO - __main__ - Step 11397: {'lr': 0.0004950439898383047, 'samples': 2188224, 'steps': 11396, 'loss/train': 1.9023692607879639} -08/30/2021 15:11:26 - INFO - __main__ - Step 11398: {'lr': 0.0004950429383633073, 'samples': 2188416, 'steps': 11397, 'loss/train': 1.5343270301818848} -08/30/2021 15:11:26 - INFO - __main__ - Step 11399: {'lr': 0.0004950418867778973, 'samples': 2188608, 'steps': 11398, 'loss/train': 1.8388445377349854} -08/30/2021 15:11:27 - INFO - __main__ - Step 11400: {'lr': 0.0004950408350820752, 'samples': 2188800, 'steps': 11399, 'loss/train': 1.4250836372375488} -08/30/2021 15:11:28 - INFO - __main__ - Step 11401: {'lr': 0.0004950397832758415, 'samples': 2188992, 'steps': 11400, 'loss/train': 1.785843849182129} -08/30/2021 15:11:29 - INFO - __main__ - Step 11402: {'lr': 0.0004950387313591968, 'samples': 2189184, 'steps': 11401, 'loss/train': 1.565565824508667} -08/30/2021 15:11:29 - INFO - __main__ - Step 11403: {'lr': 0.0004950376793321413, 'samples': 2189376, 'steps': 11402, 'loss/train': 1.7468514442443848} -08/30/2021 15:11:29 - INFO - __main__ - Step 11404: {'lr': 0.0004950366271946756, 'samples': 2189568, 'steps': 11403, 'loss/train': 2.0025267601013184} -08/30/2021 15:11:30 - INFO - __main__ - Step 11405: {'lr': 0.0004950355749468001, 'samples': 2189760, 'steps': 11404, 'loss/train': 1.8536142110824585} -08/30/2021 15:11:30 - INFO - __main__ - Step 11406: {'lr': 0.0004950345225885155, 'samples': 2189952, 'steps': 11405, 'loss/train': 0.2752886414527893} -08/30/2021 15:11:32 - INFO - __main__ - Step 11407: {'lr': 0.0004950334701198222, 'samples': 2190144, 'steps': 11406, 'loss/train': 2.00809383392334} -08/30/2021 15:11:32 - INFO - __main__ - Step 11408: {'lr': 0.0004950324175407204, 'samples': 2190336, 'steps': 11407, 'loss/train': 1.8668293952941895} -08/30/2021 15:11:33 - INFO - __main__ - Step 11409: {'lr': 0.0004950313648512108, 'samples': 2190528, 'steps': 11408, 'loss/train': 1.761200189590454} -08/30/2021 15:11:33 - INFO - __main__ - Step 11410: {'lr': 0.0004950303120512939, 'samples': 2190720, 'steps': 11409, 'loss/train': 2.185830593109131} -08/30/2021 15:11:33 - INFO - __main__ - Step 11411: {'lr': 0.0004950292591409701, 'samples': 2190912, 'steps': 11410, 'loss/train': 1.8082395792007446} -08/30/2021 15:11:35 - INFO - __main__ - Step 11412: {'lr': 0.0004950282061202399, 'samples': 2191104, 'steps': 11411, 'loss/train': 1.9240211248397827} -08/30/2021 15:11:35 - INFO - __main__ - Step 11413: {'lr': 0.0004950271529891038, 'samples': 2191296, 'steps': 11412, 'loss/train': 2.0106911659240723} -08/30/2021 15:11:35 - INFO - __main__ - Step 11414: {'lr': 0.0004950260997475623, 'samples': 2191488, 'steps': 11413, 'loss/train': 2.187958002090454} -08/30/2021 15:11:36 - INFO - __main__ - Step 11415: {'lr': 0.0004950250463956157, 'samples': 2191680, 'steps': 11414, 'loss/train': 1.452856421470642} -08/30/2021 15:11:36 - INFO - __main__ - Step 11416: {'lr': 0.0004950239929332646, 'samples': 2191872, 'steps': 11415, 'loss/train': 1.5508602857589722} -08/30/2021 15:11:38 - INFO - __main__ - Step 11417: {'lr': 0.0004950229393605095, 'samples': 2192064, 'steps': 11416, 'loss/train': 1.605417013168335} -08/30/2021 15:11:38 - INFO - __main__ - Step 11418: {'lr': 0.0004950218856773509, 'samples': 2192256, 'steps': 11417, 'loss/train': 1.8712059259414673} -08/30/2021 15:11:38 - INFO - __main__ - Step 11419: {'lr': 0.0004950208318837892, 'samples': 2192448, 'steps': 11418, 'loss/train': 1.351062297821045} -08/30/2021 15:11:39 - INFO - __main__ - Step 11420: {'lr': 0.0004950197779798248, 'samples': 2192640, 'steps': 11419, 'loss/train': 2.036375045776367} -08/30/2021 15:11:39 - INFO - __main__ - Step 11421: {'lr': 0.0004950187239654584, 'samples': 2192832, 'steps': 11420, 'loss/train': 1.9271739721298218} -08/30/2021 15:11:40 - INFO - __main__ - Step 11422: {'lr': 0.0004950176698406903, 'samples': 2193024, 'steps': 11421, 'loss/train': 1.716298222541809} -08/30/2021 15:11:41 - INFO - __main__ - Step 11423: {'lr': 0.000495016615605521, 'samples': 2193216, 'steps': 11422, 'loss/train': 1.8552886247634888} -08/30/2021 15:11:41 - INFO - __main__ - Step 11424: {'lr': 0.0004950155612599511, 'samples': 2193408, 'steps': 11423, 'loss/train': 1.9429852962493896} -08/30/2021 15:11:42 - INFO - __main__ - Step 11425: {'lr': 0.0004950145068039808, 'samples': 2193600, 'steps': 11424, 'loss/train': 1.621841311454773} -08/30/2021 15:11:42 - INFO - __main__ - Step 11426: {'lr': 0.0004950134522376108, 'samples': 2193792, 'steps': 11425, 'loss/train': 1.1670444011688232} -08/30/2021 15:11:44 - INFO - __main__ - Step 11427: {'lr': 0.0004950123975608415, 'samples': 2193984, 'steps': 11426, 'loss/train': 1.1248893737792969} -08/30/2021 15:11:44 - INFO - __main__ - Step 11428: {'lr': 0.0004950113427736734, 'samples': 2194176, 'steps': 11427, 'loss/train': 1.8337293863296509} -08/30/2021 15:11:44 - INFO - __main__ - Step 11429: {'lr': 0.000495010287876107, 'samples': 2194368, 'steps': 11428, 'loss/train': 1.7891881465911865} -08/30/2021 15:11:45 - INFO - __main__ - Step 11430: {'lr': 0.0004950092328681428, 'samples': 2194560, 'steps': 11429, 'loss/train': 1.9474878311157227} -08/30/2021 15:11:45 - INFO - __main__ - Step 11431: {'lr': 0.0004950081777497812, 'samples': 2194752, 'steps': 11430, 'loss/train': 0.9480117559432983} -08/30/2021 15:11:47 - INFO - __main__ - Step 11432: {'lr': 0.0004950071225210226, 'samples': 2194944, 'steps': 11431, 'loss/train': 1.7373414039611816} -08/30/2021 15:11:47 - INFO - __main__ - Step 11433: {'lr': 0.0004950060671818676, 'samples': 2195136, 'steps': 11432, 'loss/train': 1.7810802459716797} -08/30/2021 15:11:47 - INFO - __main__ - Step 11434: {'lr': 0.0004950050117323167, 'samples': 2195328, 'steps': 11433, 'loss/train': 0.7894968390464783} -08/30/2021 15:11:48 - INFO - __main__ - Step 11435: {'lr': 0.0004950039561723703, 'samples': 2195520, 'steps': 11434, 'loss/train': 1.410385012626648} -08/30/2021 15:11:48 - INFO - __main__ - Step 11436: {'lr': 0.0004950029005020289, 'samples': 2195712, 'steps': 11435, 'loss/train': 1.2500255107879639} -08/30/2021 15:11:50 - INFO - __main__ - Step 11437: {'lr': 0.0004950018447212929, 'samples': 2195904, 'steps': 11436, 'loss/train': 2.069624423980713} -08/30/2021 15:11:51 - INFO - __main__ - Step 11438: {'lr': 0.000495000788830163, 'samples': 2196096, 'steps': 11437, 'loss/train': 2.014286994934082} -08/30/2021 15:11:51 - INFO - __main__ - Step 11439: {'lr': 0.0004949997328286394, 'samples': 2196288, 'steps': 11438, 'loss/train': 1.1920604705810547} -08/30/2021 15:11:51 - INFO - __main__ - Step 11440: {'lr': 0.0004949986767167228, 'samples': 2196480, 'steps': 11439, 'loss/train': 1.7225277423858643} -08/30/2021 15:11:52 - INFO - __main__ - Step 11441: {'lr': 0.0004949976204944135, 'samples': 2196672, 'steps': 11440, 'loss/train': 1.8489760160446167} -08/30/2021 15:11:52 - INFO - __main__ - Step 11442: {'lr': 0.0004949965641617121, 'samples': 2196864, 'steps': 11441, 'loss/train': 1.3143986463546753} -08/30/2021 15:11:53 - INFO - __main__ - Step 11443: {'lr': 0.000494995507718619, 'samples': 2197056, 'steps': 11442, 'loss/train': 2.4320342540740967} -08/30/2021 15:11:54 - INFO - __main__ - Step 11444: {'lr': 0.0004949944511651347, 'samples': 2197248, 'steps': 11443, 'loss/train': 1.6460480690002441} -08/30/2021 15:11:54 - INFO - __main__ - Step 11445: {'lr': 0.0004949933945012597, 'samples': 2197440, 'steps': 11444, 'loss/train': 2.2736902236938477} -08/30/2021 15:11:55 - INFO - __main__ - Step 11446: {'lr': 0.0004949923377269945, 'samples': 2197632, 'steps': 11445, 'loss/train': 1.8962833881378174} -08/30/2021 15:11:55 - INFO - __main__ - Step 11447: {'lr': 0.0004949912808423394, 'samples': 2197824, 'steps': 11446, 'loss/train': 1.2450982332229614} -08/30/2021 15:11:57 - INFO - __main__ - Step 11448: {'lr': 0.000494990223847295, 'samples': 2198016, 'steps': 11447, 'loss/train': 1.5632365942001343} -08/30/2021 15:11:57 - INFO - __main__ - Step 11449: {'lr': 0.000494989166741862, 'samples': 2198208, 'steps': 11448, 'loss/train': 1.8916257619857788} -08/30/2021 15:11:57 - INFO - __main__ - Step 11450: {'lr': 0.0004949881095260405, 'samples': 2198400, 'steps': 11449, 'loss/train': 1.5801581144332886} -08/30/2021 15:11:58 - INFO - __main__ - Step 11451: {'lr': 0.0004949870521998312, 'samples': 2198592, 'steps': 11450, 'loss/train': 1.127855658531189} -08/30/2021 15:11:58 - INFO - __main__ - Step 11452: {'lr': 0.0004949859947632344, 'samples': 2198784, 'steps': 11451, 'loss/train': 1.5080382823944092} -08/30/2021 15:12:00 - INFO - __main__ - Step 11453: {'lr': 0.0004949849372162509, 'samples': 2198976, 'steps': 11452, 'loss/train': 1.588152289390564} -08/30/2021 15:12:00 - INFO - __main__ - Step 11454: {'lr': 0.0004949838795588808, 'samples': 2199168, 'steps': 11453, 'loss/train': 1.9238343238830566} -08/30/2021 15:12:00 - INFO - __main__ - Step 11455: {'lr': 0.0004949828217911248, 'samples': 2199360, 'steps': 11454, 'loss/train': 1.08119535446167} -08/30/2021 15:12:01 - INFO - __main__ - Step 11456: {'lr': 0.0004949817639129832, 'samples': 2199552, 'steps': 11455, 'loss/train': 1.9389153718948364} -08/30/2021 15:12:01 - INFO - __main__ - Step 11457: {'lr': 0.0004949807059244568, 'samples': 2199744, 'steps': 11456, 'loss/train': 1.6951968669891357} -08/30/2021 15:12:03 - INFO - __main__ - Step 11458: {'lr': 0.0004949796478255458, 'samples': 2199936, 'steps': 11457, 'loss/train': 1.8409918546676636} -08/30/2021 15:12:04 - INFO - __main__ - Step 11459: {'lr': 0.0004949785896162507, 'samples': 2200128, 'steps': 11458, 'loss/train': 0.18376825749874115} -08/30/2021 15:12:04 - INFO - __main__ - Step 11460: {'lr': 0.0004949775312965721, 'samples': 2200320, 'steps': 11459, 'loss/train': 0.5928048491477966} -08/30/2021 15:12:04 - INFO - __main__ - Step 11461: {'lr': 0.0004949764728665103, 'samples': 2200512, 'steps': 11460, 'loss/train': 2.0808823108673096} -08/30/2021 15:12:05 - INFO - __main__ - Step 11462: {'lr': 0.000494975414326066, 'samples': 2200704, 'steps': 11461, 'loss/train': 1.1502190828323364} -08/30/2021 15:12:05 - INFO - __main__ - Step 11463: {'lr': 0.0004949743556752395, 'samples': 2200896, 'steps': 11462, 'loss/train': 2.22263240814209} -08/30/2021 15:12:06 - INFO - __main__ - Step 11464: {'lr': 0.0004949732969140313, 'samples': 2201088, 'steps': 11463, 'loss/train': 1.1926612854003906} -08/30/2021 15:12:07 - INFO - __main__ - Step 11465: {'lr': 0.000494972238042442, 'samples': 2201280, 'steps': 11464, 'loss/train': 1.6181837320327759} -08/30/2021 15:12:07 - INFO - __main__ - Step 11466: {'lr': 0.0004949711790604719, 'samples': 2201472, 'steps': 11465, 'loss/train': 2.271275520324707} -08/30/2021 15:12:08 - INFO - __main__ - Step 11467: {'lr': 0.0004949701199681217, 'samples': 2201664, 'steps': 11466, 'loss/train': 2.116138458251953} -08/30/2021 15:12:08 - INFO - __main__ - Step 11468: {'lr': 0.0004949690607653916, 'samples': 2201856, 'steps': 11467, 'loss/train': 2.0212857723236084} -08/30/2021 15:12:08 - INFO - __main__ - Step 11469: {'lr': 0.0004949680014522822, 'samples': 2202048, 'steps': 11468, 'loss/train': 2.1533942222595215} -08/30/2021 15:12:10 - INFO - __main__ - Step 11470: {'lr': 0.0004949669420287941, 'samples': 2202240, 'steps': 11469, 'loss/train': 1.9581927061080933} -08/30/2021 15:12:10 - INFO - __main__ - Step 11471: {'lr': 0.0004949658824949277, 'samples': 2202432, 'steps': 11470, 'loss/train': 1.466626763343811} -08/30/2021 15:12:11 - INFO - __main__ - Step 11472: {'lr': 0.0004949648228506834, 'samples': 2202624, 'steps': 11471, 'loss/train': 2.671245574951172} -08/30/2021 15:12:11 - INFO - __main__ - Step 11473: {'lr': 0.0004949637630960618, 'samples': 2202816, 'steps': 11472, 'loss/train': 1.816586971282959} -08/30/2021 15:12:11 - INFO - __main__ - Step 11474: {'lr': 0.0004949627032310632, 'samples': 2203008, 'steps': 11473, 'loss/train': 2.005235195159912} -08/30/2021 15:12:13 - INFO - __main__ - Step 11475: {'lr': 0.0004949616432556882, 'samples': 2203200, 'steps': 11474, 'loss/train': 1.8697184324264526} -08/30/2021 15:12:13 - INFO - __main__ - Step 11476: {'lr': 0.0004949605831699373, 'samples': 2203392, 'steps': 11475, 'loss/train': 1.800644874572754} -08/30/2021 15:12:14 - INFO - __main__ - Step 11477: {'lr': 0.000494959522973811, 'samples': 2203584, 'steps': 11476, 'loss/train': 2.8131799697875977} -08/30/2021 15:12:14 - INFO - __main__ - Step 11478: {'lr': 0.0004949584626673096, 'samples': 2203776, 'steps': 11477, 'loss/train': 1.9296927452087402} -08/30/2021 15:12:14 - INFO - __main__ - Step 11479: {'lr': 0.0004949574022504338, 'samples': 2203968, 'steps': 11478, 'loss/train': 2.1797196865081787} -08/30/2021 15:12:15 - INFO - __main__ - Step 11480: {'lr': 0.0004949563417231838, 'samples': 2204160, 'steps': 11479, 'loss/train': 1.968984842300415} -08/30/2021 15:12:16 - INFO - __main__ - Step 11481: {'lr': 0.0004949552810855605, 'samples': 2204352, 'steps': 11480, 'loss/train': 1.8311598300933838} -08/30/2021 15:12:17 - INFO - __main__ - Step 11482: {'lr': 0.000494954220337564, 'samples': 2204544, 'steps': 11481, 'loss/train': 2.0590016841888428} -08/30/2021 15:12:17 - INFO - __main__ - Step 11483: {'lr': 0.0004949531594791948, 'samples': 2204736, 'steps': 11482, 'loss/train': 2.3185112476348877} -08/30/2021 15:12:18 - INFO - __main__ - Step 11484: {'lr': 0.0004949520985104536, 'samples': 2204928, 'steps': 11483, 'loss/train': 3.4016640186309814} -08/30/2021 15:12:18 - INFO - __main__ - Step 11485: {'lr': 0.0004949510374313409, 'samples': 2205120, 'steps': 11484, 'loss/train': 2.110018014907837} -08/30/2021 15:12:19 - INFO - __main__ - Step 11486: {'lr': 0.0004949499762418568, 'samples': 2205312, 'steps': 11485, 'loss/train': 1.697204828262329} -08/30/2021 15:12:20 - INFO - __main__ - Step 11487: {'lr': 0.0004949489149420021, 'samples': 2205504, 'steps': 11486, 'loss/train': 1.617307424545288} -08/30/2021 15:12:20 - INFO - __main__ - Step 11488: {'lr': 0.0004949478535317773, 'samples': 2205696, 'steps': 11487, 'loss/train': 2.041067600250244} -08/30/2021 15:12:21 - INFO - __main__ - Step 11489: {'lr': 0.0004949467920111827, 'samples': 2205888, 'steps': 11488, 'loss/train': 1.648711919784546} -08/30/2021 15:12:21 - INFO - __main__ - Step 11490: {'lr': 0.0004949457303802189, 'samples': 2206080, 'steps': 11489, 'loss/train': 2.0404109954833984} -08/30/2021 15:12:22 - INFO - __main__ - Step 11491: {'lr': 0.0004949446686388862, 'samples': 2206272, 'steps': 11490, 'loss/train': 2.035813093185425} -08/30/2021 15:12:23 - INFO - __main__ - Step 11492: {'lr': 0.0004949436067871854, 'samples': 2206464, 'steps': 11491, 'loss/train': 1.2325630187988281} -08/30/2021 15:12:23 - INFO - __main__ - Step 11493: {'lr': 0.0004949425448251166, 'samples': 2206656, 'steps': 11492, 'loss/train': 1.953182578086853} -08/30/2021 15:12:24 - INFO - __main__ - Step 11494: {'lr': 0.0004949414827526805, 'samples': 2206848, 'steps': 11493, 'loss/train': 1.9621326923370361} -08/30/2021 15:12:24 - INFO - __main__ - Step 11495: {'lr': 0.0004949404205698777, 'samples': 2207040, 'steps': 11494, 'loss/train': 2.5060646533966064} -08/30/2021 15:12:26 - INFO - __main__ - Step 11496: {'lr': 0.0004949393582767084, 'samples': 2207232, 'steps': 11495, 'loss/train': 1.8357990980148315} -08/30/2021 15:12:27 - INFO - __main__ - Step 11497: {'lr': 0.0004949382958731733, 'samples': 2207424, 'steps': 11496, 'loss/train': 0.8789867758750916} -08/30/2021 15:12:27 - INFO - __main__ - Step 11498: {'lr': 0.0004949372333592728, 'samples': 2207616, 'steps': 11497, 'loss/train': 1.5982937812805176} -08/30/2021 15:12:27 - INFO - __main__ - Step 11499: {'lr': 0.0004949361707350072, 'samples': 2207808, 'steps': 11498, 'loss/train': 1.4534696340560913} -08/30/2021 15:12:28 - INFO - __main__ - Step 11500: {'lr': 0.0004949351080003773, 'samples': 2208000, 'steps': 11499, 'loss/train': 2.250380516052246} -08/30/2021 15:12:29 - INFO - __main__ - Step 11501: {'lr': 0.0004949340451553833, 'samples': 2208192, 'steps': 11500, 'loss/train': 1.8547236919403076} -08/30/2021 15:12:30 - INFO - __main__ - Step 11502: {'lr': 0.0004949329822000259, 'samples': 2208384, 'steps': 11501, 'loss/train': 1.9595515727996826} -08/30/2021 15:12:30 - INFO - __main__ - Step 11503: {'lr': 0.0004949319191343053, 'samples': 2208576, 'steps': 11502, 'loss/train': 1.8780261278152466} -08/30/2021 15:12:30 - INFO - __main__ - Step 11504: {'lr': 0.0004949308559582224, 'samples': 2208768, 'steps': 11503, 'loss/train': 2.0255348682403564} -08/30/2021 15:12:31 - INFO - __main__ - Step 11505: {'lr': 0.0004949297926717772, 'samples': 2208960, 'steps': 11504, 'loss/train': 1.9734972715377808} -08/30/2021 15:12:32 - INFO - __main__ - Step 11506: {'lr': 0.0004949287292749705, 'samples': 2209152, 'steps': 11505, 'loss/train': 2.2389514446258545} -08/30/2021 15:12:33 - INFO - __main__ - Step 11507: {'lr': 0.0004949276657678028, 'samples': 2209344, 'steps': 11506, 'loss/train': 1.9121968746185303} -08/30/2021 15:12:33 - INFO - __main__ - Step 11508: {'lr': 0.0004949266021502744, 'samples': 2209536, 'steps': 11507, 'loss/train': 2.019136428833008} -08/30/2021 15:12:34 - INFO - __main__ - Step 11509: {'lr': 0.0004949255384223859, 'samples': 2209728, 'steps': 11508, 'loss/train': 1.6755554676055908} -08/30/2021 15:12:34 - INFO - __main__ - Step 11510: {'lr': 0.0004949244745841377, 'samples': 2209920, 'steps': 11509, 'loss/train': 1.882054090499878} -08/30/2021 15:12:34 - INFO - __main__ - Step 11511: {'lr': 0.0004949234106355302, 'samples': 2210112, 'steps': 11510, 'loss/train': 2.2465193271636963} -08/30/2021 15:12:36 - INFO - __main__ - Step 11512: {'lr': 0.0004949223465765642, 'samples': 2210304, 'steps': 11511, 'loss/train': 0.22742246091365814} -08/30/2021 15:12:36 - INFO - __main__ - Step 11513: {'lr': 0.0004949212824072398, 'samples': 2210496, 'steps': 11512, 'loss/train': 2.0608224868774414} -08/30/2021 15:12:36 - INFO - __main__ - Step 11514: {'lr': 0.0004949202181275577, 'samples': 2210688, 'steps': 11513, 'loss/train': 2.3194799423217773} -08/30/2021 15:12:37 - INFO - __main__ - Step 11515: {'lr': 0.0004949191537375184, 'samples': 2210880, 'steps': 11514, 'loss/train': 1.2681190967559814} -08/30/2021 15:12:37 - INFO - __main__ - Step 11516: {'lr': 0.0004949180892371223, 'samples': 2211072, 'steps': 11515, 'loss/train': 2.259357213973999} -08/30/2021 15:12:39 - INFO - __main__ - Step 11517: {'lr': 0.0004949170246263697, 'samples': 2211264, 'steps': 11516, 'loss/train': 2.110447645187378} -08/30/2021 15:12:40 - INFO - __main__ - Step 11518: {'lr': 0.0004949159599052614, 'samples': 2211456, 'steps': 11517, 'loss/train': 1.9945828914642334} -08/30/2021 15:12:40 - INFO - __main__ - Step 11519: {'lr': 0.0004949148950737978, 'samples': 2211648, 'steps': 11518, 'loss/train': 1.3599166870117188} -08/30/2021 15:12:40 - INFO - __main__ - Step 11520: {'lr': 0.0004949138301319793, 'samples': 2211840, 'steps': 11519, 'loss/train': 1.9862539768218994} -08/30/2021 15:12:41 - INFO - __main__ - Step 11521: {'lr': 0.0004949127650798063, 'samples': 2212032, 'steps': 11520, 'loss/train': 1.6792529821395874} -08/30/2021 15:12:42 - INFO - __main__ - Step 11522: {'lr': 0.0004949116999172795, 'samples': 2212224, 'steps': 11521, 'loss/train': 0.1359776258468628} -08/30/2021 15:12:43 - INFO - __main__ - Step 11523: {'lr': 0.0004949106346443992, 'samples': 2212416, 'steps': 11522, 'loss/train': 1.5791847705841064} -08/30/2021 15:12:43 - INFO - __main__ - Step 11524: {'lr': 0.0004949095692611661, 'samples': 2212608, 'steps': 11523, 'loss/train': 1.855224847793579} -08/30/2021 15:12:43 - INFO - __main__ - Step 11525: {'lr': 0.0004949085037675803, 'samples': 2212800, 'steps': 11524, 'loss/train': 0.5812322497367859} -08/30/2021 15:12:44 - INFO - __main__ - Step 11526: {'lr': 0.0004949074381636427, 'samples': 2212992, 'steps': 11525, 'loss/train': 1.8495157957077026} -08/30/2021 15:12:45 - INFO - __main__ - Step 11527: {'lr': 0.0004949063724493534, 'samples': 2213184, 'steps': 11526, 'loss/train': 1.6610225439071655} -08/30/2021 15:12:46 - INFO - __main__ - Step 11528: {'lr': 0.0004949053066247133, 'samples': 2213376, 'steps': 11527, 'loss/train': 1.7594808340072632} -08/30/2021 15:12:46 - INFO - __main__ - Step 11529: {'lr': 0.0004949042406897225, 'samples': 2213568, 'steps': 11528, 'loss/train': 1.9221631288528442} -08/30/2021 15:12:46 - INFO - __main__ - Step 11530: {'lr': 0.0004949031746443816, 'samples': 2213760, 'steps': 11529, 'loss/train': 2.2979493141174316} -08/30/2021 15:12:47 - INFO - __main__ - Step 11531: {'lr': 0.0004949021084886912, 'samples': 2213952, 'steps': 11530, 'loss/train': 1.7816247940063477} -08/30/2021 15:12:47 - INFO - __main__ - Step 11532: {'lr': 0.0004949010422226517, 'samples': 2214144, 'steps': 11531, 'loss/train': 1.6920993328094482} -08/30/2021 15:12:48 - INFO - __main__ - Step 11533: {'lr': 0.0004948999758462634, 'samples': 2214336, 'steps': 11532, 'loss/train': 1.6868573427200317} -08/30/2021 15:12:49 - INFO - __main__ - Step 11534: {'lr': 0.000494898909359527, 'samples': 2214528, 'steps': 11533, 'loss/train': 1.9775546789169312} -08/30/2021 15:12:49 - INFO - __main__ - Step 11535: {'lr': 0.0004948978427624431, 'samples': 2214720, 'steps': 11534, 'loss/train': 1.809630274772644} -08/30/2021 15:12:50 - INFO - __main__ - Step 11536: {'lr': 0.0004948967760550119, 'samples': 2214912, 'steps': 11535, 'loss/train': 1.6731148958206177} -08/30/2021 15:12:50 - INFO - __main__ - Step 11537: {'lr': 0.000494895709237234, 'samples': 2215104, 'steps': 11536, 'loss/train': 0.14407263696193695} -08/30/2021 15:12:52 - INFO - __main__ - Step 11538: {'lr': 0.0004948946423091099, 'samples': 2215296, 'steps': 11537, 'loss/train': 1.6394861936569214} -08/30/2021 15:12:52 - INFO - __main__ - Step 11539: {'lr': 0.0004948935752706401, 'samples': 2215488, 'steps': 11538, 'loss/train': 1.3665229082107544} -08/30/2021 15:12:52 - INFO - __main__ - Step 11540: {'lr': 0.0004948925081218248, 'samples': 2215680, 'steps': 11539, 'loss/train': 1.4844862222671509} -08/30/2021 15:12:53 - INFO - __main__ - Step 11541: {'lr': 0.000494891440862665, 'samples': 2215872, 'steps': 11540, 'loss/train': 1.7068301439285278} -08/30/2021 15:12:53 - INFO - __main__ - Step 11542: {'lr': 0.0004948903734931608, 'samples': 2216064, 'steps': 11541, 'loss/train': 1.3557708263397217} -08/30/2021 15:12:55 - INFO - __main__ - Step 11543: {'lr': 0.0004948893060133128, 'samples': 2216256, 'steps': 11542, 'loss/train': 0.9980223178863525} -08/30/2021 15:12:56 - INFO - __main__ - Step 11544: {'lr': 0.0004948882384231213, 'samples': 2216448, 'steps': 11543, 'loss/train': 1.9851670265197754} -08/30/2021 15:12:56 - INFO - __main__ - Step 11545: {'lr': 0.0004948871707225871, 'samples': 2216640, 'steps': 11544, 'loss/train': 1.6814534664154053} -08/30/2021 15:12:56 - INFO - __main__ - Step 11546: {'lr': 0.0004948861029117104, 'samples': 2216832, 'steps': 11545, 'loss/train': 2.059412717819214} -08/30/2021 15:12:57 - INFO - __main__ - Step 11547: {'lr': 0.0004948850349904919, 'samples': 2217024, 'steps': 11546, 'loss/train': 1.3900164365768433} -08/30/2021 15:12:57 - INFO - __main__ - Step 11548: {'lr': 0.0004948839669589319, 'samples': 2217216, 'steps': 11547, 'loss/train': 2.05084228515625} -08/30/2021 15:12:57 - INFO - __main__ - Step 11549: {'lr': 0.000494882898817031, 'samples': 2217408, 'steps': 11548, 'loss/train': 0.1329517364501953} -08/30/2021 15:12:59 - INFO - __main__ - Step 11550: {'lr': 0.0004948818305647897, 'samples': 2217600, 'steps': 11549, 'loss/train': 0.5742965340614319} -08/30/2021 15:13:00 - INFO - __main__ - Step 11551: {'lr': 0.0004948807622022083, 'samples': 2217792, 'steps': 11550, 'loss/train': 1.0276354551315308} -08/30/2021 15:13:00 - INFO - __main__ - Step 11552: {'lr': 0.0004948796937292875, 'samples': 2217984, 'steps': 11551, 'loss/train': 2.0554378032684326} -08/30/2021 15:13:01 - INFO - __main__ - Step 11553: {'lr': 0.0004948786251460277, 'samples': 2218176, 'steps': 11552, 'loss/train': 1.0231890678405762} -08/30/2021 15:13:01 - INFO - __main__ - Step 11554: {'lr': 0.0004948775564524294, 'samples': 2218368, 'steps': 11553, 'loss/train': 1.4752169847488403} -08/30/2021 15:13:03 - INFO - __main__ - Step 11555: {'lr': 0.000494876487648493, 'samples': 2218560, 'steps': 11554, 'loss/train': 1.8001103401184082} -08/30/2021 15:13:03 - INFO - __main__ - Step 11556: {'lr': 0.0004948754187342189, 'samples': 2218752, 'steps': 11555, 'loss/train': 1.4499326944351196} -08/30/2021 15:13:03 - INFO - __main__ - Step 11557: {'lr': 0.0004948743497096079, 'samples': 2218944, 'steps': 11556, 'loss/train': 1.8420255184173584} -08/30/2021 15:13:04 - INFO - __main__ - Step 11558: {'lr': 0.0004948732805746604, 'samples': 2219136, 'steps': 11557, 'loss/train': 2.243739128112793} -08/30/2021 15:13:04 - INFO - __main__ - Step 11559: {'lr': 0.0004948722113293766, 'samples': 2219328, 'steps': 11558, 'loss/train': 1.9791109561920166} -08/30/2021 15:13:06 - INFO - __main__ - Step 11560: {'lr': 0.000494871141973757, 'samples': 2219520, 'steps': 11559, 'loss/train': 1.691980242729187} -08/30/2021 15:13:06 - INFO - __main__ - Step 11561: {'lr': 0.0004948700725078025, 'samples': 2219712, 'steps': 11560, 'loss/train': 1.6796391010284424} -08/30/2021 15:13:06 - INFO - __main__ - Step 11562: {'lr': 0.0004948690029315133, 'samples': 2219904, 'steps': 11561, 'loss/train': 2.0924324989318848} -08/30/2021 15:13:07 - INFO - __main__ - Step 11563: {'lr': 0.0004948679332448899, 'samples': 2220096, 'steps': 11562, 'loss/train': 1.923234224319458} -08/30/2021 15:13:07 - INFO - __main__ - Step 11564: {'lr': 0.0004948668634479327, 'samples': 2220288, 'steps': 11563, 'loss/train': 1.7105976343154907} -08/30/2021 15:13:09 - INFO - __main__ - Step 11565: {'lr': 0.0004948657935406423, 'samples': 2220480, 'steps': 11564, 'loss/train': 1.4222297668457031} -08/30/2021 15:13:09 - INFO - __main__ - Step 11566: {'lr': 0.0004948647235230192, 'samples': 2220672, 'steps': 11565, 'loss/train': 0.7465553283691406} -08/30/2021 15:13:09 - INFO - __main__ - Step 11567: {'lr': 0.0004948636533950638, 'samples': 2220864, 'steps': 11566, 'loss/train': 1.5538454055786133} -08/30/2021 15:13:10 - INFO - __main__ - Step 11568: {'lr': 0.0004948625831567766, 'samples': 2221056, 'steps': 11567, 'loss/train': 1.9415048360824585} -08/30/2021 15:13:10 - INFO - __main__ - Step 11569: {'lr': 0.000494861512808158, 'samples': 2221248, 'steps': 11568, 'loss/train': 0.1553996354341507} -08/30/2021 15:13:12 - INFO - __main__ - Step 11570: {'lr': 0.0004948604423492088, 'samples': 2221440, 'steps': 11569, 'loss/train': 1.7491966485977173} -08/30/2021 15:13:12 - INFO - __main__ - Step 11571: {'lr': 0.0004948593717799292, 'samples': 2221632, 'steps': 11570, 'loss/train': 2.1043777465820312} -08/30/2021 15:13:13 - INFO - __main__ - Step 11572: {'lr': 0.0004948583011003196, 'samples': 2221824, 'steps': 11571, 'loss/train': 1.8829469680786133} -08/30/2021 15:13:13 - INFO - __main__ - Step 11573: {'lr': 0.0004948572303103808, 'samples': 2222016, 'steps': 11572, 'loss/train': 1.7994927167892456} -08/30/2021 15:13:13 - INFO - __main__ - Step 11574: {'lr': 0.0004948561594101129, 'samples': 2222208, 'steps': 11573, 'loss/train': 0.2517626881599426} -08/30/2021 15:13:15 - INFO - __main__ - Step 11575: {'lr': 0.0004948550883995168, 'samples': 2222400, 'steps': 11574, 'loss/train': 1.8151077032089233} -08/30/2021 15:13:15 - INFO - __main__ - Step 11576: {'lr': 0.0004948540172785927, 'samples': 2222592, 'steps': 11575, 'loss/train': 1.1062935590744019} -08/30/2021 15:13:16 - INFO - __main__ - Step 11577: {'lr': 0.0004948529460473412, 'samples': 2222784, 'steps': 11576, 'loss/train': 1.9714395999908447} -08/30/2021 15:13:16 - INFO - __main__ - Step 11578: {'lr': 0.0004948518747057626, 'samples': 2222976, 'steps': 11577, 'loss/train': 2.0570592880249023} -08/30/2021 15:13:17 - INFO - __main__ - Step 11579: {'lr': 0.0004948508032538578, 'samples': 2223168, 'steps': 11578, 'loss/train': 1.7397583723068237} -08/30/2021 15:13:19 - INFO - __main__ - Step 11580: {'lr': 0.0004948497316916267, 'samples': 2223360, 'steps': 11579, 'loss/train': 1.615159273147583} -08/30/2021 15:13:20 - INFO - __main__ - Step 11581: {'lr': 0.0004948486600190702, 'samples': 2223552, 'steps': 11580, 'loss/train': 1.557171106338501} -08/30/2021 15:13:20 - INFO - __main__ - Step 11582: {'lr': 0.0004948475882361888, 'samples': 2223744, 'steps': 11581, 'loss/train': 1.523047685623169} -08/30/2021 15:13:20 - INFO - __main__ - Step 11583: {'lr': 0.0004948465163429828, 'samples': 2223936, 'steps': 11582, 'loss/train': 1.893827199935913} -08/30/2021 15:13:21 - INFO - __main__ - Step 11584: {'lr': 0.0004948454443394527, 'samples': 2224128, 'steps': 11583, 'loss/train': 2.1726720333099365} -08/30/2021 15:13:21 - INFO - __main__ - Step 11585: {'lr': 0.000494844372225599, 'samples': 2224320, 'steps': 11584, 'loss/train': 1.9161070585250854} -08/30/2021 15:13:21 - INFO - __main__ - Step 11586: {'lr': 0.0004948433000014222, 'samples': 2224512, 'steps': 11585, 'loss/train': 1.873349666595459} -08/30/2021 15:13:22 - INFO - __main__ - Step 11587: {'lr': 0.0004948422276669228, 'samples': 2224704, 'steps': 11586, 'loss/train': 1.187298059463501} -08/30/2021 15:13:23 - INFO - __main__ - Step 11588: {'lr': 0.0004948411552221012, 'samples': 2224896, 'steps': 11587, 'loss/train': 1.4286316633224487} -08/30/2021 15:13:24 - INFO - __main__ - Step 11589: {'lr': 0.000494840082666958, 'samples': 2225088, 'steps': 11588, 'loss/train': 1.7936506271362305} -08/30/2021 15:13:24 - INFO - __main__ - Step 11590: {'lr': 0.0004948390100014937, 'samples': 2225280, 'steps': 11589, 'loss/train': 1.4247270822525024} -08/30/2021 15:13:24 - INFO - __main__ - Step 11591: {'lr': 0.0004948379372257086, 'samples': 2225472, 'steps': 11590, 'loss/train': 1.708005428314209} -08/30/2021 15:13:25 - INFO - __main__ - Step 11592: {'lr': 0.0004948368643396035, 'samples': 2225664, 'steps': 11591, 'loss/train': 2.1636524200439453} -08/30/2021 15:13:27 - INFO - __main__ - Step 11593: {'lr': 0.0004948357913431786, 'samples': 2225856, 'steps': 11592, 'loss/train': 2.1388227939605713} -08/30/2021 15:13:27 - INFO - __main__ - Step 11594: {'lr': 0.0004948347182364344, 'samples': 2226048, 'steps': 11593, 'loss/train': 2.0362439155578613} -08/30/2021 15:13:27 - INFO - __main__ - Step 11595: {'lr': 0.0004948336450193715, 'samples': 2226240, 'steps': 11594, 'loss/train': 1.5221621990203857} -08/30/2021 15:13:28 - INFO - __main__ - Step 11596: {'lr': 0.0004948325716919904, 'samples': 2226432, 'steps': 11595, 'loss/train': 1.754105806350708} -08/30/2021 15:13:28 - INFO - __main__ - Step 11597: {'lr': 0.0004948314982542914, 'samples': 2226624, 'steps': 11596, 'loss/train': 1.9655364751815796} -08/30/2021 15:13:28 - INFO - __main__ - Step 11598: {'lr': 0.0004948304247062752, 'samples': 2226816, 'steps': 11597, 'loss/train': 1.792184591293335} -08/30/2021 15:13:30 - INFO - __main__ - Step 11599: {'lr': 0.0004948293510479421, 'samples': 2227008, 'steps': 11598, 'loss/train': 0.968758761882782} -08/30/2021 15:13:31 - INFO - __main__ - Step 11600: {'lr': 0.0004948282772792927, 'samples': 2227200, 'steps': 11599, 'loss/train': 1.2551875114440918} -08/30/2021 15:13:31 - INFO - __main__ - Step 11601: {'lr': 0.0004948272034003275, 'samples': 2227392, 'steps': 11600, 'loss/train': 1.6902942657470703} -08/30/2021 15:13:31 - INFO - __main__ - Step 11602: {'lr': 0.000494826129411047, 'samples': 2227584, 'steps': 11601, 'loss/train': 0.12489646673202515} -08/30/2021 15:13:32 - INFO - __main__ - Step 11603: {'lr': 0.0004948250553114516, 'samples': 2227776, 'steps': 11602, 'loss/train': 0.17888374626636505} -08/30/2021 15:13:32 - INFO - __main__ - Step 11604: {'lr': 0.0004948239811015416, 'samples': 2227968, 'steps': 11603, 'loss/train': 1.967453956604004} -08/30/2021 15:13:34 - INFO - __main__ - Step 11605: {'lr': 0.0004948229067813179, 'samples': 2228160, 'steps': 11604, 'loss/train': 1.8223035335540771} -08/30/2021 15:13:35 - INFO - __main__ - Step 11606: {'lr': 0.0004948218323507807, 'samples': 2228352, 'steps': 11605, 'loss/train': 2.1264188289642334} -08/30/2021 15:13:35 - INFO - __main__ - Step 11607: {'lr': 0.0004948207578099306, 'samples': 2228544, 'steps': 11606, 'loss/train': 1.6417908668518066} -08/30/2021 15:13:36 - INFO - __main__ - Step 11608: {'lr': 0.000494819683158768, 'samples': 2228736, 'steps': 11607, 'loss/train': 2.1653733253479004} -08/30/2021 15:13:36 - INFO - __main__ - Step 11609: {'lr': 0.0004948186083972934, 'samples': 2228928, 'steps': 11608, 'loss/train': 0.1120835468173027} -08/30/2021 15:13:38 - INFO - __main__ - Step 11610: {'lr': 0.0004948175335255075, 'samples': 2229120, 'steps': 11609, 'loss/train': 1.5846641063690186} -08/30/2021 15:13:38 - INFO - __main__ - Step 11611: {'lr': 0.0004948164585434104, 'samples': 2229312, 'steps': 11610, 'loss/train': 1.7049683332443237} -08/30/2021 15:13:38 - INFO - __main__ - Step 11612: {'lr': 0.0004948153834510028, 'samples': 2229504, 'steps': 11611, 'loss/train': 0.3726326823234558} -08/30/2021 15:13:39 - INFO - __main__ - Step 11613: {'lr': 0.0004948143082482852, 'samples': 2229696, 'steps': 11612, 'loss/train': 1.0084137916564941} -08/30/2021 15:13:39 - INFO - __main__ - Step 11614: {'lr': 0.0004948132329352582, 'samples': 2229888, 'steps': 11613, 'loss/train': 2.300612688064575} -08/30/2021 15:13:39 - INFO - __main__ - Step 11615: {'lr': 0.0004948121575119219, 'samples': 2230080, 'steps': 11614, 'loss/train': 2.115280866622925} -08/30/2021 15:13:41 - INFO - __main__ - Step 11616: {'lr': 0.0004948110819782771, 'samples': 2230272, 'steps': 11615, 'loss/train': 1.264095664024353} -08/30/2021 15:13:41 - INFO - __main__ - Step 11617: {'lr': 0.0004948100063343243, 'samples': 2230464, 'steps': 11616, 'loss/train': 1.8612920045852661} -08/30/2021 15:13:42 - INFO - __main__ - Step 11618: {'lr': 0.0004948089305800638, 'samples': 2230656, 'steps': 11617, 'loss/train': 2.0519583225250244} -08/30/2021 15:13:42 - INFO - __main__ - Step 11619: {'lr': 0.0004948078547154962, 'samples': 2230848, 'steps': 11618, 'loss/train': 0.6256502866744995} -08/30/2021 15:13:42 - INFO - __main__ - Step 11620: {'lr': 0.0004948067787406219, 'samples': 2231040, 'steps': 11619, 'loss/train': 1.9627830982208252} -08/30/2021 15:13:44 - INFO - __main__ - Step 11621: {'lr': 0.0004948057026554415, 'samples': 2231232, 'steps': 11620, 'loss/train': 1.6287304162979126} -08/30/2021 15:13:45 - INFO - __main__ - Step 11622: {'lr': 0.0004948046264599554, 'samples': 2231424, 'steps': 11621, 'loss/train': 1.494590401649475} -08/30/2021 15:13:45 - INFO - __main__ - Step 11623: {'lr': 0.0004948035501541641, 'samples': 2231616, 'steps': 11622, 'loss/train': 1.9254127740859985} -08/30/2021 15:13:45 - INFO - __main__ - Step 11624: {'lr': 0.0004948024737380681, 'samples': 2231808, 'steps': 11623, 'loss/train': 1.5182067155838013} -08/30/2021 15:13:46 - INFO - __main__ - Step 11625: {'lr': 0.000494801397211668, 'samples': 2232000, 'steps': 11624, 'loss/train': 2.621610641479492} -08/30/2021 15:13:47 - INFO - __main__ - Step 11626: {'lr': 0.000494800320574964, 'samples': 2232192, 'steps': 11625, 'loss/train': 1.7660281658172607} -08/30/2021 15:13:47 - INFO - __main__ - Step 11627: {'lr': 0.0004947992438279568, 'samples': 2232384, 'steps': 11626, 'loss/train': 2.1557624340057373} -08/30/2021 15:13:48 - INFO - __main__ - Step 11628: {'lr': 0.0004947981669706469, 'samples': 2232576, 'steps': 11627, 'loss/train': 1.7714815139770508} -08/30/2021 15:13:48 - INFO - __main__ - Step 11629: {'lr': 0.0004947970900030346, 'samples': 2232768, 'steps': 11628, 'loss/train': 1.6118674278259277} -08/30/2021 15:13:49 - INFO - __main__ - Step 11630: {'lr': 0.0004947960129251206, 'samples': 2232960, 'steps': 11629, 'loss/train': 1.5114624500274658} -08/30/2021 15:13:50 - INFO - __main__ - Step 11631: {'lr': 0.0004947949357369054, 'samples': 2233152, 'steps': 11630, 'loss/train': 2.224601984024048} -08/30/2021 15:13:51 - INFO - __main__ - Step 11632: {'lr': 0.0004947938584383892, 'samples': 2233344, 'steps': 11631, 'loss/train': 1.7478086948394775} -08/30/2021 15:13:51 - INFO - __main__ - Step 11633: {'lr': 0.0004947927810295728, 'samples': 2233536, 'steps': 11632, 'loss/train': 1.528768539428711} -08/30/2021 15:13:51 - INFO - __main__ - Step 11634: {'lr': 0.0004947917035104564, 'samples': 2233728, 'steps': 11633, 'loss/train': 1.2400212287902832} -08/30/2021 15:13:52 - INFO - __main__ - Step 11635: {'lr': 0.0004947906258810407, 'samples': 2233920, 'steps': 11634, 'loss/train': 1.4715408086776733} -08/30/2021 15:13:52 - INFO - __main__ - Step 11636: {'lr': 0.0004947895481413262, 'samples': 2234112, 'steps': 11635, 'loss/train': 2.0533626079559326} -08/30/2021 15:13:53 - INFO - __main__ - Step 11637: {'lr': 0.0004947884702913133, 'samples': 2234304, 'steps': 11636, 'loss/train': 2.067622184753418} -08/30/2021 15:13:54 - INFO - __main__ - Step 11638: {'lr': 0.0004947873923310024, 'samples': 2234496, 'steps': 11637, 'loss/train': 1.6045129299163818} -08/30/2021 15:13:54 - INFO - __main__ - Step 11639: {'lr': 0.0004947863142603941, 'samples': 2234688, 'steps': 11638, 'loss/train': 1.6627546548843384} -08/30/2021 15:13:55 - INFO - __main__ - Step 11640: {'lr': 0.0004947852360794889, 'samples': 2234880, 'steps': 11639, 'loss/train': 2.2203850746154785} -08/30/2021 15:13:55 - INFO - __main__ - Step 11641: {'lr': 0.0004947841577882873, 'samples': 2235072, 'steps': 11640, 'loss/train': 1.6208118200302124} -08/30/2021 15:13:56 - INFO - __main__ - Step 11642: {'lr': 0.0004947830793867896, 'samples': 2235264, 'steps': 11641, 'loss/train': 2.3141238689422607} -08/30/2021 15:13:57 - INFO - __main__ - Step 11643: {'lr': 0.0004947820008749965, 'samples': 2235456, 'steps': 11642, 'loss/train': 1.8353108167648315} -08/30/2021 15:13:57 - INFO - __main__ - Step 11644: {'lr': 0.0004947809222529084, 'samples': 2235648, 'steps': 11643, 'loss/train': 1.8872349262237549} -08/30/2021 15:13:58 - INFO - __main__ - Step 11645: {'lr': 0.0004947798435205258, 'samples': 2235840, 'steps': 11644, 'loss/train': 0.762294352054596} -08/30/2021 15:13:58 - INFO - __main__ - Step 11646: {'lr': 0.0004947787646778491, 'samples': 2236032, 'steps': 11645, 'loss/train': 1.9617986679077148} -08/30/2021 15:13:59 - INFO - __main__ - Step 11647: {'lr': 0.0004947776857248791, 'samples': 2236224, 'steps': 11646, 'loss/train': 2.2141122817993164} -08/30/2021 15:14:00 - INFO - __main__ - Step 11648: {'lr': 0.0004947766066616157, 'samples': 2236416, 'steps': 11647, 'loss/train': 1.7058207988739014} -08/30/2021 15:14:00 - INFO - __main__ - Step 11649: {'lr': 0.00049477552748806, 'samples': 2236608, 'steps': 11648, 'loss/train': 1.2439918518066406} -08/30/2021 15:14:01 - INFO - __main__ - Step 11650: {'lr': 0.0004947744482042122, 'samples': 2236800, 'steps': 11649, 'loss/train': 1.9238418340682983} -08/30/2021 15:14:01 - INFO - __main__ - Step 11651: {'lr': 0.0004947733688100728, 'samples': 2236992, 'steps': 11650, 'loss/train': 2.2920732498168945} -08/30/2021 15:14:02 - INFO - __main__ - Step 11652: {'lr': 0.0004947722893056423, 'samples': 2237184, 'steps': 11651, 'loss/train': 1.3203538656234741} -08/30/2021 15:14:03 - INFO - __main__ - Step 11653: {'lr': 0.0004947712096909211, 'samples': 2237376, 'steps': 11652, 'loss/train': 0.6121887564659119} -08/30/2021 15:14:03 - INFO - __main__ - Step 11654: {'lr': 0.0004947701299659097, 'samples': 2237568, 'steps': 11653, 'loss/train': 1.4888660907745361} -08/30/2021 15:14:04 - INFO - __main__ - Step 11655: {'lr': 0.0004947690501306088, 'samples': 2237760, 'steps': 11654, 'loss/train': 1.632535457611084} -08/30/2021 15:14:04 - INFO - __main__ - Step 11656: {'lr': 0.0004947679701850187, 'samples': 2237952, 'steps': 11655, 'loss/train': 1.8257781267166138} -08/30/2021 15:14:06 - INFO - __main__ - Step 11657: {'lr': 0.00049476689012914, 'samples': 2238144, 'steps': 11656, 'loss/train': 0.2034396082162857} -08/30/2021 15:14:07 - INFO - __main__ - Step 11658: {'lr': 0.0004947658099629731, 'samples': 2238336, 'steps': 11657, 'loss/train': 1.9989336729049683} -08/30/2021 15:14:07 - INFO - __main__ - Step 11659: {'lr': 0.0004947647296865184, 'samples': 2238528, 'steps': 11658, 'loss/train': 1.2351003885269165} -08/30/2021 15:14:07 - INFO - __main__ - Step 11660: {'lr': 0.0004947636492997765, 'samples': 2238720, 'steps': 11659, 'loss/train': 2.5555813312530518} -08/30/2021 15:14:08 - INFO - __main__ - Step 11661: {'lr': 0.0004947625688027479, 'samples': 2238912, 'steps': 11660, 'loss/train': 1.8151615858078003} -08/30/2021 15:14:10 - INFO - __main__ - Step 11662: {'lr': 0.0004947614881954332, 'samples': 2239104, 'steps': 11661, 'loss/train': 2.078401803970337} -08/30/2021 15:14:10 - INFO - __main__ - Step 11663: {'lr': 0.0004947604074778325, 'samples': 2239296, 'steps': 11662, 'loss/train': 1.3901219367980957} -08/30/2021 15:14:11 - INFO - __main__ - Step 11664: {'lr': 0.0004947593266499468, 'samples': 2239488, 'steps': 11663, 'loss/train': 1.5410958528518677} -08/30/2021 15:14:11 - INFO - __main__ - Step 11665: {'lr': 0.0004947582457117762, 'samples': 2239680, 'steps': 11664, 'loss/train': 2.3159220218658447} -08/30/2021 15:14:11 - INFO - __main__ - Step 11666: {'lr': 0.0004947571646633214, 'samples': 2239872, 'steps': 11665, 'loss/train': 2.055731773376465} -08/30/2021 15:14:12 - INFO - __main__ - Step 11667: {'lr': 0.0004947560835045826, 'samples': 2240064, 'steps': 11666, 'loss/train': 1.9062695503234863} -08/30/2021 15:14:12 - INFO - __main__ - Step 11668: {'lr': 0.0004947550022355606, 'samples': 2240256, 'steps': 11667, 'loss/train': 1.2207061052322388} -08/30/2021 15:14:13 - INFO - __main__ - Step 11669: {'lr': 0.0004947539208562558, 'samples': 2240448, 'steps': 11668, 'loss/train': 4.36484956741333} -08/30/2021 15:14:14 - INFO - __main__ - Step 11670: {'lr': 0.0004947528393666686, 'samples': 2240640, 'steps': 11669, 'loss/train': 1.8936094045639038} -08/30/2021 15:14:14 - INFO - __main__ - Step 11671: {'lr': 0.0004947517577667996, 'samples': 2240832, 'steps': 11670, 'loss/train': 1.8972687721252441} -08/30/2021 15:14:15 - INFO - __main__ - Step 11672: {'lr': 0.0004947506760566492, 'samples': 2241024, 'steps': 11671, 'loss/train': 1.72401762008667} -08/30/2021 15:14:15 - INFO - __main__ - Step 11673: {'lr': 0.0004947495942362179, 'samples': 2241216, 'steps': 11672, 'loss/train': 1.4126760959625244} -08/30/2021 15:14:16 - INFO - __main__ - Step 11674: {'lr': 0.0004947485123055063, 'samples': 2241408, 'steps': 11673, 'loss/train': 1.4695552587509155} -08/30/2021 15:14:17 - INFO - __main__ - Step 11675: {'lr': 0.0004947474302645147, 'samples': 2241600, 'steps': 11674, 'loss/train': 0.6995078921318054} -08/30/2021 15:14:17 - INFO - __main__ - Step 11676: {'lr': 0.0004947463481132438, 'samples': 2241792, 'steps': 11675, 'loss/train': 1.9622925519943237} -08/30/2021 15:14:18 - INFO - __main__ - Step 11677: {'lr': 0.0004947452658516938, 'samples': 2241984, 'steps': 11676, 'loss/train': 2.2733633518218994} -08/30/2021 15:14:18 - INFO - __main__ - Step 11678: {'lr': 0.0004947441834798655, 'samples': 2242176, 'steps': 11677, 'loss/train': 1.803637146949768} -08/30/2021 15:14:18 - INFO - __main__ - Step 11679: {'lr': 0.0004947431009977592, 'samples': 2242368, 'steps': 11678, 'loss/train': 1.917235255241394} -08/30/2021 15:14:20 - INFO - __main__ - Step 11680: {'lr': 0.0004947420184053755, 'samples': 2242560, 'steps': 11679, 'loss/train': 2.0380828380584717} -08/30/2021 15:14:20 - INFO - __main__ - Step 11681: {'lr': 0.0004947409357027148, 'samples': 2242752, 'steps': 11680, 'loss/train': 1.8402788639068604} -08/30/2021 15:14:21 - INFO - __main__ - Step 11682: {'lr': 0.0004947398528897775, 'samples': 2242944, 'steps': 11681, 'loss/train': 1.9232163429260254} -08/30/2021 15:14:21 - INFO - __main__ - Step 11683: {'lr': 0.0004947387699665643, 'samples': 2243136, 'steps': 11682, 'loss/train': 1.3994172811508179} -08/30/2021 15:14:21 - INFO - __main__ - Step 11684: {'lr': 0.0004947376869330755, 'samples': 2243328, 'steps': 11683, 'loss/train': 1.7823961973190308} -08/30/2021 15:14:23 - INFO - __main__ - Step 11685: {'lr': 0.0004947366037893118, 'samples': 2243520, 'steps': 11684, 'loss/train': 1.9779433012008667} -08/30/2021 15:14:23 - INFO - __main__ - Step 11686: {'lr': 0.0004947355205352735, 'samples': 2243712, 'steps': 11685, 'loss/train': 1.882994294166565} -08/30/2021 15:14:24 - INFO - __main__ - Step 11687: {'lr': 0.0004947344371709611, 'samples': 2243904, 'steps': 11686, 'loss/train': 1.4967868328094482} -08/30/2021 15:14:24 - INFO - __main__ - Step 11688: {'lr': 0.0004947333536963753, 'samples': 2244096, 'steps': 11687, 'loss/train': 1.9321844577789307} -08/30/2021 15:14:24 - INFO - __main__ - Step 11689: {'lr': 0.0004947322701115163, 'samples': 2244288, 'steps': 11688, 'loss/train': 1.6577965021133423} -08/30/2021 15:14:26 - INFO - __main__ - Step 11690: {'lr': 0.0004947311864163847, 'samples': 2244480, 'steps': 11689, 'loss/train': 0.9276034235954285} -08/30/2021 15:14:27 - INFO - __main__ - Step 11691: {'lr': 0.000494730102610981, 'samples': 2244672, 'steps': 11690, 'loss/train': 1.8576034307479858} -08/30/2021 15:14:27 - INFO - __main__ - Step 11692: {'lr': 0.0004947290186953057, 'samples': 2244864, 'steps': 11691, 'loss/train': 1.895569920539856} -08/30/2021 15:14:27 - INFO - __main__ - Step 11693: {'lr': 0.0004947279346693594, 'samples': 2245056, 'steps': 11692, 'loss/train': 0.344992071390152} -08/30/2021 15:14:28 - INFO - __main__ - Step 11694: {'lr': 0.0004947268505331424, 'samples': 2245248, 'steps': 11693, 'loss/train': 1.5632882118225098} -08/30/2021 15:14:29 - INFO - __main__ - Step 11695: {'lr': 0.0004947257662866551, 'samples': 2245440, 'steps': 11694, 'loss/train': 5.149719715118408} -08/30/2021 15:14:30 - INFO - __main__ - Step 11696: {'lr': 0.0004947246819298984, 'samples': 2245632, 'steps': 11695, 'loss/train': 1.6019090414047241} -08/30/2021 15:14:30 - INFO - __main__ - Step 11697: {'lr': 0.0004947235974628723, 'samples': 2245824, 'steps': 11696, 'loss/train': 2.453235149383545} -08/30/2021 15:14:30 - INFO - __main__ - Step 11698: {'lr': 0.0004947225128855777, 'samples': 2246016, 'steps': 11697, 'loss/train': 1.7662475109100342} -08/30/2021 15:14:31 - INFO - __main__ - Step 11699: {'lr': 0.0004947214281980149, 'samples': 2246208, 'steps': 11698, 'loss/train': 2.8919992446899414} -08/30/2021 15:14:32 - INFO - __main__ - Step 11700: {'lr': 0.0004947203434001843, 'samples': 2246400, 'steps': 11699, 'loss/train': 1.7070711851119995} -08/30/2021 15:14:33 - INFO - __main__ - Step 11701: {'lr': 0.0004947192584920866, 'samples': 2246592, 'steps': 11700, 'loss/train': 1.8991669416427612} -08/30/2021 15:14:33 - INFO - __main__ - Step 11702: {'lr': 0.000494718173473722, 'samples': 2246784, 'steps': 11701, 'loss/train': 1.8828164339065552} -08/30/2021 15:14:33 - INFO - __main__ - Step 11703: {'lr': 0.0004947170883450913, 'samples': 2246976, 'steps': 11702, 'loss/train': 1.6286585330963135} -08/30/2021 15:14:34 - INFO - __main__ - Step 11704: {'lr': 0.000494716003106195, 'samples': 2247168, 'steps': 11703, 'loss/train': 1.7860980033874512} -08/30/2021 15:14:34 - INFO - __main__ - Step 11705: {'lr': 0.0004947149177570332, 'samples': 2247360, 'steps': 11704, 'loss/train': 1.9631855487823486} -08/30/2021 15:14:35 - INFO - __main__ - Step 11706: {'lr': 0.0004947138322976067, 'samples': 2247552, 'steps': 11705, 'loss/train': 1.9514325857162476} -08/30/2021 15:14:36 - INFO - __main__ - Step 11707: {'lr': 0.000494712746727916, 'samples': 2247744, 'steps': 11706, 'loss/train': 2.257874011993408} -08/30/2021 15:14:36 - INFO - __main__ - Step 11708: {'lr': 0.0004947116610479614, 'samples': 2247936, 'steps': 11707, 'loss/train': 1.631121277809143} -08/30/2021 15:14:37 - INFO - __main__ - Step 11709: {'lr': 0.0004947105752577436, 'samples': 2248128, 'steps': 11708, 'loss/train': 1.3235853910446167} -08/30/2021 15:14:37 - INFO - __main__ - Step 11710: {'lr': 0.0004947094893572629, 'samples': 2248320, 'steps': 11709, 'loss/train': 1.4561848640441895} -08/30/2021 15:14:38 - INFO - __main__ - Step 11711: {'lr': 0.00049470840334652, 'samples': 2248512, 'steps': 11710, 'loss/train': 1.8853501081466675} -08/30/2021 15:14:39 - INFO - __main__ - Step 11712: {'lr': 0.0004947073172255151, 'samples': 2248704, 'steps': 11711, 'loss/train': 1.6063880920410156} -08/30/2021 15:14:39 - INFO - __main__ - Step 11713: {'lr': 0.000494706230994249, 'samples': 2248896, 'steps': 11712, 'loss/train': 1.1136841773986816} -08/30/2021 15:14:40 - INFO - __main__ - Step 11714: {'lr': 0.000494705144652722, 'samples': 2249088, 'steps': 11713, 'loss/train': 2.184231996536255} -08/30/2021 15:14:40 - INFO - __main__ - Step 11715: {'lr': 0.0004947040582009346, 'samples': 2249280, 'steps': 11714, 'loss/train': 1.7813596725463867} -08/30/2021 15:14:42 - INFO - __main__ - Step 11716: {'lr': 0.0004947029716388875, 'samples': 2249472, 'steps': 11715, 'loss/train': 2.1649110317230225} -08/30/2021 15:14:42 - INFO - __main__ - Step 11717: {'lr': 0.0004947018849665809, 'samples': 2249664, 'steps': 11716, 'loss/train': 1.8251116275787354} -08/30/2021 15:14:43 - INFO - __main__ - Step 11718: {'lr': 0.0004947007981840153, 'samples': 2249856, 'steps': 11717, 'loss/train': 2.155564546585083} -08/30/2021 15:14:43 - INFO - __main__ - Step 11719: {'lr': 0.0004946997112911914, 'samples': 2250048, 'steps': 11718, 'loss/train': 1.1258002519607544} -08/30/2021 15:14:43 - INFO - __main__ - Step 11720: {'lr': 0.0004946986242881096, 'samples': 2250240, 'steps': 11719, 'loss/train': 1.8737475872039795} -08/30/2021 15:14:45 - INFO - __main__ - Step 11721: {'lr': 0.0004946975371747704, 'samples': 2250432, 'steps': 11720, 'loss/train': 1.9213136434555054} -08/30/2021 15:14:45 - INFO - __main__ - Step 11722: {'lr': 0.0004946964499511742, 'samples': 2250624, 'steps': 11721, 'loss/train': 1.68390691280365} -08/30/2021 15:14:46 - INFO - __main__ - Step 11723: {'lr': 0.0004946953626173216, 'samples': 2250816, 'steps': 11722, 'loss/train': 0.8829115629196167} -08/30/2021 15:14:46 - INFO - __main__ - Step 11724: {'lr': 0.0004946942751732129, 'samples': 2251008, 'steps': 11723, 'loss/train': 2.01387095451355} -08/30/2021 15:14:46 - INFO - __main__ - Step 11725: {'lr': 0.000494693187618849, 'samples': 2251200, 'steps': 11724, 'loss/train': 0.17464707791805267} -08/30/2021 15:14:48 - INFO - __main__ - Step 11726: {'lr': 0.0004946920999542299, 'samples': 2251392, 'steps': 11725, 'loss/train': 2.0406157970428467} -08/30/2021 15:14:49 - INFO - __main__ - Step 11727: {'lr': 0.0004946910121793564, 'samples': 2251584, 'steps': 11726, 'loss/train': 1.7692480087280273} -08/30/2021 15:14:49 - INFO - __main__ - Step 11728: {'lr': 0.0004946899242942289, 'samples': 2251776, 'steps': 11727, 'loss/train': 1.89846932888031} -08/30/2021 15:14:50 - INFO - __main__ - Step 11729: {'lr': 0.000494688836298848, 'samples': 2251968, 'steps': 11728, 'loss/train': 2.0183138847351074} -08/30/2021 15:14:50 - INFO - __main__ - Step 11730: {'lr': 0.0004946877481932139, 'samples': 2252160, 'steps': 11729, 'loss/train': 1.7410293817520142} -08/30/2021 15:14:50 - INFO - __main__ - Step 11731: {'lr': 0.0004946866599773274, 'samples': 2252352, 'steps': 11730, 'loss/train': 1.5501283407211304} -08/30/2021 15:14:52 - INFO - __main__ - Step 11732: {'lr': 0.0004946855716511888, 'samples': 2252544, 'steps': 11731, 'loss/train': 0.4122734069824219} -08/30/2021 15:14:53 - INFO - __main__ - Step 11733: {'lr': 0.0004946844832147987, 'samples': 2252736, 'steps': 11732, 'loss/train': 0.14123785495758057} -08/30/2021 15:14:53 - INFO - __main__ - Step 11734: {'lr': 0.0004946833946681575, 'samples': 2252928, 'steps': 11733, 'loss/train': 1.3744008541107178} -08/30/2021 15:14:53 - INFO - __main__ - Step 11735: {'lr': 0.0004946823060112658, 'samples': 2253120, 'steps': 11734, 'loss/train': 1.4184517860412598} -08/30/2021 15:14:54 - INFO - __main__ - Step 11736: {'lr': 0.000494681217244124, 'samples': 2253312, 'steps': 11735, 'loss/train': 1.8464114665985107} -08/30/2021 15:14:54 - INFO - __main__ - Step 11737: {'lr': 0.0004946801283667326, 'samples': 2253504, 'steps': 11736, 'loss/train': 1.6429179906845093} -08/30/2021 15:14:56 - INFO - __main__ - Step 11738: {'lr': 0.0004946790393790921, 'samples': 2253696, 'steps': 11737, 'loss/train': 1.7506275177001953} -08/30/2021 15:14:56 - INFO - __main__ - Step 11739: {'lr': 0.0004946779502812031, 'samples': 2253888, 'steps': 11738, 'loss/train': 2.6980814933776855} -08/30/2021 15:14:57 - INFO - __main__ - Step 11740: {'lr': 0.0004946768610730659, 'samples': 2254080, 'steps': 11739, 'loss/train': 1.2672038078308105} -08/30/2021 15:14:57 - INFO - __main__ - Step 11741: {'lr': 0.0004946757717546812, 'samples': 2254272, 'steps': 11740, 'loss/train': 1.8932408094406128} -08/30/2021 15:14:57 - INFO - __main__ - Step 11742: {'lr': 0.0004946746823260491, 'samples': 2254464, 'steps': 11741, 'loss/train': 0.5532539486885071} -08/30/2021 15:14:58 - INFO - __main__ - Step 11743: {'lr': 0.0004946735927871706, 'samples': 2254656, 'steps': 11742, 'loss/train': 1.672285795211792} -08/30/2021 15:14:59 - INFO - __main__ - Step 11744: {'lr': 0.0004946725031380459, 'samples': 2254848, 'steps': 11743, 'loss/train': 1.7819613218307495} -08/30/2021 15:14:59 - INFO - __main__ - Step 11745: {'lr': 0.0004946714133786756, 'samples': 2255040, 'steps': 11744, 'loss/train': 1.6214816570281982} -08/30/2021 15:15:00 - INFO - __main__ - Step 11746: {'lr': 0.00049467032350906, 'samples': 2255232, 'steps': 11745, 'loss/train': 2.1793644428253174} -08/30/2021 15:15:00 - INFO - __main__ - Step 11747: {'lr': 0.0004946692335291999, 'samples': 2255424, 'steps': 11746, 'loss/train': 2.0590147972106934} -08/30/2021 15:15:00 - INFO - __main__ - Step 11748: {'lr': 0.0004946681434390955, 'samples': 2255616, 'steps': 11747, 'loss/train': 2.3604531288146973} -08/30/2021 15:15:02 - INFO - __main__ - Step 11749: {'lr': 0.0004946670532387474, 'samples': 2255808, 'steps': 11748, 'loss/train': 2.0560808181762695} -08/30/2021 15:15:02 - INFO - __main__ - Step 11750: {'lr': 0.0004946659629281561, 'samples': 2256000, 'steps': 11749, 'loss/train': 1.992100477218628} -08/30/2021 15:15:03 - INFO - __main__ - Step 11751: {'lr': 0.0004946648725073222, 'samples': 2256192, 'steps': 11750, 'loss/train': 1.704413890838623} -08/30/2021 15:15:03 - INFO - __main__ - Step 11752: {'lr': 0.0004946637819762459, 'samples': 2256384, 'steps': 11751, 'loss/train': 1.4175366163253784} -08/30/2021 15:15:03 - INFO - __main__ - Step 11753: {'lr': 0.000494662691334928, 'samples': 2256576, 'steps': 11752, 'loss/train': 1.1848088502883911} -08/30/2021 15:15:05 - INFO - __main__ - Step 11754: {'lr': 0.0004946616005833689, 'samples': 2256768, 'steps': 11753, 'loss/train': 1.4894793033599854} -08/30/2021 15:15:05 - INFO - __main__ - Step 11755: {'lr': 0.0004946605097215691, 'samples': 2256960, 'steps': 11754, 'loss/train': 1.7255768775939941} -08/30/2021 15:15:06 - INFO - __main__ - Step 11756: {'lr': 0.0004946594187495289, 'samples': 2257152, 'steps': 11755, 'loss/train': 1.7005902528762817} -08/30/2021 15:15:06 - INFO - __main__ - Step 11757: {'lr': 0.0004946583276672489, 'samples': 2257344, 'steps': 11756, 'loss/train': 1.6552094221115112} -08/30/2021 15:15:06 - INFO - __main__ - Step 11758: {'lr': 0.0004946572364747298, 'samples': 2257536, 'steps': 11757, 'loss/train': 2.274648666381836} -08/30/2021 15:15:08 - INFO - __main__ - Step 11759: {'lr': 0.0004946561451719719, 'samples': 2257728, 'steps': 11758, 'loss/train': 2.040285587310791} -08/30/2021 15:15:09 - INFO - __main__ - Step 11760: {'lr': 0.0004946550537589757, 'samples': 2257920, 'steps': 11759, 'loss/train': 2.1042490005493164} -08/30/2021 15:15:09 - INFO - __main__ - Step 11761: {'lr': 0.0004946539622357417, 'samples': 2258112, 'steps': 11760, 'loss/train': 1.696751356124878} -08/30/2021 15:15:10 - INFO - __main__ - Step 11762: {'lr': 0.0004946528706022703, 'samples': 2258304, 'steps': 11761, 'loss/train': 1.9341208934783936} -08/30/2021 15:15:10 - INFO - __main__ - Step 11763: {'lr': 0.0004946517788585622, 'samples': 2258496, 'steps': 11762, 'loss/train': 2.3381707668304443} -08/30/2021 15:15:11 - INFO - __main__ - Step 11764: {'lr': 0.0004946506870046178, 'samples': 2258688, 'steps': 11763, 'loss/train': 2.199601650238037} -08/30/2021 15:15:12 - INFO - __main__ - Step 11765: {'lr': 0.0004946495950404375, 'samples': 2258880, 'steps': 11764, 'loss/train': 1.7529102563858032} -08/30/2021 15:15:12 - INFO - __main__ - Step 11766: {'lr': 0.0004946485029660219, 'samples': 2259072, 'steps': 11765, 'loss/train': 1.9411066770553589} -08/30/2021 15:15:13 - INFO - __main__ - Step 11767: {'lr': 0.0004946474107813715, 'samples': 2259264, 'steps': 11766, 'loss/train': 1.7289375066757202} -08/30/2021 15:15:13 - INFO - __main__ - Step 11768: {'lr': 0.0004946463184864867, 'samples': 2259456, 'steps': 11767, 'loss/train': 1.5154902935028076} -08/30/2021 15:15:15 - INFO - __main__ - Step 11769: {'lr': 0.000494645226081368, 'samples': 2259648, 'steps': 11768, 'loss/train': 1.7412127256393433} -08/30/2021 15:15:15 - INFO - __main__ - Step 11770: {'lr': 0.000494644133566016, 'samples': 2259840, 'steps': 11769, 'loss/train': 1.731998324394226} -08/30/2021 15:15:15 - INFO - __main__ - Step 11771: {'lr': 0.0004946430409404311, 'samples': 2260032, 'steps': 11770, 'loss/train': 0.18437843024730682} -08/30/2021 15:15:16 - INFO - __main__ - Step 11772: {'lr': 0.0004946419482046139, 'samples': 2260224, 'steps': 11771, 'loss/train': 2.0941176414489746} -08/30/2021 15:15:16 - INFO - __main__ - Step 11773: {'lr': 0.0004946408553585648, 'samples': 2260416, 'steps': 11772, 'loss/train': 2.2236886024475098} -08/30/2021 15:15:18 - INFO - __main__ - Step 11774: {'lr': 0.0004946397624022843, 'samples': 2260608, 'steps': 11773, 'loss/train': 2.299236536026001} -08/30/2021 15:15:18 - INFO - __main__ - Step 11775: {'lr': 0.0004946386693357728, 'samples': 2260800, 'steps': 11774, 'loss/train': 1.7870864868164062} -08/30/2021 15:15:18 - INFO - __main__ - Step 11776: {'lr': 0.0004946375761590309, 'samples': 2260992, 'steps': 11775, 'loss/train': 1.6457983255386353} -08/30/2021 15:15:19 - INFO - __main__ - Step 11777: {'lr': 0.0004946364828720592, 'samples': 2261184, 'steps': 11776, 'loss/train': 1.8843894004821777} -08/30/2021 15:15:19 - INFO - __main__ - Step 11778: {'lr': 0.000494635389474858, 'samples': 2261376, 'steps': 11777, 'loss/train': 2.5461606979370117} -08/30/2021 15:15:21 - INFO - __main__ - Step 11779: {'lr': 0.0004946342959674278, 'samples': 2261568, 'steps': 11778, 'loss/train': 1.298263430595398} -08/30/2021 15:15:21 - INFO - __main__ - Step 11780: {'lr': 0.0004946332023497693, 'samples': 2261760, 'steps': 11779, 'loss/train': 1.4017049074172974} -08/30/2021 15:15:21 - INFO - __main__ - Step 11781: {'lr': 0.0004946321086218828, 'samples': 2261952, 'steps': 11780, 'loss/train': 3.3718361854553223} -08/30/2021 15:15:22 - INFO - __main__ - Step 11782: {'lr': 0.0004946310147837689, 'samples': 2262144, 'steps': 11781, 'loss/train': 1.831998348236084} -08/30/2021 15:15:22 - INFO - __main__ - Step 11783: {'lr': 0.0004946299208354279, 'samples': 2262336, 'steps': 11782, 'loss/train': 1.3627289533615112} -08/30/2021 15:15:24 - INFO - __main__ - Step 11784: {'lr': 0.0004946288267768605, 'samples': 2262528, 'steps': 11783, 'loss/train': 2.2675211429595947} -08/30/2021 15:15:24 - INFO - __main__ - Step 11785: {'lr': 0.0004946277326080672, 'samples': 2262720, 'steps': 11784, 'loss/train': 1.698428988456726} -08/30/2021 15:15:24 - INFO - __main__ - Step 11786: {'lr': 0.0004946266383290483, 'samples': 2262912, 'steps': 11785, 'loss/train': 2.13415265083313} -08/30/2021 15:15:25 - INFO - __main__ - Step 11787: {'lr': 0.0004946255439398045, 'samples': 2263104, 'steps': 11786, 'loss/train': 1.7996593713760376} -08/30/2021 15:15:25 - INFO - __main__ - Step 11788: {'lr': 0.0004946244494403361, 'samples': 2263296, 'steps': 11787, 'loss/train': 1.7397469282150269} -08/30/2021 15:15:26 - INFO - __main__ - Step 11789: {'lr': 0.0004946233548306438, 'samples': 2263488, 'steps': 11788, 'loss/train': 1.4018193483352661} -08/30/2021 15:15:27 - INFO - __main__ - Step 11790: {'lr': 0.000494622260110728, 'samples': 2263680, 'steps': 11789, 'loss/train': 1.829760193824768} -08/30/2021 15:15:28 - INFO - __main__ - Step 11791: {'lr': 0.0004946211652805891, 'samples': 2263872, 'steps': 11790, 'loss/train': 1.2616387605667114} -08/30/2021 15:15:28 - INFO - __main__ - Step 11792: {'lr': 0.0004946200703402278, 'samples': 2264064, 'steps': 11791, 'loss/train': 2.205960750579834} -08/30/2021 15:15:28 - INFO - __main__ - Step 11793: {'lr': 0.0004946189752896443, 'samples': 2264256, 'steps': 11792, 'loss/train': 2.12526798248291} -08/30/2021 15:15:29 - INFO - __main__ - Step 11794: {'lr': 0.0004946178801288394, 'samples': 2264448, 'steps': 11793, 'loss/train': 1.6127997636795044} -08/30/2021 15:15:30 - INFO - __main__ - Step 11795: {'lr': 0.0004946167848578134, 'samples': 2264640, 'steps': 11794, 'loss/train': 1.4849432706832886} -08/30/2021 15:15:31 - INFO - __main__ - Step 11796: {'lr': 0.0004946156894765669, 'samples': 2264832, 'steps': 11795, 'loss/train': 2.4573872089385986} -08/30/2021 15:15:31 - INFO - __main__ - Step 11797: {'lr': 0.0004946145939851004, 'samples': 2265024, 'steps': 11796, 'loss/train': 1.4694702625274658} -08/30/2021 15:15:32 - INFO - __main__ - Step 11798: {'lr': 0.0004946134983834142, 'samples': 2265216, 'steps': 11797, 'loss/train': 0.4310687482357025} -08/30/2021 15:15:32 - INFO - __main__ - Step 11799: {'lr': 0.0004946124026715089, 'samples': 2265408, 'steps': 11798, 'loss/train': 1.533728837966919} -08/30/2021 15:15:34 - INFO - __main__ - Step 11800: {'lr': 0.0004946113068493851, 'samples': 2265600, 'steps': 11799, 'loss/train': 1.7493268251419067} -08/30/2021 15:15:34 - INFO - __main__ - Step 11801: {'lr': 0.0004946102109170433, 'samples': 2265792, 'steps': 11800, 'loss/train': 1.5623968839645386} -08/30/2021 15:15:35 - INFO - __main__ - Step 11802: {'lr': 0.0004946091148744838, 'samples': 2265984, 'steps': 11801, 'loss/train': 1.8144017457962036} -08/30/2021 15:15:35 - INFO - __main__ - Step 11803: {'lr': 0.0004946080187217072, 'samples': 2266176, 'steps': 11802, 'loss/train': 0.19895613193511963} -08/30/2021 15:15:35 - INFO - __main__ - Step 11804: {'lr': 0.0004946069224587141, 'samples': 2266368, 'steps': 11803, 'loss/train': 1.3789323568344116} -08/30/2021 15:15:37 - INFO - __main__ - Step 11805: {'lr': 0.0004946058260855049, 'samples': 2266560, 'steps': 11804, 'loss/train': 1.8440556526184082} -08/30/2021 15:15:38 - INFO - __main__ - Step 11806: {'lr': 0.00049460472960208, 'samples': 2266752, 'steps': 11805, 'loss/train': 2.2906994819641113} -08/30/2021 15:15:38 - INFO - __main__ - Step 11807: {'lr': 0.00049460363300844, 'samples': 2266944, 'steps': 11806, 'loss/train': 1.9607677459716797} -08/30/2021 15:15:38 - INFO - __main__ - Step 11808: {'lr': 0.0004946025363045854, 'samples': 2267136, 'steps': 11807, 'loss/train': 2.244109630584717} -08/30/2021 15:15:39 - INFO - __main__ - Step 11809: {'lr': 0.0004946014394905167, 'samples': 2267328, 'steps': 11808, 'loss/train': 1.970001220703125} -08/30/2021 15:15:39 - INFO - __main__ - Step 11810: {'lr': 0.0004946003425662343, 'samples': 2267520, 'steps': 11809, 'loss/train': 0.0902596190571785} -08/30/2021 15:15:39 - INFO - __main__ - Step 11811: {'lr': 0.0004945992455317389, 'samples': 2267712, 'steps': 11810, 'loss/train': 0.5853404998779297} -08/30/2021 15:15:41 - INFO - __main__ - Step 11812: {'lr': 0.0004945981483870307, 'samples': 2267904, 'steps': 11811, 'loss/train': 1.6543635129928589} -08/30/2021 15:15:41 - INFO - __main__ - Step 11813: {'lr': 0.0004945970511321104, 'samples': 2268096, 'steps': 11812, 'loss/train': 1.7412084341049194} -08/30/2021 15:15:42 - INFO - __main__ - Step 11814: {'lr': 0.0004945959537669784, 'samples': 2268288, 'steps': 11813, 'loss/train': 1.5137156248092651} -08/30/2021 15:15:42 - INFO - __main__ - Step 11815: {'lr': 0.0004945948562916353, 'samples': 2268480, 'steps': 11814, 'loss/train': 2.1057684421539307} -08/30/2021 15:15:43 - INFO - __main__ - Step 11816: {'lr': 0.0004945937587060815, 'samples': 2268672, 'steps': 11815, 'loss/train': 1.7500317096710205} -08/30/2021 15:15:45 - INFO - __main__ - Step 11817: {'lr': 0.0004945926610103175, 'samples': 2268864, 'steps': 11816, 'loss/train': 2.100980281829834} -08/30/2021 15:15:45 - INFO - __main__ - Step 11818: {'lr': 0.0004945915632043439, 'samples': 2269056, 'steps': 11817, 'loss/train': 1.5017176866531372} -08/30/2021 15:15:46 - INFO - __main__ - Step 11819: {'lr': 0.0004945904652881611, 'samples': 2269248, 'steps': 11818, 'loss/train': 1.8831287622451782} -08/30/2021 15:15:46 - INFO - __main__ - Step 11820: {'lr': 0.0004945893672617695, 'samples': 2269440, 'steps': 11819, 'loss/train': 2.4403114318847656} -08/30/2021 15:15:46 - INFO - __main__ - Step 11821: {'lr': 0.0004945882691251699, 'samples': 2269632, 'steps': 11820, 'loss/train': 2.021946668624878} -08/30/2021 15:15:48 - INFO - __main__ - Step 11822: {'lr': 0.0004945871708783625, 'samples': 2269824, 'steps': 11821, 'loss/train': 2.088178873062134} -08/30/2021 15:15:48 - INFO - __main__ - Step 11823: {'lr': 0.0004945860725213477, 'samples': 2270016, 'steps': 11822, 'loss/train': 1.171350121498108} -08/30/2021 15:15:49 - INFO - __main__ - Step 11824: {'lr': 0.0004945849740541265, 'samples': 2270208, 'steps': 11823, 'loss/train': 1.861392855644226} -08/30/2021 15:15:49 - INFO - __main__ - Step 11825: {'lr': 0.000494583875476699, 'samples': 2270400, 'steps': 11824, 'loss/train': 2.1119577884674072} -08/30/2021 15:15:49 - INFO - __main__ - Step 11826: {'lr': 0.0004945827767890657, 'samples': 2270592, 'steps': 11825, 'loss/train': 1.9140068292617798} -08/30/2021 15:15:50 - INFO - __main__ - Step 11827: {'lr': 0.0004945816779912272, 'samples': 2270784, 'steps': 11826, 'loss/train': 1.7558281421661377} -08/30/2021 15:15:51 - INFO - __main__ - Step 11828: {'lr': 0.000494580579083184, 'samples': 2270976, 'steps': 11827, 'loss/train': 1.6848113536834717} -08/30/2021 15:15:51 - INFO - __main__ - Step 11829: {'lr': 0.0004945794800649366, 'samples': 2271168, 'steps': 11828, 'loss/train': 1.7365353107452393} -08/30/2021 15:15:52 - INFO - __main__ - Step 11830: {'lr': 0.0004945783809364853, 'samples': 2271360, 'steps': 11829, 'loss/train': 1.7429718971252441} -08/30/2021 15:15:52 - INFO - __main__ - Step 11831: {'lr': 0.0004945772816978309, 'samples': 2271552, 'steps': 11830, 'loss/train': 2.4146013259887695} -08/30/2021 15:15:52 - INFO - __main__ - Step 11832: {'lr': 0.0004945761823489737, 'samples': 2271744, 'steps': 11831, 'loss/train': 1.812188982963562} -08/30/2021 15:15:54 - INFO - __main__ - Step 11833: {'lr': 0.0004945750828899144, 'samples': 2271936, 'steps': 11832, 'loss/train': 1.648162841796875} -08/30/2021 15:15:54 - INFO - __main__ - Step 11834: {'lr': 0.0004945739833206531, 'samples': 2272128, 'steps': 11833, 'loss/train': 2.069950580596924} -08/30/2021 15:15:55 - INFO - __main__ - Step 11835: {'lr': 0.0004945728836411907, 'samples': 2272320, 'steps': 11834, 'loss/train': 2.2438645362854004} -08/30/2021 15:15:55 - INFO - __main__ - Step 11836: {'lr': 0.0004945717838515275, 'samples': 2272512, 'steps': 11835, 'loss/train': 1.9432957172393799} -08/30/2021 15:15:55 - INFO - __main__ - Step 11837: {'lr': 0.0004945706839516639, 'samples': 2272704, 'steps': 11836, 'loss/train': 1.6880847215652466} -08/30/2021 15:15:57 - INFO - __main__ - Step 11838: {'lr': 0.0004945695839416006, 'samples': 2272896, 'steps': 11837, 'loss/train': 1.4829120635986328} -08/30/2021 15:15:57 - INFO - __main__ - Step 11839: {'lr': 0.0004945684838213382, 'samples': 2273088, 'steps': 11838, 'loss/train': 2.03684139251709} -08/30/2021 15:15:58 - INFO - __main__ - Step 11840: {'lr': 0.0004945673835908767, 'samples': 2273280, 'steps': 11839, 'loss/train': 1.7222049236297607} -08/30/2021 15:15:58 - INFO - __main__ - Step 11841: {'lr': 0.0004945662832502171, 'samples': 2273472, 'steps': 11840, 'loss/train': 1.6915655136108398} -08/30/2021 15:15:58 - INFO - __main__ - Step 11842: {'lr': 0.0004945651827993597, 'samples': 2273664, 'steps': 11841, 'loss/train': 2.2450461387634277} -08/30/2021 15:16:00 - INFO - __main__ - Step 11843: {'lr': 0.000494564082238305, 'samples': 2273856, 'steps': 11842, 'loss/train': 1.5833274126052856} -08/30/2021 15:16:00 - INFO - __main__ - Step 11844: {'lr': 0.0004945629815670535, 'samples': 2274048, 'steps': 11843, 'loss/train': 1.8316855430603027} -08/30/2021 15:16:01 - INFO - __main__ - Step 11845: {'lr': 0.0004945618807856056, 'samples': 2274240, 'steps': 11844, 'loss/train': 1.6846545934677124} -08/30/2021 15:16:01 - INFO - __main__ - Step 11846: {'lr': 0.000494560779893962, 'samples': 2274432, 'steps': 11845, 'loss/train': 2.065723180770874} -08/30/2021 15:16:01 - INFO - __main__ - Step 11847: {'lr': 0.0004945596788921231, 'samples': 2274624, 'steps': 11846, 'loss/train': 1.5155576467514038} -08/30/2021 15:16:03 - INFO - __main__ - Step 11848: {'lr': 0.0004945585777800893, 'samples': 2274816, 'steps': 11847, 'loss/train': 2.3535053730010986} -08/30/2021 15:16:04 - INFO - __main__ - Step 11849: {'lr': 0.0004945574765578612, 'samples': 2275008, 'steps': 11848, 'loss/train': 1.3265169858932495} -08/30/2021 15:16:04 - INFO - __main__ - Step 11850: {'lr': 0.0004945563752254393, 'samples': 2275200, 'steps': 11849, 'loss/train': 0.10267017036676407} -08/30/2021 15:16:04 - INFO - __main__ - Step 11851: {'lr': 0.000494555273782824, 'samples': 2275392, 'steps': 11850, 'loss/train': 1.8187745809555054} -08/30/2021 15:16:05 - INFO - __main__ - Step 11852: {'lr': 0.000494554172230016, 'samples': 2275584, 'steps': 11851, 'loss/train': 1.3680561780929565} -08/30/2021 15:16:05 - INFO - __main__ - Step 11853: {'lr': 0.0004945530705670156, 'samples': 2275776, 'steps': 11852, 'loss/train': 2.0712554454803467} -08/30/2021 15:16:07 - INFO - __main__ - Step 11854: {'lr': 0.0004945519687938234, 'samples': 2275968, 'steps': 11853, 'loss/train': 0.8978202939033508} -08/30/2021 15:16:08 - INFO - __main__ - Step 11855: {'lr': 0.0004945508669104397, 'samples': 2276160, 'steps': 11854, 'loss/train': 1.6371419429779053} -08/30/2021 15:16:08 - INFO - __main__ - Step 11856: {'lr': 0.0004945497649168654, 'samples': 2276352, 'steps': 11855, 'loss/train': 1.8161147832870483} -08/30/2021 15:16:08 - INFO - __main__ - Step 11857: {'lr': 0.0004945486628131006, 'samples': 2276544, 'steps': 11856, 'loss/train': 1.4968148469924927} -08/30/2021 15:16:09 - INFO - __main__ - Step 11858: {'lr': 0.0004945475605991459, 'samples': 2276736, 'steps': 11857, 'loss/train': 1.6238117218017578} -08/30/2021 15:16:10 - INFO - __main__ - Step 11859: {'lr': 0.0004945464582750019, 'samples': 2276928, 'steps': 11858, 'loss/train': 1.0893546342849731} -08/30/2021 15:16:11 - INFO - __main__ - Step 11860: {'lr': 0.000494545355840669, 'samples': 2277120, 'steps': 11859, 'loss/train': 0.9706990122795105} -08/30/2021 15:16:11 - INFO - __main__ - Step 11861: {'lr': 0.0004945442532961478, 'samples': 2277312, 'steps': 11860, 'loss/train': 1.086559534072876} -08/30/2021 15:16:11 - INFO - __main__ - Step 11862: {'lr': 0.0004945431506414386, 'samples': 2277504, 'steps': 11861, 'loss/train': 1.9632014036178589} -08/30/2021 15:16:12 - INFO - __main__ - Step 11863: {'lr': 0.0004945420478765422, 'samples': 2277696, 'steps': 11862, 'loss/train': 1.5190651416778564} -08/30/2021 15:16:12 - INFO - __main__ - Step 11864: {'lr': 0.0004945409450014588, 'samples': 2277888, 'steps': 11863, 'loss/train': 0.6566113829612732} -08/30/2021 15:16:14 - INFO - __main__ - Step 11865: {'lr': 0.0004945398420161892, 'samples': 2278080, 'steps': 11864, 'loss/train': 1.752700924873352} -08/30/2021 15:16:15 - INFO - __main__ - Step 11866: {'lr': 0.0004945387389207335, 'samples': 2278272, 'steps': 11865, 'loss/train': 1.5283820629119873} -08/30/2021 15:16:15 - INFO - __main__ - Step 11867: {'lr': 0.0004945376357150926, 'samples': 2278464, 'steps': 11866, 'loss/train': 2.3288278579711914} -08/30/2021 15:16:15 - INFO - __main__ - Step 11868: {'lr': 0.0004945365323992668, 'samples': 2278656, 'steps': 11867, 'loss/train': 1.4412542581558228} -08/30/2021 15:16:16 - INFO - __main__ - Step 11869: {'lr': 0.0004945354289732565, 'samples': 2278848, 'steps': 11868, 'loss/train': 1.701159119606018} -08/30/2021 15:16:17 - INFO - __main__ - Step 11870: {'lr': 0.0004945343254370623, 'samples': 2279040, 'steps': 11869, 'loss/train': 2.2766289710998535} -08/30/2021 15:16:18 - INFO - __main__ - Step 11871: {'lr': 0.0004945332217906848, 'samples': 2279232, 'steps': 11870, 'loss/train': 1.0289002656936646} -08/30/2021 15:16:19 - INFO - __main__ - Step 11872: {'lr': 0.0004945321180341244, 'samples': 2279424, 'steps': 11871, 'loss/train': 1.8550326824188232} -08/30/2021 15:16:19 - INFO - __main__ - Step 11873: {'lr': 0.0004945310141673816, 'samples': 2279616, 'steps': 11872, 'loss/train': 1.3300050497055054} -08/30/2021 15:16:19 - INFO - __main__ - Step 11874: {'lr': 0.0004945299101904568, 'samples': 2279808, 'steps': 11873, 'loss/train': 1.3555680513381958} -08/30/2021 15:16:21 - INFO - __main__ - Step 11875: {'lr': 0.0004945288061033507, 'samples': 2280000, 'steps': 11874, 'loss/train': 1.2853432893753052} -08/30/2021 15:16:21 - INFO - __main__ - Step 11876: {'lr': 0.0004945277019060637, 'samples': 2280192, 'steps': 11875, 'loss/train': 1.9826915264129639} -08/30/2021 15:16:22 - INFO - __main__ - Step 11877: {'lr': 0.0004945265975985962, 'samples': 2280384, 'steps': 11876, 'loss/train': 1.8472506999969482} -08/30/2021 15:16:22 - INFO - __main__ - Step 11878: {'lr': 0.0004945254931809489, 'samples': 2280576, 'steps': 11877, 'loss/train': 1.9365565776824951} -08/30/2021 15:16:22 - INFO - __main__ - Step 11879: {'lr': 0.000494524388653122, 'samples': 2280768, 'steps': 11878, 'loss/train': 1.9993367195129395} -08/30/2021 15:16:24 - INFO - __main__ - Step 11880: {'lr': 0.0004945232840151164, 'samples': 2280960, 'steps': 11879, 'loss/train': 2.090670347213745} -08/30/2021 15:16:24 - INFO - __main__ - Step 11881: {'lr': 0.0004945221792669322, 'samples': 2281152, 'steps': 11880, 'loss/train': 1.2670029401779175} -08/30/2021 15:16:25 - INFO - __main__ - Step 11882: {'lr': 0.0004945210744085702, 'samples': 2281344, 'steps': 11881, 'loss/train': 1.4060724973678589} -08/30/2021 15:16:25 - INFO - __main__ - Step 11883: {'lr': 0.0004945199694400308, 'samples': 2281536, 'steps': 11882, 'loss/train': 1.7131822109222412} -08/30/2021 15:16:25 - INFO - __main__ - Step 11884: {'lr': 0.0004945188643613144, 'samples': 2281728, 'steps': 11883, 'loss/train': 2.860826253890991} -08/30/2021 15:16:26 - INFO - __main__ - Step 11885: {'lr': 0.0004945177591724216, 'samples': 2281920, 'steps': 11884, 'loss/train': 2.138678789138794} -08/30/2021 15:16:28 - INFO - __main__ - Step 11886: {'lr': 0.0004945166538733529, 'samples': 2282112, 'steps': 11885, 'loss/train': 2.2239696979522705} -08/30/2021 15:16:28 - INFO - __main__ - Step 11887: {'lr': 0.0004945155484641087, 'samples': 2282304, 'steps': 11886, 'loss/train': 1.3135066032409668} -08/30/2021 15:16:28 - INFO - __main__ - Step 11888: {'lr': 0.0004945144429446897, 'samples': 2282496, 'steps': 11887, 'loss/train': 1.7199856042861938} -08/30/2021 15:16:29 - INFO - __main__ - Step 11889: {'lr': 0.000494513337315096, 'samples': 2282688, 'steps': 11888, 'loss/train': 2.244947671890259} -08/30/2021 15:16:29 - INFO - __main__ - Step 11890: {'lr': 0.0004945122315753286, 'samples': 2282880, 'steps': 11889, 'loss/train': 0.1160358339548111} -08/30/2021 15:16:29 - INFO - __main__ - Step 11891: {'lr': 0.0004945111257253877, 'samples': 2283072, 'steps': 11890, 'loss/train': 1.718772292137146} -08/30/2021 15:16:31 - INFO - __main__ - Step 11892: {'lr': 0.0004945100197652738, 'samples': 2283264, 'steps': 11891, 'loss/train': 1.8626842498779297} -08/30/2021 15:16:32 - INFO - __main__ - Step 11893: {'lr': 0.0004945089136949876, 'samples': 2283456, 'steps': 11892, 'loss/train': 1.7901222705841064} -08/30/2021 15:16:32 - INFO - __main__ - Step 11894: {'lr': 0.0004945078075145292, 'samples': 2283648, 'steps': 11893, 'loss/train': 1.7418882846832275} -08/30/2021 15:16:32 - INFO - __main__ - Step 11895: {'lr': 0.0004945067012238996, 'samples': 2283840, 'steps': 11894, 'loss/train': 1.9788968563079834} -08/30/2021 15:16:33 - INFO - __main__ - Step 11896: {'lr': 0.000494505594823099, 'samples': 2284032, 'steps': 11895, 'loss/train': 2.1579482555389404} -08/30/2021 15:16:34 - INFO - __main__ - Step 11897: {'lr': 0.0004945044883121279, 'samples': 2284224, 'steps': 11896, 'loss/train': 2.1536645889282227} -08/30/2021 15:16:35 - INFO - __main__ - Step 11898: {'lr': 0.0004945033816909868, 'samples': 2284416, 'steps': 11897, 'loss/train': 1.8212894201278687} -08/30/2021 15:16:35 - INFO - __main__ - Step 11899: {'lr': 0.0004945022749596764, 'samples': 2284608, 'steps': 11898, 'loss/train': 1.8418039083480835} -08/30/2021 15:16:35 - INFO - __main__ - Step 11900: {'lr': 0.000494501168118197, 'samples': 2284800, 'steps': 11899, 'loss/train': 2.2023589611053467} -08/30/2021 15:16:36 - INFO - __main__ - Step 11901: {'lr': 0.0004945000611665491, 'samples': 2284992, 'steps': 11900, 'loss/train': 0.8514636754989624} -08/30/2021 15:16:37 - INFO - __main__ - Step 11902: {'lr': 0.0004944989541047333, 'samples': 2285184, 'steps': 11901, 'loss/train': 1.9046348333358765} -08/30/2021 15:16:38 - INFO - __main__ - Step 11903: {'lr': 0.0004944978469327499, 'samples': 2285376, 'steps': 11902, 'loss/train': 2.3624885082244873} -08/30/2021 15:16:38 - INFO - __main__ - Step 11904: {'lr': 0.0004944967396505998, 'samples': 2285568, 'steps': 11903, 'loss/train': 2.0583996772766113} -08/30/2021 15:16:38 - INFO - __main__ - Step 11905: {'lr': 0.000494495632258283, 'samples': 2285760, 'steps': 11904, 'loss/train': 1.5278751850128174} -08/30/2021 15:16:39 - INFO - __main__ - Step 11906: {'lr': 0.0004944945247558004, 'samples': 2285952, 'steps': 11905, 'loss/train': 1.9481247663497925} -08/30/2021 15:16:40 - INFO - __main__ - Step 11907: {'lr': 0.0004944934171431522, 'samples': 2286144, 'steps': 11906, 'loss/train': 2.091527223587036} -08/30/2021 15:16:41 - INFO - __main__ - Step 11908: {'lr': 0.0004944923094203391, 'samples': 2286336, 'steps': 11907, 'loss/train': 1.9200574159622192} -08/30/2021 15:16:41 - INFO - __main__ - Step 11909: {'lr': 0.0004944912015873616, 'samples': 2286528, 'steps': 11908, 'loss/train': 1.7044814825057983} -08/30/2021 15:16:41 - INFO - __main__ - Step 11910: {'lr': 0.0004944900936442201, 'samples': 2286720, 'steps': 11909, 'loss/train': 1.9967432022094727} -08/30/2021 15:16:42 - INFO - __main__ - Step 11911: {'lr': 0.000494488985590915, 'samples': 2286912, 'steps': 11910, 'loss/train': 1.1475468873977661} -08/30/2021 15:16:43 - INFO - __main__ - Step 11912: {'lr': 0.0004944878774274472, 'samples': 2287104, 'steps': 11911, 'loss/train': 2.161979913711548} -08/30/2021 15:16:44 - INFO - __main__ - Step 11913: {'lr': 0.0004944867691538167, 'samples': 2287296, 'steps': 11912, 'loss/train': 1.6226567029953003} -08/30/2021 15:16:44 - INFO - __main__ - Step 11914: {'lr': 0.0004944856607700243, 'samples': 2287488, 'steps': 11913, 'loss/train': 1.9641687870025635} -08/30/2021 15:16:44 - INFO - __main__ - Step 11915: {'lr': 0.0004944845522760706, 'samples': 2287680, 'steps': 11914, 'loss/train': 1.3493125438690186} -08/30/2021 15:16:45 - INFO - __main__ - Step 11916: {'lr': 0.0004944834436719557, 'samples': 2287872, 'steps': 11915, 'loss/train': 1.9325021505355835} -08/30/2021 15:16:47 - INFO - __main__ - Step 11917: {'lr': 0.0004944823349576805, 'samples': 2288064, 'steps': 11916, 'loss/train': 1.6535131931304932} -08/30/2021 15:16:47 - INFO - __main__ - Step 11918: {'lr': 0.0004944812261332452, 'samples': 2288256, 'steps': 11917, 'loss/train': 1.7490426301956177} -08/30/2021 15:16:48 - INFO - __main__ - Step 11919: {'lr': 0.0004944801171986505, 'samples': 2288448, 'steps': 11918, 'loss/train': 2.1977345943450928} -08/30/2021 15:16:48 - INFO - __main__ - Step 11920: {'lr': 0.0004944790081538969, 'samples': 2288640, 'steps': 11919, 'loss/train': 1.394598364830017} -08/30/2021 15:16:48 - INFO - __main__ - Step 11921: {'lr': 0.0004944778989989847, 'samples': 2288832, 'steps': 11920, 'loss/train': 1.4951305389404297} -08/30/2021 15:16:49 - INFO - __main__ - Step 11922: {'lr': 0.0004944767897339146, 'samples': 2289024, 'steps': 11921, 'loss/train': 1.8019953966140747} -08/30/2021 15:16:51 - INFO - __main__ - Step 11923: {'lr': 0.000494475680358687, 'samples': 2289216, 'steps': 11922, 'loss/train': 2.575214147567749} -08/30/2021 15:16:51 - INFO - __main__ - Step 11924: {'lr': 0.0004944745708733025, 'samples': 2289408, 'steps': 11923, 'loss/train': 1.8814994096755981} -08/30/2021 15:16:52 - INFO - __main__ - Step 11925: {'lr': 0.0004944734612777615, 'samples': 2289600, 'steps': 11924, 'loss/train': 1.3159366846084595} -08/30/2021 15:16:52 - INFO - __main__ - Step 11926: {'lr': 0.0004944723515720645, 'samples': 2289792, 'steps': 11925, 'loss/train': 1.339134693145752} -08/30/2021 15:16:53 - INFO - __main__ - Step 11927: {'lr': 0.000494471241756212, 'samples': 2289984, 'steps': 11926, 'loss/train': 1.8326565027236938} -08/30/2021 15:16:53 - INFO - __main__ - Step 11928: {'lr': 0.0004944701318302046, 'samples': 2290176, 'steps': 11927, 'loss/train': 1.7587428092956543} -08/30/2021 15:16:54 - INFO - __main__ - Step 11929: {'lr': 0.0004944690217940427, 'samples': 2290368, 'steps': 11928, 'loss/train': 1.8818683624267578} -08/30/2021 15:16:55 - INFO - __main__ - Step 11930: {'lr': 0.0004944679116477269, 'samples': 2290560, 'steps': 11929, 'loss/train': 1.6216456890106201} -08/30/2021 15:16:55 - INFO - __main__ - Step 11931: {'lr': 0.0004944668013912575, 'samples': 2290752, 'steps': 11930, 'loss/train': 4.033947944641113} -08/30/2021 15:16:56 - INFO - __main__ - Step 11932: {'lr': 0.0004944656910246352, 'samples': 2290944, 'steps': 11931, 'loss/train': 1.6390389204025269} -08/30/2021 15:16:56 - INFO - __main__ - Step 11933: {'lr': 0.0004944645805478605, 'samples': 2291136, 'steps': 11932, 'loss/train': 2.1255385875701904} -08/30/2021 15:16:58 - INFO - __main__ - Step 11934: {'lr': 0.0004944634699609338, 'samples': 2291328, 'steps': 11933, 'loss/train': 2.00468373298645} -08/30/2021 15:16:59 - INFO - __main__ - Step 11935: {'lr': 0.0004944623592638555, 'samples': 2291520, 'steps': 11934, 'loss/train': 1.8242744207382202} -08/30/2021 15:16:59 - INFO - __main__ - Step 11936: {'lr': 0.0004944612484566263, 'samples': 2291712, 'steps': 11935, 'loss/train': 1.6638684272766113} -08/30/2021 15:16:59 - INFO - __main__ - Step 11937: {'lr': 0.0004944601375392467, 'samples': 2291904, 'steps': 11936, 'loss/train': 1.7676445245742798} -08/30/2021 15:17:00 - INFO - __main__ - Step 11938: {'lr': 0.000494459026511717, 'samples': 2292096, 'steps': 11937, 'loss/train': 1.9250776767730713} -08/30/2021 15:17:00 - INFO - __main__ - Step 11939: {'lr': 0.000494457915374038, 'samples': 2292288, 'steps': 11938, 'loss/train': 0.27478641271591187} -08/30/2021 15:17:00 - INFO - __main__ - Step 11940: {'lr': 0.00049445680412621, 'samples': 2292480, 'steps': 11939, 'loss/train': 0.22299745678901672} -08/30/2021 15:17:02 - INFO - __main__ - Step 11941: {'lr': 0.0004944556927682335, 'samples': 2292672, 'steps': 11940, 'loss/train': 0.11953985691070557} -08/30/2021 15:17:02 - INFO - __main__ - Step 11942: {'lr': 0.000494454581300109, 'samples': 2292864, 'steps': 11941, 'loss/train': 1.916543960571289} -08/30/2021 15:17:03 - INFO - __main__ - Step 11943: {'lr': 0.0004944534697218371, 'samples': 2293056, 'steps': 11942, 'loss/train': 1.9661853313446045} -08/30/2021 15:17:03 - INFO - __main__ - Step 11944: {'lr': 0.0004944523580334183, 'samples': 2293248, 'steps': 11943, 'loss/train': 1.1564851999282837} -08/30/2021 15:17:03 - INFO - __main__ - Step 11945: {'lr': 0.0004944512462348528, 'samples': 2293440, 'steps': 11944, 'loss/train': 0.4339814782142639} -08/30/2021 15:17:05 - INFO - __main__ - Step 11946: {'lr': 0.0004944501343261416, 'samples': 2293632, 'steps': 11945, 'loss/train': 2.549010753631592} -08/30/2021 15:17:05 - INFO - __main__ - Step 11947: {'lr': 0.0004944490223072848, 'samples': 2293824, 'steps': 11946, 'loss/train': 1.7171857357025146} -08/30/2021 15:17:06 - INFO - __main__ - Step 11948: {'lr': 0.0004944479101782831, 'samples': 2294016, 'steps': 11947, 'loss/train': 1.3282312154769897} -08/30/2021 15:17:06 - INFO - __main__ - Step 11949: {'lr': 0.0004944467979391369, 'samples': 2294208, 'steps': 11948, 'loss/train': 1.839789628982544} -08/30/2021 15:17:06 - INFO - __main__ - Step 11950: {'lr': 0.0004944456855898469, 'samples': 2294400, 'steps': 11949, 'loss/train': 1.7644050121307373} -08/30/2021 15:17:08 - INFO - __main__ - Step 11951: {'lr': 0.0004944445731304133, 'samples': 2294592, 'steps': 11950, 'loss/train': 2.0731210708618164} -08/30/2021 15:17:08 - INFO - __main__ - Step 11952: {'lr': 0.0004944434605608367, 'samples': 2294784, 'steps': 11951, 'loss/train': 2.1134634017944336} -08/30/2021 15:17:09 - INFO - __main__ - Step 11953: {'lr': 0.0004944423478811177, 'samples': 2294976, 'steps': 11952, 'loss/train': 1.8561817407608032} -08/30/2021 15:17:09 - INFO - __main__ - Step 11954: {'lr': 0.0004944412350912567, 'samples': 2295168, 'steps': 11953, 'loss/train': 1.8143947124481201} -08/30/2021 15:17:09 - INFO - __main__ - Step 11955: {'lr': 0.0004944401221912544, 'samples': 2295360, 'steps': 11954, 'loss/train': 1.742327332496643} -08/30/2021 15:17:10 - INFO - __main__ - Step 11956: {'lr': 0.0004944390091811111, 'samples': 2295552, 'steps': 11955, 'loss/train': 1.770018219947815} -08/30/2021 15:17:11 - INFO - __main__ - Step 11957: {'lr': 0.0004944378960608272, 'samples': 2295744, 'steps': 11956, 'loss/train': 1.9021027088165283} -08/30/2021 15:17:12 - INFO - __main__ - Step 11958: {'lr': 0.0004944367828304035, 'samples': 2295936, 'steps': 11957, 'loss/train': 1.9084395170211792} -08/30/2021 15:17:12 - INFO - __main__ - Step 11959: {'lr': 0.0004944356694898404, 'samples': 2296128, 'steps': 11958, 'loss/train': 1.5890378952026367} -08/30/2021 15:17:13 - INFO - __main__ - Step 11960: {'lr': 0.0004944345560391382, 'samples': 2296320, 'steps': 11959, 'loss/train': 1.9585572481155396} -08/30/2021 15:17:13 - INFO - __main__ - Step 11961: {'lr': 0.0004944334424782977, 'samples': 2296512, 'steps': 11960, 'loss/train': 2.0318806171417236} -08/30/2021 15:17:15 - INFO - __main__ - Step 11962: {'lr': 0.0004944323288073192, 'samples': 2296704, 'steps': 11961, 'loss/train': 1.6990612745285034} -08/30/2021 15:17:15 - INFO - __main__ - Step 11963: {'lr': 0.0004944312150262033, 'samples': 2296896, 'steps': 11962, 'loss/train': 2.077442169189453} -08/30/2021 15:17:15 - INFO - __main__ - Step 11964: {'lr': 0.0004944301011349505, 'samples': 2297088, 'steps': 11963, 'loss/train': 1.551512360572815} -08/30/2021 15:17:16 - INFO - __main__ - Step 11965: {'lr': 0.0004944289871335612, 'samples': 2297280, 'steps': 11964, 'loss/train': 1.5474135875701904} -08/30/2021 15:17:16 - INFO - __main__ - Step 11966: {'lr': 0.0004944278730220359, 'samples': 2297472, 'steps': 11965, 'loss/train': 4.930060863494873} -08/30/2021 15:17:18 - INFO - __main__ - Step 11967: {'lr': 0.0004944267588003754, 'samples': 2297664, 'steps': 11966, 'loss/train': 1.3303277492523193} -08/30/2021 15:17:18 - INFO - __main__ - Step 11968: {'lr': 0.0004944256444685798, 'samples': 2297856, 'steps': 11967, 'loss/train': 2.613445520401001} -08/30/2021 15:17:18 - INFO - __main__ - Step 11969: {'lr': 0.0004944245300266498, 'samples': 2298048, 'steps': 11968, 'loss/train': 1.755059838294983} -08/30/2021 15:17:19 - INFO - __main__ - Step 11970: {'lr': 0.0004944234154745859, 'samples': 2298240, 'steps': 11969, 'loss/train': 2.520012617111206} -08/30/2021 15:17:19 - INFO - __main__ - Step 11971: {'lr': 0.0004944223008123886, 'samples': 2298432, 'steps': 11970, 'loss/train': 1.772457242012024} -08/30/2021 15:17:21 - INFO - __main__ - Step 11972: {'lr': 0.0004944211860400582, 'samples': 2298624, 'steps': 11971, 'loss/train': 2.64841628074646} -08/30/2021 15:17:21 - INFO - __main__ - Step 11973: {'lr': 0.0004944200711575956, 'samples': 2298816, 'steps': 11972, 'loss/train': 2.3025026321411133} -08/30/2021 15:17:21 - INFO - __main__ - Step 11974: {'lr': 0.0004944189561650011, 'samples': 2299008, 'steps': 11973, 'loss/train': 1.9383209943771362} -08/30/2021 15:17:22 - INFO - __main__ - Step 11975: {'lr': 0.0004944178410622751, 'samples': 2299200, 'steps': 11974, 'loss/train': 2.0031256675720215} -08/30/2021 15:17:22 - INFO - __main__ - Step 11976: {'lr': 0.0004944167258494181, 'samples': 2299392, 'steps': 11975, 'loss/train': 1.6150741577148438} -08/30/2021 15:17:24 - INFO - __main__ - Step 11977: {'lr': 0.0004944156105264308, 'samples': 2299584, 'steps': 11976, 'loss/train': 1.7885252237319946} -08/30/2021 15:17:24 - INFO - __main__ - Step 11978: {'lr': 0.0004944144950933137, 'samples': 2299776, 'steps': 11977, 'loss/train': 1.420885682106018} -08/30/2021 15:17:24 - INFO - __main__ - Step 11979: {'lr': 0.000494413379550067, 'samples': 2299968, 'steps': 11978, 'loss/train': 1.8487935066223145} -08/30/2021 15:17:25 - INFO - __main__ - Step 11980: {'lr': 0.0004944122638966916, 'samples': 2300160, 'steps': 11979, 'loss/train': 1.9244537353515625} -08/30/2021 15:17:25 - INFO - __main__ - Step 11981: {'lr': 0.0004944111481331876, 'samples': 2300352, 'steps': 11980, 'loss/train': 1.6892220973968506} -08/30/2021 15:17:26 - INFO - __main__ - Step 11982: {'lr': 0.0004944100322595558, 'samples': 2300544, 'steps': 11981, 'loss/train': 1.8874355554580688} -08/30/2021 15:17:27 - INFO - __main__ - Step 11983: {'lr': 0.0004944089162757968, 'samples': 2300736, 'steps': 11982, 'loss/train': 1.6030975580215454} -08/30/2021 15:17:28 - INFO - __main__ - Step 11984: {'lr': 0.0004944078001819106, 'samples': 2300928, 'steps': 11983, 'loss/train': 1.707241415977478} -08/30/2021 15:17:28 - INFO - __main__ - Step 11985: {'lr': 0.0004944066839778983, 'samples': 2301120, 'steps': 11984, 'loss/train': 1.5362730026245117} -08/30/2021 15:17:29 - INFO - __main__ - Step 11986: {'lr': 0.0004944055676637599, 'samples': 2301312, 'steps': 11985, 'loss/train': 1.617297887802124} -08/30/2021 15:17:29 - INFO - __main__ - Step 11987: {'lr': 0.0004944044512394962, 'samples': 2301504, 'steps': 11986, 'loss/train': 2.1507620811462402} -08/30/2021 15:17:31 - INFO - __main__ - Step 11988: {'lr': 0.0004944033347051076, 'samples': 2301696, 'steps': 11987, 'loss/train': 1.9792611598968506} -08/30/2021 15:17:31 - INFO - __main__ - Step 11989: {'lr': 0.0004944022180605947, 'samples': 2301888, 'steps': 11988, 'loss/train': 1.146347999572754} -08/30/2021 15:17:31 - INFO - __main__ - Step 11990: {'lr': 0.0004944011013059579, 'samples': 2302080, 'steps': 11989, 'loss/train': 1.4543150663375854} -08/30/2021 15:17:32 - INFO - __main__ - Step 11991: {'lr': 0.0004943999844411977, 'samples': 2302272, 'steps': 11990, 'loss/train': 2.1181256771087646} -08/30/2021 15:17:32 - INFO - __main__ - Step 11992: {'lr': 0.0004943988674663147, 'samples': 2302464, 'steps': 11991, 'loss/train': 2.086256980895996} -08/30/2021 15:17:34 - INFO - __main__ - Step 11993: {'lr': 0.0004943977503813092, 'samples': 2302656, 'steps': 11992, 'loss/train': 2.1037232875823975} -08/30/2021 15:17:34 - INFO - __main__ - Step 11994: {'lr': 0.000494396633186182, 'samples': 2302848, 'steps': 11993, 'loss/train': 2.0811357498168945} -08/30/2021 15:17:34 - INFO - __main__ - Step 11995: {'lr': 0.0004943955158809334, 'samples': 2303040, 'steps': 11994, 'loss/train': 1.6144832372665405} -08/30/2021 15:17:35 - INFO - __main__ - Step 11996: {'lr': 0.0004943943984655639, 'samples': 2303232, 'steps': 11995, 'loss/train': 1.6353332996368408} -08/30/2021 15:17:35 - INFO - __main__ - Step 11997: {'lr': 0.0004943932809400741, 'samples': 2303424, 'steps': 11996, 'loss/train': 2.0281214714050293} -08/30/2021 15:17:37 - INFO - __main__ - Step 11998: {'lr': 0.0004943921633044644, 'samples': 2303616, 'steps': 11997, 'loss/train': 1.399830937385559} -08/30/2021 15:17:37 - INFO - __main__ - Step 11999: {'lr': 0.0004943910455587354, 'samples': 2303808, 'steps': 11998, 'loss/train': 1.625523328781128} -08/30/2021 15:17:37 - INFO - __main__ - Step 12000: {'lr': 0.0004943899277028877, 'samples': 2304000, 'steps': 11999, 'loss/train': 1.9747083187103271} -08/30/2021 15:17:38 - INFO - __main__ - Step 12001: {'lr': 0.0004943888097369216, 'samples': 2304192, 'steps': 12000, 'loss/train': 1.6894176006317139} -08/30/2021 15:17:38 - INFO - __main__ - Step 12002: {'lr': 0.0004943876916608375, 'samples': 2304384, 'steps': 12001, 'loss/train': 1.666957974433899} -08/30/2021 15:17:40 - INFO - __main__ - Step 12003: {'lr': 0.0004943865734746364, 'samples': 2304576, 'steps': 12002, 'loss/train': 1.9539308547973633} -08/30/2021 15:17:40 - INFO - __main__ - Step 12004: {'lr': 0.0004943854551783182, 'samples': 2304768, 'steps': 12003, 'loss/train': 2.365431070327759} -08/30/2021 15:17:40 - INFO - __main__ - Step 12005: {'lr': 0.0004943843367718838, 'samples': 2304960, 'steps': 12004, 'loss/train': 1.2316572666168213} -08/30/2021 15:17:41 - INFO - __main__ - Step 12006: {'lr': 0.0004943832182553336, 'samples': 2305152, 'steps': 12005, 'loss/train': 1.4853630065917969} -08/30/2021 15:17:41 - INFO - __main__ - Step 12007: {'lr': 0.000494382099628668, 'samples': 2305344, 'steps': 12006, 'loss/train': 1.1035212278366089} -08/30/2021 15:17:43 - INFO - __main__ - Step 12008: {'lr': 0.0004943809808918877, 'samples': 2305536, 'steps': 12007, 'loss/train': 1.5442581176757812} -08/30/2021 15:17:44 - INFO - __main__ - Step 12009: {'lr': 0.000494379862044993, 'samples': 2305728, 'steps': 12008, 'loss/train': 2.388361692428589} -08/30/2021 15:17:44 - INFO - __main__ - Step 12010: {'lr': 0.0004943787430879846, 'samples': 2305920, 'steps': 12009, 'loss/train': 1.524498701095581} -08/30/2021 15:17:44 - INFO - __main__ - Step 12011: {'lr': 0.0004943776240208628, 'samples': 2306112, 'steps': 12010, 'loss/train': 1.300168752670288} -08/30/2021 15:17:45 - INFO - __main__ - Step 12012: {'lr': 0.0004943765048436283, 'samples': 2306304, 'steps': 12011, 'loss/train': 1.6063472032546997} -08/30/2021 15:17:45 - INFO - __main__ - Step 12013: {'lr': 0.0004943753855562815, 'samples': 2306496, 'steps': 12012, 'loss/train': 1.5207185745239258} -08/30/2021 15:17:45 - INFO - __main__ - Step 12014: {'lr': 0.000494374266158823, 'samples': 2306688, 'steps': 12013, 'loss/train': 0.12340107560157776} -08/30/2021 15:17:47 - INFO - __main__ - Step 12015: {'lr': 0.0004943731466512531, 'samples': 2306880, 'steps': 12014, 'loss/train': 1.4685721397399902} -08/30/2021 15:17:47 - INFO - __main__ - Step 12016: {'lr': 0.0004943720270335724, 'samples': 2307072, 'steps': 12015, 'loss/train': 2.2033302783966064} -08/30/2021 15:17:48 - INFO - __main__ - Step 12017: {'lr': 0.0004943709073057816, 'samples': 2307264, 'steps': 12016, 'loss/train': 2.157628059387207} -08/30/2021 15:17:48 - INFO - __main__ - Step 12018: {'lr': 0.000494369787467881, 'samples': 2307456, 'steps': 12017, 'loss/train': 6.126431941986084} -08/30/2021 15:17:48 - INFO - __main__ - Step 12019: {'lr': 0.000494368667519871, 'samples': 2307648, 'steps': 12018, 'loss/train': 1.3012217283248901} -08/30/2021 15:17:50 - INFO - __main__ - Step 12020: {'lr': 0.0004943675474617524, 'samples': 2307840, 'steps': 12019, 'loss/train': 1.4627915620803833} -08/30/2021 15:17:51 - INFO - __main__ - Step 12021: {'lr': 0.0004943664272935255, 'samples': 2308032, 'steps': 12020, 'loss/train': 1.4414600133895874} -08/30/2021 15:17:51 - INFO - __main__ - Step 12022: {'lr': 0.0004943653070151909, 'samples': 2308224, 'steps': 12021, 'loss/train': 1.6685082912445068} -08/30/2021 15:17:52 - INFO - __main__ - Step 12023: {'lr': 0.000494364186626749, 'samples': 2308416, 'steps': 12022, 'loss/train': 1.2931737899780273} -08/30/2021 15:17:52 - INFO - __main__ - Step 12024: {'lr': 0.0004943630661282004, 'samples': 2308608, 'steps': 12023, 'loss/train': 0.8000673651695251} -08/30/2021 15:17:52 - INFO - __main__ - Step 12025: {'lr': 0.0004943619455195456, 'samples': 2308800, 'steps': 12024, 'loss/train': 0.7814105153083801} -08/30/2021 15:17:54 - INFO - __main__ - Step 12026: {'lr': 0.000494360824800785, 'samples': 2308992, 'steps': 12025, 'loss/train': 0.7187609672546387} -08/30/2021 15:17:55 - INFO - __main__ - Step 12027: {'lr': 0.0004943597039719192, 'samples': 2309184, 'steps': 12026, 'loss/train': 1.802985429763794} -08/30/2021 15:17:55 - INFO - __main__ - Step 12028: {'lr': 0.0004943585830329487, 'samples': 2309376, 'steps': 12027, 'loss/train': 2.038097620010376} -08/30/2021 15:17:55 - INFO - __main__ - Step 12029: {'lr': 0.0004943574619838741, 'samples': 2309568, 'steps': 12028, 'loss/train': 1.644842505455017} -08/30/2021 15:17:56 - INFO - __main__ - Step 12030: {'lr': 0.0004943563408246957, 'samples': 2309760, 'steps': 12029, 'loss/train': 1.4243265390396118} -08/30/2021 15:17:57 - INFO - __main__ - Step 12031: {'lr': 0.000494355219555414, 'samples': 2309952, 'steps': 12030, 'loss/train': 1.8283549547195435} -08/30/2021 15:17:58 - INFO - __main__ - Step 12032: {'lr': 0.0004943540981760298, 'samples': 2310144, 'steps': 12031, 'loss/train': 2.287456750869751} -08/30/2021 15:17:58 - INFO - __main__ - Step 12033: {'lr': 0.0004943529766865434, 'samples': 2310336, 'steps': 12032, 'loss/train': 2.2850167751312256} -08/30/2021 15:17:58 - INFO - __main__ - Step 12034: {'lr': 0.0004943518550869552, 'samples': 2310528, 'steps': 12033, 'loss/train': 1.8853846788406372} -08/30/2021 15:17:59 - INFO - __main__ - Step 12035: {'lr': 0.0004943507333772659, 'samples': 2310720, 'steps': 12034, 'loss/train': 1.424363613128662} -08/30/2021 15:17:59 - INFO - __main__ - Step 12036: {'lr': 0.0004943496115574758, 'samples': 2310912, 'steps': 12035, 'loss/train': 0.38498976826667786} -08/30/2021 15:18:01 - INFO - __main__ - Step 12037: {'lr': 0.0004943484896275857, 'samples': 2311104, 'steps': 12036, 'loss/train': 1.6763032674789429} -08/30/2021 15:18:02 - INFO - __main__ - Step 12038: {'lr': 0.0004943473675875959, 'samples': 2311296, 'steps': 12037, 'loss/train': 1.6160004138946533} -08/30/2021 15:18:02 - INFO - __main__ - Step 12039: {'lr': 0.0004943462454375069, 'samples': 2311488, 'steps': 12038, 'loss/train': 1.7438759803771973} -08/30/2021 15:18:02 - INFO - __main__ - Step 12040: {'lr': 0.0004943451231773192, 'samples': 2311680, 'steps': 12039, 'loss/train': 1.6552613973617554} -08/30/2021 15:18:03 - INFO - __main__ - Step 12041: {'lr': 0.0004943440008070336, 'samples': 2311872, 'steps': 12040, 'loss/train': 1.7740602493286133} -08/30/2021 15:18:04 - INFO - __main__ - Step 12042: {'lr': 0.0004943428783266502, 'samples': 2312064, 'steps': 12041, 'loss/train': 1.8296421766281128} -08/30/2021 15:18:05 - INFO - __main__ - Step 12043: {'lr': 0.0004943417557361696, 'samples': 2312256, 'steps': 12042, 'loss/train': 2.170560359954834} -08/30/2021 15:18:05 - INFO - __main__ - Step 12044: {'lr': 0.0004943406330355925, 'samples': 2312448, 'steps': 12043, 'loss/train': 2.164201259613037} -08/30/2021 15:18:05 - INFO - __main__ - Step 12045: {'lr': 0.0004943395102249192, 'samples': 2312640, 'steps': 12044, 'loss/train': 1.9016125202178955} -08/30/2021 15:18:06 - INFO - __main__ - Step 12046: {'lr': 0.0004943383873041503, 'samples': 2312832, 'steps': 12045, 'loss/train': 0.9587546586990356} -08/30/2021 15:18:07 - INFO - __main__ - Step 12047: {'lr': 0.0004943372642732864, 'samples': 2313024, 'steps': 12046, 'loss/train': 1.6233153343200684} -08/30/2021 15:18:08 - INFO - __main__ - Step 12048: {'lr': 0.0004943361411323277, 'samples': 2313216, 'steps': 12047, 'loss/train': 1.6164321899414062} -08/30/2021 15:18:08 - INFO - __main__ - Step 12049: {'lr': 0.0004943350178812751, 'samples': 2313408, 'steps': 12048, 'loss/train': 1.4530580043792725} -08/30/2021 15:18:08 - INFO - __main__ - Step 12050: {'lr': 0.0004943338945201288, 'samples': 2313600, 'steps': 12049, 'loss/train': 2.2362661361694336} -08/30/2021 15:18:09 - INFO - __main__ - Step 12051: {'lr': 0.0004943327710488894, 'samples': 2313792, 'steps': 12050, 'loss/train': 1.9938535690307617} -08/30/2021 15:18:10 - INFO - __main__ - Step 12052: {'lr': 0.0004943316474675575, 'samples': 2313984, 'steps': 12051, 'loss/train': 1.6572089195251465} -08/30/2021 15:18:11 - INFO - __main__ - Step 12053: {'lr': 0.0004943305237761335, 'samples': 2314176, 'steps': 12052, 'loss/train': 1.9264360666275024} -08/30/2021 15:18:11 - INFO - __main__ - Step 12054: {'lr': 0.0004943293999746179, 'samples': 2314368, 'steps': 12053, 'loss/train': 5.252533912658691} -08/30/2021 15:18:11 - INFO - __main__ - Step 12055: {'lr': 0.0004943282760630114, 'samples': 2314560, 'steps': 12054, 'loss/train': 2.003549337387085} -08/30/2021 15:18:12 - INFO - __main__ - Step 12056: {'lr': 0.0004943271520413141, 'samples': 2314752, 'steps': 12055, 'loss/train': 1.935607671737671} -08/30/2021 15:18:12 - INFO - __main__ - Step 12057: {'lr': 0.0004943260279095269, 'samples': 2314944, 'steps': 12056, 'loss/train': 2.268451452255249} -08/30/2021 15:18:14 - INFO - __main__ - Step 12058: {'lr': 0.0004943249036676501, 'samples': 2315136, 'steps': 12057, 'loss/train': 1.9314218759536743} -08/30/2021 15:18:14 - INFO - __main__ - Step 12059: {'lr': 0.0004943237793156844, 'samples': 2315328, 'steps': 12058, 'loss/train': 1.8404067754745483} -08/30/2021 15:18:15 - INFO - __main__ - Step 12060: {'lr': 0.00049432265485363, 'samples': 2315520, 'steps': 12059, 'loss/train': 1.3859785795211792} -08/30/2021 15:18:15 - INFO - __main__ - Step 12061: {'lr': 0.0004943215302814877, 'samples': 2315712, 'steps': 12060, 'loss/train': 0.191435769200325} -08/30/2021 15:18:15 - INFO - __main__ - Step 12062: {'lr': 0.0004943204055992579, 'samples': 2315904, 'steps': 12061, 'loss/train': 1.8861454725265503} -08/30/2021 15:18:17 - INFO - __main__ - Step 12063: {'lr': 0.0004943192808069411, 'samples': 2316096, 'steps': 12062, 'loss/train': 1.554942011833191} -08/30/2021 15:18:17 - INFO - __main__ - Step 12064: {'lr': 0.0004943181559045378, 'samples': 2316288, 'steps': 12063, 'loss/train': 2.055192470550537} -08/30/2021 15:18:18 - INFO - __main__ - Step 12065: {'lr': 0.0004943170308920483, 'samples': 2316480, 'steps': 12064, 'loss/train': 1.8513082265853882} -08/30/2021 15:18:18 - INFO - __main__ - Step 12066: {'lr': 0.0004943159057694736, 'samples': 2316672, 'steps': 12065, 'loss/train': 1.7051243782043457} -08/30/2021 15:18:19 - INFO - __main__ - Step 12067: {'lr': 0.0004943147805368138, 'samples': 2316864, 'steps': 12066, 'loss/train': 0.13096553087234497} -08/30/2021 15:18:20 - INFO - __main__ - Step 12068: {'lr': 0.0004943136551940695, 'samples': 2317056, 'steps': 12067, 'loss/train': 2.0382769107818604} -08/30/2021 15:18:20 - INFO - __main__ - Step 12069: {'lr': 0.0004943125297412413, 'samples': 2317248, 'steps': 12068, 'loss/train': 2.5085906982421875} -08/30/2021 15:18:21 - INFO - __main__ - Step 12070: {'lr': 0.0004943114041783296, 'samples': 2317440, 'steps': 12069, 'loss/train': 1.7958232164382935} -08/30/2021 15:18:21 - INFO - __main__ - Step 12071: {'lr': 0.000494310278505335, 'samples': 2317632, 'steps': 12070, 'loss/train': 1.4741815328598022} -08/30/2021 15:18:22 - INFO - __main__ - Step 12072: {'lr': 0.0004943091527222579, 'samples': 2317824, 'steps': 12071, 'loss/train': 1.7163307666778564} -08/30/2021 15:18:23 - INFO - __main__ - Step 12073: {'lr': 0.0004943080268290989, 'samples': 2318016, 'steps': 12072, 'loss/train': 1.750003695487976} -08/30/2021 15:18:23 - INFO - __main__ - Step 12074: {'lr': 0.0004943069008258584, 'samples': 2318208, 'steps': 12073, 'loss/train': 1.5996164083480835} -08/30/2021 15:18:24 - INFO - __main__ - Step 12075: {'lr': 0.0004943057747125371, 'samples': 2318400, 'steps': 12074, 'loss/train': 1.823594093322754} -08/30/2021 15:18:24 - INFO - __main__ - Step 12076: {'lr': 0.0004943046484891352, 'samples': 2318592, 'steps': 12075, 'loss/train': 1.444747805595398} -08/30/2021 15:18:24 - INFO - __main__ - Step 12077: {'lr': 0.0004943035221556536, 'samples': 2318784, 'steps': 12076, 'loss/train': 1.5687693357467651} -08/30/2021 15:18:26 - INFO - __main__ - Step 12078: {'lr': 0.0004943023957120926, 'samples': 2318976, 'steps': 12077, 'loss/train': 1.819845199584961} -08/30/2021 15:18:27 - INFO - __main__ - Step 12079: {'lr': 0.0004943012691584526, 'samples': 2319168, 'steps': 12078, 'loss/train': 1.7982951402664185} -08/30/2021 15:18:27 - INFO - __main__ - Step 12080: {'lr': 0.0004943001424947343, 'samples': 2319360, 'steps': 12079, 'loss/train': 0.7677766680717468} -08/30/2021 15:18:27 - INFO - __main__ - Step 12081: {'lr': 0.000494299015720938, 'samples': 2319552, 'steps': 12080, 'loss/train': 1.7462985515594482} -08/30/2021 15:18:28 - INFO - __main__ - Step 12082: {'lr': 0.0004942978888370645, 'samples': 2319744, 'steps': 12081, 'loss/train': 1.373520851135254} -08/30/2021 15:18:29 - INFO - __main__ - Step 12083: {'lr': 0.000494296761843114, 'samples': 2319936, 'steps': 12082, 'loss/train': 1.4659006595611572} -08/30/2021 15:18:30 - INFO - __main__ - Step 12084: {'lr': 0.0004942956347390872, 'samples': 2320128, 'steps': 12083, 'loss/train': 1.479794979095459} -08/30/2021 15:18:30 - INFO - __main__ - Step 12085: {'lr': 0.0004942945075249845, 'samples': 2320320, 'steps': 12084, 'loss/train': 1.0551555156707764} -08/30/2021 15:18:30 - INFO - __main__ - Step 12086: {'lr': 0.0004942933802008066, 'samples': 2320512, 'steps': 12085, 'loss/train': 1.9779893159866333} -08/30/2021 15:18:31 - INFO - __main__ - Step 12087: {'lr': 0.0004942922527665538, 'samples': 2320704, 'steps': 12086, 'loss/train': 1.4531564712524414} -08/30/2021 15:18:31 - INFO - __main__ - Step 12088: {'lr': 0.0004942911252222267, 'samples': 2320896, 'steps': 12087, 'loss/train': 1.9168614149093628} -08/30/2021 15:18:32 - INFO - __main__ - Step 12089: {'lr': 0.0004942899975678257, 'samples': 2321088, 'steps': 12088, 'loss/train': 1.192571759223938} -08/30/2021 15:18:33 - INFO - __main__ - Step 12090: {'lr': 0.0004942888698033515, 'samples': 2321280, 'steps': 12089, 'loss/train': 1.5015541315078735} -08/30/2021 15:18:33 - INFO - __main__ - Step 12091: {'lr': 0.0004942877419288045, 'samples': 2321472, 'steps': 12090, 'loss/train': 1.565805435180664} -08/30/2021 15:18:34 - INFO - __main__ - Step 12092: {'lr': 0.0004942866139441851, 'samples': 2321664, 'steps': 12091, 'loss/train': 1.1745671033859253} -08/30/2021 15:18:34 - INFO - __main__ - Step 12093: {'lr': 0.0004942854858494941, 'samples': 2321856, 'steps': 12092, 'loss/train': 1.6281485557556152} -08/30/2021 15:18:36 - INFO - __main__ - Step 12094: {'lr': 0.0004942843576447316, 'samples': 2322048, 'steps': 12093, 'loss/train': 1.7991557121276855} -08/30/2021 15:18:37 - INFO - __main__ - Step 12095: {'lr': 0.0004942832293298986, 'samples': 2322240, 'steps': 12094, 'loss/train': 1.21683669090271} -08/30/2021 15:18:37 - INFO - __main__ - Step 12096: {'lr': 0.0004942821009049952, 'samples': 2322432, 'steps': 12095, 'loss/train': 1.626397967338562} -08/30/2021 15:18:37 - INFO - __main__ - Step 12097: {'lr': 0.0004942809723700221, 'samples': 2322624, 'steps': 12096, 'loss/train': 1.7386540174484253} -08/30/2021 15:18:38 - INFO - __main__ - Step 12098: {'lr': 0.0004942798437249797, 'samples': 2322816, 'steps': 12097, 'loss/train': 1.600664734840393} -08/30/2021 15:18:39 - INFO - __main__ - Step 12099: {'lr': 0.0004942787149698687, 'samples': 2323008, 'steps': 12098, 'loss/train': 2.1354129314422607} -08/30/2021 15:18:40 - INFO - __main__ - Step 12100: {'lr': 0.0004942775861046893, 'samples': 2323200, 'steps': 12099, 'loss/train': 1.0666619539260864} -08/30/2021 15:18:40 - INFO - __main__ - Step 12101: {'lr': 0.0004942764571294422, 'samples': 2323392, 'steps': 12100, 'loss/train': 1.6054303646087646} -08/30/2021 15:18:40 - INFO - __main__ - Step 12102: {'lr': 0.0004942753280441281, 'samples': 2323584, 'steps': 12101, 'loss/train': 2.294025421142578} -08/30/2021 15:18:41 - INFO - __main__ - Step 12103: {'lr': 0.0004942741988487471, 'samples': 2323776, 'steps': 12102, 'loss/train': 1.8871198892593384} -08/30/2021 15:18:42 - INFO - __main__ - Step 12104: {'lr': 0.0004942730695433001, 'samples': 2323968, 'steps': 12103, 'loss/train': 0.6726149916648865} -08/30/2021 15:18:42 - INFO - __main__ - Step 12105: {'lr': 0.0004942719401277873, 'samples': 2324160, 'steps': 12104, 'loss/train': 1.5810009241104126} -08/30/2021 15:18:43 - INFO - __main__ - Step 12106: {'lr': 0.0004942708106022094, 'samples': 2324352, 'steps': 12105, 'loss/train': 1.3863474130630493} -08/30/2021 15:18:43 - INFO - __main__ - Step 12107: {'lr': 0.0004942696809665668, 'samples': 2324544, 'steps': 12106, 'loss/train': 1.8221224546432495} -08/30/2021 15:18:44 - INFO - __main__ - Step 12108: {'lr': 0.0004942685512208599, 'samples': 2324736, 'steps': 12107, 'loss/train': 1.6639631986618042} -08/30/2021 15:18:45 - INFO - __main__ - Step 12109: {'lr': 0.0004942674213650896, 'samples': 2324928, 'steps': 12108, 'loss/train': 1.747971773147583} -08/30/2021 15:18:46 - INFO - __main__ - Step 12110: {'lr': 0.000494266291399256, 'samples': 2325120, 'steps': 12109, 'loss/train': 2.1878867149353027} -08/30/2021 15:18:46 - INFO - __main__ - Step 12111: {'lr': 0.0004942651613233599, 'samples': 2325312, 'steps': 12110, 'loss/train': 1.359521508216858} -08/30/2021 15:18:46 - INFO - __main__ - Step 12112: {'lr': 0.0004942640311374017, 'samples': 2325504, 'steps': 12111, 'loss/train': 1.5496395826339722} -08/30/2021 15:18:47 - INFO - __main__ - Step 12113: {'lr': 0.0004942629008413818, 'samples': 2325696, 'steps': 12112, 'loss/train': 1.916627049446106} -08/30/2021 15:18:48 - INFO - __main__ - Step 12114: {'lr': 0.0004942617704353008, 'samples': 2325888, 'steps': 12113, 'loss/train': 1.8518034219741821} -08/30/2021 15:18:49 - INFO - __main__ - Step 12115: {'lr': 0.0004942606399191593, 'samples': 2326080, 'steps': 12114, 'loss/train': 2.5131680965423584} -08/30/2021 15:18:49 - INFO - __main__ - Step 12116: {'lr': 0.0004942595092929577, 'samples': 2326272, 'steps': 12115, 'loss/train': 1.6142479181289673} -08/30/2021 15:18:50 - INFO - __main__ - Step 12117: {'lr': 0.0004942583785566965, 'samples': 2326464, 'steps': 12116, 'loss/train': 1.4931957721710205} -08/30/2021 15:18:50 - INFO - __main__ - Step 12118: {'lr': 0.0004942572477103763, 'samples': 2326656, 'steps': 12117, 'loss/train': 1.6612237691879272} -08/30/2021 15:18:51 - INFO - __main__ - Step 12119: {'lr': 0.0004942561167539975, 'samples': 2326848, 'steps': 12118, 'loss/train': 1.540592908859253} -08/30/2021 15:18:52 - INFO - __main__ - Step 12120: {'lr': 0.0004942549856875606, 'samples': 2327040, 'steps': 12119, 'loss/train': 1.9624732732772827} -08/30/2021 15:18:52 - INFO - __main__ - Step 12121: {'lr': 0.0004942538545110663, 'samples': 2327232, 'steps': 12120, 'loss/train': 1.8401318788528442} -08/30/2021 15:18:53 - INFO - __main__ - Step 12122: {'lr': 0.0004942527232245149, 'samples': 2327424, 'steps': 12121, 'loss/train': 1.9509354829788208} -08/30/2021 15:18:53 - INFO - __main__ - Step 12123: {'lr': 0.0004942515918279071, 'samples': 2327616, 'steps': 12122, 'loss/train': 1.8921127319335938} -08/30/2021 15:18:54 - INFO - __main__ - Step 12124: {'lr': 0.0004942504603212433, 'samples': 2327808, 'steps': 12123, 'loss/train': 1.6281896829605103} -08/30/2021 15:18:55 - INFO - __main__ - Step 12125: {'lr': 0.0004942493287045239, 'samples': 2328000, 'steps': 12124, 'loss/train': 1.2714658975601196} -08/30/2021 15:18:55 - INFO - __main__ - Step 12126: {'lr': 0.0004942481969777495, 'samples': 2328192, 'steps': 12125, 'loss/train': 1.8391683101654053} -08/30/2021 15:18:55 - INFO - __main__ - Step 12127: {'lr': 0.0004942470651409207, 'samples': 2328384, 'steps': 12126, 'loss/train': 1.2472349405288696} -08/30/2021 15:18:56 - INFO - __main__ - Step 12128: {'lr': 0.000494245933194038, 'samples': 2328576, 'steps': 12127, 'loss/train': 1.6282511949539185} -08/30/2021 15:18:57 - INFO - __main__ - Step 12129: {'lr': 0.0004942448011371018, 'samples': 2328768, 'steps': 12128, 'loss/train': 1.464552879333496} -08/30/2021 15:18:58 - INFO - __main__ - Step 12130: {'lr': 0.0004942436689701126, 'samples': 2328960, 'steps': 12129, 'loss/train': 1.3245165348052979} -08/30/2021 15:18:58 - INFO - __main__ - Step 12131: {'lr': 0.000494242536693071, 'samples': 2329152, 'steps': 12130, 'loss/train': 1.7746152877807617} -08/30/2021 15:18:58 - INFO - __main__ - Step 12132: {'lr': 0.0004942414043059776, 'samples': 2329344, 'steps': 12131, 'loss/train': 1.863704800605774} -08/30/2021 15:18:59 - INFO - __main__ - Step 12133: {'lr': 0.0004942402718088326, 'samples': 2329536, 'steps': 12132, 'loss/train': 1.7185570001602173} -08/30/2021 15:19:00 - INFO - __main__ - Step 12134: {'lr': 0.0004942391392016368, 'samples': 2329728, 'steps': 12133, 'loss/train': 1.7659586668014526} -08/30/2021 15:19:01 - INFO - __main__ - Step 12135: {'lr': 0.0004942380064843906, 'samples': 2329920, 'steps': 12134, 'loss/train': 1.9427530765533447} -08/30/2021 15:19:01 - INFO - __main__ - Step 12136: {'lr': 0.0004942368736570946, 'samples': 2330112, 'steps': 12135, 'loss/train': 1.532886028289795} -08/30/2021 15:19:02 - INFO - __main__ - Step 12137: {'lr': 0.0004942357407197491, 'samples': 2330304, 'steps': 12136, 'loss/train': 0.5886409282684326} -08/30/2021 15:19:02 - INFO - __main__ - Step 12138: {'lr': 0.0004942346076723548, 'samples': 2330496, 'steps': 12137, 'loss/train': 0.3196311593055725} -08/30/2021 15:19:04 - INFO - __main__ - Step 12139: {'lr': 0.0004942334745149122, 'samples': 2330688, 'steps': 12138, 'loss/train': 1.8268685340881348} -08/30/2021 15:19:04 - INFO - __main__ - Step 12140: {'lr': 0.0004942323412474218, 'samples': 2330880, 'steps': 12139, 'loss/train': 2.045480966567993} -08/30/2021 15:19:05 - INFO - __main__ - Step 12141: {'lr': 0.000494231207869884, 'samples': 2331072, 'steps': 12140, 'loss/train': 1.5094717741012573} -08/30/2021 15:19:05 - INFO - __main__ - Step 12142: {'lr': 0.0004942300743822993, 'samples': 2331264, 'steps': 12141, 'loss/train': 1.67244553565979} -08/30/2021 15:19:05 - INFO - __main__ - Step 12143: {'lr': 0.0004942289407846684, 'samples': 2331456, 'steps': 12142, 'loss/train': 1.5462299585342407} -08/30/2021 15:19:06 - INFO - __main__ - Step 12144: {'lr': 0.0004942278070769917, 'samples': 2331648, 'steps': 12143, 'loss/train': 0.135407492518425} -08/30/2021 15:19:08 - INFO - __main__ - Step 12145: {'lr': 0.0004942266732592697, 'samples': 2331840, 'steps': 12144, 'loss/train': 1.4855194091796875} -08/30/2021 15:19:08 - INFO - __main__ - Step 12146: {'lr': 0.0004942255393315029, 'samples': 2332032, 'steps': 12145, 'loss/train': 1.9162156581878662} -08/30/2021 15:19:09 - INFO - __main__ - Step 12147: {'lr': 0.000494224405293692, 'samples': 2332224, 'steps': 12146, 'loss/train': 1.5435060262680054} -08/30/2021 15:19:09 - INFO - __main__ - Step 12148: {'lr': 0.0004942232711458372, 'samples': 2332416, 'steps': 12147, 'loss/train': 0.9427946209907532} -08/30/2021 15:19:09 - INFO - __main__ - Step 12149: {'lr': 0.0004942221368879391, 'samples': 2332608, 'steps': 12148, 'loss/train': 1.492453694343567} -08/30/2021 15:19:11 - INFO - __main__ - Step 12150: {'lr': 0.0004942210025199985, 'samples': 2332800, 'steps': 12149, 'loss/train': 1.6069821119308472} -08/30/2021 15:19:11 - INFO - __main__ - Step 12151: {'lr': 0.0004942198680420155, 'samples': 2332992, 'steps': 12150, 'loss/train': 1.6264772415161133} -08/30/2021 15:19:12 - INFO - __main__ - Step 12152: {'lr': 0.0004942187334539908, 'samples': 2333184, 'steps': 12151, 'loss/train': 1.6122090816497803} -08/30/2021 15:19:12 - INFO - __main__ - Step 12153: {'lr': 0.0004942175987559251, 'samples': 2333376, 'steps': 12152, 'loss/train': 1.3487244844436646} -08/30/2021 15:19:12 - INFO - __main__ - Step 12154: {'lr': 0.0004942164639478185, 'samples': 2333568, 'steps': 12153, 'loss/train': 1.9462392330169678} -08/30/2021 15:19:14 - INFO - __main__ - Step 12155: {'lr': 0.0004942153290296718, 'samples': 2333760, 'steps': 12154, 'loss/train': 2.1020166873931885} -08/30/2021 15:19:14 - INFO - __main__ - Step 12156: {'lr': 0.0004942141940014854, 'samples': 2333952, 'steps': 12155, 'loss/train': 2.0489957332611084} -08/30/2021 15:19:15 - INFO - __main__ - Step 12157: {'lr': 0.0004942130588632599, 'samples': 2334144, 'steps': 12156, 'loss/train': 2.6077041625976562} -08/30/2021 15:19:15 - INFO - __main__ - Step 12158: {'lr': 0.0004942119236149958, 'samples': 2334336, 'steps': 12157, 'loss/train': 1.9298309087753296} -08/30/2021 15:19:15 - INFO - __main__ - Step 12159: {'lr': 0.0004942107882566936, 'samples': 2334528, 'steps': 12158, 'loss/train': 1.816013216972351} -08/30/2021 15:19:17 - INFO - __main__ - Step 12160: {'lr': 0.0004942096527883538, 'samples': 2334720, 'steps': 12159, 'loss/train': 1.7926967144012451} -08/30/2021 15:19:17 - INFO - __main__ - Step 12161: {'lr': 0.0004942085172099768, 'samples': 2334912, 'steps': 12160, 'loss/train': 1.8809715509414673} -08/30/2021 15:19:18 - INFO - __main__ - Step 12162: {'lr': 0.0004942073815215632, 'samples': 2335104, 'steps': 12161, 'loss/train': 2.161996364593506} -08/30/2021 15:19:18 - INFO - __main__ - Step 12163: {'lr': 0.0004942062457231136, 'samples': 2335296, 'steps': 12162, 'loss/train': 1.6908721923828125} -08/30/2021 15:19:18 - INFO - __main__ - Step 12164: {'lr': 0.0004942051098146284, 'samples': 2335488, 'steps': 12163, 'loss/train': 1.698455810546875} -08/30/2021 15:19:20 - INFO - __main__ - Step 12165: {'lr': 0.0004942039737961081, 'samples': 2335680, 'steps': 12164, 'loss/train': 1.7169294357299805} -08/30/2021 15:19:20 - INFO - __main__ - Step 12166: {'lr': 0.0004942028376675533, 'samples': 2335872, 'steps': 12165, 'loss/train': 1.8420363664627075} -08/30/2021 15:19:21 - INFO - __main__ - Step 12167: {'lr': 0.0004942017014289645, 'samples': 2336064, 'steps': 12166, 'loss/train': 2.1549808979034424} -08/30/2021 15:19:21 - INFO - __main__ - Step 12168: {'lr': 0.0004942005650803421, 'samples': 2336256, 'steps': 12167, 'loss/train': 1.9457118511199951} -08/30/2021 15:19:21 - INFO - __main__ - Step 12169: {'lr': 0.0004941994286216867, 'samples': 2336448, 'steps': 12168, 'loss/train': 1.997660756111145} -08/30/2021 15:19:23 - INFO - __main__ - Step 12170: {'lr': 0.0004941982920529989, 'samples': 2336640, 'steps': 12169, 'loss/train': 0.12547174096107483} -08/30/2021 15:19:23 - INFO - __main__ - Step 12171: {'lr': 0.0004941971553742791, 'samples': 2336832, 'steps': 12170, 'loss/train': 1.582919716835022} -08/30/2021 15:19:24 - INFO - __main__ - Step 12172: {'lr': 0.0004941960185855278, 'samples': 2337024, 'steps': 12171, 'loss/train': 1.3614516258239746} -08/30/2021 15:19:24 - INFO - __main__ - Step 12173: {'lr': 0.0004941948816867455, 'samples': 2337216, 'steps': 12172, 'loss/train': 1.503619909286499} -08/30/2021 15:19:24 - INFO - __main__ - Step 12174: {'lr': 0.0004941937446779328, 'samples': 2337408, 'steps': 12173, 'loss/train': 1.5388134717941284} -08/30/2021 15:19:26 - INFO - __main__ - Step 12175: {'lr': 0.0004941926075590901, 'samples': 2337600, 'steps': 12174, 'loss/train': 1.9619473218917847} -08/30/2021 15:19:26 - INFO - __main__ - Step 12176: {'lr': 0.0004941914703302181, 'samples': 2337792, 'steps': 12175, 'loss/train': 1.6383063793182373} -08/30/2021 15:19:27 - INFO - __main__ - Step 12177: {'lr': 0.0004941903329913172, 'samples': 2337984, 'steps': 12176, 'loss/train': 0.8161340355873108} -08/30/2021 15:19:27 - INFO - __main__ - Step 12178: {'lr': 0.0004941891955423878, 'samples': 2338176, 'steps': 12177, 'loss/train': 1.8237727880477905} -08/30/2021 15:19:27 - INFO - __main__ - Step 12179: {'lr': 0.0004941880579834306, 'samples': 2338368, 'steps': 12178, 'loss/train': 2.046415328979492} -08/30/2021 15:19:29 - INFO - __main__ - Step 12180: {'lr': 0.0004941869203144459, 'samples': 2338560, 'steps': 12179, 'loss/train': 1.5539066791534424} -08/30/2021 15:19:29 - INFO - __main__ - Step 12181: {'lr': 0.0004941857825354344, 'samples': 2338752, 'steps': 12180, 'loss/train': 2.091731071472168} -08/30/2021 15:19:30 - INFO - __main__ - Step 12182: {'lr': 0.0004941846446463966, 'samples': 2338944, 'steps': 12181, 'loss/train': 1.92172372341156} -08/30/2021 15:19:30 - INFO - __main__ - Step 12183: {'lr': 0.000494183506647333, 'samples': 2339136, 'steps': 12182, 'loss/train': 1.6249258518218994} -08/30/2021 15:19:30 - INFO - __main__ - Step 12184: {'lr': 0.000494182368538244, 'samples': 2339328, 'steps': 12183, 'loss/train': 1.3668913841247559} -08/30/2021 15:19:31 - INFO - __main__ - Step 12185: {'lr': 0.0004941812303191302, 'samples': 2339520, 'steps': 12184, 'loss/train': 1.7039155960083008} -08/30/2021 15:19:32 - INFO - __main__ - Step 12186: {'lr': 0.0004941800919899921, 'samples': 2339712, 'steps': 12185, 'loss/train': 1.3259013891220093} -08/30/2021 15:19:33 - INFO - __main__ - Step 12187: {'lr': 0.0004941789535508303, 'samples': 2339904, 'steps': 12186, 'loss/train': 1.8849434852600098} -08/30/2021 15:19:33 - INFO - __main__ - Step 12188: {'lr': 0.0004941778150016451, 'samples': 2340096, 'steps': 12187, 'loss/train': 1.3777295351028442} -08/30/2021 15:19:33 - INFO - __main__ - Step 12189: {'lr': 0.0004941766763424373, 'samples': 2340288, 'steps': 12188, 'loss/train': 1.2483760118484497} -08/30/2021 15:19:34 - INFO - __main__ - Step 12190: {'lr': 0.0004941755375732071, 'samples': 2340480, 'steps': 12189, 'loss/train': 2.1583364009857178} -08/30/2021 15:19:35 - INFO - __main__ - Step 12191: {'lr': 0.0004941743986939553, 'samples': 2340672, 'steps': 12190, 'loss/train': 1.2722080945968628} -08/30/2021 15:19:36 - INFO - __main__ - Step 12192: {'lr': 0.0004941732597046822, 'samples': 2340864, 'steps': 12191, 'loss/train': 1.8975012302398682} -08/30/2021 15:19:36 - INFO - __main__ - Step 12193: {'lr': 0.0004941721206053885, 'samples': 2341056, 'steps': 12192, 'loss/train': 1.4381009340286255} -08/30/2021 15:19:36 - INFO - __main__ - Step 12194: {'lr': 0.0004941709813960745, 'samples': 2341248, 'steps': 12193, 'loss/train': 1.772352933883667} -08/30/2021 15:19:37 - INFO - __main__ - Step 12195: {'lr': 0.0004941698420767408, 'samples': 2341440, 'steps': 12194, 'loss/train': 1.7654757499694824} -08/30/2021 15:19:39 - INFO - __main__ - Step 12196: {'lr': 0.0004941687026473881, 'samples': 2341632, 'steps': 12195, 'loss/train': 1.6286343336105347} -08/30/2021 15:19:39 - INFO - __main__ - Step 12197: {'lr': 0.0004941675631080166, 'samples': 2341824, 'steps': 12196, 'loss/train': 2.1513400077819824} -08/30/2021 15:19:40 - INFO - __main__ - Step 12198: {'lr': 0.000494166423458627, 'samples': 2342016, 'steps': 12197, 'loss/train': 0.1918555647134781} -08/30/2021 15:19:40 - INFO - __main__ - Step 12199: {'lr': 0.0004941652836992198, 'samples': 2342208, 'steps': 12198, 'loss/train': 2.00239634513855} -08/30/2021 15:19:40 - INFO - __main__ - Step 12200: {'lr': 0.0004941641438297955, 'samples': 2342400, 'steps': 12199, 'loss/train': 2.297025203704834} -08/30/2021 15:19:42 - INFO - __main__ - Step 12201: {'lr': 0.0004941630038503545, 'samples': 2342592, 'steps': 12200, 'loss/train': 1.8913379907608032} -08/30/2021 15:19:42 - INFO - __main__ - Step 12202: {'lr': 0.0004941618637608976, 'samples': 2342784, 'steps': 12201, 'loss/train': 1.133849024772644} -08/30/2021 15:19:43 - INFO - __main__ - Step 12203: {'lr': 0.000494160723561425, 'samples': 2342976, 'steps': 12202, 'loss/train': 1.7795054912567139} -08/30/2021 15:19:43 - INFO - __main__ - Step 12204: {'lr': 0.0004941595832519374, 'samples': 2343168, 'steps': 12203, 'loss/train': 1.6500552892684937} -08/30/2021 15:19:43 - INFO - __main__ - Step 12205: {'lr': 0.0004941584428324352, 'samples': 2343360, 'steps': 12204, 'loss/train': 1.7131215333938599} -08/30/2021 15:19:45 - INFO - __main__ - Step 12206: {'lr': 0.000494157302302919, 'samples': 2343552, 'steps': 12205, 'loss/train': 1.3454593420028687} -08/30/2021 15:19:46 - INFO - __main__ - Step 12207: {'lr': 0.0004941561616633893, 'samples': 2343744, 'steps': 12206, 'loss/train': 2.19356632232666} -08/30/2021 15:19:46 - INFO - __main__ - Step 12208: {'lr': 0.0004941550209138466, 'samples': 2343936, 'steps': 12207, 'loss/train': 1.1932798624038696} -08/30/2021 15:19:46 - INFO - __main__ - Step 12209: {'lr': 0.0004941538800542915, 'samples': 2344128, 'steps': 12208, 'loss/train': 1.4473735094070435} -08/30/2021 15:19:47 - INFO - __main__ - Step 12210: {'lr': 0.0004941527390847243, 'samples': 2344320, 'steps': 12209, 'loss/train': 1.747239589691162} -08/30/2021 15:19:47 - INFO - __main__ - Step 12211: {'lr': 0.0004941515980051457, 'samples': 2344512, 'steps': 12210, 'loss/train': 1.310584545135498} -08/30/2021 15:19:48 - INFO - __main__ - Step 12212: {'lr': 0.0004941504568155561, 'samples': 2344704, 'steps': 12211, 'loss/train': 2.0716114044189453} -08/30/2021 15:19:49 - INFO - __main__ - Step 12213: {'lr': 0.0004941493155159562, 'samples': 2344896, 'steps': 12212, 'loss/train': 1.9429436922073364} -08/30/2021 15:19:49 - INFO - __main__ - Step 12214: {'lr': 0.0004941481741063462, 'samples': 2345088, 'steps': 12213, 'loss/train': 1.6388980150222778} -08/30/2021 15:19:50 - INFO - __main__ - Step 12215: {'lr': 0.000494147032586727, 'samples': 2345280, 'steps': 12214, 'loss/train': 1.7224280834197998} -08/30/2021 15:19:50 - INFO - __main__ - Step 12216: {'lr': 0.0004941458909570988, 'samples': 2345472, 'steps': 12215, 'loss/train': 1.334747314453125} -08/30/2021 15:19:52 - INFO - __main__ - Step 12217: {'lr': 0.0004941447492174622, 'samples': 2345664, 'steps': 12216, 'loss/train': 1.5395238399505615} -08/30/2021 15:19:52 - INFO - __main__ - Step 12218: {'lr': 0.0004941436073678179, 'samples': 2345856, 'steps': 12217, 'loss/train': 1.8215900659561157} -08/30/2021 15:19:52 - INFO - __main__ - Step 12219: {'lr': 0.0004941424654081661, 'samples': 2346048, 'steps': 12218, 'loss/train': 1.6174993515014648} -08/30/2021 15:19:53 - INFO - __main__ - Step 12220: {'lr': 0.0004941413233385075, 'samples': 2346240, 'steps': 12219, 'loss/train': 1.6133155822753906} -08/30/2021 15:19:53 - INFO - __main__ - Step 12221: {'lr': 0.0004941401811588426, 'samples': 2346432, 'steps': 12220, 'loss/train': 1.8205928802490234} -08/30/2021 15:19:55 - INFO - __main__ - Step 12222: {'lr': 0.0004941390388691719, 'samples': 2346624, 'steps': 12221, 'loss/train': 1.6221952438354492} -08/30/2021 15:19:55 - INFO - __main__ - Step 12223: {'lr': 0.0004941378964694959, 'samples': 2346816, 'steps': 12222, 'loss/train': 0.200674906373024} -08/30/2021 15:19:55 - INFO - __main__ - Step 12224: {'lr': 0.0004941367539598152, 'samples': 2347008, 'steps': 12223, 'loss/train': 1.7082698345184326} -08/30/2021 15:19:56 - INFO - __main__ - Step 12225: {'lr': 0.0004941356113401301, 'samples': 2347200, 'steps': 12224, 'loss/train': 2.0742337703704834} -08/30/2021 15:19:56 - INFO - __main__ - Step 12226: {'lr': 0.0004941344686104414, 'samples': 2347392, 'steps': 12225, 'loss/train': 2.614518165588379} -08/30/2021 15:19:57 - INFO - __main__ - Step 12227: {'lr': 0.0004941333257707495, 'samples': 2347584, 'steps': 12226, 'loss/train': 1.2951313257217407} -08/30/2021 15:19:58 - INFO - __main__ - Step 12228: {'lr': 0.0004941321828210548, 'samples': 2347776, 'steps': 12227, 'loss/train': 2.0186338424682617} -08/30/2021 15:19:58 - INFO - __main__ - Step 12229: {'lr': 0.000494131039761358, 'samples': 2347968, 'steps': 12228, 'loss/train': 1.534130334854126} -08/30/2021 15:19:59 - INFO - __main__ - Step 12230: {'lr': 0.0004941298965916594, 'samples': 2348160, 'steps': 12229, 'loss/train': 1.3590337038040161} -08/30/2021 15:19:59 - INFO - __main__ - Step 12231: {'lr': 0.0004941287533119597, 'samples': 2348352, 'steps': 12230, 'loss/train': 1.7603479623794556} -08/30/2021 15:20:01 - INFO - __main__ - Step 12232: {'lr': 0.0004941276099222593, 'samples': 2348544, 'steps': 12231, 'loss/train': 1.6896908283233643} -08/30/2021 15:20:01 - INFO - __main__ - Step 12233: {'lr': 0.0004941264664225589, 'samples': 2348736, 'steps': 12232, 'loss/train': 1.9289885759353638} -08/30/2021 15:20:01 - INFO - __main__ - Step 12234: {'lr': 0.0004941253228128588, 'samples': 2348928, 'steps': 12233, 'loss/train': 1.995834231376648} -08/30/2021 15:20:02 - INFO - __main__ - Step 12235: {'lr': 0.0004941241790931595, 'samples': 2349120, 'steps': 12234, 'loss/train': 2.0375280380249023} -08/30/2021 15:20:02 - INFO - __main__ - Step 12236: {'lr': 0.0004941230352634617, 'samples': 2349312, 'steps': 12235, 'loss/train': 1.4215041399002075} -08/30/2021 15:20:03 - INFO - __main__ - Step 12237: {'lr': 0.0004941218913237658, 'samples': 2349504, 'steps': 12236, 'loss/train': 1.9986791610717773} -08/30/2021 15:20:04 - INFO - __main__ - Step 12238: {'lr': 0.0004941207472740724, 'samples': 2349696, 'steps': 12237, 'loss/train': 1.5555988550186157} -08/30/2021 15:20:04 - INFO - __main__ - Step 12239: {'lr': 0.000494119603114382, 'samples': 2349888, 'steps': 12238, 'loss/train': 1.4673455953598022} -08/30/2021 15:20:05 - INFO - __main__ - Step 12240: {'lr': 0.000494118458844695, 'samples': 2350080, 'steps': 12239, 'loss/train': 1.7984997034072876} -08/30/2021 15:20:05 - INFO - __main__ - Step 12241: {'lr': 0.0004941173144650119, 'samples': 2350272, 'steps': 12240, 'loss/train': 1.2752575874328613} -08/30/2021 15:20:06 - INFO - __main__ - Step 12242: {'lr': 0.0004941161699753335, 'samples': 2350464, 'steps': 12241, 'loss/train': 0.7331043481826782} -08/30/2021 15:20:07 - INFO - __main__ - Step 12243: {'lr': 0.00049411502537566, 'samples': 2350656, 'steps': 12242, 'loss/train': 1.6997778415679932} -08/30/2021 15:20:07 - INFO - __main__ - Step 12244: {'lr': 0.0004941138806659921, 'samples': 2350848, 'steps': 12243, 'loss/train': 1.990111231803894} -08/30/2021 15:20:08 - INFO - __main__ - Step 12245: {'lr': 0.00049411273584633, 'samples': 2351040, 'steps': 12244, 'loss/train': 0.49503204226493835} -08/30/2021 15:20:08 - INFO - __main__ - Step 12246: {'lr': 0.0004941115909166748, 'samples': 2351232, 'steps': 12245, 'loss/train': 3.0827579498291016} -08/30/2021 15:20:08 - INFO - __main__ - Step 12247: {'lr': 0.0004941104458770266, 'samples': 2351424, 'steps': 12246, 'loss/train': 2.4586760997772217} -08/30/2021 15:20:10 - INFO - __main__ - Step 12248: {'lr': 0.0004941093007273859, 'samples': 2351616, 'steps': 12247, 'loss/train': 1.9005318880081177} -08/30/2021 15:20:10 - INFO - __main__ - Step 12249: {'lr': 0.0004941081554677534, 'samples': 2351808, 'steps': 12248, 'loss/train': 2.209047317504883} -08/30/2021 15:20:11 - INFO - __main__ - Step 12250: {'lr': 0.0004941070100981295, 'samples': 2352000, 'steps': 12249, 'loss/train': 1.7038828134536743} -08/30/2021 15:20:11 - INFO - __main__ - Step 12251: {'lr': 0.0004941058646185148, 'samples': 2352192, 'steps': 12250, 'loss/train': 1.8614627122879028} -08/30/2021 15:20:12 - INFO - __main__ - Step 12252: {'lr': 0.0004941047190289096, 'samples': 2352384, 'steps': 12251, 'loss/train': 1.5548309087753296} -08/30/2021 15:20:13 - INFO - __main__ - Step 12253: {'lr': 0.0004941035733293148, 'samples': 2352576, 'steps': 12252, 'loss/train': 1.694841980934143} -08/30/2021 15:20:14 - INFO - __main__ - Step 12254: {'lr': 0.0004941024275197305, 'samples': 2352768, 'steps': 12253, 'loss/train': 1.6687698364257812} -08/30/2021 15:20:15 - INFO - __main__ - Step 12255: {'lr': 0.0004941012816001575, 'samples': 2352960, 'steps': 12254, 'loss/train': 1.4105418920516968} -08/30/2021 15:20:15 - INFO - __main__ - Step 12256: {'lr': 0.0004941001355705963, 'samples': 2353152, 'steps': 12255, 'loss/train': 1.5553321838378906} -08/30/2021 15:20:15 - INFO - __main__ - Step 12257: {'lr': 0.0004940989894310473, 'samples': 2353344, 'steps': 12256, 'loss/train': 1.8310878276824951} -08/30/2021 15:20:17 - INFO - __main__ - Step 12258: {'lr': 0.000494097843181511, 'samples': 2353536, 'steps': 12257, 'loss/train': 2.332899570465088} -08/30/2021 15:20:17 - INFO - __main__ - Step 12259: {'lr': 0.0004940966968219881, 'samples': 2353728, 'steps': 12258, 'loss/train': 2.1879830360412598} -08/30/2021 15:20:18 - INFO - __main__ - Step 12260: {'lr': 0.0004940955503524789, 'samples': 2353920, 'steps': 12259, 'loss/train': 0.9828661680221558} -08/30/2021 15:20:18 - INFO - __main__ - Step 12261: {'lr': 0.000494094403772984, 'samples': 2354112, 'steps': 12260, 'loss/train': 1.3328101634979248} -08/30/2021 15:20:18 - INFO - __main__ - Step 12262: {'lr': 0.0004940932570835039, 'samples': 2354304, 'steps': 12261, 'loss/train': 0.5736973881721497} -08/30/2021 15:20:19 - INFO - __main__ - Step 12263: {'lr': 0.0004940921102840393, 'samples': 2354496, 'steps': 12262, 'loss/train': 1.9213297367095947} -08/30/2021 15:20:20 - INFO - __main__ - Step 12264: {'lr': 0.0004940909633745905, 'samples': 2354688, 'steps': 12263, 'loss/train': 0.4872017204761505} -08/30/2021 15:20:21 - INFO - __main__ - Step 12265: {'lr': 0.000494089816355158, 'samples': 2354880, 'steps': 12264, 'loss/train': 1.5357216596603394} -08/30/2021 15:20:21 - INFO - __main__ - Step 12266: {'lr': 0.0004940886692257424, 'samples': 2355072, 'steps': 12265, 'loss/train': 1.768714427947998} -08/30/2021 15:20:21 - INFO - __main__ - Step 12267: {'lr': 0.0004940875219863443, 'samples': 2355264, 'steps': 12266, 'loss/train': 1.309556007385254} -08/30/2021 15:20:22 - INFO - __main__ - Step 12268: {'lr': 0.0004940863746369641, 'samples': 2355456, 'steps': 12267, 'loss/train': 1.784734845161438} -08/30/2021 15:20:24 - INFO - __main__ - Step 12269: {'lr': 0.0004940852271776023, 'samples': 2355648, 'steps': 12268, 'loss/train': 1.2673885822296143} -08/30/2021 15:20:24 - INFO - __main__ - Step 12270: {'lr': 0.0004940840796082594, 'samples': 2355840, 'steps': 12269, 'loss/train': 1.6234240531921387} -08/30/2021 15:20:24 - INFO - __main__ - Step 12271: {'lr': 0.0004940829319289361, 'samples': 2356032, 'steps': 12270, 'loss/train': 1.8377019166946411} -08/30/2021 15:20:25 - INFO - __main__ - Step 12272: {'lr': 0.0004940817841396327, 'samples': 2356224, 'steps': 12271, 'loss/train': 1.2662084102630615} -08/30/2021 15:20:25 - INFO - __main__ - Step 12273: {'lr': 0.0004940806362403499, 'samples': 2356416, 'steps': 12272, 'loss/train': 1.339592695236206} -08/30/2021 15:20:25 - INFO - __main__ - Step 12274: {'lr': 0.0004940794882310882, 'samples': 2356608, 'steps': 12273, 'loss/train': 1.7002252340316772} -08/30/2021 15:20:26 - INFO - __main__ - Step 12275: {'lr': 0.000494078340111848, 'samples': 2356800, 'steps': 12274, 'loss/train': 2.020940065383911} -08/30/2021 15:20:27 - INFO - __main__ - Step 12276: {'lr': 0.0004940771918826298, 'samples': 2356992, 'steps': 12275, 'loss/train': 1.9736751317977905} -08/30/2021 15:20:28 - INFO - __main__ - Step 12277: {'lr': 0.0004940760435434341, 'samples': 2357184, 'steps': 12276, 'loss/train': 1.4225600957870483} -08/30/2021 15:20:28 - INFO - __main__ - Step 12278: {'lr': 0.0004940748950942618, 'samples': 2357376, 'steps': 12277, 'loss/train': 1.7238681316375732} -08/30/2021 15:20:29 - INFO - __main__ - Step 12279: {'lr': 0.0004940737465351128, 'samples': 2357568, 'steps': 12278, 'loss/train': 1.6024529933929443} -08/30/2021 15:20:29 - INFO - __main__ - Step 12280: {'lr': 0.0004940725978659881, 'samples': 2357760, 'steps': 12279, 'loss/train': 1.577825903892517} -08/30/2021 15:20:31 - INFO - __main__ - Step 12281: {'lr': 0.000494071449086888, 'samples': 2357952, 'steps': 12280, 'loss/train': 2.065798282623291} -08/30/2021 15:20:31 - INFO - __main__ - Step 12282: {'lr': 0.0004940703001978131, 'samples': 2358144, 'steps': 12281, 'loss/train': 1.089477777481079} -08/30/2021 15:20:31 - INFO - __main__ - Step 12283: {'lr': 0.0004940691511987639, 'samples': 2358336, 'steps': 12282, 'loss/train': 1.8239578008651733} -08/30/2021 15:20:32 - INFO - __main__ - Step 12284: {'lr': 0.0004940680020897409, 'samples': 2358528, 'steps': 12283, 'loss/train': 1.7185299396514893} -08/30/2021 15:20:32 - INFO - __main__ - Step 12285: {'lr': 0.0004940668528707446, 'samples': 2358720, 'steps': 12284, 'loss/train': 1.0978227853775024} -08/30/2021 15:20:32 - INFO - __main__ - Step 12286: {'lr': 0.0004940657035417755, 'samples': 2358912, 'steps': 12285, 'loss/train': 2.4013559818267822} -08/30/2021 15:20:34 - INFO - __main__ - Step 12287: {'lr': 0.0004940645541028343, 'samples': 2359104, 'steps': 12286, 'loss/train': 1.9952807426452637} -08/30/2021 15:20:34 - INFO - __main__ - Step 12288: {'lr': 0.0004940634045539213, 'samples': 2359296, 'steps': 12287, 'loss/train': 1.9006563425064087} -08/30/2021 15:20:35 - INFO - __main__ - Step 12289: {'lr': 0.000494062254895037, 'samples': 2359488, 'steps': 12288, 'loss/train': 1.5698041915893555} -08/30/2021 15:20:35 - INFO - __main__ - Step 12290: {'lr': 0.0004940611051261822, 'samples': 2359680, 'steps': 12289, 'loss/train': 1.6416971683502197} -08/30/2021 15:20:35 - INFO - __main__ - Step 12291: {'lr': 0.000494059955247357, 'samples': 2359872, 'steps': 12290, 'loss/train': 1.372291088104248} -08/30/2021 15:20:37 - INFO - __main__ - Step 12292: {'lr': 0.0004940588052585624, 'samples': 2360064, 'steps': 12291, 'loss/train': 1.3547165393829346} -08/30/2021 15:20:37 - INFO - __main__ - Step 12293: {'lr': 0.0004940576551597985, 'samples': 2360256, 'steps': 12292, 'loss/train': 2.036637544631958} -08/30/2021 15:20:38 - INFO - __main__ - Step 12294: {'lr': 0.000494056504951066, 'samples': 2360448, 'steps': 12293, 'loss/train': 1.5060285329818726} -08/30/2021 15:20:38 - INFO - __main__ - Step 12295: {'lr': 0.0004940553546323655, 'samples': 2360640, 'steps': 12294, 'loss/train': 1.766244888305664} -08/30/2021 15:20:38 - INFO - __main__ - Step 12296: {'lr': 0.0004940542042036974, 'samples': 2360832, 'steps': 12295, 'loss/train': 1.63885498046875} -08/30/2021 15:20:40 - INFO - __main__ - Step 12297: {'lr': 0.0004940530536650621, 'samples': 2361024, 'steps': 12296, 'loss/train': 1.6277042627334595} -08/30/2021 15:20:40 - INFO - __main__ - Step 12298: {'lr': 0.0004940519030164605, 'samples': 2361216, 'steps': 12297, 'loss/train': 1.5816974639892578} -08/30/2021 15:20:41 - INFO - __main__ - Step 12299: {'lr': 0.0004940507522578927, 'samples': 2361408, 'steps': 12298, 'loss/train': 1.8461530208587646} -08/30/2021 15:20:41 - INFO - __main__ - Step 12300: {'lr': 0.0004940496013893594, 'samples': 2361600, 'steps': 12299, 'loss/train': 2.1077511310577393} -08/30/2021 15:20:41 - INFO - __main__ - Step 12301: {'lr': 0.0004940484504108612, 'samples': 2361792, 'steps': 12300, 'loss/train': 1.92961585521698} -08/30/2021 15:20:43 - INFO - __main__ - Step 12302: {'lr': 0.0004940472993223985, 'samples': 2361984, 'steps': 12301, 'loss/train': 1.577030897140503} -08/30/2021 15:20:44 - INFO - __main__ - Step 12303: {'lr': 0.0004940461481239719, 'samples': 2362176, 'steps': 12302, 'loss/train': 1.322467565536499} -08/30/2021 15:20:44 - INFO - __main__ - Step 12304: {'lr': 0.0004940449968155818, 'samples': 2362368, 'steps': 12303, 'loss/train': 2.117222547531128} -08/30/2021 15:20:44 - INFO - __main__ - Step 12305: {'lr': 0.0004940438453972288, 'samples': 2362560, 'steps': 12304, 'loss/train': 1.5622693300247192} -08/30/2021 15:20:45 - INFO - __main__ - Step 12306: {'lr': 0.0004940426938689135, 'samples': 2362752, 'steps': 12305, 'loss/train': 1.739802598953247} -08/30/2021 15:20:47 - INFO - __main__ - Step 12307: {'lr': 0.0004940415422306361, 'samples': 2362944, 'steps': 12306, 'loss/train': 1.2217721939086914} -08/30/2021 15:20:47 - INFO - __main__ - Step 12308: {'lr': 0.0004940403904823976, 'samples': 2363136, 'steps': 12307, 'loss/train': 1.8506790399551392} -08/30/2021 15:20:48 - INFO - __main__ - Step 12309: {'lr': 0.0004940392386241981, 'samples': 2363328, 'steps': 12308, 'loss/train': 2.1373562812805176} -08/30/2021 15:20:48 - INFO - __main__ - Step 12310: {'lr': 0.0004940380866560384, 'samples': 2363520, 'steps': 12309, 'loss/train': 1.64629328250885} -08/30/2021 15:20:48 - INFO - __main__ - Step 12311: {'lr': 0.0004940369345779187, 'samples': 2363712, 'steps': 12310, 'loss/train': 1.8088691234588623} -08/30/2021 15:20:50 - INFO - __main__ - Step 12312: {'lr': 0.00049403578238984, 'samples': 2363904, 'steps': 12311, 'loss/train': 1.6565057039260864} -08/30/2021 15:20:50 - INFO - __main__ - Step 12313: {'lr': 0.0004940346300918024, 'samples': 2364096, 'steps': 12312, 'loss/train': 2.030160903930664} -08/30/2021 15:20:51 - INFO - __main__ - Step 12314: {'lr': 0.0004940334776838065, 'samples': 2364288, 'steps': 12313, 'loss/train': 1.8640719652175903} -08/30/2021 15:20:51 - INFO - __main__ - Step 12315: {'lr': 0.000494032325165853, 'samples': 2364480, 'steps': 12314, 'loss/train': 2.038550615310669} -08/30/2021 15:20:51 - INFO - __main__ - Step 12316: {'lr': 0.0004940311725379423, 'samples': 2364672, 'steps': 12315, 'loss/train': 1.426437497138977} -08/30/2021 15:20:52 - INFO - __main__ - Step 12317: {'lr': 0.0004940300198000748, 'samples': 2364864, 'steps': 12316, 'loss/train': 1.886391282081604} -08/30/2021 15:20:53 - INFO - __main__ - Step 12318: {'lr': 0.0004940288669522513, 'samples': 2365056, 'steps': 12317, 'loss/train': 2.6517083644866943} -08/30/2021 15:20:54 - INFO - __main__ - Step 12319: {'lr': 0.000494027713994472, 'samples': 2365248, 'steps': 12318, 'loss/train': 1.4126795530319214} -08/30/2021 15:20:54 - INFO - __main__ - Step 12320: {'lr': 0.0004940265609267377, 'samples': 2365440, 'steps': 12319, 'loss/train': 1.5219357013702393} -08/30/2021 15:20:54 - INFO - __main__ - Step 12321: {'lr': 0.0004940254077490487, 'samples': 2365632, 'steps': 12320, 'loss/train': 1.2527730464935303} -08/30/2021 15:20:55 - INFO - __main__ - Step 12322: {'lr': 0.0004940242544614056, 'samples': 2365824, 'steps': 12321, 'loss/train': 2.077793836593628} -08/30/2021 15:20:56 - INFO - __main__ - Step 12323: {'lr': 0.0004940231010638091, 'samples': 2366016, 'steps': 12322, 'loss/train': 1.6778231859207153} -08/30/2021 15:20:57 - INFO - __main__ - Step 12324: {'lr': 0.0004940219475562593, 'samples': 2366208, 'steps': 12323, 'loss/train': 1.868173599243164} -08/30/2021 15:20:57 - INFO - __main__ - Step 12325: {'lr': 0.0004940207939387573, 'samples': 2366400, 'steps': 12324, 'loss/train': 2.4082648754119873} -08/30/2021 15:20:57 - INFO - __main__ - Step 12326: {'lr': 0.0004940196402113031, 'samples': 2366592, 'steps': 12325, 'loss/train': 1.8570210933685303} -08/30/2021 15:20:58 - INFO - __main__ - Step 12327: {'lr': 0.0004940184863738975, 'samples': 2366784, 'steps': 12326, 'loss/train': 2.2421019077301025} -08/30/2021 15:20:59 - INFO - __main__ - Step 12328: {'lr': 0.0004940173324265407, 'samples': 2366976, 'steps': 12327, 'loss/train': 2.0102992057800293} -08/30/2021 15:21:00 - INFO - __main__ - Step 12329: {'lr': 0.0004940161783692338, 'samples': 2367168, 'steps': 12328, 'loss/train': 1.3427133560180664} -08/30/2021 15:21:00 - INFO - __main__ - Step 12330: {'lr': 0.0004940150242019768, 'samples': 2367360, 'steps': 12329, 'loss/train': 1.481920838356018} -08/30/2021 15:21:01 - INFO - __main__ - Step 12331: {'lr': 0.0004940138699247704, 'samples': 2367552, 'steps': 12330, 'loss/train': 2.420530319213867} -08/30/2021 15:21:01 - INFO - __main__ - Step 12332: {'lr': 0.0004940127155376151, 'samples': 2367744, 'steps': 12331, 'loss/train': 1.4439826011657715} -08/30/2021 15:21:02 - INFO - __main__ - Step 12333: {'lr': 0.0004940115610405114, 'samples': 2367936, 'steps': 12332, 'loss/train': 1.0832420587539673} -08/30/2021 15:21:03 - INFO - __main__ - Step 12334: {'lr': 0.0004940104064334599, 'samples': 2368128, 'steps': 12333, 'loss/train': 1.490478277206421} -08/30/2021 15:21:03 - INFO - __main__ - Step 12335: {'lr': 0.0004940092517164612, 'samples': 2368320, 'steps': 12334, 'loss/train': 1.9114985466003418} -08/30/2021 15:21:04 - INFO - __main__ - Step 12336: {'lr': 0.0004940080968895155, 'samples': 2368512, 'steps': 12335, 'loss/train': 1.3063796758651733} -08/30/2021 15:21:04 - INFO - __main__ - Step 12337: {'lr': 0.0004940069419526236, 'samples': 2368704, 'steps': 12336, 'loss/train': 1.779631495475769} -08/30/2021 15:21:04 - INFO - __main__ - Step 12338: {'lr': 0.0004940057869057859, 'samples': 2368896, 'steps': 12337, 'loss/train': 2.4336724281311035} -08/30/2021 15:21:06 - INFO - __main__ - Step 12339: {'lr': 0.000494004631749003, 'samples': 2369088, 'steps': 12338, 'loss/train': 2.139826774597168} -08/30/2021 15:21:06 - INFO - __main__ - Step 12340: {'lr': 0.0004940034764822754, 'samples': 2369280, 'steps': 12339, 'loss/train': 1.249495029449463} -08/30/2021 15:21:07 - INFO - __main__ - Step 12341: {'lr': 0.0004940023211056036, 'samples': 2369472, 'steps': 12340, 'loss/train': 1.9051568508148193} -08/30/2021 15:21:07 - INFO - __main__ - Step 12342: {'lr': 0.0004940011656189881, 'samples': 2369664, 'steps': 12341, 'loss/train': 1.901642084121704} -08/30/2021 15:21:07 - INFO - __main__ - Step 12343: {'lr': 0.0004940000100224295, 'samples': 2369856, 'steps': 12342, 'loss/train': 1.8271327018737793} -08/30/2021 15:21:09 - INFO - __main__ - Step 12344: {'lr': 0.0004939988543159282, 'samples': 2370048, 'steps': 12343, 'loss/train': 2.083096742630005} -08/30/2021 15:21:10 - INFO - __main__ - Step 12345: {'lr': 0.0004939976984994847, 'samples': 2370240, 'steps': 12344, 'loss/train': 0.5472157001495361} -08/30/2021 15:21:10 - INFO - __main__ - Step 12346: {'lr': 0.0004939965425730996, 'samples': 2370432, 'steps': 12345, 'loss/train': 1.6035313606262207} -08/30/2021 15:21:10 - INFO - __main__ - Step 12347: {'lr': 0.0004939953865367735, 'samples': 2370624, 'steps': 12346, 'loss/train': 1.7876683473587036} -08/30/2021 15:21:11 - INFO - __main__ - Step 12348: {'lr': 0.0004939942303905069, 'samples': 2370816, 'steps': 12347, 'loss/train': 1.195544719696045} -08/30/2021 15:21:11 - INFO - __main__ - Step 12349: {'lr': 0.0004939930741343002, 'samples': 2371008, 'steps': 12348, 'loss/train': 1.6651946306228638} -08/30/2021 15:21:13 - INFO - __main__ - Step 12350: {'lr': 0.000493991917768154, 'samples': 2371200, 'steps': 12349, 'loss/train': 1.0392279624938965} -08/30/2021 15:21:13 - INFO - __main__ - Step 12351: {'lr': 0.0004939907612920688, 'samples': 2371392, 'steps': 12350, 'loss/train': 1.6462291479110718} -08/30/2021 15:21:13 - INFO - __main__ - Step 12352: {'lr': 0.0004939896047060451, 'samples': 2371584, 'steps': 12351, 'loss/train': 1.5832334756851196} -08/30/2021 15:21:14 - INFO - __main__ - Step 12353: {'lr': 0.0004939884480100836, 'samples': 2371776, 'steps': 12352, 'loss/train': 1.5563801527023315} -08/30/2021 15:21:14 - INFO - __main__ - Step 12354: {'lr': 0.0004939872912041844, 'samples': 2371968, 'steps': 12353, 'loss/train': 1.5932083129882812} -08/30/2021 15:21:16 - INFO - __main__ - Step 12355: {'lr': 0.0004939861342883485, 'samples': 2372160, 'steps': 12354, 'loss/train': 1.953323245048523} -08/30/2021 15:21:16 - INFO - __main__ - Step 12356: {'lr': 0.0004939849772625761, 'samples': 2372352, 'steps': 12355, 'loss/train': 1.797263503074646} -08/30/2021 15:21:17 - INFO - __main__ - Step 12357: {'lr': 0.0004939838201268679, 'samples': 2372544, 'steps': 12356, 'loss/train': 1.5991339683532715} -08/30/2021 15:21:17 - INFO - __main__ - Step 12358: {'lr': 0.0004939826628812244, 'samples': 2372736, 'steps': 12357, 'loss/train': 1.9488673210144043} -08/30/2021 15:21:17 - INFO - __main__ - Step 12359: {'lr': 0.000493981505525646, 'samples': 2372928, 'steps': 12358, 'loss/train': 1.513182282447815} -08/30/2021 15:21:18 - INFO - __main__ - Step 12360: {'lr': 0.0004939803480601333, 'samples': 2373120, 'steps': 12359, 'loss/train': 2.8466885089874268} -08/30/2021 15:21:20 - INFO - __main__ - Step 12361: {'lr': 0.0004939791904846869, 'samples': 2373312, 'steps': 12360, 'loss/train': 1.4838905334472656} -08/30/2021 15:21:20 - INFO - __main__ - Step 12362: {'lr': 0.0004939780327993072, 'samples': 2373504, 'steps': 12361, 'loss/train': 1.9791806936264038} -08/30/2021 15:21:21 - INFO - __main__ - Step 12363: {'lr': 0.0004939768750039946, 'samples': 2373696, 'steps': 12362, 'loss/train': 1.3516241312026978} -08/30/2021 15:21:21 - INFO - __main__ - Step 12364: {'lr': 0.00049397571709875, 'samples': 2373888, 'steps': 12363, 'loss/train': 1.4593547582626343} -08/30/2021 15:21:21 - INFO - __main__ - Step 12365: {'lr': 0.0004939745590835736, 'samples': 2374080, 'steps': 12364, 'loss/train': 1.6037418842315674} -08/30/2021 15:21:23 - INFO - __main__ - Step 12366: {'lr': 0.0004939734009584661, 'samples': 2374272, 'steps': 12365, 'loss/train': 1.8691282272338867} -08/30/2021 15:21:23 - INFO - __main__ - Step 12367: {'lr': 0.0004939722427234279, 'samples': 2374464, 'steps': 12366, 'loss/train': 1.6306006908416748} -08/30/2021 15:21:24 - INFO - __main__ - Step 12368: {'lr': 0.0004939710843784596, 'samples': 2374656, 'steps': 12367, 'loss/train': 2.2240822315216064} -08/30/2021 15:21:24 - INFO - __main__ - Step 12369: {'lr': 0.0004939699259235617, 'samples': 2374848, 'steps': 12368, 'loss/train': 1.5180351734161377} -08/30/2021 15:21:24 - INFO - __main__ - Step 12370: {'lr': 0.0004939687673587346, 'samples': 2375040, 'steps': 12369, 'loss/train': 1.2453733682632446} -08/30/2021 15:21:26 - INFO - __main__ - Step 12371: {'lr': 0.0004939676086839791, 'samples': 2375232, 'steps': 12370, 'loss/train': 1.4904848337173462} -08/30/2021 15:21:26 - INFO - __main__ - Step 12372: {'lr': 0.0004939664498992955, 'samples': 2375424, 'steps': 12371, 'loss/train': 1.5308938026428223} -08/30/2021 15:21:27 - INFO - __main__ - Step 12373: {'lr': 0.0004939652910046844, 'samples': 2375616, 'steps': 12372, 'loss/train': 1.7801154851913452} -08/30/2021 15:21:27 - INFO - __main__ - Step 12374: {'lr': 0.0004939641320001462, 'samples': 2375808, 'steps': 12373, 'loss/train': 1.9854333400726318} -08/30/2021 15:21:27 - INFO - __main__ - Step 12375: {'lr': 0.0004939629728856817, 'samples': 2376000, 'steps': 12374, 'loss/train': 1.6718435287475586} -08/30/2021 15:21:29 - INFO - __main__ - Step 12376: {'lr': 0.0004939618136612911, 'samples': 2376192, 'steps': 12375, 'loss/train': 1.6842349767684937} -08/30/2021 15:21:29 - INFO - __main__ - Step 12377: {'lr': 0.0004939606543269751, 'samples': 2376384, 'steps': 12376, 'loss/train': 1.6865808963775635} -08/30/2021 15:21:30 - INFO - __main__ - Step 12378: {'lr': 0.0004939594948827343, 'samples': 2376576, 'steps': 12377, 'loss/train': 2.005328893661499} -08/30/2021 15:21:30 - INFO - __main__ - Step 12379: {'lr': 0.000493958335328569, 'samples': 2376768, 'steps': 12378, 'loss/train': 2.3254377841949463} -08/30/2021 15:21:31 - INFO - __main__ - Step 12380: {'lr': 0.0004939571756644799, 'samples': 2376960, 'steps': 12379, 'loss/train': 1.0390169620513916} -08/30/2021 15:21:31 - INFO - __main__ - Step 12381: {'lr': 0.0004939560158904675, 'samples': 2377152, 'steps': 12380, 'loss/train': 1.4461275339126587} -08/30/2021 15:21:32 - INFO - __main__ - Step 12382: {'lr': 0.0004939548560065322, 'samples': 2377344, 'steps': 12381, 'loss/train': 1.4545270204544067} -08/30/2021 15:21:33 - INFO - __main__ - Step 12383: {'lr': 0.0004939536960126746, 'samples': 2377536, 'steps': 12382, 'loss/train': 1.4851293563842773} -08/30/2021 15:21:33 - INFO - __main__ - Step 12384: {'lr': 0.0004939525359088953, 'samples': 2377728, 'steps': 12383, 'loss/train': 1.9911237955093384} -08/30/2021 15:21:34 - INFO - __main__ - Step 12385: {'lr': 0.0004939513756951946, 'samples': 2377920, 'steps': 12384, 'loss/train': 2.0675361156463623} -08/30/2021 15:21:34 - INFO - __main__ - Step 12386: {'lr': 0.0004939502153715733, 'samples': 2378112, 'steps': 12385, 'loss/train': 1.9893680810928345} -08/30/2021 15:21:36 - INFO - __main__ - Step 12387: {'lr': 0.0004939490549380318, 'samples': 2378304, 'steps': 12386, 'loss/train': 1.779490351676941} -08/30/2021 15:21:36 - INFO - __main__ - Step 12388: {'lr': 0.0004939478943945706, 'samples': 2378496, 'steps': 12387, 'loss/train': 1.7265629768371582} -08/30/2021 15:21:37 - INFO - __main__ - Step 12389: {'lr': 0.0004939467337411903, 'samples': 2378688, 'steps': 12388, 'loss/train': 1.4875437021255493} -08/30/2021 15:21:37 - INFO - __main__ - Step 12390: {'lr': 0.0004939455729778912, 'samples': 2378880, 'steps': 12389, 'loss/train': 0.10893329232931137} -08/30/2021 15:21:37 - INFO - __main__ - Step 12391: {'lr': 0.0004939444121046741, 'samples': 2379072, 'steps': 12390, 'loss/train': 1.4834707975387573} -08/30/2021 15:21:38 - INFO - __main__ - Step 12392: {'lr': 0.0004939432511215395, 'samples': 2379264, 'steps': 12391, 'loss/train': 1.798765778541565} -08/30/2021 15:21:39 - INFO - __main__ - Step 12393: {'lr': 0.0004939420900284876, 'samples': 2379456, 'steps': 12392, 'loss/train': 2.3325815200805664} -08/30/2021 15:21:40 - INFO - __main__ - Step 12394: {'lr': 0.0004939409288255194, 'samples': 2379648, 'steps': 12393, 'loss/train': 1.9942257404327393} -08/30/2021 15:21:40 - INFO - __main__ - Step 12395: {'lr': 0.000493939767512635, 'samples': 2379840, 'steps': 12394, 'loss/train': 1.1501344442367554} -08/30/2021 15:21:40 - INFO - __main__ - Step 12396: {'lr': 0.0004939386060898353, 'samples': 2380032, 'steps': 12395, 'loss/train': 2.169787883758545} -08/30/2021 15:21:41 - INFO - __main__ - Step 12397: {'lr': 0.0004939374445571206, 'samples': 2380224, 'steps': 12396, 'loss/train': 1.9157381057739258} -08/30/2021 15:21:42 - INFO - __main__ - Step 12398: {'lr': 0.0004939362829144913, 'samples': 2380416, 'steps': 12397, 'loss/train': 1.526296854019165} -08/30/2021 15:21:43 - INFO - __main__ - Step 12399: {'lr': 0.0004939351211619481, 'samples': 2380608, 'steps': 12398, 'loss/train': 1.5075287818908691} -08/30/2021 15:21:43 - INFO - __main__ - Step 12400: {'lr': 0.0004939339592994916, 'samples': 2380800, 'steps': 12399, 'loss/train': 1.858720302581787} -08/30/2021 15:21:44 - INFO - __main__ - Step 12401: {'lr': 0.0004939327973271222, 'samples': 2380992, 'steps': 12400, 'loss/train': 1.6559598445892334} -08/30/2021 15:21:44 - INFO - __main__ - Step 12402: {'lr': 0.0004939316352448403, 'samples': 2381184, 'steps': 12401, 'loss/train': 1.5791690349578857} -08/30/2021 15:21:46 - INFO - __main__ - Step 12403: {'lr': 0.0004939304730526467, 'samples': 2381376, 'steps': 12402, 'loss/train': 2.0456554889678955} -08/30/2021 15:21:46 - INFO - __main__ - Step 12404: {'lr': 0.0004939293107505418, 'samples': 2381568, 'steps': 12403, 'loss/train': 1.1767677068710327} -08/30/2021 15:21:47 - INFO - __main__ - Step 12405: {'lr': 0.0004939281483385261, 'samples': 2381760, 'steps': 12404, 'loss/train': 1.947377324104309} -08/30/2021 15:21:47 - INFO - __main__ - Step 12406: {'lr': 0.0004939269858166001, 'samples': 2381952, 'steps': 12405, 'loss/train': 0.2319193184375763} -08/30/2021 15:21:47 - INFO - __main__ - Step 12407: {'lr': 0.0004939258231847644, 'samples': 2382144, 'steps': 12406, 'loss/train': 1.9935581684112549} -08/30/2021 15:21:49 - INFO - __main__ - Step 12408: {'lr': 0.0004939246604430195, 'samples': 2382336, 'steps': 12407, 'loss/train': 1.9596755504608154} -08/30/2021 15:21:50 - INFO - __main__ - Step 12409: {'lr': 0.0004939234975913659, 'samples': 2382528, 'steps': 12408, 'loss/train': 1.8188401460647583} -08/30/2021 15:21:50 - INFO - __main__ - Step 12410: {'lr': 0.0004939223346298042, 'samples': 2382720, 'steps': 12409, 'loss/train': 1.6885244846343994} -08/30/2021 15:21:50 - INFO - __main__ - Step 12411: {'lr': 0.0004939211715583347, 'samples': 2382912, 'steps': 12410, 'loss/train': 1.8496094942092896} -08/30/2021 15:21:51 - INFO - __main__ - Step 12412: {'lr': 0.0004939200083769582, 'samples': 2383104, 'steps': 12411, 'loss/train': 1.5743927955627441} -08/30/2021 15:21:52 - INFO - __main__ - Step 12413: {'lr': 0.000493918845085675, 'samples': 2383296, 'steps': 12412, 'loss/train': 1.727419137954712} -08/30/2021 15:21:53 - INFO - __main__ - Step 12414: {'lr': 0.000493917681684486, 'samples': 2383488, 'steps': 12413, 'loss/train': 1.1140133142471313} -08/30/2021 15:21:53 - INFO - __main__ - Step 12415: {'lr': 0.0004939165181733911, 'samples': 2383680, 'steps': 12414, 'loss/train': 0.8899873495101929} -08/30/2021 15:21:54 - INFO - __main__ - Step 12416: {'lr': 0.0004939153545523914, 'samples': 2383872, 'steps': 12415, 'loss/train': 0.7002155780792236} -08/30/2021 15:21:54 - INFO - __main__ - Step 12417: {'lr': 0.0004939141908214871, 'samples': 2384064, 'steps': 12416, 'loss/train': 1.9062436819076538} -08/30/2021 15:21:54 - INFO - __main__ - Step 12418: {'lr': 0.000493913026980679, 'samples': 2384256, 'steps': 12417, 'loss/train': 0.7851493954658508} -08/30/2021 15:21:56 - INFO - __main__ - Step 12419: {'lr': 0.0004939118630299672, 'samples': 2384448, 'steps': 12418, 'loss/train': 1.919806718826294} -08/30/2021 15:21:57 - INFO - __main__ - Step 12420: {'lr': 0.0004939106989693527, 'samples': 2384640, 'steps': 12419, 'loss/train': 0.9437406659126282} -08/30/2021 15:21:57 - INFO - __main__ - Step 12421: {'lr': 0.0004939095347988357, 'samples': 2384832, 'steps': 12420, 'loss/train': 1.8690074682235718} -08/30/2021 15:21:57 - INFO - __main__ - Step 12422: {'lr': 0.0004939083705184169, 'samples': 2385024, 'steps': 12421, 'loss/train': 2.076601266860962} -08/30/2021 15:21:58 - INFO - __main__ - Step 12423: {'lr': 0.0004939072061280967, 'samples': 2385216, 'steps': 12422, 'loss/train': 1.6892462968826294} -08/30/2021 15:22:00 - INFO - __main__ - Step 12424: {'lr': 0.0004939060416278756, 'samples': 2385408, 'steps': 12423, 'loss/train': 1.4793415069580078} -08/30/2021 15:22:00 - INFO - __main__ - Step 12425: {'lr': 0.0004939048770177543, 'samples': 2385600, 'steps': 12424, 'loss/train': 1.83730947971344} -08/30/2021 15:22:00 - INFO - __main__ - Step 12426: {'lr': 0.0004939037122977332, 'samples': 2385792, 'steps': 12425, 'loss/train': 2.017552137374878} -08/30/2021 15:22:01 - INFO - __main__ - Step 12427: {'lr': 0.0004939025474678129, 'samples': 2385984, 'steps': 12426, 'loss/train': 0.09431283921003342} -08/30/2021 15:22:01 - INFO - __main__ - Step 12428: {'lr': 0.0004939013825279939, 'samples': 2386176, 'steps': 12427, 'loss/train': 2.293602228164673} -08/30/2021 15:22:02 - INFO - __main__ - Step 12429: {'lr': 0.0004939002174782766, 'samples': 2386368, 'steps': 12428, 'loss/train': 1.7615902423858643} -08/30/2021 15:22:03 - INFO - __main__ - Step 12430: {'lr': 0.0004938990523186616, 'samples': 2386560, 'steps': 12429, 'loss/train': 0.1607472151517868} -08/30/2021 15:22:04 - INFO - __main__ - Step 12431: {'lr': 0.0004938978870491495, 'samples': 2386752, 'steps': 12430, 'loss/train': 2.0253050327301025} -08/30/2021 15:22:04 - INFO - __main__ - Step 12432: {'lr': 0.0004938967216697409, 'samples': 2386944, 'steps': 12431, 'loss/train': 1.1702685356140137} -08/30/2021 15:22:05 - INFO - __main__ - Step 12433: {'lr': 0.0004938955561804361, 'samples': 2387136, 'steps': 12432, 'loss/train': 1.8104138374328613} -08/30/2021 15:22:05 - INFO - __main__ - Step 12434: {'lr': 0.0004938943905812357, 'samples': 2387328, 'steps': 12433, 'loss/train': 0.1371229588985443} -08/30/2021 15:22:05 - INFO - __main__ - Step 12435: {'lr': 0.0004938932248721401, 'samples': 2387520, 'steps': 12434, 'loss/train': 0.5494178533554077} -08/30/2021 15:22:07 - INFO - __main__ - Step 12436: {'lr': 0.0004938920590531503, 'samples': 2387712, 'steps': 12435, 'loss/train': 1.388697624206543} -08/30/2021 15:22:07 - INFO - __main__ - Step 12437: {'lr': 0.0004938908931242663, 'samples': 2387904, 'steps': 12436, 'loss/train': 1.370986819267273} -08/30/2021 15:22:08 - INFO - __main__ - Step 12438: {'lr': 0.0004938897270854889, 'samples': 2388096, 'steps': 12437, 'loss/train': 1.4781913757324219} -08/30/2021 15:22:08 - INFO - __main__ - Step 12439: {'lr': 0.0004938885609368184, 'samples': 2388288, 'steps': 12438, 'loss/train': 1.5946956872940063} -08/30/2021 15:22:08 - INFO - __main__ - Step 12440: {'lr': 0.0004938873946782557, 'samples': 2388480, 'steps': 12439, 'loss/train': 1.0407694578170776} -08/30/2021 15:22:10 - INFO - __main__ - Step 12441: {'lr': 0.000493886228309801, 'samples': 2388672, 'steps': 12440, 'loss/train': 2.2493369579315186} -08/30/2021 15:22:10 - INFO - __main__ - Step 12442: {'lr': 0.0004938850618314549, 'samples': 2388864, 'steps': 12441, 'loss/train': 2.3278608322143555} -08/30/2021 15:22:11 - INFO - __main__ - Step 12443: {'lr': 0.000493883895243218, 'samples': 2389056, 'steps': 12442, 'loss/train': 1.4713679552078247} -08/30/2021 15:22:11 - INFO - __main__ - Step 12444: {'lr': 0.0004938827285450908, 'samples': 2389248, 'steps': 12443, 'loss/train': 1.7078709602355957} -08/30/2021 15:22:11 - INFO - __main__ - Step 12445: {'lr': 0.0004938815617370737, 'samples': 2389440, 'steps': 12444, 'loss/train': 1.4049808979034424} -08/30/2021 15:22:13 - INFO - __main__ - Step 12446: {'lr': 0.0004938803948191674, 'samples': 2389632, 'steps': 12445, 'loss/train': 0.1803952008485794} -08/30/2021 15:22:13 - INFO - __main__ - Step 12447: {'lr': 0.0004938792277913724, 'samples': 2389824, 'steps': 12446, 'loss/train': 1.6435493230819702} -08/30/2021 15:22:13 - INFO - __main__ - Step 12448: {'lr': 0.0004938780606536891, 'samples': 2390016, 'steps': 12447, 'loss/train': 1.762094497680664} -08/30/2021 15:22:14 - INFO - __main__ - Step 12449: {'lr': 0.0004938768934061182, 'samples': 2390208, 'steps': 12448, 'loss/train': 1.5482165813446045} -08/30/2021 15:22:14 - INFO - __main__ - Step 12450: {'lr': 0.0004938757260486601, 'samples': 2390400, 'steps': 12449, 'loss/train': 1.4777065515518188} -08/30/2021 15:22:16 - INFO - __main__ - Step 12451: {'lr': 0.0004938745585813153, 'samples': 2390592, 'steps': 12450, 'loss/train': 1.2664315700531006} -08/30/2021 15:22:16 - INFO - __main__ - Step 12452: {'lr': 0.0004938733910040845, 'samples': 2390784, 'steps': 12451, 'loss/train': 1.8675448894500732} -08/30/2021 15:22:17 - INFO - __main__ - Step 12453: {'lr': 0.000493872223316968, 'samples': 2390976, 'steps': 12452, 'loss/train': 1.7587313652038574} -08/30/2021 15:22:17 - INFO - __main__ - Step 12454: {'lr': 0.0004938710555199664, 'samples': 2391168, 'steps': 12453, 'loss/train': 2.098862648010254} -08/30/2021 15:22:17 - INFO - __main__ - Step 12455: {'lr': 0.0004938698876130804, 'samples': 2391360, 'steps': 12454, 'loss/train': 1.8751031160354614} -08/30/2021 15:22:18 - INFO - __main__ - Step 12456: {'lr': 0.0004938687195963104, 'samples': 2391552, 'steps': 12455, 'loss/train': 1.2401816844940186} -08/30/2021 15:22:19 - INFO - __main__ - Step 12457: {'lr': 0.0004938675514696569, 'samples': 2391744, 'steps': 12456, 'loss/train': 1.090671181678772} -08/30/2021 15:22:20 - INFO - __main__ - Step 12458: {'lr': 0.0004938663832331204, 'samples': 2391936, 'steps': 12457, 'loss/train': 1.8153104782104492} -08/30/2021 15:22:20 - INFO - __main__ - Step 12459: {'lr': 0.0004938652148867014, 'samples': 2392128, 'steps': 12458, 'loss/train': 1.4731745719909668} -08/30/2021 15:22:21 - INFO - __main__ - Step 12460: {'lr': 0.0004938640464304006, 'samples': 2392320, 'steps': 12459, 'loss/train': 2.171313524246216} -08/30/2021 15:22:21 - INFO - __main__ - Step 12461: {'lr': 0.0004938628778642185, 'samples': 2392512, 'steps': 12460, 'loss/train': 1.8743846416473389} -08/30/2021 15:22:23 - INFO - __main__ - Step 12462: {'lr': 0.0004938617091881554, 'samples': 2392704, 'steps': 12461, 'loss/train': 1.378425121307373} -08/30/2021 15:22:23 - INFO - __main__ - Step 12463: {'lr': 0.000493860540402212, 'samples': 2392896, 'steps': 12462, 'loss/train': 2.4345130920410156} -08/30/2021 15:22:23 - INFO - __main__ - Step 12464: {'lr': 0.0004938593715063888, 'samples': 2393088, 'steps': 12463, 'loss/train': 0.23290377855300903} -08/30/2021 15:22:24 - INFO - __main__ - Step 12465: {'lr': 0.0004938582025006864, 'samples': 2393280, 'steps': 12464, 'loss/train': 2.8235154151916504} -08/30/2021 15:22:24 - INFO - __main__ - Step 12466: {'lr': 0.0004938570333851052, 'samples': 2393472, 'steps': 12465, 'loss/train': 1.8025381565093994} -08/30/2021 15:22:26 - INFO - __main__ - Step 12467: {'lr': 0.0004938558641596458, 'samples': 2393664, 'steps': 12466, 'loss/train': 1.8506377935409546} -08/30/2021 15:22:26 - INFO - __main__ - Step 12468: {'lr': 0.0004938546948243087, 'samples': 2393856, 'steps': 12467, 'loss/train': 1.8140132427215576} -08/30/2021 15:22:26 - INFO - __main__ - Step 12469: {'lr': 0.0004938535253790944, 'samples': 2394048, 'steps': 12468, 'loss/train': 1.4851552248001099} -08/30/2021 15:22:27 - INFO - __main__ - Step 12470: {'lr': 0.0004938523558240035, 'samples': 2394240, 'steps': 12469, 'loss/train': 1.7355839014053345} -08/30/2021 15:22:27 - INFO - __main__ - Step 12471: {'lr': 0.0004938511861590365, 'samples': 2394432, 'steps': 12470, 'loss/train': 1.5451091527938843} -08/30/2021 15:22:30 - INFO - __main__ - Step 12472: {'lr': 0.000493850016384194, 'samples': 2394624, 'steps': 12471, 'loss/train': 1.8238810300827026} -08/30/2021 15:22:31 - INFO - __main__ - Step 12473: {'lr': 0.0004938488464994764, 'samples': 2394816, 'steps': 12472, 'loss/train': 0.9098502397537231} -08/30/2021 15:22:31 - INFO - __main__ - Step 12474: {'lr': 0.0004938476765048842, 'samples': 2395008, 'steps': 12473, 'loss/train': 0.8234099745750427} -08/30/2021 15:22:31 - INFO - __main__ - Step 12475: {'lr': 0.0004938465064004181, 'samples': 2395200, 'steps': 12474, 'loss/train': 0.6922528147697449} -08/30/2021 15:22:32 - INFO - __main__ - Step 12476: {'lr': 0.0004938453361860785, 'samples': 2395392, 'steps': 12475, 'loss/train': 1.9006537199020386} -08/30/2021 15:22:32 - INFO - __main__ - Step 12477: {'lr': 0.0004938441658618659, 'samples': 2395584, 'steps': 12476, 'loss/train': 1.4312968254089355} -08/30/2021 15:22:34 - INFO - __main__ - Step 12478: {'lr': 0.0004938429954277809, 'samples': 2395776, 'steps': 12477, 'loss/train': 2.016352653503418} -08/30/2021 15:22:34 - INFO - __main__ - Step 12479: {'lr': 0.000493841824883824, 'samples': 2395968, 'steps': 12478, 'loss/train': 2.184368848800659} -08/30/2021 15:22:35 - INFO - __main__ - Step 12480: {'lr': 0.0004938406542299956, 'samples': 2396160, 'steps': 12479, 'loss/train': 1.658437967300415} -08/30/2021 15:22:35 - INFO - __main__ - Step 12481: {'lr': 0.0004938394834662966, 'samples': 2396352, 'steps': 12480, 'loss/train': 0.22018125653266907} -08/30/2021 15:22:35 - INFO - __main__ - Step 12482: {'lr': 0.0004938383125927272, 'samples': 2396544, 'steps': 12481, 'loss/train': 2.0617432594299316} -08/30/2021 15:22:36 - INFO - __main__ - Step 12483: {'lr': 0.0004938371416092881, 'samples': 2396736, 'steps': 12482, 'loss/train': 1.5849149227142334} -08/30/2021 15:22:37 - INFO - __main__ - Step 12484: {'lr': 0.0004938359705159796, 'samples': 2396928, 'steps': 12483, 'loss/train': 1.7631844282150269} -08/30/2021 15:22:38 - INFO - __main__ - Step 12485: {'lr': 0.0004938347993128025, 'samples': 2397120, 'steps': 12484, 'loss/train': 1.6862891912460327} -08/30/2021 15:22:38 - INFO - __main__ - Step 12486: {'lr': 0.0004938336279997571, 'samples': 2397312, 'steps': 12485, 'loss/train': 1.6655131578445435} -08/30/2021 15:22:39 - INFO - __main__ - Step 12487: {'lr': 0.0004938324565768441, 'samples': 2397504, 'steps': 12486, 'loss/train': 1.7845306396484375} -08/30/2021 15:22:39 - INFO - __main__ - Step 12488: {'lr': 0.0004938312850440639, 'samples': 2397696, 'steps': 12487, 'loss/train': 0.5651407837867737} -08/30/2021 15:22:40 - INFO - __main__ - Step 12489: {'lr': 0.0004938301134014172, 'samples': 2397888, 'steps': 12488, 'loss/train': 0.9216361045837402} -08/30/2021 15:22:41 - INFO - __main__ - Step 12490: {'lr': 0.0004938289416489042, 'samples': 2398080, 'steps': 12489, 'loss/train': 1.7292640209197998} -08/30/2021 15:22:41 - INFO - __main__ - Step 12491: {'lr': 0.0004938277697865259, 'samples': 2398272, 'steps': 12490, 'loss/train': 1.921535611152649} -08/30/2021 15:22:42 - INFO - __main__ - Step 12492: {'lr': 0.0004938265978142824, 'samples': 2398464, 'steps': 12491, 'loss/train': 1.4806448221206665} -08/30/2021 15:22:42 - INFO - __main__ - Step 12493: {'lr': 0.0004938254257321745, 'samples': 2398656, 'steps': 12492, 'loss/train': 2.1684815883636475} -08/30/2021 15:22:43 - INFO - __main__ - Step 12494: {'lr': 0.0004938242535402025, 'samples': 2398848, 'steps': 12493, 'loss/train': 1.8698049783706665} -08/30/2021 15:22:44 - INFO - __main__ - Step 12495: {'lr': 0.0004938230812383672, 'samples': 2399040, 'steps': 12494, 'loss/train': 1.7525417804718018} -08/30/2021 15:22:44 - INFO - __main__ - Step 12496: {'lr': 0.0004938219088266688, 'samples': 2399232, 'steps': 12495, 'loss/train': 2.0826210975646973} -08/30/2021 15:22:44 - INFO - __main__ - Step 12497: {'lr': 0.0004938207363051082, 'samples': 2399424, 'steps': 12496, 'loss/train': 1.6311655044555664} -08/30/2021 15:22:45 - INFO - __main__ - Step 12498: {'lr': 0.0004938195636736857, 'samples': 2399616, 'steps': 12497, 'loss/train': 1.8564714193344116} -08/30/2021 15:22:46 - INFO - __main__ - Step 12499: {'lr': 0.0004938183909324017, 'samples': 2399808, 'steps': 12498, 'loss/train': 2.4576282501220703} -08/30/2021 15:22:47 - INFO - __main__ - Step 12500: {'lr': 0.0004938172180812571, 'samples': 2400000, 'steps': 12499, 'loss/train': 1.2565624713897705} -08/30/2021 15:22:47 - INFO - __main__ - Step 12501: {'lr': 0.000493816045120252, 'samples': 2400192, 'steps': 12500, 'loss/train': 1.589972972869873} -08/30/2021 15:22:48 - INFO - __main__ - Step 12502: {'lr': 0.0004938148720493873, 'samples': 2400384, 'steps': 12501, 'loss/train': 1.6916298866271973} -08/30/2021 15:22:48 - INFO - __main__ - Step 12503: {'lr': 0.0004938136988686634, 'samples': 2400576, 'steps': 12502, 'loss/train': 1.5743650197982788} -08/30/2021 15:22:48 - INFO - __main__ - Step 12504: {'lr': 0.0004938125255780808, 'samples': 2400768, 'steps': 12503, 'loss/train': 1.841348648071289} -08/30/2021 15:22:50 - INFO - __main__ - Step 12505: {'lr': 0.0004938113521776401, 'samples': 2400960, 'steps': 12504, 'loss/train': 1.791174054145813} -08/30/2021 15:22:50 - INFO - __main__ - Step 12506: {'lr': 0.0004938101786673416, 'samples': 2401152, 'steps': 12505, 'loss/train': 1.8853627443313599} -08/30/2021 15:22:51 - INFO - __main__ - Step 12507: {'lr': 0.0004938090050471861, 'samples': 2401344, 'steps': 12506, 'loss/train': 1.1951075792312622} -08/30/2021 15:22:51 - INFO - __main__ - Step 12508: {'lr': 0.000493807831317174, 'samples': 2401536, 'steps': 12507, 'loss/train': 1.2089728116989136} -08/30/2021 15:22:51 - INFO - __main__ - Step 12509: {'lr': 0.0004938066574773058, 'samples': 2401728, 'steps': 12508, 'loss/train': 1.4420223236083984} -08/30/2021 15:22:53 - INFO - __main__ - Step 12510: {'lr': 0.0004938054835275822, 'samples': 2401920, 'steps': 12509, 'loss/train': 1.7887407541275024} -08/30/2021 15:22:53 - INFO - __main__ - Step 12511: {'lr': 0.0004938043094680036, 'samples': 2402112, 'steps': 12510, 'loss/train': 1.6452138423919678} -08/30/2021 15:22:54 - INFO - __main__ - Step 12512: {'lr': 0.0004938031352985704, 'samples': 2402304, 'steps': 12511, 'loss/train': 1.6797332763671875} -08/30/2021 15:22:54 - INFO - __main__ - Step 12513: {'lr': 0.0004938019610192835, 'samples': 2402496, 'steps': 12512, 'loss/train': 1.5179246664047241} -08/30/2021 15:22:54 - INFO - __main__ - Step 12514: {'lr': 0.0004938007866301429, 'samples': 2402688, 'steps': 12513, 'loss/train': 1.9688055515289307} -08/30/2021 15:22:56 - INFO - __main__ - Step 12515: {'lr': 0.0004937996121311496, 'samples': 2402880, 'steps': 12514, 'loss/train': 1.907478928565979} -08/30/2021 15:22:56 - INFO - __main__ - Step 12516: {'lr': 0.000493798437522304, 'samples': 2403072, 'steps': 12515, 'loss/train': 1.7711124420166016} -08/30/2021 15:22:56 - INFO - __main__ - Step 12517: {'lr': 0.0004937972628036065, 'samples': 2403264, 'steps': 12516, 'loss/train': 1.4934422969818115} -08/30/2021 15:22:57 - INFO - __main__ - Step 12518: {'lr': 0.0004937960879750578, 'samples': 2403456, 'steps': 12517, 'loss/train': 1.4428638219833374} -08/30/2021 15:22:57 - INFO - __main__ - Step 12519: {'lr': 0.0004937949130366582, 'samples': 2403648, 'steps': 12518, 'loss/train': 1.6491045951843262} -08/30/2021 15:22:59 - INFO - __main__ - Step 12520: {'lr': 0.0004937937379884085, 'samples': 2403840, 'steps': 12519, 'loss/train': 1.5070687532424927} -08/30/2021 15:22:59 - INFO - __main__ - Step 12521: {'lr': 0.0004937925628303091, 'samples': 2404032, 'steps': 12520, 'loss/train': 1.9181841611862183} -08/30/2021 15:22:59 - INFO - __main__ - Step 12522: {'lr': 0.0004937913875623605, 'samples': 2404224, 'steps': 12521, 'loss/train': 1.913568139076233} -08/30/2021 15:23:00 - INFO - __main__ - Step 12523: {'lr': 0.0004937902121845633, 'samples': 2404416, 'steps': 12522, 'loss/train': 1.7699967622756958} -08/30/2021 15:23:00 - INFO - __main__ - Step 12524: {'lr': 0.000493789036696918, 'samples': 2404608, 'steps': 12523, 'loss/train': 1.8491734266281128} -08/30/2021 15:23:02 - INFO - __main__ - Step 12525: {'lr': 0.000493787861099425, 'samples': 2404800, 'steps': 12524, 'loss/train': 1.6258100271224976} -08/30/2021 15:23:02 - INFO - __main__ - Step 12526: {'lr': 0.0004937866853920851, 'samples': 2404992, 'steps': 12525, 'loss/train': 2.2164700031280518} -08/30/2021 15:23:02 - INFO - __main__ - Step 12527: {'lr': 0.0004937855095748985, 'samples': 2405184, 'steps': 12526, 'loss/train': 1.8664838075637817} -08/30/2021 15:23:03 - INFO - __main__ - Step 12528: {'lr': 0.0004937843336478661, 'samples': 2405376, 'steps': 12527, 'loss/train': 1.4773613214492798} -08/30/2021 15:23:03 - INFO - __main__ - Step 12529: {'lr': 0.0004937831576109881, 'samples': 2405568, 'steps': 12528, 'loss/train': 2.0828826427459717} -08/30/2021 15:23:05 - INFO - __main__ - Step 12530: {'lr': 0.0004937819814642653, 'samples': 2405760, 'steps': 12529, 'loss/train': 2.1169567108154297} -08/30/2021 15:23:06 - INFO - __main__ - Step 12531: {'lr': 0.000493780805207698, 'samples': 2405952, 'steps': 12530, 'loss/train': 1.6626170873641968} -08/30/2021 15:23:06 - INFO - __main__ - Step 12532: {'lr': 0.000493779628841287, 'samples': 2406144, 'steps': 12531, 'loss/train': 0.2646285593509674} -08/30/2021 15:23:06 - INFO - __main__ - Step 12533: {'lr': 0.0004937784523650324, 'samples': 2406336, 'steps': 12532, 'loss/train': 1.410550832748413} -08/30/2021 15:23:07 - INFO - __main__ - Step 12534: {'lr': 0.0004937772757789352, 'samples': 2406528, 'steps': 12533, 'loss/train': 1.9159671068191528} -08/30/2021 15:23:08 - INFO - __main__ - Step 12535: {'lr': 0.0004937760990829956, 'samples': 2406720, 'steps': 12534, 'loss/train': 1.1231690645217896} -08/30/2021 15:23:09 - INFO - __main__ - Step 12536: {'lr': 0.0004937749222772143, 'samples': 2406912, 'steps': 12535, 'loss/train': 1.831701636314392} -08/30/2021 15:23:09 - INFO - __main__ - Step 12537: {'lr': 0.0004937737453615918, 'samples': 2407104, 'steps': 12536, 'loss/train': 1.8218296766281128} -08/30/2021 15:23:09 - INFO - __main__ - Step 12538: {'lr': 0.0004937725683361286, 'samples': 2407296, 'steps': 12537, 'loss/train': 1.5685603618621826} -08/30/2021 15:23:10 - INFO - __main__ - Step 12539: {'lr': 0.0004937713912008252, 'samples': 2407488, 'steps': 12538, 'loss/train': 1.727821946144104} -08/30/2021 15:23:10 - INFO - __main__ - Step 12540: {'lr': 0.0004937702139556822, 'samples': 2407680, 'steps': 12539, 'loss/train': 1.4807853698730469} -08/30/2021 15:23:11 - INFO - __main__ - Step 12541: {'lr': 0.0004937690366007, 'samples': 2407872, 'steps': 12540, 'loss/train': 1.8320239782333374} -08/30/2021 15:23:12 - INFO - __main__ - Step 12542: {'lr': 0.0004937678591358794, 'samples': 2408064, 'steps': 12541, 'loss/train': 1.73628568649292} -08/30/2021 15:23:12 - INFO - __main__ - Step 12543: {'lr': 0.0004937666815612207, 'samples': 2408256, 'steps': 12542, 'loss/train': 1.7498762607574463} -08/30/2021 15:23:12 - INFO - __main__ - Step 12544: {'lr': 0.0004937655038767245, 'samples': 2408448, 'steps': 12543, 'loss/train': 2.125943183898926} -08/30/2021 15:23:13 - INFO - __main__ - Step 12545: {'lr': 0.0004937643260823914, 'samples': 2408640, 'steps': 12544, 'loss/train': 1.7223514318466187} -08/30/2021 15:23:14 - INFO - __main__ - Step 12546: {'lr': 0.0004937631481782218, 'samples': 2408832, 'steps': 12545, 'loss/train': 1.3177604675292969} -08/30/2021 15:23:15 - INFO - __main__ - Step 12547: {'lr': 0.0004937619701642162, 'samples': 2409024, 'steps': 12546, 'loss/train': 1.0912584066390991} -08/30/2021 15:23:15 - INFO - __main__ - Step 12548: {'lr': 0.0004937607920403752, 'samples': 2409216, 'steps': 12547, 'loss/train': 1.5156407356262207} -08/30/2021 15:23:16 - INFO - __main__ - Step 12549: {'lr': 0.0004937596138066996, 'samples': 2409408, 'steps': 12548, 'loss/train': 0.5244348049163818} -08/30/2021 15:23:16 - INFO - __main__ - Step 12550: {'lr': 0.0004937584354631894, 'samples': 2409600, 'steps': 12549, 'loss/train': 0.5477697849273682} -08/30/2021 15:23:18 - INFO - __main__ - Step 12551: {'lr': 0.0004937572570098455, 'samples': 2409792, 'steps': 12550, 'loss/train': 1.8346753120422363} -08/30/2021 15:23:18 - INFO - __main__ - Step 12552: {'lr': 0.0004937560784466685, 'samples': 2409984, 'steps': 12551, 'loss/train': 2.2612287998199463} -08/30/2021 15:23:18 - INFO - __main__ - Step 12553: {'lr': 0.0004937548997736586, 'samples': 2410176, 'steps': 12552, 'loss/train': 1.7875642776489258} -08/30/2021 15:23:19 - INFO - __main__ - Step 12554: {'lr': 0.0004937537209908165, 'samples': 2410368, 'steps': 12553, 'loss/train': 1.822165846824646} -08/30/2021 15:23:19 - INFO - __main__ - Step 12555: {'lr': 0.0004937525420981428, 'samples': 2410560, 'steps': 12554, 'loss/train': 1.816356897354126} -08/30/2021 15:23:20 - INFO - __main__ - Step 12556: {'lr': 0.0004937513630956379, 'samples': 2410752, 'steps': 12555, 'loss/train': 1.835490107536316} -08/30/2021 15:23:21 - INFO - __main__ - Step 12557: {'lr': 0.0004937501839833024, 'samples': 2410944, 'steps': 12556, 'loss/train': 2.248667001724243} -08/30/2021 15:23:22 - INFO - __main__ - Step 12558: {'lr': 0.0004937490047611369, 'samples': 2411136, 'steps': 12557, 'loss/train': 1.3210731744766235} -08/30/2021 15:23:22 - INFO - __main__ - Step 12559: {'lr': 0.0004937478254291418, 'samples': 2411328, 'steps': 12558, 'loss/train': 1.8700735569000244} -08/30/2021 15:23:22 - INFO - __main__ - Step 12560: {'lr': 0.0004937466459873178, 'samples': 2411520, 'steps': 12559, 'loss/train': 2.178784132003784} -08/30/2021 15:23:23 - INFO - __main__ - Step 12561: {'lr': 0.0004937454664356652, 'samples': 2411712, 'steps': 12560, 'loss/train': 1.6456546783447266} -08/30/2021 15:23:24 - INFO - __main__ - Step 12562: {'lr': 0.0004937442867741848, 'samples': 2411904, 'steps': 12561, 'loss/train': 1.9860590696334839} -08/30/2021 15:23:25 - INFO - __main__ - Step 12563: {'lr': 0.0004937431070028768, 'samples': 2412096, 'steps': 12562, 'loss/train': 2.0442144870758057} -08/30/2021 15:23:25 - INFO - __main__ - Step 12564: {'lr': 0.0004937419271217419, 'samples': 2412288, 'steps': 12563, 'loss/train': 1.8291712999343872} -08/30/2021 15:23:25 - INFO - __main__ - Step 12565: {'lr': 0.0004937407471307807, 'samples': 2412480, 'steps': 12564, 'loss/train': 1.5600214004516602} -08/30/2021 15:23:26 - INFO - __main__ - Step 12566: {'lr': 0.0004937395670299938, 'samples': 2412672, 'steps': 12565, 'loss/train': 1.662540078163147} -08/30/2021 15:23:27 - INFO - __main__ - Step 12567: {'lr': 0.0004937383868193815, 'samples': 2412864, 'steps': 12566, 'loss/train': 2.447221279144287} -08/30/2021 15:23:28 - INFO - __main__ - Step 12568: {'lr': 0.0004937372064989445, 'samples': 2413056, 'steps': 12567, 'loss/train': 1.4903484582901} -08/30/2021 15:23:28 - INFO - __main__ - Step 12569: {'lr': 0.0004937360260686833, 'samples': 2413248, 'steps': 12568, 'loss/train': 1.952978491783142} -08/30/2021 15:23:28 - INFO - __main__ - Step 12570: {'lr': 0.0004937348455285983, 'samples': 2413440, 'steps': 12569, 'loss/train': 1.8628313541412354} -08/30/2021 15:23:29 - INFO - __main__ - Step 12571: {'lr': 0.0004937336648786903, 'samples': 2413632, 'steps': 12570, 'loss/train': 1.6591362953186035} -08/30/2021 15:23:30 - INFO - __main__ - Step 12572: {'lr': 0.0004937324841189595, 'samples': 2413824, 'steps': 12571, 'loss/train': 2.9854345321655273} -08/30/2021 15:23:31 - INFO - __main__ - Step 12573: {'lr': 0.0004937313032494068, 'samples': 2414016, 'steps': 12572, 'loss/train': 1.566379189491272} -08/30/2021 15:23:31 - INFO - __main__ - Step 12574: {'lr': 0.0004937301222700324, 'samples': 2414208, 'steps': 12573, 'loss/train': 1.1759110689163208} -08/30/2021 15:23:31 - INFO - __main__ - Step 12575: {'lr': 0.0004937289411808369, 'samples': 2414400, 'steps': 12574, 'loss/train': 0.8813082575798035} -08/30/2021 15:23:32 - INFO - __main__ - Step 12576: {'lr': 0.000493727759981821, 'samples': 2414592, 'steps': 12575, 'loss/train': 1.5776596069335938} -08/30/2021 15:23:33 - INFO - __main__ - Step 12577: {'lr': 0.0004937265786729851, 'samples': 2414784, 'steps': 12576, 'loss/train': 0.5332491993904114} -08/30/2021 15:23:34 - INFO - __main__ - Step 12578: {'lr': 0.0004937253972543298, 'samples': 2414976, 'steps': 12577, 'loss/train': 1.688797950744629} -08/30/2021 15:23:34 - INFO - __main__ - Step 12579: {'lr': 0.0004937242157258555, 'samples': 2415168, 'steps': 12578, 'loss/train': 2.6554276943206787} -08/30/2021 15:23:35 - INFO - __main__ - Step 12580: {'lr': 0.000493723034087563, 'samples': 2415360, 'steps': 12579, 'loss/train': 1.850439429283142} -08/30/2021 15:23:35 - INFO - __main__ - Step 12581: {'lr': 0.0004937218523394525, 'samples': 2415552, 'steps': 12580, 'loss/train': 1.299819827079773} -08/30/2021 15:23:35 - INFO - __main__ - Step 12582: {'lr': 0.0004937206704815248, 'samples': 2415744, 'steps': 12581, 'loss/train': 1.8108617067337036} -08/30/2021 15:23:37 - INFO - __main__ - Step 12583: {'lr': 0.0004937194885137803, 'samples': 2415936, 'steps': 12582, 'loss/train': 2.009592294692993} -08/30/2021 15:23:38 - INFO - __main__ - Step 12584: {'lr': 0.0004937183064362196, 'samples': 2416128, 'steps': 12583, 'loss/train': 1.7571768760681152} -08/30/2021 15:23:38 - INFO - __main__ - Step 12585: {'lr': 0.0004937171242488431, 'samples': 2416320, 'steps': 12584, 'loss/train': 2.422935962677002} -08/30/2021 15:23:38 - INFO - __main__ - Step 12586: {'lr': 0.0004937159419516515, 'samples': 2416512, 'steps': 12585, 'loss/train': 1.5480355024337769} -08/30/2021 15:23:39 - INFO - __main__ - Step 12587: {'lr': 0.0004937147595446452, 'samples': 2416704, 'steps': 12586, 'loss/train': 1.3654075860977173} -08/30/2021 15:23:40 - INFO - __main__ - Step 12588: {'lr': 0.0004937135770278248, 'samples': 2416896, 'steps': 12587, 'loss/train': 1.9075508117675781} -08/30/2021 15:23:41 - INFO - __main__ - Step 12589: {'lr': 0.0004937123944011908, 'samples': 2417088, 'steps': 12588, 'loss/train': 1.8653266429901123} -08/30/2021 15:23:41 - INFO - __main__ - Step 12590: {'lr': 0.0004937112116647439, 'samples': 2417280, 'steps': 12589, 'loss/train': 1.9763001203536987} -08/30/2021 15:23:41 - INFO - __main__ - Step 12591: {'lr': 0.0004937100288184843, 'samples': 2417472, 'steps': 12590, 'loss/train': 0.810440182685852} -08/30/2021 15:23:42 - INFO - __main__ - Step 12592: {'lr': 0.0004937088458624128, 'samples': 2417664, 'steps': 12591, 'loss/train': 1.4978715181350708} -08/30/2021 15:23:43 - INFO - __main__ - Step 12593: {'lr': 0.0004937076627965299, 'samples': 2417856, 'steps': 12592, 'loss/train': 1.519140601158142} -08/30/2021 15:23:44 - INFO - __main__ - Step 12594: {'lr': 0.000493706479620836, 'samples': 2418048, 'steps': 12593, 'loss/train': 1.8998225927352905} -08/30/2021 15:23:44 - INFO - __main__ - Step 12595: {'lr': 0.0004937052963353318, 'samples': 2418240, 'steps': 12594, 'loss/train': 2.019606828689575} -08/30/2021 15:23:45 - INFO - __main__ - Step 12596: {'lr': 0.0004937041129400177, 'samples': 2418432, 'steps': 12595, 'loss/train': 1.3530529737472534} -08/30/2021 15:23:45 - INFO - __main__ - Step 12597: {'lr': 0.0004937029294348943, 'samples': 2418624, 'steps': 12596, 'loss/train': 1.3625153303146362} -08/30/2021 15:23:46 - INFO - __main__ - Step 12598: {'lr': 0.0004937017458199621, 'samples': 2418816, 'steps': 12597, 'loss/train': 1.8002816438674927} -08/30/2021 15:23:47 - INFO - __main__ - Step 12599: {'lr': 0.0004937005620952217, 'samples': 2419008, 'steps': 12598, 'loss/train': 1.3398879766464233} -08/30/2021 15:23:47 - INFO - __main__ - Step 12600: {'lr': 0.0004936993782606735, 'samples': 2419200, 'steps': 12599, 'loss/train': 1.5852748155593872} -08/30/2021 15:23:48 - INFO - __main__ - Step 12601: {'lr': 0.0004936981943163182, 'samples': 2419392, 'steps': 12600, 'loss/train': 1.806483268737793} -08/30/2021 15:23:48 - INFO - __main__ - Step 12602: {'lr': 0.0004936970102621563, 'samples': 2419584, 'steps': 12601, 'loss/train': 1.811933159828186} -08/30/2021 15:23:50 - INFO - __main__ - Step 12603: {'lr': 0.0004936958260981883, 'samples': 2419776, 'steps': 12602, 'loss/train': 1.9197443723678589} -08/30/2021 15:23:50 - INFO - __main__ - Step 12604: {'lr': 0.0004936946418244146, 'samples': 2419968, 'steps': 12603, 'loss/train': 1.1525815725326538} -08/30/2021 15:23:51 - INFO - __main__ - Step 12605: {'lr': 0.000493693457440836, 'samples': 2420160, 'steps': 12604, 'loss/train': 2.6090035438537598} -08/30/2021 15:23:51 - INFO - __main__ - Step 12606: {'lr': 0.0004936922729474526, 'samples': 2420352, 'steps': 12605, 'loss/train': 1.2480660676956177} -08/30/2021 15:23:51 - INFO - __main__ - Step 12607: {'lr': 0.0004936910883442655, 'samples': 2420544, 'steps': 12606, 'loss/train': 1.8558886051177979} -08/30/2021 15:23:52 - INFO - __main__ - Step 12608: {'lr': 0.0004936899036312749, 'samples': 2420736, 'steps': 12607, 'loss/train': 1.8366355895996094} -08/30/2021 15:23:53 - INFO - __main__ - Step 12609: {'lr': 0.0004936887188084813, 'samples': 2420928, 'steps': 12608, 'loss/train': 1.5720945596694946} -08/30/2021 15:23:54 - INFO - __main__ - Step 12610: {'lr': 0.0004936875338758855, 'samples': 2421120, 'steps': 12609, 'loss/train': 1.534041404724121} -08/30/2021 15:23:54 - INFO - __main__ - Step 12611: {'lr': 0.0004936863488334877, 'samples': 2421312, 'steps': 12610, 'loss/train': 1.8757835626602173} -08/30/2021 15:23:55 - INFO - __main__ - Step 12612: {'lr': 0.0004936851636812886, 'samples': 2421504, 'steps': 12611, 'loss/train': 1.5210860967636108} -08/30/2021 15:23:55 - INFO - __main__ - Step 12613: {'lr': 0.0004936839784192888, 'samples': 2421696, 'steps': 12612, 'loss/train': 1.7473598718643188} -08/30/2021 15:23:57 - INFO - __main__ - Step 12614: {'lr': 0.0004936827930474887, 'samples': 2421888, 'steps': 12613, 'loss/train': 0.2659986615180969} -08/30/2021 15:23:57 - INFO - __main__ - Step 12615: {'lr': 0.0004936816075658889, 'samples': 2422080, 'steps': 12614, 'loss/train': 1.3665947914123535} -08/30/2021 15:23:58 - INFO - __main__ - Step 12616: {'lr': 0.00049368042197449, 'samples': 2422272, 'steps': 12615, 'loss/train': 1.896285057067871} -08/30/2021 15:23:58 - INFO - __main__ - Step 12617: {'lr': 0.0004936792362732924, 'samples': 2422464, 'steps': 12616, 'loss/train': 1.6242717504501343} -08/30/2021 15:23:58 - INFO - __main__ - Step 12618: {'lr': 0.0004936780504622967, 'samples': 2422656, 'steps': 12617, 'loss/train': 0.108314648270607} -08/30/2021 15:24:00 - INFO - __main__ - Step 12619: {'lr': 0.0004936768645415033, 'samples': 2422848, 'steps': 12618, 'loss/train': 1.9631596803665161} -08/30/2021 15:24:00 - INFO - __main__ - Step 12620: {'lr': 0.0004936756785109131, 'samples': 2423040, 'steps': 12619, 'loss/train': 1.9854191541671753} -08/30/2021 15:24:01 - INFO - __main__ - Step 12621: {'lr': 0.0004936744923705263, 'samples': 2423232, 'steps': 12620, 'loss/train': 2.0630979537963867} -08/30/2021 15:24:01 - INFO - __main__ - Step 12622: {'lr': 0.0004936733061203435, 'samples': 2423424, 'steps': 12621, 'loss/train': 2.102893114089966} -08/30/2021 15:24:01 - INFO - __main__ - Step 12623: {'lr': 0.0004936721197603653, 'samples': 2423616, 'steps': 12622, 'loss/train': 1.8399444818496704} -08/30/2021 15:24:03 - INFO - __main__ - Step 12624: {'lr': 0.0004936709332905923, 'samples': 2423808, 'steps': 12623, 'loss/train': 2.204284429550171} -08/30/2021 15:24:03 - INFO - __main__ - Step 12625: {'lr': 0.0004936697467110248, 'samples': 2424000, 'steps': 12624, 'loss/train': 1.6818745136260986} -08/30/2021 15:24:03 - INFO - __main__ - Step 12626: {'lr': 0.0004936685600216635, 'samples': 2424192, 'steps': 12625, 'loss/train': 1.5752936601638794} -08/30/2021 15:24:04 - INFO - __main__ - Step 12627: {'lr': 0.0004936673732225088, 'samples': 2424384, 'steps': 12626, 'loss/train': 1.9554191827774048} -08/30/2021 15:24:04 - INFO - __main__ - Step 12628: {'lr': 0.0004936661863135615, 'samples': 2424576, 'steps': 12627, 'loss/train': 1.9483890533447266} -08/30/2021 15:24:04 - INFO - __main__ - Step 12629: {'lr': 0.000493664999294822, 'samples': 2424768, 'steps': 12628, 'loss/train': 1.863869309425354} -08/30/2021 15:24:06 - INFO - __main__ - Step 12630: {'lr': 0.0004936638121662908, 'samples': 2424960, 'steps': 12629, 'loss/train': 1.722177505493164} -08/30/2021 15:24:07 - INFO - __main__ - Step 12631: {'lr': 0.0004936626249279683, 'samples': 2425152, 'steps': 12630, 'loss/train': 0.61997389793396} -08/30/2021 15:24:07 - INFO - __main__ - Step 12632: {'lr': 0.0004936614375798553, 'samples': 2425344, 'steps': 12631, 'loss/train': 1.797813892364502} -08/30/2021 15:24:07 - INFO - __main__ - Step 12633: {'lr': 0.0004936602501219522, 'samples': 2425536, 'steps': 12632, 'loss/train': 1.9456511735916138} -08/30/2021 15:24:08 - INFO - __main__ - Step 12634: {'lr': 0.0004936590625542595, 'samples': 2425728, 'steps': 12633, 'loss/train': 1.688139796257019} -08/30/2021 15:24:10 - INFO - __main__ - Step 12635: {'lr': 0.0004936578748767779, 'samples': 2425920, 'steps': 12634, 'loss/train': 1.8951882123947144} -08/30/2021 15:24:10 - INFO - __main__ - Step 12636: {'lr': 0.0004936566870895078, 'samples': 2426112, 'steps': 12635, 'loss/train': 1.5163230895996094} -08/30/2021 15:24:11 - INFO - __main__ - Step 12637: {'lr': 0.0004936554991924496, 'samples': 2426304, 'steps': 12636, 'loss/train': 1.1690499782562256} -08/30/2021 15:24:11 - INFO - __main__ - Step 12638: {'lr': 0.0004936543111856041, 'samples': 2426496, 'steps': 12637, 'loss/train': 1.6015605926513672} -08/30/2021 15:24:11 - INFO - __main__ - Step 12639: {'lr': 0.0004936531230689717, 'samples': 2426688, 'steps': 12638, 'loss/train': 1.7503412961959839} -08/30/2021 15:24:13 - INFO - __main__ - Step 12640: {'lr': 0.000493651934842553, 'samples': 2426880, 'steps': 12639, 'loss/train': 1.9404630661010742} -08/30/2021 15:24:13 - INFO - __main__ - Step 12641: {'lr': 0.0004936507465063486, 'samples': 2427072, 'steps': 12640, 'loss/train': 1.403029441833496} -08/30/2021 15:24:14 - INFO - __main__ - Step 12642: {'lr': 0.0004936495580603588, 'samples': 2427264, 'steps': 12641, 'loss/train': 1.5929763317108154} -08/30/2021 15:24:14 - INFO - __main__ - Step 12643: {'lr': 0.0004936483695045842, 'samples': 2427456, 'steps': 12642, 'loss/train': 0.18132981657981873} -08/30/2021 15:24:15 - INFO - __main__ - Step 12644: {'lr': 0.0004936471808390254, 'samples': 2427648, 'steps': 12643, 'loss/train': 0.9389256834983826} -08/30/2021 15:24:15 - INFO - __main__ - Step 12645: {'lr': 0.0004936459920636832, 'samples': 2427840, 'steps': 12644, 'loss/train': 1.2691066265106201} -08/30/2021 15:24:16 - INFO - __main__ - Step 12646: {'lr': 0.0004936448031785576, 'samples': 2428032, 'steps': 12645, 'loss/train': 1.7338886260986328} -08/30/2021 15:24:17 - INFO - __main__ - Step 12647: {'lr': 0.0004936436141836496, 'samples': 2428224, 'steps': 12646, 'loss/train': 1.61439049243927} -08/30/2021 15:24:17 - INFO - __main__ - Step 12648: {'lr': 0.0004936424250789594, 'samples': 2428416, 'steps': 12647, 'loss/train': 2.189393997192383} -08/30/2021 15:24:18 - INFO - __main__ - Step 12649: {'lr': 0.0004936412358644878, 'samples': 2428608, 'steps': 12648, 'loss/train': 1.6907033920288086} -08/30/2021 15:24:18 - INFO - __main__ - Step 12650: {'lr': 0.0004936400465402351, 'samples': 2428800, 'steps': 12649, 'loss/train': 2.043912649154663} -08/30/2021 15:24:20 - INFO - __main__ - Step 12651: {'lr': 0.0004936388571062021, 'samples': 2428992, 'steps': 12650, 'loss/train': 2.0402636528015137} -08/30/2021 15:24:21 - INFO - __main__ - Step 12652: {'lr': 0.0004936376675623892, 'samples': 2429184, 'steps': 12651, 'loss/train': 1.9127482175827026} -08/30/2021 15:24:21 - INFO - __main__ - Step 12653: {'lr': 0.0004936364779087967, 'samples': 2429376, 'steps': 12652, 'loss/train': 0.11245076358318329} -08/30/2021 15:24:21 - INFO - __main__ - Step 12654: {'lr': 0.0004936352881454256, 'samples': 2429568, 'steps': 12653, 'loss/train': 0.10869347304105759} -08/30/2021 15:24:22 - INFO - __main__ - Step 12655: {'lr': 0.000493634098272276, 'samples': 2429760, 'steps': 12654, 'loss/train': 1.4098806381225586} -08/30/2021 15:24:22 - INFO - __main__ - Step 12656: {'lr': 0.0004936329082893488, 'samples': 2429952, 'steps': 12655, 'loss/train': 1.5289244651794434} -08/30/2021 15:24:22 - INFO - __main__ - Step 12657: {'lr': 0.0004936317181966443, 'samples': 2430144, 'steps': 12656, 'loss/train': 1.7236436605453491} -08/30/2021 15:24:24 - INFO - __main__ - Step 12658: {'lr': 0.000493630527994163, 'samples': 2430336, 'steps': 12657, 'loss/train': 1.7598484754562378} -08/30/2021 15:24:24 - INFO - __main__ - Step 12659: {'lr': 0.0004936293376819058, 'samples': 2430528, 'steps': 12658, 'loss/train': 1.7739248275756836} -08/30/2021 15:24:25 - INFO - __main__ - Step 12660: {'lr': 0.0004936281472598728, 'samples': 2430720, 'steps': 12659, 'loss/train': 1.8535062074661255} -08/30/2021 15:24:25 - INFO - __main__ - Step 12661: {'lr': 0.0004936269567280648, 'samples': 2430912, 'steps': 12660, 'loss/train': 1.5991106033325195} -08/30/2021 15:24:25 - INFO - __main__ - Step 12662: {'lr': 0.0004936257660864822, 'samples': 2431104, 'steps': 12661, 'loss/train': 1.926518201828003} -08/30/2021 15:24:27 - INFO - __main__ - Step 12663: {'lr': 0.0004936245753351256, 'samples': 2431296, 'steps': 12662, 'loss/train': 1.5261632204055786} -08/30/2021 15:24:27 - INFO - __main__ - Step 12664: {'lr': 0.0004936233844739955, 'samples': 2431488, 'steps': 12663, 'loss/train': 1.7146270275115967} -08/30/2021 15:24:28 - INFO - __main__ - Step 12665: {'lr': 0.0004936221935030924, 'samples': 2431680, 'steps': 12664, 'loss/train': 1.2206121683120728} -08/30/2021 15:24:28 - INFO - __main__ - Step 12666: {'lr': 0.000493621002422417, 'samples': 2431872, 'steps': 12665, 'loss/train': 0.9639013409614563} -08/30/2021 15:24:28 - INFO - __main__ - Step 12667: {'lr': 0.0004936198112319698, 'samples': 2432064, 'steps': 12666, 'loss/train': 2.054918050765991} -08/30/2021 15:24:30 - INFO - __main__ - Step 12668: {'lr': 0.0004936186199317511, 'samples': 2432256, 'steps': 12667, 'loss/train': 1.744736909866333} -08/30/2021 15:24:30 - INFO - __main__ - Step 12669: {'lr': 0.0004936174285217618, 'samples': 2432448, 'steps': 12668, 'loss/train': 1.7439709901809692} -08/30/2021 15:24:31 - INFO - __main__ - Step 12670: {'lr': 0.0004936162370020021, 'samples': 2432640, 'steps': 12669, 'loss/train': 1.9177600145339966} -08/30/2021 15:24:31 - INFO - __main__ - Step 12671: {'lr': 0.0004936150453724727, 'samples': 2432832, 'steps': 12670, 'loss/train': 1.896408200263977} -08/30/2021 15:24:31 - INFO - __main__ - Step 12672: {'lr': 0.0004936138536331742, 'samples': 2433024, 'steps': 12671, 'loss/train': 2.183018207550049} -08/30/2021 15:24:33 - INFO - __main__ - Step 12673: {'lr': 0.000493612661784107, 'samples': 2433216, 'steps': 12672, 'loss/train': 1.9232347011566162} -08/30/2021 15:24:34 - INFO - __main__ - Step 12674: {'lr': 0.0004936114698252717, 'samples': 2433408, 'steps': 12673, 'loss/train': 0.4394769072532654} -08/30/2021 15:24:34 - INFO - __main__ - Step 12675: {'lr': 0.0004936102777566688, 'samples': 2433600, 'steps': 12674, 'loss/train': 1.6537195444107056} -08/30/2021 15:24:34 - INFO - __main__ - Step 12676: {'lr': 0.0004936090855782989, 'samples': 2433792, 'steps': 12675, 'loss/train': 1.8253090381622314} -08/30/2021 15:24:35 - INFO - __main__ - Step 12677: {'lr': 0.0004936078932901625, 'samples': 2433984, 'steps': 12676, 'loss/train': 1.7961907386779785} -08/30/2021 15:24:36 - INFO - __main__ - Step 12678: {'lr': 0.0004936067008922602, 'samples': 2434176, 'steps': 12677, 'loss/train': 1.5258166790008545} -08/30/2021 15:24:37 - INFO - __main__ - Step 12679: {'lr': 0.0004936055083845924, 'samples': 2434368, 'steps': 12678, 'loss/train': 1.9338176250457764} -08/30/2021 15:24:37 - INFO - __main__ - Step 12680: {'lr': 0.0004936043157671597, 'samples': 2434560, 'steps': 12679, 'loss/train': 1.5246820449829102} -08/30/2021 15:24:37 - INFO - __main__ - Step 12681: {'lr': 0.0004936031230399628, 'samples': 2434752, 'steps': 12680, 'loss/train': 2.037579298019409} -08/30/2021 15:24:38 - INFO - __main__ - Step 12682: {'lr': 0.000493601930203002, 'samples': 2434944, 'steps': 12681, 'loss/train': 1.7349222898483276} -08/30/2021 15:24:38 - INFO - __main__ - Step 12683: {'lr': 0.0004936007372562778, 'samples': 2435136, 'steps': 12682, 'loss/train': 1.0998066663742065} -08/30/2021 15:24:40 - INFO - __main__ - Step 12684: {'lr': 0.0004935995441997911, 'samples': 2435328, 'steps': 12683, 'loss/train': 2.121187210083008} -08/30/2021 15:24:40 - INFO - __main__ - Step 12685: {'lr': 0.000493598351033542, 'samples': 2435520, 'steps': 12684, 'loss/train': 1.8788855075836182} -08/30/2021 15:24:40 - INFO - __main__ - Step 12686: {'lr': 0.0004935971577575313, 'samples': 2435712, 'steps': 12685, 'loss/train': 2.2197322845458984} -08/30/2021 15:24:41 - INFO - __main__ - Step 12687: {'lr': 0.0004935959643717595, 'samples': 2435904, 'steps': 12686, 'loss/train': 1.721380591392517} -08/30/2021 15:24:41 - INFO - __main__ - Step 12688: {'lr': 0.0004935947708762272, 'samples': 2436096, 'steps': 12687, 'loss/train': 2.050400733947754} -08/30/2021 15:24:43 - INFO - __main__ - Step 12689: {'lr': 0.0004935935772709348, 'samples': 2436288, 'steps': 12688, 'loss/train': 1.7758708000183105} -08/30/2021 15:24:43 - INFO - __main__ - Step 12690: {'lr': 0.0004935923835558829, 'samples': 2436480, 'steps': 12689, 'loss/train': 1.0109050273895264} -08/30/2021 15:24:44 - INFO - __main__ - Step 12691: {'lr': 0.0004935911897310719, 'samples': 2436672, 'steps': 12690, 'loss/train': 1.314550518989563} -08/30/2021 15:24:44 - INFO - __main__ - Step 12692: {'lr': 0.0004935899957965027, 'samples': 2436864, 'steps': 12691, 'loss/train': 1.9543402194976807} -08/30/2021 15:24:44 - INFO - __main__ - Step 12693: {'lr': 0.0004935888017521754, 'samples': 2437056, 'steps': 12692, 'loss/train': 1.5407357215881348} -08/30/2021 15:24:46 - INFO - __main__ - Step 12694: {'lr': 0.0004935876075980908, 'samples': 2437248, 'steps': 12693, 'loss/train': 1.6913949251174927} -08/30/2021 15:24:47 - INFO - __main__ - Step 12695: {'lr': 0.0004935864133342495, 'samples': 2437440, 'steps': 12694, 'loss/train': 1.5512062311172485} -08/30/2021 15:24:47 - INFO - __main__ - Step 12696: {'lr': 0.0004935852189606517, 'samples': 2437632, 'steps': 12695, 'loss/train': 1.8069430589675903} -08/30/2021 15:24:48 - INFO - __main__ - Step 12697: {'lr': 0.0004935840244772984, 'samples': 2437824, 'steps': 12696, 'loss/train': 1.825741171836853} -08/30/2021 15:24:48 - INFO - __main__ - Step 12698: {'lr': 0.0004935828298841898, 'samples': 2438016, 'steps': 12697, 'loss/train': 1.56669020652771} -08/30/2021 15:24:49 - INFO - __main__ - Step 12699: {'lr': 0.0004935816351813265, 'samples': 2438208, 'steps': 12698, 'loss/train': 1.4825313091278076} -08/30/2021 15:24:50 - INFO - __main__ - Step 12700: {'lr': 0.0004935804403687091, 'samples': 2438400, 'steps': 12699, 'loss/train': 1.686589002609253} -08/30/2021 15:24:50 - INFO - __main__ - Step 12701: {'lr': 0.0004935792454463381, 'samples': 2438592, 'steps': 12700, 'loss/train': 1.9009692668914795} -08/30/2021 15:24:51 - INFO - __main__ - Step 12702: {'lr': 0.000493578050414214, 'samples': 2438784, 'steps': 12701, 'loss/train': 0.9109597206115723} -08/30/2021 15:24:51 - INFO - __main__ - Step 12703: {'lr': 0.0004935768552723375, 'samples': 2438976, 'steps': 12702, 'loss/train': 1.5171445608139038} -08/30/2021 15:24:52 - INFO - __main__ - Step 12704: {'lr': 0.000493575660020709, 'samples': 2439168, 'steps': 12703, 'loss/train': 1.1090315580368042} -08/30/2021 15:24:53 - INFO - __main__ - Step 12705: {'lr': 0.000493574464659329, 'samples': 2439360, 'steps': 12704, 'loss/train': 1.2787632942199707} -08/30/2021 15:24:53 - INFO - __main__ - Step 12706: {'lr': 0.0004935732691881981, 'samples': 2439552, 'steps': 12705, 'loss/train': 1.6112338304519653} -08/30/2021 15:24:54 - INFO - __main__ - Step 12707: {'lr': 0.0004935720736073169, 'samples': 2439744, 'steps': 12706, 'loss/train': 1.8073229789733887} -08/30/2021 15:24:54 - INFO - __main__ - Step 12708: {'lr': 0.0004935708779166859, 'samples': 2439936, 'steps': 12707, 'loss/train': 1.8363302946090698} -08/30/2021 15:24:56 - INFO - __main__ - Step 12709: {'lr': 0.0004935696821163056, 'samples': 2440128, 'steps': 12708, 'loss/train': 1.8159846067428589} -08/30/2021 15:24:57 - INFO - __main__ - Step 12710: {'lr': 0.0004935684862061766, 'samples': 2440320, 'steps': 12709, 'loss/train': 1.759819746017456} -08/30/2021 15:24:57 - INFO - __main__ - Step 12711: {'lr': 0.0004935672901862993, 'samples': 2440512, 'steps': 12710, 'loss/train': 2.3868110179901123} -08/30/2021 15:24:57 - INFO - __main__ - Step 12712: {'lr': 0.0004935660940566744, 'samples': 2440704, 'steps': 12711, 'loss/train': 1.9664065837860107} -08/30/2021 15:24:58 - INFO - __main__ - Step 12713: {'lr': 0.0004935648978173024, 'samples': 2440896, 'steps': 12712, 'loss/train': 2.251214027404785} -08/30/2021 15:24:58 - INFO - __main__ - Step 12714: {'lr': 0.0004935637014681837, 'samples': 2441088, 'steps': 12713, 'loss/train': 1.8730881214141846} -08/30/2021 15:25:00 - INFO - __main__ - Step 12715: {'lr': 0.0004935625050093191, 'samples': 2441280, 'steps': 12714, 'loss/train': 2.399866819381714} -08/30/2021 15:25:00 - INFO - __main__ - Step 12716: {'lr': 0.000493561308440709, 'samples': 2441472, 'steps': 12715, 'loss/train': 1.6971989870071411} -08/30/2021 15:25:00 - INFO - __main__ - Step 12717: {'lr': 0.0004935601117623538, 'samples': 2441664, 'steps': 12716, 'loss/train': 2.003096580505371} -08/30/2021 15:25:01 - INFO - __main__ - Step 12718: {'lr': 0.0004935589149742542, 'samples': 2441856, 'steps': 12717, 'loss/train': 2.3252768516540527} -08/30/2021 15:25:01 - INFO - __main__ - Step 12719: {'lr': 0.0004935577180764108, 'samples': 2442048, 'steps': 12718, 'loss/train': 1.8923490047454834} -08/30/2021 15:25:04 - INFO - __main__ - Step 12720: {'lr': 0.000493556521068824, 'samples': 2442240, 'steps': 12719, 'loss/train': 2.1121156215667725} -08/30/2021 15:25:04 - INFO - __main__ - Step 12721: {'lr': 0.0004935553239514943, 'samples': 2442432, 'steps': 12720, 'loss/train': 1.3137507438659668} -08/30/2021 15:25:04 - INFO - __main__ - Step 12722: {'lr': 0.0004935541267244225, 'samples': 2442624, 'steps': 12721, 'loss/train': 1.5639243125915527} -08/30/2021 15:25:05 - INFO - __main__ - Step 12723: {'lr': 0.0004935529293876088, 'samples': 2442816, 'steps': 12722, 'loss/train': 1.3681550025939941} -08/30/2021 15:25:05 - INFO - __main__ - Step 12724: {'lr': 0.000493551731941054, 'samples': 2443008, 'steps': 12723, 'loss/train': 2.215101718902588} -08/30/2021 15:25:05 - INFO - __main__ - Step 12725: {'lr': 0.0004935505343847586, 'samples': 2443200, 'steps': 12724, 'loss/train': 0.5666799545288086} -08/30/2021 15:25:06 - INFO - __main__ - Step 12726: {'lr': 0.000493549336718723, 'samples': 2443392, 'steps': 12725, 'loss/train': 1.3400561809539795} -08/30/2021 15:25:08 - INFO - __main__ - Step 12727: {'lr': 0.0004935481389429479, 'samples': 2443584, 'steps': 12726, 'loss/train': 3.0213704109191895} -08/30/2021 15:25:08 - INFO - __main__ - Step 12728: {'lr': 0.0004935469410574337, 'samples': 2443776, 'steps': 12727, 'loss/train': 2.337177038192749} -08/30/2021 15:25:09 - INFO - __main__ - Step 12729: {'lr': 0.000493545743062181, 'samples': 2443968, 'steps': 12728, 'loss/train': 2.118790864944458} -08/30/2021 15:25:09 - INFO - __main__ - Step 12730: {'lr': 0.0004935445449571903, 'samples': 2444160, 'steps': 12729, 'loss/train': 0.36622175574302673} -08/30/2021 15:25:09 - INFO - __main__ - Step 12731: {'lr': 0.0004935433467424624, 'samples': 2444352, 'steps': 12730, 'loss/train': 2.5760347843170166} -08/30/2021 15:25:10 - INFO - __main__ - Step 12732: {'lr': 0.0004935421484179974, 'samples': 2444544, 'steps': 12731, 'loss/train': 1.9112876653671265} -08/30/2021 15:25:11 - INFO - __main__ - Step 12733: {'lr': 0.0004935409499837962, 'samples': 2444736, 'steps': 12732, 'loss/train': 0.34345391392707825} -08/30/2021 15:25:12 - INFO - __main__ - Step 12734: {'lr': 0.0004935397514398591, 'samples': 2444928, 'steps': 12733, 'loss/train': 2.2672271728515625} -08/30/2021 15:25:12 - INFO - __main__ - Step 12735: {'lr': 0.0004935385527861869, 'samples': 2445120, 'steps': 12734, 'loss/train': 2.1733508110046387} -08/30/2021 15:25:12 - INFO - __main__ - Step 12736: {'lr': 0.0004935373540227798, 'samples': 2445312, 'steps': 12735, 'loss/train': 1.9029417037963867} -08/30/2021 15:25:13 - INFO - __main__ - Step 12737: {'lr': 0.0004935361551496387, 'samples': 2445504, 'steps': 12736, 'loss/train': 2.114182472229004} -08/30/2021 15:25:14 - INFO - __main__ - Step 12738: {'lr': 0.0004935349561667638, 'samples': 2445696, 'steps': 12737, 'loss/train': 2.133676290512085} -08/30/2021 15:25:15 - INFO - __main__ - Step 12739: {'lr': 0.000493533757074156, 'samples': 2445888, 'steps': 12738, 'loss/train': 5.65504789352417} -08/30/2021 15:25:15 - INFO - __main__ - Step 12740: {'lr': 0.0004935325578718155, 'samples': 2446080, 'steps': 12739, 'loss/train': 2.1850454807281494} -08/30/2021 15:25:15 - INFO - __main__ - Step 12741: {'lr': 0.000493531358559743, 'samples': 2446272, 'steps': 12740, 'loss/train': 1.9255011081695557} -08/30/2021 15:25:16 - INFO - __main__ - Step 12742: {'lr': 0.0004935301591379391, 'samples': 2446464, 'steps': 12741, 'loss/train': 1.9801987409591675} -08/30/2021 15:25:17 - INFO - __main__ - Step 12743: {'lr': 0.0004935289596064042, 'samples': 2446656, 'steps': 12742, 'loss/train': 0.8448387980461121} -08/30/2021 15:25:17 - INFO - __main__ - Step 12744: {'lr': 0.0004935277599651389, 'samples': 2446848, 'steps': 12743, 'loss/train': 3.033478021621704} -08/30/2021 15:25:18 - INFO - __main__ - Step 12745: {'lr': 0.0004935265602141437, 'samples': 2447040, 'steps': 12744, 'loss/train': 1.927393913269043} -08/30/2021 15:25:18 - INFO - __main__ - Step 12746: {'lr': 0.0004935253603534193, 'samples': 2447232, 'steps': 12745, 'loss/train': 1.9398053884506226} -08/30/2021 15:25:19 - INFO - __main__ - Step 12747: {'lr': 0.0004935241603829661, 'samples': 2447424, 'steps': 12746, 'loss/train': 1.4622310400009155} -08/30/2021 15:25:21 - INFO - __main__ - Step 12748: {'lr': 0.0004935229603027847, 'samples': 2447616, 'steps': 12747, 'loss/train': 2.3264105319976807} -08/30/2021 15:25:21 - INFO - __main__ - Step 12749: {'lr': 0.0004935217601128755, 'samples': 2447808, 'steps': 12748, 'loss/train': 2.2108681201934814} -08/30/2021 15:25:22 - INFO - __main__ - Step 12750: {'lr': 0.0004935205598132393, 'samples': 2448000, 'steps': 12749, 'loss/train': 2.0789570808410645} -08/30/2021 15:25:22 - INFO - __main__ - Step 12751: {'lr': 0.0004935193594038764, 'samples': 2448192, 'steps': 12750, 'loss/train': 1.9540125131607056} -08/30/2021 15:25:22 - INFO - __main__ - Step 12752: {'lr': 0.0004935181588847876, 'samples': 2448384, 'steps': 12751, 'loss/train': 1.6292519569396973} -08/30/2021 15:25:24 - INFO - __main__ - Step 12753: {'lr': 0.0004935169582559731, 'samples': 2448576, 'steps': 12752, 'loss/train': 2.6580960750579834} -08/30/2021 15:25:24 - INFO - __main__ - Step 12754: {'lr': 0.0004935157575174336, 'samples': 2448768, 'steps': 12753, 'loss/train': 1.4992064237594604} -08/30/2021 15:25:24 - INFO - __main__ - Step 12755: {'lr': 0.0004935145566691698, 'samples': 2448960, 'steps': 12754, 'loss/train': 1.9568040370941162} -08/30/2021 15:25:25 - INFO - __main__ - Step 12756: {'lr': 0.000493513355711182, 'samples': 2449152, 'steps': 12755, 'loss/train': 1.905815601348877} -08/30/2021 15:25:25 - INFO - __main__ - Step 12757: {'lr': 0.0004935121546434708, 'samples': 2449344, 'steps': 12756, 'loss/train': 1.869763970375061} -08/30/2021 15:25:25 - INFO - __main__ - Step 12758: {'lr': 0.0004935109534660368, 'samples': 2449536, 'steps': 12757, 'loss/train': 2.1079020500183105} -08/30/2021 15:25:27 - INFO - __main__ - Step 12759: {'lr': 0.0004935097521788805, 'samples': 2449728, 'steps': 12758, 'loss/train': 1.1101970672607422} -08/30/2021 15:25:27 - INFO - __main__ - Step 12760: {'lr': 0.0004935085507820026, 'samples': 2449920, 'steps': 12759, 'loss/train': 1.996029019355774} -08/30/2021 15:25:28 - INFO - __main__ - Step 12761: {'lr': 0.0004935073492754034, 'samples': 2450112, 'steps': 12760, 'loss/train': 1.956479787826538} -08/30/2021 15:25:28 - INFO - __main__ - Step 12762: {'lr': 0.0004935061476590835, 'samples': 2450304, 'steps': 12761, 'loss/train': 2.4640419483184814} -08/30/2021 15:25:29 - INFO - __main__ - Step 12763: {'lr': 0.0004935049459330437, 'samples': 2450496, 'steps': 12762, 'loss/train': 2.0030322074890137} -08/30/2021 15:25:30 - INFO - __main__ - Step 12764: {'lr': 0.0004935037440972841, 'samples': 2450688, 'steps': 12763, 'loss/train': 1.5955910682678223} -08/30/2021 15:25:30 - INFO - __main__ - Step 12765: {'lr': 0.0004935025421518056, 'samples': 2450880, 'steps': 12764, 'loss/train': 1.809960961341858} -08/30/2021 15:25:31 - INFO - __main__ - Step 12766: {'lr': 0.0004935013400966086, 'samples': 2451072, 'steps': 12765, 'loss/train': 1.6778466701507568} -08/30/2021 15:25:31 - INFO - __main__ - Step 12767: {'lr': 0.0004935001379316935, 'samples': 2451264, 'steps': 12766, 'loss/train': 1.922008752822876} -08/30/2021 15:25:31 - INFO - __main__ - Step 12768: {'lr': 0.0004934989356570611, 'samples': 2451456, 'steps': 12767, 'loss/train': 2.5410382747650146} -08/30/2021 15:25:33 - INFO - __main__ - Step 12769: {'lr': 0.0004934977332727118, 'samples': 2451648, 'steps': 12768, 'loss/train': 2.064488410949707} -08/30/2021 15:25:33 - INFO - __main__ - Step 12770: {'lr': 0.0004934965307786464, 'samples': 2451840, 'steps': 12769, 'loss/train': 1.5209386348724365} -08/30/2021 15:25:34 - INFO - __main__ - Step 12771: {'lr': 0.0004934953281748649, 'samples': 2452032, 'steps': 12770, 'loss/train': 1.9649244546890259} -08/30/2021 15:25:34 - INFO - __main__ - Step 12772: {'lr': 0.0004934941254613684, 'samples': 2452224, 'steps': 12771, 'loss/train': 1.8762067556381226} -08/30/2021 15:25:35 - INFO - __main__ - Step 12773: {'lr': 0.0004934929226381572, 'samples': 2452416, 'steps': 12772, 'loss/train': 1.9542076587677002} -08/30/2021 15:25:36 - INFO - __main__ - Step 12774: {'lr': 0.0004934917197052317, 'samples': 2452608, 'steps': 12773, 'loss/train': 1.2381634712219238} -08/30/2021 15:25:37 - INFO - __main__ - Step 12775: {'lr': 0.0004934905166625926, 'samples': 2452800, 'steps': 12774, 'loss/train': 1.5721044540405273} -08/30/2021 15:25:37 - INFO - __main__ - Step 12776: {'lr': 0.0004934893135102405, 'samples': 2452992, 'steps': 12775, 'loss/train': 2.069021224975586} -08/30/2021 15:25:37 - INFO - __main__ - Step 12777: {'lr': 0.0004934881102481759, 'samples': 2453184, 'steps': 12776, 'loss/train': 1.5824388265609741} -08/30/2021 15:25:38 - INFO - __main__ - Step 12778: {'lr': 0.0004934869068763992, 'samples': 2453376, 'steps': 12777, 'loss/train': 1.8608088493347168} -08/30/2021 15:25:38 - INFO - __main__ - Step 12779: {'lr': 0.0004934857033949112, 'samples': 2453568, 'steps': 12778, 'loss/train': 1.4795398712158203} -08/30/2021 15:25:40 - INFO - __main__ - Step 12780: {'lr': 0.0004934844998037122, 'samples': 2453760, 'steps': 12779, 'loss/train': 0.2948019802570343} -08/30/2021 15:25:40 - INFO - __main__ - Step 12781: {'lr': 0.0004934832961028028, 'samples': 2453952, 'steps': 12780, 'loss/train': 2.3595540523529053} -08/30/2021 15:25:40 - INFO - __main__ - Step 12782: {'lr': 0.0004934820922921836, 'samples': 2454144, 'steps': 12781, 'loss/train': 1.6248605251312256} -08/30/2021 15:25:41 - INFO - __main__ - Step 12783: {'lr': 0.0004934808883718553, 'samples': 2454336, 'steps': 12782, 'loss/train': 1.213696837425232} -08/30/2021 15:25:41 - INFO - __main__ - Step 12784: {'lr': 0.0004934796843418181, 'samples': 2454528, 'steps': 12783, 'loss/train': 2.4891302585601807} -08/30/2021 15:25:43 - INFO - __main__ - Step 12785: {'lr': 0.0004934784802020728, 'samples': 2454720, 'steps': 12784, 'loss/train': 1.2858890295028687} -08/30/2021 15:25:43 - INFO - __main__ - Step 12786: {'lr': 0.0004934772759526198, 'samples': 2454912, 'steps': 12785, 'loss/train': 0.19185945391654968} -08/30/2021 15:25:44 - INFO - __main__ - Step 12787: {'lr': 0.0004934760715934597, 'samples': 2455104, 'steps': 12786, 'loss/train': 1.5422052145004272} -08/30/2021 15:25:44 - INFO - __main__ - Step 12788: {'lr': 0.0004934748671245931, 'samples': 2455296, 'steps': 12787, 'loss/train': 1.79157292842865} -08/30/2021 15:25:44 - INFO - __main__ - Step 12789: {'lr': 0.0004934736625460203, 'samples': 2455488, 'steps': 12788, 'loss/train': 1.1268810033798218} -08/30/2021 15:25:45 - INFO - __main__ - Step 12790: {'lr': 0.0004934724578577422, 'samples': 2455680, 'steps': 12789, 'loss/train': 1.5829182863235474} -08/30/2021 15:25:46 - INFO - __main__ - Step 12791: {'lr': 0.0004934712530597591, 'samples': 2455872, 'steps': 12790, 'loss/train': 1.360123872756958} -08/30/2021 15:25:47 - INFO - __main__ - Step 12792: {'lr': 0.0004934700481520717, 'samples': 2456064, 'steps': 12791, 'loss/train': 1.7475991249084473} -08/30/2021 15:25:47 - INFO - __main__ - Step 12793: {'lr': 0.0004934688431346804, 'samples': 2456256, 'steps': 12792, 'loss/train': 1.7553184032440186} -08/30/2021 15:25:48 - INFO - __main__ - Step 12794: {'lr': 0.0004934676380075857, 'samples': 2456448, 'steps': 12793, 'loss/train': 1.767801284790039} -08/30/2021 15:25:48 - INFO - __main__ - Step 12795: {'lr': 0.0004934664327707884, 'samples': 2456640, 'steps': 12794, 'loss/train': 1.4440882205963135} -08/30/2021 15:25:49 - INFO - __main__ - Step 12796: {'lr': 0.0004934652274242888, 'samples': 2456832, 'steps': 12795, 'loss/train': 2.174332857131958} -08/30/2021 15:25:50 - INFO - __main__ - Step 12797: {'lr': 0.0004934640219680875, 'samples': 2457024, 'steps': 12796, 'loss/train': 1.8413528203964233} -08/30/2021 15:25:50 - INFO - __main__ - Step 12798: {'lr': 0.0004934628164021851, 'samples': 2457216, 'steps': 12797, 'loss/train': 2.294133424758911} -08/30/2021 15:25:51 - INFO - __main__ - Step 12799: {'lr': 0.0004934616107265821, 'samples': 2457408, 'steps': 12798, 'loss/train': 2.405320882797241} -08/30/2021 15:25:51 - INFO - __main__ - Step 12800: {'lr': 0.0004934604049412791, 'samples': 2457600, 'steps': 12799, 'loss/train': 2.5989420413970947} -08/30/2021 15:25:53 - INFO - __main__ - Step 12801: {'lr': 0.0004934591990462766, 'samples': 2457792, 'steps': 12800, 'loss/train': 1.8813281059265137} -08/30/2021 15:25:53 - INFO - __main__ - Step 12802: {'lr': 0.0004934579930415751, 'samples': 2457984, 'steps': 12801, 'loss/train': 2.196131944656372} -08/30/2021 15:25:53 - INFO - __main__ - Step 12803: {'lr': 0.0004934567869271751, 'samples': 2458176, 'steps': 12802, 'loss/train': 1.6211522817611694} -08/30/2021 15:25:54 - INFO - __main__ - Step 12804: {'lr': 0.0004934555807030774, 'samples': 2458368, 'steps': 12803, 'loss/train': 2.0689356327056885} -08/30/2021 15:25:54 - INFO - __main__ - Step 12805: {'lr': 0.0004934543743692822, 'samples': 2458560, 'steps': 12804, 'loss/train': 1.8443782329559326} -08/30/2021 15:25:57 - INFO - __main__ - Step 12806: {'lr': 0.0004934531679257903, 'samples': 2458752, 'steps': 12805, 'loss/train': 1.8418288230895996} -08/30/2021 15:25:57 - INFO - __main__ - Step 12807: {'lr': 0.0004934519613726022, 'samples': 2458944, 'steps': 12806, 'loss/train': 1.5568180084228516} -08/30/2021 15:25:58 - INFO - __main__ - Step 12808: {'lr': 0.0004934507547097183, 'samples': 2459136, 'steps': 12807, 'loss/train': 1.6972455978393555} -08/30/2021 15:25:58 - INFO - __main__ - Step 12809: {'lr': 0.0004934495479371393, 'samples': 2459328, 'steps': 12808, 'loss/train': 1.9759559631347656} -08/30/2021 15:25:58 - INFO - __main__ - Step 12810: {'lr': 0.0004934483410548658, 'samples': 2459520, 'steps': 12809, 'loss/train': 1.7882384061813354} -08/30/2021 15:25:59 - INFO - __main__ - Step 12811: {'lr': 0.0004934471340628981, 'samples': 2459712, 'steps': 12810, 'loss/train': 1.5598998069763184} -08/30/2021 15:26:00 - INFO - __main__ - Step 12812: {'lr': 0.000493445926961237, 'samples': 2459904, 'steps': 12811, 'loss/train': 2.299872398376465} -08/30/2021 15:26:01 - INFO - __main__ - Step 12813: {'lr': 0.0004934447197498828, 'samples': 2460096, 'steps': 12812, 'loss/train': 1.3567181825637817} -08/30/2021 15:26:01 - INFO - __main__ - Step 12814: {'lr': 0.0004934435124288362, 'samples': 2460288, 'steps': 12813, 'loss/train': 1.9463375806808472} -08/30/2021 15:26:02 - INFO - __main__ - Step 12815: {'lr': 0.0004934423049980977, 'samples': 2460480, 'steps': 12814, 'loss/train': 2.5686609745025635} -08/30/2021 15:26:02 - INFO - __main__ - Step 12816: {'lr': 0.0004934410974576679, 'samples': 2460672, 'steps': 12815, 'loss/train': 2.101588487625122} -08/30/2021 15:26:04 - INFO - __main__ - Step 12817: {'lr': 0.0004934398898075472, 'samples': 2460864, 'steps': 12816, 'loss/train': 1.9919829368591309} -08/30/2021 15:26:04 - INFO - __main__ - Step 12818: {'lr': 0.0004934386820477363, 'samples': 2461056, 'steps': 12817, 'loss/train': 2.2948756217956543} -08/30/2021 15:26:05 - INFO - __main__ - Step 12819: {'lr': 0.0004934374741782357, 'samples': 2461248, 'steps': 12818, 'loss/train': 0.21224519610404968} -08/30/2021 15:26:05 - INFO - __main__ - Step 12820: {'lr': 0.000493436266199046, 'samples': 2461440, 'steps': 12819, 'loss/train': 2.1891863346099854} -08/30/2021 15:26:05 - INFO - __main__ - Step 12821: {'lr': 0.0004934350581101676, 'samples': 2461632, 'steps': 12820, 'loss/train': 2.082596778869629} -08/30/2021 15:26:07 - INFO - __main__ - Step 12822: {'lr': 0.0004934338499116011, 'samples': 2461824, 'steps': 12821, 'loss/train': 2.3154423236846924} -08/30/2021 15:26:08 - INFO - __main__ - Step 12823: {'lr': 0.0004934326416033471, 'samples': 2462016, 'steps': 12822, 'loss/train': 1.5506004095077515} -08/30/2021 15:26:08 - INFO - __main__ - Step 12824: {'lr': 0.0004934314331854061, 'samples': 2462208, 'steps': 12823, 'loss/train': 1.188932180404663} -08/30/2021 15:26:08 - INFO - __main__ - Step 12825: {'lr': 0.0004934302246577786, 'samples': 2462400, 'steps': 12824, 'loss/train': 0.27423277497291565} -08/30/2021 15:26:09 - INFO - __main__ - Step 12826: {'lr': 0.0004934290160204652, 'samples': 2462592, 'steps': 12825, 'loss/train': 0.6592503786087036} -08/30/2021 15:26:09 - INFO - __main__ - Step 12827: {'lr': 0.0004934278072734666, 'samples': 2462784, 'steps': 12826, 'loss/train': 1.895760178565979} -08/30/2021 15:26:11 - INFO - __main__ - Step 12828: {'lr': 0.000493426598416783, 'samples': 2462976, 'steps': 12827, 'loss/train': 1.7769666910171509} -08/30/2021 15:26:11 - INFO - __main__ - Step 12829: {'lr': 0.0004934253894504152, 'samples': 2463168, 'steps': 12828, 'loss/train': 2.225257635116577} -08/30/2021 15:26:11 - INFO - __main__ - Step 12830: {'lr': 0.0004934241803743637, 'samples': 2463360, 'steps': 12829, 'loss/train': 1.3340060710906982} -08/30/2021 15:26:12 - INFO - __main__ - Step 12831: {'lr': 0.000493422971188629, 'samples': 2463552, 'steps': 12830, 'loss/train': 1.8774023056030273} -08/30/2021 15:26:12 - INFO - __main__ - Step 12832: {'lr': 0.0004934217618932117, 'samples': 2463744, 'steps': 12831, 'loss/train': 1.8951119184494019} -08/30/2021 15:26:14 - INFO - __main__ - Step 12833: {'lr': 0.0004934205524881123, 'samples': 2463936, 'steps': 12832, 'loss/train': 1.9925721883773804} -08/30/2021 15:26:14 - INFO - __main__ - Step 12834: {'lr': 0.0004934193429733312, 'samples': 2464128, 'steps': 12833, 'loss/train': 2.1481235027313232} -08/30/2021 15:26:14 - INFO - __main__ - Step 12835: {'lr': 0.0004934181333488693, 'samples': 2464320, 'steps': 12834, 'loss/train': 1.726758360862732} -08/30/2021 15:26:15 - INFO - __main__ - Step 12836: {'lr': 0.0004934169236147268, 'samples': 2464512, 'steps': 12835, 'loss/train': 1.7222379446029663} -08/30/2021 15:26:15 - INFO - __main__ - Step 12837: {'lr': 0.0004934157137709044, 'samples': 2464704, 'steps': 12836, 'loss/train': 2.0570788383483887} -08/30/2021 15:26:15 - INFO - __main__ - Step 12838: {'lr': 0.0004934145038174028, 'samples': 2464896, 'steps': 12837, 'loss/train': 1.9421387910842896} -08/30/2021 15:26:17 - INFO - __main__ - Step 12839: {'lr': 0.0004934132937542223, 'samples': 2465088, 'steps': 12838, 'loss/train': 2.1006321907043457} -08/30/2021 15:26:18 - INFO - __main__ - Step 12840: {'lr': 0.0004934120835813634, 'samples': 2465280, 'steps': 12839, 'loss/train': 1.5314640998840332} -08/30/2021 15:26:18 - INFO - __main__ - Step 12841: {'lr': 0.0004934108732988269, 'samples': 2465472, 'steps': 12840, 'loss/train': 1.9027420282363892} -08/30/2021 15:26:18 - INFO - __main__ - Step 12842: {'lr': 0.0004934096629066133, 'samples': 2465664, 'steps': 12841, 'loss/train': 2.09247088432312} -08/30/2021 15:26:19 - INFO - __main__ - Step 12843: {'lr': 0.0004934084524047229, 'samples': 2465856, 'steps': 12842, 'loss/train': 2.0536134243011475} -08/30/2021 15:26:20 - INFO - __main__ - Step 12844: {'lr': 0.0004934072417931564, 'samples': 2466048, 'steps': 12843, 'loss/train': 2.0693199634552} -08/30/2021 15:26:21 - INFO - __main__ - Step 12845: {'lr': 0.0004934060310719145, 'samples': 2466240, 'steps': 12844, 'loss/train': 1.6274563074111938} -08/30/2021 15:26:21 - INFO - __main__ - Step 12846: {'lr': 0.0004934048202409974, 'samples': 2466432, 'steps': 12845, 'loss/train': 1.8991349935531616} -08/30/2021 15:26:22 - INFO - __main__ - Step 12847: {'lr': 0.000493403609300406, 'samples': 2466624, 'steps': 12846, 'loss/train': 1.8625999689102173} -08/30/2021 15:26:22 - INFO - __main__ - Step 12848: {'lr': 0.0004934023982501406, 'samples': 2466816, 'steps': 12847, 'loss/train': 1.3336262702941895} -08/30/2021 15:26:22 - INFO - __main__ - Step 12849: {'lr': 0.000493401187090202, 'samples': 2467008, 'steps': 12848, 'loss/train': 1.5156720876693726} -08/30/2021 15:26:24 - INFO - __main__ - Step 12850: {'lr': 0.0004933999758205904, 'samples': 2467200, 'steps': 12849, 'loss/train': 2.161287307739258} -08/30/2021 15:26:24 - INFO - __main__ - Step 12851: {'lr': 0.0004933987644413066, 'samples': 2467392, 'steps': 12850, 'loss/train': 2.1711788177490234} -08/30/2021 15:26:24 - INFO - __main__ - Step 12852: {'lr': 0.0004933975529523511, 'samples': 2467584, 'steps': 12851, 'loss/train': 2.485257625579834} -08/30/2021 15:26:25 - INFO - __main__ - Step 12853: {'lr': 0.0004933963413537244, 'samples': 2467776, 'steps': 12852, 'loss/train': 2.2051398754119873} -08/30/2021 15:26:25 - INFO - __main__ - Step 12854: {'lr': 0.000493395129645427, 'samples': 2467968, 'steps': 12853, 'loss/train': 0.40571528673171997} -08/30/2021 15:26:27 - INFO - __main__ - Step 12855: {'lr': 0.0004933939178274596, 'samples': 2468160, 'steps': 12854, 'loss/train': 2.2921669483184814} -08/30/2021 15:26:28 - INFO - __main__ - Step 12856: {'lr': 0.0004933927058998226, 'samples': 2468352, 'steps': 12855, 'loss/train': 0.5320433378219604} -08/30/2021 15:26:28 - INFO - __main__ - Step 12857: {'lr': 0.0004933914938625166, 'samples': 2468544, 'steps': 12856, 'loss/train': 0.6518922448158264} -08/30/2021 15:26:29 - INFO - __main__ - Step 12858: {'lr': 0.0004933902817155422, 'samples': 2468736, 'steps': 12857, 'loss/train': 0.6996716260910034} -08/30/2021 15:26:29 - INFO - __main__ - Step 12859: {'lr': 0.0004933890694588998, 'samples': 2468928, 'steps': 12858, 'loss/train': 2.0849716663360596} -08/30/2021 15:26:29 - INFO - __main__ - Step 12860: {'lr': 0.0004933878570925901, 'samples': 2469120, 'steps': 12859, 'loss/train': 1.9486299753189087} -08/30/2021 15:26:31 - INFO - __main__ - Step 12861: {'lr': 0.0004933866446166136, 'samples': 2469312, 'steps': 12860, 'loss/train': 1.7212613821029663} -08/30/2021 15:26:32 - INFO - __main__ - Step 12862: {'lr': 0.0004933854320309708, 'samples': 2469504, 'steps': 12861, 'loss/train': 1.654227375984192} -08/30/2021 15:26:32 - INFO - __main__ - Step 12863: {'lr': 0.0004933842193356624, 'samples': 2469696, 'steps': 12862, 'loss/train': 2.332019329071045} -08/30/2021 15:26:33 - INFO - __main__ - Step 12864: {'lr': 0.0004933830065306887, 'samples': 2469888, 'steps': 12863, 'loss/train': 1.7721030712127686} -08/30/2021 15:26:33 - INFO - __main__ - Step 12865: {'lr': 0.0004933817936160504, 'samples': 2470080, 'steps': 12864, 'loss/train': 1.8317217826843262} -08/30/2021 15:26:33 - INFO - __main__ - Step 12866: {'lr': 0.0004933805805917479, 'samples': 2470272, 'steps': 12865, 'loss/train': 1.6601803302764893} -08/30/2021 15:26:35 - INFO - __main__ - Step 12867: {'lr': 0.000493379367457782, 'samples': 2470464, 'steps': 12866, 'loss/train': 2.19952130317688} -08/30/2021 15:26:36 - INFO - __main__ - Step 12868: {'lr': 0.0004933781542141532, 'samples': 2470656, 'steps': 12867, 'loss/train': 1.25111722946167} -08/30/2021 15:26:36 - INFO - __main__ - Step 12869: {'lr': 0.0004933769408608618, 'samples': 2470848, 'steps': 12868, 'loss/train': 1.9844472408294678} -08/30/2021 15:26:36 - INFO - __main__ - Step 12870: {'lr': 0.0004933757273979086, 'samples': 2471040, 'steps': 12869, 'loss/train': 1.5841888189315796} -08/30/2021 15:26:37 - INFO - __main__ - Step 12871: {'lr': 0.0004933745138252939, 'samples': 2471232, 'steps': 12870, 'loss/train': 1.4705384969711304} -08/30/2021 15:26:38 - INFO - __main__ - Step 12872: {'lr': 0.0004933733001430186, 'samples': 2471424, 'steps': 12871, 'loss/train': 0.19169384241104126} -08/30/2021 15:26:39 - INFO - __main__ - Step 12873: {'lr': 0.000493372086351083, 'samples': 2471616, 'steps': 12872, 'loss/train': 1.6319408416748047} -08/30/2021 15:26:39 - INFO - __main__ - Step 12874: {'lr': 0.0004933708724494877, 'samples': 2471808, 'steps': 12873, 'loss/train': 1.8161916732788086} -08/30/2021 15:26:39 - INFO - __main__ - Step 12875: {'lr': 0.0004933696584382331, 'samples': 2472000, 'steps': 12874, 'loss/train': 1.2566332817077637} -08/30/2021 15:26:40 - INFO - __main__ - Step 12876: {'lr': 0.00049336844431732, 'samples': 2472192, 'steps': 12875, 'loss/train': 2.009991407394409} -08/30/2021 15:26:41 - INFO - __main__ - Step 12877: {'lr': 0.0004933672300867488, 'samples': 2472384, 'steps': 12876, 'loss/train': 1.9428919553756714} -08/30/2021 15:26:42 - INFO - __main__ - Step 12878: {'lr': 0.0004933660157465202, 'samples': 2472576, 'steps': 12877, 'loss/train': 1.9996424913406372} -08/30/2021 15:26:42 - INFO - __main__ - Step 12879: {'lr': 0.0004933648012966344, 'samples': 2472768, 'steps': 12878, 'loss/train': 1.4289755821228027} -08/30/2021 15:26:42 - INFO - __main__ - Step 12880: {'lr': 0.0004933635867370923, 'samples': 2472960, 'steps': 12879, 'loss/train': 1.3390545845031738} -08/30/2021 15:26:43 - INFO - __main__ - Step 12881: {'lr': 0.0004933623720678944, 'samples': 2473152, 'steps': 12880, 'loss/train': 1.5453749895095825} -08/30/2021 15:26:44 - INFO - __main__ - Step 12882: {'lr': 0.000493361157289041, 'samples': 2473344, 'steps': 12881, 'loss/train': 2.0054750442504883} -08/30/2021 15:26:45 - INFO - __main__ - Step 12883: {'lr': 0.000493359942400533, 'samples': 2473536, 'steps': 12882, 'loss/train': 1.3292654752731323} -08/30/2021 15:26:45 - INFO - __main__ - Step 12884: {'lr': 0.0004933587274023706, 'samples': 2473728, 'steps': 12883, 'loss/train': 2.0311615467071533} -08/30/2021 15:26:45 - INFO - __main__ - Step 12885: {'lr': 0.0004933575122945547, 'samples': 2473920, 'steps': 12884, 'loss/train': 1.31778883934021} -08/30/2021 15:26:46 - INFO - __main__ - Step 12886: {'lr': 0.0004933562970770855, 'samples': 2474112, 'steps': 12885, 'loss/train': 1.9492117166519165} -08/30/2021 15:26:47 - INFO - __main__ - Step 12887: {'lr': 0.0004933550817499638, 'samples': 2474304, 'steps': 12886, 'loss/train': 1.905481219291687} -08/30/2021 15:26:48 - INFO - __main__ - Step 12888: {'lr': 0.00049335386631319, 'samples': 2474496, 'steps': 12887, 'loss/train': 1.9886780977249146} -08/30/2021 15:26:48 - INFO - __main__ - Step 12889: {'lr': 0.0004933526507667648, 'samples': 2474688, 'steps': 12888, 'loss/train': 1.90106201171875} -08/30/2021 15:26:48 - INFO - __main__ - Step 12890: {'lr': 0.0004933514351106885, 'samples': 2474880, 'steps': 12889, 'loss/train': 2.4388670921325684} -08/30/2021 15:26:49 - INFO - __main__ - Step 12891: {'lr': 0.0004933502193449618, 'samples': 2475072, 'steps': 12890, 'loss/train': 1.6792958974838257} -08/30/2021 15:26:50 - INFO - __main__ - Step 12892: {'lr': 0.0004933490034695853, 'samples': 2475264, 'steps': 12891, 'loss/train': 1.1208237409591675} -08/30/2021 15:26:51 - INFO - __main__ - Step 12893: {'lr': 0.0004933477874845595, 'samples': 2475456, 'steps': 12892, 'loss/train': 0.9411040544509888} -08/30/2021 15:26:51 - INFO - __main__ - Step 12894: {'lr': 0.000493346571389885, 'samples': 2475648, 'steps': 12893, 'loss/train': 1.7961270809173584} -08/30/2021 15:26:51 - INFO - __main__ - Step 12895: {'lr': 0.0004933453551855622, 'samples': 2475840, 'steps': 12894, 'loss/train': 0.7018240094184875} -08/30/2021 15:26:52 - INFO - __main__ - Step 12896: {'lr': 0.0004933441388715919, 'samples': 2476032, 'steps': 12895, 'loss/train': 1.3613004684448242} -08/30/2021 15:26:52 - INFO - __main__ - Step 12897: {'lr': 0.0004933429224479743, 'samples': 2476224, 'steps': 12896, 'loss/train': 1.989190697669983} -08/30/2021 15:26:53 - INFO - __main__ - Step 12898: {'lr': 0.0004933417059147102, 'samples': 2476416, 'steps': 12897, 'loss/train': 1.6655298471450806} -08/30/2021 15:26:54 - INFO - __main__ - Step 12899: {'lr': 0.0004933404892718, 'samples': 2476608, 'steps': 12898, 'loss/train': 1.571376919746399} -08/30/2021 15:26:54 - INFO - __main__ - Step 12900: {'lr': 0.0004933392725192444, 'samples': 2476800, 'steps': 12899, 'loss/train': 1.7903738021850586} -08/30/2021 15:26:55 - INFO - __main__ - Step 12901: {'lr': 0.000493338055657044, 'samples': 2476992, 'steps': 12900, 'loss/train': 2.3699591159820557} -08/30/2021 15:26:55 - INFO - __main__ - Step 12902: {'lr': 0.0004933368386851991, 'samples': 2477184, 'steps': 12901, 'loss/train': 1.7695090770721436} -08/30/2021 15:26:57 - INFO - __main__ - Step 12903: {'lr': 0.0004933356216037104, 'samples': 2477376, 'steps': 12902, 'loss/train': 1.897432804107666} -08/30/2021 15:26:57 - INFO - __main__ - Step 12904: {'lr': 0.0004933344044125784, 'samples': 2477568, 'steps': 12903, 'loss/train': 2.428956985473633} -08/30/2021 15:26:57 - INFO - __main__ - Step 12905: {'lr': 0.0004933331871118037, 'samples': 2477760, 'steps': 12904, 'loss/train': 1.5634547472000122} -08/30/2021 15:26:58 - INFO - __main__ - Step 12906: {'lr': 0.0004933319697013869, 'samples': 2477952, 'steps': 12905, 'loss/train': 1.5574288368225098} -08/30/2021 15:26:58 - INFO - __main__ - Step 12907: {'lr': 0.0004933307521813282, 'samples': 2478144, 'steps': 12906, 'loss/train': 1.9178047180175781} -08/30/2021 15:27:00 - INFO - __main__ - Step 12908: {'lr': 0.0004933295345516287, 'samples': 2478336, 'steps': 12907, 'loss/train': 1.6965242624282837} -08/30/2021 15:27:00 - INFO - __main__ - Step 12909: {'lr': 0.0004933283168122886, 'samples': 2478528, 'steps': 12908, 'loss/train': 2.1432430744171143} -08/30/2021 15:27:00 - INFO - __main__ - Step 12910: {'lr': 0.0004933270989633084, 'samples': 2478720, 'steps': 12909, 'loss/train': 1.492651104927063} -08/30/2021 15:27:01 - INFO - __main__ - Step 12911: {'lr': 0.0004933258810046889, 'samples': 2478912, 'steps': 12910, 'loss/train': 2.094221591949463} -08/30/2021 15:27:01 - INFO - __main__ - Step 12912: {'lr': 0.0004933246629364304, 'samples': 2479104, 'steps': 12911, 'loss/train': 1.8227078914642334} -08/30/2021 15:27:03 - INFO - __main__ - Step 12913: {'lr': 0.0004933234447585337, 'samples': 2479296, 'steps': 12912, 'loss/train': 1.4459824562072754} -08/30/2021 15:27:04 - INFO - __main__ - Step 12914: {'lr': 0.0004933222264709991, 'samples': 2479488, 'steps': 12913, 'loss/train': 1.6463892459869385} -08/30/2021 15:27:04 - INFO - __main__ - Step 12915: {'lr': 0.0004933210080738273, 'samples': 2479680, 'steps': 12914, 'loss/train': 1.5907765626907349} -08/30/2021 15:27:04 - INFO - __main__ - Step 12916: {'lr': 0.0004933197895670187, 'samples': 2479872, 'steps': 12915, 'loss/train': 1.5506144762039185} -08/30/2021 15:27:05 - INFO - __main__ - Step 12917: {'lr': 0.0004933185709505741, 'samples': 2480064, 'steps': 12916, 'loss/train': 2.120018482208252} -08/30/2021 15:27:05 - INFO - __main__ - Step 12918: {'lr': 0.0004933173522244939, 'samples': 2480256, 'steps': 12917, 'loss/train': 1.5343645811080933} -08/30/2021 15:27:07 - INFO - __main__ - Step 12919: {'lr': 0.0004933161333887786, 'samples': 2480448, 'steps': 12918, 'loss/train': 1.7413872480392456} -08/30/2021 15:27:07 - INFO - __main__ - Step 12920: {'lr': 0.0004933149144434288, 'samples': 2480640, 'steps': 12919, 'loss/train': 1.8250689506530762} -08/30/2021 15:27:07 - INFO - __main__ - Step 12921: {'lr': 0.0004933136953884451, 'samples': 2480832, 'steps': 12920, 'loss/train': 1.645958423614502} -08/30/2021 15:27:08 - INFO - __main__ - Step 12922: {'lr': 0.0004933124762238279, 'samples': 2481024, 'steps': 12921, 'loss/train': 1.9412498474121094} -08/30/2021 15:27:08 - INFO - __main__ - Step 12923: {'lr': 0.000493311256949578, 'samples': 2481216, 'steps': 12922, 'loss/train': 1.5907375812530518} -08/30/2021 15:27:10 - INFO - __main__ - Step 12924: {'lr': 0.0004933100375656957, 'samples': 2481408, 'steps': 12923, 'loss/train': 0.8259760737419128} -08/30/2021 15:27:10 - INFO - __main__ - Step 12925: {'lr': 0.0004933088180721817, 'samples': 2481600, 'steps': 12924, 'loss/train': 1.698560357093811} -08/30/2021 15:27:10 - INFO - __main__ - Step 12926: {'lr': 0.0004933075984690365, 'samples': 2481792, 'steps': 12925, 'loss/train': 2.067666530609131} -08/30/2021 15:27:11 - INFO - __main__ - Step 12927: {'lr': 0.0004933063787562606, 'samples': 2481984, 'steps': 12926, 'loss/train': 2.4630961418151855} -08/30/2021 15:27:11 - INFO - __main__ - Step 12928: {'lr': 0.0004933051589338547, 'samples': 2482176, 'steps': 12927, 'loss/train': 1.671011209487915} -08/30/2021 15:27:13 - INFO - __main__ - Step 12929: {'lr': 0.0004933039390018192, 'samples': 2482368, 'steps': 12928, 'loss/train': 1.714061975479126} -08/30/2021 15:27:13 - INFO - __main__ - Step 12930: {'lr': 0.0004933027189601547, 'samples': 2482560, 'steps': 12929, 'loss/train': 1.7152819633483887} -08/30/2021 15:27:13 - INFO - __main__ - Step 12931: {'lr': 0.0004933014988088616, 'samples': 2482752, 'steps': 12930, 'loss/train': 1.3183889389038086} -08/30/2021 15:27:14 - INFO - __main__ - Step 12932: {'lr': 0.0004933002785479408, 'samples': 2482944, 'steps': 12931, 'loss/train': 0.16766878962516785} -08/30/2021 15:27:14 - INFO - __main__ - Step 12933: {'lr': 0.0004932990581773926, 'samples': 2483136, 'steps': 12932, 'loss/train': 2.2817769050598145} -08/30/2021 15:27:16 - INFO - __main__ - Step 12934: {'lr': 0.0004932978376972175, 'samples': 2483328, 'steps': 12933, 'loss/train': 1.4748798608779907} -08/30/2021 15:27:16 - INFO - __main__ - Step 12935: {'lr': 0.0004932966171074163, 'samples': 2483520, 'steps': 12934, 'loss/train': 1.686767816543579} -08/30/2021 15:27:16 - INFO - __main__ - Step 12936: {'lr': 0.0004932953964079893, 'samples': 2483712, 'steps': 12935, 'loss/train': 1.5524197816848755} -08/30/2021 15:27:17 - INFO - __main__ - Step 12937: {'lr': 0.0004932941755989372, 'samples': 2483904, 'steps': 12936, 'loss/train': 2.500237464904785} -08/30/2021 15:27:17 - INFO - __main__ - Step 12938: {'lr': 0.0004932929546802605, 'samples': 2484096, 'steps': 12937, 'loss/train': 1.6547746658325195} -08/30/2021 15:27:19 - INFO - __main__ - Step 12939: {'lr': 0.0004932917336519597, 'samples': 2484288, 'steps': 12938, 'loss/train': 0.5372771620750427} -08/30/2021 15:27:19 - INFO - __main__ - Step 12940: {'lr': 0.0004932905125140354, 'samples': 2484480, 'steps': 12939, 'loss/train': 1.3921217918395996} -08/30/2021 15:27:20 - INFO - __main__ - Step 12941: {'lr': 0.0004932892912664882, 'samples': 2484672, 'steps': 12940, 'loss/train': 1.3276793956756592} -08/30/2021 15:27:20 - INFO - __main__ - Step 12942: {'lr': 0.0004932880699093186, 'samples': 2484864, 'steps': 12941, 'loss/train': 1.8124228715896606} -08/30/2021 15:27:20 - INFO - __main__ - Step 12943: {'lr': 0.0004932868484425271, 'samples': 2485056, 'steps': 12942, 'loss/train': 0.16740307211875916} -08/30/2021 15:27:21 - INFO - __main__ - Step 12944: {'lr': 0.0004932856268661143, 'samples': 2485248, 'steps': 12943, 'loss/train': 1.3268613815307617} -08/30/2021 15:27:21 - INFO - __main__ - Step 12945: {'lr': 0.0004932844051800808, 'samples': 2485440, 'steps': 12944, 'loss/train': 2.3583836555480957} -08/30/2021 15:27:23 - INFO - __main__ - Step 12946: {'lr': 0.000493283183384427, 'samples': 2485632, 'steps': 12945, 'loss/train': 2.23337984085083} -08/30/2021 15:27:23 - INFO - __main__ - Step 12947: {'lr': 0.0004932819614791537, 'samples': 2485824, 'steps': 12946, 'loss/train': 1.7928889989852905} -08/30/2021 15:27:23 - INFO - __main__ - Step 12948: {'lr': 0.0004932807394642612, 'samples': 2486016, 'steps': 12947, 'loss/train': 1.3809243440628052} -08/30/2021 15:27:24 - INFO - __main__ - Step 12949: {'lr': 0.0004932795173397501, 'samples': 2486208, 'steps': 12948, 'loss/train': 1.9425253868103027} -08/30/2021 15:27:24 - INFO - __main__ - Step 12950: {'lr': 0.0004932782951056211, 'samples': 2486400, 'steps': 12949, 'loss/train': 2.1360065937042236} -08/30/2021 15:27:26 - INFO - __main__ - Step 12951: {'lr': 0.0004932770727618747, 'samples': 2486592, 'steps': 12950, 'loss/train': 2.145446538925171} -08/30/2021 15:27:26 - INFO - __main__ - Step 12952: {'lr': 0.0004932758503085114, 'samples': 2486784, 'steps': 12951, 'loss/train': 1.6578941345214844} -08/30/2021 15:27:26 - INFO - __main__ - Step 12953: {'lr': 0.0004932746277455317, 'samples': 2486976, 'steps': 12952, 'loss/train': 1.815985083580017} -08/30/2021 15:27:27 - INFO - __main__ - Step 12954: {'lr': 0.0004932734050729362, 'samples': 2487168, 'steps': 12953, 'loss/train': 1.4310932159423828} -08/30/2021 15:27:27 - INFO - __main__ - Step 12955: {'lr': 0.0004932721822907255, 'samples': 2487360, 'steps': 12954, 'loss/train': 1.784164309501648} -08/30/2021 15:27:29 - INFO - __main__ - Step 12956: {'lr': 0.0004932709593989, 'samples': 2487552, 'steps': 12955, 'loss/train': 2.0219085216522217} -08/30/2021 15:27:29 - INFO - __main__ - Step 12957: {'lr': 0.0004932697363974604, 'samples': 2487744, 'steps': 12956, 'loss/train': 1.3164905309677124} -08/30/2021 15:27:29 - INFO - __main__ - Step 12958: {'lr': 0.0004932685132864072, 'samples': 2487936, 'steps': 12957, 'loss/train': 1.2794688940048218} -08/30/2021 15:27:30 - INFO - __main__ - Step 12959: {'lr': 0.0004932672900657411, 'samples': 2488128, 'steps': 12958, 'loss/train': 1.6962989568710327} -08/30/2021 15:27:30 - INFO - __main__ - Step 12960: {'lr': 0.0004932660667354623, 'samples': 2488320, 'steps': 12959, 'loss/train': 1.8925210237503052} -08/30/2021 15:27:32 - INFO - __main__ - Step 12961: {'lr': 0.0004932648432955717, 'samples': 2488512, 'steps': 12960, 'loss/train': 1.7702349424362183} -08/30/2021 15:27:32 - INFO - __main__ - Step 12962: {'lr': 0.0004932636197460698, 'samples': 2488704, 'steps': 12961, 'loss/train': 1.7371070384979248} -08/30/2021 15:27:32 - INFO - __main__ - Step 12963: {'lr': 0.0004932623960869569, 'samples': 2488896, 'steps': 12962, 'loss/train': 1.5402714014053345} -08/30/2021 15:27:33 - INFO - __main__ - Step 12964: {'lr': 0.0004932611723182338, 'samples': 2489088, 'steps': 12963, 'loss/train': 1.582326054573059} -08/30/2021 15:27:33 - INFO - __main__ - Step 12965: {'lr': 0.000493259948439901, 'samples': 2489280, 'steps': 12964, 'loss/train': 1.4854434728622437} -08/30/2021 15:27:35 - INFO - __main__ - Step 12966: {'lr': 0.0004932587244519589, 'samples': 2489472, 'steps': 12965, 'loss/train': 2.4423863887786865} -08/30/2021 15:27:35 - INFO - __main__ - Step 12967: {'lr': 0.0004932575003544083, 'samples': 2489664, 'steps': 12966, 'loss/train': 1.630094051361084} -08/30/2021 15:27:35 - INFO - __main__ - Step 12968: {'lr': 0.0004932562761472496, 'samples': 2489856, 'steps': 12967, 'loss/train': 2.0432162284851074} -08/30/2021 15:27:36 - INFO - __main__ - Step 12969: {'lr': 0.0004932550518304833, 'samples': 2490048, 'steps': 12968, 'loss/train': 2.013092517852783} -08/30/2021 15:27:36 - INFO - __main__ - Step 12970: {'lr': 0.0004932538274041101, 'samples': 2490240, 'steps': 12969, 'loss/train': 1.8890380859375} -08/30/2021 15:27:38 - INFO - __main__ - Step 12971: {'lr': 0.0004932526028681304, 'samples': 2490432, 'steps': 12970, 'loss/train': 1.1682820320129395} -08/30/2021 15:27:38 - INFO - __main__ - Step 12972: {'lr': 0.0004932513782225449, 'samples': 2490624, 'steps': 12971, 'loss/train': 1.8650240898132324} -08/30/2021 15:27:39 - INFO - __main__ - Step 12973: {'lr': 0.000493250153467354, 'samples': 2490816, 'steps': 12972, 'loss/train': 1.0635807514190674} -08/30/2021 15:27:39 - INFO - __main__ - Step 12974: {'lr': 0.0004932489286025584, 'samples': 2491008, 'steps': 12973, 'loss/train': 1.5997942686080933} -08/30/2021 15:27:39 - INFO - __main__ - Step 12975: {'lr': 0.0004932477036281586, 'samples': 2491200, 'steps': 12974, 'loss/train': 2.061941623687744} -08/30/2021 15:27:40 - INFO - __main__ - Step 12976: {'lr': 0.0004932464785441552, 'samples': 2491392, 'steps': 12975, 'loss/train': 2.1151795387268066} -08/30/2021 15:27:41 - INFO - __main__ - Step 12977: {'lr': 0.0004932452533505486, 'samples': 2491584, 'steps': 12976, 'loss/train': 2.0156846046447754} -08/30/2021 15:27:42 - INFO - __main__ - Step 12978: {'lr': 0.0004932440280473395, 'samples': 2491776, 'steps': 12977, 'loss/train': 1.2708879709243774} -08/30/2021 15:27:42 - INFO - __main__ - Step 12979: {'lr': 0.0004932428026345282, 'samples': 2491968, 'steps': 12978, 'loss/train': 1.660595178604126} -08/30/2021 15:27:42 - INFO - __main__ - Step 12980: {'lr': 0.0004932415771121157, 'samples': 2492160, 'steps': 12979, 'loss/train': 1.8325729370117188} -08/30/2021 15:27:43 - INFO - __main__ - Step 12981: {'lr': 0.0004932403514801021, 'samples': 2492352, 'steps': 12980, 'loss/train': 1.737576961517334} -08/30/2021 15:27:45 - INFO - __main__ - Step 12982: {'lr': 0.0004932391257384883, 'samples': 2492544, 'steps': 12981, 'loss/train': 1.7842106819152832} -08/30/2021 15:27:45 - INFO - __main__ - Step 12983: {'lr': 0.0004932378998872746, 'samples': 2492736, 'steps': 12982, 'loss/train': 2.11392879486084} -08/30/2021 15:27:46 - INFO - __main__ - Step 12984: {'lr': 0.0004932366739264618, 'samples': 2492928, 'steps': 12983, 'loss/train': 1.9216110706329346} -08/30/2021 15:27:46 - INFO - __main__ - Step 12985: {'lr': 0.0004932354478560502, 'samples': 2493120, 'steps': 12984, 'loss/train': 2.0142393112182617} -08/30/2021 15:27:47 - INFO - __main__ - Step 12986: {'lr': 0.0004932342216760405, 'samples': 2493312, 'steps': 12985, 'loss/train': 0.9964456558227539} -08/30/2021 15:27:47 - INFO - __main__ - Step 12987: {'lr': 0.0004932329953864331, 'samples': 2493504, 'steps': 12986, 'loss/train': 1.4187933206558228} -08/30/2021 15:27:49 - INFO - __main__ - Step 12988: {'lr': 0.0004932317689872287, 'samples': 2493696, 'steps': 12987, 'loss/train': 1.1365156173706055} -08/30/2021 15:27:49 - INFO - __main__ - Step 12989: {'lr': 0.000493230542478428, 'samples': 2493888, 'steps': 12988, 'loss/train': 1.653011679649353} -08/30/2021 15:27:49 - INFO - __main__ - Step 12990: {'lr': 0.0004932293158600312, 'samples': 2494080, 'steps': 12989, 'loss/train': 1.5194389820098877} -08/30/2021 15:27:50 - INFO - __main__ - Step 12991: {'lr': 0.0004932280891320391, 'samples': 2494272, 'steps': 12990, 'loss/train': 1.7696212530136108} -08/30/2021 15:27:50 - INFO - __main__ - Step 12992: {'lr': 0.0004932268622944521, 'samples': 2494464, 'steps': 12991, 'loss/train': 1.1499416828155518} -08/30/2021 15:27:50 - INFO - __main__ - Step 12993: {'lr': 0.0004932256353472709, 'samples': 2494656, 'steps': 12992, 'loss/train': 0.48234203457832336} -08/30/2021 15:27:52 - INFO - __main__ - Step 12994: {'lr': 0.0004932244082904959, 'samples': 2494848, 'steps': 12993, 'loss/train': 2.079378128051758} -08/30/2021 15:27:52 - INFO - __main__ - Step 12995: {'lr': 0.0004932231811241278, 'samples': 2495040, 'steps': 12994, 'loss/train': 1.7509737014770508} -08/30/2021 15:27:53 - INFO - __main__ - Step 12996: {'lr': 0.0004932219538481672, 'samples': 2495232, 'steps': 12995, 'loss/train': 2.2721691131591797} -08/30/2021 15:27:53 - INFO - __main__ - Step 12997: {'lr': 0.0004932207264626143, 'samples': 2495424, 'steps': 12996, 'loss/train': 2.0370490550994873} -08/30/2021 15:27:53 - INFO - __main__ - Step 12998: {'lr': 0.00049321949896747, 'samples': 2495616, 'steps': 12997, 'loss/train': 1.7114466428756714} -08/30/2021 15:27:55 - INFO - __main__ - Step 12999: {'lr': 0.0004932182713627348, 'samples': 2495808, 'steps': 12998, 'loss/train': 0.8038334250450134} -08/30/2021 15:27:56 - INFO - __main__ - Step 13000: {'lr': 0.0004932170436484091, 'samples': 2496000, 'steps': 12999, 'loss/train': 2.0671768188476562} -08/30/2021 15:27:56 - INFO - __main__ - Step 13001: {'lr': 0.0004932158158244937, 'samples': 2496192, 'steps': 13000, 'loss/train': 2.1165475845336914} -08/30/2021 15:27:56 - INFO - __main__ - Step 13002: {'lr': 0.0004932145878909889, 'samples': 2496384, 'steps': 13001, 'loss/train': 1.4926173686981201} -08/30/2021 15:27:57 - INFO - __main__ - Step 13003: {'lr': 0.0004932133598478953, 'samples': 2496576, 'steps': 13002, 'loss/train': 2.1384963989257812} -08/30/2021 15:27:58 - INFO - __main__ - Step 13004: {'lr': 0.0004932121316952136, 'samples': 2496768, 'steps': 13003, 'loss/train': 2.163433313369751} -08/30/2021 15:27:59 - INFO - __main__ - Step 13005: {'lr': 0.0004932109034329442, 'samples': 2496960, 'steps': 13004, 'loss/train': 1.7609907388687134} -08/30/2021 15:27:59 - INFO - __main__ - Step 13006: {'lr': 0.0004932096750610879, 'samples': 2497152, 'steps': 13005, 'loss/train': 2.1369967460632324} -08/30/2021 15:27:59 - INFO - __main__ - Step 13007: {'lr': 0.0004932084465796449, 'samples': 2497344, 'steps': 13006, 'loss/train': 1.5515129566192627} -08/30/2021 15:28:00 - INFO - __main__ - Step 13008: {'lr': 0.000493207217988616, 'samples': 2497536, 'steps': 13007, 'loss/train': 1.4073905944824219} -08/30/2021 15:28:01 - INFO - __main__ - Step 13009: {'lr': 0.0004932059892880016, 'samples': 2497728, 'steps': 13008, 'loss/train': 1.4713689088821411} -08/30/2021 15:28:02 - INFO - __main__ - Step 13010: {'lr': 0.0004932047604778025, 'samples': 2497920, 'steps': 13009, 'loss/train': 1.11771821975708} -08/30/2021 15:28:02 - INFO - __main__ - Step 13011: {'lr': 0.0004932035315580188, 'samples': 2498112, 'steps': 13010, 'loss/train': 2.0724284648895264} -08/30/2021 15:28:02 - INFO - __main__ - Step 13012: {'lr': 0.0004932023025286516, 'samples': 2498304, 'steps': 13011, 'loss/train': 2.1573293209075928} -08/30/2021 15:28:03 - INFO - __main__ - Step 13013: {'lr': 0.0004932010733897012, 'samples': 2498496, 'steps': 13012, 'loss/train': 1.907956838607788} -08/30/2021 15:28:04 - INFO - __main__ - Step 13014: {'lr': 0.000493199844141168, 'samples': 2498688, 'steps': 13013, 'loss/train': 1.34544837474823} -08/30/2021 15:28:05 - INFO - __main__ - Step 13015: {'lr': 0.0004931986147830527, 'samples': 2498880, 'steps': 13014, 'loss/train': 1.8426891565322876} -08/30/2021 15:28:05 - INFO - __main__ - Step 13016: {'lr': 0.000493197385315356, 'samples': 2499072, 'steps': 13015, 'loss/train': 2.1983206272125244} -08/30/2021 15:28:05 - INFO - __main__ - Step 13017: {'lr': 0.0004931961557380782, 'samples': 2499264, 'steps': 13016, 'loss/train': 1.6161142587661743} -08/30/2021 15:28:06 - INFO - __main__ - Step 13018: {'lr': 0.00049319492605122, 'samples': 2499456, 'steps': 13017, 'loss/train': 1.5326571464538574} -08/30/2021 15:28:07 - INFO - __main__ - Step 13019: {'lr': 0.000493193696254782, 'samples': 2499648, 'steps': 13018, 'loss/train': 1.9193850755691528} -08/30/2021 15:28:08 - INFO - __main__ - Step 13020: {'lr': 0.0004931924663487646, 'samples': 2499840, 'steps': 13019, 'loss/train': 0.864918053150177} -08/30/2021 15:28:08 - INFO - __main__ - Step 13021: {'lr': 0.0004931912363331683, 'samples': 2500032, 'steps': 13020, 'loss/train': 1.8274675607681274} -08/30/2021 15:28:08 - INFO - __main__ - Step 13022: {'lr': 0.000493190006207994, 'samples': 2500224, 'steps': 13021, 'loss/train': 1.7764897346496582} -08/30/2021 15:28:09 - INFO - __main__ - Step 13023: {'lr': 0.0004931887759732419, 'samples': 2500416, 'steps': 13022, 'loss/train': 1.5352623462677002} -08/30/2021 15:28:11 - INFO - __main__ - Step 13024: {'lr': 0.0004931875456289128, 'samples': 2500608, 'steps': 13023, 'loss/train': 1.5049412250518799} -08/30/2021 15:28:11 - INFO - __main__ - Step 13025: {'lr': 0.000493186315175007, 'samples': 2500800, 'steps': 13024, 'loss/train': 2.0036520957946777} -08/30/2021 15:28:12 - INFO - __main__ - Step 13026: {'lr': 0.0004931850846115253, 'samples': 2500992, 'steps': 13025, 'loss/train': 1.5592503547668457} -08/30/2021 15:28:12 - INFO - __main__ - Step 13027: {'lr': 0.0004931838539384681, 'samples': 2501184, 'steps': 13026, 'loss/train': 1.9943856000900269} -08/30/2021 15:28:12 - INFO - __main__ - Step 13028: {'lr': 0.0004931826231558361, 'samples': 2501376, 'steps': 13027, 'loss/train': 1.7973827123641968} -08/30/2021 15:28:14 - INFO - __main__ - Step 13029: {'lr': 0.0004931813922636297, 'samples': 2501568, 'steps': 13028, 'loss/train': 1.706641435623169} -08/30/2021 15:28:14 - INFO - __main__ - Step 13030: {'lr': 0.0004931801612618494, 'samples': 2501760, 'steps': 13029, 'loss/train': 1.7919440269470215} -08/30/2021 15:28:15 - INFO - __main__ - Step 13031: {'lr': 0.0004931789301504961, 'samples': 2501952, 'steps': 13030, 'loss/train': 2.379535675048828} -08/30/2021 15:28:15 - INFO - __main__ - Step 13032: {'lr': 0.00049317769892957, 'samples': 2502144, 'steps': 13031, 'loss/train': 1.557008981704712} -08/30/2021 15:28:15 - INFO - __main__ - Step 13033: {'lr': 0.0004931764675990718, 'samples': 2502336, 'steps': 13032, 'loss/train': 1.3330165147781372} -08/30/2021 15:28:16 - INFO - __main__ - Step 13034: {'lr': 0.000493175236159002, 'samples': 2502528, 'steps': 13033, 'loss/train': 1.2604204416275024} -08/30/2021 15:28:17 - INFO - __main__ - Step 13035: {'lr': 0.0004931740046093612, 'samples': 2502720, 'steps': 13034, 'loss/train': 1.5593136548995972} -08/30/2021 15:28:18 - INFO - __main__ - Step 13036: {'lr': 0.0004931727729501499, 'samples': 2502912, 'steps': 13035, 'loss/train': 1.4550620317459106} -08/30/2021 15:28:18 - INFO - __main__ - Step 13037: {'lr': 0.0004931715411813689, 'samples': 2503104, 'steps': 13036, 'loss/train': 1.0847595930099487} -08/30/2021 15:28:18 - INFO - __main__ - Step 13038: {'lr': 0.0004931703093030183, 'samples': 2503296, 'steps': 13037, 'loss/train': 2.3429133892059326} -08/30/2021 15:28:19 - INFO - __main__ - Step 13039: {'lr': 0.0004931690773150991, 'samples': 2503488, 'steps': 13038, 'loss/train': 1.7359956502914429} -08/30/2021 15:28:20 - INFO - __main__ - Step 13040: {'lr': 0.0004931678452176116, 'samples': 2503680, 'steps': 13039, 'loss/train': 1.437747836112976} -08/30/2021 15:28:21 - INFO - __main__ - Step 13041: {'lr': 0.0004931666130105563, 'samples': 2503872, 'steps': 13040, 'loss/train': 1.7497220039367676} -08/30/2021 15:28:21 - INFO - __main__ - Step 13042: {'lr': 0.0004931653806939341, 'samples': 2504064, 'steps': 13041, 'loss/train': 1.897395372390747} -08/30/2021 15:28:21 - INFO - __main__ - Step 13043: {'lr': 0.0004931641482677452, 'samples': 2504256, 'steps': 13042, 'loss/train': 1.0215831995010376} -08/30/2021 15:28:22 - INFO - __main__ - Step 13044: {'lr': 0.0004931629157319904, 'samples': 2504448, 'steps': 13043, 'loss/train': 2.220050096511841} -08/30/2021 15:28:22 - INFO - __main__ - Step 13045: {'lr': 0.00049316168308667, 'samples': 2504640, 'steps': 13044, 'loss/train': 0.17489831149578094} -08/30/2021 15:28:24 - INFO - __main__ - Step 13046: {'lr': 0.0004931604503317846, 'samples': 2504832, 'steps': 13045, 'loss/train': 1.2778693437576294} -08/30/2021 15:28:24 - INFO - __main__ - Step 13047: {'lr': 0.0004931592174673351, 'samples': 2505024, 'steps': 13046, 'loss/train': 1.2653385400772095} -08/30/2021 15:28:25 - INFO - __main__ - Step 13048: {'lr': 0.0004931579844933218, 'samples': 2505216, 'steps': 13047, 'loss/train': 2.0661964416503906} -08/30/2021 15:28:25 - INFO - __main__ - Step 13049: {'lr': 0.0004931567514097451, 'samples': 2505408, 'steps': 13048, 'loss/train': 1.877793312072754} -08/30/2021 15:28:25 - INFO - __main__ - Step 13050: {'lr': 0.0004931555182166059, 'samples': 2505600, 'steps': 13049, 'loss/train': 1.6688730716705322} -08/30/2021 15:28:27 - INFO - __main__ - Step 13051: {'lr': 0.0004931542849139044, 'samples': 2505792, 'steps': 13050, 'loss/train': 2.4740827083587646} -08/30/2021 15:28:27 - INFO - __main__ - Step 13052: {'lr': 0.0004931530515016415, 'samples': 2505984, 'steps': 13051, 'loss/train': 1.5523220300674438} -08/30/2021 15:28:28 - INFO - __main__ - Step 13053: {'lr': 0.0004931518179798175, 'samples': 2506176, 'steps': 13052, 'loss/train': 1.5974029302597046} -08/30/2021 15:28:28 - INFO - __main__ - Step 13054: {'lr': 0.000493150584348433, 'samples': 2506368, 'steps': 13053, 'loss/train': 1.7093305587768555} -08/30/2021 15:28:28 - INFO - __main__ - Step 13055: {'lr': 0.0004931493506074886, 'samples': 2506560, 'steps': 13054, 'loss/train': 1.8807342052459717} -08/30/2021 15:28:30 - INFO - __main__ - Step 13056: {'lr': 0.0004931481167569849, 'samples': 2506752, 'steps': 13055, 'loss/train': 2.1391303539276123} -08/30/2021 15:28:30 - INFO - __main__ - Step 13057: {'lr': 0.0004931468827969223, 'samples': 2506944, 'steps': 13056, 'loss/train': 1.5391812324523926} -08/30/2021 15:28:31 - INFO - __main__ - Step 13058: {'lr': 0.0004931456487273017, 'samples': 2507136, 'steps': 13057, 'loss/train': 1.659219741821289} -08/30/2021 15:28:31 - INFO - __main__ - Step 13059: {'lr': 0.0004931444145481233, 'samples': 2507328, 'steps': 13058, 'loss/train': 1.429943323135376} -08/30/2021 15:28:31 - INFO - __main__ - Step 13060: {'lr': 0.0004931431802593877, 'samples': 2507520, 'steps': 13059, 'loss/train': 1.8401118516921997} -08/30/2021 15:28:33 - INFO - __main__ - Step 13061: {'lr': 0.0004931419458610956, 'samples': 2507712, 'steps': 13060, 'loss/train': 1.9002833366394043} -08/30/2021 15:28:33 - INFO - __main__ - Step 13062: {'lr': 0.0004931407113532476, 'samples': 2507904, 'steps': 13061, 'loss/train': 1.1754478216171265} -08/30/2021 15:28:33 - INFO - __main__ - Step 13063: {'lr': 0.000493139476735844, 'samples': 2508096, 'steps': 13062, 'loss/train': 1.7957676649093628} -08/30/2021 15:28:34 - INFO - __main__ - Step 13064: {'lr': 0.0004931382420088855, 'samples': 2508288, 'steps': 13063, 'loss/train': 1.8040765523910522} -08/30/2021 15:28:34 - INFO - __main__ - Step 13065: {'lr': 0.0004931370071723728, 'samples': 2508480, 'steps': 13064, 'loss/train': 1.305092453956604} -08/30/2021 15:28:36 - INFO - __main__ - Step 13066: {'lr': 0.0004931357722263061, 'samples': 2508672, 'steps': 13065, 'loss/train': 1.7021839618682861} -08/30/2021 15:28:36 - INFO - __main__ - Step 13067: {'lr': 0.0004931345371706863, 'samples': 2508864, 'steps': 13066, 'loss/train': 2.398237943649292} -08/30/2021 15:28:36 - INFO - __main__ - Step 13068: {'lr': 0.0004931333020055139, 'samples': 2509056, 'steps': 13067, 'loss/train': 2.0597445964813232} -08/30/2021 15:28:37 - INFO - __main__ - Step 13069: {'lr': 0.0004931320667307893, 'samples': 2509248, 'steps': 13068, 'loss/train': 2.1479623317718506} -08/30/2021 15:28:37 - INFO - __main__ - Step 13070: {'lr': 0.0004931308313465132, 'samples': 2509440, 'steps': 13069, 'loss/train': 1.5970937013626099} -08/30/2021 15:28:39 - INFO - __main__ - Step 13071: {'lr': 0.000493129595852686, 'samples': 2509632, 'steps': 13070, 'loss/train': 1.9472614526748657} -08/30/2021 15:28:39 - INFO - __main__ - Step 13072: {'lr': 0.0004931283602493084, 'samples': 2509824, 'steps': 13071, 'loss/train': 1.283542275428772} -08/30/2021 15:28:40 - INFO - __main__ - Step 13073: {'lr': 0.0004931271245363809, 'samples': 2510016, 'steps': 13072, 'loss/train': 1.7467390298843384} -08/30/2021 15:28:40 - INFO - __main__ - Step 13074: {'lr': 0.0004931258887139041, 'samples': 2510208, 'steps': 13073, 'loss/train': 0.3075007200241089} -08/30/2021 15:28:40 - INFO - __main__ - Step 13075: {'lr': 0.0004931246527818785, 'samples': 2510400, 'steps': 13074, 'loss/train': 1.9166795015335083} -08/30/2021 15:28:42 - INFO - __main__ - Step 13076: {'lr': 0.0004931234167403047, 'samples': 2510592, 'steps': 13075, 'loss/train': 1.3028392791748047} -08/30/2021 15:28:42 - INFO - __main__ - Step 13077: {'lr': 0.0004931221805891833, 'samples': 2510784, 'steps': 13076, 'loss/train': 1.6634352207183838} -08/30/2021 15:28:43 - INFO - __main__ - Step 13078: {'lr': 0.0004931209443285147, 'samples': 2510976, 'steps': 13077, 'loss/train': 1.9077144861221313} -08/30/2021 15:28:43 - INFO - __main__ - Step 13079: {'lr': 0.0004931197079582996, 'samples': 2511168, 'steps': 13078, 'loss/train': 1.5824267864227295} -08/30/2021 15:28:43 - INFO - __main__ - Step 13080: {'lr': 0.0004931184714785385, 'samples': 2511360, 'steps': 13079, 'loss/train': 1.7552483081817627} -08/30/2021 15:28:45 - INFO - __main__ - Step 13081: {'lr': 0.000493117234889232, 'samples': 2511552, 'steps': 13080, 'loss/train': 1.94263756275177} -08/30/2021 15:28:46 - INFO - __main__ - Step 13082: {'lr': 0.0004931159981903805, 'samples': 2511744, 'steps': 13081, 'loss/train': 1.7694244384765625} -08/30/2021 15:28:46 - INFO - __main__ - Step 13083: {'lr': 0.0004931147613819848, 'samples': 2511936, 'steps': 13082, 'loss/train': 2.3691859245300293} -08/30/2021 15:28:47 - INFO - __main__ - Step 13084: {'lr': 0.0004931135244640453, 'samples': 2512128, 'steps': 13083, 'loss/train': 1.850730061531067} -08/30/2021 15:28:47 - INFO - __main__ - Step 13085: {'lr': 0.0004931122874365627, 'samples': 2512320, 'steps': 13084, 'loss/train': 1.9314231872558594} -08/30/2021 15:28:47 - INFO - __main__ - Step 13086: {'lr': 0.0004931110502995374, 'samples': 2512512, 'steps': 13085, 'loss/train': 2.1539690494537354} -08/30/2021 15:28:49 - INFO - __main__ - Step 13087: {'lr': 0.0004931098130529699, 'samples': 2512704, 'steps': 13086, 'loss/train': 2.0296292304992676} -08/30/2021 15:28:49 - INFO - __main__ - Step 13088: {'lr': 0.000493108575696861, 'samples': 2512896, 'steps': 13087, 'loss/train': 1.527732491493225} -08/30/2021 15:28:50 - INFO - __main__ - Step 13089: {'lr': 0.0004931073382312111, 'samples': 2513088, 'steps': 13088, 'loss/train': 1.7371238470077515} -08/30/2021 15:28:50 - INFO - __main__ - Step 13090: {'lr': 0.0004931061006560207, 'samples': 2513280, 'steps': 13089, 'loss/train': 1.9282242059707642} -08/30/2021 15:28:50 - INFO - __main__ - Step 13091: {'lr': 0.0004931048629712905, 'samples': 2513472, 'steps': 13090, 'loss/train': 1.2753441333770752} -08/30/2021 15:28:52 - INFO - __main__ - Step 13092: {'lr': 0.000493103625177021, 'samples': 2513664, 'steps': 13091, 'loss/train': 1.8101255893707275} -08/30/2021 15:28:52 - INFO - __main__ - Step 13093: {'lr': 0.0004931023872732128, 'samples': 2513856, 'steps': 13092, 'loss/train': 1.4918361902236938} -08/30/2021 15:28:53 - INFO - __main__ - Step 13094: {'lr': 0.0004931011492598664, 'samples': 2514048, 'steps': 13093, 'loss/train': 1.029206395149231} -08/30/2021 15:28:53 - INFO - __main__ - Step 13095: {'lr': 0.0004930999111369824, 'samples': 2514240, 'steps': 13094, 'loss/train': 1.8578993082046509} -08/30/2021 15:28:53 - INFO - __main__ - Step 13096: {'lr': 0.0004930986729045613, 'samples': 2514432, 'steps': 13095, 'loss/train': 1.5148252248764038} -08/30/2021 15:28:55 - INFO - __main__ - Step 13097: {'lr': 0.0004930974345626036, 'samples': 2514624, 'steps': 13096, 'loss/train': 1.5347464084625244} -08/30/2021 15:28:55 - INFO - __main__ - Step 13098: {'lr': 0.00049309619611111, 'samples': 2514816, 'steps': 13097, 'loss/train': 1.093123197555542} -08/30/2021 15:28:56 - INFO - __main__ - Step 13099: {'lr': 0.000493094957550081, 'samples': 2515008, 'steps': 13098, 'loss/train': 1.668910264968872} -08/30/2021 15:28:56 - INFO - __main__ - Step 13100: {'lr': 0.0004930937188795172, 'samples': 2515200, 'steps': 13099, 'loss/train': 1.6206682920455933} -08/30/2021 15:28:56 - INFO - __main__ - Step 13101: {'lr': 0.0004930924800994192, 'samples': 2515392, 'steps': 13100, 'loss/train': 1.2876331806182861} -08/30/2021 15:28:58 - INFO - __main__ - Step 13102: {'lr': 0.0004930912412097874, 'samples': 2515584, 'steps': 13101, 'loss/train': 1.5982943773269653} -08/30/2021 15:28:58 - INFO - __main__ - Step 13103: {'lr': 0.0004930900022106224, 'samples': 2515776, 'steps': 13102, 'loss/train': 0.8433182835578918} -08/30/2021 15:28:59 - INFO - __main__ - Step 13104: {'lr': 0.0004930887631019248, 'samples': 2515968, 'steps': 13103, 'loss/train': 1.2797197103500366} -08/30/2021 15:28:59 - INFO - __main__ - Step 13105: {'lr': 0.0004930875238836951, 'samples': 2516160, 'steps': 13104, 'loss/train': 1.6055853366851807} -08/30/2021 15:28:59 - INFO - __main__ - Step 13106: {'lr': 0.000493086284555934, 'samples': 2516352, 'steps': 13105, 'loss/train': 1.447858452796936} -08/30/2021 15:29:00 - INFO - __main__ - Step 13107: {'lr': 0.0004930850451186421, 'samples': 2516544, 'steps': 13106, 'loss/train': 1.67668879032135} -08/30/2021 15:29:01 - INFO - __main__ - Step 13108: {'lr': 0.0004930838055718196, 'samples': 2516736, 'steps': 13107, 'loss/train': 1.573887825012207} -08/30/2021 15:29:02 - INFO - __main__ - Step 13109: {'lr': 0.0004930825659154674, 'samples': 2516928, 'steps': 13108, 'loss/train': 1.8749699592590332} -08/30/2021 15:29:02 - INFO - __main__ - Step 13110: {'lr': 0.000493081326149586, 'samples': 2517120, 'steps': 13109, 'loss/train': 0.5593264698982239} -08/30/2021 15:29:02 - INFO - __main__ - Step 13111: {'lr': 0.0004930800862741758, 'samples': 2517312, 'steps': 13110, 'loss/train': 1.6479274034500122} -08/30/2021 15:29:03 - INFO - __main__ - Step 13112: {'lr': 0.0004930788462892375, 'samples': 2517504, 'steps': 13111, 'loss/train': 1.4467664957046509} -08/30/2021 15:29:04 - INFO - __main__ - Step 13113: {'lr': 0.0004930776061947716, 'samples': 2517696, 'steps': 13112, 'loss/train': 0.14597637951374054} -08/30/2021 15:29:05 - INFO - __main__ - Step 13114: {'lr': 0.0004930763659907788, 'samples': 2517888, 'steps': 13113, 'loss/train': 1.8421238660812378} -08/30/2021 15:29:05 - INFO - __main__ - Step 13115: {'lr': 0.0004930751256772593, 'samples': 2518080, 'steps': 13114, 'loss/train': 2.404543876647949} -08/30/2021 15:29:05 - INFO - __main__ - Step 13116: {'lr': 0.0004930738852542141, 'samples': 2518272, 'steps': 13115, 'loss/train': 1.7245795726776123} -08/30/2021 15:29:06 - INFO - __main__ - Step 13117: {'lr': 0.0004930726447216435, 'samples': 2518464, 'steps': 13116, 'loss/train': 0.9352125525474548} -08/30/2021 15:29:07 - INFO - __main__ - Step 13118: {'lr': 0.0004930714040795481, 'samples': 2518656, 'steps': 13117, 'loss/train': 1.5468991994857788} -08/30/2021 15:29:08 - INFO - __main__ - Step 13119: {'lr': 0.0004930701633279285, 'samples': 2518848, 'steps': 13118, 'loss/train': 1.8813652992248535} -08/30/2021 15:29:08 - INFO - __main__ - Step 13120: {'lr': 0.0004930689224667853, 'samples': 2519040, 'steps': 13119, 'loss/train': 1.510832667350769} -08/30/2021 15:29:08 - INFO - __main__ - Step 13121: {'lr': 0.0004930676814961189, 'samples': 2519232, 'steps': 13120, 'loss/train': 1.934361457824707} -08/30/2021 15:29:09 - INFO - __main__ - Step 13122: {'lr': 0.00049306644041593, 'samples': 2519424, 'steps': 13121, 'loss/train': 1.4233644008636475} -08/30/2021 15:29:10 - INFO - __main__ - Step 13123: {'lr': 0.0004930651992262191, 'samples': 2519616, 'steps': 13122, 'loss/train': 1.3029298782348633} -08/30/2021 15:29:11 - INFO - __main__ - Step 13124: {'lr': 0.0004930639579269866, 'samples': 2519808, 'steps': 13123, 'loss/train': 1.943230152130127} -08/30/2021 15:29:11 - INFO - __main__ - Step 13125: {'lr': 0.0004930627165182335, 'samples': 2520000, 'steps': 13124, 'loss/train': 1.8684998750686646} -08/30/2021 15:29:11 - INFO - __main__ - Step 13126: {'lr': 0.00049306147499996, 'samples': 2520192, 'steps': 13125, 'loss/train': 1.570236325263977} -08/30/2021 15:29:12 - INFO - __main__ - Step 13127: {'lr': 0.0004930602333721667, 'samples': 2520384, 'steps': 13126, 'loss/train': 1.9651436805725098} -08/30/2021 15:29:13 - INFO - __main__ - Step 13128: {'lr': 0.0004930589916348542, 'samples': 2520576, 'steps': 13127, 'loss/train': 1.6157217025756836} -08/30/2021 15:29:14 - INFO - __main__ - Step 13129: {'lr': 0.0004930577497880231, 'samples': 2520768, 'steps': 13128, 'loss/train': 1.955784797668457} -08/30/2021 15:29:14 - INFO - __main__ - Step 13130: {'lr': 0.000493056507831674, 'samples': 2520960, 'steps': 13129, 'loss/train': 1.4171680212020874} -08/30/2021 15:29:14 - INFO - __main__ - Step 13131: {'lr': 0.0004930552657658073, 'samples': 2521152, 'steps': 13130, 'loss/train': 1.706404209136963} -08/30/2021 15:29:15 - INFO - __main__ - Step 13132: {'lr': 0.0004930540235904237, 'samples': 2521344, 'steps': 13131, 'loss/train': 0.4153987169265747} -08/30/2021 15:29:17 - INFO - __main__ - Step 13133: {'lr': 0.0004930527813055237, 'samples': 2521536, 'steps': 13132, 'loss/train': 1.846850037574768} -08/30/2021 15:29:18 - INFO - __main__ - Step 13134: {'lr': 0.0004930515389111078, 'samples': 2521728, 'steps': 13133, 'loss/train': 0.9846248030662537} -08/30/2021 15:29:18 - INFO - __main__ - Step 13135: {'lr': 0.0004930502964071767, 'samples': 2521920, 'steps': 13134, 'loss/train': 1.8380756378173828} -08/30/2021 15:29:18 - INFO - __main__ - Step 13136: {'lr': 0.0004930490537937309, 'samples': 2522112, 'steps': 13135, 'loss/train': 1.9091602563858032} -08/30/2021 15:29:19 - INFO - __main__ - Step 13137: {'lr': 0.0004930478110707709, 'samples': 2522304, 'steps': 13136, 'loss/train': 1.7970647811889648} -08/30/2021 15:29:19 - INFO - __main__ - Step 13138: {'lr': 0.0004930465682382973, 'samples': 2522496, 'steps': 13137, 'loss/train': 1.3530611991882324} -08/30/2021 15:29:21 - INFO - __main__ - Step 13139: {'lr': 0.0004930453252963107, 'samples': 2522688, 'steps': 13138, 'loss/train': 1.371092677116394} -08/30/2021 15:29:21 - INFO - __main__ - Step 13140: {'lr': 0.0004930440822448115, 'samples': 2522880, 'steps': 13139, 'loss/train': 1.1301995515823364} -08/30/2021 15:29:21 - INFO - __main__ - Step 13141: {'lr': 0.0004930428390838006, 'samples': 2523072, 'steps': 13140, 'loss/train': 1.8004950284957886} -08/30/2021 15:29:22 - INFO - __main__ - Step 13142: {'lr': 0.0004930415958132782, 'samples': 2523264, 'steps': 13141, 'loss/train': 1.6366088390350342} -08/30/2021 15:29:22 - INFO - __main__ - Step 13143: {'lr': 0.0004930403524332451, 'samples': 2523456, 'steps': 13142, 'loss/train': 1.5675653219223022} -08/30/2021 15:29:22 - INFO - __main__ - Step 13144: {'lr': 0.0004930391089437017, 'samples': 2523648, 'steps': 13143, 'loss/train': 0.7293281555175781} -08/30/2021 15:29:24 - INFO - __main__ - Step 13145: {'lr': 0.0004930378653446487, 'samples': 2523840, 'steps': 13144, 'loss/train': 2.0169146060943604} -08/30/2021 15:29:25 - INFO - __main__ - Step 13146: {'lr': 0.0004930366216360865, 'samples': 2524032, 'steps': 13145, 'loss/train': 0.2024550586938858} -08/30/2021 15:29:25 - INFO - __main__ - Step 13147: {'lr': 0.0004930353778180158, 'samples': 2524224, 'steps': 13146, 'loss/train': 1.6575980186462402} -08/30/2021 15:29:25 - INFO - __main__ - Step 13148: {'lr': 0.0004930341338904371, 'samples': 2524416, 'steps': 13147, 'loss/train': 1.7918614149093628} -08/30/2021 15:29:26 - INFO - __main__ - Step 13149: {'lr': 0.000493032889853351, 'samples': 2524608, 'steps': 13148, 'loss/train': 1.5911606550216675} -08/30/2021 15:29:27 - INFO - __main__ - Step 13150: {'lr': 0.0004930316457067579, 'samples': 2524800, 'steps': 13149, 'loss/train': 2.0211563110351562} -08/30/2021 15:29:28 - INFO - __main__ - Step 13151: {'lr': 0.0004930304014506586, 'samples': 2524992, 'steps': 13150, 'loss/train': 1.477755069732666} -08/30/2021 15:29:28 - INFO - __main__ - Step 13152: {'lr': 0.0004930291570850536, 'samples': 2525184, 'steps': 13151, 'loss/train': 1.3428807258605957} -08/30/2021 15:29:28 - INFO - __main__ - Step 13153: {'lr': 0.0004930279126099433, 'samples': 2525376, 'steps': 13152, 'loss/train': 1.9181922674179077} -08/30/2021 15:29:29 - INFO - __main__ - Step 13154: {'lr': 0.0004930266680253284, 'samples': 2525568, 'steps': 13153, 'loss/train': 2.255140542984009} -08/30/2021 15:29:31 - INFO - __main__ - Step 13155: {'lr': 0.0004930254233312095, 'samples': 2525760, 'steps': 13154, 'loss/train': 1.7637264728546143} -08/30/2021 15:29:31 - INFO - __main__ - Step 13156: {'lr': 0.000493024178527587, 'samples': 2525952, 'steps': 13155, 'loss/train': 1.082656741142273} -08/30/2021 15:29:32 - INFO - __main__ - Step 13157: {'lr': 0.0004930229336144616, 'samples': 2526144, 'steps': 13156, 'loss/train': 0.9817512631416321} -08/30/2021 15:29:32 - INFO - __main__ - Step 13158: {'lr': 0.0004930216885918339, 'samples': 2526336, 'steps': 13157, 'loss/train': 0.7919743061065674} -08/30/2021 15:29:32 - INFO - __main__ - Step 13159: {'lr': 0.0004930204434597042, 'samples': 2526528, 'steps': 13158, 'loss/train': 0.7817718386650085} -08/30/2021 15:29:33 - INFO - __main__ - Step 13160: {'lr': 0.0004930191982180734, 'samples': 2526720, 'steps': 13159, 'loss/train': 1.6986939907073975} -08/30/2021 15:29:34 - INFO - __main__ - Step 13161: {'lr': 0.0004930179528669418, 'samples': 2526912, 'steps': 13160, 'loss/train': 2.3518199920654297} -08/30/2021 15:29:35 - INFO - __main__ - Step 13162: {'lr': 0.0004930167074063101, 'samples': 2527104, 'steps': 13161, 'loss/train': 1.8200459480285645} -08/30/2021 15:29:35 - INFO - __main__ - Step 13163: {'lr': 0.0004930154618361789, 'samples': 2527296, 'steps': 13162, 'loss/train': 1.7531898021697998} -08/30/2021 15:29:35 - INFO - __main__ - Step 13164: {'lr': 0.0004930142161565486, 'samples': 2527488, 'steps': 13163, 'loss/train': 1.6355242729187012} -08/30/2021 15:29:36 - INFO - __main__ - Step 13165: {'lr': 0.0004930129703674198, 'samples': 2527680, 'steps': 13164, 'loss/train': 1.484022855758667} -08/30/2021 15:29:36 - INFO - __main__ - Step 13166: {'lr': 0.0004930117244687931, 'samples': 2527872, 'steps': 13165, 'loss/train': 1.532153844833374} -08/30/2021 15:29:38 - INFO - __main__ - Step 13167: {'lr': 0.0004930104784606692, 'samples': 2528064, 'steps': 13166, 'loss/train': 0.9530429840087891} -08/30/2021 15:29:38 - INFO - __main__ - Step 13168: {'lr': 0.0004930092323430484, 'samples': 2528256, 'steps': 13167, 'loss/train': 1.9393770694732666} -08/30/2021 15:29:38 - INFO - __main__ - Step 13169: {'lr': 0.0004930079861159315, 'samples': 2528448, 'steps': 13168, 'loss/train': 1.4961903095245361} -08/30/2021 15:29:39 - INFO - __main__ - Step 13170: {'lr': 0.0004930067397793188, 'samples': 2528640, 'steps': 13169, 'loss/train': 1.5230586528778076} -08/30/2021 15:29:39 - INFO - __main__ - Step 13171: {'lr': 0.0004930054933332111, 'samples': 2528832, 'steps': 13170, 'loss/train': 1.8054306507110596} -08/30/2021 15:29:40 - INFO - __main__ - Step 13172: {'lr': 0.0004930042467776089, 'samples': 2529024, 'steps': 13171, 'loss/train': 1.5270925760269165} -08/30/2021 15:29:41 - INFO - __main__ - Step 13173: {'lr': 0.0004930030001125128, 'samples': 2529216, 'steps': 13172, 'loss/train': 2.004761219024658} -08/30/2021 15:29:41 - INFO - __main__ - Step 13174: {'lr': 0.000493001753337923, 'samples': 2529408, 'steps': 13173, 'loss/train': 1.9755587577819824} -08/30/2021 15:29:42 - INFO - __main__ - Step 13175: {'lr': 0.0004930005064538406, 'samples': 2529600, 'steps': 13174, 'loss/train': 1.6368324756622314} -08/30/2021 15:29:42 - INFO - __main__ - Step 13176: {'lr': 0.0004929992594602659, 'samples': 2529792, 'steps': 13175, 'loss/train': 2.0778143405914307} -08/30/2021 15:29:44 - INFO - __main__ - Step 13177: {'lr': 0.0004929980123571995, 'samples': 2529984, 'steps': 13176, 'loss/train': 1.456868290901184} -08/30/2021 15:29:44 - INFO - __main__ - Step 13178: {'lr': 0.000492996765144642, 'samples': 2530176, 'steps': 13177, 'loss/train': 1.6746386289596558} -08/30/2021 15:29:44 - INFO - __main__ - Step 13179: {'lr': 0.0004929955178225938, 'samples': 2530368, 'steps': 13178, 'loss/train': 1.5261129140853882} -08/30/2021 15:29:45 - INFO - __main__ - Step 13180: {'lr': 0.0004929942703910556, 'samples': 2530560, 'steps': 13179, 'loss/train': 1.931277871131897} -08/30/2021 15:29:45 - INFO - __main__ - Step 13181: {'lr': 0.0004929930228500279, 'samples': 2530752, 'steps': 13180, 'loss/train': 1.0765554904937744} -08/30/2021 15:29:46 - INFO - __main__ - Step 13182: {'lr': 0.0004929917751995114, 'samples': 2530944, 'steps': 13181, 'loss/train': 1.4679514169692993} -08/30/2021 15:29:47 - INFO - __main__ - Step 13183: {'lr': 0.0004929905274395064, 'samples': 2531136, 'steps': 13182, 'loss/train': 1.5988885164260864} -08/30/2021 15:29:47 - INFO - __main__ - Step 13184: {'lr': 0.0004929892795700137, 'samples': 2531328, 'steps': 13183, 'loss/train': 1.6287188529968262} -08/30/2021 15:29:48 - INFO - __main__ - Step 13185: {'lr': 0.0004929880315910338, 'samples': 2531520, 'steps': 13184, 'loss/train': 2.115199565887451} -08/30/2021 15:29:48 - INFO - __main__ - Step 13186: {'lr': 0.0004929867835025672, 'samples': 2531712, 'steps': 13185, 'loss/train': 1.7262567281723022} -08/30/2021 15:29:49 - INFO - __main__ - Step 13187: {'lr': 0.0004929855353046145, 'samples': 2531904, 'steps': 13186, 'loss/train': 2.0716159343719482} -08/30/2021 15:29:50 - INFO - __main__ - Step 13188: {'lr': 0.0004929842869971763, 'samples': 2532096, 'steps': 13187, 'loss/train': 1.6969057321548462} -08/30/2021 15:29:51 - INFO - __main__ - Step 13189: {'lr': 0.000492983038580253, 'samples': 2532288, 'steps': 13188, 'loss/train': 1.133381962776184} -08/30/2021 15:29:51 - INFO - __main__ - Step 13190: {'lr': 0.0004929817900538455, 'samples': 2532480, 'steps': 13189, 'loss/train': 1.6991007328033447} -08/30/2021 15:29:52 - INFO - __main__ - Step 13191: {'lr': 0.000492980541417954, 'samples': 2532672, 'steps': 13190, 'loss/train': 2.106668472290039} -08/30/2021 15:29:52 - INFO - __main__ - Step 13192: {'lr': 0.0004929792926725794, 'samples': 2532864, 'steps': 13191, 'loss/train': 1.9648419618606567} -08/30/2021 15:29:54 - INFO - __main__ - Step 13193: {'lr': 0.000492978043817722, 'samples': 2533056, 'steps': 13192, 'loss/train': 1.5465891361236572} -08/30/2021 15:29:54 - INFO - __main__ - Step 13194: {'lr': 0.0004929767948533823, 'samples': 2533248, 'steps': 13193, 'loss/train': 0.7830932140350342} -08/30/2021 15:29:54 - INFO - __main__ - Step 13195: {'lr': 0.0004929755457795612, 'samples': 2533440, 'steps': 13194, 'loss/train': 1.7344844341278076} -08/30/2021 15:29:55 - INFO - __main__ - Step 13196: {'lr': 0.0004929742965962589, 'samples': 2533632, 'steps': 13195, 'loss/train': 1.909066081047058} -08/30/2021 15:29:55 - INFO - __main__ - Step 13197: {'lr': 0.0004929730473034763, 'samples': 2533824, 'steps': 13196, 'loss/train': 1.7170289754867554} -08/30/2021 15:29:55 - INFO - __main__ - Step 13198: {'lr': 0.0004929717979012136, 'samples': 2534016, 'steps': 13197, 'loss/train': 1.6677168607711792} -08/30/2021 15:29:57 - INFO - __main__ - Step 13199: {'lr': 0.0004929705483894717, 'samples': 2534208, 'steps': 13198, 'loss/train': 1.4450730085372925} -08/30/2021 15:29:57 - INFO - __main__ - Step 13200: {'lr': 0.000492969298768251, 'samples': 2534400, 'steps': 13199, 'loss/train': 1.698410987854004} -08/30/2021 15:29:58 - INFO - __main__ - Step 13201: {'lr': 0.000492968049037552, 'samples': 2534592, 'steps': 13200, 'loss/train': 2.3205251693725586} -08/30/2021 15:29:58 - INFO - __main__ - Step 13202: {'lr': 0.0004929667991973754, 'samples': 2534784, 'steps': 13201, 'loss/train': 1.383763313293457} -08/30/2021 15:29:58 - INFO - __main__ - Step 13203: {'lr': 0.0004929655492477218, 'samples': 2534976, 'steps': 13202, 'loss/train': 2.1142139434814453} -08/30/2021 15:30:00 - INFO - __main__ - Step 13204: {'lr': 0.0004929642991885916, 'samples': 2535168, 'steps': 13203, 'loss/train': 1.5923293828964233} -08/30/2021 15:30:01 - INFO - __main__ - Step 13205: {'lr': 0.0004929630490199854, 'samples': 2535360, 'steps': 13204, 'loss/train': 1.6323366165161133} -08/30/2021 15:30:01 - INFO - __main__ - Step 13206: {'lr': 0.0004929617987419039, 'samples': 2535552, 'steps': 13205, 'loss/train': 1.70604407787323} -08/30/2021 15:30:01 - INFO - __main__ - Step 13207: {'lr': 0.0004929605483543474, 'samples': 2535744, 'steps': 13206, 'loss/train': 1.908188819885254} -08/30/2021 15:30:02 - INFO - __main__ - Step 13208: {'lr': 0.0004929592978573168, 'samples': 2535936, 'steps': 13207, 'loss/train': 0.18984326720237732} -08/30/2021 15:30:03 - INFO - __main__ - Step 13209: {'lr': 0.0004929580472508124, 'samples': 2536128, 'steps': 13208, 'loss/train': 1.8235244750976562} -08/30/2021 15:30:04 - INFO - __main__ - Step 13210: {'lr': 0.0004929567965348347, 'samples': 2536320, 'steps': 13209, 'loss/train': 1.8458211421966553} -08/30/2021 15:30:04 - INFO - __main__ - Step 13211: {'lr': 0.0004929555457093847, 'samples': 2536512, 'steps': 13210, 'loss/train': 1.812822699546814} -08/30/2021 15:30:05 - INFO - __main__ - Step 13212: {'lr': 0.0004929542947744625, 'samples': 2536704, 'steps': 13211, 'loss/train': 2.154083728790283} -08/30/2021 15:30:05 - INFO - __main__ - Step 13213: {'lr': 0.0004929530437300689, 'samples': 2536896, 'steps': 13212, 'loss/train': 1.3480331897735596} -08/30/2021 15:30:05 - INFO - __main__ - Step 13214: {'lr': 0.0004929517925762045, 'samples': 2537088, 'steps': 13213, 'loss/train': 1.5183898210525513} -08/30/2021 15:30:07 - INFO - __main__ - Step 13215: {'lr': 0.0004929505413128696, 'samples': 2537280, 'steps': 13214, 'loss/train': 0.8376405835151672} -08/30/2021 15:30:07 - INFO - __main__ - Step 13216: {'lr': 0.000492949289940065, 'samples': 2537472, 'steps': 13215, 'loss/train': 1.357436180114746} -08/30/2021 15:30:08 - INFO - __main__ - Step 13217: {'lr': 0.0004929480384577912, 'samples': 2537664, 'steps': 13216, 'loss/train': 1.9467532634735107} -08/30/2021 15:30:08 - INFO - __main__ - Step 13218: {'lr': 0.0004929467868660487, 'samples': 2537856, 'steps': 13217, 'loss/train': 1.9680449962615967} -08/30/2021 15:30:08 - INFO - __main__ - Step 13219: {'lr': 0.0004929455351648383, 'samples': 2538048, 'steps': 13218, 'loss/train': 1.0793286561965942} -08/30/2021 15:30:10 - INFO - __main__ - Step 13220: {'lr': 0.0004929442833541603, 'samples': 2538240, 'steps': 13219, 'loss/train': 2.0653204917907715} -08/30/2021 15:30:10 - INFO - __main__ - Step 13221: {'lr': 0.0004929430314340154, 'samples': 2538432, 'steps': 13220, 'loss/train': 2.175964593887329} -08/30/2021 15:30:11 - INFO - __main__ - Step 13222: {'lr': 0.000492941779404404, 'samples': 2538624, 'steps': 13221, 'loss/train': 1.3470433950424194} -08/30/2021 15:30:11 - INFO - __main__ - Step 13223: {'lr': 0.0004929405272653269, 'samples': 2538816, 'steps': 13222, 'loss/train': 1.9551588296890259} -08/30/2021 15:30:11 - INFO - __main__ - Step 13224: {'lr': 0.0004929392750167845, 'samples': 2539008, 'steps': 13223, 'loss/train': 1.7434378862380981} -08/30/2021 15:30:13 - INFO - __main__ - Step 13225: {'lr': 0.0004929380226587774, 'samples': 2539200, 'steps': 13224, 'loss/train': 1.5585001707077026} -08/30/2021 15:30:14 - INFO - __main__ - Step 13226: {'lr': 0.0004929367701913062, 'samples': 2539392, 'steps': 13225, 'loss/train': 1.1908096075057983} -08/30/2021 15:30:14 - INFO - __main__ - Step 13227: {'lr': 0.0004929355176143714, 'samples': 2539584, 'steps': 13226, 'loss/train': 1.8879069089889526} -08/30/2021 15:30:14 - INFO - __main__ - Step 13228: {'lr': 0.0004929342649279736, 'samples': 2539776, 'steps': 13227, 'loss/train': 1.9522531032562256} -08/30/2021 15:30:15 - INFO - __main__ - Step 13229: {'lr': 0.0004929330121321134, 'samples': 2539968, 'steps': 13228, 'loss/train': 1.3740723133087158} -08/30/2021 15:30:15 - INFO - __main__ - Step 13230: {'lr': 0.0004929317592267913, 'samples': 2540160, 'steps': 13229, 'loss/train': 2.5365686416625977} -08/30/2021 15:30:17 - INFO - __main__ - Step 13231: {'lr': 0.000492930506212008, 'samples': 2540352, 'steps': 13230, 'loss/train': 1.5278126001358032} -08/30/2021 15:30:18 - INFO - __main__ - Step 13232: {'lr': 0.0004929292530877638, 'samples': 2540544, 'steps': 13231, 'loss/train': 1.9534343481063843} -08/30/2021 15:30:18 - INFO - __main__ - Step 13233: {'lr': 0.0004929279998540596, 'samples': 2540736, 'steps': 13232, 'loss/train': 1.5942615270614624} -08/30/2021 15:30:19 - INFO - __main__ - Step 13234: {'lr': 0.0004929267465108956, 'samples': 2540928, 'steps': 13233, 'loss/train': 2.1778907775878906} -08/30/2021 15:30:19 - INFO - __main__ - Step 13235: {'lr': 0.0004929254930582728, 'samples': 2541120, 'steps': 13234, 'loss/train': 1.9903875589370728} -08/30/2021 15:30:19 - INFO - __main__ - Step 13236: {'lr': 0.0004929242394961914, 'samples': 2541312, 'steps': 13235, 'loss/train': 1.5462241172790527} -08/30/2021 15:30:21 - INFO - __main__ - Step 13237: {'lr': 0.000492922985824652, 'samples': 2541504, 'steps': 13236, 'loss/train': 0.9284600615501404} -08/30/2021 15:30:21 - INFO - __main__ - Step 13238: {'lr': 0.0004929217320436553, 'samples': 2541696, 'steps': 13237, 'loss/train': 1.269327163696289} -08/30/2021 15:30:22 - INFO - __main__ - Step 13239: {'lr': 0.0004929204781532018, 'samples': 2541888, 'steps': 13238, 'loss/train': 0.7098487019538879} -08/30/2021 15:30:22 - INFO - __main__ - Step 13240: {'lr': 0.0004929192241532921, 'samples': 2542080, 'steps': 13239, 'loss/train': 1.7692023515701294} -08/30/2021 15:30:22 - INFO - __main__ - Step 13241: {'lr': 0.0004929179700439269, 'samples': 2542272, 'steps': 13240, 'loss/train': 0.8944202661514282} -08/30/2021 15:30:24 - INFO - __main__ - Step 13242: {'lr': 0.0004929167158251065, 'samples': 2542464, 'steps': 13241, 'loss/train': 2.1399567127227783} -08/30/2021 15:30:24 - INFO - __main__ - Step 13243: {'lr': 0.0004929154614968315, 'samples': 2542656, 'steps': 13242, 'loss/train': 1.815641164779663} -08/30/2021 15:30:25 - INFO - __main__ - Step 13244: {'lr': 0.0004929142070591026, 'samples': 2542848, 'steps': 13243, 'loss/train': 1.5281676054000854} -08/30/2021 15:30:25 - INFO - __main__ - Step 13245: {'lr': 0.0004929129525119203, 'samples': 2543040, 'steps': 13244, 'loss/train': 1.5754562616348267} -08/30/2021 15:30:25 - INFO - __main__ - Step 13246: {'lr': 0.0004929116978552851, 'samples': 2543232, 'steps': 13245, 'loss/train': 1.7237863540649414} -08/30/2021 15:30:27 - INFO - __main__ - Step 13247: {'lr': 0.0004929104430891978, 'samples': 2543424, 'steps': 13246, 'loss/train': 1.7179235219955444} -08/30/2021 15:30:27 - INFO - __main__ - Step 13248: {'lr': 0.0004929091882136587, 'samples': 2543616, 'steps': 13247, 'loss/train': 1.0756183862686157} -08/30/2021 15:30:28 - INFO - __main__ - Step 13249: {'lr': 0.0004929079332286685, 'samples': 2543808, 'steps': 13248, 'loss/train': 1.8723208904266357} -08/30/2021 15:30:28 - INFO - __main__ - Step 13250: {'lr': 0.0004929066781342277, 'samples': 2544000, 'steps': 13249, 'loss/train': 1.806351900100708} -08/30/2021 15:30:28 - INFO - __main__ - Step 13251: {'lr': 0.0004929054229303369, 'samples': 2544192, 'steps': 13250, 'loss/train': 1.8154417276382446} -08/30/2021 15:30:29 - INFO - __main__ - Step 13252: {'lr': 0.0004929041676169967, 'samples': 2544384, 'steps': 13251, 'loss/train': 1.8198550939559937} -08/30/2021 15:30:31 - INFO - __main__ - Step 13253: {'lr': 0.0004929029121942077, 'samples': 2544576, 'steps': 13252, 'loss/train': 1.9762464761734009} -08/30/2021 15:30:31 - INFO - __main__ - Step 13254: {'lr': 0.0004929016566619703, 'samples': 2544768, 'steps': 13253, 'loss/train': 0.40915924310684204} -08/30/2021 15:30:32 - INFO - __main__ - Step 13255: {'lr': 0.0004929004010202851, 'samples': 2544960, 'steps': 13254, 'loss/train': 0.6848592162132263} -08/30/2021 15:30:32 - INFO - __main__ - Step 13256: {'lr': 0.0004928991452691528, 'samples': 2545152, 'steps': 13255, 'loss/train': 1.5487536191940308} -08/30/2021 15:30:32 - INFO - __main__ - Step 13257: {'lr': 0.0004928978894085739, 'samples': 2545344, 'steps': 13256, 'loss/train': 1.764366626739502} -08/30/2021 15:30:34 - INFO - __main__ - Step 13258: {'lr': 0.000492896633438549, 'samples': 2545536, 'steps': 13257, 'loss/train': 1.4504001140594482} -08/30/2021 15:30:34 - INFO - __main__ - Step 13259: {'lr': 0.0004928953773590785, 'samples': 2545728, 'steps': 13258, 'loss/train': 1.9216653108596802} -08/30/2021 15:30:35 - INFO - __main__ - Step 13260: {'lr': 0.0004928941211701632, 'samples': 2545920, 'steps': 13259, 'loss/train': 2.251816987991333} -08/30/2021 15:30:35 - INFO - __main__ - Step 13261: {'lr': 0.0004928928648718035, 'samples': 2546112, 'steps': 13260, 'loss/train': 1.874138593673706} -08/30/2021 15:30:35 - INFO - __main__ - Step 13262: {'lr': 0.0004928916084640001, 'samples': 2546304, 'steps': 13261, 'loss/train': 2.1850218772888184} -08/30/2021 15:30:37 - INFO - __main__ - Step 13263: {'lr': 0.0004928903519467534, 'samples': 2546496, 'steps': 13262, 'loss/train': 1.3525229692459106} -08/30/2021 15:30:37 - INFO - __main__ - Step 13264: {'lr': 0.0004928890953200641, 'samples': 2546688, 'steps': 13263, 'loss/train': 2.343693494796753} -08/30/2021 15:30:38 - INFO - __main__ - Step 13265: {'lr': 0.0004928878385839327, 'samples': 2546880, 'steps': 13264, 'loss/train': 1.8137409687042236} -08/30/2021 15:30:38 - INFO - __main__ - Step 13266: {'lr': 0.0004928865817383597, 'samples': 2547072, 'steps': 13265, 'loss/train': 1.2084486484527588} -08/30/2021 15:30:38 - INFO - __main__ - Step 13267: {'lr': 0.0004928853247833459, 'samples': 2547264, 'steps': 13266, 'loss/train': 1.4776631593704224} -08/30/2021 15:30:40 - INFO - __main__ - Step 13268: {'lr': 0.0004928840677188918, 'samples': 2547456, 'steps': 13267, 'loss/train': 1.9044543504714966} -08/30/2021 15:30:41 - INFO - __main__ - Step 13269: {'lr': 0.0004928828105449977, 'samples': 2547648, 'steps': 13268, 'loss/train': 1.7458200454711914} -08/30/2021 15:30:41 - INFO - __main__ - Step 13270: {'lr': 0.0004928815532616644, 'samples': 2547840, 'steps': 13269, 'loss/train': 1.4329379796981812} -08/30/2021 15:30:42 - INFO - __main__ - Step 13271: {'lr': 0.0004928802958688924, 'samples': 2548032, 'steps': 13270, 'loss/train': 1.7306426763534546} -08/30/2021 15:30:42 - INFO - __main__ - Step 13272: {'lr': 0.0004928790383666823, 'samples': 2548224, 'steps': 13271, 'loss/train': 0.7937204241752625} -08/30/2021 15:30:42 - INFO - __main__ - Step 13273: {'lr': 0.0004928777807550348, 'samples': 2548416, 'steps': 13272, 'loss/train': 1.482376217842102} -08/30/2021 15:30:44 - INFO - __main__ - Step 13274: {'lr': 0.0004928765230339502, 'samples': 2548608, 'steps': 13273, 'loss/train': 1.8877966403961182} -08/30/2021 15:30:45 - INFO - __main__ - Step 13275: {'lr': 0.000492875265203429, 'samples': 2548800, 'steps': 13274, 'loss/train': 1.852259635925293} -08/30/2021 15:30:45 - INFO - __main__ - Step 13276: {'lr': 0.0004928740072634722, 'samples': 2548992, 'steps': 13275, 'loss/train': 1.7160547971725464} -08/30/2021 15:30:45 - INFO - __main__ - Step 13277: {'lr': 0.0004928727492140801, 'samples': 2549184, 'steps': 13276, 'loss/train': 1.6651161909103394} -08/30/2021 15:30:46 - INFO - __main__ - Step 13278: {'lr': 0.0004928714910552533, 'samples': 2549376, 'steps': 13277, 'loss/train': 1.5182185173034668} -08/30/2021 15:30:48 - INFO - __main__ - Step 13279: {'lr': 0.0004928702327869922, 'samples': 2549568, 'steps': 13278, 'loss/train': 2.057767391204834} -08/30/2021 15:30:48 - INFO - __main__ - Step 13280: {'lr': 0.0004928689744092976, 'samples': 2549760, 'steps': 13279, 'loss/train': 1.9808582067489624} -08/30/2021 15:30:48 - INFO - __main__ - Step 13281: {'lr': 0.0004928677159221701, 'samples': 2549952, 'steps': 13280, 'loss/train': 2.1056995391845703} -08/30/2021 15:30:49 - INFO - __main__ - Step 13282: {'lr': 0.00049286645732561, 'samples': 2550144, 'steps': 13281, 'loss/train': 1.766992449760437} -08/30/2021 15:30:49 - INFO - __main__ - Step 13283: {'lr': 0.0004928651986196181, 'samples': 2550336, 'steps': 13282, 'loss/train': 1.5733379125595093} -08/30/2021 15:30:51 - INFO - __main__ - Step 13284: {'lr': 0.0004928639398041948, 'samples': 2550528, 'steps': 13283, 'loss/train': 0.18167980015277863} -08/30/2021 15:30:52 - INFO - __main__ - Step 13285: {'lr': 0.0004928626808793409, 'samples': 2550720, 'steps': 13284, 'loss/train': 1.9902777671813965} -08/30/2021 15:30:52 - INFO - __main__ - Step 13286: {'lr': 0.0004928614218450568, 'samples': 2550912, 'steps': 13285, 'loss/train': 0.9557822942733765} -08/30/2021 15:30:52 - INFO - __main__ - Step 13287: {'lr': 0.000492860162701343, 'samples': 2551104, 'steps': 13286, 'loss/train': 1.8120317459106445} -08/30/2021 15:30:53 - INFO - __main__ - Step 13288: {'lr': 0.0004928589034482001, 'samples': 2551296, 'steps': 13287, 'loss/train': 1.8779343366622925} -08/30/2021 15:30:54 - INFO - __main__ - Step 13289: {'lr': 0.000492857644085629, 'samples': 2551488, 'steps': 13288, 'loss/train': 1.497378945350647} -08/30/2021 15:30:55 - INFO - __main__ - Step 13290: {'lr': 0.0004928563846136296, 'samples': 2551680, 'steps': 13289, 'loss/train': 1.435523509979248} -08/30/2021 15:30:55 - INFO - __main__ - Step 13291: {'lr': 0.0004928551250322032, 'samples': 2551872, 'steps': 13290, 'loss/train': 1.588564395904541} -08/30/2021 15:30:55 - INFO - __main__ - Step 13292: {'lr': 0.0004928538653413499, 'samples': 2552064, 'steps': 13291, 'loss/train': 2.1687352657318115} -08/30/2021 15:30:56 - INFO - __main__ - Step 13293: {'lr': 0.0004928526055410704, 'samples': 2552256, 'steps': 13292, 'loss/train': 1.9012430906295776} -08/30/2021 15:30:56 - INFO - __main__ - Step 13294: {'lr': 0.0004928513456313653, 'samples': 2552448, 'steps': 13293, 'loss/train': 1.6171404123306274} -08/30/2021 15:30:58 - INFO - __main__ - Step 13295: {'lr': 0.000492850085612235, 'samples': 2552640, 'steps': 13294, 'loss/train': 1.7512423992156982} -08/30/2021 15:30:58 - INFO - __main__ - Step 13296: {'lr': 0.0004928488254836804, 'samples': 2552832, 'steps': 13295, 'loss/train': 2.2569284439086914} -08/30/2021 15:30:58 - INFO - __main__ - Step 13297: {'lr': 0.0004928475652457017, 'samples': 2553024, 'steps': 13296, 'loss/train': 2.118741750717163} -08/30/2021 15:30:59 - INFO - __main__ - Step 13298: {'lr': 0.0004928463048982998, 'samples': 2553216, 'steps': 13297, 'loss/train': 1.2525237798690796} -08/30/2021 15:30:59 - INFO - __main__ - Step 13299: {'lr': 0.0004928450444414749, 'samples': 2553408, 'steps': 13298, 'loss/train': 1.3978713750839233} -08/30/2021 15:31:00 - INFO - __main__ - Step 13300: {'lr': 0.0004928437838752278, 'samples': 2553600, 'steps': 13299, 'loss/train': 1.324633240699768} -08/30/2021 15:31:01 - INFO - __main__ - Step 13301: {'lr': 0.0004928425231995593, 'samples': 2553792, 'steps': 13300, 'loss/train': 1.0953269004821777} -08/30/2021 15:31:01 - INFO - __main__ - Step 13302: {'lr': 0.0004928412624144694, 'samples': 2553984, 'steps': 13301, 'loss/train': 2.4973647594451904} -08/30/2021 15:31:02 - INFO - __main__ - Step 13303: {'lr': 0.0004928400015199591, 'samples': 2554176, 'steps': 13302, 'loss/train': 1.8358838558197021} -08/30/2021 15:31:02 - INFO - __main__ - Step 13304: {'lr': 0.0004928387405160288, 'samples': 2554368, 'steps': 13303, 'loss/train': 1.4225980043411255} -08/30/2021 15:31:03 - INFO - __main__ - Step 13305: {'lr': 0.0004928374794026792, 'samples': 2554560, 'steps': 13304, 'loss/train': 2.1696431636810303} -08/30/2021 15:31:04 - INFO - __main__ - Step 13306: {'lr': 0.0004928362181799107, 'samples': 2554752, 'steps': 13305, 'loss/train': 1.1681604385375977} -08/30/2021 15:31:04 - INFO - __main__ - Step 13307: {'lr': 0.0004928349568477239, 'samples': 2554944, 'steps': 13306, 'loss/train': 2.1276936531066895} -08/30/2021 15:31:05 - INFO - __main__ - Step 13308: {'lr': 0.0004928336954061195, 'samples': 2555136, 'steps': 13307, 'loss/train': 2.125086784362793} -08/30/2021 15:31:05 - INFO - __main__ - Step 13309: {'lr': 0.000492832433855098, 'samples': 2555328, 'steps': 13308, 'loss/train': 1.6042321920394897} -08/30/2021 15:31:07 - INFO - __main__ - Step 13310: {'lr': 0.0004928311721946599, 'samples': 2555520, 'steps': 13309, 'loss/train': 2.4290051460266113} -08/30/2021 15:31:07 - INFO - __main__ - Step 13311: {'lr': 0.0004928299104248059, 'samples': 2555712, 'steps': 13310, 'loss/train': 1.592270016670227} -08/30/2021 15:31:07 - INFO - __main__ - Step 13312: {'lr': 0.0004928286485455365, 'samples': 2555904, 'steps': 13311, 'loss/train': 1.0809060335159302} -08/30/2021 15:31:08 - INFO - __main__ - Step 13313: {'lr': 0.0004928273865568521, 'samples': 2556096, 'steps': 13312, 'loss/train': 1.4615657329559326} -08/30/2021 15:31:08 - INFO - __main__ - Step 13314: {'lr': 0.0004928261244587536, 'samples': 2556288, 'steps': 13313, 'loss/train': 1.2980906963348389} -08/30/2021 15:31:08 - INFO - __main__ - Step 13315: {'lr': 0.0004928248622512412, 'samples': 2556480, 'steps': 13314, 'loss/train': 1.498451590538025} -08/30/2021 15:31:11 - INFO - __main__ - Step 13316: {'lr': 0.0004928235999343159, 'samples': 2556672, 'steps': 13315, 'loss/train': 2.0136260986328125} -08/30/2021 15:31:11 - INFO - __main__ - Step 13317: {'lr': 0.0004928223375079778, 'samples': 2556864, 'steps': 13316, 'loss/train': 1.6528249979019165} -08/30/2021 15:31:12 - INFO - __main__ - Step 13318: {'lr': 0.0004928210749722278, 'samples': 2557056, 'steps': 13317, 'loss/train': 1.390761137008667} -08/30/2021 15:31:12 - INFO - __main__ - Step 13319: {'lr': 0.0004928198123270664, 'samples': 2557248, 'steps': 13318, 'loss/train': 1.7772823572158813} -08/30/2021 15:31:13 - INFO - __main__ - Step 13320: {'lr': 0.0004928185495724942, 'samples': 2557440, 'steps': 13319, 'loss/train': 1.8425750732421875} -08/30/2021 15:31:13 - INFO - __main__ - Step 13321: {'lr': 0.0004928172867085115, 'samples': 2557632, 'steps': 13320, 'loss/train': 1.2989501953125} -08/30/2021 15:31:13 - INFO - __main__ - Step 13322: {'lr': 0.0004928160237351192, 'samples': 2557824, 'steps': 13321, 'loss/train': 1.7174687385559082} -08/30/2021 15:31:15 - INFO - __main__ - Step 13323: {'lr': 0.0004928147606523179, 'samples': 2558016, 'steps': 13322, 'loss/train': 1.8456381559371948} -08/30/2021 15:31:15 - INFO - __main__ - Step 13324: {'lr': 0.0004928134974601078, 'samples': 2558208, 'steps': 13323, 'loss/train': 1.8499038219451904} -08/30/2021 15:31:16 - INFO - __main__ - Step 13325: {'lr': 0.0004928122341584897, 'samples': 2558400, 'steps': 13324, 'loss/train': 1.5015943050384521} -08/30/2021 15:31:16 - INFO - __main__ - Step 13326: {'lr': 0.0004928109707474643, 'samples': 2558592, 'steps': 13325, 'loss/train': 1.7252732515335083} -08/30/2021 15:31:16 - INFO - __main__ - Step 13327: {'lr': 0.0004928097072270319, 'samples': 2558784, 'steps': 13326, 'loss/train': 1.6393089294433594} -08/30/2021 15:31:18 - INFO - __main__ - Step 13328: {'lr': 0.0004928084435971932, 'samples': 2558976, 'steps': 13327, 'loss/train': 1.2961522340774536} -08/30/2021 15:31:18 - INFO - __main__ - Step 13329: {'lr': 0.0004928071798579488, 'samples': 2559168, 'steps': 13328, 'loss/train': 1.9010658264160156} -08/30/2021 15:31:19 - INFO - __main__ - Step 13330: {'lr': 0.0004928059160092993, 'samples': 2559360, 'steps': 13329, 'loss/train': 3.0207693576812744} -08/30/2021 15:31:19 - INFO - __main__ - Step 13331: {'lr': 0.000492804652051245, 'samples': 2559552, 'steps': 13330, 'loss/train': 1.5045816898345947} -08/30/2021 15:31:19 - INFO - __main__ - Step 13332: {'lr': 0.0004928033879837868, 'samples': 2559744, 'steps': 13331, 'loss/train': 2.1083710193634033} -08/30/2021 15:31:21 - INFO - __main__ - Step 13333: {'lr': 0.0004928021238069251, 'samples': 2559936, 'steps': 13332, 'loss/train': 1.9268851280212402} -08/30/2021 15:31:21 - INFO - __main__ - Step 13334: {'lr': 0.0004928008595206605, 'samples': 2560128, 'steps': 13333, 'loss/train': 2.03450608253479} -08/30/2021 15:31:22 - INFO - __main__ - Step 13335: {'lr': 0.0004927995951249937, 'samples': 2560320, 'steps': 13334, 'loss/train': 1.4016634225845337} -08/30/2021 15:31:22 - INFO - __main__ - Step 13336: {'lr': 0.0004927983306199251, 'samples': 2560512, 'steps': 13335, 'loss/train': 1.840184211730957} -08/30/2021 15:31:22 - INFO - __main__ - Step 13337: {'lr': 0.0004927970660054552, 'samples': 2560704, 'steps': 13336, 'loss/train': 2.3702948093414307} -08/30/2021 15:31:24 - INFO - __main__ - Step 13338: {'lr': 0.0004927958012815849, 'samples': 2560896, 'steps': 13337, 'loss/train': 1.7123851776123047} -08/30/2021 15:31:25 - INFO - __main__ - Step 13339: {'lr': 0.0004927945364483144, 'samples': 2561088, 'steps': 13338, 'loss/train': 1.6064941883087158} -08/30/2021 15:31:25 - INFO - __main__ - Step 13340: {'lr': 0.0004927932715056444, 'samples': 2561280, 'steps': 13339, 'loss/train': 1.7054412364959717} -08/30/2021 15:31:25 - INFO - __main__ - Step 13341: {'lr': 0.0004927920064535756, 'samples': 2561472, 'steps': 13340, 'loss/train': 1.9482789039611816} -08/30/2021 15:31:26 - INFO - __main__ - Step 13342: {'lr': 0.0004927907412921084, 'samples': 2561664, 'steps': 13341, 'loss/train': 2.082087516784668} -08/30/2021 15:31:26 - INFO - __main__ - Step 13343: {'lr': 0.0004927894760212435, 'samples': 2561856, 'steps': 13342, 'loss/train': 2.1705963611602783} -08/30/2021 15:31:28 - INFO - __main__ - Step 13344: {'lr': 0.0004927882106409813, 'samples': 2562048, 'steps': 13343, 'loss/train': 1.5502218008041382} -08/30/2021 15:31:28 - INFO - __main__ - Step 13345: {'lr': 0.0004927869451513226, 'samples': 2562240, 'steps': 13344, 'loss/train': 1.7382903099060059} -08/30/2021 15:31:28 - INFO - __main__ - Step 13346: {'lr': 0.0004927856795522678, 'samples': 2562432, 'steps': 13345, 'loss/train': 1.8929860591888428} -08/30/2021 15:31:29 - INFO - __main__ - Step 13347: {'lr': 0.0004927844138438175, 'samples': 2562624, 'steps': 13346, 'loss/train': 2.2494239807128906} -08/30/2021 15:31:29 - INFO - __main__ - Step 13348: {'lr': 0.0004927831480259723, 'samples': 2562816, 'steps': 13347, 'loss/train': 1.2005528211593628} -08/30/2021 15:31:31 - INFO - __main__ - Step 13349: {'lr': 0.0004927818820987328, 'samples': 2563008, 'steps': 13348, 'loss/train': 1.6468842029571533} -08/30/2021 15:31:31 - INFO - __main__ - Step 13350: {'lr': 0.0004927806160620995, 'samples': 2563200, 'steps': 13349, 'loss/train': 3.6370012760162354} -08/30/2021 15:31:32 - INFO - __main__ - Step 13351: {'lr': 0.0004927793499160729, 'samples': 2563392, 'steps': 13350, 'loss/train': 1.8585752248764038} -08/30/2021 15:31:32 - INFO - __main__ - Step 13352: {'lr': 0.000492778083660654, 'samples': 2563584, 'steps': 13351, 'loss/train': 1.6590094566345215} -08/30/2021 15:31:32 - INFO - __main__ - Step 13353: {'lr': 0.0004927768172958427, 'samples': 2563776, 'steps': 13352, 'loss/train': 2.0702600479125977} -08/30/2021 15:31:34 - INFO - __main__ - Step 13354: {'lr': 0.00049277555082164, 'samples': 2563968, 'steps': 13353, 'loss/train': 2.8682162761688232} -08/30/2021 15:31:35 - INFO - __main__ - Step 13355: {'lr': 0.0004927742842380465, 'samples': 2564160, 'steps': 13354, 'loss/train': 2.250650644302368} -08/30/2021 15:31:35 - INFO - __main__ - Step 13356: {'lr': 0.0004927730175450626, 'samples': 2564352, 'steps': 13355, 'loss/train': 1.4539607763290405} -08/30/2021 15:31:35 - INFO - __main__ - Step 13357: {'lr': 0.0004927717507426887, 'samples': 2564544, 'steps': 13356, 'loss/train': 2.3869025707244873} -08/30/2021 15:31:36 - INFO - __main__ - Step 13358: {'lr': 0.0004927704838309259, 'samples': 2564736, 'steps': 13357, 'loss/train': 0.7346906661987305} -08/30/2021 15:31:36 - INFO - __main__ - Step 13359: {'lr': 0.0004927692168097743, 'samples': 2564928, 'steps': 13358, 'loss/train': 0.4545074701309204} -08/30/2021 15:31:38 - INFO - __main__ - Step 13360: {'lr': 0.0004927679496792347, 'samples': 2565120, 'steps': 13359, 'loss/train': 1.3047525882720947} -08/30/2021 15:31:38 - INFO - __main__ - Step 13361: {'lr': 0.0004927666824393076, 'samples': 2565312, 'steps': 13360, 'loss/train': 2.1561946868896484} -08/30/2021 15:31:38 - INFO - __main__ - Step 13362: {'lr': 0.0004927654150899937, 'samples': 2565504, 'steps': 13361, 'loss/train': 2.065976858139038} -08/30/2021 15:31:39 - INFO - __main__ - Step 13363: {'lr': 0.0004927641476312932, 'samples': 2565696, 'steps': 13362, 'loss/train': 1.631472110748291} -08/30/2021 15:31:39 - INFO - __main__ - Step 13364: {'lr': 0.000492762880063207, 'samples': 2565888, 'steps': 13363, 'loss/train': 1.8592429161071777} -08/30/2021 15:31:40 - INFO - __main__ - Step 13365: {'lr': 0.0004927616123857357, 'samples': 2566080, 'steps': 13364, 'loss/train': 1.8340822458267212} -08/30/2021 15:31:41 - INFO - __main__ - Step 13366: {'lr': 0.0004927603445988797, 'samples': 2566272, 'steps': 13365, 'loss/train': 1.757806658744812} -08/30/2021 15:31:41 - INFO - __main__ - Step 13367: {'lr': 0.0004927590767026396, 'samples': 2566464, 'steps': 13366, 'loss/train': 2.1953835487365723} -08/30/2021 15:31:42 - INFO - __main__ - Step 13368: {'lr': 0.0004927578086970161, 'samples': 2566656, 'steps': 13367, 'loss/train': 1.2725802659988403} -08/30/2021 15:31:42 - INFO - __main__ - Step 13369: {'lr': 0.0004927565405820096, 'samples': 2566848, 'steps': 13368, 'loss/train': 1.6763789653778076} -08/30/2021 15:31:43 - INFO - __main__ - Step 13370: {'lr': 0.0004927552723576207, 'samples': 2567040, 'steps': 13369, 'loss/train': 1.4753245115280151} -08/30/2021 15:31:44 - INFO - __main__ - Step 13371: {'lr': 0.0004927540040238501, 'samples': 2567232, 'steps': 13370, 'loss/train': 1.8064439296722412} -08/30/2021 15:31:44 - INFO - __main__ - Step 13372: {'lr': 0.0004927527355806983, 'samples': 2567424, 'steps': 13371, 'loss/train': 1.9299222230911255} -08/30/2021 15:31:45 - INFO - __main__ - Step 13373: {'lr': 0.0004927514670281659, 'samples': 2567616, 'steps': 13372, 'loss/train': 2.529559373855591} -08/30/2021 15:31:45 - INFO - __main__ - Step 13374: {'lr': 0.0004927501983662534, 'samples': 2567808, 'steps': 13373, 'loss/train': 1.4066401720046997} -08/30/2021 15:31:47 - INFO - __main__ - Step 13375: {'lr': 0.0004927489295949613, 'samples': 2568000, 'steps': 13374, 'loss/train': 1.5471380949020386} -08/30/2021 15:31:47 - INFO - __main__ - Step 13376: {'lr': 0.0004927476607142904, 'samples': 2568192, 'steps': 13375, 'loss/train': 1.9019792079925537} -08/30/2021 15:31:47 - INFO - __main__ - Step 13377: {'lr': 0.0004927463917242411, 'samples': 2568384, 'steps': 13376, 'loss/train': 0.1306307017803192} -08/30/2021 15:31:48 - INFO - __main__ - Step 13378: {'lr': 0.0004927451226248141, 'samples': 2568576, 'steps': 13377, 'loss/train': 1.5481854677200317} -08/30/2021 15:31:48 - INFO - __main__ - Step 13379: {'lr': 0.0004927438534160098, 'samples': 2568768, 'steps': 13378, 'loss/train': 1.2974473237991333} -08/30/2021 15:31:49 - INFO - __main__ - Step 13380: {'lr': 0.0004927425840978289, 'samples': 2568960, 'steps': 13379, 'loss/train': 1.4157050848007202} -08/30/2021 15:31:50 - INFO - __main__ - Step 13381: {'lr': 0.0004927413146702719, 'samples': 2569152, 'steps': 13380, 'loss/train': 1.8663315773010254} -08/30/2021 15:31:50 - INFO - __main__ - Step 13382: {'lr': 0.0004927400451333394, 'samples': 2569344, 'steps': 13381, 'loss/train': 2.2063639163970947} -08/30/2021 15:31:51 - INFO - __main__ - Step 13383: {'lr': 0.0004927387754870321, 'samples': 2569536, 'steps': 13382, 'loss/train': 2.020737648010254} -08/30/2021 15:31:51 - INFO - __main__ - Step 13384: {'lr': 0.0004927375057313504, 'samples': 2569728, 'steps': 13383, 'loss/train': 1.731574535369873} -08/30/2021 15:31:53 - INFO - __main__ - Step 13385: {'lr': 0.0004927362358662948, 'samples': 2569920, 'steps': 13384, 'loss/train': 2.4749715328216553} -08/30/2021 15:31:53 - INFO - __main__ - Step 13386: {'lr': 0.0004927349658918662, 'samples': 2570112, 'steps': 13385, 'loss/train': 1.827108383178711} -08/30/2021 15:31:54 - INFO - __main__ - Step 13387: {'lr': 0.0004927336958080648, 'samples': 2570304, 'steps': 13386, 'loss/train': 0.7441443800926208} -08/30/2021 15:31:54 - INFO - __main__ - Step 13388: {'lr': 0.0004927324256148914, 'samples': 2570496, 'steps': 13387, 'loss/train': 1.480206847190857} -08/30/2021 15:31:54 - INFO - __main__ - Step 13389: {'lr': 0.0004927311553123465, 'samples': 2570688, 'steps': 13388, 'loss/train': 1.9811094999313354} -08/30/2021 15:31:56 - INFO - __main__ - Step 13390: {'lr': 0.0004927298849004307, 'samples': 2570880, 'steps': 13389, 'loss/train': 2.4168450832366943} -08/30/2021 15:31:57 - INFO - __main__ - Step 13391: {'lr': 0.0004927286143791447, 'samples': 2571072, 'steps': 13390, 'loss/train': 1.5338354110717773} -08/30/2021 15:31:57 - INFO - __main__ - Step 13392: {'lr': 0.0004927273437484888, 'samples': 2571264, 'steps': 13391, 'loss/train': 2.638021230697632} -08/30/2021 15:31:57 - INFO - __main__ - Step 13393: {'lr': 0.0004927260730084636, 'samples': 2571456, 'steps': 13392, 'loss/train': 1.6690860986709595} -08/30/2021 15:31:58 - INFO - __main__ - Step 13394: {'lr': 0.0004927248021590699, 'samples': 2571648, 'steps': 13393, 'loss/train': 1.7890369892120361} -08/30/2021 15:31:58 - INFO - __main__ - Step 13395: {'lr': 0.0004927235312003082, 'samples': 2571840, 'steps': 13394, 'loss/train': 1.6572185754776} -08/30/2021 15:32:00 - INFO - __main__ - Step 13396: {'lr': 0.0004927222601321789, 'samples': 2572032, 'steps': 13395, 'loss/train': 1.8415395021438599} -08/30/2021 15:32:00 - INFO - __main__ - Step 13397: {'lr': 0.0004927209889546828, 'samples': 2572224, 'steps': 13396, 'loss/train': 1.4626591205596924} -08/30/2021 15:32:01 - INFO - __main__ - Step 13398: {'lr': 0.0004927197176678203, 'samples': 2572416, 'steps': 13397, 'loss/train': 1.4553471803665161} -08/30/2021 15:32:01 - INFO - __main__ - Step 13399: {'lr': 0.000492718446271592, 'samples': 2572608, 'steps': 13398, 'loss/train': 1.4588000774383545} -08/30/2021 15:32:01 - INFO - __main__ - Step 13400: {'lr': 0.0004927171747659986, 'samples': 2572800, 'steps': 13399, 'loss/train': 1.9691166877746582} -08/30/2021 15:32:03 - INFO - __main__ - Step 13401: {'lr': 0.0004927159031510405, 'samples': 2572992, 'steps': 13400, 'loss/train': 1.2933005094528198} -08/30/2021 15:32:03 - INFO - __main__ - Step 13402: {'lr': 0.0004927146314267184, 'samples': 2573184, 'steps': 13401, 'loss/train': 1.8195914030075073} -08/30/2021 15:32:04 - INFO - __main__ - Step 13403: {'lr': 0.000492713359593033, 'samples': 2573376, 'steps': 13402, 'loss/train': 1.3688124418258667} -08/30/2021 15:32:04 - INFO - __main__ - Step 13404: {'lr': 0.0004927120876499846, 'samples': 2573568, 'steps': 13403, 'loss/train': 1.0743030309677124} -08/30/2021 15:32:04 - INFO - __main__ - Step 13405: {'lr': 0.0004927108155975738, 'samples': 2573760, 'steps': 13404, 'loss/train': 0.2135283201932907} -08/30/2021 15:32:06 - INFO - __main__ - Step 13406: {'lr': 0.0004927095434358012, 'samples': 2573952, 'steps': 13405, 'loss/train': 1.4170094728469849} -08/30/2021 15:32:06 - INFO - __main__ - Step 13407: {'lr': 0.0004927082711646676, 'samples': 2574144, 'steps': 13406, 'loss/train': 1.9869948625564575} -08/30/2021 15:32:07 - INFO - __main__ - Step 13408: {'lr': 0.0004927069987841733, 'samples': 2574336, 'steps': 13407, 'loss/train': 1.0781617164611816} -08/30/2021 15:32:07 - INFO - __main__ - Step 13409: {'lr': 0.0004927057262943189, 'samples': 2574528, 'steps': 13408, 'loss/train': 2.1366934776306152} -08/30/2021 15:32:07 - INFO - __main__ - Step 13410: {'lr': 0.0004927044536951052, 'samples': 2574720, 'steps': 13409, 'loss/train': 1.9036860466003418} -08/30/2021 15:32:09 - INFO - __main__ - Step 13411: {'lr': 0.0004927031809865324, 'samples': 2574912, 'steps': 13410, 'loss/train': 1.7845879793167114} -08/30/2021 15:32:09 - INFO - __main__ - Step 13412: {'lr': 0.0004927019081686015, 'samples': 2575104, 'steps': 13411, 'loss/train': 1.9031624794006348} -08/30/2021 15:32:10 - INFO - __main__ - Step 13413: {'lr': 0.0004927006352413128, 'samples': 2575296, 'steps': 13412, 'loss/train': 1.0926494598388672} -08/30/2021 15:32:10 - INFO - __main__ - Step 13414: {'lr': 0.000492699362204667, 'samples': 2575488, 'steps': 13413, 'loss/train': 1.0936707258224487} -08/30/2021 15:32:10 - INFO - __main__ - Step 13415: {'lr': 0.0004926980890586645, 'samples': 2575680, 'steps': 13414, 'loss/train': 1.6012905836105347} -08/30/2021 15:32:12 - INFO - __main__ - Step 13416: {'lr': 0.000492696815803306, 'samples': 2575872, 'steps': 13415, 'loss/train': 1.9375407695770264} -08/30/2021 15:32:12 - INFO - __main__ - Step 13417: {'lr': 0.0004926955424385921, 'samples': 2576064, 'steps': 13416, 'loss/train': 1.780282974243164} -08/30/2021 15:32:13 - INFO - __main__ - Step 13418: {'lr': 0.0004926942689645234, 'samples': 2576256, 'steps': 13417, 'loss/train': 0.8918399810791016} -08/30/2021 15:32:13 - INFO - __main__ - Step 13419: {'lr': 0.0004926929953811003, 'samples': 2576448, 'steps': 13418, 'loss/train': 1.4750359058380127} -08/30/2021 15:32:13 - INFO - __main__ - Step 13420: {'lr': 0.0004926917216883235, 'samples': 2576640, 'steps': 13419, 'loss/train': 1.820640206336975} -08/30/2021 15:32:15 - INFO - __main__ - Step 13421: {'lr': 0.0004926904478861937, 'samples': 2576832, 'steps': 13420, 'loss/train': 1.9349567890167236} -08/30/2021 15:32:15 - INFO - __main__ - Step 13422: {'lr': 0.0004926891739747111, 'samples': 2577024, 'steps': 13421, 'loss/train': 2.1062088012695312} -08/30/2021 15:32:16 - INFO - __main__ - Step 13423: {'lr': 0.0004926878999538766, 'samples': 2577216, 'steps': 13422, 'loss/train': 1.8544186353683472} -08/30/2021 15:32:16 - INFO - __main__ - Step 13424: {'lr': 0.0004926866258236907, 'samples': 2577408, 'steps': 13423, 'loss/train': 2.040912389755249} -08/30/2021 15:32:16 - INFO - __main__ - Step 13425: {'lr': 0.000492685351584154, 'samples': 2577600, 'steps': 13424, 'loss/train': 1.3988056182861328} -08/30/2021 15:32:18 - INFO - __main__ - Step 13426: {'lr': 0.000492684077235267, 'samples': 2577792, 'steps': 13425, 'loss/train': 0.15480317175388336} -08/30/2021 15:32:18 - INFO - __main__ - Step 13427: {'lr': 0.0004926828027770302, 'samples': 2577984, 'steps': 13426, 'loss/train': 1.557691216468811} -08/30/2021 15:32:19 - INFO - __main__ - Step 13428: {'lr': 0.0004926815282094443, 'samples': 2578176, 'steps': 13427, 'loss/train': 1.267248272895813} -08/30/2021 15:32:19 - INFO - __main__ - Step 13429: {'lr': 0.00049268025353251, 'samples': 2578368, 'steps': 13428, 'loss/train': 1.7829160690307617} -08/30/2021 15:32:19 - INFO - __main__ - Step 13430: {'lr': 0.0004926789787462276, 'samples': 2578560, 'steps': 13429, 'loss/train': 1.8831775188446045} -08/30/2021 15:32:21 - INFO - __main__ - Step 13431: {'lr': 0.0004926777038505978, 'samples': 2578752, 'steps': 13430, 'loss/train': 2.025161027908325} -08/30/2021 15:32:22 - INFO - __main__ - Step 13432: {'lr': 0.0004926764288456212, 'samples': 2578944, 'steps': 13431, 'loss/train': 1.5182650089263916} -08/30/2021 15:32:22 - INFO - __main__ - Step 13433: {'lr': 0.0004926751537312982, 'samples': 2579136, 'steps': 13432, 'loss/train': 2.0059070587158203} -08/30/2021 15:32:22 - INFO - __main__ - Step 13434: {'lr': 0.0004926738785076297, 'samples': 2579328, 'steps': 13433, 'loss/train': 1.5889866352081299} -08/30/2021 15:32:23 - INFO - __main__ - Step 13435: {'lr': 0.000492672603174616, 'samples': 2579520, 'steps': 13434, 'loss/train': 1.8432821035385132} -08/30/2021 15:32:23 - INFO - __main__ - Step 13436: {'lr': 0.0004926713277322579, 'samples': 2579712, 'steps': 13435, 'loss/train': 1.587931513786316} -08/30/2021 15:32:25 - INFO - __main__ - Step 13437: {'lr': 0.0004926700521805557, 'samples': 2579904, 'steps': 13436, 'loss/train': 0.8050898909568787} -08/30/2021 15:32:25 - INFO - __main__ - Step 13438: {'lr': 0.0004926687765195102, 'samples': 2580096, 'steps': 13437, 'loss/train': 1.083593487739563} -08/30/2021 15:32:26 - INFO - __main__ - Step 13439: {'lr': 0.0004926675007491218, 'samples': 2580288, 'steps': 13438, 'loss/train': 1.3361473083496094} -08/30/2021 15:32:26 - INFO - __main__ - Step 13440: {'lr': 0.0004926662248693912, 'samples': 2580480, 'steps': 13439, 'loss/train': 2.625636577606201} -08/30/2021 15:32:26 - INFO - __main__ - Step 13441: {'lr': 0.000492664948880319, 'samples': 2580672, 'steps': 13440, 'loss/train': 0.5153382420539856} -08/30/2021 15:32:28 - INFO - __main__ - Step 13442: {'lr': 0.0004926636727819057, 'samples': 2580864, 'steps': 13441, 'loss/train': 1.1688904762268066} -08/30/2021 15:32:28 - INFO - __main__ - Step 13443: {'lr': 0.0004926623965741519, 'samples': 2581056, 'steps': 13442, 'loss/train': 0.3777546286582947} -08/30/2021 15:32:29 - INFO - __main__ - Step 13444: {'lr': 0.0004926611202570582, 'samples': 2581248, 'steps': 13443, 'loss/train': 2.0682897567749023} -08/30/2021 15:32:29 - INFO - __main__ - Step 13445: {'lr': 0.0004926598438306252, 'samples': 2581440, 'steps': 13444, 'loss/train': 1.3861676454544067} -08/30/2021 15:32:29 - INFO - __main__ - Step 13446: {'lr': 0.0004926585672948532, 'samples': 2581632, 'steps': 13445, 'loss/train': 1.8295286893844604} -08/30/2021 15:32:32 - INFO - __main__ - Step 13447: {'lr': 0.0004926572906497432, 'samples': 2581824, 'steps': 13446, 'loss/train': 2.2387988567352295} -08/30/2021 15:32:32 - INFO - __main__ - Step 13448: {'lr': 0.0004926560138952955, 'samples': 2582016, 'steps': 13447, 'loss/train': 1.6616758108139038} -08/30/2021 15:32:32 - INFO - __main__ - Step 13449: {'lr': 0.0004926547370315106, 'samples': 2582208, 'steps': 13448, 'loss/train': 1.9965187311172485} -08/30/2021 15:32:33 - INFO - __main__ - Step 13450: {'lr': 0.0004926534600583894, 'samples': 2582400, 'steps': 13449, 'loss/train': 1.5119333267211914} -08/30/2021 15:32:33 - INFO - __main__ - Step 13451: {'lr': 0.0004926521829759323, 'samples': 2582592, 'steps': 13450, 'loss/train': 0.17454367876052856} -08/30/2021 15:32:35 - INFO - __main__ - Step 13452: {'lr': 0.0004926509057841397, 'samples': 2582784, 'steps': 13451, 'loss/train': 0.9735919237136841} -08/30/2021 15:32:35 - INFO - __main__ - Step 13453: {'lr': 0.0004926496284830125, 'samples': 2582976, 'steps': 13452, 'loss/train': 1.9807783365249634} -08/30/2021 15:32:36 - INFO - __main__ - Step 13454: {'lr': 0.0004926483510725511, 'samples': 2583168, 'steps': 13453, 'loss/train': 2.1969621181488037} -08/30/2021 15:32:36 - INFO - __main__ - Step 13455: {'lr': 0.000492647073552756, 'samples': 2583360, 'steps': 13454, 'loss/train': 1.5524709224700928} -08/30/2021 15:32:36 - INFO - __main__ - Step 13456: {'lr': 0.000492645795923628, 'samples': 2583552, 'steps': 13455, 'loss/train': 1.983012318611145} -08/30/2021 15:32:37 - INFO - __main__ - Step 13457: {'lr': 0.0004926445181851675, 'samples': 2583744, 'steps': 13456, 'loss/train': 1.7045586109161377} -08/30/2021 15:32:38 - INFO - __main__ - Step 13458: {'lr': 0.0004926432403373752, 'samples': 2583936, 'steps': 13457, 'loss/train': 0.1535819172859192} -08/30/2021 15:32:39 - INFO - __main__ - Step 13459: {'lr': 0.0004926419623802515, 'samples': 2584128, 'steps': 13458, 'loss/train': 2.1512367725372314} -08/30/2021 15:32:39 - INFO - __main__ - Step 13460: {'lr': 0.0004926406843137971, 'samples': 2584320, 'steps': 13459, 'loss/train': 1.4353790283203125} -08/30/2021 15:32:40 - INFO - __main__ - Step 13461: {'lr': 0.0004926394061380126, 'samples': 2584512, 'steps': 13460, 'loss/train': 1.5081475973129272} -08/30/2021 15:32:40 - INFO - __main__ - Step 13462: {'lr': 0.0004926381278528984, 'samples': 2584704, 'steps': 13461, 'loss/train': 1.1380120515823364} -08/30/2021 15:32:42 - INFO - __main__ - Step 13463: {'lr': 0.0004926368494584553, 'samples': 2584896, 'steps': 13462, 'loss/train': 0.14483055472373962} -08/30/2021 15:32:42 - INFO - __main__ - Step 13464: {'lr': 0.0004926355709546838, 'samples': 2585088, 'steps': 13463, 'loss/train': 1.4653459787368774} -08/30/2021 15:32:43 - INFO - __main__ - Step 13465: {'lr': 0.0004926342923415844, 'samples': 2585280, 'steps': 13464, 'loss/train': 1.9759973287582397} -08/30/2021 15:32:43 - INFO - __main__ - Step 13466: {'lr': 0.0004926330136191577, 'samples': 2585472, 'steps': 13465, 'loss/train': 1.9447349309921265} -08/30/2021 15:32:43 - INFO - __main__ - Step 13467: {'lr': 0.0004926317347874044, 'samples': 2585664, 'steps': 13466, 'loss/train': 3.166593074798584} -08/30/2021 15:32:44 - INFO - __main__ - Step 13468: {'lr': 0.000492630455846325, 'samples': 2585856, 'steps': 13467, 'loss/train': 0.10132548213005066} -08/30/2021 15:32:45 - INFO - __main__ - Step 13469: {'lr': 0.0004926291767959199, 'samples': 2586048, 'steps': 13468, 'loss/train': 1.5672332048416138} -08/30/2021 15:32:46 - INFO - __main__ - Step 13470: {'lr': 0.00049262789763619, 'samples': 2586240, 'steps': 13469, 'loss/train': 1.7698413133621216} -08/30/2021 15:32:46 - INFO - __main__ - Step 13471: {'lr': 0.0004926266183671356, 'samples': 2586432, 'steps': 13470, 'loss/train': 2.4681591987609863} -08/30/2021 15:32:46 - INFO - __main__ - Step 13472: {'lr': 0.0004926253389887575, 'samples': 2586624, 'steps': 13471, 'loss/train': 1.5869358777999878} -08/30/2021 15:32:47 - INFO - __main__ - Step 13473: {'lr': 0.0004926240595010561, 'samples': 2586816, 'steps': 13472, 'loss/train': 1.713945746421814} -08/30/2021 15:32:48 - INFO - __main__ - Step 13474: {'lr': 0.000492622779904032, 'samples': 2587008, 'steps': 13473, 'loss/train': 1.8002439737319946} -08/30/2021 15:32:49 - INFO - __main__ - Step 13475: {'lr': 0.000492621500197686, 'samples': 2587200, 'steps': 13474, 'loss/train': 1.5905848741531372} -08/30/2021 15:32:49 - INFO - __main__ - Step 13476: {'lr': 0.0004926202203820182, 'samples': 2587392, 'steps': 13475, 'loss/train': 1.6016812324523926} -08/30/2021 15:32:49 - INFO - __main__ - Step 13477: {'lr': 0.0004926189404570297, 'samples': 2587584, 'steps': 13476, 'loss/train': 1.763638973236084} -08/30/2021 15:32:50 - INFO - __main__ - Step 13478: {'lr': 0.0004926176604227208, 'samples': 2587776, 'steps': 13477, 'loss/train': 2.030625343322754} -08/30/2021 15:32:51 - INFO - __main__ - Step 13479: {'lr': 0.0004926163802790922, 'samples': 2587968, 'steps': 13478, 'loss/train': 2.518698215484619} -08/30/2021 15:32:52 - INFO - __main__ - Step 13480: {'lr': 0.0004926151000261442, 'samples': 2588160, 'steps': 13479, 'loss/train': 1.3181692361831665} -08/30/2021 15:32:52 - INFO - __main__ - Step 13481: {'lr': 0.0004926138196638777, 'samples': 2588352, 'steps': 13480, 'loss/train': 1.6662728786468506} -08/30/2021 15:32:52 - INFO - __main__ - Step 13482: {'lr': 0.0004926125391922932, 'samples': 2588544, 'steps': 13481, 'loss/train': 1.7330400943756104} -08/30/2021 15:32:53 - INFO - __main__ - Step 13483: {'lr': 0.0004926112586113912, 'samples': 2588736, 'steps': 13482, 'loss/train': 1.8911123275756836} -08/30/2021 15:32:55 - INFO - __main__ - Step 13484: {'lr': 0.0004926099779211723, 'samples': 2588928, 'steps': 13483, 'loss/train': 1.4070862531661987} -08/30/2021 15:32:55 - INFO - __main__ - Step 13485: {'lr': 0.0004926086971216371, 'samples': 2589120, 'steps': 13484, 'loss/train': 1.8312996625900269} -08/30/2021 15:32:55 - INFO - __main__ - Step 13486: {'lr': 0.0004926074162127862, 'samples': 2589312, 'steps': 13485, 'loss/train': 1.3259183168411255} -08/30/2021 15:32:56 - INFO - __main__ - Step 13487: {'lr': 0.0004926061351946201, 'samples': 2589504, 'steps': 13486, 'loss/train': 1.5153173208236694} -08/30/2021 15:32:56 - INFO - __main__ - Step 13488: {'lr': 0.0004926048540671394, 'samples': 2589696, 'steps': 13487, 'loss/train': 0.09712362289428711} -08/30/2021 15:32:56 - INFO - __main__ - Step 13489: {'lr': 0.0004926035728303447, 'samples': 2589888, 'steps': 13488, 'loss/train': 1.635308027267456} -08/30/2021 15:32:57 - INFO - __main__ - Step 13490: {'lr': 0.0004926022914842366, 'samples': 2590080, 'steps': 13489, 'loss/train': 1.9806077480316162} -08/30/2021 15:32:58 - INFO - __main__ - Step 13491: {'lr': 0.0004926010100288156, 'samples': 2590272, 'steps': 13490, 'loss/train': 2.0295376777648926} -08/30/2021 15:32:59 - INFO - __main__ - Step 13492: {'lr': 0.0004925997284640823, 'samples': 2590464, 'steps': 13491, 'loss/train': 1.9048993587493896} -08/30/2021 15:32:59 - INFO - __main__ - Step 13493: {'lr': 0.0004925984467900374, 'samples': 2590656, 'steps': 13492, 'loss/train': 1.0696717500686646} -08/30/2021 15:32:59 - INFO - __main__ - Step 13494: {'lr': 0.0004925971650066814, 'samples': 2590848, 'steps': 13493, 'loss/train': 1.2702785730361938} -08/30/2021 15:33:00 - INFO - __main__ - Step 13495: {'lr': 0.0004925958831140147, 'samples': 2591040, 'steps': 13494, 'loss/train': 1.4568878412246704} -08/30/2021 15:33:01 - INFO - __main__ - Step 13496: {'lr': 0.0004925946011120382, 'samples': 2591232, 'steps': 13495, 'loss/train': 0.07764939963817596} -08/30/2021 15:33:02 - INFO - __main__ - Step 13497: {'lr': 0.0004925933190007523, 'samples': 2591424, 'steps': 13496, 'loss/train': 1.8755857944488525} -08/30/2021 15:33:02 - INFO - __main__ - Step 13498: {'lr': 0.0004925920367801575, 'samples': 2591616, 'steps': 13497, 'loss/train': 1.6979717016220093} -08/30/2021 15:33:02 - INFO - __main__ - Step 13499: {'lr': 0.0004925907544502545, 'samples': 2591808, 'steps': 13498, 'loss/train': 2.2595162391662598} -08/30/2021 15:33:03 - INFO - __main__ - Step 13500: {'lr': 0.000492589472011044, 'samples': 2592000, 'steps': 13499, 'loss/train': 1.2787915468215942} -08/30/2021 15:33:04 - INFO - __main__ - Step 13501: {'lr': 0.0004925881894625263, 'samples': 2592192, 'steps': 13500, 'loss/train': 1.5989959239959717} -08/30/2021 15:33:05 - INFO - __main__ - Step 13502: {'lr': 0.0004925869068047021, 'samples': 2592384, 'steps': 13501, 'loss/train': 1.7259631156921387} -08/30/2021 15:33:05 - INFO - __main__ - Step 13503: {'lr': 0.000492585624037572, 'samples': 2592576, 'steps': 13502, 'loss/train': 1.824569582939148} -08/30/2021 15:33:05 - INFO - __main__ - Step 13504: {'lr': 0.0004925843411611366, 'samples': 2592768, 'steps': 13503, 'loss/train': 1.6618465185165405} -08/30/2021 15:33:06 - INFO - __main__ - Step 13505: {'lr': 0.0004925830581753964, 'samples': 2592960, 'steps': 13504, 'loss/train': 1.47261643409729} -08/30/2021 15:33:08 - INFO - __main__ - Step 13506: {'lr': 0.000492581775080352, 'samples': 2593152, 'steps': 13505, 'loss/train': 1.3551136255264282} -08/30/2021 15:33:08 - INFO - __main__ - Step 13507: {'lr': 0.000492580491876004, 'samples': 2593344, 'steps': 13506, 'loss/train': 1.8640018701553345} -08/30/2021 15:33:09 - INFO - __main__ - Step 13508: {'lr': 0.000492579208562353, 'samples': 2593536, 'steps': 13507, 'loss/train': 0.9833238124847412} -08/30/2021 15:33:09 - INFO - __main__ - Step 13509: {'lr': 0.0004925779251393995, 'samples': 2593728, 'steps': 13508, 'loss/train': 1.9962507486343384} -08/30/2021 15:33:09 - INFO - __main__ - Step 13510: {'lr': 0.0004925766416071441, 'samples': 2593920, 'steps': 13509, 'loss/train': 0.13176283240318298} -08/30/2021 15:33:11 - INFO - __main__ - Step 13511: {'lr': 0.0004925753579655876, 'samples': 2594112, 'steps': 13510, 'loss/train': 1.688368797302246} -08/30/2021 15:33:11 - INFO - __main__ - Step 13512: {'lr': 0.0004925740742147302, 'samples': 2594304, 'steps': 13511, 'loss/train': 1.932279109954834} -08/30/2021 15:33:12 - INFO - __main__ - Step 13513: {'lr': 0.0004925727903545727, 'samples': 2594496, 'steps': 13512, 'loss/train': 1.8428903818130493} -08/30/2021 15:33:12 - INFO - __main__ - Step 13514: {'lr': 0.0004925715063851157, 'samples': 2594688, 'steps': 13513, 'loss/train': 2.994810104370117} -08/30/2021 15:33:12 - INFO - __main__ - Step 13515: {'lr': 0.0004925702223063597, 'samples': 2594880, 'steps': 13514, 'loss/train': 1.7586320638656616} -08/30/2021 15:33:14 - INFO - __main__ - Step 13516: {'lr': 0.0004925689381183052, 'samples': 2595072, 'steps': 13515, 'loss/train': 1.5178900957107544} -08/30/2021 15:33:14 - INFO - __main__ - Step 13517: {'lr': 0.0004925676538209531, 'samples': 2595264, 'steps': 13516, 'loss/train': 1.4516875743865967} -08/30/2021 15:33:15 - INFO - __main__ - Step 13518: {'lr': 0.0004925663694143036, 'samples': 2595456, 'steps': 13517, 'loss/train': 0.3572317063808441} -08/30/2021 15:33:15 - INFO - __main__ - Step 13519: {'lr': 0.0004925650848983575, 'samples': 2595648, 'steps': 13518, 'loss/train': 5.944174766540527} -08/30/2021 15:33:15 - INFO - __main__ - Step 13520: {'lr': 0.0004925638002731153, 'samples': 2595840, 'steps': 13519, 'loss/train': 3.11750864982605} -08/30/2021 15:33:16 - INFO - __main__ - Step 13521: {'lr': 0.0004925625155385775, 'samples': 2596032, 'steps': 13520, 'loss/train': 2.209549903869629} -08/30/2021 15:33:17 - INFO - __main__ - Step 13522: {'lr': 0.0004925612306947449, 'samples': 2596224, 'steps': 13521, 'loss/train': 2.039141893386841} -08/30/2021 15:33:18 - INFO - __main__ - Step 13523: {'lr': 0.0004925599457416179, 'samples': 2596416, 'steps': 13522, 'loss/train': 1.6940282583236694} -08/30/2021 15:33:18 - INFO - __main__ - Step 13524: {'lr': 0.0004925586606791972, 'samples': 2596608, 'steps': 13523, 'loss/train': 1.8162835836410522} -08/30/2021 15:33:18 - INFO - __main__ - Step 13525: {'lr': 0.0004925573755074832, 'samples': 2596800, 'steps': 13524, 'loss/train': 1.530030608177185} -08/30/2021 15:33:19 - INFO - __main__ - Step 13526: {'lr': 0.0004925560902264766, 'samples': 2596992, 'steps': 13525, 'loss/train': 1.6636945009231567} -08/30/2021 15:33:20 - INFO - __main__ - Step 13527: {'lr': 0.000492554804836178, 'samples': 2597184, 'steps': 13526, 'loss/train': 1.7782299518585205} -08/30/2021 15:33:21 - INFO - __main__ - Step 13528: {'lr': 0.000492553519336588, 'samples': 2597376, 'steps': 13527, 'loss/train': 1.6822110414505005} -08/30/2021 15:33:21 - INFO - __main__ - Step 13529: {'lr': 0.000492552233727707, 'samples': 2597568, 'steps': 13528, 'loss/train': 1.5328527688980103} -08/30/2021 15:33:21 - INFO - __main__ - Step 13530: {'lr': 0.0004925509480095358, 'samples': 2597760, 'steps': 13529, 'loss/train': 1.6794860363006592} -08/30/2021 15:33:22 - INFO - __main__ - Step 13531: {'lr': 0.0004925496621820749, 'samples': 2597952, 'steps': 13530, 'loss/train': 1.9116847515106201} -08/30/2021 15:33:24 - INFO - __main__ - Step 13532: {'lr': 0.0004925483762453249, 'samples': 2598144, 'steps': 13531, 'loss/train': 1.8638628721237183} -08/30/2021 15:33:24 - INFO - __main__ - Step 13533: {'lr': 0.0004925470901992863, 'samples': 2598336, 'steps': 13532, 'loss/train': 1.8651126623153687} -08/30/2021 15:33:24 - INFO - __main__ - Step 13534: {'lr': 0.0004925458040439596, 'samples': 2598528, 'steps': 13533, 'loss/train': 1.7516535520553589} -08/30/2021 15:33:25 - INFO - __main__ - Step 13535: {'lr': 0.0004925445177793457, 'samples': 2598720, 'steps': 13534, 'loss/train': 3.865978956222534} -08/30/2021 15:33:25 - INFO - __main__ - Step 13536: {'lr': 0.0004925432314054448, 'samples': 2598912, 'steps': 13535, 'loss/train': 1.8925580978393555} -08/30/2021 15:33:25 - INFO - __main__ - Step 13537: {'lr': 0.0004925419449222578, 'samples': 2599104, 'steps': 13536, 'loss/train': 0.10232044756412506} -08/30/2021 15:33:27 - INFO - __main__ - Step 13538: {'lr': 0.0004925406583297851, 'samples': 2599296, 'steps': 13537, 'loss/train': 1.7366762161254883} -08/30/2021 15:33:27 - INFO - __main__ - Step 13539: {'lr': 0.0004925393716280274, 'samples': 2599488, 'steps': 13538, 'loss/train': 1.4790434837341309} -08/30/2021 15:33:28 - INFO - __main__ - Step 13540: {'lr': 0.0004925380848169851, 'samples': 2599680, 'steps': 13539, 'loss/train': 1.6714898347854614} -08/30/2021 15:33:28 - INFO - __main__ - Step 13541: {'lr': 0.0004925367978966588, 'samples': 2599872, 'steps': 13540, 'loss/train': 1.2758488655090332} -08/30/2021 15:33:28 - INFO - __main__ - Step 13542: {'lr': 0.0004925355108670493, 'samples': 2600064, 'steps': 13541, 'loss/train': 1.4123115539550781} -08/30/2021 15:33:30 - INFO - __main__ - Step 13543: {'lr': 0.0004925342237281571, 'samples': 2600256, 'steps': 13542, 'loss/train': 1.858891487121582} -08/30/2021 15:33:30 - INFO - __main__ - Step 13544: {'lr': 0.0004925329364799825, 'samples': 2600448, 'steps': 13543, 'loss/train': 1.4883283376693726} -08/30/2021 15:33:31 - INFO - __main__ - Step 13545: {'lr': 0.0004925316491225265, 'samples': 2600640, 'steps': 13544, 'loss/train': 1.4505428075790405} -08/30/2021 15:33:31 - INFO - __main__ - Step 13546: {'lr': 0.0004925303616557893, 'samples': 2600832, 'steps': 13545, 'loss/train': 2.4108376502990723} -08/30/2021 15:33:31 - INFO - __main__ - Step 13547: {'lr': 0.0004925290740797718, 'samples': 2601024, 'steps': 13546, 'loss/train': 2.0243844985961914} -08/30/2021 15:33:32 - INFO - __main__ - Step 13548: {'lr': 0.0004925277863944745, 'samples': 2601216, 'steps': 13547, 'loss/train': 1.008447527885437} -08/30/2021 15:33:33 - INFO - __main__ - Step 13549: {'lr': 0.0004925264985998978, 'samples': 2601408, 'steps': 13548, 'loss/train': 2.024259328842163} -08/30/2021 15:33:34 - INFO - __main__ - Step 13550: {'lr': 0.0004925252106960425, 'samples': 2601600, 'steps': 13549, 'loss/train': 1.6532448530197144} -08/30/2021 15:33:34 - INFO - __main__ - Step 13551: {'lr': 0.000492523922682909, 'samples': 2601792, 'steps': 13550, 'loss/train': 0.10432249307632446} -08/30/2021 15:33:35 - INFO - __main__ - Step 13552: {'lr': 0.0004925226345604979, 'samples': 2601984, 'steps': 13551, 'loss/train': 2.243321418762207} -08/30/2021 15:33:35 - INFO - __main__ - Step 13553: {'lr': 0.0004925213463288099, 'samples': 2602176, 'steps': 13552, 'loss/train': 1.8855124711990356} -08/30/2021 15:33:36 - INFO - __main__ - Step 13554: {'lr': 0.0004925200579878456, 'samples': 2602368, 'steps': 13553, 'loss/train': 1.4332842826843262} -08/30/2021 15:33:37 - INFO - __main__ - Step 13555: {'lr': 0.0004925187695376055, 'samples': 2602560, 'steps': 13554, 'loss/train': 1.4411249160766602} -08/30/2021 15:33:37 - INFO - __main__ - Step 13556: {'lr': 0.0004925174809780901, 'samples': 2602752, 'steps': 13555, 'loss/train': 1.4498666524887085} -08/30/2021 15:33:38 - INFO - __main__ - Step 13557: {'lr': 0.0004925161923093001, 'samples': 2602944, 'steps': 13556, 'loss/train': 1.8133999109268188} -08/30/2021 15:33:38 - INFO - __main__ - Step 13558: {'lr': 0.000492514903531236, 'samples': 2603136, 'steps': 13557, 'loss/train': 1.8084253072738647} -08/30/2021 15:33:40 - INFO - __main__ - Step 13559: {'lr': 0.0004925136146438986, 'samples': 2603328, 'steps': 13558, 'loss/train': 1.520235538482666} -08/30/2021 15:33:41 - INFO - __main__ - Step 13560: {'lr': 0.0004925123256472881, 'samples': 2603520, 'steps': 13559, 'loss/train': 1.945859432220459} -08/30/2021 15:33:41 - INFO - __main__ - Step 13561: {'lr': 0.0004925110365414054, 'samples': 2603712, 'steps': 13560, 'loss/train': 1.7827258110046387} -08/30/2021 15:33:42 - INFO - __main__ - Step 13562: {'lr': 0.0004925097473262509, 'samples': 2603904, 'steps': 13561, 'loss/train': 1.188539743423462} -08/30/2021 15:33:42 - INFO - __main__ - Step 13563: {'lr': 0.0004925084580018253, 'samples': 2604096, 'steps': 13562, 'loss/train': 2.1434900760650635} -08/30/2021 15:33:42 - INFO - __main__ - Step 13564: {'lr': 0.0004925071685681292, 'samples': 2604288, 'steps': 13563, 'loss/train': 2.2147574424743652} -08/30/2021 15:33:44 - INFO - __main__ - Step 13565: {'lr': 0.000492505879025163, 'samples': 2604480, 'steps': 13564, 'loss/train': 0.2813052237033844} -08/30/2021 15:33:44 - INFO - __main__ - Step 13566: {'lr': 0.0004925045893729274, 'samples': 2604672, 'steps': 13565, 'loss/train': 1.7352817058563232} -08/30/2021 15:33:45 - INFO - __main__ - Step 13567: {'lr': 0.000492503299611423, 'samples': 2604864, 'steps': 13566, 'loss/train': 1.5272668600082397} -08/30/2021 15:33:45 - INFO - __main__ - Step 13568: {'lr': 0.0004925020097406504, 'samples': 2605056, 'steps': 13567, 'loss/train': 2.014237880706787} -08/30/2021 15:33:46 - INFO - __main__ - Step 13569: {'lr': 0.00049250071976061, 'samples': 2605248, 'steps': 13568, 'loss/train': 1.9641761779785156} -08/30/2021 15:33:47 - INFO - __main__ - Step 13570: {'lr': 0.0004924994296713026, 'samples': 2605440, 'steps': 13569, 'loss/train': 1.3411521911621094} -08/30/2021 15:33:47 - INFO - __main__ - Step 13571: {'lr': 0.0004924981394727288, 'samples': 2605632, 'steps': 13570, 'loss/train': 2.0921950340270996} -08/30/2021 15:33:48 - INFO - __main__ - Step 13572: {'lr': 0.0004924968491648889, 'samples': 2605824, 'steps': 13571, 'loss/train': 1.5525544881820679} -08/30/2021 15:33:48 - INFO - __main__ - Step 13573: {'lr': 0.0004924955587477837, 'samples': 2606016, 'steps': 13572, 'loss/train': 1.8229926824569702} -08/30/2021 15:33:49 - INFO - __main__ - Step 13574: {'lr': 0.0004924942682214138, 'samples': 2606208, 'steps': 13573, 'loss/train': 1.407418131828308} -08/30/2021 15:33:50 - INFO - __main__ - Step 13575: {'lr': 0.0004924929775857798, 'samples': 2606400, 'steps': 13574, 'loss/train': 1.6291581392288208} -08/30/2021 15:33:51 - INFO - __main__ - Step 13576: {'lr': 0.0004924916868408821, 'samples': 2606592, 'steps': 13575, 'loss/train': 1.8845282793045044} -08/30/2021 15:33:51 - INFO - __main__ - Step 13577: {'lr': 0.0004924903959867214, 'samples': 2606784, 'steps': 13576, 'loss/train': 2.195474624633789} -08/30/2021 15:33:51 - INFO - __main__ - Step 13578: {'lr': 0.0004924891050232984, 'samples': 2606976, 'steps': 13577, 'loss/train': 2.0111098289489746} -08/30/2021 15:33:52 - INFO - __main__ - Step 13579: {'lr': 0.0004924878139506134, 'samples': 2607168, 'steps': 13578, 'loss/train': 1.620241403579712} -08/30/2021 15:33:52 - INFO - __main__ - Step 13580: {'lr': 0.0004924865227686671, 'samples': 2607360, 'steps': 13579, 'loss/train': 1.8174797296524048} -08/30/2021 15:33:53 - INFO - __main__ - Step 13581: {'lr': 0.0004924852314774602, 'samples': 2607552, 'steps': 13580, 'loss/train': 1.1066776514053345} -08/30/2021 15:33:54 - INFO - __main__ - Step 13582: {'lr': 0.0004924839400769932, 'samples': 2607744, 'steps': 13581, 'loss/train': 1.4693632125854492} -08/30/2021 15:33:54 - INFO - __main__ - Step 13583: {'lr': 0.0004924826485672667, 'samples': 2607936, 'steps': 13582, 'loss/train': 1.5049018859863281} -08/30/2021 15:33:55 - INFO - __main__ - Step 13584: {'lr': 0.0004924813569482812, 'samples': 2608128, 'steps': 13583, 'loss/train': 1.9511942863464355} -08/30/2021 15:33:55 - INFO - __main__ - Step 13585: {'lr': 0.0004924800652200373, 'samples': 2608320, 'steps': 13584, 'loss/train': 1.3383973836898804} -08/30/2021 15:33:57 - INFO - __main__ - Step 13586: {'lr': 0.0004924787733825357, 'samples': 2608512, 'steps': 13585, 'loss/train': 1.1023023128509521} -08/30/2021 15:33:57 - INFO - __main__ - Step 13587: {'lr': 0.0004924774814357768, 'samples': 2608704, 'steps': 13586, 'loss/train': 1.8889728784561157} -08/30/2021 15:33:57 - INFO - __main__ - Step 13588: {'lr': 0.0004924761893797615, 'samples': 2608896, 'steps': 13587, 'loss/train': 2.334665060043335} -08/30/2021 15:33:58 - INFO - __main__ - Step 13589: {'lr': 0.00049247489721449, 'samples': 2609088, 'steps': 13588, 'loss/train': 1.6174975633621216} -08/30/2021 15:33:58 - INFO - __main__ - Step 13590: {'lr': 0.0004924736049399631, 'samples': 2609280, 'steps': 13589, 'loss/train': 1.8216828107833862} -08/30/2021 15:34:00 - INFO - __main__ - Step 13591: {'lr': 0.0004924723125561813, 'samples': 2609472, 'steps': 13590, 'loss/train': 1.5053640604019165} -08/30/2021 15:34:00 - INFO - __main__ - Step 13592: {'lr': 0.0004924710200631453, 'samples': 2609664, 'steps': 13591, 'loss/train': 1.7296819686889648} -08/30/2021 15:34:01 - INFO - __main__ - Step 13593: {'lr': 0.0004924697274608556, 'samples': 2609856, 'steps': 13592, 'loss/train': 1.9816350936889648} -08/30/2021 15:34:01 - INFO - __main__ - Step 13594: {'lr': 0.0004924684347493126, 'samples': 2610048, 'steps': 13593, 'loss/train': 1.0792206525802612} -08/30/2021 15:34:01 - INFO - __main__ - Step 13595: {'lr': 0.0004924671419285172, 'samples': 2610240, 'steps': 13594, 'loss/train': 1.7045694589614868} -08/30/2021 15:34:03 - INFO - __main__ - Step 13596: {'lr': 0.0004924658489984699, 'samples': 2610432, 'steps': 13595, 'loss/train': 2.1342239379882812} -08/30/2021 15:34:03 - INFO - __main__ - Step 13597: {'lr': 0.0004924645559591712, 'samples': 2610624, 'steps': 13596, 'loss/train': 1.6696661710739136} -08/30/2021 15:34:03 - INFO - __main__ - Step 13598: {'lr': 0.0004924632628106217, 'samples': 2610816, 'steps': 13597, 'loss/train': 1.7132092714309692} -08/30/2021 15:34:04 - INFO - __main__ - Step 13599: {'lr': 0.000492461969552822, 'samples': 2611008, 'steps': 13598, 'loss/train': 0.9362173080444336} -08/30/2021 15:34:04 - INFO - __main__ - Step 13600: {'lr': 0.0004924606761857726, 'samples': 2611200, 'steps': 13599, 'loss/train': 1.4645830392837524} -08/30/2021 15:34:06 - INFO - __main__ - Step 13601: {'lr': 0.0004924593827094744, 'samples': 2611392, 'steps': 13600, 'loss/train': 1.4075853824615479} -08/30/2021 15:34:06 - INFO - __main__ - Step 13602: {'lr': 0.0004924580891239274, 'samples': 2611584, 'steps': 13601, 'loss/train': 1.5761439800262451} -08/30/2021 15:34:06 - INFO - __main__ - Step 13603: {'lr': 0.0004924567954291328, 'samples': 2611776, 'steps': 13602, 'loss/train': 1.1367765665054321} -08/30/2021 15:34:07 - INFO - __main__ - Step 13604: {'lr': 0.0004924555016250908, 'samples': 2611968, 'steps': 13603, 'loss/train': 1.0156999826431274} -08/30/2021 15:34:07 - INFO - __main__ - Step 13605: {'lr': 0.0004924542077118021, 'samples': 2612160, 'steps': 13604, 'loss/train': 1.5204416513442993} -08/30/2021 15:34:09 - INFO - __main__ - Step 13606: {'lr': 0.0004924529136892673, 'samples': 2612352, 'steps': 13605, 'loss/train': 1.3079928159713745} -08/30/2021 15:34:09 - INFO - __main__ - Step 13607: {'lr': 0.0004924516195574869, 'samples': 2612544, 'steps': 13606, 'loss/train': 5.3268280029296875} -08/30/2021 15:34:09 - INFO - __main__ - Step 13608: {'lr': 0.0004924503253164614, 'samples': 2612736, 'steps': 13607, 'loss/train': 0.18579594790935516} -08/30/2021 15:34:10 - INFO - __main__ - Step 13609: {'lr': 0.0004924490309661918, 'samples': 2612928, 'steps': 13608, 'loss/train': 1.557999849319458} -08/30/2021 15:34:10 - INFO - __main__ - Step 13610: {'lr': 0.0004924477365066783, 'samples': 2613120, 'steps': 13609, 'loss/train': 0.18215464055538177} -08/30/2021 15:34:12 - INFO - __main__ - Step 13611: {'lr': 0.0004924464419379217, 'samples': 2613312, 'steps': 13610, 'loss/train': 1.7966129779815674} -08/30/2021 15:34:12 - INFO - __main__ - Step 13612: {'lr': 0.0004924451472599222, 'samples': 2613504, 'steps': 13611, 'loss/train': 1.552573323249817} -08/30/2021 15:34:12 - INFO - __main__ - Step 13613: {'lr': 0.000492443852472681, 'samples': 2613696, 'steps': 13612, 'loss/train': 1.795635461807251} -08/30/2021 15:34:13 - INFO - __main__ - Step 13614: {'lr': 0.000492442557576198, 'samples': 2613888, 'steps': 13613, 'loss/train': 1.6038355827331543} -08/30/2021 15:34:13 - INFO - __main__ - Step 13615: {'lr': 0.0004924412625704744, 'samples': 2614080, 'steps': 13614, 'loss/train': 2.2988336086273193} -08/30/2021 15:34:15 - INFO - __main__ - Step 13616: {'lr': 0.0004924399674555103, 'samples': 2614272, 'steps': 13615, 'loss/train': 1.9128919839859009} -08/30/2021 15:34:16 - INFO - __main__ - Step 13617: {'lr': 0.0004924386722313066, 'samples': 2614464, 'steps': 13616, 'loss/train': 1.461970329284668} -08/30/2021 15:34:16 - INFO - __main__ - Step 13618: {'lr': 0.0004924373768978638, 'samples': 2614656, 'steps': 13617, 'loss/train': 1.7205674648284912} -08/30/2021 15:34:16 - INFO - __main__ - Step 13619: {'lr': 0.0004924360814551825, 'samples': 2614848, 'steps': 13618, 'loss/train': 1.3666102886199951} -08/30/2021 15:34:17 - INFO - __main__ - Step 13620: {'lr': 0.0004924347859032631, 'samples': 2615040, 'steps': 13619, 'loss/train': 2.179389476776123} -08/30/2021 15:34:17 - INFO - __main__ - Step 13621: {'lr': 0.0004924334902421065, 'samples': 2615232, 'steps': 13620, 'loss/train': 2.01278018951416} -08/30/2021 15:34:19 - INFO - __main__ - Step 13622: {'lr': 0.0004924321944717129, 'samples': 2615424, 'steps': 13621, 'loss/train': 0.9595762491226196} -08/30/2021 15:34:19 - INFO - __main__ - Step 13623: {'lr': 0.0004924308985920832, 'samples': 2615616, 'steps': 13622, 'loss/train': 2.0263359546661377} -08/30/2021 15:34:19 - INFO - __main__ - Step 13624: {'lr': 0.0004924296026032179, 'samples': 2615808, 'steps': 13623, 'loss/train': 1.9515252113342285} -08/30/2021 15:34:20 - INFO - __main__ - Step 13625: {'lr': 0.0004924283065051176, 'samples': 2616000, 'steps': 13624, 'loss/train': 1.8134857416152954} -08/30/2021 15:34:20 - INFO - __main__ - Step 13626: {'lr': 0.0004924270102977827, 'samples': 2616192, 'steps': 13625, 'loss/train': 1.8927422761917114} -08/30/2021 15:34:22 - INFO - __main__ - Step 13627: {'lr': 0.0004924257139812141, 'samples': 2616384, 'steps': 13626, 'loss/train': 1.8158823251724243} -08/30/2021 15:34:22 - INFO - __main__ - Step 13628: {'lr': 0.0004924244175554121, 'samples': 2616576, 'steps': 13627, 'loss/train': 1.0761092901229858} -08/30/2021 15:34:22 - INFO - __main__ - Step 13629: {'lr': 0.0004924231210203775, 'samples': 2616768, 'steps': 13628, 'loss/train': 1.7435681819915771} -08/30/2021 15:34:23 - INFO - __main__ - Step 13630: {'lr': 0.0004924218243761106, 'samples': 2616960, 'steps': 13629, 'loss/train': 1.5496809482574463} -08/30/2021 15:34:23 - INFO - __main__ - Step 13631: {'lr': 0.0004924205276226123, 'samples': 2617152, 'steps': 13630, 'loss/train': 2.409818649291992} -08/30/2021 15:34:25 - INFO - __main__ - Step 13632: {'lr': 0.000492419230759883, 'samples': 2617344, 'steps': 13631, 'loss/train': 0.7975999712944031} -08/30/2021 15:34:25 - INFO - __main__ - Step 13633: {'lr': 0.0004924179337879234, 'samples': 2617536, 'steps': 13632, 'loss/train': 1.728769063949585} -08/30/2021 15:34:26 - INFO - __main__ - Step 13634: {'lr': 0.000492416636706734, 'samples': 2617728, 'steps': 13633, 'loss/train': 1.2326794862747192} -08/30/2021 15:34:26 - INFO - __main__ - Step 13635: {'lr': 0.0004924153395163153, 'samples': 2617920, 'steps': 13634, 'loss/train': 1.1788344383239746} -08/30/2021 15:34:27 - INFO - __main__ - Step 13636: {'lr': 0.0004924140422166681, 'samples': 2618112, 'steps': 13635, 'loss/train': 1.7727967500686646} -08/30/2021 15:34:27 - INFO - __main__ - Step 13637: {'lr': 0.0004924127448077929, 'samples': 2618304, 'steps': 13636, 'loss/train': 1.20018470287323} -08/30/2021 15:34:29 - INFO - __main__ - Step 13638: {'lr': 0.0004924114472896902, 'samples': 2618496, 'steps': 13637, 'loss/train': 1.5733697414398193} -08/30/2021 15:34:29 - INFO - __main__ - Step 13639: {'lr': 0.0004924101496623606, 'samples': 2618688, 'steps': 13638, 'loss/train': 1.8506971597671509} -08/30/2021 15:34:30 - INFO - __main__ - Step 13640: {'lr': 0.0004924088519258049, 'samples': 2618880, 'steps': 13639, 'loss/train': 1.184861421585083} -08/30/2021 15:34:30 - INFO - __main__ - Step 13641: {'lr': 0.0004924075540800233, 'samples': 2619072, 'steps': 13640, 'loss/train': 1.7108304500579834} -08/30/2021 15:34:30 - INFO - __main__ - Step 13642: {'lr': 0.0004924062561250167, 'samples': 2619264, 'steps': 13641, 'loss/train': 1.9534341096878052} -08/30/2021 15:34:31 - INFO - __main__ - Step 13643: {'lr': 0.0004924049580607855, 'samples': 2619456, 'steps': 13642, 'loss/train': 0.7120783925056458} -08/30/2021 15:34:32 - INFO - __main__ - Step 13644: {'lr': 0.0004924036598873305, 'samples': 2619648, 'steps': 13643, 'loss/train': 0.24787519872188568} -08/30/2021 15:34:33 - INFO - __main__ - Step 13645: {'lr': 0.0004924023616046521, 'samples': 2619840, 'steps': 13644, 'loss/train': 1.3333410024642944} -08/30/2021 15:34:33 - INFO - __main__ - Step 13646: {'lr': 0.000492401063212751, 'samples': 2620032, 'steps': 13645, 'loss/train': 0.9179432988166809} -08/30/2021 15:34:33 - INFO - __main__ - Step 13647: {'lr': 0.0004923997647116276, 'samples': 2620224, 'steps': 13646, 'loss/train': 1.2959872484207153} -08/30/2021 15:34:34 - INFO - __main__ - Step 13648: {'lr': 0.0004923984661012827, 'samples': 2620416, 'steps': 13647, 'loss/train': 1.8445854187011719} -08/30/2021 15:34:35 - INFO - __main__ - Step 13649: {'lr': 0.0004923971673817167, 'samples': 2620608, 'steps': 13648, 'loss/train': 1.988378643989563} -08/30/2021 15:34:36 - INFO - __main__ - Step 13650: {'lr': 0.0004923958685529303, 'samples': 2620800, 'steps': 13649, 'loss/train': 1.8842787742614746} -08/30/2021 15:34:36 - INFO - __main__ - Step 13651: {'lr': 0.0004923945696149241, 'samples': 2620992, 'steps': 13650, 'loss/train': 1.9136470556259155} -08/30/2021 15:34:36 - INFO - __main__ - Step 13652: {'lr': 0.0004923932705676986, 'samples': 2621184, 'steps': 13651, 'loss/train': 1.5448200702667236} -08/30/2021 15:34:37 - INFO - __main__ - Step 13653: {'lr': 0.0004923919714112545, 'samples': 2621376, 'steps': 13652, 'loss/train': 1.7074371576309204} -08/30/2021 15:34:38 - INFO - __main__ - Step 13654: {'lr': 0.0004923906721455922, 'samples': 2621568, 'steps': 13653, 'loss/train': 1.8044511079788208} -08/30/2021 15:34:39 - INFO - __main__ - Step 13655: {'lr': 0.0004923893727707125, 'samples': 2621760, 'steps': 13654, 'loss/train': 1.8527477979660034} -08/30/2021 15:34:39 - INFO - __main__ - Step 13656: {'lr': 0.0004923880732866159, 'samples': 2621952, 'steps': 13655, 'loss/train': 1.6376972198486328} -08/30/2021 15:34:39 - INFO - __main__ - Step 13657: {'lr': 0.0004923867736933029, 'samples': 2622144, 'steps': 13656, 'loss/train': 1.3884831666946411} -08/30/2021 15:34:40 - INFO - __main__ - Step 13658: {'lr': 0.0004923854739907743, 'samples': 2622336, 'steps': 13657, 'loss/train': 1.9756426811218262} -08/30/2021 15:34:41 - INFO - __main__ - Step 13659: {'lr': 0.0004923841741790304, 'samples': 2622528, 'steps': 13658, 'loss/train': 1.6669288873672485} -08/30/2021 15:34:42 - INFO - __main__ - Step 13660: {'lr': 0.0004923828742580719, 'samples': 2622720, 'steps': 13659, 'loss/train': 1.7132149934768677} -08/30/2021 15:34:42 - INFO - __main__ - Step 13661: {'lr': 0.0004923815742278996, 'samples': 2622912, 'steps': 13660, 'loss/train': 1.8713726997375488} -08/30/2021 15:34:42 - INFO - __main__ - Step 13662: {'lr': 0.0004923802740885139, 'samples': 2623104, 'steps': 13661, 'loss/train': 1.4689429998397827} -08/30/2021 15:34:43 - INFO - __main__ - Step 13663: {'lr': 0.0004923789738399152, 'samples': 2623296, 'steps': 13662, 'loss/train': 1.1093848943710327} -08/30/2021 15:34:43 - INFO - __main__ - Step 13664: {'lr': 0.0004923776734821044, 'samples': 2623488, 'steps': 13663, 'loss/train': 1.5304033756256104} -08/30/2021 15:34:45 - INFO - __main__ - Step 13665: {'lr': 0.0004923763730150819, 'samples': 2623680, 'steps': 13664, 'loss/train': 1.599599003791809} -08/30/2021 15:34:45 - INFO - __main__ - Step 13666: {'lr': 0.0004923750724388483, 'samples': 2623872, 'steps': 13665, 'loss/train': 1.955889105796814} -08/30/2021 15:34:46 - INFO - __main__ - Step 13667: {'lr': 0.0004923737717534044, 'samples': 2624064, 'steps': 13666, 'loss/train': 2.132965087890625} -08/30/2021 15:34:46 - INFO - __main__ - Step 13668: {'lr': 0.0004923724709587504, 'samples': 2624256, 'steps': 13667, 'loss/train': 1.6331837177276611} -08/30/2021 15:34:46 - INFO - __main__ - Step 13669: {'lr': 0.0004923711700548873, 'samples': 2624448, 'steps': 13668, 'loss/train': 1.400579810142517} -08/30/2021 15:34:48 - INFO - __main__ - Step 13670: {'lr': 0.0004923698690418154, 'samples': 2624640, 'steps': 13669, 'loss/train': 1.7198896408081055} -08/30/2021 15:34:48 - INFO - __main__ - Step 13671: {'lr': 0.0004923685679195355, 'samples': 2624832, 'steps': 13670, 'loss/train': 2.168217420578003} -08/30/2021 15:34:49 - INFO - __main__ - Step 13672: {'lr': 0.0004923672666880479, 'samples': 2625024, 'steps': 13671, 'loss/train': 1.213516116142273} -08/30/2021 15:34:49 - INFO - __main__ - Step 13673: {'lr': 0.0004923659653473533, 'samples': 2625216, 'steps': 13672, 'loss/train': 1.551790475845337} -08/30/2021 15:34:50 - INFO - __main__ - Step 13674: {'lr': 0.0004923646638974524, 'samples': 2625408, 'steps': 13673, 'loss/train': 2.2469582557678223} -08/30/2021 15:34:51 - INFO - __main__ - Step 13675: {'lr': 0.0004923633623383459, 'samples': 2625600, 'steps': 13674, 'loss/train': 1.7807055711746216} -08/30/2021 15:34:52 - INFO - __main__ - Step 13676: {'lr': 0.0004923620606700341, 'samples': 2625792, 'steps': 13675, 'loss/train': 1.5575268268585205} -08/30/2021 15:34:52 - INFO - __main__ - Step 13677: {'lr': 0.0004923607588925177, 'samples': 2625984, 'steps': 13676, 'loss/train': 2.6210319995880127} -08/30/2021 15:34:52 - INFO - __main__ - Step 13678: {'lr': 0.0004923594570057972, 'samples': 2626176, 'steps': 13677, 'loss/train': 2.1359925270080566} -08/30/2021 15:34:53 - INFO - __main__ - Step 13679: {'lr': 0.0004923581550098733, 'samples': 2626368, 'steps': 13678, 'loss/train': 0.1307481974363327} -08/30/2021 15:34:55 - INFO - __main__ - Step 13680: {'lr': 0.0004923568529047466, 'samples': 2626560, 'steps': 13679, 'loss/train': 1.6401782035827637} -08/30/2021 15:34:55 - INFO - __main__ - Step 13681: {'lr': 0.0004923555506904176, 'samples': 2626752, 'steps': 13680, 'loss/train': 0.12490972131490707} -08/30/2021 15:34:56 - INFO - __main__ - Step 13682: {'lr': 0.0004923542483668869, 'samples': 2626944, 'steps': 13681, 'loss/train': 0.09010914713144302} -08/30/2021 15:34:56 - INFO - __main__ - Step 13683: {'lr': 0.0004923529459341553, 'samples': 2627136, 'steps': 13682, 'loss/train': 1.6802605390548706} -08/30/2021 15:34:56 - INFO - __main__ - Step 13684: {'lr': 0.000492351643392223, 'samples': 2627328, 'steps': 13683, 'loss/train': 1.671370506286621} -08/30/2021 15:34:57 - INFO - __main__ - Step 13685: {'lr': 0.0004923503407410908, 'samples': 2627520, 'steps': 13684, 'loss/train': 1.8083133697509766} -08/30/2021 15:34:57 - INFO - __main__ - Step 13686: {'lr': 0.0004923490379807594, 'samples': 2627712, 'steps': 13685, 'loss/train': 0.9506597518920898} -08/30/2021 15:34:58 - INFO - __main__ - Step 13687: {'lr': 0.0004923477351112291, 'samples': 2627904, 'steps': 13686, 'loss/train': 2.1542840003967285} -08/30/2021 15:34:59 - INFO - __main__ - Step 13688: {'lr': 0.0004923464321325008, 'samples': 2628096, 'steps': 13687, 'loss/train': 1.3836222887039185} -08/30/2021 15:34:59 - INFO - __main__ - Step 13689: {'lr': 0.0004923451290445749, 'samples': 2628288, 'steps': 13688, 'loss/train': 1.8518695831298828} -08/30/2021 15:35:00 - INFO - __main__ - Step 13690: {'lr': 0.000492343825847452, 'samples': 2628480, 'steps': 13689, 'loss/train': 1.8045462369918823} -08/30/2021 15:35:00 - INFO - __main__ - Step 13691: {'lr': 0.0004923425225411328, 'samples': 2628672, 'steps': 13690, 'loss/train': 1.5389764308929443} -08/30/2021 15:35:02 - INFO - __main__ - Step 13692: {'lr': 0.0004923412191256176, 'samples': 2628864, 'steps': 13691, 'loss/train': 2.1948177814483643} -08/30/2021 15:35:03 - INFO - __main__ - Step 13693: {'lr': 0.0004923399156009073, 'samples': 2629056, 'steps': 13692, 'loss/train': 1.0094873905181885} -08/30/2021 15:35:03 - INFO - __main__ - Step 13694: {'lr': 0.0004923386119670024, 'samples': 2629248, 'steps': 13693, 'loss/train': 0.15823443233966827} -08/30/2021 15:35:03 - INFO - __main__ - Step 13695: {'lr': 0.0004923373082239035, 'samples': 2629440, 'steps': 13694, 'loss/train': 0.6393691301345825} -08/30/2021 15:35:04 - INFO - __main__ - Step 13696: {'lr': 0.000492336004371611, 'samples': 2629632, 'steps': 13695, 'loss/train': 1.8347361087799072} -08/30/2021 15:35:06 - INFO - __main__ - Step 13697: {'lr': 0.0004923347004101257, 'samples': 2629824, 'steps': 13696, 'loss/train': 1.632712483406067} -08/30/2021 15:35:06 - INFO - __main__ - Step 13698: {'lr': 0.0004923333963394482, 'samples': 2630016, 'steps': 13697, 'loss/train': 1.9935790300369263} -08/30/2021 15:35:06 - INFO - __main__ - Step 13699: {'lr': 0.000492332092159579, 'samples': 2630208, 'steps': 13698, 'loss/train': 1.5431437492370605} -08/30/2021 15:35:07 - INFO - __main__ - Step 13700: {'lr': 0.0004923307878705186, 'samples': 2630400, 'steps': 13699, 'loss/train': 1.884891152381897} -08/30/2021 15:35:07 - INFO - __main__ - Step 13701: {'lr': 0.0004923294834722678, 'samples': 2630592, 'steps': 13700, 'loss/train': 1.852683424949646} -08/30/2021 15:35:07 - INFO - __main__ - Step 13702: {'lr': 0.000492328178964827, 'samples': 2630784, 'steps': 13701, 'loss/train': 1.8306818008422852} -08/30/2021 15:35:09 - INFO - __main__ - Step 13703: {'lr': 0.0004923268743481969, 'samples': 2630976, 'steps': 13702, 'loss/train': 0.10214895755052567} -08/30/2021 15:35:10 - INFO - __main__ - Step 13704: {'lr': 0.000492325569622378, 'samples': 2631168, 'steps': 13703, 'loss/train': 1.338849663734436} -08/30/2021 15:35:10 - INFO - __main__ - Step 13705: {'lr': 0.0004923242647873709, 'samples': 2631360, 'steps': 13704, 'loss/train': 2.2124781608581543} -08/30/2021 15:35:10 - INFO - __main__ - Step 13706: {'lr': 0.0004923229598431763, 'samples': 2631552, 'steps': 13705, 'loss/train': 1.8244792222976685} -08/30/2021 15:35:11 - INFO - __main__ - Step 13707: {'lr': 0.0004923216547897948, 'samples': 2631744, 'steps': 13706, 'loss/train': 1.1003340482711792} -08/30/2021 15:35:12 - INFO - __main__ - Step 13708: {'lr': 0.0004923203496272267, 'samples': 2631936, 'steps': 13707, 'loss/train': 1.254780888557434} -08/30/2021 15:35:12 - INFO - __main__ - Step 13709: {'lr': 0.0004923190443554729, 'samples': 2632128, 'steps': 13708, 'loss/train': 1.9208908081054688} -08/30/2021 15:35:13 - INFO - __main__ - Step 13710: {'lr': 0.0004923177389745339, 'samples': 2632320, 'steps': 13709, 'loss/train': 1.4887737035751343} -08/30/2021 15:35:13 - INFO - __main__ - Step 13711: {'lr': 0.0004923164334844103, 'samples': 2632512, 'steps': 13710, 'loss/train': 1.7068501710891724} -08/30/2021 15:35:13 - INFO - __main__ - Step 13712: {'lr': 0.0004923151278851025, 'samples': 2632704, 'steps': 13711, 'loss/train': 2.020146131515503} -08/30/2021 15:35:15 - INFO - __main__ - Step 13713: {'lr': 0.0004923138221766114, 'samples': 2632896, 'steps': 13712, 'loss/train': 1.5657011270523071} -08/30/2021 15:35:16 - INFO - __main__ - Step 13714: {'lr': 0.0004923125163589373, 'samples': 2633088, 'steps': 13713, 'loss/train': 2.091078758239746} -08/30/2021 15:35:16 - INFO - __main__ - Step 13715: {'lr': 0.0004923112104320811, 'samples': 2633280, 'steps': 13714, 'loss/train': 1.5669457912445068} -08/30/2021 15:35:16 - INFO - __main__ - Step 13716: {'lr': 0.000492309904396043, 'samples': 2633472, 'steps': 13715, 'loss/train': 1.9935438632965088} -08/30/2021 15:35:17 - INFO - __main__ - Step 13717: {'lr': 0.0004923085982508239, 'samples': 2633664, 'steps': 13716, 'loss/train': 1.3683717250823975} -08/30/2021 15:35:17 - INFO - __main__ - Step 13718: {'lr': 0.0004923072919964243, 'samples': 2633856, 'steps': 13717, 'loss/train': 5.963078498840332} -08/30/2021 15:35:19 - INFO - __main__ - Step 13719: {'lr': 0.0004923059856328447, 'samples': 2634048, 'steps': 13718, 'loss/train': 2.031951427459717} -08/30/2021 15:35:19 - INFO - __main__ - Step 13720: {'lr': 0.0004923046791600859, 'samples': 2634240, 'steps': 13719, 'loss/train': 1.8273379802703857} -08/30/2021 15:35:19 - INFO - __main__ - Step 13721: {'lr': 0.0004923033725781482, 'samples': 2634432, 'steps': 13720, 'loss/train': 1.4259757995605469} -08/30/2021 15:35:20 - INFO - __main__ - Step 13722: {'lr': 0.0004923020658870324, 'samples': 2634624, 'steps': 13721, 'loss/train': 1.7631014585494995} -08/30/2021 15:35:20 - INFO - __main__ - Step 13723: {'lr': 0.000492300759086739, 'samples': 2634816, 'steps': 13722, 'loss/train': 2.193504571914673} -08/30/2021 15:35:22 - INFO - __main__ - Step 13724: {'lr': 0.0004922994521772687, 'samples': 2635008, 'steps': 13723, 'loss/train': 2.0830652713775635} -08/30/2021 15:35:22 - INFO - __main__ - Step 13725: {'lr': 0.000492298145158622, 'samples': 2635200, 'steps': 13724, 'loss/train': 2.2276597023010254} -08/30/2021 15:35:23 - INFO - __main__ - Step 13726: {'lr': 0.0004922968380307994, 'samples': 2635392, 'steps': 13725, 'loss/train': 2.376321315765381} -08/30/2021 15:35:23 - INFO - __main__ - Step 13727: {'lr': 0.0004922955307938016, 'samples': 2635584, 'steps': 13726, 'loss/train': 1.9856606721878052} -08/30/2021 15:35:23 - INFO - __main__ - Step 13728: {'lr': 0.0004922942234476292, 'samples': 2635776, 'steps': 13727, 'loss/train': 2.001293420791626} -08/30/2021 15:35:25 - INFO - __main__ - Step 13729: {'lr': 0.0004922929159922828, 'samples': 2635968, 'steps': 13728, 'loss/train': 1.4641457796096802} -08/30/2021 15:35:25 - INFO - __main__ - Step 13730: {'lr': 0.0004922916084277629, 'samples': 2636160, 'steps': 13729, 'loss/train': 2.233157157897949} -08/30/2021 15:35:26 - INFO - __main__ - Step 13731: {'lr': 0.0004922903007540701, 'samples': 2636352, 'steps': 13730, 'loss/train': 1.1955019235610962} -08/30/2021 15:35:26 - INFO - __main__ - Step 13732: {'lr': 0.0004922889929712051, 'samples': 2636544, 'steps': 13731, 'loss/train': 2.0497384071350098} -08/30/2021 15:35:26 - INFO - __main__ - Step 13733: {'lr': 0.0004922876850791684, 'samples': 2636736, 'steps': 13732, 'loss/train': 1.1751309633255005} -08/30/2021 15:35:28 - INFO - __main__ - Step 13734: {'lr': 0.0004922863770779606, 'samples': 2636928, 'steps': 13733, 'loss/train': 1.266606092453003} -08/30/2021 15:35:28 - INFO - __main__ - Step 13735: {'lr': 0.0004922850689675823, 'samples': 2637120, 'steps': 13734, 'loss/train': 2.1586008071899414} -08/30/2021 15:35:29 - INFO - __main__ - Step 13736: {'lr': 0.0004922837607480341, 'samples': 2637312, 'steps': 13735, 'loss/train': 1.6889420747756958} -08/30/2021 15:35:29 - INFO - __main__ - Step 13737: {'lr': 0.0004922824524193166, 'samples': 2637504, 'steps': 13736, 'loss/train': 0.9684352278709412} -08/30/2021 15:35:29 - INFO - __main__ - Step 13738: {'lr': 0.0004922811439814303, 'samples': 2637696, 'steps': 13737, 'loss/train': 2.1781835556030273} -08/30/2021 15:35:30 - INFO - __main__ - Step 13739: {'lr': 0.0004922798354343758, 'samples': 2637888, 'steps': 13738, 'loss/train': 1.8887906074523926} -08/30/2021 15:35:32 - INFO - __main__ - Step 13740: {'lr': 0.0004922785267781539, 'samples': 2638080, 'steps': 13739, 'loss/train': 1.4249500036239624} -08/30/2021 15:35:32 - INFO - __main__ - Step 13741: {'lr': 0.000492277218012765, 'samples': 2638272, 'steps': 13740, 'loss/train': 1.7357696294784546} -08/30/2021 15:35:32 - INFO - __main__ - Step 13742: {'lr': 0.0004922759091382097, 'samples': 2638464, 'steps': 13741, 'loss/train': 1.5921028852462769} -08/30/2021 15:35:33 - INFO - __main__ - Step 13743: {'lr': 0.0004922746001544885, 'samples': 2638656, 'steps': 13742, 'loss/train': 1.498734474182129} -08/30/2021 15:35:33 - INFO - __main__ - Step 13744: {'lr': 0.0004922732910616023, 'samples': 2638848, 'steps': 13743, 'loss/train': 1.9081112146377563} -08/30/2021 15:35:33 - INFO - __main__ - Step 13745: {'lr': 0.0004922719818595514, 'samples': 2639040, 'steps': 13744, 'loss/train': 1.339704990386963} -08/30/2021 15:35:35 - INFO - __main__ - Step 13746: {'lr': 0.0004922706725483364, 'samples': 2639232, 'steps': 13745, 'loss/train': 2.2559444904327393} -08/30/2021 15:35:35 - INFO - __main__ - Step 13747: {'lr': 0.0004922693631279581, 'samples': 2639424, 'steps': 13746, 'loss/train': 1.1486022472381592} -08/30/2021 15:35:36 - INFO - __main__ - Step 13748: {'lr': 0.000492268053598417, 'samples': 2639616, 'steps': 13747, 'loss/train': 1.211904764175415} -08/30/2021 15:35:36 - INFO - __main__ - Step 13749: {'lr': 0.0004922667439597136, 'samples': 2639808, 'steps': 13748, 'loss/train': 1.418578863143921} -08/30/2021 15:35:36 - INFO - __main__ - Step 13750: {'lr': 0.0004922654342118484, 'samples': 2640000, 'steps': 13749, 'loss/train': 1.3844101428985596} -08/30/2021 15:35:38 - INFO - __main__ - Step 13751: {'lr': 0.0004922641243548223, 'samples': 2640192, 'steps': 13750, 'loss/train': 1.8498740196228027} -08/30/2021 15:35:38 - INFO - __main__ - Step 13752: {'lr': 0.0004922628143886358, 'samples': 2640384, 'steps': 13751, 'loss/train': 1.6858294010162354} -08/30/2021 15:35:39 - INFO - __main__ - Step 13753: {'lr': 0.0004922615043132892, 'samples': 2640576, 'steps': 13752, 'loss/train': 1.8434538841247559} -08/30/2021 15:35:39 - INFO - __main__ - Step 13754: {'lr': 0.0004922601941287835, 'samples': 2640768, 'steps': 13753, 'loss/train': 0.7334967851638794} -08/30/2021 15:35:39 - INFO - __main__ - Step 13755: {'lr': 0.0004922588838351189, 'samples': 2640960, 'steps': 13754, 'loss/train': 1.306587815284729} -08/30/2021 15:35:41 - INFO - __main__ - Step 13756: {'lr': 0.0004922575734322963, 'samples': 2641152, 'steps': 13755, 'loss/train': 2.007366180419922} -08/30/2021 15:35:41 - INFO - __main__ - Step 13757: {'lr': 0.0004922562629203161, 'samples': 2641344, 'steps': 13756, 'loss/train': 2.00295090675354} -08/30/2021 15:35:42 - INFO - __main__ - Step 13758: {'lr': 0.0004922549522991791, 'samples': 2641536, 'steps': 13757, 'loss/train': 1.7510627508163452} -08/30/2021 15:35:42 - INFO - __main__ - Step 13759: {'lr': 0.0004922536415688856, 'samples': 2641728, 'steps': 13758, 'loss/train': 1.7219719886779785} -08/30/2021 15:35:43 - INFO - __main__ - Step 13760: {'lr': 0.0004922523307294364, 'samples': 2641920, 'steps': 13759, 'loss/train': 0.19753147661685944} -08/30/2021 15:35:44 - INFO - __main__ - Step 13761: {'lr': 0.0004922510197808321, 'samples': 2642112, 'steps': 13760, 'loss/train': 1.529544472694397} -08/30/2021 15:35:44 - INFO - __main__ - Step 13762: {'lr': 0.0004922497087230732, 'samples': 2642304, 'steps': 13761, 'loss/train': 1.213055968284607} -08/30/2021 15:35:45 - INFO - __main__ - Step 13763: {'lr': 0.0004922483975561603, 'samples': 2642496, 'steps': 13762, 'loss/train': 2.152477502822876} -08/30/2021 15:35:45 - INFO - __main__ - Step 13764: {'lr': 0.000492247086280094, 'samples': 2642688, 'steps': 13763, 'loss/train': 2.0268726348876953} -08/30/2021 15:35:45 - INFO - __main__ - Step 13765: {'lr': 0.0004922457748948749, 'samples': 2642880, 'steps': 13764, 'loss/train': 2.165783166885376} -08/30/2021 15:35:47 - INFO - __main__ - Step 13766: {'lr': 0.0004922444634005037, 'samples': 2643072, 'steps': 13765, 'loss/train': 2.0102698802948} -08/30/2021 15:35:47 - INFO - __main__ - Step 13767: {'lr': 0.0004922431517969808, 'samples': 2643264, 'steps': 13766, 'loss/train': 1.9530229568481445} -08/30/2021 15:35:48 - INFO - __main__ - Step 13768: {'lr': 0.0004922418400843068, 'samples': 2643456, 'steps': 13767, 'loss/train': 1.5066810846328735} -08/30/2021 15:35:48 - INFO - __main__ - Step 13769: {'lr': 0.0004922405282624825, 'samples': 2643648, 'steps': 13768, 'loss/train': 1.6222310066223145} -08/30/2021 15:35:48 - INFO - __main__ - Step 13770: {'lr': 0.0004922392163315083, 'samples': 2643840, 'steps': 13769, 'loss/train': 1.7509607076644897} -08/30/2021 15:35:50 - INFO - __main__ - Step 13771: {'lr': 0.0004922379042913848, 'samples': 2644032, 'steps': 13770, 'loss/train': 1.8124586343765259} -08/30/2021 15:35:50 - INFO - __main__ - Step 13772: {'lr': 0.0004922365921421126, 'samples': 2644224, 'steps': 13771, 'loss/train': 1.820056676864624} -08/30/2021 15:35:51 - INFO - __main__ - Step 13773: {'lr': 0.0004922352798836924, 'samples': 2644416, 'steps': 13772, 'loss/train': 1.8008754253387451} -08/30/2021 15:35:51 - INFO - __main__ - Step 13774: {'lr': 0.0004922339675161248, 'samples': 2644608, 'steps': 13773, 'loss/train': 1.695332646369934} -08/30/2021 15:35:51 - INFO - __main__ - Step 13775: {'lr': 0.0004922326550394102, 'samples': 2644800, 'steps': 13774, 'loss/train': 1.359049916267395} -08/30/2021 15:35:54 - INFO - __main__ - Step 13776: {'lr': 0.0004922313424535494, 'samples': 2644992, 'steps': 13775, 'loss/train': 1.735809326171875} -08/30/2021 15:35:55 - INFO - __main__ - Step 13777: {'lr': 0.0004922300297585428, 'samples': 2645184, 'steps': 13776, 'loss/train': 1.83517587184906} -08/30/2021 15:35:55 - INFO - __main__ - Step 13778: {'lr': 0.0004922287169543911, 'samples': 2645376, 'steps': 13777, 'loss/train': 1.6809149980545044} -08/30/2021 15:35:55 - INFO - __main__ - Step 13779: {'lr': 0.0004922274040410949, 'samples': 2645568, 'steps': 13778, 'loss/train': 0.24220360815525055} -08/30/2021 15:35:56 - INFO - __main__ - Step 13780: {'lr': 0.0004922260910186548, 'samples': 2645760, 'steps': 13779, 'loss/train': 0.3392987847328186} -08/30/2021 15:35:57 - INFO - __main__ - Step 13781: {'lr': 0.0004922247778870714, 'samples': 2645952, 'steps': 13780, 'loss/train': 2.3549277782440186} -08/30/2021 15:35:58 - INFO - __main__ - Step 13782: {'lr': 0.0004922234646463451, 'samples': 2646144, 'steps': 13781, 'loss/train': 1.7731692790985107} -08/30/2021 15:35:58 - INFO - __main__ - Step 13783: {'lr': 0.0004922221512964767, 'samples': 2646336, 'steps': 13782, 'loss/train': 2.125839948654175} -08/30/2021 15:35:59 - INFO - __main__ - Step 13784: {'lr': 0.0004922208378374668, 'samples': 2646528, 'steps': 13783, 'loss/train': 1.2620468139648438} -08/30/2021 15:35:59 - INFO - __main__ - Step 13785: {'lr': 0.0004922195242693159, 'samples': 2646720, 'steps': 13784, 'loss/train': 0.20281535387039185} -08/30/2021 15:35:59 - INFO - __main__ - Step 13786: {'lr': 0.0004922182105920246, 'samples': 2646912, 'steps': 13785, 'loss/train': 0.11585058271884918} -08/30/2021 15:36:01 - INFO - __main__ - Step 13787: {'lr': 0.0004922168968055935, 'samples': 2647104, 'steps': 13786, 'loss/train': 1.6856178045272827} -08/30/2021 15:36:01 - INFO - __main__ - Step 13788: {'lr': 0.0004922155829100233, 'samples': 2647296, 'steps': 13787, 'loss/train': 1.5219813585281372} -08/30/2021 15:36:02 - INFO - __main__ - Step 13789: {'lr': 0.0004922142689053144, 'samples': 2647488, 'steps': 13788, 'loss/train': 1.7836838960647583} -08/30/2021 15:36:02 - INFO - __main__ - Step 13790: {'lr': 0.0004922129547914675, 'samples': 2647680, 'steps': 13789, 'loss/train': 1.9570887088775635} -08/30/2021 15:36:03 - INFO - __main__ - Step 13791: {'lr': 0.0004922116405684832, 'samples': 2647872, 'steps': 13790, 'loss/train': 1.0402331352233887} -08/30/2021 15:36:04 - INFO - __main__ - Step 13792: {'lr': 0.0004922103262363621, 'samples': 2648064, 'steps': 13791, 'loss/train': 1.649842381477356} -08/30/2021 15:36:05 - INFO - __main__ - Step 13793: {'lr': 0.0004922090117951047, 'samples': 2648256, 'steps': 13792, 'loss/train': 0.8131370544433594} -08/30/2021 15:36:05 - INFO - __main__ - Step 13794: {'lr': 0.0004922076972447117, 'samples': 2648448, 'steps': 13793, 'loss/train': 2.0038375854492188} -08/30/2021 15:36:05 - INFO - __main__ - Step 13795: {'lr': 0.0004922063825851836, 'samples': 2648640, 'steps': 13794, 'loss/train': 1.4933514595031738} -08/30/2021 15:36:06 - INFO - __main__ - Step 13796: {'lr': 0.0004922050678165211, 'samples': 2648832, 'steps': 13795, 'loss/train': 1.5484554767608643} -08/30/2021 15:36:06 - INFO - __main__ - Step 13797: {'lr': 0.0004922037529387247, 'samples': 2649024, 'steps': 13796, 'loss/train': 1.4274927377700806} -08/30/2021 15:36:08 - INFO - __main__ - Step 13798: {'lr': 0.000492202437951795, 'samples': 2649216, 'steps': 13797, 'loss/train': 1.2743474245071411} -08/30/2021 15:36:08 - INFO - __main__ - Step 13799: {'lr': 0.0004922011228557327, 'samples': 2649408, 'steps': 13798, 'loss/train': 1.3631792068481445} -08/30/2021 15:36:08 - INFO - __main__ - Step 13800: {'lr': 0.0004921998076505383, 'samples': 2649600, 'steps': 13799, 'loss/train': 1.6608229875564575} -08/30/2021 15:36:09 - INFO - __main__ - Step 13801: {'lr': 0.0004921984923362124, 'samples': 2649792, 'steps': 13800, 'loss/train': 0.8246711492538452} -08/30/2021 15:36:09 - INFO - __main__ - Step 13802: {'lr': 0.0004921971769127555, 'samples': 2649984, 'steps': 13801, 'loss/train': 1.6632049083709717} -08/30/2021 15:36:11 - INFO - __main__ - Step 13803: {'lr': 0.0004921958613801683, 'samples': 2650176, 'steps': 13802, 'loss/train': 0.21885547041893005} -08/30/2021 15:36:11 - INFO - __main__ - Step 13804: {'lr': 0.0004921945457384516, 'samples': 2650368, 'steps': 13803, 'loss/train': 0.9048483967781067} -08/30/2021 15:36:11 - INFO - __main__ - Step 13805: {'lr': 0.0004921932299876055, 'samples': 2650560, 'steps': 13804, 'loss/train': 1.8860636949539185} -08/30/2021 15:36:12 - INFO - __main__ - Step 13806: {'lr': 0.000492191914127631, 'samples': 2650752, 'steps': 13805, 'loss/train': 1.522040605545044} -08/30/2021 15:36:12 - INFO - __main__ - Step 13807: {'lr': 0.0004921905981585286, 'samples': 2650944, 'steps': 13806, 'loss/train': 1.6715176105499268} -08/30/2021 15:36:14 - INFO - __main__ - Step 13808: {'lr': 0.0004921892820802988, 'samples': 2651136, 'steps': 13807, 'loss/train': 2.209564685821533} -08/30/2021 15:36:14 - INFO - __main__ - Step 13809: {'lr': 0.0004921879658929422, 'samples': 2651328, 'steps': 13808, 'loss/train': 1.5849223136901855} -08/30/2021 15:36:14 - INFO - __main__ - Step 13810: {'lr': 0.0004921866495964594, 'samples': 2651520, 'steps': 13809, 'loss/train': 1.9061890840530396} -08/30/2021 15:36:15 - INFO - __main__ - Step 13811: {'lr': 0.0004921853331908512, 'samples': 2651712, 'steps': 13810, 'loss/train': 1.5075124502182007} -08/30/2021 15:36:15 - INFO - __main__ - Step 13812: {'lr': 0.000492184016676118, 'samples': 2651904, 'steps': 13811, 'loss/train': 1.7688640356063843} -08/30/2021 15:36:17 - INFO - __main__ - Step 13813: {'lr': 0.0004921827000522603, 'samples': 2652096, 'steps': 13812, 'loss/train': 1.7393929958343506} -08/30/2021 15:36:17 - INFO - __main__ - Step 13814: {'lr': 0.0004921813833192788, 'samples': 2652288, 'steps': 13813, 'loss/train': 1.659746766090393} -08/30/2021 15:36:17 - INFO - __main__ - Step 13815: {'lr': 0.0004921800664771743, 'samples': 2652480, 'steps': 13814, 'loss/train': 1.9074373245239258} -08/30/2021 15:36:18 - INFO - __main__ - Step 13816: {'lr': 0.0004921787495259471, 'samples': 2652672, 'steps': 13815, 'loss/train': 1.6964482069015503} -08/30/2021 15:36:18 - INFO - __main__ - Step 13817: {'lr': 0.0004921774324655978, 'samples': 2652864, 'steps': 13816, 'loss/train': 1.5799070596694946} -08/30/2021 15:36:19 - INFO - __main__ - Step 13818: {'lr': 0.0004921761152961271, 'samples': 2653056, 'steps': 13817, 'loss/train': 2.1930577754974365} -08/30/2021 15:36:20 - INFO - __main__ - Step 13819: {'lr': 0.0004921747980175357, 'samples': 2653248, 'steps': 13818, 'loss/train': 1.612560510635376} -08/30/2021 15:36:20 - INFO - __main__ - Step 13820: {'lr': 0.0004921734806298241, 'samples': 2653440, 'steps': 13819, 'loss/train': 1.8078802824020386} -08/30/2021 15:36:21 - INFO - __main__ - Step 13821: {'lr': 0.0004921721631329927, 'samples': 2653632, 'steps': 13820, 'loss/train': 1.85303795337677} -08/30/2021 15:36:21 - INFO - __main__ - Step 13822: {'lr': 0.0004921708455270424, 'samples': 2653824, 'steps': 13821, 'loss/train': 1.341817855834961} -08/30/2021 15:36:21 - INFO - __main__ - Step 13823: {'lr': 0.0004921695278119736, 'samples': 2654016, 'steps': 13822, 'loss/train': 1.5608800649642944} -08/30/2021 15:36:23 - INFO - __main__ - Step 13824: {'lr': 0.0004921682099877869, 'samples': 2654208, 'steps': 13823, 'loss/train': 1.3948137760162354} -08/30/2021 15:36:23 - INFO - __main__ - Step 13825: {'lr': 0.000492166892054483, 'samples': 2654400, 'steps': 13824, 'loss/train': 1.2661569118499756} -08/30/2021 15:36:24 - INFO - __main__ - Step 13826: {'lr': 0.0004921655740120623, 'samples': 2654592, 'steps': 13825, 'loss/train': 1.4389091730117798} -08/30/2021 15:36:24 - INFO - __main__ - Step 13827: {'lr': 0.0004921642558605257, 'samples': 2654784, 'steps': 13826, 'loss/train': 0.37669238448143005} -08/30/2021 15:36:25 - INFO - __main__ - Step 13828: {'lr': 0.0004921629375998736, 'samples': 2654976, 'steps': 13827, 'loss/train': 0.6892330050468445} -08/30/2021 15:36:26 - INFO - __main__ - Step 13829: {'lr': 0.0004921616192301065, 'samples': 2655168, 'steps': 13828, 'loss/train': 1.7391256093978882} -08/30/2021 15:36:27 - INFO - __main__ - Step 13830: {'lr': 0.0004921603007512253, 'samples': 2655360, 'steps': 13829, 'loss/train': 2.2470057010650635} -08/30/2021 15:36:27 - INFO - __main__ - Step 13831: {'lr': 0.0004921589821632302, 'samples': 2655552, 'steps': 13830, 'loss/train': 2.3947322368621826} -08/30/2021 15:36:27 - INFO - __main__ - Step 13832: {'lr': 0.0004921576634661221, 'samples': 2655744, 'steps': 13831, 'loss/train': 1.621037483215332} -08/30/2021 15:36:28 - INFO - __main__ - Step 13833: {'lr': 0.0004921563446599015, 'samples': 2655936, 'steps': 13832, 'loss/train': 0.7523802518844604} -08/30/2021 15:36:30 - INFO - __main__ - Step 13834: {'lr': 0.000492155025744569, 'samples': 2656128, 'steps': 13833, 'loss/train': 1.4243792295455933} -08/30/2021 15:36:31 - INFO - __main__ - Step 13835: {'lr': 0.0004921537067201252, 'samples': 2656320, 'steps': 13834, 'loss/train': 1.2156262397766113} -08/30/2021 15:36:31 - INFO - __main__ - Step 13836: {'lr': 0.0004921523875865706, 'samples': 2656512, 'steps': 13835, 'loss/train': 1.4866888523101807} -08/30/2021 15:36:31 - INFO - __main__ - Step 13837: {'lr': 0.000492151068343906, 'samples': 2656704, 'steps': 13836, 'loss/train': 1.5981640815734863} -08/30/2021 15:36:32 - INFO - __main__ - Step 13838: {'lr': 0.0004921497489921318, 'samples': 2656896, 'steps': 13837, 'loss/train': 1.5347036123275757} -08/30/2021 15:36:33 - INFO - __main__ - Step 13839: {'lr': 0.0004921484295312485, 'samples': 2657088, 'steps': 13838, 'loss/train': 2.1072139739990234} -08/30/2021 15:36:33 - INFO - __main__ - Step 13840: {'lr': 0.0004921471099612571, 'samples': 2657280, 'steps': 13839, 'loss/train': 1.8525291681289673} -08/30/2021 15:36:34 - INFO - __main__ - Step 13841: {'lr': 0.0004921457902821578, 'samples': 2657472, 'steps': 13840, 'loss/train': 1.9629462957382202} -08/30/2021 15:36:34 - INFO - __main__ - Step 13842: {'lr': 0.0004921444704939514, 'samples': 2657664, 'steps': 13841, 'loss/train': 1.8306949138641357} -08/30/2021 15:36:34 - INFO - __main__ - Step 13843: {'lr': 0.0004921431505966384, 'samples': 2657856, 'steps': 13842, 'loss/train': 1.860345482826233} -08/30/2021 15:36:36 - INFO - __main__ - Step 13844: {'lr': 0.0004921418305902194, 'samples': 2658048, 'steps': 13843, 'loss/train': 0.7579705715179443} -08/30/2021 15:36:36 - INFO - __main__ - Step 13845: {'lr': 0.0004921405104746951, 'samples': 2658240, 'steps': 13844, 'loss/train': 1.740308165550232} -08/30/2021 15:36:37 - INFO - __main__ - Step 13846: {'lr': 0.0004921391902500661, 'samples': 2658432, 'steps': 13845, 'loss/train': 2.0427796840667725} -08/30/2021 15:36:37 - INFO - __main__ - Step 13847: {'lr': 0.0004921378699163328, 'samples': 2658624, 'steps': 13846, 'loss/train': 1.9733552932739258} -08/30/2021 15:36:37 - INFO - __main__ - Step 13848: {'lr': 0.0004921365494734959, 'samples': 2658816, 'steps': 13847, 'loss/train': 1.2051162719726562} -08/30/2021 15:36:39 - INFO - __main__ - Step 13849: {'lr': 0.0004921352289215561, 'samples': 2659008, 'steps': 13848, 'loss/train': 1.9503183364868164} -08/30/2021 15:36:40 - INFO - __main__ - Step 13850: {'lr': 0.0004921339082605137, 'samples': 2659200, 'steps': 13849, 'loss/train': 0.5631958842277527} -08/30/2021 15:36:40 - INFO - __main__ - Step 13851: {'lr': 0.0004921325874903697, 'samples': 2659392, 'steps': 13850, 'loss/train': 3.191243886947632} -08/30/2021 15:36:40 - INFO - __main__ - Step 13852: {'lr': 0.0004921312666111245, 'samples': 2659584, 'steps': 13851, 'loss/train': 1.1803581714630127} -08/30/2021 15:36:41 - INFO - __main__ - Step 13853: {'lr': 0.0004921299456227785, 'samples': 2659776, 'steps': 13852, 'loss/train': 2.2592413425445557} -08/30/2021 15:36:41 - INFO - __main__ - Step 13854: {'lr': 0.0004921286245253327, 'samples': 2659968, 'steps': 13853, 'loss/train': 1.7450721263885498} -08/30/2021 15:36:43 - INFO - __main__ - Step 13855: {'lr': 0.0004921273033187874, 'samples': 2660160, 'steps': 13854, 'loss/train': 2.659731388092041} -08/30/2021 15:36:43 - INFO - __main__ - Step 13856: {'lr': 0.0004921259820031431, 'samples': 2660352, 'steps': 13855, 'loss/train': 1.5547701120376587} -08/30/2021 15:36:43 - INFO - __main__ - Step 13857: {'lr': 0.0004921246605784008, 'samples': 2660544, 'steps': 13856, 'loss/train': 1.8264232873916626} -08/30/2021 15:36:44 - INFO - __main__ - Step 13858: {'lr': 0.0004921233390445608, 'samples': 2660736, 'steps': 13857, 'loss/train': 1.5676571130752563} -08/30/2021 15:36:44 - INFO - __main__ - Step 13859: {'lr': 0.0004921220174016238, 'samples': 2660928, 'steps': 13858, 'loss/train': 2.17057728767395} -08/30/2021 15:36:46 - INFO - __main__ - Step 13860: {'lr': 0.0004921206956495903, 'samples': 2661120, 'steps': 13859, 'loss/train': 1.4273568391799927} -08/30/2021 15:36:46 - INFO - __main__ - Step 13861: {'lr': 0.000492119373788461, 'samples': 2661312, 'steps': 13860, 'loss/train': 1.8180774450302124} -08/30/2021 15:36:46 - INFO - __main__ - Step 13862: {'lr': 0.0004921180518182363, 'samples': 2661504, 'steps': 13861, 'loss/train': 1.031244158744812} -08/30/2021 15:36:47 - INFO - __main__ - Step 13863: {'lr': 0.0004921167297389171, 'samples': 2661696, 'steps': 13862, 'loss/train': 1.8788319826126099} -08/30/2021 15:36:47 - INFO - __main__ - Step 13864: {'lr': 0.0004921154075505038, 'samples': 2661888, 'steps': 13863, 'loss/train': 1.8196581602096558} -08/30/2021 15:36:49 - INFO - __main__ - Step 13865: {'lr': 0.0004921140852529969, 'samples': 2662080, 'steps': 13864, 'loss/train': 1.7515127658843994} -08/30/2021 15:36:49 - INFO - __main__ - Step 13866: {'lr': 0.0004921127628463972, 'samples': 2662272, 'steps': 13865, 'loss/train': 1.7796953916549683} -08/30/2021 15:36:50 - INFO - __main__ - Step 13867: {'lr': 0.0004921114403307053, 'samples': 2662464, 'steps': 13866, 'loss/train': 0.07805261760950089} -08/30/2021 15:36:50 - INFO - __main__ - Step 13868: {'lr': 0.0004921101177059218, 'samples': 2662656, 'steps': 13867, 'loss/train': 1.6172711849212646} -08/30/2021 15:36:50 - INFO - __main__ - Step 13869: {'lr': 0.0004921087949720471, 'samples': 2662848, 'steps': 13868, 'loss/train': 1.4609322547912598} -08/30/2021 15:36:51 - INFO - __main__ - Step 13870: {'lr': 0.0004921074721290819, 'samples': 2663040, 'steps': 13869, 'loss/train': 1.6962738037109375} -08/30/2021 15:36:52 - INFO - __main__ - Step 13871: {'lr': 0.0004921061491770268, 'samples': 2663232, 'steps': 13870, 'loss/train': 2.0180251598358154} -08/30/2021 15:36:53 - INFO - __main__ - Step 13872: {'lr': 0.0004921048261158825, 'samples': 2663424, 'steps': 13871, 'loss/train': 1.196499228477478} -08/30/2021 15:36:53 - INFO - __main__ - Step 13873: {'lr': 0.0004921035029456493, 'samples': 2663616, 'steps': 13872, 'loss/train': 1.5539485216140747} -08/30/2021 15:36:53 - INFO - __main__ - Step 13874: {'lr': 0.0004921021796663282, 'samples': 2663808, 'steps': 13873, 'loss/train': 1.5859588384628296} -08/30/2021 15:36:54 - INFO - __main__ - Step 13875: {'lr': 0.0004921008562779195, 'samples': 2664000, 'steps': 13874, 'loss/train': 2.119206190109253} -08/30/2021 15:36:55 - INFO - __main__ - Step 13876: {'lr': 0.0004920995327804239, 'samples': 2664192, 'steps': 13875, 'loss/train': 1.698654294013977} -08/30/2021 15:36:56 - INFO - __main__ - Step 13877: {'lr': 0.000492098209173842, 'samples': 2664384, 'steps': 13876, 'loss/train': 1.9036214351654053} -08/30/2021 15:36:56 - INFO - __main__ - Step 13878: {'lr': 0.0004920968854581745, 'samples': 2664576, 'steps': 13877, 'loss/train': 1.3836435079574585} -08/30/2021 15:36:56 - INFO - __main__ - Step 13879: {'lr': 0.0004920955616334216, 'samples': 2664768, 'steps': 13878, 'loss/train': 1.2148957252502441} -08/30/2021 15:36:57 - INFO - __main__ - Step 13880: {'lr': 0.0004920942376995844, 'samples': 2664960, 'steps': 13879, 'loss/train': 1.7520737648010254} -08/30/2021 15:36:58 - INFO - __main__ - Step 13881: {'lr': 0.0004920929136566632, 'samples': 2665152, 'steps': 13880, 'loss/train': 1.4705777168273926} -08/30/2021 15:36:59 - INFO - __main__ - Step 13882: {'lr': 0.0004920915895046587, 'samples': 2665344, 'steps': 13881, 'loss/train': 1.2839056253433228} -08/30/2021 15:36:59 - INFO - __main__ - Step 13883: {'lr': 0.0004920902652435715, 'samples': 2665536, 'steps': 13882, 'loss/train': 1.5503829717636108} -08/30/2021 15:36:59 - INFO - __main__ - Step 13884: {'lr': 0.0004920889408734021, 'samples': 2665728, 'steps': 13883, 'loss/train': 2.0199179649353027} -08/30/2021 15:37:00 - INFO - __main__ - Step 13885: {'lr': 0.0004920876163941511, 'samples': 2665920, 'steps': 13884, 'loss/train': 1.7413121461868286} -08/30/2021 15:37:02 - INFO - __main__ - Step 13886: {'lr': 0.0004920862918058192, 'samples': 2666112, 'steps': 13885, 'loss/train': 1.861501693725586} -08/30/2021 15:37:02 - INFO - __main__ - Step 13887: {'lr': 0.000492084967108407, 'samples': 2666304, 'steps': 13886, 'loss/train': 1.5949935913085938} -08/30/2021 15:37:03 - INFO - __main__ - Step 13888: {'lr': 0.000492083642301915, 'samples': 2666496, 'steps': 13887, 'loss/train': 2.0910377502441406} -08/30/2021 15:37:03 - INFO - __main__ - Step 13889: {'lr': 0.0004920823173863439, 'samples': 2666688, 'steps': 13888, 'loss/train': 0.0696505680680275} -08/30/2021 15:37:04 - INFO - __main__ - Step 13890: {'lr': 0.0004920809923616942, 'samples': 2666880, 'steps': 13889, 'loss/train': 0.8083196878433228} -08/30/2021 15:37:04 - INFO - __main__ - Step 13891: {'lr': 0.0004920796672279666, 'samples': 2667072, 'steps': 13890, 'loss/train': 1.207556128501892} -08/30/2021 15:37:05 - INFO - __main__ - Step 13892: {'lr': 0.0004920783419851615, 'samples': 2667264, 'steps': 13891, 'loss/train': 1.9331567287445068} -08/30/2021 15:37:06 - INFO - __main__ - Step 13893: {'lr': 0.0004920770166332798, 'samples': 2667456, 'steps': 13892, 'loss/train': 1.6196753978729248} -08/30/2021 15:37:06 - INFO - __main__ - Step 13894: {'lr': 0.0004920756911723219, 'samples': 2667648, 'steps': 13893, 'loss/train': 1.9326804876327515} -08/30/2021 15:37:06 - INFO - __main__ - Step 13895: {'lr': 0.0004920743656022884, 'samples': 2667840, 'steps': 13894, 'loss/train': 1.6578922271728516} -08/30/2021 15:37:07 - INFO - __main__ - Step 13896: {'lr': 0.0004920730399231799, 'samples': 2668032, 'steps': 13895, 'loss/train': 1.6116663217544556} -08/30/2021 15:37:07 - INFO - __main__ - Step 13897: {'lr': 0.000492071714134997, 'samples': 2668224, 'steps': 13896, 'loss/train': 1.697620153427124} -08/30/2021 15:37:09 - INFO - __main__ - Step 13898: {'lr': 0.0004920703882377403, 'samples': 2668416, 'steps': 13897, 'loss/train': 1.84322190284729} -08/30/2021 15:37:09 - INFO - __main__ - Step 13899: {'lr': 0.0004920690622314105, 'samples': 2668608, 'steps': 13898, 'loss/train': 2.862149953842163} -08/30/2021 15:37:10 - INFO - __main__ - Step 13900: {'lr': 0.0004920677361160081, 'samples': 2668800, 'steps': 13899, 'loss/train': 1.6132988929748535} -08/30/2021 15:37:10 - INFO - __main__ - Step 13901: {'lr': 0.0004920664098915337, 'samples': 2668992, 'steps': 13900, 'loss/train': 0.9476858377456665} -08/30/2021 15:37:10 - INFO - __main__ - Step 13902: {'lr': 0.000492065083557988, 'samples': 2669184, 'steps': 13901, 'loss/train': 1.6156305074691772} -08/30/2021 15:37:12 - INFO - __main__ - Step 13903: {'lr': 0.0004920637571153713, 'samples': 2669376, 'steps': 13902, 'loss/train': 1.4620449542999268} -08/30/2021 15:37:12 - INFO - __main__ - Step 13904: {'lr': 0.0004920624305636846, 'samples': 2669568, 'steps': 13903, 'loss/train': 1.3141453266143799} -08/30/2021 15:37:12 - INFO - __main__ - Step 13905: {'lr': 0.0004920611039029283, 'samples': 2669760, 'steps': 13904, 'loss/train': 0.782860279083252} -08/30/2021 15:37:13 - INFO - __main__ - Step 13906: {'lr': 0.0004920597771331029, 'samples': 2669952, 'steps': 13905, 'loss/train': 2.0047669410705566} -08/30/2021 15:37:13 - INFO - __main__ - Step 13907: {'lr': 0.0004920584502542091, 'samples': 2670144, 'steps': 13906, 'loss/train': 1.9071727991104126} -08/30/2021 15:37:15 - INFO - __main__ - Step 13908: {'lr': 0.0004920571232662475, 'samples': 2670336, 'steps': 13907, 'loss/train': 3.6241841316223145} -08/30/2021 15:37:15 - INFO - __main__ - Step 13909: {'lr': 0.0004920557961692188, 'samples': 2670528, 'steps': 13908, 'loss/train': 1.6944514513015747} -08/30/2021 15:37:15 - INFO - __main__ - Step 13910: {'lr': 0.0004920544689631233, 'samples': 2670720, 'steps': 13909, 'loss/train': 1.308904767036438} -08/30/2021 15:37:16 - INFO - __main__ - Step 13911: {'lr': 0.000492053141647962, 'samples': 2670912, 'steps': 13910, 'loss/train': 1.8157734870910645} -08/30/2021 15:37:16 - INFO - __main__ - Step 13912: {'lr': 0.0004920518142237352, 'samples': 2671104, 'steps': 13911, 'loss/train': 2.1475274562835693} -08/30/2021 15:37:18 - INFO - __main__ - Step 13913: {'lr': 0.0004920504866904436, 'samples': 2671296, 'steps': 13912, 'loss/train': 1.5949275493621826} -08/30/2021 15:37:18 - INFO - __main__ - Step 13914: {'lr': 0.0004920491590480878, 'samples': 2671488, 'steps': 13913, 'loss/train': 1.5115959644317627} -08/30/2021 15:37:19 - INFO - __main__ - Step 13915: {'lr': 0.0004920478312966683, 'samples': 2671680, 'steps': 13914, 'loss/train': 1.5728046894073486} -08/30/2021 15:37:19 - INFO - __main__ - Step 13916: {'lr': 0.0004920465034361859, 'samples': 2671872, 'steps': 13915, 'loss/train': 1.8880095481872559} -08/30/2021 15:37:19 - INFO - __main__ - Step 13917: {'lr': 0.000492045175466641, 'samples': 2672064, 'steps': 13916, 'loss/train': 1.8674532175064087} -08/30/2021 15:37:21 - INFO - __main__ - Step 13918: {'lr': 0.0004920438473880344, 'samples': 2672256, 'steps': 13917, 'loss/train': 1.7776989936828613} -08/30/2021 15:37:21 - INFO - __main__ - Step 13919: {'lr': 0.0004920425192003663, 'samples': 2672448, 'steps': 13918, 'loss/train': 1.404813528060913} -08/30/2021 15:37:22 - INFO - __main__ - Step 13920: {'lr': 0.0004920411909036379, 'samples': 2672640, 'steps': 13919, 'loss/train': 1.480295181274414} -08/30/2021 15:37:22 - INFO - __main__ - Step 13921: {'lr': 0.0004920398624978493, 'samples': 2672832, 'steps': 13920, 'loss/train': 1.4315030574798584} -08/30/2021 15:37:22 - INFO - __main__ - Step 13922: {'lr': 0.0004920385339830012, 'samples': 2673024, 'steps': 13921, 'loss/train': 1.4261845350265503} -08/30/2021 15:37:23 - INFO - __main__ - Step 13923: {'lr': 0.0004920372053590945, 'samples': 2673216, 'steps': 13922, 'loss/train': 2.091437339782715} -08/30/2021 15:37:24 - INFO - __main__ - Step 13924: {'lr': 0.0004920358766261294, 'samples': 2673408, 'steps': 13923, 'loss/train': 1.374764323234558} -08/30/2021 15:37:25 - INFO - __main__ - Step 13925: {'lr': 0.0004920345477841067, 'samples': 2673600, 'steps': 13924, 'loss/train': 1.987488031387329} -08/30/2021 15:37:25 - INFO - __main__ - Step 13926: {'lr': 0.000492033218833027, 'samples': 2673792, 'steps': 13925, 'loss/train': 2.5749735832214355} -08/30/2021 15:37:25 - INFO - __main__ - Step 13927: {'lr': 0.0004920318897728909, 'samples': 2673984, 'steps': 13926, 'loss/train': 1.9229964017868042} -08/30/2021 15:37:26 - INFO - __main__ - Step 13928: {'lr': 0.0004920305606036988, 'samples': 2674176, 'steps': 13927, 'loss/train': 2.0174031257629395} -08/30/2021 15:37:27 - INFO - __main__ - Step 13929: {'lr': 0.0004920292313254516, 'samples': 2674368, 'steps': 13928, 'loss/train': 1.2086713314056396} -08/30/2021 15:37:28 - INFO - __main__ - Step 13930: {'lr': 0.0004920279019381497, 'samples': 2674560, 'steps': 13929, 'loss/train': 1.6760241985321045} -08/30/2021 15:37:28 - INFO - __main__ - Step 13931: {'lr': 0.0004920265724417938, 'samples': 2674752, 'steps': 13930, 'loss/train': 1.5668439865112305} -08/30/2021 15:37:28 - INFO - __main__ - Step 13932: {'lr': 0.0004920252428363845, 'samples': 2674944, 'steps': 13931, 'loss/train': 1.283671259880066} -08/30/2021 15:37:29 - INFO - __main__ - Step 13933: {'lr': 0.0004920239131219223, 'samples': 2675136, 'steps': 13932, 'loss/train': 0.7934750318527222} -08/30/2021 15:37:30 - INFO - __main__ - Step 13934: {'lr': 0.0004920225832984079, 'samples': 2675328, 'steps': 13933, 'loss/train': 1.6775068044662476} -08/30/2021 15:37:31 - INFO - __main__ - Step 13935: {'lr': 0.0004920212533658419, 'samples': 2675520, 'steps': 13934, 'loss/train': 1.5483037233352661} -08/30/2021 15:37:31 - INFO - __main__ - Step 13936: {'lr': 0.0004920199233242247, 'samples': 2675712, 'steps': 13935, 'loss/train': 1.383685827255249} -08/30/2021 15:37:31 - INFO - __main__ - Step 13937: {'lr': 0.0004920185931735572, 'samples': 2675904, 'steps': 13936, 'loss/train': 1.6135034561157227} -08/30/2021 15:37:32 - INFO - __main__ - Step 13938: {'lr': 0.0004920172629138399, 'samples': 2676096, 'steps': 13937, 'loss/train': 1.8389533758163452} -08/30/2021 15:37:32 - INFO - __main__ - Step 13939: {'lr': 0.0004920159325450731, 'samples': 2676288, 'steps': 13938, 'loss/train': 5.266563892364502} -08/30/2021 15:37:34 - INFO - __main__ - Step 13940: {'lr': 0.0004920146020672578, 'samples': 2676480, 'steps': 13939, 'loss/train': 2.102337598800659} -08/30/2021 15:37:35 - INFO - __main__ - Step 13941: {'lr': 0.0004920132714803946, 'samples': 2676672, 'steps': 13940, 'loss/train': 1.7820079326629639} -08/30/2021 15:37:35 - INFO - __main__ - Step 13942: {'lr': 0.0004920119407844838, 'samples': 2676864, 'steps': 13941, 'loss/train': 1.3730963468551636} -08/30/2021 15:37:35 - INFO - __main__ - Step 13943: {'lr': 0.0004920106099795262, 'samples': 2677056, 'steps': 13942, 'loss/train': 1.7216168642044067} -08/30/2021 15:37:36 - INFO - __main__ - Step 13944: {'lr': 0.0004920092790655224, 'samples': 2677248, 'steps': 13943, 'loss/train': 1.7423903942108154} -08/30/2021 15:37:37 - INFO - __main__ - Step 13945: {'lr': 0.0004920079480424728, 'samples': 2677440, 'steps': 13944, 'loss/train': 1.3568315505981445} -08/30/2021 15:37:38 - INFO - __main__ - Step 13946: {'lr': 0.0004920066169103783, 'samples': 2677632, 'steps': 13945, 'loss/train': 1.8082294464111328} -08/30/2021 15:37:38 - INFO - __main__ - Step 13947: {'lr': 0.0004920052856692394, 'samples': 2677824, 'steps': 13946, 'loss/train': 0.3955638110637665} -08/30/2021 15:37:38 - INFO - __main__ - Step 13948: {'lr': 0.0004920039543190565, 'samples': 2678016, 'steps': 13947, 'loss/train': 2.1612000465393066} -08/30/2021 15:37:39 - INFO - __main__ - Step 13949: {'lr': 0.0004920026228598303, 'samples': 2678208, 'steps': 13948, 'loss/train': 2.3141117095947266} -08/30/2021 15:37:40 - INFO - __main__ - Step 13950: {'lr': 0.0004920012912915616, 'samples': 2678400, 'steps': 13949, 'loss/train': 1.8165549039840698} -08/30/2021 15:37:41 - INFO - __main__ - Step 13951: {'lr': 0.0004919999596142508, 'samples': 2678592, 'steps': 13950, 'loss/train': 1.9764556884765625} -08/30/2021 15:37:41 - INFO - __main__ - Step 13952: {'lr': 0.0004919986278278986, 'samples': 2678784, 'steps': 13951, 'loss/train': 1.7947592735290527} -08/30/2021 15:37:42 - INFO - __main__ - Step 13953: {'lr': 0.0004919972959325055, 'samples': 2678976, 'steps': 13952, 'loss/train': 0.1696995049715042} -08/30/2021 15:37:42 - INFO - __main__ - Step 13954: {'lr': 0.0004919959639280722, 'samples': 2679168, 'steps': 13953, 'loss/train': 1.772992491722107} -08/30/2021 15:37:44 - INFO - __main__ - Step 13955: {'lr': 0.0004919946318145992, 'samples': 2679360, 'steps': 13954, 'loss/train': 1.8060719966888428} -08/30/2021 15:37:44 - INFO - __main__ - Step 13956: {'lr': 0.0004919932995920872, 'samples': 2679552, 'steps': 13955, 'loss/train': 1.8740953207015991} -08/30/2021 15:37:44 - INFO - __main__ - Step 13957: {'lr': 0.0004919919672605366, 'samples': 2679744, 'steps': 13956, 'loss/train': 1.5823982954025269} -08/30/2021 15:37:45 - INFO - __main__ - Step 13958: {'lr': 0.0004919906348199483, 'samples': 2679936, 'steps': 13957, 'loss/train': 1.7188812494277954} -08/30/2021 15:37:45 - INFO - __main__ - Step 13959: {'lr': 0.0004919893022703228, 'samples': 2680128, 'steps': 13958, 'loss/train': 2.2183656692504883} -08/30/2021 15:37:45 - INFO - __main__ - Step 13960: {'lr': 0.0004919879696116605, 'samples': 2680320, 'steps': 13959, 'loss/train': 1.7986222505569458} -08/30/2021 15:37:47 - INFO - __main__ - Step 13961: {'lr': 0.0004919866368439624, 'samples': 2680512, 'steps': 13960, 'loss/train': 1.681349754333496} -08/30/2021 15:37:47 - INFO - __main__ - Step 13962: {'lr': 0.0004919853039672287, 'samples': 2680704, 'steps': 13961, 'loss/train': 1.8460050821304321} -08/30/2021 15:37:48 - INFO - __main__ - Step 13963: {'lr': 0.00049198397098146, 'samples': 2680896, 'steps': 13962, 'loss/train': 1.95518159866333} -08/30/2021 15:37:48 - INFO - __main__ - Step 13964: {'lr': 0.0004919826378866573, 'samples': 2681088, 'steps': 13963, 'loss/train': 1.8929909467697144} -08/30/2021 15:37:48 - INFO - __main__ - Step 13965: {'lr': 0.0004919813046828209, 'samples': 2681280, 'steps': 13964, 'loss/train': 1.0597758293151855} -08/30/2021 15:37:50 - INFO - __main__ - Step 13966: {'lr': 0.0004919799713699514, 'samples': 2681472, 'steps': 13965, 'loss/train': 1.583213210105896} -08/30/2021 15:37:50 - INFO - __main__ - Step 13967: {'lr': 0.0004919786379480494, 'samples': 2681664, 'steps': 13966, 'loss/train': 1.4857362508773804} -08/30/2021 15:37:51 - INFO - __main__ - Step 13968: {'lr': 0.0004919773044171158, 'samples': 2681856, 'steps': 13967, 'loss/train': 1.5280898809432983} -08/30/2021 15:37:51 - INFO - __main__ - Step 13969: {'lr': 0.0004919759707771507, 'samples': 2682048, 'steps': 13968, 'loss/train': 1.9612340927124023} -08/30/2021 15:37:51 - INFO - __main__ - Step 13970: {'lr': 0.0004919746370281551, 'samples': 2682240, 'steps': 13969, 'loss/train': 1.8146198987960815} -08/30/2021 15:37:53 - INFO - __main__ - Step 13971: {'lr': 0.0004919733031701295, 'samples': 2682432, 'steps': 13970, 'loss/train': 1.1746950149536133} -08/30/2021 15:37:54 - INFO - __main__ - Step 13972: {'lr': 0.0004919719692030743, 'samples': 2682624, 'steps': 13971, 'loss/train': 0.9985931515693665} -08/30/2021 15:37:54 - INFO - __main__ - Step 13973: {'lr': 0.0004919706351269904, 'samples': 2682816, 'steps': 13972, 'loss/train': 1.7299377918243408} -08/30/2021 15:37:54 - INFO - __main__ - Step 13974: {'lr': 0.0004919693009418782, 'samples': 2683008, 'steps': 13973, 'loss/train': 1.6628096103668213} -08/30/2021 15:37:55 - INFO - __main__ - Step 13975: {'lr': 0.0004919679666477384, 'samples': 2683200, 'steps': 13974, 'loss/train': 1.7094441652297974} -08/30/2021 15:37:55 - INFO - __main__ - Step 13976: {'lr': 0.0004919666322445715, 'samples': 2683392, 'steps': 13975, 'loss/train': 1.5595203638076782} -08/30/2021 15:37:57 - INFO - __main__ - Step 13977: {'lr': 0.0004919652977323783, 'samples': 2683584, 'steps': 13976, 'loss/train': 3.2277538776397705} -08/30/2021 15:37:57 - INFO - __main__ - Step 13978: {'lr': 0.0004919639631111592, 'samples': 2683776, 'steps': 13977, 'loss/train': 1.7416126728057861} -08/30/2021 15:37:58 - INFO - __main__ - Step 13979: {'lr': 0.0004919626283809149, 'samples': 2683968, 'steps': 13978, 'loss/train': 2.1867125034332275} -08/30/2021 15:37:58 - INFO - __main__ - Step 13980: {'lr': 0.0004919612935416459, 'samples': 2684160, 'steps': 13979, 'loss/train': 2.0710060596466064} -08/30/2021 15:37:58 - INFO - __main__ - Step 13981: {'lr': 0.000491959958593353, 'samples': 2684352, 'steps': 13980, 'loss/train': 1.9789578914642334} -08/30/2021 15:37:59 - INFO - __main__ - Step 13982: {'lr': 0.0004919586235360365, 'samples': 2684544, 'steps': 13981, 'loss/train': 2.061649799346924} -08/30/2021 15:38:00 - INFO - __main__ - Step 13983: {'lr': 0.0004919572883696974, 'samples': 2684736, 'steps': 13982, 'loss/train': 0.13816119730472565} -08/30/2021 15:38:01 - INFO - __main__ - Step 13984: {'lr': 0.0004919559530943359, 'samples': 2684928, 'steps': 13983, 'loss/train': 2.414689064025879} -08/30/2021 15:38:01 - INFO - __main__ - Step 13985: {'lr': 0.0004919546177099528, 'samples': 2685120, 'steps': 13984, 'loss/train': 1.581223964691162} -08/30/2021 15:38:01 - INFO - __main__ - Step 13986: {'lr': 0.0004919532822165487, 'samples': 2685312, 'steps': 13985, 'loss/train': 1.731987476348877} -08/30/2021 15:38:02 - INFO - __main__ - Step 13987: {'lr': 0.0004919519466141242, 'samples': 2685504, 'steps': 13986, 'loss/train': 1.7833051681518555} -08/30/2021 15:38:04 - INFO - __main__ - Step 13988: {'lr': 0.0004919506109026799, 'samples': 2685696, 'steps': 13987, 'loss/train': 1.6730360984802246} -08/30/2021 15:38:04 - INFO - __main__ - Step 13989: {'lr': 0.0004919492750822163, 'samples': 2685888, 'steps': 13988, 'loss/train': 1.2312800884246826} -08/30/2021 15:38:05 - INFO - __main__ - Step 13990: {'lr': 0.0004919479391527343, 'samples': 2686080, 'steps': 13989, 'loss/train': 1.9871710538864136} -08/30/2021 15:38:05 - INFO - __main__ - Step 13991: {'lr': 0.0004919466031142342, 'samples': 2686272, 'steps': 13990, 'loss/train': 1.8162356615066528} -08/30/2021 15:38:06 - INFO - __main__ - Step 13992: {'lr': 0.0004919452669667166, 'samples': 2686464, 'steps': 13991, 'loss/train': 1.7460132837295532} -08/30/2021 15:38:06 - INFO - __main__ - Step 13993: {'lr': 0.0004919439307101822, 'samples': 2686656, 'steps': 13992, 'loss/train': 1.6586244106292725} -08/30/2021 15:38:07 - INFO - __main__ - Step 13994: {'lr': 0.0004919425943446317, 'samples': 2686848, 'steps': 13993, 'loss/train': 0.23169642686843872} -08/30/2021 15:38:08 - INFO - __main__ - Step 13995: {'lr': 0.0004919412578700654, 'samples': 2687040, 'steps': 13994, 'loss/train': 2.336965322494507} -08/30/2021 15:38:08 - INFO - __main__ - Step 13996: {'lr': 0.0004919399212864843, 'samples': 2687232, 'steps': 13995, 'loss/train': 1.0330415964126587} -08/30/2021 15:38:09 - INFO - __main__ - Step 13997: {'lr': 0.0004919385845938888, 'samples': 2687424, 'steps': 13996, 'loss/train': 1.7321889400482178} -08/30/2021 15:38:09 - INFO - __main__ - Step 13998: {'lr': 0.0004919372477922794, 'samples': 2687616, 'steps': 13997, 'loss/train': 1.6030454635620117} -08/30/2021 15:38:11 - INFO - __main__ - Step 13999: {'lr': 0.0004919359108816569, 'samples': 2687808, 'steps': 13998, 'loss/train': 1.7427433729171753} -08/30/2021 15:38:12 - INFO - __main__ - Step 14000: {'lr': 0.0004919345738620218, 'samples': 2688000, 'steps': 13999, 'loss/train': 1.8576711416244507} -08/30/2021 15:38:12 - INFO - __main__ - Step 14001: {'lr': 0.0004919332367333747, 'samples': 2688192, 'steps': 14000, 'loss/train': 1.4826809167861938} -08/30/2021 15:38:12 - INFO - __main__ - Step 14002: {'lr': 0.0004919318994957162, 'samples': 2688384, 'steps': 14001, 'loss/train': 1.815764307975769} -08/30/2021 15:38:13 - INFO - __main__ - Step 14003: {'lr': 0.0004919305621490469, 'samples': 2688576, 'steps': 14002, 'loss/train': 2.4873239994049072} -08/30/2021 15:38:13 - INFO - __main__ - Step 14004: {'lr': 0.0004919292246933675, 'samples': 2688768, 'steps': 14003, 'loss/train': 1.6412919759750366} -08/30/2021 15:38:15 - INFO - __main__ - Step 14005: {'lr': 0.0004919278871286785, 'samples': 2688960, 'steps': 14004, 'loss/train': 2.0664548873901367} -08/30/2021 15:38:15 - INFO - __main__ - Step 14006: {'lr': 0.0004919265494549805, 'samples': 2689152, 'steps': 14005, 'loss/train': 2.6249313354492188} -08/30/2021 15:38:16 - INFO - __main__ - Step 14007: {'lr': 0.0004919252116722742, 'samples': 2689344, 'steps': 14006, 'loss/train': 1.8031655550003052} -08/30/2021 15:38:16 - INFO - __main__ - Step 14008: {'lr': 0.0004919238737805601, 'samples': 2689536, 'steps': 14007, 'loss/train': 0.16975277662277222} -08/30/2021 15:38:17 - INFO - __main__ - Step 14009: {'lr': 0.0004919225357798387, 'samples': 2689728, 'steps': 14008, 'loss/train': 1.5877736806869507} -08/30/2021 15:38:18 - INFO - __main__ - Step 14010: {'lr': 0.000491921197670111, 'samples': 2689920, 'steps': 14009, 'loss/train': 1.8153903484344482} -08/30/2021 15:38:18 - INFO - __main__ - Step 14011: {'lr': 0.0004919198594513771, 'samples': 2690112, 'steps': 14010, 'loss/train': 1.5196207761764526} -08/30/2021 15:38:19 - INFO - __main__ - Step 14012: {'lr': 0.0004919185211236379, 'samples': 2690304, 'steps': 14011, 'loss/train': 1.0222389698028564} -08/30/2021 15:38:19 - INFO - __main__ - Step 14013: {'lr': 0.000491917182686894, 'samples': 2690496, 'steps': 14012, 'loss/train': 1.8241993188858032} -08/30/2021 15:38:19 - INFO - __main__ - Step 14014: {'lr': 0.0004919158441411459, 'samples': 2690688, 'steps': 14013, 'loss/train': 1.7418286800384521} -08/30/2021 15:38:21 - INFO - __main__ - Step 14015: {'lr': 0.0004919145054863943, 'samples': 2690880, 'steps': 14014, 'loss/train': 1.3573681116104126} -08/30/2021 15:38:21 - INFO - __main__ - Step 14016: {'lr': 0.0004919131667226398, 'samples': 2691072, 'steps': 14015, 'loss/train': 1.9249037504196167} -08/30/2021 15:38:22 - INFO - __main__ - Step 14017: {'lr': 0.0004919118278498828, 'samples': 2691264, 'steps': 14016, 'loss/train': 1.7148103713989258} -08/30/2021 15:38:22 - INFO - __main__ - Step 14018: {'lr': 0.0004919104888681242, 'samples': 2691456, 'steps': 14017, 'loss/train': 2.0112602710723877} -08/30/2021 15:38:22 - INFO - __main__ - Step 14019: {'lr': 0.0004919091497773643, 'samples': 2691648, 'steps': 14018, 'loss/train': 1.5301368236541748} -08/30/2021 15:38:24 - INFO - __main__ - Step 14020: {'lr': 0.0004919078105776041, 'samples': 2691840, 'steps': 14019, 'loss/train': 0.8327675461769104} -08/30/2021 15:38:24 - INFO - __main__ - Step 14021: {'lr': 0.0004919064712688439, 'samples': 2692032, 'steps': 14020, 'loss/train': 1.8283535242080688} -08/30/2021 15:38:25 - INFO - __main__ - Step 14022: {'lr': 0.0004919051318510844, 'samples': 2692224, 'steps': 14021, 'loss/train': 1.206780195236206} -08/30/2021 15:38:25 - INFO - __main__ - Step 14023: {'lr': 0.0004919037923243261, 'samples': 2692416, 'steps': 14022, 'loss/train': 0.09630504250526428} -08/30/2021 15:38:25 - INFO - __main__ - Step 14024: {'lr': 0.0004919024526885697, 'samples': 2692608, 'steps': 14023, 'loss/train': 1.8012055158615112} -08/30/2021 15:38:27 - INFO - __main__ - Step 14025: {'lr': 0.0004919011129438158, 'samples': 2692800, 'steps': 14024, 'loss/train': 1.7135487794876099} -08/30/2021 15:38:27 - INFO - __main__ - Step 14026: {'lr': 0.0004918997730900649, 'samples': 2692992, 'steps': 14025, 'loss/train': 1.7016279697418213} -08/30/2021 15:38:28 - INFO - __main__ - Step 14027: {'lr': 0.0004918984331273178, 'samples': 2693184, 'steps': 14026, 'loss/train': 1.536525845527649} -08/30/2021 15:38:28 - INFO - __main__ - Step 14028: {'lr': 0.0004918970930555751, 'samples': 2693376, 'steps': 14027, 'loss/train': 1.658823013305664} -08/30/2021 15:38:28 - INFO - __main__ - Step 14029: {'lr': 0.0004918957528748371, 'samples': 2693568, 'steps': 14028, 'loss/train': 1.4102813005447388} -08/30/2021 15:38:30 - INFO - __main__ - Step 14030: {'lr': 0.0004918944125851047, 'samples': 2693760, 'steps': 14029, 'loss/train': 1.7518928050994873} -08/30/2021 15:38:31 - INFO - __main__ - Step 14031: {'lr': 0.0004918930721863784, 'samples': 2693952, 'steps': 14030, 'loss/train': 1.562180519104004} -08/30/2021 15:38:31 - INFO - __main__ - Step 14032: {'lr': 0.0004918917316786589, 'samples': 2694144, 'steps': 14031, 'loss/train': 1.6976679563522339} -08/30/2021 15:38:31 - INFO - __main__ - Step 14033: {'lr': 0.0004918903910619465, 'samples': 2694336, 'steps': 14032, 'loss/train': 1.5939868688583374} -08/30/2021 15:38:32 - INFO - __main__ - Step 14034: {'lr': 0.0004918890503362422, 'samples': 2694528, 'steps': 14033, 'loss/train': 1.6739760637283325} -08/30/2021 15:38:32 - INFO - __main__ - Step 14035: {'lr': 0.0004918877095015465, 'samples': 2694720, 'steps': 14034, 'loss/train': 3.0974340438842773} -08/30/2021 15:38:33 - INFO - __main__ - Step 14036: {'lr': 0.0004918863685578598, 'samples': 2694912, 'steps': 14035, 'loss/train': 0.43638405203819275} -08/30/2021 15:38:34 - INFO - __main__ - Step 14037: {'lr': 0.0004918850275051829, 'samples': 2695104, 'steps': 14036, 'loss/train': 0.8242853879928589} -08/30/2021 15:38:34 - INFO - __main__ - Step 14038: {'lr': 0.0004918836863435162, 'samples': 2695296, 'steps': 14037, 'loss/train': 1.301469326019287} -08/30/2021 15:38:35 - INFO - __main__ - Step 14039: {'lr': 0.0004918823450728606, 'samples': 2695488, 'steps': 14038, 'loss/train': 1.672101616859436} -08/30/2021 15:38:35 - INFO - __main__ - Step 14040: {'lr': 0.0004918810036932164, 'samples': 2695680, 'steps': 14039, 'loss/train': 1.5688748359680176} -08/30/2021 15:38:37 - INFO - __main__ - Step 14041: {'lr': 0.0004918796622045844, 'samples': 2695872, 'steps': 14040, 'loss/train': 0.8930960893630981} -08/30/2021 15:38:37 - INFO - __main__ - Step 14042: {'lr': 0.0004918783206069652, 'samples': 2696064, 'steps': 14041, 'loss/train': 0.10164300352334976} -08/30/2021 15:38:37 - INFO - __main__ - Step 14043: {'lr': 0.0004918769789003593, 'samples': 2696256, 'steps': 14042, 'loss/train': 1.9629344940185547} -08/30/2021 15:38:38 - INFO - __main__ - Step 14044: {'lr': 0.0004918756370847674, 'samples': 2696448, 'steps': 14043, 'loss/train': 1.7223443984985352} -08/30/2021 15:38:38 - INFO - __main__ - Step 14045: {'lr': 0.0004918742951601902, 'samples': 2696640, 'steps': 14044, 'loss/train': 2.261448383331299} -08/30/2021 15:38:40 - INFO - __main__ - Step 14046: {'lr': 0.000491872953126628, 'samples': 2696832, 'steps': 14045, 'loss/train': 2.6446807384490967} -08/30/2021 15:38:40 - INFO - __main__ - Step 14047: {'lr': 0.0004918716109840817, 'samples': 2697024, 'steps': 14046, 'loss/train': 1.6899405717849731} -08/30/2021 15:38:40 - INFO - __main__ - Step 14048: {'lr': 0.0004918702687325517, 'samples': 2697216, 'steps': 14047, 'loss/train': 1.8066340684890747} -08/30/2021 15:38:41 - INFO - __main__ - Step 14049: {'lr': 0.0004918689263720388, 'samples': 2697408, 'steps': 14048, 'loss/train': 1.766615390777588} -08/30/2021 15:38:41 - INFO - __main__ - Step 14050: {'lr': 0.0004918675839025434, 'samples': 2697600, 'steps': 14049, 'loss/train': 2.1533803939819336} -08/30/2021 15:38:44 - INFO - __main__ - Step 14051: {'lr': 0.0004918662413240662, 'samples': 2697792, 'steps': 14050, 'loss/train': 1.5729386806488037} -08/30/2021 15:38:44 - INFO - __main__ - Step 14052: {'lr': 0.0004918648986366078, 'samples': 2697984, 'steps': 14051, 'loss/train': 1.3882887363433838} -08/30/2021 15:38:44 - INFO - __main__ - Step 14053: {'lr': 0.0004918635558401687, 'samples': 2698176, 'steps': 14052, 'loss/train': 1.6236763000488281} -08/30/2021 15:38:45 - INFO - __main__ - Step 14054: {'lr': 0.0004918622129347498, 'samples': 2698368, 'steps': 14053, 'loss/train': 2.609205961227417} -08/30/2021 15:38:45 - INFO - __main__ - Step 14055: {'lr': 0.0004918608699203515, 'samples': 2698560, 'steps': 14054, 'loss/train': 1.5624489784240723} -08/30/2021 15:38:45 - INFO - __main__ - Step 14056: {'lr': 0.0004918595267969744, 'samples': 2698752, 'steps': 14055, 'loss/train': 1.3526252508163452} -08/30/2021 15:38:47 - INFO - __main__ - Step 14057: {'lr': 0.0004918581835646191, 'samples': 2698944, 'steps': 14056, 'loss/train': 1.87291419506073} -08/30/2021 15:38:47 - INFO - __main__ - Step 14058: {'lr': 0.0004918568402232863, 'samples': 2699136, 'steps': 14057, 'loss/train': 1.5407071113586426} -08/30/2021 15:38:48 - INFO - __main__ - Step 14059: {'lr': 0.0004918554967729764, 'samples': 2699328, 'steps': 14058, 'loss/train': 1.3131482601165771} -08/30/2021 15:38:48 - INFO - __main__ - Step 14060: {'lr': 0.0004918541532136902, 'samples': 2699520, 'steps': 14059, 'loss/train': 0.9513907432556152} -08/30/2021 15:38:48 - INFO - __main__ - Step 14061: {'lr': 0.0004918528095454283, 'samples': 2699712, 'steps': 14060, 'loss/train': 1.919915795326233} -08/30/2021 15:38:49 - INFO - __main__ - Step 14062: {'lr': 0.0004918514657681913, 'samples': 2699904, 'steps': 14061, 'loss/train': 1.270890235900879} -08/30/2021 15:38:50 - INFO - __main__ - Step 14063: {'lr': 0.0004918501218819796, 'samples': 2700096, 'steps': 14062, 'loss/train': 1.272247552871704} -08/30/2021 15:38:51 - INFO - __main__ - Step 14064: {'lr': 0.0004918487778867941, 'samples': 2700288, 'steps': 14063, 'loss/train': 2.140005111694336} -08/30/2021 15:38:51 - INFO - __main__ - Step 14065: {'lr': 0.0004918474337826353, 'samples': 2700480, 'steps': 14064, 'loss/train': 1.036586880683899} -08/30/2021 15:38:51 - INFO - __main__ - Step 14066: {'lr': 0.0004918460895695037, 'samples': 2700672, 'steps': 14065, 'loss/train': 1.626570701599121} -08/30/2021 15:38:52 - INFO - __main__ - Step 14067: {'lr': 0.0004918447452474, 'samples': 2700864, 'steps': 14066, 'loss/train': 1.351240634918213} -08/30/2021 15:38:53 - INFO - __main__ - Step 14068: {'lr': 0.0004918434008163247, 'samples': 2701056, 'steps': 14067, 'loss/train': 1.6912751197814941} -08/30/2021 15:38:54 - INFO - __main__ - Step 14069: {'lr': 0.0004918420562762786, 'samples': 2701248, 'steps': 14068, 'loss/train': 1.9792084693908691} -08/30/2021 15:38:54 - INFO - __main__ - Step 14070: {'lr': 0.0004918407116272622, 'samples': 2701440, 'steps': 14069, 'loss/train': 1.7819777727127075} -08/30/2021 15:38:54 - INFO - __main__ - Step 14071: {'lr': 0.000491839366869276, 'samples': 2701632, 'steps': 14070, 'loss/train': 1.1663535833358765} -08/30/2021 15:38:55 - INFO - __main__ - Step 14072: {'lr': 0.000491838022002321, 'samples': 2701824, 'steps': 14071, 'loss/train': 2.1723740100860596} -08/30/2021 15:38:56 - INFO - __main__ - Step 14073: {'lr': 0.0004918366770263972, 'samples': 2702016, 'steps': 14072, 'loss/train': 1.923164963722229} -08/30/2021 15:38:57 - INFO - __main__ - Step 14074: {'lr': 0.0004918353319415057, 'samples': 2702208, 'steps': 14073, 'loss/train': 1.9491578340530396} -08/30/2021 15:38:57 - INFO - __main__ - Step 14075: {'lr': 0.0004918339867476469, 'samples': 2702400, 'steps': 14074, 'loss/train': 1.578508734703064} -08/30/2021 15:38:57 - INFO - __main__ - Step 14076: {'lr': 0.0004918326414448214, 'samples': 2702592, 'steps': 14075, 'loss/train': 0.5960631966590881} -08/30/2021 15:38:58 - INFO - __main__ - Step 14077: {'lr': 0.0004918312960330299, 'samples': 2702784, 'steps': 14076, 'loss/train': 1.7320919036865234} -08/30/2021 15:38:59 - INFO - __main__ - Step 14078: {'lr': 0.0004918299505122729, 'samples': 2702976, 'steps': 14077, 'loss/train': 1.436476469039917} -08/30/2021 15:39:00 - INFO - __main__ - Step 14079: {'lr': 0.000491828604882551, 'samples': 2703168, 'steps': 14078, 'loss/train': 1.8881703615188599} -08/30/2021 15:39:00 - INFO - __main__ - Step 14080: {'lr': 0.0004918272591438649, 'samples': 2703360, 'steps': 14079, 'loss/train': 1.6356626749038696} -08/30/2021 15:39:01 - INFO - __main__ - Step 14081: {'lr': 0.0004918259132962153, 'samples': 2703552, 'steps': 14080, 'loss/train': 1.0681535005569458} -08/30/2021 15:39:01 - INFO - __main__ - Step 14082: {'lr': 0.0004918245673396025, 'samples': 2703744, 'steps': 14081, 'loss/train': 2.058180570602417} -08/30/2021 15:39:01 - INFO - __main__ - Step 14083: {'lr': 0.0004918232212740274, 'samples': 2703936, 'steps': 14082, 'loss/train': 1.0928046703338623} -08/30/2021 15:39:03 - INFO - __main__ - Step 14084: {'lr': 0.0004918218750994904, 'samples': 2704128, 'steps': 14083, 'loss/train': 1.6999531984329224} -08/30/2021 15:39:03 - INFO - __main__ - Step 14085: {'lr': 0.0004918205288159923, 'samples': 2704320, 'steps': 14084, 'loss/train': 1.7699096202850342} -08/30/2021 15:39:04 - INFO - __main__ - Step 14086: {'lr': 0.0004918191824235335, 'samples': 2704512, 'steps': 14085, 'loss/train': 1.5534898042678833} -08/30/2021 15:39:04 - INFO - __main__ - Step 14087: {'lr': 0.0004918178359221147, 'samples': 2704704, 'steps': 14086, 'loss/train': 1.5937029123306274} -08/30/2021 15:39:04 - INFO - __main__ - Step 14088: {'lr': 0.0004918164893117366, 'samples': 2704896, 'steps': 14087, 'loss/train': 1.4823368787765503} -08/30/2021 15:39:06 - INFO - __main__ - Step 14089: {'lr': 0.0004918151425923996, 'samples': 2705088, 'steps': 14088, 'loss/train': 1.1469001770019531} -08/30/2021 15:39:06 - INFO - __main__ - Step 14090: {'lr': 0.0004918137957641046, 'samples': 2705280, 'steps': 14089, 'loss/train': 0.939859926700592} -08/30/2021 15:39:07 - INFO - __main__ - Step 14091: {'lr': 0.000491812448826852, 'samples': 2705472, 'steps': 14090, 'loss/train': 0.8698261380195618} -08/30/2021 15:39:07 - INFO - __main__ - Step 14092: {'lr': 0.0004918111017806424, 'samples': 2705664, 'steps': 14091, 'loss/train': 1.6383382081985474} -08/30/2021 15:39:07 - INFO - __main__ - Step 14093: {'lr': 0.0004918097546254764, 'samples': 2705856, 'steps': 14092, 'loss/train': 2.0791850090026855} -08/30/2021 15:39:09 - INFO - __main__ - Step 14094: {'lr': 0.0004918084073613547, 'samples': 2706048, 'steps': 14093, 'loss/train': 2.0904128551483154} -08/30/2021 15:39:09 - INFO - __main__ - Step 14095: {'lr': 0.0004918070599882778, 'samples': 2706240, 'steps': 14094, 'loss/train': 1.762641429901123} -08/30/2021 15:39:10 - INFO - __main__ - Step 14096: {'lr': 0.0004918057125062465, 'samples': 2706432, 'steps': 14095, 'loss/train': 1.576412320137024} -08/30/2021 15:39:10 - INFO - __main__ - Step 14097: {'lr': 0.0004918043649152612, 'samples': 2706624, 'steps': 14096, 'loss/train': 1.2938681840896606} -08/30/2021 15:39:10 - INFO - __main__ - Step 14098: {'lr': 0.0004918030172153225, 'samples': 2706816, 'steps': 14097, 'loss/train': 1.8019441366195679} -08/30/2021 15:39:12 - INFO - __main__ - Step 14099: {'lr': 0.0004918016694064313, 'samples': 2707008, 'steps': 14098, 'loss/train': 1.796257495880127} -08/30/2021 15:39:12 - INFO - __main__ - Step 14100: {'lr': 0.0004918003214885877, 'samples': 2707200, 'steps': 14099, 'loss/train': 1.3860641717910767} -08/30/2021 15:39:13 - INFO - __main__ - Step 14101: {'lr': 0.0004917989734617928, 'samples': 2707392, 'steps': 14100, 'loss/train': 0.7811518311500549} -08/30/2021 15:39:13 - INFO - __main__ - Step 14102: {'lr': 0.0004917976253260471, 'samples': 2707584, 'steps': 14101, 'loss/train': 1.9318650960922241} -08/30/2021 15:39:13 - INFO - __main__ - Step 14103: {'lr': 0.000491796277081351, 'samples': 2707776, 'steps': 14102, 'loss/train': 2.0168838500976562} -08/30/2021 15:39:16 - INFO - __main__ - Step 14104: {'lr': 0.0004917949287277052, 'samples': 2707968, 'steps': 14103, 'loss/train': 2.3239035606384277} -08/30/2021 15:39:16 - INFO - __main__ - Step 14105: {'lr': 0.0004917935802651104, 'samples': 2708160, 'steps': 14104, 'loss/train': 1.8436191082000732} -08/30/2021 15:39:17 - INFO - __main__ - Step 14106: {'lr': 0.0004917922316935671, 'samples': 2708352, 'steps': 14105, 'loss/train': 1.6571234464645386} -08/30/2021 15:39:17 - INFO - __main__ - Step 14107: {'lr': 0.000491790883013076, 'samples': 2708544, 'steps': 14106, 'loss/train': 1.3560878038406372} -08/30/2021 15:39:17 - INFO - __main__ - Step 14108: {'lr': 0.0004917895342236377, 'samples': 2708736, 'steps': 14107, 'loss/train': 0.08560151606798172} -08/30/2021 15:39:18 - INFO - __main__ - Step 14109: {'lr': 0.0004917881853252527, 'samples': 2708928, 'steps': 14108, 'loss/train': 1.4498388767242432} -08/30/2021 15:39:19 - INFO - __main__ - Step 14110: {'lr': 0.0004917868363179216, 'samples': 2709120, 'steps': 14109, 'loss/train': 2.0461947917938232} -08/30/2021 15:39:20 - INFO - __main__ - Step 14111: {'lr': 0.0004917854872016451, 'samples': 2709312, 'steps': 14110, 'loss/train': 1.3963159322738647} -08/30/2021 15:39:20 - INFO - __main__ - Step 14112: {'lr': 0.000491784137976424, 'samples': 2709504, 'steps': 14111, 'loss/train': 1.5421956777572632} -08/30/2021 15:39:20 - INFO - __main__ - Step 14113: {'lr': 0.0004917827886422586, 'samples': 2709696, 'steps': 14112, 'loss/train': 1.673872709274292} -08/30/2021 15:39:21 - INFO - __main__ - Step 14114: {'lr': 0.0004917814391991494, 'samples': 2709888, 'steps': 14113, 'loss/train': 2.0303893089294434} -08/30/2021 15:39:22 - INFO - __main__ - Step 14115: {'lr': 0.0004917800896470974, 'samples': 2710080, 'steps': 14114, 'loss/train': 1.528775930404663} -08/30/2021 15:39:23 - INFO - __main__ - Step 14116: {'lr': 0.000491778739986103, 'samples': 2710272, 'steps': 14115, 'loss/train': 1.8756296634674072} -08/30/2021 15:39:23 - INFO - __main__ - Step 14117: {'lr': 0.0004917773902161669, 'samples': 2710464, 'steps': 14116, 'loss/train': 2.3668806552886963} -08/30/2021 15:39:23 - INFO - __main__ - Step 14118: {'lr': 0.0004917760403372895, 'samples': 2710656, 'steps': 14117, 'loss/train': 2.0578255653381348} -08/30/2021 15:39:24 - INFO - __main__ - Step 14119: {'lr': 0.0004917746903494717, 'samples': 2710848, 'steps': 14118, 'loss/train': 1.6370103359222412} -08/30/2021 15:39:25 - INFO - __main__ - Step 14120: {'lr': 0.0004917733402527138, 'samples': 2711040, 'steps': 14119, 'loss/train': 1.6128284931182861} -08/30/2021 15:39:26 - INFO - __main__ - Step 14121: {'lr': 0.0004917719900470167, 'samples': 2711232, 'steps': 14120, 'loss/train': 1.5568597316741943} -08/30/2021 15:39:26 - INFO - __main__ - Step 14122: {'lr': 0.0004917706397323808, 'samples': 2711424, 'steps': 14121, 'loss/train': 1.3538464307785034} -08/30/2021 15:39:27 - INFO - __main__ - Step 14123: {'lr': 0.0004917692893088067, 'samples': 2711616, 'steps': 14122, 'loss/train': 0.16965769231319427} -08/30/2021 15:39:27 - INFO - __main__ - Step 14124: {'lr': 0.0004917679387762952, 'samples': 2711808, 'steps': 14123, 'loss/train': 1.666258692741394} -08/30/2021 15:39:28 - INFO - __main__ - Step 14125: {'lr': 0.0004917665881348467, 'samples': 2712000, 'steps': 14124, 'loss/train': 1.620166540145874} -08/30/2021 15:39:29 - INFO - __main__ - Step 14126: {'lr': 0.000491765237384462, 'samples': 2712192, 'steps': 14125, 'loss/train': 1.5839182138442993} -08/30/2021 15:39:29 - INFO - __main__ - Step 14127: {'lr': 0.0004917638865251416, 'samples': 2712384, 'steps': 14126, 'loss/train': 1.9082685708999634} -08/30/2021 15:39:30 - INFO - __main__ - Step 14128: {'lr': 0.0004917625355568861, 'samples': 2712576, 'steps': 14127, 'loss/train': 2.201725482940674} -08/30/2021 15:39:30 - INFO - __main__ - Step 14129: {'lr': 0.0004917611844796962, 'samples': 2712768, 'steps': 14128, 'loss/train': 1.6258965730667114} -08/30/2021 15:39:30 - INFO - __main__ - Step 14130: {'lr': 0.0004917598332935724, 'samples': 2712960, 'steps': 14129, 'loss/train': 1.4448388814926147} -08/30/2021 15:39:32 - INFO - __main__ - Step 14131: {'lr': 0.0004917584819985153, 'samples': 2713152, 'steps': 14130, 'loss/train': 1.4698928594589233} -08/30/2021 15:39:32 - INFO - __main__ - Step 14132: {'lr': 0.0004917571305945256, 'samples': 2713344, 'steps': 14131, 'loss/train': 1.5409729480743408} -08/30/2021 15:39:33 - INFO - __main__ - Step 14133: {'lr': 0.0004917557790816039, 'samples': 2713536, 'steps': 14132, 'loss/train': 1.8997957706451416} -08/30/2021 15:39:33 - INFO - __main__ - Step 14134: {'lr': 0.0004917544274597507, 'samples': 2713728, 'steps': 14133, 'loss/train': 1.914629340171814} -08/30/2021 15:39:33 - INFO - __main__ - Step 14135: {'lr': 0.0004917530757289668, 'samples': 2713920, 'steps': 14134, 'loss/train': 1.625847339630127} -08/30/2021 15:39:35 - INFO - __main__ - Step 14136: {'lr': 0.0004917517238892526, 'samples': 2714112, 'steps': 14135, 'loss/train': 2.0104947090148926} -08/30/2021 15:39:36 - INFO - __main__ - Step 14137: {'lr': 0.0004917503719406087, 'samples': 2714304, 'steps': 14136, 'loss/train': 0.09295482188463211} -08/30/2021 15:39:36 - INFO - __main__ - Step 14138: {'lr': 0.000491749019883036, 'samples': 2714496, 'steps': 14137, 'loss/train': 0.12390390038490295} -08/30/2021 15:39:37 - INFO - __main__ - Step 14139: {'lr': 0.0004917476677165349, 'samples': 2714688, 'steps': 14138, 'loss/train': 1.3897292613983154} -08/30/2021 15:39:37 - INFO - __main__ - Step 14140: {'lr': 0.0004917463154411059, 'samples': 2714880, 'steps': 14139, 'loss/train': 1.7671445608139038} -08/30/2021 15:39:37 - INFO - __main__ - Step 14141: {'lr': 0.0004917449630567499, 'samples': 2715072, 'steps': 14140, 'loss/train': 1.804566740989685} -08/30/2021 15:39:39 - INFO - __main__ - Step 14142: {'lr': 0.0004917436105634673, 'samples': 2715264, 'steps': 14141, 'loss/train': 1.5026624202728271} -08/30/2021 15:39:39 - INFO - __main__ - Step 14143: {'lr': 0.0004917422579612587, 'samples': 2715456, 'steps': 14142, 'loss/train': 1.7232012748718262} -08/30/2021 15:39:40 - INFO - __main__ - Step 14144: {'lr': 0.0004917409052501248, 'samples': 2715648, 'steps': 14143, 'loss/train': 1.2619420289993286} -08/30/2021 15:39:40 - INFO - __main__ - Step 14145: {'lr': 0.0004917395524300661, 'samples': 2715840, 'steps': 14144, 'loss/train': 1.1857624053955078} -08/30/2021 15:39:40 - INFO - __main__ - Step 14146: {'lr': 0.0004917381995010834, 'samples': 2716032, 'steps': 14145, 'loss/train': 1.8339183330535889} -08/30/2021 15:39:42 - INFO - __main__ - Step 14147: {'lr': 0.0004917368464631772, 'samples': 2716224, 'steps': 14146, 'loss/train': 1.0906007289886475} -08/30/2021 15:39:42 - INFO - __main__ - Step 14148: {'lr': 0.0004917354933163481, 'samples': 2716416, 'steps': 14147, 'loss/train': 1.5463742017745972} -08/30/2021 15:39:43 - INFO - __main__ - Step 14149: {'lr': 0.0004917341400605967, 'samples': 2716608, 'steps': 14148, 'loss/train': 1.2037752866744995} -08/30/2021 15:39:43 - INFO - __main__ - Step 14150: {'lr': 0.0004917327866959236, 'samples': 2716800, 'steps': 14149, 'loss/train': 1.5649795532226562} -08/30/2021 15:39:44 - INFO - __main__ - Step 14151: {'lr': 0.0004917314332223295, 'samples': 2716992, 'steps': 14150, 'loss/train': 2.0070488452911377} -08/30/2021 15:39:44 - INFO - __main__ - Step 14152: {'lr': 0.0004917300796398148, 'samples': 2717184, 'steps': 14151, 'loss/train': 1.3868390321731567} -08/30/2021 15:39:45 - INFO - __main__ - Step 14153: {'lr': 0.0004917287259483805, 'samples': 2717376, 'steps': 14152, 'loss/train': 3.9668636322021484} -08/30/2021 15:39:46 - INFO - __main__ - Step 14154: {'lr': 0.0004917273721480268, 'samples': 2717568, 'steps': 14153, 'loss/train': 2.3048255443573} -08/30/2021 15:39:46 - INFO - __main__ - Step 14155: {'lr': 0.0004917260182387545, 'samples': 2717760, 'steps': 14154, 'loss/train': 1.8597017526626587} -08/30/2021 15:39:46 - INFO - __main__ - Step 14156: {'lr': 0.0004917246642205642, 'samples': 2717952, 'steps': 14155, 'loss/train': 1.8402026891708374} -08/30/2021 15:39:47 - INFO - __main__ - Step 14157: {'lr': 0.0004917233100934565, 'samples': 2718144, 'steps': 14156, 'loss/train': 1.6949419975280762} -08/30/2021 15:39:49 - INFO - __main__ - Step 14158: {'lr': 0.0004917219558574319, 'samples': 2718336, 'steps': 14157, 'loss/train': 1.4849724769592285} -08/30/2021 15:39:49 - INFO - __main__ - Step 14159: {'lr': 0.0004917206015124913, 'samples': 2718528, 'steps': 14158, 'loss/train': 1.8341007232666016} -08/30/2021 15:39:50 - INFO - __main__ - Step 14160: {'lr': 0.000491719247058635, 'samples': 2718720, 'steps': 14159, 'loss/train': 1.6200454235076904} -08/30/2021 15:39:50 - INFO - __main__ - Step 14161: {'lr': 0.0004917178924958638, 'samples': 2718912, 'steps': 14160, 'loss/train': 1.7147324085235596} -08/30/2021 15:39:50 - INFO - __main__ - Step 14162: {'lr': 0.0004917165378241782, 'samples': 2719104, 'steps': 14161, 'loss/train': 1.798283576965332} -08/30/2021 15:39:52 - INFO - __main__ - Step 14163: {'lr': 0.0004917151830435789, 'samples': 2719296, 'steps': 14162, 'loss/train': 1.7082637548446655} -08/30/2021 15:39:52 - INFO - __main__ - Step 14164: {'lr': 0.0004917138281540664, 'samples': 2719488, 'steps': 14163, 'loss/train': 1.2861160039901733} -08/30/2021 15:39:53 - INFO - __main__ - Step 14165: {'lr': 0.0004917124731556415, 'samples': 2719680, 'steps': 14164, 'loss/train': 1.4616657495498657} -08/30/2021 15:39:53 - INFO - __main__ - Step 14166: {'lr': 0.0004917111180483046, 'samples': 2719872, 'steps': 14165, 'loss/train': 1.669005274772644} -08/30/2021 15:39:53 - INFO - __main__ - Step 14167: {'lr': 0.0004917097628320564, 'samples': 2720064, 'steps': 14166, 'loss/train': 1.6722915172576904} -08/30/2021 15:39:55 - INFO - __main__ - Step 14168: {'lr': 0.0004917084075068975, 'samples': 2720256, 'steps': 14167, 'loss/train': 2.3572487831115723} -08/30/2021 15:39:55 - INFO - __main__ - Step 14169: {'lr': 0.0004917070520728286, 'samples': 2720448, 'steps': 14168, 'loss/train': 1.9552350044250488} -08/30/2021 15:39:56 - INFO - __main__ - Step 14170: {'lr': 0.0004917056965298501, 'samples': 2720640, 'steps': 14169, 'loss/train': 1.7678080797195435} -08/30/2021 15:39:56 - INFO - __main__ - Step 14171: {'lr': 0.0004917043408779629, 'samples': 2720832, 'steps': 14170, 'loss/train': 1.659894585609436} -08/30/2021 15:39:56 - INFO - __main__ - Step 14172: {'lr': 0.0004917029851171674, 'samples': 2721024, 'steps': 14171, 'loss/train': 1.7558727264404297} -08/30/2021 15:39:58 - INFO - __main__ - Step 14173: {'lr': 0.0004917016292474642, 'samples': 2721216, 'steps': 14172, 'loss/train': 2.1233808994293213} -08/30/2021 15:39:58 - INFO - __main__ - Step 14174: {'lr': 0.000491700273268854, 'samples': 2721408, 'steps': 14173, 'loss/train': 1.6767710447311401} -08/30/2021 15:39:59 - INFO - __main__ - Step 14175: {'lr': 0.0004916989171813374, 'samples': 2721600, 'steps': 14174, 'loss/train': 1.980328917503357} -08/30/2021 15:39:59 - INFO - __main__ - Step 14176: {'lr': 0.000491697560984915, 'samples': 2721792, 'steps': 14175, 'loss/train': 1.541935682296753} -08/30/2021 15:39:59 - INFO - __main__ - Step 14177: {'lr': 0.0004916962046795874, 'samples': 2721984, 'steps': 14176, 'loss/train': 1.7506691217422485} -08/30/2021 15:40:01 - INFO - __main__ - Step 14178: {'lr': 0.0004916948482653553, 'samples': 2722176, 'steps': 14177, 'loss/train': 1.729347586631775} -08/30/2021 15:40:01 - INFO - __main__ - Step 14179: {'lr': 0.0004916934917422191, 'samples': 2722368, 'steps': 14178, 'loss/train': 1.5602684020996094} -08/30/2021 15:40:02 - INFO - __main__ - Step 14180: {'lr': 0.0004916921351101796, 'samples': 2722560, 'steps': 14179, 'loss/train': 1.8815113306045532} -08/30/2021 15:40:02 - INFO - __main__ - Step 14181: {'lr': 0.0004916907783692374, 'samples': 2722752, 'steps': 14180, 'loss/train': 1.4521411657333374} -08/30/2021 15:40:02 - INFO - __main__ - Step 14182: {'lr': 0.000491689421519393, 'samples': 2722944, 'steps': 14181, 'loss/train': 0.0882885530591011} -08/30/2021 15:40:04 - INFO - __main__ - Step 14183: {'lr': 0.0004916880645606471, 'samples': 2723136, 'steps': 14182, 'loss/train': 2.0369925498962402} -08/30/2021 15:40:04 - INFO - __main__ - Step 14184: {'lr': 0.0004916867074930002, 'samples': 2723328, 'steps': 14183, 'loss/train': 1.6349990367889404} -08/30/2021 15:40:05 - INFO - __main__ - Step 14185: {'lr': 0.0004916853503164531, 'samples': 2723520, 'steps': 14184, 'loss/train': 1.890197992324829} -08/30/2021 15:40:05 - INFO - __main__ - Step 14186: {'lr': 0.0004916839930310063, 'samples': 2723712, 'steps': 14185, 'loss/train': 1.398798942565918} -08/30/2021 15:40:05 - INFO - __main__ - Step 14187: {'lr': 0.0004916826356366605, 'samples': 2723904, 'steps': 14186, 'loss/train': 1.4671858549118042} -08/30/2021 15:40:06 - INFO - __main__ - Step 14188: {'lr': 0.0004916812781334161, 'samples': 2724096, 'steps': 14187, 'loss/train': 1.8269046545028687} -08/30/2021 15:40:07 - INFO - __main__ - Step 14189: {'lr': 0.0004916799205212739, 'samples': 2724288, 'steps': 14188, 'loss/train': 1.612385630607605} -08/30/2021 15:40:08 - INFO - __main__ - Step 14190: {'lr': 0.0004916785628002345, 'samples': 2724480, 'steps': 14189, 'loss/train': 1.8590627908706665} -08/30/2021 15:40:08 - INFO - __main__ - Step 14191: {'lr': 0.0004916772049702984, 'samples': 2724672, 'steps': 14190, 'loss/train': 1.6657508611679077} -08/30/2021 15:40:08 - INFO - __main__ - Step 14192: {'lr': 0.0004916758470314662, 'samples': 2724864, 'steps': 14191, 'loss/train': 1.6730341911315918} -08/30/2021 15:40:09 - INFO - __main__ - Step 14193: {'lr': 0.0004916744889837388, 'samples': 2725056, 'steps': 14192, 'loss/train': 1.5481258630752563} -08/30/2021 15:40:10 - INFO - __main__ - Step 14194: {'lr': 0.0004916731308271165, 'samples': 2725248, 'steps': 14193, 'loss/train': 1.7963457107543945} -08/30/2021 15:40:11 - INFO - __main__ - Step 14195: {'lr': 0.0004916717725616, 'samples': 2725440, 'steps': 14194, 'loss/train': 1.623094916343689} -08/30/2021 15:40:11 - INFO - __main__ - Step 14196: {'lr': 0.0004916704141871899, 'samples': 2725632, 'steps': 14195, 'loss/train': 1.7807375192642212} -08/30/2021 15:40:11 - INFO - __main__ - Step 14197: {'lr': 0.000491669055703887, 'samples': 2725824, 'steps': 14196, 'loss/train': 1.500786542892456} -08/30/2021 15:40:12 - INFO - __main__ - Step 14198: {'lr': 0.0004916676971116916, 'samples': 2726016, 'steps': 14197, 'loss/train': 0.9933580756187439} -08/30/2021 15:40:13 - INFO - __main__ - Step 14199: {'lr': 0.0004916663384106045, 'samples': 2726208, 'steps': 14198, 'loss/train': 0.9632720947265625} -08/30/2021 15:40:14 - INFO - __main__ - Step 14200: {'lr': 0.0004916649796006263, 'samples': 2726400, 'steps': 14199, 'loss/train': 1.751441478729248} -08/30/2021 15:40:14 - INFO - __main__ - Step 14201: {'lr': 0.0004916636206817575, 'samples': 2726592, 'steps': 14200, 'loss/train': 1.7866759300231934} -08/30/2021 15:40:14 - INFO - __main__ - Step 14202: {'lr': 0.0004916622616539988, 'samples': 2726784, 'steps': 14201, 'loss/train': 1.6616225242614746} -08/30/2021 15:40:15 - INFO - __main__ - Step 14203: {'lr': 0.000491660902517351, 'samples': 2726976, 'steps': 14202, 'loss/train': 1.58908212184906} -08/30/2021 15:40:16 - INFO - __main__ - Step 14204: {'lr': 0.0004916595432718143, 'samples': 2727168, 'steps': 14203, 'loss/train': 1.4164177179336548} -08/30/2021 15:40:17 - INFO - __main__ - Step 14205: {'lr': 0.0004916581839173897, 'samples': 2727360, 'steps': 14204, 'loss/train': 1.7263103723526} -08/30/2021 15:40:17 - INFO - __main__ - Step 14206: {'lr': 0.0004916568244540776, 'samples': 2727552, 'steps': 14205, 'loss/train': 1.6879026889801025} -08/30/2021 15:40:17 - INFO - __main__ - Step 14207: {'lr': 0.0004916554648818787, 'samples': 2727744, 'steps': 14206, 'loss/train': 1.2350469827651978} -08/30/2021 15:40:18 - INFO - __main__ - Step 14208: {'lr': 0.0004916541052007936, 'samples': 2727936, 'steps': 14207, 'loss/train': 0.9809690713882446} -08/30/2021 15:40:20 - INFO - __main__ - Step 14209: {'lr': 0.0004916527454108227, 'samples': 2728128, 'steps': 14208, 'loss/train': 1.7045831680297852} -08/30/2021 15:40:20 - INFO - __main__ - Step 14210: {'lr': 0.0004916513855119669, 'samples': 2728320, 'steps': 14209, 'loss/train': 1.4296053647994995} -08/30/2021 15:40:21 - INFO - __main__ - Step 14211: {'lr': 0.0004916500255042268, 'samples': 2728512, 'steps': 14210, 'loss/train': 0.5579972267150879} -08/30/2021 15:40:21 - INFO - __main__ - Step 14212: {'lr': 0.0004916486653876029, 'samples': 2728704, 'steps': 14211, 'loss/train': 1.7848087549209595} -08/30/2021 15:40:21 - INFO - __main__ - Step 14213: {'lr': 0.0004916473051620958, 'samples': 2728896, 'steps': 14212, 'loss/train': 1.980293869972229} -08/30/2021 15:40:23 - INFO - __main__ - Step 14214: {'lr': 0.0004916459448277062, 'samples': 2729088, 'steps': 14213, 'loss/train': 1.9483768939971924} -08/30/2021 15:40:23 - INFO - __main__ - Step 14215: {'lr': 0.0004916445843844346, 'samples': 2729280, 'steps': 14214, 'loss/train': 1.2159225940704346} -08/30/2021 15:40:24 - INFO - __main__ - Step 14216: {'lr': 0.0004916432238322818, 'samples': 2729472, 'steps': 14215, 'loss/train': 0.19944612681865692} -08/30/2021 15:40:24 - INFO - __main__ - Step 14217: {'lr': 0.0004916418631712481, 'samples': 2729664, 'steps': 14216, 'loss/train': 2.559760570526123} -08/30/2021 15:40:24 - INFO - __main__ - Step 14218: {'lr': 0.0004916405024013344, 'samples': 2729856, 'steps': 14217, 'loss/train': 1.8995834589004517} -08/30/2021 15:40:27 - INFO - __main__ - Step 14219: {'lr': 0.0004916391415225413, 'samples': 2730048, 'steps': 14218, 'loss/train': 1.6571044921875} -08/30/2021 15:40:27 - INFO - __main__ - Step 14220: {'lr': 0.0004916377805348692, 'samples': 2730240, 'steps': 14219, 'loss/train': 1.1118005514144897} -08/30/2021 15:40:28 - INFO - __main__ - Step 14221: {'lr': 0.000491636419438319, 'samples': 2730432, 'steps': 14220, 'loss/train': 0.6850120425224304} -08/30/2021 15:40:28 - INFO - __main__ - Step 14222: {'lr': 0.000491635058232891, 'samples': 2730624, 'steps': 14221, 'loss/train': 0.6429716944694519} -08/30/2021 15:40:28 - INFO - __main__ - Step 14223: {'lr': 0.0004916336969185861, 'samples': 2730816, 'steps': 14222, 'loss/train': 0.6164513230323792} -08/30/2021 15:40:29 - INFO - __main__ - Step 14224: {'lr': 0.0004916323354954047, 'samples': 2731008, 'steps': 14223, 'loss/train': 1.9105051755905151} -08/30/2021 15:40:30 - INFO - __main__ - Step 14225: {'lr': 0.0004916309739633475, 'samples': 2731200, 'steps': 14224, 'loss/train': 1.7779122591018677} -08/30/2021 15:40:31 - INFO - __main__ - Step 14226: {'lr': 0.0004916296123224151, 'samples': 2731392, 'steps': 14225, 'loss/train': 1.6873564720153809} -08/30/2021 15:40:31 - INFO - __main__ - Step 14227: {'lr': 0.0004916282505726082, 'samples': 2731584, 'steps': 14226, 'loss/train': 1.4683501720428467} -08/30/2021 15:40:32 - INFO - __main__ - Step 14228: {'lr': 0.0004916268887139272, 'samples': 2731776, 'steps': 14227, 'loss/train': 0.12098906189203262} -08/30/2021 15:40:32 - INFO - __main__ - Step 14229: {'lr': 0.000491625526746373, 'samples': 2731968, 'steps': 14228, 'loss/train': 1.8777852058410645} -08/30/2021 15:40:33 - INFO - __main__ - Step 14230: {'lr': 0.000491624164669946, 'samples': 2732160, 'steps': 14229, 'loss/train': 1.4158958196640015} -08/30/2021 15:40:34 - INFO - __main__ - Step 14231: {'lr': 0.0004916228024846469, 'samples': 2732352, 'steps': 14230, 'loss/train': 0.4140443503856659} -08/30/2021 15:40:34 - INFO - __main__ - Step 14232: {'lr': 0.0004916214401904763, 'samples': 2732544, 'steps': 14231, 'loss/train': 1.8795267343521118} -08/30/2021 15:40:34 - INFO - __main__ - Step 14233: {'lr': 0.0004916200777874348, 'samples': 2732736, 'steps': 14232, 'loss/train': 1.7342122793197632} -08/30/2021 15:40:35 - INFO - __main__ - Step 14234: {'lr': 0.000491618715275523, 'samples': 2732928, 'steps': 14233, 'loss/train': 1.5589019060134888} -08/30/2021 15:40:37 - INFO - __main__ - Step 14235: {'lr': 0.0004916173526547415, 'samples': 2733120, 'steps': 14234, 'loss/train': 1.8375165462493896} -08/30/2021 15:40:37 - INFO - __main__ - Step 14236: {'lr': 0.000491615989925091, 'samples': 2733312, 'steps': 14235, 'loss/train': 1.63279128074646} -08/30/2021 15:40:37 - INFO - __main__ - Step 14237: {'lr': 0.0004916146270865721, 'samples': 2733504, 'steps': 14236, 'loss/train': 0.2016444057226181} -08/30/2021 15:40:38 - INFO - __main__ - Step 14238: {'lr': 0.0004916132641391854, 'samples': 2733696, 'steps': 14237, 'loss/train': 1.4945404529571533} -08/30/2021 15:40:38 - INFO - __main__ - Step 14239: {'lr': 0.0004916119010829314, 'samples': 2733888, 'steps': 14238, 'loss/train': 1.5928460359573364} -08/30/2021 15:40:40 - INFO - __main__ - Step 14240: {'lr': 0.0004916105379178108, 'samples': 2734080, 'steps': 14239, 'loss/train': 1.9532207250595093} -08/30/2021 15:40:40 - INFO - __main__ - Step 14241: {'lr': 0.0004916091746438243, 'samples': 2734272, 'steps': 14240, 'loss/train': 2.2842166423797607} -08/30/2021 15:40:40 - INFO - __main__ - Step 14242: {'lr': 0.0004916078112609724, 'samples': 2734464, 'steps': 14241, 'loss/train': 1.407718300819397} -08/30/2021 15:40:41 - INFO - __main__ - Step 14243: {'lr': 0.0004916064477692557, 'samples': 2734656, 'steps': 14242, 'loss/train': 1.682555913925171} -08/30/2021 15:40:41 - INFO - __main__ - Step 14244: {'lr': 0.0004916050841686748, 'samples': 2734848, 'steps': 14243, 'loss/train': 1.3194701671600342} -08/30/2021 15:40:43 - INFO - __main__ - Step 14245: {'lr': 0.0004916037204592306, 'samples': 2735040, 'steps': 14244, 'loss/train': 1.6163827180862427} -08/30/2021 15:40:43 - INFO - __main__ - Step 14246: {'lr': 0.0004916023566409233, 'samples': 2735232, 'steps': 14245, 'loss/train': 1.799128770828247} -08/30/2021 15:40:43 - INFO - __main__ - Step 14247: {'lr': 0.0004916009927137538, 'samples': 2735424, 'steps': 14246, 'loss/train': 1.4250456094741821} -08/30/2021 15:40:44 - INFO - __main__ - Step 14248: {'lr': 0.0004915996286777226, 'samples': 2735616, 'steps': 14247, 'loss/train': 1.5041444301605225} -08/30/2021 15:40:44 - INFO - __main__ - Step 14249: {'lr': 0.0004915982645328304, 'samples': 2735808, 'steps': 14248, 'loss/train': 1.6152318716049194} -08/30/2021 15:40:44 - INFO - __main__ - Step 14250: {'lr': 0.0004915969002790777, 'samples': 2736000, 'steps': 14249, 'loss/train': 2.0096380710601807} -08/30/2021 15:40:46 - INFO - __main__ - Step 14251: {'lr': 0.0004915955359164651, 'samples': 2736192, 'steps': 14250, 'loss/train': 1.9248408079147339} -08/30/2021 15:40:46 - INFO - __main__ - Step 14252: {'lr': 0.0004915941714449933, 'samples': 2736384, 'steps': 14251, 'loss/train': 0.09167566150426865} -08/30/2021 15:40:47 - INFO - __main__ - Step 14253: {'lr': 0.000491592806864663, 'samples': 2736576, 'steps': 14252, 'loss/train': 2.085392475128174} -08/30/2021 15:40:47 - INFO - __main__ - Step 14254: {'lr': 0.0004915914421754746, 'samples': 2736768, 'steps': 14253, 'loss/train': 1.867599606513977} -08/30/2021 15:40:48 - INFO - __main__ - Step 14255: {'lr': 0.0004915900773774289, 'samples': 2736960, 'steps': 14254, 'loss/train': 1.4897617101669312} -08/30/2021 15:40:49 - INFO - __main__ - Step 14256: {'lr': 0.0004915887124705263, 'samples': 2737152, 'steps': 14255, 'loss/train': 1.184784173965454} -08/30/2021 15:40:49 - INFO - __main__ - Step 14257: {'lr': 0.0004915873474547677, 'samples': 2737344, 'steps': 14256, 'loss/train': 1.953404426574707} -08/30/2021 15:40:50 - INFO - __main__ - Step 14258: {'lr': 0.0004915859823301535, 'samples': 2737536, 'steps': 14257, 'loss/train': 1.5674388408660889} -08/30/2021 15:40:50 - INFO - __main__ - Step 14259: {'lr': 0.0004915846170966845, 'samples': 2737728, 'steps': 14258, 'loss/train': 1.546112060546875} -08/30/2021 15:40:51 - INFO - __main__ - Step 14260: {'lr': 0.000491583251754361, 'samples': 2737920, 'steps': 14259, 'loss/train': 1.146052360534668} -08/30/2021 15:40:52 - INFO - __main__ - Step 14261: {'lr': 0.0004915818863031839, 'samples': 2738112, 'steps': 14260, 'loss/train': 1.3799189329147339} -08/30/2021 15:40:52 - INFO - __main__ - Step 14262: {'lr': 0.0004915805207431537, 'samples': 2738304, 'steps': 14261, 'loss/train': 1.8515392541885376} -08/30/2021 15:40:53 - INFO - __main__ - Step 14263: {'lr': 0.0004915791550742712, 'samples': 2738496, 'steps': 14262, 'loss/train': 1.4869722127914429} -08/30/2021 15:40:53 - INFO - __main__ - Step 14264: {'lr': 0.0004915777892965368, 'samples': 2738688, 'steps': 14263, 'loss/train': 0.8241997957229614} -08/30/2021 15:40:53 - INFO - __main__ - Step 14265: {'lr': 0.0004915764234099511, 'samples': 2738880, 'steps': 14264, 'loss/train': 1.3659237623214722} -08/30/2021 15:40:55 - INFO - __main__ - Step 14266: {'lr': 0.0004915750574145148, 'samples': 2739072, 'steps': 14265, 'loss/train': 1.5381276607513428} -08/30/2021 15:40:55 - INFO - __main__ - Step 14267: {'lr': 0.0004915736913102285, 'samples': 2739264, 'steps': 14266, 'loss/train': 1.520689845085144} -08/30/2021 15:40:56 - INFO - __main__ - Step 14268: {'lr': 0.0004915723250970928, 'samples': 2739456, 'steps': 14267, 'loss/train': 2.185713529586792} -08/30/2021 15:40:56 - INFO - __main__ - Step 14269: {'lr': 0.0004915709587751084, 'samples': 2739648, 'steps': 14268, 'loss/train': 11.970024108886719} -08/30/2021 15:40:57 - INFO - __main__ - Step 14270: {'lr': 0.0004915695923442759, 'samples': 2739840, 'steps': 14269, 'loss/train': 0.8003661632537842} -08/30/2021 15:40:59 - INFO - __main__ - Step 14271: {'lr': 0.0004915682258045958, 'samples': 2740032, 'steps': 14270, 'loss/train': 1.5905641317367554} -08/30/2021 15:40:59 - INFO - __main__ - Step 14272: {'lr': 0.0004915668591560688, 'samples': 2740224, 'steps': 14271, 'loss/train': 2.2194135189056396} -08/30/2021 15:40:59 - INFO - __main__ - Step 14273: {'lr': 0.0004915654923986955, 'samples': 2740416, 'steps': 14272, 'loss/train': 1.8407152891159058} -08/30/2021 15:41:00 - INFO - __main__ - Step 14274: {'lr': 0.0004915641255324764, 'samples': 2740608, 'steps': 14273, 'loss/train': 1.638126015663147} -08/30/2021 15:41:00 - INFO - __main__ - Step 14275: {'lr': 0.0004915627585574124, 'samples': 2740800, 'steps': 14274, 'loss/train': 1.9308607578277588} -08/30/2021 15:41:01 - INFO - __main__ - Step 14276: {'lr': 0.0004915613914735038, 'samples': 2740992, 'steps': 14275, 'loss/train': 1.8504908084869385} -08/30/2021 15:41:02 - INFO - __main__ - Step 14277: {'lr': 0.0004915600242807516, 'samples': 2741184, 'steps': 14276, 'loss/train': 0.22727176547050476} -08/30/2021 15:41:02 - INFO - __main__ - Step 14278: {'lr': 0.000491558656979156, 'samples': 2741376, 'steps': 14277, 'loss/train': 5.502272129058838} -08/30/2021 15:41:03 - INFO - __main__ - Step 14279: {'lr': 0.0004915572895687179, 'samples': 2741568, 'steps': 14278, 'loss/train': 1.881693720817566} -08/30/2021 15:41:03 - INFO - __main__ - Step 14280: {'lr': 0.0004915559220494376, 'samples': 2741760, 'steps': 14279, 'loss/train': 1.9186737537384033} -08/30/2021 15:41:03 - INFO - __main__ - Step 14281: {'lr': 0.0004915545544213161, 'samples': 2741952, 'steps': 14280, 'loss/train': 1.2309820652008057} -08/30/2021 15:41:05 - INFO - __main__ - Step 14282: {'lr': 0.0004915531866843539, 'samples': 2742144, 'steps': 14281, 'loss/train': 2.065537452697754} -08/30/2021 15:41:06 - INFO - __main__ - Step 14283: {'lr': 0.0004915518188385514, 'samples': 2742336, 'steps': 14282, 'loss/train': 1.8233487606048584} -08/30/2021 15:41:06 - INFO - __main__ - Step 14284: {'lr': 0.0004915504508839095, 'samples': 2742528, 'steps': 14283, 'loss/train': 1.5087192058563232} -08/30/2021 15:41:06 - INFO - __main__ - Step 14285: {'lr': 0.0004915490828204287, 'samples': 2742720, 'steps': 14284, 'loss/train': 1.539300560951233} -08/30/2021 15:41:07 - INFO - __main__ - Step 14286: {'lr': 0.0004915477146481095, 'samples': 2742912, 'steps': 14285, 'loss/train': 1.836625576019287} -08/30/2021 15:41:08 - INFO - __main__ - Step 14287: {'lr': 0.0004915463463669527, 'samples': 2743104, 'steps': 14286, 'loss/train': 0.992317795753479} -08/30/2021 15:41:09 - INFO - __main__ - Step 14288: {'lr': 0.0004915449779769589, 'samples': 2743296, 'steps': 14287, 'loss/train': 1.8336970806121826} -08/30/2021 15:41:09 - INFO - __main__ - Step 14289: {'lr': 0.0004915436094781285, 'samples': 2743488, 'steps': 14288, 'loss/train': 2.112403392791748} -08/30/2021 15:41:09 - INFO - __main__ - Step 14290: {'lr': 0.0004915422408704624, 'samples': 2743680, 'steps': 14289, 'loss/train': 1.8381317853927612} -08/30/2021 15:41:10 - INFO - __main__ - Step 14291: {'lr': 0.0004915408721539612, 'samples': 2743872, 'steps': 14290, 'loss/train': 1.4352819919586182} -08/30/2021 15:41:10 - INFO - __main__ - Step 14292: {'lr': 0.0004915395033286251, 'samples': 2744064, 'steps': 14291, 'loss/train': 1.2204521894454956} -08/30/2021 15:41:12 - INFO - __main__ - Step 14293: {'lr': 0.0004915381343944552, 'samples': 2744256, 'steps': 14292, 'loss/train': 1.5716047286987305} -08/30/2021 15:41:12 - INFO - __main__ - Step 14294: {'lr': 0.0004915367653514521, 'samples': 2744448, 'steps': 14293, 'loss/train': 1.7927772998809814} -08/30/2021 15:41:12 - INFO - __main__ - Step 14295: {'lr': 0.0004915353961996161, 'samples': 2744640, 'steps': 14294, 'loss/train': 2.267578125} -08/30/2021 15:41:13 - INFO - __main__ - Step 14296: {'lr': 0.000491534026938948, 'samples': 2744832, 'steps': 14295, 'loss/train': 1.5962440967559814} -08/30/2021 15:41:13 - INFO - __main__ - Step 14297: {'lr': 0.0004915326575694484, 'samples': 2745024, 'steps': 14296, 'loss/train': 1.5142970085144043} -08/30/2021 15:41:15 - INFO - __main__ - Step 14298: {'lr': 0.0004915312880911178, 'samples': 2745216, 'steps': 14297, 'loss/train': 1.996443748474121} -08/30/2021 15:41:15 - INFO - __main__ - Step 14299: {'lr': 0.000491529918503957, 'samples': 2745408, 'steps': 14298, 'loss/train': 1.968015432357788} -08/30/2021 15:41:15 - INFO - __main__ - Step 14300: {'lr': 0.0004915285488079666, 'samples': 2745600, 'steps': 14299, 'loss/train': 1.713179349899292} -08/30/2021 15:41:16 - INFO - __main__ - Step 14301: {'lr': 0.0004915271790031471, 'samples': 2745792, 'steps': 14300, 'loss/train': 2.0385515689849854} -08/30/2021 15:41:16 - INFO - __main__ - Step 14302: {'lr': 0.0004915258090894993, 'samples': 2745984, 'steps': 14301, 'loss/train': 1.9879531860351562} -08/30/2021 15:41:17 - INFO - __main__ - Step 14303: {'lr': 0.0004915244390670236, 'samples': 2746176, 'steps': 14302, 'loss/train': 1.8816629648208618} -08/30/2021 15:41:18 - INFO - __main__ - Step 14304: {'lr': 0.0004915230689357206, 'samples': 2746368, 'steps': 14303, 'loss/train': 2.0318562984466553} -08/30/2021 15:41:18 - INFO - __main__ - Step 14305: {'lr': 0.0004915216986955913, 'samples': 2746560, 'steps': 14304, 'loss/train': 2.043475389480591} -08/30/2021 15:41:19 - INFO - __main__ - Step 14306: {'lr': 0.0004915203283466359, 'samples': 2746752, 'steps': 14305, 'loss/train': 1.5072704553604126} -08/30/2021 15:41:19 - INFO - __main__ - Step 14307: {'lr': 0.0004915189578888552, 'samples': 2746944, 'steps': 14306, 'loss/train': 1.5600268840789795} -08/30/2021 15:41:21 - INFO - __main__ - Step 14308: {'lr': 0.0004915175873222497, 'samples': 2747136, 'steps': 14307, 'loss/train': 1.9318269491195679} -08/30/2021 15:41:21 - INFO - __main__ - Step 14309: {'lr': 0.0004915162166468201, 'samples': 2747328, 'steps': 14308, 'loss/train': 1.7547612190246582} -08/30/2021 15:41:22 - INFO - __main__ - Step 14310: {'lr': 0.0004915148458625671, 'samples': 2747520, 'steps': 14309, 'loss/train': 1.6511695384979248} -08/30/2021 15:41:22 - INFO - __main__ - Step 14311: {'lr': 0.0004915134749694912, 'samples': 2747712, 'steps': 14310, 'loss/train': 1.975413203239441} -08/30/2021 15:41:22 - INFO - __main__ - Step 14312: {'lr': 0.000491512103967593, 'samples': 2747904, 'steps': 14311, 'loss/train': 1.1436662673950195} -08/30/2021 15:41:23 - INFO - __main__ - Step 14313: {'lr': 0.0004915107328568733, 'samples': 2748096, 'steps': 14312, 'loss/train': 0.17707191407680511} -08/30/2021 15:41:24 - INFO - __main__ - Step 14314: {'lr': 0.0004915093616373326, 'samples': 2748288, 'steps': 14313, 'loss/train': 0.571360170841217} -08/30/2021 15:41:25 - INFO - __main__ - Step 14315: {'lr': 0.0004915079903089714, 'samples': 2748480, 'steps': 14314, 'loss/train': 1.20900559425354} -08/30/2021 15:41:25 - INFO - __main__ - Step 14316: {'lr': 0.0004915066188717905, 'samples': 2748672, 'steps': 14315, 'loss/train': 1.5505168437957764} -08/30/2021 15:41:26 - INFO - __main__ - Step 14317: {'lr': 0.0004915052473257904, 'samples': 2748864, 'steps': 14316, 'loss/train': 1.903862476348877} -08/30/2021 15:41:26 - INFO - __main__ - Step 14318: {'lr': 0.0004915038756709717, 'samples': 2749056, 'steps': 14317, 'loss/train': 1.8158437013626099} -08/30/2021 15:41:27 - INFO - __main__ - Step 14319: {'lr': 0.0004915025039073352, 'samples': 2749248, 'steps': 14318, 'loss/train': 1.8041901588439941} -08/30/2021 15:41:28 - INFO - __main__ - Step 14320: {'lr': 0.0004915011320348814, 'samples': 2749440, 'steps': 14319, 'loss/train': 2.1272006034851074} -08/30/2021 15:41:28 - INFO - __main__ - Step 14321: {'lr': 0.0004914997600536108, 'samples': 2749632, 'steps': 14320, 'loss/train': 1.5176854133605957} -08/30/2021 15:41:29 - INFO - __main__ - Step 14322: {'lr': 0.0004914983879635242, 'samples': 2749824, 'steps': 14321, 'loss/train': 1.4800630807876587} -08/30/2021 15:41:29 - INFO - __main__ - Step 14323: {'lr': 0.0004914970157646222, 'samples': 2750016, 'steps': 14322, 'loss/train': 1.5841407775878906} -08/30/2021 15:41:31 - INFO - __main__ - Step 14324: {'lr': 0.0004914956434569054, 'samples': 2750208, 'steps': 14323, 'loss/train': 1.765442967414856} -08/30/2021 15:41:31 - INFO - __main__ - Step 14325: {'lr': 0.0004914942710403743, 'samples': 2750400, 'steps': 14324, 'loss/train': 1.7265383005142212} -08/30/2021 15:41:32 - INFO - __main__ - Step 14326: {'lr': 0.0004914928985150296, 'samples': 2750592, 'steps': 14325, 'loss/train': 1.7524030208587646} -08/30/2021 15:41:32 - INFO - __main__ - Step 14327: {'lr': 0.0004914915258808719, 'samples': 2750784, 'steps': 14326, 'loss/train': 2.004016160964966} -08/30/2021 15:41:32 - INFO - __main__ - Step 14328: {'lr': 0.0004914901531379019, 'samples': 2750976, 'steps': 14327, 'loss/train': 1.2179161310195923} -08/30/2021 15:41:34 - INFO - __main__ - Step 14329: {'lr': 0.0004914887802861201, 'samples': 2751168, 'steps': 14328, 'loss/train': 1.6710330247879028} -08/30/2021 15:41:34 - INFO - __main__ - Step 14330: {'lr': 0.0004914874073255273, 'samples': 2751360, 'steps': 14329, 'loss/train': 2.0541014671325684} -08/30/2021 15:41:35 - INFO - __main__ - Step 14331: {'lr': 0.0004914860342561239, 'samples': 2751552, 'steps': 14330, 'loss/train': 2.1631600856781006} -08/30/2021 15:41:35 - INFO - __main__ - Step 14332: {'lr': 0.0004914846610779107, 'samples': 2751744, 'steps': 14331, 'loss/train': 1.567399024963379} -08/30/2021 15:41:35 - INFO - __main__ - Step 14333: {'lr': 0.0004914832877908881, 'samples': 2751936, 'steps': 14332, 'loss/train': 2.012059211730957} -08/30/2021 15:41:37 - INFO - __main__ - Step 14334: {'lr': 0.0004914819143950571, 'samples': 2752128, 'steps': 14333, 'loss/train': 1.7972086668014526} -08/30/2021 15:41:37 - INFO - __main__ - Step 14335: {'lr': 0.0004914805408904179, 'samples': 2752320, 'steps': 14334, 'loss/train': 1.19582998752594} -08/30/2021 15:41:38 - INFO - __main__ - Step 14336: {'lr': 0.0004914791672769713, 'samples': 2752512, 'steps': 14335, 'loss/train': 1.9483637809753418} -08/30/2021 15:41:38 - INFO - __main__ - Step 14337: {'lr': 0.000491477793554718, 'samples': 2752704, 'steps': 14336, 'loss/train': 1.8428703546524048} -08/30/2021 15:41:38 - INFO - __main__ - Step 14338: {'lr': 0.0004914764197236584, 'samples': 2752896, 'steps': 14337, 'loss/train': 1.7327208518981934} -08/30/2021 15:41:39 - INFO - __main__ - Step 14339: {'lr': 0.0004914750457837933, 'samples': 2753088, 'steps': 14338, 'loss/train': 1.4848452806472778} -08/30/2021 15:41:40 - INFO - __main__ - Step 14340: {'lr': 0.0004914736717351233, 'samples': 2753280, 'steps': 14339, 'loss/train': 1.6279864311218262} -08/30/2021 15:41:41 - INFO - __main__ - Step 14341: {'lr': 0.000491472297577649, 'samples': 2753472, 'steps': 14340, 'loss/train': 1.8970388174057007} -08/30/2021 15:41:41 - INFO - __main__ - Step 14342: {'lr': 0.000491470923311371, 'samples': 2753664, 'steps': 14341, 'loss/train': 1.8129960298538208} -08/30/2021 15:41:41 - INFO - __main__ - Step 14343: {'lr': 0.0004914695489362899, 'samples': 2753856, 'steps': 14342, 'loss/train': 1.3674474954605103} -08/30/2021 15:41:42 - INFO - __main__ - Step 14344: {'lr': 0.0004914681744524064, 'samples': 2754048, 'steps': 14343, 'loss/train': 1.4709528684616089} -08/30/2021 15:41:43 - INFO - __main__ - Step 14345: {'lr': 0.0004914667998597211, 'samples': 2754240, 'steps': 14344, 'loss/train': 1.3310235738754272} -08/30/2021 15:41:44 - INFO - __main__ - Step 14346: {'lr': 0.0004914654251582344, 'samples': 2754432, 'steps': 14345, 'loss/train': 2.2530410289764404} -08/30/2021 15:41:44 - INFO - __main__ - Step 14347: {'lr': 0.0004914640503479473, 'samples': 2754624, 'steps': 14346, 'loss/train': 1.4643199443817139} -08/30/2021 15:41:45 - INFO - __main__ - Step 14348: {'lr': 0.0004914626754288601, 'samples': 2754816, 'steps': 14347, 'loss/train': 1.0527572631835938} -08/30/2021 15:41:45 - INFO - __main__ - Step 14349: {'lr': 0.0004914613004009736, 'samples': 2755008, 'steps': 14348, 'loss/train': 1.3456844091415405} -08/30/2021 15:41:46 - INFO - __main__ - Step 14350: {'lr': 0.0004914599252642884, 'samples': 2755200, 'steps': 14349, 'loss/train': 1.5882034301757812} -08/30/2021 15:41:47 - INFO - __main__ - Step 14351: {'lr': 0.000491458550018805, 'samples': 2755392, 'steps': 14350, 'loss/train': 1.6092170476913452} -08/30/2021 15:41:47 - INFO - __main__ - Step 14352: {'lr': 0.0004914571746645242, 'samples': 2755584, 'steps': 14351, 'loss/train': 1.8229730129241943} -08/30/2021 15:41:47 - INFO - __main__ - Step 14353: {'lr': 0.0004914557992014465, 'samples': 2755776, 'steps': 14352, 'loss/train': 1.7088993787765503} -08/30/2021 15:41:48 - INFO - __main__ - Step 14354: {'lr': 0.0004914544236295725, 'samples': 2755968, 'steps': 14353, 'loss/train': 1.7496505975723267} -08/30/2021 15:41:49 - INFO - __main__ - Step 14355: {'lr': 0.0004914530479489029, 'samples': 2756160, 'steps': 14354, 'loss/train': 2.1107027530670166} -08/30/2021 15:41:50 - INFO - __main__ - Step 14356: {'lr': 0.0004914516721594382, 'samples': 2756352, 'steps': 14355, 'loss/train': 1.5025612115859985} -08/30/2021 15:41:50 - INFO - __main__ - Step 14357: {'lr': 0.0004914502962611792, 'samples': 2756544, 'steps': 14356, 'loss/train': 2.0511035919189453} -08/30/2021 15:41:51 - INFO - __main__ - Step 14358: {'lr': 0.0004914489202541264, 'samples': 2756736, 'steps': 14357, 'loss/train': 1.1436680555343628} -08/30/2021 15:41:51 - INFO - __main__ - Step 14359: {'lr': 0.0004914475441382804, 'samples': 2756928, 'steps': 14358, 'loss/train': 1.7909042835235596} -08/30/2021 15:41:52 - INFO - __main__ - Step 14360: {'lr': 0.0004914461679136419, 'samples': 2757120, 'steps': 14359, 'loss/train': 2.647141695022583} -08/30/2021 15:41:53 - INFO - __main__ - Step 14361: {'lr': 0.0004914447915802115, 'samples': 2757312, 'steps': 14360, 'loss/train': 1.8089959621429443} -08/30/2021 15:41:53 - INFO - __main__ - Step 14362: {'lr': 0.0004914434151379898, 'samples': 2757504, 'steps': 14361, 'loss/train': 1.717605471611023} -08/30/2021 15:41:54 - INFO - __main__ - Step 14363: {'lr': 0.0004914420385869773, 'samples': 2757696, 'steps': 14362, 'loss/train': 1.586990475654602} -08/30/2021 15:41:54 - INFO - __main__ - Step 14364: {'lr': 0.0004914406619271749, 'samples': 2757888, 'steps': 14363, 'loss/train': 1.747564435005188} -08/30/2021 15:41:54 - INFO - __main__ - Step 14365: {'lr': 0.0004914392851585829, 'samples': 2758080, 'steps': 14364, 'loss/train': 1.7078890800476074} -08/30/2021 15:41:56 - INFO - __main__ - Step 14366: {'lr': 0.0004914379082812023, 'samples': 2758272, 'steps': 14365, 'loss/train': 1.7765601873397827} -08/30/2021 15:41:56 - INFO - __main__ - Step 14367: {'lr': 0.0004914365312950333, 'samples': 2758464, 'steps': 14366, 'loss/train': 1.6005475521087646} -08/30/2021 15:41:56 - INFO - __main__ - Step 14368: {'lr': 0.0004914351542000768, 'samples': 2758656, 'steps': 14367, 'loss/train': 1.6172153949737549} -08/30/2021 15:41:57 - INFO - __main__ - Step 14369: {'lr': 0.0004914337769963334, 'samples': 2758848, 'steps': 14368, 'loss/train': 1.952616810798645} -08/30/2021 15:41:57 - INFO - __main__ - Step 14370: {'lr': 0.0004914323996838036, 'samples': 2759040, 'steps': 14369, 'loss/train': 1.992571234703064} -08/30/2021 15:41:59 - INFO - __main__ - Step 14371: {'lr': 0.0004914310222624881, 'samples': 2759232, 'steps': 14370, 'loss/train': 2.0507609844207764} -08/30/2021 15:41:59 - INFO - __main__ - Step 14372: {'lr': 0.0004914296447323875, 'samples': 2759424, 'steps': 14371, 'loss/train': 1.6695152521133423} -08/30/2021 15:42:00 - INFO - __main__ - Step 14373: {'lr': 0.0004914282670935025, 'samples': 2759616, 'steps': 14372, 'loss/train': 1.9530751705169678} -08/30/2021 15:42:00 - INFO - __main__ - Step 14374: {'lr': 0.0004914268893458336, 'samples': 2759808, 'steps': 14373, 'loss/train': 1.5470737218856812} -08/30/2021 15:42:00 - INFO - __main__ - Step 14375: {'lr': 0.0004914255114893814, 'samples': 2760000, 'steps': 14374, 'loss/train': 1.6123696565628052} -08/30/2021 15:42:02 - INFO - __main__ - Step 14376: {'lr': 0.0004914241335241467, 'samples': 2760192, 'steps': 14375, 'loss/train': 1.5364497900009155} -08/30/2021 15:42:02 - INFO - __main__ - Step 14377: {'lr': 0.0004914227554501299, 'samples': 2760384, 'steps': 14376, 'loss/train': 1.3919613361358643} -08/30/2021 15:42:03 - INFO - __main__ - Step 14378: {'lr': 0.0004914213772673319, 'samples': 2760576, 'steps': 14377, 'loss/train': 1.6869041919708252} -08/30/2021 15:42:03 - INFO - __main__ - Step 14379: {'lr': 0.0004914199989757529, 'samples': 2760768, 'steps': 14378, 'loss/train': 1.5844998359680176} -08/30/2021 15:42:04 - INFO - __main__ - Step 14380: {'lr': 0.000491418620575394, 'samples': 2760960, 'steps': 14379, 'loss/train': 1.8117092847824097} -08/30/2021 15:42:04 - INFO - __main__ - Step 14381: {'lr': 0.0004914172420662556, 'samples': 2761152, 'steps': 14380, 'loss/train': 1.4020788669586182} -08/30/2021 15:42:06 - INFO - __main__ - Step 14382: {'lr': 0.0004914158634483381, 'samples': 2761344, 'steps': 14381, 'loss/train': 6.557975769042969} -08/30/2021 15:42:07 - INFO - __main__ - Step 14383: {'lr': 0.0004914144847216425, 'samples': 2761536, 'steps': 14382, 'loss/train': 1.495499849319458} -08/30/2021 15:42:07 - INFO - __main__ - Step 14384: {'lr': 0.0004914131058861693, 'samples': 2761728, 'steps': 14383, 'loss/train': 1.9853951930999756} -08/30/2021 15:42:07 - INFO - __main__ - Step 14385: {'lr': 0.000491411726941919, 'samples': 2761920, 'steps': 14384, 'loss/train': 1.6249979734420776} -08/30/2021 15:42:08 - INFO - __main__ - Step 14386: {'lr': 0.0004914103478888922, 'samples': 2762112, 'steps': 14385, 'loss/train': 1.6414304971694946} -08/30/2021 15:42:09 - INFO - __main__ - Step 14387: {'lr': 0.0004914089687270898, 'samples': 2762304, 'steps': 14386, 'loss/train': 1.6743136644363403} -08/30/2021 15:42:10 - INFO - __main__ - Step 14388: {'lr': 0.0004914075894565122, 'samples': 2762496, 'steps': 14387, 'loss/train': 2.039595603942871} -08/30/2021 15:42:10 - INFO - __main__ - Step 14389: {'lr': 0.00049140621007716, 'samples': 2762688, 'steps': 14388, 'loss/train': 0.9971103072166443} -08/30/2021 15:42:10 - INFO - __main__ - Step 14390: {'lr': 0.0004914048305890339, 'samples': 2762880, 'steps': 14389, 'loss/train': 0.6940599679946899} -08/30/2021 15:42:11 - INFO - __main__ - Step 14391: {'lr': 0.0004914034509921345, 'samples': 2763072, 'steps': 14390, 'loss/train': 1.2802982330322266} -08/30/2021 15:42:12 - INFO - __main__ - Step 14392: {'lr': 0.0004914020712864626, 'samples': 2763264, 'steps': 14391, 'loss/train': 1.6955795288085938} -08/30/2021 15:42:12 - INFO - __main__ - Step 14393: {'lr': 0.0004914006914720184, 'samples': 2763456, 'steps': 14392, 'loss/train': 1.7631808519363403} -08/30/2021 15:42:13 - INFO - __main__ - Step 14394: {'lr': 0.0004913993115488029, 'samples': 2763648, 'steps': 14393, 'loss/train': 1.2318246364593506} -08/30/2021 15:42:13 - INFO - __main__ - Step 14395: {'lr': 0.0004913979315168167, 'samples': 2763840, 'steps': 14394, 'loss/train': 1.6404566764831543} -08/30/2021 15:42:13 - INFO - __main__ - Step 14396: {'lr': 0.0004913965513760601, 'samples': 2764032, 'steps': 14395, 'loss/train': 1.5663487911224365} -08/30/2021 15:42:15 - INFO - __main__ - Step 14397: {'lr': 0.0004913951711265341, 'samples': 2764224, 'steps': 14396, 'loss/train': 1.854474425315857} -08/30/2021 15:42:15 - INFO - __main__ - Step 14398: {'lr': 0.0004913937907682391, 'samples': 2764416, 'steps': 14397, 'loss/train': 2.02028751373291} -08/30/2021 15:42:16 - INFO - __main__ - Step 14399: {'lr': 0.0004913924103011757, 'samples': 2764608, 'steps': 14398, 'loss/train': 1.9994747638702393} -08/30/2021 15:42:16 - INFO - __main__ - Step 14400: {'lr': 0.0004913910297253448, 'samples': 2764800, 'steps': 14399, 'loss/train': 2.0656163692474365} -08/30/2021 15:42:16 - INFO - __main__ - Step 14401: {'lr': 0.0004913896490407467, 'samples': 2764992, 'steps': 14400, 'loss/train': 2.1407995223999023} -08/30/2021 15:42:18 - INFO - __main__ - Step 14402: {'lr': 0.0004913882682473821, 'samples': 2765184, 'steps': 14401, 'loss/train': 1.5955979824066162} -08/30/2021 15:42:18 - INFO - __main__ - Step 14403: {'lr': 0.0004913868873452519, 'samples': 2765376, 'steps': 14402, 'loss/train': 1.9759739637374878} -08/30/2021 15:42:19 - INFO - __main__ - Step 14404: {'lr': 0.0004913855063343563, 'samples': 2765568, 'steps': 14403, 'loss/train': 1.3353103399276733} -08/30/2021 15:42:19 - INFO - __main__ - Step 14405: {'lr': 0.0004913841252146961, 'samples': 2765760, 'steps': 14404, 'loss/train': 1.6983386278152466} -08/30/2021 15:42:20 - INFO - __main__ - Step 14406: {'lr': 0.000491382743986272, 'samples': 2765952, 'steps': 14405, 'loss/train': 1.600548505783081} -08/30/2021 15:42:20 - INFO - __main__ - Step 14407: {'lr': 0.0004913813626490845, 'samples': 2766144, 'steps': 14406, 'loss/train': 1.7812741994857788} -08/30/2021 15:42:21 - INFO - __main__ - Step 14408: {'lr': 0.0004913799812031343, 'samples': 2766336, 'steps': 14407, 'loss/train': 1.9552769660949707} -08/30/2021 15:42:22 - INFO - __main__ - Step 14409: {'lr': 0.0004913785996484221, 'samples': 2766528, 'steps': 14408, 'loss/train': 1.6603641510009766} -08/30/2021 15:42:22 - INFO - __main__ - Step 14410: {'lr': 0.0004913772179849483, 'samples': 2766720, 'steps': 14409, 'loss/train': 1.7005271911621094} -08/30/2021 15:42:22 - INFO - __main__ - Step 14411: {'lr': 0.0004913758362127137, 'samples': 2766912, 'steps': 14410, 'loss/train': 2.074171543121338} -08/30/2021 15:42:23 - INFO - __main__ - Step 14412: {'lr': 0.0004913744543317189, 'samples': 2767104, 'steps': 14411, 'loss/train': 1.8987823724746704} -08/30/2021 15:42:24 - INFO - __main__ - Step 14413: {'lr': 0.0004913730723419645, 'samples': 2767296, 'steps': 14412, 'loss/train': 1.542839527130127} -08/30/2021 15:42:25 - INFO - __main__ - Step 14414: {'lr': 0.000491371690243451, 'samples': 2767488, 'steps': 14413, 'loss/train': 1.8802578449249268} -08/30/2021 15:42:25 - INFO - __main__ - Step 14415: {'lr': 0.0004913703080361793, 'samples': 2767680, 'steps': 14414, 'loss/train': 1.681760549545288} -08/30/2021 15:42:25 - INFO - __main__ - Step 14416: {'lr': 0.0004913689257201499, 'samples': 2767872, 'steps': 14415, 'loss/train': 1.4980852603912354} -08/30/2021 15:42:26 - INFO - __main__ - Step 14417: {'lr': 0.0004913675432953633, 'samples': 2768064, 'steps': 14416, 'loss/train': 1.130185604095459} -08/30/2021 15:42:26 - INFO - __main__ - Step 14418: {'lr': 0.0004913661607618202, 'samples': 2768256, 'steps': 14417, 'loss/train': 1.6542071104049683} -08/30/2021 15:42:28 - INFO - __main__ - Step 14419: {'lr': 0.0004913647781195212, 'samples': 2768448, 'steps': 14418, 'loss/train': 1.6528840065002441} -08/30/2021 15:42:28 - INFO - __main__ - Step 14420: {'lr': 0.000491363395368467, 'samples': 2768640, 'steps': 14419, 'loss/train': 1.2821459770202637} -08/30/2021 15:42:29 - INFO - __main__ - Step 14421: {'lr': 0.0004913620125086581, 'samples': 2768832, 'steps': 14420, 'loss/train': 2.111851453781128} -08/30/2021 15:42:29 - INFO - __main__ - Step 14422: {'lr': 0.0004913606295400953, 'samples': 2769024, 'steps': 14421, 'loss/train': 2.1326797008514404} -08/30/2021 15:42:29 - INFO - __main__ - Step 14423: {'lr': 0.000491359246462779, 'samples': 2769216, 'steps': 14422, 'loss/train': 2.0644469261169434} -08/30/2021 15:42:31 - INFO - __main__ - Step 14424: {'lr': 0.0004913578632767101, 'samples': 2769408, 'steps': 14423, 'loss/train': 1.1016974449157715} -08/30/2021 15:42:31 - INFO - __main__ - Step 14425: {'lr': 0.0004913564799818891, 'samples': 2769600, 'steps': 14424, 'loss/train': 1.6002943515777588} -08/30/2021 15:42:32 - INFO - __main__ - Step 14426: {'lr': 0.0004913550965783165, 'samples': 2769792, 'steps': 14425, 'loss/train': 1.3188844919204712} -08/30/2021 15:42:32 - INFO - __main__ - Step 14427: {'lr': 0.000491353713065993, 'samples': 2769984, 'steps': 14426, 'loss/train': 1.687347412109375} -08/30/2021 15:42:32 - INFO - __main__ - Step 14428: {'lr': 0.0004913523294449193, 'samples': 2770176, 'steps': 14427, 'loss/train': 1.5591503381729126} -08/30/2021 15:42:34 - INFO - __main__ - Step 14429: {'lr': 0.0004913509457150959, 'samples': 2770368, 'steps': 14428, 'loss/train': 1.6258282661437988} -08/30/2021 15:42:35 - INFO - __main__ - Step 14430: {'lr': 0.0004913495618765235, 'samples': 2770560, 'steps': 14429, 'loss/train': 1.6587992906570435} -08/30/2021 15:42:35 - INFO - __main__ - Step 14431: {'lr': 0.0004913481779292027, 'samples': 2770752, 'steps': 14430, 'loss/train': 1.442101240158081} -08/30/2021 15:42:35 - INFO - __main__ - Step 14432: {'lr': 0.0004913467938731341, 'samples': 2770944, 'steps': 14431, 'loss/train': 1.6395477056503296} -08/30/2021 15:42:36 - INFO - __main__ - Step 14433: {'lr': 0.0004913454097083185, 'samples': 2771136, 'steps': 14432, 'loss/train': 1.3623318672180176} -08/30/2021 15:42:36 - INFO - __main__ - Step 14434: {'lr': 0.0004913440254347563, 'samples': 2771328, 'steps': 14433, 'loss/train': 1.7937641143798828} -08/30/2021 15:42:38 - INFO - __main__ - Step 14435: {'lr': 0.0004913426410524482, 'samples': 2771520, 'steps': 14434, 'loss/train': 0.3770926594734192} -08/30/2021 15:42:38 - INFO - __main__ - Step 14436: {'lr': 0.0004913412565613948, 'samples': 2771712, 'steps': 14435, 'loss/train': 1.848724126815796} -08/30/2021 15:42:39 - INFO - __main__ - Step 14437: {'lr': 0.0004913398719615968, 'samples': 2771904, 'steps': 14436, 'loss/train': 1.6998211145401} -08/30/2021 15:42:39 - INFO - __main__ - Step 14438: {'lr': 0.0004913384872530548, 'samples': 2772096, 'steps': 14437, 'loss/train': 1.955406665802002} -08/30/2021 15:42:39 - INFO - __main__ - Step 14439: {'lr': 0.0004913371024357694, 'samples': 2772288, 'steps': 14438, 'loss/train': 2.1819000244140625} -08/30/2021 15:42:41 - INFO - __main__ - Step 14440: {'lr': 0.0004913357175097412, 'samples': 2772480, 'steps': 14439, 'loss/train': 1.3407856225967407} -08/30/2021 15:42:41 - INFO - __main__ - Step 14441: {'lr': 0.0004913343324749708, 'samples': 2772672, 'steps': 14440, 'loss/train': 2.3821146488189697} -08/30/2021 15:42:42 - INFO - __main__ - Step 14442: {'lr': 0.000491332947331459, 'samples': 2772864, 'steps': 14441, 'loss/train': 2.2518422603607178} -08/30/2021 15:42:42 - INFO - __main__ - Step 14443: {'lr': 0.0004913315620792061, 'samples': 2773056, 'steps': 14442, 'loss/train': 1.3385586738586426} -08/30/2021 15:42:42 - INFO - __main__ - Step 14444: {'lr': 0.0004913301767182131, 'samples': 2773248, 'steps': 14443, 'loss/train': 1.8875072002410889} -08/30/2021 15:42:44 - INFO - __main__ - Step 14445: {'lr': 0.0004913287912484804, 'samples': 2773440, 'steps': 14444, 'loss/train': 1.8578765392303467} -08/30/2021 15:42:45 - INFO - __main__ - Step 14446: {'lr': 0.0004913274056700087, 'samples': 2773632, 'steps': 14445, 'loss/train': 1.2141847610473633} -08/30/2021 15:42:45 - INFO - __main__ - Step 14447: {'lr': 0.0004913260199827986, 'samples': 2773824, 'steps': 14446, 'loss/train': 1.3405717611312866} -08/30/2021 15:42:46 - INFO - __main__ - Step 14448: {'lr': 0.0004913246341868506, 'samples': 2774016, 'steps': 14447, 'loss/train': 1.4121546745300293} -08/30/2021 15:42:46 - INFO - __main__ - Step 14449: {'lr': 0.0004913232482821656, 'samples': 2774208, 'steps': 14448, 'loss/train': 1.3116148710250854} -08/30/2021 15:42:46 - INFO - __main__ - Step 14450: {'lr': 0.0004913218622687439, 'samples': 2774400, 'steps': 14449, 'loss/train': 3.291533946990967} -08/30/2021 15:42:47 - INFO - __main__ - Step 14451: {'lr': 0.0004913204761465864, 'samples': 2774592, 'steps': 14450, 'loss/train': 0.10549765825271606} -08/30/2021 15:42:48 - INFO - __main__ - Step 14452: {'lr': 0.0004913190899156936, 'samples': 2774784, 'steps': 14451, 'loss/train': 1.6932841539382935} -08/30/2021 15:42:49 - INFO - __main__ - Step 14453: {'lr': 0.0004913177035760661, 'samples': 2774976, 'steps': 14452, 'loss/train': 2.2363641262054443} -08/30/2021 15:42:49 - INFO - __main__ - Step 14454: {'lr': 0.0004913163171277046, 'samples': 2775168, 'steps': 14453, 'loss/train': 1.5592412948608398} -08/30/2021 15:42:49 - INFO - __main__ - Step 14455: {'lr': 0.0004913149305706097, 'samples': 2775360, 'steps': 14454, 'loss/train': 1.3753920793533325} -08/30/2021 15:42:50 - INFO - __main__ - Step 14456: {'lr': 0.0004913135439047821, 'samples': 2775552, 'steps': 14455, 'loss/train': 1.8267714977264404} -08/30/2021 15:42:51 - INFO - __main__ - Step 14457: {'lr': 0.0004913121571302222, 'samples': 2775744, 'steps': 14456, 'loss/train': 2.6834311485290527} -08/30/2021 15:42:52 - INFO - __main__ - Step 14458: {'lr': 0.0004913107702469308, 'samples': 2775936, 'steps': 14457, 'loss/train': 2.420761823654175} -08/30/2021 15:42:52 - INFO - __main__ - Step 14459: {'lr': 0.0004913093832549085, 'samples': 2776128, 'steps': 14458, 'loss/train': 2.002096652984619} -08/30/2021 15:42:52 - INFO - __main__ - Step 14460: {'lr': 0.000491307996154156, 'samples': 2776320, 'steps': 14459, 'loss/train': 1.5985876321792603} -08/30/2021 15:42:53 - INFO - __main__ - Step 14461: {'lr': 0.0004913066089446737, 'samples': 2776512, 'steps': 14460, 'loss/train': 1.7746468782424927} -08/30/2021 15:42:54 - INFO - __main__ - Step 14462: {'lr': 0.0004913052216264624, 'samples': 2776704, 'steps': 14461, 'loss/train': 1.565679907798767} -08/30/2021 15:42:55 - INFO - __main__ - Step 14463: {'lr': 0.0004913038341995227, 'samples': 2776896, 'steps': 14462, 'loss/train': 1.2869205474853516} -08/30/2021 15:42:55 - INFO - __main__ - Step 14464: {'lr': 0.0004913024466638553, 'samples': 2777088, 'steps': 14463, 'loss/train': 1.9432456493377686} -08/30/2021 15:42:56 - INFO - __main__ - Step 14465: {'lr': 0.0004913010590194607, 'samples': 2777280, 'steps': 14464, 'loss/train': 1.7373874187469482} -08/30/2021 15:42:56 - INFO - __main__ - Step 14466: {'lr': 0.0004912996712663396, 'samples': 2777472, 'steps': 14465, 'loss/train': 0.2349952906370163} -08/30/2021 15:42:58 - INFO - __main__ - Step 14467: {'lr': 0.0004912982834044924, 'samples': 2777664, 'steps': 14466, 'loss/train': 1.9728477001190186} -08/30/2021 15:42:58 - INFO - __main__ - Step 14468: {'lr': 0.0004912968954339202, 'samples': 2777856, 'steps': 14467, 'loss/train': 1.616193413734436} -08/30/2021 15:42:58 - INFO - __main__ - Step 14469: {'lr': 0.0004912955073546231, 'samples': 2778048, 'steps': 14468, 'loss/train': 1.854647159576416} -08/30/2021 15:42:59 - INFO - __main__ - Step 14470: {'lr': 0.0004912941191666021, 'samples': 2778240, 'steps': 14469, 'loss/train': 1.7872931957244873} -08/30/2021 15:42:59 - INFO - __main__ - Step 14471: {'lr': 0.0004912927308698576, 'samples': 2778432, 'steps': 14470, 'loss/train': 1.5087742805480957} -08/30/2021 15:42:59 - INFO - __main__ - Step 14472: {'lr': 0.0004912913424643904, 'samples': 2778624, 'steps': 14471, 'loss/train': 2.019666910171509} -08/30/2021 15:43:01 - INFO - __main__ - Step 14473: {'lr': 0.0004912899539502011, 'samples': 2778816, 'steps': 14472, 'loss/train': 1.479892373085022} -08/30/2021 15:43:01 - INFO - __main__ - Step 14474: {'lr': 0.0004912885653272902, 'samples': 2779008, 'steps': 14473, 'loss/train': 2.0292649269104004} -08/30/2021 15:43:02 - INFO - __main__ - Step 14475: {'lr': 0.0004912871765956583, 'samples': 2779200, 'steps': 14474, 'loss/train': 1.6204290390014648} -08/30/2021 15:43:02 - INFO - __main__ - Step 14476: {'lr': 0.0004912857877553062, 'samples': 2779392, 'steps': 14475, 'loss/train': 1.3374171257019043} -08/30/2021 15:43:02 - INFO - __main__ - Step 14477: {'lr': 0.0004912843988062345, 'samples': 2779584, 'steps': 14476, 'loss/train': 1.354299545288086} -08/30/2021 15:43:04 - INFO - __main__ - Step 14478: {'lr': 0.0004912830097484437, 'samples': 2779776, 'steps': 14477, 'loss/train': 1.3030502796173096} -08/30/2021 15:43:05 - INFO - __main__ - Step 14479: {'lr': 0.0004912816205819346, 'samples': 2779968, 'steps': 14478, 'loss/train': 1.8572869300842285} -08/30/2021 15:43:05 - INFO - __main__ - Step 14480: {'lr': 0.0004912802313067076, 'samples': 2780160, 'steps': 14479, 'loss/train': 1.7414358854293823} -08/30/2021 15:43:05 - INFO - __main__ - Step 14481: {'lr': 0.0004912788419227635, 'samples': 2780352, 'steps': 14480, 'loss/train': 0.28012627363204956} -08/30/2021 15:43:06 - INFO - __main__ - Step 14482: {'lr': 0.000491277452430103, 'samples': 2780544, 'steps': 14481, 'loss/train': 1.5621333122253418} -08/30/2021 15:43:07 - INFO - __main__ - Step 14483: {'lr': 0.0004912760628287264, 'samples': 2780736, 'steps': 14482, 'loss/train': 1.1264241933822632} -08/30/2021 15:43:08 - INFO - __main__ - Step 14484: {'lr': 0.0004912746731186346, 'samples': 2780928, 'steps': 14483, 'loss/train': 1.716565489768982} -08/30/2021 15:43:08 - INFO - __main__ - Step 14485: {'lr': 0.0004912732832998281, 'samples': 2781120, 'steps': 14484, 'loss/train': 1.7526382207870483} -08/30/2021 15:43:08 - INFO - __main__ - Step 14486: {'lr': 0.0004912718933723077, 'samples': 2781312, 'steps': 14485, 'loss/train': 1.299196481704712} -08/30/2021 15:43:09 - INFO - __main__ - Step 14487: {'lr': 0.0004912705033360738, 'samples': 2781504, 'steps': 14486, 'loss/train': 2.215812921524048} -08/30/2021 15:43:11 - INFO - __main__ - Step 14488: {'lr': 0.0004912691131911272, 'samples': 2781696, 'steps': 14487, 'loss/train': 2.1676204204559326} -08/30/2021 15:43:11 - INFO - __main__ - Step 14489: {'lr': 0.0004912677229374684, 'samples': 2781888, 'steps': 14488, 'loss/train': 2.0206358432769775} -08/30/2021 15:43:12 - INFO - __main__ - Step 14490: {'lr': 0.0004912663325750982, 'samples': 2782080, 'steps': 14489, 'loss/train': 1.6100986003875732} -08/30/2021 15:43:12 - INFO - __main__ - Step 14491: {'lr': 0.000491264942104017, 'samples': 2782272, 'steps': 14490, 'loss/train': 1.6361287832260132} -08/30/2021 15:43:12 - INFO - __main__ - Step 14492: {'lr': 0.0004912635515242257, 'samples': 2782464, 'steps': 14491, 'loss/train': 1.7629488706588745} -08/30/2021 15:43:13 - INFO - __main__ - Step 14493: {'lr': 0.0004912621608357246, 'samples': 2782656, 'steps': 14492, 'loss/train': 1.7426536083221436} -08/30/2021 15:43:14 - INFO - __main__ - Step 14494: {'lr': 0.0004912607700385146, 'samples': 2782848, 'steps': 14493, 'loss/train': 2.1075809001922607} -08/30/2021 15:43:15 - INFO - __main__ - Step 14495: {'lr': 0.0004912593791325962, 'samples': 2783040, 'steps': 14494, 'loss/train': 1.903563141822815} -08/30/2021 15:43:15 - INFO - __main__ - Step 14496: {'lr': 0.00049125798811797, 'samples': 2783232, 'steps': 14495, 'loss/train': 1.6912320852279663} -08/30/2021 15:43:15 - INFO - __main__ - Step 14497: {'lr': 0.0004912565969946367, 'samples': 2783424, 'steps': 14496, 'loss/train': 1.7569342851638794} -08/30/2021 15:43:16 - INFO - __main__ - Step 14498: {'lr': 0.0004912552057625969, 'samples': 2783616, 'steps': 14497, 'loss/train': 1.7169954776763916} -08/30/2021 15:43:17 - INFO - __main__ - Step 14499: {'lr': 0.0004912538144218512, 'samples': 2783808, 'steps': 14498, 'loss/train': 1.592843770980835} -08/30/2021 15:43:18 - INFO - __main__ - Step 14500: {'lr': 0.0004912524229724002, 'samples': 2784000, 'steps': 14499, 'loss/train': 1.4646787643432617} -08/30/2021 15:43:18 - INFO - __main__ - Step 14501: {'lr': 0.0004912510314142447, 'samples': 2784192, 'steps': 14500, 'loss/train': 1.7538471221923828} -08/30/2021 15:43:18 - INFO - __main__ - Step 14502: {'lr': 0.0004912496397473852, 'samples': 2784384, 'steps': 14501, 'loss/train': 2.0602452754974365} -08/30/2021 15:43:19 - INFO - __main__ - Step 14503: {'lr': 0.0004912482479718223, 'samples': 2784576, 'steps': 14502, 'loss/train': 1.6451038122177124} -08/30/2021 15:43:20 - INFO - __main__ - Step 14504: {'lr': 0.0004912468560875566, 'samples': 2784768, 'steps': 14503, 'loss/train': 1.4356677532196045} -08/30/2021 15:43:21 - INFO - __main__ - Step 14505: {'lr': 0.0004912454640945889, 'samples': 2784960, 'steps': 14504, 'loss/train': 2.1461522579193115} -08/30/2021 15:43:21 - INFO - __main__ - Step 14506: {'lr': 0.0004912440719929196, 'samples': 2785152, 'steps': 14505, 'loss/train': 1.3326867818832397} -08/30/2021 15:43:21 - INFO - __main__ - Step 14507: {'lr': 0.0004912426797825495, 'samples': 2785344, 'steps': 14506, 'loss/train': 1.4029852151870728} -08/30/2021 15:43:22 - INFO - __main__ - Step 14508: {'lr': 0.0004912412874634792, 'samples': 2785536, 'steps': 14507, 'loss/train': 2.0477237701416016} -08/30/2021 15:43:23 - INFO - __main__ - Step 14509: {'lr': 0.0004912398950357094, 'samples': 2785728, 'steps': 14508, 'loss/train': 1.2198266983032227} -08/30/2021 15:43:24 - INFO - __main__ - Step 14510: {'lr': 0.0004912385024992404, 'samples': 2785920, 'steps': 14509, 'loss/train': 2.0874016284942627} -08/30/2021 15:43:24 - INFO - __main__ - Step 14511: {'lr': 0.0004912371098540733, 'samples': 2786112, 'steps': 14510, 'loss/train': 5.1942620277404785} -08/30/2021 15:43:25 - INFO - __main__ - Step 14512: {'lr': 0.0004912357171002082, 'samples': 2786304, 'steps': 14511, 'loss/train': 3.4363343715667725} -08/30/2021 15:43:25 - INFO - __main__ - Step 14513: {'lr': 0.0004912343242376462, 'samples': 2786496, 'steps': 14512, 'loss/train': 2.5290675163269043} -08/30/2021 15:43:25 - INFO - __main__ - Step 14514: {'lr': 0.0004912329312663877, 'samples': 2786688, 'steps': 14513, 'loss/train': 2.168471574783325} -08/30/2021 15:43:27 - INFO - __main__ - Step 14515: {'lr': 0.0004912315381864333, 'samples': 2786880, 'steps': 14514, 'loss/train': 1.8507919311523438} -08/30/2021 15:43:27 - INFO - __main__ - Step 14516: {'lr': 0.0004912301449977837, 'samples': 2787072, 'steps': 14515, 'loss/train': 1.9655901193618774} -08/30/2021 15:43:28 - INFO - __main__ - Step 14517: {'lr': 0.0004912287517004397, 'samples': 2787264, 'steps': 14516, 'loss/train': 1.8701720237731934} -08/30/2021 15:43:28 - INFO - __main__ - Step 14518: {'lr': 0.0004912273582944015, 'samples': 2787456, 'steps': 14517, 'loss/train': 1.980516791343689} -08/30/2021 15:43:28 - INFO - __main__ - Step 14519: {'lr': 0.0004912259647796701, 'samples': 2787648, 'steps': 14518, 'loss/train': 1.4434527158737183} -08/30/2021 15:43:29 - INFO - __main__ - Step 14520: {'lr': 0.000491224571156246, 'samples': 2787840, 'steps': 14519, 'loss/train': 1.8004525899887085} -08/30/2021 15:43:30 - INFO - __main__ - Step 14521: {'lr': 0.0004912231774241298, 'samples': 2788032, 'steps': 14520, 'loss/train': 1.748858094215393} -08/30/2021 15:43:31 - INFO - __main__ - Step 14522: {'lr': 0.0004912217835833222, 'samples': 2788224, 'steps': 14521, 'loss/train': 1.8290034532546997} -08/30/2021 15:43:31 - INFO - __main__ - Step 14523: {'lr': 0.0004912203896338238, 'samples': 2788416, 'steps': 14522, 'loss/train': 1.771354079246521} -08/30/2021 15:43:31 - INFO - __main__ - Step 14524: {'lr': 0.0004912189955756351, 'samples': 2788608, 'steps': 14523, 'loss/train': 2.1499438285827637} -08/30/2021 15:43:32 - INFO - __main__ - Step 14525: {'lr': 0.000491217601408757, 'samples': 2788800, 'steps': 14524, 'loss/train': 1.9782694578170776} -08/30/2021 15:43:33 - INFO - __main__ - Step 14526: {'lr': 0.0004912162071331898, 'samples': 2788992, 'steps': 14525, 'loss/train': 1.9178650379180908} -08/30/2021 15:43:34 - INFO - __main__ - Step 14527: {'lr': 0.0004912148127489345, 'samples': 2789184, 'steps': 14526, 'loss/train': 1.8704619407653809} -08/30/2021 15:43:34 - INFO - __main__ - Step 14528: {'lr': 0.0004912134182559913, 'samples': 2789376, 'steps': 14527, 'loss/train': 1.8732547760009766} -08/30/2021 15:43:34 - INFO - __main__ - Step 14529: {'lr': 0.0004912120236543611, 'samples': 2789568, 'steps': 14528, 'loss/train': 1.8324247598648071} -08/30/2021 15:43:35 - INFO - __main__ - Step 14530: {'lr': 0.0004912106289440446, 'samples': 2789760, 'steps': 14529, 'loss/train': 1.3917843103408813} -08/30/2021 15:43:36 - INFO - __main__ - Step 14531: {'lr': 0.0004912092341250422, 'samples': 2789952, 'steps': 14530, 'loss/train': 2.2684664726257324} -08/30/2021 15:43:37 - INFO - __main__ - Step 14532: {'lr': 0.0004912078391973547, 'samples': 2790144, 'steps': 14531, 'loss/train': 1.54881751537323} -08/30/2021 15:43:37 - INFO - __main__ - Step 14533: {'lr': 0.0004912064441609827, 'samples': 2790336, 'steps': 14532, 'loss/train': 1.2664347887039185} -08/30/2021 15:43:37 - INFO - __main__ - Step 14534: {'lr': 0.0004912050490159268, 'samples': 2790528, 'steps': 14533, 'loss/train': 1.573196530342102} -08/30/2021 15:43:38 - INFO - __main__ - Step 14535: {'lr': 0.0004912036537621877, 'samples': 2790720, 'steps': 14534, 'loss/train': 1.3205132484436035} -08/30/2021 15:43:38 - INFO - __main__ - Step 14536: {'lr': 0.0004912022583997658, 'samples': 2790912, 'steps': 14535, 'loss/train': 2.139380931854248} -08/30/2021 15:43:40 - INFO - __main__ - Step 14537: {'lr': 0.0004912008629286619, 'samples': 2791104, 'steps': 14536, 'loss/train': 0.3022192716598511} -08/30/2021 15:43:40 - INFO - __main__ - Step 14538: {'lr': 0.0004911994673488766, 'samples': 2791296, 'steps': 14537, 'loss/train': 1.9566104412078857} -08/30/2021 15:43:40 - INFO - __main__ - Step 14539: {'lr': 0.0004911980716604107, 'samples': 2791488, 'steps': 14538, 'loss/train': 1.9875560998916626} -08/30/2021 15:43:41 - INFO - __main__ - Step 14540: {'lr': 0.0004911966758632645, 'samples': 2791680, 'steps': 14539, 'loss/train': 1.564862847328186} -08/30/2021 15:43:41 - INFO - __main__ - Step 14541: {'lr': 0.000491195279957439, 'samples': 2791872, 'steps': 14540, 'loss/train': 1.498392939567566} -08/30/2021 15:43:44 - INFO - __main__ - Step 14542: {'lr': 0.0004911938839429344, 'samples': 2792064, 'steps': 14541, 'loss/train': 1.539810061454773} -08/30/2021 15:43:45 - INFO - __main__ - Step 14543: {'lr': 0.0004911924878197517, 'samples': 2792256, 'steps': 14542, 'loss/train': 2.13578200340271} -08/30/2021 15:43:45 - INFO - __main__ - Step 14544: {'lr': 0.0004911910915878913, 'samples': 2792448, 'steps': 14543, 'loss/train': 1.6552116870880127} -08/30/2021 15:43:45 - INFO - __main__ - Step 14545: {'lr': 0.000491189695247354, 'samples': 2792640, 'steps': 14544, 'loss/train': 1.9474873542785645} -08/30/2021 15:43:46 - INFO - __main__ - Step 14546: {'lr': 0.0004911882987981404, 'samples': 2792832, 'steps': 14545, 'loss/train': 1.9455745220184326} -08/30/2021 15:43:46 - INFO - __main__ - Step 14547: {'lr': 0.0004911869022402508, 'samples': 2793024, 'steps': 14546, 'loss/train': 2.396836757659912} -08/30/2021 15:43:47 - INFO - __main__ - Step 14548: {'lr': 0.0004911855055736863, 'samples': 2793216, 'steps': 14547, 'loss/train': 0.6741005182266235} -08/30/2021 15:43:47 - INFO - __main__ - Step 14549: {'lr': 0.0004911841087984473, 'samples': 2793408, 'steps': 14548, 'loss/train': 0.5657904744148254} -08/30/2021 15:43:48 - INFO - __main__ - Step 14550: {'lr': 0.0004911827119145345, 'samples': 2793600, 'steps': 14549, 'loss/train': 0.5266324281692505} -08/30/2021 15:43:49 - INFO - __main__ - Step 14551: {'lr': 0.0004911813149219485, 'samples': 2793792, 'steps': 14550, 'loss/train': 2.2867889404296875} -08/30/2021 15:43:49 - INFO - __main__ - Step 14552: {'lr': 0.0004911799178206899, 'samples': 2793984, 'steps': 14551, 'loss/train': 1.652372121810913} -08/30/2021 15:43:50 - INFO - __main__ - Step 14553: {'lr': 0.0004911785206107592, 'samples': 2794176, 'steps': 14552, 'loss/train': 1.2229183912277222} -08/30/2021 15:43:50 - INFO - __main__ - Step 14554: {'lr': 0.0004911771232921575, 'samples': 2794368, 'steps': 14553, 'loss/train': 1.9569799900054932} -08/30/2021 15:43:52 - INFO - __main__ - Step 14555: {'lr': 0.0004911757258648849, 'samples': 2794560, 'steps': 14554, 'loss/train': 1.7661128044128418} -08/30/2021 15:43:52 - INFO - __main__ - Step 14556: {'lr': 0.0004911743283289423, 'samples': 2794752, 'steps': 14555, 'loss/train': 1.9324421882629395} -08/30/2021 15:43:52 - INFO - __main__ - Step 14557: {'lr': 0.0004911729306843302, 'samples': 2794944, 'steps': 14556, 'loss/train': 1.7198010683059692} -08/30/2021 15:43:53 - INFO - __main__ - Step 14558: {'lr': 0.0004911715329310493, 'samples': 2795136, 'steps': 14557, 'loss/train': 2.081277847290039} -08/30/2021 15:43:53 - INFO - __main__ - Step 14559: {'lr': 0.0004911701350691002, 'samples': 2795328, 'steps': 14558, 'loss/train': 1.5989199876785278} -08/30/2021 15:43:55 - INFO - __main__ - Step 14560: {'lr': 0.0004911687370984836, 'samples': 2795520, 'steps': 14559, 'loss/train': 1.6618127822875977} -08/30/2021 15:43:55 - INFO - __main__ - Step 14561: {'lr': 0.0004911673390192002, 'samples': 2795712, 'steps': 14560, 'loss/train': 1.6317024230957031} -08/30/2021 15:43:55 - INFO - __main__ - Step 14562: {'lr': 0.0004911659408312505, 'samples': 2795904, 'steps': 14561, 'loss/train': 1.6831574440002441} -08/30/2021 15:43:56 - INFO - __main__ - Step 14563: {'lr': 0.000491164542534635, 'samples': 2796096, 'steps': 14562, 'loss/train': 1.9227943420410156} -08/30/2021 15:43:56 - INFO - __main__ - Step 14564: {'lr': 0.0004911631441293546, 'samples': 2796288, 'steps': 14563, 'loss/train': 1.221450686454773} -08/30/2021 15:43:57 - INFO - __main__ - Step 14565: {'lr': 0.0004911617456154097, 'samples': 2796480, 'steps': 14564, 'loss/train': 1.5972568988800049} -08/30/2021 15:43:58 - INFO - __main__ - Step 14566: {'lr': 0.0004911603469928012, 'samples': 2796672, 'steps': 14565, 'loss/train': 1.9297749996185303} -08/30/2021 15:43:59 - INFO - __main__ - Step 14567: {'lr': 0.0004911589482615294, 'samples': 2796864, 'steps': 14566, 'loss/train': 0.8215628862380981} -08/30/2021 15:43:59 - INFO - __main__ - Step 14568: {'lr': 0.0004911575494215952, 'samples': 2797056, 'steps': 14567, 'loss/train': 2.0217251777648926} -08/30/2021 15:43:59 - INFO - __main__ - Step 14569: {'lr': 0.0004911561504729992, 'samples': 2797248, 'steps': 14568, 'loss/train': 1.7546579837799072} -08/30/2021 15:44:00 - INFO - __main__ - Step 14570: {'lr': 0.0004911547514157417, 'samples': 2797440, 'steps': 14569, 'loss/train': 1.7044743299484253} -08/30/2021 15:44:01 - INFO - __main__ - Step 14571: {'lr': 0.0004911533522498239, 'samples': 2797632, 'steps': 14570, 'loss/train': 2.543809652328491} -08/30/2021 15:44:02 - INFO - __main__ - Step 14572: {'lr': 0.0004911519529752459, 'samples': 2797824, 'steps': 14571, 'loss/train': 2.1772594451904297} -08/30/2021 15:44:02 - INFO - __main__ - Step 14573: {'lr': 0.0004911505535920086, 'samples': 2798016, 'steps': 14572, 'loss/train': 1.947395920753479} -08/30/2021 15:44:02 - INFO - __main__ - Step 14574: {'lr': 0.0004911491541001126, 'samples': 2798208, 'steps': 14573, 'loss/train': 2.5584192276000977} -08/30/2021 15:44:03 - INFO - __main__ - Step 14575: {'lr': 0.0004911477544995585, 'samples': 2798400, 'steps': 14574, 'loss/train': 1.6723089218139648} -08/30/2021 15:44:04 - INFO - __main__ - Step 14576: {'lr': 0.000491146354790347, 'samples': 2798592, 'steps': 14575, 'loss/train': 2.1901209354400635} -08/30/2021 15:44:04 - INFO - __main__ - Step 14577: {'lr': 0.0004911449549724786, 'samples': 2798784, 'steps': 14576, 'loss/train': 1.4071576595306396} -08/30/2021 15:44:05 - INFO - __main__ - Step 14578: {'lr': 0.0004911435550459541, 'samples': 2798976, 'steps': 14577, 'loss/train': 1.4971303939819336} -08/30/2021 15:44:05 - INFO - __main__ - Step 14579: {'lr': 0.0004911421550107739, 'samples': 2799168, 'steps': 14578, 'loss/train': 1.8599587678909302} -08/30/2021 15:44:06 - INFO - __main__ - Step 14580: {'lr': 0.0004911407548669389, 'samples': 2799360, 'steps': 14579, 'loss/train': 2.2231287956237793} -08/30/2021 15:44:07 - INFO - __main__ - Step 14581: {'lr': 0.0004911393546144495, 'samples': 2799552, 'steps': 14580, 'loss/train': 1.9813406467437744} -08/30/2021 15:44:07 - INFO - __main__ - Step 14582: {'lr': 0.0004911379542533065, 'samples': 2799744, 'steps': 14581, 'loss/train': 1.5219194889068604} -08/30/2021 15:44:08 - INFO - __main__ - Step 14583: {'lr': 0.0004911365537835105, 'samples': 2799936, 'steps': 14582, 'loss/train': 1.6899129152297974} -08/30/2021 15:44:08 - INFO - __main__ - Step 14584: {'lr': 0.000491135153205062, 'samples': 2800128, 'steps': 14583, 'loss/train': 1.8255943059921265} -08/30/2021 15:44:09 - INFO - __main__ - Step 14585: {'lr': 0.0004911337525179616, 'samples': 2800320, 'steps': 14584, 'loss/train': 1.802324652671814} -08/30/2021 15:44:10 - INFO - __main__ - Step 14586: {'lr': 0.0004911323517222103, 'samples': 2800512, 'steps': 14585, 'loss/train': 1.627037763595581} -08/30/2021 15:44:11 - INFO - __main__ - Step 14587: {'lr': 0.0004911309508178084, 'samples': 2800704, 'steps': 14586, 'loss/train': 1.3630696535110474} -08/30/2021 15:44:11 - INFO - __main__ - Step 14588: {'lr': 0.0004911295498047565, 'samples': 2800896, 'steps': 14587, 'loss/train': 1.8996014595031738} -08/30/2021 15:44:12 - INFO - __main__ - Step 14589: {'lr': 0.0004911281486830554, 'samples': 2801088, 'steps': 14588, 'loss/train': 2.2303671836853027} -08/30/2021 15:44:12 - INFO - __main__ - Step 14590: {'lr': 0.0004911267474527058, 'samples': 2801280, 'steps': 14589, 'loss/train': 1.1725919246673584} -08/30/2021 15:44:12 - INFO - __main__ - Step 14591: {'lr': 0.000491125346113708, 'samples': 2801472, 'steps': 14590, 'loss/train': 1.1614854335784912} -08/30/2021 15:44:14 - INFO - __main__ - Step 14592: {'lr': 0.000491123944666063, 'samples': 2801664, 'steps': 14591, 'loss/train': 2.026860475540161} -08/30/2021 15:44:14 - INFO - __main__ - Step 14593: {'lr': 0.0004911225431097712, 'samples': 2801856, 'steps': 14592, 'loss/train': 1.815241813659668} -08/30/2021 15:44:15 - INFO - __main__ - Step 14594: {'lr': 0.0004911211414448333, 'samples': 2802048, 'steps': 14593, 'loss/train': 1.818095326423645} -08/30/2021 15:44:15 - INFO - __main__ - Step 14595: {'lr': 0.0004911197396712501, 'samples': 2802240, 'steps': 14594, 'loss/train': 1.7291560173034668} -08/30/2021 15:44:15 - INFO - __main__ - Step 14596: {'lr': 0.0004911183377890218, 'samples': 2802432, 'steps': 14595, 'loss/train': 1.8934985399246216} -08/30/2021 15:44:17 - INFO - __main__ - Step 14597: {'lr': 0.0004911169357981496, 'samples': 2802624, 'steps': 14596, 'loss/train': 1.3341199159622192} -08/30/2021 15:44:17 - INFO - __main__ - Step 14598: {'lr': 0.0004911155336986335, 'samples': 2802816, 'steps': 14597, 'loss/train': 1.5891129970550537} -08/30/2021 15:44:18 - INFO - __main__ - Step 14599: {'lr': 0.0004911141314904747, 'samples': 2803008, 'steps': 14598, 'loss/train': 1.7796026468276978} -08/30/2021 15:44:18 - INFO - __main__ - Step 14600: {'lr': 0.0004911127291736735, 'samples': 2803200, 'steps': 14599, 'loss/train': 4.444014549255371} -08/30/2021 15:44:18 - INFO - __main__ - Step 14601: {'lr': 0.0004911113267482307, 'samples': 2803392, 'steps': 14600, 'loss/train': 1.5700595378875732} -08/30/2021 15:44:19 - INFO - __main__ - Step 14602: {'lr': 0.0004911099242141467, 'samples': 2803584, 'steps': 14601, 'loss/train': 1.9138917922973633} -08/30/2021 15:44:21 - INFO - __main__ - Step 14603: {'lr': 0.0004911085215714224, 'samples': 2803776, 'steps': 14602, 'loss/train': 1.6377992630004883} -08/30/2021 15:44:21 - INFO - __main__ - Step 14604: {'lr': 0.0004911071188200584, 'samples': 2803968, 'steps': 14603, 'loss/train': 1.746010184288025} -08/30/2021 15:44:21 - INFO - __main__ - Step 14605: {'lr': 0.0004911057159600551, 'samples': 2804160, 'steps': 14604, 'loss/train': 1.6858192682266235} -08/30/2021 15:44:22 - INFO - __main__ - Step 14606: {'lr': 0.0004911043129914133, 'samples': 2804352, 'steps': 14605, 'loss/train': 2.0764570236206055} -08/30/2021 15:44:22 - INFO - __main__ - Step 14607: {'lr': 0.0004911029099141336, 'samples': 2804544, 'steps': 14606, 'loss/train': 1.961524248123169} -08/30/2021 15:44:24 - INFO - __main__ - Step 14608: {'lr': 0.0004911015067282168, 'samples': 2804736, 'steps': 14607, 'loss/train': 1.7911008596420288} -08/30/2021 15:44:24 - INFO - __main__ - Step 14609: {'lr': 0.0004911001034336633, 'samples': 2804928, 'steps': 14608, 'loss/train': 1.6780343055725098} -08/30/2021 15:44:24 - INFO - __main__ - Step 14610: {'lr': 0.0004910987000304737, 'samples': 2805120, 'steps': 14609, 'loss/train': 1.8911654949188232} -08/30/2021 15:44:25 - INFO - __main__ - Step 14611: {'lr': 0.0004910972965186488, 'samples': 2805312, 'steps': 14610, 'loss/train': 2.0743560791015625} -08/30/2021 15:44:25 - INFO - __main__ - Step 14612: {'lr': 0.0004910958928981893, 'samples': 2805504, 'steps': 14611, 'loss/train': 1.5017342567443848} -08/30/2021 15:44:27 - INFO - __main__ - Step 14613: {'lr': 0.0004910944891690956, 'samples': 2805696, 'steps': 14612, 'loss/train': 1.7243694067001343} -08/30/2021 15:44:27 - INFO - __main__ - Step 14614: {'lr': 0.0004910930853313686, 'samples': 2805888, 'steps': 14613, 'loss/train': 1.8691600561141968} -08/30/2021 15:44:27 - INFO - __main__ - Step 14615: {'lr': 0.0004910916813850086, 'samples': 2806080, 'steps': 14614, 'loss/train': 1.6921037435531616} -08/30/2021 15:44:28 - INFO - __main__ - Step 14616: {'lr': 0.0004910902773300164, 'samples': 2806272, 'steps': 14615, 'loss/train': 1.556960940361023} -08/30/2021 15:44:28 - INFO - __main__ - Step 14617: {'lr': 0.0004910888731663928, 'samples': 2806464, 'steps': 14616, 'loss/train': 1.6416927576065063} -08/30/2021 15:44:30 - INFO - __main__ - Step 14618: {'lr': 0.0004910874688941381, 'samples': 2806656, 'steps': 14617, 'loss/train': 1.4495739936828613} -08/30/2021 15:44:30 - INFO - __main__ - Step 14619: {'lr': 0.0004910860645132532, 'samples': 2806848, 'steps': 14618, 'loss/train': 2.184468984603882} -08/30/2021 15:44:30 - INFO - __main__ - Step 14620: {'lr': 0.0004910846600237386, 'samples': 2807040, 'steps': 14619, 'loss/train': 1.7852646112442017} -08/30/2021 15:44:31 - INFO - __main__ - Step 14621: {'lr': 0.0004910832554255951, 'samples': 2807232, 'steps': 14620, 'loss/train': 1.9583921432495117} -08/30/2021 15:44:31 - INFO - __main__ - Step 14622: {'lr': 0.0004910818507188231, 'samples': 2807424, 'steps': 14621, 'loss/train': 1.8207911252975464} -08/30/2021 15:44:33 - INFO - __main__ - Step 14623: {'lr': 0.0004910804459034233, 'samples': 2807616, 'steps': 14622, 'loss/train': 1.994828701019287} -08/30/2021 15:44:33 - INFO - __main__ - Step 14624: {'lr': 0.0004910790409793965, 'samples': 2807808, 'steps': 14623, 'loss/train': 1.6754604578018188} -08/30/2021 15:44:34 - INFO - __main__ - Step 14625: {'lr': 0.000491077635946743, 'samples': 2808000, 'steps': 14624, 'loss/train': 1.3960660696029663} -08/30/2021 15:44:34 - INFO - __main__ - Step 14626: {'lr': 0.0004910762308054638, 'samples': 2808192, 'steps': 14625, 'loss/train': 1.5810043811798096} -08/30/2021 15:44:34 - INFO - __main__ - Step 14627: {'lr': 0.0004910748255555593, 'samples': 2808384, 'steps': 14626, 'loss/train': 1.9512444734573364} -08/30/2021 15:44:36 - INFO - __main__ - Step 14628: {'lr': 0.0004910734201970302, 'samples': 2808576, 'steps': 14627, 'loss/train': 1.7666977643966675} -08/30/2021 15:44:36 - INFO - __main__ - Step 14629: {'lr': 0.0004910720147298772, 'samples': 2808768, 'steps': 14628, 'loss/train': 1.2753146886825562} -08/30/2021 15:44:37 - INFO - __main__ - Step 14630: {'lr': 0.0004910706091541009, 'samples': 2808960, 'steps': 14629, 'loss/train': 0.964402973651886} -08/30/2021 15:44:37 - INFO - __main__ - Step 14631: {'lr': 0.0004910692034697018, 'samples': 2809152, 'steps': 14630, 'loss/train': 1.3130466938018799} -08/30/2021 15:44:37 - INFO - __main__ - Step 14632: {'lr': 0.0004910677976766807, 'samples': 2809344, 'steps': 14631, 'loss/train': 1.5554542541503906} -08/30/2021 15:44:38 - INFO - __main__ - Step 14633: {'lr': 0.0004910663917750382, 'samples': 2809536, 'steps': 14632, 'loss/train': 1.7356388568878174} -08/30/2021 15:44:39 - INFO - __main__ - Step 14634: {'lr': 0.0004910649857647748, 'samples': 2809728, 'steps': 14633, 'loss/train': 1.9776718616485596} -08/30/2021 15:44:40 - INFO - __main__ - Step 14635: {'lr': 0.0004910635796458913, 'samples': 2809920, 'steps': 14634, 'loss/train': 2.3299033641815186} -08/30/2021 15:44:40 - INFO - __main__ - Step 14636: {'lr': 0.0004910621734183882, 'samples': 2810112, 'steps': 14635, 'loss/train': 2.086420774459839} -08/30/2021 15:44:40 - INFO - __main__ - Step 14637: {'lr': 0.0004910607670822663, 'samples': 2810304, 'steps': 14636, 'loss/train': 1.181735873222351} -08/30/2021 15:44:41 - INFO - __main__ - Step 14638: {'lr': 0.0004910593606375261, 'samples': 2810496, 'steps': 14637, 'loss/train': 1.4632714986801147} -08/30/2021 15:44:41 - INFO - __main__ - Step 14639: {'lr': 0.0004910579540841683, 'samples': 2810688, 'steps': 14638, 'loss/train': 2.17461895942688} -08/30/2021 15:44:43 - INFO - __main__ - Step 14640: {'lr': 0.0004910565474221934, 'samples': 2810880, 'steps': 14639, 'loss/train': 1.7071837186813354} -08/30/2021 15:44:43 - INFO - __main__ - Step 14641: {'lr': 0.0004910551406516022, 'samples': 2811072, 'steps': 14640, 'loss/train': 1.1795498132705688} -08/30/2021 15:44:43 - INFO - __main__ - Step 14642: {'lr': 0.0004910537337723954, 'samples': 2811264, 'steps': 14641, 'loss/train': 1.0120351314544678} -08/30/2021 15:44:44 - INFO - __main__ - Step 14643: {'lr': 0.0004910523267845733, 'samples': 2811456, 'steps': 14642, 'loss/train': 2.166316270828247} -08/30/2021 15:44:44 - INFO - __main__ - Step 14644: {'lr': 0.0004910509196881369, 'samples': 2811648, 'steps': 14643, 'loss/train': 1.7520242929458618} -08/30/2021 15:44:46 - INFO - __main__ - Step 14645: {'lr': 0.0004910495124830866, 'samples': 2811840, 'steps': 14644, 'loss/train': 0.8346025347709656} -08/30/2021 15:44:46 - INFO - __main__ - Step 14646: {'lr': 0.0004910481051694231, 'samples': 2812032, 'steps': 14645, 'loss/train': 2.275949478149414} -08/30/2021 15:44:46 - INFO - __main__ - Step 14647: {'lr': 0.0004910466977471471, 'samples': 2812224, 'steps': 14646, 'loss/train': 1.7611808776855469} -08/30/2021 15:44:47 - INFO - __main__ - Step 14648: {'lr': 0.0004910452902162592, 'samples': 2812416, 'steps': 14647, 'loss/train': 2.085137367248535} -08/30/2021 15:44:47 - INFO - __main__ - Step 14649: {'lr': 0.0004910438825767599, 'samples': 2812608, 'steps': 14648, 'loss/train': 2.0280754566192627} -08/30/2021 15:44:49 - INFO - __main__ - Step 14650: {'lr': 0.00049104247482865, 'samples': 2812800, 'steps': 14649, 'loss/train': 1.8058545589447021} -08/30/2021 15:44:49 - INFO - __main__ - Step 14651: {'lr': 0.0004910410669719301, 'samples': 2812992, 'steps': 14650, 'loss/train': 1.3903549909591675} -08/30/2021 15:44:49 - INFO - __main__ - Step 14652: {'lr': 0.0004910396590066008, 'samples': 2813184, 'steps': 14651, 'loss/train': 2.116035223007202} -08/30/2021 15:44:50 - INFO - __main__ - Step 14653: {'lr': 0.0004910382509326627, 'samples': 2813376, 'steps': 14652, 'loss/train': 1.607561707496643} -08/30/2021 15:44:50 - INFO - __main__ - Step 14654: {'lr': 0.0004910368427501166, 'samples': 2813568, 'steps': 14653, 'loss/train': 1.5568851232528687} -08/30/2021 15:44:52 - INFO - __main__ - Step 14655: {'lr': 0.000491035434458963, 'samples': 2813760, 'steps': 14654, 'loss/train': 1.773860216140747} -08/30/2021 15:44:53 - INFO - __main__ - Step 14656: {'lr': 0.0004910340260592024, 'samples': 2813952, 'steps': 14655, 'loss/train': 1.6594730615615845} -08/30/2021 15:44:53 - INFO - __main__ - Step 14657: {'lr': 0.0004910326175508357, 'samples': 2814144, 'steps': 14656, 'loss/train': 1.91238272190094} -08/30/2021 15:44:54 - INFO - __main__ - Step 14658: {'lr': 0.0004910312089338634, 'samples': 2814336, 'steps': 14657, 'loss/train': 1.8704928159713745} -08/30/2021 15:44:54 - INFO - __main__ - Step 14659: {'lr': 0.0004910298002082863, 'samples': 2814528, 'steps': 14658, 'loss/train': 2.0522892475128174} -08/30/2021 15:44:54 - INFO - __main__ - Step 14660: {'lr': 0.0004910283913741047, 'samples': 2814720, 'steps': 14659, 'loss/train': 1.9995373487472534} -08/30/2021 15:44:56 - INFO - __main__ - Step 14661: {'lr': 0.0004910269824313194, 'samples': 2814912, 'steps': 14660, 'loss/train': 0.10485048592090607} -08/30/2021 15:44:57 - INFO - __main__ - Step 14662: {'lr': 0.0004910255733799312, 'samples': 2815104, 'steps': 14661, 'loss/train': 1.678443431854248} -08/30/2021 15:44:57 - INFO - __main__ - Step 14663: {'lr': 0.0004910241642199406, 'samples': 2815296, 'steps': 14662, 'loss/train': 1.8793506622314453} -08/30/2021 15:44:57 - INFO - __main__ - Step 14664: {'lr': 0.0004910227549513481, 'samples': 2815488, 'steps': 14663, 'loss/train': 1.6896947622299194} -08/30/2021 15:44:58 - INFO - __main__ - Step 14665: {'lr': 0.0004910213455741546, 'samples': 2815680, 'steps': 14664, 'loss/train': 1.2330312728881836} -08/30/2021 15:44:59 - INFO - __main__ - Step 14666: {'lr': 0.0004910199360883605, 'samples': 2815872, 'steps': 14665, 'loss/train': 0.17734304070472717} -08/30/2021 15:45:00 - INFO - __main__ - Step 14667: {'lr': 0.0004910185264939667, 'samples': 2816064, 'steps': 14666, 'loss/train': 1.6526727676391602} -08/30/2021 15:45:00 - INFO - __main__ - Step 14668: {'lr': 0.0004910171167909734, 'samples': 2816256, 'steps': 14667, 'loss/train': 1.6394777297973633} -08/30/2021 15:45:00 - INFO - __main__ - Step 14669: {'lr': 0.0004910157069793816, 'samples': 2816448, 'steps': 14668, 'loss/train': 1.6216762065887451} -08/30/2021 15:45:01 - INFO - __main__ - Step 14670: {'lr': 0.000491014297059192, 'samples': 2816640, 'steps': 14669, 'loss/train': 1.1892478466033936} -08/30/2021 15:45:02 - INFO - __main__ - Step 14671: {'lr': 0.000491012887030405, 'samples': 2816832, 'steps': 14670, 'loss/train': 1.829420566558838} -08/30/2021 15:45:02 - INFO - __main__ - Step 14672: {'lr': 0.0004910114768930212, 'samples': 2817024, 'steps': 14671, 'loss/train': 1.589525818824768} -08/30/2021 15:45:03 - INFO - __main__ - Step 14673: {'lr': 0.0004910100666470415, 'samples': 2817216, 'steps': 14672, 'loss/train': 1.4008476734161377} -08/30/2021 15:45:03 - INFO - __main__ - Step 14674: {'lr': 0.0004910086562924663, 'samples': 2817408, 'steps': 14673, 'loss/train': 1.9427365064620972} -08/30/2021 15:45:03 - INFO - __main__ - Step 14675: {'lr': 0.0004910072458292963, 'samples': 2817600, 'steps': 14674, 'loss/train': 1.1250696182250977} -08/30/2021 15:45:05 - INFO - __main__ - Step 14676: {'lr': 0.0004910058352575322, 'samples': 2817792, 'steps': 14675, 'loss/train': 1.6572259664535522} -08/30/2021 15:45:06 - INFO - __main__ - Step 14677: {'lr': 0.0004910044245771745, 'samples': 2817984, 'steps': 14676, 'loss/train': 1.3050671815872192} -08/30/2021 15:45:06 - INFO - __main__ - Step 14678: {'lr': 0.0004910030137882241, 'samples': 2818176, 'steps': 14677, 'loss/train': 1.45987868309021} -08/30/2021 15:45:06 - INFO - __main__ - Step 14679: {'lr': 0.0004910016028906813, 'samples': 2818368, 'steps': 14678, 'loss/train': 1.8911447525024414} -08/30/2021 15:45:07 - INFO - __main__ - Step 14680: {'lr': 0.000491000191884547, 'samples': 2818560, 'steps': 14679, 'loss/train': 1.4819631576538086} -08/30/2021 15:45:07 - INFO - __main__ - Step 14681: {'lr': 0.0004909987807698217, 'samples': 2818752, 'steps': 14680, 'loss/train': 1.9897003173828125} -08/30/2021 15:45:09 - INFO - __main__ - Step 14682: {'lr': 0.000490997369546506, 'samples': 2818944, 'steps': 14681, 'loss/train': 1.1989651918411255} -08/30/2021 15:45:09 - INFO - __main__ - Step 14683: {'lr': 0.0004909959582146007, 'samples': 2819136, 'steps': 14682, 'loss/train': 1.6224522590637207} -08/30/2021 15:45:09 - INFO - __main__ - Step 14684: {'lr': 0.0004909945467741063, 'samples': 2819328, 'steps': 14683, 'loss/train': 1.3895024061203003} -08/30/2021 15:45:10 - INFO - __main__ - Step 14685: {'lr': 0.0004909931352250235, 'samples': 2819520, 'steps': 14684, 'loss/train': 1.818917989730835} -08/30/2021 15:45:10 - INFO - __main__ - Step 14686: {'lr': 0.0004909917235673529, 'samples': 2819712, 'steps': 14685, 'loss/train': 1.71416437625885} -08/30/2021 15:45:13 - INFO - __main__ - Step 14687: {'lr': 0.0004909903118010951, 'samples': 2819904, 'steps': 14686, 'loss/train': 0.31285062432289124} -08/30/2021 15:45:13 - INFO - __main__ - Step 14688: {'lr': 0.0004909888999262509, 'samples': 2820096, 'steps': 14687, 'loss/train': 1.394999623298645} -08/30/2021 15:45:14 - INFO - __main__ - Step 14689: {'lr': 0.0004909874879428207, 'samples': 2820288, 'steps': 14688, 'loss/train': 1.726932406425476} -08/30/2021 15:45:14 - INFO - __main__ - Step 14690: {'lr': 0.0004909860758508052, 'samples': 2820480, 'steps': 14689, 'loss/train': 1.9724937677383423} -08/30/2021 15:45:15 - INFO - __main__ - Step 14691: {'lr': 0.0004909846636502053, 'samples': 2820672, 'steps': 14690, 'loss/train': 1.2475253343582153} -08/30/2021 15:45:15 - INFO - __main__ - Step 14692: {'lr': 0.0004909832513410213, 'samples': 2820864, 'steps': 14691, 'loss/train': 0.6993420720100403} -08/30/2021 15:45:15 - INFO - __main__ - Step 14693: {'lr': 0.000490981838923254, 'samples': 2821056, 'steps': 14692, 'loss/train': 0.6544314026832581} -08/30/2021 15:45:17 - INFO - __main__ - Step 14694: {'lr': 0.000490980426396904, 'samples': 2821248, 'steps': 14693, 'loss/train': 0.6051246523857117} -08/30/2021 15:45:17 - INFO - __main__ - Step 14695: {'lr': 0.0004909790137619719, 'samples': 2821440, 'steps': 14694, 'loss/train': 1.8594558238983154} -08/30/2021 15:45:18 - INFO - __main__ - Step 14696: {'lr': 0.0004909776010184585, 'samples': 2821632, 'steps': 14695, 'loss/train': 1.3099099397659302} -08/30/2021 15:45:18 - INFO - __main__ - Step 14697: {'lr': 0.0004909761881663642, 'samples': 2821824, 'steps': 14696, 'loss/train': 0.8243240118026733} -08/30/2021 15:45:18 - INFO - __main__ - Step 14698: {'lr': 0.0004909747752056897, 'samples': 2822016, 'steps': 14697, 'loss/train': 1.732924461364746} -08/30/2021 15:45:20 - INFO - __main__ - Step 14699: {'lr': 0.0004909733621364358, 'samples': 2822208, 'steps': 14698, 'loss/train': 1.355660319328308} -08/30/2021 15:45:20 - INFO - __main__ - Step 14700: {'lr': 0.0004909719489586029, 'samples': 2822400, 'steps': 14699, 'loss/train': 1.5890251398086548} -08/30/2021 15:45:21 - INFO - __main__ - Step 14701: {'lr': 0.0004909705356721919, 'samples': 2822592, 'steps': 14700, 'loss/train': 1.6387518644332886} -08/30/2021 15:45:21 - INFO - __main__ - Step 14702: {'lr': 0.0004909691222772032, 'samples': 2822784, 'steps': 14701, 'loss/train': 1.9046984910964966} -08/30/2021 15:45:21 - INFO - __main__ - Step 14703: {'lr': 0.0004909677087736375, 'samples': 2822976, 'steps': 14702, 'loss/train': 2.410398006439209} -08/30/2021 15:45:23 - INFO - __main__ - Step 14704: {'lr': 0.0004909662951614955, 'samples': 2823168, 'steps': 14703, 'loss/train': 2.110142469406128} -08/30/2021 15:45:24 - INFO - __main__ - Step 14705: {'lr': 0.0004909648814407779, 'samples': 2823360, 'steps': 14704, 'loss/train': 1.9797699451446533} -08/30/2021 15:45:24 - INFO - __main__ - Step 14706: {'lr': 0.0004909634676114851, 'samples': 2823552, 'steps': 14705, 'loss/train': 0.40343761444091797} -08/30/2021 15:45:24 - INFO - __main__ - Step 14707: {'lr': 0.000490962053673618, 'samples': 2823744, 'steps': 14706, 'loss/train': 2.281370162963867} -08/30/2021 15:45:25 - INFO - __main__ - Step 14708: {'lr': 0.0004909606396271771, 'samples': 2823936, 'steps': 14707, 'loss/train': 1.9501404762268066} -08/30/2021 15:45:25 - INFO - __main__ - Step 14709: {'lr': 0.000490959225472163, 'samples': 2824128, 'steps': 14708, 'loss/train': 2.140007734298706} -08/30/2021 15:45:26 - INFO - __main__ - Step 14710: {'lr': 0.0004909578112085764, 'samples': 2824320, 'steps': 14709, 'loss/train': 1.8393839597702026} -08/30/2021 15:45:27 - INFO - __main__ - Step 14711: {'lr': 0.0004909563968364179, 'samples': 2824512, 'steps': 14710, 'loss/train': 1.8584641218185425} -08/30/2021 15:45:27 - INFO - __main__ - Step 14712: {'lr': 0.0004909549823556883, 'samples': 2824704, 'steps': 14711, 'loss/train': 1.9532889127731323} -08/30/2021 15:45:28 - INFO - __main__ - Step 14713: {'lr': 0.000490953567766388, 'samples': 2824896, 'steps': 14712, 'loss/train': 1.585712194442749} -08/30/2021 15:45:28 - INFO - __main__ - Step 14714: {'lr': 0.0004909521530685177, 'samples': 2825088, 'steps': 14713, 'loss/train': 2.0731117725372314} -08/30/2021 15:45:29 - INFO - __main__ - Step 14715: {'lr': 0.0004909507382620782, 'samples': 2825280, 'steps': 14714, 'loss/train': 2.686898946762085} -08/30/2021 15:45:30 - INFO - __main__ - Step 14716: {'lr': 0.0004909493233470699, 'samples': 2825472, 'steps': 14715, 'loss/train': 1.6656004190444946} -08/30/2021 15:45:30 - INFO - __main__ - Step 14717: {'lr': 0.0004909479083234936, 'samples': 2825664, 'steps': 14716, 'loss/train': 1.4297140836715698} -08/30/2021 15:45:31 - INFO - __main__ - Step 14718: {'lr': 0.0004909464931913499, 'samples': 2825856, 'steps': 14717, 'loss/train': 2.172856569290161} -08/30/2021 15:45:31 - INFO - __main__ - Step 14719: {'lr': 0.0004909450779506393, 'samples': 2826048, 'steps': 14718, 'loss/train': 1.8576105833053589} -08/30/2021 15:45:33 - INFO - __main__ - Step 14720: {'lr': 0.0004909436626013628, 'samples': 2826240, 'steps': 14719, 'loss/train': 2.227588653564453} -08/30/2021 15:45:33 - INFO - __main__ - Step 14721: {'lr': 0.0004909422471435207, 'samples': 2826432, 'steps': 14720, 'loss/train': 0.9746146202087402} -08/30/2021 15:45:34 - INFO - __main__ - Step 14722: {'lr': 0.0004909408315771136, 'samples': 2826624, 'steps': 14721, 'loss/train': 1.4908896684646606} -08/30/2021 15:45:34 - INFO - __main__ - Step 14723: {'lr': 0.0004909394159021425, 'samples': 2826816, 'steps': 14722, 'loss/train': 1.2262314558029175} -08/30/2021 15:45:34 - INFO - __main__ - Step 14724: {'lr': 0.0004909380001186077, 'samples': 2827008, 'steps': 14723, 'loss/train': 1.6169757843017578} -08/30/2021 15:45:36 - INFO - __main__ - Step 14725: {'lr': 0.00049093658422651, 'samples': 2827200, 'steps': 14724, 'loss/train': 1.6944632530212402} -08/30/2021 15:45:36 - INFO - __main__ - Step 14726: {'lr': 0.00049093516822585, 'samples': 2827392, 'steps': 14725, 'loss/train': 1.458341121673584} -08/30/2021 15:45:37 - INFO - __main__ - Step 14727: {'lr': 0.0004909337521166282, 'samples': 2827584, 'steps': 14726, 'loss/train': 2.004753351211548} -08/30/2021 15:45:37 - INFO - __main__ - Step 14728: {'lr': 0.0004909323358988455, 'samples': 2827776, 'steps': 14727, 'loss/train': 0.2734319269657135} -08/30/2021 15:45:37 - INFO - __main__ - Step 14729: {'lr': 0.0004909309195725024, 'samples': 2827968, 'steps': 14728, 'loss/train': 2.0499861240386963} -08/30/2021 15:45:38 - INFO - __main__ - Step 14730: {'lr': 0.0004909295031375996, 'samples': 2828160, 'steps': 14729, 'loss/train': 1.128167748451233} -08/30/2021 15:45:40 - INFO - __main__ - Step 14731: {'lr': 0.0004909280865941375, 'samples': 2828352, 'steps': 14730, 'loss/train': 1.9347211122512817} -08/30/2021 15:45:40 - INFO - __main__ - Step 14732: {'lr': 0.0004909266699421171, 'samples': 2828544, 'steps': 14731, 'loss/train': 2.115064859390259} -08/30/2021 15:45:40 - INFO - __main__ - Step 14733: {'lr': 0.0004909252531815388, 'samples': 2828736, 'steps': 14732, 'loss/train': 2.062617540359497} -08/30/2021 15:45:41 - INFO - __main__ - Step 14734: {'lr': 0.0004909238363124033, 'samples': 2828928, 'steps': 14733, 'loss/train': 2.1753149032592773} -08/30/2021 15:45:41 - INFO - __main__ - Step 14735: {'lr': 0.0004909224193347112, 'samples': 2829120, 'steps': 14734, 'loss/train': 1.2242854833602905} -08/30/2021 15:45:43 - INFO - __main__ - Step 14736: {'lr': 0.0004909210022484633, 'samples': 2829312, 'steps': 14735, 'loss/train': 1.9963405132293701} -08/30/2021 15:45:43 - INFO - __main__ - Step 14737: {'lr': 0.00049091958505366, 'samples': 2829504, 'steps': 14736, 'loss/train': 1.435778021812439} -08/30/2021 15:45:44 - INFO - __main__ - Step 14738: {'lr': 0.000490918167750302, 'samples': 2829696, 'steps': 14737, 'loss/train': 0.13562822341918945} -08/30/2021 15:45:44 - INFO - __main__ - Step 14739: {'lr': 0.00049091675033839, 'samples': 2829888, 'steps': 14738, 'loss/train': 1.2889208793640137} -08/30/2021 15:45:44 - INFO - __main__ - Step 14740: {'lr': 0.0004909153328179248, 'samples': 2830080, 'steps': 14739, 'loss/train': 2.167332410812378} -08/30/2021 15:45:45 - INFO - __main__ - Step 14741: {'lr': 0.0004909139151889067, 'samples': 2830272, 'steps': 14740, 'loss/train': 1.9671624898910522} -08/30/2021 15:45:46 - INFO - __main__ - Step 14742: {'lr': 0.0004909124974513366, 'samples': 2830464, 'steps': 14741, 'loss/train': 1.864754557609558} -08/30/2021 15:45:47 - INFO - __main__ - Step 14743: {'lr': 0.000490911079605215, 'samples': 2830656, 'steps': 14742, 'loss/train': 1.824412226676941} -08/30/2021 15:45:47 - INFO - __main__ - Step 14744: {'lr': 0.0004909096616505426, 'samples': 2830848, 'steps': 14743, 'loss/train': 0.8528931140899658} -08/30/2021 15:45:48 - INFO - __main__ - Step 14745: {'lr': 0.00049090824358732, 'samples': 2831040, 'steps': 14744, 'loss/train': 1.975135326385498} -08/30/2021 15:45:48 - INFO - __main__ - Step 14746: {'lr': 0.0004909068254155479, 'samples': 2831232, 'steps': 14745, 'loss/train': 1.5108544826507568} -08/30/2021 15:45:50 - INFO - __main__ - Step 14747: {'lr': 0.0004909054071352269, 'samples': 2831424, 'steps': 14746, 'loss/train': 1.790999412536621} -08/30/2021 15:45:50 - INFO - __main__ - Step 14748: {'lr': 0.0004909039887463576, 'samples': 2831616, 'steps': 14747, 'loss/train': 1.9513864517211914} -08/30/2021 15:45:51 - INFO - __main__ - Step 14749: {'lr': 0.0004909025702489407, 'samples': 2831808, 'steps': 14748, 'loss/train': 0.9044994115829468} -08/30/2021 15:45:51 - INFO - __main__ - Step 14750: {'lr': 0.0004909011516429768, 'samples': 2832000, 'steps': 14749, 'loss/train': 1.6430326700210571} -08/30/2021 15:45:51 - INFO - __main__ - Step 14751: {'lr': 0.0004908997329284667, 'samples': 2832192, 'steps': 14750, 'loss/train': 1.896259069442749} -08/30/2021 15:45:52 - INFO - __main__ - Step 14752: {'lr': 0.0004908983141054107, 'samples': 2832384, 'steps': 14751, 'loss/train': 2.2090365886688232} -08/30/2021 15:45:53 - INFO - __main__ - Step 14753: {'lr': 0.0004908968951738098, 'samples': 2832576, 'steps': 14752, 'loss/train': 2.1068897247314453} -08/30/2021 15:45:54 - INFO - __main__ - Step 14754: {'lr': 0.0004908954761336643, 'samples': 2832768, 'steps': 14753, 'loss/train': 1.7195020914077759} -08/30/2021 15:45:54 - INFO - __main__ - Step 14755: {'lr': 0.0004908940569849751, 'samples': 2832960, 'steps': 14754, 'loss/train': 3.5167717933654785} -08/30/2021 15:45:54 - INFO - __main__ - Step 14756: {'lr': 0.0004908926377277428, 'samples': 2833152, 'steps': 14755, 'loss/train': 1.8004331588745117} -08/30/2021 15:45:55 - INFO - __main__ - Step 14757: {'lr': 0.000490891218361968, 'samples': 2833344, 'steps': 14756, 'loss/train': 1.5686569213867188} -08/30/2021 15:45:56 - INFO - __main__ - Step 14758: {'lr': 0.0004908897988876512, 'samples': 2833536, 'steps': 14757, 'loss/train': 2.927267551422119} -08/30/2021 15:45:57 - INFO - __main__ - Step 14759: {'lr': 0.0004908883793047934, 'samples': 2833728, 'steps': 14758, 'loss/train': 1.738626480102539} -08/30/2021 15:45:57 - INFO - __main__ - Step 14760: {'lr': 0.0004908869596133948, 'samples': 2833920, 'steps': 14759, 'loss/train': 1.6574175357818604} -08/30/2021 15:45:58 - INFO - __main__ - Step 14761: {'lr': 0.0004908855398134563, 'samples': 2834112, 'steps': 14760, 'loss/train': 2.0832979679107666} -08/30/2021 15:45:58 - INFO - __main__ - Step 14762: {'lr': 0.0004908841199049785, 'samples': 2834304, 'steps': 14761, 'loss/train': 1.847208023071289} -08/30/2021 15:46:00 - INFO - __main__ - Step 14763: {'lr': 0.0004908826998879621, 'samples': 2834496, 'steps': 14762, 'loss/train': 1.6407380104064941} -08/30/2021 15:46:00 - INFO - __main__ - Step 14764: {'lr': 0.0004908812797624077, 'samples': 2834688, 'steps': 14763, 'loss/train': 2.1208245754241943} -08/30/2021 15:46:00 - INFO - __main__ - Step 14765: {'lr': 0.0004908798595283159, 'samples': 2834880, 'steps': 14764, 'loss/train': 2.920278549194336} -08/30/2021 15:46:01 - INFO - __main__ - Step 14766: {'lr': 0.0004908784391856872, 'samples': 2835072, 'steps': 14765, 'loss/train': 1.6570030450820923} -08/30/2021 15:46:01 - INFO - __main__ - Step 14767: {'lr': 0.0004908770187345225, 'samples': 2835264, 'steps': 14766, 'loss/train': 1.491756796836853} -08/30/2021 15:46:01 - INFO - __main__ - Step 14768: {'lr': 0.0004908755981748223, 'samples': 2835456, 'steps': 14767, 'loss/train': 2.148419141769409} -08/30/2021 15:46:03 - INFO - __main__ - Step 14769: {'lr': 0.0004908741775065873, 'samples': 2835648, 'steps': 14768, 'loss/train': 1.8597686290740967} -08/30/2021 15:46:03 - INFO - __main__ - Step 14770: {'lr': 0.0004908727567298181, 'samples': 2835840, 'steps': 14769, 'loss/train': 1.5146944522857666} -08/30/2021 15:46:04 - INFO - __main__ - Step 14771: {'lr': 0.0004908713358445154, 'samples': 2836032, 'steps': 14770, 'loss/train': 1.489193320274353} -08/30/2021 15:46:04 - INFO - __main__ - Step 14772: {'lr': 0.0004908699148506797, 'samples': 2836224, 'steps': 14771, 'loss/train': 2.9027161598205566} -08/30/2021 15:46:04 - INFO - __main__ - Step 14773: {'lr': 0.0004908684937483119, 'samples': 2836416, 'steps': 14772, 'loss/train': 1.098861813545227} -08/30/2021 15:46:06 - INFO - __main__ - Step 14774: {'lr': 0.0004908670725374122, 'samples': 2836608, 'steps': 14773, 'loss/train': 1.5781524181365967} -08/30/2021 15:46:06 - INFO - __main__ - Step 14775: {'lr': 0.0004908656512179817, 'samples': 2836800, 'steps': 14774, 'loss/train': 1.9069923162460327} -08/30/2021 15:46:07 - INFO - __main__ - Step 14776: {'lr': 0.0004908642297900209, 'samples': 2836992, 'steps': 14775, 'loss/train': 1.7256543636322021} -08/30/2021 15:46:07 - INFO - __main__ - Step 14777: {'lr': 0.0004908628082535303, 'samples': 2837184, 'steps': 14776, 'loss/train': 1.6065256595611572} -08/30/2021 15:46:07 - INFO - __main__ - Step 14778: {'lr': 0.0004908613866085106, 'samples': 2837376, 'steps': 14777, 'loss/train': 1.8986363410949707} -08/30/2021 15:46:09 - INFO - __main__ - Step 14779: {'lr': 0.0004908599648549626, 'samples': 2837568, 'steps': 14778, 'loss/train': 2.2807629108428955} -08/30/2021 15:46:09 - INFO - __main__ - Step 14780: {'lr': 0.0004908585429928867, 'samples': 2837760, 'steps': 14779, 'loss/train': 1.5258680582046509} -08/30/2021 15:46:10 - INFO - __main__ - Step 14781: {'lr': 0.0004908571210222837, 'samples': 2837952, 'steps': 14780, 'loss/train': 1.6942903995513916} -08/30/2021 15:46:10 - INFO - __main__ - Step 14782: {'lr': 0.0004908556989431543, 'samples': 2838144, 'steps': 14781, 'loss/train': 1.432295322418213} -08/30/2021 15:46:10 - INFO - __main__ - Step 14783: {'lr': 0.0004908542767554988, 'samples': 2838336, 'steps': 14782, 'loss/train': 1.9186686277389526} -08/30/2021 15:46:12 - INFO - __main__ - Step 14784: {'lr': 0.0004908528544593184, 'samples': 2838528, 'steps': 14783, 'loss/train': 1.4333107471466064} -08/30/2021 15:46:12 - INFO - __main__ - Step 14785: {'lr': 0.0004908514320546132, 'samples': 2838720, 'steps': 14784, 'loss/train': 0.1518404483795166} -08/30/2021 15:46:13 - INFO - __main__ - Step 14786: {'lr': 0.000490850009541384, 'samples': 2838912, 'steps': 14785, 'loss/train': 1.9479858875274658} -08/30/2021 15:46:13 - INFO - __main__ - Step 14787: {'lr': 0.0004908485869196317, 'samples': 2839104, 'steps': 14786, 'loss/train': 1.773112416267395} -08/30/2021 15:46:13 - INFO - __main__ - Step 14788: {'lr': 0.0004908471641893566, 'samples': 2839296, 'steps': 14787, 'loss/train': 1.6422818899154663} -08/30/2021 15:46:15 - INFO - __main__ - Step 14789: {'lr': 0.0004908457413505596, 'samples': 2839488, 'steps': 14788, 'loss/train': 1.4594115018844604} -08/30/2021 15:46:15 - INFO - __main__ - Step 14790: {'lr': 0.0004908443184032411, 'samples': 2839680, 'steps': 14789, 'loss/train': 1.9129072427749634} -08/30/2021 15:46:16 - INFO - __main__ - Step 14791: {'lr': 0.0004908428953474019, 'samples': 2839872, 'steps': 14790, 'loss/train': 1.6468173265457153} -08/30/2021 15:46:16 - INFO - __main__ - Step 14792: {'lr': 0.0004908414721830427, 'samples': 2840064, 'steps': 14791, 'loss/train': 1.5827839374542236} -08/30/2021 15:46:16 - INFO - __main__ - Step 14793: {'lr': 0.000490840048910164, 'samples': 2840256, 'steps': 14792, 'loss/train': 1.5768771171569824} -08/30/2021 15:46:18 - INFO - __main__ - Step 14794: {'lr': 0.0004908386255287664, 'samples': 2840448, 'steps': 14793, 'loss/train': 1.356516718864441} -08/30/2021 15:46:19 - INFO - __main__ - Step 14795: {'lr': 0.0004908372020388508, 'samples': 2840640, 'steps': 14794, 'loss/train': 1.7304892539978027} -08/30/2021 15:46:19 - INFO - __main__ - Step 14796: {'lr': 0.0004908357784404175, 'samples': 2840832, 'steps': 14795, 'loss/train': 1.7871992588043213} -08/30/2021 15:46:19 - INFO - __main__ - Step 14797: {'lr': 0.0004908343547334674, 'samples': 2841024, 'steps': 14796, 'loss/train': 0.23681989312171936} -08/30/2021 15:46:20 - INFO - __main__ - Step 14798: {'lr': 0.0004908329309180011, 'samples': 2841216, 'steps': 14797, 'loss/train': 2.157694101333618} -08/30/2021 15:46:22 - INFO - __main__ - Step 14799: {'lr': 0.0004908315069940191, 'samples': 2841408, 'steps': 14798, 'loss/train': 2.138364553451538} -08/30/2021 15:46:22 - INFO - __main__ - Step 14800: {'lr': 0.0004908300829615222, 'samples': 2841600, 'steps': 14799, 'loss/train': 1.54379403591156} -08/30/2021 15:46:23 - INFO - __main__ - Step 14801: {'lr': 0.000490828658820511, 'samples': 2841792, 'steps': 14800, 'loss/train': 1.8878065347671509} -08/30/2021 15:46:23 - INFO - __main__ - Step 14802: {'lr': 0.0004908272345709861, 'samples': 2841984, 'steps': 14801, 'loss/train': 1.5881515741348267} -08/30/2021 15:46:23 - INFO - __main__ - Step 14803: {'lr': 0.0004908258102129481, 'samples': 2842176, 'steps': 14802, 'loss/train': 1.6217010021209717} -08/30/2021 15:46:24 - INFO - __main__ - Step 14804: {'lr': 0.0004908243857463978, 'samples': 2842368, 'steps': 14803, 'loss/train': 1.1415027379989624} -08/30/2021 15:46:25 - INFO - __main__ - Step 14805: {'lr': 0.0004908229611713357, 'samples': 2842560, 'steps': 14804, 'loss/train': 1.365323781967163} -08/30/2021 15:46:26 - INFO - __main__ - Step 14806: {'lr': 0.0004908215364877625, 'samples': 2842752, 'steps': 14805, 'loss/train': 2.133239269256592} -08/30/2021 15:46:26 - INFO - __main__ - Step 14807: {'lr': 0.0004908201116956788, 'samples': 2842944, 'steps': 14806, 'loss/train': 1.3232611417770386} -08/30/2021 15:46:26 - INFO - __main__ - Step 14808: {'lr': 0.0004908186867950854, 'samples': 2843136, 'steps': 14807, 'loss/train': 2.03147292137146} -08/30/2021 15:46:27 - INFO - __main__ - Step 14809: {'lr': 0.0004908172617859826, 'samples': 2843328, 'steps': 14808, 'loss/train': 1.729400396347046} -08/30/2021 15:46:28 - INFO - __main__ - Step 14810: {'lr': 0.0004908158366683714, 'samples': 2843520, 'steps': 14809, 'loss/train': 1.1836036443710327} -08/30/2021 15:46:28 - INFO - __main__ - Step 14811: {'lr': 0.0004908144114422523, 'samples': 2843712, 'steps': 14810, 'loss/train': 1.562010407447815} -08/30/2021 15:46:29 - INFO - __main__ - Step 14812: {'lr': 0.000490812986107626, 'samples': 2843904, 'steps': 14811, 'loss/train': 1.824299931526184} -08/30/2021 15:46:29 - INFO - __main__ - Step 14813: {'lr': 0.000490811560664493, 'samples': 2844096, 'steps': 14812, 'loss/train': 1.4921859502792358} -08/30/2021 15:46:30 - INFO - __main__ - Step 14814: {'lr': 0.000490810135112854, 'samples': 2844288, 'steps': 14813, 'loss/train': 1.8960782289505005} -08/30/2021 15:46:31 - INFO - __main__ - Step 14815: {'lr': 0.0004908087094527097, 'samples': 2844480, 'steps': 14814, 'loss/train': 1.6396292448043823} -08/30/2021 15:46:31 - INFO - __main__ - Step 14816: {'lr': 0.0004908072836840607, 'samples': 2844672, 'steps': 14815, 'loss/train': 1.745307445526123} -08/30/2021 15:46:32 - INFO - __main__ - Step 14817: {'lr': 0.0004908058578069077, 'samples': 2844864, 'steps': 14816, 'loss/train': 1.9213478565216064} -08/30/2021 15:46:32 - INFO - __main__ - Step 14818: {'lr': 0.0004908044318212512, 'samples': 2845056, 'steps': 14817, 'loss/train': 1.8593806028366089} -08/30/2021 15:46:32 - INFO - __main__ - Step 14819: {'lr': 0.000490803005727092, 'samples': 2845248, 'steps': 14818, 'loss/train': 1.5759621858596802} -08/30/2021 15:46:34 - INFO - __main__ - Step 14820: {'lr': 0.0004908015795244307, 'samples': 2845440, 'steps': 14819, 'loss/train': 0.7184984683990479} -08/30/2021 15:46:34 - INFO - __main__ - Step 14821: {'lr': 0.0004908001532132679, 'samples': 2845632, 'steps': 14820, 'loss/train': 1.781602382659912} -08/30/2021 15:46:35 - INFO - __main__ - Step 14822: {'lr': 0.0004907987267936042, 'samples': 2845824, 'steps': 14821, 'loss/train': 1.566272497177124} -08/30/2021 15:46:35 - INFO - __main__ - Step 14823: {'lr': 0.0004907973002654404, 'samples': 2846016, 'steps': 14822, 'loss/train': 1.946954607963562} -08/30/2021 15:46:35 - INFO - __main__ - Step 14824: {'lr': 0.0004907958736287771, 'samples': 2846208, 'steps': 14823, 'loss/train': 1.6509966850280762} -08/30/2021 15:46:36 - INFO - __main__ - Step 14825: {'lr': 0.0004907944468836148, 'samples': 2846400, 'steps': 14824, 'loss/train': 0.7784429788589478} -08/30/2021 15:46:37 - INFO - __main__ - Step 14826: {'lr': 0.0004907930200299543, 'samples': 2846592, 'steps': 14825, 'loss/train': 1.9518537521362305} -08/30/2021 15:46:38 - INFO - __main__ - Step 14827: {'lr': 0.0004907915930677961, 'samples': 2846784, 'steps': 14826, 'loss/train': 1.9460275173187256} -08/30/2021 15:46:38 - INFO - __main__ - Step 14828: {'lr': 0.000490790165997141, 'samples': 2846976, 'steps': 14827, 'loss/train': 1.861189603805542} -08/30/2021 15:46:39 - INFO - __main__ - Step 14829: {'lr': 0.0004907887388179896, 'samples': 2847168, 'steps': 14828, 'loss/train': 1.3093841075897217} -08/30/2021 15:46:39 - INFO - __main__ - Step 14830: {'lr': 0.0004907873115303424, 'samples': 2847360, 'steps': 14829, 'loss/train': 1.8715815544128418} -08/30/2021 15:46:40 - INFO - __main__ - Step 14831: {'lr': 0.0004907858841342002, 'samples': 2847552, 'steps': 14830, 'loss/train': 1.680856466293335} -08/30/2021 15:46:41 - INFO - __main__ - Step 14832: {'lr': 0.0004907844566295637, 'samples': 2847744, 'steps': 14831, 'loss/train': 1.2978127002716064} -08/30/2021 15:46:41 - INFO - __main__ - Step 14833: {'lr': 0.0004907830290164332, 'samples': 2847936, 'steps': 14832, 'loss/train': 0.87298583984375} -08/30/2021 15:46:41 - INFO - __main__ - Step 14834: {'lr': 0.0004907816012948098, 'samples': 2848128, 'steps': 14833, 'loss/train': 1.9467687606811523} -08/30/2021 15:46:42 - INFO - __main__ - Step 14835: {'lr': 0.0004907801734646938, 'samples': 2848320, 'steps': 14834, 'loss/train': 1.938592553138733} -08/30/2021 15:46:43 - INFO - __main__ - Step 14836: {'lr': 0.000490778745526086, 'samples': 2848512, 'steps': 14835, 'loss/train': 1.41289484500885} -08/30/2021 15:46:44 - INFO - __main__ - Step 14837: {'lr': 0.000490777317478987, 'samples': 2848704, 'steps': 14836, 'loss/train': 1.4709492921829224} -08/30/2021 15:46:44 - INFO - __main__ - Step 14838: {'lr': 0.0004907758893233975, 'samples': 2848896, 'steps': 14837, 'loss/train': 1.7636767625808716} -08/30/2021 15:46:44 - INFO - __main__ - Step 14839: {'lr': 0.0004907744610593181, 'samples': 2849088, 'steps': 14838, 'loss/train': 2.2299578189849854} -08/30/2021 15:46:45 - INFO - __main__ - Step 14840: {'lr': 0.0004907730326867495, 'samples': 2849280, 'steps': 14839, 'loss/train': 1.736441731452942} -08/30/2021 15:46:46 - INFO - __main__ - Step 14841: {'lr': 0.0004907716042056921, 'samples': 2849472, 'steps': 14840, 'loss/train': 1.7323708534240723} -08/30/2021 15:46:47 - INFO - __main__ - Step 14842: {'lr': 0.0004907701756161469, 'samples': 2849664, 'steps': 14841, 'loss/train': 1.5519299507141113} -08/30/2021 15:46:47 - INFO - __main__ - Step 14843: {'lr': 0.0004907687469181143, 'samples': 2849856, 'steps': 14842, 'loss/train': 1.7373147010803223} -08/30/2021 15:46:47 - INFO - __main__ - Step 14844: {'lr': 0.000490767318111595, 'samples': 2850048, 'steps': 14843, 'loss/train': 1.595334768295288} -08/30/2021 15:46:48 - INFO - __main__ - Step 14845: {'lr': 0.0004907658891965897, 'samples': 2850240, 'steps': 14844, 'loss/train': 2.56266713142395} -08/30/2021 15:46:50 - INFO - __main__ - Step 14846: {'lr': 0.000490764460173099, 'samples': 2850432, 'steps': 14845, 'loss/train': 2.260747194290161} -08/30/2021 15:46:50 - INFO - __main__ - Step 14847: {'lr': 0.0004907630310411236, 'samples': 2850624, 'steps': 14846, 'loss/train': 1.8458120822906494} -08/30/2021 15:46:51 - INFO - __main__ - Step 14848: {'lr': 0.000490761601800664, 'samples': 2850816, 'steps': 14847, 'loss/train': 1.4040337800979614} -08/30/2021 15:46:51 - INFO - __main__ - Step 14849: {'lr': 0.000490760172451721, 'samples': 2851008, 'steps': 14848, 'loss/train': 1.395462989807129} -08/30/2021 15:46:51 - INFO - __main__ - Step 14850: {'lr': 0.0004907587429942952, 'samples': 2851200, 'steps': 14849, 'loss/train': 1.7758604288101196} -08/30/2021 15:46:52 - INFO - __main__ - Step 14851: {'lr': 0.0004907573134283872, 'samples': 2851392, 'steps': 14850, 'loss/train': 0.34356027841567993} -08/30/2021 15:46:54 - INFO - __main__ - Step 14852: {'lr': 0.0004907558837539976, 'samples': 2851584, 'steps': 14851, 'loss/train': 0.09492310881614685} -08/30/2021 15:46:54 - INFO - __main__ - Step 14853: {'lr': 0.0004907544539711272, 'samples': 2851776, 'steps': 14852, 'loss/train': 2.0711779594421387} -08/30/2021 15:46:54 - INFO - __main__ - Step 14854: {'lr': 0.0004907530240797765, 'samples': 2851968, 'steps': 14853, 'loss/train': 1.9771314859390259} -08/30/2021 15:46:55 - INFO - __main__ - Step 14855: {'lr': 0.0004907515940799463, 'samples': 2852160, 'steps': 14854, 'loss/train': 1.5970083475112915} -08/30/2021 15:46:55 - INFO - __main__ - Step 14856: {'lr': 0.000490750163971637, 'samples': 2852352, 'steps': 14855, 'loss/train': 2.4142673015594482} -08/30/2021 15:46:57 - INFO - __main__ - Step 14857: {'lr': 0.0004907487337548495, 'samples': 2852544, 'steps': 14856, 'loss/train': 1.8362771272659302} -08/30/2021 15:46:57 - INFO - __main__ - Step 14858: {'lr': 0.0004907473034295843, 'samples': 2852736, 'steps': 14857, 'loss/train': 1.6539779901504517} -08/30/2021 15:46:57 - INFO - __main__ - Step 14859: {'lr': 0.0004907458729958422, 'samples': 2852928, 'steps': 14858, 'loss/train': 1.4540634155273438} -08/30/2021 15:46:58 - INFO - __main__ - Step 14860: {'lr': 0.0004907444424536235, 'samples': 2853120, 'steps': 14859, 'loss/train': 2.2673745155334473} -08/30/2021 15:46:58 - INFO - __main__ - Step 14861: {'lr': 0.0004907430118029293, 'samples': 2853312, 'steps': 14860, 'loss/train': 1.9660253524780273} -08/30/2021 15:47:00 - INFO - __main__ - Step 14862: {'lr': 0.0004907415810437598, 'samples': 2853504, 'steps': 14861, 'loss/train': 1.8410143852233887} -08/30/2021 15:47:00 - INFO - __main__ - Step 14863: {'lr': 0.0004907401501761159, 'samples': 2853696, 'steps': 14862, 'loss/train': 1.4958369731903076} -08/30/2021 15:47:00 - INFO - __main__ - Step 14864: {'lr': 0.0004907387191999984, 'samples': 2853888, 'steps': 14863, 'loss/train': 1.8503696918487549} -08/30/2021 15:47:01 - INFO - __main__ - Step 14865: {'lr': 0.0004907372881154075, 'samples': 2854080, 'steps': 14864, 'loss/train': 2.0514066219329834} -08/30/2021 15:47:01 - INFO - __main__ - Step 14866: {'lr': 0.0004907358569223442, 'samples': 2854272, 'steps': 14865, 'loss/train': 1.3077809810638428} -08/30/2021 15:47:01 - INFO - __main__ - Step 14867: {'lr': 0.000490734425620809, 'samples': 2854464, 'steps': 14866, 'loss/train': 1.553786039352417} -08/30/2021 15:47:03 - INFO - __main__ - Step 14868: {'lr': 0.0004907329942108027, 'samples': 2854656, 'steps': 14867, 'loss/train': 1.9677926301956177} -08/30/2021 15:47:04 - INFO - __main__ - Step 14869: {'lr': 0.0004907315626923258, 'samples': 2854848, 'steps': 14868, 'loss/train': 2.0620124340057373} -08/30/2021 15:47:04 - INFO - __main__ - Step 14870: {'lr': 0.0004907301310653789, 'samples': 2855040, 'steps': 14869, 'loss/train': 2.2896623611450195} -08/30/2021 15:47:04 - INFO - __main__ - Step 14871: {'lr': 0.0004907286993299627, 'samples': 2855232, 'steps': 14870, 'loss/train': 2.145505666732788} -08/30/2021 15:47:05 - INFO - __main__ - Step 14872: {'lr': 0.0004907272674860779, 'samples': 2855424, 'steps': 14871, 'loss/train': 1.4551688432693481} -08/30/2021 15:47:06 - INFO - __main__ - Step 14873: {'lr': 0.0004907258355337251, 'samples': 2855616, 'steps': 14872, 'loss/train': 1.6255871057510376} -08/30/2021 15:47:06 - INFO - __main__ - Step 14874: {'lr': 0.0004907244034729049, 'samples': 2855808, 'steps': 14873, 'loss/train': 2.0014379024505615} -08/30/2021 15:47:07 - INFO - __main__ - Step 14875: {'lr': 0.0004907229713036181, 'samples': 2856000, 'steps': 14874, 'loss/train': 1.3547459840774536} -08/30/2021 15:47:07 - INFO - __main__ - Step 14876: {'lr': 0.0004907215390258652, 'samples': 2856192, 'steps': 14875, 'loss/train': 0.11287747323513031} -08/30/2021 15:47:08 - INFO - __main__ - Step 14877: {'lr': 0.0004907201066396469, 'samples': 2856384, 'steps': 14876, 'loss/train': 1.8825775384902954} -08/30/2021 15:47:09 - INFO - __main__ - Step 14878: {'lr': 0.0004907186741449638, 'samples': 2856576, 'steps': 14877, 'loss/train': 1.454063892364502} -08/30/2021 15:47:09 - INFO - __main__ - Step 14879: {'lr': 0.0004907172415418166, 'samples': 2856768, 'steps': 14878, 'loss/train': 1.7126121520996094} -08/30/2021 15:47:10 - INFO - __main__ - Step 14880: {'lr': 0.0004907158088302059, 'samples': 2856960, 'steps': 14879, 'loss/train': 2.1869077682495117} -08/30/2021 15:47:10 - INFO - __main__ - Step 14881: {'lr': 0.0004907143760101325, 'samples': 2857152, 'steps': 14880, 'loss/train': 1.6359323263168335} -08/30/2021 15:47:11 - INFO - __main__ - Step 14882: {'lr': 0.0004907129430815968, 'samples': 2857344, 'steps': 14881, 'loss/train': 1.8957350254058838} -08/30/2021 15:47:12 - INFO - __main__ - Step 14883: {'lr': 0.0004907115100445996, 'samples': 2857536, 'steps': 14882, 'loss/train': 1.642533302307129} -08/30/2021 15:47:12 - INFO - __main__ - Step 14884: {'lr': 0.0004907100768991415, 'samples': 2857728, 'steps': 14883, 'loss/train': 1.667534351348877} -08/30/2021 15:47:13 - INFO - __main__ - Step 14885: {'lr': 0.0004907086436452231, 'samples': 2857920, 'steps': 14884, 'loss/train': 1.2480792999267578} -08/30/2021 15:47:13 - INFO - __main__ - Step 14886: {'lr': 0.0004907072102828451, 'samples': 2858112, 'steps': 14885, 'loss/train': 1.7617106437683105} -08/30/2021 15:47:14 - INFO - __main__ - Step 14887: {'lr': 0.0004907057768120082, 'samples': 2858304, 'steps': 14886, 'loss/train': 1.7082254886627197} -08/30/2021 15:47:15 - INFO - __main__ - Step 14888: {'lr': 0.000490704343232713, 'samples': 2858496, 'steps': 14887, 'loss/train': 1.3154035806655884} -08/30/2021 15:47:16 - INFO - __main__ - Step 14889: {'lr': 0.0004907029095449602, 'samples': 2858688, 'steps': 14888, 'loss/train': 1.9118108749389648} -08/30/2021 15:47:16 - INFO - __main__ - Step 14890: {'lr': 0.0004907014757487503, 'samples': 2858880, 'steps': 14889, 'loss/train': 1.3688138723373413} -08/30/2021 15:47:16 - INFO - __main__ - Step 14891: {'lr': 0.0004907000418440839, 'samples': 2859072, 'steps': 14890, 'loss/train': 1.8967663049697876} -08/30/2021 15:47:17 - INFO - __main__ - Step 14892: {'lr': 0.000490698607830962, 'samples': 2859264, 'steps': 14891, 'loss/train': 1.5738953351974487} -08/30/2021 15:47:17 - INFO - __main__ - Step 14893: {'lr': 0.0004906971737093849, 'samples': 2859456, 'steps': 14892, 'loss/train': 2.4357826709747314} -08/30/2021 15:47:19 - INFO - __main__ - Step 14894: {'lr': 0.0004906957394793534, 'samples': 2859648, 'steps': 14893, 'loss/train': 2.1864922046661377} -08/30/2021 15:47:19 - INFO - __main__ - Step 14895: {'lr': 0.0004906943051408682, 'samples': 2859840, 'steps': 14894, 'loss/train': 1.4296636581420898} -08/30/2021 15:47:19 - INFO - __main__ - Step 14896: {'lr': 0.0004906928706939296, 'samples': 2860032, 'steps': 14895, 'loss/train': 2.200885057449341} -08/30/2021 15:47:20 - INFO - __main__ - Step 14897: {'lr': 0.0004906914361385387, 'samples': 2860224, 'steps': 14896, 'loss/train': 0.5324799418449402} -08/30/2021 15:47:20 - INFO - __main__ - Step 14898: {'lr': 0.0004906900014746959, 'samples': 2860416, 'steps': 14897, 'loss/train': 1.1619032621383667} -08/30/2021 15:47:22 - INFO - __main__ - Step 14899: {'lr': 0.000490688566702402, 'samples': 2860608, 'steps': 14898, 'loss/train': 1.9572542905807495} -08/30/2021 15:47:22 - INFO - __main__ - Step 14900: {'lr': 0.0004906871318216575, 'samples': 2860800, 'steps': 14899, 'loss/train': 1.9340944290161133} -08/30/2021 15:47:22 - INFO - __main__ - Step 14901: {'lr': 0.000490685696832463, 'samples': 2860992, 'steps': 14900, 'loss/train': 1.7831494808197021} -08/30/2021 15:47:23 - INFO - __main__ - Step 14902: {'lr': 0.0004906842617348193, 'samples': 2861184, 'steps': 14901, 'loss/train': 1.7678884267807007} -08/30/2021 15:47:23 - INFO - __main__ - Step 14903: {'lr': 0.000490682826528727, 'samples': 2861376, 'steps': 14902, 'loss/train': 1.1274467706680298} -08/30/2021 15:47:24 - INFO - __main__ - Step 14904: {'lr': 0.0004906813912141868, 'samples': 2861568, 'steps': 14903, 'loss/train': 1.6408709287643433} -08/30/2021 15:47:25 - INFO - __main__ - Step 14905: {'lr': 0.0004906799557911992, 'samples': 2861760, 'steps': 14904, 'loss/train': 1.5663658380508423} -08/30/2021 15:47:25 - INFO - __main__ - Step 14906: {'lr': 0.0004906785202597649, 'samples': 2861952, 'steps': 14905, 'loss/train': 2.121103525161743} -08/30/2021 15:47:26 - INFO - __main__ - Step 14907: {'lr': 0.0004906770846198846, 'samples': 2862144, 'steps': 14906, 'loss/train': 1.4484742879867554} -08/30/2021 15:47:26 - INFO - __main__ - Step 14908: {'lr': 0.0004906756488715589, 'samples': 2862336, 'steps': 14907, 'loss/train': 1.4668267965316772} -08/30/2021 15:47:28 - INFO - __main__ - Step 14909: {'lr': 0.0004906742130147884, 'samples': 2862528, 'steps': 14908, 'loss/train': 1.9839438199996948} -08/30/2021 15:47:29 - INFO - __main__ - Step 14910: {'lr': 0.0004906727770495739, 'samples': 2862720, 'steps': 14909, 'loss/train': 1.2441987991333008} -08/30/2021 15:47:29 - INFO - __main__ - Step 14911: {'lr': 0.000490671340975916, 'samples': 2862912, 'steps': 14910, 'loss/train': 1.6728696823120117} -08/30/2021 15:47:29 - INFO - __main__ - Step 14912: {'lr': 0.0004906699047938153, 'samples': 2863104, 'steps': 14911, 'loss/train': 1.10178804397583} -08/30/2021 15:47:30 - INFO - __main__ - Step 14913: {'lr': 0.0004906684685032724, 'samples': 2863296, 'steps': 14912, 'loss/train': 1.5558502674102783} -08/30/2021 15:47:31 - INFO - __main__ - Step 14914: {'lr': 0.0004906670321042881, 'samples': 2863488, 'steps': 14913, 'loss/train': 1.8439747095108032} -08/30/2021 15:47:32 - INFO - __main__ - Step 14915: {'lr': 0.0004906655955968628, 'samples': 2863680, 'steps': 14914, 'loss/train': 1.6044782400131226} -08/30/2021 15:47:32 - INFO - __main__ - Step 14916: {'lr': 0.0004906641589809973, 'samples': 2863872, 'steps': 14915, 'loss/train': 1.4196702241897583} -08/30/2021 15:47:33 - INFO - __main__ - Step 14917: {'lr': 0.0004906627222566924, 'samples': 2864064, 'steps': 14916, 'loss/train': 1.9430594444274902} -08/30/2021 15:47:33 - INFO - __main__ - Step 14918: {'lr': 0.0004906612854239485, 'samples': 2864256, 'steps': 14917, 'loss/train': 1.3791557550430298} -08/30/2021 15:47:33 - INFO - __main__ - Step 14919: {'lr': 0.0004906598484827663, 'samples': 2864448, 'steps': 14918, 'loss/train': 1.1848090887069702} -08/30/2021 15:47:35 - INFO - __main__ - Step 14920: {'lr': 0.0004906584114331465, 'samples': 2864640, 'steps': 14919, 'loss/train': 1.3372910022735596} -08/30/2021 15:47:35 - INFO - __main__ - Step 14921: {'lr': 0.0004906569742750899, 'samples': 2864832, 'steps': 14920, 'loss/train': 1.316491723060608} -08/30/2021 15:47:35 - INFO - __main__ - Step 14922: {'lr': 0.0004906555370085968, 'samples': 2865024, 'steps': 14921, 'loss/train': 1.4104100465774536} -08/30/2021 15:47:36 - INFO - __main__ - Step 14923: {'lr': 0.000490654099633668, 'samples': 2865216, 'steps': 14922, 'loss/train': 1.2647488117218018} -08/30/2021 15:47:36 - INFO - __main__ - Step 14924: {'lr': 0.0004906526621503043, 'samples': 2865408, 'steps': 14923, 'loss/train': 1.5276551246643066} -08/30/2021 15:47:38 - INFO - __main__ - Step 14925: {'lr': 0.0004906512245585062, 'samples': 2865600, 'steps': 14924, 'loss/train': 1.7782212495803833} -08/30/2021 15:47:38 - INFO - __main__ - Step 14926: {'lr': 0.0004906497868582743, 'samples': 2865792, 'steps': 14925, 'loss/train': 0.7870326638221741} -08/30/2021 15:47:39 - INFO - __main__ - Step 14927: {'lr': 0.0004906483490496093, 'samples': 2865984, 'steps': 14926, 'loss/train': 2.2952516078948975} -08/30/2021 15:47:39 - INFO - __main__ - Step 14928: {'lr': 0.000490646911132512, 'samples': 2866176, 'steps': 14927, 'loss/train': 2.0275893211364746} -08/30/2021 15:47:39 - INFO - __main__ - Step 14929: {'lr': 0.0004906454731069828, 'samples': 2866368, 'steps': 14928, 'loss/train': 1.9735183715820312} -08/30/2021 15:47:41 - INFO - __main__ - Step 14930: {'lr': 0.0004906440349730226, 'samples': 2866560, 'steps': 14929, 'loss/train': 2.132662534713745} -08/30/2021 15:47:41 - INFO - __main__ - Step 14931: {'lr': 0.0004906425967306317, 'samples': 2866752, 'steps': 14930, 'loss/train': 1.2584959268569946} -08/30/2021 15:47:42 - INFO - __main__ - Step 14932: {'lr': 0.0004906411583798112, 'samples': 2866944, 'steps': 14931, 'loss/train': 3.4257090091705322} -08/30/2021 15:47:42 - INFO - __main__ - Step 14933: {'lr': 0.0004906397199205614, 'samples': 2867136, 'steps': 14932, 'loss/train': 1.8130868673324585} -08/30/2021 15:47:42 - INFO - __main__ - Step 14934: {'lr': 0.000490638281352883, 'samples': 2867328, 'steps': 14933, 'loss/train': 1.9742066860198975} -08/30/2021 15:47:44 - INFO - __main__ - Step 14935: {'lr': 0.0004906368426767767, 'samples': 2867520, 'steps': 14934, 'loss/train': 1.6100530624389648} -08/30/2021 15:47:45 - INFO - __main__ - Step 14936: {'lr': 0.0004906354038922432, 'samples': 2867712, 'steps': 14935, 'loss/train': 2.1630990505218506} -08/30/2021 15:47:45 - INFO - __main__ - Step 14937: {'lr': 0.000490633964999283, 'samples': 2867904, 'steps': 14936, 'loss/train': 2.1897051334381104} -08/30/2021 15:47:45 - INFO - __main__ - Step 14938: {'lr': 0.000490632525997897, 'samples': 2868096, 'steps': 14937, 'loss/train': 1.8568459749221802} -08/30/2021 15:47:46 - INFO - __main__ - Step 14939: {'lr': 0.0004906310868880856, 'samples': 2868288, 'steps': 14938, 'loss/train': 1.7828978300094604} -08/30/2021 15:47:46 - INFO - __main__ - Step 14940: {'lr': 0.0004906296476698496, 'samples': 2868480, 'steps': 14939, 'loss/train': 1.3063057661056519} -08/30/2021 15:47:48 - INFO - __main__ - Step 14941: {'lr': 0.0004906282083431897, 'samples': 2868672, 'steps': 14940, 'loss/train': 1.8772317171096802} -08/30/2021 15:47:48 - INFO - __main__ - Step 14942: {'lr': 0.0004906267689081063, 'samples': 2868864, 'steps': 14941, 'loss/train': 0.2673923075199127} -08/30/2021 15:47:49 - INFO - __main__ - Step 14943: {'lr': 0.0004906253293646002, 'samples': 2869056, 'steps': 14942, 'loss/train': 1.1200165748596191} -08/30/2021 15:47:49 - INFO - __main__ - Step 14944: {'lr': 0.0004906238897126721, 'samples': 2869248, 'steps': 14943, 'loss/train': 1.26520836353302} -08/30/2021 15:47:49 - INFO - __main__ - Step 14945: {'lr': 0.0004906224499523225, 'samples': 2869440, 'steps': 14944, 'loss/train': 2.1648335456848145} -08/30/2021 15:47:51 - INFO - __main__ - Step 14946: {'lr': 0.0004906210100835522, 'samples': 2869632, 'steps': 14945, 'loss/train': 1.5770320892333984} -08/30/2021 15:47:51 - INFO - __main__ - Step 14947: {'lr': 0.0004906195701063617, 'samples': 2869824, 'steps': 14946, 'loss/train': 2.1350629329681396} -08/30/2021 15:47:52 - INFO - __main__ - Step 14948: {'lr': 0.0004906181300207518, 'samples': 2870016, 'steps': 14947, 'loss/train': 0.7200288772583008} -08/30/2021 15:47:52 - INFO - __main__ - Step 14949: {'lr': 0.0004906166898267231, 'samples': 2870208, 'steps': 14948, 'loss/train': 1.9455991983413696} -08/30/2021 15:47:52 - INFO - __main__ - Step 14950: {'lr': 0.0004906152495242763, 'samples': 2870400, 'steps': 14949, 'loss/train': 1.9666111469268799} -08/30/2021 15:47:54 - INFO - __main__ - Step 14951: {'lr': 0.0004906138091134118, 'samples': 2870592, 'steps': 14950, 'loss/train': 1.8162511587142944} -08/30/2021 15:47:54 - INFO - __main__ - Step 14952: {'lr': 0.0004906123685941306, 'samples': 2870784, 'steps': 14951, 'loss/train': 2.864201784133911} -08/30/2021 15:47:55 - INFO - __main__ - Step 14953: {'lr': 0.000490610927966433, 'samples': 2870976, 'steps': 14952, 'loss/train': 2.0321316719055176} -08/30/2021 15:47:55 - INFO - __main__ - Step 14954: {'lr': 0.00049060948723032, 'samples': 2871168, 'steps': 14953, 'loss/train': 1.412567138671875} -08/30/2021 15:47:56 - INFO - __main__ - Step 14955: {'lr': 0.000490608046385792, 'samples': 2871360, 'steps': 14954, 'loss/train': 0.8047583699226379} -08/30/2021 15:47:57 - INFO - __main__ - Step 14956: {'lr': 0.0004906066054328498, 'samples': 2871552, 'steps': 14955, 'loss/train': 1.4855256080627441} -08/30/2021 15:47:57 - INFO - __main__ - Step 14957: {'lr': 0.0004906051643714939, 'samples': 2871744, 'steps': 14956, 'loss/train': 2.1654229164123535} -08/30/2021 15:47:58 - INFO - __main__ - Step 14958: {'lr': 0.000490603723201725, 'samples': 2871936, 'steps': 14957, 'loss/train': 1.1873350143432617} -08/30/2021 15:47:58 - INFO - __main__ - Step 14959: {'lr': 0.0004906022819235438, 'samples': 2872128, 'steps': 14958, 'loss/train': 1.7369675636291504} -08/30/2021 15:47:59 - INFO - __main__ - Step 14960: {'lr': 0.000490600840536951, 'samples': 2872320, 'steps': 14959, 'loss/train': 1.7949846982955933} -08/30/2021 15:48:01 - INFO - __main__ - Step 14961: {'lr': 0.0004905993990419471, 'samples': 2872512, 'steps': 14960, 'loss/train': 1.988272786140442} -08/30/2021 15:48:01 - INFO - __main__ - Step 14962: {'lr': 0.0004905979574385328, 'samples': 2872704, 'steps': 14961, 'loss/train': 2.0101239681243896} -08/30/2021 15:48:01 - INFO - __main__ - Step 14963: {'lr': 0.0004905965157267088, 'samples': 2872896, 'steps': 14962, 'loss/train': 1.64951491355896} -08/30/2021 15:48:02 - INFO - __main__ - Step 14964: {'lr': 0.0004905950739064758, 'samples': 2873088, 'steps': 14963, 'loss/train': 1.8198285102844238} -08/30/2021 15:48:02 - INFO - __main__ - Step 14965: {'lr': 0.0004905936319778343, 'samples': 2873280, 'steps': 14964, 'loss/train': 1.8101497888565063} -08/30/2021 15:48:02 - INFO - __main__ - Step 14966: {'lr': 0.000490592189940785, 'samples': 2873472, 'steps': 14965, 'loss/train': 1.6880543231964111} -08/30/2021 15:48:04 - INFO - __main__ - Step 14967: {'lr': 0.0004905907477953286, 'samples': 2873664, 'steps': 14966, 'loss/train': 1.7889503240585327} -08/30/2021 15:48:04 - INFO - __main__ - Step 14968: {'lr': 0.0004905893055414658, 'samples': 2873856, 'steps': 14967, 'loss/train': 1.9825594425201416} -08/30/2021 15:48:05 - INFO - __main__ - Step 14969: {'lr': 0.0004905878631791971, 'samples': 2874048, 'steps': 14968, 'loss/train': 1.815059781074524} -08/30/2021 15:48:05 - INFO - __main__ - Step 14970: {'lr': 0.0004905864207085232, 'samples': 2874240, 'steps': 14969, 'loss/train': 1.415787935256958} -08/30/2021 15:48:07 - INFO - __main__ - Step 14971: {'lr': 0.0004905849781294448, 'samples': 2874432, 'steps': 14970, 'loss/train': 1.7248291969299316} -08/30/2021 15:48:07 - INFO - __main__ - Step 14972: {'lr': 0.0004905835354419625, 'samples': 2874624, 'steps': 14971, 'loss/train': 1.9839503765106201} -08/30/2021 15:48:07 - INFO - __main__ - Step 14973: {'lr': 0.0004905820926460769, 'samples': 2874816, 'steps': 14972, 'loss/train': 1.7970905303955078} -08/30/2021 15:48:08 - INFO - __main__ - Step 14974: {'lr': 0.0004905806497417888, 'samples': 2875008, 'steps': 14973, 'loss/train': 1.7530096769332886} -08/30/2021 15:48:08 - INFO - __main__ - Step 14975: {'lr': 0.0004905792067290988, 'samples': 2875200, 'steps': 14974, 'loss/train': 1.4415957927703857} -08/30/2021 15:48:08 - INFO - __main__ - Step 14976: {'lr': 0.0004905777636080075, 'samples': 2875392, 'steps': 14975, 'loss/train': 1.703970193862915} -08/30/2021 15:48:10 - INFO - __main__ - Step 14977: {'lr': 0.0004905763203785157, 'samples': 2875584, 'steps': 14976, 'loss/train': 1.4527407884597778} -08/30/2021 15:48:10 - INFO - __main__ - Step 14978: {'lr': 0.0004905748770406237, 'samples': 2875776, 'steps': 14977, 'loss/train': 1.8297884464263916} -08/30/2021 15:48:11 - INFO - __main__ - Step 14979: {'lr': 0.0004905734335943325, 'samples': 2875968, 'steps': 14978, 'loss/train': 2.642838478088379} -08/30/2021 15:48:11 - INFO - __main__ - Step 14980: {'lr': 0.0004905719900396426, 'samples': 2876160, 'steps': 14979, 'loss/train': 1.9550862312316895} -08/30/2021 15:48:11 - INFO - __main__ - Step 14981: {'lr': 0.0004905705463765546, 'samples': 2876352, 'steps': 14980, 'loss/train': 2.4028172492980957} -08/30/2021 15:48:13 - INFO - __main__ - Step 14982: {'lr': 0.0004905691026050692, 'samples': 2876544, 'steps': 14981, 'loss/train': 0.9124690890312195} -08/30/2021 15:48:13 - INFO - __main__ - Step 14983: {'lr': 0.0004905676587251873, 'samples': 2876736, 'steps': 14982, 'loss/train': 1.3576433658599854} -08/30/2021 15:48:14 - INFO - __main__ - Step 14984: {'lr': 0.0004905662147369091, 'samples': 2876928, 'steps': 14983, 'loss/train': 1.7100127935409546} -08/30/2021 15:48:14 - INFO - __main__ - Step 14985: {'lr': 0.0004905647706402356, 'samples': 2877120, 'steps': 14984, 'loss/train': 1.6217868328094482} -08/30/2021 15:48:14 - INFO - __main__ - Step 14986: {'lr': 0.0004905633264351673, 'samples': 2877312, 'steps': 14985, 'loss/train': 1.4821100234985352} -08/30/2021 15:48:16 - INFO - __main__ - Step 14987: {'lr': 0.0004905618821217048, 'samples': 2877504, 'steps': 14986, 'loss/train': 2.151357412338257} -08/30/2021 15:48:16 - INFO - __main__ - Step 14988: {'lr': 0.0004905604376998489, 'samples': 2877696, 'steps': 14987, 'loss/train': 1.3934756517410278} -08/30/2021 15:48:17 - INFO - __main__ - Step 14989: {'lr': 0.0004905589931696002, 'samples': 2877888, 'steps': 14988, 'loss/train': 1.4435477256774902} -08/30/2021 15:48:17 - INFO - __main__ - Step 14990: {'lr': 0.0004905575485309593, 'samples': 2878080, 'steps': 14989, 'loss/train': 1.2365061044692993} -08/30/2021 15:48:17 - INFO - __main__ - Step 14991: {'lr': 0.0004905561037839269, 'samples': 2878272, 'steps': 14990, 'loss/train': 0.9699716567993164} -08/30/2021 15:48:19 - INFO - __main__ - Step 14992: {'lr': 0.0004905546589285036, 'samples': 2878464, 'steps': 14991, 'loss/train': 1.7452621459960938} -08/30/2021 15:48:19 - INFO - __main__ - Step 14993: {'lr': 0.0004905532139646901, 'samples': 2878656, 'steps': 14992, 'loss/train': 1.7208856344223022} -08/30/2021 15:48:20 - INFO - __main__ - Step 14994: {'lr': 0.000490551768892487, 'samples': 2878848, 'steps': 14993, 'loss/train': 1.2783823013305664} -08/30/2021 15:48:20 - INFO - __main__ - Step 14995: {'lr': 0.000490550323711895, 'samples': 2879040, 'steps': 14994, 'loss/train': 2.156923532485962} -08/30/2021 15:48:20 - INFO - __main__ - Step 14996: {'lr': 0.0004905488784229147, 'samples': 2879232, 'steps': 14995, 'loss/train': 1.968981385231018} -08/30/2021 15:48:23 - INFO - __main__ - Step 14997: {'lr': 0.000490547433025547, 'samples': 2879424, 'steps': 14996, 'loss/train': 1.880060076713562} -08/30/2021 15:48:23 - INFO - __main__ - Step 14998: {'lr': 0.0004905459875197921, 'samples': 2879616, 'steps': 14997, 'loss/train': 1.4786137342453003} -08/30/2021 15:48:23 - INFO - __main__ - Step 14999: {'lr': 0.000490544541905651, 'samples': 2879808, 'steps': 14998, 'loss/train': 0.6797895431518555} -08/30/2021 15:48:24 - INFO - __main__ - Step 15000: {'lr': 0.0004905430961831242, 'samples': 2880000, 'steps': 14999, 'loss/train': 0.09316903352737427} -08/30/2021 15:48:24 - INFO - __main__ - Evaluating model checkpoint -08/30/2021 15:57:02 - INFO - __main__ - Step 15000: {'loss/eval': 1.5676782131195068, 'perplexity': 4.795501232147217} -08/30/2021 15:57:02 - INFO - __main__ - Saving model checkpoint -08/30/2021 15:57:37 - INFO - __main__ - Step 15001: {'lr': 0.0004905416503522123, 'samples': 2880192, 'steps': 15000, 'loss/train': 0.08897807449102402} -08/30/2021 15:57:37 - INFO - __main__ - Step 15002: {'lr': 0.0004905402044129162, 'samples': 2880384, 'steps': 15001, 'loss/train': 1.7169634103775024} -08/30/2021 15:57:38 - INFO - __main__ - Step 15003: {'lr': 0.0004905387583652363, 'samples': 2880576, 'steps': 15002, 'loss/train': 2.079348564147949} -08/30/2021 15:57:39 - INFO - __main__ - Step 15004: {'lr': 0.0004905373122091734, 'samples': 2880768, 'steps': 15003, 'loss/train': 1.7418956756591797} -08/30/2021 15:57:40 - INFO - __main__ - Step 15005: {'lr': 0.0004905358659447281, 'samples': 2880960, 'steps': 15004, 'loss/train': 1.5207520723342896} -08/30/2021 15:57:40 - INFO - __main__ - Step 15006: {'lr': 0.000490534419571901, 'samples': 2881152, 'steps': 15005, 'loss/train': 1.5853830575942993} -08/30/2021 15:57:40 - INFO - __main__ - Step 15007: {'lr': 0.0004905329730906929, 'samples': 2881344, 'steps': 15006, 'loss/train': 1.8985745906829834} -08/30/2021 15:57:41 - INFO - __main__ - Step 15008: {'lr': 0.0004905315265011043, 'samples': 2881536, 'steps': 15007, 'loss/train': 1.9557712078094482} -08/30/2021 15:57:42 - INFO - __main__ - Step 15009: {'lr': 0.0004905300798031359, 'samples': 2881728, 'steps': 15008, 'loss/train': 1.9216936826705933} -08/30/2021 15:57:43 - INFO - __main__ - Step 15010: {'lr': 0.0004905286329967883, 'samples': 2881920, 'steps': 15009, 'loss/train': 1.2003295421600342} -08/30/2021 15:57:43 - INFO - __main__ - Step 15011: {'lr': 0.0004905271860820622, 'samples': 2882112, 'steps': 15010, 'loss/train': 2.3111867904663086} -08/30/2021 15:57:43 - INFO - __main__ - Step 15012: {'lr': 0.0004905257390589585, 'samples': 2882304, 'steps': 15011, 'loss/train': 1.5301975011825562} -08/30/2021 15:57:44 - INFO - __main__ - Step 15013: {'lr': 0.0004905242919274774, 'samples': 2882496, 'steps': 15012, 'loss/train': 1.2972427606582642} -08/30/2021 15:57:45 - INFO - __main__ - Step 15014: {'lr': 0.0004905228446876197, 'samples': 2882688, 'steps': 15013, 'loss/train': 1.50941002368927} -08/30/2021 15:57:46 - INFO - __main__ - Step 15015: {'lr': 0.0004905213973393863, 'samples': 2882880, 'steps': 15014, 'loss/train': 1.6621195077896118} -08/30/2021 15:57:46 - INFO - __main__ - Step 15016: {'lr': 0.0004905199498827776, 'samples': 2883072, 'steps': 15015, 'loss/train': 1.812369704246521} -08/30/2021 15:57:46 - INFO - __main__ - Step 15017: {'lr': 0.0004905185023177942, 'samples': 2883264, 'steps': 15016, 'loss/train': 1.7890472412109375} -08/30/2021 15:57:47 - INFO - __main__ - Step 15018: {'lr': 0.0004905170546444371, 'samples': 2883456, 'steps': 15017, 'loss/train': 1.4666922092437744} -08/30/2021 15:57:49 - INFO - __main__ - Step 15019: {'lr': 0.0004905156068627065, 'samples': 2883648, 'steps': 15018, 'loss/train': 1.536946177482605} -08/30/2021 15:57:49 - INFO - __main__ - Step 15020: {'lr': 0.0004905141589726035, 'samples': 2883840, 'steps': 15019, 'loss/train': 1.8957767486572266} -08/30/2021 15:57:50 - INFO - __main__ - Step 15021: {'lr': 0.0004905127109741284, 'samples': 2884032, 'steps': 15020, 'loss/train': 1.2258646488189697} -08/30/2021 15:57:50 - INFO - __main__ - Step 15022: {'lr': 0.000490511262867282, 'samples': 2884224, 'steps': 15021, 'loss/train': 1.2116807699203491} -08/30/2021 15:57:50 - INFO - __main__ - Step 15023: {'lr': 0.000490509814652065, 'samples': 2884416, 'steps': 15022, 'loss/train': 1.846852421760559} -08/30/2021 15:57:52 - INFO - __main__ - Step 15024: {'lr': 0.0004905083663284779, 'samples': 2884608, 'steps': 15023, 'loss/train': 1.4833589792251587} -08/30/2021 15:57:52 - INFO - __main__ - Step 15025: {'lr': 0.0004905069178965214, 'samples': 2884800, 'steps': 15024, 'loss/train': 1.6528632640838623} -08/30/2021 15:57:53 - INFO - __main__ - Step 15026: {'lr': 0.0004905054693561963, 'samples': 2884992, 'steps': 15025, 'loss/train': 1.6975077390670776} -08/30/2021 15:57:53 - INFO - __main__ - Step 15027: {'lr': 0.0004905040207075032, 'samples': 2885184, 'steps': 15026, 'loss/train': 1.3338165283203125} -08/30/2021 15:57:53 - INFO - __main__ - Step 15028: {'lr': 0.0004905025719504426, 'samples': 2885376, 'steps': 15027, 'loss/train': 1.818396806716919} -08/30/2021 15:57:54 - INFO - __main__ - Step 15029: {'lr': 0.0004905011230850152, 'samples': 2885568, 'steps': 15028, 'loss/train': 1.5168710947036743} -08/30/2021 15:57:56 - INFO - __main__ - Step 15030: {'lr': 0.0004904996741112218, 'samples': 2885760, 'steps': 15029, 'loss/train': 1.5877747535705566} -08/30/2021 15:57:56 - INFO - __main__ - Step 15031: {'lr': 0.0004904982250290629, 'samples': 2885952, 'steps': 15030, 'loss/train': 1.7008051872253418} -08/30/2021 15:57:56 - INFO - __main__ - Step 15032: {'lr': 0.0004904967758385393, 'samples': 2886144, 'steps': 15031, 'loss/train': 1.7522859573364258} -08/30/2021 15:57:57 - INFO - __main__ - Step 15033: {'lr': 0.0004904953265396515, 'samples': 2886336, 'steps': 15032, 'loss/train': 0.14056184887886047} -08/30/2021 15:57:57 - INFO - __main__ - Step 15034: {'lr': 0.0004904938771324002, 'samples': 2886528, 'steps': 15033, 'loss/train': 1.7451437711715698} -08/30/2021 15:57:59 - INFO - __main__ - Step 15035: {'lr': 0.0004904924276167861, 'samples': 2886720, 'steps': 15034, 'loss/train': 1.7355155944824219} -08/30/2021 15:57:59 - INFO - __main__ - Step 15036: {'lr': 0.0004904909779928099, 'samples': 2886912, 'steps': 15035, 'loss/train': 1.4620782136917114} -08/30/2021 15:57:59 - INFO - __main__ - Step 15037: {'lr': 0.000490489528260472, 'samples': 2887104, 'steps': 15036, 'loss/train': 0.44157060980796814} -08/30/2021 15:58:00 - INFO - __main__ - Step 15038: {'lr': 0.0004904880784197734, 'samples': 2887296, 'steps': 15037, 'loss/train': 1.6056537628173828} -08/30/2021 15:58:00 - INFO - __main__ - Step 15039: {'lr': 0.0004904866284707144, 'samples': 2887488, 'steps': 15038, 'loss/train': 2.031805992126465} -08/30/2021 15:58:02 - INFO - __main__ - Step 15040: {'lr': 0.000490485178413296, 'samples': 2887680, 'steps': 15039, 'loss/train': 1.5526639223098755} -08/30/2021 15:58:02 - INFO - __main__ - Step 15041: {'lr': 0.0004904837282475186, 'samples': 2887872, 'steps': 15040, 'loss/train': 2.158902406692505} -08/30/2021 15:58:03 - INFO - __main__ - Step 15042: {'lr': 0.000490482277973383, 'samples': 2888064, 'steps': 15041, 'loss/train': 1.7040448188781738} -08/30/2021 15:58:03 - INFO - __main__ - Step 15043: {'lr': 0.0004904808275908898, 'samples': 2888256, 'steps': 15042, 'loss/train': 0.609427809715271} -08/30/2021 15:58:03 - INFO - __main__ - Step 15044: {'lr': 0.0004904793771000396, 'samples': 2888448, 'steps': 15043, 'loss/train': 1.9580683708190918} -08/30/2021 15:58:05 - INFO - __main__ - Step 15045: {'lr': 0.0004904779265008331, 'samples': 2888640, 'steps': 15044, 'loss/train': 1.416972041130066} -08/30/2021 15:58:05 - INFO - __main__ - Step 15046: {'lr': 0.000490476475793271, 'samples': 2888832, 'steps': 15045, 'loss/train': 1.914841890335083} -08/30/2021 15:58:06 - INFO - __main__ - Step 15047: {'lr': 0.0004904750249773538, 'samples': 2889024, 'steps': 15046, 'loss/train': 1.60141122341156} -08/30/2021 15:58:06 - INFO - __main__ - Step 15048: {'lr': 0.0004904735740530825, 'samples': 2889216, 'steps': 15047, 'loss/train': 1.4357203245162964} -08/30/2021 15:58:06 - INFO - __main__ - Step 15049: {'lr': 0.0004904721230204573, 'samples': 2889408, 'steps': 15048, 'loss/train': 2.2410624027252197} -08/30/2021 15:58:08 - INFO - __main__ - Step 15050: {'lr': 0.0004904706718794791, 'samples': 2889600, 'steps': 15049, 'loss/train': 1.1474930047988892} -08/30/2021 15:58:09 - INFO - __main__ - Step 15051: {'lr': 0.0004904692206301487, 'samples': 2889792, 'steps': 15050, 'loss/train': 1.4560447931289673} -08/30/2021 15:58:09 - INFO - __main__ - Step 15052: {'lr': 0.0004904677692724664, 'samples': 2889984, 'steps': 15051, 'loss/train': 1.4431084394454956} -08/30/2021 15:58:09 - INFO - __main__ - Step 15053: {'lr': 0.000490466317806433, 'samples': 2890176, 'steps': 15052, 'loss/train': 1.6216411590576172} -08/30/2021 15:58:10 - INFO - __main__ - Step 15054: {'lr': 0.0004904648662320493, 'samples': 2890368, 'steps': 15053, 'loss/train': 0.1565411537885666} -08/30/2021 15:58:11 - INFO - __main__ - Step 15055: {'lr': 0.0004904634145493159, 'samples': 2890560, 'steps': 15054, 'loss/train': 1.1482092142105103} -08/30/2021 15:58:12 - INFO - __main__ - Step 15056: {'lr': 0.0004904619627582332, 'samples': 2890752, 'steps': 15055, 'loss/train': 1.7334765195846558} -08/30/2021 15:58:12 - INFO - __main__ - Step 15057: {'lr': 0.0004904605108588023, 'samples': 2890944, 'steps': 15056, 'loss/train': 1.4141312837600708} -08/30/2021 15:58:12 - INFO - __main__ - Step 15058: {'lr': 0.0004904590588510234, 'samples': 2891136, 'steps': 15057, 'loss/train': 1.9265528917312622} -08/30/2021 15:58:13 - INFO - __main__ - Step 15059: {'lr': 0.0004904576067348975, 'samples': 2891328, 'steps': 15058, 'loss/train': 2.2109851837158203} -08/30/2021 15:58:13 - INFO - __main__ - Step 15060: {'lr': 0.000490456154510425, 'samples': 2891520, 'steps': 15059, 'loss/train': 2.0628292560577393} -08/30/2021 15:58:15 - INFO - __main__ - Step 15061: {'lr': 0.0004904547021776067, 'samples': 2891712, 'steps': 15060, 'loss/train': 1.9347633123397827} -08/30/2021 15:58:15 - INFO - __main__ - Step 15062: {'lr': 0.0004904532497364432, 'samples': 2891904, 'steps': 15061, 'loss/train': 1.5641708374023438} -08/30/2021 15:58:15 - INFO - __main__ - Step 15063: {'lr': 0.0004904517971869352, 'samples': 2892096, 'steps': 15062, 'loss/train': 1.079559326171875} -08/30/2021 15:58:16 - INFO - __main__ - Step 15064: {'lr': 0.0004904503445290833, 'samples': 2892288, 'steps': 15063, 'loss/train': 1.13528573513031} -08/30/2021 15:58:16 - INFO - __main__ - Step 15065: {'lr': 0.0004904488917628882, 'samples': 2892480, 'steps': 15064, 'loss/train': 2.182119607925415} -08/30/2021 15:58:18 - INFO - __main__ - Step 15066: {'lr': 0.0004904474388883507, 'samples': 2892672, 'steps': 15065, 'loss/train': 1.4964021444320679} -08/30/2021 15:58:18 - INFO - __main__ - Step 15067: {'lr': 0.000490445985905471, 'samples': 2892864, 'steps': 15066, 'loss/train': 1.062370777130127} -08/30/2021 15:58:18 - INFO - __main__ - Step 15068: {'lr': 0.0004904445328142503, 'samples': 2893056, 'steps': 15067, 'loss/train': 0.9581953287124634} -08/30/2021 15:58:19 - INFO - __main__ - Step 15069: {'lr': 0.0004904430796146889, 'samples': 2893248, 'steps': 15068, 'loss/train': 1.8068184852600098} -08/30/2021 15:58:19 - INFO - __main__ - Step 15070: {'lr': 0.0004904416263067876, 'samples': 2893440, 'steps': 15069, 'loss/train': 1.8006515502929688} -08/30/2021 15:58:21 - INFO - __main__ - Step 15071: {'lr': 0.0004904401728905469, 'samples': 2893632, 'steps': 15070, 'loss/train': 1.647088646888733} -08/30/2021 15:58:22 - INFO - __main__ - Step 15072: {'lr': 0.0004904387193659677, 'samples': 2893824, 'steps': 15071, 'loss/train': 1.7353768348693848} -08/30/2021 15:58:22 - INFO - __main__ - Step 15073: {'lr': 0.0004904372657330504, 'samples': 2894016, 'steps': 15072, 'loss/train': 1.6333556175231934} -08/30/2021 15:58:22 - INFO - __main__ - Step 15074: {'lr': 0.0004904358119917959, 'samples': 2894208, 'steps': 15073, 'loss/train': 1.9115346670150757} -08/30/2021 15:58:23 - INFO - __main__ - Step 15075: {'lr': 0.0004904343581422047, 'samples': 2894400, 'steps': 15074, 'loss/train': 1.6262946128845215} -08/30/2021 15:58:24 - INFO - __main__ - Step 15076: {'lr': 0.0004904329041842774, 'samples': 2894592, 'steps': 15075, 'loss/train': 2.36826229095459} -08/30/2021 15:58:25 - INFO - __main__ - Step 15077: {'lr': 0.0004904314501180148, 'samples': 2894784, 'steps': 15076, 'loss/train': 1.9142673015594482} -08/30/2021 15:58:25 - INFO - __main__ - Step 15078: {'lr': 0.0004904299959434175, 'samples': 2894976, 'steps': 15077, 'loss/train': 1.7328768968582153} -08/30/2021 15:58:25 - INFO - __main__ - Step 15079: {'lr': 0.0004904285416604862, 'samples': 2895168, 'steps': 15078, 'loss/train': 1.6171680688858032} -08/30/2021 15:58:26 - INFO - __main__ - Step 15080: {'lr': 0.0004904270872692215, 'samples': 2895360, 'steps': 15079, 'loss/train': 2.092799663543701} -08/30/2021 15:58:27 - INFO - __main__ - Step 15081: {'lr': 0.0004904256327696241, 'samples': 2895552, 'steps': 15080, 'loss/train': 1.2302974462509155} -08/30/2021 15:58:28 - INFO - __main__ - Step 15082: {'lr': 0.0004904241781616945, 'samples': 2895744, 'steps': 15081, 'loss/train': 1.1482905149459839} -08/30/2021 15:58:28 - INFO - __main__ - Step 15083: {'lr': 0.0004904227234454335, 'samples': 2895936, 'steps': 15082, 'loss/train': 1.9209469556808472} -08/30/2021 15:58:28 - INFO - __main__ - Step 15084: {'lr': 0.0004904212686208418, 'samples': 2896128, 'steps': 15083, 'loss/train': 2.028625011444092} -08/30/2021 15:58:29 - INFO - __main__ - Step 15085: {'lr': 0.00049041981368792, 'samples': 2896320, 'steps': 15084, 'loss/train': 1.8900392055511475} -08/30/2021 15:58:29 - INFO - __main__ - Step 15086: {'lr': 0.0004904183586466686, 'samples': 2896512, 'steps': 15085, 'loss/train': 2.02756404876709} -08/30/2021 15:58:31 - INFO - __main__ - Step 15087: {'lr': 0.0004904169034970885, 'samples': 2896704, 'steps': 15086, 'loss/train': 1.0059603452682495} -08/30/2021 15:58:31 - INFO - __main__ - Step 15088: {'lr': 0.0004904154482391803, 'samples': 2896896, 'steps': 15087, 'loss/train': 1.565056562423706} -08/30/2021 15:58:31 - INFO - __main__ - Step 15089: {'lr': 0.0004904139928729445, 'samples': 2897088, 'steps': 15088, 'loss/train': 1.6708370447158813} -08/30/2021 15:58:32 - INFO - __main__ - Step 15090: {'lr': 0.0004904125373983819, 'samples': 2897280, 'steps': 15089, 'loss/train': 1.9066559076309204} -08/30/2021 15:58:32 - INFO - __main__ - Step 15091: {'lr': 0.0004904110818154931, 'samples': 2897472, 'steps': 15090, 'loss/train': 1.757454514503479} -08/30/2021 15:58:33 - INFO - __main__ - Step 15092: {'lr': 0.0004904096261242789, 'samples': 2897664, 'steps': 15091, 'loss/train': 1.1484358310699463} -08/30/2021 15:58:34 - INFO - __main__ - Step 15093: {'lr': 0.0004904081703247397, 'samples': 2897856, 'steps': 15092, 'loss/train': 1.4675343036651611} -08/30/2021 15:58:34 - INFO - __main__ - Step 15094: {'lr': 0.0004904067144168763, 'samples': 2898048, 'steps': 15093, 'loss/train': 1.3540998697280884} -08/30/2021 15:58:35 - INFO - __main__ - Step 15095: {'lr': 0.0004904052584006895, 'samples': 2898240, 'steps': 15094, 'loss/train': 2.115405321121216} -08/30/2021 15:58:35 - INFO - __main__ - Step 15096: {'lr': 0.0004904038022761797, 'samples': 2898432, 'steps': 15095, 'loss/train': 1.7329566478729248} -08/30/2021 15:58:36 - INFO - __main__ - Step 15097: {'lr': 0.0004904023460433475, 'samples': 2898624, 'steps': 15096, 'loss/train': 1.617341160774231} -08/30/2021 15:58:37 - INFO - __main__ - Step 15098: {'lr': 0.0004904008897021939, 'samples': 2898816, 'steps': 15097, 'loss/train': 1.7051061391830444} -08/30/2021 15:58:37 - INFO - __main__ - Step 15099: {'lr': 0.0004903994332527193, 'samples': 2899008, 'steps': 15098, 'loss/train': 1.9150274991989136} -08/30/2021 15:58:38 - INFO - __main__ - Step 15100: {'lr': 0.0004903979766949244, 'samples': 2899200, 'steps': 15099, 'loss/train': 2.107600450515747} -08/30/2021 15:58:38 - INFO - __main__ - Step 15101: {'lr': 0.00049039652002881, 'samples': 2899392, 'steps': 15100, 'loss/train': 2.323913335800171} -08/30/2021 15:58:39 - INFO - __main__ - Step 15102: {'lr': 0.0004903950632543766, 'samples': 2899584, 'steps': 15101, 'loss/train': 1.8349885940551758} -08/30/2021 15:58:40 - INFO - __main__ - Step 15103: {'lr': 0.0004903936063716248, 'samples': 2899776, 'steps': 15102, 'loss/train': 1.3465237617492676} -08/30/2021 15:58:40 - INFO - __main__ - Step 15104: {'lr': 0.0004903921493805554, 'samples': 2899968, 'steps': 15103, 'loss/train': 1.4871973991394043} -08/30/2021 15:58:41 - INFO - __main__ - Step 15105: {'lr': 0.000490390692281169, 'samples': 2900160, 'steps': 15104, 'loss/train': 1.7064441442489624} -08/30/2021 15:58:41 - INFO - __main__ - Step 15106: {'lr': 0.0004903892350734663, 'samples': 2900352, 'steps': 15105, 'loss/train': 1.973088264465332} -08/30/2021 15:58:43 - INFO - __main__ - Step 15107: {'lr': 0.0004903877777574479, 'samples': 2900544, 'steps': 15106, 'loss/train': 1.91025710105896} -08/30/2021 15:58:43 - INFO - __main__ - Step 15108: {'lr': 0.0004903863203331145, 'samples': 2900736, 'steps': 15107, 'loss/train': 1.796217441558838} -08/30/2021 15:58:43 - INFO - __main__ - Step 15109: {'lr': 0.0004903848628004667, 'samples': 2900928, 'steps': 15108, 'loss/train': 1.2699918746948242} -08/30/2021 15:58:44 - INFO - __main__ - Step 15110: {'lr': 0.0004903834051595052, 'samples': 2901120, 'steps': 15109, 'loss/train': 1.7588151693344116} -08/30/2021 15:58:44 - INFO - __main__ - Step 15111: {'lr': 0.0004903819474102306, 'samples': 2901312, 'steps': 15110, 'loss/train': 1.5148886442184448} -08/30/2021 15:58:45 - INFO - __main__ - Step 15112: {'lr': 0.0004903804895526437, 'samples': 2901504, 'steps': 15111, 'loss/train': 1.8466156721115112} -08/30/2021 15:58:46 - INFO - __main__ - Step 15113: {'lr': 0.0004903790315867449, 'samples': 2901696, 'steps': 15112, 'loss/train': 1.7272372245788574} -08/30/2021 15:58:46 - INFO - __main__ - Step 15114: {'lr': 0.0004903775735125352, 'samples': 2901888, 'steps': 15113, 'loss/train': 1.9933096170425415} -08/30/2021 15:58:47 - INFO - __main__ - Step 15115: {'lr': 0.0004903761153300149, 'samples': 2902080, 'steps': 15114, 'loss/train': 0.09477217495441437} -08/30/2021 15:58:47 - INFO - __main__ - Step 15116: {'lr': 0.000490374657039185, 'samples': 2902272, 'steps': 15115, 'loss/train': 1.6263753175735474} -08/30/2021 15:58:49 - INFO - __main__ - Step 15117: {'lr': 0.0004903731986400459, 'samples': 2902464, 'steps': 15116, 'loss/train': 1.6342326402664185} -08/30/2021 15:58:50 - INFO - __main__ - Step 15118: {'lr': 0.0004903717401325983, 'samples': 2902656, 'steps': 15117, 'loss/train': 2.0062599182128906} -08/30/2021 15:58:50 - INFO - __main__ - Step 15119: {'lr': 0.000490370281516843, 'samples': 2902848, 'steps': 15118, 'loss/train': 1.5492897033691406} -08/30/2021 15:58:50 - INFO - __main__ - Step 15120: {'lr': 0.0004903688227927806, 'samples': 2903040, 'steps': 15119, 'loss/train': 1.9500274658203125} -08/30/2021 15:58:51 - INFO - __main__ - Step 15121: {'lr': 0.0004903673639604116, 'samples': 2903232, 'steps': 15120, 'loss/train': 1.6372621059417725} -08/30/2021 15:58:51 - INFO - __main__ - Step 15122: {'lr': 0.0004903659050197369, 'samples': 2903424, 'steps': 15121, 'loss/train': 2.0835390090942383} -08/30/2021 15:58:51 - INFO - __main__ - Step 15123: {'lr': 0.0004903644459707569, 'samples': 2903616, 'steps': 15122, 'loss/train': 1.7659131288528442} -08/30/2021 15:58:54 - INFO - __main__ - Step 15124: {'lr': 0.0004903629868134725, 'samples': 2903808, 'steps': 15123, 'loss/train': 1.7020103931427002} -08/30/2021 15:58:54 - INFO - __main__ - Step 15125: {'lr': 0.0004903615275478841, 'samples': 2904000, 'steps': 15124, 'loss/train': 1.284178614616394} -08/30/2021 15:58:55 - INFO - __main__ - Step 15126: {'lr': 0.0004903600681739926, 'samples': 2904192, 'steps': 15125, 'loss/train': 0.15328308939933777} -08/30/2021 15:58:55 - INFO - __main__ - Step 15127: {'lr': 0.0004903586086917986, 'samples': 2904384, 'steps': 15126, 'loss/train': 1.4526680707931519} -08/30/2021 15:58:55 - INFO - __main__ - Step 15128: {'lr': 0.0004903571491013027, 'samples': 2904576, 'steps': 15127, 'loss/train': 1.530230164527893} -08/30/2021 15:58:56 - INFO - __main__ - Step 15129: {'lr': 0.0004903556894025055, 'samples': 2904768, 'steps': 15128, 'loss/train': 0.06229347363114357} -08/30/2021 15:58:57 - INFO - __main__ - Step 15130: {'lr': 0.0004903542295954077, 'samples': 2904960, 'steps': 15129, 'loss/train': 1.8654475212097168} -08/30/2021 15:58:58 - INFO - __main__ - Step 15131: {'lr': 0.0004903527696800102, 'samples': 2905152, 'steps': 15130, 'loss/train': 1.4783753156661987} -08/30/2021 15:58:58 - INFO - __main__ - Step 15132: {'lr': 0.0004903513096563133, 'samples': 2905344, 'steps': 15131, 'loss/train': 0.13516157865524292} -08/30/2021 15:58:59 - INFO - __main__ - Step 15133: {'lr': 0.0004903498495243178, 'samples': 2905536, 'steps': 15132, 'loss/train': 1.6506235599517822} -08/30/2021 15:58:59 - INFO - __main__ - Step 15134: {'lr': 0.0004903483892840244, 'samples': 2905728, 'steps': 15133, 'loss/train': 4.622920513153076} -08/30/2021 15:59:00 - INFO - __main__ - Step 15135: {'lr': 0.0004903469289354338, 'samples': 2905920, 'steps': 15134, 'loss/train': 1.3137805461883545} -08/30/2021 15:59:01 - INFO - __main__ - Step 15136: {'lr': 0.0004903454684785465, 'samples': 2906112, 'steps': 15135, 'loss/train': 1.9431031942367554} -08/30/2021 15:59:01 - INFO - __main__ - Step 15137: {'lr': 0.0004903440079133633, 'samples': 2906304, 'steps': 15136, 'loss/train': 2.1094818115234375} -08/30/2021 15:59:02 - INFO - __main__ - Step 15138: {'lr': 0.0004903425472398846, 'samples': 2906496, 'steps': 15137, 'loss/train': 1.6039923429489136} -08/30/2021 15:59:02 - INFO - __main__ - Step 15139: {'lr': 0.0004903410864581115, 'samples': 2906688, 'steps': 15138, 'loss/train': 2.016150951385498} -08/30/2021 15:59:02 - INFO - __main__ - Step 15140: {'lr': 0.0004903396255680443, 'samples': 2906880, 'steps': 15139, 'loss/train': 1.7691010236740112} -08/30/2021 15:59:04 - INFO - __main__ - Step 15141: {'lr': 0.0004903381645696838, 'samples': 2907072, 'steps': 15140, 'loss/train': 0.2667216360569} -08/30/2021 15:59:04 - INFO - __main__ - Step 15142: {'lr': 0.0004903367034630307, 'samples': 2907264, 'steps': 15141, 'loss/train': 1.5593140125274658} -08/30/2021 15:59:05 - INFO - __main__ - Step 15143: {'lr': 0.0004903352422480855, 'samples': 2907456, 'steps': 15142, 'loss/train': 1.4108080863952637} -08/30/2021 15:59:05 - INFO - __main__ - Step 15144: {'lr': 0.000490333780924849, 'samples': 2907648, 'steps': 15143, 'loss/train': 1.7154890298843384} -08/30/2021 15:59:05 - INFO - __main__ - Step 15145: {'lr': 0.0004903323194933218, 'samples': 2907840, 'steps': 15144, 'loss/train': 1.3250635862350464} -08/30/2021 15:59:07 - INFO - __main__ - Step 15146: {'lr': 0.0004903308579535045, 'samples': 2908032, 'steps': 15145, 'loss/train': 1.4927868843078613} -08/30/2021 15:59:07 - INFO - __main__ - Step 15147: {'lr': 0.0004903293963053979, 'samples': 2908224, 'steps': 15146, 'loss/train': 1.4518280029296875} -08/30/2021 15:59:08 - INFO - __main__ - Step 15148: {'lr': 0.0004903279345490026, 'samples': 2908416, 'steps': 15147, 'loss/train': 1.5175867080688477} -08/30/2021 15:59:08 - INFO - __main__ - Step 15149: {'lr': 0.0004903264726843191, 'samples': 2908608, 'steps': 15148, 'loss/train': 1.6642018556594849} -08/30/2021 15:59:08 - INFO - __main__ - Step 15150: {'lr': 0.0004903250107113483, 'samples': 2908800, 'steps': 15149, 'loss/train': 1.3926502466201782} -08/30/2021 15:59:10 - INFO - __main__ - Step 15151: {'lr': 0.0004903235486300908, 'samples': 2908992, 'steps': 15150, 'loss/train': 1.6689372062683105} -08/30/2021 15:59:10 - INFO - __main__ - Step 15152: {'lr': 0.0004903220864405471, 'samples': 2909184, 'steps': 15151, 'loss/train': 1.4074832201004028} -08/30/2021 15:59:11 - INFO - __main__ - Step 15153: {'lr': 0.000490320624142718, 'samples': 2909376, 'steps': 15152, 'loss/train': 1.8029906749725342} -08/30/2021 15:59:11 - INFO - __main__ - Step 15154: {'lr': 0.0004903191617366043, 'samples': 2909568, 'steps': 15153, 'loss/train': 2.1712491512298584} -08/30/2021 15:59:12 - INFO - __main__ - Step 15155: {'lr': 0.0004903176992222063, 'samples': 2909760, 'steps': 15154, 'loss/train': 1.6152732372283936} -08/30/2021 15:59:13 - INFO - __main__ - Step 15156: {'lr': 0.000490316236599525, 'samples': 2909952, 'steps': 15155, 'loss/train': 1.0634926557540894} -08/30/2021 15:59:14 - INFO - __main__ - Step 15157: {'lr': 0.0004903147738685609, 'samples': 2910144, 'steps': 15156, 'loss/train': 1.811274766921997} -08/30/2021 15:59:14 - INFO - __main__ - Step 15158: {'lr': 0.0004903133110293145, 'samples': 2910336, 'steps': 15157, 'loss/train': 1.590394139289856} -08/30/2021 15:59:14 - INFO - __main__ - Step 15159: {'lr': 0.0004903118480817868, 'samples': 2910528, 'steps': 15158, 'loss/train': 1.6736689805984497} -08/30/2021 15:59:15 - INFO - __main__ - Step 15160: {'lr': 0.0004903103850259781, 'samples': 2910720, 'steps': 15159, 'loss/train': 1.409801721572876} -08/30/2021 15:59:16 - INFO - __main__ - Step 15161: {'lr': 0.0004903089218618895, 'samples': 2910912, 'steps': 15160, 'loss/train': 1.5411909818649292} -08/30/2021 15:59:16 - INFO - __main__ - Step 15162: {'lr': 0.0004903074585895212, 'samples': 2911104, 'steps': 15161, 'loss/train': 2.174487590789795} -08/30/2021 15:59:17 - INFO - __main__ - Step 15163: {'lr': 0.0004903059952088742, 'samples': 2911296, 'steps': 15162, 'loss/train': 1.5213121175765991} -08/30/2021 15:59:17 - INFO - __main__ - Step 15164: {'lr': 0.0004903045317199489, 'samples': 2911488, 'steps': 15163, 'loss/train': 1.627817153930664} -08/30/2021 15:59:18 - INFO - __main__ - Step 15165: {'lr': 0.0004903030681227463, 'samples': 2911680, 'steps': 15164, 'loss/train': 1.5124437808990479} -08/30/2021 15:59:19 - INFO - __main__ - Step 15166: {'lr': 0.0004903016044172666, 'samples': 2911872, 'steps': 15165, 'loss/train': 1.874131441116333} -08/30/2021 15:59:19 - INFO - __main__ - Step 15167: {'lr': 0.0004903001406035109, 'samples': 2912064, 'steps': 15166, 'loss/train': 1.0103309154510498} -08/30/2021 15:59:20 - INFO - __main__ - Step 15168: {'lr': 0.0004902986766814795, 'samples': 2912256, 'steps': 15167, 'loss/train': 1.9327702522277832} -08/30/2021 15:59:20 - INFO - __main__ - Step 15169: {'lr': 0.0004902972126511734, 'samples': 2912448, 'steps': 15168, 'loss/train': 2.031543493270874} -08/30/2021 15:59:20 - INFO - __main__ - Step 15170: {'lr': 0.0004902957485125929, 'samples': 2912640, 'steps': 15169, 'loss/train': 2.0452992916107178} -08/30/2021 15:59:21 - INFO - __main__ - Step 15171: {'lr': 0.0004902942842657389, 'samples': 2912832, 'steps': 15170, 'loss/train': 1.6215959787368774} -08/30/2021 15:59:22 - INFO - __main__ - Step 15172: {'lr': 0.0004902928199106121, 'samples': 2913024, 'steps': 15171, 'loss/train': 1.258383870124817} -08/30/2021 15:59:23 - INFO - __main__ - Step 15173: {'lr': 0.000490291355447213, 'samples': 2913216, 'steps': 15172, 'loss/train': 1.4947481155395508} -08/30/2021 15:59:23 - INFO - __main__ - Step 15174: {'lr': 0.0004902898908755424, 'samples': 2913408, 'steps': 15173, 'loss/train': 2.7635366916656494} -08/30/2021 15:59:23 - INFO - __main__ - Step 15175: {'lr': 0.0004902884261956007, 'samples': 2913600, 'steps': 15174, 'loss/train': 1.5870851278305054} -08/30/2021 15:59:24 - INFO - __main__ - Step 15176: {'lr': 0.0004902869614073889, 'samples': 2913792, 'steps': 15175, 'loss/train': 1.5923242568969727} -08/30/2021 15:59:25 - INFO - __main__ - Step 15177: {'lr': 0.0004902854965109074, 'samples': 2913984, 'steps': 15176, 'loss/train': 1.8057106733322144} -08/30/2021 15:59:26 - INFO - __main__ - Step 15178: {'lr': 0.0004902840315061571, 'samples': 2914176, 'steps': 15177, 'loss/train': 1.4928910732269287} -08/30/2021 15:59:26 - INFO - __main__ - Step 15179: {'lr': 0.0004902825663931384, 'samples': 2914368, 'steps': 15178, 'loss/train': 1.6890974044799805} -08/30/2021 15:59:27 - INFO - __main__ - Step 15180: {'lr': 0.0004902811011718521, 'samples': 2914560, 'steps': 15179, 'loss/train': 1.528063416481018} -08/30/2021 15:59:27 - INFO - __main__ - Step 15181: {'lr': 0.0004902796358422989, 'samples': 2914752, 'steps': 15180, 'loss/train': 2.985886812210083} -08/30/2021 15:59:27 - INFO - __main__ - Step 15182: {'lr': 0.0004902781704044793, 'samples': 2914944, 'steps': 15181, 'loss/train': 1.86506187915802} -08/30/2021 15:59:29 - INFO - __main__ - Step 15183: {'lr': 0.0004902767048583942, 'samples': 2915136, 'steps': 15182, 'loss/train': 1.3643348217010498} -08/30/2021 15:59:30 - INFO - __main__ - Step 15184: {'lr': 0.000490275239204044, 'samples': 2915328, 'steps': 15183, 'loss/train': 1.420096516609192} -08/30/2021 15:59:30 - INFO - __main__ - Step 15185: {'lr': 0.0004902737734414296, 'samples': 2915520, 'steps': 15184, 'loss/train': 1.7147296667099} -08/30/2021 15:59:31 - INFO - __main__ - Step 15186: {'lr': 0.0004902723075705514, 'samples': 2915712, 'steps': 15185, 'loss/train': 2.1276416778564453} -08/30/2021 15:59:31 - INFO - __main__ - Step 15187: {'lr': 0.0004902708415914103, 'samples': 2915904, 'steps': 15186, 'loss/train': 0.7894248366355896} -08/30/2021 15:59:32 - INFO - __main__ - Step 15188: {'lr': 0.0004902693755040069, 'samples': 2916096, 'steps': 15187, 'loss/train': 1.9741934537887573} -08/30/2021 15:59:33 - INFO - __main__ - Step 15189: {'lr': 0.0004902679093083418, 'samples': 2916288, 'steps': 15188, 'loss/train': 1.7528294324874878} -08/30/2021 15:59:33 - INFO - __main__ - Step 15190: {'lr': 0.0004902664430044156, 'samples': 2916480, 'steps': 15189, 'loss/train': 1.6628696918487549} -08/30/2021 15:59:34 - INFO - __main__ - Step 15191: {'lr': 0.0004902649765922292, 'samples': 2916672, 'steps': 15190, 'loss/train': 1.560943841934204} -08/30/2021 15:59:34 - INFO - __main__ - Step 15192: {'lr': 0.0004902635100717831, 'samples': 2916864, 'steps': 15191, 'loss/train': 1.5229425430297852} -08/30/2021 15:59:36 - INFO - __main__ - Step 15193: {'lr': 0.0004902620434430778, 'samples': 2917056, 'steps': 15192, 'loss/train': 2.1835124492645264} -08/30/2021 15:59:36 - INFO - __main__ - Step 15194: {'lr': 0.0004902605767061142, 'samples': 2917248, 'steps': 15193, 'loss/train': 1.9095793962478638} -08/30/2021 15:59:36 - INFO - __main__ - Step 15195: {'lr': 0.000490259109860893, 'samples': 2917440, 'steps': 15194, 'loss/train': 1.4937175512313843} -08/30/2021 15:59:37 - INFO - __main__ - Step 15196: {'lr': 0.0004902576429074146, 'samples': 2917632, 'steps': 15195, 'loss/train': 0.872139036655426} -08/30/2021 15:59:37 - INFO - __main__ - Step 15197: {'lr': 0.0004902561758456799, 'samples': 2917824, 'steps': 15196, 'loss/train': 1.0893328189849854} -08/30/2021 15:59:39 - INFO - __main__ - Step 15198: {'lr': 0.0004902547086756895, 'samples': 2918016, 'steps': 15197, 'loss/train': 1.9009952545166016} -08/30/2021 15:59:39 - INFO - __main__ - Step 15199: {'lr': 0.000490253241397444, 'samples': 2918208, 'steps': 15198, 'loss/train': 1.7882243394851685} -08/30/2021 15:59:39 - INFO - __main__ - Step 15200: {'lr': 0.0004902517740109441, 'samples': 2918400, 'steps': 15199, 'loss/train': 2.0170230865478516} -08/30/2021 15:59:40 - INFO - __main__ - Step 15201: {'lr': 0.0004902503065161905, 'samples': 2918592, 'steps': 15200, 'loss/train': 1.1906795501708984} -08/30/2021 15:59:40 - INFO - __main__ - Step 15202: {'lr': 0.0004902488389131837, 'samples': 2918784, 'steps': 15201, 'loss/train': 1.0520771741867065} -08/30/2021 15:59:42 - INFO - __main__ - Step 15203: {'lr': 0.0004902473712019246, 'samples': 2918976, 'steps': 15202, 'loss/train': 1.7138489484786987} -08/30/2021 15:59:42 - INFO - __main__ - Step 15204: {'lr': 0.0004902459033824137, 'samples': 2919168, 'steps': 15203, 'loss/train': 1.5838242769241333} -08/30/2021 15:59:42 - INFO - __main__ - Step 15205: {'lr': 0.0004902444354546516, 'samples': 2919360, 'steps': 15204, 'loss/train': 1.8327378034591675} -08/30/2021 15:59:43 - INFO - __main__ - Step 15206: {'lr': 0.0004902429674186392, 'samples': 2919552, 'steps': 15205, 'loss/train': 1.8911542892456055} -08/30/2021 15:59:43 - INFO - __main__ - Step 15207: {'lr': 0.000490241499274377, 'samples': 2919744, 'steps': 15206, 'loss/train': 1.6966699361801147} -08/30/2021 15:59:43 - INFO - __main__ - Step 15208: {'lr': 0.0004902400310218657, 'samples': 2919936, 'steps': 15207, 'loss/train': 1.6051431894302368} -08/30/2021 15:59:45 - INFO - __main__ - Step 15209: {'lr': 0.0004902385626611059, 'samples': 2920128, 'steps': 15208, 'loss/train': 1.5678776502609253} -08/30/2021 15:59:45 - INFO - __main__ - Step 15210: {'lr': 0.0004902370941920984, 'samples': 2920320, 'steps': 15209, 'loss/train': 1.2162106037139893} -08/30/2021 15:59:46 - INFO - __main__ - Step 15211: {'lr': 0.0004902356256148437, 'samples': 2920512, 'steps': 15210, 'loss/train': 1.455880045890808} -08/30/2021 15:59:46 - INFO - __main__ - Step 15212: {'lr': 0.0004902341569293425, 'samples': 2920704, 'steps': 15211, 'loss/train': 1.459934949874878} -08/30/2021 15:59:46 - INFO - __main__ - Step 15213: {'lr': 0.0004902326881355955, 'samples': 2920896, 'steps': 15212, 'loss/train': 1.446386456489563} -08/30/2021 15:59:48 - INFO - __main__ - Step 15214: {'lr': 0.0004902312192336034, 'samples': 2921088, 'steps': 15213, 'loss/train': 1.5584096908569336} -08/30/2021 15:59:48 - INFO - __main__ - Step 15215: {'lr': 0.000490229750223367, 'samples': 2921280, 'steps': 15214, 'loss/train': 0.9233636260032654} -08/30/2021 15:59:49 - INFO - __main__ - Step 15216: {'lr': 0.0004902282811048864, 'samples': 2921472, 'steps': 15215, 'loss/train': 1.0606367588043213} -08/30/2021 15:59:49 - INFO - __main__ - Step 15217: {'lr': 0.000490226811878163, 'samples': 2921664, 'steps': 15216, 'loss/train': 1.704091191291809} -08/30/2021 15:59:50 - INFO - __main__ - Step 15218: {'lr': 0.0004902253425431969, 'samples': 2921856, 'steps': 15217, 'loss/train': 1.7339808940887451} -08/30/2021 15:59:51 - INFO - __main__ - Step 15219: {'lr': 0.000490223873099989, 'samples': 2922048, 'steps': 15218, 'loss/train': 2.1102333068847656} -08/30/2021 15:59:51 - INFO - __main__ - Step 15220: {'lr': 0.00049022240354854, 'samples': 2922240, 'steps': 15219, 'loss/train': 1.6153285503387451} -08/30/2021 15:59:52 - INFO - __main__ - Step 15221: {'lr': 0.0004902209338888503, 'samples': 2922432, 'steps': 15220, 'loss/train': 2.018859386444092} -08/30/2021 15:59:52 - INFO - __main__ - Step 15222: {'lr': 0.000490219464120921, 'samples': 2922624, 'steps': 15221, 'loss/train': 0.7686914205551147} -08/30/2021 15:59:53 - INFO - __main__ - Step 15223: {'lr': 0.0004902179942447524, 'samples': 2922816, 'steps': 15222, 'loss/train': 0.8456284999847412} -08/30/2021 15:59:54 - INFO - __main__ - Step 15224: {'lr': 0.0004902165242603452, 'samples': 2923008, 'steps': 15223, 'loss/train': 1.8118358850479126} -08/30/2021 15:59:54 - INFO - __main__ - Step 15225: {'lr': 0.0004902150541677003, 'samples': 2923200, 'steps': 15224, 'loss/train': 1.6165413856506348} -08/30/2021 15:59:55 - INFO - __main__ - Step 15226: {'lr': 0.0004902135839668181, 'samples': 2923392, 'steps': 15225, 'loss/train': 1.4570969343185425} -08/30/2021 15:59:55 - INFO - __main__ - Step 15227: {'lr': 0.0004902121136576994, 'samples': 2923584, 'steps': 15226, 'loss/train': 2.010981559753418} -08/30/2021 15:59:55 - INFO - __main__ - Step 15228: {'lr': 0.0004902106432403448, 'samples': 2923776, 'steps': 15227, 'loss/train': 2.0917279720306396} -08/30/2021 15:59:56 - INFO - __main__ - Step 15229: {'lr': 0.0004902091727147551, 'samples': 2923968, 'steps': 15228, 'loss/train': 1.145888090133667} -08/30/2021 15:59:57 - INFO - __main__ - Step 15230: {'lr': 0.0004902077020809307, 'samples': 2924160, 'steps': 15229, 'loss/train': 1.5485759973526} -08/30/2021 15:59:58 - INFO - __main__ - Step 15231: {'lr': 0.0004902062313388725, 'samples': 2924352, 'steps': 15230, 'loss/train': 1.5448799133300781} -08/30/2021 15:59:58 - INFO - __main__ - Step 15232: {'lr': 0.0004902047604885811, 'samples': 2924544, 'steps': 15231, 'loss/train': 1.6722486019134521} -08/30/2021 15:59:58 - INFO - __main__ - Step 15233: {'lr': 0.0004902032895300571, 'samples': 2924736, 'steps': 15232, 'loss/train': 1.3838722705841064} -08/30/2021 15:59:59 - INFO - __main__ - Step 15234: {'lr': 0.0004902018184633012, 'samples': 2924928, 'steps': 15233, 'loss/train': 0.8554103374481201} -08/30/2021 16:00:01 - INFO - __main__ - Step 15235: {'lr': 0.0004902003472883141, 'samples': 2925120, 'steps': 15234, 'loss/train': 1.9881125688552856} -08/30/2021 16:00:01 - INFO - __main__ - Step 15236: {'lr': 0.0004901988760050964, 'samples': 2925312, 'steps': 15235, 'loss/train': 1.5846076011657715} -08/30/2021 16:00:02 - INFO - __main__ - Step 15237: {'lr': 0.0004901974046136488, 'samples': 2925504, 'steps': 15236, 'loss/train': 2.070047378540039} -08/30/2021 16:00:02 - INFO - __main__ - Step 15238: {'lr': 0.000490195933113972, 'samples': 2925696, 'steps': 15237, 'loss/train': 1.5535564422607422} -08/30/2021 16:00:02 - INFO - __main__ - Step 15239: {'lr': 0.0004901944615060665, 'samples': 2925888, 'steps': 15238, 'loss/train': 1.2036014795303345} -08/30/2021 16:00:04 - INFO - __main__ - Step 15240: {'lr': 0.0004901929897899331, 'samples': 2926080, 'steps': 15239, 'loss/train': 1.620802402496338} -08/30/2021 16:00:05 - INFO - __main__ - Step 15241: {'lr': 0.0004901915179655726, 'samples': 2926272, 'steps': 15240, 'loss/train': 1.8651938438415527} -08/30/2021 16:00:05 - INFO - __main__ - Step 15242: {'lr': 0.0004901900460329853, 'samples': 2926464, 'steps': 15241, 'loss/train': 1.6313143968582153} -08/30/2021 16:00:05 - INFO - __main__ - Step 15243: {'lr': 0.0004901885739921723, 'samples': 2926656, 'steps': 15242, 'loss/train': 2.0313265323638916} -08/30/2021 16:00:06 - INFO - __main__ - Step 15244: {'lr': 0.0004901871018431339, 'samples': 2926848, 'steps': 15243, 'loss/train': 1.65639066696167} -08/30/2021 16:00:06 - INFO - __main__ - Step 15245: {'lr': 0.0004901856295858708, 'samples': 2927040, 'steps': 15244, 'loss/train': 1.7966381311416626} -08/30/2021 16:00:08 - INFO - __main__ - Step 15246: {'lr': 0.0004901841572203839, 'samples': 2927232, 'steps': 15245, 'loss/train': 1.388607382774353} -08/30/2021 16:00:08 - INFO - __main__ - Step 15247: {'lr': 0.0004901826847466738, 'samples': 2927424, 'steps': 15246, 'loss/train': 1.3225113153457642} -08/30/2021 16:00:09 - INFO - __main__ - Step 15248: {'lr': 0.000490181212164741, 'samples': 2927616, 'steps': 15247, 'loss/train': 1.9013538360595703} -08/30/2021 16:00:09 - INFO - __main__ - Step 15249: {'lr': 0.0004901797394745861, 'samples': 2927808, 'steps': 15248, 'loss/train': 1.9068899154663086} -08/30/2021 16:00:09 - INFO - __main__ - Step 15250: {'lr': 0.0004901782666762102, 'samples': 2928000, 'steps': 15249, 'loss/train': 0.07610747218132019} -08/30/2021 16:00:10 - INFO - __main__ - Step 15251: {'lr': 0.0004901767937696135, 'samples': 2928192, 'steps': 15250, 'loss/train': 1.5153677463531494} -08/30/2021 16:00:11 - INFO - __main__ - Step 15252: {'lr': 0.0004901753207547969, 'samples': 2928384, 'steps': 15251, 'loss/train': 1.294348955154419} -08/30/2021 16:00:11 - INFO - __main__ - Step 15253: {'lr': 0.000490173847631761, 'samples': 2928576, 'steps': 15252, 'loss/train': 1.6863707304000854} -08/30/2021 16:00:12 - INFO - __main__ - Step 15254: {'lr': 0.0004901723744005065, 'samples': 2928768, 'steps': 15253, 'loss/train': 1.673261284828186} -08/30/2021 16:00:12 - INFO - __main__ - Step 15255: {'lr': 0.0004901709010610339, 'samples': 2928960, 'steps': 15254, 'loss/train': 1.7124124765396118} -08/30/2021 16:00:12 - INFO - __main__ - Step 15256: {'lr': 0.0004901694276133441, 'samples': 2929152, 'steps': 15255, 'loss/train': 2.0685617923736572} -08/30/2021 16:00:14 - INFO - __main__ - Step 15257: {'lr': 0.0004901679540574377, 'samples': 2929344, 'steps': 15256, 'loss/train': 1.9410738945007324} -08/30/2021 16:00:14 - INFO - __main__ - Step 15258: {'lr': 0.0004901664803933153, 'samples': 2929536, 'steps': 15257, 'loss/train': 2.0417656898498535} -08/30/2021 16:00:15 - INFO - __main__ - Step 15259: {'lr': 0.0004901650066209775, 'samples': 2929728, 'steps': 15258, 'loss/train': 1.6134295463562012} -08/30/2021 16:00:15 - INFO - __main__ - Step 15260: {'lr': 0.0004901635327404252, 'samples': 2929920, 'steps': 15259, 'loss/train': 1.9462106227874756} -08/30/2021 16:00:15 - INFO - __main__ - Step 15261: {'lr': 0.0004901620587516587, 'samples': 2930112, 'steps': 15260, 'loss/train': 1.2231272459030151} -08/30/2021 16:00:17 - INFO - __main__ - Step 15262: {'lr': 0.0004901605846546791, 'samples': 2930304, 'steps': 15261, 'loss/train': 1.6867084503173828} -08/30/2021 16:00:18 - INFO - __main__ - Step 15263: {'lr': 0.0004901591104494868, 'samples': 2930496, 'steps': 15262, 'loss/train': 1.9147292375564575} -08/30/2021 16:00:18 - INFO - __main__ - Step 15264: {'lr': 0.0004901576361360825, 'samples': 2930688, 'steps': 15263, 'loss/train': 2.208069086074829} -08/30/2021 16:00:18 - INFO - __main__ - Step 15265: {'lr': 0.0004901561617144667, 'samples': 2930880, 'steps': 15264, 'loss/train': 1.3121311664581299} -08/30/2021 16:00:19 - INFO - __main__ - Step 15266: {'lr': 0.0004901546871846405, 'samples': 2931072, 'steps': 15265, 'loss/train': 2.051281690597534} -08/30/2021 16:00:20 - INFO - __main__ - Step 15267: {'lr': 0.0004901532125466041, 'samples': 2931264, 'steps': 15266, 'loss/train': 0.10278207808732986} -08/30/2021 16:00:21 - INFO - __main__ - Step 15268: {'lr': 0.0004901517378003584, 'samples': 2931456, 'steps': 15267, 'loss/train': 1.8167712688446045} -08/30/2021 16:00:21 - INFO - __main__ - Step 15269: {'lr': 0.0004901502629459042, 'samples': 2931648, 'steps': 15268, 'loss/train': 1.5532091856002808} -08/30/2021 16:00:22 - INFO - __main__ - Step 15270: {'lr': 0.000490148787983242, 'samples': 2931840, 'steps': 15269, 'loss/train': 2.1325762271881104} -08/30/2021 16:00:22 - INFO - __main__ - Step 15271: {'lr': 0.0004901473129123723, 'samples': 2932032, 'steps': 15270, 'loss/train': 1.9315848350524902} -08/30/2021 16:00:22 - INFO - __main__ - Step 15272: {'lr': 0.0004901458377332959, 'samples': 2932224, 'steps': 15271, 'loss/train': 0.2822628319263458} -08/30/2021 16:00:24 - INFO - __main__ - Step 15273: {'lr': 0.0004901443624460136, 'samples': 2932416, 'steps': 15272, 'loss/train': 1.6238374710083008} -08/30/2021 16:00:24 - INFO - __main__ - Step 15274: {'lr': 0.000490142887050526, 'samples': 2932608, 'steps': 15273, 'loss/train': 2.0749807357788086} -08/30/2021 16:00:25 - INFO - __main__ - Step 15275: {'lr': 0.0004901414115468335, 'samples': 2932800, 'steps': 15274, 'loss/train': 2.2964682579040527} -08/30/2021 16:00:25 - INFO - __main__ - Step 15276: {'lr': 0.0004901399359349372, 'samples': 2932992, 'steps': 15275, 'loss/train': 1.9444867372512817} -08/30/2021 16:00:25 - INFO - __main__ - Step 15277: {'lr': 0.0004901384602148376, 'samples': 2933184, 'steps': 15276, 'loss/train': 1.6872153282165527} -08/30/2021 16:00:27 - INFO - __main__ - Step 15278: {'lr': 0.0004901369843865351, 'samples': 2933376, 'steps': 15277, 'loss/train': 1.8935812711715698} -08/30/2021 16:00:27 - INFO - __main__ - Step 15279: {'lr': 0.0004901355084500307, 'samples': 2933568, 'steps': 15278, 'loss/train': 3.2335526943206787} -08/30/2021 16:00:28 - INFO - __main__ - Step 15280: {'lr': 0.000490134032405325, 'samples': 2933760, 'steps': 15279, 'loss/train': 1.9136563539505005} -08/30/2021 16:00:28 - INFO - __main__ - Step 15281: {'lr': 0.0004901325562524185, 'samples': 2933952, 'steps': 15280, 'loss/train': 1.8464934825897217} -08/30/2021 16:00:28 - INFO - __main__ - Step 15282: {'lr': 0.0004901310799913121, 'samples': 2934144, 'steps': 15281, 'loss/train': 1.439648151397705} -08/30/2021 16:00:30 - INFO - __main__ - Step 15283: {'lr': 0.0004901296036220062, 'samples': 2934336, 'steps': 15282, 'loss/train': 1.7032266855239868} -08/30/2021 16:00:30 - INFO - __main__ - Step 15284: {'lr': 0.0004901281271445016, 'samples': 2934528, 'steps': 15283, 'loss/train': 1.8631856441497803} -08/30/2021 16:00:31 - INFO - __main__ - Step 15285: {'lr': 0.000490126650558799, 'samples': 2934720, 'steps': 15284, 'loss/train': 2.1576526165008545} -08/30/2021 16:00:31 - INFO - __main__ - Step 15286: {'lr': 0.000490125173864899, 'samples': 2934912, 'steps': 15285, 'loss/train': 1.8573395013809204} -08/30/2021 16:00:31 - INFO - __main__ - Step 15287: {'lr': 0.0004901236970628024, 'samples': 2935104, 'steps': 15286, 'loss/train': 1.9123634099960327} -08/30/2021 16:00:33 - INFO - __main__ - Step 15288: {'lr': 0.0004901222201525099, 'samples': 2935296, 'steps': 15287, 'loss/train': 2.1508285999298096} -08/30/2021 16:00:34 - INFO - __main__ - Step 15289: {'lr': 0.0004901207431340218, 'samples': 2935488, 'steps': 15288, 'loss/train': 1.8390781879425049} -08/30/2021 16:00:34 - INFO - __main__ - Step 15290: {'lr': 0.000490119266007339, 'samples': 2935680, 'steps': 15289, 'loss/train': 1.6442031860351562} -08/30/2021 16:00:34 - INFO - __main__ - Step 15291: {'lr': 0.0004901177887724623, 'samples': 2935872, 'steps': 15290, 'loss/train': 2.0264084339141846} -08/30/2021 16:00:35 - INFO - __main__ - Step 15292: {'lr': 0.0004901163114293921, 'samples': 2936064, 'steps': 15291, 'loss/train': 1.4709222316741943} -08/30/2021 16:00:35 - INFO - __main__ - Step 15293: {'lr': 0.0004901148339781293, 'samples': 2936256, 'steps': 15292, 'loss/train': 1.3401129245758057} -08/30/2021 16:00:37 - INFO - __main__ - Step 15294: {'lr': 0.0004901133564186744, 'samples': 2936448, 'steps': 15293, 'loss/train': 1.8701170682907104} -08/30/2021 16:00:38 - INFO - __main__ - Step 15295: {'lr': 0.0004901118787510281, 'samples': 2936640, 'steps': 15294, 'loss/train': 1.311923861503601} -08/30/2021 16:00:38 - INFO - __main__ - Step 15296: {'lr': 0.0004901104009751912, 'samples': 2936832, 'steps': 15295, 'loss/train': 1.8409775495529175} -08/30/2021 16:00:39 - INFO - __main__ - Step 15297: {'lr': 0.0004901089230911642, 'samples': 2937024, 'steps': 15296, 'loss/train': 1.8538223505020142} -08/30/2021 16:00:39 - INFO - __main__ - Step 15298: {'lr': 0.0004901074450989479, 'samples': 2937216, 'steps': 15297, 'loss/train': 1.9554061889648438} -08/30/2021 16:00:41 - INFO - __main__ - Step 15299: {'lr': 0.0004901059669985427, 'samples': 2937408, 'steps': 15298, 'loss/train': 0.32535094022750854} -08/30/2021 16:00:41 - INFO - __main__ - Step 15300: {'lr': 0.0004901044887899496, 'samples': 2937600, 'steps': 15299, 'loss/train': 1.4372743368148804} -08/30/2021 16:00:41 - INFO - __main__ - Step 15301: {'lr': 0.0004901030104731691, 'samples': 2937792, 'steps': 15300, 'loss/train': 1.6454297304153442} -08/30/2021 16:00:42 - INFO - __main__ - Step 15302: {'lr': 0.0004901015320482019, 'samples': 2937984, 'steps': 15301, 'loss/train': 2.1553637981414795} -08/30/2021 16:00:42 - INFO - __main__ - Step 15303: {'lr': 0.0004901000535150486, 'samples': 2938176, 'steps': 15302, 'loss/train': 1.8293977975845337} -08/30/2021 16:00:44 - INFO - __main__ - Step 15304: {'lr': 0.0004900985748737101, 'samples': 2938368, 'steps': 15303, 'loss/train': 2.0799834728240967} -08/30/2021 16:00:44 - INFO - __main__ - Step 15305: {'lr': 0.0004900970961241866, 'samples': 2938560, 'steps': 15304, 'loss/train': 2.3479645252227783} -08/30/2021 16:00:45 - INFO - __main__ - Step 15306: {'lr': 0.0004900956172664792, 'samples': 2938752, 'steps': 15305, 'loss/train': 1.979406714439392} -08/30/2021 16:00:45 - INFO - __main__ - Step 15307: {'lr': 0.0004900941383005884, 'samples': 2938944, 'steps': 15306, 'loss/train': 2.0431814193725586} -08/30/2021 16:00:45 - INFO - __main__ - Step 15308: {'lr': 0.0004900926592265149, 'samples': 2939136, 'steps': 15307, 'loss/train': 1.457631230354309} -08/30/2021 16:00:47 - INFO - __main__ - Step 15309: {'lr': 0.0004900911800442593, 'samples': 2939328, 'steps': 15308, 'loss/train': 1.8405603170394897} -08/30/2021 16:00:47 - INFO - __main__ - Step 15310: {'lr': 0.0004900897007538225, 'samples': 2939520, 'steps': 15309, 'loss/train': 1.909132480621338} -08/30/2021 16:00:48 - INFO - __main__ - Step 15311: {'lr': 0.0004900882213552049, 'samples': 2939712, 'steps': 15310, 'loss/train': 2.91546893119812} -08/30/2021 16:00:48 - INFO - __main__ - Step 15312: {'lr': 0.0004900867418484072, 'samples': 2939904, 'steps': 15311, 'loss/train': 1.8374571800231934} -08/30/2021 16:00:48 - INFO - __main__ - Step 15313: {'lr': 0.0004900852622334301, 'samples': 2940096, 'steps': 15312, 'loss/train': 1.6467686891555786} -08/30/2021 16:00:49 - INFO - __main__ - Step 15314: {'lr': 0.0004900837825102743, 'samples': 2940288, 'steps': 15313, 'loss/train': 0.1568973809480667} -08/30/2021 16:00:50 - INFO - __main__ - Step 15315: {'lr': 0.0004900823026789405, 'samples': 2940480, 'steps': 15314, 'loss/train': 1.7074110507965088} -08/30/2021 16:00:51 - INFO - __main__ - Step 15316: {'lr': 0.0004900808227394293, 'samples': 2940672, 'steps': 15315, 'loss/train': 1.5589522123336792} -08/30/2021 16:00:51 - INFO - __main__ - Step 15317: {'lr': 0.0004900793426917412, 'samples': 2940864, 'steps': 15316, 'loss/train': 1.637278437614441} -08/30/2021 16:00:52 - INFO - __main__ - Step 15318: {'lr': 0.0004900778625358774, 'samples': 2941056, 'steps': 15317, 'loss/train': 1.842742919921875} -08/30/2021 16:00:52 - INFO - __main__ - Step 15319: {'lr': 0.000490076382271838, 'samples': 2941248, 'steps': 15318, 'loss/train': 1.6763697862625122} -08/30/2021 16:00:53 - INFO - __main__ - Step 15320: {'lr': 0.0004900749018996238, 'samples': 2941440, 'steps': 15319, 'loss/train': 1.5344160795211792} -08/30/2021 16:00:54 - INFO - __main__ - Step 15321: {'lr': 0.0004900734214192358, 'samples': 2941632, 'steps': 15320, 'loss/train': 2.8766956329345703} -08/30/2021 16:00:54 - INFO - __main__ - Step 15322: {'lr': 0.0004900719408306743, 'samples': 2941824, 'steps': 15321, 'loss/train': 2.0137224197387695} -08/30/2021 16:00:54 - INFO - __main__ - Step 15323: {'lr': 0.0004900704601339401, 'samples': 2942016, 'steps': 15322, 'loss/train': 2.109374761581421} -08/30/2021 16:00:55 - INFO - __main__ - Step 15324: {'lr': 0.0004900689793290339, 'samples': 2942208, 'steps': 15323, 'loss/train': 1.5553075075149536} -08/30/2021 16:00:56 - INFO - __main__ - Step 15325: {'lr': 0.0004900674984159562, 'samples': 2942400, 'steps': 15324, 'loss/train': 1.4952634572982788} -08/30/2021 16:00:57 - INFO - __main__ - Step 15326: {'lr': 0.0004900660173947079, 'samples': 2942592, 'steps': 15325, 'loss/train': 0.48776811361312866} -08/30/2021 16:00:57 - INFO - __main__ - Step 15327: {'lr': 0.0004900645362652895, 'samples': 2942784, 'steps': 15326, 'loss/train': 1.2803184986114502} -08/30/2021 16:00:57 - INFO - __main__ - Step 15328: {'lr': 0.0004900630550277018, 'samples': 2942976, 'steps': 15327, 'loss/train': 1.2247620820999146} -08/30/2021 16:00:58 - INFO - __main__ - Step 15329: {'lr': 0.0004900615736819452, 'samples': 2943168, 'steps': 15328, 'loss/train': 1.6304024457931519} -08/30/2021 16:00:59 - INFO - __main__ - Step 15330: {'lr': 0.0004900600922280207, 'samples': 2943360, 'steps': 15329, 'loss/train': 1.6658141613006592} -08/30/2021 16:01:00 - INFO - __main__ - Step 15331: {'lr': 0.0004900586106659289, 'samples': 2943552, 'steps': 15330, 'loss/train': 2.2869555950164795} -08/30/2021 16:01:00 - INFO - __main__ - Step 15332: {'lr': 0.0004900571289956703, 'samples': 2943744, 'steps': 15331, 'loss/train': 1.738834023475647} -08/30/2021 16:01:01 - INFO - __main__ - Step 15333: {'lr': 0.0004900556472172457, 'samples': 2943936, 'steps': 15332, 'loss/train': 1.7425967454910278} -08/30/2021 16:01:01 - INFO - __main__ - Step 15334: {'lr': 0.0004900541653306557, 'samples': 2944128, 'steps': 15333, 'loss/train': 1.44273042678833} -08/30/2021 16:01:02 - INFO - __main__ - Step 15335: {'lr': 0.0004900526833359009, 'samples': 2944320, 'steps': 15334, 'loss/train': 1.672918677330017} -08/30/2021 16:01:03 - INFO - __main__ - Step 15336: {'lr': 0.0004900512012329822, 'samples': 2944512, 'steps': 15335, 'loss/train': 1.6832565069198608} -08/30/2021 16:01:03 - INFO - __main__ - Step 15337: {'lr': 0.0004900497190219002, 'samples': 2944704, 'steps': 15336, 'loss/train': 1.8559441566467285} -08/30/2021 16:01:04 - INFO - __main__ - Step 15338: {'lr': 0.0004900482367026554, 'samples': 2944896, 'steps': 15337, 'loss/train': 1.5720969438552856} -08/30/2021 16:01:04 - INFO - __main__ - Step 15339: {'lr': 0.0004900467542752485, 'samples': 2945088, 'steps': 15338, 'loss/train': 2.4836173057556152} -08/30/2021 16:01:04 - INFO - __main__ - Step 15340: {'lr': 0.0004900452717396803, 'samples': 2945280, 'steps': 15339, 'loss/train': 2.947153091430664} -08/30/2021 16:01:06 - INFO - __main__ - Step 15341: {'lr': 0.0004900437890959515, 'samples': 2945472, 'steps': 15340, 'loss/train': 2.604426145553589} -08/30/2021 16:01:07 - INFO - __main__ - Step 15342: {'lr': 0.0004900423063440625, 'samples': 2945664, 'steps': 15341, 'loss/train': 2.2659289836883545} -08/30/2021 16:01:07 - INFO - __main__ - Step 15343: {'lr': 0.0004900408234840142, 'samples': 2945856, 'steps': 15342, 'loss/train': 0.302096426486969} -08/30/2021 16:01:07 - INFO - __main__ - Step 15344: {'lr': 0.0004900393405158073, 'samples': 2946048, 'steps': 15343, 'loss/train': 1.3263083696365356} -08/30/2021 16:01:08 - INFO - __main__ - Step 15345: {'lr': 0.0004900378574394423, 'samples': 2946240, 'steps': 15344, 'loss/train': 0.3805118203163147} -08/30/2021 16:01:10 - INFO - __main__ - Step 15346: {'lr': 0.00049003637425492, 'samples': 2946432, 'steps': 15345, 'loss/train': 2.1891603469848633} -08/30/2021 16:01:10 - INFO - __main__ - Step 15347: {'lr': 0.0004900348909622409, 'samples': 2946624, 'steps': 15346, 'loss/train': 1.907754898071289} -08/30/2021 16:01:10 - INFO - __main__ - Step 15348: {'lr': 0.0004900334075614059, 'samples': 2946816, 'steps': 15347, 'loss/train': 2.2687036991119385} -08/30/2021 16:01:11 - INFO - __main__ - Step 15349: {'lr': 0.0004900319240524155, 'samples': 2947008, 'steps': 15348, 'loss/train': 1.630103349685669} -08/30/2021 16:01:11 - INFO - __main__ - Step 15350: {'lr': 0.0004900304404352704, 'samples': 2947200, 'steps': 15349, 'loss/train': 1.5954492092132568} -08/30/2021 16:01:13 - INFO - __main__ - Step 15351: {'lr': 0.0004900289567099713, 'samples': 2947392, 'steps': 15350, 'loss/train': 0.9392467737197876} -08/30/2021 16:01:13 - INFO - __main__ - Step 15352: {'lr': 0.000490027472876519, 'samples': 2947584, 'steps': 15351, 'loss/train': 1.7012474536895752} -08/30/2021 16:01:13 - INFO - __main__ - Step 15353: {'lr': 0.0004900259889349138, 'samples': 2947776, 'steps': 15352, 'loss/train': 2.369603395462036} -08/30/2021 16:01:14 - INFO - __main__ - Step 15354: {'lr': 0.0004900245048851567, 'samples': 2947968, 'steps': 15353, 'loss/train': 2.3797850608825684} -08/30/2021 16:01:14 - INFO - __main__ - Step 15355: {'lr': 0.0004900230207272483, 'samples': 2948160, 'steps': 15354, 'loss/train': 1.4411885738372803} -08/30/2021 16:01:16 - INFO - __main__ - Step 15356: {'lr': 0.000490021536461189, 'samples': 2948352, 'steps': 15355, 'loss/train': 1.212572455406189} -08/30/2021 16:01:16 - INFO - __main__ - Step 15357: {'lr': 0.00049002005208698, 'samples': 2948544, 'steps': 15356, 'loss/train': 1.9965567588806152} -08/30/2021 16:01:16 - INFO - __main__ - Step 15358: {'lr': 0.0004900185676046214, 'samples': 2948736, 'steps': 15357, 'loss/train': 1.5751240253448486} -08/30/2021 16:01:17 - INFO - __main__ - Step 15359: {'lr': 0.0004900170830141144, 'samples': 2948928, 'steps': 15358, 'loss/train': 2.052021026611328} -08/30/2021 16:01:17 - INFO - __main__ - Step 15360: {'lr': 0.0004900155983154592, 'samples': 2949120, 'steps': 15359, 'loss/train': 1.865669846534729} -08/30/2021 16:01:19 - INFO - __main__ - Step 15361: {'lr': 0.0004900141135086569, 'samples': 2949312, 'steps': 15360, 'loss/train': 1.7544538974761963} -08/30/2021 16:01:19 - INFO - __main__ - Step 15362: {'lr': 0.0004900126285937077, 'samples': 2949504, 'steps': 15361, 'loss/train': 1.7860257625579834} -08/30/2021 16:01:19 - INFO - __main__ - Step 15363: {'lr': 0.0004900111435706127, 'samples': 2949696, 'steps': 15362, 'loss/train': 1.7874385118484497} -08/30/2021 16:01:20 - INFO - __main__ - Step 15364: {'lr': 0.0004900096584393723, 'samples': 2949888, 'steps': 15363, 'loss/train': 2.277987241744995} -08/30/2021 16:01:20 - INFO - __main__ - Step 15365: {'lr': 0.0004900081731999872, 'samples': 2950080, 'steps': 15364, 'loss/train': 1.8814116716384888} -08/30/2021 16:01:23 - INFO - __main__ - Step 15366: {'lr': 0.0004900066878524582, 'samples': 2950272, 'steps': 15365, 'loss/train': 1.7960764169692993} -08/30/2021 16:01:23 - INFO - __main__ - Step 15367: {'lr': 0.0004900052023967859, 'samples': 2950464, 'steps': 15366, 'loss/train': 1.2443969249725342} -08/30/2021 16:01:23 - INFO - __main__ - Step 15368: {'lr': 0.0004900037168329709, 'samples': 2950656, 'steps': 15367, 'loss/train': 1.445622444152832} -08/30/2021 16:01:24 - INFO - __main__ - Step 15369: {'lr': 0.000490002231161014, 'samples': 2950848, 'steps': 15368, 'loss/train': 2.6704702377319336} -08/30/2021 16:01:24 - INFO - __main__ - Step 15370: {'lr': 0.0004900007453809157, 'samples': 2951040, 'steps': 15369, 'loss/train': 3.144233465194702} -08/30/2021 16:01:25 - INFO - __main__ - Step 15371: {'lr': 0.0004899992594926769, 'samples': 2951232, 'steps': 15370, 'loss/train': 3.3713228702545166} -08/30/2021 16:01:25 - INFO - __main__ - Step 15372: {'lr': 0.000489997773496298, 'samples': 2951424, 'steps': 15371, 'loss/train': 3.7108395099639893} -08/30/2021 16:01:25 - INFO - __main__ - Step 15373: {'lr': 0.0004899962873917798, 'samples': 2951616, 'steps': 15372, 'loss/train': 2.2490532398223877} -08/30/2021 16:01:27 - INFO - __main__ - Step 15374: {'lr': 0.000489994801179123, 'samples': 2951808, 'steps': 15373, 'loss/train': 1.7610284090042114} -08/30/2021 16:01:27 - INFO - __main__ - Step 15375: {'lr': 0.0004899933148583284, 'samples': 2952000, 'steps': 15374, 'loss/train': 2.233377456665039} -08/30/2021 16:01:27 - INFO - __main__ - Step 15376: {'lr': 0.0004899918284293964, 'samples': 2952192, 'steps': 15375, 'loss/train': 1.900270938873291} -08/30/2021 16:01:28 - INFO - __main__ - Step 15377: {'lr': 0.0004899903418923278, 'samples': 2952384, 'steps': 15376, 'loss/train': 1.764028787612915} -08/30/2021 16:01:28 - INFO - __main__ - Step 15378: {'lr': 0.0004899888552471232, 'samples': 2952576, 'steps': 15377, 'loss/train': 1.6459065675735474} -08/30/2021 16:01:30 - INFO - __main__ - Step 15379: {'lr': 0.0004899873684937833, 'samples': 2952768, 'steps': 15378, 'loss/train': 1.967921257019043} -08/30/2021 16:01:30 - INFO - __main__ - Step 15380: {'lr': 0.0004899858816323089, 'samples': 2952960, 'steps': 15379, 'loss/train': 1.7271283864974976} -08/30/2021 16:01:30 - INFO - __main__ - Step 15381: {'lr': 0.0004899843946627006, 'samples': 2953152, 'steps': 15380, 'loss/train': 1.5563031435012817} -08/30/2021 16:01:31 - INFO - __main__ - Step 15382: {'lr': 0.0004899829075849589, 'samples': 2953344, 'steps': 15381, 'loss/train': 1.7910250425338745} -08/30/2021 16:01:31 - INFO - __main__ - Step 15383: {'lr': 0.0004899814203990847, 'samples': 2953536, 'steps': 15382, 'loss/train': 1.7405543327331543} -08/30/2021 16:01:33 - INFO - __main__ - Step 15384: {'lr': 0.0004899799331050785, 'samples': 2953728, 'steps': 15383, 'loss/train': 2.0326998233795166} -08/30/2021 16:01:33 - INFO - __main__ - Step 15385: {'lr': 0.0004899784457029411, 'samples': 2953920, 'steps': 15384, 'loss/train': 1.8632278442382812} -08/30/2021 16:01:34 - INFO - __main__ - Step 15386: {'lr': 0.000489976958192673, 'samples': 2954112, 'steps': 15385, 'loss/train': 1.770098328590393} -08/30/2021 16:01:34 - INFO - __main__ - Step 15387: {'lr': 0.0004899754705742752, 'samples': 2954304, 'steps': 15386, 'loss/train': 1.867549180984497} -08/30/2021 16:01:34 - INFO - __main__ - Step 15388: {'lr': 0.0004899739828477481, 'samples': 2954496, 'steps': 15387, 'loss/train': 1.5787196159362793} -08/30/2021 16:01:36 - INFO - __main__ - Step 15389: {'lr': 0.0004899724950130923, 'samples': 2954688, 'steps': 15388, 'loss/train': 1.854261040687561} -08/30/2021 16:01:36 - INFO - __main__ - Step 15390: {'lr': 0.0004899710070703087, 'samples': 2954880, 'steps': 15389, 'loss/train': 4.427979946136475} -08/30/2021 16:01:37 - INFO - __main__ - Step 15391: {'lr': 0.0004899695190193978, 'samples': 2955072, 'steps': 15390, 'loss/train': 1.817335605621338} -08/30/2021 16:01:37 - INFO - __main__ - Step 15392: {'lr': 0.0004899680308603604, 'samples': 2955264, 'steps': 15391, 'loss/train': 1.8148187398910522} -08/30/2021 16:01:37 - INFO - __main__ - Step 15393: {'lr': 0.000489966542593197, 'samples': 2955456, 'steps': 15392, 'loss/train': 1.0594487190246582} -08/30/2021 16:01:39 - INFO - __main__ - Step 15394: {'lr': 0.0004899650542179085, 'samples': 2955648, 'steps': 15393, 'loss/train': 1.8477115631103516} -08/30/2021 16:01:39 - INFO - __main__ - Step 15395: {'lr': 0.0004899635657344954, 'samples': 2955840, 'steps': 15394, 'loss/train': 0.6730448603630066} -08/30/2021 16:01:40 - INFO - __main__ - Step 15396: {'lr': 0.0004899620771429585, 'samples': 2956032, 'steps': 15395, 'loss/train': 1.3027268648147583} -08/30/2021 16:01:40 - INFO - __main__ - Step 15397: {'lr': 0.0004899605884432983, 'samples': 2956224, 'steps': 15396, 'loss/train': 2.2151174545288086} -08/30/2021 16:01:40 - INFO - __main__ - Step 15398: {'lr': 0.0004899590996355155, 'samples': 2956416, 'steps': 15397, 'loss/train': 1.4743446111679077} -08/30/2021 16:01:41 - INFO - __main__ - Step 15399: {'lr': 0.000489957610719611, 'samples': 2956608, 'steps': 15398, 'loss/train': 2.064164161682129} -08/30/2021 16:01:43 - INFO - __main__ - Step 15400: {'lr': 0.0004899561216955852, 'samples': 2956800, 'steps': 15399, 'loss/train': 1.038681149482727} -08/30/2021 16:01:43 - INFO - __main__ - Step 15401: {'lr': 0.0004899546325634388, 'samples': 2956992, 'steps': 15400, 'loss/train': 1.3875161409378052} -08/30/2021 16:01:43 - INFO - __main__ - Step 15402: {'lr': 0.0004899531433231728, 'samples': 2957184, 'steps': 15401, 'loss/train': 2.049558639526367} -08/30/2021 16:01:44 - INFO - __main__ - Step 15403: {'lr': 0.0004899516539747874, 'samples': 2957376, 'steps': 15402, 'loss/train': 2.8670461177825928} -08/30/2021 16:01:44 - INFO - __main__ - Step 15404: {'lr': 0.0004899501645182835, 'samples': 2957568, 'steps': 15403, 'loss/train': 1.763898491859436} -08/30/2021 16:01:47 - INFO - __main__ - Step 15405: {'lr': 0.0004899486749536618, 'samples': 2957760, 'steps': 15404, 'loss/train': 1.6202975511550903} -08/30/2021 16:01:47 - INFO - __main__ - Step 15406: {'lr': 0.000489947185280923, 'samples': 2957952, 'steps': 15405, 'loss/train': 1.525149941444397} -08/30/2021 16:01:47 - INFO - __main__ - Step 15407: {'lr': 0.0004899456955000676, 'samples': 2958144, 'steps': 15406, 'loss/train': 2.3715343475341797} -08/30/2021 16:01:48 - INFO - __main__ - Step 15408: {'lr': 0.0004899442056110964, 'samples': 2958336, 'steps': 15407, 'loss/train': 0.917862057685852} -08/30/2021 16:01:48 - INFO - __main__ - Step 15409: {'lr': 0.00048994271561401, 'samples': 2958528, 'steps': 15408, 'loss/train': 0.7670138478279114} -08/30/2021 16:01:48 - INFO - __main__ - Step 15410: {'lr': 0.0004899412255088091, 'samples': 2958720, 'steps': 15409, 'loss/train': 0.6514217853546143} -08/30/2021 16:01:50 - INFO - __main__ - Step 15411: {'lr': 0.0004899397352954945, 'samples': 2958912, 'steps': 15410, 'loss/train': 1.4594303369522095} -08/30/2021 16:01:50 - INFO - __main__ - Step 15412: {'lr': 0.0004899382449740667, 'samples': 2959104, 'steps': 15411, 'loss/train': 1.6789549589157104} -08/30/2021 16:01:51 - INFO - __main__ - Step 15413: {'lr': 0.0004899367545445264, 'samples': 2959296, 'steps': 15412, 'loss/train': 1.2324168682098389} -08/30/2021 16:01:51 - INFO - __main__ - Step 15414: {'lr': 0.0004899352640068743, 'samples': 2959488, 'steps': 15413, 'loss/train': 1.689152717590332} -08/30/2021 16:01:51 - INFO - __main__ - Step 15415: {'lr': 0.0004899337733611113, 'samples': 2959680, 'steps': 15414, 'loss/train': 2.1103951930999756} -08/30/2021 16:01:53 - INFO - __main__ - Step 15416: {'lr': 0.0004899322826072375, 'samples': 2959872, 'steps': 15415, 'loss/train': 1.8710706233978271} -08/30/2021 16:01:54 - INFO - __main__ - Step 15417: {'lr': 0.0004899307917452542, 'samples': 2960064, 'steps': 15416, 'loss/train': 2.642216205596924} -08/30/2021 16:01:54 - INFO - __main__ - Step 15418: {'lr': 0.0004899293007751616, 'samples': 2960256, 'steps': 15417, 'loss/train': 1.8343582153320312} -08/30/2021 16:01:54 - INFO - __main__ - Step 15419: {'lr': 0.0004899278096969605, 'samples': 2960448, 'steps': 15418, 'loss/train': 2.05309796333313} -08/30/2021 16:01:55 - INFO - __main__ - Step 15420: {'lr': 0.0004899263185106518, 'samples': 2960640, 'steps': 15419, 'loss/train': 1.5433604717254639} -08/30/2021 16:01:55 - INFO - __main__ - Step 15421: {'lr': 0.000489924827216236, 'samples': 2960832, 'steps': 15420, 'loss/train': 2.4911468029022217} -08/30/2021 16:01:57 - INFO - __main__ - Step 15422: {'lr': 0.0004899233358137137, 'samples': 2961024, 'steps': 15421, 'loss/train': 2.5839223861694336} -08/30/2021 16:01:57 - INFO - __main__ - Step 15423: {'lr': 0.0004899218443030857, 'samples': 2961216, 'steps': 15422, 'loss/train': 1.6599600315093994} -08/30/2021 16:01:57 - INFO - __main__ - Step 15424: {'lr': 0.0004899203526843526, 'samples': 2961408, 'steps': 15423, 'loss/train': 2.8455517292022705} -08/30/2021 16:01:58 - INFO - __main__ - Step 15425: {'lr': 0.000489918860957515, 'samples': 2961600, 'steps': 15424, 'loss/train': 1.2354341745376587} -08/30/2021 16:01:58 - INFO - __main__ - Step 15426: {'lr': 0.0004899173691225737, 'samples': 2961792, 'steps': 15425, 'loss/train': 1.9968653917312622} -08/30/2021 16:02:00 - INFO - __main__ - Step 15427: {'lr': 0.0004899158771795295, 'samples': 2961984, 'steps': 15426, 'loss/train': 1.388020634651184} -08/30/2021 16:02:00 - INFO - __main__ - Step 15428: {'lr': 0.0004899143851283827, 'samples': 2962176, 'steps': 15427, 'loss/train': 1.0337297916412354} -08/30/2021 16:02:01 - INFO - __main__ - Step 15429: {'lr': 0.0004899128929691343, 'samples': 2962368, 'steps': 15428, 'loss/train': 0.4183272421360016} -08/30/2021 16:02:01 - INFO - __main__ - Step 15430: {'lr': 0.0004899114007017849, 'samples': 2962560, 'steps': 15429, 'loss/train': 1.970598578453064} -08/30/2021 16:02:02 - INFO - __main__ - Step 15431: {'lr': 0.000489909908326335, 'samples': 2962752, 'steps': 15430, 'loss/train': 1.612714171409607} -08/30/2021 16:02:03 - INFO - __main__ - Step 15432: {'lr': 0.0004899084158427855, 'samples': 2962944, 'steps': 15431, 'loss/train': 1.9569873809814453} -08/30/2021 16:02:03 - INFO - __main__ - Step 15433: {'lr': 0.0004899069232511368, 'samples': 2963136, 'steps': 15432, 'loss/train': 1.9313437938690186} -08/30/2021 16:02:04 - INFO - __main__ - Step 15434: {'lr': 0.0004899054305513899, 'samples': 2963328, 'steps': 15433, 'loss/train': 1.5398770570755005} -08/30/2021 16:02:04 - INFO - __main__ - Step 15435: {'lr': 0.0004899039377435452, 'samples': 2963520, 'steps': 15434, 'loss/train': 1.5831071138381958} -08/30/2021 16:02:04 - INFO - __main__ - Step 15436: {'lr': 0.0004899024448276036, 'samples': 2963712, 'steps': 15435, 'loss/train': 1.657619833946228} -08/30/2021 16:02:06 - INFO - __main__ - Step 15437: {'lr': 0.0004899009518035657, 'samples': 2963904, 'steps': 15436, 'loss/train': 1.9374465942382812} -08/30/2021 16:02:06 - INFO - __main__ - Step 15438: {'lr': 0.000489899458671432, 'samples': 2964096, 'steps': 15437, 'loss/train': 1.7268048524856567} -08/30/2021 16:02:07 - INFO - __main__ - Step 15439: {'lr': 0.0004898979654312034, 'samples': 2964288, 'steps': 15438, 'loss/train': 2.1226131916046143} -08/30/2021 16:02:07 - INFO - __main__ - Step 15440: {'lr': 0.0004898964720828804, 'samples': 2964480, 'steps': 15439, 'loss/train': 1.9830279350280762} -08/30/2021 16:02:07 - INFO - __main__ - Step 15441: {'lr': 0.0004898949786264638, 'samples': 2964672, 'steps': 15440, 'loss/train': 1.5021300315856934} -08/30/2021 16:02:08 - INFO - __main__ - Step 15442: {'lr': 0.0004898934850619542, 'samples': 2964864, 'steps': 15441, 'loss/train': 1.5217854976654053} -08/30/2021 16:02:09 - INFO - __main__ - Step 15443: {'lr': 0.0004898919913893522, 'samples': 2965056, 'steps': 15442, 'loss/train': 1.356797456741333} -08/30/2021 16:02:10 - INFO - __main__ - Step 15444: {'lr': 0.0004898904976086588, 'samples': 2965248, 'steps': 15443, 'loss/train': 1.2115391492843628} -08/30/2021 16:02:10 - INFO - __main__ - Step 15445: {'lr': 0.0004898890037198743, 'samples': 2965440, 'steps': 15444, 'loss/train': 2.0368924140930176} -08/30/2021 16:02:11 - INFO - __main__ - Step 15446: {'lr': 0.0004898875097229995, 'samples': 2965632, 'steps': 15445, 'loss/train': 1.4779425859451294} -08/30/2021 16:02:11 - INFO - __main__ - Step 15447: {'lr': 0.0004898860156180351, 'samples': 2965824, 'steps': 15446, 'loss/train': 0.7495663166046143} -08/30/2021 16:02:12 - INFO - __main__ - Step 15448: {'lr': 0.0004898845214049818, 'samples': 2966016, 'steps': 15447, 'loss/train': 1.6176329851150513} -08/30/2021 16:02:13 - INFO - __main__ - Step 15449: {'lr': 0.0004898830270838403, 'samples': 2966208, 'steps': 15448, 'loss/train': 1.2131174802780151} -08/30/2021 16:02:13 - INFO - __main__ - Step 15450: {'lr': 0.0004898815326546111, 'samples': 2966400, 'steps': 15449, 'loss/train': 1.6455386877059937} -08/30/2021 16:02:14 - INFO - __main__ - Step 15451: {'lr': 0.0004898800381172951, 'samples': 2966592, 'steps': 15450, 'loss/train': 1.2084242105484009} -08/30/2021 16:02:14 - INFO - __main__ - Step 15452: {'lr': 0.0004898785434718927, 'samples': 2966784, 'steps': 15451, 'loss/train': 1.802215337753296} -08/30/2021 16:02:16 - INFO - __main__ - Step 15453: {'lr': 0.0004898770487184047, 'samples': 2966976, 'steps': 15452, 'loss/train': 1.7267192602157593} -08/30/2021 16:02:16 - INFO - __main__ - Step 15454: {'lr': 0.000489875553856832, 'samples': 2967168, 'steps': 15453, 'loss/train': 2.06032133102417} -08/30/2021 16:02:16 - INFO - __main__ - Step 15455: {'lr': 0.000489874058887175, 'samples': 2967360, 'steps': 15454, 'loss/train': 2.269136428833008} -08/30/2021 16:02:17 - INFO - __main__ - Step 15456: {'lr': 0.0004898725638094345, 'samples': 2967552, 'steps': 15455, 'loss/train': 1.7237387895584106} -08/30/2021 16:02:17 - INFO - __main__ - Step 15457: {'lr': 0.0004898710686236109, 'samples': 2967744, 'steps': 15456, 'loss/train': 2.390012264251709} -08/30/2021 16:02:17 - INFO - __main__ - Step 15458: {'lr': 0.0004898695733297054, 'samples': 2967936, 'steps': 15457, 'loss/train': 1.067933201789856} -08/30/2021 16:02:19 - INFO - __main__ - Step 15459: {'lr': 0.0004898680779277182, 'samples': 2968128, 'steps': 15458, 'loss/train': 1.0919665098190308} -08/30/2021 16:02:20 - INFO - __main__ - Step 15460: {'lr': 0.0004898665824176502, 'samples': 2968320, 'steps': 15459, 'loss/train': 1.6166990995407104} -08/30/2021 16:02:20 - INFO - __main__ - Step 15461: {'lr': 0.000489865086799502, 'samples': 2968512, 'steps': 15460, 'loss/train': 6.107758045196533} -08/30/2021 16:02:21 - INFO - __main__ - Step 15462: {'lr': 0.0004898635910732743, 'samples': 2968704, 'steps': 15461, 'loss/train': 1.7005637884140015} -08/30/2021 16:02:21 - INFO - __main__ - Step 15463: {'lr': 0.0004898620952389677, 'samples': 2968896, 'steps': 15462, 'loss/train': 1.6844971179962158} -08/30/2021 16:02:22 - INFO - __main__ - Step 15464: {'lr': 0.000489860599296583, 'samples': 2969088, 'steps': 15463, 'loss/train': 1.0527204275131226} -08/30/2021 16:02:23 - INFO - __main__ - Step 15465: {'lr': 0.0004898591032461208, 'samples': 2969280, 'steps': 15464, 'loss/train': 0.9791547060012817} -08/30/2021 16:02:23 - INFO - __main__ - Step 15466: {'lr': 0.0004898576070875818, 'samples': 2969472, 'steps': 15465, 'loss/train': 1.6744648218154907} -08/30/2021 16:02:24 - INFO - __main__ - Step 15467: {'lr': 0.0004898561108209667, 'samples': 2969664, 'steps': 15466, 'loss/train': 1.3549813032150269} -08/30/2021 16:02:24 - INFO - __main__ - Step 15468: {'lr': 0.0004898546144462762, 'samples': 2969856, 'steps': 15467, 'loss/train': 1.7299755811691284} -08/30/2021 16:02:25 - INFO - __main__ - Step 15469: {'lr': 0.0004898531179635108, 'samples': 2970048, 'steps': 15468, 'loss/train': 2.0573878288269043} -08/30/2021 16:02:26 - INFO - __main__ - Step 15470: {'lr': 0.0004898516213726712, 'samples': 2970240, 'steps': 15469, 'loss/train': 1.1556767225265503} -08/30/2021 16:02:26 - INFO - __main__ - Step 15471: {'lr': 0.0004898501246737583, 'samples': 2970432, 'steps': 15470, 'loss/train': 1.9659992456436157} -08/30/2021 16:02:26 - INFO - __main__ - Step 15472: {'lr': 0.0004898486278667725, 'samples': 2970624, 'steps': 15471, 'loss/train': 2.3629324436187744} -08/30/2021 16:02:27 - INFO - __main__ - Step 15473: {'lr': 0.0004898471309517148, 'samples': 2970816, 'steps': 15472, 'loss/train': 1.8187549114227295} -08/30/2021 16:02:29 - INFO - __main__ - Step 15474: {'lr': 0.0004898456339285857, 'samples': 2971008, 'steps': 15473, 'loss/train': 1.479103446006775} -08/30/2021 16:02:29 - INFO - __main__ - Step 15475: {'lr': 0.0004898441367973856, 'samples': 2971200, 'steps': 15474, 'loss/train': 1.9135509729385376} -08/30/2021 16:02:30 - INFO - __main__ - Step 15476: {'lr': 0.0004898426395581156, 'samples': 2971392, 'steps': 15475, 'loss/train': 1.8636592626571655} -08/30/2021 16:02:30 - INFO - __main__ - Step 15477: {'lr': 0.0004898411422107762, 'samples': 2971584, 'steps': 15476, 'loss/train': 1.3952314853668213} -08/30/2021 16:02:31 - INFO - __main__ - Step 15478: {'lr': 0.0004898396447553681, 'samples': 2971776, 'steps': 15477, 'loss/train': 2.1136181354522705} -08/30/2021 16:02:31 - INFO - __main__ - Step 15479: {'lr': 0.000489838147191892, 'samples': 2971968, 'steps': 15478, 'loss/train': 1.599002718925476} -08/30/2021 16:02:31 - INFO - __main__ - Step 15480: {'lr': 0.0004898366495203483, 'samples': 2972160, 'steps': 15479, 'loss/train': 1.0923447608947754} -08/30/2021 16:02:34 - INFO - __main__ - Step 15481: {'lr': 0.0004898351517407381, 'samples': 2972352, 'steps': 15480, 'loss/train': 0.9394541382789612} -08/30/2021 16:02:35 - INFO - __main__ - Step 15482: {'lr': 0.0004898336538530619, 'samples': 2972544, 'steps': 15481, 'loss/train': 1.670491337776184} -08/30/2021 16:02:35 - INFO - __main__ - Step 15483: {'lr': 0.0004898321558573203, 'samples': 2972736, 'steps': 15482, 'loss/train': 1.520904302597046} -08/30/2021 16:02:35 - INFO - __main__ - Step 15484: {'lr': 0.000489830657753514, 'samples': 2972928, 'steps': 15483, 'loss/train': 0.9412619471549988} -08/30/2021 16:02:36 - INFO - __main__ - Step 15485: {'lr': 0.0004898291595416438, 'samples': 2973120, 'steps': 15484, 'loss/train': 1.2993401288986206} -08/30/2021 16:02:36 - INFO - __main__ - Step 15486: {'lr': 0.0004898276612217102, 'samples': 2973312, 'steps': 15485, 'loss/train': 3.5321402549743652} -08/30/2021 16:02:36 - INFO - __main__ - Step 15487: {'lr': 0.0004898261627937139, 'samples': 2973504, 'steps': 15486, 'loss/train': 4.29628324508667} -08/30/2021 16:02:37 - INFO - __main__ - Step 15488: {'lr': 0.0004898246642576559, 'samples': 2973696, 'steps': 15487, 'loss/train': 4.206449508666992} -08/30/2021 16:02:38 - INFO - __main__ - Step 15489: {'lr': 0.0004898231656135362, 'samples': 2973888, 'steps': 15488, 'loss/train': 3.173597812652588} -08/30/2021 16:02:39 - INFO - __main__ - Step 15490: {'lr': 0.0004898216668613562, 'samples': 2974080, 'steps': 15489, 'loss/train': 2.2753357887268066} -08/30/2021 16:02:39 - INFO - __main__ - Step 15491: {'lr': 0.0004898201680011161, 'samples': 2974272, 'steps': 15490, 'loss/train': 1.9113277196884155} -08/30/2021 16:02:39 - INFO - __main__ - Step 15492: {'lr': 0.0004898186690328168, 'samples': 2974464, 'steps': 15491, 'loss/train': 1.8918006420135498} -08/30/2021 16:02:40 - INFO - __main__ - Step 15493: {'lr': 0.000489817169956459, 'samples': 2974656, 'steps': 15492, 'loss/train': 1.9345825910568237} -08/30/2021 16:02:42 - INFO - __main__ - Step 15494: {'lr': 0.0004898156707720432, 'samples': 2974848, 'steps': 15493, 'loss/train': 2.1934449672698975} -08/30/2021 16:02:42 - INFO - __main__ - Step 15495: {'lr': 0.0004898141714795701, 'samples': 2975040, 'steps': 15494, 'loss/train': 1.4573293924331665} -08/30/2021 16:02:43 - INFO - __main__ - Step 15496: {'lr': 0.0004898126720790405, 'samples': 2975232, 'steps': 15495, 'loss/train': 2.0083725452423096} -08/30/2021 16:02:43 - INFO - __main__ - Step 15497: {'lr': 0.0004898111725704549, 'samples': 2975424, 'steps': 15496, 'loss/train': 2.119008779525757} -08/30/2021 16:02:43 - INFO - __main__ - Step 15498: {'lr': 0.0004898096729538142, 'samples': 2975616, 'steps': 15497, 'loss/train': 1.5298768281936646} -08/30/2021 16:02:44 - INFO - __main__ - Step 15499: {'lr': 0.000489808173229119, 'samples': 2975808, 'steps': 15498, 'loss/train': 2.387995958328247} -08/30/2021 16:02:44 - INFO - __main__ - Step 15500: {'lr': 0.0004898066733963699, 'samples': 2976000, 'steps': 15499, 'loss/train': 1.9597584009170532} -08/30/2021 16:02:45 - INFO - __main__ - Step 15501: {'lr': 0.0004898051734555676, 'samples': 2976192, 'steps': 15500, 'loss/train': 2.040754795074463} -08/30/2021 16:02:46 - INFO - __main__ - Step 15502: {'lr': 0.0004898036734067127, 'samples': 2976384, 'steps': 15501, 'loss/train': 1.9665862321853638} -08/30/2021 16:02:46 - INFO - __main__ - Step 15503: {'lr': 0.000489802173249806, 'samples': 2976576, 'steps': 15502, 'loss/train': 1.9422433376312256} -08/30/2021 16:02:47 - INFO - __main__ - Step 15504: {'lr': 0.0004898006729848482, 'samples': 2976768, 'steps': 15503, 'loss/train': 2.226653575897217} -08/30/2021 16:02:47 - INFO - __main__ - Step 15505: {'lr': 0.0004897991726118399, 'samples': 2976960, 'steps': 15504, 'loss/train': 2.4603707790374756} -08/30/2021 16:02:49 - INFO - __main__ - Step 15506: {'lr': 0.0004897976721307818, 'samples': 2977152, 'steps': 15505, 'loss/train': 1.1228480339050293} -08/30/2021 16:02:49 - INFO - __main__ - Step 15507: {'lr': 0.0004897961715416746, 'samples': 2977344, 'steps': 15506, 'loss/train': 1.8973417282104492} -08/30/2021 16:02:50 - INFO - __main__ - Step 15508: {'lr': 0.0004897946708445189, 'samples': 2977536, 'steps': 15507, 'loss/train': 4.241513729095459} -08/30/2021 16:02:50 - INFO - __main__ - Step 15509: {'lr': 0.0004897931700393154, 'samples': 2977728, 'steps': 15508, 'loss/train': 2.953615665435791} -08/30/2021 16:02:50 - INFO - __main__ - Step 15510: {'lr': 0.0004897916691260648, 'samples': 2977920, 'steps': 15509, 'loss/train': 2.6631486415863037} -08/30/2021 16:02:51 - INFO - __main__ - Step 15511: {'lr': 0.0004897901681047679, 'samples': 2978112, 'steps': 15510, 'loss/train': 1.7656136751174927} -08/30/2021 16:02:53 - INFO - __main__ - Step 15512: {'lr': 0.0004897886669754251, 'samples': 2978304, 'steps': 15511, 'loss/train': 1.8558725118637085} -08/30/2021 16:02:53 - INFO - __main__ - Step 15513: {'lr': 0.0004897871657380373, 'samples': 2978496, 'steps': 15512, 'loss/train': 2.337657928466797} -08/30/2021 16:02:54 - INFO - __main__ - Step 15514: {'lr': 0.0004897856643926051, 'samples': 2978688, 'steps': 15513, 'loss/train': 2.785068988800049} -08/30/2021 16:02:54 - INFO - __main__ - Step 15515: {'lr': 0.0004897841629391291, 'samples': 2978880, 'steps': 15514, 'loss/train': 2.09179949760437} -08/30/2021 16:02:54 - INFO - __main__ - Step 15516: {'lr': 0.0004897826613776101, 'samples': 2979072, 'steps': 15515, 'loss/train': 2.7315292358398438} -08/30/2021 16:02:56 - INFO - __main__ - Step 15517: {'lr': 0.0004897811597080488, 'samples': 2979264, 'steps': 15516, 'loss/train': 2.242156744003296} -08/30/2021 16:02:56 - INFO - __main__ - Step 15518: {'lr': 0.0004897796579304458, 'samples': 2979456, 'steps': 15517, 'loss/train': 2.1583588123321533} -08/30/2021 16:02:57 - INFO - __main__ - Step 15519: {'lr': 0.0004897781560448017, 'samples': 2979648, 'steps': 15518, 'loss/train': 1.82471764087677} -08/30/2021 16:02:57 - INFO - __main__ - Step 15520: {'lr': 0.0004897766540511173, 'samples': 2979840, 'steps': 15519, 'loss/train': 0.4177507758140564} -08/30/2021 16:02:57 - INFO - __main__ - Step 15521: {'lr': 0.0004897751519493933, 'samples': 2980032, 'steps': 15520, 'loss/train': 2.0823662281036377} -08/30/2021 16:02:58 - INFO - __main__ - Step 15522: {'lr': 0.0004897736497396303, 'samples': 2980224, 'steps': 15521, 'loss/train': 2.7419381141662598} -08/30/2021 16:03:00 - INFO - __main__ - Step 15523: {'lr': 0.000489772147421829, 'samples': 2980416, 'steps': 15522, 'loss/train': 2.4459147453308105} -08/30/2021 16:03:00 - INFO - __main__ - Step 15524: {'lr': 0.0004897706449959899, 'samples': 2980608, 'steps': 15523, 'loss/train': 2.3358840942382812} -08/30/2021 16:03:00 - INFO - __main__ - Step 15525: {'lr': 0.000489769142462114, 'samples': 2980800, 'steps': 15524, 'loss/train': 1.6837490797042847} -08/30/2021 16:03:01 - INFO - __main__ - Step 15526: {'lr': 0.0004897676398202018, 'samples': 2980992, 'steps': 15525, 'loss/train': 2.7207229137420654} -08/30/2021 16:03:01 - INFO - __main__ - Step 15527: {'lr': 0.000489766137070254, 'samples': 2981184, 'steps': 15526, 'loss/train': 1.6504679918289185} -08/30/2021 16:03:02 - INFO - __main__ - Step 15528: {'lr': 0.0004897646342122713, 'samples': 2981376, 'steps': 15527, 'loss/train': 0.8819839954376221} -08/30/2021 16:03:03 - INFO - __main__ - Step 15529: {'lr': 0.0004897631312462544, 'samples': 2981568, 'steps': 15528, 'loss/train': 1.7353520393371582} -08/30/2021 16:03:03 - INFO - __main__ - Step 15530: {'lr': 0.0004897616281722038, 'samples': 2981760, 'steps': 15529, 'loss/train': 2.0722784996032715} -08/30/2021 16:03:04 - INFO - __main__ - Step 15531: {'lr': 0.0004897601249901204, 'samples': 2981952, 'steps': 15530, 'loss/train': 1.614208698272705} -08/30/2021 16:03:04 - INFO - __main__ - Step 15532: {'lr': 0.0004897586217000047, 'samples': 2982144, 'steps': 15531, 'loss/train': 2.2137129306793213} -08/30/2021 16:03:06 - INFO - __main__ - Step 15533: {'lr': 0.0004897571183018576, 'samples': 2982336, 'steps': 15532, 'loss/train': 2.5601062774658203} -08/30/2021 16:03:06 - INFO - __main__ - Step 15534: {'lr': 0.0004897556147956796, 'samples': 2982528, 'steps': 15533, 'loss/train': 1.969010591506958} -08/30/2021 16:03:06 - INFO - __main__ - Step 15535: {'lr': 0.0004897541111814714, 'samples': 2982720, 'steps': 15534, 'loss/train': 1.4815599918365479} -08/30/2021 16:03:07 - INFO - __main__ - Step 15536: {'lr': 0.0004897526074592337, 'samples': 2982912, 'steps': 15535, 'loss/train': 2.658247470855713} -08/30/2021 16:03:07 - INFO - __main__ - Step 15537: {'lr': 0.0004897511036289671, 'samples': 2983104, 'steps': 15536, 'loss/train': 1.8597320318222046} -08/30/2021 16:03:09 - INFO - __main__ - Step 15538: {'lr': 0.0004897495996906725, 'samples': 2983296, 'steps': 15537, 'loss/train': 1.9959858655929565} -08/30/2021 16:03:09 - INFO - __main__ - Step 15539: {'lr': 0.0004897480956443503, 'samples': 2983488, 'steps': 15538, 'loss/train': 1.9335285425186157} -08/30/2021 16:03:10 - INFO - __main__ - Step 15540: {'lr': 0.0004897465914900013, 'samples': 2983680, 'steps': 15539, 'loss/train': 2.258700370788574} -08/30/2021 16:03:10 - INFO - __main__ - Step 15541: {'lr': 0.0004897450872276263, 'samples': 2983872, 'steps': 15540, 'loss/train': 1.6229095458984375} -08/30/2021 16:03:10 - INFO - __main__ - Step 15542: {'lr': 0.0004897435828572258, 'samples': 2984064, 'steps': 15541, 'loss/train': 1.8740934133529663} -08/30/2021 16:03:11 - INFO - __main__ - Step 15543: {'lr': 0.0004897420783788006, 'samples': 2984256, 'steps': 15542, 'loss/train': 0.48658761382102966} -08/30/2021 16:03:12 - INFO - __main__ - Step 15544: {'lr': 0.0004897405737923511, 'samples': 2984448, 'steps': 15543, 'loss/train': 1.3301993608474731} -08/30/2021 16:03:13 - INFO - __main__ - Step 15545: {'lr': 0.0004897390690978785, 'samples': 2984640, 'steps': 15544, 'loss/train': 2.144516944885254} -08/30/2021 16:03:13 - INFO - __main__ - Step 15546: {'lr': 0.000489737564295383, 'samples': 2984832, 'steps': 15545, 'loss/train': 1.8909426927566528} -08/30/2021 16:03:13 - INFO - __main__ - Step 15547: {'lr': 0.0004897360593848655, 'samples': 2985024, 'steps': 15546, 'loss/train': 2.0608294010162354} -08/30/2021 16:03:14 - INFO - __main__ - Step 15548: {'lr': 0.0004897345543663266, 'samples': 2985216, 'steps': 15547, 'loss/train': 1.966789722442627} -08/30/2021 16:03:15 - INFO - __main__ - Step 15549: {'lr': 0.000489733049239767, 'samples': 2985408, 'steps': 15548, 'loss/train': 2.0603878498077393} -08/30/2021 16:03:16 - INFO - __main__ - Step 15550: {'lr': 0.0004897315440051874, 'samples': 2985600, 'steps': 15549, 'loss/train': 1.5398551225662231} -08/30/2021 16:03:16 - INFO - __main__ - Step 15551: {'lr': 0.0004897300386625885, 'samples': 2985792, 'steps': 15550, 'loss/train': 1.3343030214309692} -08/30/2021 16:03:16 - INFO - __main__ - Step 15552: {'lr': 0.0004897285332119709, 'samples': 2985984, 'steps': 15551, 'loss/train': 1.5717535018920898} -08/30/2021 16:03:17 - INFO - __main__ - Step 15553: {'lr': 0.0004897270276533355, 'samples': 2986176, 'steps': 15552, 'loss/train': 1.6205661296844482} -08/30/2021 16:03:18 - INFO - __main__ - Step 15554: {'lr': 0.0004897255219866825, 'samples': 2986368, 'steps': 15553, 'loss/train': 1.9927802085876465} -08/30/2021 16:03:19 - INFO - __main__ - Step 15555: {'lr': 0.000489724016212013, 'samples': 2986560, 'steps': 15554, 'loss/train': 2.115006446838379} -08/30/2021 16:03:19 - INFO - __main__ - Step 15556: {'lr': 0.0004897225103293277, 'samples': 2986752, 'steps': 15555, 'loss/train': 1.4051820039749146} -08/30/2021 16:03:19 - INFO - __main__ - Step 15557: {'lr': 0.0004897210043386269, 'samples': 2986944, 'steps': 15556, 'loss/train': 1.575562834739685} -08/30/2021 16:03:20 - INFO - __main__ - Step 15558: {'lr': 0.0004897194982399117, 'samples': 2987136, 'steps': 15557, 'loss/train': 1.874578595161438} -08/30/2021 16:03:21 - INFO - __main__ - Step 15559: {'lr': 0.0004897179920331826, 'samples': 2987328, 'steps': 15558, 'loss/train': 1.6472991704940796} -08/30/2021 16:03:22 - INFO - __main__ - Step 15560: {'lr': 0.0004897164857184401, 'samples': 2987520, 'steps': 15559, 'loss/train': 1.7609413862228394} -08/30/2021 16:03:22 - INFO - __main__ - Step 15561: {'lr': 0.0004897149792956852, 'samples': 2987712, 'steps': 15560, 'loss/train': 2.2637219429016113} -08/30/2021 16:03:22 - INFO - __main__ - Step 15562: {'lr': 0.0004897134727649184, 'samples': 2987904, 'steps': 15561, 'loss/train': 1.636091947555542} -08/30/2021 16:03:23 - INFO - __main__ - Step 15563: {'lr': 0.0004897119661261403, 'samples': 2988096, 'steps': 15562, 'loss/train': 1.4694645404815674} -08/30/2021 16:03:24 - INFO - __main__ - Step 15564: {'lr': 0.0004897104593793518, 'samples': 2988288, 'steps': 15563, 'loss/train': 1.817311406135559} -08/30/2021 16:03:25 - INFO - __main__ - Step 15565: {'lr': 0.0004897089525245535, 'samples': 2988480, 'steps': 15564, 'loss/train': 2.0266592502593994} -08/30/2021 16:03:25 - INFO - __main__ - Step 15566: {'lr': 0.000489707445561746, 'samples': 2988672, 'steps': 15565, 'loss/train': 1.5361164808273315} -08/30/2021 16:03:25 - INFO - __main__ - Step 15567: {'lr': 0.0004897059384909299, 'samples': 2988864, 'steps': 15566, 'loss/train': 2.2441718578338623} -08/30/2021 16:03:26 - INFO - __main__ - Step 15568: {'lr': 0.0004897044313121061, 'samples': 2989056, 'steps': 15567, 'loss/train': 1.7525969743728638} -08/30/2021 16:03:28 - INFO - __main__ - Step 15569: {'lr': 0.0004897029240252753, 'samples': 2989248, 'steps': 15568, 'loss/train': 2.4664337635040283} -08/30/2021 16:03:28 - INFO - __main__ - Step 15570: {'lr': 0.000489701416630438, 'samples': 2989440, 'steps': 15569, 'loss/train': 1.9209808111190796} -08/30/2021 16:03:29 - INFO - __main__ - Step 15571: {'lr': 0.0004896999091275948, 'samples': 2989632, 'steps': 15570, 'loss/train': 0.6832961440086365} -08/30/2021 16:03:29 - INFO - __main__ - Step 15572: {'lr': 0.0004896984015167466, 'samples': 2989824, 'steps': 15571, 'loss/train': 1.6293202638626099} -08/30/2021 16:03:29 - INFO - __main__ - Step 15573: {'lr': 0.0004896968937978941, 'samples': 2990016, 'steps': 15572, 'loss/train': 1.7801684141159058} -08/30/2021 16:03:31 - INFO - __main__ - Step 15574: {'lr': 0.0004896953859710379, 'samples': 2990208, 'steps': 15573, 'loss/train': 1.8957176208496094} -08/30/2021 16:03:31 - INFO - __main__ - Step 15575: {'lr': 0.0004896938780361784, 'samples': 2990400, 'steps': 15574, 'loss/train': 1.351629614830017} -08/30/2021 16:03:32 - INFO - __main__ - Step 15576: {'lr': 0.0004896923699933167, 'samples': 2990592, 'steps': 15575, 'loss/train': 1.7757244110107422} -08/30/2021 16:03:32 - INFO - __main__ - Step 15577: {'lr': 0.0004896908618424533, 'samples': 2990784, 'steps': 15576, 'loss/train': 0.904737651348114} -08/30/2021 16:03:32 - INFO - __main__ - Step 15578: {'lr': 0.0004896893535835889, 'samples': 2990976, 'steps': 15577, 'loss/train': 1.9108182191848755} -08/30/2021 16:03:34 - INFO - __main__ - Step 15579: {'lr': 0.0004896878452167241, 'samples': 2991168, 'steps': 15578, 'loss/train': 1.9039455652236938} -08/30/2021 16:03:35 - INFO - __main__ - Step 15580: {'lr': 0.0004896863367418598, 'samples': 2991360, 'steps': 15579, 'loss/train': 1.4533703327178955} -08/30/2021 16:03:35 - INFO - __main__ - Step 15581: {'lr': 0.0004896848281589966, 'samples': 2991552, 'steps': 15580, 'loss/train': 1.8411744832992554} -08/30/2021 16:03:35 - INFO - __main__ - Step 15582: {'lr': 0.0004896833194681349, 'samples': 2991744, 'steps': 15581, 'loss/train': 1.028562307357788} -08/30/2021 16:03:36 - INFO - __main__ - Step 15583: {'lr': 0.0004896818106692757, 'samples': 2991936, 'steps': 15582, 'loss/train': 1.3289109468460083} -08/30/2021 16:03:36 - INFO - __main__ - Step 15584: {'lr': 0.0004896803017624196, 'samples': 2992128, 'steps': 15583, 'loss/train': 2.1643829345703125} -08/30/2021 16:03:38 - INFO - __main__ - Step 15585: {'lr': 0.0004896787927475671, 'samples': 2992320, 'steps': 15584, 'loss/train': 1.8471970558166504} -08/30/2021 16:03:38 - INFO - __main__ - Step 15586: {'lr': 0.0004896772836247192, 'samples': 2992512, 'steps': 15585, 'loss/train': 0.6814278960227966} -08/30/2021 16:03:38 - INFO - __main__ - Step 15587: {'lr': 0.0004896757743938764, 'samples': 2992704, 'steps': 15586, 'loss/train': 1.236244559288025} -08/30/2021 16:03:39 - INFO - __main__ - Step 15588: {'lr': 0.0004896742650550393, 'samples': 2992896, 'steps': 15587, 'loss/train': 0.9975184202194214} -08/30/2021 16:03:39 - INFO - __main__ - Step 15589: {'lr': 0.0004896727556082086, 'samples': 2993088, 'steps': 15588, 'loss/train': 1.2266881465911865} -08/30/2021 16:03:41 - INFO - __main__ - Step 15590: {'lr': 0.0004896712460533854, 'samples': 2993280, 'steps': 15589, 'loss/train': 1.6080315113067627} -08/30/2021 16:03:41 - INFO - __main__ - Step 15591: {'lr': 0.0004896697363905697, 'samples': 2993472, 'steps': 15590, 'loss/train': 1.8571051359176636} -08/30/2021 16:03:41 - INFO - __main__ - Step 15592: {'lr': 0.0004896682266197626, 'samples': 2993664, 'steps': 15591, 'loss/train': 1.597836971282959} -08/30/2021 16:03:42 - INFO - __main__ - Step 15593: {'lr': 0.0004896667167409648, 'samples': 2993856, 'steps': 15592, 'loss/train': 1.7377614974975586} -08/30/2021 16:03:42 - INFO - __main__ - Step 15594: {'lr': 0.0004896652067541767, 'samples': 2994048, 'steps': 15593, 'loss/train': 2.089097738265991} -08/30/2021 16:03:44 - INFO - __main__ - Step 15595: {'lr': 0.0004896636966593993, 'samples': 2994240, 'steps': 15594, 'loss/train': 1.5005847215652466} -08/30/2021 16:03:44 - INFO - __main__ - Step 15596: {'lr': 0.0004896621864566331, 'samples': 2994432, 'steps': 15595, 'loss/train': 1.8175733089447021} -08/30/2021 16:03:44 - INFO - __main__ - Step 15597: {'lr': 0.0004896606761458788, 'samples': 2994624, 'steps': 15596, 'loss/train': 2.0225472450256348} -08/30/2021 16:03:45 - INFO - __main__ - Step 15598: {'lr': 0.0004896591657271371, 'samples': 2994816, 'steps': 15597, 'loss/train': 1.8359782695770264} -08/30/2021 16:03:45 - INFO - __main__ - Step 15599: {'lr': 0.0004896576552004087, 'samples': 2995008, 'steps': 15598, 'loss/train': 1.9440196752548218} -08/30/2021 16:03:47 - INFO - __main__ - Step 15600: {'lr': 0.0004896561445656943, 'samples': 2995200, 'steps': 15599, 'loss/train': 1.7889635562896729} -08/30/2021 16:03:47 - INFO - __main__ - Step 15601: {'lr': 0.0004896546338229945, 'samples': 2995392, 'steps': 15600, 'loss/train': 1.71900475025177} -08/30/2021 16:03:47 - INFO - __main__ - Step 15602: {'lr': 0.00048965312297231, 'samples': 2995584, 'steps': 15601, 'loss/train': 1.3022347688674927} -08/30/2021 16:03:48 - INFO - __main__ - Step 15603: {'lr': 0.0004896516120136415, 'samples': 2995776, 'steps': 15602, 'loss/train': 1.4900071620941162} -08/30/2021 16:03:48 - INFO - __main__ - Step 15604: {'lr': 0.0004896501009469896, 'samples': 2995968, 'steps': 15603, 'loss/train': 1.9007580280303955} -08/30/2021 16:03:50 - INFO - __main__ - Step 15605: {'lr': 0.0004896485897723552, 'samples': 2996160, 'steps': 15604, 'loss/train': 1.6240850687026978} -08/30/2021 16:03:50 - INFO - __main__ - Step 15606: {'lr': 0.0004896470784897388, 'samples': 2996352, 'steps': 15605, 'loss/train': 1.648932933807373} -08/30/2021 16:03:50 - INFO - __main__ - Step 15607: {'lr': 0.0004896455670991411, 'samples': 2996544, 'steps': 15606, 'loss/train': 2.3295695781707764} -08/30/2021 16:03:51 - INFO - __main__ - Step 15608: {'lr': 0.0004896440556005628, 'samples': 2996736, 'steps': 15607, 'loss/train': 1.33921480178833} -08/30/2021 16:03:51 - INFO - __main__ - Step 15609: {'lr': 0.0004896425439940047, 'samples': 2996928, 'steps': 15608, 'loss/train': 2.26648211479187} -08/30/2021 16:03:52 - INFO - __main__ - Step 15610: {'lr': 0.0004896410322794673, 'samples': 2997120, 'steps': 15609, 'loss/train': 2.101055145263672} -08/30/2021 16:03:53 - INFO - __main__ - Step 15611: {'lr': 0.0004896395204569512, 'samples': 2997312, 'steps': 15610, 'loss/train': 1.5403823852539062} -08/30/2021 16:03:54 - INFO - __main__ - Step 15612: {'lr': 0.0004896380085264573, 'samples': 2997504, 'steps': 15611, 'loss/train': 1.9643793106079102} -08/30/2021 16:03:54 - INFO - __main__ - Step 15613: {'lr': 0.0004896364964879864, 'samples': 2997696, 'steps': 15612, 'loss/train': 1.3354697227478027} -08/30/2021 16:03:54 - INFO - __main__ - Step 15614: {'lr': 0.0004896349843415389, 'samples': 2997888, 'steps': 15613, 'loss/train': 1.8205819129943848} -08/30/2021 16:03:55 - INFO - __main__ - Step 15615: {'lr': 0.0004896334720871156, 'samples': 2998080, 'steps': 15614, 'loss/train': 1.1578238010406494} -08/30/2021 16:03:57 - INFO - __main__ - Step 15616: {'lr': 0.0004896319597247169, 'samples': 2998272, 'steps': 15615, 'loss/train': 1.310843586921692} -08/30/2021 16:03:57 - INFO - __main__ - Step 15617: {'lr': 0.0004896304472543439, 'samples': 2998464, 'steps': 15616, 'loss/train': 1.4455901384353638} -08/30/2021 16:03:57 - INFO - __main__ - Step 15618: {'lr': 0.0004896289346759973, 'samples': 2998656, 'steps': 15617, 'loss/train': 2.1688995361328125} -08/30/2021 16:03:58 - INFO - __main__ - Step 15619: {'lr': 0.0004896274219896773, 'samples': 2998848, 'steps': 15618, 'loss/train': 1.1482386589050293} -08/30/2021 16:03:58 - INFO - __main__ - Step 15620: {'lr': 0.000489625909195385, 'samples': 2999040, 'steps': 15619, 'loss/train': 1.9774795770645142} -08/30/2021 16:04:00 - INFO - __main__ - Step 15621: {'lr': 0.0004896243962931211, 'samples': 2999232, 'steps': 15620, 'loss/train': 1.5860469341278076} -08/30/2021 16:04:01 - INFO - __main__ - Step 15622: {'lr': 0.0004896228832828861, 'samples': 2999424, 'steps': 15621, 'loss/train': 1.7794502973556519} -08/30/2021 16:04:01 - INFO - __main__ - Step 15623: {'lr': 0.0004896213701646806, 'samples': 2999616, 'steps': 15622, 'loss/train': 1.5514764785766602} -08/30/2021 16:04:01 - INFO - __main__ - Step 15624: {'lr': 0.0004896198569385055, 'samples': 2999808, 'steps': 15623, 'loss/train': 1.6653560400009155} -08/30/2021 16:04:02 - INFO - __main__ - Step 15625: {'lr': 0.0004896183436043613, 'samples': 3000000, 'steps': 15624, 'loss/train': 1.218605875968933} -08/30/2021 16:04:03 - INFO - __main__ - Step 15626: {'lr': 0.0004896168301622488, 'samples': 3000192, 'steps': 15625, 'loss/train': 1.5329443216323853} -08/30/2021 16:04:04 - INFO - __main__ - Step 15627: {'lr': 0.0004896153166121688, 'samples': 3000384, 'steps': 15626, 'loss/train': 2.0231528282165527} -08/30/2021 16:04:04 - INFO - __main__ - Step 15628: {'lr': 0.0004896138029541217, 'samples': 3000576, 'steps': 15627, 'loss/train': 2.0275752544403076} -08/30/2021 16:04:04 - INFO - __main__ - Step 15629: {'lr': 0.0004896122891881083, 'samples': 3000768, 'steps': 15628, 'loss/train': 1.9274102449417114} -08/30/2021 16:04:05 - INFO - __main__ - Step 15630: {'lr': 0.0004896107753141293, 'samples': 3000960, 'steps': 15629, 'loss/train': 1.6786177158355713} -08/30/2021 16:04:06 - INFO - __main__ - Step 15631: {'lr': 0.0004896092613321854, 'samples': 3001152, 'steps': 15630, 'loss/train': 1.7088583707809448} -08/30/2021 16:04:07 - INFO - __main__ - Step 15632: {'lr': 0.0004896077472422773, 'samples': 3001344, 'steps': 15631, 'loss/train': 1.5837279558181763} -08/30/2021 16:04:07 - INFO - __main__ - Step 15633: {'lr': 0.0004896062330444057, 'samples': 3001536, 'steps': 15632, 'loss/train': 1.5668208599090576} -08/30/2021 16:04:07 - INFO - __main__ - Step 15634: {'lr': 0.0004896047187385711, 'samples': 3001728, 'steps': 15633, 'loss/train': 1.3298778533935547} -08/30/2021 16:04:08 - INFO - __main__ - Step 15635: {'lr': 0.0004896032043247744, 'samples': 3001920, 'steps': 15634, 'loss/train': 1.4978915452957153} -08/30/2021 16:04:09 - INFO - __main__ - Step 15636: {'lr': 0.0004896016898030161, 'samples': 3002112, 'steps': 15635, 'loss/train': 1.8773466348648071} -08/30/2021 16:04:09 - INFO - __main__ - Step 15637: {'lr': 0.0004896001751732971, 'samples': 3002304, 'steps': 15636, 'loss/train': 1.8856909275054932} -08/30/2021 16:04:10 - INFO - __main__ - Step 15638: {'lr': 0.0004895986604356178, 'samples': 3002496, 'steps': 15637, 'loss/train': 1.6762871742248535} -08/30/2021 16:04:10 - INFO - __main__ - Step 15639: {'lr': 0.0004895971455899792, 'samples': 3002688, 'steps': 15638, 'loss/train': 1.5342628955841064} -08/30/2021 16:04:10 - INFO - __main__ - Step 15640: {'lr': 0.0004895956306363818, 'samples': 3002880, 'steps': 15639, 'loss/train': 2.096414804458618} -08/30/2021 16:04:11 - INFO - __main__ - Step 15641: {'lr': 0.0004895941155748263, 'samples': 3003072, 'steps': 15640, 'loss/train': 1.8845845460891724} -08/30/2021 16:04:12 - INFO - __main__ - Step 15642: {'lr': 0.0004895926004053133, 'samples': 3003264, 'steps': 15641, 'loss/train': 1.309841275215149} -08/30/2021 16:04:13 - INFO - __main__ - Step 15643: {'lr': 0.0004895910851278436, 'samples': 3003456, 'steps': 15642, 'loss/train': 1.4342775344848633} -08/30/2021 16:04:13 - INFO - __main__ - Step 15644: {'lr': 0.0004895895697424179, 'samples': 3003648, 'steps': 15643, 'loss/train': 1.3895652294158936} -08/30/2021 16:04:14 - INFO - __main__ - Step 15645: {'lr': 0.0004895880542490369, 'samples': 3003840, 'steps': 15644, 'loss/train': 1.7355033159255981} -08/30/2021 16:04:14 - INFO - __main__ - Step 15646: {'lr': 0.0004895865386477011, 'samples': 3004032, 'steps': 15645, 'loss/train': 1.8758642673492432} -08/30/2021 16:04:15 - INFO - __main__ - Step 15647: {'lr': 0.0004895850229384113, 'samples': 3004224, 'steps': 15646, 'loss/train': 1.4401111602783203} -08/30/2021 16:04:16 - INFO - __main__ - Step 15648: {'lr': 0.0004895835071211682, 'samples': 3004416, 'steps': 15647, 'loss/train': 1.859441876411438} -08/30/2021 16:04:16 - INFO - __main__ - Step 15649: {'lr': 0.0004895819911959725, 'samples': 3004608, 'steps': 15648, 'loss/train': 1.9605817794799805} -08/30/2021 16:04:16 - INFO - __main__ - Step 15650: {'lr': 0.0004895804751628249, 'samples': 3004800, 'steps': 15649, 'loss/train': 2.3211185932159424} -08/30/2021 16:04:17 - INFO - __main__ - Step 15651: {'lr': 0.0004895789590217259, 'samples': 3004992, 'steps': 15650, 'loss/train': 1.648622751235962} -08/30/2021 16:04:18 - INFO - __main__ - Step 15652: {'lr': 0.0004895774427726764, 'samples': 3005184, 'steps': 15651, 'loss/train': 1.631855845451355} -08/30/2021 16:04:19 - INFO - __main__ - Step 15653: {'lr': 0.000489575926415677, 'samples': 3005376, 'steps': 15652, 'loss/train': 1.496962070465088} -08/30/2021 16:04:19 - INFO - __main__ - Step 15654: {'lr': 0.0004895744099507284, 'samples': 3005568, 'steps': 15653, 'loss/train': 1.2107460498809814} -08/30/2021 16:04:20 - INFO - __main__ - Step 15655: {'lr': 0.0004895728933778313, 'samples': 3005760, 'steps': 15654, 'loss/train': 1.797992467880249} -08/30/2021 16:04:20 - INFO - __main__ - Step 15656: {'lr': 0.0004895713766969863, 'samples': 3005952, 'steps': 15655, 'loss/train': 1.4545979499816895} -08/30/2021 16:04:21 - INFO - __main__ - Step 15657: {'lr': 0.0004895698599081942, 'samples': 3006144, 'steps': 15656, 'loss/train': 1.5968542098999023} -08/30/2021 16:04:22 - INFO - __main__ - Step 15658: {'lr': 0.0004895683430114555, 'samples': 3006336, 'steps': 15657, 'loss/train': 3.075434923171997} -08/30/2021 16:04:22 - INFO - __main__ - Step 15659: {'lr': 0.0004895668260067711, 'samples': 3006528, 'steps': 15658, 'loss/train': 1.7385143041610718} -08/30/2021 16:04:23 - INFO - __main__ - Step 15660: {'lr': 0.0004895653088941416, 'samples': 3006720, 'steps': 15659, 'loss/train': 1.9182649850845337} -08/30/2021 16:04:23 - INFO - __main__ - Step 15661: {'lr': 0.0004895637916735675, 'samples': 3006912, 'steps': 15660, 'loss/train': 1.7979016304016113} -08/30/2021 16:04:25 - INFO - __main__ - Step 15662: {'lr': 0.0004895622743450497, 'samples': 3007104, 'steps': 15661, 'loss/train': 1.7512699365615845} -08/30/2021 16:04:25 - INFO - __main__ - Step 15663: {'lr': 0.000489560756908589, 'samples': 3007296, 'steps': 15662, 'loss/train': 0.8430560827255249} -08/30/2021 16:04:25 - INFO - __main__ - Step 15664: {'lr': 0.0004895592393641858, 'samples': 3007488, 'steps': 15663, 'loss/train': 1.425565242767334} -08/30/2021 16:04:26 - INFO - __main__ - Step 15665: {'lr': 0.0004895577217118408, 'samples': 3007680, 'steps': 15664, 'loss/train': 1.679845929145813} -08/30/2021 16:04:26 - INFO - __main__ - Step 15666: {'lr': 0.000489556203951555, 'samples': 3007872, 'steps': 15665, 'loss/train': 1.8205928802490234} -08/30/2021 16:04:26 - INFO - __main__ - Step 15667: {'lr': 0.0004895546860833287, 'samples': 3008064, 'steps': 15666, 'loss/train': 1.5674464702606201} -08/30/2021 16:04:28 - INFO - __main__ - Step 15668: {'lr': 0.000489553168107163, 'samples': 3008256, 'steps': 15667, 'loss/train': 2.0820534229278564} -08/30/2021 16:04:29 - INFO - __main__ - Step 15669: {'lr': 0.0004895516500230581, 'samples': 3008448, 'steps': 15668, 'loss/train': 1.8909108638763428} -08/30/2021 16:04:29 - INFO - __main__ - Step 15670: {'lr': 0.000489550131831015, 'samples': 3008640, 'steps': 15669, 'loss/train': 1.6744166612625122} -08/30/2021 16:04:29 - INFO - __main__ - Step 15671: {'lr': 0.0004895486135310343, 'samples': 3008832, 'steps': 15670, 'loss/train': 1.5791500806808472} -08/30/2021 16:04:30 - INFO - __main__ - Step 15672: {'lr': 0.0004895470951231166, 'samples': 3009024, 'steps': 15671, 'loss/train': 1.5914665460586548} -08/30/2021 16:04:31 - INFO - __main__ - Step 15673: {'lr': 0.0004895455766072629, 'samples': 3009216, 'steps': 15672, 'loss/train': 0.410793662071228} -08/30/2021 16:04:32 - INFO - __main__ - Step 15674: {'lr': 0.0004895440579834736, 'samples': 3009408, 'steps': 15673, 'loss/train': 1.7942060232162476} -08/30/2021 16:04:32 - INFO - __main__ - Step 15675: {'lr': 0.0004895425392517493, 'samples': 3009600, 'steps': 15674, 'loss/train': 1.6709843873977661} -08/30/2021 16:04:32 - INFO - __main__ - Step 15676: {'lr': 0.0004895410204120909, 'samples': 3009792, 'steps': 15675, 'loss/train': 1.6655640602111816} -08/30/2021 16:04:33 - INFO - __main__ - Step 15677: {'lr': 0.000489539501464499, 'samples': 3009984, 'steps': 15676, 'loss/train': 1.4968088865280151} -08/30/2021 16:04:35 - INFO - __main__ - Step 15678: {'lr': 0.0004895379824089743, 'samples': 3010176, 'steps': 15677, 'loss/train': 2.078408718109131} -08/30/2021 16:04:35 - INFO - __main__ - Step 15679: {'lr': 0.0004895364632455175, 'samples': 3010368, 'steps': 15678, 'loss/train': 1.7145956754684448} -08/30/2021 16:04:36 - INFO - __main__ - Step 15680: {'lr': 0.0004895349439741292, 'samples': 3010560, 'steps': 15679, 'loss/train': 2.807765483856201} -08/30/2021 16:04:36 - INFO - __main__ - Step 15681: {'lr': 0.0004895334245948103, 'samples': 3010752, 'steps': 15680, 'loss/train': 2.011272430419922} -08/30/2021 16:04:36 - INFO - __main__ - Step 15682: {'lr': 0.0004895319051075612, 'samples': 3010944, 'steps': 15681, 'loss/train': 1.902477741241455} -08/30/2021 16:04:38 - INFO - __main__ - Step 15683: {'lr': 0.0004895303855123828, 'samples': 3011136, 'steps': 15682, 'loss/train': 1.9463393688201904} -08/30/2021 16:04:38 - INFO - __main__ - Step 15684: {'lr': 0.0004895288658092757, 'samples': 3011328, 'steps': 15683, 'loss/train': 1.6282411813735962} -08/30/2021 16:04:39 - INFO - __main__ - Step 15685: {'lr': 0.0004895273459982406, 'samples': 3011520, 'steps': 15684, 'loss/train': 1.6483428478240967} -08/30/2021 16:04:39 - INFO - __main__ - Step 15686: {'lr': 0.0004895258260792781, 'samples': 3011712, 'steps': 15685, 'loss/train': 1.8689420223236084} -08/30/2021 16:04:39 - INFO - __main__ - Step 15687: {'lr': 0.0004895243060523889, 'samples': 3011904, 'steps': 15686, 'loss/train': 1.473405122756958} -08/30/2021 16:04:41 - INFO - __main__ - Step 15688: {'lr': 0.0004895227859175739, 'samples': 3012096, 'steps': 15687, 'loss/train': 1.5170730352401733} -08/30/2021 16:04:42 - INFO - __main__ - Step 15689: {'lr': 0.0004895212656748336, 'samples': 3012288, 'steps': 15688, 'loss/train': 0.24248376488685608} -08/30/2021 16:04:42 - INFO - __main__ - Step 15690: {'lr': 0.0004895197453241687, 'samples': 3012480, 'steps': 15689, 'loss/train': 2.572460174560547} -08/30/2021 16:04:43 - INFO - __main__ - Step 15691: {'lr': 0.0004895182248655798, 'samples': 3012672, 'steps': 15690, 'loss/train': 1.790162205696106} -08/30/2021 16:04:43 - INFO - __main__ - Step 15692: {'lr': 0.0004895167042990678, 'samples': 3012864, 'steps': 15691, 'loss/train': 1.0607959032058716} -08/30/2021 16:04:44 - INFO - __main__ - Step 15693: {'lr': 0.0004895151836246332, 'samples': 3013056, 'steps': 15692, 'loss/train': 1.7529367208480835} -08/30/2021 16:04:45 - INFO - __main__ - Step 15694: {'lr': 0.0004895136628422767, 'samples': 3013248, 'steps': 15693, 'loss/train': 1.3572545051574707} -08/30/2021 16:04:45 - INFO - __main__ - Step 15695: {'lr': 0.0004895121419519992, 'samples': 3013440, 'steps': 15694, 'loss/train': 1.9496676921844482} -08/30/2021 16:04:45 - INFO - __main__ - Step 15696: {'lr': 0.0004895106209538011, 'samples': 3013632, 'steps': 15695, 'loss/train': 1.5155653953552246} -08/30/2021 16:04:46 - INFO - __main__ - Step 15697: {'lr': 0.0004895090998476833, 'samples': 3013824, 'steps': 15696, 'loss/train': 1.7715060710906982} -08/30/2021 16:04:47 - INFO - __main__ - Step 15698: {'lr': 0.0004895075786336463, 'samples': 3014016, 'steps': 15697, 'loss/train': 2.041308879852295} -08/30/2021 16:04:48 - INFO - __main__ - Step 15699: {'lr': 0.000489506057311691, 'samples': 3014208, 'steps': 15698, 'loss/train': 1.2994133234024048} -08/30/2021 16:04:48 - INFO - __main__ - Step 15700: {'lr': 0.0004895045358818179, 'samples': 3014400, 'steps': 15699, 'loss/train': 1.5458451509475708} -08/30/2021 16:04:48 - INFO - __main__ - Step 15701: {'lr': 0.0004895030143440278, 'samples': 3014592, 'steps': 15700, 'loss/train': 2.004124164581299} -08/30/2021 16:04:49 - INFO - __main__ - Step 15702: {'lr': 0.0004895014926983212, 'samples': 3014784, 'steps': 15701, 'loss/train': 1.2008405923843384} -08/30/2021 16:04:49 - INFO - __main__ - Step 15703: {'lr': 0.0004894999709446991, 'samples': 3014976, 'steps': 15702, 'loss/train': 1.6882003545761108} -08/30/2021 16:04:51 - INFO - __main__ - Step 15704: {'lr': 0.0004894984490831619, 'samples': 3015168, 'steps': 15703, 'loss/train': 1.5917606353759766} -08/30/2021 16:04:51 - INFO - __main__ - Step 15705: {'lr': 0.0004894969271137104, 'samples': 3015360, 'steps': 15704, 'loss/train': 0.23126155138015747} -08/30/2021 16:04:52 - INFO - __main__ - Step 15706: {'lr': 0.0004894954050363452, 'samples': 3015552, 'steps': 15705, 'loss/train': 1.0706652402877808} -08/30/2021 16:04:52 - INFO - __main__ - Step 15707: {'lr': 0.0004894938828510672, 'samples': 3015744, 'steps': 15706, 'loss/train': 1.2698158025741577} -08/30/2021 16:04:53 - INFO - __main__ - Step 15708: {'lr': 0.000489492360557877, 'samples': 3015936, 'steps': 15707, 'loss/train': 0.8350092768669128} -08/30/2021 16:04:53 - INFO - __main__ - Step 15709: {'lr': 0.0004894908381567751, 'samples': 3016128, 'steps': 15708, 'loss/train': 2.3612992763519287} -08/30/2021 16:04:54 - INFO - __main__ - Step 15710: {'lr': 0.0004894893156477623, 'samples': 3016320, 'steps': 15709, 'loss/train': 1.7201426029205322} -08/30/2021 16:04:55 - INFO - __main__ - Step 15711: {'lr': 0.0004894877930308395, 'samples': 3016512, 'steps': 15710, 'loss/train': 1.4212003946304321} -08/30/2021 16:04:55 - INFO - __main__ - Step 15712: {'lr': 0.0004894862703060071, 'samples': 3016704, 'steps': 15711, 'loss/train': 2.0885603427886963} -08/30/2021 16:04:55 - INFO - __main__ - Step 15713: {'lr': 0.0004894847474732658, 'samples': 3016896, 'steps': 15712, 'loss/train': 2.1898651123046875} -08/30/2021 16:04:56 - INFO - __main__ - Step 15714: {'lr': 0.0004894832245326165, 'samples': 3017088, 'steps': 15713, 'loss/train': 1.267521619796753} -08/30/2021 16:04:57 - INFO - __main__ - Step 15715: {'lr': 0.0004894817014840597, 'samples': 3017280, 'steps': 15714, 'loss/train': 1.5059354305267334} -08/30/2021 16:04:58 - INFO - __main__ - Step 15716: {'lr': 0.0004894801783275961, 'samples': 3017472, 'steps': 15715, 'loss/train': 1.5661461353302002} -08/30/2021 16:04:58 - INFO - __main__ - Step 15717: {'lr': 0.0004894786550632264, 'samples': 3017664, 'steps': 15716, 'loss/train': 1.3200610876083374} -08/30/2021 16:04:58 - INFO - __main__ - Step 15718: {'lr': 0.0004894771316909514, 'samples': 3017856, 'steps': 15717, 'loss/train': 1.5051206350326538} -08/30/2021 16:04:59 - INFO - __main__ - Step 15719: {'lr': 0.0004894756082107717, 'samples': 3018048, 'steps': 15718, 'loss/train': 1.4719260931015015} -08/30/2021 16:05:00 - INFO - __main__ - Step 15720: {'lr': 0.0004894740846226879, 'samples': 3018240, 'steps': 15719, 'loss/train': 1.7230294942855835} -08/30/2021 16:05:01 - INFO - __main__ - Step 15721: {'lr': 0.0004894725609267009, 'samples': 3018432, 'steps': 15720, 'loss/train': 1.6836109161376953} -08/30/2021 16:05:01 - INFO - __main__ - Step 15722: {'lr': 0.0004894710371228111, 'samples': 3018624, 'steps': 15721, 'loss/train': 2.2346858978271484} -08/30/2021 16:05:02 - INFO - __main__ - Step 15723: {'lr': 0.0004894695132110196, 'samples': 3018816, 'steps': 15722, 'loss/train': 1.240833044052124} -08/30/2021 16:05:02 - INFO - __main__ - Step 15724: {'lr': 0.0004894679891913266, 'samples': 3019008, 'steps': 15723, 'loss/train': 1.9928617477416992} -08/30/2021 16:05:02 - INFO - __main__ - Step 15725: {'lr': 0.000489466465063733, 'samples': 3019200, 'steps': 15724, 'loss/train': 1.71743905544281} -08/30/2021 16:05:04 - INFO - __main__ - Step 15726: {'lr': 0.0004894649408282396, 'samples': 3019392, 'steps': 15725, 'loss/train': 1.3347309827804565} -08/30/2021 16:05:04 - INFO - __main__ - Step 15727: {'lr': 0.000489463416484847, 'samples': 3019584, 'steps': 15726, 'loss/train': 2.6286916732788086} -08/30/2021 16:05:05 - INFO - __main__ - Step 15728: {'lr': 0.0004894618920335558, 'samples': 3019776, 'steps': 15727, 'loss/train': 1.3679033517837524} -08/30/2021 16:05:05 - INFO - __main__ - Step 15729: {'lr': 0.0004894603674743668, 'samples': 3019968, 'steps': 15728, 'loss/train': 1.9781831502914429} -08/30/2021 16:05:05 - INFO - __main__ - Step 15730: {'lr': 0.0004894588428072808, 'samples': 3020160, 'steps': 15729, 'loss/train': 2.1462972164154053} -08/30/2021 16:05:07 - INFO - __main__ - Step 15731: {'lr': 0.0004894573180322982, 'samples': 3020352, 'steps': 15730, 'loss/train': 1.7896645069122314} -08/30/2021 16:05:08 - INFO - __main__ - Step 15732: {'lr': 0.0004894557931494199, 'samples': 3020544, 'steps': 15731, 'loss/train': 1.843048334121704} -08/30/2021 16:05:08 - INFO - __main__ - Step 15733: {'lr': 0.0004894542681586465, 'samples': 3020736, 'steps': 15732, 'loss/train': 1.7974251508712769} -08/30/2021 16:05:09 - INFO - __main__ - Step 15734: {'lr': 0.0004894527430599786, 'samples': 3020928, 'steps': 15733, 'loss/train': 1.9471001625061035} -08/30/2021 16:05:09 - INFO - __main__ - Step 15735: {'lr': 0.0004894512178534171, 'samples': 3021120, 'steps': 15734, 'loss/train': 1.8450522422790527} -08/30/2021 16:05:10 - INFO - __main__ - Step 15736: {'lr': 0.0004894496925389625, 'samples': 3021312, 'steps': 15735, 'loss/train': 1.952476143836975} -08/30/2021 16:05:11 - INFO - __main__ - Step 15737: {'lr': 0.0004894481671166155, 'samples': 3021504, 'steps': 15736, 'loss/train': 1.9185781478881836} -08/30/2021 16:05:11 - INFO - __main__ - Step 15738: {'lr': 0.0004894466415863771, 'samples': 3021696, 'steps': 15737, 'loss/train': 1.8842803239822388} -08/30/2021 16:05:12 - INFO - __main__ - Step 15739: {'lr': 0.0004894451159482476, 'samples': 3021888, 'steps': 15738, 'loss/train': 1.6598477363586426} -08/30/2021 16:05:12 - INFO - __main__ - Step 15740: {'lr': 0.0004894435902022277, 'samples': 3022080, 'steps': 15739, 'loss/train': 2.236760139465332} -08/30/2021 16:05:14 - INFO - __main__ - Step 15741: {'lr': 0.0004894420643483184, 'samples': 3022272, 'steps': 15740, 'loss/train': 1.7471964359283447} -08/30/2021 16:05:14 - INFO - __main__ - Step 15742: {'lr': 0.0004894405383865201, 'samples': 3022464, 'steps': 15741, 'loss/train': 1.1105577945709229} -08/30/2021 16:05:15 - INFO - __main__ - Step 15743: {'lr': 0.0004894390123168337, 'samples': 3022656, 'steps': 15742, 'loss/train': 1.852920413017273} -08/30/2021 16:05:15 - INFO - __main__ - Step 15744: {'lr': 0.0004894374861392596, 'samples': 3022848, 'steps': 15743, 'loss/train': 1.7588038444519043} -08/30/2021 16:05:15 - INFO - __main__ - Step 15745: {'lr': 0.0004894359598537987, 'samples': 3023040, 'steps': 15744, 'loss/train': 1.2188833951950073} -08/30/2021 16:05:17 - INFO - __main__ - Step 15746: {'lr': 0.0004894344334604517, 'samples': 3023232, 'steps': 15745, 'loss/train': 1.872450590133667} -08/30/2021 16:05:17 - INFO - __main__ - Step 15747: {'lr': 0.0004894329069592192, 'samples': 3023424, 'steps': 15746, 'loss/train': 1.7818655967712402} -08/30/2021 16:05:18 - INFO - __main__ - Step 15748: {'lr': 0.000489431380350102, 'samples': 3023616, 'steps': 15747, 'loss/train': 1.5086807012557983} -08/30/2021 16:05:18 - INFO - __main__ - Step 15749: {'lr': 0.0004894298536331007, 'samples': 3023808, 'steps': 15748, 'loss/train': 1.1315829753875732} -08/30/2021 16:05:18 - INFO - __main__ - Step 15750: {'lr': 0.000489428326808216, 'samples': 3024000, 'steps': 15749, 'loss/train': 1.984466314315796} -08/30/2021 16:05:20 - INFO - __main__ - Step 15751: {'lr': 0.0004894267998754486, 'samples': 3024192, 'steps': 15750, 'loss/train': 2.230523109436035} -08/30/2021 16:05:20 - INFO - __main__ - Step 15752: {'lr': 0.0004894252728347992, 'samples': 3024384, 'steps': 15751, 'loss/train': 1.0668296813964844} -08/30/2021 16:05:21 - INFO - __main__ - Step 15753: {'lr': 0.0004894237456862684, 'samples': 3024576, 'steps': 15752, 'loss/train': 2.916994333267212} -08/30/2021 16:05:21 - INFO - __main__ - Step 15754: {'lr': 0.000489422218429857, 'samples': 3024768, 'steps': 15753, 'loss/train': 1.766281247138977} -08/30/2021 16:05:21 - INFO - __main__ - Step 15755: {'lr': 0.0004894206910655656, 'samples': 3024960, 'steps': 15754, 'loss/train': 2.572554349899292} -08/30/2021 16:05:23 - INFO - __main__ - Step 15756: {'lr': 0.0004894191635933949, 'samples': 3025152, 'steps': 15755, 'loss/train': 1.671134114265442} -08/30/2021 16:05:23 - INFO - __main__ - Step 15757: {'lr': 0.0004894176360133456, 'samples': 3025344, 'steps': 15756, 'loss/train': 1.7096961736679077} -08/30/2021 16:05:24 - INFO - __main__ - Step 15758: {'lr': 0.0004894161083254186, 'samples': 3025536, 'steps': 15757, 'loss/train': 1.6784322261810303} -08/30/2021 16:05:24 - INFO - __main__ - Step 15759: {'lr': 0.0004894145805296143, 'samples': 3025728, 'steps': 15758, 'loss/train': 2.076785087585449} -08/30/2021 16:05:24 - INFO - __main__ - Step 15760: {'lr': 0.0004894130526259334, 'samples': 3025920, 'steps': 15759, 'loss/train': 1.7659324407577515} -08/30/2021 16:05:26 - INFO - __main__ - Step 15761: {'lr': 0.0004894115246143768, 'samples': 3026112, 'steps': 15760, 'loss/train': 0.3448126018047333} -08/30/2021 16:05:26 - INFO - __main__ - Step 15762: {'lr': 0.0004894099964949449, 'samples': 3026304, 'steps': 15761, 'loss/train': 2.420470714569092} -08/30/2021 16:05:27 - INFO - __main__ - Step 15763: {'lr': 0.0004894084682676387, 'samples': 3026496, 'steps': 15762, 'loss/train': 2.1055173873901367} -08/30/2021 16:05:27 - INFO - __main__ - Step 15764: {'lr': 0.0004894069399324586, 'samples': 3026688, 'steps': 15763, 'loss/train': 1.9874101877212524} -08/30/2021 16:05:27 - INFO - __main__ - Step 15765: {'lr': 0.0004894054114894055, 'samples': 3026880, 'steps': 15764, 'loss/train': 1.9154988527297974} -08/30/2021 16:05:28 - INFO - __main__ - Step 15766: {'lr': 0.00048940388293848, 'samples': 3027072, 'steps': 15765, 'loss/train': 1.456554889678955} -08/30/2021 16:05:29 - INFO - __main__ - Step 15767: {'lr': 0.000489402354279683, 'samples': 3027264, 'steps': 15766, 'loss/train': 1.8956642150878906} -08/30/2021 16:05:30 - INFO - __main__ - Step 15768: {'lr': 0.0004894008255130147, 'samples': 3027456, 'steps': 15767, 'loss/train': 1.8803777694702148} -08/30/2021 16:05:30 - INFO - __main__ - Step 15769: {'lr': 0.0004893992966384762, 'samples': 3027648, 'steps': 15768, 'loss/train': 1.9418342113494873} -08/30/2021 16:05:30 - INFO - __main__ - Step 15770: {'lr': 0.0004893977676560682, 'samples': 3027840, 'steps': 15769, 'loss/train': 1.8949304819107056} -08/30/2021 16:05:31 - INFO - __main__ - Step 15771: {'lr': 0.000489396238565791, 'samples': 3028032, 'steps': 15770, 'loss/train': 0.8951969146728516} -08/30/2021 16:05:32 - INFO - __main__ - Step 15772: {'lr': 0.0004893947093676458, 'samples': 3028224, 'steps': 15771, 'loss/train': 1.8372505903244019} -08/30/2021 16:05:33 - INFO - __main__ - Step 15773: {'lr': 0.0004893931800616329, 'samples': 3028416, 'steps': 15772, 'loss/train': 2.0663514137268066} -08/30/2021 16:05:33 - INFO - __main__ - Step 15774: {'lr': 0.0004893916506477532, 'samples': 3028608, 'steps': 15773, 'loss/train': 1.3187042474746704} -08/30/2021 16:05:33 - INFO - __main__ - Step 15775: {'lr': 0.0004893901211260073, 'samples': 3028800, 'steps': 15774, 'loss/train': 2.269486665725708} -08/30/2021 16:05:34 - INFO - __main__ - Step 15776: {'lr': 0.0004893885914963958, 'samples': 3028992, 'steps': 15775, 'loss/train': 1.5242422819137573} -08/30/2021 16:05:35 - INFO - __main__ - Step 15777: {'lr': 0.0004893870617589196, 'samples': 3029184, 'steps': 15776, 'loss/train': 1.0224928855895996} -08/30/2021 16:05:36 - INFO - __main__ - Step 15778: {'lr': 0.0004893855319135791, 'samples': 3029376, 'steps': 15777, 'loss/train': 1.6880754232406616} -08/30/2021 16:05:36 - INFO - __main__ - Step 15779: {'lr': 0.0004893840019603754, 'samples': 3029568, 'steps': 15778, 'loss/train': 1.4016624689102173} -08/30/2021 16:05:36 - INFO - __main__ - Step 15780: {'lr': 0.0004893824718993088, 'samples': 3029760, 'steps': 15779, 'loss/train': 1.8057093620300293} -08/30/2021 16:05:37 - INFO - __main__ - Step 15781: {'lr': 0.0004893809417303803, 'samples': 3029952, 'steps': 15780, 'loss/train': 1.8039134740829468} -08/30/2021 16:05:39 - INFO - __main__ - Step 15782: {'lr': 0.0004893794114535905, 'samples': 3030144, 'steps': 15781, 'loss/train': 1.7117946147918701} -08/30/2021 16:05:39 - INFO - __main__ - Step 15783: {'lr': 0.0004893778810689399, 'samples': 3030336, 'steps': 15782, 'loss/train': 1.8342255353927612} -08/30/2021 16:05:39 - INFO - __main__ - Step 15784: {'lr': 0.0004893763505764292, 'samples': 3030528, 'steps': 15783, 'loss/train': 1.4451026916503906} -08/30/2021 16:05:40 - INFO - __main__ - Step 15785: {'lr': 0.0004893748199760594, 'samples': 3030720, 'steps': 15784, 'loss/train': 0.1269480586051941} -08/30/2021 16:05:40 - INFO - __main__ - Step 15786: {'lr': 0.0004893732892678309, 'samples': 3030912, 'steps': 15785, 'loss/train': 1.6834965944290161} -08/30/2021 16:05:40 - INFO - __main__ - Step 15787: {'lr': 0.0004893717584517445, 'samples': 3031104, 'steps': 15786, 'loss/train': 0.7068189978599548} -08/30/2021 16:05:42 - INFO - __main__ - Step 15788: {'lr': 0.000489370227527801, 'samples': 3031296, 'steps': 15787, 'loss/train': 0.6516126990318298} -08/30/2021 16:05:43 - INFO - __main__ - Step 15789: {'lr': 0.0004893686964960009, 'samples': 3031488, 'steps': 15788, 'loss/train': 1.4837327003479004} -08/30/2021 16:05:43 - INFO - __main__ - Step 15790: {'lr': 0.0004893671653563448, 'samples': 3031680, 'steps': 15789, 'loss/train': 2.016655445098877} -08/30/2021 16:05:44 - INFO - __main__ - Step 15791: {'lr': 0.0004893656341088338, 'samples': 3031872, 'steps': 15790, 'loss/train': 1.369646430015564} -08/30/2021 16:05:44 - INFO - __main__ - Step 15792: {'lr': 0.0004893641027534682, 'samples': 3032064, 'steps': 15791, 'loss/train': 1.9633276462554932} -08/30/2021 16:05:46 - INFO - __main__ - Step 15793: {'lr': 0.0004893625712902489, 'samples': 3032256, 'steps': 15792, 'loss/train': 1.4365977048873901} -08/30/2021 16:05:46 - INFO - __main__ - Step 15794: {'lr': 0.0004893610397191764, 'samples': 3032448, 'steps': 15793, 'loss/train': 1.6184943914413452} -08/30/2021 16:05:46 - INFO - __main__ - Step 15795: {'lr': 0.0004893595080402517, 'samples': 3032640, 'steps': 15794, 'loss/train': 1.0569422245025635} -08/30/2021 16:05:47 - INFO - __main__ - Step 15796: {'lr': 0.0004893579762534751, 'samples': 3032832, 'steps': 15795, 'loss/train': 1.966475486755371} -08/30/2021 16:05:47 - INFO - __main__ - Step 15797: {'lr': 0.0004893564443588476, 'samples': 3033024, 'steps': 15796, 'loss/train': 1.7992537021636963} -08/30/2021 16:05:49 - INFO - __main__ - Step 15798: {'lr': 0.0004893549123563697, 'samples': 3033216, 'steps': 15797, 'loss/train': 1.788185477256775} -08/30/2021 16:05:49 - INFO - __main__ - Step 15799: {'lr': 0.0004893533802460422, 'samples': 3033408, 'steps': 15798, 'loss/train': 1.57007896900177} -08/30/2021 16:05:49 - INFO - __main__ - Step 15800: {'lr': 0.0004893518480278658, 'samples': 3033600, 'steps': 15799, 'loss/train': 2.435354232788086} -08/30/2021 16:05:50 - INFO - __main__ - Step 15801: {'lr': 0.0004893503157018412, 'samples': 3033792, 'steps': 15800, 'loss/train': 1.724379301071167} -08/30/2021 16:05:50 - INFO - __main__ - Step 15802: {'lr': 0.000489348783267969, 'samples': 3033984, 'steps': 15801, 'loss/train': 1.6994962692260742} -08/30/2021 16:05:50 - INFO - __main__ - Step 15803: {'lr': 0.0004893472507262499, 'samples': 3034176, 'steps': 15802, 'loss/train': 2.779169797897339} -08/30/2021 16:05:52 - INFO - __main__ - Step 15804: {'lr': 0.0004893457180766846, 'samples': 3034368, 'steps': 15803, 'loss/train': 1.732416033744812} -08/30/2021 16:05:53 - INFO - __main__ - Step 15805: {'lr': 0.0004893441853192739, 'samples': 3034560, 'steps': 15804, 'loss/train': 1.6029468774795532} -08/30/2021 16:05:53 - INFO - __main__ - Step 15806: {'lr': 0.0004893426524540183, 'samples': 3034752, 'steps': 15805, 'loss/train': 2.099090099334717} -08/30/2021 16:05:53 - INFO - __main__ - Step 15807: {'lr': 0.0004893411194809186, 'samples': 3034944, 'steps': 15806, 'loss/train': 1.7839194536209106} -08/30/2021 16:05:54 - INFO - __main__ - Step 15808: {'lr': 0.0004893395863999755, 'samples': 3035136, 'steps': 15807, 'loss/train': 1.5603755712509155} -08/30/2021 16:05:55 - INFO - __main__ - Step 15809: {'lr': 0.0004893380532111898, 'samples': 3035328, 'steps': 15808, 'loss/train': 1.5778244733810425} -08/30/2021 16:05:56 - INFO - __main__ - Step 15810: {'lr': 0.0004893365199145619, 'samples': 3035520, 'steps': 15809, 'loss/train': 1.8768761157989502} -08/30/2021 16:05:56 - INFO - __main__ - Step 15811: {'lr': 0.0004893349865100927, 'samples': 3035712, 'steps': 15810, 'loss/train': 1.9645310640335083} -08/30/2021 16:05:56 - INFO - __main__ - Step 15812: {'lr': 0.0004893334529977828, 'samples': 3035904, 'steps': 15811, 'loss/train': 1.8728632926940918} -08/30/2021 16:05:57 - INFO - __main__ - Step 15813: {'lr': 0.0004893319193776331, 'samples': 3036096, 'steps': 15812, 'loss/train': 1.7371985912322998} -08/30/2021 16:05:58 - INFO - __main__ - Step 15814: {'lr': 0.000489330385649644, 'samples': 3036288, 'steps': 15813, 'loss/train': 1.9565091133117676} -08/30/2021 16:05:59 - INFO - __main__ - Step 15815: {'lr': 0.0004893288518138163, 'samples': 3036480, 'steps': 15814, 'loss/train': 1.8143585920333862} -08/30/2021 16:05:59 - INFO - __main__ - Step 15816: {'lr': 0.0004893273178701508, 'samples': 3036672, 'steps': 15815, 'loss/train': 1.7400017976760864} -08/30/2021 16:05:59 - INFO - __main__ - Step 15817: {'lr': 0.0004893257838186481, 'samples': 3036864, 'steps': 15816, 'loss/train': 2.777813673019409} -08/30/2021 16:06:00 - INFO - __main__ - Step 15818: {'lr': 0.0004893242496593089, 'samples': 3037056, 'steps': 15817, 'loss/train': 2.0366008281707764} -08/30/2021 16:06:01 - INFO - __main__ - Step 15819: {'lr': 0.0004893227153921338, 'samples': 3037248, 'steps': 15818, 'loss/train': 1.7623364925384521} -08/30/2021 16:06:02 - INFO - __main__ - Step 15820: {'lr': 0.0004893211810171237, 'samples': 3037440, 'steps': 15819, 'loss/train': 1.1324254274368286} -08/30/2021 16:06:02 - INFO - __main__ - Step 15821: {'lr': 0.0004893196465342791, 'samples': 3037632, 'steps': 15820, 'loss/train': 2.2985141277313232} -08/30/2021 16:06:02 - INFO - __main__ - Step 15822: {'lr': 0.0004893181119436007, 'samples': 3037824, 'steps': 15821, 'loss/train': 1.7648950815200806} -08/30/2021 16:06:03 - INFO - __main__ - Step 15823: {'lr': 0.0004893165772450893, 'samples': 3038016, 'steps': 15822, 'loss/train': 1.7349241971969604} -08/30/2021 16:06:04 - INFO - __main__ - Step 15824: {'lr': 0.0004893150424387456, 'samples': 3038208, 'steps': 15823, 'loss/train': 1.8271968364715576} -08/30/2021 16:06:05 - INFO - __main__ - Step 15825: {'lr': 0.0004893135075245702, 'samples': 3038400, 'steps': 15824, 'loss/train': 1.7137402296066284} -08/30/2021 16:06:05 - INFO - __main__ - Step 15826: {'lr': 0.0004893119725025639, 'samples': 3038592, 'steps': 15825, 'loss/train': 1.4959312677383423} -08/30/2021 16:06:06 - INFO - __main__ - Step 15827: {'lr': 0.0004893104373727272, 'samples': 3038784, 'steps': 15826, 'loss/train': 1.7496213912963867} -08/30/2021 16:06:06 - INFO - __main__ - Step 15828: {'lr': 0.0004893089021350609, 'samples': 3038976, 'steps': 15827, 'loss/train': 1.48745596408844} -08/30/2021 16:06:07 - INFO - __main__ - Step 15829: {'lr': 0.0004893073667895658, 'samples': 3039168, 'steps': 15828, 'loss/train': 0.20793157815933228} -08/30/2021 16:06:08 - INFO - __main__ - Step 15830: {'lr': 0.0004893058313362424, 'samples': 3039360, 'steps': 15829, 'loss/train': 2.057208776473999} -08/30/2021 16:06:08 - INFO - __main__ - Step 15831: {'lr': 0.0004893042957750916, 'samples': 3039552, 'steps': 15830, 'loss/train': 1.514568567276001} -08/30/2021 16:06:09 - INFO - __main__ - Step 15832: {'lr': 0.0004893027601061138, 'samples': 3039744, 'steps': 15831, 'loss/train': 1.5174131393432617} -08/30/2021 16:06:09 - INFO - __main__ - Step 15833: {'lr': 0.00048930122432931, 'samples': 3039936, 'steps': 15832, 'loss/train': 1.8271756172180176} -08/30/2021 16:06:09 - INFO - __main__ - Step 15834: {'lr': 0.0004892996884446807, 'samples': 3040128, 'steps': 15833, 'loss/train': 1.2590651512145996} -08/30/2021 16:06:11 - INFO - __main__ - Step 15835: {'lr': 0.0004892981524522267, 'samples': 3040320, 'steps': 15834, 'loss/train': 1.8676629066467285} -08/30/2021 16:06:12 - INFO - __main__ - Step 15836: {'lr': 0.0004892966163519487, 'samples': 3040512, 'steps': 15835, 'loss/train': 1.9099675416946411} -08/30/2021 16:06:12 - INFO - __main__ - Step 15837: {'lr': 0.0004892950801438472, 'samples': 3040704, 'steps': 15836, 'loss/train': 1.5653126239776611} -08/30/2021 16:06:12 - INFO - __main__ - Step 15838: {'lr': 0.0004892935438279231, 'samples': 3040896, 'steps': 15837, 'loss/train': 1.9078892469406128} -08/30/2021 16:06:13 - INFO - __main__ - Step 15839: {'lr': 0.0004892920074041771, 'samples': 3041088, 'steps': 15838, 'loss/train': 1.8621835708618164} -08/30/2021 16:06:13 - INFO - __main__ - Step 15840: {'lr': 0.0004892904708726096, 'samples': 3041280, 'steps': 15839, 'loss/train': 1.7209863662719727} -08/30/2021 16:06:15 - INFO - __main__ - Step 15841: {'lr': 0.0004892889342332218, 'samples': 3041472, 'steps': 15840, 'loss/train': 1.2462749481201172} -08/30/2021 16:06:16 - INFO - __main__ - Step 15842: {'lr': 0.000489287397486014, 'samples': 3041664, 'steps': 15841, 'loss/train': 1.5948426723480225} -08/30/2021 16:06:16 - INFO - __main__ - Step 15843: {'lr': 0.0004892858606309868, 'samples': 3041856, 'steps': 15842, 'loss/train': 1.6169359683990479} -08/30/2021 16:06:16 - INFO - __main__ - Step 15844: {'lr': 0.0004892843236681412, 'samples': 3042048, 'steps': 15843, 'loss/train': 1.8096169233322144} -08/30/2021 16:06:17 - INFO - __main__ - Step 15845: {'lr': 0.0004892827865974779, 'samples': 3042240, 'steps': 15844, 'loss/train': 1.927626609802246} -08/30/2021 16:06:18 - INFO - __main__ - Step 15846: {'lr': 0.0004892812494189973, 'samples': 3042432, 'steps': 15845, 'loss/train': 1.567002534866333} -08/30/2021 16:06:19 - INFO - __main__ - Step 15847: {'lr': 0.0004892797121327003, 'samples': 3042624, 'steps': 15846, 'loss/train': 1.6373697519302368} -08/30/2021 16:06:19 - INFO - __main__ - Step 15848: {'lr': 0.0004892781747385876, 'samples': 3042816, 'steps': 15847, 'loss/train': 1.892551064491272} -08/30/2021 16:06:19 - INFO - __main__ - Step 15849: {'lr': 0.0004892766372366598, 'samples': 3043008, 'steps': 15848, 'loss/train': 2.0063562393188477} -08/30/2021 16:06:20 - INFO - __main__ - Step 15850: {'lr': 0.0004892750996269177, 'samples': 3043200, 'steps': 15849, 'loss/train': 2.2678918838500977} -08/30/2021 16:06:21 - INFO - __main__ - Step 15851: {'lr': 0.0004892735619093618, 'samples': 3043392, 'steps': 15850, 'loss/train': 2.7943601608276367} -08/30/2021 16:06:22 - INFO - __main__ - Step 15852: {'lr': 0.0004892720240839931, 'samples': 3043584, 'steps': 15851, 'loss/train': 1.4127070903778076} -08/30/2021 16:06:22 - INFO - __main__ - Step 15853: {'lr': 0.0004892704861508121, 'samples': 3043776, 'steps': 15852, 'loss/train': 2.1591296195983887} -08/30/2021 16:06:22 - INFO - __main__ - Step 15854: {'lr': 0.0004892689481098193, 'samples': 3043968, 'steps': 15853, 'loss/train': 2.0167603492736816} -08/30/2021 16:06:23 - INFO - __main__ - Step 15855: {'lr': 0.0004892674099610158, 'samples': 3044160, 'steps': 15854, 'loss/train': 1.6414259672164917} -08/30/2021 16:06:24 - INFO - __main__ - Step 15856: {'lr': 0.000489265871704402, 'samples': 3044352, 'steps': 15855, 'loss/train': 6.075537204742432} -08/30/2021 16:06:25 - INFO - __main__ - Step 15857: {'lr': 0.0004892643333399788, 'samples': 3044544, 'steps': 15856, 'loss/train': 1.768763780593872} -08/30/2021 16:06:25 - INFO - __main__ - Step 15858: {'lr': 0.0004892627948677467, 'samples': 3044736, 'steps': 15857, 'loss/train': 1.0978754758834839} -08/30/2021 16:06:26 - INFO - __main__ - Step 15859: {'lr': 0.0004892612562877066, 'samples': 3044928, 'steps': 15858, 'loss/train': 2.134469509124756} -08/30/2021 16:06:26 - INFO - __main__ - Step 15860: {'lr': 0.0004892597175998589, 'samples': 3045120, 'steps': 15859, 'loss/train': 2.2281742095947266} -08/30/2021 16:06:26 - INFO - __main__ - Step 15861: {'lr': 0.0004892581788042045, 'samples': 3045312, 'steps': 15860, 'loss/train': 1.843698263168335} -08/30/2021 16:06:28 - INFO - __main__ - Step 15862: {'lr': 0.0004892566399007441, 'samples': 3045504, 'steps': 15861, 'loss/train': 0.2343396246433258} -08/30/2021 16:06:28 - INFO - __main__ - Step 15863: {'lr': 0.0004892551008894784, 'samples': 3045696, 'steps': 15862, 'loss/train': 0.3301844000816345} -08/30/2021 16:06:29 - INFO - __main__ - Step 15864: {'lr': 0.0004892535617704079, 'samples': 3045888, 'steps': 15863, 'loss/train': 1.5133025646209717} -08/30/2021 16:06:29 - INFO - __main__ - Step 15865: {'lr': 0.0004892520225435336, 'samples': 3046080, 'steps': 15864, 'loss/train': 1.9222338199615479} -08/30/2021 16:06:29 - INFO - __main__ - Step 15866: {'lr': 0.000489250483208856, 'samples': 3046272, 'steps': 15865, 'loss/train': 1.7021836042404175} -08/30/2021 16:06:31 - INFO - __main__ - Step 15867: {'lr': 0.0004892489437663758, 'samples': 3046464, 'steps': 15866, 'loss/train': 0.7320907115936279} -08/30/2021 16:06:31 - INFO - __main__ - Step 15868: {'lr': 0.0004892474042160936, 'samples': 3046656, 'steps': 15867, 'loss/train': 2.1231696605682373} -08/30/2021 16:06:32 - INFO - __main__ - Step 15869: {'lr': 0.0004892458645580103, 'samples': 3046848, 'steps': 15868, 'loss/train': 1.857272982597351} -08/30/2021 16:06:32 - INFO - __main__ - Step 15870: {'lr': 0.0004892443247921265, 'samples': 3047040, 'steps': 15869, 'loss/train': 1.4664748907089233} -08/30/2021 16:06:33 - INFO - __main__ - Step 15871: {'lr': 0.0004892427849184428, 'samples': 3047232, 'steps': 15870, 'loss/train': 1.3892543315887451} -08/30/2021 16:06:34 - INFO - __main__ - Step 15872: {'lr': 0.0004892412449369602, 'samples': 3047424, 'steps': 15871, 'loss/train': 0.11538084596395493} -08/30/2021 16:06:34 - INFO - __main__ - Step 15873: {'lr': 0.0004892397048476791, 'samples': 3047616, 'steps': 15872, 'loss/train': 1.4485125541687012} -08/30/2021 16:06:35 - INFO - __main__ - Step 15874: {'lr': 0.0004892381646506002, 'samples': 3047808, 'steps': 15873, 'loss/train': 2.0320661067962646} -08/30/2021 16:06:35 - INFO - __main__ - Step 15875: {'lr': 0.0004892366243457244, 'samples': 3048000, 'steps': 15874, 'loss/train': 1.4326623678207397} -08/30/2021 16:06:36 - INFO - __main__ - Step 15876: {'lr': 0.0004892350839330522, 'samples': 3048192, 'steps': 15875, 'loss/train': 1.6021592617034912} -08/30/2021 16:06:37 - INFO - __main__ - Step 15877: {'lr': 0.0004892335434125844, 'samples': 3048384, 'steps': 15876, 'loss/train': 1.6339194774627686} -08/30/2021 16:06:38 - INFO - __main__ - Step 15878: {'lr': 0.0004892320027843216, 'samples': 3048576, 'steps': 15877, 'loss/train': 1.673117756843567} -08/30/2021 16:06:38 - INFO - __main__ - Step 15879: {'lr': 0.0004892304620482646, 'samples': 3048768, 'steps': 15878, 'loss/train': 1.6826636791229248} -08/30/2021 16:06:38 - INFO - __main__ - Step 15880: {'lr': 0.000489228921204414, 'samples': 3048960, 'steps': 15879, 'loss/train': 1.749036192893982} -08/30/2021 16:06:39 - INFO - __main__ - Step 15881: {'lr': 0.0004892273802527706, 'samples': 3049152, 'steps': 15880, 'loss/train': 0.9491150975227356} -08/30/2021 16:06:40 - INFO - __main__ - Step 15882: {'lr': 0.000489225839193335, 'samples': 3049344, 'steps': 15881, 'loss/train': 2.020514488220215} -08/30/2021 16:06:41 - INFO - __main__ - Step 15883: {'lr': 0.0004892242980261079, 'samples': 3049536, 'steps': 15882, 'loss/train': 1.8321619033813477} -08/30/2021 16:06:41 - INFO - __main__ - Step 15884: {'lr': 0.0004892227567510901, 'samples': 3049728, 'steps': 15883, 'loss/train': 0.1489810347557068} -08/30/2021 16:06:41 - INFO - __main__ - Step 15885: {'lr': 0.0004892212153682822, 'samples': 3049920, 'steps': 15884, 'loss/train': 1.6919065713882446} -08/30/2021 16:06:42 - INFO - __main__ - Step 15886: {'lr': 0.0004892196738776848, 'samples': 3050112, 'steps': 15885, 'loss/train': 1.034507393836975} -08/30/2021 16:06:43 - INFO - __main__ - Step 15887: {'lr': 0.0004892181322792989, 'samples': 3050304, 'steps': 15886, 'loss/train': 1.7606680393218994} -08/30/2021 16:06:44 - INFO - __main__ - Step 15888: {'lr': 0.0004892165905731248, 'samples': 3050496, 'steps': 15887, 'loss/train': 1.3945250511169434} -08/30/2021 16:06:44 - INFO - __main__ - Step 15889: {'lr': 0.0004892150487591635, 'samples': 3050688, 'steps': 15888, 'loss/train': 1.6292153596878052} -08/30/2021 16:06:44 - INFO - __main__ - Step 15890: {'lr': 0.0004892135068374156, 'samples': 3050880, 'steps': 15889, 'loss/train': 1.4689536094665527} -08/30/2021 16:06:45 - INFO - __main__ - Step 15891: {'lr': 0.0004892119648078817, 'samples': 3051072, 'steps': 15890, 'loss/train': 1.9595842361450195} -08/30/2021 16:06:47 - INFO - __main__ - Step 15892: {'lr': 0.0004892104226705627, 'samples': 3051264, 'steps': 15891, 'loss/train': 1.322706937789917} -08/30/2021 16:06:47 - INFO - __main__ - Step 15893: {'lr': 0.0004892088804254591, 'samples': 3051456, 'steps': 15892, 'loss/train': 1.619107961654663} -08/30/2021 16:06:48 - INFO - __main__ - Step 15894: {'lr': 0.0004892073380725716, 'samples': 3051648, 'steps': 15893, 'loss/train': 1.9878965616226196} -08/30/2021 16:06:48 - INFO - __main__ - Step 15895: {'lr': 0.0004892057956119012, 'samples': 3051840, 'steps': 15894, 'loss/train': 1.452697515487671} -08/30/2021 16:06:48 - INFO - __main__ - Step 15896: {'lr': 0.0004892042530434482, 'samples': 3052032, 'steps': 15895, 'loss/train': 1.6216015815734863} -08/30/2021 16:06:49 - INFO - __main__ - Step 15897: {'lr': 0.0004892027103672134, 'samples': 3052224, 'steps': 15896, 'loss/train': 1.6163655519485474} -08/30/2021 16:06:50 - INFO - __main__ - Step 15898: {'lr': 0.0004892011675831976, 'samples': 3052416, 'steps': 15897, 'loss/train': 0.8906508684158325} -08/30/2021 16:06:51 - INFO - __main__ - Step 15899: {'lr': 0.0004891996246914014, 'samples': 3052608, 'steps': 15898, 'loss/train': 1.6975879669189453} -08/30/2021 16:06:51 - INFO - __main__ - Step 15900: {'lr': 0.0004891980816918257, 'samples': 3052800, 'steps': 15899, 'loss/train': 0.37823686003685} -08/30/2021 16:06:51 - INFO - __main__ - Step 15901: {'lr': 0.0004891965385844709, 'samples': 3052992, 'steps': 15900, 'loss/train': 1.9129810333251953} -08/30/2021 16:06:52 - INFO - __main__ - Step 15902: {'lr': 0.0004891949953693378, 'samples': 3053184, 'steps': 15901, 'loss/train': 1.1313961744308472} -08/30/2021 16:06:53 - INFO - __main__ - Step 15903: {'lr': 0.0004891934520464273, 'samples': 3053376, 'steps': 15902, 'loss/train': 1.218643069267273} -08/30/2021 16:06:54 - INFO - __main__ - Step 15904: {'lr': 0.0004891919086157398, 'samples': 3053568, 'steps': 15903, 'loss/train': 2.356090784072876} -08/30/2021 16:06:54 - INFO - __main__ - Step 15905: {'lr': 0.000489190365077276, 'samples': 3053760, 'steps': 15904, 'loss/train': 1.6718299388885498} -08/30/2021 16:06:54 - INFO - __main__ - Step 15906: {'lr': 0.0004891888214310369, 'samples': 3053952, 'steps': 15905, 'loss/train': 1.7623941898345947} -08/30/2021 16:06:55 - INFO - __main__ - Step 15907: {'lr': 0.000489187277677023, 'samples': 3054144, 'steps': 15906, 'loss/train': 1.8284597396850586} -08/30/2021 16:06:56 - INFO - __main__ - Step 15908: {'lr': 0.000489185733815235, 'samples': 3054336, 'steps': 15907, 'loss/train': 1.508117437362671} -08/30/2021 16:06:57 - INFO - __main__ - Step 15909: {'lr': 0.0004891841898456735, 'samples': 3054528, 'steps': 15908, 'loss/train': 1.4869719743728638} -08/30/2021 16:06:57 - INFO - __main__ - Step 15910: {'lr': 0.0004891826457683394, 'samples': 3054720, 'steps': 15909, 'loss/train': 1.608035683631897} -08/30/2021 16:06:57 - INFO - __main__ - Step 15911: {'lr': 0.0004891811015832332, 'samples': 3054912, 'steps': 15910, 'loss/train': 1.6275404691696167} -08/30/2021 16:06:58 - INFO - __main__ - Step 15912: {'lr': 0.0004891795572903557, 'samples': 3055104, 'steps': 15911, 'loss/train': 1.6273819208145142} -08/30/2021 16:06:59 - INFO - __main__ - Step 15913: {'lr': 0.0004891780128897077, 'samples': 3055296, 'steps': 15912, 'loss/train': 1.4007941484451294} -08/30/2021 16:07:00 - INFO - __main__ - Step 15914: {'lr': 0.0004891764683812896, 'samples': 3055488, 'steps': 15913, 'loss/train': 1.4682165384292603} -08/30/2021 16:07:00 - INFO - __main__ - Step 15915: {'lr': 0.0004891749237651024, 'samples': 3055680, 'steps': 15914, 'loss/train': 1.6606872081756592} -08/30/2021 16:07:00 - INFO - __main__ - Step 15916: {'lr': 0.0004891733790411466, 'samples': 3055872, 'steps': 15915, 'loss/train': 1.191284418106079} -08/30/2021 16:07:01 - INFO - __main__ - Step 15917: {'lr': 0.000489171834209423, 'samples': 3056064, 'steps': 15916, 'loss/train': 1.778518557548523} -08/30/2021 16:07:03 - INFO - __main__ - Step 15918: {'lr': 0.0004891702892699323, 'samples': 3056256, 'steps': 15917, 'loss/train': 1.8627073764801025} -08/30/2021 16:07:03 - INFO - __main__ - Step 15919: {'lr': 0.0004891687442226751, 'samples': 3056448, 'steps': 15918, 'loss/train': 1.9882503747940063} -08/30/2021 16:07:04 - INFO - __main__ - Step 15920: {'lr': 0.0004891671990676522, 'samples': 3056640, 'steps': 15919, 'loss/train': 2.7746639251708984} -08/30/2021 16:07:04 - INFO - __main__ - Step 15921: {'lr': 0.0004891656538048642, 'samples': 3056832, 'steps': 15920, 'loss/train': 2.682562828063965} -08/30/2021 16:07:04 - INFO - __main__ - Step 15922: {'lr': 0.0004891641084343118, 'samples': 3057024, 'steps': 15921, 'loss/train': 1.0898919105529785} -08/30/2021 16:07:05 - INFO - __main__ - Step 15923: {'lr': 0.0004891625629559959, 'samples': 3057216, 'steps': 15922, 'loss/train': 1.7425451278686523} -08/30/2021 16:07:05 - INFO - __main__ - Step 15924: {'lr': 0.0004891610173699169, 'samples': 3057408, 'steps': 15923, 'loss/train': 1.8265413045883179} -08/30/2021 16:07:07 - INFO - __main__ - Step 15925: {'lr': 0.0004891594716760757, 'samples': 3057600, 'steps': 15924, 'loss/train': 2.081162214279175} -08/30/2021 16:07:07 - INFO - __main__ - Step 15926: {'lr': 0.0004891579258744728, 'samples': 3057792, 'steps': 15925, 'loss/train': 1.856448769569397} -08/30/2021 16:07:07 - INFO - __main__ - Step 15927: {'lr': 0.0004891563799651092, 'samples': 3057984, 'steps': 15926, 'loss/train': 2.0374579429626465} -08/30/2021 16:07:08 - INFO - __main__ - Step 15928: {'lr': 0.0004891548339479854, 'samples': 3058176, 'steps': 15927, 'loss/train': 1.7977981567382812} -08/30/2021 16:07:08 - INFO - __main__ - Step 15929: {'lr': 0.0004891532878231021, 'samples': 3058368, 'steps': 15928, 'loss/train': 1.543886423110962} -08/30/2021 16:07:10 - INFO - __main__ - Step 15930: {'lr': 0.00048915174159046, 'samples': 3058560, 'steps': 15929, 'loss/train': 1.049500584602356} -08/30/2021 16:07:10 - INFO - __main__ - Step 15931: {'lr': 0.0004891501952500599, 'samples': 3058752, 'steps': 15930, 'loss/train': 1.4056872129440308} -08/30/2021 16:07:10 - INFO - __main__ - Step 15932: {'lr': 0.0004891486488019023, 'samples': 3058944, 'steps': 15931, 'loss/train': 1.9798353910446167} -08/30/2021 16:07:11 - INFO - __main__ - Step 15933: {'lr': 0.000489147102245988, 'samples': 3059136, 'steps': 15932, 'loss/train': 0.31406834721565247} -08/30/2021 16:07:11 - INFO - __main__ - Step 15934: {'lr': 0.0004891455555823179, 'samples': 3059328, 'steps': 15933, 'loss/train': 2.054659605026245} -08/30/2021 16:07:13 - INFO - __main__ - Step 15935: {'lr': 0.0004891440088108923, 'samples': 3059520, 'steps': 15934, 'loss/train': 2.25657320022583} -08/30/2021 16:07:13 - INFO - __main__ - Step 15936: {'lr': 0.0004891424619317121, 'samples': 3059712, 'steps': 15935, 'loss/train': 1.7731446027755737} -08/30/2021 16:07:13 - INFO - __main__ - Step 15937: {'lr': 0.000489140914944778, 'samples': 3059904, 'steps': 15936, 'loss/train': 1.6978503465652466} -08/30/2021 16:07:14 - INFO - __main__ - Step 15938: {'lr': 0.0004891393678500909, 'samples': 3060096, 'steps': 15937, 'loss/train': 1.7160401344299316} -08/30/2021 16:07:14 - INFO - __main__ - Step 15939: {'lr': 0.0004891378206476511, 'samples': 3060288, 'steps': 15938, 'loss/train': 0.48282942175865173} -08/30/2021 16:07:14 - INFO - __main__ - Step 15940: {'lr': 0.0004891362733374595, 'samples': 3060480, 'steps': 15939, 'loss/train': 1.8949224948883057} -08/30/2021 16:07:17 - INFO - __main__ - Step 15941: {'lr': 0.0004891347259195168, 'samples': 3060672, 'steps': 15940, 'loss/train': 1.5520035028457642} -08/30/2021 16:07:17 - INFO - __main__ - Step 15942: {'lr': 0.0004891331783938238, 'samples': 3060864, 'steps': 15941, 'loss/train': 1.6616119146347046} -08/30/2021 16:07:18 - INFO - __main__ - Step 15943: {'lr': 0.000489131630760381, 'samples': 3061056, 'steps': 15942, 'loss/train': 1.7089266777038574} -08/30/2021 16:07:18 - INFO - __main__ - Step 15944: {'lr': 0.000489130083019189, 'samples': 3061248, 'steps': 15943, 'loss/train': 2.1419475078582764} -08/30/2021 16:07:18 - INFO - __main__ - Step 15945: {'lr': 0.000489128535170249, 'samples': 3061440, 'steps': 15944, 'loss/train': 1.6969479322433472} -08/30/2021 16:07:19 - INFO - __main__ - Step 15946: {'lr': 0.0004891269872135611, 'samples': 3061632, 'steps': 15945, 'loss/train': 1.1622493267059326} -08/30/2021 16:07:19 - INFO - __main__ - Step 15947: {'lr': 0.0004891254391491264, 'samples': 3061824, 'steps': 15946, 'loss/train': 1.6910468339920044} -08/30/2021 16:07:21 - INFO - __main__ - Step 15948: {'lr': 0.0004891238909769454, 'samples': 3062016, 'steps': 15947, 'loss/train': 1.6272855997085571} -08/30/2021 16:07:21 - INFO - __main__ - Step 15949: {'lr': 0.0004891223426970189, 'samples': 3062208, 'steps': 15948, 'loss/train': 1.7621570825576782} -08/30/2021 16:07:21 - INFO - __main__ - Step 15950: {'lr': 0.0004891207943093476, 'samples': 3062400, 'steps': 15949, 'loss/train': 0.6291665434837341} -08/30/2021 16:07:22 - INFO - __main__ - Step 15951: {'lr': 0.000489119245813932, 'samples': 3062592, 'steps': 15950, 'loss/train': 1.1066741943359375} -08/30/2021 16:07:22 - INFO - __main__ - Step 15952: {'lr': 0.0004891176972107731, 'samples': 3062784, 'steps': 15951, 'loss/train': 1.4184036254882812} -08/30/2021 16:07:24 - INFO - __main__ - Step 15953: {'lr': 0.0004891161484998715, 'samples': 3062976, 'steps': 15952, 'loss/train': 1.664896011352539} -08/30/2021 16:07:25 - INFO - __main__ - Step 15954: {'lr': 0.0004891145996812279, 'samples': 3063168, 'steps': 15953, 'loss/train': 1.8335856199264526} -08/30/2021 16:07:25 - INFO - __main__ - Step 15955: {'lr': 0.0004891130507548427, 'samples': 3063360, 'steps': 15954, 'loss/train': 1.547168254852295} -08/30/2021 16:07:25 - INFO - __main__ - Step 15956: {'lr': 0.000489111501720717, 'samples': 3063552, 'steps': 15955, 'loss/train': 1.9942551851272583} -08/30/2021 16:07:26 - INFO - __main__ - Step 15957: {'lr': 0.0004891099525788514, 'samples': 3063744, 'steps': 15956, 'loss/train': 1.791953206062317} -08/30/2021 16:07:26 - INFO - __main__ - Step 15958: {'lr': 0.0004891084033292464, 'samples': 3063936, 'steps': 15957, 'loss/train': 1.6415573358535767} -08/30/2021 16:07:28 - INFO - __main__ - Step 15959: {'lr': 0.0004891068539719031, 'samples': 3064128, 'steps': 15958, 'loss/train': 1.894308090209961} -08/30/2021 16:07:28 - INFO - __main__ - Step 15960: {'lr': 0.0004891053045068217, 'samples': 3064320, 'steps': 15959, 'loss/train': 2.062399387359619} -08/30/2021 16:07:28 - INFO - __main__ - Step 15961: {'lr': 0.0004891037549340032, 'samples': 3064512, 'steps': 15960, 'loss/train': 1.6622875928878784} -08/30/2021 16:07:29 - INFO - __main__ - Step 15962: {'lr': 0.0004891022052534482, 'samples': 3064704, 'steps': 15961, 'loss/train': 1.6348267793655396} -08/30/2021 16:07:29 - INFO - __main__ - Step 15963: {'lr': 0.0004891006554651574, 'samples': 3064896, 'steps': 15962, 'loss/train': 1.1106070280075073} -08/30/2021 16:07:31 - INFO - __main__ - Step 15964: {'lr': 0.0004890991055691318, 'samples': 3065088, 'steps': 15963, 'loss/train': 1.455451488494873} -08/30/2021 16:07:31 - INFO - __main__ - Step 15965: {'lr': 0.0004890975555653716, 'samples': 3065280, 'steps': 15964, 'loss/train': 1.4749478101730347} -08/30/2021 16:07:31 - INFO - __main__ - Step 15966: {'lr': 0.0004890960054538778, 'samples': 3065472, 'steps': 15965, 'loss/train': 1.6150314807891846} -08/30/2021 16:07:32 - INFO - __main__ - Step 15967: {'lr': 0.000489094455234651, 'samples': 3065664, 'steps': 15966, 'loss/train': 0.3192380368709564} -08/30/2021 16:07:32 - INFO - __main__ - Step 15968: {'lr': 0.0004890929049076919, 'samples': 3065856, 'steps': 15967, 'loss/train': 1.7374497652053833} -08/30/2021 16:07:34 - INFO - __main__ - Step 15969: {'lr': 0.0004890913544730013, 'samples': 3066048, 'steps': 15968, 'loss/train': 1.5663126707077026} -08/30/2021 16:07:35 - INFO - __main__ - Step 15970: {'lr': 0.0004890898039305798, 'samples': 3066240, 'steps': 15969, 'loss/train': 1.9863234758377075} -08/30/2021 16:07:35 - INFO - __main__ - Step 15971: {'lr': 0.000489088253280428, 'samples': 3066432, 'steps': 15970, 'loss/train': 1.812970519065857} -08/30/2021 16:07:35 - INFO - __main__ - Step 15972: {'lr': 0.0004890867025225469, 'samples': 3066624, 'steps': 15971, 'loss/train': 1.6286590099334717} -08/30/2021 16:07:36 - INFO - __main__ - Step 15973: {'lr': 0.000489085151656937, 'samples': 3066816, 'steps': 15972, 'loss/train': 2.0572667121887207} -08/30/2021 16:07:37 - INFO - __main__ - Step 15974: {'lr': 0.000489083600683599, 'samples': 3067008, 'steps': 15973, 'loss/train': 0.20823699235916138} -08/30/2021 16:07:37 - INFO - __main__ - Step 15975: {'lr': 0.0004890820496025335, 'samples': 3067200, 'steps': 15974, 'loss/train': 2.290116310119629} -08/30/2021 16:07:38 - INFO - __main__ - Step 15976: {'lr': 0.0004890804984137415, 'samples': 3067392, 'steps': 15975, 'loss/train': 1.6490013599395752} -08/30/2021 16:07:38 - INFO - __main__ - Step 15977: {'lr': 0.0004890789471172233, 'samples': 3067584, 'steps': 15976, 'loss/train': 1.6396937370300293} -08/30/2021 16:07:38 - INFO - __main__ - Step 15978: {'lr': 0.00048907739571298, 'samples': 3067776, 'steps': 15977, 'loss/train': 1.9426047801971436} -08/30/2021 16:07:39 - INFO - __main__ - Step 15979: {'lr': 0.000489075844201012, 'samples': 3067968, 'steps': 15978, 'loss/train': 1.6522164344787598} -08/30/2021 16:07:40 - INFO - __main__ - Step 15980: {'lr': 0.0004890742925813202, 'samples': 3068160, 'steps': 15979, 'loss/train': 1.8167675733566284} -08/30/2021 16:07:41 - INFO - __main__ - Step 15981: {'lr': 0.0004890727408539051, 'samples': 3068352, 'steps': 15980, 'loss/train': 1.2056710720062256} -08/30/2021 16:07:41 - INFO - __main__ - Step 15982: {'lr': 0.0004890711890187676, 'samples': 3068544, 'steps': 15981, 'loss/train': 2.293987274169922} -08/30/2021 16:07:42 - INFO - __main__ - Step 15983: {'lr': 0.0004890696370759085, 'samples': 3068736, 'steps': 15982, 'loss/train': 1.3528395891189575} -08/30/2021 16:07:42 - INFO - __main__ - Step 15984: {'lr': 0.0004890680850253281, 'samples': 3068928, 'steps': 15983, 'loss/train': 1.4105851650238037} -08/30/2021 16:07:43 - INFO - __main__ - Step 15985: {'lr': 0.0004890665328670273, 'samples': 3069120, 'steps': 15984, 'loss/train': 1.8543025255203247} -08/30/2021 16:07:44 - INFO - __main__ - Step 15986: {'lr': 0.0004890649806010067, 'samples': 3069312, 'steps': 15985, 'loss/train': 0.3930068612098694} -08/30/2021 16:07:44 - INFO - __main__ - Step 15987: {'lr': 0.0004890634282272673, 'samples': 3069504, 'steps': 15986, 'loss/train': 1.812916874885559} -08/30/2021 16:07:45 - INFO - __main__ - Step 15988: {'lr': 0.0004890618757458096, 'samples': 3069696, 'steps': 15987, 'loss/train': 1.3969653844833374} -08/30/2021 16:07:45 - INFO - __main__ - Step 15989: {'lr': 0.0004890603231566343, 'samples': 3069888, 'steps': 15988, 'loss/train': 1.9779038429260254} -08/30/2021 16:07:47 - INFO - __main__ - Step 15990: {'lr': 0.000489058770459742, 'samples': 3070080, 'steps': 15989, 'loss/train': 1.6323916912078857} -08/30/2021 16:07:47 - INFO - __main__ - Step 15991: {'lr': 0.0004890572176551337, 'samples': 3070272, 'steps': 15990, 'loss/train': 1.7052792310714722} -08/30/2021 16:07:47 - INFO - __main__ - Step 15992: {'lr': 0.0004890556647428097, 'samples': 3070464, 'steps': 15991, 'loss/train': 1.92897629737854} -08/30/2021 16:07:48 - INFO - __main__ - Step 15993: {'lr': 0.0004890541117227711, 'samples': 3070656, 'steps': 15992, 'loss/train': 1.7285797595977783} -08/30/2021 16:07:48 - INFO - __main__ - Step 15994: {'lr': 0.0004890525585950181, 'samples': 3070848, 'steps': 15993, 'loss/train': 1.4235693216323853} -08/30/2021 16:07:48 - INFO - __main__ - Step 15995: {'lr': 0.000489051005359552, 'samples': 3071040, 'steps': 15994, 'loss/train': 0.4631354510784149} -08/30/2021 16:07:50 - INFO - __main__ - Step 15996: {'lr': 0.0004890494520163731, 'samples': 3071232, 'steps': 15995, 'loss/train': 4.9341912269592285} -08/30/2021 16:07:50 - INFO - __main__ - Step 15997: {'lr': 0.0004890478985654823, 'samples': 3071424, 'steps': 15996, 'loss/train': 1.2674771547317505} -08/30/2021 16:07:51 - INFO - __main__ - Step 15998: {'lr': 0.0004890463450068801, 'samples': 3071616, 'steps': 15997, 'loss/train': 1.4238637685775757} -08/30/2021 16:07:51 - INFO - __main__ - Step 15999: {'lr': 0.0004890447913405673, 'samples': 3071808, 'steps': 15998, 'loss/train': 1.9229238033294678} -08/30/2021 16:07:51 - INFO - __main__ - Step 16000: {'lr': 0.0004890432375665447, 'samples': 3072000, 'steps': 15999, 'loss/train': 2.1698992252349854} -08/30/2021 16:07:53 - INFO - __main__ - Step 16001: {'lr': 0.0004890416836848127, 'samples': 3072192, 'steps': 16000, 'loss/train': 1.5063798427581787} -08/30/2021 16:07:53 - INFO - __main__ - Step 16002: {'lr': 0.0004890401296953723, 'samples': 3072384, 'steps': 16001, 'loss/train': 1.455306887626648} -08/30/2021 16:07:54 - INFO - __main__ - Step 16003: {'lr': 0.0004890385755982243, 'samples': 3072576, 'steps': 16002, 'loss/train': 1.368117094039917} -08/30/2021 16:07:54 - INFO - __main__ - Step 16004: {'lr': 0.0004890370213933691, 'samples': 3072768, 'steps': 16003, 'loss/train': 1.1363060474395752} -08/30/2021 16:07:54 - INFO - __main__ - Step 16005: {'lr': 0.0004890354670808074, 'samples': 3072960, 'steps': 16004, 'loss/train': 1.667634129524231} -08/30/2021 16:07:57 - INFO - __main__ - Step 16006: {'lr': 0.0004890339126605401, 'samples': 3073152, 'steps': 16005, 'loss/train': 1.5886671543121338} -08/30/2021 16:07:57 - INFO - __main__ - Step 16007: {'lr': 0.0004890323581325677, 'samples': 3073344, 'steps': 16006, 'loss/train': 1.4568320512771606} -08/30/2021 16:07:57 - INFO - __main__ - Step 16008: {'lr': 0.0004890308034968911, 'samples': 3073536, 'steps': 16007, 'loss/train': 1.618986964225769} -08/30/2021 16:07:58 - INFO - __main__ - Step 16009: {'lr': 0.0004890292487535108, 'samples': 3073728, 'steps': 16008, 'loss/train': 1.9119718074798584} -08/30/2021 16:07:58 - INFO - __main__ - Step 16010: {'lr': 0.0004890276939024278, 'samples': 3073920, 'steps': 16009, 'loss/train': 2.1318917274475098} -08/30/2021 16:08:00 - INFO - __main__ - Step 16011: {'lr': 0.0004890261389436424, 'samples': 3074112, 'steps': 16010, 'loss/train': 1.9940615892410278} -08/30/2021 16:08:01 - INFO - __main__ - Step 16012: {'lr': 0.0004890245838771557, 'samples': 3074304, 'steps': 16011, 'loss/train': 0.35355421900749207} -08/30/2021 16:08:01 - INFO - __main__ - Step 16013: {'lr': 0.0004890230287029681, 'samples': 3074496, 'steps': 16012, 'loss/train': 0.5573104023933411} -08/30/2021 16:08:01 - INFO - __main__ - Step 16014: {'lr': 0.0004890214734210805, 'samples': 3074688, 'steps': 16013, 'loss/train': 1.2571091651916504} -08/30/2021 16:08:02 - INFO - __main__ - Step 16015: {'lr': 0.0004890199180314935, 'samples': 3074880, 'steps': 16014, 'loss/train': 1.6820523738861084} -08/30/2021 16:08:02 - INFO - __main__ - Step 16016: {'lr': 0.0004890183625342078, 'samples': 3075072, 'steps': 16015, 'loss/train': 1.702893614768982} -08/30/2021 16:08:03 - INFO - __main__ - Step 16017: {'lr': 0.0004890168069292241, 'samples': 3075264, 'steps': 16016, 'loss/train': 1.690147876739502} -08/30/2021 16:08:04 - INFO - __main__ - Step 16018: {'lr': 0.000489015251216543, 'samples': 3075456, 'steps': 16017, 'loss/train': 1.5505287647247314} -08/30/2021 16:08:04 - INFO - __main__ - Step 16019: {'lr': 0.0004890136953961654, 'samples': 3075648, 'steps': 16018, 'loss/train': 1.1830521821975708} -08/30/2021 16:08:05 - INFO - __main__ - Step 16020: {'lr': 0.000489012139468092, 'samples': 3075840, 'steps': 16019, 'loss/train': 1.4839494228363037} -08/30/2021 16:08:05 - INFO - __main__ - Step 16021: {'lr': 0.0004890105834323233, 'samples': 3076032, 'steps': 16020, 'loss/train': 1.502497673034668} -08/30/2021 16:08:06 - INFO - __main__ - Step 16022: {'lr': 0.0004890090272888602, 'samples': 3076224, 'steps': 16021, 'loss/train': 1.6627182960510254} -08/30/2021 16:08:07 - INFO - __main__ - Step 16023: {'lr': 0.0004890074710377033, 'samples': 3076416, 'steps': 16022, 'loss/train': 1.9242879152297974} -08/30/2021 16:08:07 - INFO - __main__ - Step 16024: {'lr': 0.0004890059146788532, 'samples': 3076608, 'steps': 16023, 'loss/train': 1.4171985387802124} -08/30/2021 16:08:08 - INFO - __main__ - Step 16025: {'lr': 0.000489004358212311, 'samples': 3076800, 'steps': 16024, 'loss/train': 2.0105652809143066} -08/30/2021 16:08:08 - INFO - __main__ - Step 16026: {'lr': 0.0004890028016380769, 'samples': 3076992, 'steps': 16025, 'loss/train': 1.8932466506958008} -08/30/2021 16:08:10 - INFO - __main__ - Step 16027: {'lr': 0.0004890012449561518, 'samples': 3077184, 'steps': 16026, 'loss/train': 1.5929791927337646} -08/30/2021 16:08:10 - INFO - __main__ - Step 16028: {'lr': 0.0004889996881665366, 'samples': 3077376, 'steps': 16027, 'loss/train': 1.5297855138778687} -08/30/2021 16:08:10 - INFO - __main__ - Step 16029: {'lr': 0.0004889981312692317, 'samples': 3077568, 'steps': 16028, 'loss/train': 1.4741088151931763} -08/30/2021 16:08:11 - INFO - __main__ - Step 16030: {'lr': 0.000488996574264238, 'samples': 3077760, 'steps': 16029, 'loss/train': 0.3136903941631317} -08/30/2021 16:08:11 - INFO - __main__ - Step 16031: {'lr': 0.000488995017151556, 'samples': 3077952, 'steps': 16030, 'loss/train': 1.9275661706924438} -08/30/2021 16:08:13 - INFO - __main__ - Step 16032: {'lr': 0.0004889934599311867, 'samples': 3078144, 'steps': 16031, 'loss/train': 1.510998010635376} -08/30/2021 16:08:13 - INFO - __main__ - Step 16033: {'lr': 0.0004889919026031306, 'samples': 3078336, 'steps': 16032, 'loss/train': 1.4501458406448364} -08/30/2021 16:08:13 - INFO - __main__ - Step 16034: {'lr': 0.0004889903451673884, 'samples': 3078528, 'steps': 16033, 'loss/train': 1.6799242496490479} -08/30/2021 16:08:14 - INFO - __main__ - Step 16035: {'lr': 0.0004889887876239608, 'samples': 3078720, 'steps': 16034, 'loss/train': 1.4250009059906006} -08/30/2021 16:08:14 - INFO - __main__ - Step 16036: {'lr': 0.0004889872299728486, 'samples': 3078912, 'steps': 16035, 'loss/train': 1.598712682723999} -08/30/2021 16:08:15 - INFO - __main__ - Step 16037: {'lr': 0.0004889856722140525, 'samples': 3079104, 'steps': 16036, 'loss/train': 0.8378870487213135} -08/30/2021 16:08:16 - INFO - __main__ - Step 16038: {'lr': 0.000488984114347573, 'samples': 3079296, 'steps': 16037, 'loss/train': 1.6544798612594604} -08/30/2021 16:08:16 - INFO - __main__ - Step 16039: {'lr': 0.000488982556373411, 'samples': 3079488, 'steps': 16038, 'loss/train': 0.9884001612663269} -08/30/2021 16:08:17 - INFO - __main__ - Step 16040: {'lr': 0.0004889809982915672, 'samples': 3079680, 'steps': 16039, 'loss/train': 1.8656682968139648} -08/30/2021 16:08:17 - INFO - __main__ - Step 16041: {'lr': 0.0004889794401020422, 'samples': 3079872, 'steps': 16040, 'loss/train': 1.5121309757232666} -08/30/2021 16:08:18 - INFO - __main__ - Step 16042: {'lr': 0.0004889778818048368, 'samples': 3080064, 'steps': 16041, 'loss/train': 1.3341726064682007} -08/30/2021 16:08:19 - INFO - __main__ - Step 16043: {'lr': 0.0004889763233999516, 'samples': 3080256, 'steps': 16042, 'loss/train': 1.7305001020431519} -08/30/2021 16:08:19 - INFO - __main__ - Step 16044: {'lr': 0.0004889747648873874, 'samples': 3080448, 'steps': 16043, 'loss/train': 2.1049811840057373} -08/30/2021 16:08:19 - INFO - __main__ - Step 16045: {'lr': 0.0004889732062671448, 'samples': 3080640, 'steps': 16044, 'loss/train': 1.8849035501480103} -08/30/2021 16:08:20 - INFO - __main__ - Step 16046: {'lr': 0.0004889716475392247, 'samples': 3080832, 'steps': 16045, 'loss/train': 1.5957787036895752} -08/30/2021 16:08:21 - INFO - __main__ - Step 16047: {'lr': 0.0004889700887036275, 'samples': 3081024, 'steps': 16046, 'loss/train': 1.4747272729873657} -08/30/2021 16:08:22 - INFO - __main__ - Step 16048: {'lr': 0.0004889685297603541, 'samples': 3081216, 'steps': 16047, 'loss/train': 1.2768683433532715} -08/30/2021 16:08:22 - INFO - __main__ - Step 16049: {'lr': 0.0004889669707094052, 'samples': 3081408, 'steps': 16048, 'loss/train': 1.3526276350021362} -08/30/2021 16:08:23 - INFO - __main__ - Step 16050: {'lr': 0.0004889654115507815, 'samples': 3081600, 'steps': 16049, 'loss/train': 2.011629343032837} -08/30/2021 16:08:23 - INFO - __main__ - Step 16051: {'lr': 0.0004889638522844836, 'samples': 3081792, 'steps': 16050, 'loss/train': 1.3644627332687378} -08/30/2021 16:08:24 - INFO - __main__ - Step 16052: {'lr': 0.0004889622929105123, 'samples': 3081984, 'steps': 16051, 'loss/train': 1.5981725454330444} -08/30/2021 16:08:25 - INFO - __main__ - Step 16053: {'lr': 0.0004889607334288683, 'samples': 3082176, 'steps': 16052, 'loss/train': 1.5981335639953613} -08/30/2021 16:08:25 - INFO - __main__ - Step 16054: {'lr': 0.0004889591738395522, 'samples': 3082368, 'steps': 16053, 'loss/train': 1.9253791570663452} -08/30/2021 16:08:25 - INFO - __main__ - Step 16055: {'lr': 0.0004889576141425649, 'samples': 3082560, 'steps': 16054, 'loss/train': 1.7079644203186035} -08/30/2021 16:08:26 - INFO - __main__ - Step 16056: {'lr': 0.0004889560543379069, 'samples': 3082752, 'steps': 16055, 'loss/train': 1.6662176847457886} -08/30/2021 16:08:28 - INFO - __main__ - Step 16057: {'lr': 0.000488954494425579, 'samples': 3082944, 'steps': 16056, 'loss/train': 1.7057243585586548} -08/30/2021 16:08:28 - INFO - __main__ - Step 16058: {'lr': 0.000488952934405582, 'samples': 3083136, 'steps': 16057, 'loss/train': 2.2320845127105713} -08/30/2021 16:08:29 - INFO - __main__ - Step 16059: {'lr': 0.0004889513742779164, 'samples': 3083328, 'steps': 16058, 'loss/train': 1.759162425994873} -08/30/2021 16:08:29 - INFO - __main__ - Step 16060: {'lr': 0.0004889498140425829, 'samples': 3083520, 'steps': 16059, 'loss/train': 0.5264279246330261} -08/30/2021 16:08:29 - INFO - __main__ - Step 16061: {'lr': 0.0004889482536995825, 'samples': 3083712, 'steps': 16060, 'loss/train': 1.7540335655212402} -08/30/2021 16:08:30 - INFO - __main__ - Step 16062: {'lr': 0.0004889466932489157, 'samples': 3083904, 'steps': 16061, 'loss/train': 1.7482750415802002} -08/30/2021 16:08:31 - INFO - __main__ - Step 16063: {'lr': 0.0004889451326905831, 'samples': 3084096, 'steps': 16062, 'loss/train': 1.2973772287368774} -08/30/2021 16:08:32 - INFO - __main__ - Step 16064: {'lr': 0.0004889435720245855, 'samples': 3084288, 'steps': 16063, 'loss/train': 1.0407685041427612} -08/30/2021 16:08:32 - INFO - __main__ - Step 16065: {'lr': 0.0004889420112509237, 'samples': 3084480, 'steps': 16064, 'loss/train': 0.8719043135643005} -08/30/2021 16:08:33 - INFO - __main__ - Step 16066: {'lr': 0.0004889404503695983, 'samples': 3084672, 'steps': 16065, 'loss/train': 0.8405120372772217} -08/30/2021 16:08:33 - INFO - __main__ - Step 16067: {'lr': 0.0004889388893806099, 'samples': 3084864, 'steps': 16066, 'loss/train': 1.693964958190918} -08/30/2021 16:08:34 - INFO - __main__ - Step 16068: {'lr': 0.0004889373282839594, 'samples': 3085056, 'steps': 16067, 'loss/train': 1.8568710088729858} -08/30/2021 16:08:35 - INFO - __main__ - Step 16069: {'lr': 0.0004889357670796474, 'samples': 3085248, 'steps': 16068, 'loss/train': 2.2184221744537354} -08/30/2021 16:08:35 - INFO - __main__ - Step 16070: {'lr': 0.0004889342057676748, 'samples': 3085440, 'steps': 16069, 'loss/train': 1.2420254945755005} -08/30/2021 16:08:36 - INFO - __main__ - Step 16071: {'lr': 0.000488932644348042, 'samples': 3085632, 'steps': 16070, 'loss/train': 1.8536574840545654} -08/30/2021 16:08:36 - INFO - __main__ - Step 16072: {'lr': 0.0004889310828207498, 'samples': 3085824, 'steps': 16071, 'loss/train': 1.2023687362670898} -08/30/2021 16:08:37 - INFO - __main__ - Step 16073: {'lr': 0.000488929521185799, 'samples': 3086016, 'steps': 16072, 'loss/train': 1.577937126159668} -08/30/2021 16:08:38 - INFO - __main__ - Step 16074: {'lr': 0.0004889279594431903, 'samples': 3086208, 'steps': 16073, 'loss/train': 1.64153254032135} -08/30/2021 16:08:38 - INFO - __main__ - Step 16075: {'lr': 0.0004889263975929242, 'samples': 3086400, 'steps': 16074, 'loss/train': 1.453249454498291} -08/30/2021 16:08:39 - INFO - __main__ - Step 16076: {'lr': 0.0004889248356350016, 'samples': 3086592, 'steps': 16075, 'loss/train': 1.5572229623794556} -08/30/2021 16:08:39 - INFO - __main__ - Step 16077: {'lr': 0.0004889232735694232, 'samples': 3086784, 'steps': 16076, 'loss/train': 1.7651371955871582} -08/30/2021 16:08:41 - INFO - __main__ - Step 16078: {'lr': 0.0004889217113961896, 'samples': 3086976, 'steps': 16077, 'loss/train': 1.8475475311279297} -08/30/2021 16:08:41 - INFO - __main__ - Step 16079: {'lr': 0.0004889201491153016, 'samples': 3087168, 'steps': 16078, 'loss/train': 2.020800828933716} -08/30/2021 16:08:42 - INFO - __main__ - Step 16080: {'lr': 0.0004889185867267599, 'samples': 3087360, 'steps': 16079, 'loss/train': 2.3029513359069824} -08/30/2021 16:08:42 - INFO - __main__ - Step 16081: {'lr': 0.0004889170242305652, 'samples': 3087552, 'steps': 16080, 'loss/train': 0.11970590054988861} -08/30/2021 16:08:42 - INFO - __main__ - Step 16082: {'lr': 0.0004889154616267181, 'samples': 3087744, 'steps': 16081, 'loss/train': 1.6496000289916992} -08/30/2021 16:08:43 - INFO - __main__ - Step 16083: {'lr': 0.0004889138989152194, 'samples': 3087936, 'steps': 16082, 'loss/train': 1.455633282661438} -08/30/2021 16:08:44 - INFO - __main__ - Step 16084: {'lr': 0.0004889123360960698, 'samples': 3088128, 'steps': 16083, 'loss/train': 1.4459062814712524} -08/30/2021 16:08:45 - INFO - __main__ - Step 16085: {'lr': 0.0004889107731692699, 'samples': 3088320, 'steps': 16084, 'loss/train': 1.3344615697860718} -08/30/2021 16:08:45 - INFO - __main__ - Step 16086: {'lr': 0.0004889092101348206, 'samples': 3088512, 'steps': 16085, 'loss/train': 1.3583908081054688} -08/30/2021 16:08:45 - INFO - __main__ - Step 16087: {'lr': 0.0004889076469927225, 'samples': 3088704, 'steps': 16086, 'loss/train': 1.5506062507629395} -08/30/2021 16:08:46 - INFO - __main__ - Step 16088: {'lr': 0.0004889060837429762, 'samples': 3088896, 'steps': 16087, 'loss/train': 1.8411803245544434} -08/30/2021 16:08:47 - INFO - __main__ - Step 16089: {'lr': 0.0004889045203855826, 'samples': 3089088, 'steps': 16088, 'loss/train': 1.8212236166000366} -08/30/2021 16:08:48 - INFO - __main__ - Step 16090: {'lr': 0.0004889029569205423, 'samples': 3089280, 'steps': 16089, 'loss/train': 1.8571813106536865} -08/30/2021 16:08:48 - INFO - __main__ - Step 16091: {'lr': 0.0004889013933478559, 'samples': 3089472, 'steps': 16090, 'loss/train': 1.8308440446853638} -08/30/2021 16:08:48 - INFO - __main__ - Step 16092: {'lr': 0.0004888998296675243, 'samples': 3089664, 'steps': 16091, 'loss/train': 1.9102141857147217} -08/30/2021 16:08:49 - INFO - __main__ - Step 16093: {'lr': 0.0004888982658795482, 'samples': 3089856, 'steps': 16092, 'loss/train': 1.6870355606079102} -08/30/2021 16:08:49 - INFO - __main__ - Step 16094: {'lr': 0.0004888967019839282, 'samples': 3090048, 'steps': 16093, 'loss/train': 1.6751246452331543} -08/30/2021 16:08:51 - INFO - __main__ - Step 16095: {'lr': 0.000488895137980665, 'samples': 3090240, 'steps': 16094, 'loss/train': 1.1235871315002441} -08/30/2021 16:08:51 - INFO - __main__ - Step 16096: {'lr': 0.0004888935738697593, 'samples': 3090432, 'steps': 16095, 'loss/train': 0.3828321099281311} -08/30/2021 16:08:52 - INFO - __main__ - Step 16097: {'lr': 0.0004888920096512118, 'samples': 3090624, 'steps': 16096, 'loss/train': 1.1133627891540527} -08/30/2021 16:08:52 - INFO - __main__ - Step 16098: {'lr': 0.0004888904453250233, 'samples': 3090816, 'steps': 16097, 'loss/train': 1.6914875507354736} -08/30/2021 16:08:52 - INFO - __main__ - Step 16099: {'lr': 0.0004888888808911946, 'samples': 3091008, 'steps': 16098, 'loss/train': 1.1670382022857666} -08/30/2021 16:08:54 - INFO - __main__ - Step 16100: {'lr': 0.0004888873163497261, 'samples': 3091200, 'steps': 16099, 'loss/train': 2.175337076187134} -08/30/2021 16:08:54 - INFO - __main__ - Step 16101: {'lr': 0.0004888857517006186, 'samples': 3091392, 'steps': 16100, 'loss/train': 1.7574958801269531} -08/30/2021 16:08:55 - INFO - __main__ - Step 16102: {'lr': 0.000488884186943873, 'samples': 3091584, 'steps': 16101, 'loss/train': 1.4863200187683105} -08/30/2021 16:08:55 - INFO - __main__ - Step 16103: {'lr': 0.0004888826220794899, 'samples': 3091776, 'steps': 16102, 'loss/train': 1.8977420330047607} -08/30/2021 16:08:56 - INFO - __main__ - Step 16104: {'lr': 0.0004888810571074698, 'samples': 3091968, 'steps': 16103, 'loss/train': 1.5029984712600708} -08/30/2021 16:08:56 - INFO - __main__ - Step 16105: {'lr': 0.0004888794920278137, 'samples': 3092160, 'steps': 16104, 'loss/train': 1.0788410902023315} -08/30/2021 16:08:57 - INFO - __main__ - Step 16106: {'lr': 0.0004888779268405223, 'samples': 3092352, 'steps': 16105, 'loss/train': 2.3209078311920166} -08/30/2021 16:08:58 - INFO - __main__ - Step 16107: {'lr': 0.0004888763615455959, 'samples': 3092544, 'steps': 16106, 'loss/train': 0.9094582200050354} -08/30/2021 16:08:58 - INFO - __main__ - Step 16108: {'lr': 0.0004888747961430358, 'samples': 3092736, 'steps': 16107, 'loss/train': 2.0828287601470947} -08/30/2021 16:08:59 - INFO - __main__ - Step 16109: {'lr': 0.0004888732306328422, 'samples': 3092928, 'steps': 16108, 'loss/train': 1.569623589515686} -08/30/2021 16:08:59 - INFO - __main__ - Step 16110: {'lr': 0.000488871665015016, 'samples': 3093120, 'steps': 16109, 'loss/train': 1.9902257919311523} -08/30/2021 16:09:01 - INFO - __main__ - Step 16111: {'lr': 0.0004888700992895581, 'samples': 3093312, 'steps': 16110, 'loss/train': 1.6226801872253418} -08/30/2021 16:09:01 - INFO - __main__ - Step 16112: {'lr': 0.0004888685334564688, 'samples': 3093504, 'steps': 16111, 'loss/train': 1.4757969379425049} -08/30/2021 16:09:02 - INFO - __main__ - Step 16113: {'lr': 0.0004888669675157492, 'samples': 3093696, 'steps': 16112, 'loss/train': 1.684322476387024} -08/30/2021 16:09:02 - INFO - __main__ - Step 16114: {'lr': 0.0004888654014673998, 'samples': 3093888, 'steps': 16113, 'loss/train': 0.572607696056366} -08/30/2021 16:09:02 - INFO - __main__ - Step 16115: {'lr': 0.0004888638353114212, 'samples': 3094080, 'steps': 16114, 'loss/train': 3.351923704147339} -08/30/2021 16:09:04 - INFO - __main__ - Step 16116: {'lr': 0.0004888622690478144, 'samples': 3094272, 'steps': 16115, 'loss/train': 2.2719335556030273} -08/30/2021 16:09:05 - INFO - __main__ - Step 16117: {'lr': 0.0004888607026765799, 'samples': 3094464, 'steps': 16116, 'loss/train': 1.4435566663742065} -08/30/2021 16:09:05 - INFO - __main__ - Step 16118: {'lr': 0.0004888591361977184, 'samples': 3094656, 'steps': 16117, 'loss/train': 2.0642950534820557} -08/30/2021 16:09:05 - INFO - __main__ - Step 16119: {'lr': 0.0004888575696112308, 'samples': 3094848, 'steps': 16118, 'loss/train': 1.451029658317566} -08/30/2021 16:09:06 - INFO - __main__ - Step 16120: {'lr': 0.0004888560029171175, 'samples': 3095040, 'steps': 16119, 'loss/train': 0.7746983766555786} -08/30/2021 16:09:07 - INFO - __main__ - Step 16121: {'lr': 0.0004888544361153794, 'samples': 3095232, 'steps': 16120, 'loss/train': 2.073786973953247} -08/30/2021 16:09:08 - INFO - __main__ - Step 16122: {'lr': 0.0004888528692060173, 'samples': 3095424, 'steps': 16121, 'loss/train': 1.788468837738037} -08/30/2021 16:09:08 - INFO - __main__ - Step 16123: {'lr': 0.0004888513021890316, 'samples': 3095616, 'steps': 16122, 'loss/train': 1.5074615478515625} -08/30/2021 16:09:08 - INFO - __main__ - Step 16124: {'lr': 0.0004888497350644234, 'samples': 3095808, 'steps': 16123, 'loss/train': 1.744973063468933} -08/30/2021 16:09:09 - INFO - __main__ - Step 16125: {'lr': 0.000488848167832193, 'samples': 3096000, 'steps': 16124, 'loss/train': 1.935605764389038} -08/30/2021 16:09:09 - INFO - __main__ - Step 16126: {'lr': 0.0004888466004923413, 'samples': 3096192, 'steps': 16125, 'loss/train': 1.6238654851913452} -08/30/2021 16:09:10 - INFO - __main__ - Step 16127: {'lr': 0.0004888450330448692, 'samples': 3096384, 'steps': 16126, 'loss/train': 1.3200464248657227} -08/30/2021 16:09:11 - INFO - __main__ - Step 16128: {'lr': 0.000488843465489777, 'samples': 3096576, 'steps': 16127, 'loss/train': 2.069633960723877} -08/30/2021 16:09:11 - INFO - __main__ - Step 16129: {'lr': 0.0004888418978270658, 'samples': 3096768, 'steps': 16128, 'loss/train': 1.963121771812439} -08/30/2021 16:09:12 - INFO - __main__ - Step 16130: {'lr': 0.000488840330056736, 'samples': 3096960, 'steps': 16129, 'loss/train': 0.6227633953094482} -08/30/2021 16:09:12 - INFO - __main__ - Step 16131: {'lr': 0.0004888387621787885, 'samples': 3097152, 'steps': 16130, 'loss/train': 1.151824712753296} -08/30/2021 16:09:14 - INFO - __main__ - Step 16132: {'lr': 0.0004888371941932239, 'samples': 3097344, 'steps': 16131, 'loss/train': 1.8692610263824463} -08/30/2021 16:09:14 - INFO - __main__ - Step 16133: {'lr': 0.000488835626100043, 'samples': 3097536, 'steps': 16132, 'loss/train': 2.0648441314697266} -08/30/2021 16:09:15 - INFO - __main__ - Step 16134: {'lr': 0.0004888340578992464, 'samples': 3097728, 'steps': 16133, 'loss/train': 1.5093820095062256} -08/30/2021 16:09:15 - INFO - __main__ - Step 16135: {'lr': 0.0004888324895908349, 'samples': 3097920, 'steps': 16134, 'loss/train': 0.14670990407466888} -08/30/2021 16:09:15 - INFO - __main__ - Step 16136: {'lr': 0.0004888309211748091, 'samples': 3098112, 'steps': 16135, 'loss/train': 2.1670074462890625} -08/30/2021 16:09:17 - INFO - __main__ - Step 16137: {'lr': 0.0004888293526511697, 'samples': 3098304, 'steps': 16136, 'loss/train': 1.357384204864502} -08/30/2021 16:09:18 - INFO - __main__ - Step 16138: {'lr': 0.0004888277840199177, 'samples': 3098496, 'steps': 16137, 'loss/train': 2.0959296226501465} -08/30/2021 16:09:18 - INFO - __main__ - Step 16139: {'lr': 0.0004888262152810534, 'samples': 3098688, 'steps': 16138, 'loss/train': 1.4581689834594727} -08/30/2021 16:09:19 - INFO - __main__ - Step 16140: {'lr': 0.0004888246464345779, 'samples': 3098880, 'steps': 16139, 'loss/train': 1.218555212020874} -08/30/2021 16:09:19 - INFO - __main__ - Step 16141: {'lr': 0.0004888230774804915, 'samples': 3099072, 'steps': 16140, 'loss/train': 2.924306631088257} -08/30/2021 16:09:19 - INFO - __main__ - Step 16142: {'lr': 0.0004888215084187952, 'samples': 3099264, 'steps': 16141, 'loss/train': 1.1649971008300781} -08/30/2021 16:09:20 - INFO - __main__ - Step 16143: {'lr': 0.0004888199392494896, 'samples': 3099456, 'steps': 16142, 'loss/train': 1.8804823160171509} -08/30/2021 16:09:21 - INFO - __main__ - Step 16144: {'lr': 0.0004888183699725755, 'samples': 3099648, 'steps': 16143, 'loss/train': 1.9456937313079834} -08/30/2021 16:09:22 - INFO - __main__ - Step 16145: {'lr': 0.0004888168005880533, 'samples': 3099840, 'steps': 16144, 'loss/train': 1.3489423990249634} -08/30/2021 16:09:22 - INFO - __main__ - Step 16146: {'lr': 0.0004888152310959242, 'samples': 3100032, 'steps': 16145, 'loss/train': 2.2964887619018555} -08/30/2021 16:09:23 - INFO - __main__ - Step 16147: {'lr': 0.0004888136614961885, 'samples': 3100224, 'steps': 16146, 'loss/train': 1.5480968952178955} -08/30/2021 16:09:23 - INFO - __main__ - Step 16148: {'lr': 0.000488812091788847, 'samples': 3100416, 'steps': 16147, 'loss/train': 1.7133764028549194} -08/30/2021 16:09:23 - INFO - __main__ - Step 16149: {'lr': 0.0004888105219739005, 'samples': 3100608, 'steps': 16148, 'loss/train': 1.5252094268798828} -08/30/2021 16:09:25 - INFO - __main__ - Step 16150: {'lr': 0.0004888089520513497, 'samples': 3100800, 'steps': 16149, 'loss/train': 2.347001314163208} -08/30/2021 16:09:25 - INFO - __main__ - Step 16151: {'lr': 0.0004888073820211952, 'samples': 3100992, 'steps': 16150, 'loss/train': 1.6128660440444946} -08/30/2021 16:09:26 - INFO - __main__ - Step 16152: {'lr': 0.0004888058118834379, 'samples': 3101184, 'steps': 16151, 'loss/train': 1.2262918949127197} -08/30/2021 16:09:26 - INFO - __main__ - Step 16153: {'lr': 0.0004888042416380784, 'samples': 3101376, 'steps': 16152, 'loss/train': 1.3816686868667603} -08/30/2021 16:09:26 - INFO - __main__ - Step 16154: {'lr': 0.0004888026712851172, 'samples': 3101568, 'steps': 16153, 'loss/train': 1.3808690309524536} -08/30/2021 16:09:28 - INFO - __main__ - Step 16155: {'lr': 0.0004888011008245554, 'samples': 3101760, 'steps': 16154, 'loss/train': 2.342851400375366} -08/30/2021 16:09:28 - INFO - __main__ - Step 16156: {'lr': 0.0004887995302563934, 'samples': 3101952, 'steps': 16155, 'loss/train': 1.524072527885437} -08/30/2021 16:09:29 - INFO - __main__ - Step 16157: {'lr': 0.000488797959580632, 'samples': 3102144, 'steps': 16156, 'loss/train': 1.9407135248184204} -08/30/2021 16:09:29 - INFO - __main__ - Step 16158: {'lr': 0.000488796388797272, 'samples': 3102336, 'steps': 16157, 'loss/train': 1.8427869081497192} -08/30/2021 16:09:29 - INFO - __main__ - Step 16159: {'lr': 0.0004887948179063139, 'samples': 3102528, 'steps': 16158, 'loss/train': 1.2670528888702393} -08/30/2021 16:09:31 - INFO - __main__ - Step 16160: {'lr': 0.0004887932469077587, 'samples': 3102720, 'steps': 16159, 'loss/train': 1.7608425617218018} -08/30/2021 16:09:32 - INFO - __main__ - Step 16161: {'lr': 0.0004887916758016069, 'samples': 3102912, 'steps': 16160, 'loss/train': 1.6997241973876953} -08/30/2021 16:09:32 - INFO - __main__ - Step 16162: {'lr': 0.0004887901045878592, 'samples': 3103104, 'steps': 16161, 'loss/train': 1.8640961647033691} -08/30/2021 16:09:33 - INFO - __main__ - Step 16163: {'lr': 0.0004887885332665165, 'samples': 3103296, 'steps': 16162, 'loss/train': 1.8507424592971802} -08/30/2021 16:09:33 - INFO - __main__ - Step 16164: {'lr': 0.0004887869618375793, 'samples': 3103488, 'steps': 16163, 'loss/train': 1.8012827634811401} -08/30/2021 16:09:34 - INFO - __main__ - Step 16165: {'lr': 0.0004887853903010483, 'samples': 3103680, 'steps': 16164, 'loss/train': 1.77405846118927} -08/30/2021 16:09:35 - INFO - __main__ - Step 16166: {'lr': 0.0004887838186569244, 'samples': 3103872, 'steps': 16165, 'loss/train': 1.9588273763656616} -08/30/2021 16:09:35 - INFO - __main__ - Step 16167: {'lr': 0.0004887822469052081, 'samples': 3104064, 'steps': 16166, 'loss/train': 1.5669358968734741} -08/30/2021 16:09:35 - INFO - __main__ - Step 16168: {'lr': 0.0004887806750459002, 'samples': 3104256, 'steps': 16167, 'loss/train': 1.1243661642074585} -08/30/2021 16:09:36 - INFO - __main__ - Step 16169: {'lr': 0.0004887791030790016, 'samples': 3104448, 'steps': 16168, 'loss/train': 0.7587945461273193} -08/30/2021 16:09:37 - INFO - __main__ - Step 16170: {'lr': 0.0004887775310045126, 'samples': 3104640, 'steps': 16169, 'loss/train': 1.7444339990615845} -08/30/2021 16:09:38 - INFO - __main__ - Step 16171: {'lr': 0.0004887759588224342, 'samples': 3104832, 'steps': 16170, 'loss/train': 1.7415778636932373} -08/30/2021 16:09:38 - INFO - __main__ - Step 16172: {'lr': 0.000488774386532767, 'samples': 3105024, 'steps': 16171, 'loss/train': 1.9292267560958862} -08/30/2021 16:09:39 - INFO - __main__ - Step 16173: {'lr': 0.0004887728141355118, 'samples': 3105216, 'steps': 16172, 'loss/train': 1.68677818775177} -08/30/2021 16:09:39 - INFO - __main__ - Step 16174: {'lr': 0.0004887712416306693, 'samples': 3105408, 'steps': 16173, 'loss/train': 1.582221269607544} -08/30/2021 16:09:39 - INFO - __main__ - Step 16175: {'lr': 0.00048876966901824, 'samples': 3105600, 'steps': 16174, 'loss/train': 3.0712389945983887} -08/30/2021 16:09:41 - INFO - __main__ - Step 16176: {'lr': 0.0004887680962982249, 'samples': 3105792, 'steps': 16175, 'loss/train': 1.2103501558303833} -08/30/2021 16:09:41 - INFO - __main__ - Step 16177: {'lr': 0.0004887665234706247, 'samples': 3105984, 'steps': 16176, 'loss/train': 0.9753164052963257} -08/30/2021 16:09:42 - INFO - __main__ - Step 16178: {'lr': 0.0004887649505354398, 'samples': 3106176, 'steps': 16177, 'loss/train': 1.9455859661102295} -08/30/2021 16:09:42 - INFO - __main__ - Step 16179: {'lr': 0.000488763377492671, 'samples': 3106368, 'steps': 16178, 'loss/train': 2.0331685543060303} -08/30/2021 16:09:42 - INFO - __main__ - Step 16180: {'lr': 0.0004887618043423194, 'samples': 3106560, 'steps': 16179, 'loss/train': 1.3366820812225342} -08/30/2021 16:09:44 - INFO - __main__ - Step 16181: {'lr': 0.0004887602310843852, 'samples': 3106752, 'steps': 16180, 'loss/train': 1.2191157341003418} -08/30/2021 16:09:44 - INFO - __main__ - Step 16182: {'lr': 0.0004887586577188694, 'samples': 3106944, 'steps': 16181, 'loss/train': 1.6067984104156494} -08/30/2021 16:09:45 - INFO - __main__ - Step 16183: {'lr': 0.0004887570842457726, 'samples': 3107136, 'steps': 16182, 'loss/train': 1.8974665403366089} -08/30/2021 16:09:45 - INFO - __main__ - Step 16184: {'lr': 0.0004887555106650956, 'samples': 3107328, 'steps': 16183, 'loss/train': 1.5397377014160156} -08/30/2021 16:09:46 - INFO - __main__ - Step 16185: {'lr': 0.000488753936976839, 'samples': 3107520, 'steps': 16184, 'loss/train': 1.5278619527816772} -08/30/2021 16:09:47 - INFO - __main__ - Step 16186: {'lr': 0.0004887523631810036, 'samples': 3107712, 'steps': 16185, 'loss/train': 1.9503189325332642} -08/30/2021 16:09:48 - INFO - __main__ - Step 16187: {'lr': 0.00048875078927759, 'samples': 3107904, 'steps': 16186, 'loss/train': 1.579522967338562} -08/30/2021 16:09:48 - INFO - __main__ - Step 16188: {'lr': 0.000488749215266599, 'samples': 3108096, 'steps': 16187, 'loss/train': 1.55048406124115} -08/30/2021 16:09:48 - INFO - __main__ - Step 16189: {'lr': 0.0004887476411480314, 'samples': 3108288, 'steps': 16188, 'loss/train': 1.6580860614776611} -08/30/2021 16:09:49 - INFO - __main__ - Step 16190: {'lr': 0.0004887460669218877, 'samples': 3108480, 'steps': 16189, 'loss/train': 2.1892404556274414} -08/30/2021 16:09:49 - INFO - __main__ - Step 16191: {'lr': 0.0004887444925881688, 'samples': 3108672, 'steps': 16190, 'loss/train': 1.9593427181243896} -08/30/2021 16:09:50 - INFO - __main__ - Step 16192: {'lr': 0.0004887429181468752, 'samples': 3108864, 'steps': 16191, 'loss/train': 1.5536094903945923} -08/30/2021 16:09:51 - INFO - __main__ - Step 16193: {'lr': 0.0004887413435980077, 'samples': 3109056, 'steps': 16192, 'loss/train': 1.3946034908294678} -08/30/2021 16:09:51 - INFO - __main__ - Step 16194: {'lr': 0.0004887397689415672, 'samples': 3109248, 'steps': 16193, 'loss/train': 1.8941177129745483} -08/30/2021 16:09:52 - INFO - __main__ - Step 16195: {'lr': 0.0004887381941775541, 'samples': 3109440, 'steps': 16194, 'loss/train': 1.5038566589355469} -08/30/2021 16:09:52 - INFO - __main__ - Step 16196: {'lr': 0.0004887366193059693, 'samples': 3109632, 'steps': 16195, 'loss/train': 2.350515127182007} -08/30/2021 16:09:54 - INFO - __main__ - Step 16197: {'lr': 0.0004887350443268134, 'samples': 3109824, 'steps': 16196, 'loss/train': 2.0816149711608887} -08/30/2021 16:09:54 - INFO - __main__ - Step 16198: {'lr': 0.0004887334692400872, 'samples': 3110016, 'steps': 16197, 'loss/train': 2.001119375228882} -08/30/2021 16:09:54 - INFO - __main__ - Step 16199: {'lr': 0.0004887318940457915, 'samples': 3110208, 'steps': 16198, 'loss/train': 2.252450466156006} -08/30/2021 16:09:55 - INFO - __main__ - Step 16200: {'lr': 0.0004887303187439267, 'samples': 3110400, 'steps': 16199, 'loss/train': 1.8264209032058716} -08/30/2021 16:09:55 - INFO - __main__ - Step 16201: {'lr': 0.0004887287433344939, 'samples': 3110592, 'steps': 16200, 'loss/train': 2.057054281234741} -08/30/2021 16:09:57 - INFO - __main__ - Step 16202: {'lr': 0.0004887271678174935, 'samples': 3110784, 'steps': 16201, 'loss/train': 1.7432345151901245} -08/30/2021 16:09:57 - INFO - __main__ - Step 16203: {'lr': 0.0004887255921929264, 'samples': 3110976, 'steps': 16202, 'loss/train': 1.7855374813079834} -08/30/2021 16:09:57 - INFO - __main__ - Step 16204: {'lr': 0.0004887240164607931, 'samples': 3111168, 'steps': 16203, 'loss/train': 1.6861077547073364} -08/30/2021 16:09:58 - INFO - __main__ - Step 16205: {'lr': 0.0004887224406210945, 'samples': 3111360, 'steps': 16204, 'loss/train': 1.757550597190857} -08/30/2021 16:09:58 - INFO - __main__ - Step 16206: {'lr': 0.0004887208646738312, 'samples': 3111552, 'steps': 16205, 'loss/train': 1.7205955982208252} -08/30/2021 16:10:00 - INFO - __main__ - Step 16207: {'lr': 0.000488719288619004, 'samples': 3111744, 'steps': 16206, 'loss/train': 1.0609853267669678} -08/30/2021 16:10:00 - INFO - __main__ - Step 16208: {'lr': 0.0004887177124566136, 'samples': 3111936, 'steps': 16207, 'loss/train': 1.9943522214889526} -08/30/2021 16:10:01 - INFO - __main__ - Step 16209: {'lr': 0.0004887161361866607, 'samples': 3112128, 'steps': 16208, 'loss/train': 2.03987455368042} -08/30/2021 16:10:01 - INFO - __main__ - Step 16210: {'lr': 0.000488714559809146, 'samples': 3112320, 'steps': 16209, 'loss/train': 1.0090466737747192} -08/30/2021 16:10:01 - INFO - __main__ - Step 16211: {'lr': 0.0004887129833240703, 'samples': 3112512, 'steps': 16210, 'loss/train': 2.009734630584717} -08/30/2021 16:10:02 - INFO - __main__ - Step 16212: {'lr': 0.000488711406731434, 'samples': 3112704, 'steps': 16211, 'loss/train': 2.1733686923980713} -08/30/2021 16:10:04 - INFO - __main__ - Step 16213: {'lr': 0.0004887098300312381, 'samples': 3112896, 'steps': 16212, 'loss/train': 2.4037039279937744} -08/30/2021 16:10:04 - INFO - __main__ - Step 16214: {'lr': 0.0004887082532234832, 'samples': 3113088, 'steps': 16213, 'loss/train': 1.0594024658203125} -08/30/2021 16:10:05 - INFO - __main__ - Step 16215: {'lr': 0.0004887066763081702, 'samples': 3113280, 'steps': 16214, 'loss/train': 1.5682018995285034} -08/30/2021 16:10:05 - INFO - __main__ - Step 16216: {'lr': 0.0004887050992852995, 'samples': 3113472, 'steps': 16215, 'loss/train': 2.072334051132202} -08/30/2021 16:10:05 - INFO - __main__ - Step 16217: {'lr': 0.000488703522154872, 'samples': 3113664, 'steps': 16216, 'loss/train': 1.8428153991699219} -08/30/2021 16:10:07 - INFO - __main__ - Step 16218: {'lr': 0.0004887019449168884, 'samples': 3113856, 'steps': 16217, 'loss/train': 1.2231703996658325} -08/30/2021 16:10:08 - INFO - __main__ - Step 16219: {'lr': 0.0004887003675713493, 'samples': 3114048, 'steps': 16218, 'loss/train': 1.609653115272522} -08/30/2021 16:10:08 - INFO - __main__ - Step 16220: {'lr': 0.0004886987901182556, 'samples': 3114240, 'steps': 16219, 'loss/train': 0.17627251148223877} -08/30/2021 16:10:08 - INFO - __main__ - Step 16221: {'lr': 0.0004886972125576079, 'samples': 3114432, 'steps': 16220, 'loss/train': 0.09967661648988724} -08/30/2021 16:10:09 - INFO - __main__ - Step 16222: {'lr': 0.0004886956348894069, 'samples': 3114624, 'steps': 16221, 'loss/train': 1.9792263507843018} -08/30/2021 16:10:09 - INFO - __main__ - Step 16223: {'lr': 0.0004886940571136533, 'samples': 3114816, 'steps': 16222, 'loss/train': 1.4621689319610596} -08/30/2021 16:10:11 - INFO - __main__ - Step 16224: {'lr': 0.0004886924792303479, 'samples': 3115008, 'steps': 16223, 'loss/train': 1.6258628368377686} -08/30/2021 16:10:11 - INFO - __main__ - Step 16225: {'lr': 0.0004886909012394913, 'samples': 3115200, 'steps': 16224, 'loss/train': 1.3522077798843384} -08/30/2021 16:10:11 - INFO - __main__ - Step 16226: {'lr': 0.0004886893231410844, 'samples': 3115392, 'steps': 16225, 'loss/train': 2.247959613800049} -08/30/2021 16:10:12 - INFO - __main__ - Step 16227: {'lr': 0.0004886877449351276, 'samples': 3115584, 'steps': 16226, 'loss/train': 1.8723901510238647} -08/30/2021 16:10:12 - INFO - __main__ - Step 16228: {'lr': 0.0004886861666216219, 'samples': 3115776, 'steps': 16227, 'loss/train': 1.1099066734313965} -08/30/2021 16:10:14 - INFO - __main__ - Step 16229: {'lr': 0.0004886845882005679, 'samples': 3115968, 'steps': 16228, 'loss/train': 1.552213191986084} -08/30/2021 16:10:14 - INFO - __main__ - Step 16230: {'lr': 0.0004886830096719662, 'samples': 3116160, 'steps': 16229, 'loss/train': 1.9366902112960815} -08/30/2021 16:10:14 - INFO - __main__ - Step 16231: {'lr': 0.0004886814310358176, 'samples': 3116352, 'steps': 16230, 'loss/train': 1.5782767534255981} -08/30/2021 16:10:15 - INFO - __main__ - Step 16232: {'lr': 0.000488679852292123, 'samples': 3116544, 'steps': 16231, 'loss/train': 1.4731717109680176} -08/30/2021 16:10:15 - INFO - __main__ - Step 16233: {'lr': 0.0004886782734408828, 'samples': 3116736, 'steps': 16232, 'loss/train': 2.0903234481811523} -08/30/2021 16:10:17 - INFO - __main__ - Step 16234: {'lr': 0.0004886766944820979, 'samples': 3116928, 'steps': 16233, 'loss/train': 0.8610385060310364} -08/30/2021 16:10:17 - INFO - __main__ - Step 16235: {'lr': 0.0004886751154157689, 'samples': 3117120, 'steps': 16234, 'loss/train': 1.0175727605819702} -08/30/2021 16:10:17 - INFO - __main__ - Step 16236: {'lr': 0.0004886735362418967, 'samples': 3117312, 'steps': 16235, 'loss/train': 1.5067758560180664} -08/30/2021 16:10:18 - INFO - __main__ - Step 16237: {'lr': 0.0004886719569604818, 'samples': 3117504, 'steps': 16236, 'loss/train': 1.7044957876205444} -08/30/2021 16:10:18 - INFO - __main__ - Step 16238: {'lr': 0.000488670377571525, 'samples': 3117696, 'steps': 16237, 'loss/train': 3.1742258071899414} -08/30/2021 16:10:19 - INFO - __main__ - Step 16239: {'lr': 0.0004886687980750271, 'samples': 3117888, 'steps': 16238, 'loss/train': 2.278348684310913} -08/30/2021 16:10:20 - INFO - __main__ - Step 16240: {'lr': 0.0004886672184709886, 'samples': 3118080, 'steps': 16239, 'loss/train': 1.5339815616607666} -08/30/2021 16:10:20 - INFO - __main__ - Step 16241: {'lr': 0.0004886656387594104, 'samples': 3118272, 'steps': 16240, 'loss/train': 0.7528780698776245} -08/30/2021 16:10:21 - INFO - __main__ - Step 16242: {'lr': 0.0004886640589402932, 'samples': 3118464, 'steps': 16241, 'loss/train': 1.4154741764068604} -08/30/2021 16:10:21 - INFO - __main__ - Step 16243: {'lr': 0.0004886624790136375, 'samples': 3118656, 'steps': 16242, 'loss/train': 1.8899236917495728} -08/30/2021 16:10:22 - INFO - __main__ - Step 16244: {'lr': 0.0004886608989794443, 'samples': 3118848, 'steps': 16243, 'loss/train': 1.998671293258667} -08/30/2021 16:10:23 - INFO - __main__ - Step 16245: {'lr': 0.0004886593188377142, 'samples': 3119040, 'steps': 16244, 'loss/train': 1.9466640949249268} -08/30/2021 16:10:23 - INFO - __main__ - Step 16246: {'lr': 0.0004886577385884478, 'samples': 3119232, 'steps': 16245, 'loss/train': 1.231416940689087} -08/30/2021 16:10:24 - INFO - __main__ - Step 16247: {'lr': 0.0004886561582316458, 'samples': 3119424, 'steps': 16246, 'loss/train': 1.6249898672103882} -08/30/2021 16:10:24 - INFO - __main__ - Step 16248: {'lr': 0.0004886545777673093, 'samples': 3119616, 'steps': 16247, 'loss/train': 1.663931131362915} -08/30/2021 16:10:26 - INFO - __main__ - Step 16249: {'lr': 0.0004886529971954385, 'samples': 3119808, 'steps': 16248, 'loss/train': 1.503287672996521} -08/30/2021 16:10:26 - INFO - __main__ - Step 16250: {'lr': 0.0004886514165160345, 'samples': 3120000, 'steps': 16249, 'loss/train': 0.7937673330307007} -08/30/2021 16:10:26 - INFO - __main__ - Step 16251: {'lr': 0.0004886498357290979, 'samples': 3120192, 'steps': 16250, 'loss/train': 3.2912514209747314} -08/30/2021 16:10:27 - INFO - __main__ - Step 16252: {'lr': 0.0004886482548346291, 'samples': 3120384, 'steps': 16251, 'loss/train': 0.1299923211336136} -08/30/2021 16:10:27 - INFO - __main__ - Step 16253: {'lr': 0.0004886466738326293, 'samples': 3120576, 'steps': 16252, 'loss/train': 0.14120961725711823} -08/30/2021 16:10:27 - INFO - __main__ - Step 16254: {'lr': 0.000488645092723099, 'samples': 3120768, 'steps': 16253, 'loss/train': 1.906154990196228} -08/30/2021 16:10:29 - INFO - __main__ - Step 16255: {'lr': 0.0004886435115060388, 'samples': 3120960, 'steps': 16254, 'loss/train': 1.6424577236175537} -08/30/2021 16:10:29 - INFO - __main__ - Step 16256: {'lr': 0.0004886419301814495, 'samples': 3121152, 'steps': 16255, 'loss/train': 1.7797577381134033} -08/30/2021 16:10:30 - INFO - __main__ - Step 16257: {'lr': 0.0004886403487493319, 'samples': 3121344, 'steps': 16256, 'loss/train': 1.8279746770858765} -08/30/2021 16:10:30 - INFO - __main__ - Step 16258: {'lr': 0.0004886387672096866, 'samples': 3121536, 'steps': 16257, 'loss/train': 0.8470008969306946} -08/30/2021 16:10:30 - INFO - __main__ - Step 16259: {'lr': 0.0004886371855625143, 'samples': 3121728, 'steps': 16258, 'loss/train': 1.8683289289474487} -08/30/2021 16:10:32 - INFO - __main__ - Step 16260: {'lr': 0.0004886356038078159, 'samples': 3121920, 'steps': 16259, 'loss/train': 1.5578852891921997} -08/30/2021 16:10:32 - INFO - __main__ - Step 16261: {'lr': 0.0004886340219455919, 'samples': 3122112, 'steps': 16260, 'loss/train': 1.034650444984436} -08/30/2021 16:10:33 - INFO - __main__ - Step 16262: {'lr': 0.0004886324399758431, 'samples': 3122304, 'steps': 16261, 'loss/train': 1.6897884607315063} -08/30/2021 16:10:33 - INFO - __main__ - Step 16263: {'lr': 0.0004886308578985702, 'samples': 3122496, 'steps': 16262, 'loss/train': 1.7113878726959229} -08/30/2021 16:10:33 - INFO - __main__ - Step 16264: {'lr': 0.0004886292757137739, 'samples': 3122688, 'steps': 16263, 'loss/train': 2.0861010551452637} -08/30/2021 16:10:34 - INFO - __main__ - Step 16265: {'lr': 0.0004886276934214551, 'samples': 3122880, 'steps': 16264, 'loss/train': 1.7308111190795898} -08/30/2021 16:10:35 - INFO - __main__ - Step 16266: {'lr': 0.0004886261110216141, 'samples': 3123072, 'steps': 16265, 'loss/train': 1.7342652082443237} -08/30/2021 16:10:36 - INFO - __main__ - Step 16267: {'lr': 0.000488624528514252, 'samples': 3123264, 'steps': 16266, 'loss/train': 1.5815978050231934} -08/30/2021 16:10:36 - INFO - __main__ - Step 16268: {'lr': 0.0004886229458993693, 'samples': 3123456, 'steps': 16267, 'loss/train': 1.6773253679275513} -08/30/2021 16:10:36 - INFO - __main__ - Step 16269: {'lr': 0.0004886213631769669, 'samples': 3123648, 'steps': 16268, 'loss/train': 1.8577414751052856} -08/30/2021 16:10:37 - INFO - __main__ - Step 16270: {'lr': 0.0004886197803470453, 'samples': 3123840, 'steps': 16269, 'loss/train': 1.8149452209472656} -08/30/2021 16:10:39 - INFO - __main__ - Step 16271: {'lr': 0.0004886181974096052, 'samples': 3124032, 'steps': 16270, 'loss/train': 1.1607913970947266} -08/30/2021 16:10:39 - INFO - __main__ - Step 16272: {'lr': 0.0004886166143646476, 'samples': 3124224, 'steps': 16271, 'loss/train': 1.8695080280303955} -08/30/2021 16:10:40 - INFO - __main__ - Step 16273: {'lr': 0.000488615031212173, 'samples': 3124416, 'steps': 16272, 'loss/train': 1.834064245223999} -08/30/2021 16:10:40 - INFO - __main__ - Step 16274: {'lr': 0.0004886134479521821, 'samples': 3124608, 'steps': 16273, 'loss/train': 1.9997714757919312} -08/30/2021 16:10:40 - INFO - __main__ - Step 16275: {'lr': 0.0004886118645846757, 'samples': 3124800, 'steps': 16274, 'loss/train': 1.942400574684143} -08/30/2021 16:10:42 - INFO - __main__ - Step 16276: {'lr': 0.0004886102811096544, 'samples': 3124992, 'steps': 16275, 'loss/train': 1.6288559436798096} -08/30/2021 16:10:42 - INFO - __main__ - Step 16277: {'lr': 0.0004886086975271191, 'samples': 3125184, 'steps': 16276, 'loss/train': 1.7238287925720215} -08/30/2021 16:10:43 - INFO - __main__ - Step 16278: {'lr': 0.0004886071138370704, 'samples': 3125376, 'steps': 16277, 'loss/train': 1.8636168241500854} -08/30/2021 16:10:43 - INFO - __main__ - Step 16279: {'lr': 0.000488605530039509, 'samples': 3125568, 'steps': 16278, 'loss/train': 1.5248596668243408} -08/30/2021 16:10:43 - INFO - __main__ - Step 16280: {'lr': 0.0004886039461344356, 'samples': 3125760, 'steps': 16279, 'loss/train': 1.7116458415985107} -08/30/2021 16:10:45 - INFO - __main__ - Step 16281: {'lr': 0.0004886023621218509, 'samples': 3125952, 'steps': 16280, 'loss/train': 1.7959003448486328} -08/30/2021 16:10:45 - INFO - __main__ - Step 16282: {'lr': 0.0004886007780017557, 'samples': 3126144, 'steps': 16281, 'loss/train': 1.5302084684371948} -08/30/2021 16:10:46 - INFO - __main__ - Step 16283: {'lr': 0.0004885991937741506, 'samples': 3126336, 'steps': 16282, 'loss/train': 1.8500771522521973} -08/30/2021 16:10:46 - INFO - __main__ - Step 16284: {'lr': 0.0004885976094390366, 'samples': 3126528, 'steps': 16283, 'loss/train': 1.7807413339614868} -08/30/2021 16:10:46 - INFO - __main__ - Step 16285: {'lr': 0.000488596024996414, 'samples': 3126720, 'steps': 16284, 'loss/train': 1.6970168352127075} -08/30/2021 16:10:47 - INFO - __main__ - Step 16286: {'lr': 0.0004885944404462838, 'samples': 3126912, 'steps': 16285, 'loss/train': 1.7380517721176147} -08/30/2021 16:10:49 - INFO - __main__ - Step 16287: {'lr': 0.0004885928557886466, 'samples': 3127104, 'steps': 16286, 'loss/train': 1.9905680418014526} -08/30/2021 16:10:49 - INFO - __main__ - Step 16288: {'lr': 0.0004885912710235031, 'samples': 3127296, 'steps': 16287, 'loss/train': 1.461103916168213} -08/30/2021 16:10:49 - INFO - __main__ - Step 16289: {'lr': 0.0004885896861508541, 'samples': 3127488, 'steps': 16288, 'loss/train': 2.0694077014923096} -08/30/2021 16:10:50 - INFO - __main__ - Step 16290: {'lr': 0.0004885881011707003, 'samples': 3127680, 'steps': 16289, 'loss/train': 1.1995704174041748} -08/30/2021 16:10:50 - INFO - __main__ - Step 16291: {'lr': 0.0004885865160830422, 'samples': 3127872, 'steps': 16290, 'loss/train': 1.7522541284561157} -08/30/2021 16:10:51 - INFO - __main__ - Step 16292: {'lr': 0.0004885849308878809, 'samples': 3128064, 'steps': 16291, 'loss/train': 1.6052396297454834} -08/30/2021 16:10:52 - INFO - __main__ - Step 16293: {'lr': 0.0004885833455852169, 'samples': 3128256, 'steps': 16292, 'loss/train': 1.8246219158172607} -08/30/2021 16:10:52 - INFO - __main__ - Step 16294: {'lr': 0.0004885817601750509, 'samples': 3128448, 'steps': 16293, 'loss/train': 1.7759073972702026} -08/30/2021 16:10:53 - INFO - __main__ - Step 16295: {'lr': 0.0004885801746573836, 'samples': 3128640, 'steps': 16294, 'loss/train': 1.4780112504959106} -08/30/2021 16:10:53 - INFO - __main__ - Step 16296: {'lr': 0.0004885785890322158, 'samples': 3128832, 'steps': 16295, 'loss/train': 1.8578686714172363} -08/30/2021 16:10:54 - INFO - __main__ - Step 16297: {'lr': 0.0004885770032995482, 'samples': 3129024, 'steps': 16296, 'loss/train': 1.973870873451233} -08/30/2021 16:10:55 - INFO - __main__ - Step 16298: {'lr': 0.0004885754174593814, 'samples': 3129216, 'steps': 16297, 'loss/train': 1.013839602470398} -08/30/2021 16:10:55 - INFO - __main__ - Step 16299: {'lr': 0.0004885738315117162, 'samples': 3129408, 'steps': 16298, 'loss/train': 1.2680706977844238} -08/30/2021 16:10:56 - INFO - __main__ - Step 16300: {'lr': 0.0004885722454565534, 'samples': 3129600, 'steps': 16299, 'loss/train': 1.2194448709487915} -08/30/2021 16:10:56 - INFO - __main__ - Step 16301: {'lr': 0.0004885706592938936, 'samples': 3129792, 'steps': 16300, 'loss/train': 1.9567265510559082} -08/30/2021 16:10:58 - INFO - __main__ - Step 16302: {'lr': 0.0004885690730237375, 'samples': 3129984, 'steps': 16301, 'loss/train': 1.841776967048645} -08/30/2021 16:10:58 - INFO - __main__ - Step 16303: {'lr': 0.0004885674866460858, 'samples': 3130176, 'steps': 16302, 'loss/train': 2.2307300567626953} -08/30/2021 16:10:58 - INFO - __main__ - Step 16304: {'lr': 0.0004885659001609393, 'samples': 3130368, 'steps': 16303, 'loss/train': 1.4630793333053589} -08/30/2021 16:10:59 - INFO - __main__ - Step 16305: {'lr': 0.0004885643135682987, 'samples': 3130560, 'steps': 16304, 'loss/train': 1.1288224458694458} -08/30/2021 16:10:59 - INFO - __main__ - Step 16306: {'lr': 0.0004885627268681648, 'samples': 3130752, 'steps': 16305, 'loss/train': 5.890904903411865} -08/30/2021 16:10:59 - INFO - __main__ - Step 16307: {'lr': 0.0004885611400605381, 'samples': 3130944, 'steps': 16306, 'loss/train': 1.1502996683120728} -08/30/2021 16:11:01 - INFO - __main__ - Step 16308: {'lr': 0.0004885595531454195, 'samples': 3131136, 'steps': 16307, 'loss/train': 2.030357837677002} -08/30/2021 16:11:01 - INFO - __main__ - Step 16309: {'lr': 0.0004885579661228097, 'samples': 3131328, 'steps': 16308, 'loss/train': 2.012671947479248} -08/30/2021 16:11:02 - INFO - __main__ - Step 16310: {'lr': 0.0004885563789927092, 'samples': 3131520, 'steps': 16309, 'loss/train': 1.4014322757720947} -08/30/2021 16:11:02 - INFO - __main__ - Step 16311: {'lr': 0.0004885547917551189, 'samples': 3131712, 'steps': 16310, 'loss/train': 1.609916090965271} -08/30/2021 16:11:02 - INFO - __main__ - Step 16312: {'lr': 0.0004885532044100396, 'samples': 3131904, 'steps': 16311, 'loss/train': 1.7045129537582397} -08/30/2021 16:11:04 - INFO - __main__ - Step 16313: {'lr': 0.0004885516169574719, 'samples': 3132096, 'steps': 16312, 'loss/train': 1.6659396886825562} -08/30/2021 16:11:05 - INFO - __main__ - Step 16314: {'lr': 0.0004885500293974165, 'samples': 3132288, 'steps': 16313, 'loss/train': 1.6932291984558105} -08/30/2021 16:11:05 - INFO - __main__ - Step 16315: {'lr': 0.0004885484417298741, 'samples': 3132480, 'steps': 16314, 'loss/train': 1.825520396232605} -08/30/2021 16:11:05 - INFO - __main__ - Step 16316: {'lr': 0.0004885468539548455, 'samples': 3132672, 'steps': 16315, 'loss/train': 0.23717674612998962} -08/30/2021 16:11:06 - INFO - __main__ - Step 16317: {'lr': 0.0004885452660723313, 'samples': 3132864, 'steps': 16316, 'loss/train': 1.829975962638855} -08/30/2021 16:11:07 - INFO - __main__ - Step 16318: {'lr': 0.0004885436780823324, 'samples': 3133056, 'steps': 16317, 'loss/train': 1.3374109268188477} -08/30/2021 16:11:08 - INFO - __main__ - Step 16319: {'lr': 0.0004885420899848492, 'samples': 3133248, 'steps': 16318, 'loss/train': 0.565299928188324} -08/30/2021 16:11:08 - INFO - __main__ - Step 16320: {'lr': 0.0004885405017798828, 'samples': 3133440, 'steps': 16319, 'loss/train': 1.8940999507904053} -08/30/2021 16:11:08 - INFO - __main__ - Step 16321: {'lr': 0.0004885389134674337, 'samples': 3133632, 'steps': 16320, 'loss/train': 1.845708966255188} -08/30/2021 16:11:09 - INFO - __main__ - Step 16322: {'lr': 0.0004885373250475026, 'samples': 3133824, 'steps': 16321, 'loss/train': 1.7308459281921387} -08/30/2021 16:11:11 - INFO - __main__ - Step 16323: {'lr': 0.0004885357365200903, 'samples': 3134016, 'steps': 16322, 'loss/train': 1.538646936416626} -08/30/2021 16:11:11 - INFO - __main__ - Step 16324: {'lr': 0.0004885341478851975, 'samples': 3134208, 'steps': 16323, 'loss/train': 1.763047695159912} -08/30/2021 16:11:12 - INFO - __main__ - Step 16325: {'lr': 0.0004885325591428248, 'samples': 3134400, 'steps': 16324, 'loss/train': 1.3690780401229858} -08/30/2021 16:11:12 - INFO - __main__ - Step 16326: {'lr': 0.0004885309702929731, 'samples': 3134592, 'steps': 16325, 'loss/train': 1.5660958290100098} -08/30/2021 16:11:12 - INFO - __main__ - Step 16327: {'lr': 0.000488529381335643, 'samples': 3134784, 'steps': 16326, 'loss/train': 1.7297216653823853} -08/30/2021 16:11:14 - INFO - __main__ - Step 16328: {'lr': 0.0004885277922708352, 'samples': 3134976, 'steps': 16327, 'loss/train': 1.8478820323944092} -08/30/2021 16:11:14 - INFO - __main__ - Step 16329: {'lr': 0.0004885262030985504, 'samples': 3135168, 'steps': 16328, 'loss/train': 1.6181265115737915} -08/30/2021 16:11:15 - INFO - __main__ - Step 16330: {'lr': 0.0004885246138187896, 'samples': 3135360, 'steps': 16329, 'loss/train': 1.5884735584259033} -08/30/2021 16:11:15 - INFO - __main__ - Step 16331: {'lr': 0.0004885230244315531, 'samples': 3135552, 'steps': 16330, 'loss/train': 1.2228111028671265} -08/30/2021 16:11:15 - INFO - __main__ - Step 16332: {'lr': 0.0004885214349368419, 'samples': 3135744, 'steps': 16331, 'loss/train': 2.0802552700042725} -08/30/2021 16:11:16 - INFO - __main__ - Step 16333: {'lr': 0.0004885198453346565, 'samples': 3135936, 'steps': 16332, 'loss/train': 1.9758137464523315} -08/30/2021 16:11:18 - INFO - __main__ - Step 16334: {'lr': 0.0004885182556249978, 'samples': 3136128, 'steps': 16333, 'loss/train': 2.045431137084961} -08/30/2021 16:11:18 - INFO - __main__ - Step 16335: {'lr': 0.0004885166658078666, 'samples': 3136320, 'steps': 16334, 'loss/train': 1.4344342947006226} -08/30/2021 16:11:18 - INFO - __main__ - Step 16336: {'lr': 0.0004885150758832632, 'samples': 3136512, 'steps': 16335, 'loss/train': 1.4791133403778076} -08/30/2021 16:11:19 - INFO - __main__ - Step 16337: {'lr': 0.0004885134858511888, 'samples': 3136704, 'steps': 16336, 'loss/train': 1.6670126914978027} -08/30/2021 16:11:19 - INFO - __main__ - Step 16338: {'lr': 0.0004885118957116438, 'samples': 3136896, 'steps': 16337, 'loss/train': 1.0015093088150024} -08/30/2021 16:11:21 - INFO - __main__ - Step 16339: {'lr': 0.000488510305464629, 'samples': 3137088, 'steps': 16338, 'loss/train': 2.0380828380584717} -08/30/2021 16:11:21 - INFO - __main__ - Step 16340: {'lr': 0.0004885087151101453, 'samples': 3137280, 'steps': 16339, 'loss/train': 1.8990954160690308} -08/30/2021 16:11:21 - INFO - __main__ - Step 16341: {'lr': 0.0004885071246481931, 'samples': 3137472, 'steps': 16340, 'loss/train': 1.7942309379577637} -08/30/2021 16:11:22 - INFO - __main__ - Step 16342: {'lr': 0.0004885055340787733, 'samples': 3137664, 'steps': 16341, 'loss/train': 1.1840516328811646} -08/30/2021 16:11:22 - INFO - __main__ - Step 16343: {'lr': 0.0004885039434018866, 'samples': 3137856, 'steps': 16342, 'loss/train': 1.8106180429458618} -08/30/2021 16:11:24 - INFO - __main__ - Step 16344: {'lr': 0.0004885023526175337, 'samples': 3138048, 'steps': 16343, 'loss/train': 1.5840362310409546} -08/30/2021 16:11:24 - INFO - __main__ - Step 16345: {'lr': 0.0004885007617257154, 'samples': 3138240, 'steps': 16344, 'loss/train': 1.4874635934829712} -08/30/2021 16:11:25 - INFO - __main__ - Step 16346: {'lr': 0.0004884991707264322, 'samples': 3138432, 'steps': 16345, 'loss/train': 0.11009877920150757} -08/30/2021 16:11:25 - INFO - __main__ - Step 16347: {'lr': 0.000488497579619685, 'samples': 3138624, 'steps': 16346, 'loss/train': 1.738002061843872} -08/30/2021 16:11:25 - INFO - __main__ - Step 16348: {'lr': 0.0004884959884054745, 'samples': 3138816, 'steps': 16347, 'loss/train': 1.8687289953231812} -08/30/2021 16:11:26 - INFO - __main__ - Step 16349: {'lr': 0.0004884943970838014, 'samples': 3139008, 'steps': 16348, 'loss/train': 1.5455678701400757} -08/30/2021 16:11:27 - INFO - __main__ - Step 16350: {'lr': 0.0004884928056546663, 'samples': 3139200, 'steps': 16349, 'loss/train': 1.8006826639175415} -08/30/2021 16:11:28 - INFO - __main__ - Step 16351: {'lr': 0.0004884912141180701, 'samples': 3139392, 'steps': 16350, 'loss/train': 1.7931283712387085} -08/30/2021 16:11:28 - INFO - __main__ - Step 16352: {'lr': 0.0004884896224740136, 'samples': 3139584, 'steps': 16351, 'loss/train': 1.4437652826309204} -08/30/2021 16:11:28 - INFO - __main__ - Step 16353: {'lr': 0.0004884880307224972, 'samples': 3139776, 'steps': 16352, 'loss/train': 2.056745767593384} -08/30/2021 16:11:29 - INFO - __main__ - Step 16354: {'lr': 0.0004884864388635217, 'samples': 3139968, 'steps': 16353, 'loss/train': 1.7429823875427246} -08/30/2021 16:11:30 - INFO - __main__ - Step 16355: {'lr': 0.0004884848468970879, 'samples': 3140160, 'steps': 16354, 'loss/train': 1.7310128211975098} -08/30/2021 16:11:31 - INFO - __main__ - Step 16356: {'lr': 0.0004884832548231966, 'samples': 3140352, 'steps': 16355, 'loss/train': 1.6515498161315918} -08/30/2021 16:11:31 - INFO - __main__ - Step 16357: {'lr': 0.0004884816626418484, 'samples': 3140544, 'steps': 16356, 'loss/train': 1.6642929315567017} -08/30/2021 16:11:31 - INFO - __main__ - Step 16358: {'lr': 0.000488480070353044, 'samples': 3140736, 'steps': 16357, 'loss/train': 1.6606919765472412} -08/30/2021 16:11:32 - INFO - __main__ - Step 16359: {'lr': 0.0004884784779567843, 'samples': 3140928, 'steps': 16358, 'loss/train': 1.5081998109817505} -08/30/2021 16:11:34 - INFO - __main__ - Step 16360: {'lr': 0.0004884768854530696, 'samples': 3141120, 'steps': 16359, 'loss/train': 1.4753029346466064} -08/30/2021 16:11:34 - INFO - __main__ - Step 16361: {'lr': 0.0004884752928419012, 'samples': 3141312, 'steps': 16360, 'loss/train': 1.6934443712234497} -08/30/2021 16:11:35 - INFO - __main__ - Step 16362: {'lr': 0.0004884737001232793, 'samples': 3141504, 'steps': 16361, 'loss/train': 1.7826738357543945} -08/30/2021 16:11:35 - INFO - __main__ - Step 16363: {'lr': 0.000488472107297205, 'samples': 3141696, 'steps': 16362, 'loss/train': 0.815053403377533} -08/30/2021 16:11:35 - INFO - __main__ - Step 16364: {'lr': 0.0004884705143636788, 'samples': 3141888, 'steps': 16363, 'loss/train': 1.4334876537322998} -08/30/2021 16:11:36 - INFO - __main__ - Step 16365: {'lr': 0.0004884689213227013, 'samples': 3142080, 'steps': 16364, 'loss/train': 1.7051260471343994} -08/30/2021 16:11:36 - INFO - __main__ - Step 16366: {'lr': 0.0004884673281742736, 'samples': 3142272, 'steps': 16365, 'loss/train': 0.10288375616073608} -08/30/2021 16:11:38 - INFO - __main__ - Step 16367: {'lr': 0.0004884657349183961, 'samples': 3142464, 'steps': 16366, 'loss/train': 0.10311628878116608} -08/30/2021 16:11:38 - INFO - __main__ - Step 16368: {'lr': 0.0004884641415550696, 'samples': 3142656, 'steps': 16367, 'loss/train': 1.4080204963684082} -08/30/2021 16:11:38 - INFO - __main__ - Step 16369: {'lr': 0.0004884625480842949, 'samples': 3142848, 'steps': 16368, 'loss/train': 1.8912681341171265} -08/30/2021 16:11:39 - INFO - __main__ - Step 16370: {'lr': 0.0004884609545060726, 'samples': 3143040, 'steps': 16369, 'loss/train': 1.391222596168518} -08/30/2021 16:11:39 - INFO - __main__ - Step 16371: {'lr': 0.0004884593608204035, 'samples': 3143232, 'steps': 16370, 'loss/train': 1.6049600839614868} -08/30/2021 16:11:41 - INFO - __main__ - Step 16372: {'lr': 0.0004884577670272882, 'samples': 3143424, 'steps': 16371, 'loss/train': 1.399133563041687} -08/30/2021 16:11:41 - INFO - __main__ - Step 16373: {'lr': 0.0004884561731267278, 'samples': 3143616, 'steps': 16372, 'loss/train': 1.9584330320358276} -08/30/2021 16:11:41 - INFO - __main__ - Step 16374: {'lr': 0.0004884545791187224, 'samples': 3143808, 'steps': 16373, 'loss/train': 1.2325204610824585} -08/30/2021 16:11:42 - INFO - __main__ - Step 16375: {'lr': 0.0004884529850032732, 'samples': 3144000, 'steps': 16374, 'loss/train': 1.823428988456726} -08/30/2021 16:11:42 - INFO - __main__ - Step 16376: {'lr': 0.0004884513907803808, 'samples': 3144192, 'steps': 16375, 'loss/train': 2.0254604816436768} -08/30/2021 16:11:44 - INFO - __main__ - Step 16377: {'lr': 0.0004884497964500457, 'samples': 3144384, 'steps': 16376, 'loss/train': 1.838220238685608} -08/30/2021 16:11:44 - INFO - __main__ - Step 16378: {'lr': 0.000488448202012269, 'samples': 3144576, 'steps': 16377, 'loss/train': 1.714113473892212} -08/30/2021 16:11:45 - INFO - __main__ - Step 16379: {'lr': 0.0004884466074670512, 'samples': 3144768, 'steps': 16378, 'loss/train': 1.836683988571167} -08/30/2021 16:11:45 - INFO - __main__ - Step 16380: {'lr': 0.0004884450128143929, 'samples': 3144960, 'steps': 16379, 'loss/train': 1.4216639995574951} -08/30/2021 16:11:45 - INFO - __main__ - Step 16381: {'lr': 0.000488443418054295, 'samples': 3145152, 'steps': 16380, 'loss/train': 1.983205795288086} -08/30/2021 16:11:47 - INFO - __main__ - Step 16382: {'lr': 0.0004884418231867583, 'samples': 3145344, 'steps': 16381, 'loss/train': 1.8755842447280884} -08/30/2021 16:11:48 - INFO - __main__ - Step 16383: {'lr': 0.0004884402282117833, 'samples': 3145536, 'steps': 16382, 'loss/train': 1.6494497060775757} -08/30/2021 16:11:48 - INFO - __main__ - Step 16384: {'lr': 0.0004884386331293708, 'samples': 3145728, 'steps': 16383, 'loss/train': 0.07024643570184708} -08/30/2021 16:11:49 - INFO - __main__ - Step 16385: {'lr': 0.0004884370379395215, 'samples': 3145920, 'steps': 16384, 'loss/train': 1.9015545845031738} -08/30/2021 16:11:49 - INFO - __main__ - Step 16386: {'lr': 0.0004884354426422363, 'samples': 3146112, 'steps': 16385, 'loss/train': 0.16112719476222992} -08/30/2021 16:11:49 - INFO - __main__ - Step 16387: {'lr': 0.0004884338472375156, 'samples': 3146304, 'steps': 16386, 'loss/train': 1.2409710884094238} -08/30/2021 16:11:51 - INFO - __main__ - Step 16388: {'lr': 0.0004884322517253604, 'samples': 3146496, 'steps': 16387, 'loss/train': 1.0356227159500122} -08/30/2021 16:11:51 - INFO - __main__ - Step 16389: {'lr': 0.0004884306561057713, 'samples': 3146688, 'steps': 16388, 'loss/train': 1.4719094038009644} -08/30/2021 16:11:52 - INFO - __main__ - Step 16390: {'lr': 0.000488429060378749, 'samples': 3146880, 'steps': 16389, 'loss/train': 1.825208306312561} -08/30/2021 16:11:52 - INFO - __main__ - Step 16391: {'lr': 0.0004884274645442942, 'samples': 3147072, 'steps': 16390, 'loss/train': 1.7455666065216064} -08/30/2021 16:11:52 - INFO - __main__ - Step 16392: {'lr': 0.0004884258686024077, 'samples': 3147264, 'steps': 16391, 'loss/train': 1.788954734802246} -08/30/2021 16:11:54 - INFO - __main__ - Step 16393: {'lr': 0.0004884242725530902, 'samples': 3147456, 'steps': 16392, 'loss/train': 1.6024516820907593} -08/30/2021 16:11:54 - INFO - __main__ - Step 16394: {'lr': 0.0004884226763963423, 'samples': 3147648, 'steps': 16393, 'loss/train': 1.8891571760177612} -08/30/2021 16:11:55 - INFO - __main__ - Step 16395: {'lr': 0.000488421080132165, 'samples': 3147840, 'steps': 16394, 'loss/train': 1.7516354322433472} -08/30/2021 16:11:55 - INFO - __main__ - Step 16396: {'lr': 0.0004884194837605587, 'samples': 3148032, 'steps': 16395, 'loss/train': 1.6981509923934937} -08/30/2021 16:11:55 - INFO - __main__ - Step 16397: {'lr': 0.0004884178872815243, 'samples': 3148224, 'steps': 16396, 'loss/train': 1.2616357803344727} -08/30/2021 16:11:57 - INFO - __main__ - Step 16398: {'lr': 0.0004884162906950624, 'samples': 3148416, 'steps': 16397, 'loss/train': 0.14406365156173706} -08/30/2021 16:11:58 - INFO - __main__ - Step 16399: {'lr': 0.000488414694001174, 'samples': 3148608, 'steps': 16398, 'loss/train': 2.0568366050720215} -08/30/2021 16:11:58 - INFO - __main__ - Step 16400: {'lr': 0.0004884130971998595, 'samples': 3148800, 'steps': 16399, 'loss/train': 2.191758871078491} -08/30/2021 16:11:58 - INFO - __main__ - Step 16401: {'lr': 0.0004884115002911197, 'samples': 3148992, 'steps': 16400, 'loss/train': 1.3861243724822998} -08/30/2021 16:11:59 - INFO - __main__ - Step 16402: {'lr': 0.0004884099032749554, 'samples': 3149184, 'steps': 16401, 'loss/train': 0.0903669074177742} -08/30/2021 16:12:00 - INFO - __main__ - Step 16403: {'lr': 0.0004884083061513672, 'samples': 3149376, 'steps': 16402, 'loss/train': 2.5146679878234863} -08/30/2021 16:12:00 - INFO - __main__ - Step 16404: {'lr': 0.0004884067089203559, 'samples': 3149568, 'steps': 16403, 'loss/train': 1.8538411855697632} -08/30/2021 16:12:01 - INFO - __main__ - Step 16405: {'lr': 0.0004884051115819224, 'samples': 3149760, 'steps': 16404, 'loss/train': 2.032058000564575} -08/30/2021 16:12:01 - INFO - __main__ - Step 16406: {'lr': 0.000488403514136067, 'samples': 3149952, 'steps': 16405, 'loss/train': 1.4845865964889526} -08/30/2021 16:12:01 - INFO - __main__ - Step 16407: {'lr': 0.0004884019165827909, 'samples': 3150144, 'steps': 16406, 'loss/train': 1.7833247184753418} -08/30/2021 16:12:03 - INFO - __main__ - Step 16408: {'lr': 0.0004884003189220945, 'samples': 3150336, 'steps': 16407, 'loss/train': 1.4036445617675781} -08/30/2021 16:12:03 - INFO - __main__ - Step 16409: {'lr': 0.0004883987211539785, 'samples': 3150528, 'steps': 16408, 'loss/train': 2.021967649459839} -08/30/2021 16:12:04 - INFO - __main__ - Step 16410: {'lr': 0.0004883971232784438, 'samples': 3150720, 'steps': 16409, 'loss/train': 1.841018557548523} -08/30/2021 16:12:04 - INFO - __main__ - Step 16411: {'lr': 0.0004883955252954909, 'samples': 3150912, 'steps': 16410, 'loss/train': 2.0723958015441895} -08/30/2021 16:12:04 - INFO - __main__ - Step 16412: {'lr': 0.0004883939272051208, 'samples': 3151104, 'steps': 16411, 'loss/train': 1.7425384521484375} -08/30/2021 16:12:05 - INFO - __main__ - Step 16413: {'lr': 0.000488392329007334, 'samples': 3151296, 'steps': 16412, 'loss/train': 1.697700023651123} -08/30/2021 16:12:07 - INFO - __main__ - Step 16414: {'lr': 0.0004883907307021314, 'samples': 3151488, 'steps': 16413, 'loss/train': 2.5796310901641846} -08/30/2021 16:12:07 - INFO - __main__ - Step 16415: {'lr': 0.0004883891322895134, 'samples': 3151680, 'steps': 16414, 'loss/train': 2.1869726181030273} -08/30/2021 16:12:07 - INFO - __main__ - Step 16416: {'lr': 0.000488387533769481, 'samples': 3151872, 'steps': 16415, 'loss/train': 1.569940209388733} -08/30/2021 16:12:08 - INFO - __main__ - Step 16417: {'lr': 0.000488385935142035, 'samples': 3152064, 'steps': 16416, 'loss/train': 1.4833344221115112} -08/30/2021 16:12:08 - INFO - __main__ - Step 16418: {'lr': 0.0004883843364071759, 'samples': 3152256, 'steps': 16417, 'loss/train': 1.2835125923156738} -08/30/2021 16:12:09 - INFO - __main__ - Step 16419: {'lr': 0.0004883827375649045, 'samples': 3152448, 'steps': 16418, 'loss/train': 1.0750722885131836} -08/30/2021 16:12:10 - INFO - __main__ - Step 16420: {'lr': 0.0004883811386152216, 'samples': 3152640, 'steps': 16419, 'loss/train': 1.722716212272644} -08/30/2021 16:12:10 - INFO - __main__ - Step 16421: {'lr': 0.0004883795395581277, 'samples': 3152832, 'steps': 16420, 'loss/train': 0.47888919711112976} -08/30/2021 16:12:11 - INFO - __main__ - Step 16422: {'lr': 0.0004883779403936237, 'samples': 3153024, 'steps': 16421, 'loss/train': 1.4829291105270386} -08/30/2021 16:12:11 - INFO - __main__ - Step 16423: {'lr': 0.0004883763411217103, 'samples': 3153216, 'steps': 16422, 'loss/train': 1.7919137477874756} -08/30/2021 16:12:12 - INFO - __main__ - Step 16424: {'lr': 0.0004883747417423882, 'samples': 3153408, 'steps': 16423, 'loss/train': 1.6080315113067627} -08/30/2021 16:12:13 - INFO - __main__ - Step 16425: {'lr': 0.000488373142255658, 'samples': 3153600, 'steps': 16424, 'loss/train': 1.644591212272644} -08/30/2021 16:12:13 - INFO - __main__ - Step 16426: {'lr': 0.0004883715426615207, 'samples': 3153792, 'steps': 16425, 'loss/train': 1.6483370065689087} -08/30/2021 16:12:14 - INFO - __main__ - Step 16427: {'lr': 0.0004883699429599768, 'samples': 3153984, 'steps': 16426, 'loss/train': 1.8033820390701294} -08/30/2021 16:12:14 - INFO - __main__ - Step 16428: {'lr': 0.0004883683431510272, 'samples': 3154176, 'steps': 16427, 'loss/train': 1.4099290370941162} -08/30/2021 16:12:16 - INFO - __main__ - Step 16429: {'lr': 0.0004883667432346723, 'samples': 3154368, 'steps': 16428, 'loss/train': 0.9474764466285706} -08/30/2021 16:12:16 - INFO - __main__ - Step 16430: {'lr': 0.0004883651432109132, 'samples': 3154560, 'steps': 16429, 'loss/train': 2.8283019065856934} -08/30/2021 16:12:17 - INFO - __main__ - Step 16431: {'lr': 0.0004883635430797502, 'samples': 3154752, 'steps': 16430, 'loss/train': 2.3652114868164062} -08/30/2021 16:12:17 - INFO - __main__ - Step 16432: {'lr': 0.0004883619428411846, 'samples': 3154944, 'steps': 16431, 'loss/train': 1.80955171585083} -08/30/2021 16:12:17 - INFO - __main__ - Step 16433: {'lr': 0.0004883603424952165, 'samples': 3155136, 'steps': 16432, 'loss/train': 1.612752914428711} -08/30/2021 16:12:19 - INFO - __main__ - Step 16434: {'lr': 0.0004883587420418471, 'samples': 3155328, 'steps': 16433, 'loss/train': 1.9555912017822266} -08/30/2021 16:12:20 - INFO - __main__ - Step 16435: {'lr': 0.0004883571414810769, 'samples': 3155520, 'steps': 16434, 'loss/train': 1.5818567276000977} -08/30/2021 16:12:20 - INFO - __main__ - Step 16436: {'lr': 0.0004883555408129066, 'samples': 3155712, 'steps': 16435, 'loss/train': 1.2745782136917114} -08/30/2021 16:12:20 - INFO - __main__ - Step 16437: {'lr': 0.0004883539400373369, 'samples': 3155904, 'steps': 16436, 'loss/train': 1.8561028242111206} -08/30/2021 16:12:21 - INFO - __main__ - Step 16438: {'lr': 0.0004883523391543687, 'samples': 3156096, 'steps': 16437, 'loss/train': 1.5114132165908813} -08/30/2021 16:12:22 - INFO - __main__ - Step 16439: {'lr': 0.0004883507381640026, 'samples': 3156288, 'steps': 16438, 'loss/train': 1.323274850845337} -08/30/2021 16:12:23 - INFO - __main__ - Step 16440: {'lr': 0.0004883491370662393, 'samples': 3156480, 'steps': 16439, 'loss/train': 0.6661016941070557} -08/30/2021 16:12:23 - INFO - __main__ - Step 16441: {'lr': 0.0004883475358610794, 'samples': 3156672, 'steps': 16440, 'loss/train': 1.3470076322555542} -08/30/2021 16:12:24 - INFO - __main__ - Step 16442: {'lr': 0.000488345934548524, 'samples': 3156864, 'steps': 16441, 'loss/train': 1.2103748321533203} -08/30/2021 16:12:24 - INFO - __main__ - Step 16443: {'lr': 0.0004883443331285736, 'samples': 3157056, 'steps': 16442, 'loss/train': 1.5097126960754395} -08/30/2021 16:12:24 - INFO - __main__ - Step 16444: {'lr': 0.0004883427316012289, 'samples': 3157248, 'steps': 16443, 'loss/train': 1.5376880168914795} -08/30/2021 16:12:26 - INFO - __main__ - Step 16445: {'lr': 0.0004883411299664906, 'samples': 3157440, 'steps': 16444, 'loss/train': 3.0078248977661133} -08/30/2021 16:12:27 - INFO - __main__ - Step 16446: {'lr': 0.0004883395282243595, 'samples': 3157632, 'steps': 16445, 'loss/train': 0.14940780401229858} -08/30/2021 16:12:27 - INFO - __main__ - Step 16447: {'lr': 0.0004883379263748363, 'samples': 3157824, 'steps': 16446, 'loss/train': 2.0638163089752197} -08/30/2021 16:12:27 - INFO - __main__ - Step 16448: {'lr': 0.0004883363244179217, 'samples': 3158016, 'steps': 16447, 'loss/train': 1.5818711519241333} -08/30/2021 16:12:28 - INFO - __main__ - Step 16449: {'lr': 0.0004883347223536164, 'samples': 3158208, 'steps': 16448, 'loss/train': 1.8282077312469482} -08/30/2021 16:12:28 - INFO - __main__ - Step 16450: {'lr': 0.0004883331201819211, 'samples': 3158400, 'steps': 16449, 'loss/train': 0.11230821907520294} -08/30/2021 16:12:30 - INFO - __main__ - Step 16451: {'lr': 0.0004883315179028366, 'samples': 3158592, 'steps': 16450, 'loss/train': 0.17662116885185242} -08/30/2021 16:12:30 - INFO - __main__ - Step 16452: {'lr': 0.0004883299155163636, 'samples': 3158784, 'steps': 16451, 'loss/train': 1.5383926630020142} -08/30/2021 16:12:30 - INFO - __main__ - Step 16453: {'lr': 0.0004883283130225029, 'samples': 3158976, 'steps': 16452, 'loss/train': 2.2520840167999268} -08/30/2021 16:12:31 - INFO - __main__ - Step 16454: {'lr': 0.0004883267104212551, 'samples': 3159168, 'steps': 16453, 'loss/train': 0.7508336901664734} -08/30/2021 16:12:31 - INFO - __main__ - Step 16455: {'lr': 0.0004883251077126209, 'samples': 3159360, 'steps': 16454, 'loss/train': 2.7111029624938965} -08/30/2021 16:12:31 - INFO - __main__ - Step 16456: {'lr': 0.0004883235048966011, 'samples': 3159552, 'steps': 16455, 'loss/train': 1.7357203960418701} -08/30/2021 16:12:33 - INFO - __main__ - Step 16457: {'lr': 0.0004883219019731964, 'samples': 3159744, 'steps': 16456, 'loss/train': 2.1748054027557373} -08/30/2021 16:12:34 - INFO - __main__ - Step 16458: {'lr': 0.0004883202989424076, 'samples': 3159936, 'steps': 16457, 'loss/train': 1.9947377443313599} -08/30/2021 16:12:34 - INFO - __main__ - Step 16459: {'lr': 0.0004883186958042354, 'samples': 3160128, 'steps': 16458, 'loss/train': 0.9799297451972961} -08/30/2021 16:12:34 - INFO - __main__ - Step 16460: {'lr': 0.0004883170925586804, 'samples': 3160320, 'steps': 16459, 'loss/train': 1.2041651010513306} -08/30/2021 16:12:35 - INFO - __main__ - Step 16461: {'lr': 0.0004883154892057433, 'samples': 3160512, 'steps': 16460, 'loss/train': 1.4210397005081177} -08/30/2021 16:12:36 - INFO - __main__ - Step 16462: {'lr': 0.000488313885745425, 'samples': 3160704, 'steps': 16461, 'loss/train': 1.7475907802581787} -08/30/2021 16:12:37 - INFO - __main__ - Step 16463: {'lr': 0.0004883122821777261, 'samples': 3160896, 'steps': 16462, 'loss/train': 1.7158664464950562} -08/30/2021 16:12:37 - INFO - __main__ - Step 16464: {'lr': 0.0004883106785026475, 'samples': 3161088, 'steps': 16463, 'loss/train': 1.3037594556808472} -08/30/2021 16:12:37 - INFO - __main__ - Step 16465: {'lr': 0.0004883090747201897, 'samples': 3161280, 'steps': 16464, 'loss/train': 1.3759013414382935} -08/30/2021 16:12:38 - INFO - __main__ - Step 16466: {'lr': 0.0004883074708303534, 'samples': 3161472, 'steps': 16465, 'loss/train': 1.0900455713272095} -08/30/2021 16:12:39 - INFO - __main__ - Step 16467: {'lr': 0.0004883058668331396, 'samples': 3161664, 'steps': 16466, 'loss/train': 1.6898516416549683} -08/30/2021 16:12:40 - INFO - __main__ - Step 16468: {'lr': 0.0004883042627285488, 'samples': 3161856, 'steps': 16467, 'loss/train': 1.8191605806350708} -08/30/2021 16:12:40 - INFO - __main__ - Step 16469: {'lr': 0.0004883026585165817, 'samples': 3162048, 'steps': 16468, 'loss/train': 1.6544195413589478} -08/30/2021 16:12:41 - INFO - __main__ - Step 16470: {'lr': 0.0004883010541972392, 'samples': 3162240, 'steps': 16469, 'loss/train': 1.6518362760543823} -08/30/2021 16:12:41 - INFO - __main__ - Step 16471: {'lr': 0.0004882994497705219, 'samples': 3162432, 'steps': 16470, 'loss/train': 2.0174849033355713} -08/30/2021 16:12:42 - INFO - __main__ - Step 16472: {'lr': 0.0004882978452364305, 'samples': 3162624, 'steps': 16471, 'loss/train': 1.4940745830535889} -08/30/2021 16:12:43 - INFO - __main__ - Step 16473: {'lr': 0.0004882962405949658, 'samples': 3162816, 'steps': 16472, 'loss/train': 1.7469748258590698} -08/30/2021 16:12:43 - INFO - __main__ - Step 16474: {'lr': 0.0004882946358461285, 'samples': 3163008, 'steps': 16473, 'loss/train': 1.8230326175689697} -08/30/2021 16:12:44 - INFO - __main__ - Step 16475: {'lr': 0.0004882930309899192, 'samples': 3163200, 'steps': 16474, 'loss/train': 1.4943701028823853} -08/30/2021 16:12:44 - INFO - __main__ - Step 16476: {'lr': 0.000488291426026339, 'samples': 3163392, 'steps': 16475, 'loss/train': 1.4653288125991821} -08/30/2021 16:12:44 - INFO - __main__ - Step 16477: {'lr': 0.0004882898209553881, 'samples': 3163584, 'steps': 16476, 'loss/train': 1.550358533859253} -08/30/2021 16:12:46 - INFO - __main__ - Step 16478: {'lr': 0.0004882882157770676, 'samples': 3163776, 'steps': 16477, 'loss/train': 1.679360270500183} -08/30/2021 16:12:47 - INFO - __main__ - Step 16479: {'lr': 0.000488286610491378, 'samples': 3163968, 'steps': 16478, 'loss/train': 1.8442274332046509} -08/30/2021 16:12:47 - INFO - __main__ - Step 16480: {'lr': 0.0004882850050983203, 'samples': 3164160, 'steps': 16479, 'loss/train': 1.6017777919769287} -08/30/2021 16:12:47 - INFO - __main__ - Step 16481: {'lr': 0.0004882833995978949, 'samples': 3164352, 'steps': 16480, 'loss/train': 1.884262204170227} -08/30/2021 16:12:48 - INFO - __main__ - Step 16482: {'lr': 0.0004882817939901027, 'samples': 3164544, 'steps': 16481, 'loss/train': 0.0743497759103775} -08/30/2021 16:12:48 - INFO - __main__ - Step 16483: {'lr': 0.0004882801882749445, 'samples': 3164736, 'steps': 16482, 'loss/train': 0.18168054521083832} -08/30/2021 16:12:50 - INFO - __main__ - Step 16484: {'lr': 0.0004882785824524209, 'samples': 3164928, 'steps': 16483, 'loss/train': 1.5538021326065063} -08/30/2021 16:12:50 - INFO - __main__ - Step 16485: {'lr': 0.0004882769765225326, 'samples': 3165120, 'steps': 16484, 'loss/train': 2.0989391803741455} -08/30/2021 16:12:50 - INFO - __main__ - Step 16486: {'lr': 0.00048827537048528035, 'samples': 3165312, 'steps': 16485, 'loss/train': 1.651032567024231} -08/30/2021 16:12:51 - INFO - __main__ - Step 16487: {'lr': 0.00048827376434066493, 'samples': 3165504, 'steps': 16486, 'loss/train': 1.2024333477020264} -08/30/2021 16:12:51 - INFO - __main__ - Step 16488: {'lr': 0.0004882721580886871, 'samples': 3165696, 'steps': 16487, 'loss/train': 1.6652101278305054} -08/30/2021 16:12:53 - INFO - __main__ - Step 16489: {'lr': 0.00048827055172934744, 'samples': 3165888, 'steps': 16488, 'loss/train': 1.4172935485839844} -08/30/2021 16:12:54 - INFO - __main__ - Step 16490: {'lr': 0.0004882689452626468, 'samples': 3166080, 'steps': 16489, 'loss/train': 1.1986442804336548} -08/30/2021 16:12:54 - INFO - __main__ - Step 16491: {'lr': 0.00048826733868858577, 'samples': 3166272, 'steps': 16490, 'loss/train': 1.8039789199829102} -08/30/2021 16:12:55 - INFO - __main__ - Step 16492: {'lr': 0.00048826573200716516, 'samples': 3166464, 'steps': 16491, 'loss/train': 1.7548322677612305} -08/30/2021 16:12:55 - INFO - __main__ - Step 16493: {'lr': 0.0004882641252183857, 'samples': 3166656, 'steps': 16492, 'loss/train': 1.9020053148269653} -08/30/2021 16:12:55 - INFO - __main__ - Step 16494: {'lr': 0.0004882625183222481, 'samples': 3166848, 'steps': 16493, 'loss/train': 1.7261946201324463} -08/30/2021 16:12:57 - INFO - __main__ - Step 16495: {'lr': 0.00048826091131875317, 'samples': 3167040, 'steps': 16494, 'loss/train': 1.968366265296936} -08/30/2021 16:12:57 - INFO - __main__ - Step 16496: {'lr': 0.00048825930420790144, 'samples': 3167232, 'steps': 16495, 'loss/train': 1.53008234500885} -08/30/2021 16:12:58 - INFO - __main__ - Step 16497: {'lr': 0.0004882576969896938, 'samples': 3167424, 'steps': 16496, 'loss/train': 1.7781314849853516} -08/30/2021 16:12:58 - INFO - __main__ - Step 16498: {'lr': 0.00048825608966413095, 'samples': 3167616, 'steps': 16497, 'loss/train': 1.7661806344985962} -08/30/2021 16:12:58 - INFO - __main__ - Step 16499: {'lr': 0.0004882544822312135, 'samples': 3167808, 'steps': 16498, 'loss/train': 1.7144266366958618} -08/30/2021 16:13:00 - INFO - __main__ - Step 16500: {'lr': 0.00048825287469094224, 'samples': 3168000, 'steps': 16499, 'loss/train': 2.3831145763397217} -08/30/2021 16:13:00 - INFO - __main__ - Step 16501: {'lr': 0.000488251267043318, 'samples': 3168192, 'steps': 16500, 'loss/train': 1.950164794921875} -08/30/2021 16:13:01 - INFO - __main__ - Step 16502: {'lr': 0.00048824965928834143, 'samples': 3168384, 'steps': 16501, 'loss/train': 1.650948405265808} -08/30/2021 16:13:01 - INFO - __main__ - Step 16503: {'lr': 0.0004882480514260131, 'samples': 3168576, 'steps': 16502, 'loss/train': 1.506259560585022} -08/30/2021 16:13:01 - INFO - __main__ - Step 16504: {'lr': 0.000488246443456334, 'samples': 3168768, 'steps': 16503, 'loss/train': 0.11784862726926804} -08/30/2021 16:13:03 - INFO - __main__ - Step 16505: {'lr': 0.0004882448353793048, 'samples': 3168960, 'steps': 16504, 'loss/train': 2.259474039077759} -08/30/2021 16:13:03 - INFO - __main__ - Step 16506: {'lr': 0.000488243227194926, 'samples': 3169152, 'steps': 16505, 'loss/train': 1.8807767629623413} -08/30/2021 16:13:04 - INFO - __main__ - Step 16507: {'lr': 0.00048824161890319854, 'samples': 3169344, 'steps': 16506, 'loss/train': 1.8212604522705078} -08/30/2021 16:13:04 - INFO - __main__ - Step 16508: {'lr': 0.00048824001050412304, 'samples': 3169536, 'steps': 16507, 'loss/train': 1.6447376012802124} -08/30/2021 16:13:04 - INFO - __main__ - Step 16509: {'lr': 0.0004882384019977003, 'samples': 3169728, 'steps': 16508, 'loss/train': 1.7541759014129639} -08/30/2021 16:13:06 - INFO - __main__ - Step 16510: {'lr': 0.000488236793383931, 'samples': 3169920, 'steps': 16509, 'loss/train': 1.5085219144821167} -08/30/2021 16:13:07 - INFO - __main__ - Step 16511: {'lr': 0.00048823518466281586, 'samples': 3170112, 'steps': 16510, 'loss/train': 1.641247034072876} -08/30/2021 16:13:07 - INFO - __main__ - Step 16512: {'lr': 0.0004882335758343557, 'samples': 3170304, 'steps': 16511, 'loss/train': 1.3721646070480347} -08/30/2021 16:13:07 - INFO - __main__ - Step 16513: {'lr': 0.0004882319668985511, 'samples': 3170496, 'steps': 16512, 'loss/train': 0.09264480322599411} -08/30/2021 16:13:08 - INFO - __main__ - Step 16514: {'lr': 0.00048823035785540284, 'samples': 3170688, 'steps': 16513, 'loss/train': 1.4933146238327026} -08/30/2021 16:13:09 - INFO - __main__ - Step 16515: {'lr': 0.0004882287487049117, 'samples': 3170880, 'steps': 16514, 'loss/train': 2.5302674770355225} -08/30/2021 16:13:10 - INFO - __main__ - Step 16516: {'lr': 0.00048822713944707833, 'samples': 3171072, 'steps': 16515, 'loss/train': 1.7074077129364014} -08/30/2021 16:13:10 - INFO - __main__ - Step 16517: {'lr': 0.0004882255300819035, 'samples': 3171264, 'steps': 16516, 'loss/train': 2.1281604766845703} -08/30/2021 16:13:10 - INFO - __main__ - Step 16518: {'lr': 0.0004882239206093879, 'samples': 3171456, 'steps': 16517, 'loss/train': 0.7898990511894226} -08/30/2021 16:13:11 - INFO - __main__ - Step 16519: {'lr': 0.0004882223110295323, 'samples': 3171648, 'steps': 16518, 'loss/train': 1.6536293029785156} -08/30/2021 16:13:12 - INFO - __main__ - Step 16520: {'lr': 0.00048822070134233743, 'samples': 3171840, 'steps': 16519, 'loss/train': 2.1504950523376465} -08/30/2021 16:13:13 - INFO - __main__ - Step 16521: {'lr': 0.000488219091547804, 'samples': 3172032, 'steps': 16520, 'loss/train': 1.400365948677063} -08/30/2021 16:13:13 - INFO - __main__ - Step 16522: {'lr': 0.0004882174816459326, 'samples': 3172224, 'steps': 16521, 'loss/train': 2.339890480041504} -08/30/2021 16:13:13 - INFO - __main__ - Step 16523: {'lr': 0.0004882158716367242, 'samples': 3172416, 'steps': 16522, 'loss/train': 1.9823507070541382} -08/30/2021 16:13:14 - INFO - __main__ - Step 16524: {'lr': 0.0004882142615201793, 'samples': 3172608, 'steps': 16523, 'loss/train': 1.4485024213790894} -08/30/2021 16:13:14 - INFO - __main__ - Step 16525: {'lr': 0.00048821265129629887, 'samples': 3172800, 'steps': 16524, 'loss/train': 1.3576749563217163} -08/30/2021 16:13:16 - INFO - __main__ - Step 16526: {'lr': 0.0004882110409650834, 'samples': 3172992, 'steps': 16525, 'loss/train': 1.6916894912719727} -08/30/2021 16:13:16 - INFO - __main__ - Step 16527: {'lr': 0.0004882094305265338, 'samples': 3173184, 'steps': 16526, 'loss/train': 1.6859670877456665} -08/30/2021 16:13:16 - INFO - __main__ - Step 16528: {'lr': 0.00048820781998065054, 'samples': 3173376, 'steps': 16527, 'loss/train': 1.3498218059539795} -08/30/2021 16:13:17 - INFO - __main__ - Step 16529: {'lr': 0.00048820620932743465, 'samples': 3173568, 'steps': 16528, 'loss/train': 1.842890977859497} -08/30/2021 16:13:17 - INFO - __main__ - Step 16530: {'lr': 0.0004882045985668867, 'samples': 3173760, 'steps': 16529, 'loss/train': 1.518268346786499} -08/30/2021 16:13:18 - INFO - __main__ - Step 16531: {'lr': 0.0004882029876990074, 'samples': 3173952, 'steps': 16530, 'loss/train': 2.1686899662017822} -08/30/2021 16:13:19 - INFO - __main__ - Step 16532: {'lr': 0.0004882013767237975, 'samples': 3174144, 'steps': 16531, 'loss/train': 1.8740262985229492} -08/30/2021 16:13:19 - INFO - __main__ - Step 16533: {'lr': 0.0004881997656412578, 'samples': 3174336, 'steps': 16532, 'loss/train': 1.9127898216247559} -08/30/2021 16:13:20 - INFO - __main__ - Step 16534: {'lr': 0.0004881981544513889, 'samples': 3174528, 'steps': 16533, 'loss/train': 1.4909237623214722} -08/30/2021 16:13:20 - INFO - __main__ - Step 16535: {'lr': 0.0004881965431541916, 'samples': 3174720, 'steps': 16534, 'loss/train': 1.2026665210723877} -08/30/2021 16:13:21 - INFO - __main__ - Step 16536: {'lr': 0.0004881949317496667, 'samples': 3174912, 'steps': 16535, 'loss/train': 1.699640154838562} -08/30/2021 16:13:22 - INFO - __main__ - Step 16537: {'lr': 0.0004881933202378147, 'samples': 3175104, 'steps': 16536, 'loss/train': 1.465736746788025} -08/30/2021 16:13:22 - INFO - __main__ - Step 16538: {'lr': 0.0004881917086186365, 'samples': 3175296, 'steps': 16537, 'loss/train': 2.144170045852661} -08/30/2021 16:13:23 - INFO - __main__ - Step 16539: {'lr': 0.0004881900968921328, 'samples': 3175488, 'steps': 16538, 'loss/train': 1.691697597503662} -08/30/2021 16:13:23 - INFO - __main__ - Step 16540: {'lr': 0.00048818848505830436, 'samples': 3175680, 'steps': 16539, 'loss/train': 1.9390833377838135} -08/30/2021 16:13:24 - INFO - __main__ - Step 16541: {'lr': 0.0004881868731171518, 'samples': 3175872, 'steps': 16540, 'loss/train': 1.9974125623703003} -08/30/2021 16:13:25 - INFO - __main__ - Step 16542: {'lr': 0.000488185261068676, 'samples': 3176064, 'steps': 16541, 'loss/train': 2.561133623123169} -08/30/2021 16:13:25 - INFO - __main__ - Step 16543: {'lr': 0.0004881836489128776, 'samples': 3176256, 'steps': 16542, 'loss/train': 1.8090492486953735} -08/30/2021 16:13:26 - INFO - __main__ - Step 16544: {'lr': 0.00048818203664975727, 'samples': 3176448, 'steps': 16543, 'loss/train': 1.488569736480713} -08/30/2021 16:13:26 - INFO - __main__ - Step 16545: {'lr': 0.00048818042427931573, 'samples': 3176640, 'steps': 16544, 'loss/train': 1.1984081268310547} -08/30/2021 16:13:28 - INFO - __main__ - Step 16546: {'lr': 0.00048817881180155385, 'samples': 3176832, 'steps': 16545, 'loss/train': 1.8053693771362305} -08/30/2021 16:13:29 - INFO - __main__ - Step 16547: {'lr': 0.0004881771992164722, 'samples': 3177024, 'steps': 16546, 'loss/train': 1.8906036615371704} -08/30/2021 16:13:29 - INFO - __main__ - Step 16548: {'lr': 0.0004881755865240717, 'samples': 3177216, 'steps': 16547, 'loss/train': 1.862004280090332} -08/30/2021 16:13:29 - INFO - __main__ - Step 16549: {'lr': 0.0004881739737243528, 'samples': 3177408, 'steps': 16548, 'loss/train': 1.5678037405014038} -08/30/2021 16:13:30 - INFO - __main__ - Step 16550: {'lr': 0.00048817236081731655, 'samples': 3177600, 'steps': 16549, 'loss/train': 1.2787948846817017} -08/30/2021 16:13:30 - INFO - __main__ - Step 16551: {'lr': 0.0004881707478029634, 'samples': 3177792, 'steps': 16550, 'loss/train': 1.0139423608779907} -08/30/2021 16:13:32 - INFO - __main__ - Step 16552: {'lr': 0.0004881691346812942, 'samples': 3177984, 'steps': 16551, 'loss/train': 1.6228530406951904} -08/30/2021 16:13:32 - INFO - __main__ - Step 16553: {'lr': 0.0004881675214523097, 'samples': 3178176, 'steps': 16552, 'loss/train': 1.7885985374450684} -08/30/2021 16:13:33 - INFO - __main__ - Step 16554: {'lr': 0.00048816590811601054, 'samples': 3178368, 'steps': 16553, 'loss/train': 1.4082645177841187} -08/30/2021 16:13:33 - INFO - __main__ - Step 16555: {'lr': 0.0004881642946723975, 'samples': 3178560, 'steps': 16554, 'loss/train': 0.08122952282428741} -08/30/2021 16:13:33 - INFO - __main__ - Step 16556: {'lr': 0.00048816268112147134, 'samples': 3178752, 'steps': 16555, 'loss/train': 1.641249656677246} -08/30/2021 16:13:35 - INFO - __main__ - Step 16557: {'lr': 0.00048816106746323273, 'samples': 3178944, 'steps': 16556, 'loss/train': 1.8160207271575928} -08/30/2021 16:13:35 - INFO - __main__ - Step 16558: {'lr': 0.00048815945369768245, 'samples': 3179136, 'steps': 16557, 'loss/train': 1.1699459552764893} -08/30/2021 16:13:36 - INFO - __main__ - Step 16559: {'lr': 0.00048815783982482115, 'samples': 3179328, 'steps': 16558, 'loss/train': 1.8620539903640747} -08/30/2021 16:13:36 - INFO - __main__ - Step 16560: {'lr': 0.0004881562258446496, 'samples': 3179520, 'steps': 16559, 'loss/train': 1.6518065929412842} -08/30/2021 16:13:36 - INFO - __main__ - Step 16561: {'lr': 0.00048815461175716855, 'samples': 3179712, 'steps': 16560, 'loss/train': 1.3696002960205078} -08/30/2021 16:13:37 - INFO - __main__ - Step 16562: {'lr': 0.00048815299756237873, 'samples': 3179904, 'steps': 16561, 'loss/train': 1.7370407581329346} -08/30/2021 16:13:38 - INFO - __main__ - Step 16563: {'lr': 0.0004881513832602808, 'samples': 3180096, 'steps': 16562, 'loss/train': 1.635070562362671} -08/30/2021 16:13:38 - INFO - __main__ - Step 16564: {'lr': 0.0004881497688508756, 'samples': 3180288, 'steps': 16563, 'loss/train': 1.273830771446228} -08/30/2021 16:13:39 - INFO - __main__ - Step 16565: {'lr': 0.0004881481543341637, 'samples': 3180480, 'steps': 16564, 'loss/train': 1.7977510690689087} -08/30/2021 16:13:39 - INFO - __main__ - Step 16566: {'lr': 0.000488146539710146, 'samples': 3180672, 'steps': 16565, 'loss/train': 2.0253050327301025} -08/30/2021 16:13:40 - INFO - __main__ - Step 16567: {'lr': 0.00048814492497882306, 'samples': 3180864, 'steps': 16566, 'loss/train': 1.941239833831787} -08/30/2021 16:13:41 - INFO - __main__ - Step 16568: {'lr': 0.00048814331014019577, 'samples': 3181056, 'steps': 16567, 'loss/train': 1.6758822202682495} -08/30/2021 16:13:41 - INFO - __main__ - Step 16569: {'lr': 0.0004881416951942647, 'samples': 3181248, 'steps': 16568, 'loss/train': 2.201371431350708} -08/30/2021 16:13:42 - INFO - __main__ - Step 16570: {'lr': 0.0004881400801410307, 'samples': 3181440, 'steps': 16569, 'loss/train': 1.941340684890747} -08/30/2021 16:13:42 - INFO - __main__ - Step 16571: {'lr': 0.0004881384649804945, 'samples': 3181632, 'steps': 16570, 'loss/train': 2.0682497024536133} -08/30/2021 16:13:43 - INFO - __main__ - Step 16572: {'lr': 0.0004881368497126567, 'samples': 3181824, 'steps': 16571, 'loss/train': 1.958207368850708} -08/30/2021 16:13:44 - INFO - __main__ - Step 16573: {'lr': 0.00048813523433751814, 'samples': 3182016, 'steps': 16572, 'loss/train': 1.3708523511886597} -08/30/2021 16:13:45 - INFO - __main__ - Step 16574: {'lr': 0.00048813361885507956, 'samples': 3182208, 'steps': 16573, 'loss/train': 1.3560123443603516} -08/30/2021 16:13:45 - INFO - __main__ - Step 16575: {'lr': 0.00048813200326534156, 'samples': 3182400, 'steps': 16574, 'loss/train': 1.6077187061309814} -08/30/2021 16:13:45 - INFO - __main__ - Step 16576: {'lr': 0.00048813038756830506, 'samples': 3182592, 'steps': 16575, 'loss/train': 1.6748696565628052} -08/30/2021 16:13:46 - INFO - __main__ - Step 16577: {'lr': 0.00048812877176397066, 'samples': 3182784, 'steps': 16576, 'loss/train': 0.4968474507331848} -08/30/2021 16:13:47 - INFO - __main__ - Step 16578: {'lr': 0.00048812715585233905, 'samples': 3182976, 'steps': 16577, 'loss/train': 1.143213152885437} -08/30/2021 16:13:48 - INFO - __main__ - Step 16579: {'lr': 0.000488125539833411, 'samples': 3183168, 'steps': 16578, 'loss/train': 1.5067323446273804} -08/30/2021 16:13:48 - INFO - __main__ - Step 16580: {'lr': 0.0004881239237071873, 'samples': 3183360, 'steps': 16579, 'loss/train': 0.1325390636920929} -08/30/2021 16:13:49 - INFO - __main__ - Step 16581: {'lr': 0.0004881223074736687, 'samples': 3183552, 'steps': 16580, 'loss/train': 1.699009895324707} -08/30/2021 16:13:49 - INFO - __main__ - Step 16582: {'lr': 0.00048812069113285573, 'samples': 3183744, 'steps': 16581, 'loss/train': 0.08957020193338394} -08/30/2021 16:13:49 - INFO - __main__ - Step 16583: {'lr': 0.00048811907468474934, 'samples': 3183936, 'steps': 16582, 'loss/train': 1.3878061771392822} -08/30/2021 16:13:51 - INFO - __main__ - Step 16584: {'lr': 0.00048811745812935015, 'samples': 3184128, 'steps': 16583, 'loss/train': 0.20824885368347168} -08/30/2021 16:13:51 - INFO - __main__ - Step 16585: {'lr': 0.00048811584146665895, 'samples': 3184320, 'steps': 16584, 'loss/train': 1.6124420166015625} -08/30/2021 16:13:52 - INFO - __main__ - Step 16586: {'lr': 0.0004881142246966763, 'samples': 3184512, 'steps': 16585, 'loss/train': 1.8895361423492432} -08/30/2021 16:13:52 - INFO - __main__ - Step 16587: {'lr': 0.00048811260781940317, 'samples': 3184704, 'steps': 16586, 'loss/train': 1.4383306503295898} -08/30/2021 16:13:52 - INFO - __main__ - Step 16588: {'lr': 0.00048811099083484016, 'samples': 3184896, 'steps': 16587, 'loss/train': 1.6250507831573486} -08/30/2021 16:13:54 - INFO - __main__ - Step 16589: {'lr': 0.000488109373742988, 'samples': 3185088, 'steps': 16588, 'loss/train': 1.5738410949707031} -08/30/2021 16:13:54 - INFO - __main__ - Step 16590: {'lr': 0.0004881077565438474, 'samples': 3185280, 'steps': 16589, 'loss/train': 1.6363602876663208} -08/30/2021 16:13:55 - INFO - __main__ - Step 16591: {'lr': 0.0004881061392374192, 'samples': 3185472, 'steps': 16590, 'loss/train': 1.9625236988067627} -08/30/2021 16:13:55 - INFO - __main__ - Step 16592: {'lr': 0.000488104521823704, 'samples': 3185664, 'steps': 16591, 'loss/train': 1.8436386585235596} -08/30/2021 16:13:55 - INFO - __main__ - Step 16593: {'lr': 0.00048810290430270257, 'samples': 3185856, 'steps': 16592, 'loss/train': 2.055682420730591} -08/30/2021 16:13:56 - INFO - __main__ - Step 16594: {'lr': 0.0004881012866744156, 'samples': 3186048, 'steps': 16593, 'loss/train': 1.7000099420547485} -08/30/2021 16:13:57 - INFO - __main__ - Step 16595: {'lr': 0.00048809966893884396, 'samples': 3186240, 'steps': 16594, 'loss/train': 1.7137199640274048} -08/30/2021 16:13:58 - INFO - __main__ - Step 16596: {'lr': 0.00048809805109598813, 'samples': 3186432, 'steps': 16595, 'loss/train': 1.7170580625534058} -08/30/2021 16:13:58 - INFO - __main__ - Step 16597: {'lr': 0.0004880964331458492, 'samples': 3186624, 'steps': 16596, 'loss/train': 1.5858354568481445} -08/30/2021 16:13:59 - INFO - __main__ - Step 16598: {'lr': 0.0004880948150884276, 'samples': 3186816, 'steps': 16597, 'loss/train': 1.4752651453018188} -08/30/2021 16:13:59 - INFO - __main__ - Step 16599: {'lr': 0.00048809319692372406, 'samples': 3187008, 'steps': 16598, 'loss/train': 1.3279571533203125} -08/30/2021 16:14:01 - INFO - __main__ - Step 16600: {'lr': 0.0004880915786517395, 'samples': 3187200, 'steps': 16599, 'loss/train': 2.0533125400543213} -08/30/2021 16:14:01 - INFO - __main__ - Step 16601: {'lr': 0.00048808996027247453, 'samples': 3187392, 'steps': 16600, 'loss/train': 2.0156710147857666} -08/30/2021 16:14:02 - INFO - __main__ - Step 16602: {'lr': 0.0004880883417859299, 'samples': 3187584, 'steps': 16601, 'loss/train': 1.2864296436309814} -08/30/2021 16:14:02 - INFO - __main__ - Step 16603: {'lr': 0.0004880867231921063, 'samples': 3187776, 'steps': 16602, 'loss/train': 1.0905944108963013} -08/30/2021 16:14:03 - INFO - __main__ - Step 16604: {'lr': 0.0004880851044910045, 'samples': 3187968, 'steps': 16603, 'loss/train': 1.7267661094665527} -08/30/2021 16:14:04 - INFO - __main__ - Step 16605: {'lr': 0.0004880834856826253, 'samples': 3188160, 'steps': 16604, 'loss/train': 1.4709233045578003} -08/30/2021 16:14:04 - INFO - __main__ - Step 16606: {'lr': 0.0004880818667669693, 'samples': 3188352, 'steps': 16605, 'loss/train': 2.203814744949341} -08/30/2021 16:14:05 - INFO - __main__ - Step 16607: {'lr': 0.00048808024774403726, 'samples': 3188544, 'steps': 16606, 'loss/train': 1.5960253477096558} -08/30/2021 16:14:05 - INFO - __main__ - Step 16608: {'lr': 0.00048807862861382996, 'samples': 3188736, 'steps': 16607, 'loss/train': 1.7516332864761353} -08/30/2021 16:14:05 - INFO - __main__ - Step 16609: {'lr': 0.0004880770093763481, 'samples': 3188928, 'steps': 16608, 'loss/train': 2.1294281482696533} -08/30/2021 16:14:07 - INFO - __main__ - Step 16610: {'lr': 0.0004880753900315924, 'samples': 3189120, 'steps': 16609, 'loss/train': 1.4692928791046143} -08/30/2021 16:14:07 - INFO - __main__ - Step 16611: {'lr': 0.00048807377057956365, 'samples': 3189312, 'steps': 16610, 'loss/train': 1.856947422027588} -08/30/2021 16:14:08 - INFO - __main__ - Step 16612: {'lr': 0.00048807215102026247, 'samples': 3189504, 'steps': 16611, 'loss/train': 1.485852837562561} -08/30/2021 16:14:08 - INFO - __main__ - Step 16613: {'lr': 0.00048807053135368973, 'samples': 3189696, 'steps': 16612, 'loss/train': 2.0284597873687744} -08/30/2021 16:14:08 - INFO - __main__ - Step 16614: {'lr': 0.00048806891157984604, 'samples': 3189888, 'steps': 16613, 'loss/train': 1.6739753484725952} -08/30/2021 16:14:10 - INFO - __main__ - Step 16615: {'lr': 0.0004880672916987322, 'samples': 3190080, 'steps': 16614, 'loss/train': 0.4266573488712311} -08/30/2021 16:14:11 - INFO - __main__ - Step 16616: {'lr': 0.0004880656717103489, 'samples': 3190272, 'steps': 16615, 'loss/train': 1.585524320602417} -08/30/2021 16:14:11 - INFO - __main__ - Step 16617: {'lr': 0.0004880640516146968, 'samples': 3190464, 'steps': 16616, 'loss/train': 1.5404939651489258} -08/30/2021 16:14:11 - INFO - __main__ - Step 16618: {'lr': 0.0004880624314117768, 'samples': 3190656, 'steps': 16617, 'loss/train': 1.2139486074447632} -08/30/2021 16:14:12 - INFO - __main__ - Step 16619: {'lr': 0.0004880608111015895, 'samples': 3190848, 'steps': 16618, 'loss/train': 1.6645313501358032} -08/30/2021 16:14:13 - INFO - __main__ - Step 16620: {'lr': 0.00048805919068413574, 'samples': 3191040, 'steps': 16619, 'loss/train': 0.14072319865226746} -08/30/2021 16:14:14 - INFO - __main__ - Step 16621: {'lr': 0.0004880575701594161, 'samples': 3191232, 'steps': 16620, 'loss/train': 2.3166964054107666} -08/30/2021 16:14:14 - INFO - __main__ - Step 16622: {'lr': 0.0004880559495274315, 'samples': 3191424, 'steps': 16621, 'loss/train': 1.9499908685684204} -08/30/2021 16:14:15 - INFO - __main__ - Step 16623: {'lr': 0.00048805432878818247, 'samples': 3191616, 'steps': 16622, 'loss/train': 1.9381393194198608} -08/30/2021 16:14:15 - INFO - __main__ - Step 16624: {'lr': 0.0004880527079416698, 'samples': 3191808, 'steps': 16623, 'loss/train': 1.55039381980896} -08/30/2021 16:14:15 - INFO - __main__ - Step 16625: {'lr': 0.00048805108698789435, 'samples': 3192000, 'steps': 16624, 'loss/train': 1.7067677974700928} -08/30/2021 16:14:17 - INFO - __main__ - Step 16626: {'lr': 0.00048804946592685667, 'samples': 3192192, 'steps': 16625, 'loss/train': 0.2757457494735718} -08/30/2021 16:14:17 - INFO - __main__ - Step 16627: {'lr': 0.0004880478447585576, 'samples': 3192384, 'steps': 16626, 'loss/train': 0.9581832885742188} -08/30/2021 16:14:18 - INFO - __main__ - Step 16628: {'lr': 0.00048804622348299785, 'samples': 3192576, 'steps': 16627, 'loss/train': 1.693848729133606} -08/30/2021 16:14:18 - INFO - __main__ - Step 16629: {'lr': 0.0004880446021001782, 'samples': 3192768, 'steps': 16628, 'loss/train': 1.7661103010177612} -08/30/2021 16:14:18 - INFO - __main__ - Step 16630: {'lr': 0.00048804298061009925, 'samples': 3192960, 'steps': 16629, 'loss/train': 2.469510078430176} -08/30/2021 16:14:20 - INFO - __main__ - Step 16631: {'lr': 0.0004880413590127619, 'samples': 3193152, 'steps': 16630, 'loss/train': 1.0144615173339844} -08/30/2021 16:14:20 - INFO - __main__ - Step 16632: {'lr': 0.0004880397373081666, 'samples': 3193344, 'steps': 16631, 'loss/train': 1.9545166492462158} -08/30/2021 16:14:21 - INFO - __main__ - Step 16633: {'lr': 0.0004880381154963145, 'samples': 3193536, 'steps': 16632, 'loss/train': 1.8227757215499878} -08/30/2021 16:14:21 - INFO - __main__ - Step 16634: {'lr': 0.0004880364935772059, 'samples': 3193728, 'steps': 16633, 'loss/train': 1.6634933948516846} -08/30/2021 16:14:21 - INFO - __main__ - Step 16635: {'lr': 0.00048803487155084184, 'samples': 3193920, 'steps': 16634, 'loss/train': 1.8381518125534058} -08/30/2021 16:14:23 - INFO - __main__ - Step 16636: {'lr': 0.00048803324941722295, 'samples': 3194112, 'steps': 16635, 'loss/train': 1.544309377670288} -08/30/2021 16:14:23 - INFO - __main__ - Step 16637: {'lr': 0.0004880316271763499, 'samples': 3194304, 'steps': 16636, 'loss/train': 0.11979955434799194} -08/30/2021 16:14:24 - INFO - __main__ - Step 16638: {'lr': 0.0004880300048282235, 'samples': 3194496, 'steps': 16637, 'loss/train': 1.9168736934661865} -08/30/2021 16:14:24 - INFO - __main__ - Step 16639: {'lr': 0.00048802838237284443, 'samples': 3194688, 'steps': 16638, 'loss/train': 2.0347630977630615} -08/30/2021 16:14:24 - INFO - __main__ - Step 16640: {'lr': 0.0004880267598102135, 'samples': 3194880, 'steps': 16639, 'loss/train': 1.0156313180923462} -08/30/2021 16:14:25 - INFO - __main__ - Step 16641: {'lr': 0.0004880251371403313, 'samples': 3195072, 'steps': 16640, 'loss/train': 1.5347892045974731} -08/30/2021 16:14:26 - INFO - __main__ - Step 16642: {'lr': 0.0004880235143631987, 'samples': 3195264, 'steps': 16641, 'loss/train': 1.6933704614639282} -08/30/2021 16:14:27 - INFO - __main__ - Step 16643: {'lr': 0.0004880218914788164, 'samples': 3195456, 'steps': 16642, 'loss/train': 1.696418285369873} -08/30/2021 16:14:27 - INFO - __main__ - Step 16644: {'lr': 0.00048802026848718505, 'samples': 3195648, 'steps': 16643, 'loss/train': 1.2272576093673706} -08/30/2021 16:14:28 - INFO - __main__ - Step 16645: {'lr': 0.0004880186453883054, 'samples': 3195840, 'steps': 16644, 'loss/train': 1.1475294828414917} -08/30/2021 16:14:28 - INFO - __main__ - Step 16646: {'lr': 0.00048801702218217834, 'samples': 3196032, 'steps': 16645, 'loss/train': 1.7064080238342285} -08/30/2021 16:14:29 - INFO - __main__ - Step 16647: {'lr': 0.0004880153988688044, 'samples': 3196224, 'steps': 16646, 'loss/train': 0.5632283687591553} -08/30/2021 16:14:30 - INFO - __main__ - Step 16648: {'lr': 0.0004880137754481845, 'samples': 3196416, 'steps': 16647, 'loss/train': 1.7644410133361816} -08/30/2021 16:14:30 - INFO - __main__ - Step 16649: {'lr': 0.0004880121519203191, 'samples': 3196608, 'steps': 16648, 'loss/train': 1.4228501319885254} -08/30/2021 16:14:31 - INFO - __main__ - Step 16650: {'lr': 0.0004880105282852092, 'samples': 3196800, 'steps': 16649, 'loss/train': 1.9696342945098877} -08/30/2021 16:14:31 - INFO - __main__ - Step 16651: {'lr': 0.0004880089045428554, 'samples': 3196992, 'steps': 16650, 'loss/train': 1.603187918663025} -08/30/2021 16:14:33 - INFO - __main__ - Step 16652: {'lr': 0.0004880072806932585, 'samples': 3197184, 'steps': 16651, 'loss/train': 1.5181456804275513} -08/30/2021 16:14:33 - INFO - __main__ - Step 16653: {'lr': 0.00048800565673641917, 'samples': 3197376, 'steps': 16652, 'loss/train': 1.427760362625122} -08/30/2021 16:14:34 - INFO - __main__ - Step 16654: {'lr': 0.0004880040326723382, 'samples': 3197568, 'steps': 16653, 'loss/train': 1.944973349571228} -08/30/2021 16:14:34 - INFO - __main__ - Step 16655: {'lr': 0.0004880024085010162, 'samples': 3197760, 'steps': 16654, 'loss/train': 1.6088995933532715} -08/30/2021 16:14:34 - INFO - __main__ - Step 16656: {'lr': 0.00048800078422245406, 'samples': 3197952, 'steps': 16655, 'loss/train': 1.9604657888412476} -08/30/2021 16:14:36 - INFO - __main__ - Step 16657: {'lr': 0.0004879991598366524, 'samples': 3198144, 'steps': 16656, 'loss/train': 1.8557242155075073} -08/30/2021 16:14:37 - INFO - __main__ - Step 16658: {'lr': 0.000487997535343612, 'samples': 3198336, 'steps': 16657, 'loss/train': 2.594700336456299} -08/30/2021 16:14:37 - INFO - __main__ - Step 16659: {'lr': 0.0004879959107433336, 'samples': 3198528, 'steps': 16658, 'loss/train': 1.4913543462753296} -08/30/2021 16:14:37 - INFO - __main__ - Step 16660: {'lr': 0.00048799428603581786, 'samples': 3198720, 'steps': 16659, 'loss/train': 1.9455454349517822} -08/30/2021 16:14:38 - INFO - __main__ - Step 16661: {'lr': 0.0004879926612210656, 'samples': 3198912, 'steps': 16660, 'loss/train': 0.6294904947280884} -08/30/2021 16:14:38 - INFO - __main__ - Step 16662: {'lr': 0.0004879910362990775, 'samples': 3199104, 'steps': 16661, 'loss/train': 1.3812592029571533} -08/30/2021 16:14:38 - INFO - __main__ - Step 16663: {'lr': 0.0004879894112698544, 'samples': 3199296, 'steps': 16662, 'loss/train': 1.2141501903533936} -08/30/2021 16:14:40 - INFO - __main__ - Step 16664: {'lr': 0.0004879877861333969, 'samples': 3199488, 'steps': 16663, 'loss/train': 0.5333452224731445} -08/30/2021 16:14:40 - INFO - __main__ - Step 16665: {'lr': 0.00048798616088970573, 'samples': 3199680, 'steps': 16664, 'loss/train': 0.5689380168914795} -08/30/2021 16:14:41 - INFO - __main__ - Step 16666: {'lr': 0.0004879845355387817, 'samples': 3199872, 'steps': 16665, 'loss/train': 1.3376206159591675} -08/30/2021 16:14:41 - INFO - __main__ - Step 16667: {'lr': 0.00048798291008062553, 'samples': 3200064, 'steps': 16666, 'loss/train': 2.0341899394989014} -08/30/2021 16:14:41 - INFO - __main__ - Step 16668: {'lr': 0.0004879812845152379, 'samples': 3200256, 'steps': 16667, 'loss/train': 2.0121335983276367} -08/30/2021 16:14:43 - INFO - __main__ - Step 16669: {'lr': 0.0004879796588426195, 'samples': 3200448, 'steps': 16668, 'loss/train': 1.902250051498413} -08/30/2021 16:14:44 - INFO - __main__ - Step 16670: {'lr': 0.0004879780330627713, 'samples': 3200640, 'steps': 16669, 'loss/train': 1.7941910028457642} -08/30/2021 16:14:44 - INFO - __main__ - Step 16671: {'lr': 0.0004879764071756938, 'samples': 3200832, 'steps': 16670, 'loss/train': 0.3390023708343506} -08/30/2021 16:14:44 - INFO - __main__ - Step 16672: {'lr': 0.00048797478118138777, 'samples': 3201024, 'steps': 16671, 'loss/train': 1.7030514478683472} -08/30/2021 16:14:45 - INFO - __main__ - Step 16673: {'lr': 0.000487973155079854, 'samples': 3201216, 'steps': 16672, 'loss/train': 1.5212053060531616} -08/30/2021 16:14:46 - INFO - __main__ - Step 16674: {'lr': 0.0004879715288710932, 'samples': 3201408, 'steps': 16673, 'loss/train': 1.762177586555481} -08/30/2021 16:14:47 - INFO - __main__ - Step 16675: {'lr': 0.0004879699025551061, 'samples': 3201600, 'steps': 16674, 'loss/train': 1.2488783597946167} -08/30/2021 16:14:47 - INFO - __main__ - Step 16676: {'lr': 0.0004879682761318934, 'samples': 3201792, 'steps': 16675, 'loss/train': 1.6335327625274658} -08/30/2021 16:14:47 - INFO - __main__ - Step 16677: {'lr': 0.00048796664960145596, 'samples': 3201984, 'steps': 16676, 'loss/train': 0.05811972916126251} -08/30/2021 16:14:48 - INFO - __main__ - Step 16678: {'lr': 0.00048796502296379437, 'samples': 3202176, 'steps': 16677, 'loss/train': 1.8747398853302002} -08/30/2021 16:14:49 - INFO - __main__ - Step 16679: {'lr': 0.0004879633962189094, 'samples': 3202368, 'steps': 16678, 'loss/train': 1.61774742603302} -08/30/2021 16:14:50 - INFO - __main__ - Step 16680: {'lr': 0.0004879617693668018, 'samples': 3202560, 'steps': 16679, 'loss/train': 2.108137607574463} -08/30/2021 16:14:50 - INFO - __main__ - Step 16681: {'lr': 0.00048796014240747227, 'samples': 3202752, 'steps': 16680, 'loss/train': 1.5128915309906006} -08/30/2021 16:14:50 - INFO - __main__ - Step 16682: {'lr': 0.0004879585153409216, 'samples': 3202944, 'steps': 16681, 'loss/train': 1.926310420036316} -08/30/2021 16:14:51 - INFO - __main__ - Step 16683: {'lr': 0.0004879568881671505, 'samples': 3203136, 'steps': 16682, 'loss/train': 1.9453061819076538} -08/30/2021 16:14:52 - INFO - __main__ - Step 16684: {'lr': 0.0004879552608861597, 'samples': 3203328, 'steps': 16683, 'loss/train': 1.6820000410079956} -08/30/2021 16:14:53 - INFO - __main__ - Step 16685: {'lr': 0.00048795363349794996, 'samples': 3203520, 'steps': 16684, 'loss/train': 1.78916335105896} -08/30/2021 16:14:53 - INFO - __main__ - Step 16686: {'lr': 0.00048795200600252193, 'samples': 3203712, 'steps': 16685, 'loss/train': 1.3662347793579102} -08/30/2021 16:14:54 - INFO - __main__ - Step 16687: {'lr': 0.00048795037839987644, 'samples': 3203904, 'steps': 16686, 'loss/train': 1.3548601865768433} -08/30/2021 16:14:54 - INFO - __main__ - Step 16688: {'lr': 0.0004879487506900141, 'samples': 3204096, 'steps': 16687, 'loss/train': 1.7290133237838745} -08/30/2021 16:14:55 - INFO - __main__ - Step 16689: {'lr': 0.0004879471228729358, 'samples': 3204288, 'steps': 16688, 'loss/train': 0.3155171871185303} -08/30/2021 16:14:56 - INFO - __main__ - Step 16690: {'lr': 0.0004879454949486422, 'samples': 3204480, 'steps': 16689, 'loss/train': 1.1663745641708374} -08/30/2021 16:14:56 - INFO - __main__ - Step 16691: {'lr': 0.000487943866917134, 'samples': 3204672, 'steps': 16690, 'loss/train': 1.5553964376449585} -08/30/2021 16:14:57 - INFO - __main__ - Step 16692: {'lr': 0.00048794223877841197, 'samples': 3204864, 'steps': 16691, 'loss/train': 1.8806887865066528} -08/30/2021 16:14:57 - INFO - __main__ - Step 16693: {'lr': 0.00048794061053247686, 'samples': 3205056, 'steps': 16692, 'loss/train': 1.5888007879257202} -08/30/2021 16:14:58 - INFO - __main__ - Step 16694: {'lr': 0.0004879389821793294, 'samples': 3205248, 'steps': 16693, 'loss/train': 1.103945016860962} -08/30/2021 16:14:59 - INFO - __main__ - Step 16695: {'lr': 0.00048793735371897027, 'samples': 3205440, 'steps': 16694, 'loss/train': 1.3188711404800415} -08/30/2021 16:14:59 - INFO - __main__ - Step 16696: {'lr': 0.00048793572515140024, 'samples': 3205632, 'steps': 16695, 'loss/train': 1.5159010887145996} -08/30/2021 16:15:00 - INFO - __main__ - Step 16697: {'lr': 0.00048793409647662, 'samples': 3205824, 'steps': 16696, 'loss/train': 2.130124092102051} -08/30/2021 16:15:00 - INFO - __main__ - Step 16698: {'lr': 0.0004879324676946304, 'samples': 3206016, 'steps': 16697, 'loss/train': 1.5905779600143433} -08/30/2021 16:15:00 - INFO - __main__ - Step 16699: {'lr': 0.0004879308388054321, 'samples': 3206208, 'steps': 16698, 'loss/train': 1.96693754196167} -08/30/2021 16:15:03 - INFO - __main__ - Step 16700: {'lr': 0.0004879292098090258, 'samples': 3206400, 'steps': 16699, 'loss/train': 1.7866253852844238} -08/30/2021 16:15:03 - INFO - __main__ - Step 16701: {'lr': 0.00048792758070541234, 'samples': 3206592, 'steps': 16700, 'loss/train': 1.3016022443771362} -08/30/2021 16:15:04 - INFO - __main__ - Step 16702: {'lr': 0.00048792595149459226, 'samples': 3206784, 'steps': 16701, 'loss/train': 0.7525354623794556} -08/30/2021 16:15:04 - INFO - __main__ - Step 16703: {'lr': 0.0004879243221765665, 'samples': 3206976, 'steps': 16702, 'loss/train': 0.6439904570579529} -08/30/2021 16:15:04 - INFO - __main__ - Step 16704: {'lr': 0.00048792269275133574, 'samples': 3207168, 'steps': 16703, 'loss/train': 0.6069667935371399} -08/30/2021 16:15:05 - INFO - __main__ - Step 16705: {'lr': 0.0004879210632189006, 'samples': 3207360, 'steps': 16704, 'loss/train': 1.6717065572738647} -08/30/2021 16:15:06 - INFO - __main__ - Step 16706: {'lr': 0.0004879194335792619, 'samples': 3207552, 'steps': 16705, 'loss/train': 1.686883807182312} -08/30/2021 16:15:07 - INFO - __main__ - Step 16707: {'lr': 0.0004879178038324205, 'samples': 3207744, 'steps': 16706, 'loss/train': 0.46764278411865234} -08/30/2021 16:15:07 - INFO - __main__ - Step 16708: {'lr': 0.0004879161739783769, 'samples': 3207936, 'steps': 16707, 'loss/train': 1.4054722785949707} -08/30/2021 16:15:07 - INFO - __main__ - Step 16709: {'lr': 0.00048791454401713195, 'samples': 3208128, 'steps': 16708, 'loss/train': 1.715261697769165} -08/30/2021 16:15:08 - INFO - __main__ - Step 16710: {'lr': 0.00048791291394868644, 'samples': 3208320, 'steps': 16709, 'loss/train': 1.0365930795669556} -08/30/2021 16:15:10 - INFO - __main__ - Step 16711: {'lr': 0.000487911283773041, 'samples': 3208512, 'steps': 16710, 'loss/train': 0.22322697937488556} -08/30/2021 16:15:10 - INFO - __main__ - Step 16712: {'lr': 0.0004879096534901964, 'samples': 3208704, 'steps': 16711, 'loss/train': 1.6091737747192383} -08/30/2021 16:15:11 - INFO - __main__ - Step 16713: {'lr': 0.00048790802310015336, 'samples': 3208896, 'steps': 16712, 'loss/train': 1.3067803382873535} -08/30/2021 16:15:11 - INFO - __main__ - Step 16714: {'lr': 0.0004879063926029127, 'samples': 3209088, 'steps': 16713, 'loss/train': 0.07299730181694031} -08/30/2021 16:15:11 - INFO - __main__ - Step 16715: {'lr': 0.00048790476199847506, 'samples': 3209280, 'steps': 16714, 'loss/train': 1.7180428504943848} -08/30/2021 16:15:13 - INFO - __main__ - Step 16716: {'lr': 0.0004879031312868412, 'samples': 3209472, 'steps': 16715, 'loss/train': 1.3390231132507324} -08/30/2021 16:15:13 - INFO - __main__ - Step 16717: {'lr': 0.00048790150046801187, 'samples': 3209664, 'steps': 16716, 'loss/train': 1.1674901247024536} -08/30/2021 16:15:14 - INFO - __main__ - Step 16718: {'lr': 0.0004878998695419877, 'samples': 3209856, 'steps': 16717, 'loss/train': 1.949594259262085} -08/30/2021 16:15:14 - INFO - __main__ - Step 16719: {'lr': 0.0004878982385087697, 'samples': 3210048, 'steps': 16718, 'loss/train': 1.2132210731506348} -08/30/2021 16:15:15 - INFO - __main__ - Step 16720: {'lr': 0.0004878966073683583, 'samples': 3210240, 'steps': 16719, 'loss/train': 1.2069034576416016} -08/30/2021 16:15:15 - INFO - __main__ - Step 16721: {'lr': 0.0004878949761207544, 'samples': 3210432, 'steps': 16720, 'loss/train': 1.6156997680664062} -08/30/2021 16:15:16 - INFO - __main__ - Step 16722: {'lr': 0.0004878933447659587, 'samples': 3210624, 'steps': 16721, 'loss/train': 2.123835325241089} -08/30/2021 16:15:17 - INFO - __main__ - Step 16723: {'lr': 0.0004878917133039719, 'samples': 3210816, 'steps': 16722, 'loss/train': 1.9504806995391846} -08/30/2021 16:15:17 - INFO - __main__ - Step 16724: {'lr': 0.00048789008173479476, 'samples': 3211008, 'steps': 16723, 'loss/train': 1.1853959560394287} -08/30/2021 16:15:17 - INFO - __main__ - Step 16725: {'lr': 0.0004878884500584281, 'samples': 3211200, 'steps': 16724, 'loss/train': 1.256620168685913} -08/30/2021 16:15:18 - INFO - __main__ - Step 16726: {'lr': 0.0004878868182748725, 'samples': 3211392, 'steps': 16725, 'loss/train': 1.831167459487915} -08/30/2021 16:15:19 - INFO - __main__ - Step 16727: {'lr': 0.0004878851863841287, 'samples': 3211584, 'steps': 16726, 'loss/train': 1.5383081436157227} -08/30/2021 16:15:20 - INFO - __main__ - Step 16728: {'lr': 0.00048788355438619764, 'samples': 3211776, 'steps': 16727, 'loss/train': 1.5069228410720825} -08/30/2021 16:15:20 - INFO - __main__ - Step 16729: {'lr': 0.00048788192228107986, 'samples': 3211968, 'steps': 16728, 'loss/train': 1.9376816749572754} -08/30/2021 16:15:20 - INFO - __main__ - Step 16730: {'lr': 0.00048788029006877623, 'samples': 3212160, 'steps': 16729, 'loss/train': 1.933656096458435} -08/30/2021 16:15:21 - INFO - __main__ - Step 16731: {'lr': 0.0004878786577492873, 'samples': 3212352, 'steps': 16730, 'loss/train': 1.6945432424545288} -08/30/2021 16:15:22 - INFO - __main__ - Step 16732: {'lr': 0.00048787702532261396, 'samples': 3212544, 'steps': 16731, 'loss/train': 1.8733289241790771} -08/30/2021 16:15:23 - INFO - __main__ - Step 16733: {'lr': 0.0004878753927887569, 'samples': 3212736, 'steps': 16732, 'loss/train': 1.5571599006652832} -08/30/2021 16:15:23 - INFO - __main__ - Step 16734: {'lr': 0.0004878737601477169, 'samples': 3212928, 'steps': 16733, 'loss/train': 1.8006837368011475} -08/30/2021 16:15:23 - INFO - __main__ - Step 16735: {'lr': 0.0004878721273994946, 'samples': 3213120, 'steps': 16734, 'loss/train': 1.913068175315857} -08/30/2021 16:15:24 - INFO - __main__ - Step 16736: {'lr': 0.00048787049454409085, 'samples': 3213312, 'steps': 16735, 'loss/train': 1.6572901010513306} -08/30/2021 16:15:25 - INFO - __main__ - Step 16737: {'lr': 0.0004878688615815063, 'samples': 3213504, 'steps': 16736, 'loss/train': 1.5615729093551636} -08/30/2021 16:15:26 - INFO - __main__ - Step 16738: {'lr': 0.0004878672285117417, 'samples': 3213696, 'steps': 16737, 'loss/train': 1.1859101057052612} -08/30/2021 16:15:26 - INFO - __main__ - Step 16739: {'lr': 0.0004878655953347978, 'samples': 3213888, 'steps': 16738, 'loss/train': 1.5913857221603394} -08/30/2021 16:15:26 - INFO - __main__ - Step 16740: {'lr': 0.0004878639620506753, 'samples': 3214080, 'steps': 16739, 'loss/train': 1.3443471193313599} -08/30/2021 16:15:27 - INFO - __main__ - Step 16741: {'lr': 0.00048786232865937504, 'samples': 3214272, 'steps': 16740, 'loss/train': 0.7952996492385864} -08/30/2021 16:15:28 - INFO - __main__ - Step 16742: {'lr': 0.0004878606951608976, 'samples': 3214464, 'steps': 16741, 'loss/train': 1.502210021018982} -08/30/2021 16:15:29 - INFO - __main__ - Step 16743: {'lr': 0.00048785906155524386, 'samples': 3214656, 'steps': 16742, 'loss/train': 1.5023962259292603} -08/30/2021 16:15:29 - INFO - __main__ - Step 16744: {'lr': 0.0004878574278424145, 'samples': 3214848, 'steps': 16743, 'loss/train': 2.827465295791626} -08/30/2021 16:15:30 - INFO - __main__ - Step 16745: {'lr': 0.0004878557940224102, 'samples': 3215040, 'steps': 16744, 'loss/train': 1.257771611213684} -08/30/2021 16:15:30 - INFO - __main__ - Step 16746: {'lr': 0.0004878541600952318, 'samples': 3215232, 'steps': 16745, 'loss/train': 1.6157188415527344} -08/30/2021 16:15:30 - INFO - __main__ - Step 16747: {'lr': 0.00048785252606087996, 'samples': 3215424, 'steps': 16746, 'loss/train': 1.7678358554840088} -08/30/2021 16:15:32 - INFO - __main__ - Step 16748: {'lr': 0.0004878508919193555, 'samples': 3215616, 'steps': 16747, 'loss/train': 1.8955780267715454} -08/30/2021 16:15:33 - INFO - __main__ - Step 16749: {'lr': 0.000487849257670659, 'samples': 3215808, 'steps': 16748, 'loss/train': 1.434479832649231} -08/30/2021 16:15:33 - INFO - __main__ - Step 16750: {'lr': 0.0004878476233147914, 'samples': 3216000, 'steps': 16749, 'loss/train': 1.400259256362915} -08/30/2021 16:15:33 - INFO - __main__ - Step 16751: {'lr': 0.00048784598885175324, 'samples': 3216192, 'steps': 16750, 'loss/train': 1.5084441900253296} -08/30/2021 16:15:34 - INFO - __main__ - Step 16752: {'lr': 0.00048784435428154537, 'samples': 3216384, 'steps': 16751, 'loss/train': 1.7930991649627686} -08/30/2021 16:15:34 - INFO - __main__ - Step 16753: {'lr': 0.0004878427196041686, 'samples': 3216576, 'steps': 16752, 'loss/train': 1.52134370803833} -08/30/2021 16:15:35 - INFO - __main__ - Step 16754: {'lr': 0.00048784108481962347, 'samples': 3216768, 'steps': 16753, 'loss/train': 0.8323087096214294} -08/30/2021 16:15:36 - INFO - __main__ - Step 16755: {'lr': 0.00048783944992791085, 'samples': 3216960, 'steps': 16754, 'loss/train': 1.7217965126037598} -08/30/2021 16:15:36 - INFO - __main__ - Step 16756: {'lr': 0.00048783781492903145, 'samples': 3217152, 'steps': 16755, 'loss/train': 1.1818318367004395} -08/30/2021 16:15:36 - INFO - __main__ - Step 16757: {'lr': 0.00048783617982298594, 'samples': 3217344, 'steps': 16756, 'loss/train': 1.7665915489196777} -08/30/2021 16:15:37 - INFO - __main__ - Step 16758: {'lr': 0.00048783454460977517, 'samples': 3217536, 'steps': 16757, 'loss/train': 2.1646244525909424} -08/30/2021 16:15:38 - INFO - __main__ - Step 16759: {'lr': 0.00048783290928939985, 'samples': 3217728, 'steps': 16758, 'loss/train': 1.5340540409088135} -08/30/2021 16:15:39 - INFO - __main__ - Step 16760: {'lr': 0.00048783127386186064, 'samples': 3217920, 'steps': 16759, 'loss/train': 2.2429051399230957} -08/30/2021 16:15:39 - INFO - __main__ - Step 16761: {'lr': 0.00048782963832715834, 'samples': 3218112, 'steps': 16760, 'loss/train': 2.0270144939422607} -08/30/2021 16:15:39 - INFO - __main__ - Step 16762: {'lr': 0.0004878280026852937, 'samples': 3218304, 'steps': 16761, 'loss/train': 1.3143175840377808} -08/30/2021 16:15:40 - INFO - __main__ - Step 16763: {'lr': 0.00048782636693626736, 'samples': 3218496, 'steps': 16762, 'loss/train': 1.7576345205307007} -08/30/2021 16:15:42 - INFO - __main__ - Step 16764: {'lr': 0.0004878247310800802, 'samples': 3218688, 'steps': 16763, 'loss/train': 0.20639830827713013} -08/30/2021 16:15:43 - INFO - __main__ - Step 16765: {'lr': 0.0004878230951167328, 'samples': 3218880, 'steps': 16764, 'loss/train': 0.18535570800304413} -08/30/2021 16:15:43 - INFO - __main__ - Step 16766: {'lr': 0.0004878214590462261, 'samples': 3219072, 'steps': 16765, 'loss/train': 0.671101987361908} -08/30/2021 16:15:44 - INFO - __main__ - Step 16767: {'lr': 0.0004878198228685607, 'samples': 3219264, 'steps': 16766, 'loss/train': 1.7018426656723022} -08/30/2021 16:15:44 - INFO - __main__ - Step 16768: {'lr': 0.00048781818658373734, 'samples': 3219456, 'steps': 16767, 'loss/train': 1.3425238132476807} -08/30/2021 16:15:44 - INFO - __main__ - Step 16769: {'lr': 0.00048781655019175676, 'samples': 3219648, 'steps': 16768, 'loss/train': 1.5089943408966064} -08/30/2021 16:15:46 - INFO - __main__ - Step 16770: {'lr': 0.00048781491369261965, 'samples': 3219840, 'steps': 16769, 'loss/train': 1.4512887001037598} -08/30/2021 16:15:46 - INFO - __main__ - Step 16771: {'lr': 0.00048781327708632695, 'samples': 3220032, 'steps': 16770, 'loss/train': 0.9616290926933289} -08/30/2021 16:15:47 - INFO - __main__ - Step 16772: {'lr': 0.0004878116403728792, 'samples': 3220224, 'steps': 16771, 'loss/train': 1.8094511032104492} -08/30/2021 16:15:47 - INFO - __main__ - Step 16773: {'lr': 0.0004878100035522771, 'samples': 3220416, 'steps': 16772, 'loss/train': 1.944799542427063} -08/30/2021 16:15:47 - INFO - __main__ - Step 16774: {'lr': 0.00048780836662452154, 'samples': 3220608, 'steps': 16773, 'loss/train': 1.8739910125732422} -08/30/2021 16:15:49 - INFO - __main__ - Step 16775: {'lr': 0.00048780672958961325, 'samples': 3220800, 'steps': 16774, 'loss/train': 2.0597751140594482} -08/30/2021 16:15:49 - INFO - __main__ - Step 16776: {'lr': 0.0004878050924475529, 'samples': 3220992, 'steps': 16775, 'loss/train': 1.400397777557373} -08/30/2021 16:15:50 - INFO - __main__ - Step 16777: {'lr': 0.00048780345519834124, 'samples': 3221184, 'steps': 16776, 'loss/train': 1.1562952995300293} -08/30/2021 16:15:50 - INFO - __main__ - Step 16778: {'lr': 0.000487801817841979, 'samples': 3221376, 'steps': 16777, 'loss/train': 0.9177966117858887} -08/30/2021 16:15:50 - INFO - __main__ - Step 16779: {'lr': 0.0004878001803784669, 'samples': 3221568, 'steps': 16778, 'loss/train': 1.7204710245132446} -08/30/2021 16:15:51 - INFO - __main__ - Step 16780: {'lr': 0.00048779854280780576, 'samples': 3221760, 'steps': 16779, 'loss/train': 1.5911046266555786} -08/30/2021 16:15:52 - INFO - __main__ - Step 16781: {'lr': 0.00048779690512999627, 'samples': 3221952, 'steps': 16780, 'loss/train': 1.4506856203079224} -08/30/2021 16:15:53 - INFO - __main__ - Step 16782: {'lr': 0.0004877952673450391, 'samples': 3222144, 'steps': 16781, 'loss/train': 1.4995564222335815} -08/30/2021 16:15:53 - INFO - __main__ - Step 16783: {'lr': 0.0004877936294529351, 'samples': 3222336, 'steps': 16782, 'loss/train': 0.9332077503204346} -08/30/2021 16:15:53 - INFO - __main__ - Step 16784: {'lr': 0.00048779199145368494, 'samples': 3222528, 'steps': 16783, 'loss/train': 1.4664751291275024} -08/30/2021 16:15:54 - INFO - __main__ - Step 16785: {'lr': 0.0004877903533472894, 'samples': 3222720, 'steps': 16784, 'loss/train': 1.3890423774719238} -08/30/2021 16:15:55 - INFO - __main__ - Step 16786: {'lr': 0.0004877887151337492, 'samples': 3222912, 'steps': 16785, 'loss/train': 0.972080409526825} -08/30/2021 16:15:56 - INFO - __main__ - Step 16787: {'lr': 0.0004877870768130651, 'samples': 3223104, 'steps': 16786, 'loss/train': 1.5679256916046143} -08/30/2021 16:15:56 - INFO - __main__ - Step 16788: {'lr': 0.0004877854383852377, 'samples': 3223296, 'steps': 16787, 'loss/train': 1.64675772190094} -08/30/2021 16:15:57 - INFO - __main__ - Step 16789: {'lr': 0.000487783799850268, 'samples': 3223488, 'steps': 16788, 'loss/train': 1.936020016670227} -08/30/2021 16:15:57 - INFO - __main__ - Step 16790: {'lr': 0.00048778216120815644, 'samples': 3223680, 'steps': 16789, 'loss/train': 1.426086187362671} -08/30/2021 16:15:58 - INFO - __main__ - Step 16791: {'lr': 0.00048778052245890404, 'samples': 3223872, 'steps': 16790, 'loss/train': 1.7422831058502197} -08/30/2021 16:15:59 - INFO - __main__ - Step 16792: {'lr': 0.0004877788836025113, 'samples': 3224064, 'steps': 16791, 'loss/train': 1.311118245124817} -08/30/2021 16:15:59 - INFO - __main__ - Step 16793: {'lr': 0.0004877772446389791, 'samples': 3224256, 'steps': 16792, 'loss/train': 1.623799204826355} -08/30/2021 16:16:00 - INFO - __main__ - Step 16794: {'lr': 0.0004877756055683082, 'samples': 3224448, 'steps': 16793, 'loss/train': 2.0339138507843018} -08/30/2021 16:16:00 - INFO - __main__ - Step 16795: {'lr': 0.0004877739663904992, 'samples': 3224640, 'steps': 16794, 'loss/train': 1.47018301486969} -08/30/2021 16:16:02 - INFO - __main__ - Step 16796: {'lr': 0.00048777232710555296, 'samples': 3224832, 'steps': 16795, 'loss/train': 1.961258888244629} -08/30/2021 16:16:02 - INFO - __main__ - Step 16797: {'lr': 0.0004877706877134702, 'samples': 3225024, 'steps': 16796, 'loss/train': 1.7934300899505615} -08/30/2021 16:16:03 - INFO - __main__ - Step 16798: {'lr': 0.0004877690482142516, 'samples': 3225216, 'steps': 16797, 'loss/train': 1.6483789682388306} -08/30/2021 16:16:03 - INFO - __main__ - Step 16799: {'lr': 0.0004877674086078979, 'samples': 3225408, 'steps': 16798, 'loss/train': 1.7061437368392944} -08/30/2021 16:16:03 - INFO - __main__ - Step 16800: {'lr': 0.0004877657688944099, 'samples': 3225600, 'steps': 16799, 'loss/train': 1.4893561601638794} -08/30/2021 16:16:04 - INFO - __main__ - Step 16801: {'lr': 0.0004877641290737884, 'samples': 3225792, 'steps': 16800, 'loss/train': 1.5711534023284912} -08/30/2021 16:16:05 - INFO - __main__ - Step 16802: {'lr': 0.000487762489146034, 'samples': 3225984, 'steps': 16801, 'loss/train': 0.10147201269865036} -08/30/2021 16:16:06 - INFO - __main__ - Step 16803: {'lr': 0.0004877608491111475, 'samples': 3226176, 'steps': 16802, 'loss/train': 1.5733031034469604} -08/30/2021 16:16:06 - INFO - __main__ - Step 16804: {'lr': 0.0004877592089691296, 'samples': 3226368, 'steps': 16803, 'loss/train': 1.1071979999542236} -08/30/2021 16:16:06 - INFO - __main__ - Step 16805: {'lr': 0.00048775756871998106, 'samples': 3226560, 'steps': 16804, 'loss/train': 1.2677621841430664} -08/30/2021 16:16:07 - INFO - __main__ - Step 16806: {'lr': 0.0004877559283637026, 'samples': 3226752, 'steps': 16805, 'loss/train': 1.9323376417160034} -08/30/2021 16:16:08 - INFO - __main__ - Step 16807: {'lr': 0.0004877542879002951, 'samples': 3226944, 'steps': 16806, 'loss/train': 1.47136390209198} -08/30/2021 16:16:09 - INFO - __main__ - Step 16808: {'lr': 0.0004877526473297591, 'samples': 3227136, 'steps': 16807, 'loss/train': 1.6244699954986572} -08/30/2021 16:16:09 - INFO - __main__ - Step 16809: {'lr': 0.0004877510066520954, 'samples': 3227328, 'steps': 16808, 'loss/train': 1.7713903188705444} -08/30/2021 16:16:09 - INFO - __main__ - Step 16810: {'lr': 0.0004877493658673048, 'samples': 3227520, 'steps': 16809, 'loss/train': 2.050170660018921} -08/30/2021 16:16:10 - INFO - __main__ - Step 16811: {'lr': 0.00048774772497538806, 'samples': 3227712, 'steps': 16810, 'loss/train': 2.4477641582489014} -08/30/2021 16:16:11 - INFO - __main__ - Step 16812: {'lr': 0.0004877460839763458, 'samples': 3227904, 'steps': 16811, 'loss/train': 1.2472822666168213} -08/30/2021 16:16:12 - INFO - __main__ - Step 16813: {'lr': 0.0004877444428701788, 'samples': 3228096, 'steps': 16812, 'loss/train': 1.5294315814971924} -08/30/2021 16:16:12 - INFO - __main__ - Step 16814: {'lr': 0.0004877428016568879, 'samples': 3228288, 'steps': 16813, 'loss/train': 2.1093595027923584} -08/30/2021 16:16:13 - INFO - __main__ - Step 16815: {'lr': 0.00048774116033647373, 'samples': 3228480, 'steps': 16814, 'loss/train': 1.6045103073120117} -08/30/2021 16:16:13 - INFO - __main__ - Step 16816: {'lr': 0.0004877395189089371, 'samples': 3228672, 'steps': 16815, 'loss/train': 2.525740146636963} -08/30/2021 16:16:15 - INFO - __main__ - Step 16817: {'lr': 0.00048773787737427867, 'samples': 3228864, 'steps': 16816, 'loss/train': 1.4167840480804443} -08/30/2021 16:16:16 - INFO - __main__ - Step 16818: {'lr': 0.0004877362357324992, 'samples': 3229056, 'steps': 16817, 'loss/train': 2.2660722732543945} -08/30/2021 16:16:16 - INFO - __main__ - Step 16819: {'lr': 0.0004877345939835995, 'samples': 3229248, 'steps': 16818, 'loss/train': 1.4358583688735962} -08/30/2021 16:16:16 - INFO - __main__ - Step 16820: {'lr': 0.0004877329521275802, 'samples': 3229440, 'steps': 16819, 'loss/train': 1.6625192165374756} -08/30/2021 16:16:17 - INFO - __main__ - Step 16821: {'lr': 0.0004877313101644422, 'samples': 3229632, 'steps': 16820, 'loss/train': 1.6703619956970215} -08/30/2021 16:16:17 - INFO - __main__ - Step 16822: {'lr': 0.000487729668094186, 'samples': 3229824, 'steps': 16821, 'loss/train': 2.0354955196380615} -08/30/2021 16:16:18 - INFO - __main__ - Step 16823: {'lr': 0.0004877280259168125, 'samples': 3230016, 'steps': 16822, 'loss/train': 1.4470092058181763} -08/30/2021 16:16:19 - INFO - __main__ - Step 16824: {'lr': 0.0004877263836323226, 'samples': 3230208, 'steps': 16823, 'loss/train': 1.4930732250213623} -08/30/2021 16:16:19 - INFO - __main__ - Step 16825: {'lr': 0.00048772474124071663, 'samples': 3230400, 'steps': 16824, 'loss/train': 1.8102967739105225} -08/30/2021 16:16:20 - INFO - __main__ - Step 16826: {'lr': 0.0004877230987419957, 'samples': 3230592, 'steps': 16825, 'loss/train': 1.7201083898544312} -08/30/2021 16:16:20 - INFO - __main__ - Step 16827: {'lr': 0.00048772145613616035, 'samples': 3230784, 'steps': 16826, 'loss/train': 1.827391505241394} -08/30/2021 16:16:22 - INFO - __main__ - Step 16828: {'lr': 0.00048771981342321145, 'samples': 3230976, 'steps': 16827, 'loss/train': 1.4888100624084473} -08/30/2021 16:16:22 - INFO - __main__ - Step 16829: {'lr': 0.0004877181706031496, 'samples': 3231168, 'steps': 16828, 'loss/train': 1.685758352279663} -08/30/2021 16:16:23 - INFO - __main__ - Step 16830: {'lr': 0.00048771652767597563, 'samples': 3231360, 'steps': 16829, 'loss/train': 1.369916558265686} -08/30/2021 16:16:23 - INFO - __main__ - Step 16831: {'lr': 0.0004877148846416903, 'samples': 3231552, 'steps': 16830, 'loss/train': 1.7621418237686157} -08/30/2021 16:16:23 - INFO - __main__ - Step 16832: {'lr': 0.0004877132415002943, 'samples': 3231744, 'steps': 16831, 'loss/train': 1.6573519706726074} -08/30/2021 16:16:25 - INFO - __main__ - Step 16833: {'lr': 0.00048771159825178827, 'samples': 3231936, 'steps': 16832, 'loss/train': 1.4401060342788696} -08/30/2021 16:16:26 - INFO - __main__ - Step 16834: {'lr': 0.0004877099548961732, 'samples': 3232128, 'steps': 16833, 'loss/train': 1.8510234355926514} -08/30/2021 16:16:26 - INFO - __main__ - Step 16835: {'lr': 0.0004877083114334496, 'samples': 3232320, 'steps': 16834, 'loss/train': 1.7695484161376953} -08/30/2021 16:16:27 - INFO - __main__ - Step 16836: {'lr': 0.0004877066678636184, 'samples': 3232512, 'steps': 16835, 'loss/train': 1.2076002359390259} -08/30/2021 16:16:27 - INFO - __main__ - Step 16837: {'lr': 0.00048770502418668017, 'samples': 3232704, 'steps': 16836, 'loss/train': 1.9213272333145142} -08/30/2021 16:16:27 - INFO - __main__ - Step 16838: {'lr': 0.00048770338040263574, 'samples': 3232896, 'steps': 16837, 'loss/train': 1.7977879047393799} -08/30/2021 16:16:28 - INFO - __main__ - Step 16839: {'lr': 0.00048770173651148586, 'samples': 3233088, 'steps': 16838, 'loss/train': 1.4382543563842773} -08/30/2021 16:16:29 - INFO - __main__ - Step 16840: {'lr': 0.0004877000925132312, 'samples': 3233280, 'steps': 16839, 'loss/train': 1.8501614332199097} -08/30/2021 16:16:30 - INFO - __main__ - Step 16841: {'lr': 0.0004876984484078726, 'samples': 3233472, 'steps': 16840, 'loss/train': 2.0979394912719727} -08/30/2021 16:16:30 - INFO - __main__ - Step 16842: {'lr': 0.0004876968041954107, 'samples': 3233664, 'steps': 16841, 'loss/train': 1.6127644777297974} -08/30/2021 16:16:30 - INFO - __main__ - Step 16843: {'lr': 0.00048769515987584624, 'samples': 3233856, 'steps': 16842, 'loss/train': 1.70716392993927} -08/30/2021 16:16:31 - INFO - __main__ - Step 16844: {'lr': 0.0004876935154491801, 'samples': 3234048, 'steps': 16843, 'loss/train': 1.579373836517334} -08/30/2021 16:16:32 - INFO - __main__ - Step 16845: {'lr': 0.00048769187091541287, 'samples': 3234240, 'steps': 16844, 'loss/train': 2.0687344074249268} -08/30/2021 16:16:33 - INFO - __main__ - Step 16846: {'lr': 0.0004876902262745454, 'samples': 3234432, 'steps': 16845, 'loss/train': 1.246543288230896} -08/30/2021 16:16:33 - INFO - __main__ - Step 16847: {'lr': 0.00048768858152657837, 'samples': 3234624, 'steps': 16846, 'loss/train': 1.0815016031265259} -08/30/2021 16:16:33 - INFO - __main__ - Step 16848: {'lr': 0.0004876869366715125, 'samples': 3234816, 'steps': 16847, 'loss/train': 2.131363868713379} -08/30/2021 16:16:34 - INFO - __main__ - Step 16849: {'lr': 0.0004876852917093486, 'samples': 3235008, 'steps': 16848, 'loss/train': 1.6099157333374023} -08/30/2021 16:16:35 - INFO - __main__ - Step 16850: {'lr': 0.0004876836466400874, 'samples': 3235200, 'steps': 16849, 'loss/train': 1.794905185699463} -08/30/2021 16:16:36 - INFO - __main__ - Step 16851: {'lr': 0.00048768200146372955, 'samples': 3235392, 'steps': 16850, 'loss/train': 1.6487356424331665} -08/30/2021 16:16:36 - INFO - __main__ - Step 16852: {'lr': 0.00048768035618027597, 'samples': 3235584, 'steps': 16851, 'loss/train': 1.405745506286621} -08/30/2021 16:16:37 - INFO - __main__ - Step 16853: {'lr': 0.00048767871078972717, 'samples': 3235776, 'steps': 16852, 'loss/train': 0.655771791934967} -08/30/2021 16:16:37 - INFO - __main__ - Step 16854: {'lr': 0.000487677065292084, 'samples': 3235968, 'steps': 16853, 'loss/train': 0.8521744012832642} -08/30/2021 16:16:38 - INFO - __main__ - Step 16855: {'lr': 0.0004876754196873473, 'samples': 3236160, 'steps': 16854, 'loss/train': 1.6467833518981934} -08/30/2021 16:16:39 - INFO - __main__ - Step 16856: {'lr': 0.00048767377397551773, 'samples': 3236352, 'steps': 16855, 'loss/train': 1.3419854640960693} -08/30/2021 16:16:39 - INFO - __main__ - Step 16857: {'lr': 0.00048767212815659593, 'samples': 3236544, 'steps': 16856, 'loss/train': 1.296749234199524} -08/30/2021 16:16:39 - INFO - __main__ - Step 16858: {'lr': 0.0004876704822305828, 'samples': 3236736, 'steps': 16857, 'loss/train': 1.3770450353622437} -08/30/2021 16:16:40 - INFO - __main__ - Step 16859: {'lr': 0.00048766883619747906, 'samples': 3236928, 'steps': 16858, 'loss/train': 1.717189908027649} -08/30/2021 16:16:40 - INFO - __main__ - Step 16860: {'lr': 0.00048766719005728534, 'samples': 3237120, 'steps': 16859, 'loss/train': 1.4536820650100708} -08/30/2021 16:16:42 - INFO - __main__ - Step 16861: {'lr': 0.0004876655438100024, 'samples': 3237312, 'steps': 16860, 'loss/train': 1.5952472686767578} -08/30/2021 16:16:42 - INFO - __main__ - Step 16862: {'lr': 0.00048766389745563113, 'samples': 3237504, 'steps': 16861, 'loss/train': 1.6588070392608643} -08/30/2021 16:16:43 - INFO - __main__ - Step 16863: {'lr': 0.00048766225099417215, 'samples': 3237696, 'steps': 16862, 'loss/train': 2.1189510822296143} -08/30/2021 16:16:43 - INFO - __main__ - Step 16864: {'lr': 0.0004876606044256262, 'samples': 3237888, 'steps': 16863, 'loss/train': 1.515399694442749} -08/30/2021 16:16:43 - INFO - __main__ - Step 16865: {'lr': 0.0004876589577499941, 'samples': 3238080, 'steps': 16864, 'loss/train': 1.8756680488586426} -08/30/2021 16:16:45 - INFO - __main__ - Step 16866: {'lr': 0.0004876573109672765, 'samples': 3238272, 'steps': 16865, 'loss/train': 1.465890645980835} -08/30/2021 16:16:45 - INFO - __main__ - Step 16867: {'lr': 0.0004876556640774742, 'samples': 3238464, 'steps': 16866, 'loss/train': 0.9735254049301147} -08/30/2021 16:16:45 - INFO - __main__ - Step 16868: {'lr': 0.0004876540170805879, 'samples': 3238656, 'steps': 16867, 'loss/train': 1.6697684526443481} -08/30/2021 16:16:46 - INFO - __main__ - Step 16869: {'lr': 0.00048765236997661845, 'samples': 3238848, 'steps': 16868, 'loss/train': 1.7975212335586548} -08/30/2021 16:16:46 - INFO - __main__ - Step 16870: {'lr': 0.0004876507227655664, 'samples': 3239040, 'steps': 16869, 'loss/train': 2.108999252319336} -08/30/2021 16:16:48 - INFO - __main__ - Step 16871: {'lr': 0.00048764907544743264, 'samples': 3239232, 'steps': 16870, 'loss/train': 1.7371759414672852} -08/30/2021 16:16:49 - INFO - __main__ - Step 16872: {'lr': 0.0004876474280222179, 'samples': 3239424, 'steps': 16871, 'loss/train': 1.6256959438323975} -08/30/2021 16:16:49 - INFO - __main__ - Step 16873: {'lr': 0.00048764578048992284, 'samples': 3239616, 'steps': 16872, 'loss/train': 1.8462085723876953} -08/30/2021 16:16:49 - INFO - __main__ - Step 16874: {'lr': 0.0004876441328505483, 'samples': 3239808, 'steps': 16873, 'loss/train': 1.6450989246368408} -08/30/2021 16:16:50 - INFO - __main__ - Step 16875: {'lr': 0.000487642485104095, 'samples': 3240000, 'steps': 16874, 'loss/train': 1.564517617225647} -08/30/2021 16:16:50 - INFO - __main__ - Step 16876: {'lr': 0.00048764083725056365, 'samples': 3240192, 'steps': 16875, 'loss/train': 1.8679288625717163} -08/30/2021 16:16:52 - INFO - __main__ - Step 16877: {'lr': 0.00048763918928995496, 'samples': 3240384, 'steps': 16876, 'loss/train': 0.08533859252929688} -08/30/2021 16:16:53 - INFO - __main__ - Step 16878: {'lr': 0.00048763754122226977, 'samples': 3240576, 'steps': 16877, 'loss/train': 0.792040228843689} -08/30/2021 16:16:53 - INFO - __main__ - Step 16879: {'lr': 0.00048763589304750876, 'samples': 3240768, 'steps': 16878, 'loss/train': 1.5878849029541016} -08/30/2021 16:16:53 - INFO - __main__ - Step 16880: {'lr': 0.0004876342447656727, 'samples': 3240960, 'steps': 16879, 'loss/train': 1.5004578828811646} -08/30/2021 16:16:54 - INFO - __main__ - Step 16881: {'lr': 0.00048763259637676226, 'samples': 3241152, 'steps': 16880, 'loss/train': 0.9142868518829346} -08/30/2021 16:16:54 - INFO - __main__ - Step 16882: {'lr': 0.00048763094788077834, 'samples': 3241344, 'steps': 16881, 'loss/train': 2.1745200157165527} -08/30/2021 16:16:56 - INFO - __main__ - Step 16883: {'lr': 0.0004876292992777215, 'samples': 3241536, 'steps': 16882, 'loss/train': 0.9276759624481201} -08/30/2021 16:16:56 - INFO - __main__ - Step 16884: {'lr': 0.00048762765056759255, 'samples': 3241728, 'steps': 16883, 'loss/train': 1.70012366771698} -08/30/2021 16:16:56 - INFO - __main__ - Step 16885: {'lr': 0.00048762600175039227, 'samples': 3241920, 'steps': 16884, 'loss/train': 1.8063913583755493} -08/30/2021 16:16:57 - INFO - __main__ - Step 16886: {'lr': 0.0004876243528261214, 'samples': 3242112, 'steps': 16885, 'loss/train': 1.6086015701293945} -08/30/2021 16:16:57 - INFO - __main__ - Step 16887: {'lr': 0.0004876227037947807, 'samples': 3242304, 'steps': 16886, 'loss/train': 1.947364091873169} -08/30/2021 16:16:59 - INFO - __main__ - Step 16888: {'lr': 0.0004876210546563707, 'samples': 3242496, 'steps': 16887, 'loss/train': 1.076502799987793} -08/30/2021 16:16:59 - INFO - __main__ - Step 16889: {'lr': 0.0004876194054108926, 'samples': 3242688, 'steps': 16888, 'loss/train': 1.7061368227005005} -08/30/2021 16:16:59 - INFO - __main__ - Step 16890: {'lr': 0.0004876177560583466, 'samples': 3242880, 'steps': 16889, 'loss/train': 1.4884884357452393} -08/30/2021 16:17:00 - INFO - __main__ - Step 16891: {'lr': 0.00048761610659873387, 'samples': 3243072, 'steps': 16890, 'loss/train': 1.8173021078109741} -08/30/2021 16:17:00 - INFO - __main__ - Step 16892: {'lr': 0.0004876144570320549, 'samples': 3243264, 'steps': 16891, 'loss/train': 1.4878637790679932} -08/30/2021 16:17:01 - INFO - __main__ - Step 16893: {'lr': 0.0004876128073583106, 'samples': 3243456, 'steps': 16892, 'loss/train': 1.981358289718628} -08/30/2021 16:17:02 - INFO - __main__ - Step 16894: {'lr': 0.00048761115757750155, 'samples': 3243648, 'steps': 16893, 'loss/train': 1.865716814994812} -08/30/2021 16:17:02 - INFO - __main__ - Step 16895: {'lr': 0.00048760950768962863, 'samples': 3243840, 'steps': 16894, 'loss/train': 1.4976617097854614} -08/30/2021 16:17:03 - INFO - __main__ - Step 16896: {'lr': 0.00048760785769469254, 'samples': 3244032, 'steps': 16895, 'loss/train': 1.4995694160461426} -08/30/2021 16:17:03 - INFO - __main__ - Step 16897: {'lr': 0.00048760620759269403, 'samples': 3244224, 'steps': 16896, 'loss/train': 1.84534752368927} -08/30/2021 16:17:04 - INFO - __main__ - Step 16898: {'lr': 0.00048760455738363376, 'samples': 3244416, 'steps': 16897, 'loss/train': 1.0716979503631592} -08/30/2021 16:17:05 - INFO - __main__ - Step 16899: {'lr': 0.0004876029070675126, 'samples': 3244608, 'steps': 16898, 'loss/train': 1.7161740064620972} -08/30/2021 16:17:05 - INFO - __main__ - Step 16900: {'lr': 0.0004876012566443312, 'samples': 3244800, 'steps': 16899, 'loss/train': 1.3478282690048218} -08/30/2021 16:17:06 - INFO - __main__ - Step 16901: {'lr': 0.00048759960611409036, 'samples': 3244992, 'steps': 16900, 'loss/train': 1.9062011241912842} -08/30/2021 16:17:06 - INFO - __main__ - Step 16902: {'lr': 0.00048759795547679083, 'samples': 3245184, 'steps': 16901, 'loss/train': 2.2854104042053223} -08/30/2021 16:17:06 - INFO - __main__ - Step 16903: {'lr': 0.00048759630473243327, 'samples': 3245376, 'steps': 16902, 'loss/train': 1.3685877323150635} -08/30/2021 16:17:08 - INFO - __main__ - Step 16904: {'lr': 0.00048759465388101855, 'samples': 3245568, 'steps': 16903, 'loss/train': 1.9079225063323975} -08/30/2021 16:17:08 - INFO - __main__ - Step 16905: {'lr': 0.0004875930029225473, 'samples': 3245760, 'steps': 16904, 'loss/train': 0.7501497864723206} -08/30/2021 16:17:09 - INFO - __main__ - Step 16906: {'lr': 0.0004875913518570203, 'samples': 3245952, 'steps': 16905, 'loss/train': 1.463302493095398} -08/30/2021 16:17:09 - INFO - __main__ - Step 16907: {'lr': 0.0004875897006844383, 'samples': 3246144, 'steps': 16906, 'loss/train': 2.013986825942993} -08/30/2021 16:17:09 - INFO - __main__ - Step 16908: {'lr': 0.00048758804940480203, 'samples': 3246336, 'steps': 16907, 'loss/train': 1.6306395530700684} -08/30/2021 16:17:11 - INFO - __main__ - Step 16909: {'lr': 0.0004875863980181123, 'samples': 3246528, 'steps': 16908, 'loss/train': 0.6218293309211731} -08/30/2021 16:17:11 - INFO - __main__ - Step 16910: {'lr': 0.0004875847465243698, 'samples': 3246720, 'steps': 16909, 'loss/train': 2.3276655673980713} -08/30/2021 16:17:12 - INFO - __main__ - Step 16911: {'lr': 0.00048758309492357533, 'samples': 3246912, 'steps': 16910, 'loss/train': 3.1968994140625} -08/30/2021 16:17:12 - INFO - __main__ - Step 16912: {'lr': 0.0004875814432157295, 'samples': 3247104, 'steps': 16911, 'loss/train': 1.6495847702026367} -08/30/2021 16:17:12 - INFO - __main__ - Step 16913: {'lr': 0.0004875797914008332, 'samples': 3247296, 'steps': 16912, 'loss/train': 2.0352587699890137} -08/30/2021 16:17:14 - INFO - __main__ - Step 16914: {'lr': 0.00048757813947888706, 'samples': 3247488, 'steps': 16913, 'loss/train': 1.3868038654327393} -08/30/2021 16:17:14 - INFO - __main__ - Step 16915: {'lr': 0.0004875764874498919, 'samples': 3247680, 'steps': 16914, 'loss/train': 1.3998552560806274} -08/30/2021 16:17:15 - INFO - __main__ - Step 16916: {'lr': 0.00048757483531384837, 'samples': 3247872, 'steps': 16915, 'loss/train': 1.9597069025039673} -08/30/2021 16:17:15 - INFO - __main__ - Step 16917: {'lr': 0.0004875731830707574, 'samples': 3248064, 'steps': 16916, 'loss/train': 1.2749173641204834} -08/30/2021 16:17:15 - INFO - __main__ - Step 16918: {'lr': 0.00048757153072061954, 'samples': 3248256, 'steps': 16917, 'loss/train': 1.8954534530639648} -08/30/2021 16:17:17 - INFO - __main__ - Step 16919: {'lr': 0.0004875698782634357, 'samples': 3248448, 'steps': 16918, 'loss/train': 2.011024236679077} -08/30/2021 16:17:17 - INFO - __main__ - Step 16920: {'lr': 0.00048756822569920647, 'samples': 3248640, 'steps': 16919, 'loss/train': 1.3850997686386108} -08/30/2021 16:17:18 - INFO - __main__ - Step 16921: {'lr': 0.0004875665730279326, 'samples': 3248832, 'steps': 16920, 'loss/train': 1.5362807512283325} -08/30/2021 16:17:18 - INFO - __main__ - Step 16922: {'lr': 0.000487564920249615, 'samples': 3249024, 'steps': 16921, 'loss/train': 1.6729166507720947} -08/30/2021 16:17:18 - INFO - __main__ - Step 16923: {'lr': 0.00048756326736425427, 'samples': 3249216, 'steps': 16922, 'loss/train': 1.3989808559417725} -08/30/2021 16:17:20 - INFO - __main__ - Step 16924: {'lr': 0.00048756161437185126, 'samples': 3249408, 'steps': 16923, 'loss/train': 1.8012539148330688} -08/30/2021 16:17:20 - INFO - __main__ - Step 16925: {'lr': 0.0004875599612724066, 'samples': 3249600, 'steps': 16924, 'loss/train': 1.931175947189331} -08/30/2021 16:17:21 - INFO - __main__ - Step 16926: {'lr': 0.00048755830806592105, 'samples': 3249792, 'steps': 16925, 'loss/train': 1.0830150842666626} -08/30/2021 16:17:21 - INFO - __main__ - Step 16927: {'lr': 0.00048755665475239547, 'samples': 3249984, 'steps': 16926, 'loss/train': 1.3054875135421753} -08/30/2021 16:17:21 - INFO - __main__ - Step 16928: {'lr': 0.0004875550013318305, 'samples': 3250176, 'steps': 16927, 'loss/train': 1.578044056892395} -08/30/2021 16:17:22 - INFO - __main__ - Step 16929: {'lr': 0.0004875533478042269, 'samples': 3250368, 'steps': 16928, 'loss/train': 1.6108318567276} -08/30/2021 16:17:24 - INFO - __main__ - Step 16930: {'lr': 0.00048755169416958544, 'samples': 3250560, 'steps': 16929, 'loss/train': 1.500242829322815} -08/30/2021 16:17:24 - INFO - __main__ - Step 16931: {'lr': 0.00048755004042790685, 'samples': 3250752, 'steps': 16930, 'loss/train': 1.882196307182312} -08/30/2021 16:17:25 - INFO - __main__ - Step 16932: {'lr': 0.00048754838657919186, 'samples': 3250944, 'steps': 16931, 'loss/train': 1.561686635017395} -08/30/2021 16:17:25 - INFO - __main__ - Step 16933: {'lr': 0.00048754673262344124, 'samples': 3251136, 'steps': 16932, 'loss/train': 0.8742133975028992} -08/30/2021 16:17:25 - INFO - __main__ - Step 16934: {'lr': 0.00048754507856065574, 'samples': 3251328, 'steps': 16933, 'loss/train': 1.7597050666809082} -08/30/2021 16:17:27 - INFO - __main__ - Step 16935: {'lr': 0.0004875434243908361, 'samples': 3251520, 'steps': 16934, 'loss/train': 5.917540550231934} -08/30/2021 16:17:27 - INFO - __main__ - Step 16936: {'lr': 0.00048754177011398303, 'samples': 3251712, 'steps': 16935, 'loss/train': 1.3282630443572998} -08/30/2021 16:17:28 - INFO - __main__ - Step 16937: {'lr': 0.0004875401157300973, 'samples': 3251904, 'steps': 16936, 'loss/train': 1.3805826902389526} -08/30/2021 16:17:28 - INFO - __main__ - Step 16938: {'lr': 0.00048753846123917964, 'samples': 3252096, 'steps': 16937, 'loss/train': 1.926552414894104} -08/30/2021 16:17:28 - INFO - __main__ - Step 16939: {'lr': 0.0004875368066412309, 'samples': 3252288, 'steps': 16938, 'loss/train': 1.5819123983383179} -08/30/2021 16:17:30 - INFO - __main__ - Step 16940: {'lr': 0.00048753515193625165, 'samples': 3252480, 'steps': 16939, 'loss/train': 1.2893445491790771} -08/30/2021 16:17:30 - INFO - __main__ - Step 16941: {'lr': 0.00048753349712424277, 'samples': 3252672, 'steps': 16940, 'loss/train': 0.8502808809280396} -08/30/2021 16:17:31 - INFO - __main__ - Step 16942: {'lr': 0.00048753184220520497, 'samples': 3252864, 'steps': 16941, 'loss/train': 1.6763042211532593} -08/30/2021 16:17:31 - INFO - __main__ - Step 16943: {'lr': 0.000487530187179139, 'samples': 3253056, 'steps': 16942, 'loss/train': 0.5161139369010925} -08/30/2021 16:17:31 - INFO - __main__ - Step 16944: {'lr': 0.00048752853204604555, 'samples': 3253248, 'steps': 16943, 'loss/train': 1.5600448846817017} -08/30/2021 16:17:33 - INFO - __main__ - Step 16945: {'lr': 0.00048752687680592545, 'samples': 3253440, 'steps': 16944, 'loss/train': 1.602253794670105} -08/30/2021 16:17:33 - INFO - __main__ - Step 16946: {'lr': 0.00048752522145877937, 'samples': 3253632, 'steps': 16945, 'loss/train': 1.7223378419876099} -08/30/2021 16:17:34 - INFO - __main__ - Step 16947: {'lr': 0.0004875235660046081, 'samples': 3253824, 'steps': 16946, 'loss/train': 0.6119934320449829} -08/30/2021 16:17:34 - INFO - __main__ - Step 16948: {'lr': 0.0004875219104434124, 'samples': 3254016, 'steps': 16947, 'loss/train': 1.73008131980896} -08/30/2021 16:17:34 - INFO - __main__ - Step 16949: {'lr': 0.0004875202547751929, 'samples': 3254208, 'steps': 16948, 'loss/train': 1.3419551849365234} -08/30/2021 16:17:35 - INFO - __main__ - Step 16950: {'lr': 0.00048751859899995054, 'samples': 3254400, 'steps': 16949, 'loss/train': 1.8059403896331787} -08/30/2021 16:17:36 - INFO - __main__ - Step 16951: {'lr': 0.0004875169431176859, 'samples': 3254592, 'steps': 16950, 'loss/train': 2.4468488693237305} -08/30/2021 16:17:37 - INFO - __main__ - Step 16952: {'lr': 0.0004875152871283999, 'samples': 3254784, 'steps': 16951, 'loss/train': 1.3676382303237915} -08/30/2021 16:17:37 - INFO - __main__ - Step 16953: {'lr': 0.0004875136310320931, 'samples': 3254976, 'steps': 16952, 'loss/train': 0.8390756845474243} -08/30/2021 16:17:37 - INFO - __main__ - Step 16954: {'lr': 0.0004875119748287663, 'samples': 3255168, 'steps': 16953, 'loss/train': 1.3089519739151} -08/30/2021 16:17:38 - INFO - __main__ - Step 16955: {'lr': 0.0004875103185184203, 'samples': 3255360, 'steps': 16954, 'loss/train': 1.563284158706665} -08/30/2021 16:17:39 - INFO - __main__ - Step 16956: {'lr': 0.00048750866210105583, 'samples': 3255552, 'steps': 16955, 'loss/train': 1.4730861186981201} -08/30/2021 16:17:40 - INFO - __main__ - Step 16957: {'lr': 0.0004875070055766736, 'samples': 3255744, 'steps': 16956, 'loss/train': 1.0444947481155396} -08/30/2021 16:17:40 - INFO - __main__ - Step 16958: {'lr': 0.0004875053489452743, 'samples': 3255936, 'steps': 16957, 'loss/train': 1.472135066986084} -08/30/2021 16:17:40 - INFO - __main__ - Step 16959: {'lr': 0.00048750369220685886, 'samples': 3256128, 'steps': 16958, 'loss/train': 1.045244812965393} -08/30/2021 16:17:41 - INFO - __main__ - Step 16960: {'lr': 0.0004875020353614279, 'samples': 3256320, 'steps': 16959, 'loss/train': 2.2059497833251953} -08/30/2021 16:17:42 - INFO - __main__ - Step 16961: {'lr': 0.0004875003784089822, 'samples': 3256512, 'steps': 16960, 'loss/train': 1.6468404531478882} -08/30/2021 16:17:43 - INFO - __main__ - Step 16962: {'lr': 0.00048749872134952243, 'samples': 3256704, 'steps': 16961, 'loss/train': 1.4637099504470825} -08/30/2021 16:17:43 - INFO - __main__ - Step 16963: {'lr': 0.0004874970641830495, 'samples': 3256896, 'steps': 16962, 'loss/train': 1.3961182832717896} -08/30/2021 16:17:43 - INFO - __main__ - Step 16964: {'lr': 0.000487495406909564, 'samples': 3257088, 'steps': 16963, 'loss/train': 1.7496854066848755} -08/30/2021 16:17:44 - INFO - __main__ - Step 16965: {'lr': 0.00048749374952906677, 'samples': 3257280, 'steps': 16964, 'loss/train': 1.5075517892837524} -08/30/2021 16:17:46 - INFO - __main__ - Step 16966: {'lr': 0.0004874920920415584, 'samples': 3257472, 'steps': 16965, 'loss/train': 1.5595650672912598} -08/30/2021 16:17:46 - INFO - __main__ - Step 16967: {'lr': 0.0004874904344470399, 'samples': 3257664, 'steps': 16966, 'loss/train': 1.7632176876068115} -08/30/2021 16:17:46 - INFO - __main__ - Step 16968: {'lr': 0.00048748877674551183, 'samples': 3257856, 'steps': 16967, 'loss/train': 1.9016896486282349} -08/30/2021 16:17:47 - INFO - __main__ - Step 16969: {'lr': 0.00048748711893697495, 'samples': 3258048, 'steps': 16968, 'loss/train': 1.3011797666549683} -08/30/2021 16:17:47 - INFO - __main__ - Step 16970: {'lr': 0.0004874854610214301, 'samples': 3258240, 'steps': 16969, 'loss/train': 0.07831119745969772} -08/30/2021 16:17:48 - INFO - __main__ - Step 16971: {'lr': 0.00048748380299887793, 'samples': 3258432, 'steps': 16970, 'loss/train': 1.6787441968917847} -08/30/2021 16:17:48 - INFO - __main__ - Step 16972: {'lr': 0.0004874821448693192, 'samples': 3258624, 'steps': 16971, 'loss/train': 1.504599928855896} -08/30/2021 16:17:49 - INFO - __main__ - Step 16973: {'lr': 0.00048748048663275475, 'samples': 3258816, 'steps': 16972, 'loss/train': 1.9052436351776123} -08/30/2021 16:17:50 - INFO - __main__ - Step 16974: {'lr': 0.00048747882828918524, 'samples': 3259008, 'steps': 16973, 'loss/train': 1.4593864679336548} -08/30/2021 16:17:50 - INFO - __main__ - Step 16975: {'lr': 0.0004874771698386113, 'samples': 3259200, 'steps': 16974, 'loss/train': 1.39486563205719} -08/30/2021 16:17:51 - INFO - __main__ - Step 16976: {'lr': 0.00048747551128103397, 'samples': 3259392, 'steps': 16975, 'loss/train': 1.2716879844665527} -08/30/2021 16:17:51 - INFO - __main__ - Step 16977: {'lr': 0.00048747385261645377, 'samples': 3259584, 'steps': 16976, 'loss/train': 1.0684585571289062} -08/30/2021 16:17:52 - INFO - __main__ - Step 16978: {'lr': 0.0004874721938448715, 'samples': 3259776, 'steps': 16977, 'loss/train': 2.4069674015045166} -08/30/2021 16:17:53 - INFO - __main__ - Step 16979: {'lr': 0.000487470534966288, 'samples': 3259968, 'steps': 16978, 'loss/train': 1.359895944595337} -08/30/2021 16:17:53 - INFO - __main__ - Step 16980: {'lr': 0.0004874688759807039, 'samples': 3260160, 'steps': 16979, 'loss/train': 1.7185837030410767} -08/30/2021 16:17:53 - INFO - __main__ - Step 16981: {'lr': 0.00048746721688812004, 'samples': 3260352, 'steps': 16980, 'loss/train': 1.7675763368606567} -08/30/2021 16:17:54 - INFO - __main__ - Step 16982: {'lr': 0.00048746555768853703, 'samples': 3260544, 'steps': 16981, 'loss/train': 2.0602288246154785} -08/30/2021 16:17:56 - INFO - __main__ - Step 16983: {'lr': 0.00048746389838195573, 'samples': 3260736, 'steps': 16982, 'loss/train': 1.249222755432129} -08/30/2021 16:17:57 - INFO - __main__ - Step 16984: {'lr': 0.0004874622389683768, 'samples': 3260928, 'steps': 16983, 'loss/train': 1.7813916206359863} -08/30/2021 16:17:57 - INFO - __main__ - Step 16985: {'lr': 0.0004874605794478012, 'samples': 3261120, 'steps': 16984, 'loss/train': 1.7750695943832397} -08/30/2021 16:17:57 - INFO - __main__ - Step 16986: {'lr': 0.0004874589198202294, 'samples': 3261312, 'steps': 16985, 'loss/train': 2.1372036933898926} -08/30/2021 16:17:58 - INFO - __main__ - Step 16987: {'lr': 0.0004874572600856624, 'samples': 3261504, 'steps': 16986, 'loss/train': 1.801600456237793} -08/30/2021 16:17:59 - INFO - __main__ - Step 16988: {'lr': 0.0004874556002441007, 'samples': 3261696, 'steps': 16987, 'loss/train': 1.3790847063064575} -08/30/2021 16:18:00 - INFO - __main__ - Step 16989: {'lr': 0.0004874539402955452, 'samples': 3261888, 'steps': 16988, 'loss/train': 2.015305519104004} -08/30/2021 16:18:00 - INFO - __main__ - Step 16990: {'lr': 0.00048745228023999666, 'samples': 3262080, 'steps': 16989, 'loss/train': 1.1904144287109375} -08/30/2021 16:18:00 - INFO - __main__ - Step 16991: {'lr': 0.0004874506200774557, 'samples': 3262272, 'steps': 16990, 'loss/train': 1.6295344829559326} -08/30/2021 16:18:01 - INFO - __main__ - Step 16992: {'lr': 0.00048744895980792327, 'samples': 3262464, 'steps': 16991, 'loss/train': 1.7436455488204956} -08/30/2021 16:18:02 - INFO - __main__ - Step 16993: {'lr': 0.00048744729943139993, 'samples': 3262656, 'steps': 16992, 'loss/train': 1.2896414995193481} -08/30/2021 16:18:03 - INFO - __main__ - Step 16994: {'lr': 0.0004874456389478865, 'samples': 3262848, 'steps': 16993, 'loss/train': 1.5997600555419922} -08/30/2021 16:18:03 - INFO - __main__ - Step 16995: {'lr': 0.00048744397835738377, 'samples': 3263040, 'steps': 16994, 'loss/train': 1.8420839309692383} -08/30/2021 16:18:03 - INFO - __main__ - Step 16996: {'lr': 0.00048744231765989246, 'samples': 3263232, 'steps': 16995, 'loss/train': 1.8090988397598267} -08/30/2021 16:18:04 - INFO - __main__ - Step 16997: {'lr': 0.0004874406568554132, 'samples': 3263424, 'steps': 16996, 'loss/train': 1.8278638124465942} -08/30/2021 16:18:05 - INFO - __main__ - Step 16998: {'lr': 0.0004874389959439469, 'samples': 3263616, 'steps': 16997, 'loss/train': 1.401595950126648} -08/30/2021 16:18:06 - INFO - __main__ - Step 16999: {'lr': 0.0004874373349254943, 'samples': 3263808, 'steps': 16998, 'loss/train': 1.4432423114776611} -08/30/2021 16:18:06 - INFO - __main__ - Step 17000: {'lr': 0.00048743567380005604, 'samples': 3264000, 'steps': 16999, 'loss/train': 1.7033408880233765} -08/30/2021 16:18:06 - INFO - __main__ - Step 17001: {'lr': 0.000487434012567633, 'samples': 3264192, 'steps': 17000, 'loss/train': 0.7083486318588257} -08/30/2021 16:18:07 - INFO - __main__ - Step 17002: {'lr': 0.0004874323512282258, 'samples': 3264384, 'steps': 17001, 'loss/train': 1.2216070890426636} -08/30/2021 16:18:08 - INFO - __main__ - Step 17003: {'lr': 0.00048743068978183523, 'samples': 3264576, 'steps': 17002, 'loss/train': 1.9648942947387695} -08/30/2021 16:18:09 - INFO - __main__ - Step 17004: {'lr': 0.00048742902822846215, 'samples': 3264768, 'steps': 17003, 'loss/train': 1.9739830493927002} -08/30/2021 16:18:09 - INFO - __main__ - Step 17005: {'lr': 0.0004874273665681071, 'samples': 3264960, 'steps': 17004, 'loss/train': 1.4854813814163208} -08/30/2021 16:18:09 - INFO - __main__ - Step 17006: {'lr': 0.00048742570480077096, 'samples': 3265152, 'steps': 17005, 'loss/train': 1.954255223274231} -08/30/2021 16:18:10 - INFO - __main__ - Step 17007: {'lr': 0.0004874240429264545, 'samples': 3265344, 'steps': 17006, 'loss/train': 1.6127092838287354} -08/30/2021 16:18:10 - INFO - __main__ - Step 17008: {'lr': 0.00048742238094515844, 'samples': 3265536, 'steps': 17007, 'loss/train': 1.5501658916473389} -08/30/2021 16:18:11 - INFO - __main__ - Step 17009: {'lr': 0.00048742071885688354, 'samples': 3265728, 'steps': 17008, 'loss/train': 1.9240108728408813} -08/30/2021 16:18:12 - INFO - __main__ - Step 17010: {'lr': 0.00048741905666163047, 'samples': 3265920, 'steps': 17009, 'loss/train': 2.3126652240753174} -08/30/2021 16:18:12 - INFO - __main__ - Step 17011: {'lr': 0.00048741739435940003, 'samples': 3266112, 'steps': 17010, 'loss/train': 1.563551664352417} -08/30/2021 16:18:13 - INFO - __main__ - Step 17012: {'lr': 0.000487415731950193, 'samples': 3266304, 'steps': 17011, 'loss/train': 1.6391255855560303} -08/30/2021 16:18:13 - INFO - __main__ - Step 17013: {'lr': 0.0004874140694340101, 'samples': 3266496, 'steps': 17012, 'loss/train': 1.1839629411697388} -08/30/2021 16:18:15 - INFO - __main__ - Step 17014: {'lr': 0.0004874124068108521, 'samples': 3266688, 'steps': 17013, 'loss/train': 1.763357162475586} -08/30/2021 16:18:15 - INFO - __main__ - Step 17015: {'lr': 0.00048741074408071975, 'samples': 3266880, 'steps': 17014, 'loss/train': 1.1405329704284668} -08/30/2021 16:18:16 - INFO - __main__ - Step 17016: {'lr': 0.00048740908124361373, 'samples': 3267072, 'steps': 17015, 'loss/train': 1.4558064937591553} -08/30/2021 16:18:16 - INFO - __main__ - Step 17017: {'lr': 0.0004874074182995349, 'samples': 3267264, 'steps': 17016, 'loss/train': 0.0474298894405365} -08/30/2021 16:18:16 - INFO - __main__ - Step 17018: {'lr': 0.0004874057552484839, 'samples': 3267456, 'steps': 17017, 'loss/train': 1.5617492198944092} -08/30/2021 16:18:17 - INFO - __main__ - Step 17019: {'lr': 0.00048740409209046154, 'samples': 3267648, 'steps': 17018, 'loss/train': 1.7178077697753906} -08/30/2021 16:18:18 - INFO - __main__ - Step 17020: {'lr': 0.0004874024288254686, 'samples': 3267840, 'steps': 17019, 'loss/train': 1.9327551126480103} -08/30/2021 16:18:18 - INFO - __main__ - Step 17021: {'lr': 0.00048740076545350573, 'samples': 3268032, 'steps': 17020, 'loss/train': 1.848136067390442} -08/30/2021 16:18:19 - INFO - __main__ - Step 17022: {'lr': 0.00048739910197457376, 'samples': 3268224, 'steps': 17021, 'loss/train': 1.6528129577636719} -08/30/2021 16:18:19 - INFO - __main__ - Step 17023: {'lr': 0.00048739743838867344, 'samples': 3268416, 'steps': 17022, 'loss/train': 2.532574415206909} -08/30/2021 16:18:19 - INFO - __main__ - Step 17024: {'lr': 0.00048739577469580545, 'samples': 3268608, 'steps': 17023, 'loss/train': 1.4743624925613403} -08/30/2021 16:18:22 - INFO - __main__ - Step 17025: {'lr': 0.0004873941108959706, 'samples': 3268800, 'steps': 17024, 'loss/train': 1.819540023803711} -08/30/2021 16:18:22 - INFO - __main__ - Step 17026: {'lr': 0.0004873924469891697, 'samples': 3268992, 'steps': 17025, 'loss/train': 1.5908654928207397} -08/30/2021 16:18:23 - INFO - __main__ - Step 17027: {'lr': 0.00048739078297540335, 'samples': 3269184, 'steps': 17026, 'loss/train': 1.6285433769226074} -08/30/2021 16:18:23 - INFO - __main__ - Step 17028: {'lr': 0.00048738911885467243, 'samples': 3269376, 'steps': 17027, 'loss/train': 1.983981966972351} -08/30/2021 16:18:23 - INFO - __main__ - Step 17029: {'lr': 0.00048738745462697754, 'samples': 3269568, 'steps': 17028, 'loss/train': 1.3978523015975952} -08/30/2021 16:18:24 - INFO - __main__ - Step 17030: {'lr': 0.0004873857902923196, 'samples': 3269760, 'steps': 17029, 'loss/train': 1.835018515586853} -08/30/2021 16:18:24 - INFO - __main__ - Step 17031: {'lr': 0.00048738412585069927, 'samples': 3269952, 'steps': 17030, 'loss/train': 1.1982173919677734} -08/30/2021 16:18:26 - INFO - __main__ - Step 17032: {'lr': 0.00048738246130211734, 'samples': 3270144, 'steps': 17031, 'loss/train': 0.9439342617988586} -08/30/2021 16:18:26 - INFO - __main__ - Step 17033: {'lr': 0.00048738079664657454, 'samples': 3270336, 'steps': 17032, 'loss/train': 1.631165623664856} -08/30/2021 16:18:26 - INFO - __main__ - Step 17034: {'lr': 0.00048737913188407156, 'samples': 3270528, 'steps': 17033, 'loss/train': 1.7660175561904907} -08/30/2021 16:18:27 - INFO - __main__ - Step 17035: {'lr': 0.00048737746701460927, 'samples': 3270720, 'steps': 17034, 'loss/train': 2.2325189113616943} -08/30/2021 16:18:27 - INFO - __main__ - Step 17036: {'lr': 0.0004873758020381883, 'samples': 3270912, 'steps': 17035, 'loss/train': 2.220383882522583} -08/30/2021 16:18:29 - INFO - __main__ - Step 17037: {'lr': 0.00048737413695480947, 'samples': 3271104, 'steps': 17036, 'loss/train': 1.8013945817947388} -08/30/2021 16:18:30 - INFO - __main__ - Step 17038: {'lr': 0.00048737247176447354, 'samples': 3271296, 'steps': 17037, 'loss/train': 2.1499481201171875} -08/30/2021 16:18:30 - INFO - __main__ - Step 17039: {'lr': 0.0004873708064671812, 'samples': 3271488, 'steps': 17038, 'loss/train': 1.095421314239502} -08/30/2021 16:18:30 - INFO - __main__ - Step 17040: {'lr': 0.0004873691410629333, 'samples': 3271680, 'steps': 17039, 'loss/train': 1.4788717031478882} -08/30/2021 16:18:31 - INFO - __main__ - Step 17041: {'lr': 0.0004873674755517304, 'samples': 3271872, 'steps': 17040, 'loss/train': 1.1645203828811646} -08/30/2021 16:18:32 - INFO - __main__ - Step 17042: {'lr': 0.00048736580993357357, 'samples': 3272064, 'steps': 17041, 'loss/train': 0.893046498298645} -08/30/2021 16:18:33 - INFO - __main__ - Step 17043: {'lr': 0.0004873641442084632, 'samples': 3272256, 'steps': 17042, 'loss/train': 1.681810736656189} -08/30/2021 16:18:33 - INFO - __main__ - Step 17044: {'lr': 0.00048736247837640037, 'samples': 3272448, 'steps': 17043, 'loss/train': 1.2126652002334595} -08/30/2021 16:18:33 - INFO - __main__ - Step 17045: {'lr': 0.0004873608124373855, 'samples': 3272640, 'steps': 17044, 'loss/train': 1.578004240989685} -08/30/2021 16:18:34 - INFO - __main__ - Step 17046: {'lr': 0.00048735914639141964, 'samples': 3272832, 'steps': 17045, 'loss/train': 1.7768607139587402} -08/30/2021 16:18:35 - INFO - __main__ - Step 17047: {'lr': 0.00048735748023850337, 'samples': 3273024, 'steps': 17046, 'loss/train': 1.973023772239685} -08/30/2021 16:18:36 - INFO - __main__ - Step 17048: {'lr': 0.00048735581397863745, 'samples': 3273216, 'steps': 17047, 'loss/train': 1.459733247756958} -08/30/2021 16:18:36 - INFO - __main__ - Step 17049: {'lr': 0.0004873541476118227, 'samples': 3273408, 'steps': 17048, 'loss/train': 1.3695586919784546} -08/30/2021 16:18:37 - INFO - __main__ - Step 17050: {'lr': 0.00048735248113805976, 'samples': 3273600, 'steps': 17049, 'loss/train': 1.7251688241958618} -08/30/2021 16:18:37 - INFO - __main__ - Step 17051: {'lr': 0.0004873508145573495, 'samples': 3273792, 'steps': 17050, 'loss/train': 1.272658109664917} -08/30/2021 16:18:37 - INFO - __main__ - Step 17052: {'lr': 0.00048734914786969266, 'samples': 3273984, 'steps': 17051, 'loss/train': 1.9978035688400269} -08/30/2021 16:18:39 - INFO - __main__ - Step 17053: {'lr': 0.00048734748107509, 'samples': 3274176, 'steps': 17052, 'loss/train': 1.6371781826019287} -08/30/2021 16:18:39 - INFO - __main__ - Step 17054: {'lr': 0.0004873458141735421, 'samples': 3274368, 'steps': 17053, 'loss/train': 1.8606921434402466} -08/30/2021 16:18:39 - INFO - __main__ - Step 17055: {'lr': 0.0004873441471650499, 'samples': 3274560, 'steps': 17054, 'loss/train': 1.903680682182312} -08/30/2021 16:18:40 - INFO - __main__ - Step 17056: {'lr': 0.00048734248004961414, 'samples': 3274752, 'steps': 17055, 'loss/train': 1.8469626903533936} -08/30/2021 16:18:40 - INFO - __main__ - Step 17057: {'lr': 0.00048734081282723543, 'samples': 3274944, 'steps': 17056, 'loss/train': 1.2959022521972656} -08/30/2021 16:18:42 - INFO - __main__ - Step 17058: {'lr': 0.00048733914549791465, 'samples': 3275136, 'steps': 17057, 'loss/train': 0.8788344860076904} -08/30/2021 16:18:42 - INFO - __main__ - Step 17059: {'lr': 0.0004873374780616525, 'samples': 3275328, 'steps': 17058, 'loss/train': 1.9548438787460327} -08/30/2021 16:18:42 - INFO - __main__ - Step 17060: {'lr': 0.00048733581051844976, 'samples': 3275520, 'steps': 17059, 'loss/train': 1.576919674873352} -08/30/2021 16:18:43 - INFO - __main__ - Step 17061: {'lr': 0.00048733414286830716, 'samples': 3275712, 'steps': 17060, 'loss/train': 1.4760609865188599} -08/30/2021 16:18:43 - INFO - __main__ - Step 17062: {'lr': 0.00048733247511122547, 'samples': 3275904, 'steps': 17061, 'loss/train': 1.4664009809494019} -08/30/2021 16:18:45 - INFO - __main__ - Step 17063: {'lr': 0.00048733080724720545, 'samples': 3276096, 'steps': 17062, 'loss/train': 1.7509276866912842} -08/30/2021 16:18:46 - INFO - __main__ - Step 17064: {'lr': 0.00048732913927624776, 'samples': 3276288, 'steps': 17063, 'loss/train': 1.422742247581482} -08/30/2021 16:18:46 - INFO - __main__ - Step 17065: {'lr': 0.0004873274711983533, 'samples': 3276480, 'steps': 17064, 'loss/train': 1.491871953010559} -08/30/2021 16:18:47 - INFO - __main__ - Step 17066: {'lr': 0.0004873258030135227, 'samples': 3276672, 'steps': 17065, 'loss/train': 1.6416592597961426} -08/30/2021 16:18:47 - INFO - __main__ - Step 17067: {'lr': 0.0004873241347217567, 'samples': 3276864, 'steps': 17066, 'loss/train': 2.1945347785949707} -08/30/2021 16:18:47 - INFO - __main__ - Step 17068: {'lr': 0.0004873224663230562, 'samples': 3277056, 'steps': 17067, 'loss/train': 3.0288026332855225} -08/30/2021 16:18:49 - INFO - __main__ - Step 17069: {'lr': 0.0004873207978174219, 'samples': 3277248, 'steps': 17068, 'loss/train': 3.829235792160034} -08/30/2021 16:18:49 - INFO - __main__ - Step 17070: {'lr': 0.00048731912920485444, 'samples': 3277440, 'steps': 17069, 'loss/train': 2.0071985721588135} -08/30/2021 16:18:50 - INFO - __main__ - Step 17071: {'lr': 0.0004873174604853546, 'samples': 3277632, 'steps': 17070, 'loss/train': 1.8288429975509644} -08/30/2021 16:18:50 - INFO - __main__ - Step 17072: {'lr': 0.00048731579165892325, 'samples': 3277824, 'steps': 17071, 'loss/train': 1.354732871055603} -08/30/2021 16:18:50 - INFO - __main__ - Step 17073: {'lr': 0.000487314122725561, 'samples': 3278016, 'steps': 17072, 'loss/train': 1.5520434379577637} -08/30/2021 16:18:52 - INFO - __main__ - Step 17074: {'lr': 0.00048731245368526877, 'samples': 3278208, 'steps': 17073, 'loss/train': 1.3054972887039185} -08/30/2021 16:18:53 - INFO - __main__ - Step 17075: {'lr': 0.0004873107845380471, 'samples': 3278400, 'steps': 17074, 'loss/train': 2.0592572689056396} -08/30/2021 16:18:53 - INFO - __main__ - Step 17076: {'lr': 0.00048730911528389686, 'samples': 3278592, 'steps': 17075, 'loss/train': 2.3109729290008545} -08/30/2021 16:18:53 - INFO - __main__ - Step 17077: {'lr': 0.0004873074459228188, 'samples': 3278784, 'steps': 17076, 'loss/train': 1.7390919923782349} -08/30/2021 16:18:54 - INFO - __main__ - Step 17078: {'lr': 0.0004873057764548138, 'samples': 3278976, 'steps': 17077, 'loss/train': 1.2778682708740234} -08/30/2021 16:18:54 - INFO - __main__ - Step 17079: {'lr': 0.00048730410687988237, 'samples': 3279168, 'steps': 17078, 'loss/train': 1.43776535987854} -08/30/2021 16:18:55 - INFO - __main__ - Step 17080: {'lr': 0.00048730243719802535, 'samples': 3279360, 'steps': 17079, 'loss/train': 1.517069935798645} -08/30/2021 16:18:56 - INFO - __main__ - Step 17081: {'lr': 0.00048730076740924355, 'samples': 3279552, 'steps': 17080, 'loss/train': 1.8498196601867676} -08/30/2021 16:18:56 - INFO - __main__ - Step 17082: {'lr': 0.0004872990975135377, 'samples': 3279744, 'steps': 17081, 'loss/train': 1.755913496017456} -08/30/2021 16:18:57 - INFO - __main__ - Step 17083: {'lr': 0.0004872974275109085, 'samples': 3279936, 'steps': 17082, 'loss/train': 1.8197604417800903} -08/30/2021 16:18:57 - INFO - __main__ - Step 17084: {'lr': 0.00048729575740135675, 'samples': 3280128, 'steps': 17083, 'loss/train': 2.2922885417938232} -08/30/2021 16:18:59 - INFO - __main__ - Step 17085: {'lr': 0.0004872940871848832, 'samples': 3280320, 'steps': 17084, 'loss/train': 1.6462880373001099} -08/30/2021 16:18:59 - INFO - __main__ - Step 17086: {'lr': 0.00048729241686148864, 'samples': 3280512, 'steps': 17085, 'loss/train': 1.4661798477172852} -08/30/2021 16:18:59 - INFO - __main__ - Step 17087: {'lr': 0.0004872907464311737, 'samples': 3280704, 'steps': 17086, 'loss/train': 1.6990941762924194} -08/30/2021 16:19:00 - INFO - __main__ - Step 17088: {'lr': 0.0004872890758939392, 'samples': 3280896, 'steps': 17087, 'loss/train': 1.6704976558685303} -08/30/2021 16:19:00 - INFO - __main__ - Step 17089: {'lr': 0.00048728740524978597, 'samples': 3281088, 'steps': 17088, 'loss/train': 2.290745973587036} -08/30/2021 16:19:03 - INFO - __main__ - Step 17090: {'lr': 0.00048728573449871473, 'samples': 3281280, 'steps': 17089, 'loss/train': 1.4036996364593506} -08/30/2021 16:19:03 - INFO - __main__ - Step 17091: {'lr': 0.0004872840636407261, 'samples': 3281472, 'steps': 17090, 'loss/train': 1.581344723701477} -08/30/2021 16:19:03 - INFO - __main__ - Step 17092: {'lr': 0.00048728239267582096, 'samples': 3281664, 'steps': 17091, 'loss/train': 1.573412537574768} -08/30/2021 16:19:04 - INFO - __main__ - Step 17093: {'lr': 0.00048728072160400006, 'samples': 3281856, 'steps': 17092, 'loss/train': 0.24032923579216003} -08/30/2021 16:19:04 - INFO - __main__ - Step 17094: {'lr': 0.0004872790504252641, 'samples': 3282048, 'steps': 17093, 'loss/train': 0.16618132591247559} -08/30/2021 16:19:04 - INFO - __main__ - Step 17095: {'lr': 0.0004872773791396139, 'samples': 3282240, 'steps': 17094, 'loss/train': 1.9471571445465088} -08/30/2021 16:19:05 - INFO - __main__ - Step 17096: {'lr': 0.0004872757077470502, 'samples': 3282432, 'steps': 17095, 'loss/train': 0.5481041669845581} -08/30/2021 16:19:05 - INFO - __main__ - Step 17097: {'lr': 0.0004872740362475737, 'samples': 3282624, 'steps': 17096, 'loss/train': 0.5585260987281799} -08/30/2021 16:19:07 - INFO - __main__ - Step 17098: {'lr': 0.0004872723646411851, 'samples': 3282816, 'steps': 17097, 'loss/train': 1.5546623468399048} -08/30/2021 16:19:08 - INFO - __main__ - Step 17099: {'lr': 0.0004872706929278853, 'samples': 3283008, 'steps': 17098, 'loss/train': 1.0834232568740845} -08/30/2021 16:19:08 - INFO - __main__ - Step 17100: {'lr': 0.000487269021107675, 'samples': 3283200, 'steps': 17099, 'loss/train': 1.696337103843689} -08/30/2021 16:19:08 - INFO - __main__ - Step 17101: {'lr': 0.0004872673491805549, 'samples': 3283392, 'steps': 17100, 'loss/train': 1.5764994621276855} -08/30/2021 16:19:09 - INFO - __main__ - Step 17102: {'lr': 0.0004872656771465259, 'samples': 3283584, 'steps': 17101, 'loss/train': 1.586539387702942} -08/30/2021 16:19:10 - INFO - __main__ - Step 17103: {'lr': 0.00048726400500558856, 'samples': 3283776, 'steps': 17102, 'loss/train': 1.5957640409469604} -08/30/2021 16:19:11 - INFO - __main__ - Step 17104: {'lr': 0.0004872623327577437, 'samples': 3283968, 'steps': 17103, 'loss/train': 2.2525582313537598} -08/30/2021 16:19:11 - INFO - __main__ - Step 17105: {'lr': 0.0004872606604029921, 'samples': 3284160, 'steps': 17104, 'loss/train': 1.8458601236343384} -08/30/2021 16:19:11 - INFO - __main__ - Step 17106: {'lr': 0.00048725898794133455, 'samples': 3284352, 'steps': 17105, 'loss/train': 1.9900256395339966} -08/30/2021 16:19:12 - INFO - __main__ - Step 17107: {'lr': 0.00048725731537277173, 'samples': 3284544, 'steps': 17106, 'loss/train': 1.4694170951843262} -08/30/2021 16:19:13 - INFO - __main__ - Step 17108: {'lr': 0.0004872556426973044, 'samples': 3284736, 'steps': 17107, 'loss/train': 1.8389586210250854} -08/30/2021 16:19:14 - INFO - __main__ - Step 17109: {'lr': 0.0004872539699149334, 'samples': 3284928, 'steps': 17108, 'loss/train': 1.6983451843261719} -08/30/2021 16:19:14 - INFO - __main__ - Step 17110: {'lr': 0.0004872522970256594, 'samples': 3285120, 'steps': 17109, 'loss/train': 1.7530301809310913} -08/30/2021 16:19:15 - INFO - __main__ - Step 17111: {'lr': 0.00048725062402948314, 'samples': 3285312, 'steps': 17110, 'loss/train': 0.3163411319255829} -08/30/2021 16:19:15 - INFO - __main__ - Step 17112: {'lr': 0.00048724895092640546, 'samples': 3285504, 'steps': 17111, 'loss/train': 1.2892173528671265} -08/30/2021 16:19:17 - INFO - __main__ - Step 17113: {'lr': 0.00048724727771642706, 'samples': 3285696, 'steps': 17112, 'loss/train': 1.6487714052200317} -08/30/2021 16:19:17 - INFO - __main__ - Step 17114: {'lr': 0.00048724560439954867, 'samples': 3285888, 'steps': 17113, 'loss/train': 1.8985477685928345} -08/30/2021 16:19:18 - INFO - __main__ - Step 17115: {'lr': 0.00048724393097577113, 'samples': 3286080, 'steps': 17114, 'loss/train': 0.21476341784000397} -08/30/2021 16:19:18 - INFO - __main__ - Step 17116: {'lr': 0.0004872422574450951, 'samples': 3286272, 'steps': 17115, 'loss/train': 1.6858916282653809} -08/30/2021 16:19:18 - INFO - __main__ - Step 17117: {'lr': 0.0004872405838075213, 'samples': 3286464, 'steps': 17116, 'loss/train': 1.4407038688659668} -08/30/2021 16:19:20 - INFO - __main__ - Step 17118: {'lr': 0.00048723891006305066, 'samples': 3286656, 'steps': 17117, 'loss/train': 1.684228539466858} -08/30/2021 16:19:20 - INFO - __main__ - Step 17119: {'lr': 0.0004872372362116838, 'samples': 3286848, 'steps': 17118, 'loss/train': 1.4467246532440186} -08/30/2021 16:19:21 - INFO - __main__ - Step 17120: {'lr': 0.0004872355622534215, 'samples': 3287040, 'steps': 17119, 'loss/train': 1.9959315061569214} -08/30/2021 16:19:21 - INFO - __main__ - Step 17121: {'lr': 0.0004872338881882644, 'samples': 3287232, 'steps': 17120, 'loss/train': 1.707873821258545} -08/30/2021 16:19:21 - INFO - __main__ - Step 17122: {'lr': 0.00048723221401621354, 'samples': 3287424, 'steps': 17121, 'loss/train': 2.1110117435455322} -08/30/2021 16:19:23 - INFO - __main__ - Step 17123: {'lr': 0.0004872305397372694, 'samples': 3287616, 'steps': 17122, 'loss/train': 0.8126787543296814} -08/30/2021 16:19:23 - INFO - __main__ - Step 17124: {'lr': 0.0004872288653514329, 'samples': 3287808, 'steps': 17123, 'loss/train': 1.9742519855499268} -08/30/2021 16:19:24 - INFO - __main__ - Step 17125: {'lr': 0.0004872271908587047, 'samples': 3288000, 'steps': 17124, 'loss/train': 1.7569471597671509} -08/30/2021 16:19:24 - INFO - __main__ - Step 17126: {'lr': 0.0004872255162590856, 'samples': 3288192, 'steps': 17125, 'loss/train': 1.9443386793136597} -08/30/2021 16:19:25 - INFO - __main__ - Step 17127: {'lr': 0.0004872238415525764, 'samples': 3288384, 'steps': 17126, 'loss/train': 0.16956979036331177} -08/30/2021 16:19:25 - INFO - __main__ - Step 17128: {'lr': 0.0004872221667391777, 'samples': 3288576, 'steps': 17127, 'loss/train': 2.152531623840332} -08/30/2021 16:19:27 - INFO - __main__ - Step 17129: {'lr': 0.00048722049181889037, 'samples': 3288768, 'steps': 17128, 'loss/train': 1.5011897087097168} -08/30/2021 16:19:27 - INFO - __main__ - Step 17130: {'lr': 0.0004872188167917152, 'samples': 3288960, 'steps': 17129, 'loss/train': 1.6086961030960083} -08/30/2021 16:19:27 - INFO - __main__ - Step 17131: {'lr': 0.00048721714165765286, 'samples': 3289152, 'steps': 17130, 'loss/train': 1.6895132064819336} -08/30/2021 16:19:28 - INFO - __main__ - Step 17132: {'lr': 0.00048721546641670413, 'samples': 3289344, 'steps': 17131, 'loss/train': 1.262113332748413} -08/30/2021 16:19:28 - INFO - __main__ - Step 17133: {'lr': 0.00048721379106886976, 'samples': 3289536, 'steps': 17132, 'loss/train': 1.8208268880844116} -08/30/2021 16:19:29 - INFO - __main__ - Step 17134: {'lr': 0.0004872121156141506, 'samples': 3289728, 'steps': 17133, 'loss/train': 1.3156644105911255} -08/30/2021 16:19:30 - INFO - __main__ - Step 17135: {'lr': 0.0004872104400525472, 'samples': 3289920, 'steps': 17134, 'loss/train': 1.5294270515441895} -08/30/2021 16:19:30 - INFO - __main__ - Step 17136: {'lr': 0.0004872087643840605, 'samples': 3290112, 'steps': 17135, 'loss/train': 1.184144139289856} -08/30/2021 16:19:31 - INFO - __main__ - Step 17137: {'lr': 0.00048720708860869116, 'samples': 3290304, 'steps': 17136, 'loss/train': 1.7141838073730469} -08/30/2021 16:19:31 - INFO - __main__ - Step 17138: {'lr': 0.00048720541272644004, 'samples': 3290496, 'steps': 17137, 'loss/train': 0.6089520454406738} -08/30/2021 16:19:32 - INFO - __main__ - Step 17139: {'lr': 0.00048720373673730773, 'samples': 3290688, 'steps': 17138, 'loss/train': 1.5148826837539673} -08/30/2021 16:19:33 - INFO - __main__ - Step 17140: {'lr': 0.00048720206064129516, 'samples': 3290880, 'steps': 17139, 'loss/train': 1.9033597707748413} -08/30/2021 16:19:33 - INFO - __main__ - Step 17141: {'lr': 0.0004872003844384029, 'samples': 3291072, 'steps': 17140, 'loss/train': 1.4932576417922974} -08/30/2021 16:19:33 - INFO - __main__ - Step 17142: {'lr': 0.0004871987081286319, 'samples': 3291264, 'steps': 17141, 'loss/train': 0.6825220584869385} -08/30/2021 16:19:34 - INFO - __main__ - Step 17143: {'lr': 0.0004871970317119828, 'samples': 3291456, 'steps': 17142, 'loss/train': 1.1307752132415771} -08/30/2021 16:19:35 - INFO - __main__ - Step 17144: {'lr': 0.00048719535518845634, 'samples': 3291648, 'steps': 17143, 'loss/train': 1.6785632371902466} -08/30/2021 16:19:36 - INFO - __main__ - Step 17145: {'lr': 0.0004871936785580533, 'samples': 3291840, 'steps': 17144, 'loss/train': 1.5717003345489502} -08/30/2021 16:19:36 - INFO - __main__ - Step 17146: {'lr': 0.0004871920018207745, 'samples': 3292032, 'steps': 17145, 'loss/train': 1.947385549545288} -08/30/2021 16:19:37 - INFO - __main__ - Step 17147: {'lr': 0.0004871903249766206, 'samples': 3292224, 'steps': 17146, 'loss/train': 0.9774880409240723} -08/30/2021 16:19:37 - INFO - __main__ - Step 17148: {'lr': 0.0004871886480255925, 'samples': 3292416, 'steps': 17147, 'loss/train': 1.7427949905395508} -08/30/2021 16:19:39 - INFO - __main__ - Step 17149: {'lr': 0.0004871869709676907, 'samples': 3292608, 'steps': 17148, 'loss/train': 1.4562371969223022} -08/30/2021 16:19:39 - INFO - __main__ - Step 17150: {'lr': 0.0004871852938029162, 'samples': 3292800, 'steps': 17149, 'loss/train': 1.6578058004379272} -08/30/2021 16:19:40 - INFO - __main__ - Step 17151: {'lr': 0.00048718361653126975, 'samples': 3292992, 'steps': 17150, 'loss/train': 1.7739109992980957} -08/30/2021 16:19:40 - INFO - __main__ - Step 17152: {'lr': 0.0004871819391527519, 'samples': 3293184, 'steps': 17151, 'loss/train': 1.5501478910446167} -08/30/2021 16:19:40 - INFO - __main__ - Step 17153: {'lr': 0.0004871802616673636, 'samples': 3293376, 'steps': 17152, 'loss/train': 1.8780291080474854} -08/30/2021 16:19:41 - INFO - __main__ - Step 17154: {'lr': 0.00048717858407510545, 'samples': 3293568, 'steps': 17153, 'loss/train': 1.376879096031189} -08/30/2021 16:19:42 - INFO - __main__ - Step 17155: {'lr': 0.0004871769063759783, 'samples': 3293760, 'steps': 17154, 'loss/train': 1.3158879280090332} -08/30/2021 16:19:43 - INFO - __main__ - Step 17156: {'lr': 0.000487175228569983, 'samples': 3293952, 'steps': 17155, 'loss/train': 1.6738362312316895} -08/30/2021 16:19:43 - INFO - __main__ - Step 17157: {'lr': 0.0004871735506571201, 'samples': 3294144, 'steps': 17156, 'loss/train': 1.697090744972229} -08/30/2021 16:19:43 - INFO - __main__ - Step 17158: {'lr': 0.00048717187263739046, 'samples': 3294336, 'steps': 17157, 'loss/train': 1.677499532699585} -08/30/2021 16:19:44 - INFO - __main__ - Step 17159: {'lr': 0.00048717019451079493, 'samples': 3294528, 'steps': 17158, 'loss/train': 1.9471052885055542} -08/30/2021 16:19:45 - INFO - __main__ - Step 17160: {'lr': 0.00048716851627733404, 'samples': 3294720, 'steps': 17159, 'loss/train': 2.3192944526672363} -08/30/2021 16:19:46 - INFO - __main__ - Step 17161: {'lr': 0.00048716683793700876, 'samples': 3294912, 'steps': 17160, 'loss/train': 1.8594112396240234} -08/30/2021 16:19:46 - INFO - __main__ - Step 17162: {'lr': 0.00048716515948981975, 'samples': 3295104, 'steps': 17161, 'loss/train': 1.7230446338653564} -08/30/2021 16:19:46 - INFO - __main__ - Step 17163: {'lr': 0.0004871634809357678, 'samples': 3295296, 'steps': 17162, 'loss/train': 1.4229161739349365} -08/30/2021 16:19:47 - INFO - __main__ - Step 17164: {'lr': 0.00048716180227485365, 'samples': 3295488, 'steps': 17163, 'loss/train': 1.7989989519119263} -08/30/2021 16:19:48 - INFO - __main__ - Step 17165: {'lr': 0.000487160123507078, 'samples': 3295680, 'steps': 17164, 'loss/train': 1.8469843864440918} -08/30/2021 16:19:49 - INFO - __main__ - Step 17166: {'lr': 0.00048715844463244166, 'samples': 3295872, 'steps': 17165, 'loss/train': 1.6918755769729614} -08/30/2021 16:19:49 - INFO - __main__ - Step 17167: {'lr': 0.0004871567656509454, 'samples': 3296064, 'steps': 17166, 'loss/train': 1.916261076927185} -08/30/2021 16:19:49 - INFO - __main__ - Step 17168: {'lr': 0.00048715508656259, 'samples': 3296256, 'steps': 17167, 'loss/train': 1.7329760789871216} -08/30/2021 16:19:50 - INFO - __main__ - Step 17169: {'lr': 0.00048715340736737615, 'samples': 3296448, 'steps': 17168, 'loss/train': 1.7122958898544312} -08/30/2021 16:19:51 - INFO - __main__ - Step 17170: {'lr': 0.0004871517280653046, 'samples': 3296640, 'steps': 17169, 'loss/train': 2.1107749938964844} -08/30/2021 16:19:52 - INFO - __main__ - Step 17171: {'lr': 0.0004871500486563761, 'samples': 3296832, 'steps': 17170, 'loss/train': 1.417673945426941} -08/30/2021 16:19:52 - INFO - __main__ - Step 17172: {'lr': 0.0004871483691405916, 'samples': 3297024, 'steps': 17171, 'loss/train': 1.558638095855713} -08/30/2021 16:19:52 - INFO - __main__ - Step 17173: {'lr': 0.0004871466895179516, 'samples': 3297216, 'steps': 17172, 'loss/train': 1.9435893297195435} -08/30/2021 16:19:53 - INFO - __main__ - Step 17174: {'lr': 0.000487145009788457, 'samples': 3297408, 'steps': 17173, 'loss/train': 1.5993436574935913} -08/30/2021 16:19:55 - INFO - __main__ - Step 17175: {'lr': 0.0004871433299521085, 'samples': 3297600, 'steps': 17174, 'loss/train': 1.9466005563735962} -08/30/2021 16:19:55 - INFO - __main__ - Step 17176: {'lr': 0.00048714165000890685, 'samples': 3297792, 'steps': 17175, 'loss/train': 1.5319772958755493} -08/30/2021 16:19:55 - INFO - __main__ - Step 17177: {'lr': 0.00048713996995885286, 'samples': 3297984, 'steps': 17176, 'loss/train': 0.8693053722381592} -08/30/2021 16:19:56 - INFO - __main__ - Step 17178: {'lr': 0.0004871382898019472, 'samples': 3298176, 'steps': 17177, 'loss/train': 2.826000928878784} -08/30/2021 16:19:56 - INFO - __main__ - Step 17179: {'lr': 0.0004871366095381908, 'samples': 3298368, 'steps': 17178, 'loss/train': 1.463893175125122} -08/30/2021 16:19:56 - INFO - __main__ - Step 17180: {'lr': 0.00048713492916758425, 'samples': 3298560, 'steps': 17179, 'loss/train': 1.4658360481262207} -08/30/2021 16:19:58 - INFO - __main__ - Step 17181: {'lr': 0.00048713324869012833, 'samples': 3298752, 'steps': 17180, 'loss/train': 0.9056485891342163} -08/30/2021 16:19:59 - INFO - __main__ - Step 17182: {'lr': 0.0004871315681058238, 'samples': 3298944, 'steps': 17181, 'loss/train': 1.3314779996871948} -08/30/2021 16:19:59 - INFO - __main__ - Step 17183: {'lr': 0.0004871298874146716, 'samples': 3299136, 'steps': 17182, 'loss/train': 0.2603258192539215} -08/30/2021 16:19:59 - INFO - __main__ - Step 17184: {'lr': 0.00048712820661667215, 'samples': 3299328, 'steps': 17183, 'loss/train': 1.1811299324035645} -08/30/2021 16:20:00 - INFO - __main__ - Step 17185: {'lr': 0.0004871265257118265, 'samples': 3299520, 'steps': 17184, 'loss/train': 0.7493991255760193} -08/30/2021 16:20:01 - INFO - __main__ - Step 17186: {'lr': 0.0004871248447001352, 'samples': 3299712, 'steps': 17185, 'loss/train': 1.7395381927490234} -08/30/2021 16:20:02 - INFO - __main__ - Step 17187: {'lr': 0.0004871231635815992, 'samples': 3299904, 'steps': 17186, 'loss/train': 1.6505751609802246} -08/30/2021 16:20:02 - INFO - __main__ - Step 17188: {'lr': 0.0004871214823562191, 'samples': 3300096, 'steps': 17187, 'loss/train': 1.7045437097549438} -08/30/2021 16:20:02 - INFO - __main__ - Step 17189: {'lr': 0.0004871198010239958, 'samples': 3300288, 'steps': 17188, 'loss/train': 1.5755842924118042} -08/30/2021 16:20:03 - INFO - __main__ - Step 17190: {'lr': 0.0004871181195849299, 'samples': 3300480, 'steps': 17189, 'loss/train': 1.3983370065689087} -08/30/2021 16:20:04 - INFO - __main__ - Step 17191: {'lr': 0.00048711643803902227, 'samples': 3300672, 'steps': 17190, 'loss/train': 1.941197156906128} -08/30/2021 16:20:05 - INFO - __main__ - Step 17192: {'lr': 0.00048711475638627363, 'samples': 3300864, 'steps': 17191, 'loss/train': 1.90217125415802} -08/30/2021 16:20:05 - INFO - __main__ - Step 17193: {'lr': 0.0004871130746266847, 'samples': 3301056, 'steps': 17192, 'loss/train': 1.3400033712387085} -08/30/2021 16:20:05 - INFO - __main__ - Step 17194: {'lr': 0.00048711139276025626, 'samples': 3301248, 'steps': 17193, 'loss/train': 1.4913097620010376} -08/30/2021 16:20:06 - INFO - __main__ - Step 17195: {'lr': 0.00048710971078698916, 'samples': 3301440, 'steps': 17194, 'loss/train': 2.4068617820739746} -08/30/2021 16:20:07 - INFO - __main__ - Step 17196: {'lr': 0.0004871080287068841, 'samples': 3301632, 'steps': 17195, 'loss/train': 1.3379743099212646} -08/30/2021 16:20:08 - INFO - __main__ - Step 17197: {'lr': 0.00048710634651994176, 'samples': 3301824, 'steps': 17196, 'loss/train': 2.3184237480163574} -08/30/2021 16:20:08 - INFO - __main__ - Step 17198: {'lr': 0.0004871046642261629, 'samples': 3302016, 'steps': 17197, 'loss/train': 1.6905794143676758} -08/30/2021 16:20:09 - INFO - __main__ - Step 17199: {'lr': 0.0004871029818255485, 'samples': 3302208, 'steps': 17198, 'loss/train': 1.668904423713684} -08/30/2021 16:20:09 - INFO - __main__ - Step 17200: {'lr': 0.0004871012993180991, 'samples': 3302400, 'steps': 17199, 'loss/train': 1.8536714315414429} -08/30/2021 16:20:09 - INFO - __main__ - Step 17201: {'lr': 0.0004870996167038154, 'samples': 3302592, 'steps': 17200, 'loss/train': 0.12117816507816315} -08/30/2021 16:20:11 - INFO - __main__ - Step 17202: {'lr': 0.0004870979339826984, 'samples': 3302784, 'steps': 17201, 'loss/train': 1.790168285369873} -08/30/2021 16:20:11 - INFO - __main__ - Step 17203: {'lr': 0.00048709625115474865, 'samples': 3302976, 'steps': 17202, 'loss/train': 1.631544828414917} -08/30/2021 16:20:11 - INFO - __main__ - Step 17204: {'lr': 0.00048709456821996705, 'samples': 3303168, 'steps': 17203, 'loss/train': 1.6139225959777832} -08/30/2021 16:20:12 - INFO - __main__ - Step 17205: {'lr': 0.0004870928851783543, 'samples': 3303360, 'steps': 17204, 'loss/train': 1.7055037021636963} -08/30/2021 16:20:12 - INFO - __main__ - Step 17206: {'lr': 0.00048709120202991107, 'samples': 3303552, 'steps': 17205, 'loss/train': 1.8445712327957153} -08/30/2021 16:20:14 - INFO - __main__ - Step 17207: {'lr': 0.0004870895187746383, 'samples': 3303744, 'steps': 17206, 'loss/train': 1.7481948137283325} -08/30/2021 16:20:15 - INFO - __main__ - Step 17208: {'lr': 0.00048708783541253655, 'samples': 3303936, 'steps': 17207, 'loss/train': 1.8356598615646362} -08/30/2021 16:20:15 - INFO - __main__ - Step 17209: {'lr': 0.00048708615194360675, 'samples': 3304128, 'steps': 17208, 'loss/train': 1.4905062913894653} -08/30/2021 16:20:15 - INFO - __main__ - Step 17210: {'lr': 0.0004870844683678496, 'samples': 3304320, 'steps': 17209, 'loss/train': 2.038738965988159} -08/30/2021 16:20:16 - INFO - __main__ - Step 17211: {'lr': 0.0004870827846852658, 'samples': 3304512, 'steps': 17210, 'loss/train': 1.8041356801986694} -08/30/2021 16:20:17 - INFO - __main__ - Step 17212: {'lr': 0.00048708110089585617, 'samples': 3304704, 'steps': 17211, 'loss/train': 1.6887880563735962} -08/30/2021 16:20:18 - INFO - __main__ - Step 17213: {'lr': 0.00048707941699962143, 'samples': 3304896, 'steps': 17212, 'loss/train': 1.7832515239715576} -08/30/2021 16:20:18 - INFO - __main__ - Step 17214: {'lr': 0.0004870777329965624, 'samples': 3305088, 'steps': 17213, 'loss/train': 1.9115080833435059} -08/30/2021 16:20:18 - INFO - __main__ - Step 17215: {'lr': 0.00048707604888667983, 'samples': 3305280, 'steps': 17214, 'loss/train': 1.2715325355529785} -08/30/2021 16:20:19 - INFO - __main__ - Step 17216: {'lr': 0.0004870743646699744, 'samples': 3305472, 'steps': 17215, 'loss/train': 1.3081682920455933} -08/30/2021 16:20:20 - INFO - __main__ - Step 17217: {'lr': 0.0004870726803464469, 'samples': 3305664, 'steps': 17216, 'loss/train': 1.637826919555664} -08/30/2021 16:20:21 - INFO - __main__ - Step 17218: {'lr': 0.00048707099591609816, 'samples': 3305856, 'steps': 17217, 'loss/train': 1.9086990356445312} -08/30/2021 16:20:21 - INFO - __main__ - Step 17219: {'lr': 0.0004870693113789289, 'samples': 3306048, 'steps': 17218, 'loss/train': 1.7289403676986694} -08/30/2021 16:20:21 - INFO - __main__ - Step 17220: {'lr': 0.00048706762673493987, 'samples': 3306240, 'steps': 17219, 'loss/train': 1.3607165813446045} -08/30/2021 16:20:22 - INFO - __main__ - Step 17221: {'lr': 0.00048706594198413177, 'samples': 3306432, 'steps': 17220, 'loss/train': 1.6289743185043335} -08/30/2021 16:20:23 - INFO - __main__ - Step 17222: {'lr': 0.0004870642571265054, 'samples': 3306624, 'steps': 17221, 'loss/train': 1.3383699655532837} -08/30/2021 16:20:24 - INFO - __main__ - Step 17223: {'lr': 0.0004870625721620616, 'samples': 3306816, 'steps': 17222, 'loss/train': 1.5149602890014648} -08/30/2021 16:20:24 - INFO - __main__ - Step 17224: {'lr': 0.00048706088709080103, 'samples': 3307008, 'steps': 17223, 'loss/train': 2.0026845932006836} -08/30/2021 16:20:24 - INFO - __main__ - Step 17225: {'lr': 0.00048705920191272447, 'samples': 3307200, 'steps': 17224, 'loss/train': 1.5719797611236572} -08/30/2021 16:20:25 - INFO - __main__ - Step 17226: {'lr': 0.0004870575166278327, 'samples': 3307392, 'steps': 17225, 'loss/train': 1.1763685941696167} -08/30/2021 16:20:26 - INFO - __main__ - Step 17227: {'lr': 0.0004870558312361265, 'samples': 3307584, 'steps': 17226, 'loss/train': 1.4753894805908203} -08/30/2021 16:20:27 - INFO - __main__ - Step 17228: {'lr': 0.0004870541457376066, 'samples': 3307776, 'steps': 17227, 'loss/train': 1.3628004789352417} -08/30/2021 16:20:27 - INFO - __main__ - Step 17229: {'lr': 0.0004870524601322737, 'samples': 3307968, 'steps': 17228, 'loss/train': 1.4777752161026} -08/30/2021 16:20:27 - INFO - __main__ - Step 17230: {'lr': 0.00048705077442012866, 'samples': 3308160, 'steps': 17229, 'loss/train': 1.9251604080200195} -08/30/2021 16:20:28 - INFO - __main__ - Step 17231: {'lr': 0.0004870490886011723, 'samples': 3308352, 'steps': 17230, 'loss/train': 1.7312031984329224} -08/30/2021 16:20:29 - INFO - __main__ - Step 17232: {'lr': 0.0004870474026754051, 'samples': 3308544, 'steps': 17231, 'loss/train': 1.7540390491485596} -08/30/2021 16:20:30 - INFO - __main__ - Step 17233: {'lr': 0.00048704571664282806, 'samples': 3308736, 'steps': 17232, 'loss/train': 1.5850716829299927} -08/30/2021 16:20:30 - INFO - __main__ - Step 17234: {'lr': 0.0004870440305034419, 'samples': 3308928, 'steps': 17233, 'loss/train': 0.14398325979709625} -08/30/2021 16:20:30 - INFO - __main__ - Step 17235: {'lr': 0.00048704234425724736, 'samples': 3309120, 'steps': 17234, 'loss/train': 1.5970796346664429} -08/30/2021 16:20:31 - INFO - __main__ - Step 17236: {'lr': 0.0004870406579042452, 'samples': 3309312, 'steps': 17235, 'loss/train': 2.115356206893921} -08/30/2021 16:20:32 - INFO - __main__ - Step 17237: {'lr': 0.00048703897144443615, 'samples': 3309504, 'steps': 17236, 'loss/train': 1.9717119932174683} -08/30/2021 16:20:33 - INFO - __main__ - Step 17238: {'lr': 0.000487037284877821, 'samples': 3309696, 'steps': 17237, 'loss/train': 1.8846182823181152} -08/30/2021 16:20:33 - INFO - __main__ - Step 17239: {'lr': 0.00048703559820440054, 'samples': 3309888, 'steps': 17238, 'loss/train': 0.8971735239028931} -08/30/2021 16:20:34 - INFO - __main__ - Step 17240: {'lr': 0.0004870339114241755, 'samples': 3310080, 'steps': 17239, 'loss/train': 1.6554961204528809} -08/30/2021 16:20:34 - INFO - __main__ - Step 17241: {'lr': 0.00048703222453714656, 'samples': 3310272, 'steps': 17240, 'loss/train': 1.9984480142593384} -08/30/2021 16:20:35 - INFO - __main__ - Step 17242: {'lr': 0.0004870305375433146, 'samples': 3310464, 'steps': 17241, 'loss/train': 0.11705752462148666} -08/30/2021 16:20:36 - INFO - __main__ - Step 17243: {'lr': 0.0004870288504426804, 'samples': 3310656, 'steps': 17242, 'loss/train': 1.8031328916549683} -08/30/2021 16:20:36 - INFO - __main__ - Step 17244: {'lr': 0.0004870271632352446, 'samples': 3310848, 'steps': 17243, 'loss/train': 1.4639816284179688} -08/30/2021 16:20:37 - INFO - __main__ - Step 17245: {'lr': 0.000487025475921008, 'samples': 3311040, 'steps': 17244, 'loss/train': 1.7096904516220093} -08/30/2021 16:20:37 - INFO - __main__ - Step 17246: {'lr': 0.00048702378849997143, 'samples': 3311232, 'steps': 17245, 'loss/train': 1.751753330230713} -08/30/2021 16:20:38 - INFO - __main__ - Step 17247: {'lr': 0.0004870221009721356, 'samples': 3311424, 'steps': 17246, 'loss/train': 1.6622823476791382} -08/30/2021 16:20:39 - INFO - __main__ - Step 17248: {'lr': 0.00048702041333750117, 'samples': 3311616, 'steps': 17247, 'loss/train': 1.5522351264953613} -08/30/2021 16:20:39 - INFO - __main__ - Step 17249: {'lr': 0.0004870187255960691, 'samples': 3311808, 'steps': 17248, 'loss/train': 1.5034717321395874} -08/30/2021 16:20:39 - INFO - __main__ - Step 17250: {'lr': 0.00048701703774784, 'samples': 3312000, 'steps': 17249, 'loss/train': 1.4204462766647339} -08/30/2021 16:20:40 - INFO - __main__ - Step 17251: {'lr': 0.0004870153497928147, 'samples': 3312192, 'steps': 17250, 'loss/train': 1.531490683555603} -08/30/2021 16:20:41 - INFO - __main__ - Step 17252: {'lr': 0.00048701366173099396, 'samples': 3312384, 'steps': 17251, 'loss/train': 1.433632254600525} -08/30/2021 16:20:42 - INFO - __main__ - Step 17253: {'lr': 0.0004870119735623785, 'samples': 3312576, 'steps': 17252, 'loss/train': 1.6299384832382202} -08/30/2021 16:20:42 - INFO - __main__ - Step 17254: {'lr': 0.00048701028528696914, 'samples': 3312768, 'steps': 17253, 'loss/train': 1.7262139320373535} -08/30/2021 16:20:42 - INFO - __main__ - Step 17255: {'lr': 0.0004870085969047665, 'samples': 3312960, 'steps': 17254, 'loss/train': 1.7061408758163452} -08/30/2021 16:20:43 - INFO - __main__ - Step 17256: {'lr': 0.00048700690841577154, 'samples': 3313152, 'steps': 17255, 'loss/train': 0.7340334057807922} -08/30/2021 16:20:45 - INFO - __main__ - Step 17257: {'lr': 0.0004870052198199849, 'samples': 3313344, 'steps': 17256, 'loss/train': 1.5008362531661987} -08/30/2021 16:20:45 - INFO - __main__ - Step 17258: {'lr': 0.00048700353111740734, 'samples': 3313536, 'steps': 17257, 'loss/train': 0.9157738089561462} -08/30/2021 16:20:46 - INFO - __main__ - Step 17259: {'lr': 0.0004870018423080397, 'samples': 3313728, 'steps': 17258, 'loss/train': 1.6854766607284546} -08/30/2021 16:20:46 - INFO - __main__ - Step 17260: {'lr': 0.00048700015339188266, 'samples': 3313920, 'steps': 17259, 'loss/train': 1.5270642042160034} -08/30/2021 16:20:46 - INFO - __main__ - Step 17261: {'lr': 0.0004869984643689369, 'samples': 3314112, 'steps': 17260, 'loss/train': 1.520378589630127} -08/30/2021 16:20:47 - INFO - __main__ - Step 17262: {'lr': 0.00048699677523920346, 'samples': 3314304, 'steps': 17261, 'loss/train': 1.5046796798706055} -08/30/2021 16:20:48 - INFO - __main__ - Step 17263: {'lr': 0.00048699508600268284, 'samples': 3314496, 'steps': 17262, 'loss/train': 1.4834710359573364} -08/30/2021 16:20:49 - INFO - __main__ - Step 17264: {'lr': 0.00048699339665937594, 'samples': 3314688, 'steps': 17263, 'loss/train': 2.0987493991851807} -08/30/2021 16:20:49 - INFO - __main__ - Step 17265: {'lr': 0.0004869917072092834, 'samples': 3314880, 'steps': 17264, 'loss/train': 1.4187264442443848} -08/30/2021 16:20:49 - INFO - __main__ - Step 17266: {'lr': 0.00048699001765240615, 'samples': 3315072, 'steps': 17265, 'loss/train': 1.3038651943206787} -08/30/2021 16:20:50 - INFO - __main__ - Step 17267: {'lr': 0.00048698832798874477, 'samples': 3315264, 'steps': 17266, 'loss/train': 1.9730043411254883} -08/30/2021 16:20:51 - INFO - __main__ - Step 17268: {'lr': 0.0004869866382183001, 'samples': 3315456, 'steps': 17267, 'loss/train': 1.1494001150131226} -08/30/2021 16:20:52 - INFO - __main__ - Step 17269: {'lr': 0.00048698494834107297, 'samples': 3315648, 'steps': 17268, 'loss/train': 1.7524253129959106} -08/30/2021 16:20:52 - INFO - __main__ - Step 17270: {'lr': 0.000486983258357064, 'samples': 3315840, 'steps': 17269, 'loss/train': 1.5027101039886475} -08/30/2021 16:20:53 - INFO - __main__ - Step 17271: {'lr': 0.00048698156826627414, 'samples': 3316032, 'steps': 17270, 'loss/train': 1.9209132194519043} -08/30/2021 16:20:53 - INFO - __main__ - Step 17272: {'lr': 0.00048697987806870397, 'samples': 3316224, 'steps': 17271, 'loss/train': 1.8910088539123535} -08/30/2021 16:20:54 - INFO - __main__ - Step 17273: {'lr': 0.0004869781877643543, 'samples': 3316416, 'steps': 17272, 'loss/train': 1.5945838689804077} -08/30/2021 16:20:55 - INFO - __main__ - Step 17274: {'lr': 0.000486976497353226, 'samples': 3316608, 'steps': 17273, 'loss/train': 0.6928431987762451} -08/30/2021 16:20:55 - INFO - __main__ - Step 17275: {'lr': 0.0004869748068353197, 'samples': 3316800, 'steps': 17274, 'loss/train': 1.5734776258468628} -08/30/2021 16:20:56 - INFO - __main__ - Step 17276: {'lr': 0.00048697311621063625, 'samples': 3316992, 'steps': 17275, 'loss/train': 1.3791122436523438} -08/30/2021 16:20:56 - INFO - __main__ - Step 17277: {'lr': 0.0004869714254791763, 'samples': 3317184, 'steps': 17276, 'loss/train': 2.1521201133728027} -08/30/2021 16:20:58 - INFO - __main__ - Step 17278: {'lr': 0.00048696973464094076, 'samples': 3317376, 'steps': 17277, 'loss/train': 1.322631597518921} -08/30/2021 16:20:59 - INFO - __main__ - Step 17279: {'lr': 0.00048696804369593023, 'samples': 3317568, 'steps': 17278, 'loss/train': 1.4515596628189087} -08/30/2021 16:20:59 - INFO - __main__ - Step 17280: {'lr': 0.0004869663526441456, 'samples': 3317760, 'steps': 17279, 'loss/train': 1.5458523035049438} -08/30/2021 16:20:59 - INFO - __main__ - Step 17281: {'lr': 0.0004869646614855876, 'samples': 3317952, 'steps': 17280, 'loss/train': 0.6698225140571594} -08/30/2021 16:21:00 - INFO - __main__ - Step 17282: {'lr': 0.0004869629702202569, 'samples': 3318144, 'steps': 17281, 'loss/train': 0.613684892654419} -08/30/2021 16:21:00 - INFO - __main__ - Step 17283: {'lr': 0.0004869612788481544, 'samples': 3318336, 'steps': 17282, 'loss/train': 0.5401663184165955} -08/30/2021 16:21:01 - INFO - __main__ - Step 17284: {'lr': 0.00048695958736928084, 'samples': 3318528, 'steps': 17283, 'loss/train': 2.1009950637817383} -08/30/2021 16:21:02 - INFO - __main__ - Step 17285: {'lr': 0.00048695789578363693, 'samples': 3318720, 'steps': 17284, 'loss/train': 1.6466425657272339} -08/30/2021 16:21:02 - INFO - __main__ - Step 17286: {'lr': 0.00048695620409122345, 'samples': 3318912, 'steps': 17285, 'loss/train': 1.2270723581314087} -08/30/2021 16:21:03 - INFO - __main__ - Step 17287: {'lr': 0.00048695451229204115, 'samples': 3319104, 'steps': 17286, 'loss/train': 1.5756330490112305} -08/30/2021 16:21:03 - INFO - __main__ - Step 17288: {'lr': 0.0004869528203860908, 'samples': 3319296, 'steps': 17287, 'loss/train': 1.4684290885925293} -08/30/2021 16:21:04 - INFO - __main__ - Step 17289: {'lr': 0.0004869511283733732, 'samples': 3319488, 'steps': 17288, 'loss/train': 1.3921698331832886} -08/30/2021 16:21:05 - INFO - __main__ - Step 17290: {'lr': 0.000486949436253889, 'samples': 3319680, 'steps': 17289, 'loss/train': 1.5589308738708496} -08/30/2021 16:21:05 - INFO - __main__ - Step 17291: {'lr': 0.0004869477440276391, 'samples': 3319872, 'steps': 17290, 'loss/train': 1.8033311367034912} -08/30/2021 16:21:06 - INFO - __main__ - Step 17292: {'lr': 0.00048694605169462415, 'samples': 3320064, 'steps': 17291, 'loss/train': 1.333516001701355} -08/30/2021 16:21:06 - INFO - __main__ - Step 17293: {'lr': 0.00048694435925484506, 'samples': 3320256, 'steps': 17292, 'loss/train': 1.8079005479812622} -08/30/2021 16:21:08 - INFO - __main__ - Step 17294: {'lr': 0.0004869426667083024, 'samples': 3320448, 'steps': 17293, 'loss/train': 2.0321059226989746} -08/30/2021 16:21:08 - INFO - __main__ - Step 17295: {'lr': 0.00048694097405499703, 'samples': 3320640, 'steps': 17294, 'loss/train': 1.420762538909912} -08/30/2021 16:21:09 - INFO - __main__ - Step 17296: {'lr': 0.0004869392812949298, 'samples': 3320832, 'steps': 17295, 'loss/train': 0.06690653413534164} -08/30/2021 16:21:09 - INFO - __main__ - Step 17297: {'lr': 0.00048693758842810133, 'samples': 3321024, 'steps': 17296, 'loss/train': 1.6953409910202026} -08/30/2021 16:21:09 - INFO - __main__ - Step 17298: {'lr': 0.00048693589545451243, 'samples': 3321216, 'steps': 17297, 'loss/train': 1.5967339277267456} -08/30/2021 16:21:10 - INFO - __main__ - Step 17299: {'lr': 0.00048693420237416393, 'samples': 3321408, 'steps': 17298, 'loss/train': 1.582407832145691} -08/30/2021 16:21:11 - INFO - __main__ - Step 17300: {'lr': 0.00048693250918705643, 'samples': 3321600, 'steps': 17299, 'loss/train': 1.3376667499542236} -08/30/2021 16:21:12 - INFO - __main__ - Step 17301: {'lr': 0.0004869308158931909, 'samples': 3321792, 'steps': 17300, 'loss/train': 2.073134660720825} -08/30/2021 16:21:12 - INFO - __main__ - Step 17302: {'lr': 0.00048692912249256794, 'samples': 3321984, 'steps': 17301, 'loss/train': 1.2439717054367065} -08/30/2021 16:21:12 - INFO - __main__ - Step 17303: {'lr': 0.00048692742898518836, 'samples': 3322176, 'steps': 17302, 'loss/train': 1.4036697149276733} -08/30/2021 16:21:13 - INFO - __main__ - Step 17304: {'lr': 0.000486925735371053, 'samples': 3322368, 'steps': 17303, 'loss/train': 1.7767975330352783} -08/30/2021 16:21:14 - INFO - __main__ - Step 17305: {'lr': 0.00048692404165016256, 'samples': 3322560, 'steps': 17304, 'loss/train': 1.9546399116516113} -08/30/2021 16:21:15 - INFO - __main__ - Step 17306: {'lr': 0.0004869223478225178, 'samples': 3322752, 'steps': 17305, 'loss/train': 1.1804614067077637} -08/30/2021 16:21:15 - INFO - __main__ - Step 17307: {'lr': 0.00048692065388811944, 'samples': 3322944, 'steps': 17306, 'loss/train': 1.7170722484588623} -08/30/2021 16:21:15 - INFO - __main__ - Step 17308: {'lr': 0.0004869189598469683, 'samples': 3323136, 'steps': 17307, 'loss/train': 1.4930357933044434} -08/30/2021 16:21:16 - INFO - __main__ - Step 17309: {'lr': 0.00048691726569906514, 'samples': 3323328, 'steps': 17308, 'loss/train': 1.680724024772644} -08/30/2021 16:21:19 - INFO - __main__ - Step 17310: {'lr': 0.0004869155714444107, 'samples': 3323520, 'steps': 17309, 'loss/train': 1.571215271949768} -08/30/2021 16:21:19 - INFO - __main__ - Step 17311: {'lr': 0.00048691387708300584, 'samples': 3323712, 'steps': 17310, 'loss/train': 1.4766267538070679} -08/30/2021 16:21:19 - INFO - __main__ - Step 17312: {'lr': 0.00048691218261485113, 'samples': 3323904, 'steps': 17311, 'loss/train': 1.329664945602417} -08/30/2021 16:21:20 - INFO - __main__ - Step 17313: {'lr': 0.00048691048803994755, 'samples': 3324096, 'steps': 17312, 'loss/train': 1.7416303157806396} -08/30/2021 16:21:20 - INFO - __main__ - Step 17314: {'lr': 0.00048690879335829565, 'samples': 3324288, 'steps': 17313, 'loss/train': 1.323940634727478} -08/30/2021 16:21:20 - INFO - __main__ - Step 17315: {'lr': 0.00048690709856989635, 'samples': 3324480, 'steps': 17314, 'loss/train': 2.468637228012085} -08/30/2021 16:21:21 - INFO - __main__ - Step 17316: {'lr': 0.00048690540367475046, 'samples': 3324672, 'steps': 17315, 'loss/train': 0.28997504711151123} -08/30/2021 16:21:22 - INFO - __main__ - Step 17317: {'lr': 0.00048690370867285847, 'samples': 3324864, 'steps': 17316, 'loss/train': 0.3503378927707672} -08/30/2021 16:21:23 - INFO - __main__ - Step 17318: {'lr': 0.00048690201356422146, 'samples': 3325056, 'steps': 17317, 'loss/train': 1.3354766368865967} -08/30/2021 16:21:23 - INFO - __main__ - Step 17319: {'lr': 0.00048690031834884004, 'samples': 3325248, 'steps': 17318, 'loss/train': 0.25356781482696533} -08/30/2021 16:21:24 - INFO - __main__ - Step 17320: {'lr': 0.00048689862302671495, 'samples': 3325440, 'steps': 17319, 'loss/train': 1.2663406133651733} -08/30/2021 16:21:24 - INFO - __main__ - Step 17321: {'lr': 0.000486896927597847, 'samples': 3325632, 'steps': 17320, 'loss/train': 2.2433221340179443} -08/30/2021 16:21:25 - INFO - __main__ - Step 17322: {'lr': 0.00048689523206223693, 'samples': 3325824, 'steps': 17321, 'loss/train': 1.3755285739898682} -08/30/2021 16:21:26 - INFO - __main__ - Step 17323: {'lr': 0.00048689353641988563, 'samples': 3326016, 'steps': 17322, 'loss/train': 1.7116140127182007} -08/30/2021 16:21:26 - INFO - __main__ - Step 17324: {'lr': 0.0004868918406707937, 'samples': 3326208, 'steps': 17323, 'loss/train': 1.3808372020721436} -08/30/2021 16:21:27 - INFO - __main__ - Step 17325: {'lr': 0.00048689014481496197, 'samples': 3326400, 'steps': 17324, 'loss/train': 1.2138450145721436} -08/30/2021 16:21:27 - INFO - __main__ - Step 17326: {'lr': 0.0004868884488523911, 'samples': 3326592, 'steps': 17325, 'loss/train': 1.6475673913955688} -08/30/2021 16:21:29 - INFO - __main__ - Step 17327: {'lr': 0.0004868867527830821, 'samples': 3326784, 'steps': 17326, 'loss/train': 1.5045684576034546} -08/30/2021 16:21:29 - INFO - __main__ - Step 17328: {'lr': 0.0004868850566070355, 'samples': 3326976, 'steps': 17327, 'loss/train': 0.6110200881958008} -08/30/2021 16:21:29 - INFO - __main__ - Step 17329: {'lr': 0.00048688336032425217, 'samples': 3327168, 'steps': 17328, 'loss/train': 2.3573122024536133} -08/30/2021 16:21:30 - INFO - __main__ - Step 17330: {'lr': 0.0004868816639347328, 'samples': 3327360, 'steps': 17329, 'loss/train': 1.7974035739898682} -08/30/2021 16:21:30 - INFO - __main__ - Step 17331: {'lr': 0.0004868799674384783, 'samples': 3327552, 'steps': 17330, 'loss/train': 2.2172374725341797} -08/30/2021 16:21:30 - INFO - __main__ - Step 17332: {'lr': 0.0004868782708354893, 'samples': 3327744, 'steps': 17331, 'loss/train': 1.334261178970337} -08/30/2021 16:21:32 - INFO - __main__ - Step 17333: {'lr': 0.0004868765741257666, 'samples': 3327936, 'steps': 17332, 'loss/train': 1.588341236114502} -08/30/2021 16:21:32 - INFO - __main__ - Step 17334: {'lr': 0.00048687487730931096, 'samples': 3328128, 'steps': 17333, 'loss/train': 2.2034811973571777} -08/30/2021 16:21:33 - INFO - __main__ - Step 17335: {'lr': 0.00048687318038612317, 'samples': 3328320, 'steps': 17334, 'loss/train': 1.5304841995239258} -08/30/2021 16:21:33 - INFO - __main__ - Step 17336: {'lr': 0.000486871483356204, 'samples': 3328512, 'steps': 17335, 'loss/train': 1.9972132444381714} -08/30/2021 16:21:34 - INFO - __main__ - Step 17337: {'lr': 0.00048686978621955416, 'samples': 3328704, 'steps': 17336, 'loss/train': 1.6155893802642822} -08/30/2021 16:21:35 - INFO - __main__ - Step 17338: {'lr': 0.00048686808897617447, 'samples': 3328896, 'steps': 17337, 'loss/train': 2.1802656650543213} -08/30/2021 16:21:35 - INFO - __main__ - Step 17339: {'lr': 0.00048686639162606564, 'samples': 3329088, 'steps': 17338, 'loss/train': 1.9840431213378906} -08/30/2021 16:21:36 - INFO - __main__ - Step 17340: {'lr': 0.0004868646941692285, 'samples': 3329280, 'steps': 17339, 'loss/train': 1.7624295949935913} -08/30/2021 16:21:36 - INFO - __main__ - Step 17341: {'lr': 0.0004868629966056638, 'samples': 3329472, 'steps': 17340, 'loss/train': 1.2280787229537964} -08/30/2021 16:21:36 - INFO - __main__ - Step 17342: {'lr': 0.0004868612989353722, 'samples': 3329664, 'steps': 17341, 'loss/train': 1.5077310800552368} -08/30/2021 16:21:38 - INFO - __main__ - Step 17343: {'lr': 0.0004868596011583547, 'samples': 3329856, 'steps': 17342, 'loss/train': 0.6439254879951477} -08/30/2021 16:21:39 - INFO - __main__ - Step 17344: {'lr': 0.00048685790327461184, 'samples': 3330048, 'steps': 17343, 'loss/train': 1.9081764221191406} -08/30/2021 16:21:39 - INFO - __main__ - Step 17345: {'lr': 0.0004868562052841444, 'samples': 3330240, 'steps': 17344, 'loss/train': 1.3459018468856812} -08/30/2021 16:21:39 - INFO - __main__ - Step 17346: {'lr': 0.00048685450718695335, 'samples': 3330432, 'steps': 17345, 'loss/train': 0.2580951750278473} -08/30/2021 16:21:40 - INFO - __main__ - Step 17347: {'lr': 0.00048685280898303916, 'samples': 3330624, 'steps': 17346, 'loss/train': 1.4930943250656128} -08/30/2021 16:21:40 - INFO - __main__ - Step 17348: {'lr': 0.00048685111067240283, 'samples': 3330816, 'steps': 17347, 'loss/train': 1.3986310958862305} -08/30/2021 16:21:42 - INFO - __main__ - Step 17349: {'lr': 0.00048684941225504507, 'samples': 3331008, 'steps': 17348, 'loss/train': 1.661223292350769} -08/30/2021 16:21:42 - INFO - __main__ - Step 17350: {'lr': 0.0004868477137309666, 'samples': 3331200, 'steps': 17349, 'loss/train': 2.1348724365234375} -08/30/2021 16:21:43 - INFO - __main__ - Step 17351: {'lr': 0.00048684601510016817, 'samples': 3331392, 'steps': 17350, 'loss/train': 2.4937057495117188} -08/30/2021 16:21:43 - INFO - __main__ - Step 17352: {'lr': 0.00048684431636265065, 'samples': 3331584, 'steps': 17351, 'loss/train': 1.2339820861816406} -08/30/2021 16:21:43 - INFO - __main__ - Step 17353: {'lr': 0.00048684261751841463, 'samples': 3331776, 'steps': 17352, 'loss/train': 1.6313081979751587} -08/30/2021 16:21:45 - INFO - __main__ - Step 17354: {'lr': 0.000486840918567461, 'samples': 3331968, 'steps': 17353, 'loss/train': 1.693860411643982} -08/30/2021 16:21:45 - INFO - __main__ - Step 17355: {'lr': 0.0004868392195097906, 'samples': 3332160, 'steps': 17354, 'loss/train': 1.7639496326446533} -08/30/2021 16:21:46 - INFO - __main__ - Step 17356: {'lr': 0.0004868375203454041, 'samples': 3332352, 'steps': 17355, 'loss/train': 1.3028088808059692} -08/30/2021 16:21:46 - INFO - __main__ - Step 17357: {'lr': 0.00048683582107430227, 'samples': 3332544, 'steps': 17356, 'loss/train': 0.4325411319732666} -08/30/2021 16:21:46 - INFO - __main__ - Step 17358: {'lr': 0.0004868341216964858, 'samples': 3332736, 'steps': 17357, 'loss/train': 1.8419189453125} -08/30/2021 16:21:48 - INFO - __main__ - Step 17359: {'lr': 0.00048683242221195553, 'samples': 3332928, 'steps': 17358, 'loss/train': 1.6655195951461792} -08/30/2021 16:21:48 - INFO - __main__ - Step 17360: {'lr': 0.00048683072262071224, 'samples': 3333120, 'steps': 17359, 'loss/train': 0.29443657398223877} -08/30/2021 16:21:49 - INFO - __main__ - Step 17361: {'lr': 0.00048682902292275667, 'samples': 3333312, 'steps': 17360, 'loss/train': 1.6831555366516113} -08/30/2021 16:21:49 - INFO - __main__ - Step 17362: {'lr': 0.00048682732311808964, 'samples': 3333504, 'steps': 17361, 'loss/train': 1.497959017753601} -08/30/2021 16:21:49 - INFO - __main__ - Step 17363: {'lr': 0.00048682562320671185, 'samples': 3333696, 'steps': 17362, 'loss/train': 1.7417789697647095} -08/30/2021 16:21:51 - INFO - __main__ - Step 17364: {'lr': 0.00048682392318862407, 'samples': 3333888, 'steps': 17363, 'loss/train': 1.3795396089553833} -08/30/2021 16:21:52 - INFO - __main__ - Step 17365: {'lr': 0.00048682222306382705, 'samples': 3334080, 'steps': 17364, 'loss/train': 1.7262126207351685} -08/30/2021 16:21:52 - INFO - __main__ - Step 17366: {'lr': 0.0004868205228323217, 'samples': 3334272, 'steps': 17365, 'loss/train': 1.6140670776367188} -08/30/2021 16:21:53 - INFO - __main__ - Step 17367: {'lr': 0.0004868188224941086, 'samples': 3334464, 'steps': 17366, 'loss/train': 2.37587308883667} -08/30/2021 16:21:53 - INFO - __main__ - Step 17368: {'lr': 0.0004868171220491886, 'samples': 3334656, 'steps': 17367, 'loss/train': 2.0379302501678467} -08/30/2021 16:21:54 - INFO - __main__ - Step 17369: {'lr': 0.00048681542149756253, 'samples': 3334848, 'steps': 17368, 'loss/train': 1.8309261798858643} -08/30/2021 16:21:55 - INFO - __main__ - Step 17370: {'lr': 0.00048681372083923103, 'samples': 3335040, 'steps': 17369, 'loss/train': 1.9486777782440186} -08/30/2021 16:21:55 - INFO - __main__ - Step 17371: {'lr': 0.0004868120200741949, 'samples': 3335232, 'steps': 17370, 'loss/train': 2.133272886276245} -08/30/2021 16:21:56 - INFO - __main__ - Step 17372: {'lr': 0.0004868103192024549, 'samples': 3335424, 'steps': 17371, 'loss/train': 1.6345919370651245} -08/30/2021 16:21:56 - INFO - __main__ - Step 17373: {'lr': 0.0004868086182240119, 'samples': 3335616, 'steps': 17372, 'loss/train': 1.309005618095398} -08/30/2021 16:21:58 - INFO - __main__ - Step 17374: {'lr': 0.00048680691713886653, 'samples': 3335808, 'steps': 17373, 'loss/train': 1.9788750410079956} -08/30/2021 16:21:58 - INFO - __main__ - Step 17375: {'lr': 0.00048680521594701964, 'samples': 3336000, 'steps': 17374, 'loss/train': 1.8031384944915771} -08/30/2021 16:21:59 - INFO - __main__ - Step 17376: {'lr': 0.00048680351464847207, 'samples': 3336192, 'steps': 17375, 'loss/train': 1.7543350458145142} -08/30/2021 16:21:59 - INFO - __main__ - Step 17377: {'lr': 0.00048680181324322437, 'samples': 3336384, 'steps': 17376, 'loss/train': 1.9475842714309692} -08/30/2021 16:21:59 - INFO - __main__ - Step 17378: {'lr': 0.00048680011173127746, 'samples': 3336576, 'steps': 17377, 'loss/train': 1.0543763637542725} -08/30/2021 16:22:00 - INFO - __main__ - Step 17379: {'lr': 0.00048679841011263204, 'samples': 3336768, 'steps': 17378, 'loss/train': 3.990530252456665} -08/30/2021 16:22:01 - INFO - __main__ - Step 17380: {'lr': 0.00048679670838728894, 'samples': 3336960, 'steps': 17379, 'loss/train': 0.1678185611963272} -08/30/2021 16:22:02 - INFO - __main__ - Step 17381: {'lr': 0.0004867950065552489, 'samples': 3337152, 'steps': 17380, 'loss/train': 1.7439442873001099} -08/30/2021 16:22:02 - INFO - __main__ - Step 17382: {'lr': 0.00048679330461651275, 'samples': 3337344, 'steps': 17381, 'loss/train': 1.6377366781234741} -08/30/2021 16:22:03 - INFO - __main__ - Step 17383: {'lr': 0.00048679160257108107, 'samples': 3337536, 'steps': 17382, 'loss/train': 2.1917710304260254} -08/30/2021 16:22:03 - INFO - __main__ - Step 17384: {'lr': 0.00048678990041895484, 'samples': 3337728, 'steps': 17383, 'loss/train': 1.8279938697814941} -08/30/2021 16:22:05 - INFO - __main__ - Step 17385: {'lr': 0.00048678819816013467, 'samples': 3337920, 'steps': 17384, 'loss/train': 0.23291407525539398} -08/30/2021 16:22:05 - INFO - __main__ - Step 17386: {'lr': 0.0004867864957946214, 'samples': 3338112, 'steps': 17385, 'loss/train': 1.5302484035491943} -08/30/2021 16:22:05 - INFO - __main__ - Step 17387: {'lr': 0.0004867847933224158, 'samples': 3338304, 'steps': 17386, 'loss/train': 1.5825395584106445} -08/30/2021 16:22:06 - INFO - __main__ - Step 17388: {'lr': 0.0004867830907435187, 'samples': 3338496, 'steps': 17387, 'loss/train': 1.4746028184890747} -08/30/2021 16:22:06 - INFO - __main__ - Step 17389: {'lr': 0.0004867813880579307, 'samples': 3338688, 'steps': 17388, 'loss/train': 1.6257576942443848} -08/30/2021 16:22:06 - INFO - __main__ - Step 17390: {'lr': 0.0004867796852656527, 'samples': 3338880, 'steps': 17389, 'loss/train': 1.0585116147994995} -08/30/2021 16:22:08 - INFO - __main__ - Step 17391: {'lr': 0.00048677798236668537, 'samples': 3339072, 'steps': 17390, 'loss/train': 1.5680699348449707} -08/30/2021 16:22:08 - INFO - __main__ - Step 17392: {'lr': 0.00048677627936102966, 'samples': 3339264, 'steps': 17391, 'loss/train': 2.17177414894104} -08/30/2021 16:22:09 - INFO - __main__ - Step 17393: {'lr': 0.0004867745762486861, 'samples': 3339456, 'steps': 17392, 'loss/train': 2.0008177757263184} -08/30/2021 16:22:09 - INFO - __main__ - Step 17394: {'lr': 0.0004867728730296556, 'samples': 3339648, 'steps': 17393, 'loss/train': 1.4614367485046387} -08/30/2021 16:22:09 - INFO - __main__ - Step 17395: {'lr': 0.0004867711697039389, 'samples': 3339840, 'steps': 17394, 'loss/train': 1.858125925064087} -08/30/2021 16:22:11 - INFO - __main__ - Step 17396: {'lr': 0.00048676946627153675, 'samples': 3340032, 'steps': 17395, 'loss/train': 1.4392808675765991} -08/30/2021 16:22:11 - INFO - __main__ - Step 17397: {'lr': 0.00048676776273244994, 'samples': 3340224, 'steps': 17396, 'loss/train': 1.8327624797821045} -08/30/2021 16:22:12 - INFO - __main__ - Step 17398: {'lr': 0.00048676605908667926, 'samples': 3340416, 'steps': 17397, 'loss/train': 2.5532779693603516} -08/30/2021 16:22:12 - INFO - __main__ - Step 17399: {'lr': 0.00048676435533422536, 'samples': 3340608, 'steps': 17398, 'loss/train': 1.3023334741592407} -08/30/2021 16:22:12 - INFO - __main__ - Step 17400: {'lr': 0.00048676265147508917, 'samples': 3340800, 'steps': 17399, 'loss/train': 1.5067830085754395} -08/30/2021 16:22:14 - INFO - __main__ - Step 17401: {'lr': 0.00048676094750927144, 'samples': 3340992, 'steps': 17400, 'loss/train': 1.7027322053909302} -08/30/2021 16:22:14 - INFO - __main__ - Step 17402: {'lr': 0.0004867592434367728, 'samples': 3341184, 'steps': 17401, 'loss/train': 1.6238844394683838} -08/30/2021 16:22:15 - INFO - __main__ - Step 17403: {'lr': 0.0004867575392575941, 'samples': 3341376, 'steps': 17402, 'loss/train': 1.6029798984527588} -08/30/2021 16:22:15 - INFO - __main__ - Step 17404: {'lr': 0.0004867558349717361, 'samples': 3341568, 'steps': 17403, 'loss/train': 1.3958392143249512} -08/30/2021 16:22:15 - INFO - __main__ - Step 17405: {'lr': 0.0004867541305791996, 'samples': 3341760, 'steps': 17404, 'loss/train': 1.8233625888824463} -08/30/2021 16:22:17 - INFO - __main__ - Step 17406: {'lr': 0.00048675242607998533, 'samples': 3341952, 'steps': 17405, 'loss/train': 1.6665757894515991} -08/30/2021 16:22:17 - INFO - __main__ - Step 17407: {'lr': 0.00048675072147409405, 'samples': 3342144, 'steps': 17406, 'loss/train': 1.259602665901184} -08/30/2021 16:22:18 - INFO - __main__ - Step 17408: {'lr': 0.0004867490167615266, 'samples': 3342336, 'steps': 17407, 'loss/train': 2.2457082271575928} -08/30/2021 16:22:18 - INFO - __main__ - Step 17409: {'lr': 0.0004867473119422837, 'samples': 3342528, 'steps': 17408, 'loss/train': 1.7272624969482422} -08/30/2021 16:22:18 - INFO - __main__ - Step 17410: {'lr': 0.00048674560701636606, 'samples': 3342720, 'steps': 17409, 'loss/train': 1.9000693559646606} -08/30/2021 16:22:20 - INFO - __main__ - Step 17411: {'lr': 0.0004867439019837745, 'samples': 3342912, 'steps': 17410, 'loss/train': 2.7054336071014404} -08/30/2021 16:22:20 - INFO - __main__ - Step 17412: {'lr': 0.00048674219684450985, 'samples': 3343104, 'steps': 17411, 'loss/train': 1.8756489753723145} -08/30/2021 16:22:21 - INFO - __main__ - Step 17413: {'lr': 0.00048674049159857277, 'samples': 3343296, 'steps': 17412, 'loss/train': 0.689872682094574} -08/30/2021 16:22:21 - INFO - __main__ - Step 17414: {'lr': 0.0004867387862459641, 'samples': 3343488, 'steps': 17413, 'loss/train': 1.6381309032440186} -08/30/2021 16:22:21 - INFO - __main__ - Step 17415: {'lr': 0.0004867370807866845, 'samples': 3343680, 'steps': 17414, 'loss/train': 1.8539162874221802} -08/30/2021 16:22:24 - INFO - __main__ - Step 17416: {'lr': 0.000486735375220735, 'samples': 3343872, 'steps': 17415, 'loss/train': 2.4776206016540527} -08/30/2021 16:22:24 - INFO - __main__ - Step 17417: {'lr': 0.00048673366954811605, 'samples': 3344064, 'steps': 17416, 'loss/train': 1.5945243835449219} -08/30/2021 16:22:24 - INFO - __main__ - Step 17418: {'lr': 0.0004867319637688286, 'samples': 3344256, 'steps': 17417, 'loss/train': 1.1917868852615356} -08/30/2021 16:22:25 - INFO - __main__ - Step 17419: {'lr': 0.0004867302578828734, 'samples': 3344448, 'steps': 17418, 'loss/train': 1.623712182044983} -08/30/2021 16:22:25 - INFO - __main__ - Step 17420: {'lr': 0.0004867285518902512, 'samples': 3344640, 'steps': 17419, 'loss/train': 2.194242477416992} -08/30/2021 16:22:25 - INFO - __main__ - Step 17421: {'lr': 0.0004867268457909627, 'samples': 3344832, 'steps': 17420, 'loss/train': 1.349695086479187} -08/30/2021 16:22:28 - INFO - __main__ - Step 17422: {'lr': 0.0004867251395850088, 'samples': 3345024, 'steps': 17421, 'loss/train': 0.17078430950641632} -08/30/2021 16:22:29 - INFO - __main__ - Step 17423: {'lr': 0.00048672343327239024, 'samples': 3345216, 'steps': 17422, 'loss/train': 1.512771725654602} -08/30/2021 16:22:29 - INFO - __main__ - Step 17424: {'lr': 0.00048672172685310767, 'samples': 3345408, 'steps': 17423, 'loss/train': 1.4440419673919678} -08/30/2021 16:22:29 - INFO - __main__ - Step 17425: {'lr': 0.000486720020327162, 'samples': 3345600, 'steps': 17424, 'loss/train': 1.7390447854995728} -08/30/2021 16:22:30 - INFO - __main__ - Step 17426: {'lr': 0.00048671831369455386, 'samples': 3345792, 'steps': 17425, 'loss/train': 0.44793176651000977} -08/30/2021 16:22:30 - INFO - __main__ - Step 17427: {'lr': 0.0004867166069552842, 'samples': 3345984, 'steps': 17426, 'loss/train': 2.000828266143799} -08/30/2021 16:22:30 - INFO - __main__ - Step 17428: {'lr': 0.00048671490010935366, 'samples': 3346176, 'steps': 17427, 'loss/train': 1.1772760152816772} -08/30/2021 16:22:31 - INFO - __main__ - Step 17429: {'lr': 0.00048671319315676305, 'samples': 3346368, 'steps': 17428, 'loss/train': 2.734375} -08/30/2021 16:22:32 - INFO - __main__ - Step 17430: {'lr': 0.00048671148609751307, 'samples': 3346560, 'steps': 17429, 'loss/train': 1.5546437501907349} -08/30/2021 16:22:33 - INFO - __main__ - Step 17431: {'lr': 0.0004867097789316046, 'samples': 3346752, 'steps': 17430, 'loss/train': 2.1142067909240723} -08/30/2021 16:22:33 - INFO - __main__ - Step 17432: {'lr': 0.0004867080716590384, 'samples': 3346944, 'steps': 17431, 'loss/train': 1.9760955572128296} -08/30/2021 16:22:33 - INFO - __main__ - Step 17433: {'lr': 0.0004867063642798151, 'samples': 3347136, 'steps': 17432, 'loss/train': 1.793282389640808} -08/30/2021 16:22:34 - INFO - __main__ - Step 17434: {'lr': 0.0004867046567939356, 'samples': 3347328, 'steps': 17433, 'loss/train': 1.8897130489349365} -08/30/2021 16:22:35 - INFO - __main__ - Step 17435: {'lr': 0.00048670294920140063, 'samples': 3347520, 'steps': 17434, 'loss/train': 2.087878465652466} -08/30/2021 16:22:36 - INFO - __main__ - Step 17436: {'lr': 0.00048670124150221094, 'samples': 3347712, 'steps': 17435, 'loss/train': 1.708673357963562} -08/30/2021 16:22:36 - INFO - __main__ - Step 17437: {'lr': 0.00048669953369636737, 'samples': 3347904, 'steps': 17436, 'loss/train': 1.349056601524353} -08/30/2021 16:22:36 - INFO - __main__ - Step 17438: {'lr': 0.00048669782578387067, 'samples': 3348096, 'steps': 17437, 'loss/train': 0.8885194063186646} -08/30/2021 16:22:37 - INFO - __main__ - Step 17439: {'lr': 0.00048669611776472153, 'samples': 3348288, 'steps': 17438, 'loss/train': 1.7635525465011597} -08/30/2021 16:22:37 - INFO - __main__ - Step 17440: {'lr': 0.00048669440963892074, 'samples': 3348480, 'steps': 17439, 'loss/train': 2.1269845962524414} -08/30/2021 16:22:39 - INFO - __main__ - Step 17441: {'lr': 0.00048669270140646914, 'samples': 3348672, 'steps': 17440, 'loss/train': 1.8065775632858276} -08/30/2021 16:22:39 - INFO - __main__ - Step 17442: {'lr': 0.0004866909930673675, 'samples': 3348864, 'steps': 17441, 'loss/train': 2.5166263580322266} -08/30/2021 16:22:39 - INFO - __main__ - Step 17443: {'lr': 0.00048668928462161653, 'samples': 3349056, 'steps': 17442, 'loss/train': 2.0788023471832275} -08/30/2021 16:22:40 - INFO - __main__ - Step 17444: {'lr': 0.000486687576069217, 'samples': 3349248, 'steps': 17443, 'loss/train': 5.522563934326172} -08/30/2021 16:22:40 - INFO - __main__ - Step 17445: {'lr': 0.00048668586741016967, 'samples': 3349440, 'steps': 17444, 'loss/train': 2.367457866668701} -08/30/2021 16:22:42 - INFO - __main__ - Step 17446: {'lr': 0.0004866841586444754, 'samples': 3349632, 'steps': 17445, 'loss/train': 1.866705060005188} -08/30/2021 16:22:43 - INFO - __main__ - Step 17447: {'lr': 0.0004866824497721349, 'samples': 3349824, 'steps': 17446, 'loss/train': 1.8990633487701416} -08/30/2021 16:22:43 - INFO - __main__ - Step 17448: {'lr': 0.0004866807407931489, 'samples': 3350016, 'steps': 17447, 'loss/train': 1.7508528232574463} -08/30/2021 16:22:43 - INFO - __main__ - Step 17449: {'lr': 0.0004866790317075182, 'samples': 3350208, 'steps': 17448, 'loss/train': 1.650154709815979} -08/30/2021 16:22:44 - INFO - __main__ - Step 17450: {'lr': 0.00048667732251524365, 'samples': 3350400, 'steps': 17449, 'loss/train': 1.7136389017105103} -08/30/2021 16:22:44 - INFO - __main__ - Step 17451: {'lr': 0.0004866756132163259, 'samples': 3350592, 'steps': 17450, 'loss/train': 1.9944013357162476} -08/30/2021 16:22:45 - INFO - __main__ - Step 17452: {'lr': 0.0004866739038107658, 'samples': 3350784, 'steps': 17451, 'loss/train': 0.36397862434387207} -08/30/2021 16:22:46 - INFO - __main__ - Step 17453: {'lr': 0.000486672194298564, 'samples': 3350976, 'steps': 17452, 'loss/train': 1.371496558189392} -08/30/2021 16:22:46 - INFO - __main__ - Step 17454: {'lr': 0.00048667048467972146, 'samples': 3351168, 'steps': 17453, 'loss/train': 2.206498384475708} -08/30/2021 16:22:47 - INFO - __main__ - Step 17455: {'lr': 0.00048666877495423885, 'samples': 3351360, 'steps': 17454, 'loss/train': 2.2213566303253174} -08/30/2021 16:22:47 - INFO - __main__ - Step 17456: {'lr': 0.0004866670651221169, 'samples': 3351552, 'steps': 17455, 'loss/train': 1.8459641933441162} -08/30/2021 16:22:48 - INFO - __main__ - Step 17457: {'lr': 0.0004866653551833564, 'samples': 3351744, 'steps': 17456, 'loss/train': 2.0397403240203857} -08/30/2021 16:22:49 - INFO - __main__ - Step 17458: {'lr': 0.00048666364513795816, 'samples': 3351936, 'steps': 17457, 'loss/train': 1.4646025896072388} -08/30/2021 16:22:49 - INFO - __main__ - Step 17459: {'lr': 0.00048666193498592304, 'samples': 3352128, 'steps': 17458, 'loss/train': 1.1593598127365112} -08/30/2021 16:22:50 - INFO - __main__ - Step 17460: {'lr': 0.0004866602247272516, 'samples': 3352320, 'steps': 17459, 'loss/train': 0.906301736831665} -08/30/2021 16:22:50 - INFO - __main__ - Step 17461: {'lr': 0.0004866585143619447, 'samples': 3352512, 'steps': 17460, 'loss/train': 1.827962875366211} -08/30/2021 16:22:51 - INFO - __main__ - Step 17462: {'lr': 0.00048665680389000315, 'samples': 3352704, 'steps': 17461, 'loss/train': 2.0785582065582275} -08/30/2021 16:22:52 - INFO - __main__ - Step 17463: {'lr': 0.0004866550933114277, 'samples': 3352896, 'steps': 17462, 'loss/train': 1.6082682609558105} -08/30/2021 16:22:52 - INFO - __main__ - Step 17464: {'lr': 0.00048665338262621915, 'samples': 3353088, 'steps': 17463, 'loss/train': 1.9932937622070312} -08/30/2021 16:22:53 - INFO - __main__ - Step 17465: {'lr': 0.00048665167183437817, 'samples': 3353280, 'steps': 17464, 'loss/train': 1.7249715328216553} -08/30/2021 16:22:53 - INFO - __main__ - Step 17466: {'lr': 0.00048664996093590563, 'samples': 3353472, 'steps': 17465, 'loss/train': 2.252119302749634} -08/30/2021 16:22:54 - INFO - __main__ - Step 17467: {'lr': 0.0004866482499308023, 'samples': 3353664, 'steps': 17466, 'loss/train': 2.0502357482910156} -08/30/2021 16:22:55 - INFO - __main__ - Step 17468: {'lr': 0.0004866465388190689, 'samples': 3353856, 'steps': 17467, 'loss/train': 1.966733694076538} -08/30/2021 16:22:55 - INFO - __main__ - Step 17469: {'lr': 0.0004866448276007062, 'samples': 3354048, 'steps': 17468, 'loss/train': 1.647402048110962} -08/30/2021 16:22:55 - INFO - __main__ - Step 17470: {'lr': 0.000486643116275715, 'samples': 3354240, 'steps': 17469, 'loss/train': 3.549617290496826} -08/30/2021 16:22:56 - INFO - __main__ - Step 17471: {'lr': 0.00048664140484409613, 'samples': 3354432, 'steps': 17470, 'loss/train': 1.3118197917938232} -08/30/2021 16:22:57 - INFO - __main__ - Step 17472: {'lr': 0.0004866396933058502, 'samples': 3354624, 'steps': 17471, 'loss/train': 1.5544676780700684} -08/30/2021 16:22:58 - INFO - __main__ - Step 17473: {'lr': 0.00048663798166097814, 'samples': 3354816, 'steps': 17472, 'loss/train': 2.0812900066375732} -08/30/2021 16:22:58 - INFO - __main__ - Step 17474: {'lr': 0.0004866362699094806, 'samples': 3355008, 'steps': 17473, 'loss/train': 1.616500973701477} -08/30/2021 16:22:58 - INFO - __main__ - Step 17475: {'lr': 0.0004866345580513585, 'samples': 3355200, 'steps': 17474, 'loss/train': 1.8247954845428467} -08/30/2021 16:22:59 - INFO - __main__ - Step 17476: {'lr': 0.0004866328460866124, 'samples': 3355392, 'steps': 17475, 'loss/train': 1.255110740661621} -08/30/2021 16:22:59 - INFO - __main__ - Step 17477: {'lr': 0.0004866311340152433, 'samples': 3355584, 'steps': 17476, 'loss/train': 1.3190022706985474} -08/30/2021 16:23:01 - INFO - __main__ - Step 17478: {'lr': 0.0004866294218372518, 'samples': 3355776, 'steps': 17477, 'loss/train': 1.7746151685714722} -08/30/2021 16:23:02 - INFO - __main__ - Step 17479: {'lr': 0.0004866277095526387, 'samples': 3355968, 'steps': 17478, 'loss/train': 2.225783348083496} -08/30/2021 16:23:02 - INFO - __main__ - Step 17480: {'lr': 0.00048662599716140485, 'samples': 3356160, 'steps': 17479, 'loss/train': 1.618331789970398} -08/30/2021 16:23:03 - INFO - __main__ - Step 17481: {'lr': 0.00048662428466355104, 'samples': 3356352, 'steps': 17480, 'loss/train': 1.8510490655899048} -08/30/2021 16:23:03 - INFO - __main__ - Step 17482: {'lr': 0.0004866225720590779, 'samples': 3356544, 'steps': 17481, 'loss/train': 3.352268695831299} -08/30/2021 16:23:05 - INFO - __main__ - Step 17483: {'lr': 0.00048662085934798627, 'samples': 3356736, 'steps': 17482, 'loss/train': 1.5689951181411743} -08/30/2021 16:23:05 - INFO - __main__ - Step 17484: {'lr': 0.00048661914653027694, 'samples': 3356928, 'steps': 17483, 'loss/train': 1.9016592502593994} -08/30/2021 16:23:05 - INFO - __main__ - Step 17485: {'lr': 0.0004866174336059507, 'samples': 3357120, 'steps': 17484, 'loss/train': 0.360641211271286} -08/30/2021 16:23:06 - INFO - __main__ - Step 17486: {'lr': 0.00048661572057500833, 'samples': 3357312, 'steps': 17485, 'loss/train': 0.2026984840631485} -08/30/2021 16:23:06 - INFO - __main__ - Step 17487: {'lr': 0.00048661400743745057, 'samples': 3357504, 'steps': 17486, 'loss/train': 1.749847412109375} -08/30/2021 16:23:08 - INFO - __main__ - Step 17488: {'lr': 0.00048661229419327806, 'samples': 3357696, 'steps': 17487, 'loss/train': 1.402083158493042} -08/30/2021 16:23:08 - INFO - __main__ - Step 17489: {'lr': 0.0004866105808424918, 'samples': 3357888, 'steps': 17488, 'loss/train': 1.8154724836349487} -08/30/2021 16:23:09 - INFO - __main__ - Step 17490: {'lr': 0.0004866088673850925, 'samples': 3358080, 'steps': 17489, 'loss/train': 1.7261987924575806} -08/30/2021 16:23:09 - INFO - __main__ - Step 17491: {'lr': 0.0004866071538210808, 'samples': 3358272, 'steps': 17490, 'loss/train': 1.573549747467041} -08/30/2021 16:23:09 - INFO - __main__ - Step 17492: {'lr': 0.0004866054401504576, 'samples': 3358464, 'steps': 17491, 'loss/train': 2.3931453227996826} -08/30/2021 16:23:11 - INFO - __main__ - Step 17493: {'lr': 0.0004866037263732237, 'samples': 3358656, 'steps': 17492, 'loss/train': 1.9802180528640747} -08/30/2021 16:23:12 - INFO - __main__ - Step 17494: {'lr': 0.00048660201248937974, 'samples': 3358848, 'steps': 17493, 'loss/train': 1.6586722135543823} -08/30/2021 16:23:12 - INFO - __main__ - Step 17495: {'lr': 0.0004866002984989266, 'samples': 3359040, 'steps': 17494, 'loss/train': 1.571513056755066} -08/30/2021 16:23:12 - INFO - __main__ - Step 17496: {'lr': 0.000486598584401865, 'samples': 3359232, 'steps': 17495, 'loss/train': 2.110097646713257} -08/30/2021 16:23:13 - INFO - __main__ - Step 17497: {'lr': 0.0004865968701981958, 'samples': 3359424, 'steps': 17496, 'loss/train': 1.8144365549087524} -08/30/2021 16:23:13 - INFO - __main__ - Step 17498: {'lr': 0.0004865951558879196, 'samples': 3359616, 'steps': 17497, 'loss/train': 1.760158896446228} -08/30/2021 16:23:15 - INFO - __main__ - Step 17499: {'lr': 0.00048659344147103725, 'samples': 3359808, 'steps': 17498, 'loss/train': 0.44034385681152344} -08/30/2021 16:23:15 - INFO - __main__ - Step 17500: {'lr': 0.0004865917269475496, 'samples': 3360000, 'steps': 17499, 'loss/train': 1.6851074695587158} -08/30/2021 16:23:15 - INFO - __main__ - Step 17501: {'lr': 0.00048659001231745734, 'samples': 3360192, 'steps': 17500, 'loss/train': 1.7847763299942017} -08/30/2021 16:23:16 - INFO - __main__ - Step 17502: {'lr': 0.0004865882975807614, 'samples': 3360384, 'steps': 17501, 'loss/train': 1.5666096210479736} -08/30/2021 16:23:16 - INFO - __main__ - Step 17503: {'lr': 0.00048658658273746224, 'samples': 3360576, 'steps': 17502, 'loss/train': 1.6288776397705078} -08/30/2021 16:23:18 - INFO - __main__ - Step 17504: {'lr': 0.00048658486778756097, 'samples': 3360768, 'steps': 17503, 'loss/train': 1.1607974767684937} -08/30/2021 16:23:18 - INFO - __main__ - Step 17505: {'lr': 0.0004865831527310581, 'samples': 3360960, 'steps': 17504, 'loss/train': 1.639221429824829} -08/30/2021 16:23:18 - INFO - __main__ - Step 17506: {'lr': 0.00048658143756795456, 'samples': 3361152, 'steps': 17505, 'loss/train': 1.5825897455215454} -08/30/2021 16:23:19 - INFO - __main__ - Step 17507: {'lr': 0.0004865797222982511, 'samples': 3361344, 'steps': 17506, 'loss/train': 1.4309252500534058} -08/30/2021 16:23:19 - INFO - __main__ - Step 17508: {'lr': 0.0004865780069219484, 'samples': 3361536, 'steps': 17507, 'loss/train': 1.031682014465332} -08/30/2021 16:23:21 - INFO - __main__ - Step 17509: {'lr': 0.00048657629143904733, 'samples': 3361728, 'steps': 17508, 'loss/train': 1.5543208122253418} -08/30/2021 16:23:21 - INFO - __main__ - Step 17510: {'lr': 0.0004865745758495487, 'samples': 3361920, 'steps': 17509, 'loss/train': 2.160651206970215} -08/30/2021 16:23:22 - INFO - __main__ - Step 17511: {'lr': 0.00048657286015345313, 'samples': 3362112, 'steps': 17510, 'loss/train': 2.1131794452667236} -08/30/2021 16:23:22 - INFO - __main__ - Step 17512: {'lr': 0.00048657114435076153, 'samples': 3362304, 'steps': 17511, 'loss/train': 1.8827873468399048} -08/30/2021 16:23:22 - INFO - __main__ - Step 17513: {'lr': 0.00048656942844147464, 'samples': 3362496, 'steps': 17512, 'loss/train': 1.306170105934143} -08/30/2021 16:23:24 - INFO - __main__ - Step 17514: {'lr': 0.00048656771242559316, 'samples': 3362688, 'steps': 17513, 'loss/train': 1.6868219375610352} -08/30/2021 16:23:24 - INFO - __main__ - Step 17515: {'lr': 0.0004865659963031179, 'samples': 3362880, 'steps': 17514, 'loss/train': 1.9404577016830444} -08/30/2021 16:23:24 - INFO - __main__ - Step 17516: {'lr': 0.0004865642800740497, 'samples': 3363072, 'steps': 17515, 'loss/train': 1.8532264232635498} -08/30/2021 16:23:25 - INFO - __main__ - Step 17517: {'lr': 0.0004865625637383893, 'samples': 3363264, 'steps': 17516, 'loss/train': 1.0725972652435303} -08/30/2021 16:23:25 - INFO - __main__ - Step 17518: {'lr': 0.00048656084729613747, 'samples': 3363456, 'steps': 17517, 'loss/train': 1.7218142747879028} -08/30/2021 16:23:27 - INFO - __main__ - Step 17519: {'lr': 0.0004865591307472949, 'samples': 3363648, 'steps': 17518, 'loss/train': 1.6953128576278687} -08/30/2021 16:23:27 - INFO - __main__ - Step 17520: {'lr': 0.0004865574140918625, 'samples': 3363840, 'steps': 17519, 'loss/train': 1.5887824296951294} -08/30/2021 16:23:27 - INFO - __main__ - Step 17521: {'lr': 0.00048655569732984096, 'samples': 3364032, 'steps': 17520, 'loss/train': 1.7230455875396729} -08/30/2021 16:23:28 - INFO - __main__ - Step 17522: {'lr': 0.000486553980461231, 'samples': 3364224, 'steps': 17521, 'loss/train': 1.970909833908081} -08/30/2021 16:23:28 - INFO - __main__ - Step 17523: {'lr': 0.0004865522634860335, 'samples': 3364416, 'steps': 17522, 'loss/train': 1.807120442390442} -08/30/2021 16:23:30 - INFO - __main__ - Step 17524: {'lr': 0.00048655054640424936, 'samples': 3364608, 'steps': 17523, 'loss/train': 1.5671602487564087} -08/30/2021 16:23:30 - INFO - __main__ - Step 17525: {'lr': 0.00048654882921587907, 'samples': 3364800, 'steps': 17524, 'loss/train': 2.561570882797241} -08/30/2021 16:23:30 - INFO - __main__ - Step 17526: {'lr': 0.00048654711192092347, 'samples': 3364992, 'steps': 17525, 'loss/train': 0.830582857131958} -08/30/2021 16:23:31 - INFO - __main__ - Step 17527: {'lr': 0.0004865453945193835, 'samples': 3365184, 'steps': 17526, 'loss/train': 1.5798051357269287} -08/30/2021 16:23:31 - INFO - __main__ - Step 17528: {'lr': 0.00048654367701125975, 'samples': 3365376, 'steps': 17527, 'loss/train': 1.8259228467941284} -08/30/2021 16:23:33 - INFO - __main__ - Step 17529: {'lr': 0.0004865419593965531, 'samples': 3365568, 'steps': 17528, 'loss/train': 2.335393190383911} -08/30/2021 16:23:34 - INFO - __main__ - Step 17530: {'lr': 0.0004865402416752642, 'samples': 3365760, 'steps': 17529, 'loss/train': 1.5797656774520874} -08/30/2021 16:23:34 - INFO - __main__ - Step 17531: {'lr': 0.0004865385238473941, 'samples': 3365952, 'steps': 17530, 'loss/train': 1.0944950580596924} -08/30/2021 16:23:34 - INFO - __main__ - Step 17532: {'lr': 0.00048653680591294324, 'samples': 3366144, 'steps': 17531, 'loss/train': 1.232177972793579} -08/30/2021 16:23:35 - INFO - __main__ - Step 17533: {'lr': 0.00048653508787191256, 'samples': 3366336, 'steps': 17532, 'loss/train': 2.8243906497955322} -08/30/2021 16:23:37 - INFO - __main__ - Step 17534: {'lr': 0.00048653336972430297, 'samples': 3366528, 'steps': 17533, 'loss/train': 2.401196241378784} -08/30/2021 16:23:37 - INFO - __main__ - Step 17535: {'lr': 0.0004865316514701149, 'samples': 3366720, 'steps': 17534, 'loss/train': 1.4661340713500977} -08/30/2021 16:23:38 - INFO - __main__ - Step 17536: {'lr': 0.0004865299331093495, 'samples': 3366912, 'steps': 17535, 'loss/train': 1.7392544746398926} -08/30/2021 16:23:38 - INFO - __main__ - Step 17537: {'lr': 0.0004865282146420072, 'samples': 3367104, 'steps': 17536, 'loss/train': 1.827589988708496} -08/30/2021 16:23:38 - INFO - __main__ - Step 17538: {'lr': 0.000486526496068089, 'samples': 3367296, 'steps': 17537, 'loss/train': 1.1134750843048096} -08/30/2021 16:23:39 - INFO - __main__ - Step 17539: {'lr': 0.0004865247773875956, 'samples': 3367488, 'steps': 17538, 'loss/train': 1.734523892402649} -08/30/2021 16:23:39 - INFO - __main__ - Step 17540: {'lr': 0.0004865230586005278, 'samples': 3367680, 'steps': 17539, 'loss/train': 0.24024170637130737} -08/30/2021 16:23:41 - INFO - __main__ - Step 17541: {'lr': 0.00048652133970688633, 'samples': 3367872, 'steps': 17540, 'loss/train': 0.15640875697135925} -08/30/2021 16:23:41 - INFO - __main__ - Step 17542: {'lr': 0.00048651962070667197, 'samples': 3368064, 'steps': 17541, 'loss/train': 1.7502667903900146} -08/30/2021 16:23:41 - INFO - __main__ - Step 17543: {'lr': 0.00048651790159988563, 'samples': 3368256, 'steps': 17542, 'loss/train': 0.8552508354187012} -08/30/2021 16:23:42 - INFO - __main__ - Step 17544: {'lr': 0.0004865161823865279, 'samples': 3368448, 'steps': 17543, 'loss/train': 1.3909282684326172} -08/30/2021 16:23:42 - INFO - __main__ - Step 17545: {'lr': 0.0004865144630665996, 'samples': 3368640, 'steps': 17544, 'loss/train': 1.7435178756713867} -08/30/2021 16:23:44 - INFO - __main__ - Step 17546: {'lr': 0.0004865127436401016, 'samples': 3368832, 'steps': 17545, 'loss/train': 1.4475579261779785} -08/30/2021 16:23:44 - INFO - __main__ - Step 17547: {'lr': 0.00048651102410703464, 'samples': 3369024, 'steps': 17546, 'loss/train': 1.4390286207199097} -08/30/2021 16:23:44 - INFO - __main__ - Step 17548: {'lr': 0.00048650930446739936, 'samples': 3369216, 'steps': 17547, 'loss/train': 1.4975570440292358} -08/30/2021 16:23:45 - INFO - __main__ - Step 17549: {'lr': 0.00048650758472119666, 'samples': 3369408, 'steps': 17548, 'loss/train': 1.786547303199768} -08/30/2021 16:23:45 - INFO - __main__ - Step 17550: {'lr': 0.0004865058648684273, 'samples': 3369600, 'steps': 17549, 'loss/train': 1.720345139503479} -08/30/2021 16:23:46 - INFO - __main__ - Step 17551: {'lr': 0.00048650414490909207, 'samples': 3369792, 'steps': 17550, 'loss/train': 1.4965839385986328} -08/30/2021 16:23:47 - INFO - __main__ - Step 17552: {'lr': 0.00048650242484319175, 'samples': 3369984, 'steps': 17551, 'loss/train': 1.6356937885284424} -08/30/2021 16:23:47 - INFO - __main__ - Step 17553: {'lr': 0.000486500704670727, 'samples': 3370176, 'steps': 17552, 'loss/train': 1.6092661619186401} -08/30/2021 16:23:48 - INFO - __main__ - Step 17554: {'lr': 0.0004864989843916987, 'samples': 3370368, 'steps': 17553, 'loss/train': 1.1740132570266724} -08/30/2021 16:23:48 - INFO - __main__ - Step 17555: {'lr': 0.0004864972640061077, 'samples': 3370560, 'steps': 17554, 'loss/train': 1.7153794765472412} -08/30/2021 16:23:49 - INFO - __main__ - Step 17556: {'lr': 0.00048649554351395453, 'samples': 3370752, 'steps': 17555, 'loss/train': 2.135126829147339} -08/30/2021 16:23:50 - INFO - __main__ - Step 17557: {'lr': 0.00048649382291524024, 'samples': 3370944, 'steps': 17556, 'loss/train': 1.6388752460479736} -08/30/2021 16:23:50 - INFO - __main__ - Step 17558: {'lr': 0.0004864921022099654, 'samples': 3371136, 'steps': 17557, 'loss/train': 1.245361328125} -08/30/2021 16:23:51 - INFO - __main__ - Step 17559: {'lr': 0.00048649038139813097, 'samples': 3371328, 'steps': 17558, 'loss/train': 0.5165625214576721} -08/30/2021 16:23:51 - INFO - __main__ - Step 17560: {'lr': 0.00048648866047973756, 'samples': 3371520, 'steps': 17559, 'loss/train': 1.52119779586792} -08/30/2021 16:23:52 - INFO - __main__ - Step 17561: {'lr': 0.000486486939454786, 'samples': 3371712, 'steps': 17560, 'loss/train': 1.4700878858566284} -08/30/2021 16:23:53 - INFO - __main__ - Step 17562: {'lr': 0.0004864852183232771, 'samples': 3371904, 'steps': 17561, 'loss/train': 1.4670953750610352} -08/30/2021 16:23:53 - INFO - __main__ - Step 17563: {'lr': 0.0004864834970852116, 'samples': 3372096, 'steps': 17562, 'loss/train': 1.9046157598495483} -08/30/2021 16:23:54 - INFO - __main__ - Step 17564: {'lr': 0.0004864817757405903, 'samples': 3372288, 'steps': 17563, 'loss/train': 0.10192663967609406} -08/30/2021 16:23:54 - INFO - __main__ - Step 17565: {'lr': 0.0004864800542894139, 'samples': 3372480, 'steps': 17564, 'loss/train': 1.6360749006271362} -08/30/2021 16:23:56 - INFO - __main__ - Step 17566: {'lr': 0.0004864783327316833, 'samples': 3372672, 'steps': 17565, 'loss/train': 2.031972885131836} -08/30/2021 16:23:57 - INFO - __main__ - Step 17567: {'lr': 0.0004864766110673992, 'samples': 3372864, 'steps': 17566, 'loss/train': 1.7081667184829712} -08/30/2021 16:23:57 - INFO - __main__ - Step 17568: {'lr': 0.00048647488929656237, 'samples': 3373056, 'steps': 17567, 'loss/train': 1.829378604888916} -08/30/2021 16:23:57 - INFO - __main__ - Step 17569: {'lr': 0.00048647316741917365, 'samples': 3373248, 'steps': 17568, 'loss/train': 0.38812997937202454} -08/30/2021 16:23:58 - INFO - __main__ - Step 17570: {'lr': 0.0004864714454352337, 'samples': 3373440, 'steps': 17569, 'loss/train': 1.7490671873092651} -08/30/2021 16:23:59 - INFO - __main__ - Step 17571: {'lr': 0.00048646972334474343, 'samples': 3373632, 'steps': 17570, 'loss/train': 2.08906888961792} -08/30/2021 16:24:00 - INFO - __main__ - Step 17572: {'lr': 0.0004864680011477035, 'samples': 3373824, 'steps': 17571, 'loss/train': 1.4270910024642944} -08/30/2021 16:24:00 - INFO - __main__ - Step 17573: {'lr': 0.00048646627884411475, 'samples': 3374016, 'steps': 17572, 'loss/train': 1.5729337930679321} -08/30/2021 16:24:01 - INFO - __main__ - Step 17574: {'lr': 0.00048646455643397803, 'samples': 3374208, 'steps': 17573, 'loss/train': 1.4936065673828125} -08/30/2021 16:24:01 - INFO - __main__ - Step 17575: {'lr': 0.0004864628339172939, 'samples': 3374400, 'steps': 17574, 'loss/train': 2.0495150089263916} -08/30/2021 16:24:01 - INFO - __main__ - Step 17576: {'lr': 0.00048646111129406336, 'samples': 3374592, 'steps': 17575, 'loss/train': 1.1590380668640137} -08/30/2021 16:24:03 - INFO - __main__ - Step 17577: {'lr': 0.00048645938856428704, 'samples': 3374784, 'steps': 17576, 'loss/train': 1.0573232173919678} -08/30/2021 16:24:03 - INFO - __main__ - Step 17578: {'lr': 0.0004864576657279658, 'samples': 3374976, 'steps': 17577, 'loss/train': 1.2430789470672607} -08/30/2021 16:24:03 - INFO - __main__ - Step 17579: {'lr': 0.0004864559427851003, 'samples': 3375168, 'steps': 17578, 'loss/train': 1.875684142112732} -08/30/2021 16:24:04 - INFO - __main__ - Step 17580: {'lr': 0.0004864542197356915, 'samples': 3375360, 'steps': 17579, 'loss/train': 1.5721102952957153} -08/30/2021 16:24:04 - INFO - __main__ - Step 17581: {'lr': 0.00048645249657974007, 'samples': 3375552, 'steps': 17580, 'loss/train': 1.1137334108352661} -08/30/2021 16:24:06 - INFO - __main__ - Step 17582: {'lr': 0.00048645077331724675, 'samples': 3375744, 'steps': 17581, 'loss/train': 2.0492448806762695} -08/30/2021 16:24:06 - INFO - __main__ - Step 17583: {'lr': 0.00048644904994821236, 'samples': 3375936, 'steps': 17582, 'loss/train': 1.9140725135803223} -08/30/2021 16:24:06 - INFO - __main__ - Step 17584: {'lr': 0.0004864473264726377, 'samples': 3376128, 'steps': 17583, 'loss/train': 1.8759957551956177} -08/30/2021 16:24:07 - INFO - __main__ - Step 17585: {'lr': 0.00048644560289052354, 'samples': 3376320, 'steps': 17584, 'loss/train': 1.6567912101745605} -08/30/2021 16:24:07 - INFO - __main__ - Step 17586: {'lr': 0.0004864438792018706, 'samples': 3376512, 'steps': 17585, 'loss/train': 1.447975993156433} -08/30/2021 16:24:08 - INFO - __main__ - Step 17587: {'lr': 0.0004864421554066797, 'samples': 3376704, 'steps': 17586, 'loss/train': 1.0083297491073608} -08/30/2021 16:24:09 - INFO - __main__ - Step 17588: {'lr': 0.00048644043150495165, 'samples': 3376896, 'steps': 17587, 'loss/train': 1.7974839210510254} -08/30/2021 16:24:10 - INFO - __main__ - Step 17589: {'lr': 0.00048643870749668717, 'samples': 3377088, 'steps': 17588, 'loss/train': 1.3072870969772339} -08/30/2021 16:24:10 - INFO - __main__ - Step 17590: {'lr': 0.000486436983381887, 'samples': 3377280, 'steps': 17589, 'loss/train': 1.7835060358047485} -08/30/2021 16:24:11 - INFO - __main__ - Step 17591: {'lr': 0.0004864352591605521, 'samples': 3377472, 'steps': 17590, 'loss/train': 1.905362844467163} -08/30/2021 16:24:11 - INFO - __main__ - Step 17592: {'lr': 0.00048643353483268306, 'samples': 3377664, 'steps': 17591, 'loss/train': 1.7080096006393433} -08/30/2021 16:24:13 - INFO - __main__ - Step 17593: {'lr': 0.00048643181039828066, 'samples': 3377856, 'steps': 17592, 'loss/train': 1.9489187002182007} -08/30/2021 16:24:13 - INFO - __main__ - Step 17594: {'lr': 0.00048643008585734575, 'samples': 3378048, 'steps': 17593, 'loss/train': 0.11998263746500015} -08/30/2021 16:24:14 - INFO - __main__ - Step 17595: {'lr': 0.00048642836120987913, 'samples': 3378240, 'steps': 17594, 'loss/train': 2.023465156555176} -08/30/2021 16:24:14 - INFO - __main__ - Step 17596: {'lr': 0.0004864266364558816, 'samples': 3378432, 'steps': 17595, 'loss/train': 1.4682003259658813} -08/30/2021 16:24:14 - INFO - __main__ - Step 17597: {'lr': 0.00048642491159535373, 'samples': 3378624, 'steps': 17596, 'loss/train': 1.3541736602783203} -08/30/2021 16:24:15 - INFO - __main__ - Step 17598: {'lr': 0.0004864231866282965, 'samples': 3378816, 'steps': 17597, 'loss/train': 2.111245632171631} -08/30/2021 16:24:16 - INFO - __main__ - Step 17599: {'lr': 0.0004864214615547107, 'samples': 3379008, 'steps': 17598, 'loss/train': 1.268403172492981} -08/30/2021 16:24:16 - INFO - __main__ - Step 17600: {'lr': 0.000486419736374597, 'samples': 3379200, 'steps': 17599, 'loss/train': 1.5935360193252563} -08/30/2021 16:24:17 - INFO - __main__ - Step 17601: {'lr': 0.0004864180110879562, 'samples': 3379392, 'steps': 17600, 'loss/train': 1.3745697736740112} -08/30/2021 16:24:17 - INFO - __main__ - Step 17602: {'lr': 0.00048641628569478916, 'samples': 3379584, 'steps': 17601, 'loss/train': 1.301063895225525} -08/30/2021 16:24:18 - INFO - __main__ - Step 17603: {'lr': 0.00048641456019509643, 'samples': 3379776, 'steps': 17602, 'loss/train': 1.8030059337615967} -08/30/2021 16:24:19 - INFO - __main__ - Step 17604: {'lr': 0.0004864128345888791, 'samples': 3379968, 'steps': 17603, 'loss/train': 1.6895872354507446} -08/30/2021 16:24:20 - INFO - __main__ - Step 17605: {'lr': 0.0004864111088761377, 'samples': 3380160, 'steps': 17604, 'loss/train': 1.3598532676696777} -08/30/2021 16:24:20 - INFO - __main__ - Step 17606: {'lr': 0.00048640938305687315, 'samples': 3380352, 'steps': 17605, 'loss/train': 0.15379035472869873} -08/30/2021 16:24:21 - INFO - __main__ - Step 17607: {'lr': 0.00048640765713108615, 'samples': 3380544, 'steps': 17606, 'loss/train': 1.9393595457077026} -08/30/2021 16:24:21 - INFO - __main__ - Step 17608: {'lr': 0.00048640593109877754, 'samples': 3380736, 'steps': 17607, 'loss/train': 0.3218410015106201} -08/30/2021 16:24:21 - INFO - __main__ - Step 17609: {'lr': 0.00048640420495994806, 'samples': 3380928, 'steps': 17608, 'loss/train': 1.898372769355774} -08/30/2021 16:24:23 - INFO - __main__ - Step 17610: {'lr': 0.0004864024787145985, 'samples': 3381120, 'steps': 17609, 'loss/train': 1.7394880056381226} -08/30/2021 16:24:23 - INFO - __main__ - Step 17611: {'lr': 0.00048640075236272963, 'samples': 3381312, 'steps': 17610, 'loss/train': 1.656727910041809} -08/30/2021 16:24:24 - INFO - __main__ - Step 17612: {'lr': 0.00048639902590434214, 'samples': 3381504, 'steps': 17611, 'loss/train': 1.1785953044891357} -08/30/2021 16:24:24 - INFO - __main__ - Step 17613: {'lr': 0.000486397299339437, 'samples': 3381696, 'steps': 17612, 'loss/train': 1.621639609336853} -08/30/2021 16:24:24 - INFO - __main__ - Step 17614: {'lr': 0.0004863955726680149, 'samples': 3381888, 'steps': 17613, 'loss/train': 1.469756007194519} -08/30/2021 16:24:26 - INFO - __main__ - Step 17615: {'lr': 0.0004863938458900765, 'samples': 3382080, 'steps': 17614, 'loss/train': 1.897817611694336} -08/30/2021 16:24:27 - INFO - __main__ - Step 17616: {'lr': 0.0004863921190056227, 'samples': 3382272, 'steps': 17615, 'loss/train': 1.5590382814407349} -08/30/2021 16:24:27 - INFO - __main__ - Step 17617: {'lr': 0.0004863903920146544, 'samples': 3382464, 'steps': 17616, 'loss/train': 1.265742540359497} -08/30/2021 16:24:28 - INFO - __main__ - Step 17618: {'lr': 0.00048638866491717214, 'samples': 3382656, 'steps': 17617, 'loss/train': 2.574831247329712} -08/30/2021 16:24:28 - INFO - __main__ - Step 17619: {'lr': 0.00048638693771317675, 'samples': 3382848, 'steps': 17618, 'loss/train': 1.6485815048217773} -08/30/2021 16:24:28 - INFO - __main__ - Step 17620: {'lr': 0.0004863852104026691, 'samples': 3383040, 'steps': 17619, 'loss/train': 1.6006711721420288} -08/30/2021 16:24:30 - INFO - __main__ - Step 17621: {'lr': 0.00048638348298564996, 'samples': 3383232, 'steps': 17620, 'loss/train': 1.7198574542999268} -08/30/2021 16:24:31 - INFO - __main__ - Step 17622: {'lr': 0.00048638175546212, 'samples': 3383424, 'steps': 17621, 'loss/train': 2.257721424102783} -08/30/2021 16:24:31 - INFO - __main__ - Step 17623: {'lr': 0.00048638002783208013, 'samples': 3383616, 'steps': 17622, 'loss/train': 1.4844609498977661} -08/30/2021 16:24:31 - INFO - __main__ - Step 17624: {'lr': 0.000486378300095531, 'samples': 3383808, 'steps': 17623, 'loss/train': 1.7797285318374634} -08/30/2021 16:24:32 - INFO - __main__ - Step 17625: {'lr': 0.0004863765722524735, 'samples': 3384000, 'steps': 17624, 'loss/train': 1.936982274055481} -08/30/2021 16:24:33 - INFO - __main__ - Step 17626: {'lr': 0.0004863748443029083, 'samples': 3384192, 'steps': 17625, 'loss/train': 1.141573190689087} -08/30/2021 16:24:34 - INFO - __main__ - Step 17627: {'lr': 0.00048637311624683634, 'samples': 3384384, 'steps': 17626, 'loss/train': 1.7004591226577759} -08/30/2021 16:24:34 - INFO - __main__ - Step 17628: {'lr': 0.0004863713880842583, 'samples': 3384576, 'steps': 17627, 'loss/train': 1.8569802045822144} -08/30/2021 16:24:34 - INFO - __main__ - Step 17629: {'lr': 0.0004863696598151749, 'samples': 3384768, 'steps': 17628, 'loss/train': 1.8134541511535645} -08/30/2021 16:24:35 - INFO - __main__ - Step 17630: {'lr': 0.00048636793143958695, 'samples': 3384960, 'steps': 17629, 'loss/train': 1.7280523777008057} -08/30/2021 16:24:35 - INFO - __main__ - Step 17631: {'lr': 0.00048636620295749533, 'samples': 3385152, 'steps': 17630, 'loss/train': 1.4507464170455933} -08/30/2021 16:24:36 - INFO - __main__ - Step 17632: {'lr': 0.00048636447436890075, 'samples': 3385344, 'steps': 17631, 'loss/train': 1.9362410306930542} -08/30/2021 16:24:37 - INFO - __main__ - Step 17633: {'lr': 0.0004863627456738039, 'samples': 3385536, 'steps': 17632, 'loss/train': 2.50399112701416} -08/30/2021 16:24:37 - INFO - __main__ - Step 17634: {'lr': 0.00048636101687220566, 'samples': 3385728, 'steps': 17633, 'loss/train': 0.6674114465713501} -08/30/2021 16:24:38 - INFO - __main__ - Step 17635: {'lr': 0.0004863592879641069, 'samples': 3385920, 'steps': 17634, 'loss/train': 2.0079925060272217} -08/30/2021 16:24:38 - INFO - __main__ - Step 17636: {'lr': 0.0004863575589495082, 'samples': 3386112, 'steps': 17635, 'loss/train': 1.5300225019454956} -08/30/2021 16:24:40 - INFO - __main__ - Step 17637: {'lr': 0.00048635582982841047, 'samples': 3386304, 'steps': 17636, 'loss/train': 2.4551563262939453} -08/30/2021 16:24:41 - INFO - __main__ - Step 17638: {'lr': 0.0004863541006008144, 'samples': 3386496, 'steps': 17637, 'loss/train': 1.9068865776062012} -08/30/2021 16:24:41 - INFO - __main__ - Step 17639: {'lr': 0.0004863523712667209, 'samples': 3386688, 'steps': 17638, 'loss/train': 1.994493007659912} -08/30/2021 16:24:41 - INFO - __main__ - Step 17640: {'lr': 0.00048635064182613063, 'samples': 3386880, 'steps': 17639, 'loss/train': 1.995773196220398} -08/30/2021 16:24:42 - INFO - __main__ - Step 17641: {'lr': 0.00048634891227904435, 'samples': 3387072, 'steps': 17640, 'loss/train': 1.3929442167282104} -08/30/2021 16:24:43 - INFO - __main__ - Step 17642: {'lr': 0.00048634718262546297, 'samples': 3387264, 'steps': 17641, 'loss/train': 1.0950262546539307} -08/30/2021 16:24:44 - INFO - __main__ - Step 17643: {'lr': 0.0004863454528653872, 'samples': 3387456, 'steps': 17642, 'loss/train': 1.6616877317428589} -08/30/2021 16:24:44 - INFO - __main__ - Step 17644: {'lr': 0.0004863437229988178, 'samples': 3387648, 'steps': 17643, 'loss/train': 1.6589170694351196} -08/30/2021 16:24:44 - INFO - __main__ - Step 17645: {'lr': 0.00048634199302575554, 'samples': 3387840, 'steps': 17644, 'loss/train': 1.4650273323059082} -08/30/2021 16:24:45 - INFO - __main__ - Step 17646: {'lr': 0.00048634026294620125, 'samples': 3388032, 'steps': 17645, 'loss/train': 1.4868621826171875} -08/30/2021 16:24:46 - INFO - __main__ - Step 17647: {'lr': 0.00048633853276015566, 'samples': 3388224, 'steps': 17646, 'loss/train': 2.0076630115509033} -08/30/2021 16:24:47 - INFO - __main__ - Step 17648: {'lr': 0.00048633680246761956, 'samples': 3388416, 'steps': 17647, 'loss/train': 1.830798864364624} -08/30/2021 16:24:47 - INFO - __main__ - Step 17649: {'lr': 0.00048633507206859383, 'samples': 3388608, 'steps': 17648, 'loss/train': 2.4800283908843994} -08/30/2021 16:24:47 - INFO - __main__ - Step 17650: {'lr': 0.00048633334156307907, 'samples': 3388800, 'steps': 17649, 'loss/train': 1.6565618515014648} -08/30/2021 16:24:48 - INFO - __main__ - Step 17651: {'lr': 0.0004863316109510762, 'samples': 3388992, 'steps': 17650, 'loss/train': 1.6478811502456665} -08/30/2021 16:24:49 - INFO - __main__ - Step 17652: {'lr': 0.00048632988023258596, 'samples': 3389184, 'steps': 17651, 'loss/train': 1.6498517990112305} -08/30/2021 16:24:50 - INFO - __main__ - Step 17653: {'lr': 0.00048632814940760907, 'samples': 3389376, 'steps': 17652, 'loss/train': 1.7267106771469116} -08/30/2021 16:24:50 - INFO - __main__ - Step 17654: {'lr': 0.00048632641847614645, 'samples': 3389568, 'steps': 17653, 'loss/train': 1.8104838132858276} -08/30/2021 16:24:50 - INFO - __main__ - Step 17655: {'lr': 0.0004863246874381987, 'samples': 3389760, 'steps': 17654, 'loss/train': 0.7106810808181763} -08/30/2021 16:24:51 - INFO - __main__ - Step 17656: {'lr': 0.00048632295629376675, 'samples': 3389952, 'steps': 17655, 'loss/train': 1.741978406906128} -08/30/2021 16:24:52 - INFO - __main__ - Step 17657: {'lr': 0.00048632122504285133, 'samples': 3390144, 'steps': 17656, 'loss/train': 1.5844680070877075} -08/30/2021 16:24:53 - INFO - __main__ - Step 17658: {'lr': 0.0004863194936854531, 'samples': 3390336, 'steps': 17657, 'loss/train': 1.7016268968582153} -08/30/2021 16:24:53 - INFO - __main__ - Step 17659: {'lr': 0.0004863177622215731, 'samples': 3390528, 'steps': 17658, 'loss/train': 1.6292468309402466} -08/30/2021 16:24:54 - INFO - __main__ - Step 17660: {'lr': 0.00048631603065121186, 'samples': 3390720, 'steps': 17659, 'loss/train': 1.6936275959014893} -08/30/2021 16:24:54 - INFO - __main__ - Step 17661: {'lr': 0.00048631429897437033, 'samples': 3390912, 'steps': 17660, 'loss/train': 0.9331439733505249} -08/30/2021 16:24:54 - INFO - __main__ - Step 17662: {'lr': 0.0004863125671910492, 'samples': 3391104, 'steps': 17661, 'loss/train': 6.046341896057129} -08/30/2021 16:24:55 - INFO - __main__ - Step 17663: {'lr': 0.00048631083530124934, 'samples': 3391296, 'steps': 17662, 'loss/train': 1.7382398843765259} -08/30/2021 16:24:56 - INFO - __main__ - Step 17664: {'lr': 0.00048630910330497133, 'samples': 3391488, 'steps': 17663, 'loss/train': 1.9881970882415771} -08/30/2021 16:24:57 - INFO - __main__ - Step 17665: {'lr': 0.0004863073712022162, 'samples': 3391680, 'steps': 17664, 'loss/train': 1.7396708726882935} -08/30/2021 16:24:57 - INFO - __main__ - Step 17666: {'lr': 0.00048630563899298453, 'samples': 3391872, 'steps': 17665, 'loss/train': 1.8456741571426392} -08/30/2021 16:24:57 - INFO - __main__ - Step 17667: {'lr': 0.00048630390667727725, 'samples': 3392064, 'steps': 17666, 'loss/train': 1.488634467124939} -08/30/2021 16:24:58 - INFO - __main__ - Step 17668: {'lr': 0.00048630217425509503, 'samples': 3392256, 'steps': 17667, 'loss/train': 1.8691930770874023} -08/30/2021 16:24:59 - INFO - __main__ - Step 17669: {'lr': 0.00048630044172643874, 'samples': 3392448, 'steps': 17668, 'loss/train': 1.8067786693572998} -08/30/2021 16:25:00 - INFO - __main__ - Step 17670: {'lr': 0.0004862987090913091, 'samples': 3392640, 'steps': 17669, 'loss/train': 1.7889330387115479} -08/30/2021 16:25:00 - INFO - __main__ - Step 17671: {'lr': 0.0004862969763497069, 'samples': 3392832, 'steps': 17670, 'loss/train': 1.8399053812026978} -08/30/2021 16:25:01 - INFO - __main__ - Step 17672: {'lr': 0.0004862952435016329, 'samples': 3393024, 'steps': 17671, 'loss/train': 1.7011256217956543} -08/30/2021 16:25:01 - INFO - __main__ - Step 17673: {'lr': 0.00048629351054708795, 'samples': 3393216, 'steps': 17672, 'loss/train': 1.8765562772750854} -08/30/2021 16:25:02 - INFO - __main__ - Step 17674: {'lr': 0.0004862917774860728, 'samples': 3393408, 'steps': 17673, 'loss/train': 0.143140971660614} -08/30/2021 16:25:03 - INFO - __main__ - Step 17675: {'lr': 0.0004862900443185882, 'samples': 3393600, 'steps': 17674, 'loss/train': 0.4153665006160736} -08/30/2021 16:25:03 - INFO - __main__ - Step 17676: {'lr': 0.00048628831104463496, 'samples': 3393792, 'steps': 17675, 'loss/train': 1.7494155168533325} -08/30/2021 16:25:04 - INFO - __main__ - Step 17677: {'lr': 0.0004862865776642138, 'samples': 3393984, 'steps': 17676, 'loss/train': 1.814841389656067} -08/30/2021 16:25:04 - INFO - __main__ - Step 17678: {'lr': 0.00048628484417732567, 'samples': 3394176, 'steps': 17677, 'loss/train': 1.5618295669555664} -08/30/2021 16:25:06 - INFO - __main__ - Step 17679: {'lr': 0.00048628311058397113, 'samples': 3394368, 'steps': 17678, 'loss/train': 0.9141178727149963} -08/30/2021 16:25:06 - INFO - __main__ - Step 17680: {'lr': 0.0004862813768841511, 'samples': 3394560, 'steps': 17679, 'loss/train': 1.3781713247299194} -08/30/2021 16:25:06 - INFO - __main__ - Step 17681: {'lr': 0.0004862796430778663, 'samples': 3394752, 'steps': 17680, 'loss/train': 1.9683810472488403} -08/30/2021 16:25:07 - INFO - __main__ - Step 17682: {'lr': 0.0004862779091651176, 'samples': 3394944, 'steps': 17681, 'loss/train': 2.0991878509521484} -08/30/2021 16:25:07 - INFO - __main__ - Step 17683: {'lr': 0.0004862761751459057, 'samples': 3395136, 'steps': 17682, 'loss/train': 2.1489808559417725} -08/30/2021 16:25:09 - INFO - __main__ - Step 17684: {'lr': 0.0004862744410202314, 'samples': 3395328, 'steps': 17683, 'loss/train': 1.5708801746368408} -08/30/2021 16:25:09 - INFO - __main__ - Step 17685: {'lr': 0.00048627270678809544, 'samples': 3395520, 'steps': 17684, 'loss/train': 1.5949734449386597} -08/30/2021 16:25:09 - INFO - __main__ - Step 17686: {'lr': 0.0004862709724494987, 'samples': 3395712, 'steps': 17685, 'loss/train': 1.6808841228485107} -08/30/2021 16:25:10 - INFO - __main__ - Step 17687: {'lr': 0.0004862692380044419, 'samples': 3395904, 'steps': 17686, 'loss/train': 1.69366455078125} -08/30/2021 16:25:10 - INFO - __main__ - Step 17688: {'lr': 0.0004862675034529258, 'samples': 3396096, 'steps': 17687, 'loss/train': 1.183712124824524} -08/30/2021 16:25:12 - INFO - __main__ - Step 17689: {'lr': 0.0004862657687949512, 'samples': 3396288, 'steps': 17688, 'loss/train': 1.6497210264205933} -08/30/2021 16:25:12 - INFO - __main__ - Step 17690: {'lr': 0.00048626403403051894, 'samples': 3396480, 'steps': 17689, 'loss/train': 1.8684240579605103} -08/30/2021 16:25:13 - INFO - __main__ - Step 17691: {'lr': 0.00048626229915962974, 'samples': 3396672, 'steps': 17690, 'loss/train': 0.08506304025650024} -08/30/2021 16:25:13 - INFO - __main__ - Step 17692: {'lr': 0.00048626056418228436, 'samples': 3396864, 'steps': 17691, 'loss/train': 2.190805435180664} -08/30/2021 16:25:13 - INFO - __main__ - Step 17693: {'lr': 0.0004862588290984836, 'samples': 3397056, 'steps': 17692, 'loss/train': 1.9205013513565063} -08/30/2021 16:25:14 - INFO - __main__ - Step 17694: {'lr': 0.0004862570939082283, 'samples': 3397248, 'steps': 17693, 'loss/train': 1.5624686479568481} -08/30/2021 16:25:16 - INFO - __main__ - Step 17695: {'lr': 0.0004862553586115192, 'samples': 3397440, 'steps': 17694, 'loss/train': 1.7238426208496094} -08/30/2021 16:25:16 - INFO - __main__ - Step 17696: {'lr': 0.00048625362320835707, 'samples': 3397632, 'steps': 17695, 'loss/train': 1.9803744554519653} -08/30/2021 16:25:17 - INFO - __main__ - Step 17697: {'lr': 0.00048625188769874274, 'samples': 3397824, 'steps': 17696, 'loss/train': 1.5344154834747314} -08/30/2021 16:25:17 - INFO - __main__ - Step 17698: {'lr': 0.0004862501520826769, 'samples': 3398016, 'steps': 17697, 'loss/train': 0.9941984415054321} -08/30/2021 16:25:17 - INFO - __main__ - Step 17699: {'lr': 0.0004862484163601604, 'samples': 3398208, 'steps': 17698, 'loss/train': 0.08878421783447266} -08/30/2021 16:25:19 - INFO - __main__ - Step 17700: {'lr': 0.000486246680531194, 'samples': 3398400, 'steps': 17699, 'loss/train': 1.453533411026001} -08/30/2021 16:25:19 - INFO - __main__ - Step 17701: {'lr': 0.0004862449445957785, 'samples': 3398592, 'steps': 17700, 'loss/train': 1.675041913986206} -08/30/2021 16:25:20 - INFO - __main__ - Step 17702: {'lr': 0.00048624320855391467, 'samples': 3398784, 'steps': 17701, 'loss/train': 1.457558035850525} -08/30/2021 16:25:20 - INFO - __main__ - Step 17703: {'lr': 0.00048624147240560335, 'samples': 3398976, 'steps': 17702, 'loss/train': 1.555201530456543} -08/30/2021 16:25:20 - INFO - __main__ - Step 17704: {'lr': 0.00048623973615084516, 'samples': 3399168, 'steps': 17703, 'loss/train': 1.6829344034194946} -08/30/2021 16:25:22 - INFO - __main__ - Step 17705: {'lr': 0.0004862379997896411, 'samples': 3399360, 'steps': 17704, 'loss/train': 1.406872272491455} -08/30/2021 16:25:22 - INFO - __main__ - Step 17706: {'lr': 0.0004862362633219918, 'samples': 3399552, 'steps': 17705, 'loss/train': 1.8866908550262451} -08/30/2021 16:25:23 - INFO - __main__ - Step 17707: {'lr': 0.000486234526747898, 'samples': 3399744, 'steps': 17706, 'loss/train': 1.6731010675430298} -08/30/2021 16:25:23 - INFO - __main__ - Step 17708: {'lr': 0.0004862327900673607, 'samples': 3399936, 'steps': 17707, 'loss/train': 2.172962188720703} -08/30/2021 16:25:23 - INFO - __main__ - Step 17709: {'lr': 0.00048623105328038054, 'samples': 3400128, 'steps': 17708, 'loss/train': 1.1505485773086548} -08/30/2021 16:25:25 - INFO - __main__ - Step 17710: {'lr': 0.0004862293163869582, 'samples': 3400320, 'steps': 17709, 'loss/train': 1.3676457405090332} -08/30/2021 16:25:25 - INFO - __main__ - Step 17711: {'lr': 0.00048622757938709466, 'samples': 3400512, 'steps': 17710, 'loss/train': 0.37289196252822876} -08/30/2021 16:25:26 - INFO - __main__ - Step 17712: {'lr': 0.0004862258422807906, 'samples': 3400704, 'steps': 17711, 'loss/train': 1.7323291301727295} -08/30/2021 16:25:26 - INFO - __main__ - Step 17713: {'lr': 0.0004862241050680468, 'samples': 3400896, 'steps': 17712, 'loss/train': 2.248530864715576} -08/30/2021 16:25:26 - INFO - __main__ - Step 17714: {'lr': 0.00048622236774886415, 'samples': 3401088, 'steps': 17713, 'loss/train': 0.818747878074646} -08/30/2021 16:25:28 - INFO - __main__ - Step 17715: {'lr': 0.00048622063032324324, 'samples': 3401280, 'steps': 17714, 'loss/train': 1.9397470951080322} -08/30/2021 16:25:28 - INFO - __main__ - Step 17716: {'lr': 0.000486218892791185, 'samples': 3401472, 'steps': 17715, 'loss/train': 3.122344493865967} -08/30/2021 16:25:29 - INFO - __main__ - Step 17717: {'lr': 0.00048621715515269017, 'samples': 3401664, 'steps': 17716, 'loss/train': 1.2338253259658813} -08/30/2021 16:25:29 - INFO - __main__ - Step 17718: {'lr': 0.0004862154174077595, 'samples': 3401856, 'steps': 17717, 'loss/train': 1.7586365938186646} -08/30/2021 16:25:29 - INFO - __main__ - Step 17719: {'lr': 0.00048621367955639395, 'samples': 3402048, 'steps': 17718, 'loss/train': 1.6339696645736694} -08/30/2021 16:25:31 - INFO - __main__ - Step 17720: {'lr': 0.00048621194159859403, 'samples': 3402240, 'steps': 17719, 'loss/train': 1.7732384204864502} -08/30/2021 16:25:31 - INFO - __main__ - Step 17721: {'lr': 0.0004862102035343607, 'samples': 3402432, 'steps': 17720, 'loss/train': 2.0181620121002197} -08/30/2021 16:25:32 - INFO - __main__ - Step 17722: {'lr': 0.0004862084653636947, 'samples': 3402624, 'steps': 17721, 'loss/train': 2.088188886642456} -08/30/2021 16:25:32 - INFO - __main__ - Step 17723: {'lr': 0.00048620672708659675, 'samples': 3402816, 'steps': 17722, 'loss/train': 2.3807716369628906} -08/30/2021 16:25:32 - INFO - __main__ - Step 17724: {'lr': 0.0004862049887030677, 'samples': 3403008, 'steps': 17723, 'loss/train': 1.3474513292312622} -08/30/2021 16:25:34 - INFO - __main__ - Step 17725: {'lr': 0.0004862032502131084, 'samples': 3403200, 'steps': 17724, 'loss/train': 1.401879072189331} -08/30/2021 16:25:34 - INFO - __main__ - Step 17726: {'lr': 0.00048620151161671955, 'samples': 3403392, 'steps': 17725, 'loss/train': 1.8139903545379639} -08/30/2021 16:25:35 - INFO - __main__ - Step 17727: {'lr': 0.00048619977291390186, 'samples': 3403584, 'steps': 17726, 'loss/train': 2.8312020301818848} -08/30/2021 16:25:35 - INFO - __main__ - Step 17728: {'lr': 0.00048619803410465624, 'samples': 3403776, 'steps': 17727, 'loss/train': 1.4648650884628296} -08/30/2021 16:25:36 - INFO - __main__ - Step 17729: {'lr': 0.00048619629518898344, 'samples': 3403968, 'steps': 17728, 'loss/train': 2.1914825439453125} -08/30/2021 16:25:36 - INFO - __main__ - Step 17730: {'lr': 0.00048619455616688426, 'samples': 3404160, 'steps': 17729, 'loss/train': 1.0621435642242432} -08/30/2021 16:25:37 - INFO - __main__ - Step 17731: {'lr': 0.0004861928170383594, 'samples': 3404352, 'steps': 17730, 'loss/train': 1.7239242792129517} -08/30/2021 16:25:38 - INFO - __main__ - Step 17732: {'lr': 0.0004861910778034098, 'samples': 3404544, 'steps': 17731, 'loss/train': 1.5181375741958618} -08/30/2021 16:25:38 - INFO - __main__ - Step 17733: {'lr': 0.00048618933846203606, 'samples': 3404736, 'steps': 17732, 'loss/train': 1.8347440958023071} -08/30/2021 16:25:38 - INFO - __main__ - Step 17734: {'lr': 0.00048618759901423905, 'samples': 3404928, 'steps': 17733, 'loss/train': 1.5305198431015015} -08/30/2021 16:25:39 - INFO - __main__ - Step 17735: {'lr': 0.0004861858594600196, 'samples': 3405120, 'steps': 17734, 'loss/train': 1.7854728698730469} -08/30/2021 16:25:40 - INFO - __main__ - Step 17736: {'lr': 0.0004861841197993784, 'samples': 3405312, 'steps': 17735, 'loss/train': 1.6548168659210205} -08/30/2021 16:25:41 - INFO - __main__ - Step 17737: {'lr': 0.0004861823800323163, 'samples': 3405504, 'steps': 17736, 'loss/train': 1.2652748823165894} -08/30/2021 16:25:41 - INFO - __main__ - Step 17738: {'lr': 0.00048618064015883405, 'samples': 3405696, 'steps': 17737, 'loss/train': 1.4637962579727173} -08/30/2021 16:25:41 - INFO - __main__ - Step 17739: {'lr': 0.0004861789001789325, 'samples': 3405888, 'steps': 17738, 'loss/train': 1.7666879892349243} -08/30/2021 16:25:42 - INFO - __main__ - Step 17740: {'lr': 0.00048617716009261236, 'samples': 3406080, 'steps': 17739, 'loss/train': 1.6758126020431519} -08/30/2021 16:25:43 - INFO - __main__ - Step 17741: {'lr': 0.00048617541989987435, 'samples': 3406272, 'steps': 17740, 'loss/train': 1.4668971300125122} -08/30/2021 16:25:44 - INFO - __main__ - Step 17742: {'lr': 0.00048617367960071946, 'samples': 3406464, 'steps': 17741, 'loss/train': 1.4784157276153564} -08/30/2021 16:25:44 - INFO - __main__ - Step 17743: {'lr': 0.0004861719391951483, 'samples': 3406656, 'steps': 17742, 'loss/train': 1.6684218645095825} -08/30/2021 16:25:44 - INFO - __main__ - Step 17744: {'lr': 0.0004861701986831617, 'samples': 3406848, 'steps': 17743, 'loss/train': 1.5837866067886353} -08/30/2021 16:25:45 - INFO - __main__ - Step 17745: {'lr': 0.0004861684580647605, 'samples': 3407040, 'steps': 17744, 'loss/train': 1.8455150127410889} -08/30/2021 16:25:47 - INFO - __main__ - Step 17746: {'lr': 0.0004861667173399453, 'samples': 3407232, 'steps': 17745, 'loss/train': 1.2570794820785522} -08/30/2021 16:25:48 - INFO - __main__ - Step 17747: {'lr': 0.0004861649765087172, 'samples': 3407424, 'steps': 17746, 'loss/train': 2.085454225540161} -08/30/2021 16:25:48 - INFO - __main__ - Step 17748: {'lr': 0.0004861632355710767, 'samples': 3407616, 'steps': 17747, 'loss/train': 1.643376350402832} -08/30/2021 16:25:48 - INFO - __main__ - Step 17749: {'lr': 0.00048616149452702473, 'samples': 3407808, 'steps': 17748, 'loss/train': 2.5802743434906006} -08/30/2021 16:25:49 - INFO - __main__ - Step 17750: {'lr': 0.00048615975337656204, 'samples': 3408000, 'steps': 17749, 'loss/train': 1.4473512172698975} -08/30/2021 16:25:49 - INFO - __main__ - Step 17751: {'lr': 0.00048615801211968936, 'samples': 3408192, 'steps': 17750, 'loss/train': 1.7644591331481934} -08/30/2021 16:25:51 - INFO - __main__ - Step 17752: {'lr': 0.00048615627075640754, 'samples': 3408384, 'steps': 17751, 'loss/train': 1.8071231842041016} -08/30/2021 16:25:51 - INFO - __main__ - Step 17753: {'lr': 0.00048615452928671746, 'samples': 3408576, 'steps': 17752, 'loss/train': 2.0351507663726807} -08/30/2021 16:25:51 - INFO - __main__ - Step 17754: {'lr': 0.00048615278771061966, 'samples': 3408768, 'steps': 17753, 'loss/train': 0.9494560360908508} -08/30/2021 16:25:52 - INFO - __main__ - Step 17755: {'lr': 0.0004861510460281151, 'samples': 3408960, 'steps': 17754, 'loss/train': 6.22068977355957} -08/30/2021 16:25:52 - INFO - __main__ - Step 17756: {'lr': 0.0004861493042392045, 'samples': 3409152, 'steps': 17755, 'loss/train': 2.4171478748321533} -08/30/2021 16:25:54 - INFO - __main__ - Step 17757: {'lr': 0.00048614756234388866, 'samples': 3409344, 'steps': 17756, 'loss/train': 1.8834068775177002} -08/30/2021 16:25:54 - INFO - __main__ - Step 17758: {'lr': 0.00048614582034216844, 'samples': 3409536, 'steps': 17757, 'loss/train': 1.4243308305740356} -08/30/2021 16:25:54 - INFO - __main__ - Step 17759: {'lr': 0.0004861440782340445, 'samples': 3409728, 'steps': 17758, 'loss/train': 1.5687111616134644} -08/30/2021 16:25:55 - INFO - __main__ - Step 17760: {'lr': 0.0004861423360195177, 'samples': 3409920, 'steps': 17759, 'loss/train': 1.073167324066162} -08/30/2021 16:25:55 - INFO - __main__ - Step 17761: {'lr': 0.0004861405936985888, 'samples': 3410112, 'steps': 17760, 'loss/train': 1.616040587425232} -08/30/2021 16:25:57 - INFO - __main__ - Step 17762: {'lr': 0.0004861388512712586, 'samples': 3410304, 'steps': 17761, 'loss/train': 1.6898744106292725} -08/30/2021 16:25:57 - INFO - __main__ - Step 17763: {'lr': 0.0004861371087375279, 'samples': 3410496, 'steps': 17762, 'loss/train': 2.581831693649292} -08/30/2021 16:25:58 - INFO - __main__ - Step 17764: {'lr': 0.0004861353660973974, 'samples': 3410688, 'steps': 17763, 'loss/train': 1.838334560394287} -08/30/2021 16:25:58 - INFO - __main__ - Step 17765: {'lr': 0.00048613362335086797, 'samples': 3410880, 'steps': 17764, 'loss/train': 1.6511179208755493} -08/30/2021 16:25:58 - INFO - __main__ - Step 17766: {'lr': 0.00048613188049794045, 'samples': 3411072, 'steps': 17765, 'loss/train': 1.6235308647155762} -08/30/2021 16:25:59 - INFO - __main__ - Step 17767: {'lr': 0.00048613013753861546, 'samples': 3411264, 'steps': 17766, 'loss/train': 1.9086244106292725} -08/30/2021 16:26:00 - INFO - __main__ - Step 17768: {'lr': 0.0004861283944728939, 'samples': 3411456, 'steps': 17767, 'loss/train': 1.6346663236618042} -08/30/2021 16:26:00 - INFO - __main__ - Step 17769: {'lr': 0.0004861266513007765, 'samples': 3411648, 'steps': 17768, 'loss/train': 1.9003173112869263} -08/30/2021 16:26:01 - INFO - __main__ - Step 17770: {'lr': 0.00048612490802226415, 'samples': 3411840, 'steps': 17769, 'loss/train': 1.941716194152832} -08/30/2021 16:26:01 - INFO - __main__ - Step 17771: {'lr': 0.0004861231646373575, 'samples': 3412032, 'steps': 17770, 'loss/train': 2.2606074810028076} -08/30/2021 16:26:02 - INFO - __main__ - Step 17772: {'lr': 0.0004861214211460574, 'samples': 3412224, 'steps': 17771, 'loss/train': 1.241268515586853} -08/30/2021 16:26:03 - INFO - __main__ - Step 17773: {'lr': 0.00048611967754836466, 'samples': 3412416, 'steps': 17772, 'loss/train': 1.577620506286621} -08/30/2021 16:26:03 - INFO - __main__ - Step 17774: {'lr': 0.00048611793384428006, 'samples': 3412608, 'steps': 17773, 'loss/train': 1.2940549850463867} -08/30/2021 16:26:04 - INFO - __main__ - Step 17775: {'lr': 0.00048611619003380426, 'samples': 3412800, 'steps': 17774, 'loss/train': 1.457544207572937} -08/30/2021 16:26:04 - INFO - __main__ - Step 17776: {'lr': 0.0004861144461169382, 'samples': 3412992, 'steps': 17775, 'loss/train': 1.60025155544281} -08/30/2021 16:26:04 - INFO - __main__ - Step 17777: {'lr': 0.00048611270209368264, 'samples': 3413184, 'steps': 17776, 'loss/train': 1.5212907791137695} -08/30/2021 16:26:06 - INFO - __main__ - Step 17778: {'lr': 0.0004861109579640384, 'samples': 3413376, 'steps': 17777, 'loss/train': 1.9214051961898804} -08/30/2021 16:26:07 - INFO - __main__ - Step 17779: {'lr': 0.0004861092137280061, 'samples': 3413568, 'steps': 17778, 'loss/train': 1.3035353422164917} -08/30/2021 16:26:07 - INFO - __main__ - Step 17780: {'lr': 0.00048610746938558666, 'samples': 3413760, 'steps': 17779, 'loss/train': 1.7488807439804077} -08/30/2021 16:26:07 - INFO - __main__ - Step 17781: {'lr': 0.0004861057249367808, 'samples': 3413952, 'steps': 17780, 'loss/train': 0.3444135785102844} -08/30/2021 16:26:08 - INFO - __main__ - Step 17782: {'lr': 0.00048610398038158943, 'samples': 3414144, 'steps': 17781, 'loss/train': 0.3180020749568939} -08/30/2021 16:26:08 - INFO - __main__ - Step 17783: {'lr': 0.00048610223572001315, 'samples': 3414336, 'steps': 17782, 'loss/train': 1.867020606994629} -08/30/2021 16:26:09 - INFO - __main__ - Step 17784: {'lr': 0.0004861004909520529, 'samples': 3414528, 'steps': 17783, 'loss/train': 1.1937071084976196} -08/30/2021 16:26:10 - INFO - __main__ - Step 17785: {'lr': 0.00048609874607770945, 'samples': 3414720, 'steps': 17784, 'loss/train': 2.2578063011169434} -08/30/2021 16:26:10 - INFO - __main__ - Step 17786: {'lr': 0.0004860970010969835, 'samples': 3414912, 'steps': 17785, 'loss/train': 1.9325724840164185} -08/30/2021 16:26:11 - INFO - __main__ - Step 17787: {'lr': 0.0004860952560098759, 'samples': 3415104, 'steps': 17786, 'loss/train': 2.0252583026885986} -08/30/2021 16:26:11 - INFO - __main__ - Step 17788: {'lr': 0.0004860935108163874, 'samples': 3415296, 'steps': 17787, 'loss/train': 1.694702386856079} -08/30/2021 16:26:12 - INFO - __main__ - Step 17789: {'lr': 0.0004860917655165188, 'samples': 3415488, 'steps': 17788, 'loss/train': 1.336488962173462} -08/30/2021 16:26:13 - INFO - __main__ - Step 17790: {'lr': 0.00048609002011027093, 'samples': 3415680, 'steps': 17789, 'loss/train': 1.6751717329025269} -08/30/2021 16:26:13 - INFO - __main__ - Step 17791: {'lr': 0.0004860882745976445, 'samples': 3415872, 'steps': 17790, 'loss/train': 1.6190760135650635} -08/30/2021 16:26:14 - INFO - __main__ - Step 17792: {'lr': 0.00048608652897864034, 'samples': 3416064, 'steps': 17791, 'loss/train': 2.0488550662994385} -08/30/2021 16:26:14 - INFO - __main__ - Step 17793: {'lr': 0.0004860847832532593, 'samples': 3416256, 'steps': 17792, 'loss/train': 1.6386748552322388} -08/30/2021 16:26:15 - INFO - __main__ - Step 17794: {'lr': 0.00048608303742150204, 'samples': 3416448, 'steps': 17793, 'loss/train': 1.3178482055664062} -08/30/2021 16:26:16 - INFO - __main__ - Step 17795: {'lr': 0.0004860812914833694, 'samples': 3416640, 'steps': 17794, 'loss/train': 1.6896860599517822} -08/30/2021 16:26:16 - INFO - __main__ - Step 17796: {'lr': 0.00048607954543886225, 'samples': 3416832, 'steps': 17795, 'loss/train': 1.564070701599121} -08/30/2021 16:26:17 - INFO - __main__ - Step 17797: {'lr': 0.00048607779928798125, 'samples': 3417024, 'steps': 17796, 'loss/train': 1.4566324949264526} -08/30/2021 16:26:17 - INFO - __main__ - Step 17798: {'lr': 0.0004860760530307272, 'samples': 3417216, 'steps': 17797, 'loss/train': 2.0166878700256348} -08/30/2021 16:26:19 - INFO - __main__ - Step 17799: {'lr': 0.00048607430666710097, 'samples': 3417408, 'steps': 17798, 'loss/train': 2.282393217086792} -08/30/2021 16:26:19 - INFO - __main__ - Step 17800: {'lr': 0.00048607256019710327, 'samples': 3417600, 'steps': 17799, 'loss/train': 1.350229024887085} -08/30/2021 16:26:19 - INFO - __main__ - Step 17801: {'lr': 0.0004860708136207349, 'samples': 3417792, 'steps': 17800, 'loss/train': 1.3988617658615112} -08/30/2021 16:26:20 - INFO - __main__ - Step 17802: {'lr': 0.0004860690669379967, 'samples': 3417984, 'steps': 17801, 'loss/train': 1.5887693166732788} -08/30/2021 16:26:20 - INFO - __main__ - Step 17803: {'lr': 0.00048606732014888946, 'samples': 3418176, 'steps': 17802, 'loss/train': 0.10701005905866623} -08/30/2021 16:26:23 - INFO - __main__ - Step 17804: {'lr': 0.0004860655732534138, 'samples': 3418368, 'steps': 17803, 'loss/train': 1.9331892728805542} -08/30/2021 16:26:23 - INFO - __main__ - Step 17805: {'lr': 0.00048606382625157075, 'samples': 3418560, 'steps': 17804, 'loss/train': 1.2968308925628662} -08/30/2021 16:26:23 - INFO - __main__ - Step 17806: {'lr': 0.00048606207914336097, 'samples': 3418752, 'steps': 17805, 'loss/train': 0.0958833396434784} -08/30/2021 16:26:24 - INFO - __main__ - Step 17807: {'lr': 0.0004860603319287853, 'samples': 3418944, 'steps': 17806, 'loss/train': 1.3931435346603394} -08/30/2021 16:26:24 - INFO - __main__ - Step 17808: {'lr': 0.0004860585846078444, 'samples': 3419136, 'steps': 17807, 'loss/train': 2.507514238357544} -08/30/2021 16:26:24 - INFO - __main__ - Step 17809: {'lr': 0.00048605683718053915, 'samples': 3419328, 'steps': 17808, 'loss/train': 1.7126376628875732} -08/30/2021 16:26:25 - INFO - __main__ - Step 17810: {'lr': 0.0004860550896468704, 'samples': 3419520, 'steps': 17809, 'loss/train': 1.714233636856079} -08/30/2021 16:26:26 - INFO - __main__ - Step 17811: {'lr': 0.00048605334200683883, 'samples': 3419712, 'steps': 17810, 'loss/train': 1.740059733390808} -08/30/2021 16:26:27 - INFO - __main__ - Step 17812: {'lr': 0.0004860515942604452, 'samples': 3419904, 'steps': 17811, 'loss/train': 1.2822657823562622} -08/30/2021 16:26:27 - INFO - __main__ - Step 17813: {'lr': 0.00048604984640769047, 'samples': 3420096, 'steps': 17812, 'loss/train': 1.1805046796798706} -08/30/2021 16:26:27 - INFO - __main__ - Step 17814: {'lr': 0.00048604809844857524, 'samples': 3420288, 'steps': 17813, 'loss/train': 3.061659097671509} -08/30/2021 16:26:28 - INFO - __main__ - Step 17815: {'lr': 0.0004860463503831004, 'samples': 3420480, 'steps': 17814, 'loss/train': 1.9420151710510254} -08/30/2021 16:26:29 - INFO - __main__ - Step 17816: {'lr': 0.0004860446022112668, 'samples': 3420672, 'steps': 17815, 'loss/train': 1.388025164604187} -08/30/2021 16:26:30 - INFO - __main__ - Step 17817: {'lr': 0.00048604285393307503, 'samples': 3420864, 'steps': 17816, 'loss/train': 1.9964635372161865} -08/30/2021 16:26:30 - INFO - __main__ - Step 17818: {'lr': 0.000486041105548526, 'samples': 3421056, 'steps': 17817, 'loss/train': 0.955362856388092} -08/30/2021 16:26:30 - INFO - __main__ - Step 17819: {'lr': 0.00048603935705762057, 'samples': 3421248, 'steps': 17818, 'loss/train': 1.5427345037460327} -08/30/2021 16:26:31 - INFO - __main__ - Step 17820: {'lr': 0.0004860376084603594, 'samples': 3421440, 'steps': 17819, 'loss/train': 1.8449162244796753} -08/30/2021 16:26:32 - INFO - __main__ - Step 17821: {'lr': 0.00048603585975674334, 'samples': 3421632, 'steps': 17820, 'loss/train': 1.494202971458435} -08/30/2021 16:26:33 - INFO - __main__ - Step 17822: {'lr': 0.0004860341109467732, 'samples': 3421824, 'steps': 17821, 'loss/train': 1.6064958572387695} -08/30/2021 16:26:33 - INFO - __main__ - Step 17823: {'lr': 0.00048603236203044963, 'samples': 3422016, 'steps': 17822, 'loss/train': 1.8284484148025513} -08/30/2021 16:26:34 - INFO - __main__ - Step 17824: {'lr': 0.00048603061300777365, 'samples': 3422208, 'steps': 17823, 'loss/train': 1.8893921375274658} -08/30/2021 16:26:34 - INFO - __main__ - Step 17825: {'lr': 0.0004860288638787458, 'samples': 3422400, 'steps': 17824, 'loss/train': 1.239871621131897} -08/30/2021 16:26:34 - INFO - __main__ - Step 17826: {'lr': 0.000486027114643367, 'samples': 3422592, 'steps': 17825, 'loss/train': 1.517728328704834} -08/30/2021 16:26:36 - INFO - __main__ - Step 17827: {'lr': 0.0004860253653016381, 'samples': 3422784, 'steps': 17826, 'loss/train': 0.07044032216072083} -08/30/2021 16:26:36 - INFO - __main__ - Step 17828: {'lr': 0.00048602361585355975, 'samples': 3422976, 'steps': 17827, 'loss/train': 1.964586853981018} -08/30/2021 16:26:36 - INFO - __main__ - Step 17829: {'lr': 0.0004860218662991328, 'samples': 3423168, 'steps': 17828, 'loss/train': 1.9995909929275513} -08/30/2021 16:26:37 - INFO - __main__ - Step 17830: {'lr': 0.0004860201166383581, 'samples': 3423360, 'steps': 17829, 'loss/train': 1.5352898836135864} -08/30/2021 16:26:37 - INFO - __main__ - Step 17831: {'lr': 0.00048601836687123636, 'samples': 3423552, 'steps': 17830, 'loss/train': 1.1319940090179443} -08/30/2021 16:26:39 - INFO - __main__ - Step 17832: {'lr': 0.00048601661699776834, 'samples': 3423744, 'steps': 17831, 'loss/train': 1.645721197128296} -08/30/2021 16:26:39 - INFO - __main__ - Step 17833: {'lr': 0.0004860148670179549, 'samples': 3423936, 'steps': 17832, 'loss/train': 1.8793554306030273} -08/30/2021 16:26:40 - INFO - __main__ - Step 17834: {'lr': 0.0004860131169317968, 'samples': 3424128, 'steps': 17833, 'loss/train': 2.120166778564453} -08/30/2021 16:26:40 - INFO - __main__ - Step 17835: {'lr': 0.0004860113667392948, 'samples': 3424320, 'steps': 17834, 'loss/train': 0.14136287569999695} -08/30/2021 16:26:40 - INFO - __main__ - Step 17836: {'lr': 0.00048600961644044977, 'samples': 3424512, 'steps': 17835, 'loss/train': 1.4645096063613892} -08/30/2021 16:26:42 - INFO - __main__ - Step 17837: {'lr': 0.0004860078660352625, 'samples': 3424704, 'steps': 17836, 'loss/train': 0.9518241286277771} -08/30/2021 16:26:42 - INFO - __main__ - Step 17838: {'lr': 0.0004860061155237336, 'samples': 3424896, 'steps': 17837, 'loss/train': 1.8600260019302368} -08/30/2021 16:26:43 - INFO - __main__ - Step 17839: {'lr': 0.0004860043649058641, 'samples': 3425088, 'steps': 17838, 'loss/train': 1.0962424278259277} -08/30/2021 16:26:43 - INFO - __main__ - Step 17840: {'lr': 0.00048600261418165456, 'samples': 3425280, 'steps': 17839, 'loss/train': 1.6016703844070435} -08/30/2021 16:26:44 - INFO - __main__ - Step 17841: {'lr': 0.00048600086335110593, 'samples': 3425472, 'steps': 17840, 'loss/train': 1.4285876750946045} -08/30/2021 16:26:45 - INFO - __main__ - Step 17842: {'lr': 0.000485999112414219, 'samples': 3425664, 'steps': 17841, 'loss/train': 1.2479573488235474} -08/30/2021 16:26:46 - INFO - __main__ - Step 17843: {'lr': 0.0004859973613709945, 'samples': 3425856, 'steps': 17842, 'loss/train': 1.5413181781768799} -08/30/2021 16:26:46 - INFO - __main__ - Step 17844: {'lr': 0.0004859956102214332, 'samples': 3426048, 'steps': 17843, 'loss/train': 1.8095704317092896} -08/30/2021 16:26:46 - INFO - __main__ - Step 17845: {'lr': 0.00048599385896553595, 'samples': 3426240, 'steps': 17844, 'loss/train': 1.3200632333755493} -08/30/2021 16:26:47 - INFO - __main__ - Step 17846: {'lr': 0.0004859921076033034, 'samples': 3426432, 'steps': 17845, 'loss/train': 2.3370091915130615} -08/30/2021 16:26:48 - INFO - __main__ - Step 17847: {'lr': 0.00048599035613473656, 'samples': 3426624, 'steps': 17846, 'loss/train': 1.3648688793182373} -08/30/2021 16:26:49 - INFO - __main__ - Step 17848: {'lr': 0.0004859886045598361, 'samples': 3426816, 'steps': 17847, 'loss/train': 1.6096360683441162} -08/30/2021 16:26:49 - INFO - __main__ - Step 17849: {'lr': 0.0004859868528786028, 'samples': 3427008, 'steps': 17848, 'loss/train': 0.8248007297515869} -08/30/2021 16:26:50 - INFO - __main__ - Step 17850: {'lr': 0.0004859851010910374, 'samples': 3427200, 'steps': 17849, 'loss/train': 2.027937889099121} -08/30/2021 16:26:50 - INFO - __main__ - Step 17851: {'lr': 0.0004859833491971409, 'samples': 3427392, 'steps': 17850, 'loss/train': 2.022143602371216} -08/30/2021 16:26:50 - INFO - __main__ - Step 17852: {'lr': 0.0004859815971969138, 'samples': 3427584, 'steps': 17851, 'loss/train': 1.8337533473968506} -08/30/2021 16:26:52 - INFO - __main__ - Step 17853: {'lr': 0.0004859798450903571, 'samples': 3427776, 'steps': 17852, 'loss/train': 2.1065738201141357} -08/30/2021 16:26:52 - INFO - __main__ - Step 17854: {'lr': 0.00048597809287747153, 'samples': 3427968, 'steps': 17853, 'loss/train': 1.8997302055358887} -08/30/2021 16:26:53 - INFO - __main__ - Step 17855: {'lr': 0.0004859763405582579, 'samples': 3428160, 'steps': 17854, 'loss/train': 1.2824190855026245} -08/30/2021 16:26:53 - INFO - __main__ - Step 17856: {'lr': 0.00048597458813271686, 'samples': 3428352, 'steps': 17855, 'loss/train': 1.6876394748687744} -08/30/2021 16:26:53 - INFO - __main__ - Step 17857: {'lr': 0.0004859728356008494, 'samples': 3428544, 'steps': 17856, 'loss/train': 1.5995029211044312} -08/30/2021 16:26:55 - INFO - __main__ - Step 17858: {'lr': 0.00048597108296265625, 'samples': 3428736, 'steps': 17857, 'loss/train': 0.4544801414012909} -08/30/2021 16:26:56 - INFO - __main__ - Step 17859: {'lr': 0.00048596933021813815, 'samples': 3428928, 'steps': 17858, 'loss/train': 1.3313671350479126} -08/30/2021 16:26:56 - INFO - __main__ - Step 17860: {'lr': 0.0004859675773672959, 'samples': 3429120, 'steps': 17859, 'loss/train': 1.9243196249008179} -08/30/2021 16:26:57 - INFO - __main__ - Step 17861: {'lr': 0.00048596582441013026, 'samples': 3429312, 'steps': 17860, 'loss/train': 1.6134884357452393} -08/30/2021 16:26:57 - INFO - __main__ - Step 17862: {'lr': 0.0004859640713466421, 'samples': 3429504, 'steps': 17861, 'loss/train': 1.5414246320724487} -08/30/2021 16:26:59 - INFO - __main__ - Step 17863: {'lr': 0.0004859623181768321, 'samples': 3429696, 'steps': 17862, 'loss/train': 1.0997945070266724} -08/30/2021 16:26:59 - INFO - __main__ - Step 17864: {'lr': 0.0004859605649007012, 'samples': 3429888, 'steps': 17863, 'loss/train': 0.7047229409217834} -08/30/2021 16:26:59 - INFO - __main__ - Step 17865: {'lr': 0.00048595881151825015, 'samples': 3430080, 'steps': 17864, 'loss/train': 1.7464097738265991} -08/30/2021 16:27:00 - INFO - __main__ - Step 17866: {'lr': 0.00048595705802947963, 'samples': 3430272, 'steps': 17865, 'loss/train': 1.578861117362976} -08/30/2021 16:27:00 - INFO - __main__ - Step 17867: {'lr': 0.0004859553044343905, 'samples': 3430464, 'steps': 17866, 'loss/train': 1.4532793760299683} -08/30/2021 16:27:00 - INFO - __main__ - Step 17868: {'lr': 0.0004859535507329836, 'samples': 3430656, 'steps': 17867, 'loss/train': 2.017756938934326} -08/30/2021 16:27:02 - INFO - __main__ - Step 17869: {'lr': 0.0004859517969252596, 'samples': 3430848, 'steps': 17868, 'loss/train': 1.7452476024627686} -08/30/2021 16:27:02 - INFO - __main__ - Step 17870: {'lr': 0.0004859500430112194, 'samples': 3431040, 'steps': 17869, 'loss/train': 1.0578614473342896} -08/30/2021 16:27:03 - INFO - __main__ - Step 17871: {'lr': 0.0004859482889908637, 'samples': 3431232, 'steps': 17870, 'loss/train': 1.5763440132141113} -08/30/2021 16:27:03 - INFO - __main__ - Step 17872: {'lr': 0.0004859465348641934, 'samples': 3431424, 'steps': 17871, 'loss/train': 1.7885918617248535} -08/30/2021 16:27:03 - INFO - __main__ - Step 17873: {'lr': 0.0004859447806312093, 'samples': 3431616, 'steps': 17872, 'loss/train': 1.7694075107574463} -08/30/2021 16:27:05 - INFO - __main__ - Step 17874: {'lr': 0.000485943026291912, 'samples': 3431808, 'steps': 17873, 'loss/train': 1.6329407691955566} -08/30/2021 16:27:05 - INFO - __main__ - Step 17875: {'lr': 0.0004859412718463025, 'samples': 3432000, 'steps': 17874, 'loss/train': 0.8633098602294922} -08/30/2021 16:27:06 - INFO - __main__ - Step 17876: {'lr': 0.00048593951729438144, 'samples': 3432192, 'steps': 17875, 'loss/train': 1.3485416173934937} -08/30/2021 16:27:06 - INFO - __main__ - Step 17877: {'lr': 0.0004859377626361497, 'samples': 3432384, 'steps': 17876, 'loss/train': 1.8221259117126465} -08/30/2021 16:27:06 - INFO - __main__ - Step 17878: {'lr': 0.00048593600787160806, 'samples': 3432576, 'steps': 17877, 'loss/train': 0.9330003261566162} -08/30/2021 16:27:08 - INFO - __main__ - Step 17879: {'lr': 0.0004859342530007572, 'samples': 3432768, 'steps': 17878, 'loss/train': 1.376065969467163} -08/30/2021 16:27:08 - INFO - __main__ - Step 17880: {'lr': 0.0004859324980235982, 'samples': 3432960, 'steps': 17879, 'loss/train': 1.5842962265014648} -08/30/2021 16:27:09 - INFO - __main__ - Step 17881: {'lr': 0.0004859307429401315, 'samples': 3433152, 'steps': 17880, 'loss/train': 1.2794156074523926} -08/30/2021 16:27:09 - INFO - __main__ - Step 17882: {'lr': 0.0004859289877503581, 'samples': 3433344, 'steps': 17881, 'loss/train': 1.737648367881775} -08/30/2021 16:27:09 - INFO - __main__ - Step 17883: {'lr': 0.00048592723245427874, 'samples': 3433536, 'steps': 17882, 'loss/train': 0.8127500414848328} -08/30/2021 16:27:11 - INFO - __main__ - Step 17884: {'lr': 0.00048592547705189414, 'samples': 3433728, 'steps': 17883, 'loss/train': 1.9721065759658813} -08/30/2021 16:27:11 - INFO - __main__ - Step 17885: {'lr': 0.00048592372154320526, 'samples': 3433920, 'steps': 17884, 'loss/train': 1.3245036602020264} -08/30/2021 16:27:12 - INFO - __main__ - Step 17886: {'lr': 0.0004859219659282127, 'samples': 3434112, 'steps': 17885, 'loss/train': 2.183135986328125} -08/30/2021 16:27:12 - INFO - __main__ - Step 17887: {'lr': 0.00048592021020691745, 'samples': 3434304, 'steps': 17886, 'loss/train': 1.2190138101577759} -08/30/2021 16:27:12 - INFO - __main__ - Step 17888: {'lr': 0.00048591845437932014, 'samples': 3434496, 'steps': 17887, 'loss/train': 1.4049583673477173} -08/30/2021 16:27:14 - INFO - __main__ - Step 17889: {'lr': 0.0004859166984454216, 'samples': 3434688, 'steps': 17888, 'loss/train': 1.5307166576385498} -08/30/2021 16:27:14 - INFO - __main__ - Step 17890: {'lr': 0.0004859149424052226, 'samples': 3434880, 'steps': 17889, 'loss/train': 1.7316594123840332} -08/30/2021 16:27:15 - INFO - __main__ - Step 17891: {'lr': 0.00048591318625872403, 'samples': 3435072, 'steps': 17890, 'loss/train': 2.1398332118988037} -08/30/2021 16:27:15 - INFO - __main__ - Step 17892: {'lr': 0.00048591143000592665, 'samples': 3435264, 'steps': 17891, 'loss/train': 1.8469187021255493} -08/30/2021 16:27:15 - INFO - __main__ - Step 17893: {'lr': 0.00048590967364683116, 'samples': 3435456, 'steps': 17892, 'loss/train': 2.175302505493164} -08/30/2021 16:27:17 - INFO - __main__ - Step 17894: {'lr': 0.0004859079171814384, 'samples': 3435648, 'steps': 17893, 'loss/train': 1.7110624313354492} -08/30/2021 16:27:17 - INFO - __main__ - Step 17895: {'lr': 0.00048590616060974917, 'samples': 3435840, 'steps': 17894, 'loss/train': 0.8588742017745972} -08/30/2021 16:27:18 - INFO - __main__ - Step 17896: {'lr': 0.00048590440393176434, 'samples': 3436032, 'steps': 17895, 'loss/train': 1.4952541589736938} -08/30/2021 16:27:18 - INFO - __main__ - Step 17897: {'lr': 0.00048590264714748455, 'samples': 3436224, 'steps': 17896, 'loss/train': 1.6051567792892456} -08/30/2021 16:27:18 - INFO - __main__ - Step 17898: {'lr': 0.0004859008902569107, 'samples': 3436416, 'steps': 17897, 'loss/train': 1.8908735513687134} -08/30/2021 16:27:20 - INFO - __main__ - Step 17899: {'lr': 0.00048589913326004355, 'samples': 3436608, 'steps': 17898, 'loss/train': 1.6623704433441162} -08/30/2021 16:27:20 - INFO - __main__ - Step 17900: {'lr': 0.0004858973761568839, 'samples': 3436800, 'steps': 17899, 'loss/train': 1.1768349409103394} -08/30/2021 16:27:21 - INFO - __main__ - Step 17901: {'lr': 0.0004858956189474325, 'samples': 3436992, 'steps': 17900, 'loss/train': 1.343118667602539} -08/30/2021 16:27:21 - INFO - __main__ - Step 17902: {'lr': 0.0004858938616316902, 'samples': 3437184, 'steps': 17901, 'loss/train': 3.308218240737915} -08/30/2021 16:27:21 - INFO - __main__ - Step 17903: {'lr': 0.00048589210420965775, 'samples': 3437376, 'steps': 17902, 'loss/train': 1.6797643899917603} -08/30/2021 16:27:22 - INFO - __main__ - Step 17904: {'lr': 0.0004858903466813359, 'samples': 3437568, 'steps': 17903, 'loss/train': 1.4640237092971802} -08/30/2021 16:27:23 - INFO - __main__ - Step 17905: {'lr': 0.0004858885890467256, 'samples': 3437760, 'steps': 17904, 'loss/train': 0.6652421355247498} -08/30/2021 16:27:24 - INFO - __main__ - Step 17906: {'lr': 0.00048588683130582755, 'samples': 3437952, 'steps': 17905, 'loss/train': 1.5127453804016113} -08/30/2021 16:27:24 - INFO - __main__ - Step 17907: {'lr': 0.00048588507345864246, 'samples': 3438144, 'steps': 17906, 'loss/train': 1.1763780117034912} -08/30/2021 16:27:24 - INFO - __main__ - Step 17908: {'lr': 0.00048588331550517125, 'samples': 3438336, 'steps': 17907, 'loss/train': 1.3862305879592896} -08/30/2021 16:27:25 - INFO - __main__ - Step 17909: {'lr': 0.0004858815574454146, 'samples': 3438528, 'steps': 17908, 'loss/train': 1.5857625007629395} -08/30/2021 16:27:27 - INFO - __main__ - Step 17910: {'lr': 0.0004858797992793734, 'samples': 3438720, 'steps': 17909, 'loss/train': 1.6279613971710205} -08/30/2021 16:27:27 - INFO - __main__ - Step 17911: {'lr': 0.0004858780410070484, 'samples': 3438912, 'steps': 17910, 'loss/train': 2.0002217292785645} -08/30/2021 16:27:28 - INFO - __main__ - Step 17912: {'lr': 0.0004858762826284404, 'samples': 3439104, 'steps': 17911, 'loss/train': 1.3232227563858032} -08/30/2021 16:27:28 - INFO - __main__ - Step 17913: {'lr': 0.00048587452414355014, 'samples': 3439296, 'steps': 17912, 'loss/train': 1.5202692747116089} -08/30/2021 16:27:28 - INFO - __main__ - Step 17914: {'lr': 0.00048587276555237853, 'samples': 3439488, 'steps': 17913, 'loss/train': 1.5702459812164307} -08/30/2021 16:27:30 - INFO - __main__ - Step 17915: {'lr': 0.00048587100685492626, 'samples': 3439680, 'steps': 17914, 'loss/train': 1.5571792125701904} -08/30/2021 16:27:30 - INFO - __main__ - Step 17916: {'lr': 0.00048586924805119416, 'samples': 3439872, 'steps': 17915, 'loss/train': 1.0138022899627686} -08/30/2021 16:27:31 - INFO - __main__ - Step 17917: {'lr': 0.00048586748914118303, 'samples': 3440064, 'steps': 17916, 'loss/train': 1.2218353748321533} -08/30/2021 16:27:31 - INFO - __main__ - Step 17918: {'lr': 0.0004858657301248936, 'samples': 3440256, 'steps': 17917, 'loss/train': 1.5009742975234985} -08/30/2021 16:27:32 - INFO - __main__ - Step 17919: {'lr': 0.00048586397100232673, 'samples': 3440448, 'steps': 17918, 'loss/train': 1.6131455898284912} -08/30/2021 16:27:33 - INFO - __main__ - Step 17920: {'lr': 0.00048586221177348323, 'samples': 3440640, 'steps': 17919, 'loss/train': 1.9276503324508667} -08/30/2021 16:27:33 - INFO - __main__ - Step 17921: {'lr': 0.00048586045243836386, 'samples': 3440832, 'steps': 17920, 'loss/train': 1.802316427230835} -08/30/2021 16:27:34 - INFO - __main__ - Step 17922: {'lr': 0.0004858586929969693, 'samples': 3441024, 'steps': 17921, 'loss/train': 1.4100080728530884} -08/30/2021 16:27:34 - INFO - __main__ - Step 17923: {'lr': 0.0004858569334493006, 'samples': 3441216, 'steps': 17922, 'loss/train': 1.6916251182556152} -08/30/2021 16:27:34 - INFO - __main__ - Step 17924: {'lr': 0.0004858551737953583, 'samples': 3441408, 'steps': 17923, 'loss/train': 1.9449329376220703} -08/30/2021 16:27:36 - INFO - __main__ - Step 17925: {'lr': 0.00048585341403514337, 'samples': 3441600, 'steps': 17924, 'loss/train': 2.312624931335449} -08/30/2021 16:27:36 - INFO - __main__ - Step 17926: {'lr': 0.0004858516541686565, 'samples': 3441792, 'steps': 17925, 'loss/train': 1.7189046144485474} -08/30/2021 16:27:37 - INFO - __main__ - Step 17927: {'lr': 0.0004858498941958985, 'samples': 3441984, 'steps': 17926, 'loss/train': 1.7091323137283325} -08/30/2021 16:27:37 - INFO - __main__ - Step 17928: {'lr': 0.00048584813411687016, 'samples': 3442176, 'steps': 17927, 'loss/train': 1.7522549629211426} -08/30/2021 16:27:37 - INFO - __main__ - Step 17929: {'lr': 0.00048584637393157235, 'samples': 3442368, 'steps': 17928, 'loss/train': 2.142777442932129} -08/30/2021 16:27:39 - INFO - __main__ - Step 17930: {'lr': 0.00048584461364000576, 'samples': 3442560, 'steps': 17929, 'loss/train': 1.5607608556747437} -08/30/2021 16:27:40 - INFO - __main__ - Step 17931: {'lr': 0.00048584285324217125, 'samples': 3442752, 'steps': 17930, 'loss/train': 0.613991379737854} -08/30/2021 16:27:40 - INFO - __main__ - Step 17932: {'lr': 0.00048584109273806954, 'samples': 3442944, 'steps': 17931, 'loss/train': 1.3197829723358154} -08/30/2021 16:27:40 - INFO - __main__ - Step 17933: {'lr': 0.00048583933212770154, 'samples': 3443136, 'steps': 17932, 'loss/train': 1.585553765296936} -08/30/2021 16:27:41 - INFO - __main__ - Step 17934: {'lr': 0.00048583757141106796, 'samples': 3443328, 'steps': 17933, 'loss/train': 1.2175897359848022} -08/30/2021 16:27:42 - INFO - __main__ - Step 17935: {'lr': 0.00048583581058816956, 'samples': 3443520, 'steps': 17934, 'loss/train': 1.8148592710494995} -08/30/2021 16:27:42 - INFO - __main__ - Step 17936: {'lr': 0.00048583404965900725, 'samples': 3443712, 'steps': 17935, 'loss/train': 1.5685232877731323} -08/30/2021 16:27:43 - INFO - __main__ - Step 17937: {'lr': 0.0004858322886235817, 'samples': 3443904, 'steps': 17936, 'loss/train': 1.5733325481414795} -08/30/2021 16:27:43 - INFO - __main__ - Step 17938: {'lr': 0.0004858305274818938, 'samples': 3444096, 'steps': 17937, 'loss/train': 1.5058397054672241} -08/30/2021 16:27:44 - INFO - __main__ - Step 17939: {'lr': 0.0004858287662339443, 'samples': 3444288, 'steps': 17938, 'loss/train': 1.559350609779358} -08/30/2021 16:27:45 - INFO - __main__ - Step 17940: {'lr': 0.00048582700487973397, 'samples': 3444480, 'steps': 17939, 'loss/train': 1.7616230249404907} -08/30/2021 16:27:45 - INFO - __main__ - Step 17941: {'lr': 0.00048582524341926365, 'samples': 3444672, 'steps': 17940, 'loss/train': 1.6359294652938843} -08/30/2021 16:27:46 - INFO - __main__ - Step 17942: {'lr': 0.0004858234818525341, 'samples': 3444864, 'steps': 17941, 'loss/train': 1.1140216588974} -08/30/2021 16:27:46 - INFO - __main__ - Step 17943: {'lr': 0.0004858217201795462, 'samples': 3445056, 'steps': 17942, 'loss/train': 1.5846662521362305} -08/30/2021 16:27:46 - INFO - __main__ - Step 17944: {'lr': 0.0004858199584003006, 'samples': 3445248, 'steps': 17943, 'loss/train': 1.5004762411117554} -08/30/2021 16:27:47 - INFO - __main__ - Step 17945: {'lr': 0.00048581819651479814, 'samples': 3445440, 'steps': 17944, 'loss/train': 1.7346022129058838} -08/30/2021 16:27:48 - INFO - __main__ - Step 17946: {'lr': 0.0004858164345230397, 'samples': 3445632, 'steps': 17945, 'loss/train': 1.4551098346710205} -08/30/2021 16:27:49 - INFO - __main__ - Step 17947: {'lr': 0.000485814672425026, 'samples': 3445824, 'steps': 17946, 'loss/train': 1.748676061630249} -08/30/2021 16:27:49 - INFO - __main__ - Step 17948: {'lr': 0.0004858129102207578, 'samples': 3446016, 'steps': 17947, 'loss/train': 1.8068292140960693} -08/30/2021 16:27:50 - INFO - __main__ - Step 17949: {'lr': 0.0004858111479102359, 'samples': 3446208, 'steps': 17948, 'loss/train': 1.6488761901855469} -08/30/2021 16:27:50 - INFO - __main__ - Step 17950: {'lr': 0.00048580938549346134, 'samples': 3446400, 'steps': 17949, 'loss/train': 1.5202116966247559} -08/30/2021 16:27:51 - INFO - __main__ - Step 17951: {'lr': 0.00048580762297043456, 'samples': 3446592, 'steps': 17950, 'loss/train': 1.6269984245300293} -08/30/2021 16:27:52 - INFO - __main__ - Step 17952: {'lr': 0.00048580586034115646, 'samples': 3446784, 'steps': 17951, 'loss/train': 0.8832659125328064} -08/30/2021 16:27:52 - INFO - __main__ - Step 17953: {'lr': 0.000485804097605628, 'samples': 3446976, 'steps': 17952, 'loss/train': 0.5102223753929138} -08/30/2021 16:27:53 - INFO - __main__ - Step 17954: {'lr': 0.00048580233476384975, 'samples': 3447168, 'steps': 17953, 'loss/train': 1.293516993522644} -08/30/2021 16:27:53 - INFO - __main__ - Step 17955: {'lr': 0.0004858005718158227, 'samples': 3447360, 'steps': 17954, 'loss/train': 0.8091772794723511} -08/30/2021 16:27:55 - INFO - __main__ - Step 17956: {'lr': 0.0004857988087615475, 'samples': 3447552, 'steps': 17955, 'loss/train': 1.6286166906356812} -08/30/2021 16:27:55 - INFO - __main__ - Step 17957: {'lr': 0.000485797045601025, 'samples': 3447744, 'steps': 17956, 'loss/train': 1.5255802869796753} -08/30/2021 16:27:55 - INFO - __main__ - Step 17958: {'lr': 0.000485795282334256, 'samples': 3447936, 'steps': 17957, 'loss/train': 0.8993553519248962} -08/30/2021 16:27:56 - INFO - __main__ - Step 17959: {'lr': 0.00048579351896124127, 'samples': 3448128, 'steps': 17958, 'loss/train': 1.3962647914886475} -08/30/2021 16:27:56 - INFO - __main__ - Step 17960: {'lr': 0.0004857917554819816, 'samples': 3448320, 'steps': 17959, 'loss/train': 1.6764079332351685} -08/30/2021 16:27:58 - INFO - __main__ - Step 17961: {'lr': 0.00048578999189647786, 'samples': 3448512, 'steps': 17960, 'loss/train': 1.4923226833343506} -08/30/2021 16:27:59 - INFO - __main__ - Step 17962: {'lr': 0.00048578822820473074, 'samples': 3448704, 'steps': 17961, 'loss/train': 1.8143463134765625} -08/30/2021 16:27:59 - INFO - __main__ - Step 17963: {'lr': 0.00048578646440674113, 'samples': 3448896, 'steps': 17962, 'loss/train': 2.056778907775879} -08/30/2021 16:27:59 - INFO - __main__ - Step 17964: {'lr': 0.0004857847005025097, 'samples': 3449088, 'steps': 17963, 'loss/train': 1.4036874771118164} -08/30/2021 16:28:00 - INFO - __main__ - Step 17965: {'lr': 0.0004857829364920374, 'samples': 3449280, 'steps': 17964, 'loss/train': 1.3317981958389282} -08/30/2021 16:28:01 - INFO - __main__ - Step 17966: {'lr': 0.0004857811723753249, 'samples': 3449472, 'steps': 17965, 'loss/train': 1.7080540657043457} -08/30/2021 16:28:02 - INFO - __main__ - Step 17967: {'lr': 0.00048577940815237305, 'samples': 3449664, 'steps': 17966, 'loss/train': 1.4190630912780762} -08/30/2021 16:28:02 - INFO - __main__ - Step 17968: {'lr': 0.00048577764382318265, 'samples': 3449856, 'steps': 17967, 'loss/train': 1.4978206157684326} -08/30/2021 16:28:02 - INFO - __main__ - Step 17969: {'lr': 0.0004857758793877545, 'samples': 3450048, 'steps': 17968, 'loss/train': 1.8247748613357544} -08/30/2021 16:28:03 - INFO - __main__ - Step 17970: {'lr': 0.00048577411484608936, 'samples': 3450240, 'steps': 17969, 'loss/train': 1.8087624311447144} -08/30/2021 16:28:04 - INFO - __main__ - Step 17971: {'lr': 0.000485772350198188, 'samples': 3450432, 'steps': 17970, 'loss/train': 1.5536245107650757} -08/30/2021 16:28:05 - INFO - __main__ - Step 17972: {'lr': 0.00048577058544405126, 'samples': 3450624, 'steps': 17971, 'loss/train': 1.661061406135559} -08/30/2021 16:28:05 - INFO - __main__ - Step 17973: {'lr': 0.00048576882058368, 'samples': 3450816, 'steps': 17972, 'loss/train': 1.5742443799972534} -08/30/2021 16:28:05 - INFO - __main__ - Step 17974: {'lr': 0.0004857670556170749, 'samples': 3451008, 'steps': 17973, 'loss/train': 1.044863224029541} -08/30/2021 16:28:06 - INFO - __main__ - Step 17975: {'lr': 0.0004857652905442368, 'samples': 3451200, 'steps': 17974, 'loss/train': 2.287400484085083} -08/30/2021 16:28:07 - INFO - __main__ - Step 17976: {'lr': 0.0004857635253651665, 'samples': 3451392, 'steps': 17975, 'loss/train': 1.5925867557525635} -08/30/2021 16:28:08 - INFO - __main__ - Step 17977: {'lr': 0.00048576176007986485, 'samples': 3451584, 'steps': 17976, 'loss/train': 1.464400053024292} -08/30/2021 16:28:08 - INFO - __main__ - Step 17978: {'lr': 0.00048575999468833256, 'samples': 3451776, 'steps': 17977, 'loss/train': 1.465862512588501} -08/30/2021 16:28:08 - INFO - __main__ - Step 17979: {'lr': 0.0004857582291905704, 'samples': 3451968, 'steps': 17978, 'loss/train': 1.49838387966156} -08/30/2021 16:28:09 - INFO - __main__ - Step 17980: {'lr': 0.00048575646358657934, 'samples': 3452160, 'steps': 17979, 'loss/train': 1.0039933919906616} -08/30/2021 16:28:10 - INFO - __main__ - Step 17981: {'lr': 0.00048575469787635997, 'samples': 3452352, 'steps': 17980, 'loss/train': 1.6469841003417969} -08/30/2021 16:28:11 - INFO - __main__ - Step 17982: {'lr': 0.00048575293205991313, 'samples': 3452544, 'steps': 17981, 'loss/train': 1.6953777074813843} -08/30/2021 16:28:11 - INFO - __main__ - Step 17983: {'lr': 0.0004857511661372397, 'samples': 3452736, 'steps': 17982, 'loss/train': 1.6324660778045654} -08/30/2021 16:28:11 - INFO - __main__ - Step 17984: {'lr': 0.00048574940010834045, 'samples': 3452928, 'steps': 17983, 'loss/train': 1.3473966121673584} -08/30/2021 16:28:12 - INFO - __main__ - Step 17985: {'lr': 0.0004857476339732161, 'samples': 3453120, 'steps': 17984, 'loss/train': 1.9128919839859009} -08/30/2021 16:28:12 - INFO - __main__ - Step 17986: {'lr': 0.0004857458677318676, 'samples': 3453312, 'steps': 17985, 'loss/train': 1.7540589570999146} -08/30/2021 16:28:14 - INFO - __main__ - Step 17987: {'lr': 0.0004857441013842956, 'samples': 3453504, 'steps': 17986, 'loss/train': 1.6961069107055664} -08/30/2021 16:28:14 - INFO - __main__ - Step 17988: {'lr': 0.0004857423349305009, 'samples': 3453696, 'steps': 17987, 'loss/train': 1.6407495737075806} -08/30/2021 16:28:15 - INFO - __main__ - Step 17989: {'lr': 0.00048574056837048443, 'samples': 3453888, 'steps': 17988, 'loss/train': 1.7343302965164185} -08/30/2021 16:28:15 - INFO - __main__ - Step 17990: {'lr': 0.0004857388017042468, 'samples': 3454080, 'steps': 17989, 'loss/train': 0.266526997089386} -08/30/2021 16:28:15 - INFO - __main__ - Step 17991: {'lr': 0.000485737034931789, 'samples': 3454272, 'steps': 17990, 'loss/train': 1.5119613409042358} -08/30/2021 16:28:17 - INFO - __main__ - Step 17992: {'lr': 0.00048573526805311166, 'samples': 3454464, 'steps': 17991, 'loss/train': 1.3970911502838135} -08/30/2021 16:28:17 - INFO - __main__ - Step 17993: {'lr': 0.0004857335010682157, 'samples': 3454656, 'steps': 17992, 'loss/train': 2.1763477325439453} -08/30/2021 16:28:18 - INFO - __main__ - Step 17994: {'lr': 0.0004857317339771018, 'samples': 3454848, 'steps': 17993, 'loss/train': 5.6309027671813965} -08/30/2021 16:28:18 - INFO - __main__ - Step 17995: {'lr': 0.0004857299667797709, 'samples': 3455040, 'steps': 17994, 'loss/train': 1.6603909730911255} -08/30/2021 16:28:18 - INFO - __main__ - Step 17996: {'lr': 0.0004857281994762236, 'samples': 3455232, 'steps': 17995, 'loss/train': 1.3990861177444458} -08/30/2021 16:28:20 - INFO - __main__ - Step 17997: {'lr': 0.00048572643206646097, 'samples': 3455424, 'steps': 17996, 'loss/train': 1.095388412475586} -08/30/2021 16:28:21 - INFO - __main__ - Step 17998: {'lr': 0.0004857246645504835, 'samples': 3455616, 'steps': 17997, 'loss/train': 1.5710792541503906} -08/30/2021 16:28:21 - INFO - __main__ - Step 17999: {'lr': 0.00048572289692829217, 'samples': 3455808, 'steps': 17998, 'loss/train': 1.4027560949325562} -08/30/2021 16:28:21 - INFO - __main__ - Step 18000: {'lr': 0.00048572112919988776, 'samples': 3456000, 'steps': 17999, 'loss/train': 1.682323694229126} -08/30/2021 16:28:22 - INFO - __main__ - Step 18001: {'lr': 0.00048571936136527106, 'samples': 3456192, 'steps': 18000, 'loss/train': 1.7628370523452759} -08/30/2021 16:28:22 - INFO - __main__ - Step 18002: {'lr': 0.0004857175934244428, 'samples': 3456384, 'steps': 18001, 'loss/train': 1.5482879877090454} -08/30/2021 16:28:23 - INFO - __main__ - Step 18003: {'lr': 0.0004857158253774039, 'samples': 3456576, 'steps': 18002, 'loss/train': 0.09714821726083755} -08/30/2021 16:28:24 - INFO - __main__ - Step 18004: {'lr': 0.0004857140572241551, 'samples': 3456768, 'steps': 18003, 'loss/train': 0.06454353779554367} -08/30/2021 16:28:25 - INFO - __main__ - Step 18005: {'lr': 0.00048571228896469713, 'samples': 3456960, 'steps': 18004, 'loss/train': 1.6359314918518066} -08/30/2021 16:28:25 - INFO - __main__ - Step 18006: {'lr': 0.0004857105205990308, 'samples': 3457152, 'steps': 18005, 'loss/train': 1.7537561655044556} -08/30/2021 16:28:26 - INFO - __main__ - Step 18007: {'lr': 0.00048570875212715706, 'samples': 3457344, 'steps': 18006, 'loss/train': 1.392996907234192} -08/30/2021 16:28:26 - INFO - __main__ - Step 18008: {'lr': 0.0004857069835490765, 'samples': 3457536, 'steps': 18007, 'loss/train': 1.7586145401000977} -08/30/2021 16:28:26 - INFO - __main__ - Step 18009: {'lr': 0.00048570521486479004, 'samples': 3457728, 'steps': 18008, 'loss/train': 2.623910903930664} -08/30/2021 16:28:28 - INFO - __main__ - Step 18010: {'lr': 0.0004857034460742984, 'samples': 3457920, 'steps': 18009, 'loss/train': 1.8344008922576904} -08/30/2021 16:28:29 - INFO - __main__ - Step 18011: {'lr': 0.0004857016771776025, 'samples': 3458112, 'steps': 18010, 'loss/train': 2.376192092895508} -08/30/2021 16:28:29 - INFO - __main__ - Step 18012: {'lr': 0.000485699908174703, 'samples': 3458304, 'steps': 18011, 'loss/train': 2.1674773693084717} -08/30/2021 16:28:29 - INFO - __main__ - Step 18013: {'lr': 0.0004856981390656008, 'samples': 3458496, 'steps': 18012, 'loss/train': 1.5568349361419678} -08/30/2021 16:28:30 - INFO - __main__ - Step 18014: {'lr': 0.00048569636985029664, 'samples': 3458688, 'steps': 18013, 'loss/train': 2.163891077041626} -08/30/2021 16:28:31 - INFO - __main__ - Step 18015: {'lr': 0.00048569460052879136, 'samples': 3458880, 'steps': 18014, 'loss/train': 1.916684627532959} -08/30/2021 16:28:32 - INFO - __main__ - Step 18016: {'lr': 0.0004856928311010857, 'samples': 3459072, 'steps': 18015, 'loss/train': 1.7760971784591675} -08/30/2021 16:28:32 - INFO - __main__ - Step 18017: {'lr': 0.00048569106156718045, 'samples': 3459264, 'steps': 18016, 'loss/train': 1.3841313123703003} -08/30/2021 16:28:32 - INFO - __main__ - Step 18018: {'lr': 0.00048568929192707657, 'samples': 3459456, 'steps': 18017, 'loss/train': 1.5409024953842163} -08/30/2021 16:28:33 - INFO - __main__ - Step 18019: {'lr': 0.0004856875221807746, 'samples': 3459648, 'steps': 18018, 'loss/train': 1.7263318300247192} -08/30/2021 16:28:35 - INFO - __main__ - Step 18020: {'lr': 0.0004856857523282755, 'samples': 3459840, 'steps': 18019, 'loss/train': 0.9564329385757446} -08/30/2021 16:28:35 - INFO - __main__ - Step 18021: {'lr': 0.0004856839823695801, 'samples': 3460032, 'steps': 18020, 'loss/train': 1.9314879179000854} -08/30/2021 16:28:36 - INFO - __main__ - Step 18022: {'lr': 0.00048568221230468905, 'samples': 3460224, 'steps': 18021, 'loss/train': 1.7067102193832397} -08/30/2021 16:28:36 - INFO - __main__ - Step 18023: {'lr': 0.0004856804421336033, 'samples': 3460416, 'steps': 18022, 'loss/train': 2.0386927127838135} -08/30/2021 16:28:36 - INFO - __main__ - Step 18024: {'lr': 0.0004856786718563235, 'samples': 3460608, 'steps': 18023, 'loss/train': 1.5910874605178833} -08/30/2021 16:28:38 - INFO - __main__ - Step 18025: {'lr': 0.0004856769014728506, 'samples': 3460800, 'steps': 18024, 'loss/train': 1.4760442972183228} -08/30/2021 16:28:38 - INFO - __main__ - Step 18026: {'lr': 0.0004856751309831853, 'samples': 3460992, 'steps': 18025, 'loss/train': 1.577941656112671} -08/30/2021 16:28:38 - INFO - __main__ - Step 18027: {'lr': 0.00048567336038732843, 'samples': 3461184, 'steps': 18026, 'loss/train': 1.6862093210220337} -08/30/2021 16:28:39 - INFO - __main__ - Step 18028: {'lr': 0.0004856715896852808, 'samples': 3461376, 'steps': 18027, 'loss/train': 1.8757396936416626} -08/30/2021 16:28:39 - INFO - __main__ - Step 18029: {'lr': 0.0004856698188770432, 'samples': 3461568, 'steps': 18028, 'loss/train': 1.694564700126648} -08/30/2021 16:28:41 - INFO - __main__ - Step 18030: {'lr': 0.0004856680479626163, 'samples': 3461760, 'steps': 18029, 'loss/train': 1.5136922597885132} -08/30/2021 16:28:41 - INFO - __main__ - Step 18031: {'lr': 0.0004856662769420012, 'samples': 3461952, 'steps': 18030, 'loss/train': 1.7104381322860718} -08/30/2021 16:28:41 - INFO - __main__ - Step 18032: {'lr': 0.0004856645058151984, 'samples': 3462144, 'steps': 18031, 'loss/train': 0.833308219909668} -08/30/2021 16:28:42 - INFO - __main__ - Step 18033: {'lr': 0.0004856627345822088, 'samples': 3462336, 'steps': 18032, 'loss/train': 0.7060480117797852} -08/30/2021 16:28:42 - INFO - __main__ - Step 18034: {'lr': 0.0004856609632430332, 'samples': 3462528, 'steps': 18033, 'loss/train': 1.5961253643035889} -08/30/2021 16:28:42 - INFO - __main__ - Step 18035: {'lr': 0.00048565919179767246, 'samples': 3462720, 'steps': 18034, 'loss/train': 1.7715524435043335} -08/30/2021 16:28:44 - INFO - __main__ - Step 18036: {'lr': 0.0004856574202461273, 'samples': 3462912, 'steps': 18035, 'loss/train': 0.9656311273574829} -08/30/2021 16:28:45 - INFO - __main__ - Step 18037: {'lr': 0.0004856556485883985, 'samples': 3463104, 'steps': 18036, 'loss/train': 1.2984038591384888} -08/30/2021 16:28:45 - INFO - __main__ - Step 18038: {'lr': 0.000485653876824487, 'samples': 3463296, 'steps': 18037, 'loss/train': 2.0501441955566406} -08/30/2021 16:28:45 - INFO - __main__ - Step 18039: {'lr': 0.00048565210495439337, 'samples': 3463488, 'steps': 18038, 'loss/train': 1.552443265914917} -08/30/2021 16:28:46 - INFO - __main__ - Step 18040: {'lr': 0.00048565033297811867, 'samples': 3463680, 'steps': 18039, 'loss/train': 1.5536558628082275} -08/30/2021 16:28:47 - INFO - __main__ - Step 18041: {'lr': 0.0004856485608956635, 'samples': 3463872, 'steps': 18040, 'loss/train': 1.036659836769104} -08/30/2021 16:28:48 - INFO - __main__ - Step 18042: {'lr': 0.00048564678870702873, 'samples': 3464064, 'steps': 18041, 'loss/train': 1.7979850769042969} -08/30/2021 16:28:48 - INFO - __main__ - Step 18043: {'lr': 0.00048564501641221516, 'samples': 3464256, 'steps': 18042, 'loss/train': 1.3544678688049316} -08/30/2021 16:28:48 - INFO - __main__ - Step 18044: {'lr': 0.00048564324401122357, 'samples': 3464448, 'steps': 18043, 'loss/train': 1.6906307935714722} -08/30/2021 16:28:49 - INFO - __main__ - Step 18045: {'lr': 0.0004856414715040548, 'samples': 3464640, 'steps': 18044, 'loss/train': 1.0748234987258911} -08/30/2021 16:28:50 - INFO - __main__ - Step 18046: {'lr': 0.0004856396988907096, 'samples': 3464832, 'steps': 18045, 'loss/train': 1.5081632137298584} -08/30/2021 16:28:51 - INFO - __main__ - Step 18047: {'lr': 0.00048563792617118876, 'samples': 3465024, 'steps': 18046, 'loss/train': 1.872005820274353} -08/30/2021 16:28:51 - INFO - __main__ - Step 18048: {'lr': 0.00048563615334549316, 'samples': 3465216, 'steps': 18047, 'loss/train': 2.1396422386169434} -08/30/2021 16:28:51 - INFO - __main__ - Step 18049: {'lr': 0.0004856343804136235, 'samples': 3465408, 'steps': 18048, 'loss/train': 1.707249641418457} -08/30/2021 16:28:52 - INFO - __main__ - Step 18050: {'lr': 0.0004856326073755806, 'samples': 3465600, 'steps': 18049, 'loss/train': 1.3193695545196533} -08/30/2021 16:28:53 - INFO - __main__ - Step 18051: {'lr': 0.0004856308342313653, 'samples': 3465792, 'steps': 18050, 'loss/train': 0.984358549118042} -08/30/2021 16:28:54 - INFO - __main__ - Step 18052: {'lr': 0.00048562906098097847, 'samples': 3465984, 'steps': 18051, 'loss/train': 1.6047166585922241} -08/30/2021 16:28:54 - INFO - __main__ - Step 18053: {'lr': 0.0004856272876244208, 'samples': 3466176, 'steps': 18052, 'loss/train': 1.973154902458191} -08/30/2021 16:28:54 - INFO - __main__ - Step 18054: {'lr': 0.000485625514161693, 'samples': 3466368, 'steps': 18053, 'loss/train': 1.4109480381011963} -08/30/2021 16:28:55 - INFO - __main__ - Step 18055: {'lr': 0.00048562374059279604, 'samples': 3466560, 'steps': 18054, 'loss/train': 1.571926474571228} -08/30/2021 16:28:56 - INFO - __main__ - Step 18056: {'lr': 0.00048562196691773066, 'samples': 3466752, 'steps': 18055, 'loss/train': 1.6709606647491455} -08/30/2021 16:28:57 - INFO - __main__ - Step 18057: {'lr': 0.00048562019313649766, 'samples': 3466944, 'steps': 18056, 'loss/train': 0.5680364370346069} -08/30/2021 16:28:57 - INFO - __main__ - Step 18058: {'lr': 0.0004856184192490979, 'samples': 3467136, 'steps': 18057, 'loss/train': 1.7736974954605103} -08/30/2021 16:28:57 - INFO - __main__ - Step 18059: {'lr': 0.000485616645255532, 'samples': 3467328, 'steps': 18058, 'loss/train': 1.9981396198272705} -08/30/2021 16:28:58 - INFO - __main__ - Step 18060: {'lr': 0.0004856148711558009, 'samples': 3467520, 'steps': 18059, 'loss/train': 1.743849754333496} -08/30/2021 16:28:58 - INFO - __main__ - Step 18061: {'lr': 0.00048561309694990543, 'samples': 3467712, 'steps': 18060, 'loss/train': 1.9952452182769775} -08/30/2021 16:29:00 - INFO - __main__ - Step 18062: {'lr': 0.00048561132263784634, 'samples': 3467904, 'steps': 18061, 'loss/train': 1.6193169355392456} -08/30/2021 16:29:00 - INFO - __main__ - Step 18063: {'lr': 0.00048560954821962434, 'samples': 3468096, 'steps': 18062, 'loss/train': 1.4820996522903442} -08/30/2021 16:29:01 - INFO - __main__ - Step 18064: {'lr': 0.0004856077736952404, 'samples': 3468288, 'steps': 18063, 'loss/train': 0.35932403802871704} -08/30/2021 16:29:01 - INFO - __main__ - Step 18065: {'lr': 0.00048560599906469513, 'samples': 3468480, 'steps': 18064, 'loss/train': 0.5257107615470886} -08/30/2021 16:29:01 - INFO - __main__ - Step 18066: {'lr': 0.00048560422432798956, 'samples': 3468672, 'steps': 18065, 'loss/train': 2.516770124435425} -08/30/2021 16:29:02 - INFO - __main__ - Step 18067: {'lr': 0.0004856024494851243, 'samples': 3468864, 'steps': 18066, 'loss/train': 1.6919971704483032} -08/30/2021 16:29:03 - INFO - __main__ - Step 18068: {'lr': 0.00048560067453610025, 'samples': 3469056, 'steps': 18067, 'loss/train': 1.546239972114563} -08/30/2021 16:29:04 - INFO - __main__ - Step 18069: {'lr': 0.00048559889948091814, 'samples': 3469248, 'steps': 18068, 'loss/train': 1.52725088596344} -08/30/2021 16:29:04 - INFO - __main__ - Step 18070: {'lr': 0.0004855971243195788, 'samples': 3469440, 'steps': 18069, 'loss/train': 1.8115290403366089} -08/30/2021 16:29:04 - INFO - __main__ - Step 18071: {'lr': 0.00048559534905208304, 'samples': 3469632, 'steps': 18070, 'loss/train': 1.6920514106750488} -08/30/2021 16:29:05 - INFO - __main__ - Step 18072: {'lr': 0.0004855935736784316, 'samples': 3469824, 'steps': 18071, 'loss/train': 1.7712047100067139} -08/30/2021 16:29:07 - INFO - __main__ - Step 18073: {'lr': 0.00048559179819862537, 'samples': 3470016, 'steps': 18072, 'loss/train': 1.6060940027236938} -08/30/2021 16:29:07 - INFO - __main__ - Step 18074: {'lr': 0.0004855900226126651, 'samples': 3470208, 'steps': 18073, 'loss/train': 1.5529301166534424} -08/30/2021 16:29:08 - INFO - __main__ - Step 18075: {'lr': 0.00048558824692055156, 'samples': 3470400, 'steps': 18074, 'loss/train': 1.69679594039917} -08/30/2021 16:29:08 - INFO - __main__ - Step 18076: {'lr': 0.0004855864711222857, 'samples': 3470592, 'steps': 18075, 'loss/train': 1.4229506254196167} -08/30/2021 16:29:09 - INFO - __main__ - Step 18077: {'lr': 0.0004855846952178682, 'samples': 3470784, 'steps': 18076, 'loss/train': 1.3505346775054932} -08/30/2021 16:29:09 - INFO - __main__ - Step 18078: {'lr': 0.0004855829192072998, 'samples': 3470976, 'steps': 18077, 'loss/train': 1.947479009628296} -08/30/2021 16:29:10 - INFO - __main__ - Step 18079: {'lr': 0.00048558114309058144, 'samples': 3471168, 'steps': 18078, 'loss/train': 2.2514586448669434} -08/30/2021 16:29:11 - INFO - __main__ - Step 18080: {'lr': 0.00048557936686771376, 'samples': 3471360, 'steps': 18079, 'loss/train': 1.5654730796813965} -08/30/2021 16:29:11 - INFO - __main__ - Step 18081: {'lr': 0.0004855775905386977, 'samples': 3471552, 'steps': 18080, 'loss/train': 1.4146381616592407} -08/30/2021 16:29:11 - INFO - __main__ - Step 18082: {'lr': 0.000485575814103534, 'samples': 3471744, 'steps': 18081, 'loss/train': 1.4612665176391602} -08/30/2021 16:29:12 - INFO - __main__ - Step 18083: {'lr': 0.0004855740375622235, 'samples': 3471936, 'steps': 18082, 'loss/train': 1.6697293519973755} -08/30/2021 16:29:13 - INFO - __main__ - Step 18084: {'lr': 0.00048557226091476704, 'samples': 3472128, 'steps': 18083, 'loss/train': 1.5470685958862305} -08/30/2021 16:29:14 - INFO - __main__ - Step 18085: {'lr': 0.0004855704841611652, 'samples': 3472320, 'steps': 18084, 'loss/train': 1.0351128578186035} -08/30/2021 16:29:14 - INFO - __main__ - Step 18086: {'lr': 0.00048556870730141906, 'samples': 3472512, 'steps': 18085, 'loss/train': 1.4645930528640747} -08/30/2021 16:29:15 - INFO - __main__ - Step 18087: {'lr': 0.00048556693033552926, 'samples': 3472704, 'steps': 18086, 'loss/train': 1.5588650703430176} -08/30/2021 16:29:15 - INFO - __main__ - Step 18088: {'lr': 0.0004855651532634966, 'samples': 3472896, 'steps': 18087, 'loss/train': 1.4824671745300293} -08/30/2021 16:29:17 - INFO - __main__ - Step 18089: {'lr': 0.00048556337608532196, 'samples': 3473088, 'steps': 18088, 'loss/train': 1.5125601291656494} -08/30/2021 16:29:17 - INFO - __main__ - Step 18090: {'lr': 0.00048556159880100604, 'samples': 3473280, 'steps': 18089, 'loss/train': 1.5799002647399902} -08/30/2021 16:29:17 - INFO - __main__ - Step 18091: {'lr': 0.00048555982141054976, 'samples': 3473472, 'steps': 18090, 'loss/train': 1.3235498666763306} -08/30/2021 16:29:18 - INFO - __main__ - Step 18092: {'lr': 0.0004855580439139539, 'samples': 3473664, 'steps': 18091, 'loss/train': 1.2626641988754272} -08/30/2021 16:29:18 - INFO - __main__ - Step 18093: {'lr': 0.00048555626631121906, 'samples': 3473856, 'steps': 18092, 'loss/train': 1.4647942781448364} -08/30/2021 16:29:20 - INFO - __main__ - Step 18094: {'lr': 0.0004855544886023463, 'samples': 3474048, 'steps': 18093, 'loss/train': 1.4743677377700806} -08/30/2021 16:29:20 - INFO - __main__ - Step 18095: {'lr': 0.00048555271078733637, 'samples': 3474240, 'steps': 18094, 'loss/train': 1.375719666481018} -08/30/2021 16:29:20 - INFO - __main__ - Step 18096: {'lr': 0.00048555093286618996, 'samples': 3474432, 'steps': 18095, 'loss/train': 2.1218225955963135} -08/30/2021 16:29:21 - INFO - __main__ - Step 18097: {'lr': 0.0004855491548389079, 'samples': 3474624, 'steps': 18096, 'loss/train': 1.4977178573608398} -08/30/2021 16:29:21 - INFO - __main__ - Step 18098: {'lr': 0.0004855473767054911, 'samples': 3474816, 'steps': 18097, 'loss/train': 1.7799386978149414} -08/30/2021 16:29:23 - INFO - __main__ - Step 18099: {'lr': 0.00048554559846594026, 'samples': 3475008, 'steps': 18098, 'loss/train': 1.7905550003051758} -08/30/2021 16:29:23 - INFO - __main__ - Step 18100: {'lr': 0.0004855438201202562, 'samples': 3475200, 'steps': 18099, 'loss/train': 1.3962756395339966} -08/30/2021 16:29:23 - INFO - __main__ - Step 18101: {'lr': 0.0004855420416684398, 'samples': 3475392, 'steps': 18100, 'loss/train': 1.8041163682937622} -08/30/2021 16:29:24 - INFO - __main__ - Step 18102: {'lr': 0.0004855402631104917, 'samples': 3475584, 'steps': 18101, 'loss/train': 0.3637233376502991} -08/30/2021 16:29:24 - INFO - __main__ - Step 18103: {'lr': 0.0004855384844464128, 'samples': 3475776, 'steps': 18102, 'loss/train': 1.7341152429580688} -08/30/2021 16:29:24 - INFO - __main__ - Step 18104: {'lr': 0.00048553670567620395, 'samples': 3475968, 'steps': 18103, 'loss/train': 1.2765697240829468} -08/30/2021 16:29:26 - INFO - __main__ - Step 18105: {'lr': 0.0004855349267998659, 'samples': 3476160, 'steps': 18104, 'loss/train': 1.5414867401123047} -08/30/2021 16:29:26 - INFO - __main__ - Step 18106: {'lr': 0.0004855331478173994, 'samples': 3476352, 'steps': 18105, 'loss/train': 2.287764310836792} -08/30/2021 16:29:27 - INFO - __main__ - Step 18107: {'lr': 0.0004855313687288053, 'samples': 3476544, 'steps': 18106, 'loss/train': 1.6214512586593628} -08/30/2021 16:29:27 - INFO - __main__ - Step 18108: {'lr': 0.00048552958953408437, 'samples': 3476736, 'steps': 18107, 'loss/train': 1.9014850854873657} -08/30/2021 16:29:28 - INFO - __main__ - Step 18109: {'lr': 0.0004855278102332375, 'samples': 3476928, 'steps': 18108, 'loss/train': 1.979744791984558} -08/30/2021 16:29:29 - INFO - __main__ - Step 18110: {'lr': 0.0004855260308262654, 'samples': 3477120, 'steps': 18109, 'loss/train': 1.468855857849121} -08/30/2021 16:29:30 - INFO - __main__ - Step 18111: {'lr': 0.00048552425131316893, 'samples': 3477312, 'steps': 18110, 'loss/train': 2.183777093887329} -08/30/2021 16:29:30 - INFO - __main__ - Step 18112: {'lr': 0.0004855224716939488, 'samples': 3477504, 'steps': 18111, 'loss/train': 1.2424217462539673} -08/30/2021 16:29:30 - INFO - __main__ - Step 18113: {'lr': 0.0004855206919686059, 'samples': 3477696, 'steps': 18112, 'loss/train': 1.9680477380752563} -08/30/2021 16:29:31 - INFO - __main__ - Step 18114: {'lr': 0.0004855189121371411, 'samples': 3477888, 'steps': 18113, 'loss/train': 1.4735645055770874} -08/30/2021 16:29:32 - INFO - __main__ - Step 18115: {'lr': 0.00048551713219955505, 'samples': 3478080, 'steps': 18114, 'loss/train': 1.5061053037643433} -08/30/2021 16:29:32 - INFO - __main__ - Step 18116: {'lr': 0.00048551535215584865, 'samples': 3478272, 'steps': 18115, 'loss/train': 1.6229461431503296} -08/30/2021 16:29:33 - INFO - __main__ - Step 18117: {'lr': 0.00048551357200602265, 'samples': 3478464, 'steps': 18116, 'loss/train': 0.8685430288314819} -08/30/2021 16:29:33 - INFO - __main__ - Step 18118: {'lr': 0.0004855117917500778, 'samples': 3478656, 'steps': 18117, 'loss/train': 1.8633511066436768} -08/30/2021 16:29:34 - INFO - __main__ - Step 18119: {'lr': 0.000485510011388015, 'samples': 3478848, 'steps': 18118, 'loss/train': 1.6058130264282227} -08/30/2021 16:29:35 - INFO - __main__ - Step 18120: {'lr': 0.00048550823091983507, 'samples': 3479040, 'steps': 18119, 'loss/train': 0.5264639258384705} -08/30/2021 16:29:36 - INFO - __main__ - Step 18121: {'lr': 0.00048550645034553877, 'samples': 3479232, 'steps': 18120, 'loss/train': 1.413364052772522} -08/30/2021 16:29:36 - INFO - __main__ - Step 18122: {'lr': 0.00048550466966512684, 'samples': 3479424, 'steps': 18121, 'loss/train': 1.579680323600769} -08/30/2021 16:29:36 - INFO - __main__ - Step 18123: {'lr': 0.0004855028888786002, 'samples': 3479616, 'steps': 18122, 'loss/train': 1.9736636877059937} -08/30/2021 16:29:37 - INFO - __main__ - Step 18124: {'lr': 0.00048550110798595953, 'samples': 3479808, 'steps': 18123, 'loss/train': 1.5097899436950684} -08/30/2021 16:29:39 - INFO - __main__ - Step 18125: {'lr': 0.0004854993269872057, 'samples': 3480000, 'steps': 18124, 'loss/train': 1.5835509300231934} -08/30/2021 16:29:39 - INFO - __main__ - Step 18126: {'lr': 0.0004854975458823396, 'samples': 3480192, 'steps': 18125, 'loss/train': 2.423356056213379} -08/30/2021 16:29:39 - INFO - __main__ - Step 18127: {'lr': 0.0004854957646713618, 'samples': 3480384, 'steps': 18126, 'loss/train': 1.6631091833114624} -08/30/2021 16:29:40 - INFO - __main__ - Step 18128: {'lr': 0.00048549398335427337, 'samples': 3480576, 'steps': 18127, 'loss/train': 1.527232050895691} -08/30/2021 16:29:40 - INFO - __main__ - Step 18129: {'lr': 0.0004854922019310749, 'samples': 3480768, 'steps': 18128, 'loss/train': 1.6804276704788208} -08/30/2021 16:29:42 - INFO - __main__ - Step 18130: {'lr': 0.0004854904204017673, 'samples': 3480960, 'steps': 18129, 'loss/train': 1.1936918497085571} -08/30/2021 16:29:43 - INFO - __main__ - Step 18131: {'lr': 0.0004854886387663514, 'samples': 3481152, 'steps': 18130, 'loss/train': 2.179919481277466} -08/30/2021 16:29:43 - INFO - __main__ - Step 18132: {'lr': 0.0004854868570248279, 'samples': 3481344, 'steps': 18131, 'loss/train': 1.3007756471633911} -08/30/2021 16:29:43 - INFO - __main__ - Step 18133: {'lr': 0.00048548507517719766, 'samples': 3481536, 'steps': 18132, 'loss/train': 1.2625625133514404} -08/30/2021 16:29:44 - INFO - __main__ - Step 18134: {'lr': 0.0004854832932234615, 'samples': 3481728, 'steps': 18133, 'loss/train': 1.6213260889053345} -08/30/2021 16:29:44 - INFO - __main__ - Step 18135: {'lr': 0.0004854815111636202, 'samples': 3481920, 'steps': 18134, 'loss/train': 1.7813739776611328} -08/30/2021 16:29:45 - INFO - __main__ - Step 18136: {'lr': 0.00048547972899767454, 'samples': 3482112, 'steps': 18135, 'loss/train': 1.9012194871902466} -08/30/2021 16:29:46 - INFO - __main__ - Step 18137: {'lr': 0.0004854779467256254, 'samples': 3482304, 'steps': 18136, 'loss/train': 1.1619831323623657} -08/30/2021 16:29:46 - INFO - __main__ - Step 18138: {'lr': 0.00048547616434747344, 'samples': 3482496, 'steps': 18137, 'loss/train': 1.0694165229797363} -08/30/2021 16:29:47 - INFO - __main__ - Step 18139: {'lr': 0.0004854743818632196, 'samples': 3482688, 'steps': 18138, 'loss/train': 0.7140091061592102} -08/30/2021 16:29:47 - INFO - __main__ - Step 18140: {'lr': 0.0004854725992728647, 'samples': 3482880, 'steps': 18139, 'loss/train': 1.559740424156189} -08/30/2021 16:29:48 - INFO - __main__ - Step 18141: {'lr': 0.00048547081657640935, 'samples': 3483072, 'steps': 18140, 'loss/train': 1.8245887756347656} -08/30/2021 16:29:49 - INFO - __main__ - Step 18142: {'lr': 0.00048546903377385457, 'samples': 3483264, 'steps': 18141, 'loss/train': 0.4078364372253418} -08/30/2021 16:29:49 - INFO - __main__ - Step 18143: {'lr': 0.00048546725086520107, 'samples': 3483456, 'steps': 18142, 'loss/train': 2.0865206718444824} -08/30/2021 16:29:50 - INFO - __main__ - Step 18144: {'lr': 0.00048546546785044965, 'samples': 3483648, 'steps': 18143, 'loss/train': 1.1922963857650757} -08/30/2021 16:29:50 - INFO - __main__ - Step 18145: {'lr': 0.00048546368472960114, 'samples': 3483840, 'steps': 18144, 'loss/train': 1.7791651487350464} -08/30/2021 16:29:51 - INFO - __main__ - Step 18146: {'lr': 0.00048546190150265634, 'samples': 3484032, 'steps': 18145, 'loss/train': 1.6271249055862427} -08/30/2021 16:29:52 - INFO - __main__ - Step 18147: {'lr': 0.00048546011816961597, 'samples': 3484224, 'steps': 18146, 'loss/train': 1.6857608556747437} -08/30/2021 16:29:52 - INFO - __main__ - Step 18148: {'lr': 0.00048545833473048094, 'samples': 3484416, 'steps': 18147, 'loss/train': 1.4611496925354004} -08/30/2021 16:29:52 - INFO - __main__ - Step 18149: {'lr': 0.00048545655118525206, 'samples': 3484608, 'steps': 18148, 'loss/train': 1.7676684856414795} -08/30/2021 16:29:53 - INFO - __main__ - Step 18150: {'lr': 0.00048545476753393004, 'samples': 3484800, 'steps': 18149, 'loss/train': 1.7006365060806274} -08/30/2021 16:29:55 - INFO - __main__ - Step 18151: {'lr': 0.0004854529837765158, 'samples': 3484992, 'steps': 18150, 'loss/train': 2.1798832416534424} -08/30/2021 16:29:55 - INFO - __main__ - Step 18152: {'lr': 0.00048545119991301, 'samples': 3485184, 'steps': 18151, 'loss/train': 0.24442991614341736} -08/30/2021 16:29:55 - INFO - __main__ - Step 18153: {'lr': 0.0004854494159434135, 'samples': 3485376, 'steps': 18152, 'loss/train': 0.07093805074691772} -08/30/2021 16:29:56 - INFO - __main__ - Step 18154: {'lr': 0.0004854476318677272, 'samples': 3485568, 'steps': 18153, 'loss/train': 2.1398026943206787} -08/30/2021 16:29:56 - INFO - __main__ - Step 18155: {'lr': 0.00048544584768595185, 'samples': 3485760, 'steps': 18154, 'loss/train': 1.5284425020217896} -08/30/2021 16:29:56 - INFO - __main__ - Step 18156: {'lr': 0.00048544406339808823, 'samples': 3485952, 'steps': 18155, 'loss/train': 1.9047931432724} -08/30/2021 16:29:58 - INFO - __main__ - Step 18157: {'lr': 0.00048544227900413706, 'samples': 3486144, 'steps': 18156, 'loss/train': 1.0087835788726807} -08/30/2021 16:29:58 - INFO - __main__ - Step 18158: {'lr': 0.0004854404945040993, 'samples': 3486336, 'steps': 18157, 'loss/train': 1.7160950899124146} -08/30/2021 16:29:59 - INFO - __main__ - Step 18159: {'lr': 0.0004854387098979757, 'samples': 3486528, 'steps': 18158, 'loss/train': 2.1456117630004883} -08/30/2021 16:29:59 - INFO - __main__ - Step 18160: {'lr': 0.000485436925185767, 'samples': 3486720, 'steps': 18159, 'loss/train': 1.3853322267532349} -08/30/2021 16:29:59 - INFO - __main__ - Step 18161: {'lr': 0.00048543514036747404, 'samples': 3486912, 'steps': 18160, 'loss/train': 2.0687689781188965} -08/30/2021 16:30:01 - INFO - __main__ - Step 18162: {'lr': 0.00048543335544309776, 'samples': 3487104, 'steps': 18161, 'loss/train': 1.7371457815170288} -08/30/2021 16:30:02 - INFO - __main__ - Step 18163: {'lr': 0.00048543157041263876, 'samples': 3487296, 'steps': 18162, 'loss/train': 1.9401506185531616} -08/30/2021 16:30:02 - INFO - __main__ - Step 18164: {'lr': 0.0004854297852760979, 'samples': 3487488, 'steps': 18163, 'loss/train': 1.199976921081543} -08/30/2021 16:30:03 - INFO - __main__ - Step 18165: {'lr': 0.000485428000033476, 'samples': 3487680, 'steps': 18164, 'loss/train': 1.9119760990142822} -08/30/2021 16:30:03 - INFO - __main__ - Step 18166: {'lr': 0.00048542621468477393, 'samples': 3487872, 'steps': 18165, 'loss/train': 1.1560609340667725} -08/30/2021 16:30:03 - INFO - __main__ - Step 18167: {'lr': 0.0004854244292299924, 'samples': 3488064, 'steps': 18166, 'loss/train': 1.251025676727295} -08/30/2021 16:30:04 - INFO - __main__ - Step 18168: {'lr': 0.0004854226436691323, 'samples': 3488256, 'steps': 18167, 'loss/train': 0.1865871548652649} -08/30/2021 16:30:05 - INFO - __main__ - Step 18169: {'lr': 0.0004854208580021944, 'samples': 3488448, 'steps': 18168, 'loss/train': 0.15591633319854736} -08/30/2021 16:30:06 - INFO - __main__ - Step 18170: {'lr': 0.00048541907222917946, 'samples': 3488640, 'steps': 18169, 'loss/train': 2.0507378578186035} -08/30/2021 16:30:06 - INFO - __main__ - Step 18171: {'lr': 0.0004854172863500883, 'samples': 3488832, 'steps': 18170, 'loss/train': 1.788221001625061} -08/30/2021 16:30:06 - INFO - __main__ - Step 18172: {'lr': 0.00048541550036492175, 'samples': 3489024, 'steps': 18171, 'loss/train': 2.480135679244995} -08/30/2021 16:30:07 - INFO - __main__ - Step 18173: {'lr': 0.00048541371427368064, 'samples': 3489216, 'steps': 18172, 'loss/train': 2.4320027828216553} -08/30/2021 16:30:08 - INFO - __main__ - Step 18174: {'lr': 0.0004854119280763657, 'samples': 3489408, 'steps': 18173, 'loss/train': 1.6566660404205322} -08/30/2021 16:30:09 - INFO - __main__ - Step 18175: {'lr': 0.00048541014177297783, 'samples': 3489600, 'steps': 18174, 'loss/train': 1.9397094249725342} -08/30/2021 16:30:09 - INFO - __main__ - Step 18176: {'lr': 0.0004854083553635178, 'samples': 3489792, 'steps': 18175, 'loss/train': 1.500089406967163} -08/30/2021 16:30:10 - INFO - __main__ - Step 18177: {'lr': 0.00048540656884798626, 'samples': 3489984, 'steps': 18176, 'loss/train': 1.5683972835540771} -08/30/2021 16:30:10 - INFO - __main__ - Step 18178: {'lr': 0.0004854047822263843, 'samples': 3490176, 'steps': 18177, 'loss/train': 1.6979554891586304} -08/30/2021 16:30:10 - INFO - __main__ - Step 18179: {'lr': 0.00048540299549871256, 'samples': 3490368, 'steps': 18178, 'loss/train': 0.07497352361679077} -08/30/2021 16:30:11 - INFO - __main__ - Step 18180: {'lr': 0.0004854012086649718, 'samples': 3490560, 'steps': 18179, 'loss/train': 0.6716282367706299} -08/30/2021 16:30:12 - INFO - __main__ - Step 18181: {'lr': 0.00048539942172516295, 'samples': 3490752, 'steps': 18180, 'loss/train': 0.06318680942058563} -08/30/2021 16:30:13 - INFO - __main__ - Step 18182: {'lr': 0.00048539763467928665, 'samples': 3490944, 'steps': 18181, 'loss/train': 1.983986496925354} -08/30/2021 16:30:13 - INFO - __main__ - Step 18183: {'lr': 0.0004853958475273439, 'samples': 3491136, 'steps': 18182, 'loss/train': 1.9680562019348145} -08/30/2021 16:30:13 - INFO - __main__ - Step 18184: {'lr': 0.0004853940602693354, 'samples': 3491328, 'steps': 18183, 'loss/train': 1.910803198814392} -08/30/2021 16:30:14 - INFO - __main__ - Step 18185: {'lr': 0.00048539227290526194, 'samples': 3491520, 'steps': 18184, 'loss/train': 1.7229681015014648} -08/30/2021 16:30:16 - INFO - __main__ - Step 18186: {'lr': 0.00048539048543512443, 'samples': 3491712, 'steps': 18185, 'loss/train': 1.7122142314910889} -08/30/2021 16:30:17 - INFO - __main__ - Step 18187: {'lr': 0.0004853886978589235, 'samples': 3491904, 'steps': 18186, 'loss/train': 1.6136554479599} -08/30/2021 16:30:17 - INFO - __main__ - Step 18188: {'lr': 0.0004853869101766601, 'samples': 3492096, 'steps': 18187, 'loss/train': 1.744834303855896} -08/30/2021 16:30:17 - INFO - __main__ - Step 18189: {'lr': 0.000485385122388335, 'samples': 3492288, 'steps': 18188, 'loss/train': 1.8125004768371582} -08/30/2021 16:30:18 - INFO - __main__ - Step 18190: {'lr': 0.000485383334493949, 'samples': 3492480, 'steps': 18189, 'loss/train': 0.11176054179668427} -08/30/2021 16:30:19 - INFO - __main__ - Step 18191: {'lr': 0.00048538154649350286, 'samples': 3492672, 'steps': 18190, 'loss/train': 1.5933929681777954} -08/30/2021 16:30:20 - INFO - __main__ - Step 18192: {'lr': 0.00048537975838699744, 'samples': 3492864, 'steps': 18191, 'loss/train': 1.4787840843200684} -08/30/2021 16:30:20 - INFO - __main__ - Step 18193: {'lr': 0.0004853779701744335, 'samples': 3493056, 'steps': 18192, 'loss/train': 1.5653127431869507} -08/30/2021 16:30:20 - INFO - __main__ - Step 18194: {'lr': 0.000485376181855812, 'samples': 3493248, 'steps': 18193, 'loss/train': 1.5043683052062988} -08/30/2021 16:30:21 - INFO - __main__ - Step 18195: {'lr': 0.00048537439343113354, 'samples': 3493440, 'steps': 18194, 'loss/train': 1.4824970960617065} -08/30/2021 16:30:21 - INFO - __main__ - Step 18196: {'lr': 0.000485372604900399, 'samples': 3493632, 'steps': 18195, 'loss/train': 1.315542459487915} -08/30/2021 16:30:22 - INFO - __main__ - Step 18197: {'lr': 0.0004853708162636092, 'samples': 3493824, 'steps': 18196, 'loss/train': 1.5427913665771484} -08/30/2021 16:30:23 - INFO - __main__ - Step 18198: {'lr': 0.00048536902752076494, 'samples': 3494016, 'steps': 18197, 'loss/train': 1.4136998653411865} -08/30/2021 16:30:23 - INFO - __main__ - Step 18199: {'lr': 0.00048536723867186705, 'samples': 3494208, 'steps': 18198, 'loss/train': 2.3811869621276855} -08/30/2021 16:30:24 - INFO - __main__ - Step 18200: {'lr': 0.0004853654497169163, 'samples': 3494400, 'steps': 18199, 'loss/train': 1.7197117805480957} -08/30/2021 16:30:24 - INFO - __main__ - Step 18201: {'lr': 0.00048536366065591354, 'samples': 3494592, 'steps': 18200, 'loss/train': 1.966328740119934} -08/30/2021 16:30:25 - INFO - __main__ - Step 18202: {'lr': 0.00048536187148885956, 'samples': 3494784, 'steps': 18201, 'loss/train': 1.398764729499817} -08/30/2021 16:30:26 - INFO - __main__ - Step 18203: {'lr': 0.0004853600822157551, 'samples': 3494976, 'steps': 18202, 'loss/train': 1.0334347486495972} -08/30/2021 16:30:26 - INFO - __main__ - Step 18204: {'lr': 0.000485358292836601, 'samples': 3495168, 'steps': 18203, 'loss/train': 2.1281890869140625} -08/30/2021 16:30:27 - INFO - __main__ - Step 18205: {'lr': 0.0004853565033513982, 'samples': 3495360, 'steps': 18204, 'loss/train': 0.22665266692638397} -08/30/2021 16:30:27 - INFO - __main__ - Step 18206: {'lr': 0.0004853547137601473, 'samples': 3495552, 'steps': 18205, 'loss/train': 1.2151612043380737} -08/30/2021 16:30:29 - INFO - __main__ - Step 18207: {'lr': 0.0004853529240628493, 'samples': 3495744, 'steps': 18206, 'loss/train': 1.48349928855896} -08/30/2021 16:30:29 - INFO - __main__ - Step 18208: {'lr': 0.00048535113425950474, 'samples': 3495936, 'steps': 18207, 'loss/train': 1.808370590209961} -08/30/2021 16:30:29 - INFO - __main__ - Step 18209: {'lr': 0.0004853493443501147, 'samples': 3496128, 'steps': 18208, 'loss/train': 0.945346474647522} -08/30/2021 16:30:30 - INFO - __main__ - Step 18210: {'lr': 0.0004853475543346798, 'samples': 3496320, 'steps': 18209, 'loss/train': 1.5416520833969116} -08/30/2021 16:30:30 - INFO - __main__ - Step 18211: {'lr': 0.000485345764213201, 'samples': 3496512, 'steps': 18210, 'loss/train': 1.618773102760315} -08/30/2021 16:30:30 - INFO - __main__ - Step 18212: {'lr': 0.00048534397398567895, 'samples': 3496704, 'steps': 18211, 'loss/train': 1.5082675218582153} -08/30/2021 16:30:32 - INFO - __main__ - Step 18213: {'lr': 0.00048534218365211456, 'samples': 3496896, 'steps': 18212, 'loss/train': 0.14711081981658936} -08/30/2021 16:30:32 - INFO - __main__ - Step 18214: {'lr': 0.0004853403932125087, 'samples': 3497088, 'steps': 18213, 'loss/train': 1.564862608909607} -08/30/2021 16:30:33 - INFO - __main__ - Step 18215: {'lr': 0.00048533860266686203, 'samples': 3497280, 'steps': 18214, 'loss/train': 2.049409866333008} -08/30/2021 16:30:33 - INFO - __main__ - Step 18216: {'lr': 0.0004853368120151754, 'samples': 3497472, 'steps': 18215, 'loss/train': 1.8001041412353516} -08/30/2021 16:30:33 - INFO - __main__ - Step 18217: {'lr': 0.00048533502125744967, 'samples': 3497664, 'steps': 18216, 'loss/train': 1.8892565965652466} -08/30/2021 16:30:35 - INFO - __main__ - Step 18218: {'lr': 0.0004853332303936856, 'samples': 3497856, 'steps': 18217, 'loss/train': 1.4445117712020874} -08/30/2021 16:30:35 - INFO - __main__ - Step 18219: {'lr': 0.000485331439423884, 'samples': 3498048, 'steps': 18218, 'loss/train': 1.5056453943252563} -08/30/2021 16:30:36 - INFO - __main__ - Step 18220: {'lr': 0.00048532964834804566, 'samples': 3498240, 'steps': 18219, 'loss/train': 0.9864267706871033} -08/30/2021 16:30:36 - INFO - __main__ - Step 18221: {'lr': 0.00048532785716617145, 'samples': 3498432, 'steps': 18220, 'loss/train': 1.4905229806900024} -08/30/2021 16:30:37 - INFO - __main__ - Step 18222: {'lr': 0.0004853260658782621, 'samples': 3498624, 'steps': 18221, 'loss/train': 1.4205816984176636} -08/30/2021 16:30:38 - INFO - __main__ - Step 18223: {'lr': 0.0004853242744843185, 'samples': 3498816, 'steps': 18222, 'loss/train': 2.076859712600708} -08/30/2021 16:30:38 - INFO - __main__ - Step 18224: {'lr': 0.0004853224829843414, 'samples': 3499008, 'steps': 18223, 'loss/train': 2.2336368560791016} -08/30/2021 16:30:39 - INFO - __main__ - Step 18225: {'lr': 0.00048532069137833156, 'samples': 3499200, 'steps': 18224, 'loss/train': 1.8242483139038086} -08/30/2021 16:30:39 - INFO - __main__ - Step 18226: {'lr': 0.00048531889966628997, 'samples': 3499392, 'steps': 18225, 'loss/train': 1.3434109687805176} -08/30/2021 16:30:40 - INFO - __main__ - Step 18227: {'lr': 0.00048531710784821726, 'samples': 3499584, 'steps': 18226, 'loss/train': 1.7954832315444946} -08/30/2021 16:30:41 - INFO - __main__ - Step 18228: {'lr': 0.0004853153159241143, 'samples': 3499776, 'steps': 18227, 'loss/train': 1.3241018056869507} -08/30/2021 16:30:41 - INFO - __main__ - Step 18229: {'lr': 0.0004853135238939818, 'samples': 3499968, 'steps': 18228, 'loss/train': 1.6579416990280151} -08/30/2021 16:30:42 - INFO - __main__ - Step 18230: {'lr': 0.0004853117317578207, 'samples': 3500160, 'steps': 18229, 'loss/train': 2.469796657562256} -08/30/2021 16:30:42 - INFO - __main__ - Step 18231: {'lr': 0.00048530993951563186, 'samples': 3500352, 'steps': 18230, 'loss/train': 1.4420359134674072} -08/30/2021 16:30:42 - INFO - __main__ - Step 18232: {'lr': 0.0004853081471674159, 'samples': 3500544, 'steps': 18231, 'loss/train': 1.3792097568511963} -08/30/2021 16:30:43 - INFO - __main__ - Step 18233: {'lr': 0.00048530635471317373, 'samples': 3500736, 'steps': 18232, 'loss/train': 1.8431075811386108} -08/30/2021 16:30:45 - INFO - __main__ - Step 18234: {'lr': 0.0004853045621529062, 'samples': 3500928, 'steps': 18233, 'loss/train': 0.8953320980072021} -08/30/2021 16:30:45 - INFO - __main__ - Step 18235: {'lr': 0.000485302769486614, 'samples': 3501120, 'steps': 18234, 'loss/train': 1.5394054651260376} -08/30/2021 16:30:45 - INFO - __main__ - Step 18236: {'lr': 0.000485300976714298, 'samples': 3501312, 'steps': 18235, 'loss/train': 1.4558779001235962} -08/30/2021 16:30:46 - INFO - __main__ - Step 18237: {'lr': 0.00048529918383595906, 'samples': 3501504, 'steps': 18236, 'loss/train': 1.3067607879638672} -08/30/2021 16:30:46 - INFO - __main__ - Step 18238: {'lr': 0.0004852973908515979, 'samples': 3501696, 'steps': 18237, 'loss/train': 0.7174292802810669} -08/30/2021 16:30:48 - INFO - __main__ - Step 18239: {'lr': 0.0004852955977612154, 'samples': 3501888, 'steps': 18238, 'loss/train': 1.5812405347824097} -08/30/2021 16:30:49 - INFO - __main__ - Step 18240: {'lr': 0.0004852938045648123, 'samples': 3502080, 'steps': 18239, 'loss/train': 1.4285887479782104} -08/30/2021 16:30:49 - INFO - __main__ - Step 18241: {'lr': 0.0004852920112623895, 'samples': 3502272, 'steps': 18240, 'loss/train': 2.0259315967559814} -08/30/2021 16:30:49 - INFO - __main__ - Step 18242: {'lr': 0.00048529021785394765, 'samples': 3502464, 'steps': 18241, 'loss/train': 1.8416999578475952} -08/30/2021 16:30:50 - INFO - __main__ - Step 18243: {'lr': 0.00048528842433948776, 'samples': 3502656, 'steps': 18242, 'loss/train': 1.518181324005127} -08/30/2021 16:30:52 - INFO - __main__ - Step 18244: {'lr': 0.00048528663071901047, 'samples': 3502848, 'steps': 18243, 'loss/train': 1.5467149019241333} -08/30/2021 16:30:52 - INFO - __main__ - Step 18245: {'lr': 0.0004852848369925167, 'samples': 3503040, 'steps': 18244, 'loss/train': 2.726255416870117} -08/30/2021 16:30:53 - INFO - __main__ - Step 18246: {'lr': 0.00048528304316000723, 'samples': 3503232, 'steps': 18245, 'loss/train': 1.824460744857788} -08/30/2021 16:30:53 - INFO - __main__ - Step 18247: {'lr': 0.0004852812492214828, 'samples': 3503424, 'steps': 18246, 'loss/train': 1.953322172164917} -08/30/2021 16:30:53 - INFO - __main__ - Step 18248: {'lr': 0.0004852794551769443, 'samples': 3503616, 'steps': 18247, 'loss/train': 2.5393340587615967} -08/30/2021 16:30:54 - INFO - __main__ - Step 18249: {'lr': 0.0004852776610263925, 'samples': 3503808, 'steps': 18248, 'loss/train': 2.7364838123321533} -08/30/2021 16:30:54 - INFO - __main__ - Step 18250: {'lr': 0.0004852758667698282, 'samples': 3504000, 'steps': 18249, 'loss/train': 1.9968701601028442} -08/30/2021 16:30:56 - INFO - __main__ - Step 18251: {'lr': 0.00048527407240725223, 'samples': 3504192, 'steps': 18250, 'loss/train': 2.165238618850708} -08/30/2021 16:30:56 - INFO - __main__ - Step 18252: {'lr': 0.0004852722779386654, 'samples': 3504384, 'steps': 18251, 'loss/train': 2.3952183723449707} -08/30/2021 16:30:57 - INFO - __main__ - Step 18253: {'lr': 0.00048527048336406855, 'samples': 3504576, 'steps': 18252, 'loss/train': 2.9041616916656494} -08/30/2021 16:30:57 - INFO - __main__ - Step 18254: {'lr': 0.00048526868868346243, 'samples': 3504768, 'steps': 18253, 'loss/train': 2.2178878784179688} -08/30/2021 16:30:57 - INFO - __main__ - Step 18255: {'lr': 0.0004852668938968478, 'samples': 3504960, 'steps': 18254, 'loss/train': 2.0800187587738037} -08/30/2021 16:30:59 - INFO - __main__ - Step 18256: {'lr': 0.0004852650990042256, 'samples': 3505152, 'steps': 18255, 'loss/train': 1.8880712985992432} -08/30/2021 16:31:00 - INFO - __main__ - Step 18257: {'lr': 0.0004852633040055966, 'samples': 3505344, 'steps': 18256, 'loss/train': 2.0610196590423584} -08/30/2021 16:31:00 - INFO - __main__ - Step 18258: {'lr': 0.00048526150890096153, 'samples': 3505536, 'steps': 18257, 'loss/train': 1.6383503675460815} -08/30/2021 16:31:00 - INFO - __main__ - Step 18259: {'lr': 0.0004852597136903213, 'samples': 3505728, 'steps': 18258, 'loss/train': 0.2615097165107727} -08/30/2021 16:31:01 - INFO - __main__ - Step 18260: {'lr': 0.0004852579183736766, 'samples': 3505920, 'steps': 18259, 'loss/train': 1.326377511024475} -08/30/2021 16:31:01 - INFO - __main__ - Step 18261: {'lr': 0.00048525612295102836, 'samples': 3506112, 'steps': 18260, 'loss/train': 2.922910213470459} -08/30/2021 16:31:02 - INFO - __main__ - Step 18262: {'lr': 0.00048525432742237736, 'samples': 3506304, 'steps': 18261, 'loss/train': 0.17876708507537842} -08/30/2021 16:31:03 - INFO - __main__ - Step 18263: {'lr': 0.00048525253178772435, 'samples': 3506496, 'steps': 18262, 'loss/train': 1.77130925655365} -08/30/2021 16:31:03 - INFO - __main__ - Step 18264: {'lr': 0.0004852507360470702, 'samples': 3506688, 'steps': 18263, 'loss/train': 1.9590058326721191} -08/30/2021 16:31:04 - INFO - __main__ - Step 18265: {'lr': 0.0004852489402004157, 'samples': 3506880, 'steps': 18264, 'loss/train': 1.867340087890625} -08/30/2021 16:31:04 - INFO - __main__ - Step 18266: {'lr': 0.0004852471442477617, 'samples': 3507072, 'steps': 18265, 'loss/train': 1.7032133340835571} -08/30/2021 16:31:06 - INFO - __main__ - Step 18267: {'lr': 0.0004852453481891089, 'samples': 3507264, 'steps': 18266, 'loss/train': 1.5362731218338013} -08/30/2021 16:31:06 - INFO - __main__ - Step 18268: {'lr': 0.00048524355202445827, 'samples': 3507456, 'steps': 18267, 'loss/train': 2.047058343887329} -08/30/2021 16:31:06 - INFO - __main__ - Step 18269: {'lr': 0.0004852417557538104, 'samples': 3507648, 'steps': 18268, 'loss/train': 1.3270645141601562} -08/30/2021 16:31:07 - INFO - __main__ - Step 18270: {'lr': 0.00048523995937716625, 'samples': 3507840, 'steps': 18269, 'loss/train': 1.3608251810073853} -08/30/2021 16:31:07 - INFO - __main__ - Step 18271: {'lr': 0.0004852381628945267, 'samples': 3508032, 'steps': 18270, 'loss/train': 2.296241521835327} -08/30/2021 16:31:09 - INFO - __main__ - Step 18272: {'lr': 0.0004852363663058924, 'samples': 3508224, 'steps': 18271, 'loss/train': 1.6583689451217651} -08/30/2021 16:31:09 - INFO - __main__ - Step 18273: {'lr': 0.0004852345696112642, 'samples': 3508416, 'steps': 18272, 'loss/train': 1.4764230251312256} -08/30/2021 16:31:09 - INFO - __main__ - Step 18274: {'lr': 0.00048523277281064295, 'samples': 3508608, 'steps': 18273, 'loss/train': 1.6788078546524048} -08/30/2021 16:31:10 - INFO - __main__ - Step 18275: {'lr': 0.0004852309759040294, 'samples': 3508800, 'steps': 18274, 'loss/train': 1.5933668613433838} -08/30/2021 16:31:10 - INFO - __main__ - Step 18276: {'lr': 0.00048522917889142446, 'samples': 3508992, 'steps': 18275, 'loss/train': 1.636905550956726} -08/30/2021 16:31:10 - INFO - __main__ - Step 18277: {'lr': 0.00048522738177282887, 'samples': 3509184, 'steps': 18276, 'loss/train': 1.4415043592453003} -08/30/2021 16:31:12 - INFO - __main__ - Step 18278: {'lr': 0.0004852255845482435, 'samples': 3509376, 'steps': 18277, 'loss/train': 1.8900659084320068} -08/30/2021 16:31:13 - INFO - __main__ - Step 18279: {'lr': 0.0004852237872176691, 'samples': 3509568, 'steps': 18278, 'loss/train': 0.18102802336215973} -08/30/2021 16:31:13 - INFO - __main__ - Step 18280: {'lr': 0.00048522198978110645, 'samples': 3509760, 'steps': 18279, 'loss/train': 1.3858753442764282} -08/30/2021 16:31:13 - INFO - __main__ - Step 18281: {'lr': 0.0004852201922385564, 'samples': 3509952, 'steps': 18280, 'loss/train': 1.6936274766921997} -08/30/2021 16:31:14 - INFO - __main__ - Step 18282: {'lr': 0.00048521839459001977, 'samples': 3510144, 'steps': 18281, 'loss/train': 1.615212082862854} -08/30/2021 16:31:15 - INFO - __main__ - Step 18283: {'lr': 0.0004852165968354973, 'samples': 3510336, 'steps': 18282, 'loss/train': 1.8196706771850586} -08/30/2021 16:31:16 - INFO - __main__ - Step 18284: {'lr': 0.00048521479897499, 'samples': 3510528, 'steps': 18283, 'loss/train': 1.353030800819397} -08/30/2021 16:31:16 - INFO - __main__ - Step 18285: {'lr': 0.0004852130010084984, 'samples': 3510720, 'steps': 18284, 'loss/train': 1.5243914127349854} -08/30/2021 16:31:16 - INFO - __main__ - Step 18286: {'lr': 0.0004852112029360235, 'samples': 3510912, 'steps': 18285, 'loss/train': 1.9026896953582764} -08/30/2021 16:31:17 - INFO - __main__ - Step 18287: {'lr': 0.0004852094047575661, 'samples': 3511104, 'steps': 18286, 'loss/train': 2.0276737213134766} -08/30/2021 16:31:17 - INFO - __main__ - Step 18288: {'lr': 0.00048520760647312696, 'samples': 3511296, 'steps': 18287, 'loss/train': 1.7218397855758667} -08/30/2021 16:31:19 - INFO - __main__ - Step 18289: {'lr': 0.00048520580808270687, 'samples': 3511488, 'steps': 18288, 'loss/train': 1.6105717420578003} -08/30/2021 16:31:19 - INFO - __main__ - Step 18290: {'lr': 0.0004852040095863067, 'samples': 3511680, 'steps': 18289, 'loss/train': 1.9469579458236694} -08/30/2021 16:31:19 - INFO - __main__ - Step 18291: {'lr': 0.0004852022109839273, 'samples': 3511872, 'steps': 18290, 'loss/train': 0.3960586488246918} -08/30/2021 16:31:20 - INFO - __main__ - Step 18292: {'lr': 0.0004852004122755693, 'samples': 3512064, 'steps': 18291, 'loss/train': 2.3295421600341797} -08/30/2021 16:31:20 - INFO - __main__ - Step 18293: {'lr': 0.00048519861346123363, 'samples': 3512256, 'steps': 18292, 'loss/train': 1.4214847087860107} -08/30/2021 16:31:22 - INFO - __main__ - Step 18294: {'lr': 0.0004851968145409211, 'samples': 3512448, 'steps': 18293, 'loss/train': 1.611711025238037} -08/30/2021 16:31:22 - INFO - __main__ - Step 18295: {'lr': 0.00048519501551463255, 'samples': 3512640, 'steps': 18294, 'loss/train': 2.0002479553222656} -08/30/2021 16:31:22 - INFO - __main__ - Step 18296: {'lr': 0.0004851932163823688, 'samples': 3512832, 'steps': 18295, 'loss/train': 1.2055373191833496} -08/30/2021 16:31:23 - INFO - __main__ - Step 18297: {'lr': 0.0004851914171441305, 'samples': 3513024, 'steps': 18296, 'loss/train': 1.1820570230484009} -08/30/2021 16:31:23 - INFO - __main__ - Step 18298: {'lr': 0.00048518961779991866, 'samples': 3513216, 'steps': 18297, 'loss/train': 2.120363235473633} -08/30/2021 16:31:26 - INFO - __main__ - Step 18299: {'lr': 0.00048518781834973405, 'samples': 3513408, 'steps': 18298, 'loss/train': 1.4115668535232544} -08/30/2021 16:31:26 - INFO - __main__ - Step 18300: {'lr': 0.0004851860187935773, 'samples': 3513600, 'steps': 18299, 'loss/train': 1.4641038179397583} -08/30/2021 16:31:27 - INFO - __main__ - Step 18301: {'lr': 0.0004851842191314494, 'samples': 3513792, 'steps': 18300, 'loss/train': 2.2291409969329834} -08/30/2021 16:31:27 - INFO - __main__ - Step 18302: {'lr': 0.0004851824193633512, 'samples': 3513984, 'steps': 18301, 'loss/train': 1.5605565309524536} -08/30/2021 16:31:27 - INFO - __main__ - Step 18303: {'lr': 0.00048518061948928337, 'samples': 3514176, 'steps': 18302, 'loss/train': 1.9699370861053467} -08/30/2021 16:31:28 - INFO - __main__ - Step 18304: {'lr': 0.0004851788195092468, 'samples': 3514368, 'steps': 18303, 'loss/train': 0.10047666728496552} -08/30/2021 16:31:28 - INFO - __main__ - Step 18305: {'lr': 0.00048517701942324225, 'samples': 3514560, 'steps': 18304, 'loss/train': 1.6972315311431885} -08/30/2021 16:31:29 - INFO - __main__ - Step 18306: {'lr': 0.00048517521923127063, 'samples': 3514752, 'steps': 18305, 'loss/train': 1.4234768152236938} -08/30/2021 16:31:30 - INFO - __main__ - Step 18307: {'lr': 0.00048517341893333267, 'samples': 3514944, 'steps': 18306, 'loss/train': 1.5142172574996948} -08/30/2021 16:31:30 - INFO - __main__ - Step 18308: {'lr': 0.0004851716185294291, 'samples': 3515136, 'steps': 18307, 'loss/train': 2.0314602851867676} -08/30/2021 16:31:31 - INFO - __main__ - Step 18309: {'lr': 0.00048516981801956097, 'samples': 3515328, 'steps': 18308, 'loss/train': 1.5293121337890625} -08/30/2021 16:31:31 - INFO - __main__ - Step 18310: {'lr': 0.00048516801740372886, 'samples': 3515520, 'steps': 18309, 'loss/train': 1.6754064559936523} -08/30/2021 16:31:33 - INFO - __main__ - Step 18311: {'lr': 0.0004851662166819337, 'samples': 3515712, 'steps': 18310, 'loss/train': 1.343644618988037} -08/30/2021 16:31:33 - INFO - __main__ - Step 18312: {'lr': 0.00048516441585417624, 'samples': 3515904, 'steps': 18311, 'loss/train': 1.9953339099884033} -08/30/2021 16:31:33 - INFO - __main__ - Step 18313: {'lr': 0.0004851626149204573, 'samples': 3516096, 'steps': 18312, 'loss/train': 1.207190990447998} -08/30/2021 16:31:34 - INFO - __main__ - Step 18314: {'lr': 0.0004851608138807778, 'samples': 3516288, 'steps': 18313, 'loss/train': 1.730093002319336} -08/30/2021 16:31:34 - INFO - __main__ - Step 18315: {'lr': 0.0004851590127351384, 'samples': 3516480, 'steps': 18314, 'loss/train': 2.054384708404541} -08/30/2021 16:31:36 - INFO - __main__ - Step 18316: {'lr': 0.0004851572114835401, 'samples': 3516672, 'steps': 18315, 'loss/train': 2.286177158355713} -08/30/2021 16:31:36 - INFO - __main__ - Step 18317: {'lr': 0.0004851554101259834, 'samples': 3516864, 'steps': 18316, 'loss/train': 1.541135311126709} -08/30/2021 16:31:37 - INFO - __main__ - Step 18318: {'lr': 0.00048515360866246943, 'samples': 3517056, 'steps': 18317, 'loss/train': 1.7443363666534424} -08/30/2021 16:31:37 - INFO - __main__ - Step 18319: {'lr': 0.00048515180709299884, 'samples': 3517248, 'steps': 18318, 'loss/train': 3.8915019035339355} -08/30/2021 16:31:37 - INFO - __main__ - Step 18320: {'lr': 0.0004851500054175725, 'samples': 3517440, 'steps': 18319, 'loss/train': 1.7440677881240845} -08/30/2021 16:31:39 - INFO - __main__ - Step 18321: {'lr': 0.00048514820363619116, 'samples': 3517632, 'steps': 18320, 'loss/train': 0.1379471719264984} -08/30/2021 16:31:39 - INFO - __main__ - Step 18322: {'lr': 0.0004851464017488556, 'samples': 3517824, 'steps': 18321, 'loss/train': 0.9234429597854614} -08/30/2021 16:31:40 - INFO - __main__ - Step 18323: {'lr': 0.0004851445997555668, 'samples': 3518016, 'steps': 18322, 'loss/train': 2.0152969360351562} -08/30/2021 16:31:40 - INFO - __main__ - Step 18324: {'lr': 0.00048514279765632547, 'samples': 3518208, 'steps': 18323, 'loss/train': 1.6747567653656006} -08/30/2021 16:31:40 - INFO - __main__ - Step 18325: {'lr': 0.0004851409954511324, 'samples': 3518400, 'steps': 18324, 'loss/train': 1.8239686489105225} -08/30/2021 16:31:42 - INFO - __main__ - Step 18326: {'lr': 0.0004851391931399884, 'samples': 3518592, 'steps': 18325, 'loss/train': 1.2097152471542358} -08/30/2021 16:31:42 - INFO - __main__ - Step 18327: {'lr': 0.0004851373907228943, 'samples': 3518784, 'steps': 18326, 'loss/train': 1.3782691955566406} -08/30/2021 16:31:43 - INFO - __main__ - Step 18328: {'lr': 0.00048513558819985106, 'samples': 3518976, 'steps': 18327, 'loss/train': 1.735744595527649} -08/30/2021 16:31:43 - INFO - __main__ - Step 18329: {'lr': 0.0004851337855708592, 'samples': 3519168, 'steps': 18328, 'loss/train': 1.9939866065979004} -08/30/2021 16:31:43 - INFO - __main__ - Step 18330: {'lr': 0.0004851319828359198, 'samples': 3519360, 'steps': 18329, 'loss/train': 1.025618076324463} -08/30/2021 16:31:45 - INFO - __main__ - Step 18331: {'lr': 0.0004851301799950334, 'samples': 3519552, 'steps': 18330, 'loss/train': 2.0228524208068848} -08/30/2021 16:31:45 - INFO - __main__ - Step 18332: {'lr': 0.00048512837704820107, 'samples': 3519744, 'steps': 18331, 'loss/train': 1.407360315322876} -08/30/2021 16:31:46 - INFO - __main__ - Step 18333: {'lr': 0.00048512657399542346, 'samples': 3519936, 'steps': 18332, 'loss/train': 1.6591839790344238} -08/30/2021 16:31:46 - INFO - __main__ - Step 18334: {'lr': 0.0004851247708367015, 'samples': 3520128, 'steps': 18333, 'loss/train': 5.407085418701172} -08/30/2021 16:31:46 - INFO - __main__ - Step 18335: {'lr': 0.000485122967572036, 'samples': 3520320, 'steps': 18334, 'loss/train': 1.739969253540039} -08/30/2021 16:31:47 - INFO - __main__ - Step 18336: {'lr': 0.0004851211642014276, 'samples': 3520512, 'steps': 18335, 'loss/train': 1.5402262210845947} -08/30/2021 16:31:48 - INFO - __main__ - Step 18337: {'lr': 0.0004851193607248773, 'samples': 3520704, 'steps': 18336, 'loss/train': 2.23903489112854} -08/30/2021 16:31:49 - INFO - __main__ - Step 18338: {'lr': 0.00048511755714238585, 'samples': 3520896, 'steps': 18337, 'loss/train': 1.6420117616653442} -08/30/2021 16:31:49 - INFO - __main__ - Step 18339: {'lr': 0.0004851157534539541, 'samples': 3521088, 'steps': 18338, 'loss/train': 2.079241991043091} -08/30/2021 16:31:49 - INFO - __main__ - Step 18340: {'lr': 0.0004851139496595827, 'samples': 3521280, 'steps': 18339, 'loss/train': 1.5721169710159302} -08/30/2021 16:31:50 - INFO - __main__ - Step 18341: {'lr': 0.00048511214575927265, 'samples': 3521472, 'steps': 18340, 'loss/train': 2.0448737144470215} -08/30/2021 16:31:51 - INFO - __main__ - Step 18342: {'lr': 0.0004851103417530247, 'samples': 3521664, 'steps': 18341, 'loss/train': 1.964516282081604} -08/30/2021 16:31:52 - INFO - __main__ - Step 18343: {'lr': 0.0004851085376408396, 'samples': 3521856, 'steps': 18342, 'loss/train': 1.792725920677185} -08/30/2021 16:31:52 - INFO - __main__ - Step 18344: {'lr': 0.0004851067334227183, 'samples': 3522048, 'steps': 18343, 'loss/train': 1.1735317707061768} -08/30/2021 16:31:52 - INFO - __main__ - Step 18345: {'lr': 0.0004851049290986615, 'samples': 3522240, 'steps': 18344, 'loss/train': 2.0181925296783447} -08/30/2021 16:31:53 - INFO - __main__ - Step 18346: {'lr': 0.00048510312466867, 'samples': 3522432, 'steps': 18345, 'loss/train': 1.9342454671859741} -08/30/2021 16:31:54 - INFO - __main__ - Step 18347: {'lr': 0.0004851013201327448, 'samples': 3522624, 'steps': 18346, 'loss/train': 1.4876445531845093} -08/30/2021 16:31:55 - INFO - __main__ - Step 18348: {'lr': 0.0004850995154908864, 'samples': 3522816, 'steps': 18347, 'loss/train': 1.9688720703125} -08/30/2021 16:31:55 - INFO - __main__ - Step 18349: {'lr': 0.0004850977107430959, 'samples': 3523008, 'steps': 18348, 'loss/train': 1.1184128522872925} -08/30/2021 16:31:55 - INFO - __main__ - Step 18350: {'lr': 0.000485095905889374, 'samples': 3523200, 'steps': 18349, 'loss/train': 1.152635097503662} -08/30/2021 16:31:56 - INFO - __main__ - Step 18351: {'lr': 0.00048509410092972144, 'samples': 3523392, 'steps': 18350, 'loss/train': 1.8936458826065063} -08/30/2021 16:31:58 - INFO - __main__ - Step 18352: {'lr': 0.0004850922958641392, 'samples': 3523584, 'steps': 18351, 'loss/train': 1.6338152885437012} -08/30/2021 16:31:58 - INFO - __main__ - Step 18353: {'lr': 0.0004850904906926279, 'samples': 3523776, 'steps': 18352, 'loss/train': 1.175215721130371} -08/30/2021 16:31:58 - INFO - __main__ - Step 18354: {'lr': 0.0004850886854151885, 'samples': 3523968, 'steps': 18353, 'loss/train': 1.374414086341858} -08/30/2021 16:31:59 - INFO - __main__ - Step 18355: {'lr': 0.0004850868800318218, 'samples': 3524160, 'steps': 18354, 'loss/train': 1.856572151184082} -08/30/2021 16:31:59 - INFO - __main__ - Step 18356: {'lr': 0.00048508507454252846, 'samples': 3524352, 'steps': 18355, 'loss/train': 1.1230909824371338} -08/30/2021 16:31:59 - INFO - __main__ - Step 18357: {'lr': 0.00048508326894730955, 'samples': 3524544, 'steps': 18356, 'loss/train': 2.62599515914917} -08/30/2021 16:32:01 - INFO - __main__ - Step 18358: {'lr': 0.00048508146324616566, 'samples': 3524736, 'steps': 18357, 'loss/train': 1.2977162599563599} -08/30/2021 16:32:01 - INFO - __main__ - Step 18359: {'lr': 0.0004850796574390977, 'samples': 3524928, 'steps': 18358, 'loss/train': 1.9402198791503906} -08/30/2021 16:32:02 - INFO - __main__ - Step 18360: {'lr': 0.0004850778515261065, 'samples': 3525120, 'steps': 18359, 'loss/train': 1.5444425344467163} -08/30/2021 16:32:02 - INFO - __main__ - Step 18361: {'lr': 0.0004850760455071929, 'samples': 3525312, 'steps': 18360, 'loss/train': 1.594689965248108} -08/30/2021 16:32:02 - INFO - __main__ - Step 18362: {'lr': 0.0004850742393823576, 'samples': 3525504, 'steps': 18361, 'loss/train': 0.8999673128128052} -08/30/2021 16:32:04 - INFO - __main__ - Step 18363: {'lr': 0.0004850724331516014, 'samples': 3525696, 'steps': 18362, 'loss/train': 1.3309015035629272} -08/30/2021 16:32:04 - INFO - __main__ - Step 18364: {'lr': 0.0004850706268149253, 'samples': 3525888, 'steps': 18363, 'loss/train': 1.3089945316314697} -08/30/2021 16:32:05 - INFO - __main__ - Step 18365: {'lr': 0.00048506882037233, 'samples': 3526080, 'steps': 18364, 'loss/train': 1.3521586656570435} -08/30/2021 16:32:05 - INFO - __main__ - Step 18366: {'lr': 0.0004850670138238162, 'samples': 3526272, 'steps': 18365, 'loss/train': 1.974701166152954} -08/30/2021 16:32:06 - INFO - __main__ - Step 18367: {'lr': 0.00048506520716938496, 'samples': 3526464, 'steps': 18366, 'loss/train': 1.5892881155014038} -08/30/2021 16:32:07 - INFO - __main__ - Step 18368: {'lr': 0.00048506340040903697, 'samples': 3526656, 'steps': 18367, 'loss/train': 1.944163203239441} -08/30/2021 16:32:08 - INFO - __main__ - Step 18369: {'lr': 0.00048506159354277294, 'samples': 3526848, 'steps': 18368, 'loss/train': 2.3988265991210938} -08/30/2021 16:32:08 - INFO - __main__ - Step 18370: {'lr': 0.00048505978657059385, 'samples': 3527040, 'steps': 18369, 'loss/train': 1.93350350856781} -08/30/2021 16:32:08 - INFO - __main__ - Step 18371: {'lr': 0.0004850579794925004, 'samples': 3527232, 'steps': 18370, 'loss/train': 2.4299449920654297} -08/30/2021 16:32:09 - INFO - __main__ - Step 18372: {'lr': 0.0004850561723084935, 'samples': 3527424, 'steps': 18371, 'loss/train': 1.7484010457992554} -08/30/2021 16:32:10 - INFO - __main__ - Step 18373: {'lr': 0.0004850543650185739, 'samples': 3527616, 'steps': 18372, 'loss/train': 1.9789292812347412} -08/30/2021 16:32:11 - INFO - __main__ - Step 18374: {'lr': 0.0004850525576227425, 'samples': 3527808, 'steps': 18373, 'loss/train': 1.1833218336105347} -08/30/2021 16:32:11 - INFO - __main__ - Step 18375: {'lr': 0.000485050750121, 'samples': 3528000, 'steps': 18374, 'loss/train': 1.0919058322906494} -08/30/2021 16:32:11 - INFO - __main__ - Step 18376: {'lr': 0.0004850489425133472, 'samples': 3528192, 'steps': 18375, 'loss/train': 1.805298089981079} -08/30/2021 16:32:12 - INFO - __main__ - Step 18377: {'lr': 0.000485047134799785, 'samples': 3528384, 'steps': 18376, 'loss/train': 1.5543766021728516} -08/30/2021 16:32:14 - INFO - __main__ - Step 18378: {'lr': 0.00048504532698031416, 'samples': 3528576, 'steps': 18377, 'loss/train': 1.73404061794281} -08/30/2021 16:32:14 - INFO - __main__ - Step 18379: {'lr': 0.0004850435190549356, 'samples': 3528768, 'steps': 18378, 'loss/train': 1.9069091081619263} -08/30/2021 16:32:14 - INFO - __main__ - Step 18380: {'lr': 0.00048504171102365, 'samples': 3528960, 'steps': 18379, 'loss/train': 1.5401171445846558} -08/30/2021 16:32:15 - INFO - __main__ - Step 18381: {'lr': 0.0004850399028864583, 'samples': 3529152, 'steps': 18380, 'loss/train': 0.7602036595344543} -08/30/2021 16:32:15 - INFO - __main__ - Step 18382: {'lr': 0.0004850380946433611, 'samples': 3529344, 'steps': 18381, 'loss/train': 2.0335865020751953} -08/30/2021 16:32:15 - INFO - __main__ - Step 18383: {'lr': 0.00048503628629435947, 'samples': 3529536, 'steps': 18382, 'loss/train': 1.367948055267334} -08/30/2021 16:32:17 - INFO - __main__ - Step 18384: {'lr': 0.0004850344778394541, 'samples': 3529728, 'steps': 18383, 'loss/train': 1.0850682258605957} -08/30/2021 16:32:18 - INFO - __main__ - Step 18385: {'lr': 0.0004850326692786459, 'samples': 3529920, 'steps': 18384, 'loss/train': 2.2030513286590576} -08/30/2021 16:32:18 - INFO - __main__ - Step 18386: {'lr': 0.00048503086061193546, 'samples': 3530112, 'steps': 18385, 'loss/train': 2.3353638648986816} -08/30/2021 16:32:18 - INFO - __main__ - Step 18387: {'lr': 0.0004850290518393238, 'samples': 3530304, 'steps': 18386, 'loss/train': 1.7692161798477173} -08/30/2021 16:32:19 - INFO - __main__ - Step 18388: {'lr': 0.0004850272429608117, 'samples': 3530496, 'steps': 18387, 'loss/train': 1.059675693511963} -08/30/2021 16:32:20 - INFO - __main__ - Step 18389: {'lr': 0.0004850254339764, 'samples': 3530688, 'steps': 18388, 'loss/train': 1.7607570886611938} -08/30/2021 16:32:21 - INFO - __main__ - Step 18390: {'lr': 0.00048502362488608933, 'samples': 3530880, 'steps': 18389, 'loss/train': 1.701917290687561} -08/30/2021 16:32:21 - INFO - __main__ - Step 18391: {'lr': 0.0004850218156898807, 'samples': 3531072, 'steps': 18390, 'loss/train': 1.5931764841079712} -08/30/2021 16:32:21 - INFO - __main__ - Step 18392: {'lr': 0.00048502000638777487, 'samples': 3531264, 'steps': 18391, 'loss/train': 2.0616695880889893} -08/30/2021 16:32:22 - INFO - __main__ - Step 18393: {'lr': 0.0004850181969797727, 'samples': 3531456, 'steps': 18392, 'loss/train': 0.8655185103416443} -08/30/2021 16:32:23 - INFO - __main__ - Step 18394: {'lr': 0.00048501638746587493, 'samples': 3531648, 'steps': 18393, 'loss/train': 1.868634819984436} -08/30/2021 16:32:24 - INFO - __main__ - Step 18395: {'lr': 0.0004850145778460824, 'samples': 3531840, 'steps': 18394, 'loss/train': 1.9058949947357178} -08/30/2021 16:32:24 - INFO - __main__ - Step 18396: {'lr': 0.00048501276812039585, 'samples': 3532032, 'steps': 18395, 'loss/train': 1.474753737449646} -08/30/2021 16:32:24 - INFO - __main__ - Step 18397: {'lr': 0.00048501095828881627, 'samples': 3532224, 'steps': 18396, 'loss/train': 1.768510103225708} -08/30/2021 16:32:25 - INFO - __main__ - Step 18398: {'lr': 0.00048500914835134434, 'samples': 3532416, 'steps': 18397, 'loss/train': 1.8040025234222412} -08/30/2021 16:32:25 - INFO - __main__ - Step 18399: {'lr': 0.00048500733830798094, 'samples': 3532608, 'steps': 18398, 'loss/train': 1.8621283769607544} -08/30/2021 16:32:26 - INFO - __main__ - Step 18400: {'lr': 0.00048500552815872687, 'samples': 3532800, 'steps': 18399, 'loss/train': 1.68860924243927} -08/30/2021 16:32:27 - INFO - __main__ - Step 18401: {'lr': 0.0004850037179035829, 'samples': 3532992, 'steps': 18400, 'loss/train': 2.0445046424865723} -08/30/2021 16:32:27 - INFO - __main__ - Step 18402: {'lr': 0.00048500190754254994, 'samples': 3533184, 'steps': 18401, 'loss/train': 1.752744197845459} -08/30/2021 16:32:28 - INFO - __main__ - Step 18403: {'lr': 0.00048500009707562865, 'samples': 3533376, 'steps': 18402, 'loss/train': 1.315450668334961} -08/30/2021 16:32:28 - INFO - __main__ - Step 18404: {'lr': 0.00048499828650281994, 'samples': 3533568, 'steps': 18403, 'loss/train': 0.9854258894920349} -08/30/2021 16:32:30 - INFO - __main__ - Step 18405: {'lr': 0.00048499647582412475, 'samples': 3533760, 'steps': 18404, 'loss/train': 2.5694668292999268} -08/30/2021 16:32:30 - INFO - __main__ - Step 18406: {'lr': 0.0004849946650395437, 'samples': 3533952, 'steps': 18405, 'loss/train': 1.2151046991348267} -08/30/2021 16:32:30 - INFO - __main__ - Step 18407: {'lr': 0.0004849928541490777, 'samples': 3534144, 'steps': 18406, 'loss/train': 0.6300547122955322} -08/30/2021 16:32:31 - INFO - __main__ - Step 18408: {'lr': 0.0004849910431527275, 'samples': 3534336, 'steps': 18407, 'loss/train': 1.6237766742706299} -08/30/2021 16:32:31 - INFO - __main__ - Step 18409: {'lr': 0.000484989232050494, 'samples': 3534528, 'steps': 18408, 'loss/train': 1.6840767860412598} -08/30/2021 16:32:33 - INFO - __main__ - Step 18410: {'lr': 0.00048498742084237796, 'samples': 3534720, 'steps': 18409, 'loss/train': 1.428397536277771} -08/30/2021 16:32:34 - INFO - __main__ - Step 18411: {'lr': 0.00048498560952838025, 'samples': 3534912, 'steps': 18410, 'loss/train': 1.7967861890792847} -08/30/2021 16:32:34 - INFO - __main__ - Step 18412: {'lr': 0.00048498379810850157, 'samples': 3535104, 'steps': 18411, 'loss/train': 1.5502450466156006} -08/30/2021 16:32:34 - INFO - __main__ - Step 18413: {'lr': 0.0004849819865827429, 'samples': 3535296, 'steps': 18412, 'loss/train': 1.7416106462478638} -08/30/2021 16:32:35 - INFO - __main__ - Step 18414: {'lr': 0.0004849801749511049, 'samples': 3535488, 'steps': 18413, 'loss/train': 2.118992805480957} -08/30/2021 16:32:36 - INFO - __main__ - Step 18415: {'lr': 0.00048497836321358855, 'samples': 3535680, 'steps': 18414, 'loss/train': 1.533248782157898} -08/30/2021 16:32:37 - INFO - __main__ - Step 18416: {'lr': 0.00048497655137019454, 'samples': 3535872, 'steps': 18415, 'loss/train': 1.6962758302688599} -08/30/2021 16:32:37 - INFO - __main__ - Step 18417: {'lr': 0.0004849747394209237, 'samples': 3536064, 'steps': 18416, 'loss/train': 1.527657151222229} -08/30/2021 16:32:37 - INFO - __main__ - Step 18418: {'lr': 0.00048497292736577685, 'samples': 3536256, 'steps': 18417, 'loss/train': 1.5346958637237549} -08/30/2021 16:32:38 - INFO - __main__ - Step 18419: {'lr': 0.0004849711152047549, 'samples': 3536448, 'steps': 18418, 'loss/train': 1.7111904621124268} -08/30/2021 16:32:38 - INFO - __main__ - Step 18420: {'lr': 0.0004849693029378585, 'samples': 3536640, 'steps': 18419, 'loss/train': 1.6931809186935425} -08/30/2021 16:32:39 - INFO - __main__ - Step 18421: {'lr': 0.0004849674905650886, 'samples': 3536832, 'steps': 18420, 'loss/train': 1.9758563041687012} -08/30/2021 16:32:40 - INFO - __main__ - Step 18422: {'lr': 0.000484965678086446, 'samples': 3537024, 'steps': 18421, 'loss/train': 1.5684478282928467} -08/30/2021 16:32:40 - INFO - __main__ - Step 18423: {'lr': 0.0004849638655019315, 'samples': 3537216, 'steps': 18422, 'loss/train': 1.285486102104187} -08/30/2021 16:32:41 - INFO - __main__ - Step 18424: {'lr': 0.0004849620528115458, 'samples': 3537408, 'steps': 18423, 'loss/train': 1.4267280101776123} -08/30/2021 16:32:41 - INFO - __main__ - Step 18425: {'lr': 0.0004849602400152899, 'samples': 3537600, 'steps': 18424, 'loss/train': 1.044335126876831} -08/30/2021 16:32:42 - INFO - __main__ - Step 18426: {'lr': 0.0004849584271131646, 'samples': 3537792, 'steps': 18425, 'loss/train': 1.9281814098358154} -08/30/2021 16:32:43 - INFO - __main__ - Step 18427: {'lr': 0.00048495661410517056, 'samples': 3537984, 'steps': 18426, 'loss/train': 1.8135710954666138} -08/30/2021 16:32:43 - INFO - __main__ - Step 18428: {'lr': 0.0004849548009913087, 'samples': 3538176, 'steps': 18427, 'loss/train': 3.7530477046966553} -08/30/2021 16:32:44 - INFO - __main__ - Step 18429: {'lr': 0.00048495298777157994, 'samples': 3538368, 'steps': 18428, 'loss/train': 1.0768924951553345} -08/30/2021 16:32:44 - INFO - __main__ - Step 18430: {'lr': 0.0004849511744459849, 'samples': 3538560, 'steps': 18429, 'loss/train': 1.7873797416687012} -08/30/2021 16:32:45 - INFO - __main__ - Step 18431: {'lr': 0.00048494936101452446, 'samples': 3538752, 'steps': 18430, 'loss/train': 1.1974409818649292} -08/30/2021 16:32:46 - INFO - __main__ - Step 18432: {'lr': 0.00048494754747719954, 'samples': 3538944, 'steps': 18431, 'loss/train': 2.0334620475769043} -08/30/2021 16:32:46 - INFO - __main__ - Step 18433: {'lr': 0.00048494573383401084, 'samples': 3539136, 'steps': 18432, 'loss/train': 1.6517343521118164} -08/30/2021 16:32:47 - INFO - __main__ - Step 18434: {'lr': 0.0004849439200849592, 'samples': 3539328, 'steps': 18433, 'loss/train': 1.7558435201644897} -08/30/2021 16:32:47 - INFO - __main__ - Step 18435: {'lr': 0.0004849421062300455, 'samples': 3539520, 'steps': 18434, 'loss/train': 1.7587658166885376} -08/30/2021 16:32:48 - INFO - __main__ - Step 18436: {'lr': 0.0004849402922692705, 'samples': 3539712, 'steps': 18435, 'loss/train': 2.0340306758880615} -08/30/2021 16:32:49 - INFO - __main__ - Step 18437: {'lr': 0.000484938478202635, 'samples': 3539904, 'steps': 18436, 'loss/train': 1.9905076026916504} -08/30/2021 16:32:49 - INFO - __main__ - Step 18438: {'lr': 0.0004849366640301399, 'samples': 3540096, 'steps': 18437, 'loss/train': 1.4739770889282227} -08/30/2021 16:32:50 - INFO - __main__ - Step 18439: {'lr': 0.00048493484975178593, 'samples': 3540288, 'steps': 18438, 'loss/train': 1.9535123109817505} -08/30/2021 16:32:50 - INFO - __main__ - Step 18440: {'lr': 0.00048493303536757394, 'samples': 3540480, 'steps': 18439, 'loss/train': 1.733303427696228} -08/30/2021 16:32:52 - INFO - __main__ - Step 18441: {'lr': 0.00048493122087750473, 'samples': 3540672, 'steps': 18440, 'loss/train': 1.183138370513916} -08/30/2021 16:32:52 - INFO - __main__ - Step 18442: {'lr': 0.0004849294062815792, 'samples': 3540864, 'steps': 18441, 'loss/train': 1.2568312883377075} -08/30/2021 16:32:52 - INFO - __main__ - Step 18443: {'lr': 0.000484927591579798, 'samples': 3541056, 'steps': 18442, 'loss/train': 1.481009840965271} -08/30/2021 16:32:53 - INFO - __main__ - Step 18444: {'lr': 0.0004849257767721622, 'samples': 3541248, 'steps': 18443, 'loss/train': 1.2963892221450806} -08/30/2021 16:32:53 - INFO - __main__ - Step 18445: {'lr': 0.00048492396185867236, 'samples': 3541440, 'steps': 18444, 'loss/train': 1.720694899559021} -08/30/2021 16:32:53 - INFO - __main__ - Step 18446: {'lr': 0.0004849221468393294, 'samples': 3541632, 'steps': 18445, 'loss/train': 1.6941791772842407} -08/30/2021 16:32:55 - INFO - __main__ - Step 18447: {'lr': 0.00048492033171413425, 'samples': 3541824, 'steps': 18446, 'loss/train': 1.7716199159622192} -08/30/2021 16:32:55 - INFO - __main__ - Step 18448: {'lr': 0.00048491851648308756, 'samples': 3542016, 'steps': 18447, 'loss/train': 1.8997448682785034} -08/30/2021 16:32:56 - INFO - __main__ - Step 18449: {'lr': 0.00048491670114619026, 'samples': 3542208, 'steps': 18448, 'loss/train': 0.9838755130767822} -08/30/2021 16:32:56 - INFO - __main__ - Step 18450: {'lr': 0.000484914885703443, 'samples': 3542400, 'steps': 18449, 'loss/train': 1.8256545066833496} -08/30/2021 16:32:56 - INFO - __main__ - Step 18451: {'lr': 0.00048491307015484684, 'samples': 3542592, 'steps': 18450, 'loss/train': 2.717716693878174} -08/30/2021 16:32:58 - INFO - __main__ - Step 18452: {'lr': 0.0004849112545004024, 'samples': 3542784, 'steps': 18451, 'loss/train': 1.6457176208496094} -08/30/2021 16:32:59 - INFO - __main__ - Step 18453: {'lr': 0.00048490943874011054, 'samples': 3542976, 'steps': 18452, 'loss/train': 1.8555002212524414} -08/30/2021 16:32:59 - INFO - __main__ - Step 18454: {'lr': 0.00048490762287397215, 'samples': 3543168, 'steps': 18453, 'loss/train': 0.8818188309669495} -08/30/2021 16:32:59 - INFO - __main__ - Step 18455: {'lr': 0.00048490580690198804, 'samples': 3543360, 'steps': 18454, 'loss/train': 1.917466163635254} -08/30/2021 16:33:00 - INFO - __main__ - Step 18456: {'lr': 0.000484903990824159, 'samples': 3543552, 'steps': 18455, 'loss/train': 1.6682443618774414} -08/30/2021 16:33:01 - INFO - __main__ - Step 18457: {'lr': 0.0004849021746404859, 'samples': 3543744, 'steps': 18456, 'loss/train': 1.5969135761260986} -08/30/2021 16:33:02 - INFO - __main__ - Step 18458: {'lr': 0.00048490035835096936, 'samples': 3543936, 'steps': 18457, 'loss/train': 1.598833441734314} -08/30/2021 16:33:02 - INFO - __main__ - Step 18459: {'lr': 0.0004848985419556104, 'samples': 3544128, 'steps': 18458, 'loss/train': 1.4627039432525635} -08/30/2021 16:33:03 - INFO - __main__ - Step 18460: {'lr': 0.0004848967254544099, 'samples': 3544320, 'steps': 18459, 'loss/train': 1.282549500465393} -08/30/2021 16:33:03 - INFO - __main__ - Step 18461: {'lr': 0.00048489490884736844, 'samples': 3544512, 'steps': 18460, 'loss/train': 1.6859853267669678} -08/30/2021 16:33:03 - INFO - __main__ - Step 18462: {'lr': 0.00048489309213448696, 'samples': 3544704, 'steps': 18461, 'loss/train': 0.12266451865434647} -08/30/2021 16:33:05 - INFO - __main__ - Step 18463: {'lr': 0.00048489127531576627, 'samples': 3544896, 'steps': 18462, 'loss/train': 2.86110258102417} -08/30/2021 16:33:06 - INFO - __main__ - Step 18464: {'lr': 0.0004848894583912072, 'samples': 3545088, 'steps': 18463, 'loss/train': 1.9362525939941406} -08/30/2021 16:33:06 - INFO - __main__ - Step 18465: {'lr': 0.00048488764136081063, 'samples': 3545280, 'steps': 18464, 'loss/train': 1.3914740085601807} -08/30/2021 16:33:07 - INFO - __main__ - Step 18466: {'lr': 0.00048488582422457726, 'samples': 3545472, 'steps': 18465, 'loss/train': 1.8300514221191406} -08/30/2021 16:33:07 - INFO - __main__ - Step 18467: {'lr': 0.000484884006982508, 'samples': 3545664, 'steps': 18466, 'loss/train': 1.2591675519943237} -08/30/2021 16:33:09 - INFO - __main__ - Step 18468: {'lr': 0.0004848821896346036, 'samples': 3545856, 'steps': 18467, 'loss/train': 1.572219967842102} -08/30/2021 16:33:09 - INFO - __main__ - Step 18469: {'lr': 0.0004848803721808649, 'samples': 3546048, 'steps': 18468, 'loss/train': 1.520451307296753} -08/30/2021 16:33:10 - INFO - __main__ - Step 18470: {'lr': 0.0004848785546212927, 'samples': 3546240, 'steps': 18469, 'loss/train': 1.6013100147247314} -08/30/2021 16:33:10 - INFO - __main__ - Step 18471: {'lr': 0.00048487673695588794, 'samples': 3546432, 'steps': 18470, 'loss/train': 0.8847469091415405} -08/30/2021 16:33:10 - INFO - __main__ - Step 18472: {'lr': 0.00048487491918465135, 'samples': 3546624, 'steps': 18471, 'loss/train': 1.629996418952942} -08/30/2021 16:33:11 - INFO - __main__ - Step 18473: {'lr': 0.00048487310130758366, 'samples': 3546816, 'steps': 18472, 'loss/train': 1.4766883850097656} -08/30/2021 16:33:12 - INFO - __main__ - Step 18474: {'lr': 0.00048487128332468576, 'samples': 3547008, 'steps': 18473, 'loss/train': 1.941003680229187} -08/30/2021 16:33:13 - INFO - __main__ - Step 18475: {'lr': 0.00048486946523595856, 'samples': 3547200, 'steps': 18474, 'loss/train': 1.760926604270935} -08/30/2021 16:33:13 - INFO - __main__ - Step 18476: {'lr': 0.00048486764704140276, 'samples': 3547392, 'steps': 18475, 'loss/train': 1.8866465091705322} -08/30/2021 16:33:13 - INFO - __main__ - Step 18477: {'lr': 0.00048486582874101924, 'samples': 3547584, 'steps': 18476, 'loss/train': 1.8096379041671753} -08/30/2021 16:33:14 - INFO - __main__ - Step 18478: {'lr': 0.0004848640103348088, 'samples': 3547776, 'steps': 18477, 'loss/train': 1.8322175741195679} -08/30/2021 16:33:15 - INFO - __main__ - Step 18479: {'lr': 0.00048486219182277226, 'samples': 3547968, 'steps': 18478, 'loss/train': 1.4215279817581177} -08/30/2021 16:33:15 - INFO - __main__ - Step 18480: {'lr': 0.00048486037320491043, 'samples': 3548160, 'steps': 18479, 'loss/train': 2.114464044570923} -08/30/2021 16:33:16 - INFO - __main__ - Step 18481: {'lr': 0.0004848585544812242, 'samples': 3548352, 'steps': 18480, 'loss/train': 2.0277700424194336} -08/30/2021 16:33:16 - INFO - __main__ - Step 18482: {'lr': 0.0004848567356517143, 'samples': 3548544, 'steps': 18481, 'loss/train': 1.935502290725708} -08/30/2021 16:33:17 - INFO - __main__ - Step 18483: {'lr': 0.00048485491671638146, 'samples': 3548736, 'steps': 18482, 'loss/train': 1.707394003868103} -08/30/2021 16:33:18 - INFO - __main__ - Step 18484: {'lr': 0.0004848530976752268, 'samples': 3548928, 'steps': 18483, 'loss/train': 1.799896001815796} -08/30/2021 16:33:19 - INFO - __main__ - Step 18485: {'lr': 0.0004848512785282508, 'samples': 3549120, 'steps': 18484, 'loss/train': 2.754084348678589} -08/30/2021 16:33:19 - INFO - __main__ - Step 18486: {'lr': 0.00048484945927545456, 'samples': 3549312, 'steps': 18485, 'loss/train': 1.213364601135254} -08/30/2021 16:33:19 - INFO - __main__ - Step 18487: {'lr': 0.0004848476399168387, 'samples': 3549504, 'steps': 18486, 'loss/train': 1.6225429773330688} -08/30/2021 16:33:20 - INFO - __main__ - Step 18488: {'lr': 0.0004848458204524042, 'samples': 3549696, 'steps': 18487, 'loss/train': 2.1874027252197266} -08/30/2021 16:33:21 - INFO - __main__ - Step 18489: {'lr': 0.00048484400088215173, 'samples': 3549888, 'steps': 18488, 'loss/train': 1.7116848230361938} -08/30/2021 16:33:22 - INFO - __main__ - Step 18490: {'lr': 0.0004848421812060821, 'samples': 3550080, 'steps': 18489, 'loss/train': 1.7499696016311646} -08/30/2021 16:33:22 - INFO - __main__ - Step 18491: {'lr': 0.0004848403614241964, 'samples': 3550272, 'steps': 18490, 'loss/train': 0.8672402501106262} -08/30/2021 16:33:23 - INFO - __main__ - Step 18492: {'lr': 0.00048483854153649514, 'samples': 3550464, 'steps': 18491, 'loss/train': 1.9149320125579834} -08/30/2021 16:33:23 - INFO - __main__ - Step 18493: {'lr': 0.0004848367215429793, 'samples': 3550656, 'steps': 18492, 'loss/train': 1.3062007427215576} -08/30/2021 16:33:23 - INFO - __main__ - Step 18494: {'lr': 0.0004848349014436496, 'samples': 3550848, 'steps': 18493, 'loss/train': 1.0269335508346558} -08/30/2021 16:33:24 - INFO - __main__ - Step 18495: {'lr': 0.00048483308123850697, 'samples': 3551040, 'steps': 18494, 'loss/train': 0.1711260974407196} -08/30/2021 16:33:25 - INFO - __main__ - Step 18496: {'lr': 0.00048483126092755215, 'samples': 3551232, 'steps': 18495, 'loss/train': 0.07490824162960052} -08/30/2021 16:33:26 - INFO - __main__ - Step 18497: {'lr': 0.000484829440510786, 'samples': 3551424, 'steps': 18496, 'loss/train': 0.0846533253788948} -08/30/2021 16:33:26 - INFO - __main__ - Step 18498: {'lr': 0.0004848276199882093, 'samples': 3551616, 'steps': 18497, 'loss/train': 0.7802138328552246} -08/30/2021 16:33:27 - INFO - __main__ - Step 18499: {'lr': 0.0004848257993598229, 'samples': 3551808, 'steps': 18498, 'loss/train': 1.7126972675323486} -08/30/2021 16:33:27 - INFO - __main__ - Step 18500: {'lr': 0.00048482397862562764, 'samples': 3552000, 'steps': 18499, 'loss/train': 4.151735782623291} -08/30/2021 16:33:29 - INFO - __main__ - Step 18501: {'lr': 0.00048482215778562434, 'samples': 3552192, 'steps': 18500, 'loss/train': 1.5678753852844238} -08/30/2021 16:33:29 - INFO - __main__ - Step 18502: {'lr': 0.00048482033683981376, 'samples': 3552384, 'steps': 18501, 'loss/train': 0.20393653213977814} -08/30/2021 16:33:30 - INFO - __main__ - Step 18503: {'lr': 0.0004848185157881968, 'samples': 3552576, 'steps': 18502, 'loss/train': 1.5224156379699707} -08/30/2021 16:33:30 - INFO - __main__ - Step 18504: {'lr': 0.0004848166946307742, 'samples': 3552768, 'steps': 18503, 'loss/train': 1.5995322465896606} -08/30/2021 16:33:31 - INFO - __main__ - Step 18505: {'lr': 0.0004848148733675468, 'samples': 3552960, 'steps': 18504, 'loss/train': 1.0265933275222778} -08/30/2021 16:33:31 - INFO - __main__ - Step 18506: {'lr': 0.0004848130519985155, 'samples': 3553152, 'steps': 18505, 'loss/train': 1.430309534072876} -08/30/2021 16:33:31 - INFO - __main__ - Step 18507: {'lr': 0.000484811230523681, 'samples': 3553344, 'steps': 18506, 'loss/train': 1.8822970390319824} -08/30/2021 16:33:33 - INFO - __main__ - Step 18508: {'lr': 0.00048480940894304425, 'samples': 3553536, 'steps': 18507, 'loss/train': 1.445253610610962} -08/30/2021 16:33:33 - INFO - __main__ - Step 18509: {'lr': 0.000484807587256606, 'samples': 3553728, 'steps': 18508, 'loss/train': 1.4174604415893555} -08/30/2021 16:33:34 - INFO - __main__ - Step 18510: {'lr': 0.00048480576546436707, 'samples': 3553920, 'steps': 18509, 'loss/train': 1.7771098613739014} -08/30/2021 16:33:34 - INFO - __main__ - Step 18511: {'lr': 0.0004848039435663282, 'samples': 3554112, 'steps': 18510, 'loss/train': 1.7104212045669556} -08/30/2021 16:33:34 - INFO - __main__ - Step 18512: {'lr': 0.0004848021215624904, 'samples': 3554304, 'steps': 18511, 'loss/train': 1.7735743522644043} -08/30/2021 16:33:36 - INFO - __main__ - Step 18513: {'lr': 0.0004848002994528543, 'samples': 3554496, 'steps': 18512, 'loss/train': 2.0425238609313965} -08/30/2021 16:33:36 - INFO - __main__ - Step 18514: {'lr': 0.0004847984772374209, 'samples': 3554688, 'steps': 18513, 'loss/train': 0.3305189907550812} -08/30/2021 16:33:37 - INFO - __main__ - Step 18515: {'lr': 0.0004847966549161909, 'samples': 3554880, 'steps': 18514, 'loss/train': 1.1372885704040527} -08/30/2021 16:33:37 - INFO - __main__ - Step 18516: {'lr': 0.0004847948324891651, 'samples': 3555072, 'steps': 18515, 'loss/train': 1.6787761449813843} -08/30/2021 16:33:37 - INFO - __main__ - Step 18517: {'lr': 0.00048479300995634447, 'samples': 3555264, 'steps': 18516, 'loss/train': 1.302175521850586} -08/30/2021 16:33:39 - INFO - __main__ - Step 18518: {'lr': 0.0004847911873177296, 'samples': 3555456, 'steps': 18517, 'loss/train': 2.0490682125091553} -08/30/2021 16:33:40 - INFO - __main__ - Step 18519: {'lr': 0.0004847893645733216, 'samples': 3555648, 'steps': 18518, 'loss/train': 2.500790596008301} -08/30/2021 16:33:40 - INFO - __main__ - Step 18520: {'lr': 0.000484787541723121, 'samples': 3555840, 'steps': 18519, 'loss/train': 0.8049459457397461} -08/30/2021 16:33:40 - INFO - __main__ - Step 18521: {'lr': 0.0004847857187671288, 'samples': 3556032, 'steps': 18520, 'loss/train': 2.2276804447174072} -08/30/2021 16:33:41 - INFO - __main__ - Step 18522: {'lr': 0.00048478389570534575, 'samples': 3556224, 'steps': 18521, 'loss/train': 1.3165028095245361} -08/30/2021 16:33:42 - INFO - __main__ - Step 18523: {'lr': 0.0004847820725377728, 'samples': 3556416, 'steps': 18522, 'loss/train': 1.5506622791290283} -08/30/2021 16:33:43 - INFO - __main__ - Step 18524: {'lr': 0.0004847802492644106, 'samples': 3556608, 'steps': 18523, 'loss/train': 1.2318246364593506} -08/30/2021 16:33:43 - INFO - __main__ - Step 18525: {'lr': 0.00048477842588526, 'samples': 3556800, 'steps': 18524, 'loss/train': 1.4588223695755005} -08/30/2021 16:33:43 - INFO - __main__ - Step 18526: {'lr': 0.000484776602400322, 'samples': 3556992, 'steps': 18525, 'loss/train': 1.276929259300232} -08/30/2021 16:33:44 - INFO - __main__ - Step 18527: {'lr': 0.00048477477880959715, 'samples': 3557184, 'steps': 18526, 'loss/train': 1.384444236755371} -08/30/2021 16:33:45 - INFO - __main__ - Step 18528: {'lr': 0.00048477295511308645, 'samples': 3557376, 'steps': 18527, 'loss/train': 1.8755440711975098} -08/30/2021 16:33:46 - INFO - __main__ - Step 18529: {'lr': 0.0004847711313107907, 'samples': 3557568, 'steps': 18528, 'loss/train': 2.0067262649536133} -08/30/2021 16:33:46 - INFO - __main__ - Step 18530: {'lr': 0.0004847693074027106, 'samples': 3557760, 'steps': 18529, 'loss/train': 1.3764686584472656} -08/30/2021 16:33:46 - INFO - __main__ - Step 18531: {'lr': 0.0004847674833888472, 'samples': 3557952, 'steps': 18530, 'loss/train': 1.5434719324111938} -08/30/2021 16:33:47 - INFO - __main__ - Step 18532: {'lr': 0.0004847656592692012, 'samples': 3558144, 'steps': 18531, 'loss/train': 1.7961565256118774} -08/30/2021 16:33:47 - INFO - __main__ - Step 18533: {'lr': 0.00048476383504377337, 'samples': 3558336, 'steps': 18532, 'loss/train': 0.9700822234153748} -08/30/2021 16:33:49 - INFO - __main__ - Step 18534: {'lr': 0.00048476201071256453, 'samples': 3558528, 'steps': 18533, 'loss/train': 1.6476198434829712} -08/30/2021 16:33:49 - INFO - __main__ - Step 18535: {'lr': 0.0004847601862755756, 'samples': 3558720, 'steps': 18534, 'loss/train': 1.9694432020187378} -08/30/2021 16:33:49 - INFO - __main__ - Step 18536: {'lr': 0.0004847583617328074, 'samples': 3558912, 'steps': 18535, 'loss/train': 2.1525583267211914} -08/30/2021 16:33:50 - INFO - __main__ - Step 18537: {'lr': 0.00048475653708426067, 'samples': 3559104, 'steps': 18536, 'loss/train': 1.294746994972229} -08/30/2021 16:33:50 - INFO - __main__ - Step 18538: {'lr': 0.00048475471232993625, 'samples': 3559296, 'steps': 18537, 'loss/train': 1.3839820623397827} -08/30/2021 16:33:52 - INFO - __main__ - Step 18539: {'lr': 0.000484752887469835, 'samples': 3559488, 'steps': 18538, 'loss/train': 0.8167545795440674} -08/30/2021 16:33:52 - INFO - __main__ - Step 18540: {'lr': 0.0004847510625039577, 'samples': 3559680, 'steps': 18539, 'loss/train': 2.311332941055298} -08/30/2021 16:33:52 - INFO - __main__ - Step 18541: {'lr': 0.00048474923743230513, 'samples': 3559872, 'steps': 18540, 'loss/train': 1.7084465026855469} -08/30/2021 16:33:53 - INFO - __main__ - Step 18542: {'lr': 0.0004847474122548783, 'samples': 3560064, 'steps': 18541, 'loss/train': 1.2706105709075928} -08/30/2021 16:33:53 - INFO - __main__ - Step 18543: {'lr': 0.00048474558697167783, 'samples': 3560256, 'steps': 18542, 'loss/train': 1.7960759401321411} -08/30/2021 16:33:54 - INFO - __main__ - Step 18544: {'lr': 0.0004847437615827046, 'samples': 3560448, 'steps': 18543, 'loss/train': 1.3301351070404053} -08/30/2021 16:33:55 - INFO - __main__ - Step 18545: {'lr': 0.0004847419360879596, 'samples': 3560640, 'steps': 18544, 'loss/train': 1.4916123151779175} -08/30/2021 16:33:55 - INFO - __main__ - Step 18546: {'lr': 0.00048474011048744336, 'samples': 3560832, 'steps': 18545, 'loss/train': 1.7456555366516113} -08/30/2021 16:33:56 - INFO - __main__ - Step 18547: {'lr': 0.0004847382847811569, 'samples': 3561024, 'steps': 18546, 'loss/train': 1.4895341396331787} -08/30/2021 16:33:56 - INFO - __main__ - Step 18548: {'lr': 0.00048473645896910094, 'samples': 3561216, 'steps': 18547, 'loss/train': 2.0263867378234863} -08/30/2021 16:33:58 - INFO - __main__ - Step 18549: {'lr': 0.0004847346330512764, 'samples': 3561408, 'steps': 18548, 'loss/train': 1.640236496925354} -08/30/2021 16:33:58 - INFO - __main__ - Step 18550: {'lr': 0.0004847328070276841, 'samples': 3561600, 'steps': 18549, 'loss/train': 1.829225778579712} -08/30/2021 16:33:58 - INFO - __main__ - Step 18551: {'lr': 0.00048473098089832475, 'samples': 3561792, 'steps': 18550, 'loss/train': 1.2299416065216064} -08/30/2021 16:33:59 - INFO - __main__ - Step 18552: {'lr': 0.0004847291546631992, 'samples': 3561984, 'steps': 18551, 'loss/train': 0.17121967673301697} -08/30/2021 16:33:59 - INFO - __main__ - Step 18553: {'lr': 0.0004847273283223084, 'samples': 3562176, 'steps': 18552, 'loss/train': 1.252171277999878} -08/30/2021 16:34:01 - INFO - __main__ - Step 18554: {'lr': 0.0004847255018756531, 'samples': 3562368, 'steps': 18553, 'loss/train': 1.419908046722412} -08/30/2021 16:34:01 - INFO - __main__ - Step 18555: {'lr': 0.0004847236753232341, 'samples': 3562560, 'steps': 18554, 'loss/train': 1.4968973398208618} -08/30/2021 16:34:01 - INFO - __main__ - Step 18556: {'lr': 0.0004847218486650522, 'samples': 3562752, 'steps': 18555, 'loss/train': 2.253539562225342} -08/30/2021 16:34:02 - INFO - __main__ - Step 18557: {'lr': 0.00048472002190110827, 'samples': 3562944, 'steps': 18556, 'loss/train': 1.9014835357666016} -08/30/2021 16:34:02 - INFO - __main__ - Step 18558: {'lr': 0.0004847181950314031, 'samples': 3563136, 'steps': 18557, 'loss/train': 1.7548178434371948} -08/30/2021 16:34:04 - INFO - __main__ - Step 18559: {'lr': 0.00048471636805593756, 'samples': 3563328, 'steps': 18558, 'loss/train': 1.438714861869812} -08/30/2021 16:34:04 - INFO - __main__ - Step 18560: {'lr': 0.0004847145409747125, 'samples': 3563520, 'steps': 18559, 'loss/train': 1.4307847023010254} -08/30/2021 16:34:04 - INFO - __main__ - Step 18561: {'lr': 0.00048471271378772857, 'samples': 3563712, 'steps': 18560, 'loss/train': 1.4135974645614624} -08/30/2021 16:34:05 - INFO - __main__ - Step 18562: {'lr': 0.00048471088649498675, 'samples': 3563904, 'steps': 18561, 'loss/train': 1.8708280324935913} -08/30/2021 16:34:05 - INFO - __main__ - Step 18563: {'lr': 0.0004847090590964879, 'samples': 3564096, 'steps': 18562, 'loss/train': 2.121454954147339} -08/30/2021 16:34:07 - INFO - __main__ - Step 18564: {'lr': 0.00048470723159223266, 'samples': 3564288, 'steps': 18563, 'loss/train': 1.6470462083816528} -08/30/2021 16:34:07 - INFO - __main__ - Step 18565: {'lr': 0.00048470540398222207, 'samples': 3564480, 'steps': 18564, 'loss/train': 2.0197346210479736} -08/30/2021 16:34:07 - INFO - __main__ - Step 18566: {'lr': 0.00048470357626645676, 'samples': 3564672, 'steps': 18565, 'loss/train': 1.9334089756011963} -08/30/2021 16:34:08 - INFO - __main__ - Step 18567: {'lr': 0.0004847017484449377, 'samples': 3564864, 'steps': 18566, 'loss/train': 1.6592752933502197} -08/30/2021 16:34:08 - INFO - __main__ - Step 18568: {'lr': 0.0004846999205176657, 'samples': 3565056, 'steps': 18567, 'loss/train': 1.9945423603057861} -08/30/2021 16:34:10 - INFO - __main__ - Step 18569: {'lr': 0.00048469809248464135, 'samples': 3565248, 'steps': 18568, 'loss/train': 1.9166946411132812} -08/30/2021 16:34:11 - INFO - __main__ - Step 18570: {'lr': 0.0004846962643458658, 'samples': 3565440, 'steps': 18569, 'loss/train': 1.3833893537521362} -08/30/2021 16:34:11 - INFO - __main__ - Step 18571: {'lr': 0.00048469443610133975, 'samples': 3565632, 'steps': 18570, 'loss/train': 1.9449726343154907} -08/30/2021 16:34:12 - INFO - __main__ - Step 18572: {'lr': 0.00048469260775106394, 'samples': 3565824, 'steps': 18571, 'loss/train': 0.8559990525245667} -08/30/2021 16:34:12 - INFO - __main__ - Step 18573: {'lr': 0.0004846907792950393, 'samples': 3566016, 'steps': 18572, 'loss/train': 1.033095121383667} -08/30/2021 16:34:12 - INFO - __main__ - Step 18574: {'lr': 0.00048468895073326663, 'samples': 3566208, 'steps': 18573, 'loss/train': 1.4956058263778687} -08/30/2021 16:34:14 - INFO - __main__ - Step 18575: {'lr': 0.0004846871220657467, 'samples': 3566400, 'steps': 18574, 'loss/train': 1.2601957321166992} -08/30/2021 16:34:14 - INFO - __main__ - Step 18576: {'lr': 0.0004846852932924804, 'samples': 3566592, 'steps': 18575, 'loss/train': 1.1903382539749146} -08/30/2021 16:34:15 - INFO - __main__ - Step 18577: {'lr': 0.00048468346441346853, 'samples': 3566784, 'steps': 18576, 'loss/train': 1.7406201362609863} -08/30/2021 16:34:15 - INFO - __main__ - Step 18578: {'lr': 0.0004846816354287119, 'samples': 3566976, 'steps': 18577, 'loss/train': 1.6070871353149414} -08/30/2021 16:34:15 - INFO - __main__ - Step 18579: {'lr': 0.0004846798063382114, 'samples': 3567168, 'steps': 18578, 'loss/train': 1.9260528087615967} -08/30/2021 16:34:17 - INFO - __main__ - Step 18580: {'lr': 0.0004846779771419677, 'samples': 3567360, 'steps': 18579, 'loss/train': 1.7920345067977905} -08/30/2021 16:34:17 - INFO - __main__ - Step 18581: {'lr': 0.0004846761478399818, 'samples': 3567552, 'steps': 18580, 'loss/train': 1.483244776725769} -08/30/2021 16:34:18 - INFO - __main__ - Step 18582: {'lr': 0.0004846743184322544, 'samples': 3567744, 'steps': 18581, 'loss/train': 1.7939437627792358} -08/30/2021 16:34:18 - INFO - __main__ - Step 18583: {'lr': 0.00048467248891878644, 'samples': 3567936, 'steps': 18582, 'loss/train': 1.690280795097351} -08/30/2021 16:34:18 - INFO - __main__ - Step 18584: {'lr': 0.00048467065929957867, 'samples': 3568128, 'steps': 18583, 'loss/train': 1.767741084098816} -08/30/2021 16:34:20 - INFO - __main__ - Step 18585: {'lr': 0.00048466882957463186, 'samples': 3568320, 'steps': 18584, 'loss/train': 0.10865940153598785} -08/30/2021 16:34:21 - INFO - __main__ - Step 18586: {'lr': 0.0004846669997439469, 'samples': 3568512, 'steps': 18585, 'loss/train': 1.2697912454605103} -08/30/2021 16:34:21 - INFO - __main__ - Step 18587: {'lr': 0.0004846651698075246, 'samples': 3568704, 'steps': 18586, 'loss/train': 1.837859869003296} -08/30/2021 16:34:22 - INFO - __main__ - Step 18588: {'lr': 0.00048466333976536594, 'samples': 3568896, 'steps': 18587, 'loss/train': 1.3561391830444336} -08/30/2021 16:34:22 - INFO - __main__ - Step 18589: {'lr': 0.0004846615096174715, 'samples': 3569088, 'steps': 18588, 'loss/train': 1.76717209815979} -08/30/2021 16:34:22 - INFO - __main__ - Step 18590: {'lr': 0.00048465967936384217, 'samples': 3569280, 'steps': 18589, 'loss/train': 1.7219301462173462} -08/30/2021 16:34:23 - INFO - __main__ - Step 18591: {'lr': 0.00048465784900447885, 'samples': 3569472, 'steps': 18590, 'loss/train': 5.92577600479126} -08/30/2021 16:34:24 - INFO - __main__ - Step 18592: {'lr': 0.00048465601853938224, 'samples': 3569664, 'steps': 18591, 'loss/train': 5.849154472351074} -08/30/2021 16:34:25 - INFO - __main__ - Step 18593: {'lr': 0.0004846541879685533, 'samples': 3569856, 'steps': 18592, 'loss/train': 1.7809295654296875} -08/30/2021 16:34:25 - INFO - __main__ - Step 18594: {'lr': 0.0004846523572919929, 'samples': 3570048, 'steps': 18593, 'loss/train': 1.50161874294281} -08/30/2021 16:34:25 - INFO - __main__ - Step 18595: {'lr': 0.00048465052650970166, 'samples': 3570240, 'steps': 18594, 'loss/train': 1.2964003086090088} -08/30/2021 16:34:26 - INFO - __main__ - Step 18596: {'lr': 0.00048464869562168055, 'samples': 3570432, 'steps': 18595, 'loss/train': 1.6343309879302979} -08/30/2021 16:34:27 - INFO - __main__ - Step 18597: {'lr': 0.0004846468646279304, 'samples': 3570624, 'steps': 18596, 'loss/train': 1.6104968786239624} -08/30/2021 16:34:28 - INFO - __main__ - Step 18598: {'lr': 0.0004846450335284519, 'samples': 3570816, 'steps': 18597, 'loss/train': 0.6221204400062561} -08/30/2021 16:34:28 - INFO - __main__ - Step 18599: {'lr': 0.00048464320232324604, 'samples': 3571008, 'steps': 18598, 'loss/train': 2.2074191570281982} -08/30/2021 16:34:28 - INFO - __main__ - Step 18600: {'lr': 0.00048464137101231355, 'samples': 3571200, 'steps': 18599, 'loss/train': 1.2850799560546875} -08/30/2021 16:34:29 - INFO - __main__ - Step 18601: {'lr': 0.0004846395395956553, 'samples': 3571392, 'steps': 18600, 'loss/train': 1.0383111238479614} -08/30/2021 16:34:30 - INFO - __main__ - Step 18602: {'lr': 0.00048463770807327206, 'samples': 3571584, 'steps': 18601, 'loss/train': 1.3161869049072266} -08/30/2021 16:34:30 - INFO - __main__ - Step 18603: {'lr': 0.00048463587644516473, 'samples': 3571776, 'steps': 18602, 'loss/train': 1.3902069330215454} -08/30/2021 16:34:31 - INFO - __main__ - Step 18604: {'lr': 0.00048463404471133404, 'samples': 3571968, 'steps': 18603, 'loss/train': 1.687749981880188} -08/30/2021 16:34:31 - INFO - __main__ - Step 18605: {'lr': 0.00048463221287178094, 'samples': 3572160, 'steps': 18604, 'loss/train': 1.7741122245788574} -08/30/2021 16:34:32 - INFO - __main__ - Step 18606: {'lr': 0.0004846303809265061, 'samples': 3572352, 'steps': 18605, 'loss/train': 1.8821640014648438} -08/30/2021 16:34:33 - INFO - __main__ - Step 18607: {'lr': 0.00048462854887551044, 'samples': 3572544, 'steps': 18606, 'loss/train': 1.5964727401733398} -08/30/2021 16:34:33 - INFO - __main__ - Step 18608: {'lr': 0.0004846267167187949, 'samples': 3572736, 'steps': 18607, 'loss/train': 1.278092861175537} -08/30/2021 16:34:34 - INFO - __main__ - Step 18609: {'lr': 0.00048462488445636005, 'samples': 3572928, 'steps': 18608, 'loss/train': 1.5015875101089478} -08/30/2021 16:34:34 - INFO - __main__ - Step 18610: {'lr': 0.0004846230520882069, 'samples': 3573120, 'steps': 18609, 'loss/train': 1.857212781906128} -08/30/2021 16:34:34 - INFO - __main__ - Step 18611: {'lr': 0.00048462121961433623, 'samples': 3573312, 'steps': 18610, 'loss/train': 1.809973120689392} -08/30/2021 16:34:35 - INFO - __main__ - Step 18612: {'lr': 0.00048461938703474886, 'samples': 3573504, 'steps': 18611, 'loss/train': 1.3722333908081055} -08/30/2021 16:34:36 - INFO - __main__ - Step 18613: {'lr': 0.00048461755434944554, 'samples': 3573696, 'steps': 18612, 'loss/train': 1.4379137754440308} -08/30/2021 16:34:37 - INFO - __main__ - Step 18614: {'lr': 0.00048461572155842725, 'samples': 3573888, 'steps': 18613, 'loss/train': 2.0803561210632324} -08/30/2021 16:34:37 - INFO - __main__ - Step 18615: {'lr': 0.00048461388866169474, 'samples': 3574080, 'steps': 18614, 'loss/train': 2.1274871826171875} -08/30/2021 16:34:38 - INFO - __main__ - Step 18616: {'lr': 0.00048461205565924884, 'samples': 3574272, 'steps': 18615, 'loss/train': 1.253926396369934} -08/30/2021 16:34:38 - INFO - __main__ - Step 18617: {'lr': 0.0004846102225510903, 'samples': 3574464, 'steps': 18616, 'loss/train': 1.4275085926055908} -08/30/2021 16:34:39 - INFO - __main__ - Step 18618: {'lr': 0.00048460838933722005, 'samples': 3574656, 'steps': 18617, 'loss/train': 1.5730656385421753} -08/30/2021 16:34:40 - INFO - __main__ - Step 18619: {'lr': 0.0004846065560176389, 'samples': 3574848, 'steps': 18618, 'loss/train': 1.208412528038025} -08/30/2021 16:34:40 - INFO - __main__ - Step 18620: {'lr': 0.00048460472259234764, 'samples': 3575040, 'steps': 18619, 'loss/train': 1.4797141551971436} -08/30/2021 16:34:41 - INFO - __main__ - Step 18621: {'lr': 0.0004846028890613471, 'samples': 3575232, 'steps': 18620, 'loss/train': 1.6955381631851196} -08/30/2021 16:34:41 - INFO - __main__ - Step 18622: {'lr': 0.00048460105542463805, 'samples': 3575424, 'steps': 18621, 'loss/train': 1.2728599309921265} -08/30/2021 16:34:42 - INFO - __main__ - Step 18623: {'lr': 0.00048459922168222146, 'samples': 3575616, 'steps': 18622, 'loss/train': 1.4494702816009521} -08/30/2021 16:34:43 - INFO - __main__ - Step 18624: {'lr': 0.00048459738783409814, 'samples': 3575808, 'steps': 18623, 'loss/train': 1.8204737901687622} -08/30/2021 16:34:43 - INFO - __main__ - Step 18625: {'lr': 0.0004845955538802688, 'samples': 3576000, 'steps': 18624, 'loss/train': 1.6453754901885986} -08/30/2021 16:34:44 - INFO - __main__ - Step 18626: {'lr': 0.0004845937198207343, 'samples': 3576192, 'steps': 18625, 'loss/train': 1.7081118822097778} -08/30/2021 16:34:44 - INFO - __main__ - Step 18627: {'lr': 0.0004845918856554955, 'samples': 3576384, 'steps': 18626, 'loss/train': 1.1042102575302124} -08/30/2021 16:34:46 - INFO - __main__ - Step 18628: {'lr': 0.00048459005138455326, 'samples': 3576576, 'steps': 18627, 'loss/train': 1.6801420450210571} -08/30/2021 16:34:46 - INFO - __main__ - Step 18629: {'lr': 0.0004845882170079083, 'samples': 3576768, 'steps': 18628, 'loss/train': 2.0579943656921387} -08/30/2021 16:34:47 - INFO - __main__ - Step 18630: {'lr': 0.00048458638252556153, 'samples': 3576960, 'steps': 18629, 'loss/train': 1.502411127090454} -08/30/2021 16:34:47 - INFO - __main__ - Step 18631: {'lr': 0.0004845845479375138, 'samples': 3577152, 'steps': 18630, 'loss/train': 1.7819527387619019} -08/30/2021 16:34:47 - INFO - __main__ - Step 18632: {'lr': 0.00048458271324376586, 'samples': 3577344, 'steps': 18631, 'loss/train': 1.3876886367797852} -08/30/2021 16:34:49 - INFO - __main__ - Step 18633: {'lr': 0.0004845808784443185, 'samples': 3577536, 'steps': 18632, 'loss/train': 1.173553466796875} -08/30/2021 16:34:49 - INFO - __main__ - Step 18634: {'lr': 0.00048457904353917277, 'samples': 3577728, 'steps': 18633, 'loss/train': 2.2251369953155518} -08/30/2021 16:34:50 - INFO - __main__ - Step 18635: {'lr': 0.0004845772085283292, 'samples': 3577920, 'steps': 18634, 'loss/train': 1.0557796955108643} -08/30/2021 16:34:50 - INFO - __main__ - Step 18636: {'lr': 0.00048457537341178885, 'samples': 3578112, 'steps': 18635, 'loss/train': 1.8288823366165161} -08/30/2021 16:34:51 - INFO - __main__ - Step 18637: {'lr': 0.0004845735381895524, 'samples': 3578304, 'steps': 18636, 'loss/train': 1.7181144952774048} -08/30/2021 16:34:52 - INFO - __main__ - Step 18638: {'lr': 0.0004845717028616208, 'samples': 3578496, 'steps': 18637, 'loss/train': 0.7587200999259949} -08/30/2021 16:34:53 - INFO - __main__ - Step 18639: {'lr': 0.00048456986742799474, 'samples': 3578688, 'steps': 18638, 'loss/train': 1.7869253158569336} -08/30/2021 16:34:53 - INFO - __main__ - Step 18640: {'lr': 0.00048456803188867513, 'samples': 3578880, 'steps': 18639, 'loss/train': 1.3770478963851929} -08/30/2021 16:34:53 - INFO - __main__ - Step 18641: {'lr': 0.00048456619624366284, 'samples': 3579072, 'steps': 18640, 'loss/train': 1.5366994142532349} -08/30/2021 16:34:54 - INFO - __main__ - Step 18642: {'lr': 0.0004845643604929586, 'samples': 3579264, 'steps': 18641, 'loss/train': 1.6829020977020264} -08/30/2021 16:34:55 - INFO - __main__ - Step 18643: {'lr': 0.00048456252463656326, 'samples': 3579456, 'steps': 18642, 'loss/train': 1.63473379611969} -08/30/2021 16:34:56 - INFO - __main__ - Step 18644: {'lr': 0.00048456068867447767, 'samples': 3579648, 'steps': 18643, 'loss/train': 1.4576683044433594} -08/30/2021 16:34:56 - INFO - __main__ - Step 18645: {'lr': 0.0004845588526067027, 'samples': 3579840, 'steps': 18644, 'loss/train': 1.4982426166534424} -08/30/2021 16:34:56 - INFO - __main__ - Step 18646: {'lr': 0.00048455701643323914, 'samples': 3580032, 'steps': 18645, 'loss/train': 1.80778169631958} -08/30/2021 16:34:57 - INFO - __main__ - Step 18647: {'lr': 0.00048455518015408773, 'samples': 3580224, 'steps': 18646, 'loss/train': 1.5563485622406006} -08/30/2021 16:34:59 - INFO - __main__ - Step 18648: {'lr': 0.00048455334376924943, 'samples': 3580416, 'steps': 18647, 'loss/train': 1.4022586345672607} -08/30/2021 16:34:59 - INFO - __main__ - Step 18649: {'lr': 0.000484551507278725, 'samples': 3580608, 'steps': 18648, 'loss/train': 1.4820568561553955} -08/30/2021 16:35:00 - INFO - __main__ - Step 18650: {'lr': 0.0004845496706825152, 'samples': 3580800, 'steps': 18649, 'loss/train': 0.0739121288061142} -08/30/2021 16:35:00 - INFO - __main__ - Step 18651: {'lr': 0.0004845478339806211, 'samples': 3580992, 'steps': 18650, 'loss/train': 0.09882553666830063} -08/30/2021 16:35:00 - INFO - __main__ - Step 18652: {'lr': 0.00048454599717304327, 'samples': 3581184, 'steps': 18651, 'loss/train': 1.7683773040771484} -08/30/2021 16:35:01 - INFO - __main__ - Step 18653: {'lr': 0.0004845441602597826, 'samples': 3581376, 'steps': 18652, 'loss/train': 2.580165386199951} -08/30/2021 16:35:01 - INFO - __main__ - Step 18654: {'lr': 0.00048454232324084004, 'samples': 3581568, 'steps': 18653, 'loss/train': 2.1176917552948} -08/30/2021 16:35:03 - INFO - __main__ - Step 18655: {'lr': 0.0004845404861162163, 'samples': 3581760, 'steps': 18654, 'loss/train': 2.0859687328338623} -08/30/2021 16:35:03 - INFO - __main__ - Step 18656: {'lr': 0.00048453864888591214, 'samples': 3581952, 'steps': 18655, 'loss/train': 2.2482786178588867} -08/30/2021 16:35:04 - INFO - __main__ - Step 18657: {'lr': 0.0004845368115499286, 'samples': 3582144, 'steps': 18656, 'loss/train': 1.875685214996338} -08/30/2021 16:35:04 - INFO - __main__ - Step 18658: {'lr': 0.0004845349741082663, 'samples': 3582336, 'steps': 18657, 'loss/train': 1.0968303680419922} -08/30/2021 16:35:04 - INFO - __main__ - Step 18659: {'lr': 0.00048453313656092624, 'samples': 3582528, 'steps': 18658, 'loss/train': 1.6515830755233765} -08/30/2021 16:35:05 - INFO - __main__ - Step 18660: {'lr': 0.0004845312989079091, 'samples': 3582720, 'steps': 18659, 'loss/train': 1.2533869743347168} -08/30/2021 16:35:06 - INFO - __main__ - Step 18661: {'lr': 0.0004845294611492158, 'samples': 3582912, 'steps': 18660, 'loss/train': 0.9937903881072998} -08/30/2021 16:35:07 - INFO - __main__ - Step 18662: {'lr': 0.00048452762328484724, 'samples': 3583104, 'steps': 18661, 'loss/train': 0.3184073567390442} -08/30/2021 16:35:07 - INFO - __main__ - Step 18663: {'lr': 0.000484525785314804, 'samples': 3583296, 'steps': 18662, 'loss/train': 1.3504564762115479} -08/30/2021 16:35:07 - INFO - __main__ - Step 18664: {'lr': 0.0004845239472390872, 'samples': 3583488, 'steps': 18663, 'loss/train': 1.2113533020019531} -08/30/2021 16:35:08 - INFO - __main__ - Step 18665: {'lr': 0.0004845221090576974, 'samples': 3583680, 'steps': 18664, 'loss/train': 1.6577436923980713} -08/30/2021 16:35:09 - INFO - __main__ - Step 18666: {'lr': 0.0004845202707706356, 'samples': 3583872, 'steps': 18665, 'loss/train': 2.0766139030456543} -08/30/2021 16:35:09 - INFO - __main__ - Step 18667: {'lr': 0.0004845184323779026, 'samples': 3584064, 'steps': 18666, 'loss/train': 1.9564974308013916} -08/30/2021 16:35:10 - INFO - __main__ - Step 18668: {'lr': 0.0004845165938794992, 'samples': 3584256, 'steps': 18667, 'loss/train': 1.630800485610962} -08/30/2021 16:35:10 - INFO - __main__ - Step 18669: {'lr': 0.0004845147552754263, 'samples': 3584448, 'steps': 18668, 'loss/train': 1.7552801370620728} -08/30/2021 16:35:10 - INFO - __main__ - Step 18670: {'lr': 0.0004845129165656846, 'samples': 3584640, 'steps': 18669, 'loss/train': 1.6562836170196533} -08/30/2021 16:35:12 - INFO - __main__ - Step 18671: {'lr': 0.00048451107775027505, 'samples': 3584832, 'steps': 18670, 'loss/train': 1.9035931825637817} -08/30/2021 16:35:12 - INFO - __main__ - Step 18672: {'lr': 0.0004845092388291984, 'samples': 3585024, 'steps': 18671, 'loss/train': 1.4335185289382935} -08/30/2021 16:35:13 - INFO - __main__ - Step 18673: {'lr': 0.0004845073998024555, 'samples': 3585216, 'steps': 18672, 'loss/train': 1.2621657848358154} -08/30/2021 16:35:13 - INFO - __main__ - Step 18674: {'lr': 0.0004845055606700472, 'samples': 3585408, 'steps': 18673, 'loss/train': 1.5613656044006348} -08/30/2021 16:35:13 - INFO - __main__ - Step 18675: {'lr': 0.0004845037214319743, 'samples': 3585600, 'steps': 18674, 'loss/train': 1.5874727964401245} -08/30/2021 16:35:15 - INFO - __main__ - Step 18676: {'lr': 0.00048450188208823766, 'samples': 3585792, 'steps': 18675, 'loss/train': 0.40764713287353516} -08/30/2021 16:35:15 - INFO - __main__ - Step 18677: {'lr': 0.00048450004263883806, 'samples': 3585984, 'steps': 18676, 'loss/train': 1.5625742673873901} -08/30/2021 16:35:16 - INFO - __main__ - Step 18678: {'lr': 0.00048449820308377634, 'samples': 3586176, 'steps': 18677, 'loss/train': 1.9346193075180054} -08/30/2021 16:35:16 - INFO - __main__ - Step 18679: {'lr': 0.00048449636342305343, 'samples': 3586368, 'steps': 18678, 'loss/train': 1.4314703941345215} -08/30/2021 16:35:16 - INFO - __main__ - Step 18680: {'lr': 0.00048449452365667003, 'samples': 3586560, 'steps': 18679, 'loss/train': 1.5792099237442017} -08/30/2021 16:35:19 - INFO - __main__ - Step 18681: {'lr': 0.00048449268378462695, 'samples': 3586752, 'steps': 18680, 'loss/train': 1.8770092725753784} -08/30/2021 16:35:20 - INFO - __main__ - Step 18682: {'lr': 0.00048449084380692523, 'samples': 3586944, 'steps': 18681, 'loss/train': 1.610478162765503} -08/30/2021 16:35:20 - INFO - __main__ - Step 18683: {'lr': 0.0004844890037235654, 'samples': 3587136, 'steps': 18682, 'loss/train': 1.8821977376937866} -08/30/2021 16:35:20 - INFO - __main__ - Step 18684: {'lr': 0.00048448716353454856, 'samples': 3587328, 'steps': 18683, 'loss/train': 3.1390202045440674} -08/30/2021 16:35:21 - INFO - __main__ - Step 18685: {'lr': 0.0004844853232398754, 'samples': 3587520, 'steps': 18684, 'loss/train': 3.5587410926818848} -08/30/2021 16:35:21 - INFO - __main__ - Step 18686: {'lr': 0.00048448348283954674, 'samples': 3587712, 'steps': 18685, 'loss/train': 1.690757155418396} -08/30/2021 16:35:22 - INFO - __main__ - Step 18687: {'lr': 0.00048448164233356344, 'samples': 3587904, 'steps': 18686, 'loss/train': 2.143714427947998} -08/30/2021 16:35:23 - INFO - __main__ - Step 18688: {'lr': 0.0004844798017219264, 'samples': 3588096, 'steps': 18687, 'loss/train': 1.801722764968872} -08/30/2021 16:35:23 - INFO - __main__ - Step 18689: {'lr': 0.00048447796100463625, 'samples': 3588288, 'steps': 18688, 'loss/train': 2.230644941329956} -08/30/2021 16:35:24 - INFO - __main__ - Step 18690: {'lr': 0.0004844761201816941, 'samples': 3588480, 'steps': 18689, 'loss/train': 1.5586072206497192} -08/30/2021 16:35:24 - INFO - __main__ - Step 18691: {'lr': 0.0004844742792531005, 'samples': 3588672, 'steps': 18690, 'loss/train': 1.4849650859832764} -08/30/2021 16:35:24 - INFO - __main__ - Step 18692: {'lr': 0.00048447243821885644, 'samples': 3588864, 'steps': 18691, 'loss/train': 1.0598472356796265} -08/30/2021 16:35:26 - INFO - __main__ - Step 18693: {'lr': 0.0004844705970789628, 'samples': 3589056, 'steps': 18692, 'loss/train': 1.4825066328048706} -08/30/2021 16:35:26 - INFO - __main__ - Step 18694: {'lr': 0.0004844687558334202, 'samples': 3589248, 'steps': 18693, 'loss/train': 1.6356847286224365} -08/30/2021 16:35:27 - INFO - __main__ - Step 18695: {'lr': 0.0004844669144822297, 'samples': 3589440, 'steps': 18694, 'loss/train': 2.0778491497039795} -08/30/2021 16:35:27 - INFO - __main__ - Step 18696: {'lr': 0.000484465073025392, 'samples': 3589632, 'steps': 18695, 'loss/train': 1.254042148590088} -08/30/2021 16:35:27 - INFO - __main__ - Step 18697: {'lr': 0.00048446323146290795, 'samples': 3589824, 'steps': 18696, 'loss/train': 2.0559182167053223} -08/30/2021 16:35:29 - INFO - __main__ - Step 18698: {'lr': 0.0004844613897947784, 'samples': 3590016, 'steps': 18697, 'loss/train': 1.9842222929000854} -08/30/2021 16:35:29 - INFO - __main__ - Step 18699: {'lr': 0.00048445954802100414, 'samples': 3590208, 'steps': 18698, 'loss/train': 1.610824704170227} -08/30/2021 16:35:30 - INFO - __main__ - Step 18700: {'lr': 0.000484457706141586, 'samples': 3590400, 'steps': 18699, 'loss/train': 1.5430368185043335} -08/30/2021 16:35:30 - INFO - __main__ - Step 18701: {'lr': 0.0004844558641565249, 'samples': 3590592, 'steps': 18700, 'loss/train': 1.5543664693832397} -08/30/2021 16:35:30 - INFO - __main__ - Step 18702: {'lr': 0.00048445402206582155, 'samples': 3590784, 'steps': 18701, 'loss/train': 1.8709467649459839} -08/30/2021 16:35:32 - INFO - __main__ - Step 18703: {'lr': 0.0004844521798694768, 'samples': 3590976, 'steps': 18702, 'loss/train': 1.660312294960022} -08/30/2021 16:35:32 - INFO - __main__ - Step 18704: {'lr': 0.0004844503375674916, 'samples': 3591168, 'steps': 18703, 'loss/train': 1.8360676765441895} -08/30/2021 16:35:33 - INFO - __main__ - Step 18705: {'lr': 0.0004844484951598667, 'samples': 3591360, 'steps': 18704, 'loss/train': 1.815129280090332} -08/30/2021 16:35:33 - INFO - __main__ - Step 18706: {'lr': 0.00048444665264660286, 'samples': 3591552, 'steps': 18705, 'loss/train': 0.14327189326286316} -08/30/2021 16:35:33 - INFO - __main__ - Step 18707: {'lr': 0.000484444810027701, 'samples': 3591744, 'steps': 18706, 'loss/train': 1.789504051208496} -08/30/2021 16:35:35 - INFO - __main__ - Step 18708: {'lr': 0.00048444296730316196, 'samples': 3591936, 'steps': 18707, 'loss/train': 1.9275892972946167} -08/30/2021 16:35:35 - INFO - __main__ - Step 18709: {'lr': 0.0004844411244729865, 'samples': 3592128, 'steps': 18708, 'loss/train': 2.6028988361358643} -08/30/2021 16:35:36 - INFO - __main__ - Step 18710: {'lr': 0.00048443928153717555, 'samples': 3592320, 'steps': 18709, 'loss/train': 1.8521556854248047} -08/30/2021 16:35:36 - INFO - __main__ - Step 18711: {'lr': 0.00048443743849572974, 'samples': 3592512, 'steps': 18710, 'loss/train': 1.3215727806091309} -08/30/2021 16:35:36 - INFO - __main__ - Step 18712: {'lr': 0.00048443559534865017, 'samples': 3592704, 'steps': 18711, 'loss/train': 1.9808443784713745} -08/30/2021 16:35:37 - INFO - __main__ - Step 18713: {'lr': 0.0004844337520959375, 'samples': 3592896, 'steps': 18712, 'loss/train': 1.8047269582748413} -08/30/2021 16:35:39 - INFO - __main__ - Step 18714: {'lr': 0.00048443190873759256, 'samples': 3593088, 'steps': 18713, 'loss/train': 1.957062005996704} -08/30/2021 16:35:39 - INFO - __main__ - Step 18715: {'lr': 0.00048443006527361626, 'samples': 3593280, 'steps': 18714, 'loss/train': 1.7376261949539185} -08/30/2021 16:35:40 - INFO - __main__ - Step 18716: {'lr': 0.0004844282217040094, 'samples': 3593472, 'steps': 18715, 'loss/train': 1.8164899349212646} -08/30/2021 16:35:40 - INFO - __main__ - Step 18717: {'lr': 0.00048442637802877277, 'samples': 3593664, 'steps': 18716, 'loss/train': 0.22864291071891785} -08/30/2021 16:35:40 - INFO - __main__ - Step 18718: {'lr': 0.0004844245342479072, 'samples': 3593856, 'steps': 18717, 'loss/train': 1.6635072231292725} -08/30/2021 16:35:41 - INFO - __main__ - Step 18719: {'lr': 0.00048442269036141363, 'samples': 3594048, 'steps': 18718, 'loss/train': 1.2503526210784912} -08/30/2021 16:35:42 - INFO - __main__ - Step 18720: {'lr': 0.0004844208463692928, 'samples': 3594240, 'steps': 18719, 'loss/train': 0.14091970026493073} -08/30/2021 16:35:43 - INFO - __main__ - Step 18721: {'lr': 0.00048441900227154557, 'samples': 3594432, 'steps': 18720, 'loss/train': 1.1688940525054932} -08/30/2021 16:35:43 - INFO - __main__ - Step 18722: {'lr': 0.00048441715806817265, 'samples': 3594624, 'steps': 18721, 'loss/train': 1.5595972537994385} -08/30/2021 16:35:43 - INFO - __main__ - Step 18723: {'lr': 0.0004844153137591751, 'samples': 3594816, 'steps': 18722, 'loss/train': 2.0275187492370605} -08/30/2021 16:35:44 - INFO - __main__ - Step 18724: {'lr': 0.00048441346934455356, 'samples': 3595008, 'steps': 18723, 'loss/train': 1.7118854522705078} -08/30/2021 16:35:45 - INFO - __main__ - Step 18725: {'lr': 0.0004844116248243089, 'samples': 3595200, 'steps': 18724, 'loss/train': 1.8899564743041992} -08/30/2021 16:35:46 - INFO - __main__ - Step 18726: {'lr': 0.0004844097801984421, 'samples': 3595392, 'steps': 18725, 'loss/train': 1.701796054840088} -08/30/2021 16:35:46 - INFO - __main__ - Step 18727: {'lr': 0.0004844079354669537, 'samples': 3595584, 'steps': 18726, 'loss/train': 1.674830675125122} -08/30/2021 16:35:46 - INFO - __main__ - Step 18728: {'lr': 0.0004844060906298448, 'samples': 3595776, 'steps': 18727, 'loss/train': 2.0198514461517334} -08/30/2021 16:35:47 - INFO - __main__ - Step 18729: {'lr': 0.0004844042456871162, 'samples': 3595968, 'steps': 18728, 'loss/train': 1.8553674221038818} -08/30/2021 16:35:48 - INFO - __main__ - Step 18730: {'lr': 0.0004844024006387685, 'samples': 3596160, 'steps': 18729, 'loss/train': 1.6953486204147339} -08/30/2021 16:35:49 - INFO - __main__ - Step 18731: {'lr': 0.00048440055548480275, 'samples': 3596352, 'steps': 18730, 'loss/train': 1.5249199867248535} -08/30/2021 16:35:49 - INFO - __main__ - Step 18732: {'lr': 0.0004843987102252198, 'samples': 3596544, 'steps': 18731, 'loss/train': 1.6466822624206543} -08/30/2021 16:35:49 - INFO - __main__ - Step 18733: {'lr': 0.0004843968648600204, 'samples': 3596736, 'steps': 18732, 'loss/train': 1.4004868268966675} -08/30/2021 16:35:50 - INFO - __main__ - Step 18734: {'lr': 0.00048439501938920534, 'samples': 3596928, 'steps': 18733, 'loss/train': 1.815832495689392} -08/30/2021 16:35:51 - INFO - __main__ - Step 18735: {'lr': 0.0004843931738127755, 'samples': 3597120, 'steps': 18734, 'loss/train': 1.5569733381271362} -08/30/2021 16:35:52 - INFO - __main__ - Step 18736: {'lr': 0.0004843913281307317, 'samples': 3597312, 'steps': 18735, 'loss/train': 1.4122766256332397} -08/30/2021 16:35:52 - INFO - __main__ - Step 18737: {'lr': 0.0004843894823430749, 'samples': 3597504, 'steps': 18736, 'loss/train': 1.5067040920257568} -08/30/2021 16:35:52 - INFO - __main__ - Step 18738: {'lr': 0.00048438763644980564, 'samples': 3597696, 'steps': 18737, 'loss/train': 1.0526565313339233} -08/30/2021 16:35:53 - INFO - __main__ - Step 18739: {'lr': 0.0004843857904509251, 'samples': 3597888, 'steps': 18738, 'loss/train': 1.0327776670455933} -08/30/2021 16:35:55 - INFO - __main__ - Step 18740: {'lr': 0.00048438394434643386, 'samples': 3598080, 'steps': 18739, 'loss/train': 2.21777081489563} -08/30/2021 16:35:55 - INFO - __main__ - Step 18741: {'lr': 0.0004843820981363328, 'samples': 3598272, 'steps': 18740, 'loss/train': 1.4588394165039062} -08/30/2021 16:35:55 - INFO - __main__ - Step 18742: {'lr': 0.00048438025182062286, 'samples': 3598464, 'steps': 18741, 'loss/train': 1.724167823791504} -08/30/2021 16:35:56 - INFO - __main__ - Step 18743: {'lr': 0.00048437840539930466, 'samples': 3598656, 'steps': 18742, 'loss/train': 1.81268310546875} -08/30/2021 16:35:56 - INFO - __main__ - Step 18744: {'lr': 0.0004843765588723793, 'samples': 3598848, 'steps': 18743, 'loss/train': 1.3539683818817139} -08/30/2021 16:35:57 - INFO - __main__ - Step 18745: {'lr': 0.00048437471223984743, 'samples': 3599040, 'steps': 18744, 'loss/train': 2.382828712463379} -08/30/2021 16:35:58 - INFO - __main__ - Step 18746: {'lr': 0.00048437286550170996, 'samples': 3599232, 'steps': 18745, 'loss/train': 2.2191319465637207} -08/30/2021 16:35:58 - INFO - __main__ - Step 18747: {'lr': 0.00048437101865796763, 'samples': 3599424, 'steps': 18746, 'loss/train': 1.140054702758789} -08/30/2021 16:35:59 - INFO - __main__ - Step 18748: {'lr': 0.0004843691717086214, 'samples': 3599616, 'steps': 18747, 'loss/train': 1.7695509195327759} -08/30/2021 16:35:59 - INFO - __main__ - Step 18749: {'lr': 0.000484367324653672, 'samples': 3599808, 'steps': 18748, 'loss/train': 1.8163909912109375} -08/30/2021 16:36:00 - INFO - __main__ - Step 18750: {'lr': 0.0004843654774931203, 'samples': 3600000, 'steps': 18749, 'loss/train': 1.4683212041854858} -08/30/2021 16:36:01 - INFO - __main__ - Step 18751: {'lr': 0.00048436363022696715, 'samples': 3600192, 'steps': 18750, 'loss/train': 1.4695026874542236} -08/30/2021 16:36:01 - INFO - __main__ - Step 18752: {'lr': 0.0004843617828552134, 'samples': 3600384, 'steps': 18751, 'loss/train': 2.245600938796997} -08/30/2021 16:36:02 - INFO - __main__ - Step 18753: {'lr': 0.00048435993537785976, 'samples': 3600576, 'steps': 18752, 'loss/train': 2.03971266746521} -08/30/2021 16:36:02 - INFO - __main__ - Step 18754: {'lr': 0.0004843580877949072, 'samples': 3600768, 'steps': 18753, 'loss/train': 1.674576997756958} -08/30/2021 16:36:02 - INFO - __main__ - Step 18755: {'lr': 0.0004843562401063565, 'samples': 3600960, 'steps': 18754, 'loss/train': 1.3875715732574463} -08/30/2021 16:36:04 - INFO - __main__ - Step 18756: {'lr': 0.0004843543923122085, 'samples': 3601152, 'steps': 18755, 'loss/train': 1.7169502973556519} -08/30/2021 16:36:04 - INFO - __main__ - Step 18757: {'lr': 0.000484352544412464, 'samples': 3601344, 'steps': 18756, 'loss/train': 2.0435969829559326} -08/30/2021 16:36:05 - INFO - __main__ - Step 18758: {'lr': 0.0004843506964071239, 'samples': 3601536, 'steps': 18757, 'loss/train': 1.4638701677322388} -08/30/2021 16:36:05 - INFO - __main__ - Step 18759: {'lr': 0.000484348848296189, 'samples': 3601728, 'steps': 18758, 'loss/train': 1.5171616077423096} -08/30/2021 16:36:05 - INFO - __main__ - Step 18760: {'lr': 0.00048434700007966006, 'samples': 3601920, 'steps': 18759, 'loss/train': 1.8144410848617554} -08/30/2021 16:36:07 - INFO - __main__ - Step 18761: {'lr': 0.000484345151757538, 'samples': 3602112, 'steps': 18760, 'loss/train': 1.88290536403656} -08/30/2021 16:36:08 - INFO - __main__ - Step 18762: {'lr': 0.0004843433033298237, 'samples': 3602304, 'steps': 18761, 'loss/train': 1.8810815811157227} -08/30/2021 16:36:08 - INFO - __main__ - Step 18763: {'lr': 0.00048434145479651783, 'samples': 3602496, 'steps': 18762, 'loss/train': 1.4046201705932617} -08/30/2021 16:36:08 - INFO - __main__ - Step 18764: {'lr': 0.00048433960615762136, 'samples': 3602688, 'steps': 18763, 'loss/train': 1.8820677995681763} -08/30/2021 16:36:09 - INFO - __main__ - Step 18765: {'lr': 0.0004843377574131351, 'samples': 3602880, 'steps': 18764, 'loss/train': 1.4780255556106567} -08/30/2021 16:36:10 - INFO - __main__ - Step 18766: {'lr': 0.0004843359085630598, 'samples': 3603072, 'steps': 18765, 'loss/train': 1.659212350845337} -08/30/2021 16:36:11 - INFO - __main__ - Step 18767: {'lr': 0.0004843340596073964, 'samples': 3603264, 'steps': 18766, 'loss/train': 1.403775691986084} -08/30/2021 16:36:11 - INFO - __main__ - Step 18768: {'lr': 0.0004843322105461457, 'samples': 3603456, 'steps': 18767, 'loss/train': 1.7835924625396729} -08/30/2021 16:36:11 - INFO - __main__ - Step 18769: {'lr': 0.0004843303613793085, 'samples': 3603648, 'steps': 18768, 'loss/train': 1.0598496198654175} -08/30/2021 16:36:12 - INFO - __main__ - Step 18770: {'lr': 0.00048432851210688567, 'samples': 3603840, 'steps': 18769, 'loss/train': 1.6672589778900146} -08/30/2021 16:36:13 - INFO - __main__ - Step 18771: {'lr': 0.00048432666272887805, 'samples': 3604032, 'steps': 18770, 'loss/train': 2.340057849884033} -08/30/2021 16:36:13 - INFO - __main__ - Step 18772: {'lr': 0.0004843248132452864, 'samples': 3604224, 'steps': 18771, 'loss/train': 1.585218071937561} -08/30/2021 16:36:14 - INFO - __main__ - Step 18773: {'lr': 0.0004843229636561116, 'samples': 3604416, 'steps': 18772, 'loss/train': 1.4477012157440186} -08/30/2021 16:36:14 - INFO - __main__ - Step 18774: {'lr': 0.00048432111396135447, 'samples': 3604608, 'steps': 18773, 'loss/train': 1.6103549003601074} -08/30/2021 16:36:15 - INFO - __main__ - Step 18775: {'lr': 0.0004843192641610159, 'samples': 3604800, 'steps': 18774, 'loss/train': 1.2788995504379272} -08/30/2021 16:36:16 - INFO - __main__ - Step 18776: {'lr': 0.00048431741425509676, 'samples': 3604992, 'steps': 18775, 'loss/train': 1.5461417436599731} -08/30/2021 16:36:16 - INFO - __main__ - Step 18777: {'lr': 0.0004843155642435977, 'samples': 3605184, 'steps': 18776, 'loss/train': 2.0165276527404785} -08/30/2021 16:36:17 - INFO - __main__ - Step 18778: {'lr': 0.0004843137141265197, 'samples': 3605376, 'steps': 18777, 'loss/train': 1.8745001554489136} -08/30/2021 16:36:17 - INFO - __main__ - Step 18779: {'lr': 0.00048431186390386356, 'samples': 3605568, 'steps': 18778, 'loss/train': 1.5030087232589722} -08/30/2021 16:36:18 - INFO - __main__ - Step 18780: {'lr': 0.0004843100135756301, 'samples': 3605760, 'steps': 18779, 'loss/train': 2.11687970161438} -08/30/2021 16:36:18 - INFO - __main__ - Step 18781: {'lr': 0.0004843081631418202, 'samples': 3605952, 'steps': 18780, 'loss/train': 2.195359945297241} -08/30/2021 16:36:19 - INFO - __main__ - Step 18782: {'lr': 0.00048430631260243465, 'samples': 3606144, 'steps': 18781, 'loss/train': 1.9703930616378784} -08/30/2021 16:36:20 - INFO - __main__ - Step 18783: {'lr': 0.00048430446195747424, 'samples': 3606336, 'steps': 18782, 'loss/train': 1.436973214149475} -08/30/2021 16:36:20 - INFO - __main__ - Step 18784: {'lr': 0.00048430261120693986, 'samples': 3606528, 'steps': 18783, 'loss/train': 1.4219201803207397} -08/30/2021 16:36:21 - INFO - __main__ - Step 18785: {'lr': 0.0004843007603508324, 'samples': 3606720, 'steps': 18784, 'loss/train': 1.6902960538864136} -08/30/2021 16:36:21 - INFO - __main__ - Step 18786: {'lr': 0.00048429890938915255, 'samples': 3606912, 'steps': 18785, 'loss/train': 1.467069387435913} -08/30/2021 16:36:22 - INFO - __main__ - Step 18787: {'lr': 0.0004842970583219013, 'samples': 3607104, 'steps': 18786, 'loss/train': 1.503032922744751} -08/30/2021 16:36:23 - INFO - __main__ - Step 18788: {'lr': 0.0004842952071490794, 'samples': 3607296, 'steps': 18787, 'loss/train': 1.3325965404510498} -08/30/2021 16:36:23 - INFO - __main__ - Step 18789: {'lr': 0.0004842933558706877, 'samples': 3607488, 'steps': 18788, 'loss/train': 1.8448175191879272} -08/30/2021 16:36:24 - INFO - __main__ - Step 18790: {'lr': 0.000484291504486727, 'samples': 3607680, 'steps': 18789, 'loss/train': 1.696388602256775} -08/30/2021 16:36:24 - INFO - __main__ - Step 18791: {'lr': 0.0004842896529971982, 'samples': 3607872, 'steps': 18790, 'loss/train': 1.762611746788025} -08/30/2021 16:36:26 - INFO - __main__ - Step 18792: {'lr': 0.00048428780140210204, 'samples': 3608064, 'steps': 18791, 'loss/train': 1.8964207172393799} -08/30/2021 16:36:27 - INFO - __main__ - Step 18793: {'lr': 0.0004842859497014394, 'samples': 3608256, 'steps': 18792, 'loss/train': 1.6959890127182007} -08/30/2021 16:36:27 - INFO - __main__ - Step 18794: {'lr': 0.0004842840978952112, 'samples': 3608448, 'steps': 18793, 'loss/train': 0.7731893658638} -08/30/2021 16:36:27 - INFO - __main__ - Step 18795: {'lr': 0.00048428224598341815, 'samples': 3608640, 'steps': 18794, 'loss/train': 1.503921389579773} -08/30/2021 16:36:28 - INFO - __main__ - Step 18796: {'lr': 0.0004842803939660612, 'samples': 3608832, 'steps': 18795, 'loss/train': 1.7576403617858887} -08/30/2021 16:36:29 - INFO - __main__ - Step 18797: {'lr': 0.00048427854184314103, 'samples': 3609024, 'steps': 18796, 'loss/train': 1.324228286743164} -08/30/2021 16:36:30 - INFO - __main__ - Step 18798: {'lr': 0.0004842766896146586, 'samples': 3609216, 'steps': 18797, 'loss/train': 1.5051244497299194} -08/30/2021 16:36:30 - INFO - __main__ - Step 18799: {'lr': 0.0004842748372806147, 'samples': 3609408, 'steps': 18798, 'loss/train': 1.8872275352478027} -08/30/2021 16:36:30 - INFO - __main__ - Step 18800: {'lr': 0.00048427298484101023, 'samples': 3609600, 'steps': 18799, 'loss/train': 1.111180067062378} -08/30/2021 16:36:31 - INFO - __main__ - Step 18801: {'lr': 0.0004842711322958459, 'samples': 3609792, 'steps': 18800, 'loss/train': 1.7275948524475098} -08/30/2021 16:36:33 - INFO - __main__ - Step 18802: {'lr': 0.0004842692796451226, 'samples': 3609984, 'steps': 18801, 'loss/train': 1.684067726135254} -08/30/2021 16:36:33 - INFO - __main__ - Step 18803: {'lr': 0.0004842674268888413, 'samples': 3610176, 'steps': 18802, 'loss/train': 1.430519938468933} -08/30/2021 16:36:33 - INFO - __main__ - Step 18804: {'lr': 0.0004842655740270026, 'samples': 3610368, 'steps': 18803, 'loss/train': 1.34248948097229} -08/30/2021 16:36:34 - INFO - __main__ - Step 18805: {'lr': 0.0004842637210596075, 'samples': 3610560, 'steps': 18804, 'loss/train': 1.3173251152038574} -08/30/2021 16:36:34 - INFO - __main__ - Step 18806: {'lr': 0.0004842618679866567, 'samples': 3610752, 'steps': 18805, 'loss/train': 1.451834797859192} -08/30/2021 16:36:36 - INFO - __main__ - Step 18807: {'lr': 0.0004842600148081512, 'samples': 3610944, 'steps': 18806, 'loss/train': 1.028164029121399} -08/30/2021 16:36:36 - INFO - __main__ - Step 18808: {'lr': 0.00048425816152409173, 'samples': 3611136, 'steps': 18807, 'loss/train': 2.2420125007629395} -08/30/2021 16:36:36 - INFO - __main__ - Step 18809: {'lr': 0.00048425630813447916, 'samples': 3611328, 'steps': 18808, 'loss/train': 1.931848406791687} -08/30/2021 16:36:37 - INFO - __main__ - Step 18810: {'lr': 0.0004842544546393143, 'samples': 3611520, 'steps': 18809, 'loss/train': 1.5243005752563477} -08/30/2021 16:36:37 - INFO - __main__ - Step 18811: {'lr': 0.00048425260103859797, 'samples': 3611712, 'steps': 18810, 'loss/train': 2.062664270401001} -08/30/2021 16:36:39 - INFO - __main__ - Step 18812: {'lr': 0.0004842507473323311, 'samples': 3611904, 'steps': 18811, 'loss/train': 1.3754416704177856} -08/30/2021 16:36:39 - INFO - __main__ - Step 18813: {'lr': 0.00048424889352051436, 'samples': 3612096, 'steps': 18812, 'loss/train': 1.0482581853866577} -08/30/2021 16:36:39 - INFO - __main__ - Step 18814: {'lr': 0.00048424703960314876, 'samples': 3612288, 'steps': 18813, 'loss/train': 1.5366097688674927} -08/30/2021 16:36:40 - INFO - __main__ - Step 18815: {'lr': 0.00048424518558023505, 'samples': 3612480, 'steps': 18814, 'loss/train': 1.6471534967422485} -08/30/2021 16:36:40 - INFO - __main__ - Step 18816: {'lr': 0.00048424333145177405, 'samples': 3612672, 'steps': 18815, 'loss/train': 2.2628097534179688} -08/30/2021 16:36:40 - INFO - __main__ - Step 18817: {'lr': 0.00048424147721776666, 'samples': 3612864, 'steps': 18816, 'loss/train': 1.8539897203445435} -08/30/2021 16:36:42 - INFO - __main__ - Step 18818: {'lr': 0.00048423962287821366, 'samples': 3613056, 'steps': 18817, 'loss/train': 1.4543426036834717} -08/30/2021 16:36:43 - INFO - __main__ - Step 18819: {'lr': 0.00048423776843311585, 'samples': 3613248, 'steps': 18818, 'loss/train': 1.724756121635437} -08/30/2021 16:36:43 - INFO - __main__ - Step 18820: {'lr': 0.00048423591388247416, 'samples': 3613440, 'steps': 18819, 'loss/train': 1.831925392150879} -08/30/2021 16:36:44 - INFO - __main__ - Step 18821: {'lr': 0.0004842340592262894, 'samples': 3613632, 'steps': 18820, 'loss/train': 1.9668060541152954} -08/30/2021 16:36:44 - INFO - __main__ - Step 18822: {'lr': 0.00048423220446456233, 'samples': 3613824, 'steps': 18821, 'loss/train': 1.4850150346755981} -08/30/2021 16:36:44 - INFO - __main__ - Step 18823: {'lr': 0.0004842303495972939, 'samples': 3614016, 'steps': 18822, 'loss/train': 1.7642061710357666} -08/30/2021 16:36:46 - INFO - __main__ - Step 18824: {'lr': 0.00048422849462448483, 'samples': 3614208, 'steps': 18823, 'loss/train': 2.1004860401153564} -08/30/2021 16:36:47 - INFO - __main__ - Step 18825: {'lr': 0.0004842266395461361, 'samples': 3614400, 'steps': 18824, 'loss/train': 1.674424409866333} -08/30/2021 16:36:47 - INFO - __main__ - Step 18826: {'lr': 0.0004842247843622484, 'samples': 3614592, 'steps': 18825, 'loss/train': 1.7505078315734863} -08/30/2021 16:36:47 - INFO - __main__ - Step 18827: {'lr': 0.0004842229290728226, 'samples': 3614784, 'steps': 18826, 'loss/train': 1.1835781335830688} -08/30/2021 16:36:48 - INFO - __main__ - Step 18828: {'lr': 0.0004842210736778596, 'samples': 3614976, 'steps': 18827, 'loss/train': 2.0453503131866455} -08/30/2021 16:36:48 - INFO - __main__ - Step 18829: {'lr': 0.0004842192181773602, 'samples': 3615168, 'steps': 18828, 'loss/train': 1.901028037071228} -08/30/2021 16:36:48 - INFO - __main__ - Step 18830: {'lr': 0.0004842173625713252, 'samples': 3615360, 'steps': 18829, 'loss/train': 1.8921504020690918} -08/30/2021 16:36:50 - INFO - __main__ - Step 18831: {'lr': 0.0004842155068597556, 'samples': 3615552, 'steps': 18830, 'loss/train': 2.693031072616577} -08/30/2021 16:36:50 - INFO - __main__ - Step 18832: {'lr': 0.0004842136510426519, 'samples': 3615744, 'steps': 18831, 'loss/train': 1.7852935791015625} -08/30/2021 16:36:51 - INFO - __main__ - Step 18833: {'lr': 0.00048421179512001536, 'samples': 3615936, 'steps': 18832, 'loss/train': 1.0270863771438599} -08/30/2021 16:36:51 - INFO - __main__ - Step 18834: {'lr': 0.0004842099390918464, 'samples': 3616128, 'steps': 18833, 'loss/train': 1.476439356803894} -08/30/2021 16:36:51 - INFO - __main__ - Step 18835: {'lr': 0.00048420808295814624, 'samples': 3616320, 'steps': 18834, 'loss/train': 1.4553825855255127} -08/30/2021 16:36:53 - INFO - __main__ - Step 18836: {'lr': 0.00048420622671891533, 'samples': 3616512, 'steps': 18835, 'loss/train': 1.8982298374176025} -08/30/2021 16:36:53 - INFO - __main__ - Step 18837: {'lr': 0.00048420437037415486, 'samples': 3616704, 'steps': 18836, 'loss/train': 1.5830507278442383} -08/30/2021 16:36:54 - INFO - __main__ - Step 18838: {'lr': 0.00048420251392386547, 'samples': 3616896, 'steps': 18837, 'loss/train': 2.066307544708252} -08/30/2021 16:36:54 - INFO - __main__ - Step 18839: {'lr': 0.0004842006573680481, 'samples': 3617088, 'steps': 18838, 'loss/train': 1.865342617034912} -08/30/2021 16:36:54 - INFO - __main__ - Step 18840: {'lr': 0.0004841988007067034, 'samples': 3617280, 'steps': 18839, 'loss/train': 1.5887759923934937} -08/30/2021 16:36:56 - INFO - __main__ - Step 18841: {'lr': 0.00048419694393983244, 'samples': 3617472, 'steps': 18840, 'loss/train': 1.801106572151184} -08/30/2021 16:36:56 - INFO - __main__ - Step 18842: {'lr': 0.00048419508706743587, 'samples': 3617664, 'steps': 18841, 'loss/train': 1.5339930057525635} -08/30/2021 16:36:57 - INFO - __main__ - Step 18843: {'lr': 0.00048419323008951467, 'samples': 3617856, 'steps': 18842, 'loss/train': 1.4506832361221313} -08/30/2021 16:36:57 - INFO - __main__ - Step 18844: {'lr': 0.00048419137300606963, 'samples': 3618048, 'steps': 18843, 'loss/train': 1.8783767223358154} -08/30/2021 16:36:57 - INFO - __main__ - Step 18845: {'lr': 0.00048418951581710154, 'samples': 3618240, 'steps': 18844, 'loss/train': 1.9886521100997925} -08/30/2021 16:37:00 - INFO - __main__ - Step 18846: {'lr': 0.00048418765852261124, 'samples': 3618432, 'steps': 18845, 'loss/train': 1.754531979560852} -08/30/2021 16:37:00 - INFO - __main__ - Step 18847: {'lr': 0.0004841858011225996, 'samples': 3618624, 'steps': 18846, 'loss/train': 1.5919480323791504} -08/30/2021 16:37:00 - INFO - __main__ - Step 18848: {'lr': 0.0004841839436170675, 'samples': 3618816, 'steps': 18847, 'loss/train': 1.814907193183899} -08/30/2021 16:37:01 - INFO - __main__ - Step 18849: {'lr': 0.0004841820860060157, 'samples': 3619008, 'steps': 18848, 'loss/train': 1.5920826196670532} -08/30/2021 16:37:01 - INFO - __main__ - Step 18850: {'lr': 0.0004841802282894451, 'samples': 3619200, 'steps': 18849, 'loss/train': 2.005141496658325} -08/30/2021 16:37:01 - INFO - __main__ - Step 18851: {'lr': 0.0004841783704673565, 'samples': 3619392, 'steps': 18850, 'loss/train': 2.8705596923828125} -08/30/2021 16:37:03 - INFO - __main__ - Step 18852: {'lr': 0.00048417651253975067, 'samples': 3619584, 'steps': 18851, 'loss/train': 1.971785545349121} -08/30/2021 16:37:04 - INFO - __main__ - Step 18853: {'lr': 0.00048417465450662856, 'samples': 3619776, 'steps': 18852, 'loss/train': 1.8574641942977905} -08/30/2021 16:37:04 - INFO - __main__ - Step 18854: {'lr': 0.0004841727963679909, 'samples': 3619968, 'steps': 18853, 'loss/train': 1.6750909090042114} -08/30/2021 16:37:04 - INFO - __main__ - Step 18855: {'lr': 0.0004841709381238387, 'samples': 3620160, 'steps': 18854, 'loss/train': 1.5622586011886597} -08/30/2021 16:37:05 - INFO - __main__ - Step 18856: {'lr': 0.0004841690797741726, 'samples': 3620352, 'steps': 18855, 'loss/train': 1.5276461839675903} -08/30/2021 16:37:06 - INFO - __main__ - Step 18857: {'lr': 0.0004841672213189936, 'samples': 3620544, 'steps': 18856, 'loss/train': 1.2764571905136108} -08/30/2021 16:37:06 - INFO - __main__ - Step 18858: {'lr': 0.00048416536275830245, 'samples': 3620736, 'steps': 18857, 'loss/train': 1.8183342218399048} -08/30/2021 16:37:07 - INFO - __main__ - Step 18859: {'lr': 0.00048416350409209995, 'samples': 3620928, 'steps': 18858, 'loss/train': 1.6793569326400757} -08/30/2021 16:37:07 - INFO - __main__ - Step 18860: {'lr': 0.000484161645320387, 'samples': 3621120, 'steps': 18859, 'loss/train': 1.5738416910171509} -08/30/2021 16:37:08 - INFO - __main__ - Step 18861: {'lr': 0.0004841597864431645, 'samples': 3621312, 'steps': 18860, 'loss/train': 1.579481840133667} -08/30/2021 16:37:09 - INFO - __main__ - Step 18862: {'lr': 0.00048415792746043314, 'samples': 3621504, 'steps': 18861, 'loss/train': 1.9011242389678955} -08/30/2021 16:37:10 - INFO - __main__ - Step 18863: {'lr': 0.00048415606837219383, 'samples': 3621696, 'steps': 18862, 'loss/train': 2.1082510948181152} -08/30/2021 16:37:10 - INFO - __main__ - Step 18864: {'lr': 0.00048415420917844744, 'samples': 3621888, 'steps': 18863, 'loss/train': 2.0008208751678467} -08/30/2021 16:37:10 - INFO - __main__ - Step 18865: {'lr': 0.00048415234987919474, 'samples': 3622080, 'steps': 18864, 'loss/train': 0.12366552650928497} -08/30/2021 16:37:11 - INFO - __main__ - Step 18866: {'lr': 0.0004841504904744367, 'samples': 3622272, 'steps': 18865, 'loss/train': 1.6811604499816895} -08/30/2021 16:37:11 - INFO - __main__ - Step 18867: {'lr': 0.0004841486309641739, 'samples': 3622464, 'steps': 18866, 'loss/train': 1.8319847583770752} -08/30/2021 16:37:13 - INFO - __main__ - Step 18868: {'lr': 0.00048414677134840753, 'samples': 3622656, 'steps': 18867, 'loss/train': 1.8587208986282349} -08/30/2021 16:37:13 - INFO - __main__ - Step 18869: {'lr': 0.00048414491162713814, 'samples': 3622848, 'steps': 18868, 'loss/train': 1.55882728099823} -08/30/2021 16:37:13 - INFO - __main__ - Step 18870: {'lr': 0.00048414305180036665, 'samples': 3623040, 'steps': 18869, 'loss/train': 1.6058638095855713} -08/30/2021 16:37:14 - INFO - __main__ - Step 18871: {'lr': 0.0004841411918680939, 'samples': 3623232, 'steps': 18870, 'loss/train': 1.3894546031951904} -08/30/2021 16:37:14 - INFO - __main__ - Step 18872: {'lr': 0.0004841393318303208, 'samples': 3623424, 'steps': 18871, 'loss/train': 1.9317538738250732} -08/30/2021 16:37:16 - INFO - __main__ - Step 18873: {'lr': 0.0004841374716870481, 'samples': 3623616, 'steps': 18872, 'loss/train': 2.1624057292938232} -08/30/2021 16:37:16 - INFO - __main__ - Step 18874: {'lr': 0.00048413561143827665, 'samples': 3623808, 'steps': 18873, 'loss/train': 4.072031497955322} -08/30/2021 16:37:17 - INFO - __main__ - Step 18875: {'lr': 0.00048413375108400736, 'samples': 3624000, 'steps': 18874, 'loss/train': 1.3719980716705322} -08/30/2021 16:37:17 - INFO - __main__ - Step 18876: {'lr': 0.000484131890624241, 'samples': 3624192, 'steps': 18875, 'loss/train': 2.0993733406066895} -08/30/2021 16:37:17 - INFO - __main__ - Step 18877: {'lr': 0.00048413003005897835, 'samples': 3624384, 'steps': 18876, 'loss/train': 1.4373953342437744} -08/30/2021 16:37:19 - INFO - __main__ - Step 18878: {'lr': 0.0004841281693882204, 'samples': 3624576, 'steps': 18877, 'loss/train': 1.7812221050262451} -08/30/2021 16:37:19 - INFO - __main__ - Step 18879: {'lr': 0.0004841263086119679, 'samples': 3624768, 'steps': 18878, 'loss/train': 1.3264883756637573} -08/30/2021 16:37:20 - INFO - __main__ - Step 18880: {'lr': 0.00048412444773022166, 'samples': 3624960, 'steps': 18879, 'loss/train': 1.821436882019043} -08/30/2021 16:37:20 - INFO - __main__ - Step 18881: {'lr': 0.0004841225867429826, 'samples': 3625152, 'steps': 18880, 'loss/train': 0.1224297508597374} -08/30/2021 16:37:20 - INFO - __main__ - Step 18882: {'lr': 0.0004841207256502515, 'samples': 3625344, 'steps': 18881, 'loss/train': 1.7958325147628784} -08/30/2021 16:37:22 - INFO - __main__ - Step 18883: {'lr': 0.0004841188644520292, 'samples': 3625536, 'steps': 18882, 'loss/train': 1.6555604934692383} -08/30/2021 16:37:22 - INFO - __main__ - Step 18884: {'lr': 0.0004841170031483165, 'samples': 3625728, 'steps': 18883, 'loss/train': 1.895039439201355} -08/30/2021 16:37:23 - INFO - __main__ - Step 18885: {'lr': 0.0004841151417391144, 'samples': 3625920, 'steps': 18884, 'loss/train': 1.6589775085449219} -08/30/2021 16:37:23 - INFO - __main__ - Step 18886: {'lr': 0.00048411328022442357, 'samples': 3626112, 'steps': 18885, 'loss/train': 2.0037918090820312} -08/30/2021 16:37:23 - INFO - __main__ - Step 18887: {'lr': 0.000484111418604245, 'samples': 3626304, 'steps': 18886, 'loss/train': 0.38222405314445496} -08/30/2021 16:37:24 - INFO - __main__ - Step 18888: {'lr': 0.00048410955687857926, 'samples': 3626496, 'steps': 18887, 'loss/train': 0.8166512846946716} -08/30/2021 16:37:25 - INFO - __main__ - Step 18889: {'lr': 0.0004841076950474275, 'samples': 3626688, 'steps': 18888, 'loss/train': 1.5573936700820923} -08/30/2021 16:37:26 - INFO - __main__ - Step 18890: {'lr': 0.0004841058331107904, 'samples': 3626880, 'steps': 18889, 'loss/train': 1.5806729793548584} -08/30/2021 16:37:26 - INFO - __main__ - Step 18891: {'lr': 0.00048410397106866883, 'samples': 3627072, 'steps': 18890, 'loss/train': 1.5310070514678955} -08/30/2021 16:37:26 - INFO - __main__ - Step 18892: {'lr': 0.0004841021089210636, 'samples': 3627264, 'steps': 18891, 'loss/train': 1.0836338996887207} -08/30/2021 16:37:27 - INFO - __main__ - Step 18893: {'lr': 0.0004841002466679756, 'samples': 3627456, 'steps': 18892, 'loss/train': 1.0207998752593994} -08/30/2021 16:37:28 - INFO - __main__ - Step 18894: {'lr': 0.00048409838430940556, 'samples': 3627648, 'steps': 18893, 'loss/train': 1.770282506942749} -08/30/2021 16:37:29 - INFO - __main__ - Step 18895: {'lr': 0.00048409652184535447, 'samples': 3627840, 'steps': 18894, 'loss/train': 2.0498998165130615} -08/30/2021 16:37:29 - INFO - __main__ - Step 18896: {'lr': 0.0004840946592758231, 'samples': 3628032, 'steps': 18895, 'loss/train': 1.9854480028152466} -08/30/2021 16:37:29 - INFO - __main__ - Step 18897: {'lr': 0.00048409279660081226, 'samples': 3628224, 'steps': 18896, 'loss/train': 1.1680973768234253} -08/30/2021 16:37:30 - INFO - __main__ - Step 18898: {'lr': 0.0004840909338203229, 'samples': 3628416, 'steps': 18897, 'loss/train': 1.9105874300003052} -08/30/2021 16:37:31 - INFO - __main__ - Step 18899: {'lr': 0.0004840890709343557, 'samples': 3628608, 'steps': 18898, 'loss/train': 1.7854198217391968} -08/30/2021 16:37:32 - INFO - __main__ - Step 18900: {'lr': 0.0004840872079429116, 'samples': 3628800, 'steps': 18899, 'loss/train': 1.3159809112548828} -08/30/2021 16:37:32 - INFO - __main__ - Step 18901: {'lr': 0.00048408534484599143, 'samples': 3628992, 'steps': 18900, 'loss/train': 1.999829888343811} -08/30/2021 16:37:32 - INFO - __main__ - Step 18902: {'lr': 0.00048408348164359594, 'samples': 3629184, 'steps': 18901, 'loss/train': 1.5713098049163818} -08/30/2021 16:37:33 - INFO - __main__ - Step 18903: {'lr': 0.00048408161833572613, 'samples': 3629376, 'steps': 18902, 'loss/train': 1.4454656839370728} -08/30/2021 16:37:35 - INFO - __main__ - Step 18904: {'lr': 0.0004840797549223827, 'samples': 3629568, 'steps': 18903, 'loss/train': 1.9976674318313599} -08/30/2021 16:37:35 - INFO - __main__ - Step 18905: {'lr': 0.00048407789140356654, 'samples': 3629760, 'steps': 18904, 'loss/train': 1.8277145624160767} -08/30/2021 16:37:36 - INFO - __main__ - Step 18906: {'lr': 0.00048407602777927856, 'samples': 3629952, 'steps': 18905, 'loss/train': 1.0211728811264038} -08/30/2021 16:37:36 - INFO - __main__ - Step 18907: {'lr': 0.0004840741640495195, 'samples': 3630144, 'steps': 18906, 'loss/train': 1.4919006824493408} -08/30/2021 16:37:36 - INFO - __main__ - Step 18908: {'lr': 0.0004840723002142902, 'samples': 3630336, 'steps': 18907, 'loss/train': 1.4708335399627686} -08/30/2021 16:37:37 - INFO - __main__ - Step 18909: {'lr': 0.0004840704362735916, 'samples': 3630528, 'steps': 18908, 'loss/train': 1.542413592338562} -08/30/2021 16:37:39 - INFO - __main__ - Step 18910: {'lr': 0.0004840685722274244, 'samples': 3630720, 'steps': 18909, 'loss/train': 0.1078791692852974} -08/30/2021 16:37:39 - INFO - __main__ - Step 18911: {'lr': 0.0004840667080757896, 'samples': 3630912, 'steps': 18910, 'loss/train': 1.592965006828308} -08/30/2021 16:37:40 - INFO - __main__ - Step 18912: {'lr': 0.00048406484381868786, 'samples': 3631104, 'steps': 18911, 'loss/train': 0.6894677877426147} -08/30/2021 16:37:40 - INFO - __main__ - Step 18913: {'lr': 0.0004840629794561202, 'samples': 3631296, 'steps': 18912, 'loss/train': 0.5969001054763794} -08/30/2021 16:37:41 - INFO - __main__ - Step 18914: {'lr': 0.0004840611149880873, 'samples': 3631488, 'steps': 18913, 'loss/train': 0.5913561582565308} -08/30/2021 16:37:41 - INFO - __main__ - Step 18915: {'lr': 0.0004840592504145901, 'samples': 3631680, 'steps': 18914, 'loss/train': 1.8101297616958618} -08/30/2021 16:37:42 - INFO - __main__ - Step 18916: {'lr': 0.0004840573857356294, 'samples': 3631872, 'steps': 18915, 'loss/train': 0.9657647609710693} -08/30/2021 16:37:43 - INFO - __main__ - Step 18917: {'lr': 0.0004840555209512061, 'samples': 3632064, 'steps': 18916, 'loss/train': 1.3331830501556396} -08/30/2021 16:37:43 - INFO - __main__ - Step 18918: {'lr': 0.00048405365606132096, 'samples': 3632256, 'steps': 18917, 'loss/train': 1.512233018875122} -08/30/2021 16:37:43 - INFO - __main__ - Step 18919: {'lr': 0.00048405179106597487, 'samples': 3632448, 'steps': 18918, 'loss/train': 1.2156389951705933} -08/30/2021 16:37:44 - INFO - __main__ - Step 18920: {'lr': 0.0004840499259651686, 'samples': 3632640, 'steps': 18919, 'loss/train': 1.3688234090805054} -08/30/2021 16:37:45 - INFO - __main__ - Step 18921: {'lr': 0.0004840480607589031, 'samples': 3632832, 'steps': 18920, 'loss/train': 2.3019397258758545} -08/30/2021 16:37:46 - INFO - __main__ - Step 18922: {'lr': 0.0004840461954471792, 'samples': 3633024, 'steps': 18921, 'loss/train': 1.5780038833618164} -08/30/2021 16:37:46 - INFO - __main__ - Step 18923: {'lr': 0.00048404433002999757, 'samples': 3633216, 'steps': 18922, 'loss/train': 1.473617434501648} -08/30/2021 16:37:46 - INFO - __main__ - Step 18924: {'lr': 0.0004840424645073593, 'samples': 3633408, 'steps': 18923, 'loss/train': 1.555058479309082} -08/30/2021 16:37:47 - INFO - __main__ - Step 18925: {'lr': 0.000484040598879265, 'samples': 3633600, 'steps': 18924, 'loss/train': 1.5462207794189453} -08/30/2021 16:37:48 - INFO - __main__ - Step 18926: {'lr': 0.0004840387331457157, 'samples': 3633792, 'steps': 18925, 'loss/train': 1.7636566162109375} -08/30/2021 16:37:49 - INFO - __main__ - Step 18927: {'lr': 0.00048403686730671215, 'samples': 3633984, 'steps': 18926, 'loss/train': 1.7328298091888428} -08/30/2021 16:37:49 - INFO - __main__ - Step 18928: {'lr': 0.0004840350013622552, 'samples': 3634176, 'steps': 18927, 'loss/train': 1.6066393852233887} -08/30/2021 16:37:49 - INFO - __main__ - Step 18929: {'lr': 0.0004840331353123456, 'samples': 3634368, 'steps': 18928, 'loss/train': 1.3455466032028198} -08/30/2021 16:37:50 - INFO - __main__ - Step 18930: {'lr': 0.00048403126915698435, 'samples': 3634560, 'steps': 18929, 'loss/train': 1.7716022729873657} -08/30/2021 16:37:51 - INFO - __main__ - Step 18931: {'lr': 0.00048402940289617223, 'samples': 3634752, 'steps': 18930, 'loss/train': 1.5083965063095093} -08/30/2021 16:37:52 - INFO - __main__ - Step 18932: {'lr': 0.00048402753652991007, 'samples': 3634944, 'steps': 18931, 'loss/train': 1.6436960697174072} -08/30/2021 16:37:52 - INFO - __main__ - Step 18933: {'lr': 0.0004840256700581988, 'samples': 3635136, 'steps': 18932, 'loss/train': 1.7264306545257568} -08/30/2021 16:37:52 - INFO - __main__ - Step 18934: {'lr': 0.000484023803481039, 'samples': 3635328, 'steps': 18933, 'loss/train': 2.0844295024871826} -08/30/2021 16:37:53 - INFO - __main__ - Step 18935: {'lr': 0.00048402193679843175, 'samples': 3635520, 'steps': 18934, 'loss/train': 2.012082815170288} -08/30/2021 16:37:54 - INFO - __main__ - Step 18936: {'lr': 0.00048402007001037786, 'samples': 3635712, 'steps': 18935, 'loss/train': 1.2280157804489136} -08/30/2021 16:37:55 - INFO - __main__ - Step 18937: {'lr': 0.0004840182031168781, 'samples': 3635904, 'steps': 18936, 'loss/train': 1.131327509880066} -08/30/2021 16:37:55 - INFO - __main__ - Step 18938: {'lr': 0.0004840163361179334, 'samples': 3636096, 'steps': 18937, 'loss/train': 2.4972782135009766} -08/30/2021 16:37:56 - INFO - __main__ - Step 18939: {'lr': 0.00048401446901354453, 'samples': 3636288, 'steps': 18938, 'loss/train': 1.8392916917800903} -08/30/2021 16:37:56 - INFO - __main__ - Step 18940: {'lr': 0.0004840126018037123, 'samples': 3636480, 'steps': 18939, 'loss/train': 1.055567979812622} -08/30/2021 16:37:56 - INFO - __main__ - Step 18941: {'lr': 0.0004840107344884377, 'samples': 3636672, 'steps': 18940, 'loss/train': 1.5509389638900757} -08/30/2021 16:37:58 - INFO - __main__ - Step 18942: {'lr': 0.0004840088670677214, 'samples': 3636864, 'steps': 18941, 'loss/train': 1.7684361934661865} -08/30/2021 16:37:58 - INFO - __main__ - Step 18943: {'lr': 0.0004840069995415643, 'samples': 3637056, 'steps': 18942, 'loss/train': 1.6116442680358887} -08/30/2021 16:37:58 - INFO - __main__ - Step 18944: {'lr': 0.0004840051319099673, 'samples': 3637248, 'steps': 18943, 'loss/train': 1.3261322975158691} -08/30/2021 16:37:59 - INFO - __main__ - Step 18945: {'lr': 0.0004840032641729312, 'samples': 3637440, 'steps': 18944, 'loss/train': 1.5126307010650635} -08/30/2021 16:37:59 - INFO - __main__ - Step 18946: {'lr': 0.0004840013963304568, 'samples': 3637632, 'steps': 18945, 'loss/train': 1.330876350402832} -08/30/2021 16:38:01 - INFO - __main__ - Step 18947: {'lr': 0.000483999528382545, 'samples': 3637824, 'steps': 18946, 'loss/train': 1.518810510635376} -08/30/2021 16:38:01 - INFO - __main__ - Step 18948: {'lr': 0.00048399766032919666, 'samples': 3638016, 'steps': 18947, 'loss/train': 1.6638489961624146} -08/30/2021 16:38:02 - INFO - __main__ - Step 18949: {'lr': 0.0004839957921704126, 'samples': 3638208, 'steps': 18948, 'loss/train': 1.2972757816314697} -08/30/2021 16:38:02 - INFO - __main__ - Step 18950: {'lr': 0.0004839939239061936, 'samples': 3638400, 'steps': 18949, 'loss/train': 1.5717649459838867} -08/30/2021 16:38:02 - INFO - __main__ - Step 18951: {'lr': 0.00048399205553654046, 'samples': 3638592, 'steps': 18950, 'loss/train': 2.0166611671447754} -08/30/2021 16:38:04 - INFO - __main__ - Step 18952: {'lr': 0.0004839901870614543, 'samples': 3638784, 'steps': 18951, 'loss/train': 2.096992254257202} -08/30/2021 16:38:05 - INFO - __main__ - Step 18953: {'lr': 0.0004839883184809356, 'samples': 3638976, 'steps': 18952, 'loss/train': 1.51292884349823} -08/30/2021 16:38:05 - INFO - __main__ - Step 18954: {'lr': 0.00048398644979498543, 'samples': 3639168, 'steps': 18953, 'loss/train': 1.4720566272735596} -08/30/2021 16:38:05 - INFO - __main__ - Step 18955: {'lr': 0.0004839845810036047, 'samples': 3639360, 'steps': 18954, 'loss/train': 1.8984678983688354} -08/30/2021 16:38:06 - INFO - __main__ - Step 18956: {'lr': 0.00048398271210679393, 'samples': 3639552, 'steps': 18955, 'loss/train': 1.601037621498108} -08/30/2021 16:38:06 - INFO - __main__ - Step 18957: {'lr': 0.0004839808431045543, 'samples': 3639744, 'steps': 18956, 'loss/train': 2.0644285678863525} -08/30/2021 16:38:08 - INFO - __main__ - Step 18958: {'lr': 0.00048397897399688643, 'samples': 3639936, 'steps': 18957, 'loss/train': 0.19773952662944794} -08/30/2021 16:38:09 - INFO - __main__ - Step 18959: {'lr': 0.0004839771047837913, 'samples': 3640128, 'steps': 18958, 'loss/train': 2.199984550476074} -08/30/2021 16:38:09 - INFO - __main__ - Step 18960: {'lr': 0.00048397523546526966, 'samples': 3640320, 'steps': 18959, 'loss/train': 1.8648544549942017} -08/30/2021 16:38:10 - INFO - __main__ - Step 18961: {'lr': 0.0004839733660413224, 'samples': 3640512, 'steps': 18960, 'loss/train': 0.8826211094856262} -08/30/2021 16:38:10 - INFO - __main__ - Step 18962: {'lr': 0.0004839714965119504, 'samples': 3640704, 'steps': 18961, 'loss/train': 1.3562123775482178} -08/30/2021 16:38:11 - INFO - __main__ - Step 18963: {'lr': 0.0004839696268771544, 'samples': 3640896, 'steps': 18962, 'loss/train': 1.1805273294448853} -08/30/2021 16:38:12 - INFO - __main__ - Step 18964: {'lr': 0.0004839677571369353, 'samples': 3641088, 'steps': 18963, 'loss/train': 1.6383274793624878} -08/30/2021 16:38:12 - INFO - __main__ - Step 18965: {'lr': 0.000483965887291294, 'samples': 3641280, 'steps': 18964, 'loss/train': 1.8031878471374512} -08/30/2021 16:38:13 - INFO - __main__ - Step 18966: {'lr': 0.0004839640173402312, 'samples': 3641472, 'steps': 18965, 'loss/train': 1.878609538078308} -08/30/2021 16:38:13 - INFO - __main__ - Step 18967: {'lr': 0.00048396214728374786, 'samples': 3641664, 'steps': 18966, 'loss/train': 1.4588313102722168} -08/30/2021 16:38:15 - INFO - __main__ - Step 18968: {'lr': 0.00048396027712184475, 'samples': 3641856, 'steps': 18967, 'loss/train': 1.53431236743927} -08/30/2021 16:38:15 - INFO - __main__ - Step 18969: {'lr': 0.0004839584068545228, 'samples': 3642048, 'steps': 18968, 'loss/train': 1.6313693523406982} -08/30/2021 16:38:16 - INFO - __main__ - Step 18970: {'lr': 0.0004839565364817828, 'samples': 3642240, 'steps': 18969, 'loss/train': 2.1428191661834717} -08/30/2021 16:38:16 - INFO - __main__ - Step 18971: {'lr': 0.0004839546660036256, 'samples': 3642432, 'steps': 18970, 'loss/train': 1.717660903930664} -08/30/2021 16:38:16 - INFO - __main__ - Step 18972: {'lr': 0.000483952795420052, 'samples': 3642624, 'steps': 18971, 'loss/train': 2.3953351974487305} -08/30/2021 16:38:19 - INFO - __main__ - Step 18973: {'lr': 0.0004839509247310629, 'samples': 3642816, 'steps': 18972, 'loss/train': 2.4619195461273193} -08/30/2021 16:38:19 - INFO - __main__ - Step 18974: {'lr': 0.00048394905393665913, 'samples': 3643008, 'steps': 18973, 'loss/train': 1.441680908203125} -08/30/2021 16:38:19 - INFO - __main__ - Step 18975: {'lr': 0.00048394718303684147, 'samples': 3643200, 'steps': 18974, 'loss/train': 1.2632781267166138} -08/30/2021 16:38:20 - INFO - __main__ - Step 18976: {'lr': 0.00048394531203161084, 'samples': 3643392, 'steps': 18975, 'loss/train': 1.9469889402389526} -08/30/2021 16:38:20 - INFO - __main__ - Step 18977: {'lr': 0.00048394344092096816, 'samples': 3643584, 'steps': 18976, 'loss/train': 1.5366647243499756} -08/30/2021 16:38:21 - INFO - __main__ - Step 18978: {'lr': 0.0004839415697049141, 'samples': 3643776, 'steps': 18977, 'loss/train': 1.3638979196548462} -08/30/2021 16:38:21 - INFO - __main__ - Step 18979: {'lr': 0.00048393969838344956, 'samples': 3643968, 'steps': 18978, 'loss/train': 1.0342578887939453} -08/30/2021 16:38:22 - INFO - __main__ - Step 18980: {'lr': 0.0004839378269565754, 'samples': 3644160, 'steps': 18979, 'loss/train': 0.22066383063793182} -08/30/2021 16:38:23 - INFO - __main__ - Step 18981: {'lr': 0.00048393595542429253, 'samples': 3644352, 'steps': 18980, 'loss/train': 1.4377784729003906} -08/30/2021 16:38:23 - INFO - __main__ - Step 18982: {'lr': 0.0004839340837866016, 'samples': 3644544, 'steps': 18981, 'loss/train': 1.9067206382751465} -08/30/2021 16:38:24 - INFO - __main__ - Step 18983: {'lr': 0.00048393221204350376, 'samples': 3644736, 'steps': 18982, 'loss/train': 1.786861777305603} -08/30/2021 16:38:24 - INFO - __main__ - Step 18984: {'lr': 0.0004839303401949996, 'samples': 3644928, 'steps': 18983, 'loss/train': 2.1087722778320312} -08/30/2021 16:38:25 - INFO - __main__ - Step 18985: {'lr': 0.00048392846824109, 'samples': 3645120, 'steps': 18984, 'loss/train': 1.2350329160690308} -08/30/2021 16:38:26 - INFO - __main__ - Step 18986: {'lr': 0.00048392659618177585, 'samples': 3645312, 'steps': 18985, 'loss/train': 1.221070408821106} -08/30/2021 16:38:26 - INFO - __main__ - Step 18987: {'lr': 0.000483924724017058, 'samples': 3645504, 'steps': 18986, 'loss/train': 1.5440654754638672} -08/30/2021 16:38:27 - INFO - __main__ - Step 18988: {'lr': 0.00048392285174693727, 'samples': 3645696, 'steps': 18987, 'loss/train': 1.292403221130371} -08/30/2021 16:38:27 - INFO - __main__ - Step 18989: {'lr': 0.0004839209793714146, 'samples': 3645888, 'steps': 18988, 'loss/train': 1.4480961561203003} -08/30/2021 16:38:28 - INFO - __main__ - Step 18990: {'lr': 0.00048391910689049057, 'samples': 3646080, 'steps': 18989, 'loss/train': 1.1235562562942505} -08/30/2021 16:38:29 - INFO - __main__ - Step 18991: {'lr': 0.00048391723430416634, 'samples': 3646272, 'steps': 18990, 'loss/train': 1.2940679788589478} -08/30/2021 16:38:29 - INFO - __main__ - Step 18992: {'lr': 0.00048391536161244254, 'samples': 3646464, 'steps': 18991, 'loss/train': 1.7962981462478638} -08/30/2021 16:38:29 - INFO - __main__ - Step 18993: {'lr': 0.0004839134888153202, 'samples': 3646656, 'steps': 18992, 'loss/train': 1.6466200351715088} -08/30/2021 16:38:30 - INFO - __main__ - Step 18994: {'lr': 0.00048391161591279994, 'samples': 3646848, 'steps': 18993, 'loss/train': 1.578004240989685} -08/30/2021 16:38:32 - INFO - __main__ - Step 18995: {'lr': 0.0004839097429048827, 'samples': 3647040, 'steps': 18994, 'loss/train': 1.8380944728851318} -08/30/2021 16:38:32 - INFO - __main__ - Step 18996: {'lr': 0.00048390786979156944, 'samples': 3647232, 'steps': 18995, 'loss/train': 1.4364378452301025} -08/30/2021 16:38:32 - INFO - __main__ - Step 18997: {'lr': 0.0004839059965728608, 'samples': 3647424, 'steps': 18996, 'loss/train': 3.3598239421844482} -08/30/2021 16:38:33 - INFO - __main__ - Step 18998: {'lr': 0.0004839041232487578, 'samples': 3647616, 'steps': 18997, 'loss/train': 2.0735983848571777} -08/30/2021 16:38:33 - INFO - __main__ - Step 18999: {'lr': 0.0004839022498192612, 'samples': 3647808, 'steps': 18998, 'loss/train': 1.5744572877883911} -08/30/2021 16:38:33 - INFO - __main__ - Step 19000: {'lr': 0.0004839003762843718, 'samples': 3648000, 'steps': 18999, 'loss/train': 1.8879928588867188} -08/30/2021 16:38:35 - INFO - __main__ - Step 19001: {'lr': 0.00048389850264409054, 'samples': 3648192, 'steps': 19000, 'loss/train': 0.9014919996261597} -08/30/2021 16:38:35 - INFO - __main__ - Step 19002: {'lr': 0.00048389662889841825, 'samples': 3648384, 'steps': 19001, 'loss/train': 2.4000437259674072} -08/30/2021 16:38:36 - INFO - __main__ - Step 19003: {'lr': 0.0004838947550473557, 'samples': 3648576, 'steps': 19002, 'loss/train': 1.8039371967315674} -08/30/2021 16:38:36 - INFO - __main__ - Step 19004: {'lr': 0.00048389288109090383, 'samples': 3648768, 'steps': 19003, 'loss/train': 2.0567820072174072} -08/30/2021 16:38:36 - INFO - __main__ - Step 19005: {'lr': 0.0004838910070290634, 'samples': 3648960, 'steps': 19004, 'loss/train': 1.4886016845703125} -08/30/2021 16:38:38 - INFO - __main__ - Step 19006: {'lr': 0.00048388913286183535, 'samples': 3649152, 'steps': 19005, 'loss/train': 2.1133718490600586} -08/30/2021 16:38:39 - INFO - __main__ - Step 19007: {'lr': 0.0004838872585892204, 'samples': 3649344, 'steps': 19006, 'loss/train': 1.2090160846710205} -08/30/2021 16:38:39 - INFO - __main__ - Step 19008: {'lr': 0.00048388538421121946, 'samples': 3649536, 'steps': 19007, 'loss/train': 2.146662473678589} -08/30/2021 16:38:40 - INFO - __main__ - Step 19009: {'lr': 0.00048388350972783346, 'samples': 3649728, 'steps': 19008, 'loss/train': 2.1458070278167725} -08/30/2021 16:38:40 - INFO - __main__ - Step 19010: {'lr': 0.000483881635139063, 'samples': 3649920, 'steps': 19009, 'loss/train': 1.6581511497497559} -08/30/2021 16:38:40 - INFO - __main__ - Step 19011: {'lr': 0.00048387976044490924, 'samples': 3650112, 'steps': 19010, 'loss/train': 1.9609956741333008} -08/30/2021 16:38:41 - INFO - __main__ - Step 19012: {'lr': 0.0004838778856453728, 'samples': 3650304, 'steps': 19011, 'loss/train': 1.3583651781082153} -08/30/2021 16:38:43 - INFO - __main__ - Step 19013: {'lr': 0.00048387601074045464, 'samples': 3650496, 'steps': 19012, 'loss/train': 1.2468626499176025} -08/30/2021 16:38:43 - INFO - __main__ - Step 19014: {'lr': 0.0004838741357301555, 'samples': 3650688, 'steps': 19013, 'loss/train': 1.5498229265213013} -08/30/2021 16:38:44 - INFO - __main__ - Step 19015: {'lr': 0.00048387226061447633, 'samples': 3650880, 'steps': 19014, 'loss/train': 1.8786801099777222} -08/30/2021 16:38:44 - INFO - __main__ - Step 19016: {'lr': 0.0004838703853934179, 'samples': 3651072, 'steps': 19015, 'loss/train': 1.5610238313674927} -08/30/2021 16:38:44 - INFO - __main__ - Step 19017: {'lr': 0.0004838685100669811, 'samples': 3651264, 'steps': 19016, 'loss/train': 1.8917293548583984} -08/30/2021 16:38:46 - INFO - __main__ - Step 19018: {'lr': 0.0004838666346351667, 'samples': 3651456, 'steps': 19017, 'loss/train': 2.051845073699951} -08/30/2021 16:38:46 - INFO - __main__ - Step 19019: {'lr': 0.0004838647590979757, 'samples': 3651648, 'steps': 19018, 'loss/train': 1.5275967121124268} -08/30/2021 16:38:47 - INFO - __main__ - Step 19020: {'lr': 0.00048386288345540876, 'samples': 3651840, 'steps': 19019, 'loss/train': 2.161799907684326} -08/30/2021 16:38:47 - INFO - __main__ - Step 19021: {'lr': 0.00048386100770746686, 'samples': 3652032, 'steps': 19020, 'loss/train': 1.8600828647613525} -08/30/2021 16:38:47 - INFO - __main__ - Step 19022: {'lr': 0.00048385913185415076, 'samples': 3652224, 'steps': 19021, 'loss/train': 1.7161812782287598} -08/30/2021 16:38:49 - INFO - __main__ - Step 19023: {'lr': 0.00048385725589546137, 'samples': 3652416, 'steps': 19022, 'loss/train': 1.2950397729873657} -08/30/2021 16:38:50 - INFO - __main__ - Step 19024: {'lr': 0.0004838553798313995, 'samples': 3652608, 'steps': 19023, 'loss/train': 1.843496561050415} -08/30/2021 16:38:50 - INFO - __main__ - Step 19025: {'lr': 0.000483853503661966, 'samples': 3652800, 'steps': 19024, 'loss/train': 1.6987963914871216} -08/30/2021 16:38:50 - INFO - __main__ - Step 19026: {'lr': 0.00048385162738716174, 'samples': 3652992, 'steps': 19025, 'loss/train': 1.9262787103652954} -08/30/2021 16:38:51 - INFO - __main__ - Step 19027: {'lr': 0.00048384975100698756, 'samples': 3653184, 'steps': 19026, 'loss/train': 1.5370110273361206} -08/30/2021 16:38:51 - INFO - __main__ - Step 19028: {'lr': 0.0004838478745214443, 'samples': 3653376, 'steps': 19027, 'loss/train': 0.09243328869342804} -08/30/2021 16:38:53 - INFO - __main__ - Step 19029: {'lr': 0.00048384599793053275, 'samples': 3653568, 'steps': 19028, 'loss/train': 2.0480871200561523} -08/30/2021 16:38:53 - INFO - __main__ - Step 19030: {'lr': 0.0004838441212342538, 'samples': 3653760, 'steps': 19029, 'loss/train': 1.5750621557235718} -08/30/2021 16:38:54 - INFO - __main__ - Step 19031: {'lr': 0.0004838422444326084, 'samples': 3653952, 'steps': 19030, 'loss/train': 3.643911361694336} -08/30/2021 16:38:54 - INFO - __main__ - Step 19032: {'lr': 0.0004838403675255971, 'samples': 3654144, 'steps': 19031, 'loss/train': 1.4532514810562134} -08/30/2021 16:38:54 - INFO - __main__ - Step 19033: {'lr': 0.0004838384905132211, 'samples': 3654336, 'steps': 19032, 'loss/train': 1.6092004776000977} -08/30/2021 16:38:55 - INFO - __main__ - Step 19034: {'lr': 0.000483836613395481, 'samples': 3654528, 'steps': 19033, 'loss/train': 1.7530258893966675} -08/30/2021 16:38:56 - INFO - __main__ - Step 19035: {'lr': 0.0004838347361723778, 'samples': 3654720, 'steps': 19034, 'loss/train': 0.6507481932640076} -08/30/2021 16:38:57 - INFO - __main__ - Step 19036: {'lr': 0.0004838328588439123, 'samples': 3654912, 'steps': 19035, 'loss/train': 1.0046108961105347} -08/30/2021 16:38:57 - INFO - __main__ - Step 19037: {'lr': 0.0004838309814100852, 'samples': 3655104, 'steps': 19036, 'loss/train': 2.8187057971954346} -08/30/2021 16:38:57 - INFO - __main__ - Step 19038: {'lr': 0.0004838291038708975, 'samples': 3655296, 'steps': 19037, 'loss/train': 2.971289873123169} -08/30/2021 16:38:58 - INFO - __main__ - Step 19039: {'lr': 0.00048382722622635014, 'samples': 3655488, 'steps': 19038, 'loss/train': 1.3843629360198975} -08/30/2021 16:38:59 - INFO - __main__ - Step 19040: {'lr': 0.0004838253484764437, 'samples': 3655680, 'steps': 19039, 'loss/train': 1.6307727098464966} -08/30/2021 16:39:00 - INFO - __main__ - Step 19041: {'lr': 0.0004838234706211792, 'samples': 3655872, 'steps': 19040, 'loss/train': 1.6135318279266357} -08/30/2021 16:39:00 - INFO - __main__ - Step 19042: {'lr': 0.00048382159266055746, 'samples': 3656064, 'steps': 19041, 'loss/train': 0.16198968887329102} -08/30/2021 16:39:00 - INFO - __main__ - Step 19043: {'lr': 0.0004838197145945793, 'samples': 3656256, 'steps': 19042, 'loss/train': 1.6448854207992554} -08/30/2021 16:39:01 - INFO - __main__ - Step 19044: {'lr': 0.0004838178364232456, 'samples': 3656448, 'steps': 19043, 'loss/train': 2.0197489261627197} -08/30/2021 16:39:02 - INFO - __main__ - Step 19045: {'lr': 0.00048381595814655723, 'samples': 3656640, 'steps': 19044, 'loss/train': 1.3987911939620972} -08/30/2021 16:39:03 - INFO - __main__ - Step 19046: {'lr': 0.000483814079764515, 'samples': 3656832, 'steps': 19045, 'loss/train': 1.6451157331466675} -08/30/2021 16:39:03 - INFO - __main__ - Step 19047: {'lr': 0.00048381220127711967, 'samples': 3657024, 'steps': 19046, 'loss/train': 2.3354761600494385} -08/30/2021 16:39:03 - INFO - __main__ - Step 19048: {'lr': 0.0004838103226843722, 'samples': 3657216, 'steps': 19047, 'loss/train': 1.6441980600357056} -08/30/2021 16:39:04 - INFO - __main__ - Step 19049: {'lr': 0.00048380844398627343, 'samples': 3657408, 'steps': 19048, 'loss/train': 1.3039494752883911} -08/30/2021 16:39:04 - INFO - __main__ - Step 19050: {'lr': 0.0004838065651828242, 'samples': 3657600, 'steps': 19049, 'loss/train': 1.348453402519226} -08/30/2021 16:39:06 - INFO - __main__ - Step 19051: {'lr': 0.0004838046862740253, 'samples': 3657792, 'steps': 19050, 'loss/train': 1.6213575601577759} -08/30/2021 16:39:06 - INFO - __main__ - Step 19052: {'lr': 0.0004838028072598777, 'samples': 3657984, 'steps': 19051, 'loss/train': 1.3830773830413818} -08/30/2021 16:39:06 - INFO - __main__ - Step 19053: {'lr': 0.00048380092814038204, 'samples': 3658176, 'steps': 19052, 'loss/train': 1.631980299949646} -08/30/2021 16:39:07 - INFO - __main__ - Step 19054: {'lr': 0.0004837990489155394, 'samples': 3658368, 'steps': 19053, 'loss/train': 1.7626631259918213} -08/30/2021 16:39:07 - INFO - __main__ - Step 19055: {'lr': 0.00048379716958535043, 'samples': 3658560, 'steps': 19054, 'loss/train': 1.5269496440887451} -08/30/2021 16:39:09 - INFO - __main__ - Step 19056: {'lr': 0.00048379529014981604, 'samples': 3658752, 'steps': 19055, 'loss/train': 0.27664247155189514} -08/30/2021 16:39:09 - INFO - __main__ - Step 19057: {'lr': 0.0004837934106089372, 'samples': 3658944, 'steps': 19056, 'loss/train': 1.5194077491760254} -08/30/2021 16:39:09 - INFO - __main__ - Step 19058: {'lr': 0.0004837915309627146, 'samples': 3659136, 'steps': 19057, 'loss/train': 1.365946650505066} -08/30/2021 16:39:10 - INFO - __main__ - Step 19059: {'lr': 0.00048378965121114917, 'samples': 3659328, 'steps': 19058, 'loss/train': 1.3631266355514526} -08/30/2021 16:39:10 - INFO - __main__ - Step 19060: {'lr': 0.00048378777135424166, 'samples': 3659520, 'steps': 19059, 'loss/train': 1.2037910223007202} -08/30/2021 16:39:12 - INFO - __main__ - Step 19061: {'lr': 0.0004837858913919931, 'samples': 3659712, 'steps': 19060, 'loss/train': 1.6297072172164917} -08/30/2021 16:39:12 - INFO - __main__ - Step 19062: {'lr': 0.0004837840113244042, 'samples': 3659904, 'steps': 19061, 'loss/train': 1.5092374086380005} -08/30/2021 16:39:12 - INFO - __main__ - Step 19063: {'lr': 0.00048378213115147573, 'samples': 3660096, 'steps': 19062, 'loss/train': 1.9230157136917114} -08/30/2021 16:39:13 - INFO - __main__ - Step 19064: {'lr': 0.00048378025087320877, 'samples': 3660288, 'steps': 19063, 'loss/train': 1.9381505250930786} -08/30/2021 16:39:13 - INFO - __main__ - Step 19065: {'lr': 0.0004837783704896039, 'samples': 3660480, 'steps': 19064, 'loss/train': 0.7553221583366394} -08/30/2021 16:39:15 - INFO - __main__ - Step 19066: {'lr': 0.0004837764900006623, 'samples': 3660672, 'steps': 19065, 'loss/train': 1.3389997482299805} -08/30/2021 16:39:15 - INFO - __main__ - Step 19067: {'lr': 0.0004837746094063844, 'samples': 3660864, 'steps': 19066, 'loss/train': 1.5995224714279175} -08/30/2021 16:39:16 - INFO - __main__ - Step 19068: {'lr': 0.00048377272870677135, 'samples': 3661056, 'steps': 19067, 'loss/train': 1.7355479001998901} -08/30/2021 16:39:16 - INFO - __main__ - Step 19069: {'lr': 0.000483770847901824, 'samples': 3661248, 'steps': 19068, 'loss/train': 2.67655611038208} -08/30/2021 16:39:16 - INFO - __main__ - Step 19070: {'lr': 0.000483768966991543, 'samples': 3661440, 'steps': 19069, 'loss/train': 1.287881851196289} -08/30/2021 16:39:18 - INFO - __main__ - Step 19071: {'lr': 0.0004837670859759294, 'samples': 3661632, 'steps': 19070, 'loss/train': 1.5589580535888672} -08/30/2021 16:39:18 - INFO - __main__ - Step 19072: {'lr': 0.0004837652048549839, 'samples': 3661824, 'steps': 19071, 'loss/train': 1.855506181716919} -08/30/2021 16:39:19 - INFO - __main__ - Step 19073: {'lr': 0.00048376332362870745, 'samples': 3662016, 'steps': 19072, 'loss/train': 1.6589117050170898} -08/30/2021 16:39:19 - INFO - __main__ - Step 19074: {'lr': 0.00048376144229710083, 'samples': 3662208, 'steps': 19073, 'loss/train': 1.7377173900604248} -08/30/2021 16:39:19 - INFO - __main__ - Step 19075: {'lr': 0.00048375956086016495, 'samples': 3662400, 'steps': 19074, 'loss/train': 0.11043886095285416} -08/30/2021 16:39:21 - INFO - __main__ - Step 19076: {'lr': 0.0004837576793179005, 'samples': 3662592, 'steps': 19075, 'loss/train': 2.205615997314453} -08/30/2021 16:39:22 - INFO - __main__ - Step 19077: {'lr': 0.00048375579767030854, 'samples': 3662784, 'steps': 19076, 'loss/train': 1.613686203956604} -08/30/2021 16:39:22 - INFO - __main__ - Step 19078: {'lr': 0.0004837539159173898, 'samples': 3662976, 'steps': 19077, 'loss/train': 1.8518331050872803} -08/30/2021 16:39:22 - INFO - __main__ - Step 19079: {'lr': 0.00048375203405914515, 'samples': 3663168, 'steps': 19078, 'loss/train': 0.1458100527524948} -08/30/2021 16:39:23 - INFO - __main__ - Step 19080: {'lr': 0.00048375015209557547, 'samples': 3663360, 'steps': 19079, 'loss/train': 1.805875301361084} -08/30/2021 16:39:24 - INFO - __main__ - Step 19081: {'lr': 0.00048374827002668156, 'samples': 3663552, 'steps': 19080, 'loss/train': 1.8509334325790405} -08/30/2021 16:39:25 - INFO - __main__ - Step 19082: {'lr': 0.0004837463878524643, 'samples': 3663744, 'steps': 19081, 'loss/train': 1.6861164569854736} -08/30/2021 16:39:25 - INFO - __main__ - Step 19083: {'lr': 0.0004837445055729245, 'samples': 3663936, 'steps': 19082, 'loss/train': 1.4038214683532715} -08/30/2021 16:39:25 - INFO - __main__ - Step 19084: {'lr': 0.00048374262318806306, 'samples': 3664128, 'steps': 19083, 'loss/train': 1.2989164590835571} -08/30/2021 16:39:26 - INFO - __main__ - Step 19085: {'lr': 0.00048374074069788077, 'samples': 3664320, 'steps': 19084, 'loss/train': 0.9655818939208984} -08/30/2021 16:39:27 - INFO - __main__ - Step 19086: {'lr': 0.0004837388581023785, 'samples': 3664512, 'steps': 19085, 'loss/train': 1.4404168128967285} -08/30/2021 16:39:28 - INFO - __main__ - Step 19087: {'lr': 0.0004837369754015571, 'samples': 3664704, 'steps': 19086, 'loss/train': 1.8048416376113892} -08/30/2021 16:39:28 - INFO - __main__ - Step 19088: {'lr': 0.0004837350925954175, 'samples': 3664896, 'steps': 19087, 'loss/train': 2.047614336013794} -08/30/2021 16:39:28 - INFO - __main__ - Step 19089: {'lr': 0.00048373320968396043, 'samples': 3665088, 'steps': 19088, 'loss/train': 0.8277368545532227} -08/30/2021 16:39:29 - INFO - __main__ - Step 19090: {'lr': 0.0004837313266671868, 'samples': 3665280, 'steps': 19089, 'loss/train': 1.7643955945968628} -08/30/2021 16:39:29 - INFO - __main__ - Step 19091: {'lr': 0.0004837294435450974, 'samples': 3665472, 'steps': 19090, 'loss/train': 1.066404104232788} -08/30/2021 16:39:31 - INFO - __main__ - Step 19092: {'lr': 0.00048372756031769316, 'samples': 3665664, 'steps': 19091, 'loss/train': 0.10456026345491409} -08/30/2021 16:39:31 - INFO - __main__ - Step 19093: {'lr': 0.00048372567698497487, 'samples': 3665856, 'steps': 19092, 'loss/train': 1.5527896881103516} -08/30/2021 16:39:32 - INFO - __main__ - Step 19094: {'lr': 0.0004837237935469434, 'samples': 3666048, 'steps': 19093, 'loss/train': 1.5800169706344604} -08/30/2021 16:39:32 - INFO - __main__ - Step 19095: {'lr': 0.00048372191000359955, 'samples': 3666240, 'steps': 19094, 'loss/train': 1.4646916389465332} -08/30/2021 16:39:32 - INFO - __main__ - Step 19096: {'lr': 0.00048372002635494425, 'samples': 3666432, 'steps': 19095, 'loss/train': 1.577537178993225} -08/30/2021 16:39:34 - INFO - __main__ - Step 19097: {'lr': 0.00048371814260097834, 'samples': 3666624, 'steps': 19096, 'loss/train': 1.6097098588943481} -08/30/2021 16:39:34 - INFO - __main__ - Step 19098: {'lr': 0.0004837162587417027, 'samples': 3666816, 'steps': 19097, 'loss/train': 1.6733466386795044} -08/30/2021 16:39:35 - INFO - __main__ - Step 19099: {'lr': 0.000483714374777118, 'samples': 3667008, 'steps': 19098, 'loss/train': 1.3653650283813477} -08/30/2021 16:39:35 - INFO - __main__ - Step 19100: {'lr': 0.00048371249070722525, 'samples': 3667200, 'steps': 19099, 'loss/train': 1.6094400882720947} -08/30/2021 16:39:35 - INFO - __main__ - Step 19101: {'lr': 0.0004837106065320253, 'samples': 3667392, 'steps': 19100, 'loss/train': 1.5213968753814697} -08/30/2021 16:39:37 - INFO - __main__ - Step 19102: {'lr': 0.00048370872225151886, 'samples': 3667584, 'steps': 19101, 'loss/train': 1.5737665891647339} -08/30/2021 16:39:37 - INFO - __main__ - Step 19103: {'lr': 0.0004837068378657069, 'samples': 3667776, 'steps': 19102, 'loss/train': 0.6638611555099487} -08/30/2021 16:39:38 - INFO - __main__ - Step 19104: {'lr': 0.0004837049533745903, 'samples': 3667968, 'steps': 19103, 'loss/train': 1.7117505073547363} -08/30/2021 16:39:38 - INFO - __main__ - Step 19105: {'lr': 0.00048370306877816983, 'samples': 3668160, 'steps': 19104, 'loss/train': 2.4603612422943115} -08/30/2021 16:39:38 - INFO - __main__ - Step 19106: {'lr': 0.00048370118407644637, 'samples': 3668352, 'steps': 19105, 'loss/train': 1.5029852390289307} -08/30/2021 16:39:40 - INFO - __main__ - Step 19107: {'lr': 0.0004836992992694208, 'samples': 3668544, 'steps': 19106, 'loss/train': 1.1753807067871094} -08/30/2021 16:39:40 - INFO - __main__ - Step 19108: {'lr': 0.00048369741435709383, 'samples': 3668736, 'steps': 19107, 'loss/train': 1.6933237314224243} -08/30/2021 16:39:41 - INFO - __main__ - Step 19109: {'lr': 0.0004836955293394665, 'samples': 3668928, 'steps': 19108, 'loss/train': 1.3555686473846436} -08/30/2021 16:39:41 - INFO - __main__ - Step 19110: {'lr': 0.00048369364421653953, 'samples': 3669120, 'steps': 19109, 'loss/train': 1.6328330039978027} -08/30/2021 16:39:41 - INFO - __main__ - Step 19111: {'lr': 0.00048369175898831384, 'samples': 3669312, 'steps': 19110, 'loss/train': 1.8126920461654663} -08/30/2021 16:39:43 - INFO - __main__ - Step 19112: {'lr': 0.0004836898736547902, 'samples': 3669504, 'steps': 19111, 'loss/train': 1.669182538986206} -08/30/2021 16:39:44 - INFO - __main__ - Step 19113: {'lr': 0.0004836879882159696, 'samples': 3669696, 'steps': 19112, 'loss/train': 1.6478606462478638} -08/30/2021 16:39:44 - INFO - __main__ - Step 19114: {'lr': 0.0004836861026718527, 'samples': 3669888, 'steps': 19113, 'loss/train': 2.1226742267608643} -08/30/2021 16:39:44 - INFO - __main__ - Step 19115: {'lr': 0.00048368421702244045, 'samples': 3670080, 'steps': 19114, 'loss/train': 1.5584373474121094} -08/30/2021 16:39:45 - INFO - __main__ - Step 19116: {'lr': 0.00048368233126773377, 'samples': 3670272, 'steps': 19115, 'loss/train': 1.6307731866836548} -08/30/2021 16:39:45 - INFO - __main__ - Step 19117: {'lr': 0.0004836804454077334, 'samples': 3670464, 'steps': 19116, 'loss/train': 1.074960470199585} -08/30/2021 16:39:47 - INFO - __main__ - Step 19118: {'lr': 0.0004836785594424402, 'samples': 3670656, 'steps': 19117, 'loss/train': 1.7020268440246582} -08/30/2021 16:39:47 - INFO - __main__ - Step 19119: {'lr': 0.0004836766733718551, 'samples': 3670848, 'steps': 19118, 'loss/train': 1.8478784561157227} -08/30/2021 16:39:48 - INFO - __main__ - Step 19120: {'lr': 0.0004836747871959789, 'samples': 3671040, 'steps': 19119, 'loss/train': 1.623666763305664} -08/30/2021 16:39:48 - INFO - __main__ - Step 19121: {'lr': 0.0004836729009148124, 'samples': 3671232, 'steps': 19120, 'loss/train': 1.8176316022872925} -08/30/2021 16:39:48 - INFO - __main__ - Step 19122: {'lr': 0.0004836710145283565, 'samples': 3671424, 'steps': 19121, 'loss/train': 4.032705783843994} -08/30/2021 16:39:50 - INFO - __main__ - Step 19123: {'lr': 0.0004836691280366121, 'samples': 3671616, 'steps': 19122, 'loss/train': 1.6686691045761108} -08/30/2021 16:39:51 - INFO - __main__ - Step 19124: {'lr': 0.00048366724143958, 'samples': 3671808, 'steps': 19123, 'loss/train': 1.7045818567276} -08/30/2021 16:39:51 - INFO - __main__ - Step 19125: {'lr': 0.0004836653547372609, 'samples': 3672000, 'steps': 19124, 'loss/train': 1.033792495727539} -08/30/2021 16:39:52 - INFO - __main__ - Step 19126: {'lr': 0.00048366346792965597, 'samples': 3672192, 'steps': 19125, 'loss/train': 1.7519725561141968} -08/30/2021 16:39:52 - INFO - __main__ - Step 19127: {'lr': 0.0004836615810167658, 'samples': 3672384, 'steps': 19126, 'loss/train': 1.4983408451080322} -08/30/2021 16:39:52 - INFO - __main__ - Step 19128: {'lr': 0.00048365969399859134, 'samples': 3672576, 'steps': 19127, 'loss/train': 1.1733825206756592} -08/30/2021 16:39:54 - INFO - __main__ - Step 19129: {'lr': 0.00048365780687513346, 'samples': 3672768, 'steps': 19128, 'loss/train': 0.09725673496723175} -08/30/2021 16:39:54 - INFO - __main__ - Step 19130: {'lr': 0.00048365591964639294, 'samples': 3672960, 'steps': 19129, 'loss/train': 1.7708055973052979} -08/30/2021 16:39:54 - INFO - __main__ - Step 19131: {'lr': 0.0004836540323123707, 'samples': 3673152, 'steps': 19130, 'loss/train': 1.1902272701263428} -08/30/2021 16:39:55 - INFO - __main__ - Step 19132: {'lr': 0.00048365214487306753, 'samples': 3673344, 'steps': 19131, 'loss/train': 1.6898306608200073} -08/30/2021 16:39:55 - INFO - __main__ - Step 19133: {'lr': 0.00048365025732848433, 'samples': 3673536, 'steps': 19132, 'loss/train': 1.5089027881622314} -08/30/2021 16:39:57 - INFO - __main__ - Step 19134: {'lr': 0.0004836483696786219, 'samples': 3673728, 'steps': 19133, 'loss/train': 1.7575311660766602} -08/30/2021 16:39:57 - INFO - __main__ - Step 19135: {'lr': 0.00048364648192348117, 'samples': 3673920, 'steps': 19134, 'loss/train': 2.394428253173828} -08/30/2021 16:39:58 - INFO - __main__ - Step 19136: {'lr': 0.0004836445940630629, 'samples': 3674112, 'steps': 19135, 'loss/train': 1.6285349130630493} -08/30/2021 16:39:58 - INFO - __main__ - Step 19137: {'lr': 0.0004836427060973679, 'samples': 3674304, 'steps': 19136, 'loss/train': 1.4491521120071411} -08/30/2021 16:39:58 - INFO - __main__ - Step 19138: {'lr': 0.00048364081802639724, 'samples': 3674496, 'steps': 19137, 'loss/train': 1.5877060890197754} -08/30/2021 16:40:00 - INFO - __main__ - Step 19139: {'lr': 0.00048363892985015157, 'samples': 3674688, 'steps': 19138, 'loss/train': 1.4455280303955078} -08/30/2021 16:40:00 - INFO - __main__ - Step 19140: {'lr': 0.00048363704156863187, 'samples': 3674880, 'steps': 19139, 'loss/train': 1.3501614332199097} -08/30/2021 16:40:01 - INFO - __main__ - Step 19141: {'lr': 0.0004836351531818388, 'samples': 3675072, 'steps': 19140, 'loss/train': 1.4317426681518555} -08/30/2021 16:40:01 - INFO - __main__ - Step 19142: {'lr': 0.00048363326468977343, 'samples': 3675264, 'steps': 19141, 'loss/train': 1.8610998392105103} -08/30/2021 16:40:01 - INFO - __main__ - Step 19143: {'lr': 0.00048363137609243654, 'samples': 3675456, 'steps': 19142, 'loss/train': 1.4787158966064453} -08/30/2021 16:40:03 - INFO - __main__ - Step 19144: {'lr': 0.0004836294873898289, 'samples': 3675648, 'steps': 19143, 'loss/train': 1.950890064239502} -08/30/2021 16:40:03 - INFO - __main__ - Step 19145: {'lr': 0.00048362759858195146, 'samples': 3675840, 'steps': 19144, 'loss/train': 1.7649948596954346} -08/30/2021 16:40:04 - INFO - __main__ - Step 19146: {'lr': 0.0004836257096688049, 'samples': 3676032, 'steps': 19145, 'loss/train': 1.7138363122940063} -08/30/2021 16:40:04 - INFO - __main__ - Step 19147: {'lr': 0.00048362382065039034, 'samples': 3676224, 'steps': 19146, 'loss/train': 1.4875048398971558} -08/30/2021 16:40:04 - INFO - __main__ - Step 19148: {'lr': 0.00048362193152670847, 'samples': 3676416, 'steps': 19147, 'loss/train': 1.2919530868530273} -08/30/2021 16:40:06 - INFO - __main__ - Step 19149: {'lr': 0.0004836200422977601, 'samples': 3676608, 'steps': 19148, 'loss/train': 1.6786713600158691} -08/30/2021 16:40:06 - INFO - __main__ - Step 19150: {'lr': 0.00048361815296354624, 'samples': 3676800, 'steps': 19149, 'loss/train': 1.4627530574798584} -08/30/2021 16:40:07 - INFO - __main__ - Step 19151: {'lr': 0.00048361626352406756, 'samples': 3676992, 'steps': 19150, 'loss/train': 1.4496657848358154} -08/30/2021 16:40:07 - INFO - __main__ - Step 19152: {'lr': 0.00048361437397932504, 'samples': 3677184, 'steps': 19151, 'loss/train': 1.9575152397155762} -08/30/2021 16:40:07 - INFO - __main__ - Step 19153: {'lr': 0.0004836124843293195, 'samples': 3677376, 'steps': 19152, 'loss/train': 1.3367133140563965} -08/30/2021 16:40:08 - INFO - __main__ - Step 19154: {'lr': 0.00048361059457405176, 'samples': 3677568, 'steps': 19153, 'loss/train': 1.7624095678329468} -08/30/2021 16:40:09 - INFO - __main__ - Step 19155: {'lr': 0.0004836087047135227, 'samples': 3677760, 'steps': 19154, 'loss/train': 1.8370709419250488} -08/30/2021 16:40:10 - INFO - __main__ - Step 19156: {'lr': 0.0004836068147477331, 'samples': 3677952, 'steps': 19155, 'loss/train': 1.474143385887146} -08/30/2021 16:40:10 - INFO - __main__ - Step 19157: {'lr': 0.0004836049246766839, 'samples': 3678144, 'steps': 19156, 'loss/train': 0.8988378643989563} -08/30/2021 16:40:10 - INFO - __main__ - Step 19158: {'lr': 0.000483603034500376, 'samples': 3678336, 'steps': 19157, 'loss/train': 1.754389762878418} -08/30/2021 16:40:11 - INFO - __main__ - Step 19159: {'lr': 0.0004836011442188101, 'samples': 3678528, 'steps': 19158, 'loss/train': 0.9265342950820923} -08/30/2021 16:40:12 - INFO - __main__ - Step 19160: {'lr': 0.00048359925383198714, 'samples': 3678720, 'steps': 19159, 'loss/train': 1.2509101629257202} -08/30/2021 16:40:13 - INFO - __main__ - Step 19161: {'lr': 0.000483597363339908, 'samples': 3678912, 'steps': 19160, 'loss/train': 1.1521157026290894} -08/30/2021 16:40:13 - INFO - __main__ - Step 19162: {'lr': 0.0004835954727425734, 'samples': 3679104, 'steps': 19161, 'loss/train': 2.0359926223754883} -08/30/2021 16:40:13 - INFO - __main__ - Step 19163: {'lr': 0.0004835935820399844, 'samples': 3679296, 'steps': 19162, 'loss/train': 1.5492124557495117} -08/30/2021 16:40:14 - INFO - __main__ - Step 19164: {'lr': 0.0004835916912321417, 'samples': 3679488, 'steps': 19163, 'loss/train': 1.642147421836853} -08/30/2021 16:40:15 - INFO - __main__ - Step 19165: {'lr': 0.0004835898003190462, 'samples': 3679680, 'steps': 19164, 'loss/train': 1.559041142463684} -08/30/2021 16:40:16 - INFO - __main__ - Step 19166: {'lr': 0.00048358790930069876, 'samples': 3679872, 'steps': 19165, 'loss/train': 1.1350476741790771} -08/30/2021 16:40:16 - INFO - __main__ - Step 19167: {'lr': 0.0004835860181771001, 'samples': 3680064, 'steps': 19166, 'loss/train': 1.5662000179290771} -08/30/2021 16:40:17 - INFO - __main__ - Step 19168: {'lr': 0.0004835841269482513, 'samples': 3680256, 'steps': 19167, 'loss/train': 0.23353731632232666} -08/30/2021 16:40:17 - INFO - __main__ - Step 19169: {'lr': 0.00048358223561415306, 'samples': 3680448, 'steps': 19168, 'loss/train': 2.1290228366851807} -08/30/2021 16:40:18 - INFO - __main__ - Step 19170: {'lr': 0.0004835803441748062, 'samples': 3680640, 'steps': 19169, 'loss/train': 2.134377956390381} -08/30/2021 16:40:19 - INFO - __main__ - Step 19171: {'lr': 0.0004835784526302117, 'samples': 3680832, 'steps': 19170, 'loss/train': 1.7741402387619019} -08/30/2021 16:40:19 - INFO - __main__ - Step 19172: {'lr': 0.0004835765609803704, 'samples': 3681024, 'steps': 19171, 'loss/train': 1.4562523365020752} -08/30/2021 16:40:20 - INFO - __main__ - Step 19173: {'lr': 0.00048357466922528306, 'samples': 3681216, 'steps': 19172, 'loss/train': 1.050406813621521} -08/30/2021 16:40:20 - INFO - __main__ - Step 19174: {'lr': 0.00048357277736495055, 'samples': 3681408, 'steps': 19173, 'loss/train': 1.797304391860962} -08/30/2021 16:40:22 - INFO - __main__ - Step 19175: {'lr': 0.0004835708853993738, 'samples': 3681600, 'steps': 19174, 'loss/train': 1.1651562452316284} -08/30/2021 16:40:22 - INFO - __main__ - Step 19176: {'lr': 0.0004835689933285536, 'samples': 3681792, 'steps': 19175, 'loss/train': 1.6475266218185425} -08/30/2021 16:40:22 - INFO - __main__ - Step 19177: {'lr': 0.0004835671011524908, 'samples': 3681984, 'steps': 19176, 'loss/train': 1.2482472658157349} -08/30/2021 16:40:23 - INFO - __main__ - Step 19178: {'lr': 0.0004835652088711863, 'samples': 3682176, 'steps': 19177, 'loss/train': 1.5967295169830322} -08/30/2021 16:40:23 - INFO - __main__ - Step 19179: {'lr': 0.0004835633164846409, 'samples': 3682368, 'steps': 19178, 'loss/train': 1.1644779443740845} -08/30/2021 16:40:23 - INFO - __main__ - Step 19180: {'lr': 0.00048356142399285545, 'samples': 3682560, 'steps': 19179, 'loss/train': 0.6553381085395813} -08/30/2021 16:40:25 - INFO - __main__ - Step 19181: {'lr': 0.00048355953139583087, 'samples': 3682752, 'steps': 19180, 'loss/train': 2.0194222927093506} -08/30/2021 16:40:26 - INFO - __main__ - Step 19182: {'lr': 0.00048355763869356794, 'samples': 3682944, 'steps': 19181, 'loss/train': 1.7708877325057983} -08/30/2021 16:40:26 - INFO - __main__ - Step 19183: {'lr': 0.0004835557458860675, 'samples': 3683136, 'steps': 19182, 'loss/train': 2.164074659347534} -08/30/2021 16:40:27 - INFO - __main__ - Step 19184: {'lr': 0.00048355385297333054, 'samples': 3683328, 'steps': 19183, 'loss/train': 2.01297926902771} -08/30/2021 16:40:27 - INFO - __main__ - Step 19185: {'lr': 0.0004835519599553578, 'samples': 3683520, 'steps': 19184, 'loss/train': 0.9082038402557373} -08/30/2021 16:40:28 - INFO - __main__ - Step 19186: {'lr': 0.0004835500668321501, 'samples': 3683712, 'steps': 19185, 'loss/train': 1.8561290502548218} -08/30/2021 16:40:29 - INFO - __main__ - Step 19187: {'lr': 0.0004835481736037084, 'samples': 3683904, 'steps': 19186, 'loss/train': 1.6833256483078003} -08/30/2021 16:40:29 - INFO - __main__ - Step 19188: {'lr': 0.0004835462802700334, 'samples': 3684096, 'steps': 19187, 'loss/train': 0.865152895450592} -08/30/2021 16:40:30 - INFO - __main__ - Step 19189: {'lr': 0.00048354438683112614, 'samples': 3684288, 'steps': 19188, 'loss/train': 1.5439050197601318} -08/30/2021 16:40:30 - INFO - __main__ - Step 19190: {'lr': 0.00048354249328698743, 'samples': 3684480, 'steps': 19189, 'loss/train': 1.1552523374557495} -08/30/2021 16:40:32 - INFO - __main__ - Step 19191: {'lr': 0.000483540599637618, 'samples': 3684672, 'steps': 19190, 'loss/train': 1.3549734354019165} -08/30/2021 16:40:32 - INFO - __main__ - Step 19192: {'lr': 0.00048353870588301875, 'samples': 3684864, 'steps': 19191, 'loss/train': 1.8058332204818726} -08/30/2021 16:40:32 - INFO - __main__ - Step 19193: {'lr': 0.00048353681202319056, 'samples': 3685056, 'steps': 19192, 'loss/train': 1.5506209135055542} -08/30/2021 16:40:33 - INFO - __main__ - Step 19194: {'lr': 0.0004835349180581343, 'samples': 3685248, 'steps': 19193, 'loss/train': 1.9190616607666016} -08/30/2021 16:40:33 - INFO - __main__ - Step 19195: {'lr': 0.0004835330239878509, 'samples': 3685440, 'steps': 19194, 'loss/train': 1.884497880935669} -08/30/2021 16:40:34 - INFO - __main__ - Step 19196: {'lr': 0.00048353112981234104, 'samples': 3685632, 'steps': 19195, 'loss/train': 2.119391441345215} -08/30/2021 16:40:35 - INFO - __main__ - Step 19197: {'lr': 0.0004835292355316057, 'samples': 3685824, 'steps': 19196, 'loss/train': 1.1468201875686646} -08/30/2021 16:40:35 - INFO - __main__ - Step 19198: {'lr': 0.0004835273411456456, 'samples': 3686016, 'steps': 19197, 'loss/train': 1.3540319204330444} -08/30/2021 16:40:36 - INFO - __main__ - Step 19199: {'lr': 0.00048352544665446174, 'samples': 3686208, 'steps': 19198, 'loss/train': 1.6521283388137817} -08/30/2021 16:40:36 - INFO - __main__ - Step 19200: {'lr': 0.000483523552058055, 'samples': 3686400, 'steps': 19199, 'loss/train': 1.589746117591858} -08/30/2021 16:40:37 - INFO - __main__ - Step 19201: {'lr': 0.00048352165735642607, 'samples': 3686592, 'steps': 19200, 'loss/train': 1.7299714088439941} -08/30/2021 16:40:38 - INFO - __main__ - Step 19202: {'lr': 0.00048351976254957585, 'samples': 3686784, 'steps': 19201, 'loss/train': 1.8458266258239746} -08/30/2021 16:40:38 - INFO - __main__ - Step 19203: {'lr': 0.0004835178676375053, 'samples': 3686976, 'steps': 19202, 'loss/train': 1.3130806684494019} -08/30/2021 16:40:39 - INFO - __main__ - Step 19204: {'lr': 0.0004835159726202151, 'samples': 3687168, 'steps': 19203, 'loss/train': 0.9123445153236389} -08/30/2021 16:40:39 - INFO - __main__ - Step 19205: {'lr': 0.0004835140774977063, 'samples': 3687360, 'steps': 19204, 'loss/train': 2.004091739654541} -08/30/2021 16:40:41 - INFO - __main__ - Step 19206: {'lr': 0.0004835121822699796, 'samples': 3687552, 'steps': 19205, 'loss/train': 1.6181484460830688} -08/30/2021 16:40:41 - INFO - __main__ - Step 19207: {'lr': 0.000483510286937036, 'samples': 3687744, 'steps': 19206, 'loss/train': 1.237630844116211} -08/30/2021 16:40:42 - INFO - __main__ - Step 19208: {'lr': 0.0004835083914988762, 'samples': 3687936, 'steps': 19207, 'loss/train': 1.074430227279663} -08/30/2021 16:40:42 - INFO - __main__ - Step 19209: {'lr': 0.0004835064959555011, 'samples': 3688128, 'steps': 19208, 'loss/train': 1.427473783493042} -08/30/2021 16:40:42 - INFO - __main__ - Step 19210: {'lr': 0.00048350460030691165, 'samples': 3688320, 'steps': 19209, 'loss/train': 1.7300118207931519} -08/30/2021 16:40:43 - INFO - __main__ - Step 19211: {'lr': 0.00048350270455310864, 'samples': 3688512, 'steps': 19210, 'loss/train': 1.803452730178833} -08/30/2021 16:40:44 - INFO - __main__ - Step 19212: {'lr': 0.00048350080869409285, 'samples': 3688704, 'steps': 19211, 'loss/train': 1.4562078714370728} -08/30/2021 16:40:45 - INFO - __main__ - Step 19213: {'lr': 0.0004834989127298652, 'samples': 3688896, 'steps': 19212, 'loss/train': 1.6275389194488525} -08/30/2021 16:40:45 - INFO - __main__ - Step 19214: {'lr': 0.00048349701666042656, 'samples': 3689088, 'steps': 19213, 'loss/train': 2.423234462738037} -08/30/2021 16:40:45 - INFO - __main__ - Step 19215: {'lr': 0.00048349512048577784, 'samples': 3689280, 'steps': 19214, 'loss/train': 0.1250191479921341} -08/30/2021 16:40:46 - INFO - __main__ - Step 19216: {'lr': 0.00048349322420591966, 'samples': 3689472, 'steps': 19215, 'loss/train': 1.613912582397461} -08/30/2021 16:40:47 - INFO - __main__ - Step 19217: {'lr': 0.00048349132782085316, 'samples': 3689664, 'steps': 19216, 'loss/train': 1.6297813653945923} -08/30/2021 16:40:48 - INFO - __main__ - Step 19218: {'lr': 0.00048348943133057903, 'samples': 3689856, 'steps': 19217, 'loss/train': 1.4121403694152832} -08/30/2021 16:40:48 - INFO - __main__ - Step 19219: {'lr': 0.0004834875347350982, 'samples': 3690048, 'steps': 19218, 'loss/train': 1.678435206413269} -08/30/2021 16:40:48 - INFO - __main__ - Step 19220: {'lr': 0.00048348563803441146, 'samples': 3690240, 'steps': 19219, 'loss/train': 1.1719179153442383} -08/30/2021 16:40:49 - INFO - __main__ - Step 19221: {'lr': 0.0004834837412285197, 'samples': 3690432, 'steps': 19220, 'loss/train': 1.373894453048706} -08/30/2021 16:40:50 - INFO - __main__ - Step 19222: {'lr': 0.00048348184431742377, 'samples': 3690624, 'steps': 19221, 'loss/train': 1.4711549282073975} -08/30/2021 16:40:51 - INFO - __main__ - Step 19223: {'lr': 0.00048347994730112457, 'samples': 3690816, 'steps': 19222, 'loss/train': 1.4518851041793823} -08/30/2021 16:40:51 - INFO - __main__ - Step 19224: {'lr': 0.00048347805017962274, 'samples': 3691008, 'steps': 19223, 'loss/train': 1.7468440532684326} -08/30/2021 16:40:51 - INFO - __main__ - Step 19225: {'lr': 0.00048347615295291947, 'samples': 3691200, 'steps': 19224, 'loss/train': 1.2006101608276367} -08/30/2021 16:40:52 - INFO - __main__ - Step 19226: {'lr': 0.0004834742556210154, 'samples': 3691392, 'steps': 19225, 'loss/train': 1.5260684490203857} -08/30/2021 16:40:53 - INFO - __main__ - Step 19227: {'lr': 0.00048347235818391144, 'samples': 3691584, 'steps': 19226, 'loss/train': 1.6461853981018066} -08/30/2021 16:40:54 - INFO - __main__ - Step 19228: {'lr': 0.0004834704606416084, 'samples': 3691776, 'steps': 19227, 'loss/train': 1.7791305780410767} -08/30/2021 16:40:54 - INFO - __main__ - Step 19229: {'lr': 0.00048346856299410725, 'samples': 3691968, 'steps': 19228, 'loss/train': 1.5573664903640747} -08/30/2021 16:40:54 - INFO - __main__ - Step 19230: {'lr': 0.0004834666652414087, 'samples': 3692160, 'steps': 19229, 'loss/train': 1.4086616039276123} -08/30/2021 16:40:55 - INFO - __main__ - Step 19231: {'lr': 0.0004834647673835137, 'samples': 3692352, 'steps': 19230, 'loss/train': 1.5888431072235107} -08/30/2021 16:40:57 - INFO - __main__ - Step 19232: {'lr': 0.00048346286942042307, 'samples': 3692544, 'steps': 19231, 'loss/train': 1.8565961122512817} -08/30/2021 16:40:57 - INFO - __main__ - Step 19233: {'lr': 0.0004834609713521377, 'samples': 3692736, 'steps': 19232, 'loss/train': 1.3755172491073608} -08/30/2021 16:40:58 - INFO - __main__ - Step 19234: {'lr': 0.0004834590731786584, 'samples': 3692928, 'steps': 19233, 'loss/train': 2.0674779415130615} -08/30/2021 16:40:58 - INFO - __main__ - Step 19235: {'lr': 0.000483457174899986, 'samples': 3693120, 'steps': 19234, 'loss/train': 1.592346429824829} -08/30/2021 16:40:58 - INFO - __main__ - Step 19236: {'lr': 0.00048345527651612145, 'samples': 3693312, 'steps': 19235, 'loss/train': 1.53139066696167} -08/30/2021 16:41:00 - INFO - __main__ - Step 19237: {'lr': 0.00048345337802706555, 'samples': 3693504, 'steps': 19236, 'loss/train': 1.984649419784546} -08/30/2021 16:41:00 - INFO - __main__ - Step 19238: {'lr': 0.0004834514794328192, 'samples': 3693696, 'steps': 19237, 'loss/train': 1.4567769765853882} -08/30/2021 16:41:01 - INFO - __main__ - Step 19239: {'lr': 0.00048344958073338315, 'samples': 3693888, 'steps': 19238, 'loss/train': 1.2409563064575195} -08/30/2021 16:41:01 - INFO - __main__ - Step 19240: {'lr': 0.00048344768192875833, 'samples': 3694080, 'steps': 19239, 'loss/train': 1.451059341430664} -08/30/2021 16:41:01 - INFO - __main__ - Step 19241: {'lr': 0.00048344578301894557, 'samples': 3694272, 'steps': 19240, 'loss/train': 1.528473973274231} -08/30/2021 16:41:03 - INFO - __main__ - Step 19242: {'lr': 0.0004834438840039458, 'samples': 3694464, 'steps': 19241, 'loss/train': 1.8752729892730713} -08/30/2021 16:41:03 - INFO - __main__ - Step 19243: {'lr': 0.0004834419848837598, 'samples': 3694656, 'steps': 19242, 'loss/train': 1.4833667278289795} -08/30/2021 16:41:03 - INFO - __main__ - Step 19244: {'lr': 0.00048344008565838844, 'samples': 3694848, 'steps': 19243, 'loss/train': 1.3282593488693237} -08/30/2021 16:41:04 - INFO - __main__ - Step 19245: {'lr': 0.00048343818632783255, 'samples': 3695040, 'steps': 19244, 'loss/train': 1.71040678024292} -08/30/2021 16:41:04 - INFO - __main__ - Step 19246: {'lr': 0.00048343628689209305, 'samples': 3695232, 'steps': 19245, 'loss/train': 1.2799099683761597} -08/30/2021 16:41:06 - INFO - __main__ - Step 19247: {'lr': 0.00048343438735117076, 'samples': 3695424, 'steps': 19246, 'loss/train': 1.4637094736099243} -08/30/2021 16:41:06 - INFO - __main__ - Step 19248: {'lr': 0.00048343248770506655, 'samples': 3695616, 'steps': 19247, 'loss/train': 1.267026424407959} -08/30/2021 16:41:06 - INFO - __main__ - Step 19249: {'lr': 0.0004834305879537812, 'samples': 3695808, 'steps': 19248, 'loss/train': 1.6086654663085938} -08/30/2021 16:41:07 - INFO - __main__ - Step 19250: {'lr': 0.00048342868809731567, 'samples': 3696000, 'steps': 19249, 'loss/train': 1.593589425086975} -08/30/2021 16:41:07 - INFO - __main__ - Step 19251: {'lr': 0.0004834267881356708, 'samples': 3696192, 'steps': 19250, 'loss/train': 2.4772422313690186} -08/30/2021 16:41:09 - INFO - __main__ - Step 19252: {'lr': 0.0004834248880688474, 'samples': 3696384, 'steps': 19251, 'loss/train': 1.9250917434692383} -08/30/2021 16:41:09 - INFO - __main__ - Step 19253: {'lr': 0.00048342298789684637, 'samples': 3696576, 'steps': 19252, 'loss/train': 0.587297797203064} -08/30/2021 16:41:10 - INFO - __main__ - Step 19254: {'lr': 0.0004834210876196685, 'samples': 3696768, 'steps': 19253, 'loss/train': 0.7421675324440002} -08/30/2021 16:41:10 - INFO - __main__ - Step 19255: {'lr': 0.0004834191872373147, 'samples': 3696960, 'steps': 19254, 'loss/train': 1.430770993232727} -08/30/2021 16:41:10 - INFO - __main__ - Step 19256: {'lr': 0.0004834172867497858, 'samples': 3697152, 'steps': 19255, 'loss/train': 1.7474435567855835} -08/30/2021 16:41:11 - INFO - __main__ - Step 19257: {'lr': 0.0004834153861570827, 'samples': 3697344, 'steps': 19256, 'loss/train': 1.3884469270706177} -08/30/2021 16:41:12 - INFO - __main__ - Step 19258: {'lr': 0.00048341348545920623, 'samples': 3697536, 'steps': 19257, 'loss/train': 1.7233219146728516} -08/30/2021 16:41:13 - INFO - __main__ - Step 19259: {'lr': 0.0004834115846561572, 'samples': 3697728, 'steps': 19258, 'loss/train': 1.4816497564315796} -08/30/2021 16:41:13 - INFO - __main__ - Step 19260: {'lr': 0.0004834096837479366, 'samples': 3697920, 'steps': 19259, 'loss/train': 1.445310115814209} -08/30/2021 16:41:13 - INFO - __main__ - Step 19261: {'lr': 0.00048340778273454514, 'samples': 3698112, 'steps': 19260, 'loss/train': 1.3448522090911865} -08/30/2021 16:41:14 - INFO - __main__ - Step 19262: {'lr': 0.00048340588161598373, 'samples': 3698304, 'steps': 19261, 'loss/train': 1.6510472297668457} -08/30/2021 16:41:15 - INFO - __main__ - Step 19263: {'lr': 0.00048340398039225325, 'samples': 3698496, 'steps': 19262, 'loss/train': 1.1248397827148438} -08/30/2021 16:41:16 - INFO - __main__ - Step 19264: {'lr': 0.0004834020790633545, 'samples': 3698688, 'steps': 19263, 'loss/train': 1.4149553775787354} -08/30/2021 16:41:16 - INFO - __main__ - Step 19265: {'lr': 0.00048340017762928843, 'samples': 3698880, 'steps': 19264, 'loss/train': 1.1894426345825195} -08/30/2021 16:41:16 - INFO - __main__ - Step 19266: {'lr': 0.00048339827609005583, 'samples': 3699072, 'steps': 19265, 'loss/train': 1.9458779096603394} -08/30/2021 16:41:17 - INFO - __main__ - Step 19267: {'lr': 0.00048339637444565756, 'samples': 3699264, 'steps': 19266, 'loss/train': 1.5638084411621094} -08/30/2021 16:41:18 - INFO - __main__ - Step 19268: {'lr': 0.0004833944726960945, 'samples': 3699456, 'steps': 19267, 'loss/train': 1.2100439071655273} -08/30/2021 16:41:19 - INFO - __main__ - Step 19269: {'lr': 0.00048339257084136747, 'samples': 3699648, 'steps': 19268, 'loss/train': 1.7518751621246338} -08/30/2021 16:41:19 - INFO - __main__ - Step 19270: {'lr': 0.0004833906688814774, 'samples': 3699840, 'steps': 19269, 'loss/train': 1.656874179840088} -08/30/2021 16:41:19 - INFO - __main__ - Step 19271: {'lr': 0.00048338876681642504, 'samples': 3700032, 'steps': 19270, 'loss/train': 1.2396714687347412} -08/30/2021 16:41:20 - INFO - __main__ - Step 19272: {'lr': 0.0004833868646462113, 'samples': 3700224, 'steps': 19271, 'loss/train': 1.0070147514343262} -08/30/2021 16:41:21 - INFO - __main__ - Step 19273: {'lr': 0.00048338496237083705, 'samples': 3700416, 'steps': 19272, 'loss/train': 1.6314671039581299} -08/30/2021 16:41:22 - INFO - __main__ - Step 19274: {'lr': 0.00048338305999030313, 'samples': 3700608, 'steps': 19273, 'loss/train': 1.4817777872085571} -08/30/2021 16:41:22 - INFO - __main__ - Step 19275: {'lr': 0.00048338115750461044, 'samples': 3700800, 'steps': 19274, 'loss/train': 1.095033049583435} -08/30/2021 16:41:22 - INFO - __main__ - Step 19276: {'lr': 0.0004833792549137598, 'samples': 3700992, 'steps': 19275, 'loss/train': 1.7891143560409546} -08/30/2021 16:41:23 - INFO - __main__ - Step 19277: {'lr': 0.00048337735221775204, 'samples': 3701184, 'steps': 19276, 'loss/train': 1.3591951131820679} -08/30/2021 16:41:23 - INFO - __main__ - Step 19278: {'lr': 0.000483375449416588, 'samples': 3701376, 'steps': 19277, 'loss/train': 1.4019490480422974} -08/30/2021 16:41:25 - INFO - __main__ - Step 19279: {'lr': 0.0004833735465102687, 'samples': 3701568, 'steps': 19278, 'loss/train': 2.0010457038879395} -08/30/2021 16:41:25 - INFO - __main__ - Step 19280: {'lr': 0.0004833716434987948, 'samples': 3701760, 'steps': 19279, 'loss/train': 1.1725772619247437} -08/30/2021 16:41:25 - INFO - __main__ - Step 19281: {'lr': 0.0004833697403821672, 'samples': 3701952, 'steps': 19280, 'loss/train': 1.2886343002319336} -08/30/2021 16:41:26 - INFO - __main__ - Step 19282: {'lr': 0.0004833678371603869, 'samples': 3702144, 'steps': 19281, 'loss/train': 1.4475995302200317} -08/30/2021 16:41:26 - INFO - __main__ - Step 19283: {'lr': 0.0004833659338334546, 'samples': 3702336, 'steps': 19282, 'loss/train': 1.569151520729065} -08/30/2021 16:41:28 - INFO - __main__ - Step 19284: {'lr': 0.0004833640304013712, 'samples': 3702528, 'steps': 19283, 'loss/train': 1.0333819389343262} -08/30/2021 16:41:28 - INFO - __main__ - Step 19285: {'lr': 0.0004833621268641376, 'samples': 3702720, 'steps': 19284, 'loss/train': 1.674288272857666} -08/30/2021 16:41:28 - INFO - __main__ - Step 19286: {'lr': 0.0004833602232217546, 'samples': 3702912, 'steps': 19285, 'loss/train': 1.4194025993347168} -08/30/2021 16:41:29 - INFO - __main__ - Step 19287: {'lr': 0.0004833583194742231, 'samples': 3703104, 'steps': 19286, 'loss/train': 1.5545814037322998} -08/30/2021 16:41:29 - INFO - __main__ - Step 19288: {'lr': 0.00048335641562154396, 'samples': 3703296, 'steps': 19287, 'loss/train': 1.0568838119506836} -08/30/2021 16:41:31 - INFO - __main__ - Step 19289: {'lr': 0.00048335451166371803, 'samples': 3703488, 'steps': 19288, 'loss/train': 2.0425543785095215} -08/30/2021 16:41:32 - INFO - __main__ - Step 19290: {'lr': 0.0004833526076007461, 'samples': 3703680, 'steps': 19289, 'loss/train': 1.287030816078186} -08/30/2021 16:41:32 - INFO - __main__ - Step 19291: {'lr': 0.0004833507034326291, 'samples': 3703872, 'steps': 19290, 'loss/train': 1.7177244424819946} -08/30/2021 16:41:32 - INFO - __main__ - Step 19292: {'lr': 0.0004833487991593679, 'samples': 3704064, 'steps': 19291, 'loss/train': 1.2387974262237549} -08/30/2021 16:41:33 - INFO - __main__ - Step 19293: {'lr': 0.0004833468947809633, 'samples': 3704256, 'steps': 19292, 'loss/train': 1.8201804161071777} -08/30/2021 16:41:34 - INFO - __main__ - Step 19294: {'lr': 0.0004833449902974162, 'samples': 3704448, 'steps': 19293, 'loss/train': 1.149401068687439} -08/30/2021 16:41:35 - INFO - __main__ - Step 19295: {'lr': 0.00048334308570872745, 'samples': 3704640, 'steps': 19294, 'loss/train': 2.3005709648132324} -08/30/2021 16:41:35 - INFO - __main__ - Step 19296: {'lr': 0.00048334118101489793, 'samples': 3704832, 'steps': 19295, 'loss/train': 1.070224642753601} -08/30/2021 16:41:35 - INFO - __main__ - Step 19297: {'lr': 0.00048333927621592844, 'samples': 3705024, 'steps': 19296, 'loss/train': 1.6150513887405396} -08/30/2021 16:41:36 - INFO - __main__ - Step 19298: {'lr': 0.00048333737131181986, 'samples': 3705216, 'steps': 19297, 'loss/train': 1.8145430088043213} -08/30/2021 16:41:36 - INFO - __main__ - Step 19299: {'lr': 0.00048333546630257315, 'samples': 3705408, 'steps': 19298, 'loss/train': 1.3970966339111328} -08/30/2021 16:41:38 - INFO - __main__ - Step 19300: {'lr': 0.000483333561188189, 'samples': 3705600, 'steps': 19299, 'loss/train': 0.6124410033226013} -08/30/2021 16:41:38 - INFO - __main__ - Step 19301: {'lr': 0.00048333165596866837, 'samples': 3705792, 'steps': 19300, 'loss/train': 1.4383171796798706} -08/30/2021 16:41:38 - INFO - __main__ - Step 19302: {'lr': 0.00048332975064401207, 'samples': 3705984, 'steps': 19301, 'loss/train': 1.7804783582687378} -08/30/2021 16:41:39 - INFO - __main__ - Step 19303: {'lr': 0.000483327845214221, 'samples': 3706176, 'steps': 19302, 'loss/train': 1.6774909496307373} -08/30/2021 16:41:39 - INFO - __main__ - Step 19304: {'lr': 0.00048332593967929607, 'samples': 3706368, 'steps': 19303, 'loss/train': 2.2327358722686768} -08/30/2021 16:41:40 - INFO - __main__ - Step 19305: {'lr': 0.000483324034039238, 'samples': 3706560, 'steps': 19304, 'loss/train': 1.806740403175354} -08/30/2021 16:41:41 - INFO - __main__ - Step 19306: {'lr': 0.00048332212829404775, 'samples': 3706752, 'steps': 19305, 'loss/train': 1.667768120765686} -08/30/2021 16:41:41 - INFO - __main__ - Step 19307: {'lr': 0.0004833202224437261, 'samples': 3706944, 'steps': 19306, 'loss/train': 1.2210687398910522} -08/30/2021 16:41:42 - INFO - __main__ - Step 19308: {'lr': 0.000483318316488274, 'samples': 3707136, 'steps': 19307, 'loss/train': 2.147545337677002} -08/30/2021 16:41:42 - INFO - __main__ - Step 19309: {'lr': 0.00048331641042769223, 'samples': 3707328, 'steps': 19308, 'loss/train': 1.5021699666976929} -08/30/2021 16:41:43 - INFO - __main__ - Step 19310: {'lr': 0.00048331450426198177, 'samples': 3707520, 'steps': 19309, 'loss/train': 1.634742259979248} -08/30/2021 16:41:44 - INFO - __main__ - Step 19311: {'lr': 0.0004833125979911434, 'samples': 3707712, 'steps': 19310, 'loss/train': 1.7047052383422852} -08/30/2021 16:41:44 - INFO - __main__ - Step 19312: {'lr': 0.0004833106916151778, 'samples': 3707904, 'steps': 19311, 'loss/train': 1.4949703216552734} -08/30/2021 16:41:45 - INFO - __main__ - Step 19313: {'lr': 0.00048330878513408616, 'samples': 3708096, 'steps': 19312, 'loss/train': 1.2732231616973877} -08/30/2021 16:41:45 - INFO - __main__ - Step 19314: {'lr': 0.00048330687854786914, 'samples': 3708288, 'steps': 19313, 'loss/train': 1.2981466054916382} -08/30/2021 16:41:47 - INFO - __main__ - Step 19315: {'lr': 0.00048330497185652765, 'samples': 3708480, 'steps': 19314, 'loss/train': 1.2048128843307495} -08/30/2021 16:41:47 - INFO - __main__ - Step 19316: {'lr': 0.00048330306506006257, 'samples': 3708672, 'steps': 19315, 'loss/train': 1.9277514219284058} -08/30/2021 16:41:48 - INFO - __main__ - Step 19317: {'lr': 0.00048330115815847465, 'samples': 3708864, 'steps': 19316, 'loss/train': 1.4384599924087524} -08/30/2021 16:41:48 - INFO - __main__ - Step 19318: {'lr': 0.0004832992511517649, 'samples': 3709056, 'steps': 19317, 'loss/train': 0.2641623318195343} -08/30/2021 16:41:48 - INFO - __main__ - Step 19319: {'lr': 0.00048329734403993406, 'samples': 3709248, 'steps': 19318, 'loss/train': 1.6658275127410889} -08/30/2021 16:41:49 - INFO - __main__ - Step 19320: {'lr': 0.00048329543682298307, 'samples': 3709440, 'steps': 19319, 'loss/train': 1.0207011699676514} -08/30/2021 16:41:50 - INFO - __main__ - Step 19321: {'lr': 0.0004832935295009127, 'samples': 3709632, 'steps': 19320, 'loss/train': 0.1176118329167366} -08/30/2021 16:41:51 - INFO - __main__ - Step 19322: {'lr': 0.0004832916220737239, 'samples': 3709824, 'steps': 19321, 'loss/train': 1.34175443649292} -08/30/2021 16:41:51 - INFO - __main__ - Step 19323: {'lr': 0.0004832897145414175, 'samples': 3710016, 'steps': 19322, 'loss/train': 1.9319572448730469} -08/30/2021 16:41:52 - INFO - __main__ - Step 19324: {'lr': 0.0004832878069039943, 'samples': 3710208, 'steps': 19323, 'loss/train': 1.999365210533142} -08/30/2021 16:41:52 - INFO - __main__ - Step 19325: {'lr': 0.0004832858991614553, 'samples': 3710400, 'steps': 19324, 'loss/train': 1.1017085313796997} -08/30/2021 16:41:53 - INFO - __main__ - Step 19326: {'lr': 0.00048328399131380127, 'samples': 3710592, 'steps': 19325, 'loss/train': 0.11377518624067307} -08/30/2021 16:41:54 - INFO - __main__ - Step 19327: {'lr': 0.00048328208336103305, 'samples': 3710784, 'steps': 19326, 'loss/train': 1.020818829536438} -08/30/2021 16:41:54 - INFO - __main__ - Step 19328: {'lr': 0.0004832801753031515, 'samples': 3710976, 'steps': 19327, 'loss/train': 0.6918624639511108} -08/30/2021 16:41:55 - INFO - __main__ - Step 19329: {'lr': 0.00048327826714015756, 'samples': 3711168, 'steps': 19328, 'loss/train': 1.8891956806182861} -08/30/2021 16:41:55 - INFO - __main__ - Step 19330: {'lr': 0.00048327635887205196, 'samples': 3711360, 'steps': 19329, 'loss/train': 1.7779945135116577} -08/30/2021 16:41:56 - INFO - __main__ - Step 19331: {'lr': 0.00048327445049883567, 'samples': 3711552, 'steps': 19330, 'loss/train': 1.7812371253967285} -08/30/2021 16:41:57 - INFO - __main__ - Step 19332: {'lr': 0.0004832725420205095, 'samples': 3711744, 'steps': 19331, 'loss/train': 2.511662006378174} -08/30/2021 16:41:57 - INFO - __main__ - Step 19333: {'lr': 0.00048327063343707433, 'samples': 3711936, 'steps': 19332, 'loss/train': 1.664101004600525} -08/30/2021 16:41:57 - INFO - __main__ - Step 19334: {'lr': 0.000483268724748531, 'samples': 3712128, 'steps': 19333, 'loss/train': 1.742770791053772} -08/30/2021 16:41:58 - INFO - __main__ - Step 19335: {'lr': 0.0004832668159548804, 'samples': 3712320, 'steps': 19334, 'loss/train': 1.5348186492919922} -08/30/2021 16:41:59 - INFO - __main__ - Step 19336: {'lr': 0.00048326490705612337, 'samples': 3712512, 'steps': 19335, 'loss/train': 1.2737853527069092} -08/30/2021 16:42:00 - INFO - __main__ - Step 19337: {'lr': 0.0004832629980522608, 'samples': 3712704, 'steps': 19336, 'loss/train': 1.415540099143982} -08/30/2021 16:42:00 - INFO - __main__ - Step 19338: {'lr': 0.00048326108894329345, 'samples': 3712896, 'steps': 19337, 'loss/train': 1.4279959201812744} -08/30/2021 16:42:00 - INFO - __main__ - Step 19339: {'lr': 0.00048325917972922227, 'samples': 3713088, 'steps': 19338, 'loss/train': 1.3825029134750366} -08/30/2021 16:42:01 - INFO - __main__ - Step 19340: {'lr': 0.00048325727041004815, 'samples': 3713280, 'steps': 19339, 'loss/train': 2.0216457843780518} -08/30/2021 16:42:01 - INFO - __main__ - Step 19341: {'lr': 0.0004832553609857719, 'samples': 3713472, 'steps': 19340, 'loss/train': 0.8572243452072144} -08/30/2021 16:42:03 - INFO - __main__ - Step 19342: {'lr': 0.0004832534514563943, 'samples': 3713664, 'steps': 19341, 'loss/train': 1.5212790966033936} -08/30/2021 16:42:04 - INFO - __main__ - Step 19343: {'lr': 0.0004832515418219164, 'samples': 3713856, 'steps': 19342, 'loss/train': 3.0543317794799805} -08/30/2021 16:42:04 - INFO - __main__ - Step 19344: {'lr': 0.0004832496320823389, 'samples': 3714048, 'steps': 19343, 'loss/train': 1.8511292934417725} -08/30/2021 16:42:05 - INFO - __main__ - Step 19345: {'lr': 0.0004832477222376627, 'samples': 3714240, 'steps': 19344, 'loss/train': 1.4760186672210693} -08/30/2021 16:42:05 - INFO - __main__ - Step 19346: {'lr': 0.0004832458122878888, 'samples': 3714432, 'steps': 19345, 'loss/train': 1.3504347801208496} -08/30/2021 16:42:05 - INFO - __main__ - Step 19347: {'lr': 0.0004832439022330178, 'samples': 3714624, 'steps': 19346, 'loss/train': 1.0208516120910645} -08/30/2021 16:42:07 - INFO - __main__ - Step 19348: {'lr': 0.00048324199207305075, 'samples': 3714816, 'steps': 19347, 'loss/train': 1.5862152576446533} -08/30/2021 16:42:07 - INFO - __main__ - Step 19349: {'lr': 0.0004832400818079884, 'samples': 3715008, 'steps': 19348, 'loss/train': 0.6771523952484131} -08/30/2021 16:42:07 - INFO - __main__ - Step 19350: {'lr': 0.00048323817143783174, 'samples': 3715200, 'steps': 19349, 'loss/train': 1.9784314632415771} -08/30/2021 16:42:08 - INFO - __main__ - Step 19351: {'lr': 0.0004832362609625815, 'samples': 3715392, 'steps': 19350, 'loss/train': 1.5952527523040771} -08/30/2021 16:42:08 - INFO - __main__ - Step 19352: {'lr': 0.0004832343503822386, 'samples': 3715584, 'steps': 19351, 'loss/train': 1.8875341415405273} -08/30/2021 16:42:10 - INFO - __main__ - Step 19353: {'lr': 0.000483232439696804, 'samples': 3715776, 'steps': 19352, 'loss/train': 1.3885711431503296} -08/30/2021 16:42:10 - INFO - __main__ - Step 19354: {'lr': 0.0004832305289062784, 'samples': 3715968, 'steps': 19353, 'loss/train': 0.8795766830444336} -08/30/2021 16:42:10 - INFO - __main__ - Step 19355: {'lr': 0.00048322861801066265, 'samples': 3716160, 'steps': 19354, 'loss/train': 1.794315218925476} -08/30/2021 16:42:11 - INFO - __main__ - Step 19356: {'lr': 0.00048322670700995775, 'samples': 3716352, 'steps': 19355, 'loss/train': 2.2336206436157227} -08/30/2021 16:42:11 - INFO - __main__ - Step 19357: {'lr': 0.0004832247959041645, 'samples': 3716544, 'steps': 19356, 'loss/train': 1.6674057245254517} -08/30/2021 16:42:13 - INFO - __main__ - Step 19358: {'lr': 0.0004832228846932838, 'samples': 3716736, 'steps': 19357, 'loss/train': 1.828009843826294} -08/30/2021 16:42:13 - INFO - __main__ - Step 19359: {'lr': 0.0004832209733773164, 'samples': 3716928, 'steps': 19358, 'loss/train': 2.1200366020202637} -08/30/2021 16:42:13 - INFO - __main__ - Step 19360: {'lr': 0.0004832190619562632, 'samples': 3717120, 'steps': 19359, 'loss/train': 2.2332732677459717} -08/30/2021 16:42:14 - INFO - __main__ - Step 19361: {'lr': 0.00048321715043012515, 'samples': 3717312, 'steps': 19360, 'loss/train': 1.1754701137542725} -08/30/2021 16:42:14 - INFO - __main__ - Step 19362: {'lr': 0.00048321523879890307, 'samples': 3717504, 'steps': 19361, 'loss/train': 1.480566143989563} -08/30/2021 16:42:16 - INFO - __main__ - Step 19363: {'lr': 0.00048321332706259773, 'samples': 3717696, 'steps': 19362, 'loss/train': 0.8196985125541687} -08/30/2021 16:42:16 - INFO - __main__ - Step 19364: {'lr': 0.0004832114152212101, 'samples': 3717888, 'steps': 19363, 'loss/train': 1.7934433221817017} -08/30/2021 16:42:16 - INFO - __main__ - Step 19365: {'lr': 0.000483209503274741, 'samples': 3718080, 'steps': 19364, 'loss/train': 1.9399924278259277} -08/30/2021 16:42:17 - INFO - __main__ - Step 19366: {'lr': 0.0004832075912231913, 'samples': 3718272, 'steps': 19365, 'loss/train': 1.6247559785842896} -08/30/2021 16:42:17 - INFO - __main__ - Step 19367: {'lr': 0.0004832056790665619, 'samples': 3718464, 'steps': 19366, 'loss/train': 1.808705449104309} -08/30/2021 16:42:19 - INFO - __main__ - Step 19368: {'lr': 0.0004832037668048536, 'samples': 3718656, 'steps': 19367, 'loss/train': 0.978150486946106} -08/30/2021 16:42:19 - INFO - __main__ - Step 19369: {'lr': 0.00048320185443806717, 'samples': 3718848, 'steps': 19368, 'loss/train': 1.0606640577316284} -08/30/2021 16:42:19 - INFO - __main__ - Step 19370: {'lr': 0.0004831999419662037, 'samples': 3719040, 'steps': 19369, 'loss/train': 1.6687099933624268} -08/30/2021 16:42:20 - INFO - __main__ - Step 19371: {'lr': 0.0004831980293892639, 'samples': 3719232, 'steps': 19370, 'loss/train': 1.8510860204696655} -08/30/2021 16:42:20 - INFO - __main__ - Step 19372: {'lr': 0.0004831961167072487, 'samples': 3719424, 'steps': 19371, 'loss/train': 1.5339409112930298} -08/30/2021 16:42:22 - INFO - __main__ - Step 19373: {'lr': 0.0004831942039201589, 'samples': 3719616, 'steps': 19372, 'loss/train': 1.3339210748672485} -08/30/2021 16:42:22 - INFO - __main__ - Step 19374: {'lr': 0.0004831922910279954, 'samples': 3719808, 'steps': 19373, 'loss/train': 1.6575361490249634} -08/30/2021 16:42:23 - INFO - __main__ - Step 19375: {'lr': 0.000483190378030759, 'samples': 3720000, 'steps': 19374, 'loss/train': 0.06456669420003891} -08/30/2021 16:42:23 - INFO - __main__ - Step 19376: {'lr': 0.0004831884649284507, 'samples': 3720192, 'steps': 19375, 'loss/train': 0.7960783839225769} -08/30/2021 16:42:23 - INFO - __main__ - Step 19377: {'lr': 0.00048318655172107126, 'samples': 3720384, 'steps': 19376, 'loss/train': 4.159504413604736} -08/30/2021 16:42:25 - INFO - __main__ - Step 19378: {'lr': 0.0004831846384086215, 'samples': 3720576, 'steps': 19377, 'loss/train': 1.4446724653244019} -08/30/2021 16:42:25 - INFO - __main__ - Step 19379: {'lr': 0.0004831827249911024, 'samples': 3720768, 'steps': 19378, 'loss/train': 1.2134758234024048} -08/30/2021 16:42:26 - INFO - __main__ - Step 19380: {'lr': 0.0004831808114685147, 'samples': 3720960, 'steps': 19379, 'loss/train': 1.2609055042266846} -08/30/2021 16:42:26 - INFO - __main__ - Step 19381: {'lr': 0.00048317889784085935, 'samples': 3721152, 'steps': 19380, 'loss/train': 0.6011592149734497} -08/30/2021 16:42:26 - INFO - __main__ - Step 19382: {'lr': 0.0004831769841081372, 'samples': 3721344, 'steps': 19381, 'loss/train': 2.1070375442504883} -08/30/2021 16:42:27 - INFO - __main__ - Step 19383: {'lr': 0.00048317507027034913, 'samples': 3721536, 'steps': 19382, 'loss/train': 1.7769204378128052} -08/30/2021 16:42:28 - INFO - __main__ - Step 19384: {'lr': 0.0004831731563274959, 'samples': 3721728, 'steps': 19383, 'loss/train': 1.5864990949630737} -08/30/2021 16:42:29 - INFO - __main__ - Step 19385: {'lr': 0.0004831712422795785, 'samples': 3721920, 'steps': 19384, 'loss/train': 1.2622509002685547} -08/30/2021 16:42:29 - INFO - __main__ - Step 19386: {'lr': 0.00048316932812659776, 'samples': 3722112, 'steps': 19385, 'loss/train': 1.7974189519882202} -08/30/2021 16:42:30 - INFO - __main__ - Step 19387: {'lr': 0.00048316741386855445, 'samples': 3722304, 'steps': 19386, 'loss/train': 0.48866257071495056} -08/30/2021 16:42:30 - INFO - __main__ - Step 19388: {'lr': 0.0004831654995054495, 'samples': 3722496, 'steps': 19387, 'loss/train': 1.4563623666763306} -08/30/2021 16:42:32 - INFO - __main__ - Step 19389: {'lr': 0.0004831635850372838, 'samples': 3722688, 'steps': 19388, 'loss/train': 1.7257275581359863} -08/30/2021 16:42:32 - INFO - __main__ - Step 19390: {'lr': 0.00048316167046405826, 'samples': 3722880, 'steps': 19389, 'loss/train': 0.7319338917732239} -08/30/2021 16:42:32 - INFO - __main__ - Step 19391: {'lr': 0.0004831597557857735, 'samples': 3723072, 'steps': 19390, 'loss/train': 1.5165249109268188} -08/30/2021 16:42:33 - INFO - __main__ - Step 19392: {'lr': 0.00048315784100243063, 'samples': 3723264, 'steps': 19391, 'loss/train': 1.9773688316345215} -08/30/2021 16:42:33 - INFO - __main__ - Step 19393: {'lr': 0.0004831559261140305, 'samples': 3723456, 'steps': 19392, 'loss/train': 1.6093653440475464} -08/30/2021 16:42:35 - INFO - __main__ - Step 19394: {'lr': 0.0004831540111205739, 'samples': 3723648, 'steps': 19393, 'loss/train': 1.6279922723770142} -08/30/2021 16:42:35 - INFO - __main__ - Step 19395: {'lr': 0.00048315209602206165, 'samples': 3723840, 'steps': 19394, 'loss/train': 1.7154209613800049} -08/30/2021 16:42:36 - INFO - __main__ - Step 19396: {'lr': 0.0004831501808184947, 'samples': 3724032, 'steps': 19395, 'loss/train': 1.2043235301971436} -08/30/2021 16:42:36 - INFO - __main__ - Step 19397: {'lr': 0.0004831482655098738, 'samples': 3724224, 'steps': 19396, 'loss/train': 1.9871405363082886} -08/30/2021 16:42:36 - INFO - __main__ - Step 19398: {'lr': 0.00048314635009619997, 'samples': 3724416, 'steps': 19397, 'loss/train': 1.6793252229690552} -08/30/2021 16:42:37 - INFO - __main__ - Step 19399: {'lr': 0.0004831444345774739, 'samples': 3724608, 'steps': 19398, 'loss/train': 0.517352283000946} -08/30/2021 16:42:39 - INFO - __main__ - Step 19400: {'lr': 0.00048314251895369663, 'samples': 3724800, 'steps': 19399, 'loss/train': 1.0613000392913818} -08/30/2021 16:42:39 - INFO - __main__ - Step 19401: {'lr': 0.000483140603224869, 'samples': 3724992, 'steps': 19400, 'loss/train': 1.8209928274154663} -08/30/2021 16:42:40 - INFO - __main__ - Step 19402: {'lr': 0.00048313868739099166, 'samples': 3725184, 'steps': 19401, 'loss/train': 1.1783801317214966} -08/30/2021 16:42:40 - INFO - __main__ - Step 19403: {'lr': 0.0004831367714520657, 'samples': 3725376, 'steps': 19402, 'loss/train': 1.5873388051986694} -08/30/2021 16:42:40 - INFO - __main__ - Step 19404: {'lr': 0.0004831348554080919, 'samples': 3725568, 'steps': 19403, 'loss/train': 2.2661373615264893} -08/30/2021 16:42:42 - INFO - __main__ - Step 19405: {'lr': 0.0004831329392590711, 'samples': 3725760, 'steps': 19404, 'loss/train': 0.8620322346687317} -08/30/2021 16:42:42 - INFO - __main__ - Step 19406: {'lr': 0.00048313102300500424, 'samples': 3725952, 'steps': 19405, 'loss/train': 1.3002861738204956} -08/30/2021 16:42:42 - INFO - __main__ - Step 19407: {'lr': 0.00048312910664589215, 'samples': 3726144, 'steps': 19406, 'loss/train': 1.7104800939559937} -08/30/2021 16:42:43 - INFO - __main__ - Step 19408: {'lr': 0.0004831271901817357, 'samples': 3726336, 'steps': 19407, 'loss/train': 1.7206051349639893} -08/30/2021 16:42:43 - INFO - __main__ - Step 19409: {'lr': 0.00048312527361253567, 'samples': 3726528, 'steps': 19408, 'loss/train': 0.7446151971817017} -08/30/2021 16:42:45 - INFO - __main__ - Step 19410: {'lr': 0.000483123356938293, 'samples': 3726720, 'steps': 19409, 'loss/train': 1.662960410118103} -08/30/2021 16:42:45 - INFO - __main__ - Step 19411: {'lr': 0.00048312144015900856, 'samples': 3726912, 'steps': 19410, 'loss/train': 2.022324323654175} -08/30/2021 16:42:46 - INFO - __main__ - Step 19412: {'lr': 0.00048311952327468325, 'samples': 3727104, 'steps': 19411, 'loss/train': 1.5919524431228638} -08/30/2021 16:42:46 - INFO - __main__ - Step 19413: {'lr': 0.00048311760628531777, 'samples': 3727296, 'steps': 19412, 'loss/train': 0.9535502195358276} -08/30/2021 16:42:46 - INFO - __main__ - Step 19414: {'lr': 0.00048311568919091316, 'samples': 3727488, 'steps': 19413, 'loss/train': 1.7854655981063843} -08/30/2021 16:42:48 - INFO - __main__ - Step 19415: {'lr': 0.00048311377199147023, 'samples': 3727680, 'steps': 19414, 'loss/train': 1.4093464612960815} -08/30/2021 16:42:48 - INFO - __main__ - Step 19416: {'lr': 0.00048311185468698974, 'samples': 3727872, 'steps': 19415, 'loss/train': 1.5233309268951416} -08/30/2021 16:42:49 - INFO - __main__ - Step 19417: {'lr': 0.00048310993727747277, 'samples': 3728064, 'steps': 19416, 'loss/train': 1.3573007583618164} -08/30/2021 16:42:49 - INFO - __main__ - Step 19418: {'lr': 0.00048310801976292, 'samples': 3728256, 'steps': 19417, 'loss/train': 0.570035994052887} -08/30/2021 16:42:49 - INFO - __main__ - Step 19419: {'lr': 0.0004831061021433323, 'samples': 3728448, 'steps': 19418, 'loss/train': 0.9198406338691711} -08/30/2021 16:42:51 - INFO - __main__ - Step 19420: {'lr': 0.00048310418441871065, 'samples': 3728640, 'steps': 19419, 'loss/train': 1.227281928062439} -08/30/2021 16:42:51 - INFO - __main__ - Step 19421: {'lr': 0.00048310226658905585, 'samples': 3728832, 'steps': 19420, 'loss/train': 1.704697608947754} -08/30/2021 16:42:52 - INFO - __main__ - Step 19422: {'lr': 0.00048310034865436876, 'samples': 3729024, 'steps': 19421, 'loss/train': 1.689162254333496} -08/30/2021 16:42:52 - INFO - __main__ - Step 19423: {'lr': 0.0004830984306146503, 'samples': 3729216, 'steps': 19422, 'loss/train': 1.5913020372390747} -08/30/2021 16:42:52 - INFO - __main__ - Step 19424: {'lr': 0.0004830965124699012, 'samples': 3729408, 'steps': 19423, 'loss/train': 2.141072988510132} -08/30/2021 16:42:53 - INFO - __main__ - Step 19425: {'lr': 0.00048309459422012243, 'samples': 3729600, 'steps': 19424, 'loss/train': 1.4321925640106201} -08/30/2021 16:42:54 - INFO - __main__ - Step 19426: {'lr': 0.0004830926758653148, 'samples': 3729792, 'steps': 19425, 'loss/train': 1.5611809492111206} -08/30/2021 16:42:55 - INFO - __main__ - Step 19427: {'lr': 0.00048309075740547925, 'samples': 3729984, 'steps': 19426, 'loss/train': 0.10041192173957825} -08/30/2021 16:42:55 - INFO - __main__ - Step 19428: {'lr': 0.0004830888388406166, 'samples': 3730176, 'steps': 19427, 'loss/train': 1.552420973777771} -08/30/2021 16:42:56 - INFO - __main__ - Step 19429: {'lr': 0.00048308692017072773, 'samples': 3730368, 'steps': 19428, 'loss/train': 2.0706841945648193} -08/30/2021 16:42:56 - INFO - __main__ - Step 19430: {'lr': 0.00048308500139581344, 'samples': 3730560, 'steps': 19429, 'loss/train': 1.984182596206665} -08/30/2021 16:42:57 - INFO - __main__ - Step 19431: {'lr': 0.00048308308251587476, 'samples': 3730752, 'steps': 19430, 'loss/train': 1.6536108255386353} -08/30/2021 16:42:58 - INFO - __main__ - Step 19432: {'lr': 0.00048308116353091234, 'samples': 3730944, 'steps': 19431, 'loss/train': 1.4992344379425049} -08/30/2021 16:42:58 - INFO - __main__ - Step 19433: {'lr': 0.00048307924444092716, 'samples': 3731136, 'steps': 19432, 'loss/train': 1.4667798280715942} -08/30/2021 16:42:58 - INFO - __main__ - Step 19434: {'lr': 0.0004830773252459201, 'samples': 3731328, 'steps': 19433, 'loss/train': 1.0226434469223022} -08/30/2021 16:42:59 - INFO - __main__ - Step 19435: {'lr': 0.00048307540594589194, 'samples': 3731520, 'steps': 19434, 'loss/train': 1.4328798055648804} -08/30/2021 16:43:00 - INFO - __main__ - Step 19436: {'lr': 0.0004830734865408437, 'samples': 3731712, 'steps': 19435, 'loss/train': 1.447022795677185} -08/30/2021 16:43:01 - INFO - __main__ - Step 19437: {'lr': 0.000483071567030776, 'samples': 3731904, 'steps': 19436, 'loss/train': 1.696250557899475} -08/30/2021 16:43:01 - INFO - __main__ - Step 19438: {'lr': 0.00048306964741568994, 'samples': 3732096, 'steps': 19437, 'loss/train': 1.3995155096054077} -08/30/2021 16:43:01 - INFO - __main__ - Step 19439: {'lr': 0.00048306772769558624, 'samples': 3732288, 'steps': 19438, 'loss/train': 1.395381212234497} -08/30/2021 16:43:02 - INFO - __main__ - Step 19440: {'lr': 0.0004830658078704659, 'samples': 3732480, 'steps': 19439, 'loss/train': 1.5541294813156128} -08/30/2021 16:43:04 - INFO - __main__ - Step 19441: {'lr': 0.0004830638879403296, 'samples': 3732672, 'steps': 19440, 'loss/train': 1.2075867652893066} -08/30/2021 16:43:04 - INFO - __main__ - Step 19442: {'lr': 0.00048306196790517844, 'samples': 3732864, 'steps': 19441, 'loss/train': 1.0280719995498657} -08/30/2021 16:43:04 - INFO - __main__ - Step 19443: {'lr': 0.0004830600477650131, 'samples': 3733056, 'steps': 19442, 'loss/train': 0.19573047757148743} -08/30/2021 16:43:05 - INFO - __main__ - Step 19444: {'lr': 0.0004830581275198344, 'samples': 3733248, 'steps': 19443, 'loss/train': 0.19728131592273712} -08/30/2021 16:43:05 - INFO - __main__ - Step 19445: {'lr': 0.00048305620716964336, 'samples': 3733440, 'steps': 19444, 'loss/train': 1.397684931755066} -08/30/2021 16:43:05 - INFO - __main__ - Step 19446: {'lr': 0.00048305428671444083, 'samples': 3733632, 'steps': 19445, 'loss/train': 1.491231083869934} -08/30/2021 16:43:07 - INFO - __main__ - Step 19447: {'lr': 0.00048305236615422763, 'samples': 3733824, 'steps': 19446, 'loss/train': 1.369369387626648} -08/30/2021 16:43:08 - INFO - __main__ - Step 19448: {'lr': 0.00048305044548900463, 'samples': 3734016, 'steps': 19447, 'loss/train': 1.5268791913986206} -08/30/2021 16:43:08 - INFO - __main__ - Step 19449: {'lr': 0.0004830485247187727, 'samples': 3734208, 'steps': 19448, 'loss/train': 1.5801888704299927} -08/30/2021 16:43:08 - INFO - __main__ - Step 19450: {'lr': 0.0004830466038435327, 'samples': 3734400, 'steps': 19449, 'loss/train': 1.4094716310501099} -08/30/2021 16:43:09 - INFO - __main__ - Step 19451: {'lr': 0.0004830446828632854, 'samples': 3734592, 'steps': 19450, 'loss/train': 0.9922022223472595} -08/30/2021 16:43:09 - INFO - __main__ - Step 19452: {'lr': 0.00048304276177803186, 'samples': 3734784, 'steps': 19451, 'loss/train': 1.7343542575836182} -08/30/2021 16:43:11 - INFO - __main__ - Step 19453: {'lr': 0.00048304084058777285, 'samples': 3734976, 'steps': 19452, 'loss/train': 1.4883506298065186} -08/30/2021 16:43:11 - INFO - __main__ - Step 19454: {'lr': 0.00048303891929250923, 'samples': 3735168, 'steps': 19453, 'loss/train': 2.03281831741333} -08/30/2021 16:43:12 - INFO - __main__ - Step 19455: {'lr': 0.0004830369978922418, 'samples': 3735360, 'steps': 19454, 'loss/train': 1.4497188329696655} -08/30/2021 16:43:12 - INFO - __main__ - Step 19456: {'lr': 0.00048303507638697155, 'samples': 3735552, 'steps': 19455, 'loss/train': 1.403900384902954} -08/30/2021 16:43:12 - INFO - __main__ - Step 19457: {'lr': 0.0004830331547766993, 'samples': 3735744, 'steps': 19456, 'loss/train': 1.4013632535934448} -08/30/2021 16:43:14 - INFO - __main__ - Step 19458: {'lr': 0.0004830312330614259, 'samples': 3735936, 'steps': 19457, 'loss/train': 1.2117112874984741} -08/30/2021 16:43:15 - INFO - __main__ - Step 19459: {'lr': 0.00048302931124115226, 'samples': 3736128, 'steps': 19458, 'loss/train': 0.4895917773246765} -08/30/2021 16:43:15 - INFO - __main__ - Step 19460: {'lr': 0.0004830273893158791, 'samples': 3736320, 'steps': 19459, 'loss/train': 1.79667329788208} -08/30/2021 16:43:15 - INFO - __main__ - Step 19461: {'lr': 0.0004830254672856075, 'samples': 3736512, 'steps': 19460, 'loss/train': 1.1802961826324463} -08/30/2021 16:43:16 - INFO - __main__ - Step 19462: {'lr': 0.00048302354515033813, 'samples': 3736704, 'steps': 19461, 'loss/train': 1.596136212348938} -08/30/2021 16:43:16 - INFO - __main__ - Step 19463: {'lr': 0.00048302162291007203, 'samples': 3736896, 'steps': 19462, 'loss/train': 1.3673269748687744} -08/30/2021 16:43:17 - INFO - __main__ - Step 19464: {'lr': 0.00048301970056480994, 'samples': 3737088, 'steps': 19463, 'loss/train': 1.8032881021499634} -08/30/2021 16:43:18 - INFO - __main__ - Step 19465: {'lr': 0.00048301777811455274, 'samples': 3737280, 'steps': 19464, 'loss/train': 1.113150954246521} -08/30/2021 16:43:18 - INFO - __main__ - Step 19466: {'lr': 0.0004830158555593014, 'samples': 3737472, 'steps': 19465, 'loss/train': 1.349056601524353} -08/30/2021 16:43:19 - INFO - __main__ - Step 19467: {'lr': 0.00048301393289905663, 'samples': 3737664, 'steps': 19466, 'loss/train': 1.4769805669784546} -08/30/2021 16:43:19 - INFO - __main__ - Step 19468: {'lr': 0.00048301201013381946, 'samples': 3737856, 'steps': 19467, 'loss/train': 1.7169746160507202} -08/30/2021 16:43:20 - INFO - __main__ - Step 19469: {'lr': 0.00048301008726359064, 'samples': 3738048, 'steps': 19468, 'loss/train': 1.3549416065216064} -08/30/2021 16:43:21 - INFO - __main__ - Step 19470: {'lr': 0.00048300816428837104, 'samples': 3738240, 'steps': 19469, 'loss/train': 1.4819215536117554} -08/30/2021 16:43:21 - INFO - __main__ - Step 19471: {'lr': 0.00048300624120816153, 'samples': 3738432, 'steps': 19470, 'loss/train': 1.624529242515564} -08/30/2021 16:43:22 - INFO - __main__ - Step 19472: {'lr': 0.0004830043180229631, 'samples': 3738624, 'steps': 19471, 'loss/train': 1.4806876182556152} -08/30/2021 16:43:22 - INFO - __main__ - Step 19473: {'lr': 0.0004830023947327764, 'samples': 3738816, 'steps': 19472, 'loss/train': 1.8842469453811646} -08/30/2021 16:43:24 - INFO - __main__ - Step 19474: {'lr': 0.0004830004713376025, 'samples': 3739008, 'steps': 19473, 'loss/train': 0.922451913356781} -08/30/2021 16:43:24 - INFO - __main__ - Step 19475: {'lr': 0.00048299854783744224, 'samples': 3739200, 'steps': 19474, 'loss/train': 1.7893987894058228} -08/30/2021 16:43:24 - INFO - __main__ - Step 19476: {'lr': 0.0004829966242322963, 'samples': 3739392, 'steps': 19475, 'loss/train': 1.2062294483184814} -08/30/2021 16:43:25 - INFO - __main__ - Step 19477: {'lr': 0.00048299470052216576, 'samples': 3739584, 'steps': 19476, 'loss/train': 1.5458911657333374} -08/30/2021 16:43:25 - INFO - __main__ - Step 19478: {'lr': 0.0004829927767070514, 'samples': 3739776, 'steps': 19477, 'loss/train': 1.5041776895523071} -08/30/2021 16:43:27 - INFO - __main__ - Step 19479: {'lr': 0.0004829908527869541, 'samples': 3739968, 'steps': 19478, 'loss/train': 2.5316600799560547} -08/30/2021 16:43:27 - INFO - __main__ - Step 19480: {'lr': 0.0004829889287618746, 'samples': 3740160, 'steps': 19479, 'loss/train': 1.558606743812561} -08/30/2021 16:43:27 - INFO - __main__ - Step 19481: {'lr': 0.000482987004631814, 'samples': 3740352, 'steps': 19480, 'loss/train': 1.1558796167373657} -08/30/2021 16:43:28 - INFO - __main__ - Step 19482: {'lr': 0.000482985080396773, 'samples': 3740544, 'steps': 19481, 'loss/train': 1.0911834239959717} -08/30/2021 16:43:28 - INFO - __main__ - Step 19483: {'lr': 0.00048298315605675257, 'samples': 3740736, 'steps': 19482, 'loss/train': 2.164764404296875} -08/30/2021 16:43:28 - INFO - __main__ - Step 19484: {'lr': 0.0004829812316117535, 'samples': 3740928, 'steps': 19483, 'loss/train': 1.5163272619247437} -08/30/2021 16:43:30 - INFO - __main__ - Step 19485: {'lr': 0.0004829793070617767, 'samples': 3741120, 'steps': 19484, 'loss/train': 0.15662556886672974} -08/30/2021 16:43:31 - INFO - __main__ - Step 19486: {'lr': 0.000482977382406823, 'samples': 3741312, 'steps': 19485, 'loss/train': 2.4153854846954346} -08/30/2021 16:43:31 - INFO - __main__ - Step 19487: {'lr': 0.00048297545764689327, 'samples': 3741504, 'steps': 19486, 'loss/train': 1.7778544425964355} -08/30/2021 16:43:31 - INFO - __main__ - Step 19488: {'lr': 0.00048297353278198843, 'samples': 3741696, 'steps': 19487, 'loss/train': 2.195345640182495} -08/30/2021 16:43:32 - INFO - __main__ - Step 19489: {'lr': 0.00048297160781210925, 'samples': 3741888, 'steps': 19488, 'loss/train': 1.1673959493637085} -08/30/2021 16:43:33 - INFO - __main__ - Step 19490: {'lr': 0.00048296968273725673, 'samples': 3742080, 'steps': 19489, 'loss/train': 1.3847583532333374} -08/30/2021 16:43:33 - INFO - __main__ - Step 19491: {'lr': 0.0004829677575574316, 'samples': 3742272, 'steps': 19490, 'loss/train': 1.5721217393875122} -08/30/2021 16:43:34 - INFO - __main__ - Step 19492: {'lr': 0.0004829658322726348, 'samples': 3742464, 'steps': 19491, 'loss/train': 2.139817476272583} -08/30/2021 16:43:34 - INFO - __main__ - Step 19493: {'lr': 0.00048296390688286724, 'samples': 3742656, 'steps': 19492, 'loss/train': 1.1478424072265625} -08/30/2021 16:43:35 - INFO - __main__ - Step 19494: {'lr': 0.00048296198138812974, 'samples': 3742848, 'steps': 19493, 'loss/train': 1.6474329233169556} -08/30/2021 16:43:36 - INFO - __main__ - Step 19495: {'lr': 0.00048296005578842314, 'samples': 3743040, 'steps': 19494, 'loss/train': 1.5222991704940796} -08/30/2021 16:43:37 - INFO - __main__ - Step 19496: {'lr': 0.0004829581300837483, 'samples': 3743232, 'steps': 19495, 'loss/train': 1.2511401176452637} -08/30/2021 16:43:37 - INFO - __main__ - Step 19497: {'lr': 0.00048295620427410614, 'samples': 3743424, 'steps': 19496, 'loss/train': 2.0683276653289795} -08/30/2021 16:43:38 - INFO - __main__ - Step 19498: {'lr': 0.00048295427835949757, 'samples': 3743616, 'steps': 19497, 'loss/train': 0.14382371306419373} -08/30/2021 16:43:38 - INFO - __main__ - Step 19499: {'lr': 0.0004829523523399233, 'samples': 3743808, 'steps': 19498, 'loss/train': 1.646743655204773} -08/30/2021 16:43:39 - INFO - __main__ - Step 19500: {'lr': 0.0004829504262153844, 'samples': 3744000, 'steps': 19499, 'loss/train': 1.6095962524414062} -08/30/2021 16:43:40 - INFO - __main__ - Step 19501: {'lr': 0.00048294849998588155, 'samples': 3744192, 'steps': 19500, 'loss/train': 1.597055196762085} -08/30/2021 16:43:40 - INFO - __main__ - Step 19502: {'lr': 0.0004829465736514157, 'samples': 3744384, 'steps': 19501, 'loss/train': 1.6863080263137817} -08/30/2021 16:43:40 - INFO - __main__ - Step 19503: {'lr': 0.0004829446472119878, 'samples': 3744576, 'steps': 19502, 'loss/train': 1.519710659980774} -08/30/2021 16:43:41 - INFO - __main__ - Step 19504: {'lr': 0.0004829427206675986, 'samples': 3744768, 'steps': 19503, 'loss/train': 1.3485311269760132} -08/30/2021 16:43:43 - INFO - __main__ - Step 19505: {'lr': 0.000482940794018249, 'samples': 3744960, 'steps': 19504, 'loss/train': 1.680020809173584} -08/30/2021 16:43:44 - INFO - __main__ - Step 19506: {'lr': 0.00048293886726393984, 'samples': 3745152, 'steps': 19505, 'loss/train': 1.2845860719680786} -08/30/2021 16:43:44 - INFO - __main__ - Step 19507: {'lr': 0.00048293694040467205, 'samples': 3745344, 'steps': 19506, 'loss/train': 1.7753819227218628} -08/30/2021 16:43:44 - INFO - __main__ - Step 19508: {'lr': 0.00048293501344044644, 'samples': 3745536, 'steps': 19507, 'loss/train': 1.3423000574111938} -08/30/2021 16:43:45 - INFO - __main__ - Step 19509: {'lr': 0.00048293308637126393, 'samples': 3745728, 'steps': 19508, 'loss/train': 0.06995130330324173} -08/30/2021 16:43:45 - INFO - __main__ - Step 19510: {'lr': 0.0004829311591971254, 'samples': 3745920, 'steps': 19509, 'loss/train': 1.3867766857147217} -08/30/2021 16:43:46 - INFO - __main__ - Step 19511: {'lr': 0.0004829292319180316, 'samples': 3746112, 'steps': 19510, 'loss/train': 1.5491560697555542} -08/30/2021 16:43:47 - INFO - __main__ - Step 19512: {'lr': 0.00048292730453398355, 'samples': 3746304, 'steps': 19511, 'loss/train': 2.0232818126678467} -08/30/2021 16:43:47 - INFO - __main__ - Step 19513: {'lr': 0.00048292537704498203, 'samples': 3746496, 'steps': 19512, 'loss/train': 0.7678455114364624} -08/30/2021 16:43:48 - INFO - __main__ - Step 19514: {'lr': 0.00048292344945102795, 'samples': 3746688, 'steps': 19513, 'loss/train': 1.5709292888641357} -08/30/2021 16:43:48 - INFO - __main__ - Step 19515: {'lr': 0.0004829215217521221, 'samples': 3746880, 'steps': 19514, 'loss/train': 1.579296350479126} -08/30/2021 16:43:49 - INFO - __main__ - Step 19516: {'lr': 0.00048291959394826546, 'samples': 3747072, 'steps': 19515, 'loss/train': 1.4513450860977173} -08/30/2021 16:43:50 - INFO - __main__ - Step 19517: {'lr': 0.00048291766603945885, 'samples': 3747264, 'steps': 19516, 'loss/train': 1.569222331047058} -08/30/2021 16:43:50 - INFO - __main__ - Step 19518: {'lr': 0.0004829157380257031, 'samples': 3747456, 'steps': 19517, 'loss/train': 0.45005112886428833} -08/30/2021 16:43:51 - INFO - __main__ - Step 19519: {'lr': 0.0004829138099069991, 'samples': 3747648, 'steps': 19518, 'loss/train': 2.1218044757843018} -08/30/2021 16:43:51 - INFO - __main__ - Step 19520: {'lr': 0.0004829118816833478, 'samples': 3747840, 'steps': 19519, 'loss/train': 1.4196314811706543} -08/30/2021 16:43:51 - INFO - __main__ - Step 19521: {'lr': 0.00048290995335474997, 'samples': 3748032, 'steps': 19520, 'loss/train': 1.3461363315582275} -08/30/2021 16:43:53 - INFO - __main__ - Step 19522: {'lr': 0.0004829080249212064, 'samples': 3748224, 'steps': 19521, 'loss/train': 1.23183012008667} -08/30/2021 16:43:53 - INFO - __main__ - Step 19523: {'lr': 0.00048290609638271823, 'samples': 3748416, 'steps': 19522, 'loss/train': 0.9542306661605835} -08/30/2021 16:43:54 - INFO - __main__ - Step 19524: {'lr': 0.00048290416773928615, 'samples': 3748608, 'steps': 19523, 'loss/train': 1.4460543394088745} -08/30/2021 16:43:54 - INFO - __main__ - Step 19525: {'lr': 0.00048290223899091094, 'samples': 3748800, 'steps': 19524, 'loss/train': 1.4835989475250244} -08/30/2021 16:43:54 - INFO - __main__ - Step 19526: {'lr': 0.0004829003101375937, 'samples': 3748992, 'steps': 19525, 'loss/train': 1.1736853122711182} -08/30/2021 16:43:56 - INFO - __main__ - Step 19527: {'lr': 0.00048289838117933505, 'samples': 3749184, 'steps': 19526, 'loss/train': 1.1716976165771484} -08/30/2021 16:43:56 - INFO - __main__ - Step 19528: {'lr': 0.0004828964521161361, 'samples': 3749376, 'steps': 19527, 'loss/train': 1.5114786624908447} -08/30/2021 16:43:57 - INFO - __main__ - Step 19529: {'lr': 0.0004828945229479975, 'samples': 3749568, 'steps': 19528, 'loss/train': 1.2109297513961792} -08/30/2021 16:43:57 - INFO - __main__ - Step 19530: {'lr': 0.0004828925936749202, 'samples': 3749760, 'steps': 19529, 'loss/train': 1.4926478862762451} -08/30/2021 16:43:57 - INFO - __main__ - Step 19531: {'lr': 0.0004828906642969052, 'samples': 3749952, 'steps': 19530, 'loss/train': 1.70020592212677} -08/30/2021 16:43:59 - INFO - __main__ - Step 19532: {'lr': 0.00048288873481395323, 'samples': 3750144, 'steps': 19531, 'loss/train': 2.006854295730591} -08/30/2021 16:43:59 - INFO - __main__ - Step 19533: {'lr': 0.0004828868052260652, 'samples': 3750336, 'steps': 19532, 'loss/train': 1.75969398021698} -08/30/2021 16:44:00 - INFO - __main__ - Step 19534: {'lr': 0.0004828848755332419, 'samples': 3750528, 'steps': 19533, 'loss/train': 1.984788179397583} -08/30/2021 16:44:00 - INFO - __main__ - Step 19535: {'lr': 0.0004828829457354843, 'samples': 3750720, 'steps': 19534, 'loss/train': 1.0613036155700684} -08/30/2021 16:44:01 - INFO - __main__ - Step 19536: {'lr': 0.0004828810158327933, 'samples': 3750912, 'steps': 19535, 'loss/train': 1.3652853965759277} -08/30/2021 16:44:01 - INFO - __main__ - Step 19537: {'lr': 0.00048287908582516964, 'samples': 3751104, 'steps': 19536, 'loss/train': 1.3489757776260376} -08/30/2021 16:44:02 - INFO - __main__ - Step 19538: {'lr': 0.00048287715571261424, 'samples': 3751296, 'steps': 19537, 'loss/train': 1.5740211009979248} -08/30/2021 16:44:03 - INFO - __main__ - Step 19539: {'lr': 0.00048287522549512806, 'samples': 3751488, 'steps': 19538, 'loss/train': 1.7897087335586548} -08/30/2021 16:44:03 - INFO - __main__ - Step 19540: {'lr': 0.0004828732951727119, 'samples': 3751680, 'steps': 19539, 'loss/train': 1.388185977935791} -08/30/2021 16:44:04 - INFO - __main__ - Step 19541: {'lr': 0.00048287136474536657, 'samples': 3751872, 'steps': 19540, 'loss/train': 1.5125842094421387} -08/30/2021 16:44:04 - INFO - __main__ - Step 19542: {'lr': 0.000482869434213093, 'samples': 3752064, 'steps': 19541, 'loss/train': 1.222025990486145} -08/30/2021 16:44:05 - INFO - __main__ - Step 19543: {'lr': 0.0004828675035758921, 'samples': 3752256, 'steps': 19542, 'loss/train': 0.8148073554039001} -08/30/2021 16:44:06 - INFO - __main__ - Step 19544: {'lr': 0.00048286557283376465, 'samples': 3752448, 'steps': 19543, 'loss/train': 1.2790478467941284} -08/30/2021 16:44:06 - INFO - __main__ - Step 19545: {'lr': 0.0004828636419867116, 'samples': 3752640, 'steps': 19544, 'loss/train': 0.9558858871459961} -08/30/2021 16:44:07 - INFO - __main__ - Step 19546: {'lr': 0.00048286171103473376, 'samples': 3752832, 'steps': 19545, 'loss/train': 1.670215368270874} -08/30/2021 16:44:07 - INFO - __main__ - Step 19547: {'lr': 0.00048285977997783203, 'samples': 3753024, 'steps': 19546, 'loss/train': 2.879312515258789} -08/30/2021 16:44:09 - INFO - __main__ - Step 19548: {'lr': 0.0004828578488160073, 'samples': 3753216, 'steps': 19547, 'loss/train': 1.5151432752609253} -08/30/2021 16:44:09 - INFO - __main__ - Step 19549: {'lr': 0.0004828559175492604, 'samples': 3753408, 'steps': 19548, 'loss/train': 1.454259991645813} -08/30/2021 16:44:09 - INFO - __main__ - Step 19550: {'lr': 0.0004828539861775922, 'samples': 3753600, 'steps': 19549, 'loss/train': 1.4162417650222778} -08/30/2021 16:44:10 - INFO - __main__ - Step 19551: {'lr': 0.0004828520547010036, 'samples': 3753792, 'steps': 19550, 'loss/train': 2.0042665004730225} -08/30/2021 16:44:10 - INFO - __main__ - Step 19552: {'lr': 0.0004828501231194955, 'samples': 3753984, 'steps': 19551, 'loss/train': 1.8019202947616577} -08/30/2021 16:44:10 - INFO - __main__ - Step 19553: {'lr': 0.0004828481914330687, 'samples': 3754176, 'steps': 19552, 'loss/train': 1.7917029857635498} -08/30/2021 16:44:13 - INFO - __main__ - Step 19554: {'lr': 0.000482846259641724, 'samples': 3754368, 'steps': 19553, 'loss/train': 0.7208302617073059} -08/30/2021 16:44:13 - INFO - __main__ - Step 19555: {'lr': 0.0004828443277454625, 'samples': 3754560, 'steps': 19554, 'loss/train': 1.9223098754882812} -08/30/2021 16:44:13 - INFO - __main__ - Step 19556: {'lr': 0.0004828423957442849, 'samples': 3754752, 'steps': 19555, 'loss/train': 1.1059141159057617} -08/30/2021 16:44:14 - INFO - __main__ - Step 19557: {'lr': 0.00048284046363819213, 'samples': 3754944, 'steps': 19556, 'loss/train': 1.0503833293914795} -08/30/2021 16:44:14 - INFO - __main__ - Step 19558: {'lr': 0.000482838531427185, 'samples': 3755136, 'steps': 19557, 'loss/train': 0.42678242921829224} -08/30/2021 16:44:14 - INFO - __main__ - Step 19559: {'lr': 0.00048283659911126445, 'samples': 3755328, 'steps': 19558, 'loss/train': 1.0968704223632812} -08/30/2021 16:44:17 - INFO - __main__ - Step 19560: {'lr': 0.0004828346666904313, 'samples': 3755520, 'steps': 19559, 'loss/train': 1.1777867078781128} -08/30/2021 16:44:18 - INFO - __main__ - Step 19561: {'lr': 0.00048283273416468644, 'samples': 3755712, 'steps': 19560, 'loss/train': 1.7494573593139648} -08/30/2021 16:44:18 - INFO - __main__ - Step 19562: {'lr': 0.0004828308015340307, 'samples': 3755904, 'steps': 19561, 'loss/train': 1.6501796245574951} -08/30/2021 16:44:18 - INFO - __main__ - Step 19563: {'lr': 0.0004828288687984651, 'samples': 3756096, 'steps': 19562, 'loss/train': 1.9800878763198853} -08/30/2021 16:44:19 - INFO - __main__ - Step 19564: {'lr': 0.0004828269359579903, 'samples': 3756288, 'steps': 19563, 'loss/train': 1.352666974067688} -08/30/2021 16:44:19 - INFO - __main__ - Step 19565: {'lr': 0.00048282500301260735, 'samples': 3756480, 'steps': 19564, 'loss/train': 1.8031508922576904} -08/30/2021 16:44:21 - INFO - __main__ - Step 19566: {'lr': 0.000482823069962317, 'samples': 3756672, 'steps': 19565, 'loss/train': 1.3478760719299316} -08/30/2021 16:44:21 - INFO - __main__ - Step 19567: {'lr': 0.0004828211368071202, 'samples': 3756864, 'steps': 19566, 'loss/train': 1.795411229133606} -08/30/2021 16:44:21 - INFO - __main__ - Step 19568: {'lr': 0.0004828192035470178, 'samples': 3757056, 'steps': 19567, 'loss/train': 1.5540285110473633} -08/30/2021 16:44:22 - INFO - __main__ - Step 19569: {'lr': 0.00048281727018201063, 'samples': 3757248, 'steps': 19568, 'loss/train': 0.5638701915740967} -08/30/2021 16:44:22 - INFO - __main__ - Step 19570: {'lr': 0.00048281533671209955, 'samples': 3757440, 'steps': 19569, 'loss/train': 1.6570943593978882} -08/30/2021 16:44:24 - INFO - __main__ - Step 19571: {'lr': 0.0004828134031372855, 'samples': 3757632, 'steps': 19570, 'loss/train': 1.484034538269043} -08/30/2021 16:44:24 - INFO - __main__ - Step 19572: {'lr': 0.00048281146945756937, 'samples': 3757824, 'steps': 19571, 'loss/train': 2.0269041061401367} -08/30/2021 16:44:25 - INFO - __main__ - Step 19573: {'lr': 0.00048280953567295196, 'samples': 3758016, 'steps': 19572, 'loss/train': 1.5945733785629272} -08/30/2021 16:44:25 - INFO - __main__ - Step 19574: {'lr': 0.0004828076017834342, 'samples': 3758208, 'steps': 19573, 'loss/train': 1.7511272430419922} -08/30/2021 16:44:25 - INFO - __main__ - Step 19575: {'lr': 0.00048280566778901684, 'samples': 3758400, 'steps': 19574, 'loss/train': 1.7083972692489624} -08/30/2021 16:44:26 - INFO - __main__ - Step 19576: {'lr': 0.00048280373368970086, 'samples': 3758592, 'steps': 19575, 'loss/train': 0.8600512742996216} -08/30/2021 16:44:27 - INFO - __main__ - Step 19577: {'lr': 0.0004828017994854872, 'samples': 3758784, 'steps': 19576, 'loss/train': 5.872617244720459} -08/30/2021 16:44:28 - INFO - __main__ - Step 19578: {'lr': 0.0004827998651763765, 'samples': 3758976, 'steps': 19577, 'loss/train': 1.3304845094680786} -08/30/2021 16:44:28 - INFO - __main__ - Step 19579: {'lr': 0.0004827979307623699, 'samples': 3759168, 'steps': 19578, 'loss/train': 1.8319852352142334} -08/30/2021 16:44:29 - INFO - __main__ - Step 19580: {'lr': 0.0004827959962434681, 'samples': 3759360, 'steps': 19579, 'loss/train': 1.463954210281372} -08/30/2021 16:44:29 - INFO - __main__ - Step 19581: {'lr': 0.00048279406161967197, 'samples': 3759552, 'steps': 19580, 'loss/train': 1.9977972507476807} -08/30/2021 16:44:29 - INFO - __main__ - Step 19582: {'lr': 0.0004827921268909825, 'samples': 3759744, 'steps': 19581, 'loss/train': 1.2031890153884888} -08/30/2021 16:44:31 - INFO - __main__ - Step 19583: {'lr': 0.0004827901920574005, 'samples': 3759936, 'steps': 19582, 'loss/train': 4.179448127746582} -08/30/2021 16:44:31 - INFO - __main__ - Step 19584: {'lr': 0.0004827882571189268, 'samples': 3760128, 'steps': 19583, 'loss/train': 1.2608264684677124} -08/30/2021 16:44:32 - INFO - __main__ - Step 19585: {'lr': 0.00048278632207556226, 'samples': 3760320, 'steps': 19584, 'loss/train': 1.7685452699661255} -08/30/2021 16:44:32 - INFO - __main__ - Step 19586: {'lr': 0.00048278438692730784, 'samples': 3760512, 'steps': 19585, 'loss/train': 1.4851990938186646} -08/30/2021 16:44:32 - INFO - __main__ - Step 19587: {'lr': 0.00048278245167416434, 'samples': 3760704, 'steps': 19586, 'loss/train': 1.9291446208953857} -08/30/2021 16:44:34 - INFO - __main__ - Step 19588: {'lr': 0.0004827805163161327, 'samples': 3760896, 'steps': 19587, 'loss/train': 1.251665472984314} -08/30/2021 16:44:34 - INFO - __main__ - Step 19589: {'lr': 0.0004827785808532137, 'samples': 3761088, 'steps': 19588, 'loss/train': 1.1816458702087402} -08/30/2021 16:44:35 - INFO - __main__ - Step 19590: {'lr': 0.0004827766452854083, 'samples': 3761280, 'steps': 19589, 'loss/train': 1.5434032678604126} -08/30/2021 16:44:35 - INFO - __main__ - Step 19591: {'lr': 0.0004827747096127173, 'samples': 3761472, 'steps': 19590, 'loss/train': 1.9463564157485962} -08/30/2021 16:44:35 - INFO - __main__ - Step 19592: {'lr': 0.00048277277383514165, 'samples': 3761664, 'steps': 19591, 'loss/train': 1.7181123495101929} -08/30/2021 16:44:37 - INFO - __main__ - Step 19593: {'lr': 0.00048277083795268216, 'samples': 3761856, 'steps': 19592, 'loss/train': 1.314265251159668} -08/30/2021 16:44:37 - INFO - __main__ - Step 19594: {'lr': 0.0004827689019653397, 'samples': 3762048, 'steps': 19593, 'loss/train': 2.241570234298706} -08/30/2021 16:44:38 - INFO - __main__ - Step 19595: {'lr': 0.00048276696587311525, 'samples': 3762240, 'steps': 19594, 'loss/train': 2.594907283782959} -08/30/2021 16:44:38 - INFO - __main__ - Step 19596: {'lr': 0.00048276502967600955, 'samples': 3762432, 'steps': 19595, 'loss/train': 1.2087441682815552} -08/30/2021 16:44:38 - INFO - __main__ - Step 19597: {'lr': 0.00048276309337402345, 'samples': 3762624, 'steps': 19596, 'loss/train': 1.221699833869934} -08/30/2021 16:44:40 - INFO - __main__ - Step 19598: {'lr': 0.000482761156967158, 'samples': 3762816, 'steps': 19597, 'loss/train': 0.21570028364658356} -08/30/2021 16:44:40 - INFO - __main__ - Step 19599: {'lr': 0.0004827592204554139, 'samples': 3763008, 'steps': 19598, 'loss/train': 1.727426290512085} -08/30/2021 16:44:41 - INFO - __main__ - Step 19600: {'lr': 0.00048275728383879215, 'samples': 3763200, 'steps': 19599, 'loss/train': 2.093048572540283} -08/30/2021 16:44:41 - INFO - __main__ - Step 19601: {'lr': 0.0004827553471172935, 'samples': 3763392, 'steps': 19600, 'loss/train': 1.3071701526641846} -08/30/2021 16:44:41 - INFO - __main__ - Step 19602: {'lr': 0.00048275341029091885, 'samples': 3763584, 'steps': 19601, 'loss/train': 1.304287075996399} -08/30/2021 16:44:42 - INFO - __main__ - Step 19603: {'lr': 0.0004827514733596692, 'samples': 3763776, 'steps': 19602, 'loss/train': 1.56734037399292} -08/30/2021 16:44:43 - INFO - __main__ - Step 19604: {'lr': 0.00048274953632354524, 'samples': 3763968, 'steps': 19603, 'loss/train': 1.830305814743042} -08/30/2021 16:44:44 - INFO - __main__ - Step 19605: {'lr': 0.000482747599182548, 'samples': 3764160, 'steps': 19604, 'loss/train': 1.419538140296936} -08/30/2021 16:44:44 - INFO - __main__ - Step 19606: {'lr': 0.00048274566193667824, 'samples': 3764352, 'steps': 19605, 'loss/train': 1.2372103929519653} -08/30/2021 16:44:45 - INFO - __main__ - Step 19607: {'lr': 0.0004827437245859369, 'samples': 3764544, 'steps': 19606, 'loss/train': 1.2850303649902344} -08/30/2021 16:44:45 - INFO - __main__ - Step 19608: {'lr': 0.0004827417871303248, 'samples': 3764736, 'steps': 19607, 'loss/train': 0.9325003027915955} -08/30/2021 16:44:47 - INFO - __main__ - Step 19609: {'lr': 0.00048273984956984285, 'samples': 3764928, 'steps': 19608, 'loss/train': 1.6945222616195679} -08/30/2021 16:44:47 - INFO - __main__ - Step 19610: {'lr': 0.0004827379119044919, 'samples': 3765120, 'steps': 19609, 'loss/train': 2.009012460708618} -08/30/2021 16:44:47 - INFO - __main__ - Step 19611: {'lr': 0.00048273597413427284, 'samples': 3765312, 'steps': 19610, 'loss/train': 0.20731039345264435} -08/30/2021 16:44:48 - INFO - __main__ - Step 19612: {'lr': 0.00048273403625918653, 'samples': 3765504, 'steps': 19611, 'loss/train': 1.801841139793396} -08/30/2021 16:44:48 - INFO - __main__ - Step 19613: {'lr': 0.0004827320982792339, 'samples': 3765696, 'steps': 19612, 'loss/train': 1.930281639099121} -08/30/2021 16:44:50 - INFO - __main__ - Step 19614: {'lr': 0.00048273016019441585, 'samples': 3765888, 'steps': 19613, 'loss/train': 2.790879487991333} -08/30/2021 16:44:50 - INFO - __main__ - Step 19615: {'lr': 0.00048272822200473304, 'samples': 3766080, 'steps': 19614, 'loss/train': 0.7464519739151001} -08/30/2021 16:44:51 - INFO - __main__ - Step 19616: {'lr': 0.0004827262837101866, 'samples': 3766272, 'steps': 19615, 'loss/train': 1.577192783355713} -08/30/2021 16:44:51 - INFO - __main__ - Step 19617: {'lr': 0.0004827243453107772, 'samples': 3766464, 'steps': 19616, 'loss/train': 1.2627135515213013} -08/30/2021 16:44:51 - INFO - __main__ - Step 19618: {'lr': 0.0004827224068065058, 'samples': 3766656, 'steps': 19617, 'loss/train': 2.4496021270751953} -08/30/2021 16:44:53 - INFO - __main__ - Step 19619: {'lr': 0.0004827204681973733, 'samples': 3766848, 'steps': 19618, 'loss/train': 1.3852035999298096} -08/30/2021 16:44:54 - INFO - __main__ - Step 19620: {'lr': 0.00048271852948338057, 'samples': 3767040, 'steps': 19619, 'loss/train': 2.0666980743408203} -08/30/2021 16:44:54 - INFO - __main__ - Step 19621: {'lr': 0.00048271659066452847, 'samples': 3767232, 'steps': 19620, 'loss/train': 6.3381547927856445} -08/30/2021 16:44:55 - INFO - __main__ - Step 19622: {'lr': 0.0004827146517408178, 'samples': 3767424, 'steps': 19621, 'loss/train': 1.6556847095489502} -08/30/2021 16:44:55 - INFO - __main__ - Step 19623: {'lr': 0.0004827127127122495, 'samples': 3767616, 'steps': 19622, 'loss/train': 1.4426981210708618} -08/30/2021 16:44:55 - INFO - __main__ - Step 19624: {'lr': 0.00048271077357882455, 'samples': 3767808, 'steps': 19623, 'loss/train': 0.5524057745933533} -08/30/2021 16:44:57 - INFO - __main__ - Step 19625: {'lr': 0.00048270883434054364, 'samples': 3768000, 'steps': 19624, 'loss/train': 1.514841914176941} -08/30/2021 16:44:57 - INFO - __main__ - Step 19626: {'lr': 0.00048270689499740774, 'samples': 3768192, 'steps': 19625, 'loss/train': 1.9654330015182495} -08/30/2021 16:44:58 - INFO - __main__ - Step 19627: {'lr': 0.0004827049555494176, 'samples': 3768384, 'steps': 19626, 'loss/train': 1.2500262260437012} -08/30/2021 16:44:58 - INFO - __main__ - Step 19628: {'lr': 0.00048270301599657436, 'samples': 3768576, 'steps': 19627, 'loss/train': 1.5800343751907349} -08/30/2021 16:44:58 - INFO - __main__ - Step 19629: {'lr': 0.0004827010763388786, 'samples': 3768768, 'steps': 19628, 'loss/train': 1.7905545234680176} -08/30/2021 16:44:59 - INFO - __main__ - Step 19630: {'lr': 0.00048269913657633147, 'samples': 3768960, 'steps': 19629, 'loss/train': 1.5206153392791748} -08/30/2021 16:45:00 - INFO - __main__ - Step 19631: {'lr': 0.00048269719670893357, 'samples': 3769152, 'steps': 19630, 'loss/train': 1.2802495956420898} -08/30/2021 16:45:01 - INFO - __main__ - Step 19632: {'lr': 0.00048269525673668595, 'samples': 3769344, 'steps': 19631, 'loss/train': 1.1612682342529297} -08/30/2021 16:45:01 - INFO - __main__ - Step 19633: {'lr': 0.00048269331665958947, 'samples': 3769536, 'steps': 19632, 'loss/train': 1.210286021232605} -08/30/2021 16:45:02 - INFO - __main__ - Step 19634: {'lr': 0.00048269137647764495, 'samples': 3769728, 'steps': 19633, 'loss/train': 1.4296683073043823} -08/30/2021 16:45:02 - INFO - __main__ - Step 19635: {'lr': 0.00048268943619085325, 'samples': 3769920, 'steps': 19634, 'loss/train': 2.321168899536133} -08/30/2021 16:45:04 - INFO - __main__ - Step 19636: {'lr': 0.00048268749579921536, 'samples': 3770112, 'steps': 19635, 'loss/train': 1.4415132999420166} -08/30/2021 16:45:04 - INFO - __main__ - Step 19637: {'lr': 0.00048268555530273197, 'samples': 3770304, 'steps': 19636, 'loss/train': 0.2824762761592865} -08/30/2021 16:45:04 - INFO - __main__ - Step 19638: {'lr': 0.0004826836147014041, 'samples': 3770496, 'steps': 19637, 'loss/train': 1.977523922920227} -08/30/2021 16:45:05 - INFO - __main__ - Step 19639: {'lr': 0.0004826816739952326, 'samples': 3770688, 'steps': 19638, 'loss/train': 1.6820950508117676} -08/30/2021 16:45:05 - INFO - __main__ - Step 19640: {'lr': 0.0004826797331842183, 'samples': 3770880, 'steps': 19639, 'loss/train': 2.1210596561431885} -08/30/2021 16:45:07 - INFO - __main__ - Step 19641: {'lr': 0.0004826777922683622, 'samples': 3771072, 'steps': 19640, 'loss/train': 1.9992430210113525} -08/30/2021 16:45:07 - INFO - __main__ - Step 19642: {'lr': 0.0004826758512476649, 'samples': 3771264, 'steps': 19641, 'loss/train': 2.0058212280273438} -08/30/2021 16:45:08 - INFO - __main__ - Step 19643: {'lr': 0.0004826739101221276, 'samples': 3771456, 'steps': 19642, 'loss/train': 1.8318320512771606} -08/30/2021 16:45:08 - INFO - __main__ - Step 19644: {'lr': 0.000482671968891751, 'samples': 3771648, 'steps': 19643, 'loss/train': 1.7951756715774536} -08/30/2021 16:45:08 - INFO - __main__ - Step 19645: {'lr': 0.000482670027556536, 'samples': 3771840, 'steps': 19644, 'loss/train': 1.7677150964736938} -08/30/2021 16:45:09 - INFO - __main__ - Step 19646: {'lr': 0.0004826680861164834, 'samples': 3772032, 'steps': 19645, 'loss/train': 1.8392150402069092} -08/30/2021 16:45:10 - INFO - __main__ - Step 19647: {'lr': 0.00048266614457159426, 'samples': 3772224, 'steps': 19646, 'loss/train': 1.3000612258911133} -08/30/2021 16:45:11 - INFO - __main__ - Step 19648: {'lr': 0.0004826642029218693, 'samples': 3772416, 'steps': 19647, 'loss/train': 1.3055709600448608} -08/30/2021 16:45:11 - INFO - __main__ - Step 19649: {'lr': 0.00048266226116730937, 'samples': 3772608, 'steps': 19648, 'loss/train': 1.7779978513717651} -08/30/2021 16:45:11 - INFO - __main__ - Step 19650: {'lr': 0.00048266031930791555, 'samples': 3772800, 'steps': 19649, 'loss/train': 1.8078025579452515} -08/30/2021 16:45:12 - INFO - __main__ - Step 19651: {'lr': 0.0004826583773436884, 'samples': 3772992, 'steps': 19650, 'loss/train': 1.2400726079940796} -08/30/2021 16:45:13 - INFO - __main__ - Step 19652: {'lr': 0.00048265643527462915, 'samples': 3773184, 'steps': 19651, 'loss/train': 1.1456602811813354} -08/30/2021 16:45:14 - INFO - __main__ - Step 19653: {'lr': 0.00048265449310073847, 'samples': 3773376, 'steps': 19652, 'loss/train': 1.620891809463501} -08/30/2021 16:45:14 - INFO - __main__ - Step 19654: {'lr': 0.0004826525508220172, 'samples': 3773568, 'steps': 19653, 'loss/train': 1.7850602865219116} -08/30/2021 16:45:15 - INFO - __main__ - Step 19655: {'lr': 0.0004826506084384663, 'samples': 3773760, 'steps': 19654, 'loss/train': 0.13912451267242432} -08/30/2021 16:45:15 - INFO - __main__ - Step 19656: {'lr': 0.00048264866595008665, 'samples': 3773952, 'steps': 19655, 'loss/train': 1.826074481010437} -08/30/2021 16:45:17 - INFO - __main__ - Step 19657: {'lr': 0.0004826467233568791, 'samples': 3774144, 'steps': 19656, 'loss/train': 1.2786715030670166} -08/30/2021 16:45:17 - INFO - __main__ - Step 19658: {'lr': 0.00048264478065884454, 'samples': 3774336, 'steps': 19657, 'loss/train': 1.6209207773208618} -08/30/2021 16:45:18 - INFO - __main__ - Step 19659: {'lr': 0.0004826428378559838, 'samples': 3774528, 'steps': 19658, 'loss/train': 1.7213256359100342} -08/30/2021 16:45:18 - INFO - __main__ - Step 19660: {'lr': 0.00048264089494829776, 'samples': 3774720, 'steps': 19659, 'loss/train': 0.07078750431537628} -08/30/2021 16:45:18 - INFO - __main__ - Step 19661: {'lr': 0.0004826389519357874, 'samples': 3774912, 'steps': 19660, 'loss/train': 1.532974362373352} -08/30/2021 16:45:19 - INFO - __main__ - Step 19662: {'lr': 0.00048263700881845346, 'samples': 3775104, 'steps': 19661, 'loss/train': 1.3122813701629639} -08/30/2021 16:45:20 - INFO - __main__ - Step 19663: {'lr': 0.00048263506559629687, 'samples': 3775296, 'steps': 19662, 'loss/train': 1.125578761100769} -08/30/2021 16:45:21 - INFO - __main__ - Step 19664: {'lr': 0.00048263312226931853, 'samples': 3775488, 'steps': 19663, 'loss/train': 2.198880434036255} -08/30/2021 16:45:21 - INFO - __main__ - Step 19665: {'lr': 0.0004826311788375193, 'samples': 3775680, 'steps': 19664, 'loss/train': 1.7454428672790527} -08/30/2021 16:45:21 - INFO - __main__ - Step 19666: {'lr': 0.00048262923530090007, 'samples': 3775872, 'steps': 19665, 'loss/train': 1.5772764682769775} -08/30/2021 16:45:22 - INFO - __main__ - Step 19667: {'lr': 0.0004826272916594616, 'samples': 3776064, 'steps': 19666, 'loss/train': 1.87223482131958} -08/30/2021 16:45:23 - INFO - __main__ - Step 19668: {'lr': 0.000482625347913205, 'samples': 3776256, 'steps': 19667, 'loss/train': 1.2227168083190918} -08/30/2021 16:45:23 - INFO - __main__ - Step 19669: {'lr': 0.0004826234040621309, 'samples': 3776448, 'steps': 19668, 'loss/train': 0.7310164570808411} -08/30/2021 16:45:24 - INFO - __main__ - Step 19670: {'lr': 0.00048262146010624035, 'samples': 3776640, 'steps': 19669, 'loss/train': 0.8155099749565125} -08/30/2021 16:45:24 - INFO - __main__ - Step 19671: {'lr': 0.0004826195160455341, 'samples': 3776832, 'steps': 19670, 'loss/train': 1.195999264717102} -08/30/2021 16:45:25 - INFO - __main__ - Step 19672: {'lr': 0.00048261757188001314, 'samples': 3777024, 'steps': 19671, 'loss/train': 1.8243367671966553} -08/30/2021 16:45:25 - INFO - __main__ - Step 19673: {'lr': 0.00048261562760967824, 'samples': 3777216, 'steps': 19672, 'loss/train': 1.3731988668441772} -08/30/2021 16:45:27 - INFO - __main__ - Step 19674: {'lr': 0.0004826136832345304, 'samples': 3777408, 'steps': 19673, 'loss/train': 1.8078889846801758} -08/30/2021 16:45:27 - INFO - __main__ - Step 19675: {'lr': 0.00048261173875457035, 'samples': 3777600, 'steps': 19674, 'loss/train': 1.550720453262329} -08/30/2021 16:45:28 - INFO - __main__ - Step 19676: {'lr': 0.0004826097941697991, 'samples': 3777792, 'steps': 19675, 'loss/train': 1.763080358505249} -08/30/2021 16:45:28 - INFO - __main__ - Step 19677: {'lr': 0.0004826078494802174, 'samples': 3777984, 'steps': 19676, 'loss/train': 0.2705342173576355} -08/30/2021 16:45:28 - INFO - __main__ - Step 19678: {'lr': 0.00048260590468582624, 'samples': 3778176, 'steps': 19677, 'loss/train': 1.0702122449874878} -08/30/2021 16:45:30 - INFO - __main__ - Step 19679: {'lr': 0.0004826039597866265, 'samples': 3778368, 'steps': 19678, 'loss/train': 1.5734738111495972} -08/30/2021 16:45:31 - INFO - __main__ - Step 19680: {'lr': 0.00048260201478261887, 'samples': 3778560, 'steps': 19679, 'loss/train': 1.3631218671798706} -08/30/2021 16:45:31 - INFO - __main__ - Step 19681: {'lr': 0.0004826000696738045, 'samples': 3778752, 'steps': 19680, 'loss/train': 1.1993298530578613} -08/30/2021 16:45:31 - INFO - __main__ - Step 19682: {'lr': 0.000482598124460184, 'samples': 3778944, 'steps': 19681, 'loss/train': 1.9589277505874634} -08/30/2021 16:45:32 - INFO - __main__ - Step 19683: {'lr': 0.00048259617914175846, 'samples': 3779136, 'steps': 19682, 'loss/train': 1.520262360572815} -08/30/2021 16:45:33 - INFO - __main__ - Step 19684: {'lr': 0.00048259423371852867, 'samples': 3779328, 'steps': 19683, 'loss/train': 1.4517934322357178} -08/30/2021 16:45:34 - INFO - __main__ - Step 19685: {'lr': 0.0004825922881904955, 'samples': 3779520, 'steps': 19684, 'loss/train': 1.9209898710250854} -08/30/2021 16:45:34 - INFO - __main__ - Step 19686: {'lr': 0.00048259034255765984, 'samples': 3779712, 'steps': 19685, 'loss/train': 1.4244006872177124} -08/30/2021 16:45:34 - INFO - __main__ - Step 19687: {'lr': 0.00048258839682002253, 'samples': 3779904, 'steps': 19686, 'loss/train': 1.7588123083114624} -08/30/2021 16:45:35 - INFO - __main__ - Step 19688: {'lr': 0.00048258645097758445, 'samples': 3780096, 'steps': 19687, 'loss/train': 1.736598014831543} -08/30/2021 16:45:36 - INFO - __main__ - Step 19689: {'lr': 0.0004825845050303466, 'samples': 3780288, 'steps': 19688, 'loss/train': 1.4805346727371216} -08/30/2021 16:45:37 - INFO - __main__ - Step 19690: {'lr': 0.00048258255897830967, 'samples': 3780480, 'steps': 19689, 'loss/train': 1.5934196710586548} -08/30/2021 16:45:37 - INFO - __main__ - Step 19691: {'lr': 0.0004825806128214747, 'samples': 3780672, 'steps': 19690, 'loss/train': 1.61527419090271} -08/30/2021 16:45:37 - INFO - __main__ - Step 19692: {'lr': 0.00048257866655984237, 'samples': 3780864, 'steps': 19691, 'loss/train': 1.6771128177642822} -08/30/2021 16:45:38 - INFO - __main__ - Step 19693: {'lr': 0.0004825767201934138, 'samples': 3781056, 'steps': 19692, 'loss/train': 1.5107687711715698} -08/30/2021 16:45:39 - INFO - __main__ - Step 19694: {'lr': 0.0004825747737221897, 'samples': 3781248, 'steps': 19693, 'loss/train': 1.7452632188796997} -08/30/2021 16:45:40 - INFO - __main__ - Step 19695: {'lr': 0.000482572827146171, 'samples': 3781440, 'steps': 19694, 'loss/train': 1.260412335395813} -08/30/2021 16:45:40 - INFO - __main__ - Step 19696: {'lr': 0.00048257088046535864, 'samples': 3781632, 'steps': 19695, 'loss/train': 1.8159458637237549} -08/30/2021 16:45:41 - INFO - __main__ - Step 19697: {'lr': 0.0004825689336797534, 'samples': 3781824, 'steps': 19696, 'loss/train': 1.7496967315673828} -08/30/2021 16:45:41 - INFO - __main__ - Step 19698: {'lr': 0.00048256698678935615, 'samples': 3782016, 'steps': 19697, 'loss/train': 6.348109245300293} -08/30/2021 16:45:41 - INFO - __main__ - Step 19699: {'lr': 0.00048256503979416776, 'samples': 3782208, 'steps': 19698, 'loss/train': 2.1363143920898438} -08/30/2021 16:45:43 - INFO - __main__ - Step 19700: {'lr': 0.0004825630926941892, 'samples': 3782400, 'steps': 19699, 'loss/train': 0.06274674832820892} -08/30/2021 16:45:43 - INFO - __main__ - Step 19701: {'lr': 0.0004825611454894213, 'samples': 3782592, 'steps': 19700, 'loss/train': 1.3938616514205933} -08/30/2021 16:45:44 - INFO - __main__ - Step 19702: {'lr': 0.000482559198179865, 'samples': 3782784, 'steps': 19701, 'loss/train': 1.8158903121948242} -08/30/2021 16:45:44 - INFO - __main__ - Step 19703: {'lr': 0.00048255725076552103, 'samples': 3782976, 'steps': 19702, 'loss/train': 1.9675157070159912} -08/30/2021 16:45:44 - INFO - __main__ - Step 19704: {'lr': 0.0004825553032463904, 'samples': 3783168, 'steps': 19703, 'loss/train': 1.5207316875457764} -08/30/2021 16:45:45 - INFO - __main__ - Step 19705: {'lr': 0.00048255335562247395, 'samples': 3783360, 'steps': 19704, 'loss/train': 1.7516065835952759} -08/30/2021 16:45:46 - INFO - __main__ - Step 19706: {'lr': 0.0004825514078937725, 'samples': 3783552, 'steps': 19705, 'loss/train': 1.459518313407898} -08/30/2021 16:45:47 - INFO - __main__ - Step 19707: {'lr': 0.000482549460060287, 'samples': 3783744, 'steps': 19706, 'loss/train': 1.0809588432312012} -08/30/2021 16:45:47 - INFO - __main__ - Step 19708: {'lr': 0.0004825475121220183, 'samples': 3783936, 'steps': 19707, 'loss/train': 1.7737821340560913} -08/30/2021 16:45:47 - INFO - __main__ - Step 19709: {'lr': 0.0004825455640789672, 'samples': 3784128, 'steps': 19708, 'loss/train': 1.630860447883606} -08/30/2021 16:45:48 - INFO - __main__ - Step 19710: {'lr': 0.00048254361593113475, 'samples': 3784320, 'steps': 19709, 'loss/train': 1.9221594333648682} -08/30/2021 16:45:49 - INFO - __main__ - Step 19711: {'lr': 0.0004825416676785217, 'samples': 3784512, 'steps': 19710, 'loss/train': 2.125366687774658} -08/30/2021 16:45:50 - INFO - __main__ - Step 19712: {'lr': 0.000482539719321129, 'samples': 3784704, 'steps': 19711, 'loss/train': 1.2897369861602783} -08/30/2021 16:45:50 - INFO - __main__ - Step 19713: {'lr': 0.00048253777085895745, 'samples': 3784896, 'steps': 19712, 'loss/train': 1.3967864513397217} -08/30/2021 16:45:50 - INFO - __main__ - Step 19714: {'lr': 0.000482535822292008, 'samples': 3785088, 'steps': 19713, 'loss/train': 1.3750593662261963} -08/30/2021 16:45:51 - INFO - __main__ - Step 19715: {'lr': 0.0004825338736202815, 'samples': 3785280, 'steps': 19714, 'loss/train': 1.3700599670410156} -08/30/2021 16:45:52 - INFO - __main__ - Step 19716: {'lr': 0.00048253192484377884, 'samples': 3785472, 'steps': 19715, 'loss/train': 1.6668800115585327} -08/30/2021 16:45:53 - INFO - __main__ - Step 19717: {'lr': 0.0004825299759625008, 'samples': 3785664, 'steps': 19716, 'loss/train': 1.5117876529693604} -08/30/2021 16:45:53 - INFO - __main__ - Step 19718: {'lr': 0.0004825280269764484, 'samples': 3785856, 'steps': 19717, 'loss/train': 1.9901987314224243} -08/30/2021 16:45:53 - INFO - __main__ - Step 19719: {'lr': 0.0004825260778856224, 'samples': 3786048, 'steps': 19718, 'loss/train': 1.9022563695907593} -08/30/2021 16:45:54 - INFO - __main__ - Step 19720: {'lr': 0.0004825241286900238, 'samples': 3786240, 'steps': 19719, 'loss/train': 1.249380111694336} -08/30/2021 16:45:55 - INFO - __main__ - Step 19721: {'lr': 0.0004825221793896535, 'samples': 3786432, 'steps': 19720, 'loss/train': 2.0074994564056396} -08/30/2021 16:45:56 - INFO - __main__ - Step 19722: {'lr': 0.0004825202299845122, 'samples': 3786624, 'steps': 19721, 'loss/train': 2.1659655570983887} -08/30/2021 16:45:56 - INFO - __main__ - Step 19723: {'lr': 0.00048251828047460077, 'samples': 3786816, 'steps': 19722, 'loss/train': 1.6186447143554688} -08/30/2021 16:45:56 - INFO - __main__ - Step 19724: {'lr': 0.0004825163308599203, 'samples': 3787008, 'steps': 19723, 'loss/train': 1.5282928943634033} -08/30/2021 16:45:57 - INFO - __main__ - Step 19725: {'lr': 0.0004825143811404716, 'samples': 3787200, 'steps': 19724, 'loss/train': 1.08818519115448} -08/30/2021 16:45:59 - INFO - __main__ - Step 19726: {'lr': 0.00048251243131625543, 'samples': 3787392, 'steps': 19725, 'loss/train': 1.213646411895752} -08/30/2021 16:45:59 - INFO - __main__ - Step 19727: {'lr': 0.0004825104813872728, 'samples': 3787584, 'steps': 19726, 'loss/train': 1.608264446258545} -08/30/2021 16:46:00 - INFO - __main__ - Step 19728: {'lr': 0.0004825085313535245, 'samples': 3787776, 'steps': 19727, 'loss/train': 1.5605945587158203} -08/30/2021 16:46:00 - INFO - __main__ - Step 19729: {'lr': 0.00048250658121501145, 'samples': 3787968, 'steps': 19728, 'loss/train': 2.1500375270843506} -08/30/2021 16:46:00 - INFO - __main__ - Step 19730: {'lr': 0.00048250463097173447, 'samples': 3788160, 'steps': 19729, 'loss/train': 1.2001900672912598} -08/30/2021 16:46:02 - INFO - __main__ - Step 19731: {'lr': 0.0004825026806236946, 'samples': 3788352, 'steps': 19730, 'loss/train': 1.7775330543518066} -08/30/2021 16:46:02 - INFO - __main__ - Step 19732: {'lr': 0.00048250073017089257, 'samples': 3788544, 'steps': 19731, 'loss/train': 1.0759825706481934} -08/30/2021 16:46:03 - INFO - __main__ - Step 19733: {'lr': 0.00048249877961332923, 'samples': 3788736, 'steps': 19732, 'loss/train': 2.6747982501983643} -08/30/2021 16:46:03 - INFO - __main__ - Step 19734: {'lr': 0.0004824968289510056, 'samples': 3788928, 'steps': 19733, 'loss/train': 1.3608564138412476} -08/30/2021 16:46:03 - INFO - __main__ - Step 19735: {'lr': 0.0004824948781839225, 'samples': 3789120, 'steps': 19734, 'loss/train': 1.852820873260498} -08/30/2021 16:46:05 - INFO - __main__ - Step 19736: {'lr': 0.0004824929273120807, 'samples': 3789312, 'steps': 19735, 'loss/train': 1.777243971824646} -08/30/2021 16:46:05 - INFO - __main__ - Step 19737: {'lr': 0.0004824909763354813, 'samples': 3789504, 'steps': 19736, 'loss/train': 1.8846819400787354} -08/30/2021 16:46:06 - INFO - __main__ - Step 19738: {'lr': 0.00048248902525412497, 'samples': 3789696, 'steps': 19737, 'loss/train': 1.4429880380630493} -08/30/2021 16:46:06 - INFO - __main__ - Step 19739: {'lr': 0.0004824870740680127, 'samples': 3789888, 'steps': 19738, 'loss/train': 1.995111107826233} -08/30/2021 16:46:07 - INFO - __main__ - Step 19740: {'lr': 0.0004824851227771453, 'samples': 3790080, 'steps': 19739, 'loss/train': 1.3590061664581299} -08/30/2021 16:46:07 - INFO - __main__ - Step 19741: {'lr': 0.00048248317138152374, 'samples': 3790272, 'steps': 19740, 'loss/train': 1.6957652568817139} -08/30/2021 16:46:08 - INFO - __main__ - Step 19742: {'lr': 0.00048248121988114887, 'samples': 3790464, 'steps': 19741, 'loss/train': 2.3059370517730713} -08/30/2021 16:46:09 - INFO - __main__ - Step 19743: {'lr': 0.00048247926827602153, 'samples': 3790656, 'steps': 19742, 'loss/train': 1.349485158920288} -08/30/2021 16:46:09 - INFO - __main__ - Step 19744: {'lr': 0.0004824773165661426, 'samples': 3790848, 'steps': 19743, 'loss/train': 1.3163179159164429} -08/30/2021 16:46:10 - INFO - __main__ - Step 19745: {'lr': 0.000482475364751513, 'samples': 3791040, 'steps': 19744, 'loss/train': 1.5471094846725464} -08/30/2021 16:46:10 - INFO - __main__ - Step 19746: {'lr': 0.0004824734128321335, 'samples': 3791232, 'steps': 19745, 'loss/train': 1.1037479639053345} -08/30/2021 16:46:11 - INFO - __main__ - Step 19747: {'lr': 0.0004824714608080052, 'samples': 3791424, 'steps': 19746, 'loss/train': 1.6759765148162842} -08/30/2021 16:46:12 - INFO - __main__ - Step 19748: {'lr': 0.00048246950867912873, 'samples': 3791616, 'steps': 19747, 'loss/train': 1.7748245000839233} -08/30/2021 16:46:12 - INFO - __main__ - Step 19749: {'lr': 0.0004824675564455052, 'samples': 3791808, 'steps': 19748, 'loss/train': 1.7343673706054688} -08/30/2021 16:46:13 - INFO - __main__ - Step 19750: {'lr': 0.0004824656041071353, 'samples': 3792000, 'steps': 19749, 'loss/train': 1.4536768198013306} -08/30/2021 16:46:13 - INFO - __main__ - Step 19751: {'lr': 0.00048246365166402003, 'samples': 3792192, 'steps': 19750, 'loss/train': 1.4853363037109375} -08/30/2021 16:46:14 - INFO - __main__ - Step 19752: {'lr': 0.00048246169911616015, 'samples': 3792384, 'steps': 19751, 'loss/train': 2.1229076385498047} -08/30/2021 16:46:15 - INFO - __main__ - Step 19753: {'lr': 0.00048245974646355673, 'samples': 3792576, 'steps': 19752, 'loss/train': 1.5881577730178833} -08/30/2021 16:46:15 - INFO - __main__ - Step 19754: {'lr': 0.00048245779370621045, 'samples': 3792768, 'steps': 19753, 'loss/train': 0.0828220397233963} -08/30/2021 16:46:16 - INFO - __main__ - Step 19755: {'lr': 0.0004824558408441223, 'samples': 3792960, 'steps': 19754, 'loss/train': 1.7623757123947144} -08/30/2021 16:46:16 - INFO - __main__ - Step 19756: {'lr': 0.00048245388787729316, 'samples': 3793152, 'steps': 19755, 'loss/train': 1.5343509912490845} -08/30/2021 16:46:18 - INFO - __main__ - Step 19757: {'lr': 0.00048245193480572383, 'samples': 3793344, 'steps': 19756, 'loss/train': 1.145225167274475} -08/30/2021 16:46:18 - INFO - __main__ - Step 19758: {'lr': 0.0004824499816294152, 'samples': 3793536, 'steps': 19757, 'loss/train': 1.65183424949646} -08/30/2021 16:46:18 - INFO - __main__ - Step 19759: {'lr': 0.0004824480283483683, 'samples': 3793728, 'steps': 19758, 'loss/train': 1.3957730531692505} -08/30/2021 16:46:19 - INFO - __main__ - Step 19760: {'lr': 0.0004824460749625839, 'samples': 3793920, 'steps': 19759, 'loss/train': 0.8056812286376953} -08/30/2021 16:46:19 - INFO - __main__ - Step 19761: {'lr': 0.00048244412147206283, 'samples': 3794112, 'steps': 19760, 'loss/train': 1.4695429801940918} -08/30/2021 16:46:21 - INFO - __main__ - Step 19762: {'lr': 0.00048244216787680607, 'samples': 3794304, 'steps': 19761, 'loss/train': 1.407184362411499} -08/30/2021 16:46:21 - INFO - __main__ - Step 19763: {'lr': 0.0004824402141768145, 'samples': 3794496, 'steps': 19762, 'loss/train': 1.706057071685791} -08/30/2021 16:46:21 - INFO - __main__ - Step 19764: {'lr': 0.0004824382603720888, 'samples': 3794688, 'steps': 19763, 'loss/train': 1.8974753618240356} -08/30/2021 16:46:22 - INFO - __main__ - Step 19765: {'lr': 0.00048243630646263016, 'samples': 3794880, 'steps': 19764, 'loss/train': 1.7434874773025513} -08/30/2021 16:46:22 - INFO - __main__ - Step 19766: {'lr': 0.00048243435244843926, 'samples': 3795072, 'steps': 19765, 'loss/train': 1.6711057424545288} -08/30/2021 16:46:22 - INFO - __main__ - Step 19767: {'lr': 0.000482432398329517, 'samples': 3795264, 'steps': 19766, 'loss/train': 1.4974653720855713} -08/30/2021 16:46:24 - INFO - __main__ - Step 19768: {'lr': 0.00048243044410586433, 'samples': 3795456, 'steps': 19767, 'loss/train': 1.5653835535049438} -08/30/2021 16:46:24 - INFO - __main__ - Step 19769: {'lr': 0.00048242848977748205, 'samples': 3795648, 'steps': 19768, 'loss/train': 0.8201896548271179} -08/30/2021 16:46:25 - INFO - __main__ - Step 19770: {'lr': 0.0004824265353443711, 'samples': 3795840, 'steps': 19769, 'loss/train': 1.5632750988006592} -08/30/2021 16:46:25 - INFO - __main__ - Step 19771: {'lr': 0.00048242458080653233, 'samples': 3796032, 'steps': 19770, 'loss/train': 1.306421160697937} -08/30/2021 16:46:26 - INFO - __main__ - Step 19772: {'lr': 0.0004824226261639666, 'samples': 3796224, 'steps': 19771, 'loss/train': 1.869511604309082} -08/30/2021 16:46:27 - INFO - __main__ - Step 19773: {'lr': 0.00048242067141667487, 'samples': 3796416, 'steps': 19772, 'loss/train': 1.3827139139175415} -08/30/2021 16:46:28 - INFO - __main__ - Step 19774: {'lr': 0.00048241871656465795, 'samples': 3796608, 'steps': 19773, 'loss/train': 0.756730854511261} -08/30/2021 16:46:28 - INFO - __main__ - Step 19775: {'lr': 0.0004824167616079168, 'samples': 3796800, 'steps': 19774, 'loss/train': 1.6832746267318726} -08/30/2021 16:46:28 - INFO - __main__ - Step 19776: {'lr': 0.0004824148065464522, 'samples': 3796992, 'steps': 19775, 'loss/train': 1.5018789768218994} -08/30/2021 16:46:29 - INFO - __main__ - Step 19777: {'lr': 0.00048241285138026505, 'samples': 3797184, 'steps': 19776, 'loss/train': 1.9354379177093506} -08/30/2021 16:46:30 - INFO - __main__ - Step 19778: {'lr': 0.00048241089610935627, 'samples': 3797376, 'steps': 19777, 'loss/train': 1.5387619733810425} -08/30/2021 16:46:31 - INFO - __main__ - Step 19779: {'lr': 0.0004824089407337267, 'samples': 3797568, 'steps': 19778, 'loss/train': 1.7963557243347168} -08/30/2021 16:46:31 - INFO - __main__ - Step 19780: {'lr': 0.00048240698525337726, 'samples': 3797760, 'steps': 19779, 'loss/train': 1.811444878578186} -08/30/2021 16:46:31 - INFO - __main__ - Step 19781: {'lr': 0.0004824050296683089, 'samples': 3797952, 'steps': 19780, 'loss/train': 1.7149640321731567} -08/30/2021 16:46:32 - INFO - __main__ - Step 19782: {'lr': 0.0004824030739785223, 'samples': 3798144, 'steps': 19781, 'loss/train': 1.2311028242111206} -08/30/2021 16:46:32 - INFO - __main__ - Step 19783: {'lr': 0.00048240111818401854, 'samples': 3798336, 'steps': 19782, 'loss/train': 1.7671340703964233} -08/30/2021 16:46:34 - INFO - __main__ - Step 19784: {'lr': 0.0004823991622847984, 'samples': 3798528, 'steps': 19783, 'loss/train': 1.5080082416534424} -08/30/2021 16:46:35 - INFO - __main__ - Step 19785: {'lr': 0.0004823972062808628, 'samples': 3798720, 'steps': 19784, 'loss/train': 1.4996699094772339} -08/30/2021 16:46:35 - INFO - __main__ - Step 19786: {'lr': 0.0004823952501722126, 'samples': 3798912, 'steps': 19785, 'loss/train': 1.8464879989624023} -08/30/2021 16:46:35 - INFO - __main__ - Step 19787: {'lr': 0.00048239329395884865, 'samples': 3799104, 'steps': 19786, 'loss/train': 1.6811447143554688} -08/30/2021 16:46:36 - INFO - __main__ - Step 19788: {'lr': 0.00048239133764077193, 'samples': 3799296, 'steps': 19787, 'loss/train': 1.9512839317321777} -08/30/2021 16:46:37 - INFO - __main__ - Step 19789: {'lr': 0.00048238938121798313, 'samples': 3799488, 'steps': 19788, 'loss/train': 1.5324562788009644} -08/30/2021 16:46:38 - INFO - __main__ - Step 19790: {'lr': 0.00048238742469048344, 'samples': 3799680, 'steps': 19789, 'loss/train': 1.4485249519348145} -08/30/2021 16:46:38 - INFO - __main__ - Step 19791: {'lr': 0.00048238546805827345, 'samples': 3799872, 'steps': 19790, 'loss/train': 1.9327707290649414} -08/30/2021 16:46:39 - INFO - __main__ - Step 19792: {'lr': 0.00048238351132135415, 'samples': 3800064, 'steps': 19791, 'loss/train': 1.6438424587249756} -08/30/2021 16:46:39 - INFO - __main__ - Step 19793: {'lr': 0.0004823815544797265, 'samples': 3800256, 'steps': 19792, 'loss/train': 1.512700080871582} -08/30/2021 16:46:40 - INFO - __main__ - Step 19794: {'lr': 0.0004823795975333912, 'samples': 3800448, 'steps': 19793, 'loss/train': 1.6888874769210815} -08/30/2021 16:46:41 - INFO - __main__ - Step 19795: {'lr': 0.0004823776404823493, 'samples': 3800640, 'steps': 19794, 'loss/train': 1.5916376113891602} -08/30/2021 16:46:41 - INFO - __main__ - Step 19796: {'lr': 0.00048237568332660163, 'samples': 3800832, 'steps': 19795, 'loss/train': 2.0096867084503174} -08/30/2021 16:46:41 - INFO - __main__ - Step 19797: {'lr': 0.0004823737260661491, 'samples': 3801024, 'steps': 19796, 'loss/train': 1.7896571159362793} -08/30/2021 16:46:42 - INFO - __main__ - Step 19798: {'lr': 0.00048237176870099256, 'samples': 3801216, 'steps': 19797, 'loss/train': 1.7274136543273926} -08/30/2021 16:46:43 - INFO - __main__ - Step 19799: {'lr': 0.0004823698112311328, 'samples': 3801408, 'steps': 19798, 'loss/train': 1.4035961627960205} -08/30/2021 16:46:44 - INFO - __main__ - Step 19800: {'lr': 0.00048236785365657076, 'samples': 3801600, 'steps': 19799, 'loss/train': 0.17131058871746063} -08/30/2021 16:46:44 - INFO - __main__ - Step 19801: {'lr': 0.00048236589597730744, 'samples': 3801792, 'steps': 19800, 'loss/train': 1.7156814336776733} -08/30/2021 16:46:45 - INFO - __main__ - Step 19802: {'lr': 0.00048236393819334363, 'samples': 3801984, 'steps': 19801, 'loss/train': 1.3876007795333862} -08/30/2021 16:46:45 - INFO - __main__ - Step 19803: {'lr': 0.0004823619803046802, 'samples': 3802176, 'steps': 19802, 'loss/train': 0.6160278916358948} -08/30/2021 16:46:47 - INFO - __main__ - Step 19804: {'lr': 0.00048236002231131803, 'samples': 3802368, 'steps': 19803, 'loss/train': 1.3296622037887573} -08/30/2021 16:46:47 - INFO - __main__ - Step 19805: {'lr': 0.00048235806421325803, 'samples': 3802560, 'steps': 19804, 'loss/train': 1.531077265739441} -08/30/2021 16:46:47 - INFO - __main__ - Step 19806: {'lr': 0.0004823561060105011, 'samples': 3802752, 'steps': 19805, 'loss/train': 1.6807235479354858} -08/30/2021 16:46:48 - INFO - __main__ - Step 19807: {'lr': 0.00048235414770304803, 'samples': 3802944, 'steps': 19806, 'loss/train': 1.673302173614502} -08/30/2021 16:46:48 - INFO - __main__ - Step 19808: {'lr': 0.00048235218929089987, 'samples': 3803136, 'steps': 19807, 'loss/train': 1.5240333080291748} -08/30/2021 16:46:49 - INFO - __main__ - Step 19809: {'lr': 0.00048235023077405724, 'samples': 3803328, 'steps': 19808, 'loss/train': 1.59073805809021} -08/30/2021 16:46:50 - INFO - __main__ - Step 19810: {'lr': 0.0004823482721525213, 'samples': 3803520, 'steps': 19809, 'loss/train': 1.7584518194198608} -08/30/2021 16:46:50 - INFO - __main__ - Step 19811: {'lr': 0.0004823463134262928, 'samples': 3803712, 'steps': 19810, 'loss/train': 1.5256023406982422} -08/30/2021 16:46:51 - INFO - __main__ - Step 19812: {'lr': 0.00048234435459537265, 'samples': 3803904, 'steps': 19811, 'loss/train': 1.4290350675582886} -08/30/2021 16:46:51 - INFO - __main__ - Step 19813: {'lr': 0.0004823423956597617, 'samples': 3804096, 'steps': 19812, 'loss/train': 1.2690590620040894} -08/30/2021 16:46:52 - INFO - __main__ - Step 19814: {'lr': 0.0004823404366194608, 'samples': 3804288, 'steps': 19813, 'loss/train': 1.546666145324707} -08/30/2021 16:46:53 - INFO - __main__ - Step 19815: {'lr': 0.0004823384774744709, 'samples': 3804480, 'steps': 19814, 'loss/train': 1.6375718116760254} -08/30/2021 16:46:53 - INFO - __main__ - Step 19816: {'lr': 0.000482336518224793, 'samples': 3804672, 'steps': 19815, 'loss/train': 0.07490232586860657} -08/30/2021 16:46:54 - INFO - __main__ - Step 19817: {'lr': 0.00048233455887042764, 'samples': 3804864, 'steps': 19816, 'loss/train': 1.213105320930481} -08/30/2021 16:46:54 - INFO - __main__ - Step 19818: {'lr': 0.0004823325994113761, 'samples': 3805056, 'steps': 19817, 'loss/train': 1.383909821510315} -08/30/2021 16:46:56 - INFO - __main__ - Step 19819: {'lr': 0.00048233063984763895, 'samples': 3805248, 'steps': 19818, 'loss/train': 1.2611336708068848} -08/30/2021 16:46:56 - INFO - __main__ - Step 19820: {'lr': 0.0004823286801792173, 'samples': 3805440, 'steps': 19819, 'loss/train': 1.7871754169464111} -08/30/2021 16:46:56 - INFO - __main__ - Step 19821: {'lr': 0.0004823267204061118, 'samples': 3805632, 'steps': 19820, 'loss/train': 2.1539313793182373} -08/30/2021 16:46:57 - INFO - __main__ - Step 19822: {'lr': 0.0004823247605283236, 'samples': 3805824, 'steps': 19821, 'loss/train': 0.15021799504756927} -08/30/2021 16:46:57 - INFO - __main__ - Step 19823: {'lr': 0.0004823228005458534, 'samples': 3806016, 'steps': 19822, 'loss/train': 1.92867112159729} -08/30/2021 16:46:59 - INFO - __main__ - Step 19824: {'lr': 0.00048232084045870204, 'samples': 3806208, 'steps': 19823, 'loss/train': 0.8178573250770569} -08/30/2021 16:46:59 - INFO - __main__ - Step 19825: {'lr': 0.00048231888026687065, 'samples': 3806400, 'steps': 19824, 'loss/train': 1.4814424514770508} -08/30/2021 16:46:59 - INFO - __main__ - Step 19826: {'lr': 0.00048231691997035987, 'samples': 3806592, 'steps': 19825, 'loss/train': 1.6040164232254028} -08/30/2021 16:47:00 - INFO - __main__ - Step 19827: {'lr': 0.00048231495956917067, 'samples': 3806784, 'steps': 19826, 'loss/train': 1.462829351425171} -08/30/2021 16:47:00 - INFO - __main__ - Step 19828: {'lr': 0.00048231299906330397, 'samples': 3806976, 'steps': 19827, 'loss/train': 1.1462972164154053} -08/30/2021 16:47:02 - INFO - __main__ - Step 19829: {'lr': 0.0004823110384527606, 'samples': 3807168, 'steps': 19828, 'loss/train': 1.4257042407989502} -08/30/2021 16:47:02 - INFO - __main__ - Step 19830: {'lr': 0.0004823090777375414, 'samples': 3807360, 'steps': 19829, 'loss/train': 1.8113360404968262} -08/30/2021 16:47:02 - INFO - __main__ - Step 19831: {'lr': 0.0004823071169176474, 'samples': 3807552, 'steps': 19830, 'loss/train': 2.2109315395355225} -08/30/2021 16:47:03 - INFO - __main__ - Step 19832: {'lr': 0.00048230515599307933, 'samples': 3807744, 'steps': 19831, 'loss/train': 1.2028950452804565} -08/30/2021 16:47:03 - INFO - __main__ - Step 19833: {'lr': 0.0004823031949638382, 'samples': 3807936, 'steps': 19832, 'loss/train': 1.6282076835632324} -08/30/2021 16:47:03 - INFO - __main__ - Step 19834: {'lr': 0.0004823012338299248, 'samples': 3808128, 'steps': 19833, 'loss/train': 1.61159348487854} -08/30/2021 16:47:06 - INFO - __main__ - Step 19835: {'lr': 0.0004822992725913401, 'samples': 3808320, 'steps': 19834, 'loss/train': 1.688277244567871} -08/30/2021 16:47:06 - INFO - __main__ - Step 19836: {'lr': 0.00048229731124808484, 'samples': 3808512, 'steps': 19835, 'loss/train': 1.5510793924331665} -08/30/2021 16:47:07 - INFO - __main__ - Step 19837: {'lr': 0.00048229534980016007, 'samples': 3808704, 'steps': 19836, 'loss/train': 1.5770598649978638} -08/30/2021 16:47:07 - INFO - __main__ - Step 19838: {'lr': 0.0004822933882475666, 'samples': 3808896, 'steps': 19837, 'loss/train': 1.6042286157608032} -08/30/2021 16:47:07 - INFO - __main__ - Step 19839: {'lr': 0.00048229142659030527, 'samples': 3809088, 'steps': 19838, 'loss/train': 1.6330395936965942} -08/30/2021 16:47:08 - INFO - __main__ - Step 19840: {'lr': 0.000482289464828377, 'samples': 3809280, 'steps': 19839, 'loss/train': 0.057610705494880676} -08/30/2021 16:47:09 - INFO - __main__ - Step 19841: {'lr': 0.00048228750296178276, 'samples': 3809472, 'steps': 19840, 'loss/train': 1.5284667015075684} -08/30/2021 16:47:10 - INFO - __main__ - Step 19842: {'lr': 0.0004822855409905233, 'samples': 3809664, 'steps': 19841, 'loss/train': 1.4956417083740234} -08/30/2021 16:47:10 - INFO - __main__ - Step 19843: {'lr': 0.00048228357891459954, 'samples': 3809856, 'steps': 19842, 'loss/train': 2.1752610206604004} -08/30/2021 16:47:11 - INFO - __main__ - Step 19844: {'lr': 0.0004822816167340124, 'samples': 3810048, 'steps': 19843, 'loss/train': 0.914184033870697} -08/30/2021 16:47:11 - INFO - __main__ - Step 19845: {'lr': 0.00048227965444876277, 'samples': 3810240, 'steps': 19844, 'loss/train': 2.04819655418396} -08/30/2021 16:47:12 - INFO - __main__ - Step 19846: {'lr': 0.0004822776920588515, 'samples': 3810432, 'steps': 19845, 'loss/train': 1.589402437210083} -08/30/2021 16:47:13 - INFO - __main__ - Step 19847: {'lr': 0.0004822757295642795, 'samples': 3810624, 'steps': 19846, 'loss/train': 1.5684795379638672} -08/30/2021 16:47:13 - INFO - __main__ - Step 19848: {'lr': 0.00048227376696504765, 'samples': 3810816, 'steps': 19847, 'loss/train': 1.812343955039978} -08/30/2021 16:47:14 - INFO - __main__ - Step 19849: {'lr': 0.0004822718042611568, 'samples': 3811008, 'steps': 19848, 'loss/train': 1.5832816362380981} -08/30/2021 16:47:14 - INFO - __main__ - Step 19850: {'lr': 0.0004822698414526079, 'samples': 3811200, 'steps': 19849, 'loss/train': 1.8289332389831543} -08/30/2021 16:47:16 - INFO - __main__ - Step 19851: {'lr': 0.0004822678785394017, 'samples': 3811392, 'steps': 19850, 'loss/train': 1.7046853303909302} -08/30/2021 16:47:16 - INFO - __main__ - Step 19852: {'lr': 0.0004822659155215393, 'samples': 3811584, 'steps': 19851, 'loss/train': 0.8314381837844849} -08/30/2021 16:47:17 - INFO - __main__ - Step 19853: {'lr': 0.00048226395239902133, 'samples': 3811776, 'steps': 19852, 'loss/train': 1.683605670928955} -08/30/2021 16:47:17 - INFO - __main__ - Step 19854: {'lr': 0.00048226198917184886, 'samples': 3811968, 'steps': 19853, 'loss/train': 1.5703904628753662} -08/30/2021 16:47:17 - INFO - __main__ - Step 19855: {'lr': 0.00048226002584002276, 'samples': 3812160, 'steps': 19854, 'loss/train': 0.059553273022174835} -08/30/2021 16:47:18 - INFO - __main__ - Step 19856: {'lr': 0.00048225806240354387, 'samples': 3812352, 'steps': 19855, 'loss/train': 0.06528206169605255} -08/30/2021 16:47:19 - INFO - __main__ - Step 19857: {'lr': 0.0004822560988624131, 'samples': 3812544, 'steps': 19856, 'loss/train': 2.0399603843688965} -08/30/2021 16:47:20 - INFO - __main__ - Step 19858: {'lr': 0.0004822541352166312, 'samples': 3812736, 'steps': 19857, 'loss/train': 1.376532793045044} -08/30/2021 16:47:20 - INFO - __main__ - Step 19859: {'lr': 0.0004822521714661993, 'samples': 3812928, 'steps': 19858, 'loss/train': 1.4827698469161987} -08/30/2021 16:47:20 - INFO - __main__ - Step 19860: {'lr': 0.0004822502076111181, 'samples': 3813120, 'steps': 19859, 'loss/train': 1.3917800188064575} -08/30/2021 16:47:21 - INFO - __main__ - Step 19861: {'lr': 0.0004822482436513885, 'samples': 3813312, 'steps': 19860, 'loss/train': 0.8752621412277222} -08/30/2021 16:47:21 - INFO - __main__ - Step 19862: {'lr': 0.0004822462795870115, 'samples': 3813504, 'steps': 19861, 'loss/train': 0.5461375713348389} -08/30/2021 16:47:23 - INFO - __main__ - Step 19863: {'lr': 0.00048224431541798784, 'samples': 3813696, 'steps': 19862, 'loss/train': 1.2158832550048828} -08/30/2021 16:47:23 - INFO - __main__ - Step 19864: {'lr': 0.00048224235114431856, 'samples': 3813888, 'steps': 19863, 'loss/train': 2.0124335289001465} -08/30/2021 16:47:23 - INFO - __main__ - Step 19865: {'lr': 0.0004822403867660044, 'samples': 3814080, 'steps': 19864, 'loss/train': 1.2959673404693604} -08/30/2021 16:47:24 - INFO - __main__ - Step 19866: {'lr': 0.0004822384222830463, 'samples': 3814272, 'steps': 19865, 'loss/train': 2.120906352996826} -08/30/2021 16:47:24 - INFO - __main__ - Step 19867: {'lr': 0.0004822364576954452, 'samples': 3814464, 'steps': 19866, 'loss/train': 1.5623080730438232} -08/30/2021 16:47:26 - INFO - __main__ - Step 19868: {'lr': 0.0004822344930032019, 'samples': 3814656, 'steps': 19867, 'loss/train': 1.6022862195968628} -08/30/2021 16:47:26 - INFO - __main__ - Step 19869: {'lr': 0.00048223252820631736, 'samples': 3814848, 'steps': 19868, 'loss/train': 1.5811340808868408} -08/30/2021 16:47:26 - INFO - __main__ - Step 19870: {'lr': 0.00048223056330479235, 'samples': 3815040, 'steps': 19869, 'loss/train': 0.598106324672699} -08/30/2021 16:47:27 - INFO - __main__ - Step 19871: {'lr': 0.00048222859829862784, 'samples': 3815232, 'steps': 19870, 'loss/train': 1.6351191997528076} -08/30/2021 16:47:27 - INFO - __main__ - Step 19872: {'lr': 0.0004822266331878248, 'samples': 3815424, 'steps': 19871, 'loss/train': 1.4950696229934692} -08/30/2021 16:47:29 - INFO - __main__ - Step 19873: {'lr': 0.00048222466797238396, 'samples': 3815616, 'steps': 19872, 'loss/train': 1.8534035682678223} -08/30/2021 16:47:29 - INFO - __main__ - Step 19874: {'lr': 0.00048222270265230627, 'samples': 3815808, 'steps': 19873, 'loss/train': 2.3191308975219727} -08/30/2021 16:47:30 - INFO - __main__ - Step 19875: {'lr': 0.0004822207372275926, 'samples': 3816000, 'steps': 19874, 'loss/train': 0.8441720008850098} -08/30/2021 16:47:30 - INFO - __main__ - Step 19876: {'lr': 0.0004822187716982439, 'samples': 3816192, 'steps': 19875, 'loss/train': 1.893140435218811} -08/30/2021 16:47:30 - INFO - __main__ - Step 19877: {'lr': 0.000482216806064261, 'samples': 3816384, 'steps': 19876, 'loss/train': 1.9657264947891235} -08/30/2021 16:47:32 - INFO - __main__ - Step 19878: {'lr': 0.0004822148403256447, 'samples': 3816576, 'steps': 19877, 'loss/train': 1.5532938241958618} -08/30/2021 16:47:33 - INFO - __main__ - Step 19879: {'lr': 0.00048221287448239604, 'samples': 3816768, 'steps': 19878, 'loss/train': 2.102879047393799} -08/30/2021 16:47:33 - INFO - __main__ - Step 19880: {'lr': 0.00048221090853451586, 'samples': 3816960, 'steps': 19879, 'loss/train': 1.3816614151000977} -08/30/2021 16:47:33 - INFO - __main__ - Step 19881: {'lr': 0.000482208942482005, 'samples': 3817152, 'steps': 19880, 'loss/train': 1.6331406831741333} -08/30/2021 16:47:34 - INFO - __main__ - Step 19882: {'lr': 0.00048220697632486443, 'samples': 3817344, 'steps': 19881, 'loss/train': 1.5460662841796875} -08/30/2021 16:47:35 - INFO - __main__ - Step 19883: {'lr': 0.0004822050100630949, 'samples': 3817536, 'steps': 19882, 'loss/train': 1.1174434423446655} -08/30/2021 16:47:36 - INFO - __main__ - Step 19884: {'lr': 0.0004822030436966974, 'samples': 3817728, 'steps': 19883, 'loss/train': 1.226914644241333} -08/30/2021 16:47:36 - INFO - __main__ - Step 19885: {'lr': 0.0004822010772256728, 'samples': 3817920, 'steps': 19884, 'loss/train': 1.0844295024871826} -08/30/2021 16:47:37 - INFO - __main__ - Step 19886: {'lr': 0.00048219911065002196, 'samples': 3818112, 'steps': 19885, 'loss/train': 0.13883930444717407} -08/30/2021 16:47:37 - INFO - __main__ - Step 19887: {'lr': 0.00048219714396974587, 'samples': 3818304, 'steps': 19886, 'loss/train': 0.388445645570755} -08/30/2021 16:47:37 - INFO - __main__ - Step 19888: {'lr': 0.0004821951771848452, 'samples': 3818496, 'steps': 19887, 'loss/train': 1.543168544769287} -08/30/2021 16:47:39 - INFO - __main__ - Step 19889: {'lr': 0.00048219321029532104, 'samples': 3818688, 'steps': 19888, 'loss/train': 1.3442749977111816} -08/30/2021 16:47:39 - INFO - __main__ - Step 19890: {'lr': 0.0004821912433011742, 'samples': 3818880, 'steps': 19889, 'loss/train': 2.1364612579345703} -08/30/2021 16:47:39 - INFO - __main__ - Step 19891: {'lr': 0.00048218927620240557, 'samples': 3819072, 'steps': 19890, 'loss/train': 1.3614708185195923} -08/30/2021 16:47:40 - INFO - __main__ - Step 19892: {'lr': 0.00048218730899901596, 'samples': 3819264, 'steps': 19891, 'loss/train': 1.7762341499328613} -08/30/2021 16:47:40 - INFO - __main__ - Step 19893: {'lr': 0.0004821853416910065, 'samples': 3819456, 'steps': 19892, 'loss/train': 2.399401903152466} -08/30/2021 16:47:42 - INFO - __main__ - Step 19894: {'lr': 0.0004821833742783778, 'samples': 3819648, 'steps': 19893, 'loss/train': 1.5506436824798584} -08/30/2021 16:47:43 - INFO - __main__ - Step 19895: {'lr': 0.0004821814067611308, 'samples': 3819840, 'steps': 19894, 'loss/train': 1.3862872123718262} -08/30/2021 16:47:43 - INFO - __main__ - Step 19896: {'lr': 0.00048217943913926646, 'samples': 3820032, 'steps': 19895, 'loss/train': 1.5992727279663086} -08/30/2021 16:47:43 - INFO - __main__ - Step 19897: {'lr': 0.00048217747141278574, 'samples': 3820224, 'steps': 19896, 'loss/train': 1.7001378536224365} -08/30/2021 16:47:44 - INFO - __main__ - Step 19898: {'lr': 0.00048217550358168937, 'samples': 3820416, 'steps': 19897, 'loss/train': 1.771938443183899} -08/30/2021 16:47:44 - INFO - __main__ - Step 19899: {'lr': 0.00048217353564597833, 'samples': 3820608, 'steps': 19898, 'loss/train': 0.980220377445221} -08/30/2021 16:47:46 - INFO - __main__ - Step 19900: {'lr': 0.0004821715676056534, 'samples': 3820800, 'steps': 19899, 'loss/train': 1.2470473051071167} -08/30/2021 16:47:46 - INFO - __main__ - Step 19901: {'lr': 0.0004821695994607156, 'samples': 3820992, 'steps': 19900, 'loss/train': 1.54640793800354} -08/30/2021 16:47:46 - INFO - __main__ - Step 19902: {'lr': 0.0004821676312111658, 'samples': 3821184, 'steps': 19901, 'loss/train': 1.4011132717132568} -08/30/2021 16:47:47 - INFO - __main__ - Step 19903: {'lr': 0.0004821656628570048, 'samples': 3821376, 'steps': 19902, 'loss/train': 1.692028522491455} -08/30/2021 16:47:47 - INFO - __main__ - Step 19904: {'lr': 0.00048216369439823355, 'samples': 3821568, 'steps': 19903, 'loss/train': 1.0948528051376343} -08/30/2021 16:47:49 - INFO - __main__ - Step 19905: {'lr': 0.0004821617258348529, 'samples': 3821760, 'steps': 19904, 'loss/train': 1.3367528915405273} -08/30/2021 16:47:49 - INFO - __main__ - Step 19906: {'lr': 0.0004821597571668638, 'samples': 3821952, 'steps': 19905, 'loss/train': 1.7913727760314941} -08/30/2021 16:47:50 - INFO - __main__ - Step 19907: {'lr': 0.00048215778839426706, 'samples': 3822144, 'steps': 19906, 'loss/train': 1.740395426750183} -08/30/2021 16:47:50 - INFO - __main__ - Step 19908: {'lr': 0.0004821558195170636, 'samples': 3822336, 'steps': 19907, 'loss/train': 1.95854651927948} -08/30/2021 16:47:51 - INFO - __main__ - Step 19909: {'lr': 0.00048215385053525434, 'samples': 3822528, 'steps': 19908, 'loss/train': 1.7856106758117676} -08/30/2021 16:47:52 - INFO - __main__ - Step 19910: {'lr': 0.00048215188144884013, 'samples': 3822720, 'steps': 19909, 'loss/train': 1.7378044128417969} -08/30/2021 16:47:52 - INFO - __main__ - Step 19911: {'lr': 0.0004821499122578218, 'samples': 3822912, 'steps': 19910, 'loss/train': 1.4063925743103027} -08/30/2021 16:47:53 - INFO - __main__ - Step 19912: {'lr': 0.00048214794296220045, 'samples': 3823104, 'steps': 19911, 'loss/train': 2.181438684463501} -08/30/2021 16:47:53 - INFO - __main__ - Step 19913: {'lr': 0.00048214597356197665, 'samples': 3823296, 'steps': 19912, 'loss/train': 1.8075560331344604} -08/30/2021 16:47:53 - INFO - __main__ - Step 19914: {'lr': 0.00048214400405715153, 'samples': 3823488, 'steps': 19913, 'loss/train': 1.2732000350952148} -08/30/2021 16:47:55 - INFO - __main__ - Step 19915: {'lr': 0.000482142034447726, 'samples': 3823680, 'steps': 19914, 'loss/train': 2.2317516803741455} -08/30/2021 16:47:55 - INFO - __main__ - Step 19916: {'lr': 0.0004821400647337007, 'samples': 3823872, 'steps': 19915, 'loss/train': 1.7764110565185547} -08/30/2021 16:47:56 - INFO - __main__ - Step 19917: {'lr': 0.0004821380949150768, 'samples': 3824064, 'steps': 19916, 'loss/train': 1.7857691049575806} -08/30/2021 16:47:56 - INFO - __main__ - Step 19918: {'lr': 0.0004821361249918549, 'samples': 3824256, 'steps': 19917, 'loss/train': 2.807133197784424} -08/30/2021 16:47:56 - INFO - __main__ - Step 19919: {'lr': 0.0004821341549640361, 'samples': 3824448, 'steps': 19918, 'loss/train': 1.948252558708191} -08/30/2021 16:47:57 - INFO - __main__ - Step 19920: {'lr': 0.00048213218483162133, 'samples': 3824640, 'steps': 19919, 'loss/train': 1.578928828239441} -08/30/2021 16:47:58 - INFO - __main__ - Step 19921: {'lr': 0.0004821302145946113, 'samples': 3824832, 'steps': 19920, 'loss/train': 1.0670801401138306} -08/30/2021 16:47:59 - INFO - __main__ - Step 19922: {'lr': 0.00048212824425300694, 'samples': 3825024, 'steps': 19921, 'loss/train': 1.6731804609298706} -08/30/2021 16:47:59 - INFO - __main__ - Step 19923: {'lr': 0.0004821262738068093, 'samples': 3825216, 'steps': 19922, 'loss/train': 0.26068222522735596} -08/30/2021 16:48:00 - INFO - __main__ - Step 19924: {'lr': 0.00048212430325601905, 'samples': 3825408, 'steps': 19923, 'loss/train': 1.7669562101364136} -08/30/2021 16:48:00 - INFO - __main__ - Step 19925: {'lr': 0.0004821223326006372, 'samples': 3825600, 'steps': 19924, 'loss/train': 1.3206557035446167} -08/30/2021 16:48:01 - INFO - __main__ - Step 19926: {'lr': 0.0004821203618406645, 'samples': 3825792, 'steps': 19925, 'loss/train': 1.6502186059951782} -08/30/2021 16:48:02 - INFO - __main__ - Step 19927: {'lr': 0.0004821183909761021, 'samples': 3825984, 'steps': 19926, 'loss/train': 1.5708249807357788} -08/30/2021 16:48:02 - INFO - __main__ - Step 19928: {'lr': 0.00048211642000695065, 'samples': 3826176, 'steps': 19927, 'loss/train': 1.6866652965545654} -08/30/2021 16:48:03 - INFO - __main__ - Step 19929: {'lr': 0.0004821144489332112, 'samples': 3826368, 'steps': 19928, 'loss/train': 1.0631749629974365} -08/30/2021 16:48:03 - INFO - __main__ - Step 19930: {'lr': 0.0004821124777548845, 'samples': 3826560, 'steps': 19929, 'loss/train': 1.2046526670455933} -08/30/2021 16:48:05 - INFO - __main__ - Step 19931: {'lr': 0.0004821105064719715, 'samples': 3826752, 'steps': 19930, 'loss/train': 1.9138237237930298} -08/30/2021 16:48:05 - INFO - __main__ - Step 19932: {'lr': 0.0004821085350844731, 'samples': 3826944, 'steps': 19931, 'loss/train': 0.1442057490348816} -08/30/2021 16:48:05 - INFO - __main__ - Step 19933: {'lr': 0.0004821065635923902, 'samples': 3827136, 'steps': 19932, 'loss/train': 1.5246555805206299} -08/30/2021 16:48:06 - INFO - __main__ - Step 19934: {'lr': 0.0004821045919957237, 'samples': 3827328, 'steps': 19933, 'loss/train': 1.7617788314819336} -08/30/2021 16:48:06 - INFO - __main__ - Step 19935: {'lr': 0.00048210262029447425, 'samples': 3827520, 'steps': 19934, 'loss/train': 1.624178409576416} -08/30/2021 16:48:08 - INFO - __main__ - Step 19936: {'lr': 0.0004821006484886431, 'samples': 3827712, 'steps': 19935, 'loss/train': 1.6159640550613403} -08/30/2021 16:48:08 - INFO - __main__ - Step 19937: {'lr': 0.000482098676578231, 'samples': 3827904, 'steps': 19936, 'loss/train': 1.2737667560577393} -08/30/2021 16:48:09 - INFO - __main__ - Step 19938: {'lr': 0.0004820967045632388, 'samples': 3828096, 'steps': 19937, 'loss/train': 1.4769971370697021} -08/30/2021 16:48:09 - INFO - __main__ - Step 19939: {'lr': 0.00048209473244366737, 'samples': 3828288, 'steps': 19938, 'loss/train': 0.9654390811920166} -08/30/2021 16:48:09 - INFO - __main__ - Step 19940: {'lr': 0.00048209276021951765, 'samples': 3828480, 'steps': 19939, 'loss/train': 1.6610724925994873} -08/30/2021 16:48:11 - INFO - __main__ - Step 19941: {'lr': 0.00048209078789079055, 'samples': 3828672, 'steps': 19940, 'loss/train': 1.4529668092727661} -08/30/2021 16:48:11 - INFO - __main__ - Step 19942: {'lr': 0.00048208881545748684, 'samples': 3828864, 'steps': 19941, 'loss/train': 2.073242664337158} -08/30/2021 16:48:12 - INFO - __main__ - Step 19943: {'lr': 0.00048208684291960755, 'samples': 3829056, 'steps': 19942, 'loss/train': 1.3615379333496094} -08/30/2021 16:48:12 - INFO - __main__ - Step 19944: {'lr': 0.0004820848702771535, 'samples': 3829248, 'steps': 19943, 'loss/train': 1.5603870153427124} -08/30/2021 16:48:12 - INFO - __main__ - Step 19945: {'lr': 0.0004820828975301256, 'samples': 3829440, 'steps': 19944, 'loss/train': 1.638757348060608} -08/30/2021 16:48:14 - INFO - __main__ - Step 19946: {'lr': 0.0004820809246785247, 'samples': 3829632, 'steps': 19945, 'loss/train': 1.8357417583465576} -08/30/2021 16:48:15 - INFO - __main__ - Step 19947: {'lr': 0.00048207895172235174, 'samples': 3829824, 'steps': 19946, 'loss/train': 0.8339240550994873} -08/30/2021 16:48:15 - INFO - __main__ - Step 19948: {'lr': 0.00048207697866160755, 'samples': 3830016, 'steps': 19947, 'loss/train': 0.9164642691612244} -08/30/2021 16:48:15 - INFO - __main__ - Step 19949: {'lr': 0.0004820750054962931, 'samples': 3830208, 'steps': 19948, 'loss/train': 1.6671268939971924} -08/30/2021 16:48:16 - INFO - __main__ - Step 19950: {'lr': 0.00048207303222640917, 'samples': 3830400, 'steps': 19949, 'loss/train': 1.640650749206543} -08/30/2021 16:48:17 - INFO - __main__ - Step 19951: {'lr': 0.00048207105885195677, 'samples': 3830592, 'steps': 19950, 'loss/train': 1.5497727394104004} -08/30/2021 16:48:18 - INFO - __main__ - Step 19952: {'lr': 0.0004820690853729367, 'samples': 3830784, 'steps': 19951, 'loss/train': 0.19414319097995758} -08/30/2021 16:48:18 - INFO - __main__ - Step 19953: {'lr': 0.00048206711178934994, 'samples': 3830976, 'steps': 19952, 'loss/train': 1.789297342300415} -08/30/2021 16:48:19 - INFO - __main__ - Step 19954: {'lr': 0.00048206513810119725, 'samples': 3831168, 'steps': 19953, 'loss/train': 1.8761667013168335} -08/30/2021 16:48:19 - INFO - __main__ - Step 19955: {'lr': 0.0004820631643084796, 'samples': 3831360, 'steps': 19954, 'loss/train': 1.4396812915802002} -08/30/2021 16:48:19 - INFO - __main__ - Step 19956: {'lr': 0.00048206119041119787, 'samples': 3831552, 'steps': 19955, 'loss/train': 1.5129131078720093} -08/30/2021 16:48:21 - INFO - __main__ - Step 19957: {'lr': 0.000482059216409353, 'samples': 3831744, 'steps': 19956, 'loss/train': 1.8082789182662964} -08/30/2021 16:48:22 - INFO - __main__ - Step 19958: {'lr': 0.0004820572423029458, 'samples': 3831936, 'steps': 19957, 'loss/train': 1.9943994283676147} -08/30/2021 16:48:22 - INFO - __main__ - Step 19959: {'lr': 0.00048205526809197717, 'samples': 3832128, 'steps': 19958, 'loss/train': 1.5847307443618774} -08/30/2021 16:48:22 - INFO - __main__ - Step 19960: {'lr': 0.000482053293776448, 'samples': 3832320, 'steps': 19959, 'loss/train': 1.7793534994125366} -08/30/2021 16:48:23 - INFO - __main__ - Step 19961: {'lr': 0.0004820513193563593, 'samples': 3832512, 'steps': 19960, 'loss/train': 0.25694942474365234} -08/30/2021 16:48:24 - INFO - __main__ - Step 19962: {'lr': 0.00048204934483171176, 'samples': 3832704, 'steps': 19961, 'loss/train': 1.4777239561080933} -08/30/2021 16:48:25 - INFO - __main__ - Step 19963: {'lr': 0.0004820473702025064, 'samples': 3832896, 'steps': 19962, 'loss/train': 1.6857661008834839} -08/30/2021 16:48:25 - INFO - __main__ - Step 19964: {'lr': 0.000482045395468744, 'samples': 3833088, 'steps': 19963, 'loss/train': 0.335319459438324} -08/30/2021 16:48:26 - INFO - __main__ - Step 19965: {'lr': 0.0004820434206304256, 'samples': 3833280, 'steps': 19964, 'loss/train': 1.5853749513626099} -08/30/2021 16:48:26 - INFO - __main__ - Step 19966: {'lr': 0.000482041445687552, 'samples': 3833472, 'steps': 19965, 'loss/train': 2.2551088333129883} -08/30/2021 16:48:27 - INFO - __main__ - Step 19967: {'lr': 0.0004820394706401242, 'samples': 3833664, 'steps': 19966, 'loss/train': 0.075727179646492} -08/30/2021 16:48:28 - INFO - __main__ - Step 19968: {'lr': 0.0004820374954881429, 'samples': 3833856, 'steps': 19967, 'loss/train': 1.5370581150054932} -08/30/2021 16:48:28 - INFO - __main__ - Step 19969: {'lr': 0.000482035520231609, 'samples': 3834048, 'steps': 19968, 'loss/train': 1.8862011432647705} -08/30/2021 16:48:29 - INFO - __main__ - Step 19970: {'lr': 0.00048203354487052363, 'samples': 3834240, 'steps': 19969, 'loss/train': 1.4049559831619263} -08/30/2021 16:48:29 - INFO - __main__ - Step 19971: {'lr': 0.00048203156940488745, 'samples': 3834432, 'steps': 19970, 'loss/train': 1.6679749488830566} -08/30/2021 16:48:29 - INFO - __main__ - Step 19972: {'lr': 0.00048202959383470144, 'samples': 3834624, 'steps': 19971, 'loss/train': 0.8248991966247559} -08/30/2021 16:48:31 - INFO - __main__ - Step 19973: {'lr': 0.00048202761815996646, 'samples': 3834816, 'steps': 19972, 'loss/train': 1.5690691471099854} -08/30/2021 16:48:31 - INFO - __main__ - Step 19974: {'lr': 0.0004820256423806835, 'samples': 3835008, 'steps': 19973, 'loss/train': 1.0361708402633667} -08/30/2021 16:48:32 - INFO - __main__ - Step 19975: {'lr': 0.00048202366649685325, 'samples': 3835200, 'steps': 19974, 'loss/train': 1.9095230102539062} -08/30/2021 16:48:32 - INFO - __main__ - Step 19976: {'lr': 0.0004820216905084768, 'samples': 3835392, 'steps': 19975, 'loss/train': 2.128371238708496} -08/30/2021 16:48:32 - INFO - __main__ - Step 19977: {'lr': 0.00048201971441555485, 'samples': 3835584, 'steps': 19976, 'loss/train': 1.6646312475204468} -08/30/2021 16:48:34 - INFO - __main__ - Step 19978: {'lr': 0.0004820177382180885, 'samples': 3835776, 'steps': 19977, 'loss/train': 1.3691110610961914} -08/30/2021 16:48:34 - INFO - __main__ - Step 19979: {'lr': 0.00048201576191607843, 'samples': 3835968, 'steps': 19978, 'loss/train': 0.21969597041606903} -08/30/2021 16:48:35 - INFO - __main__ - Step 19980: {'lr': 0.00048201378550952575, 'samples': 3836160, 'steps': 19979, 'loss/train': 1.217984914779663} -08/30/2021 16:48:35 - INFO - __main__ - Step 19981: {'lr': 0.0004820118089984312, 'samples': 3836352, 'steps': 19980, 'loss/train': 1.7248014211654663} -08/30/2021 16:48:35 - INFO - __main__ - Step 19982: {'lr': 0.0004820098323827957, 'samples': 3836544, 'steps': 19981, 'loss/train': 1.9163602590560913} -08/30/2021 16:48:37 - INFO - __main__ - Step 19983: {'lr': 0.0004820078556626202, 'samples': 3836736, 'steps': 19982, 'loss/train': 1.093578815460205} -08/30/2021 16:48:37 - INFO - __main__ - Step 19984: {'lr': 0.0004820058788379055, 'samples': 3836928, 'steps': 19983, 'loss/train': 1.651665449142456} -08/30/2021 16:48:38 - INFO - __main__ - Step 19985: {'lr': 0.0004820039019086525, 'samples': 3837120, 'steps': 19984, 'loss/train': 1.1406774520874023} -08/30/2021 16:48:38 - INFO - __main__ - Step 19986: {'lr': 0.00048200192487486216, 'samples': 3837312, 'steps': 19985, 'loss/train': 1.5559415817260742} -08/30/2021 16:48:38 - INFO - __main__ - Step 19987: {'lr': 0.00048199994773653535, 'samples': 3837504, 'steps': 19986, 'loss/train': 1.3614102602005005} -08/30/2021 16:48:40 - INFO - __main__ - Step 19988: {'lr': 0.0004819979704936729, 'samples': 3837696, 'steps': 19987, 'loss/train': 1.2424564361572266} -08/30/2021 16:48:40 - INFO - __main__ - Step 19989: {'lr': 0.00048199599314627576, 'samples': 3837888, 'steps': 19988, 'loss/train': 1.5290501117706299} -08/30/2021 16:48:41 - INFO - __main__ - Step 19990: {'lr': 0.00048199401569434477, 'samples': 3838080, 'steps': 19989, 'loss/train': 2.1153290271759033} -08/30/2021 16:48:41 - INFO - __main__ - Step 19991: {'lr': 0.00048199203813788086, 'samples': 3838272, 'steps': 19990, 'loss/train': 1.7672927379608154} -08/30/2021 16:48:42 - INFO - __main__ - Step 19992: {'lr': 0.00048199006047688496, 'samples': 3838464, 'steps': 19991, 'loss/train': 1.7383555173873901} -08/30/2021 16:48:43 - INFO - __main__ - Step 19993: {'lr': 0.0004819880827113579, 'samples': 3838656, 'steps': 19992, 'loss/train': 1.8264869451522827} -08/30/2021 16:48:44 - INFO - __main__ - Step 19994: {'lr': 0.0004819861048413006, 'samples': 3838848, 'steps': 19993, 'loss/train': 1.6042386293411255} -08/30/2021 16:48:44 - INFO - __main__ - Step 19995: {'lr': 0.00048198412686671394, 'samples': 3839040, 'steps': 19994, 'loss/train': 0.16026639938354492} -08/30/2021 16:48:45 - INFO - __main__ - Step 19996: {'lr': 0.0004819821487875988, 'samples': 3839232, 'steps': 19995, 'loss/train': 0.062003571540117264} -08/30/2021 16:48:45 - INFO - __main__ - Step 19997: {'lr': 0.0004819801706039561, 'samples': 3839424, 'steps': 19996, 'loss/train': 1.302549123764038} -08/30/2021 16:48:45 - INFO - __main__ - Step 19998: {'lr': 0.0004819781923157867, 'samples': 3839616, 'steps': 19997, 'loss/train': 1.3895676136016846} -08/30/2021 16:48:47 - INFO - __main__ - Step 19999: {'lr': 0.00048197621392309154, 'samples': 3839808, 'steps': 19998, 'loss/train': 1.644120454788208} -08/30/2021 16:48:47 - INFO - __main__ - Step 20000: {'lr': 0.00048197423542587143, 'samples': 3840000, 'steps': 19999, 'loss/train': 1.5134613513946533} -08/30/2021 16:48:48 - INFO - __main__ - Step 20001: {'lr': 0.0004819722568241274, 'samples': 3840192, 'steps': 20000, 'loss/train': 0.9177433848381042} -08/30/2021 16:48:48 - INFO - __main__ - Step 20002: {'lr': 0.0004819702781178601, 'samples': 3840384, 'steps': 20001, 'loss/train': 1.7758409976959229} -08/30/2021 16:48:48 - INFO - __main__ - Step 20003: {'lr': 0.00048196829930707066, 'samples': 3840576, 'steps': 20002, 'loss/train': 1.3711930513381958} -08/30/2021 16:48:50 - INFO - __main__ - Step 20004: {'lr': 0.0004819663203917599, 'samples': 3840768, 'steps': 20003, 'loss/train': 1.7435840368270874} -08/30/2021 16:48:51 - INFO - __main__ - Step 20005: {'lr': 0.0004819643413719287, 'samples': 3840960, 'steps': 20004, 'loss/train': 1.8693407773971558} -08/30/2021 16:48:51 - INFO - __main__ - Step 20006: {'lr': 0.0004819623622475779, 'samples': 3841152, 'steps': 20005, 'loss/train': 1.7306019067764282} -08/30/2021 16:48:51 - INFO - __main__ - Step 20007: {'lr': 0.00048196038301870847, 'samples': 3841344, 'steps': 20006, 'loss/train': 1.9947823286056519} -08/30/2021 16:48:52 - INFO - __main__ - Step 20008: {'lr': 0.0004819584036853212, 'samples': 3841536, 'steps': 20007, 'loss/train': 1.286116123199463} -08/30/2021 16:48:52 - INFO - __main__ - Step 20009: {'lr': 0.00048195642424741716, 'samples': 3841728, 'steps': 20008, 'loss/train': 1.6496145725250244} -08/30/2021 16:48:54 - INFO - __main__ - Step 20010: {'lr': 0.00048195444470499704, 'samples': 3841920, 'steps': 20009, 'loss/train': 1.3488520383834839} -08/30/2021 16:48:54 - INFO - __main__ - Step 20011: {'lr': 0.0004819524650580619, 'samples': 3842112, 'steps': 20010, 'loss/train': 1.5523463487625122} -08/30/2021 16:48:54 - INFO - __main__ - Step 20012: {'lr': 0.0004819504853066126, 'samples': 3842304, 'steps': 20011, 'loss/train': 2.034449577331543} -08/30/2021 16:48:55 - INFO - __main__ - Step 20013: {'lr': 0.0004819485054506498, 'samples': 3842496, 'steps': 20012, 'loss/train': 1.734606146812439} -08/30/2021 16:48:55 - INFO - __main__ - Step 20014: {'lr': 0.00048194652549017484, 'samples': 3842688, 'steps': 20013, 'loss/train': 1.9898678064346313} -08/30/2021 16:48:57 - INFO - __main__ - Step 20015: {'lr': 0.0004819445454251882, 'samples': 3842880, 'steps': 20014, 'loss/train': 0.9438971877098083} -08/30/2021 16:48:57 - INFO - __main__ - Step 20016: {'lr': 0.0004819425652556909, 'samples': 3843072, 'steps': 20015, 'loss/train': 2.579280376434326} -08/30/2021 16:48:58 - INFO - __main__ - Step 20017: {'lr': 0.0004819405849816839, 'samples': 3843264, 'steps': 20016, 'loss/train': 1.5702136754989624} -08/30/2021 16:48:58 - INFO - __main__ - Step 20018: {'lr': 0.00048193860460316805, 'samples': 3843456, 'steps': 20017, 'loss/train': 0.5301432609558105} -08/30/2021 16:48:58 - INFO - __main__ - Step 20019: {'lr': 0.00048193662412014427, 'samples': 3843648, 'steps': 20018, 'loss/train': 1.7974170446395874} -08/30/2021 16:49:00 - INFO - __main__ - Step 20020: {'lr': 0.0004819346435326134, 'samples': 3843840, 'steps': 20019, 'loss/train': 1.2705624103546143} -08/30/2021 16:49:00 - INFO - __main__ - Step 20021: {'lr': 0.00048193266284057634, 'samples': 3844032, 'steps': 20020, 'loss/train': 1.3145122528076172} -08/30/2021 16:49:01 - INFO - __main__ - Step 20022: {'lr': 0.0004819306820440341, 'samples': 3844224, 'steps': 20021, 'loss/train': 1.5394717454910278} -08/30/2021 16:49:01 - INFO - __main__ - Step 20023: {'lr': 0.0004819287011429874, 'samples': 3844416, 'steps': 20022, 'loss/train': 1.6912767887115479} -08/30/2021 16:49:01 - INFO - __main__ - Step 20024: {'lr': 0.0004819267201374372, 'samples': 3844608, 'steps': 20023, 'loss/train': 1.8691939115524292} -08/30/2021 16:49:03 - INFO - __main__ - Step 20025: {'lr': 0.0004819247390273844, 'samples': 3844800, 'steps': 20024, 'loss/train': 1.7553164958953857} -08/30/2021 16:49:03 - INFO - __main__ - Step 20026: {'lr': 0.00048192275781282993, 'samples': 3844992, 'steps': 20025, 'loss/train': 1.6538194417953491} -08/30/2021 16:49:04 - INFO - __main__ - Step 20027: {'lr': 0.00048192077649377455, 'samples': 3845184, 'steps': 20026, 'loss/train': 2.2352724075317383} -08/30/2021 16:49:04 - INFO - __main__ - Step 20028: {'lr': 0.0004819187950702193, 'samples': 3845376, 'steps': 20027, 'loss/train': 1.1791073083877563} -08/30/2021 16:49:04 - INFO - __main__ - Step 20029: {'lr': 0.00048191681354216504, 'samples': 3845568, 'steps': 20028, 'loss/train': 1.2517369985580444} -08/30/2021 16:49:06 - INFO - __main__ - Step 20030: {'lr': 0.0004819148319096126, 'samples': 3845760, 'steps': 20029, 'loss/train': 1.0241451263427734} -08/30/2021 16:49:06 - INFO - __main__ - Step 20031: {'lr': 0.00048191285017256297, 'samples': 3845952, 'steps': 20030, 'loss/train': 1.7977837324142456} -08/30/2021 16:49:07 - INFO - __main__ - Step 20032: {'lr': 0.00048191086833101695, 'samples': 3846144, 'steps': 20031, 'loss/train': 1.4658101797103882} -08/30/2021 16:49:07 - INFO - __main__ - Step 20033: {'lr': 0.00048190888638497553, 'samples': 3846336, 'steps': 20032, 'loss/train': 1.695029616355896} -08/30/2021 16:49:07 - INFO - __main__ - Step 20034: {'lr': 0.00048190690433443946, 'samples': 3846528, 'steps': 20033, 'loss/train': 1.1877739429473877} -08/30/2021 16:49:08 - INFO - __main__ - Step 20035: {'lr': 0.0004819049221794097, 'samples': 3846720, 'steps': 20034, 'loss/train': 0.08224710822105408} -08/30/2021 16:49:09 - INFO - __main__ - Step 20036: {'lr': 0.0004819029399198873, 'samples': 3846912, 'steps': 20035, 'loss/train': 1.4298524856567383} -08/30/2021 16:49:10 - INFO - __main__ - Step 20037: {'lr': 0.0004819009575558729, 'samples': 3847104, 'steps': 20036, 'loss/train': 1.6943835020065308} -08/30/2021 16:49:10 - INFO - __main__ - Step 20038: {'lr': 0.0004818989750873676, 'samples': 3847296, 'steps': 20037, 'loss/train': 0.03754433989524841} -08/30/2021 16:49:11 - INFO - __main__ - Step 20039: {'lr': 0.00048189699251437206, 'samples': 3847488, 'steps': 20038, 'loss/train': 1.9434560537338257} -08/30/2021 16:49:11 - INFO - __main__ - Step 20040: {'lr': 0.0004818950098368874, 'samples': 3847680, 'steps': 20039, 'loss/train': 1.8073323965072632} -08/30/2021 16:49:11 - INFO - __main__ - Step 20041: {'lr': 0.00048189302705491446, 'samples': 3847872, 'steps': 20040, 'loss/train': 1.7424969673156738} -08/30/2021 16:49:13 - INFO - __main__ - Step 20042: {'lr': 0.000481891044168454, 'samples': 3848064, 'steps': 20041, 'loss/train': 1.8437080383300781} -08/30/2021 16:49:13 - INFO - __main__ - Step 20043: {'lr': 0.00048188906117750706, 'samples': 3848256, 'steps': 20042, 'loss/train': 0.10665156692266464} -08/30/2021 16:49:14 - INFO - __main__ - Step 20044: {'lr': 0.00048188707808207457, 'samples': 3848448, 'steps': 20043, 'loss/train': 1.8833436965942383} -08/30/2021 16:49:14 - INFO - __main__ - Step 20045: {'lr': 0.00048188509488215724, 'samples': 3848640, 'steps': 20044, 'loss/train': 1.396911859512329} -08/30/2021 16:49:14 - INFO - __main__ - Step 20046: {'lr': 0.0004818831115777561, 'samples': 3848832, 'steps': 20045, 'loss/train': 1.676553726196289} -08/30/2021 16:49:16 - INFO - __main__ - Step 20047: {'lr': 0.00048188112816887203, 'samples': 3849024, 'steps': 20046, 'loss/train': 1.7872953414916992} -08/30/2021 16:49:16 - INFO - __main__ - Step 20048: {'lr': 0.0004818791446555059, 'samples': 3849216, 'steps': 20047, 'loss/train': 1.4919394254684448} -08/30/2021 16:49:17 - INFO - __main__ - Step 20049: {'lr': 0.00048187716103765854, 'samples': 3849408, 'steps': 20048, 'loss/train': 0.8091785311698914} -08/30/2021 16:49:17 - INFO - __main__ - Step 20050: {'lr': 0.0004818751773153309, 'samples': 3849600, 'steps': 20049, 'loss/train': 0.6129899621009827} -08/30/2021 16:49:17 - INFO - __main__ - Step 20051: {'lr': 0.000481873193488524, 'samples': 3849792, 'steps': 20050, 'loss/train': 1.6006039381027222} -08/30/2021 16:49:19 - INFO - __main__ - Step 20052: {'lr': 0.0004818712095572385, 'samples': 3849984, 'steps': 20051, 'loss/train': 1.1631252765655518} -08/30/2021 16:49:19 - INFO - __main__ - Step 20053: {'lr': 0.0004818692255214755, 'samples': 3850176, 'steps': 20052, 'loss/train': 1.6821677684783936} -08/30/2021 16:49:20 - INFO - __main__ - Step 20054: {'lr': 0.00048186724138123577, 'samples': 3850368, 'steps': 20053, 'loss/train': 1.827529788017273} -08/30/2021 16:49:20 - INFO - __main__ - Step 20055: {'lr': 0.00048186525713652024, 'samples': 3850560, 'steps': 20054, 'loss/train': 1.3900905847549438} -08/30/2021 16:49:20 - INFO - __main__ - Step 20056: {'lr': 0.0004818632727873298, 'samples': 3850752, 'steps': 20055, 'loss/train': 1.4969857931137085} -08/30/2021 16:49:22 - INFO - __main__ - Step 20057: {'lr': 0.00048186128833366536, 'samples': 3850944, 'steps': 20056, 'loss/train': 1.184066653251648} -08/30/2021 16:49:23 - INFO - __main__ - Step 20058: {'lr': 0.0004818593037755278, 'samples': 3851136, 'steps': 20057, 'loss/train': 1.6948479413986206} -08/30/2021 16:49:23 - INFO - __main__ - Step 20059: {'lr': 0.000481857319112918, 'samples': 3851328, 'steps': 20058, 'loss/train': 1.9170730113983154} -08/30/2021 16:49:23 - INFO - __main__ - Step 20060: {'lr': 0.0004818553343458368, 'samples': 3851520, 'steps': 20059, 'loss/train': 1.23885178565979} -08/30/2021 16:49:24 - INFO - __main__ - Step 20061: {'lr': 0.00048185334947428525, 'samples': 3851712, 'steps': 20060, 'loss/train': 2.0625462532043457} -08/30/2021 16:49:24 - INFO - __main__ - Step 20062: {'lr': 0.0004818513644982642, 'samples': 3851904, 'steps': 20061, 'loss/train': 1.9079039096832275} -08/30/2021 16:49:26 - INFO - __main__ - Step 20063: {'lr': 0.0004818493794177744, 'samples': 3852096, 'steps': 20062, 'loss/train': 1.435896635055542} -08/30/2021 16:49:26 - INFO - __main__ - Step 20064: {'lr': 0.00048184739423281695, 'samples': 3852288, 'steps': 20063, 'loss/train': 1.9172650575637817} -08/30/2021 16:49:27 - INFO - __main__ - Step 20065: {'lr': 0.00048184540894339256, 'samples': 3852480, 'steps': 20064, 'loss/train': 0.9635215401649475} -08/30/2021 16:49:27 - INFO - __main__ - Step 20066: {'lr': 0.00048184342354950225, 'samples': 3852672, 'steps': 20065, 'loss/train': 1.7241082191467285} -08/30/2021 16:49:27 - INFO - __main__ - Step 20067: {'lr': 0.00048184143805114684, 'samples': 3852864, 'steps': 20066, 'loss/train': 1.6395256519317627} -08/30/2021 16:49:29 - INFO - __main__ - Step 20068: {'lr': 0.00048183945244832725, 'samples': 3853056, 'steps': 20067, 'loss/train': 1.6814159154891968} -08/30/2021 16:49:29 - INFO - __main__ - Step 20069: {'lr': 0.00048183746674104446, 'samples': 3853248, 'steps': 20068, 'loss/train': 1.5684231519699097} -08/30/2021 16:49:29 - INFO - __main__ - Step 20070: {'lr': 0.00048183548092929916, 'samples': 3853440, 'steps': 20069, 'loss/train': 1.3256232738494873} -08/30/2021 16:49:30 - INFO - __main__ - Step 20071: {'lr': 0.0004818334950130925, 'samples': 3853632, 'steps': 20070, 'loss/train': 1.4391560554504395} -08/30/2021 16:49:30 - INFO - __main__ - Step 20072: {'lr': 0.00048183150899242514, 'samples': 3853824, 'steps': 20071, 'loss/train': 1.5120980739593506} -08/30/2021 16:49:32 - INFO - __main__ - Step 20073: {'lr': 0.0004818295228672981, 'samples': 3854016, 'steps': 20072, 'loss/train': 1.8095577955245972} -08/30/2021 16:49:32 - INFO - __main__ - Step 20074: {'lr': 0.0004818275366377123, 'samples': 3854208, 'steps': 20073, 'loss/train': 1.1560922861099243} -08/30/2021 16:49:32 - INFO - __main__ - Step 20075: {'lr': 0.00048182555030366854, 'samples': 3854400, 'steps': 20074, 'loss/train': 1.2336541414260864} -08/30/2021 16:49:33 - INFO - __main__ - Step 20076: {'lr': 0.0004818235638651678, 'samples': 3854592, 'steps': 20075, 'loss/train': 1.116799235343933} -08/30/2021 16:49:33 - INFO - __main__ - Step 20077: {'lr': 0.0004818215773222109, 'samples': 3854784, 'steps': 20076, 'loss/train': 0.4001154601573944} -08/30/2021 16:49:35 - INFO - __main__ - Step 20078: {'lr': 0.0004818195906747988, 'samples': 3854976, 'steps': 20077, 'loss/train': 2.4976325035095215} -08/30/2021 16:49:35 - INFO - __main__ - Step 20079: {'lr': 0.0004818176039229324, 'samples': 3855168, 'steps': 20078, 'loss/train': 1.6350609064102173} -08/30/2021 16:49:35 - INFO - __main__ - Step 20080: {'lr': 0.0004818156170666125, 'samples': 3855360, 'steps': 20079, 'loss/train': 1.3892173767089844} -08/30/2021 16:49:36 - INFO - __main__ - Step 20081: {'lr': 0.0004818136301058401, 'samples': 3855552, 'steps': 20080, 'loss/train': 1.1264094114303589} -08/30/2021 16:49:36 - INFO - __main__ - Step 20082: {'lr': 0.0004818116430406161, 'samples': 3855744, 'steps': 20081, 'loss/train': 2.3538107872009277} -08/30/2021 16:49:36 - INFO - __main__ - Step 20083: {'lr': 0.00048180965587094125, 'samples': 3855936, 'steps': 20082, 'loss/train': 1.9352130889892578} -08/30/2021 16:49:38 - INFO - __main__ - Step 20084: {'lr': 0.00048180766859681664, 'samples': 3856128, 'steps': 20083, 'loss/train': 1.302859902381897} -08/30/2021 16:49:39 - INFO - __main__ - Step 20085: {'lr': 0.000481805681218243, 'samples': 3856320, 'steps': 20084, 'loss/train': 1.5741057395935059} -08/30/2021 16:49:39 - INFO - __main__ - Step 20086: {'lr': 0.0004818036937352214, 'samples': 3856512, 'steps': 20085, 'loss/train': 2.0826728343963623} -08/30/2021 16:49:39 - INFO - __main__ - Step 20087: {'lr': 0.0004818017061477525, 'samples': 3856704, 'steps': 20086, 'loss/train': 1.552943468093872} -08/30/2021 16:49:40 - INFO - __main__ - Step 20088: {'lr': 0.00048179971845583734, 'samples': 3856896, 'steps': 20087, 'loss/train': 1.6637585163116455} -08/30/2021 16:49:42 - INFO - __main__ - Step 20089: {'lr': 0.00048179773065947683, 'samples': 3857088, 'steps': 20088, 'loss/train': 1.3537242412567139} -08/30/2021 16:49:42 - INFO - __main__ - Step 20090: {'lr': 0.0004817957427586719, 'samples': 3857280, 'steps': 20089, 'loss/train': 0.22368521988391876} -08/30/2021 16:49:42 - INFO - __main__ - Step 20091: {'lr': 0.00048179375475342333, 'samples': 3857472, 'steps': 20090, 'loss/train': 0.22531534731388092} -08/30/2021 16:49:43 - INFO - __main__ - Step 20092: {'lr': 0.00048179176664373214, 'samples': 3857664, 'steps': 20091, 'loss/train': 1.5876214504241943} -08/30/2021 16:49:43 - INFO - __main__ - Step 20093: {'lr': 0.0004817897784295991, 'samples': 3857856, 'steps': 20092, 'loss/train': 1.9929802417755127} -08/30/2021 16:49:43 - INFO - __main__ - Step 20094: {'lr': 0.0004817877901110251, 'samples': 3858048, 'steps': 20093, 'loss/train': 1.6999971866607666} -08/30/2021 16:49:45 - INFO - __main__ - Step 20095: {'lr': 0.0004817858016880112, 'samples': 3858240, 'steps': 20094, 'loss/train': 1.4086908102035522} -08/30/2021 16:49:45 - INFO - __main__ - Step 20096: {'lr': 0.0004817838131605582, 'samples': 3858432, 'steps': 20095, 'loss/train': 1.7002785205841064} -08/30/2021 16:49:46 - INFO - __main__ - Step 20097: {'lr': 0.00048178182452866694, 'samples': 3858624, 'steps': 20096, 'loss/train': 0.9283069968223572} -08/30/2021 16:49:46 - INFO - __main__ - Step 20098: {'lr': 0.0004817798357923384, 'samples': 3858816, 'steps': 20097, 'loss/train': 1.4377996921539307} -08/30/2021 16:49:46 - INFO - __main__ - Step 20099: {'lr': 0.00048177784695157335, 'samples': 3859008, 'steps': 20098, 'loss/train': 1.0285416841506958} -08/30/2021 16:49:48 - INFO - __main__ - Step 20100: {'lr': 0.00048177585800637286, 'samples': 3859200, 'steps': 20099, 'loss/train': 0.9273505210876465} -08/30/2021 16:49:48 - INFO - __main__ - Step 20101: {'lr': 0.00048177386895673774, 'samples': 3859392, 'steps': 20100, 'loss/train': 1.3331303596496582} -08/30/2021 16:49:49 - INFO - __main__ - Step 20102: {'lr': 0.0004817718798026689, 'samples': 3859584, 'steps': 20101, 'loss/train': 1.147251844406128} -08/30/2021 16:49:49 - INFO - __main__ - Step 20103: {'lr': 0.0004817698905441672, 'samples': 3859776, 'steps': 20102, 'loss/train': 1.8079439401626587} -08/30/2021 16:49:50 - INFO - __main__ - Step 20104: {'lr': 0.0004817679011812336, 'samples': 3859968, 'steps': 20103, 'loss/train': 2.1963179111480713} -08/30/2021 16:49:50 - INFO - __main__ - Step 20105: {'lr': 0.00048176591171386884, 'samples': 3860160, 'steps': 20104, 'loss/train': 1.6470838785171509} -08/30/2021 16:49:51 - INFO - __main__ - Step 20106: {'lr': 0.0004817639221420741, 'samples': 3860352, 'steps': 20105, 'loss/train': 1.1575138568878174} -08/30/2021 16:49:52 - INFO - __main__ - Step 20107: {'lr': 0.00048176193246585, 'samples': 3860544, 'steps': 20106, 'loss/train': 1.32097327709198} -08/30/2021 16:49:52 - INFO - __main__ - Step 20108: {'lr': 0.00048175994268519765, 'samples': 3860736, 'steps': 20107, 'loss/train': 1.5724048614501953} -08/30/2021 16:49:52 - INFO - __main__ - Step 20109: {'lr': 0.00048175795280011775, 'samples': 3860928, 'steps': 20108, 'loss/train': 2.2219698429107666} -08/30/2021 16:49:53 - INFO - __main__ - Step 20110: {'lr': 0.00048175596281061135, 'samples': 3861120, 'steps': 20109, 'loss/train': 1.98557448387146} -08/30/2021 16:49:55 - INFO - __main__ - Step 20111: {'lr': 0.00048175397271667925, 'samples': 3861312, 'steps': 20110, 'loss/train': 1.6294634342193604} -08/30/2021 16:49:55 - INFO - __main__ - Step 20112: {'lr': 0.00048175198251832244, 'samples': 3861504, 'steps': 20111, 'loss/train': 1.6430479288101196} -08/30/2021 16:49:56 - INFO - __main__ - Step 20113: {'lr': 0.00048174999221554173, 'samples': 3861696, 'steps': 20112, 'loss/train': 1.6404865980148315} -08/30/2021 16:49:56 - INFO - __main__ - Step 20114: {'lr': 0.000481748001808338, 'samples': 3861888, 'steps': 20113, 'loss/train': 1.6970770359039307} -08/30/2021 16:49:56 - INFO - __main__ - Step 20115: {'lr': 0.00048174601129671223, 'samples': 3862080, 'steps': 20114, 'loss/train': 1.7774577140808105} -08/30/2021 16:49:58 - INFO - __main__ - Step 20116: {'lr': 0.00048174402068066534, 'samples': 3862272, 'steps': 20115, 'loss/train': 1.4758708477020264} -08/30/2021 16:49:58 - INFO - __main__ - Step 20117: {'lr': 0.0004817420299601981, 'samples': 3862464, 'steps': 20116, 'loss/train': 1.9957894086837769} -08/30/2021 16:49:59 - INFO - __main__ - Step 20118: {'lr': 0.0004817400391353115, 'samples': 3862656, 'steps': 20117, 'loss/train': 1.3740090131759644} -08/30/2021 16:49:59 - INFO - __main__ - Step 20119: {'lr': 0.00048173804820600646, 'samples': 3862848, 'steps': 20118, 'loss/train': 2.055910110473633} -08/30/2021 16:49:59 - INFO - __main__ - Step 20120: {'lr': 0.0004817360571722838, 'samples': 3863040, 'steps': 20119, 'loss/train': 1.3270663022994995} -08/30/2021 16:50:01 - INFO - __main__ - Step 20121: {'lr': 0.00048173406603414445, 'samples': 3863232, 'steps': 20120, 'loss/train': 1.580013632774353} -08/30/2021 16:50:01 - INFO - __main__ - Step 20122: {'lr': 0.00048173207479158933, 'samples': 3863424, 'steps': 20121, 'loss/train': 1.3592381477355957} -08/30/2021 16:50:02 - INFO - __main__ - Step 20123: {'lr': 0.0004817300834446192, 'samples': 3863616, 'steps': 20122, 'loss/train': 1.9252469539642334} -08/30/2021 16:50:02 - INFO - __main__ - Step 20124: {'lr': 0.0004817280919932352, 'samples': 3863808, 'steps': 20123, 'loss/train': 1.3935565948486328} -08/30/2021 16:50:02 - INFO - __main__ - Step 20125: {'lr': 0.000481726100437438, 'samples': 3864000, 'steps': 20124, 'loss/train': 1.8088167905807495} -08/30/2021 16:50:04 - INFO - __main__ - Step 20126: {'lr': 0.00048172410877722865, 'samples': 3864192, 'steps': 20125, 'loss/train': 1.7946019172668457} -08/30/2021 16:50:04 - INFO - __main__ - Step 20127: {'lr': 0.00048172211701260807, 'samples': 3864384, 'steps': 20126, 'loss/train': 0.818877100944519} -08/30/2021 16:50:05 - INFO - __main__ - Step 20128: {'lr': 0.0004817201251435769, 'samples': 3864576, 'steps': 20127, 'loss/train': 1.384813666343689} -08/30/2021 16:50:05 - INFO - __main__ - Step 20129: {'lr': 0.00048171813317013633, 'samples': 3864768, 'steps': 20128, 'loss/train': 1.5953658819198608} -08/30/2021 16:50:05 - INFO - __main__ - Step 20130: {'lr': 0.00048171614109228714, 'samples': 3864960, 'steps': 20129, 'loss/train': 1.6424446105957031} -08/30/2021 16:50:07 - INFO - __main__ - Step 20131: {'lr': 0.0004817141489100302, 'samples': 3865152, 'steps': 20130, 'loss/train': 1.778563141822815} -08/30/2021 16:50:07 - INFO - __main__ - Step 20132: {'lr': 0.0004817121566233665, 'samples': 3865344, 'steps': 20131, 'loss/train': 1.9810020923614502} -08/30/2021 16:50:08 - INFO - __main__ - Step 20133: {'lr': 0.0004817101642322968, 'samples': 3865536, 'steps': 20132, 'loss/train': 0.08221045136451721} -08/30/2021 16:50:08 - INFO - __main__ - Step 20134: {'lr': 0.00048170817173682215, 'samples': 3865728, 'steps': 20133, 'loss/train': 1.5096927881240845} -08/30/2021 16:50:08 - INFO - __main__ - Step 20135: {'lr': 0.00048170617913694333, 'samples': 3865920, 'steps': 20134, 'loss/train': 2.2990646362304688} -08/30/2021 16:50:10 - INFO - __main__ - Step 20136: {'lr': 0.00048170418643266125, 'samples': 3866112, 'steps': 20135, 'loss/train': 1.6849663257598877} -08/30/2021 16:50:10 - INFO - __main__ - Step 20137: {'lr': 0.00048170219362397685, 'samples': 3866304, 'steps': 20136, 'loss/train': 1.553839921951294} -08/30/2021 16:50:11 - INFO - __main__ - Step 20138: {'lr': 0.00048170020071089105, 'samples': 3866496, 'steps': 20137, 'loss/train': 1.7705405950546265} -08/30/2021 16:50:11 - INFO - __main__ - Step 20139: {'lr': 0.00048169820769340476, 'samples': 3866688, 'steps': 20138, 'loss/train': 0.19859115779399872} -08/30/2021 16:50:11 - INFO - __main__ - Step 20140: {'lr': 0.0004816962145715188, 'samples': 3866880, 'steps': 20139, 'loss/train': 1.2331286668777466} -08/30/2021 16:50:13 - INFO - __main__ - Step 20141: {'lr': 0.00048169422134523404, 'samples': 3867072, 'steps': 20140, 'loss/train': 1.1087123155593872} -08/30/2021 16:50:13 - INFO - __main__ - Step 20142: {'lr': 0.0004816922280145515, 'samples': 3867264, 'steps': 20141, 'loss/train': 1.4092648029327393} -08/30/2021 16:50:14 - INFO - __main__ - Step 20143: {'lr': 0.00048169023457947195, 'samples': 3867456, 'steps': 20142, 'loss/train': 1.1133297681808472} -08/30/2021 16:50:14 - INFO - __main__ - Step 20144: {'lr': 0.0004816882410399964, 'samples': 3867648, 'steps': 20143, 'loss/train': 1.3509678840637207} -08/30/2021 16:50:14 - INFO - __main__ - Step 20145: {'lr': 0.00048168624739612577, 'samples': 3867840, 'steps': 20144, 'loss/train': 1.8391437530517578} -08/30/2021 16:50:16 - INFO - __main__ - Step 20146: {'lr': 0.0004816842536478608, 'samples': 3868032, 'steps': 20145, 'loss/train': 3.161020517349243} -08/30/2021 16:50:16 - INFO - __main__ - Step 20147: {'lr': 0.00048168225979520254, 'samples': 3868224, 'steps': 20146, 'loss/train': 2.0961363315582275} -08/30/2021 16:50:17 - INFO - __main__ - Step 20148: {'lr': 0.0004816802658381518, 'samples': 3868416, 'steps': 20147, 'loss/train': 1.7573124170303345} -08/30/2021 16:50:17 - INFO - __main__ - Step 20149: {'lr': 0.00048167827177670946, 'samples': 3868608, 'steps': 20148, 'loss/train': 1.8705545663833618} -08/30/2021 16:50:18 - INFO - __main__ - Step 20150: {'lr': 0.0004816762776108765, 'samples': 3868800, 'steps': 20149, 'loss/train': 1.470387578010559} -08/30/2021 16:50:18 - INFO - __main__ - Step 20151: {'lr': 0.0004816742833406538, 'samples': 3868992, 'steps': 20150, 'loss/train': 2.1693620681762695} -08/30/2021 16:50:19 - INFO - __main__ - Step 20152: {'lr': 0.0004816722889660423, 'samples': 3869184, 'steps': 20151, 'loss/train': 1.0245689153671265} -08/30/2021 16:50:20 - INFO - __main__ - Step 20153: {'lr': 0.00048167029448704273, 'samples': 3869376, 'steps': 20152, 'loss/train': 1.4094831943511963} -08/30/2021 16:50:20 - INFO - __main__ - Step 20154: {'lr': 0.00048166829990365615, 'samples': 3869568, 'steps': 20153, 'loss/train': 1.484419822692871} -08/30/2021 16:50:20 - INFO - __main__ - Step 20155: {'lr': 0.0004816663052158834, 'samples': 3869760, 'steps': 20154, 'loss/train': 1.6280980110168457} -08/30/2021 16:50:21 - INFO - __main__ - Step 20156: {'lr': 0.0004816643104237254, 'samples': 3869952, 'steps': 20155, 'loss/train': 1.244726538658142} -08/30/2021 16:50:22 - INFO - __main__ - Step 20157: {'lr': 0.00048166231552718305, 'samples': 3870144, 'steps': 20156, 'loss/train': 1.5656678676605225} -08/30/2021 16:50:23 - INFO - __main__ - Step 20158: {'lr': 0.0004816603205262572, 'samples': 3870336, 'steps': 20157, 'loss/train': 1.7199552059173584} -08/30/2021 16:50:23 - INFO - __main__ - Step 20159: {'lr': 0.0004816583254209488, 'samples': 3870528, 'steps': 20158, 'loss/train': 1.8591266870498657} -08/30/2021 16:50:23 - INFO - __main__ - Step 20160: {'lr': 0.00048165633021125874, 'samples': 3870720, 'steps': 20159, 'loss/train': 1.7345173358917236} -08/30/2021 16:50:24 - INFO - __main__ - Step 20161: {'lr': 0.0004816543348971879, 'samples': 3870912, 'steps': 20160, 'loss/train': 1.5919828414916992} -08/30/2021 16:50:25 - INFO - __main__ - Step 20162: {'lr': 0.0004816523394787372, 'samples': 3871104, 'steps': 20161, 'loss/train': 1.9427335262298584} -08/30/2021 16:50:26 - INFO - __main__ - Step 20163: {'lr': 0.00048165034395590756, 'samples': 3871296, 'steps': 20162, 'loss/train': 2.0290613174438477} -08/30/2021 16:50:26 - INFO - __main__ - Step 20164: {'lr': 0.0004816483483286998, 'samples': 3871488, 'steps': 20163, 'loss/train': 0.8475186228752136} -08/30/2021 16:50:26 - INFO - __main__ - Step 20165: {'lr': 0.0004816463525971149, 'samples': 3871680, 'steps': 20164, 'loss/train': 1.5292781591415405} -08/30/2021 16:50:27 - INFO - __main__ - Step 20166: {'lr': 0.0004816443567611537, 'samples': 3871872, 'steps': 20165, 'loss/train': 1.7337758541107178} -08/30/2021 16:50:29 - INFO - __main__ - Step 20167: {'lr': 0.00048164236082081713, 'samples': 3872064, 'steps': 20166, 'loss/train': 1.8352793455123901} -08/30/2021 16:50:29 - INFO - __main__ - Step 20168: {'lr': 0.00048164036477610616, 'samples': 3872256, 'steps': 20167, 'loss/train': 1.8482677936553955} -08/30/2021 16:50:30 - INFO - __main__ - Step 20169: {'lr': 0.00048163836862702154, 'samples': 3872448, 'steps': 20168, 'loss/train': 0.8686457276344299} -08/30/2021 16:50:30 - INFO - __main__ - Step 20170: {'lr': 0.0004816363723735643, 'samples': 3872640, 'steps': 20169, 'loss/train': 1.7034279108047485} -08/30/2021 16:50:30 - INFO - __main__ - Step 20171: {'lr': 0.00048163437601573525, 'samples': 3872832, 'steps': 20170, 'loss/train': 0.10003358125686646} -08/30/2021 16:50:32 - INFO - __main__ - Step 20172: {'lr': 0.00048163237955353526, 'samples': 3873024, 'steps': 20171, 'loss/train': 1.6900075674057007} -08/30/2021 16:50:32 - INFO - __main__ - Step 20173: {'lr': 0.00048163038298696537, 'samples': 3873216, 'steps': 20172, 'loss/train': 1.5002872943878174} -08/30/2021 16:50:33 - INFO - __main__ - Step 20174: {'lr': 0.00048162838631602643, 'samples': 3873408, 'steps': 20173, 'loss/train': 1.8476632833480835} -08/30/2021 16:50:33 - INFO - __main__ - Step 20175: {'lr': 0.00048162638954071926, 'samples': 3873600, 'steps': 20174, 'loss/train': 1.378610372543335} -08/30/2021 16:50:33 - INFO - __main__ - Step 20176: {'lr': 0.0004816243926610448, 'samples': 3873792, 'steps': 20175, 'loss/train': 1.5293242931365967} -08/30/2021 16:50:35 - INFO - __main__ - Step 20177: {'lr': 0.000481622395677004, 'samples': 3873984, 'steps': 20176, 'loss/train': 1.675130844116211} -08/30/2021 16:50:35 - INFO - __main__ - Step 20178: {'lr': 0.0004816203985885977, 'samples': 3874176, 'steps': 20177, 'loss/train': 1.2655019760131836} -08/30/2021 16:50:36 - INFO - __main__ - Step 20179: {'lr': 0.0004816184013958268, 'samples': 3874368, 'steps': 20178, 'loss/train': 0.8092939257621765} -08/30/2021 16:50:36 - INFO - __main__ - Step 20180: {'lr': 0.0004816164040986923, 'samples': 3874560, 'steps': 20179, 'loss/train': 1.2360841035842896} -08/30/2021 16:50:36 - INFO - __main__ - Step 20181: {'lr': 0.00048161440669719496, 'samples': 3874752, 'steps': 20180, 'loss/train': 1.3704040050506592} -08/30/2021 16:50:37 - INFO - __main__ - Step 20182: {'lr': 0.00048161240919133573, 'samples': 3874944, 'steps': 20181, 'loss/train': 1.7986598014831543} -08/30/2021 16:50:39 - INFO - __main__ - Step 20183: {'lr': 0.00048161041158111564, 'samples': 3875136, 'steps': 20182, 'loss/train': 1.7684286832809448} -08/30/2021 16:50:39 - INFO - __main__ - Step 20184: {'lr': 0.0004816084138665353, 'samples': 3875328, 'steps': 20183, 'loss/train': 2.0559840202331543} -08/30/2021 16:50:40 - INFO - __main__ - Step 20185: {'lr': 0.00048160641604759593, 'samples': 3875520, 'steps': 20184, 'loss/train': 1.800355315208435} -08/30/2021 16:50:40 - INFO - __main__ - Step 20186: {'lr': 0.0004816044181242982, 'samples': 3875712, 'steps': 20185, 'loss/train': 1.0849143266677856} -08/30/2021 16:50:40 - INFO - __main__ - Step 20187: {'lr': 0.0004816024200966431, 'samples': 3875904, 'steps': 20186, 'loss/train': 1.4484061002731323} -08/30/2021 16:50:41 - INFO - __main__ - Step 20188: {'lr': 0.00048160042196463153, 'samples': 3876096, 'steps': 20187, 'loss/train': 1.6775819063186646} -08/30/2021 16:50:43 - INFO - __main__ - Step 20189: {'lr': 0.00048159842372826446, 'samples': 3876288, 'steps': 20188, 'loss/train': 0.43652939796447754} -08/30/2021 16:50:43 - INFO - __main__ - Step 20190: {'lr': 0.0004815964253875426, 'samples': 3876480, 'steps': 20189, 'loss/train': 1.82103431224823} -08/30/2021 16:50:44 - INFO - __main__ - Step 20191: {'lr': 0.000481594426942467, 'samples': 3876672, 'steps': 20190, 'loss/train': 1.695461630821228} -08/30/2021 16:50:44 - INFO - __main__ - Step 20192: {'lr': 0.0004815924283930385, 'samples': 3876864, 'steps': 20191, 'loss/train': 0.7486909031867981} -08/30/2021 16:50:45 - INFO - __main__ - Step 20193: {'lr': 0.0004815904297392582, 'samples': 3877056, 'steps': 20192, 'loss/train': 1.5004451274871826} -08/30/2021 16:50:45 - INFO - __main__ - Step 20194: {'lr': 0.00048158843098112657, 'samples': 3877248, 'steps': 20193, 'loss/train': 0.9767536520957947} -08/30/2021 16:50:45 - INFO - __main__ - Step 20195: {'lr': 0.00048158643211864495, 'samples': 3877440, 'steps': 20194, 'loss/train': 0.047608163207769394} -08/30/2021 16:50:47 - INFO - __main__ - Step 20196: {'lr': 0.000481584433151814, 'samples': 3877632, 'steps': 20195, 'loss/train': 0.05013556405901909} -08/30/2021 16:50:47 - INFO - __main__ - Step 20197: {'lr': 0.00048158243408063465, 'samples': 3877824, 'steps': 20196, 'loss/train': 1.9597336053848267} -08/30/2021 16:50:47 - INFO - __main__ - Step 20198: {'lr': 0.0004815804349051078, 'samples': 3878016, 'steps': 20197, 'loss/train': 1.4055026769638062} -08/30/2021 16:50:48 - INFO - __main__ - Step 20199: {'lr': 0.0004815784356252344, 'samples': 3878208, 'steps': 20198, 'loss/train': 1.3472555875778198} -08/30/2021 16:50:48 - INFO - __main__ - Step 20200: {'lr': 0.0004815764362410154, 'samples': 3878400, 'steps': 20199, 'loss/train': 2.0765771865844727} -08/30/2021 16:50:50 - INFO - __main__ - Step 20201: {'lr': 0.0004815744367524516, 'samples': 3878592, 'steps': 20200, 'loss/train': 1.5773504972457886} -08/30/2021 16:50:50 - INFO - __main__ - Step 20202: {'lr': 0.0004815724371595439, 'samples': 3878784, 'steps': 20201, 'loss/train': 2.0365428924560547} -08/30/2021 16:50:51 - INFO - __main__ - Step 20203: {'lr': 0.00048157043746229324, 'samples': 3878976, 'steps': 20202, 'loss/train': 1.6232331991195679} -08/30/2021 16:50:51 - INFO - __main__ - Step 20204: {'lr': 0.0004815684376607006, 'samples': 3879168, 'steps': 20203, 'loss/train': 1.6831016540527344} -08/30/2021 16:50:52 - INFO - __main__ - Step 20205: {'lr': 0.0004815664377547667, 'samples': 3879360, 'steps': 20204, 'loss/train': 1.1959266662597656} -08/30/2021 16:50:52 - INFO - __main__ - Step 20206: {'lr': 0.00048156443774449254, 'samples': 3879552, 'steps': 20205, 'loss/train': 1.4080724716186523} -08/30/2021 16:50:53 - INFO - __main__ - Step 20207: {'lr': 0.00048156243762987905, 'samples': 3879744, 'steps': 20206, 'loss/train': 0.19121168553829193} -08/30/2021 16:50:54 - INFO - __main__ - Step 20208: {'lr': 0.00048156043741092705, 'samples': 3879936, 'steps': 20207, 'loss/train': 1.7060894966125488} -08/30/2021 16:50:54 - INFO - __main__ - Step 20209: {'lr': 0.00048155843708763755, 'samples': 3880128, 'steps': 20208, 'loss/train': 1.4156874418258667} -08/30/2021 16:50:54 - INFO - __main__ - Step 20210: {'lr': 0.0004815564366600114, 'samples': 3880320, 'steps': 20209, 'loss/train': 1.5062568187713623} -08/30/2021 16:50:55 - INFO - __main__ - Step 20211: {'lr': 0.0004815544361280494, 'samples': 3880512, 'steps': 20210, 'loss/train': 1.4830186367034912} -08/30/2021 16:50:56 - INFO - __main__ - Step 20212: {'lr': 0.00048155243549175263, 'samples': 3880704, 'steps': 20211, 'loss/train': 1.079834222793579} -08/30/2021 16:50:57 - INFO - __main__ - Step 20213: {'lr': 0.00048155043475112184, 'samples': 3880896, 'steps': 20212, 'loss/train': 2.0521597862243652} -08/30/2021 16:50:57 - INFO - __main__ - Step 20214: {'lr': 0.0004815484339061581, 'samples': 3881088, 'steps': 20213, 'loss/train': 1.731704831123352} -08/30/2021 16:50:58 - INFO - __main__ - Step 20215: {'lr': 0.0004815464329568621, 'samples': 3881280, 'steps': 20214, 'loss/train': 1.4401785135269165} -08/30/2021 16:50:58 - INFO - __main__ - Step 20216: {'lr': 0.00048154443190323495, 'samples': 3881472, 'steps': 20215, 'loss/train': 1.3341749906539917} -08/30/2021 16:51:00 - INFO - __main__ - Step 20217: {'lr': 0.0004815424307452774, 'samples': 3881664, 'steps': 20216, 'loss/train': 1.637634515762329} -08/30/2021 16:51:00 - INFO - __main__ - Step 20218: {'lr': 0.0004815404294829904, 'samples': 3881856, 'steps': 20217, 'loss/train': 1.7783867120742798} -08/30/2021 16:51:01 - INFO - __main__ - Step 20219: {'lr': 0.0004815384281163748, 'samples': 3882048, 'steps': 20218, 'loss/train': 1.814454436302185} -08/30/2021 16:51:01 - INFO - __main__ - Step 20220: {'lr': 0.0004815364266454316, 'samples': 3882240, 'steps': 20219, 'loss/train': 1.4207069873809814} -08/30/2021 16:51:01 - INFO - __main__ - Step 20221: {'lr': 0.00048153442507016173, 'samples': 3882432, 'steps': 20220, 'loss/train': 1.6495163440704346} -08/30/2021 16:51:03 - INFO - __main__ - Step 20222: {'lr': 0.00048153242339056594, 'samples': 3882624, 'steps': 20221, 'loss/train': 1.6814595460891724} -08/30/2021 16:51:04 - INFO - __main__ - Step 20223: {'lr': 0.0004815304216066453, 'samples': 3882816, 'steps': 20222, 'loss/train': 0.20040147006511688} -08/30/2021 16:51:04 - INFO - __main__ - Step 20224: {'lr': 0.0004815284197184005, 'samples': 3883008, 'steps': 20223, 'loss/train': 1.9685205221176147} -08/30/2021 16:51:04 - INFO - __main__ - Step 20225: {'lr': 0.0004815264177258326, 'samples': 3883200, 'steps': 20224, 'loss/train': 1.3303196430206299} -08/30/2021 16:51:05 - INFO - __main__ - Step 20226: {'lr': 0.00048152441562894255, 'samples': 3883392, 'steps': 20225, 'loss/train': 1.6731454133987427} -08/30/2021 16:51:06 - INFO - __main__ - Step 20227: {'lr': 0.0004815224134277311, 'samples': 3883584, 'steps': 20226, 'loss/train': 1.7326157093048096} -08/30/2021 16:51:07 - INFO - __main__ - Step 20228: {'lr': 0.00048152041112219926, 'samples': 3883776, 'steps': 20227, 'loss/train': 1.5589109659194946} -08/30/2021 16:51:07 - INFO - __main__ - Step 20229: {'lr': 0.0004815184087123479, 'samples': 3883968, 'steps': 20228, 'loss/train': 0.0714040994644165} -08/30/2021 16:51:07 - INFO - __main__ - Step 20230: {'lr': 0.0004815164061981778, 'samples': 3884160, 'steps': 20229, 'loss/train': 1.3627091646194458} -08/30/2021 16:51:08 - INFO - __main__ - Step 20231: {'lr': 0.0004815144035796901, 'samples': 3884352, 'steps': 20230, 'loss/train': 1.625974178314209} -08/30/2021 16:51:09 - INFO - __main__ - Step 20232: {'lr': 0.0004815124008568856, 'samples': 3884544, 'steps': 20231, 'loss/train': 1.6093692779541016} -08/30/2021 16:51:10 - INFO - __main__ - Step 20233: {'lr': 0.00048151039802976517, 'samples': 3884736, 'steps': 20232, 'loss/train': 1.4500622749328613} -08/30/2021 16:51:10 - INFO - __main__ - Step 20234: {'lr': 0.00048150839509832966, 'samples': 3884928, 'steps': 20233, 'loss/train': 1.9628890752792358} -08/30/2021 16:51:10 - INFO - __main__ - Step 20235: {'lr': 0.0004815063920625801, 'samples': 3885120, 'steps': 20234, 'loss/train': 1.5627418756484985} -08/30/2021 16:51:11 - INFO - __main__ - Step 20236: {'lr': 0.00048150438892251724, 'samples': 3885312, 'steps': 20235, 'loss/train': 1.7016435861587524} -08/30/2021 16:51:11 - INFO - __main__ - Step 20237: {'lr': 0.00048150238567814217, 'samples': 3885504, 'steps': 20236, 'loss/train': 2.050870418548584} -08/30/2021 16:51:13 - INFO - __main__ - Step 20238: {'lr': 0.0004815003823294557, 'samples': 3885696, 'steps': 20237, 'loss/train': 1.4891928434371948} -08/30/2021 16:51:13 - INFO - __main__ - Step 20239: {'lr': 0.0004814983788764587, 'samples': 3885888, 'steps': 20238, 'loss/train': 1.7690858840942383} -08/30/2021 16:51:13 - INFO - __main__ - Step 20240: {'lr': 0.00048149637531915215, 'samples': 3886080, 'steps': 20239, 'loss/train': 1.8192404508590698} -08/30/2021 16:51:14 - INFO - __main__ - Step 20241: {'lr': 0.00048149437165753684, 'samples': 3886272, 'steps': 20240, 'loss/train': 1.5038063526153564} -08/30/2021 16:51:14 - INFO - __main__ - Step 20242: {'lr': 0.00048149236789161374, 'samples': 3886464, 'steps': 20241, 'loss/train': 1.7118151187896729} -08/30/2021 16:51:16 - INFO - __main__ - Step 20243: {'lr': 0.0004814903640213838, 'samples': 3886656, 'steps': 20242, 'loss/train': 1.7593092918395996} -08/30/2021 16:51:16 - INFO - __main__ - Step 20244: {'lr': 0.0004814883600468478, 'samples': 3886848, 'steps': 20243, 'loss/train': 1.4841561317443848} -08/30/2021 16:51:16 - INFO - __main__ - Step 20245: {'lr': 0.0004814863559680068, 'samples': 3887040, 'steps': 20244, 'loss/train': 1.5900686979293823} -08/30/2021 16:51:17 - INFO - __main__ - Step 20246: {'lr': 0.00048148435178486156, 'samples': 3887232, 'steps': 20245, 'loss/train': 1.7600446939468384} -08/30/2021 16:51:17 - INFO - __main__ - Step 20247: {'lr': 0.00048148234749741304, 'samples': 3887424, 'steps': 20246, 'loss/train': 1.2677690982818604} -08/30/2021 16:51:19 - INFO - __main__ - Step 20248: {'lr': 0.0004814803431056622, 'samples': 3887616, 'steps': 20247, 'loss/train': 0.11285198479890823} -08/30/2021 16:51:19 - INFO - __main__ - Step 20249: {'lr': 0.0004814783386096099, 'samples': 3887808, 'steps': 20248, 'loss/train': 1.5451240539550781} -08/30/2021 16:51:19 - INFO - __main__ - Step 20250: {'lr': 0.00048147633400925693, 'samples': 3888000, 'steps': 20249, 'loss/train': 1.4259566068649292} -08/30/2021 16:51:20 - INFO - __main__ - Step 20251: {'lr': 0.00048147432930460433, 'samples': 3888192, 'steps': 20250, 'loss/train': 1.0979019403457642} -08/30/2021 16:51:20 - INFO - __main__ - Step 20252: {'lr': 0.00048147232449565305, 'samples': 3888384, 'steps': 20251, 'loss/train': 1.3598960638046265} -08/30/2021 16:51:22 - INFO - __main__ - Step 20253: {'lr': 0.00048147031958240384, 'samples': 3888576, 'steps': 20252, 'loss/train': 1.4012603759765625} -08/30/2021 16:51:22 - INFO - __main__ - Step 20254: {'lr': 0.00048146831456485776, 'samples': 3888768, 'steps': 20253, 'loss/train': 1.9264036417007446} -08/30/2021 16:51:22 - INFO - __main__ - Step 20255: {'lr': 0.0004814663094430155, 'samples': 3888960, 'steps': 20254, 'loss/train': 1.0462913513183594} -08/30/2021 16:51:23 - INFO - __main__ - Step 20256: {'lr': 0.00048146430421687817, 'samples': 3889152, 'steps': 20255, 'loss/train': 2.1124379634857178} -08/30/2021 16:51:23 - INFO - __main__ - Step 20257: {'lr': 0.00048146229888644656, 'samples': 3889344, 'steps': 20256, 'loss/train': 1.7220581769943237} -08/30/2021 16:51:24 - INFO - __main__ - Step 20258: {'lr': 0.00048146029345172165, 'samples': 3889536, 'steps': 20257, 'loss/train': 2.0938880443573} -08/30/2021 16:51:25 - INFO - __main__ - Step 20259: {'lr': 0.0004814582879127043, 'samples': 3889728, 'steps': 20258, 'loss/train': 1.6154398918151855} -08/30/2021 16:51:25 - INFO - __main__ - Step 20260: {'lr': 0.0004814562822693954, 'samples': 3889920, 'steps': 20259, 'loss/train': 1.5098820924758911} -08/30/2021 16:51:26 - INFO - __main__ - Step 20261: {'lr': 0.00048145427652179583, 'samples': 3890112, 'steps': 20260, 'loss/train': 1.702278733253479} -08/30/2021 16:51:26 - INFO - __main__ - Step 20262: {'lr': 0.0004814522706699066, 'samples': 3890304, 'steps': 20261, 'loss/train': 2.050403356552124} -08/30/2021 16:51:27 - INFO - __main__ - Step 20263: {'lr': 0.00048145026471372855, 'samples': 3890496, 'steps': 20262, 'loss/train': 1.369707703590393} -08/30/2021 16:51:28 - INFO - __main__ - Step 20264: {'lr': 0.0004814482586532626, 'samples': 3890688, 'steps': 20263, 'loss/train': 1.726524829864502} -08/30/2021 16:51:28 - INFO - __main__ - Step 20265: {'lr': 0.00048144625248850955, 'samples': 3890880, 'steps': 20264, 'loss/train': 1.3683204650878906} -08/30/2021 16:51:29 - INFO - __main__ - Step 20266: {'lr': 0.0004814442462194704, 'samples': 3891072, 'steps': 20265, 'loss/train': 1.4735925197601318} -08/30/2021 16:51:29 - INFO - __main__ - Step 20267: {'lr': 0.0004814422398461461, 'samples': 3891264, 'steps': 20266, 'loss/train': 1.1498258113861084} -08/30/2021 16:51:29 - INFO - __main__ - Step 20268: {'lr': 0.00048144023336853746, 'samples': 3891456, 'steps': 20267, 'loss/train': 1.1298660039901733} -08/30/2021 16:51:31 - INFO - __main__ - Step 20269: {'lr': 0.00048143822678664545, 'samples': 3891648, 'steps': 20268, 'loss/train': 1.6574901342391968} -08/30/2021 16:51:31 - INFO - __main__ - Step 20270: {'lr': 0.00048143622010047096, 'samples': 3891840, 'steps': 20269, 'loss/train': 1.2668615579605103} -08/30/2021 16:51:32 - INFO - __main__ - Step 20271: {'lr': 0.0004814342133100149, 'samples': 3892032, 'steps': 20270, 'loss/train': 1.652359962463379} -08/30/2021 16:51:32 - INFO - __main__ - Step 20272: {'lr': 0.00048143220641527805, 'samples': 3892224, 'steps': 20271, 'loss/train': 0.955489456653595} -08/30/2021 16:51:32 - INFO - __main__ - Step 20273: {'lr': 0.0004814301994162615, 'samples': 3892416, 'steps': 20272, 'loss/train': 1.2216873168945312} -08/30/2021 16:51:34 - INFO - __main__ - Step 20274: {'lr': 0.000481428192312966, 'samples': 3892608, 'steps': 20273, 'loss/train': 0.6006215214729309} -08/30/2021 16:51:35 - INFO - __main__ - Step 20275: {'lr': 0.0004814261851053926, 'samples': 3892800, 'steps': 20274, 'loss/train': 2.2969014644622803} -08/30/2021 16:51:35 - INFO - __main__ - Step 20276: {'lr': 0.00048142417779354214, 'samples': 3892992, 'steps': 20275, 'loss/train': 1.3134269714355469} -08/30/2021 16:51:35 - INFO - __main__ - Step 20277: {'lr': 0.0004814221703774155, 'samples': 3893184, 'steps': 20276, 'loss/train': 1.9949308633804321} -08/30/2021 16:51:36 - INFO - __main__ - Step 20278: {'lr': 0.00048142016285701356, 'samples': 3893376, 'steps': 20277, 'loss/train': 0.6431128978729248} -08/30/2021 16:51:37 - INFO - __main__ - Step 20279: {'lr': 0.00048141815523233735, 'samples': 3893568, 'steps': 20278, 'loss/train': 1.374727487564087} -08/30/2021 16:51:38 - INFO - __main__ - Step 20280: {'lr': 0.00048141614750338757, 'samples': 3893760, 'steps': 20279, 'loss/train': 1.5767276287078857} -08/30/2021 16:51:38 - INFO - __main__ - Step 20281: {'lr': 0.00048141413967016535, 'samples': 3893952, 'steps': 20280, 'loss/train': 2.1855556964874268} -08/30/2021 16:51:38 - INFO - __main__ - Step 20282: {'lr': 0.00048141213173267145, 'samples': 3894144, 'steps': 20281, 'loss/train': 1.0905746221542358} -08/30/2021 16:51:39 - INFO - __main__ - Step 20283: {'lr': 0.0004814101236909068, 'samples': 3894336, 'steps': 20282, 'loss/train': 1.8638893365859985} -08/30/2021 16:51:40 - INFO - __main__ - Step 20284: {'lr': 0.00048140811554487234, 'samples': 3894528, 'steps': 20283, 'loss/train': 1.758457064628601} -08/30/2021 16:51:41 - INFO - __main__ - Step 20285: {'lr': 0.000481406107294569, 'samples': 3894720, 'steps': 20284, 'loss/train': 1.4025347232818604} -08/30/2021 16:51:41 - INFO - __main__ - Step 20286: {'lr': 0.0004814040989399975, 'samples': 3894912, 'steps': 20285, 'loss/train': 1.8196550607681274} -08/30/2021 16:51:41 - INFO - __main__ - Step 20287: {'lr': 0.000481402090481159, 'samples': 3895104, 'steps': 20286, 'loss/train': 1.3624060153961182} -08/30/2021 16:51:42 - INFO - __main__ - Step 20288: {'lr': 0.0004814000819180543, 'samples': 3895296, 'steps': 20287, 'loss/train': 0.644443929195404} -08/30/2021 16:51:42 - INFO - __main__ - Step 20289: {'lr': 0.00048139807325068423, 'samples': 3895488, 'steps': 20288, 'loss/train': 1.156691074371338} -08/30/2021 16:51:44 - INFO - __main__ - Step 20290: {'lr': 0.0004813960644790498, 'samples': 3895680, 'steps': 20289, 'loss/train': 1.8000234365463257} -08/30/2021 16:51:44 - INFO - __main__ - Step 20291: {'lr': 0.00048139405560315186, 'samples': 3895872, 'steps': 20290, 'loss/train': 1.5448402166366577} -08/30/2021 16:51:44 - INFO - __main__ - Step 20292: {'lr': 0.0004813920466229913, 'samples': 3896064, 'steps': 20291, 'loss/train': 2.0204708576202393} -08/30/2021 16:51:45 - INFO - __main__ - Step 20293: {'lr': 0.0004813900375385691, 'samples': 3896256, 'steps': 20292, 'loss/train': 1.535262107849121} -08/30/2021 16:51:45 - INFO - __main__ - Step 20294: {'lr': 0.0004813880283498861, 'samples': 3896448, 'steps': 20293, 'loss/train': 1.7797614336013794} -08/30/2021 16:51:47 - INFO - __main__ - Step 20295: {'lr': 0.00048138601905694324, 'samples': 3896640, 'steps': 20294, 'loss/train': 1.4918376207351685} -08/30/2021 16:51:47 - INFO - __main__ - Step 20296: {'lr': 0.0004813840096597414, 'samples': 3896832, 'steps': 20295, 'loss/train': 1.7750217914581299} -08/30/2021 16:51:47 - INFO - __main__ - Step 20297: {'lr': 0.00048138200015828146, 'samples': 3897024, 'steps': 20296, 'loss/train': 0.6045969724655151} -08/30/2021 16:51:48 - INFO - __main__ - Step 20298: {'lr': 0.00048137999055256444, 'samples': 3897216, 'steps': 20297, 'loss/train': 1.321756362915039} -08/30/2021 16:51:48 - INFO - __main__ - Step 20299: {'lr': 0.0004813779808425911, 'samples': 3897408, 'steps': 20298, 'loss/train': 2.277691125869751} -08/30/2021 16:51:50 - INFO - __main__ - Step 20300: {'lr': 0.0004813759710283624, 'samples': 3897600, 'steps': 20299, 'loss/train': 1.074888825416565} -08/30/2021 16:51:51 - INFO - __main__ - Step 20301: {'lr': 0.0004813739611098793, 'samples': 3897792, 'steps': 20300, 'loss/train': 1.1064374446868896} -08/30/2021 16:51:51 - INFO - __main__ - Step 20302: {'lr': 0.00048137195108714266, 'samples': 3897984, 'steps': 20301, 'loss/train': 1.246031641960144} -08/30/2021 16:51:51 - INFO - __main__ - Step 20303: {'lr': 0.00048136994096015343, 'samples': 3898176, 'steps': 20302, 'loss/train': 2.2300167083740234} -08/30/2021 16:51:52 - INFO - __main__ - Step 20304: {'lr': 0.00048136793072891236, 'samples': 3898368, 'steps': 20303, 'loss/train': 0.9699680805206299} -08/30/2021 16:51:52 - INFO - __main__ - Step 20305: {'lr': 0.00048136592039342053, 'samples': 3898560, 'steps': 20304, 'loss/train': 0.25588709115982056} -08/30/2021 16:51:54 - INFO - __main__ - Step 20306: {'lr': 0.0004813639099536789, 'samples': 3898752, 'steps': 20305, 'loss/train': 0.08922585099935532} -08/30/2021 16:51:54 - INFO - __main__ - Step 20307: {'lr': 0.0004813618994096881, 'samples': 3898944, 'steps': 20306, 'loss/train': 1.9414191246032715} -08/30/2021 16:51:54 - INFO - __main__ - Step 20308: {'lr': 0.0004813598887614492, 'samples': 3899136, 'steps': 20307, 'loss/train': 2.3342318534851074} -08/30/2021 16:51:55 - INFO - __main__ - Step 20309: {'lr': 0.0004813578780089632, 'samples': 3899328, 'steps': 20308, 'loss/train': 1.780541181564331} -08/30/2021 16:51:55 - INFO - __main__ - Step 20310: {'lr': 0.00048135586715223087, 'samples': 3899520, 'steps': 20309, 'loss/train': 1.5144213438034058} -08/30/2021 16:51:56 - INFO - __main__ - Step 20311: {'lr': 0.00048135385619125316, 'samples': 3899712, 'steps': 20310, 'loss/train': 1.6306337118148804} -08/30/2021 16:51:57 - INFO - __main__ - Step 20312: {'lr': 0.00048135184512603093, 'samples': 3899904, 'steps': 20311, 'loss/train': 1.8974195718765259} -08/30/2021 16:51:57 - INFO - __main__ - Step 20313: {'lr': 0.00048134983395656516, 'samples': 3900096, 'steps': 20312, 'loss/train': 1.349603533744812} -08/30/2021 16:51:58 - INFO - __main__ - Step 20314: {'lr': 0.00048134782268285676, 'samples': 3900288, 'steps': 20313, 'loss/train': 1.4073094129562378} -08/30/2021 16:51:58 - INFO - __main__ - Step 20315: {'lr': 0.00048134581130490655, 'samples': 3900480, 'steps': 20314, 'loss/train': 0.14571332931518555} -08/30/2021 16:51:59 - INFO - __main__ - Step 20316: {'lr': 0.0004813437998227155, 'samples': 3900672, 'steps': 20315, 'loss/train': 1.4282830953598022} -08/30/2021 16:52:00 - INFO - __main__ - Step 20317: {'lr': 0.00048134178823628455, 'samples': 3900864, 'steps': 20316, 'loss/train': 0.07498446106910706} -08/30/2021 16:52:00 - INFO - __main__ - Step 20318: {'lr': 0.0004813397765456145, 'samples': 3901056, 'steps': 20317, 'loss/train': 1.475098729133606} -08/30/2021 16:52:01 - INFO - __main__ - Step 20319: {'lr': 0.00048133776475070637, 'samples': 3901248, 'steps': 20318, 'loss/train': 1.4537569284439087} -08/30/2021 16:52:01 - INFO - __main__ - Step 20320: {'lr': 0.00048133575285156093, 'samples': 3901440, 'steps': 20319, 'loss/train': 1.7889646291732788} -08/30/2021 16:52:03 - INFO - __main__ - Step 20321: {'lr': 0.00048133374084817927, 'samples': 3901632, 'steps': 20320, 'loss/train': 1.2979167699813843} -08/30/2021 16:52:03 - INFO - __main__ - Step 20322: {'lr': 0.00048133172874056213, 'samples': 3901824, 'steps': 20321, 'loss/train': 1.4164572954177856} -08/30/2021 16:52:04 - INFO - __main__ - Step 20323: {'lr': 0.0004813297165287105, 'samples': 3902016, 'steps': 20322, 'loss/train': 0.38410359621047974} -08/30/2021 16:52:04 - INFO - __main__ - Step 20324: {'lr': 0.00048132770421262526, 'samples': 3902208, 'steps': 20323, 'loss/train': 1.6559373140335083} -08/30/2021 16:52:04 - INFO - __main__ - Step 20325: {'lr': 0.00048132569179230736, 'samples': 3902400, 'steps': 20324, 'loss/train': 1.012794852256775} -08/30/2021 16:52:06 - INFO - __main__ - Step 20326: {'lr': 0.0004813236792677577, 'samples': 3902592, 'steps': 20325, 'loss/train': 1.9623057842254639} -08/30/2021 16:52:07 - INFO - __main__ - Step 20327: {'lr': 0.00048132166663897703, 'samples': 3902784, 'steps': 20326, 'loss/train': 1.7337126731872559} -08/30/2021 16:52:07 - INFO - __main__ - Step 20328: {'lr': 0.0004813196539059665, 'samples': 3902976, 'steps': 20327, 'loss/train': 1.6525582075119019} -08/30/2021 16:52:08 - INFO - __main__ - Step 20329: {'lr': 0.0004813176410687269, 'samples': 3903168, 'steps': 20328, 'loss/train': 1.8098485469818115} -08/30/2021 16:52:08 - INFO - __main__ - Step 20330: {'lr': 0.00048131562812725904, 'samples': 3903360, 'steps': 20329, 'loss/train': 1.4743527173995972} -08/30/2021 16:52:09 - INFO - __main__ - Step 20331: {'lr': 0.000481313615081564, 'samples': 3903552, 'steps': 20330, 'loss/train': 0.7975194454193115} -08/30/2021 16:52:10 - INFO - __main__ - Step 20332: {'lr': 0.00048131160193164266, 'samples': 3903744, 'steps': 20331, 'loss/train': 1.6436889171600342} -08/30/2021 16:52:10 - INFO - __main__ - Step 20333: {'lr': 0.0004813095886774958, 'samples': 3903936, 'steps': 20332, 'loss/train': 1.3344805240631104} -08/30/2021 16:52:11 - INFO - __main__ - Step 20334: {'lr': 0.00048130757531912447, 'samples': 3904128, 'steps': 20333, 'loss/train': 1.0350271463394165} -08/30/2021 16:52:11 - INFO - __main__ - Step 20335: {'lr': 0.00048130556185652947, 'samples': 3904320, 'steps': 20334, 'loss/train': 1.1588261127471924} -08/30/2021 16:52:13 - INFO - __main__ - Step 20336: {'lr': 0.0004813035482897118, 'samples': 3904512, 'steps': 20335, 'loss/train': 0.1003037616610527} -08/30/2021 16:52:13 - INFO - __main__ - Step 20337: {'lr': 0.00048130153461867225, 'samples': 3904704, 'steps': 20336, 'loss/train': 1.3650394678115845} -08/30/2021 16:52:13 - INFO - __main__ - Step 20338: {'lr': 0.0004812995208434119, 'samples': 3904896, 'steps': 20337, 'loss/train': 1.2996113300323486} -08/30/2021 16:52:14 - INFO - __main__ - Step 20339: {'lr': 0.00048129750696393144, 'samples': 3905088, 'steps': 20338, 'loss/train': 0.38042551279067993} -08/30/2021 16:52:14 - INFO - __main__ - Step 20340: {'lr': 0.00048129549298023196, 'samples': 3905280, 'steps': 20339, 'loss/train': 2.639559745788574} -08/30/2021 16:52:16 - INFO - __main__ - Step 20341: {'lr': 0.0004812934788923143, 'samples': 3905472, 'steps': 20340, 'loss/train': 2.066987991333008} -08/30/2021 16:52:16 - INFO - __main__ - Step 20342: {'lr': 0.00048129146470017933, 'samples': 3905664, 'steps': 20341, 'loss/train': 1.4800901412963867} -08/30/2021 16:52:16 - INFO - __main__ - Step 20343: {'lr': 0.000481289450403828, 'samples': 3905856, 'steps': 20342, 'loss/train': 1.8806313276290894} -08/30/2021 16:52:17 - INFO - __main__ - Step 20344: {'lr': 0.0004812874360032613, 'samples': 3906048, 'steps': 20343, 'loss/train': 0.0669122040271759} -08/30/2021 16:52:17 - INFO - __main__ - Step 20345: {'lr': 0.0004812854214984799, 'samples': 3906240, 'steps': 20344, 'loss/train': 1.2670842409133911} -08/30/2021 16:52:19 - INFO - __main__ - Step 20346: {'lr': 0.000481283406889485, 'samples': 3906432, 'steps': 20345, 'loss/train': 1.4036363363265991} -08/30/2021 16:52:19 - INFO - __main__ - Step 20347: {'lr': 0.00048128139217627725, 'samples': 3906624, 'steps': 20346, 'loss/train': 1.4741283655166626} -08/30/2021 16:52:20 - INFO - __main__ - Step 20348: {'lr': 0.00048127937735885774, 'samples': 3906816, 'steps': 20347, 'loss/train': 1.190222978591919} -08/30/2021 16:52:20 - INFO - __main__ - Step 20349: {'lr': 0.0004812773624372273, 'samples': 3907008, 'steps': 20348, 'loss/train': 1.4741625785827637} -08/30/2021 16:52:20 - INFO - __main__ - Step 20350: {'lr': 0.0004812753474113869, 'samples': 3907200, 'steps': 20349, 'loss/train': 0.13493667542934418} -08/30/2021 16:52:21 - INFO - __main__ - Step 20351: {'lr': 0.0004812733322813373, 'samples': 3907392, 'steps': 20350, 'loss/train': 1.3247870206832886} -08/30/2021 16:52:22 - INFO - __main__ - Step 20352: {'lr': 0.00048127131704707953, 'samples': 3907584, 'steps': 20351, 'loss/train': 1.2110882997512817} -08/30/2021 16:52:23 - INFO - __main__ - Step 20353: {'lr': 0.0004812693017086145, 'samples': 3907776, 'steps': 20352, 'loss/train': 1.2169265747070312} -08/30/2021 16:52:23 - INFO - __main__ - Step 20354: {'lr': 0.00048126728626594315, 'samples': 3907968, 'steps': 20353, 'loss/train': 1.8783468008041382} -08/30/2021 16:52:24 - INFO - __main__ - Step 20355: {'lr': 0.00048126527071906623, 'samples': 3908160, 'steps': 20354, 'loss/train': 1.3172804117202759} -08/30/2021 16:52:24 - INFO - __main__ - Step 20356: {'lr': 0.0004812632550679848, 'samples': 3908352, 'steps': 20355, 'loss/train': 1.304091215133667} -08/30/2021 16:52:25 - INFO - __main__ - Step 20357: {'lr': 0.00048126123931269973, 'samples': 3908544, 'steps': 20356, 'loss/train': 2.1128251552581787} -08/30/2021 16:52:26 - INFO - __main__ - Step 20358: {'lr': 0.0004812592234532118, 'samples': 3908736, 'steps': 20357, 'loss/train': 1.362840175628662} -08/30/2021 16:52:26 - INFO - __main__ - Step 20359: {'lr': 0.00048125720748952216, 'samples': 3908928, 'steps': 20358, 'loss/train': 1.3950108289718628} -08/30/2021 16:52:27 - INFO - __main__ - Step 20360: {'lr': 0.00048125519142163157, 'samples': 3909120, 'steps': 20359, 'loss/train': 1.794309139251709} -08/30/2021 16:52:27 - INFO - __main__ - Step 20361: {'lr': 0.0004812531752495409, 'samples': 3909312, 'steps': 20360, 'loss/train': 1.2508519887924194} -08/30/2021 16:52:28 - INFO - __main__ - Step 20362: {'lr': 0.00048125115897325115, 'samples': 3909504, 'steps': 20361, 'loss/train': 1.7729012966156006} -08/30/2021 16:52:29 - INFO - __main__ - Step 20363: {'lr': 0.0004812491425927632, 'samples': 3909696, 'steps': 20362, 'loss/train': 1.9157298803329468} -08/30/2021 16:52:29 - INFO - __main__ - Step 20364: {'lr': 0.000481247126108078, 'samples': 3909888, 'steps': 20363, 'loss/train': 0.7351324558258057} -08/30/2021 16:52:29 - INFO - __main__ - Step 20365: {'lr': 0.00048124510951919633, 'samples': 3910080, 'steps': 20364, 'loss/train': 1.759158968925476} -08/30/2021 16:52:30 - INFO - __main__ - Step 20366: {'lr': 0.0004812430928261192, 'samples': 3910272, 'steps': 20365, 'loss/train': 1.376376748085022} -08/30/2021 16:52:30 - INFO - __main__ - Step 20367: {'lr': 0.00048124107602884753, 'samples': 3910464, 'steps': 20366, 'loss/train': 0.8080965876579285} -08/30/2021 16:52:32 - INFO - __main__ - Step 20368: {'lr': 0.0004812390591273822, 'samples': 3910656, 'steps': 20367, 'loss/train': 2.2293286323547363} -08/30/2021 16:52:32 - INFO - __main__ - Step 20369: {'lr': 0.00048123704212172416, 'samples': 3910848, 'steps': 20368, 'loss/train': 1.5028109550476074} -08/30/2021 16:52:32 - INFO - __main__ - Step 20370: {'lr': 0.0004812350250118742, 'samples': 3911040, 'steps': 20369, 'loss/train': 1.318708896636963} -08/30/2021 16:52:33 - INFO - __main__ - Step 20371: {'lr': 0.0004812330077978333, 'samples': 3911232, 'steps': 20370, 'loss/train': 1.5189670324325562} -08/30/2021 16:52:33 - INFO - __main__ - Step 20372: {'lr': 0.0004812309904796024, 'samples': 3911424, 'steps': 20371, 'loss/train': 2.112004518508911} -08/30/2021 16:52:35 - INFO - __main__ - Step 20373: {'lr': 0.0004812289730571824, 'samples': 3911616, 'steps': 20372, 'loss/train': 1.28286612033844} -08/30/2021 16:52:35 - INFO - __main__ - Step 20374: {'lr': 0.00048122695553057417, 'samples': 3911808, 'steps': 20373, 'loss/train': 0.4064999222755432} -08/30/2021 16:52:35 - INFO - __main__ - Step 20375: {'lr': 0.00048122493789977866, 'samples': 3912000, 'steps': 20374, 'loss/train': 0.8093968033790588} -08/30/2021 16:52:36 - INFO - __main__ - Step 20376: {'lr': 0.00048122292016479674, 'samples': 3912192, 'steps': 20375, 'loss/train': 1.5330499410629272} -08/30/2021 16:52:36 - INFO - __main__ - Step 20377: {'lr': 0.0004812209023256294, 'samples': 3912384, 'steps': 20376, 'loss/train': 1.7736256122589111} -08/30/2021 16:52:38 - INFO - __main__ - Step 20378: {'lr': 0.0004812188843822775, 'samples': 3912576, 'steps': 20377, 'loss/train': 1.1705150604248047} -08/30/2021 16:52:38 - INFO - __main__ - Step 20379: {'lr': 0.0004812168663347418, 'samples': 3912768, 'steps': 20378, 'loss/train': 1.4795498847961426} -08/30/2021 16:52:38 - INFO - __main__ - Step 20380: {'lr': 0.00048121484818302343, 'samples': 3912960, 'steps': 20379, 'loss/train': 1.5681957006454468} -08/30/2021 16:52:39 - INFO - __main__ - Step 20381: {'lr': 0.00048121282992712324, 'samples': 3913152, 'steps': 20380, 'loss/train': 1.891641616821289} -08/30/2021 16:52:39 - INFO - __main__ - Step 20382: {'lr': 0.00048121081156704207, 'samples': 3913344, 'steps': 20381, 'loss/train': 1.8444931507110596} -08/30/2021 16:52:39 - INFO - __main__ - Step 20383: {'lr': 0.00048120879310278094, 'samples': 3913536, 'steps': 20382, 'loss/train': 1.2242088317871094} -08/30/2021 16:52:41 - INFO - __main__ - Step 20384: {'lr': 0.00048120677453434066, 'samples': 3913728, 'steps': 20383, 'loss/train': 1.4907710552215576} -08/30/2021 16:52:42 - INFO - __main__ - Step 20385: {'lr': 0.00048120475586172217, 'samples': 3913920, 'steps': 20384, 'loss/train': 2.6739895343780518} -08/30/2021 16:52:42 - INFO - __main__ - Step 20386: {'lr': 0.00048120273708492637, 'samples': 3914112, 'steps': 20385, 'loss/train': 1.0332735776901245} -08/30/2021 16:52:43 - INFO - __main__ - Step 20387: {'lr': 0.0004812007182039542, 'samples': 3914304, 'steps': 20386, 'loss/train': 1.4726247787475586} -08/30/2021 16:52:43 - INFO - __main__ - Step 20388: {'lr': 0.00048119869921880656, 'samples': 3914496, 'steps': 20387, 'loss/train': 2.6740262508392334} -08/30/2021 16:52:44 - INFO - __main__ - Step 20389: {'lr': 0.00048119668012948434, 'samples': 3914688, 'steps': 20388, 'loss/train': 1.3015917539596558} -08/30/2021 16:52:45 - INFO - __main__ - Step 20390: {'lr': 0.0004811946609359885, 'samples': 3914880, 'steps': 20389, 'loss/train': 1.6949397325515747} -08/30/2021 16:52:45 - INFO - __main__ - Step 20391: {'lr': 0.00048119264163831987, 'samples': 3915072, 'steps': 20390, 'loss/train': 1.654359221458435} -08/30/2021 16:52:46 - INFO - __main__ - Step 20392: {'lr': 0.0004811906222364794, 'samples': 3915264, 'steps': 20391, 'loss/train': 2.69132924079895} -08/30/2021 16:52:46 - INFO - __main__ - Step 20393: {'lr': 0.00048118860273046804, 'samples': 3915456, 'steps': 20392, 'loss/train': 1.7485592365264893} -08/30/2021 16:52:47 - INFO - __main__ - Step 20394: {'lr': 0.00048118658312028663, 'samples': 3915648, 'steps': 20393, 'loss/train': 1.83722984790802} -08/30/2021 16:52:48 - INFO - __main__ - Step 20395: {'lr': 0.0004811845634059361, 'samples': 3915840, 'steps': 20394, 'loss/train': 1.4899861812591553} -08/30/2021 16:52:48 - INFO - __main__ - Step 20396: {'lr': 0.0004811825435874174, 'samples': 3916032, 'steps': 20395, 'loss/train': 1.6030021905899048} -08/30/2021 16:52:49 - INFO - __main__ - Step 20397: {'lr': 0.0004811805236647314, 'samples': 3916224, 'steps': 20396, 'loss/train': 1.620742917060852} -08/30/2021 16:52:49 - INFO - __main__ - Step 20398: {'lr': 0.0004811785036378791, 'samples': 3916416, 'steps': 20397, 'loss/train': 1.9796329736709595} -08/30/2021 16:52:50 - INFO - __main__ - Step 20399: {'lr': 0.0004811764835068613, 'samples': 3916608, 'steps': 20398, 'loss/train': 1.9112696647644043} -08/30/2021 16:52:51 - INFO - __main__ - Step 20400: {'lr': 0.0004811744632716789, 'samples': 3916800, 'steps': 20399, 'loss/train': 2.097015142440796} -08/30/2021 16:52:51 - INFO - __main__ - Step 20401: {'lr': 0.0004811724429323329, 'samples': 3916992, 'steps': 20400, 'loss/train': 1.3521363735198975} -08/30/2021 16:52:52 - INFO - __main__ - Step 20402: {'lr': 0.0004811704224888241, 'samples': 3917184, 'steps': 20401, 'loss/train': 0.9783707857131958} -08/30/2021 16:52:52 - INFO - __main__ - Step 20403: {'lr': 0.0004811684019411535, 'samples': 3917376, 'steps': 20402, 'loss/train': 1.3182331323623657} -08/30/2021 16:52:54 - INFO - __main__ - Step 20404: {'lr': 0.000481166381289322, 'samples': 3917568, 'steps': 20403, 'loss/train': 1.7120299339294434} -08/30/2021 16:52:54 - INFO - __main__ - Step 20405: {'lr': 0.0004811643605333305, 'samples': 3917760, 'steps': 20404, 'loss/train': 1.4472341537475586} -08/30/2021 16:52:55 - INFO - __main__ - Step 20406: {'lr': 0.0004811623396731799, 'samples': 3917952, 'steps': 20405, 'loss/train': 1.9274582862854004} -08/30/2021 16:52:55 - INFO - __main__ - Step 20407: {'lr': 0.0004811603187088711, 'samples': 3918144, 'steps': 20406, 'loss/train': 2.011478900909424} -08/30/2021 16:52:55 - INFO - __main__ - Step 20408: {'lr': 0.00048115829764040503, 'samples': 3918336, 'steps': 20407, 'loss/train': 1.7389706373214722} -08/30/2021 16:52:56 - INFO - __main__ - Step 20409: {'lr': 0.0004811562764677826, 'samples': 3918528, 'steps': 20408, 'loss/train': 1.454147219657898} -08/30/2021 16:52:57 - INFO - __main__ - Step 20410: {'lr': 0.00048115425519100474, 'samples': 3918720, 'steps': 20409, 'loss/train': 0.04675471782684326} -08/30/2021 16:52:58 - INFO - __main__ - Step 20411: {'lr': 0.0004811522338100723, 'samples': 3918912, 'steps': 20410, 'loss/train': 1.6382688283920288} -08/30/2021 16:52:58 - INFO - __main__ - Step 20412: {'lr': 0.0004811502123249862, 'samples': 3919104, 'steps': 20411, 'loss/train': 0.9834139347076416} -08/30/2021 16:52:58 - INFO - __main__ - Step 20413: {'lr': 0.0004811481907357475, 'samples': 3919296, 'steps': 20412, 'loss/train': 1.166786789894104} -08/30/2021 16:52:59 - INFO - __main__ - Step 20414: {'lr': 0.000481146169042357, 'samples': 3919488, 'steps': 20413, 'loss/train': 1.9236106872558594} -08/30/2021 16:53:00 - INFO - __main__ - Step 20415: {'lr': 0.0004811441472448155, 'samples': 3919680, 'steps': 20414, 'loss/train': 1.2484660148620605} -08/30/2021 16:53:01 - INFO - __main__ - Step 20416: {'lr': 0.000481142125343124, 'samples': 3919872, 'steps': 20415, 'loss/train': 0.8506363034248352} -08/30/2021 16:53:01 - INFO - __main__ - Step 20417: {'lr': 0.0004811401033372835, 'samples': 3920064, 'steps': 20416, 'loss/train': 1.2502920627593994} -08/30/2021 16:53:01 - INFO - __main__ - Step 20418: {'lr': 0.0004811380812272948, 'samples': 3920256, 'steps': 20417, 'loss/train': 1.8344799280166626} -08/30/2021 16:53:02 - INFO - __main__ - Step 20419: {'lr': 0.0004811360590131589, 'samples': 3920448, 'steps': 20418, 'loss/train': 1.6395113468170166} -08/30/2021 16:53:02 - INFO - __main__ - Step 20420: {'lr': 0.00048113403669487655, 'samples': 3920640, 'steps': 20419, 'loss/train': 1.2615171670913696} -08/30/2021 16:53:04 - INFO - __main__ - Step 20421: {'lr': 0.0004811320142724489, 'samples': 3920832, 'steps': 20420, 'loss/train': 1.563582181930542} -08/30/2021 16:53:04 - INFO - __main__ - Step 20422: {'lr': 0.0004811299917458766, 'samples': 3921024, 'steps': 20421, 'loss/train': 1.7724220752716064} -08/30/2021 16:53:04 - INFO - __main__ - Step 20423: {'lr': 0.00048112796911516076, 'samples': 3921216, 'steps': 20422, 'loss/train': 1.7514982223510742} -08/30/2021 16:53:05 - INFO - __main__ - Step 20424: {'lr': 0.00048112594638030225, 'samples': 3921408, 'steps': 20423, 'loss/train': 1.2668033838272095} -08/30/2021 16:53:05 - INFO - __main__ - Step 20425: {'lr': 0.00048112392354130194, 'samples': 3921600, 'steps': 20424, 'loss/train': 1.2459012269973755} -08/30/2021 16:53:07 - INFO - __main__ - Step 20426: {'lr': 0.00048112190059816076, 'samples': 3921792, 'steps': 20425, 'loss/train': 1.2621666193008423} -08/30/2021 16:53:07 - INFO - __main__ - Step 20427: {'lr': 0.0004811198775508796, 'samples': 3921984, 'steps': 20426, 'loss/train': 1.5181001424789429} -08/30/2021 16:53:07 - INFO - __main__ - Step 20428: {'lr': 0.0004811178543994593, 'samples': 3922176, 'steps': 20427, 'loss/train': 1.673447847366333} -08/30/2021 16:53:08 - INFO - __main__ - Step 20429: {'lr': 0.000481115831143901, 'samples': 3922368, 'steps': 20428, 'loss/train': 1.9533108472824097} -08/30/2021 16:53:08 - INFO - __main__ - Step 20430: {'lr': 0.00048111380778420544, 'samples': 3922560, 'steps': 20429, 'loss/train': 1.0703402757644653} -08/30/2021 16:53:10 - INFO - __main__ - Step 20431: {'lr': 0.0004811117843203735, 'samples': 3922752, 'steps': 20430, 'loss/train': 1.6772987842559814} -08/30/2021 16:53:10 - INFO - __main__ - Step 20432: {'lr': 0.00048110976075240624, 'samples': 3922944, 'steps': 20431, 'loss/train': 1.4068084955215454} -08/30/2021 16:53:11 - INFO - __main__ - Step 20433: {'lr': 0.00048110773708030444, 'samples': 3923136, 'steps': 20432, 'loss/train': 0.09284914284944534} -08/30/2021 16:53:11 - INFO - __main__ - Step 20434: {'lr': 0.00048110571330406903, 'samples': 3923328, 'steps': 20433, 'loss/train': 2.2277603149414062} -08/30/2021 16:53:11 - INFO - __main__ - Step 20435: {'lr': 0.0004811036894237011, 'samples': 3923520, 'steps': 20434, 'loss/train': 1.6527063846588135} -08/30/2021 16:53:13 - INFO - __main__ - Step 20436: {'lr': 0.00048110166543920125, 'samples': 3923712, 'steps': 20435, 'loss/train': 0.29340869188308716} -08/30/2021 16:53:14 - INFO - __main__ - Step 20437: {'lr': 0.0004810996413505706, 'samples': 3923904, 'steps': 20436, 'loss/train': 1.0672272443771362} -08/30/2021 16:53:14 - INFO - __main__ - Step 20438: {'lr': 0.0004810976171578101, 'samples': 3924096, 'steps': 20437, 'loss/train': 1.6259253025054932} -08/30/2021 16:53:15 - INFO - __main__ - Step 20439: {'lr': 0.00048109559286092047, 'samples': 3924288, 'steps': 20438, 'loss/train': 1.3832546472549438} -08/30/2021 16:53:15 - INFO - __main__ - Step 20440: {'lr': 0.0004810935684599028, 'samples': 3924480, 'steps': 20439, 'loss/train': 0.8807126879692078} -08/30/2021 16:53:16 - INFO - __main__ - Step 20441: {'lr': 0.00048109154395475787, 'samples': 3924672, 'steps': 20440, 'loss/train': 1.526767373085022} -08/30/2021 16:53:17 - INFO - __main__ - Step 20442: {'lr': 0.00048108951934548673, 'samples': 3924864, 'steps': 20441, 'loss/train': 1.0425728559494019} -08/30/2021 16:53:17 - INFO - __main__ - Step 20443: {'lr': 0.0004810874946320901, 'samples': 3925056, 'steps': 20442, 'loss/train': 1.772262692451477} -08/30/2021 16:53:18 - INFO - __main__ - Step 20444: {'lr': 0.00048108546981456916, 'samples': 3925248, 'steps': 20443, 'loss/train': 1.2528482675552368} -08/30/2021 16:53:18 - INFO - __main__ - Step 20445: {'lr': 0.0004810834448929246, 'samples': 3925440, 'steps': 20444, 'loss/train': 2.1821045875549316} -08/30/2021 16:53:18 - INFO - __main__ - Step 20446: {'lr': 0.0004810814198671574, 'samples': 3925632, 'steps': 20445, 'loss/train': 1.8502366542816162} -08/30/2021 16:53:20 - INFO - __main__ - Step 20447: {'lr': 0.00048107939473726846, 'samples': 3925824, 'steps': 20446, 'loss/train': 1.2826957702636719} -08/30/2021 16:53:20 - INFO - __main__ - Step 20448: {'lr': 0.0004810773695032588, 'samples': 3926016, 'steps': 20447, 'loss/train': 2.0178780555725098} -08/30/2021 16:53:21 - INFO - __main__ - Step 20449: {'lr': 0.00048107534416512915, 'samples': 3926208, 'steps': 20448, 'loss/train': 0.7107794880867004} -08/30/2021 16:53:21 - INFO - __main__ - Step 20450: {'lr': 0.00048107331872288055, 'samples': 3926400, 'steps': 20449, 'loss/train': 1.8956117630004883} -08/30/2021 16:53:21 - INFO - __main__ - Step 20451: {'lr': 0.0004810712931765139, 'samples': 3926592, 'steps': 20450, 'loss/train': 1.7767422199249268} -08/30/2021 16:53:23 - INFO - __main__ - Step 20452: {'lr': 0.00048106926752603007, 'samples': 3926784, 'steps': 20451, 'loss/train': 1.5847138166427612} -08/30/2021 16:53:23 - INFO - __main__ - Step 20453: {'lr': 0.00048106724177143, 'samples': 3926976, 'steps': 20452, 'loss/train': 1.5756040811538696} -08/30/2021 16:53:24 - INFO - __main__ - Step 20454: {'lr': 0.00048106521591271455, 'samples': 3927168, 'steps': 20453, 'loss/train': 1.307875633239746} -08/30/2021 16:53:24 - INFO - __main__ - Step 20455: {'lr': 0.00048106318994988476, 'samples': 3927360, 'steps': 20454, 'loss/train': 1.1496918201446533} -08/30/2021 16:53:24 - INFO - __main__ - Step 20456: {'lr': 0.0004810611638829414, 'samples': 3927552, 'steps': 20455, 'loss/train': 1.597902536392212} -08/30/2021 16:53:26 - INFO - __main__ - Step 20457: {'lr': 0.00048105913771188545, 'samples': 3927744, 'steps': 20456, 'loss/train': 1.5206817388534546} -08/30/2021 16:53:26 - INFO - __main__ - Step 20458: {'lr': 0.00048105711143671783, 'samples': 3927936, 'steps': 20457, 'loss/train': 1.676174283027649} -08/30/2021 16:53:27 - INFO - __main__ - Step 20459: {'lr': 0.0004810550850574394, 'samples': 3928128, 'steps': 20458, 'loss/train': 0.932281494140625} -08/30/2021 16:53:27 - INFO - __main__ - Step 20460: {'lr': 0.0004810530585740512, 'samples': 3928320, 'steps': 20459, 'loss/train': 1.3992466926574707} -08/30/2021 16:53:27 - INFO - __main__ - Step 20461: {'lr': 0.00048105103198655406, 'samples': 3928512, 'steps': 20460, 'loss/train': 1.2533982992172241} -08/30/2021 16:53:29 - INFO - __main__ - Step 20462: {'lr': 0.0004810490052949488, 'samples': 3928704, 'steps': 20461, 'loss/train': 1.4120899438858032} -08/30/2021 16:53:29 - INFO - __main__ - Step 20463: {'lr': 0.0004810469784992365, 'samples': 3928896, 'steps': 20462, 'loss/train': 1.0651419162750244} -08/30/2021 16:53:30 - INFO - __main__ - Step 20464: {'lr': 0.00048104495159941794, 'samples': 3929088, 'steps': 20463, 'loss/train': 1.827168583869934} -08/30/2021 16:53:30 - INFO - __main__ - Step 20465: {'lr': 0.00048104292459549413, 'samples': 3929280, 'steps': 20464, 'loss/train': 1.2470966577529907} -08/30/2021 16:53:30 - INFO - __main__ - Step 20466: {'lr': 0.0004810408974874659, 'samples': 3929472, 'steps': 20465, 'loss/train': 1.5338815450668335} -08/30/2021 16:53:32 - INFO - __main__ - Step 20467: {'lr': 0.0004810388702753342, 'samples': 3929664, 'steps': 20466, 'loss/train': 1.6177653074264526} -08/30/2021 16:53:32 - INFO - __main__ - Step 20468: {'lr': 0.0004810368429591, 'samples': 3929856, 'steps': 20467, 'loss/train': 1.5753872394561768} -08/30/2021 16:53:33 - INFO - __main__ - Step 20469: {'lr': 0.00048103481553876415, 'samples': 3930048, 'steps': 20468, 'loss/train': 1.6142983436584473} -08/30/2021 16:53:33 - INFO - __main__ - Step 20470: {'lr': 0.0004810327880143276, 'samples': 3930240, 'steps': 20469, 'loss/train': 1.7200350761413574} -08/30/2021 16:53:33 - INFO - __main__ - Step 20471: {'lr': 0.00048103076038579125, 'samples': 3930432, 'steps': 20470, 'loss/train': 1.4600830078125} -08/30/2021 16:53:35 - INFO - __main__ - Step 20472: {'lr': 0.00048102873265315596, 'samples': 3930624, 'steps': 20471, 'loss/train': 1.7758893966674805} -08/30/2021 16:53:36 - INFO - __main__ - Step 20473: {'lr': 0.0004810267048164227, 'samples': 3930816, 'steps': 20472, 'loss/train': 1.8201944828033447} -08/30/2021 16:53:36 - INFO - __main__ - Step 20474: {'lr': 0.0004810246768755924, 'samples': 3931008, 'steps': 20473, 'loss/train': 1.5521976947784424} -08/30/2021 16:53:37 - INFO - __main__ - Step 20475: {'lr': 0.0004810226488306659, 'samples': 3931200, 'steps': 20474, 'loss/train': 1.2664735317230225} -08/30/2021 16:53:37 - INFO - __main__ - Step 20476: {'lr': 0.00048102062068164413, 'samples': 3931392, 'steps': 20475, 'loss/train': 1.3742451667785645} -08/30/2021 16:53:38 - INFO - __main__ - Step 20477: {'lr': 0.0004810185924285281, 'samples': 3931584, 'steps': 20476, 'loss/train': 0.20455193519592285} -08/30/2021 16:53:39 - INFO - __main__ - Step 20478: {'lr': 0.00048101656407131864, 'samples': 3931776, 'steps': 20477, 'loss/train': 1.7805805206298828} -08/30/2021 16:53:39 - INFO - __main__ - Step 20479: {'lr': 0.00048101453561001667, 'samples': 3931968, 'steps': 20478, 'loss/train': 1.5799874067306519} -08/30/2021 16:53:40 - INFO - __main__ - Step 20480: {'lr': 0.00048101250704462315, 'samples': 3932160, 'steps': 20479, 'loss/train': 1.4885618686676025} -08/30/2021 16:53:40 - INFO - __main__ - Step 20481: {'lr': 0.0004810104783751389, 'samples': 3932352, 'steps': 20480, 'loss/train': 1.9872725009918213} -08/30/2021 16:53:40 - INFO - __main__ - Step 20482: {'lr': 0.00048100844960156496, 'samples': 3932544, 'steps': 20481, 'loss/train': 0.8941634893417358} -08/30/2021 16:53:42 - INFO - __main__ - Step 20483: {'lr': 0.0004810064207239021, 'samples': 3932736, 'steps': 20482, 'loss/train': 1.4970029592514038} -08/30/2021 16:53:42 - INFO - __main__ - Step 20484: {'lr': 0.0004810043917421514, 'samples': 3932928, 'steps': 20483, 'loss/train': 1.6084808111190796} -08/30/2021 16:53:43 - INFO - __main__ - Step 20485: {'lr': 0.0004810023626563136, 'samples': 3933120, 'steps': 20484, 'loss/train': 1.541935682296753} -08/30/2021 16:53:43 - INFO - __main__ - Step 20486: {'lr': 0.0004810003334663898, 'samples': 3933312, 'steps': 20485, 'loss/train': 1.511197566986084} -08/30/2021 16:53:43 - INFO - __main__ - Step 20487: {'lr': 0.0004809983041723807, 'samples': 3933504, 'steps': 20486, 'loss/train': 1.2819828987121582} -08/30/2021 16:53:46 - INFO - __main__ - Step 20488: {'lr': 0.00048099627477428744, 'samples': 3933696, 'steps': 20487, 'loss/train': 1.2189552783966064} -08/30/2021 16:53:47 - INFO - __main__ - Step 20489: {'lr': 0.0004809942452721107, 'samples': 3933888, 'steps': 20488, 'loss/train': 1.914501667022705} -08/30/2021 16:53:47 - INFO - __main__ - Step 20490: {'lr': 0.0004809922156658516, 'samples': 3934080, 'steps': 20489, 'loss/train': 1.2167168855667114} -08/30/2021 16:53:48 - INFO - __main__ - Step 20491: {'lr': 0.00048099018595551096, 'samples': 3934272, 'steps': 20490, 'loss/train': 1.6059019565582275} -08/30/2021 16:53:48 - INFO - __main__ - Step 20492: {'lr': 0.0004809881561410897, 'samples': 3934464, 'steps': 20491, 'loss/train': 1.2520502805709839} -08/30/2021 16:53:48 - INFO - __main__ - Step 20493: {'lr': 0.00048098612622258873, 'samples': 3934656, 'steps': 20492, 'loss/train': 5.677497863769531} -08/30/2021 16:53:49 - INFO - __main__ - Step 20494: {'lr': 0.00048098409620000906, 'samples': 3934848, 'steps': 20493, 'loss/train': 5.572636127471924} -08/30/2021 16:53:50 - INFO - __main__ - Step 20495: {'lr': 0.00048098206607335135, 'samples': 3935040, 'steps': 20494, 'loss/train': 5.476930141448975} -08/30/2021 16:53:51 - INFO - __main__ - Step 20496: {'lr': 0.00048098003584261684, 'samples': 3935232, 'steps': 20495, 'loss/train': 1.538805365562439} -08/30/2021 16:53:51 - INFO - __main__ - Step 20497: {'lr': 0.00048097800550780625, 'samples': 3935424, 'steps': 20496, 'loss/train': 0.8303343057632446} -08/30/2021 16:53:52 - INFO - __main__ - Step 20498: {'lr': 0.0004809759750689205, 'samples': 3935616, 'steps': 20497, 'loss/train': 1.6164000034332275} -08/30/2021 16:53:52 - INFO - __main__ - Step 20499: {'lr': 0.00048097394452596053, 'samples': 3935808, 'steps': 20498, 'loss/train': 1.4405229091644287} -08/30/2021 16:53:52 - INFO - __main__ - Step 20500: {'lr': 0.0004809719138789273, 'samples': 3936000, 'steps': 20499, 'loss/train': 1.1235699653625488} -08/30/2021 16:53:54 - INFO - __main__ - Step 20501: {'lr': 0.0004809698831278217, 'samples': 3936192, 'steps': 20500, 'loss/train': 1.742831826210022} -08/30/2021 16:53:54 - INFO - __main__ - Step 20502: {'lr': 0.0004809678522726446, 'samples': 3936384, 'steps': 20501, 'loss/train': 1.0082358121871948} -08/30/2021 16:53:55 - INFO - __main__ - Step 20503: {'lr': 0.000480965821313397, 'samples': 3936576, 'steps': 20502, 'loss/train': 1.5180387496948242} -08/30/2021 16:53:55 - INFO - __main__ - Step 20504: {'lr': 0.0004809637902500797, 'samples': 3936768, 'steps': 20503, 'loss/train': 1.0592870712280273} -08/30/2021 16:53:55 - INFO - __main__ - Step 20505: {'lr': 0.00048096175908269375, 'samples': 3936960, 'steps': 20504, 'loss/train': 1.5597378015518188} -08/30/2021 16:53:57 - INFO - __main__ - Step 20506: {'lr': 0.00048095972781124, 'samples': 3937152, 'steps': 20505, 'loss/train': 1.4473786354064941} -08/30/2021 16:53:58 - INFO - __main__ - Step 20507: {'lr': 0.00048095769643571927, 'samples': 3937344, 'steps': 20506, 'loss/train': 1.6616387367248535} -08/30/2021 16:53:58 - INFO - __main__ - Step 20508: {'lr': 0.0004809556649561326, 'samples': 3937536, 'steps': 20507, 'loss/train': 1.440677285194397} -08/30/2021 16:53:58 - INFO - __main__ - Step 20509: {'lr': 0.0004809536333724809, 'samples': 3937728, 'steps': 20508, 'loss/train': 1.7490971088409424} -08/30/2021 16:53:59 - INFO - __main__ - Step 20510: {'lr': 0.000480951601684765, 'samples': 3937920, 'steps': 20509, 'loss/train': 0.3238224983215332} -08/30/2021 16:54:00 - INFO - __main__ - Step 20511: {'lr': 0.00048094956989298593, 'samples': 3938112, 'steps': 20510, 'loss/train': 0.40685346722602844} -08/30/2021 16:54:00 - INFO - __main__ - Step 20512: {'lr': 0.0004809475379971445, 'samples': 3938304, 'steps': 20511, 'loss/train': 1.6993385553359985} -08/30/2021 16:54:01 - INFO - __main__ - Step 20513: {'lr': 0.00048094550599724176, 'samples': 3938496, 'steps': 20512, 'loss/train': 0.4886229634284973} -08/30/2021 16:54:01 - INFO - __main__ - Step 20514: {'lr': 0.0004809434738932785, 'samples': 3938688, 'steps': 20513, 'loss/train': 2.4234566688537598} -08/30/2021 16:54:01 - INFO - __main__ - Step 20515: {'lr': 0.0004809414416852557, 'samples': 3938880, 'steps': 20514, 'loss/train': 1.7882490158081055} -08/30/2021 16:54:03 - INFO - __main__ - Step 20516: {'lr': 0.00048093940937317414, 'samples': 3939072, 'steps': 20515, 'loss/train': 1.388883352279663} -08/30/2021 16:54:03 - INFO - __main__ - Step 20517: {'lr': 0.00048093737695703494, 'samples': 3939264, 'steps': 20516, 'loss/train': 1.4843791723251343} -08/30/2021 16:54:04 - INFO - __main__ - Step 20518: {'lr': 0.0004809353444368389, 'samples': 3939456, 'steps': 20517, 'loss/train': 1.5473222732543945} -08/30/2021 16:54:04 - INFO - __main__ - Step 20519: {'lr': 0.00048093331181258694, 'samples': 3939648, 'steps': 20518, 'loss/train': 1.5043143033981323} -08/30/2021 16:54:04 - INFO - __main__ - Step 20520: {'lr': 0.00048093127908428, 'samples': 3939840, 'steps': 20519, 'loss/train': 0.6837820410728455} -08/30/2021 16:54:06 - INFO - __main__ - Step 20521: {'lr': 0.00048092924625191903, 'samples': 3940032, 'steps': 20520, 'loss/train': 1.4310814142227173} -08/30/2021 16:54:06 - INFO - __main__ - Step 20522: {'lr': 0.0004809272133155048, 'samples': 3940224, 'steps': 20521, 'loss/train': 1.9825042486190796} -08/30/2021 16:54:07 - INFO - __main__ - Step 20523: {'lr': 0.00048092518027503844, 'samples': 3940416, 'steps': 20522, 'loss/train': 1.2254289388656616} -08/30/2021 16:54:07 - INFO - __main__ - Step 20524: {'lr': 0.0004809231471305208, 'samples': 3940608, 'steps': 20523, 'loss/train': 1.680452585220337} -08/30/2021 16:54:07 - INFO - __main__ - Step 20525: {'lr': 0.0004809211138819526, 'samples': 3940800, 'steps': 20524, 'loss/train': 1.5076162815093994} -08/30/2021 16:54:09 - INFO - __main__ - Step 20526: {'lr': 0.000480919080529335, 'samples': 3940992, 'steps': 20525, 'loss/train': 0.3464648127555847} -08/30/2021 16:54:09 - INFO - __main__ - Step 20527: {'lr': 0.0004809170470726688, 'samples': 3941184, 'steps': 20526, 'loss/train': 1.5762031078338623} -08/30/2021 16:54:10 - INFO - __main__ - Step 20528: {'lr': 0.00048091501351195495, 'samples': 3941376, 'steps': 20527, 'loss/train': 1.6600455045700073} -08/30/2021 16:54:10 - INFO - __main__ - Step 20529: {'lr': 0.00048091297984719433, 'samples': 3941568, 'steps': 20528, 'loss/train': 1.404067873954773} -08/30/2021 16:54:10 - INFO - __main__ - Step 20530: {'lr': 0.0004809109460783879, 'samples': 3941760, 'steps': 20529, 'loss/train': 0.9669828414916992} -08/30/2021 16:54:11 - INFO - __main__ - Step 20531: {'lr': 0.0004809089122055366, 'samples': 3941952, 'steps': 20530, 'loss/train': 1.045242190361023} -08/30/2021 16:54:12 - INFO - __main__ - Step 20532: {'lr': 0.00048090687822864125, 'samples': 3942144, 'steps': 20531, 'loss/train': 1.9114315509796143} -08/30/2021 16:54:13 - INFO - __main__ - Step 20533: {'lr': 0.00048090484414770284, 'samples': 3942336, 'steps': 20532, 'loss/train': 1.3316726684570312} -08/30/2021 16:54:13 - INFO - __main__ - Step 20534: {'lr': 0.00048090280996272234, 'samples': 3942528, 'steps': 20533, 'loss/train': 0.9302244782447815} -08/30/2021 16:54:13 - INFO - __main__ - Step 20535: {'lr': 0.0004809007756737005, 'samples': 3942720, 'steps': 20534, 'loss/train': 1.5411350727081299} -08/30/2021 16:54:14 - INFO - __main__ - Step 20536: {'lr': 0.0004808987412806384, 'samples': 3942912, 'steps': 20535, 'loss/train': 1.745179533958435} -08/30/2021 16:54:15 - INFO - __main__ - Step 20537: {'lr': 0.0004808967067835369, 'samples': 3943104, 'steps': 20536, 'loss/train': 1.4986993074417114} -08/30/2021 16:54:16 - INFO - __main__ - Step 20538: {'lr': 0.00048089467218239687, 'samples': 3943296, 'steps': 20537, 'loss/train': 1.336204171180725} -08/30/2021 16:54:16 - INFO - __main__ - Step 20539: {'lr': 0.00048089263747721925, 'samples': 3943488, 'steps': 20538, 'loss/train': 1.4198871850967407} -08/30/2021 16:54:17 - INFO - __main__ - Step 20540: {'lr': 0.000480890602668005, 'samples': 3943680, 'steps': 20539, 'loss/train': 1.5905554294586182} -08/30/2021 16:54:17 - INFO - __main__ - Step 20541: {'lr': 0.000480888567754755, 'samples': 3943872, 'steps': 20540, 'loss/train': 0.6319172382354736} -08/30/2021 16:54:19 - INFO - __main__ - Step 20542: {'lr': 0.0004808865327374701, 'samples': 3944064, 'steps': 20541, 'loss/train': 1.8303757905960083} -08/30/2021 16:54:19 - INFO - __main__ - Step 20543: {'lr': 0.0004808844976161514, 'samples': 3944256, 'steps': 20542, 'loss/train': 1.858598232269287} -08/30/2021 16:54:19 - INFO - __main__ - Step 20544: {'lr': 0.0004808824623907997, 'samples': 3944448, 'steps': 20543, 'loss/train': 1.625712275505066} -08/30/2021 16:54:20 - INFO - __main__ - Step 20545: {'lr': 0.0004808804270614159, 'samples': 3944640, 'steps': 20544, 'loss/train': 1.5935778617858887} -08/30/2021 16:54:20 - INFO - __main__ - Step 20546: {'lr': 0.0004808783916280008, 'samples': 3944832, 'steps': 20545, 'loss/train': 1.4860432147979736} -08/30/2021 16:54:22 - INFO - __main__ - Step 20547: {'lr': 0.0004808763560905557, 'samples': 3945024, 'steps': 20546, 'loss/train': 1.3092674016952515} -08/30/2021 16:54:22 - INFO - __main__ - Step 20548: {'lr': 0.0004808743204490811, 'samples': 3945216, 'steps': 20547, 'loss/train': 1.6856248378753662} -08/30/2021 16:54:23 - INFO - __main__ - Step 20549: {'lr': 0.00048087228470357823, 'samples': 3945408, 'steps': 20548, 'loss/train': 1.1017231941223145} -08/30/2021 16:54:23 - INFO - __main__ - Step 20550: {'lr': 0.00048087024885404777, 'samples': 3945600, 'steps': 20549, 'loss/train': 1.039155125617981} -08/30/2021 16:54:24 - INFO - __main__ - Step 20551: {'lr': 0.00048086821290049077, 'samples': 3945792, 'steps': 20550, 'loss/train': 1.5275973081588745} -08/30/2021 16:54:25 - INFO - __main__ - Step 20552: {'lr': 0.00048086617684290814, 'samples': 3945984, 'steps': 20551, 'loss/train': 1.4478583335876465} -08/30/2021 16:54:25 - INFO - __main__ - Step 20553: {'lr': 0.00048086414068130077, 'samples': 3946176, 'steps': 20552, 'loss/train': 1.6303349733352661} -08/30/2021 16:54:26 - INFO - __main__ - Step 20554: {'lr': 0.00048086210441566956, 'samples': 3946368, 'steps': 20553, 'loss/train': 1.3500038385391235} -08/30/2021 16:54:26 - INFO - __main__ - Step 20555: {'lr': 0.00048086006804601544, 'samples': 3946560, 'steps': 20554, 'loss/train': 1.5991129875183105} -08/30/2021 16:54:26 - INFO - __main__ - Step 20556: {'lr': 0.00048085803157233933, 'samples': 3946752, 'steps': 20555, 'loss/train': 1.458549976348877} -08/30/2021 16:54:28 - INFO - __main__ - Step 20557: {'lr': 0.00048085599499464216, 'samples': 3946944, 'steps': 20556, 'loss/train': 1.3403385877609253} -08/30/2021 16:54:28 - INFO - __main__ - Step 20558: {'lr': 0.0004808539583129249, 'samples': 3947136, 'steps': 20557, 'loss/train': 0.9676722288131714} -08/30/2021 16:54:29 - INFO - __main__ - Step 20559: {'lr': 0.0004808519215271884, 'samples': 3947328, 'steps': 20558, 'loss/train': 1.908630609512329} -08/30/2021 16:54:29 - INFO - __main__ - Step 20560: {'lr': 0.0004808498846374335, 'samples': 3947520, 'steps': 20559, 'loss/train': 1.5557866096496582} -08/30/2021 16:54:29 - INFO - __main__ - Step 20561: {'lr': 0.0004808478476436612, 'samples': 3947712, 'steps': 20560, 'loss/train': 1.6522068977355957} -08/30/2021 16:54:30 - INFO - __main__ - Step 20562: {'lr': 0.00048084581054587253, 'samples': 3947904, 'steps': 20561, 'loss/train': 1.812275767326355} -08/30/2021 16:54:31 - INFO - __main__ - Step 20563: {'lr': 0.0004808437733440682, 'samples': 3948096, 'steps': 20562, 'loss/train': 1.1599609851837158} -08/30/2021 16:54:32 - INFO - __main__ - Step 20564: {'lr': 0.0004808417360382493, 'samples': 3948288, 'steps': 20563, 'loss/train': 1.241487979888916} -08/30/2021 16:54:32 - INFO - __main__ - Step 20565: {'lr': 0.00048083969862841667, 'samples': 3948480, 'steps': 20564, 'loss/train': 1.663413405418396} -08/30/2021 16:54:32 - INFO - __main__ - Step 20566: {'lr': 0.00048083766111457115, 'samples': 3948672, 'steps': 20565, 'loss/train': 1.9653089046478271} -08/30/2021 16:54:33 - INFO - __main__ - Step 20567: {'lr': 0.0004808356234967138, 'samples': 3948864, 'steps': 20566, 'loss/train': 1.7561421394348145} -08/30/2021 16:54:34 - INFO - __main__ - Step 20568: {'lr': 0.00048083358577484547, 'samples': 3949056, 'steps': 20567, 'loss/train': 2.359469175338745} -08/30/2021 16:54:35 - INFO - __main__ - Step 20569: {'lr': 0.0004808315479489671, 'samples': 3949248, 'steps': 20568, 'loss/train': 1.3442726135253906} -08/30/2021 16:54:35 - INFO - __main__ - Step 20570: {'lr': 0.00048082951001907965, 'samples': 3949440, 'steps': 20569, 'loss/train': 1.7343682050704956} -08/30/2021 16:54:35 - INFO - __main__ - Step 20571: {'lr': 0.0004808274719851839, 'samples': 3949632, 'steps': 20570, 'loss/train': 1.5264581441879272} -08/30/2021 16:54:36 - INFO - __main__ - Step 20572: {'lr': 0.0004808254338472809, 'samples': 3949824, 'steps': 20571, 'loss/train': 1.246448278427124} -08/30/2021 16:54:36 - INFO - __main__ - Step 20573: {'lr': 0.00048082339560537145, 'samples': 3950016, 'steps': 20572, 'loss/train': 1.5132750272750854} -08/30/2021 16:54:38 - INFO - __main__ - Step 20574: {'lr': 0.00048082135725945665, 'samples': 3950208, 'steps': 20573, 'loss/train': 1.9364030361175537} -08/30/2021 16:54:38 - INFO - __main__ - Step 20575: {'lr': 0.0004808193188095372, 'samples': 3950400, 'steps': 20574, 'loss/train': 1.4878729581832886} -08/30/2021 16:54:38 - INFO - __main__ - Step 20576: {'lr': 0.0004808172802556142, 'samples': 3950592, 'steps': 20575, 'loss/train': 1.508954644203186} -08/30/2021 16:54:39 - INFO - __main__ - Step 20577: {'lr': 0.0004808152415976885, 'samples': 3950784, 'steps': 20576, 'loss/train': 1.4431802034378052} -08/30/2021 16:54:39 - INFO - __main__ - Step 20578: {'lr': 0.000480813202835761, 'samples': 3950976, 'steps': 20577, 'loss/train': 1.0431770086288452} -08/30/2021 16:54:41 - INFO - __main__ - Step 20579: {'lr': 0.0004808111639698326, 'samples': 3951168, 'steps': 20578, 'loss/train': 1.4277130365371704} -08/30/2021 16:54:41 - INFO - __main__ - Step 20580: {'lr': 0.0004808091249999043, 'samples': 3951360, 'steps': 20579, 'loss/train': 1.4637948274612427} -08/30/2021 16:54:41 - INFO - __main__ - Step 20581: {'lr': 0.0004808070859259769, 'samples': 3951552, 'steps': 20580, 'loss/train': 2.0352847576141357} -08/30/2021 16:54:42 - INFO - __main__ - Step 20582: {'lr': 0.0004808050467480515, 'samples': 3951744, 'steps': 20581, 'loss/train': 1.7960317134857178} -08/30/2021 16:54:42 - INFO - __main__ - Step 20583: {'lr': 0.0004808030074661288, 'samples': 3951936, 'steps': 20582, 'loss/train': 1.302974820137024} -08/30/2021 16:54:44 - INFO - __main__ - Step 20584: {'lr': 0.0004808009680802099, 'samples': 3952128, 'steps': 20583, 'loss/train': 1.623962640762329} -08/30/2021 16:54:44 - INFO - __main__ - Step 20585: {'lr': 0.00048079892859029564, 'samples': 3952320, 'steps': 20584, 'loss/train': 1.8166264295578003} -08/30/2021 16:54:45 - INFO - __main__ - Step 20586: {'lr': 0.00048079688899638684, 'samples': 3952512, 'steps': 20585, 'loss/train': 2.028949022293091} -08/30/2021 16:54:45 - INFO - __main__ - Step 20587: {'lr': 0.0004807948492984846, 'samples': 3952704, 'steps': 20586, 'loss/train': 2.6005401611328125} -08/30/2021 16:54:45 - INFO - __main__ - Step 20588: {'lr': 0.0004807928094965898, 'samples': 3952896, 'steps': 20587, 'loss/train': 1.4047460556030273} -08/30/2021 16:54:47 - INFO - __main__ - Step 20589: {'lr': 0.0004807907695907032, 'samples': 3953088, 'steps': 20588, 'loss/train': 1.6047488451004028} -08/30/2021 16:54:48 - INFO - __main__ - Step 20590: {'lr': 0.000480788729580826, 'samples': 3953280, 'steps': 20589, 'loss/train': 1.1475815773010254} -08/30/2021 16:54:48 - INFO - __main__ - Step 20591: {'lr': 0.00048078668946695887, 'samples': 3953472, 'steps': 20590, 'loss/train': 1.7670137882232666} -08/30/2021 16:54:49 - INFO - __main__ - Step 20592: {'lr': 0.0004807846492491028, 'samples': 3953664, 'steps': 20591, 'loss/train': 2.0738556385040283} -08/30/2021 16:54:49 - INFO - __main__ - Step 20593: {'lr': 0.0004807826089272588, 'samples': 3953856, 'steps': 20592, 'loss/train': 0.7206501960754395} -08/30/2021 16:54:50 - INFO - __main__ - Step 20594: {'lr': 0.0004807805685014277, 'samples': 3954048, 'steps': 20593, 'loss/train': 1.4145188331604004} -08/30/2021 16:54:51 - INFO - __main__ - Step 20595: {'lr': 0.00048077852797161034, 'samples': 3954240, 'steps': 20594, 'loss/train': 1.3185465335845947} -08/30/2021 16:54:51 - INFO - __main__ - Step 20596: {'lr': 0.0004807764873378079, 'samples': 3954432, 'steps': 20595, 'loss/train': 1.6892168521881104} -08/30/2021 16:54:52 - INFO - __main__ - Step 20597: {'lr': 0.000480774446600021, 'samples': 3954624, 'steps': 20596, 'loss/train': 0.9227716326713562} -08/30/2021 16:54:52 - INFO - __main__ - Step 20598: {'lr': 0.00048077240575825075, 'samples': 3954816, 'steps': 20597, 'loss/train': 1.5762578248977661} -08/30/2021 16:54:54 - INFO - __main__ - Step 20599: {'lr': 0.000480770364812498, 'samples': 3955008, 'steps': 20598, 'loss/train': 1.6765204668045044} -08/30/2021 16:54:55 - INFO - __main__ - Step 20600: {'lr': 0.0004807683237627637, 'samples': 3955200, 'steps': 20599, 'loss/train': 1.3946428298950195} -08/30/2021 16:54:55 - INFO - __main__ - Step 20601: {'lr': 0.0004807662826090488, 'samples': 3955392, 'steps': 20600, 'loss/train': 1.2109757661819458} -08/30/2021 16:54:55 - INFO - __main__ - Step 20602: {'lr': 0.00048076424135135406, 'samples': 3955584, 'steps': 20601, 'loss/train': 1.6038706302642822} -08/30/2021 16:54:56 - INFO - __main__ - Step 20603: {'lr': 0.00048076219998968055, 'samples': 3955776, 'steps': 20602, 'loss/train': 0.7600698471069336} -08/30/2021 16:54:56 - INFO - __main__ - Step 20604: {'lr': 0.0004807601585240292, 'samples': 3955968, 'steps': 20603, 'loss/train': 1.781967282295227} -08/30/2021 16:54:58 - INFO - __main__ - Step 20605: {'lr': 0.0004807581169544009, 'samples': 3956160, 'steps': 20604, 'loss/train': 0.2823835611343384} -08/30/2021 16:54:58 - INFO - __main__ - Step 20606: {'lr': 0.00048075607528079645, 'samples': 3956352, 'steps': 20605, 'loss/train': 1.9294631481170654} -08/30/2021 16:54:58 - INFO - __main__ - Step 20607: {'lr': 0.0004807540335032169, 'samples': 3956544, 'steps': 20606, 'loss/train': 1.2828264236450195} -08/30/2021 16:54:59 - INFO - __main__ - Step 20608: {'lr': 0.0004807519916216633, 'samples': 3956736, 'steps': 20607, 'loss/train': 0.6966751217842102} -08/30/2021 16:54:59 - INFO - __main__ - Step 20609: {'lr': 0.0004807499496361362, 'samples': 3956928, 'steps': 20608, 'loss/train': 1.4355417490005493} -08/30/2021 16:55:00 - INFO - __main__ - Step 20610: {'lr': 0.00048074790754663686, 'samples': 3957120, 'steps': 20609, 'loss/train': 1.3458967208862305} -08/30/2021 16:55:01 - INFO - __main__ - Step 20611: {'lr': 0.000480745865353166, 'samples': 3957312, 'steps': 20610, 'loss/train': 1.2405227422714233} -08/30/2021 16:55:01 - INFO - __main__ - Step 20612: {'lr': 0.0004807438230557247, 'samples': 3957504, 'steps': 20611, 'loss/train': 1.2547762393951416} -08/30/2021 16:55:02 - INFO - __main__ - Step 20613: {'lr': 0.00048074178065431373, 'samples': 3957696, 'steps': 20612, 'loss/train': 1.6068294048309326} -08/30/2021 16:55:02 - INFO - __main__ - Step 20614: {'lr': 0.0004807397381489341, 'samples': 3957888, 'steps': 20613, 'loss/train': 1.6361725330352783} -08/30/2021 16:55:04 - INFO - __main__ - Step 20615: {'lr': 0.00048073769553958666, 'samples': 3958080, 'steps': 20614, 'loss/train': 1.3007580041885376} -08/30/2021 16:55:04 - INFO - __main__ - Step 20616: {'lr': 0.00048073565282627246, 'samples': 3958272, 'steps': 20615, 'loss/train': 1.7681808471679688} -08/30/2021 16:55:05 - INFO - __main__ - Step 20617: {'lr': 0.0004807336100089923, 'samples': 3958464, 'steps': 20616, 'loss/train': 2.222637414932251} -08/30/2021 16:55:05 - INFO - __main__ - Step 20618: {'lr': 0.0004807315670877471, 'samples': 3958656, 'steps': 20617, 'loss/train': 1.2972687482833862} -08/30/2021 16:55:05 - INFO - __main__ - Step 20619: {'lr': 0.00048072952406253783, 'samples': 3958848, 'steps': 20618, 'loss/train': 1.7866398096084595} -08/30/2021 16:55:06 - INFO - __main__ - Step 20620: {'lr': 0.00048072748093336536, 'samples': 3959040, 'steps': 20619, 'loss/train': 1.496514081954956} -08/30/2021 16:55:07 - INFO - __main__ - Step 20621: {'lr': 0.00048072543770023076, 'samples': 3959232, 'steps': 20620, 'loss/train': 0.11282919347286224} -08/30/2021 16:55:08 - INFO - __main__ - Step 20622: {'lr': 0.0004807233943631347, 'samples': 3959424, 'steps': 20621, 'loss/train': 1.8915866613388062} -08/30/2021 16:55:08 - INFO - __main__ - Step 20623: {'lr': 0.0004807213509220784, 'samples': 3959616, 'steps': 20622, 'loss/train': 1.8186583518981934} -08/30/2021 16:55:09 - INFO - __main__ - Step 20624: {'lr': 0.0004807193073770625, 'samples': 3959808, 'steps': 20623, 'loss/train': 1.4623253345489502} -08/30/2021 16:55:09 - INFO - __main__ - Step 20625: {'lr': 0.0004807172637280881, 'samples': 3960000, 'steps': 20624, 'loss/train': 2.0191798210144043} -08/30/2021 16:55:09 - INFO - __main__ - Step 20626: {'lr': 0.000480715219975156, 'samples': 3960192, 'steps': 20625, 'loss/train': 1.9373518228530884} -08/30/2021 16:55:11 - INFO - __main__ - Step 20627: {'lr': 0.0004807131761182672, 'samples': 3960384, 'steps': 20626, 'loss/train': 0.041183751076459885} -08/30/2021 16:55:12 - INFO - __main__ - Step 20628: {'lr': 0.00048071113215742263, 'samples': 3960576, 'steps': 20627, 'loss/train': 1.5153496265411377} -08/30/2021 16:55:12 - INFO - __main__ - Step 20629: {'lr': 0.00048070908809262316, 'samples': 3960768, 'steps': 20628, 'loss/train': 1.4794275760650635} -08/30/2021 16:55:12 - INFO - __main__ - Step 20630: {'lr': 0.0004807070439238698, 'samples': 3960960, 'steps': 20629, 'loss/train': 1.4660319089889526} -08/30/2021 16:55:13 - INFO - __main__ - Step 20631: {'lr': 0.0004807049996511633, 'samples': 3961152, 'steps': 20630, 'loss/train': 1.8759181499481201} -08/30/2021 16:55:13 - INFO - __main__ - Step 20632: {'lr': 0.00048070295527450474, 'samples': 3961344, 'steps': 20631, 'loss/train': 0.585408091545105} -08/30/2021 16:55:14 - INFO - __main__ - Step 20633: {'lr': 0.000480700910793895, 'samples': 3961536, 'steps': 20632, 'loss/train': 1.9259815216064453} -08/30/2021 16:55:15 - INFO - __main__ - Step 20634: {'lr': 0.000480698866209335, 'samples': 3961728, 'steps': 20633, 'loss/train': 1.8975882530212402} -08/30/2021 16:55:15 - INFO - __main__ - Step 20635: {'lr': 0.0004806968215208256, 'samples': 3961920, 'steps': 20634, 'loss/train': 1.6896079778671265} -08/30/2021 16:55:16 - INFO - __main__ - Step 20636: {'lr': 0.0004806947767283678, 'samples': 3962112, 'steps': 20635, 'loss/train': 1.4961246252059937} -08/30/2021 16:55:16 - INFO - __main__ - Step 20637: {'lr': 0.0004806927318319625, 'samples': 3962304, 'steps': 20636, 'loss/train': 1.7835643291473389} -08/30/2021 16:55:18 - INFO - __main__ - Step 20638: {'lr': 0.0004806906868316106, 'samples': 3962496, 'steps': 20637, 'loss/train': 1.540489673614502} -08/30/2021 16:55:18 - INFO - __main__ - Step 20639: {'lr': 0.000480688641727313, 'samples': 3962688, 'steps': 20638, 'loss/train': 1.471384048461914} -08/30/2021 16:55:19 - INFO - __main__ - Step 20640: {'lr': 0.00048068659651907076, 'samples': 3962880, 'steps': 20639, 'loss/train': 2.1339805126190186} -08/30/2021 16:55:19 - INFO - __main__ - Step 20641: {'lr': 0.0004806845512068846, 'samples': 3963072, 'steps': 20640, 'loss/train': 1.4799166917800903} -08/30/2021 16:55:19 - INFO - __main__ - Step 20642: {'lr': 0.00048068250579075554, 'samples': 3963264, 'steps': 20641, 'loss/train': 1.211970329284668} -08/30/2021 16:55:21 - INFO - __main__ - Step 20643: {'lr': 0.00048068046027068456, 'samples': 3963456, 'steps': 20642, 'loss/train': 1.1890201568603516} -08/30/2021 16:55:22 - INFO - __main__ - Step 20644: {'lr': 0.0004806784146466726, 'samples': 3963648, 'steps': 20643, 'loss/train': 1.6303956508636475} -08/30/2021 16:55:22 - INFO - __main__ - Step 20645: {'lr': 0.00048067636891872036, 'samples': 3963840, 'steps': 20644, 'loss/train': 2.086669921875} -08/30/2021 16:55:22 - INFO - __main__ - Step 20646: {'lr': 0.00048067432308682894, 'samples': 3964032, 'steps': 20645, 'loss/train': 1.1525413990020752} -08/30/2021 16:55:23 - INFO - __main__ - Step 20647: {'lr': 0.0004806722771509993, 'samples': 3964224, 'steps': 20646, 'loss/train': 1.4894037246704102} -08/30/2021 16:55:24 - INFO - __main__ - Step 20648: {'lr': 0.0004806702311112322, 'samples': 3964416, 'steps': 20647, 'loss/train': 1.3572239875793457} -08/30/2021 16:55:25 - INFO - __main__ - Step 20649: {'lr': 0.0004806681849675287, 'samples': 3964608, 'steps': 20648, 'loss/train': 1.565950632095337} -08/30/2021 16:55:25 - INFO - __main__ - Step 20650: {'lr': 0.00048066613871988967, 'samples': 3964800, 'steps': 20649, 'loss/train': 1.4098584651947021} -08/30/2021 16:55:25 - INFO - __main__ - Step 20651: {'lr': 0.00048066409236831607, 'samples': 3964992, 'steps': 20650, 'loss/train': 1.4266493320465088} -08/30/2021 16:55:26 - INFO - __main__ - Step 20652: {'lr': 0.0004806620459128087, 'samples': 3965184, 'steps': 20651, 'loss/train': 1.2918858528137207} -08/30/2021 16:55:26 - INFO - __main__ - Step 20653: {'lr': 0.0004806599993533687, 'samples': 3965376, 'steps': 20652, 'loss/train': 1.5336929559707642} -08/30/2021 16:55:28 - INFO - __main__ - Step 20654: {'lr': 0.00048065795268999677, 'samples': 3965568, 'steps': 20653, 'loss/train': 1.3345450162887573} -08/30/2021 16:55:28 - INFO - __main__ - Step 20655: {'lr': 0.00048065590592269393, 'samples': 3965760, 'steps': 20654, 'loss/train': 2.247145652770996} -08/30/2021 16:55:28 - INFO - __main__ - Step 20656: {'lr': 0.00048065385905146114, 'samples': 3965952, 'steps': 20655, 'loss/train': 1.7187037467956543} -08/30/2021 16:55:29 - INFO - __main__ - Step 20657: {'lr': 0.0004806518120762993, 'samples': 3966144, 'steps': 20656, 'loss/train': 1.3709335327148438} -08/30/2021 16:55:29 - INFO - __main__ - Step 20658: {'lr': 0.00048064976499720923, 'samples': 3966336, 'steps': 20657, 'loss/train': 2.0189366340637207} -08/30/2021 16:55:31 - INFO - __main__ - Step 20659: {'lr': 0.000480647717814192, 'samples': 3966528, 'steps': 20658, 'loss/train': 1.8227946758270264} -08/30/2021 16:55:31 - INFO - __main__ - Step 20660: {'lr': 0.0004806456705272484, 'samples': 3966720, 'steps': 20659, 'loss/train': 1.3422613143920898} -08/30/2021 16:55:31 - INFO - __main__ - Step 20661: {'lr': 0.0004806436231363795, 'samples': 3966912, 'steps': 20660, 'loss/train': 1.457248568534851} -08/30/2021 16:55:32 - INFO - __main__ - Step 20662: {'lr': 0.00048064157564158607, 'samples': 3967104, 'steps': 20661, 'loss/train': 1.3451411724090576} -08/30/2021 16:55:32 - INFO - __main__ - Step 20663: {'lr': 0.00048063952804286913, 'samples': 3967296, 'steps': 20662, 'loss/train': 2.052534341812134} -08/30/2021 16:55:34 - INFO - __main__ - Step 20664: {'lr': 0.0004806374803402296, 'samples': 3967488, 'steps': 20663, 'loss/train': 0.9287270307540894} -08/30/2021 16:55:35 - INFO - __main__ - Step 20665: {'lr': 0.00048063543253366837, 'samples': 3967680, 'steps': 20664, 'loss/train': 1.0546422004699707} -08/30/2021 16:55:35 - INFO - __main__ - Step 20666: {'lr': 0.0004806333846231864, 'samples': 3967872, 'steps': 20665, 'loss/train': 0.13127905130386353} -08/30/2021 16:55:35 - INFO - __main__ - Step 20667: {'lr': 0.00048063133660878455, 'samples': 3968064, 'steps': 20666, 'loss/train': 1.5059527158737183} -08/30/2021 16:55:36 - INFO - __main__ - Step 20668: {'lr': 0.00048062928849046377, 'samples': 3968256, 'steps': 20667, 'loss/train': 1.7320287227630615} -08/30/2021 16:55:36 - INFO - __main__ - Step 20669: {'lr': 0.00048062724026822504, 'samples': 3968448, 'steps': 20668, 'loss/train': 0.11046398431062698} -08/30/2021 16:55:38 - INFO - __main__ - Step 20670: {'lr': 0.00048062519194206916, 'samples': 3968640, 'steps': 20669, 'loss/train': 0.32149767875671387} -08/30/2021 16:55:38 - INFO - __main__ - Step 20671: {'lr': 0.0004806231435119972, 'samples': 3968832, 'steps': 20670, 'loss/train': 1.7202013731002808} -08/30/2021 16:55:38 - INFO - __main__ - Step 20672: {'lr': 0.00048062109497800997, 'samples': 3969024, 'steps': 20671, 'loss/train': 1.3532297611236572} -08/30/2021 16:55:39 - INFO - __main__ - Step 20673: {'lr': 0.00048061904634010845, 'samples': 3969216, 'steps': 20672, 'loss/train': 1.7341771125793457} -08/30/2021 16:55:39 - INFO - __main__ - Step 20674: {'lr': 0.0004806169975982935, 'samples': 3969408, 'steps': 20673, 'loss/train': 1.6083941459655762} -08/30/2021 16:55:41 - INFO - __main__ - Step 20675: {'lr': 0.0004806149487525662, 'samples': 3969600, 'steps': 20674, 'loss/train': 1.7800225019454956} -08/30/2021 16:55:41 - INFO - __main__ - Step 20676: {'lr': 0.0004806128998029272, 'samples': 3969792, 'steps': 20675, 'loss/train': 2.0995993614196777} -08/30/2021 16:55:41 - INFO - __main__ - Step 20677: {'lr': 0.0004806108507493777, 'samples': 3969984, 'steps': 20676, 'loss/train': 1.972775936126709} -08/30/2021 16:55:42 - INFO - __main__ - Step 20678: {'lr': 0.0004806088015919185, 'samples': 3970176, 'steps': 20677, 'loss/train': 5.629034996032715} -08/30/2021 16:55:42 - INFO - __main__ - Step 20679: {'lr': 0.0004806067523305505, 'samples': 3970368, 'steps': 20678, 'loss/train': 2.0154056549072266} -08/30/2021 16:55:43 - INFO - __main__ - Step 20680: {'lr': 0.0004806047029652747, 'samples': 3970560, 'steps': 20679, 'loss/train': 1.756956696510315} -08/30/2021 16:55:44 - INFO - __main__ - Step 20681: {'lr': 0.00048060265349609193, 'samples': 3970752, 'steps': 20680, 'loss/train': 1.3318066596984863} -08/30/2021 16:55:44 - INFO - __main__ - Step 20682: {'lr': 0.0004806006039230032, 'samples': 3970944, 'steps': 20681, 'loss/train': 1.3747334480285645} -08/30/2021 16:55:45 - INFO - __main__ - Step 20683: {'lr': 0.0004805985542460094, 'samples': 3971136, 'steps': 20682, 'loss/train': 1.322189450263977} -08/30/2021 16:55:45 - INFO - __main__ - Step 20684: {'lr': 0.00048059650446511136, 'samples': 3971328, 'steps': 20683, 'loss/train': 0.8517647981643677} -08/30/2021 16:55:46 - INFO - __main__ - Step 20685: {'lr': 0.00048059445458031023, 'samples': 3971520, 'steps': 20684, 'loss/train': 1.3851511478424072} -08/30/2021 16:55:47 - INFO - __main__ - Step 20686: {'lr': 0.0004805924045916067, 'samples': 3971712, 'steps': 20685, 'loss/train': 1.5475938320159912} -08/30/2021 16:55:48 - INFO - __main__ - Step 20687: {'lr': 0.00048059035449900185, 'samples': 3971904, 'steps': 20686, 'loss/train': 1.7559659481048584} -08/30/2021 16:55:48 - INFO - __main__ - Step 20688: {'lr': 0.0004805883043024965, 'samples': 3972096, 'steps': 20687, 'loss/train': 0.40264657139778137} -08/30/2021 16:55:48 - INFO - __main__ - Step 20689: {'lr': 0.0004805862540020917, 'samples': 3972288, 'steps': 20688, 'loss/train': 0.4182220697402954} -08/30/2021 16:55:49 - INFO - __main__ - Step 20690: {'lr': 0.0004805842035977882, 'samples': 3972480, 'steps': 20689, 'loss/train': 1.4698597192764282} -08/30/2021 16:55:49 - INFO - __main__ - Step 20691: {'lr': 0.00048058215308958703, 'samples': 3972672, 'steps': 20690, 'loss/train': 1.8014353513717651} -08/30/2021 16:55:51 - INFO - __main__ - Step 20692: {'lr': 0.00048058010247748904, 'samples': 3972864, 'steps': 20691, 'loss/train': 0.4119693338871002} -08/30/2021 16:55:51 - INFO - __main__ - Step 20693: {'lr': 0.0004805780517614954, 'samples': 3973056, 'steps': 20692, 'loss/train': 1.5545519590377808} -08/30/2021 16:55:52 - INFO - __main__ - Step 20694: {'lr': 0.0004805760009416067, 'samples': 3973248, 'steps': 20693, 'loss/train': 2.980133056640625} -08/30/2021 16:55:52 - INFO - __main__ - Step 20695: {'lr': 0.000480573950017824, 'samples': 3973440, 'steps': 20694, 'loss/train': 0.15593315660953522} -08/30/2021 16:55:52 - INFO - __main__ - Step 20696: {'lr': 0.0004805718989901483, 'samples': 3973632, 'steps': 20695, 'loss/train': 1.651999592781067} -08/30/2021 16:55:54 - INFO - __main__ - Step 20697: {'lr': 0.00048056984785858046, 'samples': 3973824, 'steps': 20696, 'loss/train': 0.1327599734067917} -08/30/2021 16:55:55 - INFO - __main__ - Step 20698: {'lr': 0.0004805677966231214, 'samples': 3974016, 'steps': 20697, 'loss/train': 1.5303266048431396} -08/30/2021 16:55:55 - INFO - __main__ - Step 20699: {'lr': 0.00048056574528377205, 'samples': 3974208, 'steps': 20698, 'loss/train': 1.2969508171081543} -08/30/2021 16:55:55 - INFO - __main__ - Step 20700: {'lr': 0.00048056369384053335, 'samples': 3974400, 'steps': 20699, 'loss/train': 1.381152629852295} -08/30/2021 16:55:56 - INFO - __main__ - Step 20701: {'lr': 0.00048056164229340613, 'samples': 3974592, 'steps': 20700, 'loss/train': 1.2419464588165283} -08/30/2021 16:55:57 - INFO - __main__ - Step 20702: {'lr': 0.0004805595906423914, 'samples': 3974784, 'steps': 20701, 'loss/train': 1.3216350078582764} -08/30/2021 16:55:58 - INFO - __main__ - Step 20703: {'lr': 0.00048055753888749013, 'samples': 3974976, 'steps': 20702, 'loss/train': 2.056077480316162} -08/30/2021 16:55:58 - INFO - __main__ - Step 20704: {'lr': 0.0004805554870287032, 'samples': 3975168, 'steps': 20703, 'loss/train': 1.2361171245574951} -08/30/2021 16:55:58 - INFO - __main__ - Step 20705: {'lr': 0.0004805534350660315, 'samples': 3975360, 'steps': 20704, 'loss/train': 1.7923864126205444} -08/30/2021 16:55:59 - INFO - __main__ - Step 20706: {'lr': 0.000480551382999476, 'samples': 3975552, 'steps': 20705, 'loss/train': 1.4378912448883057} -08/30/2021 16:56:00 - INFO - __main__ - Step 20707: {'lr': 0.00048054933082903754, 'samples': 3975744, 'steps': 20706, 'loss/train': 1.7227957248687744} -08/30/2021 16:56:01 - INFO - __main__ - Step 20708: {'lr': 0.00048054727855471717, 'samples': 3975936, 'steps': 20707, 'loss/train': 1.7430933713912964} -08/30/2021 16:56:01 - INFO - __main__ - Step 20709: {'lr': 0.00048054522617651575, 'samples': 3976128, 'steps': 20708, 'loss/train': 1.4573649168014526} -08/30/2021 16:56:01 - INFO - __main__ - Step 20710: {'lr': 0.0004805431736944342, 'samples': 3976320, 'steps': 20709, 'loss/train': 1.2537758350372314} -08/30/2021 16:56:02 - INFO - __main__ - Step 20711: {'lr': 0.0004805411211084735, 'samples': 3976512, 'steps': 20710, 'loss/train': 0.9819672703742981} -08/30/2021 16:56:03 - INFO - __main__ - Step 20712: {'lr': 0.0004805390684186344, 'samples': 3976704, 'steps': 20711, 'loss/train': 2.3263676166534424} -08/30/2021 16:56:04 - INFO - __main__ - Step 20713: {'lr': 0.00048053701562491804, 'samples': 3976896, 'steps': 20712, 'loss/train': 1.2889982461929321} -08/30/2021 16:56:04 - INFO - __main__ - Step 20714: {'lr': 0.0004805349627273253, 'samples': 3977088, 'steps': 20713, 'loss/train': 1.423947811126709} -08/30/2021 16:56:05 - INFO - __main__ - Step 20715: {'lr': 0.00048053290972585697, 'samples': 3977280, 'steps': 20714, 'loss/train': 1.1521159410476685} -08/30/2021 16:56:05 - INFO - __main__ - Step 20716: {'lr': 0.0004805308566205141, 'samples': 3977472, 'steps': 20715, 'loss/train': 1.5645651817321777} -08/30/2021 16:56:05 - INFO - __main__ - Step 20717: {'lr': 0.00048052880341129764, 'samples': 3977664, 'steps': 20716, 'loss/train': 0.8094602823257446} -08/30/2021 16:56:07 - INFO - __main__ - Step 20718: {'lr': 0.00048052675009820837, 'samples': 3977856, 'steps': 20717, 'loss/train': 1.7630436420440674} -08/30/2021 16:56:07 - INFO - __main__ - Step 20719: {'lr': 0.0004805246966812474, 'samples': 3978048, 'steps': 20718, 'loss/train': 2.433021068572998} -08/30/2021 16:56:07 - INFO - __main__ - Step 20720: {'lr': 0.0004805226431604155, 'samples': 3978240, 'steps': 20719, 'loss/train': 1.4015146493911743} -08/30/2021 16:56:08 - INFO - __main__ - Step 20721: {'lr': 0.00048052058953571366, 'samples': 3978432, 'steps': 20720, 'loss/train': 1.4894248247146606} -08/30/2021 16:56:08 - INFO - __main__ - Step 20722: {'lr': 0.0004805185358071428, 'samples': 3978624, 'steps': 20721, 'loss/train': 1.6452594995498657} -08/30/2021 16:56:10 - INFO - __main__ - Step 20723: {'lr': 0.0004805164819747038, 'samples': 3978816, 'steps': 20722, 'loss/train': 1.3686636686325073} -08/30/2021 16:56:10 - INFO - __main__ - Step 20724: {'lr': 0.0004805144280383977, 'samples': 3979008, 'steps': 20723, 'loss/train': 1.8824739456176758} -08/30/2021 16:56:11 - INFO - __main__ - Step 20725: {'lr': 0.00048051237399822534, 'samples': 3979200, 'steps': 20724, 'loss/train': 1.6183282136917114} -08/30/2021 16:56:11 - INFO - __main__ - Step 20726: {'lr': 0.00048051031985418764, 'samples': 3979392, 'steps': 20725, 'loss/train': 1.4658023118972778} -08/30/2021 16:56:11 - INFO - __main__ - Step 20727: {'lr': 0.0004805082656062856, 'samples': 3979584, 'steps': 20726, 'loss/train': 1.5528312921524048} -08/30/2021 16:56:13 - INFO - __main__ - Step 20728: {'lr': 0.00048050621125451996, 'samples': 3979776, 'steps': 20727, 'loss/train': 1.1035397052764893} -08/30/2021 16:56:13 - INFO - __main__ - Step 20729: {'lr': 0.00048050415679889194, 'samples': 3979968, 'steps': 20728, 'loss/train': 2.0017354488372803} -08/30/2021 16:56:14 - INFO - __main__ - Step 20730: {'lr': 0.0004805021022394022, 'samples': 3980160, 'steps': 20729, 'loss/train': 1.5923737287521362} -08/30/2021 16:56:14 - INFO - __main__ - Step 20731: {'lr': 0.0004805000475760518, 'samples': 3980352, 'steps': 20730, 'loss/train': 1.7138861417770386} -08/30/2021 16:56:14 - INFO - __main__ - Step 20732: {'lr': 0.0004804979928088417, 'samples': 3980544, 'steps': 20731, 'loss/train': 1.8164052963256836} -08/30/2021 16:56:16 - INFO - __main__ - Step 20733: {'lr': 0.0004804959379377727, 'samples': 3980736, 'steps': 20732, 'loss/train': 1.570721983909607} -08/30/2021 16:56:16 - INFO - __main__ - Step 20734: {'lr': 0.00048049388296284576, 'samples': 3980928, 'steps': 20733, 'loss/train': 0.9652804136276245} -08/30/2021 16:56:17 - INFO - __main__ - Step 20735: {'lr': 0.00048049182788406186, 'samples': 3981120, 'steps': 20734, 'loss/train': 1.8427886962890625} -08/30/2021 16:56:17 - INFO - __main__ - Step 20736: {'lr': 0.0004804897727014219, 'samples': 3981312, 'steps': 20735, 'loss/train': 2.443028688430786} -08/30/2021 16:56:17 - INFO - __main__ - Step 20737: {'lr': 0.0004804877174149268, 'samples': 3981504, 'steps': 20736, 'loss/train': 0.9933156967163086} -08/30/2021 16:56:18 - INFO - __main__ - Step 20738: {'lr': 0.00048048566202457747, 'samples': 3981696, 'steps': 20737, 'loss/train': 1.6103301048278809} -08/30/2021 16:56:19 - INFO - __main__ - Step 20739: {'lr': 0.00048048360653037494, 'samples': 3981888, 'steps': 20738, 'loss/train': 1.3910224437713623} -08/30/2021 16:56:20 - INFO - __main__ - Step 20740: {'lr': 0.00048048155093231994, 'samples': 3982080, 'steps': 20739, 'loss/train': 1.2703614234924316} -08/30/2021 16:56:20 - INFO - __main__ - Step 20741: {'lr': 0.00048047949523041355, 'samples': 3982272, 'steps': 20740, 'loss/train': 0.5967580676078796} -08/30/2021 16:56:21 - INFO - __main__ - Step 20742: {'lr': 0.0004804774394246567, 'samples': 3982464, 'steps': 20741, 'loss/train': 1.376112461090088} -08/30/2021 16:56:21 - INFO - __main__ - Step 20743: {'lr': 0.0004804753835150503, 'samples': 3982656, 'steps': 20742, 'loss/train': 1.4000831842422485} -08/30/2021 16:56:23 - INFO - __main__ - Step 20744: {'lr': 0.0004804733275015951, 'samples': 3982848, 'steps': 20743, 'loss/train': 1.4413738250732422} -08/30/2021 16:56:24 - INFO - __main__ - Step 20745: {'lr': 0.0004804712713842923, 'samples': 3983040, 'steps': 20744, 'loss/train': 1.568382740020752} -08/30/2021 16:56:24 - INFO - __main__ - Step 20746: {'lr': 0.0004804692151631427, 'samples': 3983232, 'steps': 20745, 'loss/train': 1.5668437480926514} -08/30/2021 16:56:24 - INFO - __main__ - Step 20747: {'lr': 0.00048046715883814716, 'samples': 3983424, 'steps': 20746, 'loss/train': 1.9023722410202026} -08/30/2021 16:56:25 - INFO - __main__ - Step 20748: {'lr': 0.00048046510240930674, 'samples': 3983616, 'steps': 20747, 'loss/train': 0.3020634055137634} -08/30/2021 16:56:27 - INFO - __main__ - Step 20749: {'lr': 0.00048046304587662225, 'samples': 3983808, 'steps': 20748, 'loss/train': 1.6442160606384277} -08/30/2021 16:56:27 - INFO - __main__ - Step 20750: {'lr': 0.00048046098924009467, 'samples': 3984000, 'steps': 20749, 'loss/train': 1.6216952800750732} -08/30/2021 16:56:27 - INFO - __main__ - Step 20751: {'lr': 0.00048045893249972497, 'samples': 3984192, 'steps': 20750, 'loss/train': 1.441290259361267} -08/30/2021 16:56:28 - INFO - __main__ - Step 20752: {'lr': 0.000480456875655514, 'samples': 3984384, 'steps': 20751, 'loss/train': 1.5465011596679688} -08/30/2021 16:56:28 - INFO - __main__ - Step 20753: {'lr': 0.0004804548187074628, 'samples': 3984576, 'steps': 20752, 'loss/train': 1.6776716709136963} -08/30/2021 16:56:28 - INFO - __main__ - Step 20754: {'lr': 0.0004804527616555721, 'samples': 3984768, 'steps': 20753, 'loss/train': 1.7566523551940918} -08/30/2021 16:56:30 - INFO - __main__ - Step 20755: {'lr': 0.00048045070449984295, 'samples': 3984960, 'steps': 20754, 'loss/train': 1.4441533088684082} -08/30/2021 16:56:30 - INFO - __main__ - Step 20756: {'lr': 0.0004804486472402763, 'samples': 3985152, 'steps': 20755, 'loss/train': 1.2981563806533813} -08/30/2021 16:56:31 - INFO - __main__ - Step 20757: {'lr': 0.0004804465898768731, 'samples': 3985344, 'steps': 20756, 'loss/train': 2.227184772491455} -08/30/2021 16:56:31 - INFO - __main__ - Step 20758: {'lr': 0.00048044453240963413, 'samples': 3985536, 'steps': 20757, 'loss/train': 2.007504463195801} -08/30/2021 16:56:31 - INFO - __main__ - Step 20759: {'lr': 0.00048044247483856043, 'samples': 3985728, 'steps': 20758, 'loss/train': 2.0310137271881104} -08/30/2021 16:56:33 - INFO - __main__ - Step 20760: {'lr': 0.00048044041716365296, 'samples': 3985920, 'steps': 20759, 'loss/train': 0.8354974985122681} -08/30/2021 16:56:33 - INFO - __main__ - Step 20761: {'lr': 0.00048043835938491253, 'samples': 3986112, 'steps': 20760, 'loss/train': 1.1922798156738281} -08/30/2021 16:56:34 - INFO - __main__ - Step 20762: {'lr': 0.0004804363015023402, 'samples': 3986304, 'steps': 20761, 'loss/train': 1.7823498249053955} -08/30/2021 16:56:34 - INFO - __main__ - Step 20763: {'lr': 0.00048043424351593676, 'samples': 3986496, 'steps': 20762, 'loss/train': 2.0763256549835205} -08/30/2021 16:56:34 - INFO - __main__ - Step 20764: {'lr': 0.0004804321854257032, 'samples': 3986688, 'steps': 20763, 'loss/train': 1.223707914352417} -08/30/2021 16:56:36 - INFO - __main__ - Step 20765: {'lr': 0.0004804301272316405, 'samples': 3986880, 'steps': 20764, 'loss/train': 0.4089663326740265} -08/30/2021 16:56:36 - INFO - __main__ - Step 20766: {'lr': 0.0004804280689337496, 'samples': 3987072, 'steps': 20765, 'loss/train': 1.802085280418396} -08/30/2021 16:56:37 - INFO - __main__ - Step 20767: {'lr': 0.00048042601053203125, 'samples': 3987264, 'steps': 20766, 'loss/train': 1.5809887647628784} -08/30/2021 16:56:37 - INFO - __main__ - Step 20768: {'lr': 0.00048042395202648646, 'samples': 3987456, 'steps': 20767, 'loss/train': 1.6898623704910278} -08/30/2021 16:56:37 - INFO - __main__ - Step 20769: {'lr': 0.00048042189341711636, 'samples': 3987648, 'steps': 20768, 'loss/train': 1.701935052871704} -08/30/2021 16:56:38 - INFO - __main__ - Step 20770: {'lr': 0.0004804198347039216, 'samples': 3987840, 'steps': 20769, 'loss/train': 2.0882790088653564} -08/30/2021 16:56:39 - INFO - __main__ - Step 20771: {'lr': 0.0004804177758869032, 'samples': 3988032, 'steps': 20770, 'loss/train': 1.356032133102417} -08/30/2021 16:56:40 - INFO - __main__ - Step 20772: {'lr': 0.0004804157169660622, 'samples': 3988224, 'steps': 20771, 'loss/train': 2.3334457874298096} -08/30/2021 16:56:40 - INFO - __main__ - Step 20773: {'lr': 0.00048041365794139934, 'samples': 3988416, 'steps': 20772, 'loss/train': 0.2663647532463074} -08/30/2021 16:56:41 - INFO - __main__ - Step 20774: {'lr': 0.00048041159881291574, 'samples': 3988608, 'steps': 20773, 'loss/train': 1.5477395057678223} -08/30/2021 16:56:41 - INFO - __main__ - Step 20775: {'lr': 0.0004804095395806122, 'samples': 3988800, 'steps': 20774, 'loss/train': 1.612539529800415} -08/30/2021 16:56:43 - INFO - __main__ - Step 20776: {'lr': 0.00048040748024448954, 'samples': 3988992, 'steps': 20775, 'loss/train': 1.688582420349121} -08/30/2021 16:56:43 - INFO - __main__ - Step 20777: {'lr': 0.00048040542080454897, 'samples': 3989184, 'steps': 20776, 'loss/train': 1.3352688550949097} -08/30/2021 16:56:44 - INFO - __main__ - Step 20778: {'lr': 0.0004804033612607912, 'samples': 3989376, 'steps': 20777, 'loss/train': 1.4921340942382812} -08/30/2021 16:56:44 - INFO - __main__ - Step 20779: {'lr': 0.00048040130161321724, 'samples': 3989568, 'steps': 20778, 'loss/train': 1.7791802883148193} -08/30/2021 16:56:44 - INFO - __main__ - Step 20780: {'lr': 0.0004803992418618281, 'samples': 3989760, 'steps': 20779, 'loss/train': 1.817274808883667} -08/30/2021 16:56:46 - INFO - __main__ - Step 20781: {'lr': 0.00048039718200662454, 'samples': 3989952, 'steps': 20780, 'loss/train': 0.6666374206542969} -08/30/2021 16:56:47 - INFO - __main__ - Step 20782: {'lr': 0.0004803951220476076, 'samples': 3990144, 'steps': 20781, 'loss/train': 2.2849414348602295} -08/30/2021 16:56:47 - INFO - __main__ - Step 20783: {'lr': 0.00048039306198477817, 'samples': 3990336, 'steps': 20782, 'loss/train': 1.2788106203079224} -08/30/2021 16:56:47 - INFO - __main__ - Step 20784: {'lr': 0.0004803910018181371, 'samples': 3990528, 'steps': 20783, 'loss/train': 1.457331895828247} -08/30/2021 16:56:48 - INFO - __main__ - Step 20785: {'lr': 0.0004803889415476855, 'samples': 3990720, 'steps': 20784, 'loss/train': 1.5049031972885132} -08/30/2021 16:56:50 - INFO - __main__ - Step 20786: {'lr': 0.0004803868811734242, 'samples': 3990912, 'steps': 20785, 'loss/train': 0.9126980304718018} -08/30/2021 16:56:50 - INFO - __main__ - Step 20787: {'lr': 0.00048038482069535406, 'samples': 3991104, 'steps': 20786, 'loss/train': 0.9489515423774719} -08/30/2021 16:56:50 - INFO - __main__ - Step 20788: {'lr': 0.000480382760113476, 'samples': 3991296, 'steps': 20787, 'loss/train': 1.571537733078003} -08/30/2021 16:56:51 - INFO - __main__ - Step 20789: {'lr': 0.00048038069942779116, 'samples': 3991488, 'steps': 20788, 'loss/train': 1.521704912185669} -08/30/2021 16:56:51 - INFO - __main__ - Step 20790: {'lr': 0.00048037863863830034, 'samples': 3991680, 'steps': 20789, 'loss/train': 1.4000773429870605} -08/30/2021 16:56:51 - INFO - __main__ - Step 20791: {'lr': 0.0004803765777450044, 'samples': 3991872, 'steps': 20790, 'loss/train': 1.6413817405700684} -08/30/2021 16:56:53 - INFO - __main__ - Step 20792: {'lr': 0.00048037451674790433, 'samples': 3992064, 'steps': 20791, 'loss/train': 0.200750470161438} -08/30/2021 16:56:53 - INFO - __main__ - Step 20793: {'lr': 0.0004803724556470011, 'samples': 3992256, 'steps': 20792, 'loss/train': 1.843687653541565} -08/30/2021 16:56:54 - INFO - __main__ - Step 20794: {'lr': 0.0004803703944422956, 'samples': 3992448, 'steps': 20793, 'loss/train': 1.8204582929611206} -08/30/2021 16:56:54 - INFO - __main__ - Step 20795: {'lr': 0.0004803683331337887, 'samples': 3992640, 'steps': 20794, 'loss/train': 1.6987535953521729} -08/30/2021 16:56:54 - INFO - __main__ - Step 20796: {'lr': 0.0004803662717214814, 'samples': 3992832, 'steps': 20795, 'loss/train': 1.7447631359100342} -08/30/2021 16:56:56 - INFO - __main__ - Step 20797: {'lr': 0.00048036421020537464, 'samples': 3993024, 'steps': 20796, 'loss/train': 1.2406423091888428} -08/30/2021 16:56:56 - INFO - __main__ - Step 20798: {'lr': 0.0004803621485854693, 'samples': 3993216, 'steps': 20797, 'loss/train': 1.7606385946273804} -08/30/2021 16:56:57 - INFO - __main__ - Step 20799: {'lr': 0.00048036008686176636, 'samples': 3993408, 'steps': 20798, 'loss/train': 2.0389721393585205} -08/30/2021 16:56:57 - INFO - __main__ - Step 20800: {'lr': 0.0004803580250342666, 'samples': 3993600, 'steps': 20799, 'loss/train': 0.8765015006065369} -08/30/2021 16:56:57 - INFO - __main__ - Step 20801: {'lr': 0.00048035596310297125, 'samples': 3993792, 'steps': 20800, 'loss/train': 1.6353588104248047} -08/30/2021 16:56:58 - INFO - __main__ - Step 20802: {'lr': 0.0004803539010678809, 'samples': 3993984, 'steps': 20801, 'loss/train': 1.1891461610794067} -08/30/2021 16:57:00 - INFO - __main__ - Step 20803: {'lr': 0.00048035183892899676, 'samples': 3994176, 'steps': 20802, 'loss/train': 1.509429931640625} -08/30/2021 16:57:00 - INFO - __main__ - Step 20804: {'lr': 0.0004803497766863195, 'samples': 3994368, 'steps': 20803, 'loss/train': 1.8290326595306396} -08/30/2021 16:57:01 - INFO - __main__ - Step 20805: {'lr': 0.00048034771433985035, 'samples': 3994560, 'steps': 20804, 'loss/train': 1.8175963163375854} -08/30/2021 16:57:01 - INFO - __main__ - Step 20806: {'lr': 0.00048034565188959, 'samples': 3994752, 'steps': 20805, 'loss/train': 1.915069341659546} -08/30/2021 16:57:01 - INFO - __main__ - Step 20807: {'lr': 0.0004803435893355394, 'samples': 3994944, 'steps': 20806, 'loss/train': 1.5590801239013672} -08/30/2021 16:57:03 - INFO - __main__ - Step 20808: {'lr': 0.00048034152667769957, 'samples': 3995136, 'steps': 20807, 'loss/train': 1.4858994483947754} -08/30/2021 16:57:03 - INFO - __main__ - Step 20809: {'lr': 0.0004803394639160714, 'samples': 3995328, 'steps': 20808, 'loss/train': 1.0625766515731812} -08/30/2021 16:57:04 - INFO - __main__ - Step 20810: {'lr': 0.00048033740105065585, 'samples': 3995520, 'steps': 20809, 'loss/train': 0.7241296768188477} -08/30/2021 16:57:04 - INFO - __main__ - Step 20811: {'lr': 0.0004803353380814538, 'samples': 3995712, 'steps': 20810, 'loss/train': 1.686326503753662} -08/30/2021 16:57:04 - INFO - __main__ - Step 20812: {'lr': 0.00048033327500846625, 'samples': 3995904, 'steps': 20811, 'loss/train': 1.425820231437683} -08/30/2021 16:57:06 - INFO - __main__ - Step 20813: {'lr': 0.000480331211831694, 'samples': 3996096, 'steps': 20812, 'loss/train': 0.8603524565696716} -08/30/2021 16:57:06 - INFO - __main__ - Step 20814: {'lr': 0.00048032914855113807, 'samples': 3996288, 'steps': 20813, 'loss/train': 1.022192120552063} -08/30/2021 16:57:06 - INFO - __main__ - Step 20815: {'lr': 0.00048032708516679946, 'samples': 3996480, 'steps': 20814, 'loss/train': 0.7716886401176453} -08/30/2021 16:57:07 - INFO - __main__ - Step 20816: {'lr': 0.00048032502167867896, 'samples': 3996672, 'steps': 20815, 'loss/train': 1.5297855138778687} -08/30/2021 16:57:07 - INFO - __main__ - Step 20817: {'lr': 0.0004803229580867775, 'samples': 3996864, 'steps': 20816, 'loss/train': 1.4987337589263916} -08/30/2021 16:57:09 - INFO - __main__ - Step 20818: {'lr': 0.0004803208943910962, 'samples': 3997056, 'steps': 20817, 'loss/train': 1.2595634460449219} -08/30/2021 16:57:09 - INFO - __main__ - Step 20819: {'lr': 0.00048031883059163576, 'samples': 3997248, 'steps': 20818, 'loss/train': 1.42384934425354} -08/30/2021 16:57:09 - INFO - __main__ - Step 20820: {'lr': 0.00048031676668839723, 'samples': 3997440, 'steps': 20819, 'loss/train': 1.623425006866455} -08/30/2021 16:57:10 - INFO - __main__ - Step 20821: {'lr': 0.00048031470268138153, 'samples': 3997632, 'steps': 20820, 'loss/train': 1.529524564743042} -08/30/2021 16:57:10 - INFO - __main__ - Step 20822: {'lr': 0.00048031263857058957, 'samples': 3997824, 'steps': 20821, 'loss/train': 1.398085355758667} -08/30/2021 16:57:12 - INFO - __main__ - Step 20823: {'lr': 0.00048031057435602234, 'samples': 3998016, 'steps': 20822, 'loss/train': 0.6544572710990906} -08/30/2021 16:57:12 - INFO - __main__ - Step 20824: {'lr': 0.0004803085100376807, 'samples': 3998208, 'steps': 20823, 'loss/train': 1.5054800510406494} -08/30/2021 16:57:12 - INFO - __main__ - Step 20825: {'lr': 0.00048030644561556556, 'samples': 3998400, 'steps': 20824, 'loss/train': 2.384716749191284} -08/30/2021 16:57:13 - INFO - __main__ - Step 20826: {'lr': 0.0004803043810896779, 'samples': 3998592, 'steps': 20825, 'loss/train': 1.834130883216858} -08/30/2021 16:57:13 - INFO - __main__ - Step 20827: {'lr': 0.00048030231646001867, 'samples': 3998784, 'steps': 20826, 'loss/train': 1.5747114419937134} -08/30/2021 16:57:15 - INFO - __main__ - Step 20828: {'lr': 0.0004803002517265887, 'samples': 3998976, 'steps': 20827, 'loss/train': 1.1097772121429443} -08/30/2021 16:57:15 - INFO - __main__ - Step 20829: {'lr': 0.0004802981868893891, 'samples': 3999168, 'steps': 20828, 'loss/train': 1.3051564693450928} -08/30/2021 16:57:16 - INFO - __main__ - Step 20830: {'lr': 0.00048029612194842056, 'samples': 3999360, 'steps': 20829, 'loss/train': 1.3877121210098267} -08/30/2021 16:57:16 - INFO - __main__ - Step 20831: {'lr': 0.0004802940569036842, 'samples': 3999552, 'steps': 20830, 'loss/train': 1.4898688793182373} -08/30/2021 16:57:16 - INFO - __main__ - Step 20832: {'lr': 0.0004802919917551809, 'samples': 3999744, 'steps': 20831, 'loss/train': 1.796456217765808} -08/30/2021 16:57:18 - INFO - __main__ - Step 20833: {'lr': 0.00048028992650291156, 'samples': 3999936, 'steps': 20832, 'loss/train': 1.4047584533691406} -08/30/2021 16:57:18 - INFO - __main__ - Step 20834: {'lr': 0.00048028786114687715, 'samples': 4000128, 'steps': 20833, 'loss/train': 0.3299529552459717} -08/30/2021 16:57:18 - INFO - __main__ - Step 20835: {'lr': 0.0004802857956870786, 'samples': 4000320, 'steps': 20834, 'loss/train': 1.3085787296295166} -08/30/2021 16:57:19 - INFO - __main__ - Step 20836: {'lr': 0.00048028373012351684, 'samples': 4000512, 'steps': 20835, 'loss/train': 1.2915829420089722} -08/30/2021 16:57:19 - INFO - __main__ - Step 20837: {'lr': 0.00048028166445619275, 'samples': 4000704, 'steps': 20836, 'loss/train': 1.332929015159607} -08/30/2021 16:57:21 - INFO - __main__ - Step 20838: {'lr': 0.0004802795986851073, 'samples': 4000896, 'steps': 20837, 'loss/train': 1.5033856630325317} -08/30/2021 16:57:21 - INFO - __main__ - Step 20839: {'lr': 0.00048027753281026144, 'samples': 4001088, 'steps': 20838, 'loss/train': 1.496140956878662} -08/30/2021 16:57:21 - INFO - __main__ - Step 20840: {'lr': 0.000480275466831656, 'samples': 4001280, 'steps': 20839, 'loss/train': 1.7681258916854858} -08/30/2021 16:57:22 - INFO - __main__ - Step 20841: {'lr': 0.00048027340074929207, 'samples': 4001472, 'steps': 20840, 'loss/train': 1.8449194431304932} -08/30/2021 16:57:22 - INFO - __main__ - Step 20842: {'lr': 0.0004802713345631705, 'samples': 4001664, 'steps': 20841, 'loss/train': 1.9577341079711914} -08/30/2021 16:57:23 - INFO - __main__ - Step 20843: {'lr': 0.0004802692682732922, 'samples': 4001856, 'steps': 20842, 'loss/train': 1.7500014305114746} -08/30/2021 16:57:24 - INFO - __main__ - Step 20844: {'lr': 0.0004802672018796581, 'samples': 4002048, 'steps': 20843, 'loss/train': 0.7694911360740662} -08/30/2021 16:57:25 - INFO - __main__ - Step 20845: {'lr': 0.0004802651353822691, 'samples': 4002240, 'steps': 20844, 'loss/train': 1.3434566259384155} -08/30/2021 16:57:25 - INFO - __main__ - Step 20846: {'lr': 0.0004802630687811263, 'samples': 4002432, 'steps': 20845, 'loss/train': 0.157589390873909} -08/30/2021 16:57:25 - INFO - __main__ - Step 20847: {'lr': 0.00048026100207623047, 'samples': 4002624, 'steps': 20846, 'loss/train': 1.613234281539917} -08/30/2021 16:57:26 - INFO - __main__ - Step 20848: {'lr': 0.0004802589352675826, 'samples': 4002816, 'steps': 20847, 'loss/train': 5.843477725982666} -08/30/2021 16:57:27 - INFO - __main__ - Step 20849: {'lr': 0.0004802568683551836, 'samples': 4003008, 'steps': 20848, 'loss/train': 1.3360764980316162} -08/30/2021 16:57:28 - INFO - __main__ - Step 20850: {'lr': 0.0004802548013390343, 'samples': 4003200, 'steps': 20849, 'loss/train': 1.213433027267456} -08/30/2021 16:57:28 - INFO - __main__ - Step 20851: {'lr': 0.00048025273421913587, 'samples': 4003392, 'steps': 20850, 'loss/train': 1.7084523439407349} -08/30/2021 16:57:28 - INFO - __main__ - Step 20852: {'lr': 0.0004802506669954891, 'samples': 4003584, 'steps': 20851, 'loss/train': 1.7778393030166626} -08/30/2021 16:57:29 - INFO - __main__ - Step 20853: {'lr': 0.00048024859966809487, 'samples': 4003776, 'steps': 20852, 'loss/train': 2.043734550476074} -08/30/2021 16:57:30 - INFO - __main__ - Step 20854: {'lr': 0.00048024653223695425, 'samples': 4003968, 'steps': 20853, 'loss/train': 1.2937445640563965} -08/30/2021 16:57:31 - INFO - __main__ - Step 20855: {'lr': 0.00048024446470206806, 'samples': 4004160, 'steps': 20854, 'loss/train': 0.8848605155944824} -08/30/2021 16:57:31 - INFO - __main__ - Step 20856: {'lr': 0.0004802423970634373, 'samples': 4004352, 'steps': 20855, 'loss/train': 1.7068744897842407} -08/30/2021 16:57:31 - INFO - __main__ - Step 20857: {'lr': 0.00048024032932106277, 'samples': 4004544, 'steps': 20856, 'loss/train': 1.936099648475647} -08/30/2021 16:57:32 - INFO - __main__ - Step 20858: {'lr': 0.00048023826147494556, 'samples': 4004736, 'steps': 20857, 'loss/train': 1.530527949333191} -08/30/2021 16:57:32 - INFO - __main__ - Step 20859: {'lr': 0.0004802361935250865, 'samples': 4004928, 'steps': 20858, 'loss/train': 1.242943525314331} -08/30/2021 16:57:34 - INFO - __main__ - Step 20860: {'lr': 0.0004802341254714867, 'samples': 4005120, 'steps': 20859, 'loss/train': 1.5698579549789429} -08/30/2021 16:57:35 - INFO - __main__ - Step 20861: {'lr': 0.00048023205731414684, 'samples': 4005312, 'steps': 20860, 'loss/train': 1.8995860815048218} -08/30/2021 16:57:35 - INFO - __main__ - Step 20862: {'lr': 0.00048022998905306795, 'samples': 4005504, 'steps': 20861, 'loss/train': 0.5663987994194031} -08/30/2021 16:57:35 - INFO - __main__ - Step 20863: {'lr': 0.00048022792068825107, 'samples': 4005696, 'steps': 20862, 'loss/train': 1.5970838069915771} -08/30/2021 16:57:36 - INFO - __main__ - Step 20864: {'lr': 0.00048022585221969697, 'samples': 4005888, 'steps': 20863, 'loss/train': 0.8861684799194336} -08/30/2021 16:57:38 - INFO - __main__ - Step 20865: {'lr': 0.00048022378364740673, 'samples': 4006080, 'steps': 20864, 'loss/train': 1.7130883932113647} -08/30/2021 16:57:38 - INFO - __main__ - Step 20866: {'lr': 0.0004802217149713811, 'samples': 4006272, 'steps': 20865, 'loss/train': 1.4740095138549805} -08/30/2021 16:57:39 - INFO - __main__ - Step 20867: {'lr': 0.0004802196461916212, 'samples': 4006464, 'steps': 20866, 'loss/train': 1.6010992527008057} -08/30/2021 16:57:39 - INFO - __main__ - Step 20868: {'lr': 0.0004802175773081278, 'samples': 4006656, 'steps': 20867, 'loss/train': 1.6782881021499634} -08/30/2021 16:57:39 - INFO - __main__ - Step 20869: {'lr': 0.000480215508320902, 'samples': 4006848, 'steps': 20868, 'loss/train': 0.167189359664917} -08/30/2021 16:57:41 - INFO - __main__ - Step 20870: {'lr': 0.0004802134392299446, 'samples': 4007040, 'steps': 20869, 'loss/train': 1.6451122760772705} -08/30/2021 16:57:41 - INFO - __main__ - Step 20871: {'lr': 0.0004802113700352566, 'samples': 4007232, 'steps': 20870, 'loss/train': 1.909308910369873} -08/30/2021 16:57:42 - INFO - __main__ - Step 20872: {'lr': 0.00048020930073683886, 'samples': 4007424, 'steps': 20871, 'loss/train': 1.7468796968460083} -08/30/2021 16:57:42 - INFO - __main__ - Step 20873: {'lr': 0.0004802072313346924, 'samples': 4007616, 'steps': 20872, 'loss/train': 1.462784767150879} -08/30/2021 16:57:42 - INFO - __main__ - Step 20874: {'lr': 0.00048020516182881813, 'samples': 4007808, 'steps': 20873, 'loss/train': 1.947792410850525} -08/30/2021 16:57:44 - INFO - __main__ - Step 20875: {'lr': 0.00048020309221921686, 'samples': 4008000, 'steps': 20874, 'loss/train': 1.4549416303634644} -08/30/2021 16:57:44 - INFO - __main__ - Step 20876: {'lr': 0.00048020102250588976, 'samples': 4008192, 'steps': 20875, 'loss/train': 1.3103128671646118} -08/30/2021 16:57:45 - INFO - __main__ - Step 20877: {'lr': 0.00048019895268883764, 'samples': 4008384, 'steps': 20876, 'loss/train': 1.1322263479232788} -08/30/2021 16:57:45 - INFO - __main__ - Step 20878: {'lr': 0.0004801968827680613, 'samples': 4008576, 'steps': 20877, 'loss/train': 1.3397971391677856} -08/30/2021 16:57:45 - INFO - __main__ - Step 20879: {'lr': 0.00048019481274356194, 'samples': 4008768, 'steps': 20878, 'loss/train': 1.1345170736312866} -08/30/2021 16:57:47 - INFO - __main__ - Step 20880: {'lr': 0.0004801927426153402, 'samples': 4008960, 'steps': 20879, 'loss/train': 1.5402135848999023} -08/30/2021 16:57:48 - INFO - __main__ - Step 20881: {'lr': 0.00048019067238339725, 'samples': 4009152, 'steps': 20880, 'loss/train': 1.3619599342346191} -08/30/2021 16:57:48 - INFO - __main__ - Step 20882: {'lr': 0.000480188602047734, 'samples': 4009344, 'steps': 20881, 'loss/train': 1.7267178297042847} -08/30/2021 16:57:49 - INFO - __main__ - Step 20883: {'lr': 0.0004801865316083512, 'samples': 4009536, 'steps': 20882, 'loss/train': 2.110841989517212} -08/30/2021 16:57:49 - INFO - __main__ - Step 20884: {'lr': 0.0004801844610652499, 'samples': 4009728, 'steps': 20883, 'loss/train': 1.598005771636963} -08/30/2021 16:57:49 - INFO - __main__ - Step 20885: {'lr': 0.0004801823904184311, 'samples': 4009920, 'steps': 20884, 'loss/train': 1.4082896709442139} -08/30/2021 16:57:51 - INFO - __main__ - Step 20886: {'lr': 0.00048018031966789564, 'samples': 4010112, 'steps': 20885, 'loss/train': 0.14600832760334015} -08/30/2021 16:57:52 - INFO - __main__ - Step 20887: {'lr': 0.0004801782488136445, 'samples': 4010304, 'steps': 20886, 'loss/train': 1.7309308052062988} -08/30/2021 16:57:52 - INFO - __main__ - Step 20888: {'lr': 0.00048017617785567855, 'samples': 4010496, 'steps': 20887, 'loss/train': 0.1437617540359497} -08/30/2021 16:57:52 - INFO - __main__ - Step 20889: {'lr': 0.00048017410679399876, 'samples': 4010688, 'steps': 20888, 'loss/train': 1.4162567853927612} -08/30/2021 16:57:53 - INFO - __main__ - Step 20890: {'lr': 0.00048017203562860614, 'samples': 4010880, 'steps': 20889, 'loss/train': 2.313275098800659} -08/30/2021 16:57:53 - INFO - __main__ - Step 20891: {'lr': 0.0004801699643595015, 'samples': 4011072, 'steps': 20890, 'loss/train': 1.5743414163589478} -08/30/2021 16:57:54 - INFO - __main__ - Step 20892: {'lr': 0.00048016789298668583, 'samples': 4011264, 'steps': 20891, 'loss/train': 0.7836162447929382} -08/30/2021 16:57:55 - INFO - __main__ - Step 20893: {'lr': 0.0004801658215101601, 'samples': 4011456, 'steps': 20892, 'loss/train': 1.8106706142425537} -08/30/2021 16:57:55 - INFO - __main__ - Step 20894: {'lr': 0.00048016374992992516, 'samples': 4011648, 'steps': 20893, 'loss/train': 1.6870431900024414} -08/30/2021 16:57:56 - INFO - __main__ - Step 20895: {'lr': 0.000480161678245982, 'samples': 4011840, 'steps': 20894, 'loss/train': 1.6460051536560059} -08/30/2021 16:57:57 - INFO - __main__ - Step 20896: {'lr': 0.0004801596064583315, 'samples': 4012032, 'steps': 20895, 'loss/train': 1.2648009061813354} -08/30/2021 16:57:58 - INFO - __main__ - Step 20897: {'lr': 0.00048015753456697466, 'samples': 4012224, 'steps': 20896, 'loss/train': 1.7518366575241089} -08/30/2021 16:57:58 - INFO - __main__ - Step 20898: {'lr': 0.00048015546257191243, 'samples': 4012416, 'steps': 20897, 'loss/train': 1.0268855094909668} -08/30/2021 16:57:58 - INFO - __main__ - Step 20899: {'lr': 0.00048015339047314566, 'samples': 4012608, 'steps': 20898, 'loss/train': 1.3595432043075562} -08/30/2021 16:57:59 - INFO - __main__ - Step 20900: {'lr': 0.00048015131827067534, 'samples': 4012800, 'steps': 20899, 'loss/train': 0.8023666739463806} -08/30/2021 16:57:59 - INFO - __main__ - Step 20901: {'lr': 0.0004801492459645024, 'samples': 4012992, 'steps': 20900, 'loss/train': 1.5363144874572754} -08/30/2021 16:58:00 - INFO - __main__ - Step 20902: {'lr': 0.0004801471735546277, 'samples': 4013184, 'steps': 20901, 'loss/train': 1.5872712135314941} -08/30/2021 16:58:01 - INFO - __main__ - Step 20903: {'lr': 0.0004801451010410522, 'samples': 4013376, 'steps': 20902, 'loss/train': 1.7590477466583252} -08/30/2021 16:58:01 - INFO - __main__ - Step 20904: {'lr': 0.000480143028423777, 'samples': 4013568, 'steps': 20903, 'loss/train': 1.8734040260314941} -08/30/2021 16:58:02 - INFO - __main__ - Step 20905: {'lr': 0.0004801409557028028, 'samples': 4013760, 'steps': 20904, 'loss/train': 1.6589394807815552} -08/30/2021 16:58:02 - INFO - __main__ - Step 20906: {'lr': 0.0004801388828781307, 'samples': 4013952, 'steps': 20905, 'loss/train': 1.5599116086959839} -08/30/2021 16:58:04 - INFO - __main__ - Step 20907: {'lr': 0.00048013680994976154, 'samples': 4014144, 'steps': 20906, 'loss/train': 1.3931597471237183} -08/30/2021 16:58:05 - INFO - __main__ - Step 20908: {'lr': 0.0004801347369176963, 'samples': 4014336, 'steps': 20907, 'loss/train': 1.6757256984710693} -08/30/2021 16:58:05 - INFO - __main__ - Step 20909: {'lr': 0.00048013266378193586, 'samples': 4014528, 'steps': 20908, 'loss/train': 1.1520507335662842} -08/30/2021 16:58:05 - INFO - __main__ - Step 20910: {'lr': 0.00048013059054248134, 'samples': 4014720, 'steps': 20909, 'loss/train': 1.6782448291778564} -08/30/2021 16:58:06 - INFO - __main__ - Step 20911: {'lr': 0.00048012851719933335, 'samples': 4014912, 'steps': 20910, 'loss/train': 1.9210513830184937} -08/30/2021 16:58:06 - INFO - __main__ - Step 20912: {'lr': 0.000480126443752493, 'samples': 4015104, 'steps': 20911, 'loss/train': 5.031146049499512} -08/30/2021 16:58:08 - INFO - __main__ - Step 20913: {'lr': 0.0004801243702019614, 'samples': 4015296, 'steps': 20912, 'loss/train': 1.5334185361862183} -08/30/2021 16:58:08 - INFO - __main__ - Step 20914: {'lr': 0.00048012229654773915, 'samples': 4015488, 'steps': 20913, 'loss/train': 1.430576205253601} -08/30/2021 16:58:08 - INFO - __main__ - Step 20915: {'lr': 0.0004801202227898274, 'samples': 4015680, 'steps': 20914, 'loss/train': 1.8230525255203247} -08/30/2021 16:58:09 - INFO - __main__ - Step 20916: {'lr': 0.00048011814892822704, 'samples': 4015872, 'steps': 20915, 'loss/train': 1.590773105621338} -08/30/2021 16:58:09 - INFO - __main__ - Step 20917: {'lr': 0.00048011607496293896, 'samples': 4016064, 'steps': 20916, 'loss/train': 1.8072232007980347} -08/30/2021 16:58:11 - INFO - __main__ - Step 20918: {'lr': 0.0004801140008939642, 'samples': 4016256, 'steps': 20917, 'loss/train': 1.6074912548065186} -08/30/2021 16:58:11 - INFO - __main__ - Step 20919: {'lr': 0.00048011192672130356, 'samples': 4016448, 'steps': 20918, 'loss/train': 1.6177542209625244} -08/30/2021 16:58:11 - INFO - __main__ - Step 20920: {'lr': 0.000480109852444958, 'samples': 4016640, 'steps': 20919, 'loss/train': 0.4326907992362976} -08/30/2021 16:58:12 - INFO - __main__ - Step 20921: {'lr': 0.0004801077780649286, 'samples': 4016832, 'steps': 20920, 'loss/train': 1.431039571762085} -08/30/2021 16:58:12 - INFO - __main__ - Step 20922: {'lr': 0.00048010570358121606, 'samples': 4017024, 'steps': 20921, 'loss/train': 1.421709418296814} -08/30/2021 16:58:14 - INFO - __main__ - Step 20923: {'lr': 0.0004801036289938215, 'samples': 4017216, 'steps': 20922, 'loss/train': 1.3588948249816895} -08/30/2021 16:58:14 - INFO - __main__ - Step 20924: {'lr': 0.0004801015543027458, 'samples': 4017408, 'steps': 20923, 'loss/train': 1.118821144104004} -08/30/2021 16:58:15 - INFO - __main__ - Step 20925: {'lr': 0.0004800994795079899, 'samples': 4017600, 'steps': 20924, 'loss/train': 1.0915248394012451} -08/30/2021 16:58:15 - INFO - __main__ - Step 20926: {'lr': 0.00048009740460955465, 'samples': 4017792, 'steps': 20925, 'loss/train': 1.7997756004333496} -08/30/2021 16:58:16 - INFO - __main__ - Step 20927: {'lr': 0.00048009532960744116, 'samples': 4017984, 'steps': 20926, 'loss/train': 1.7789839506149292} -08/30/2021 16:58:17 - INFO - __main__ - Step 20928: {'lr': 0.0004800932545016502, 'samples': 4018176, 'steps': 20927, 'loss/train': 2.1777122020721436} -08/30/2021 16:58:18 - INFO - __main__ - Step 20929: {'lr': 0.0004800911792921828, 'samples': 4018368, 'steps': 20928, 'loss/train': 0.8171807527542114} -08/30/2021 16:58:18 - INFO - __main__ - Step 20930: {'lr': 0.0004800891039790399, 'samples': 4018560, 'steps': 20929, 'loss/train': 2.5374791622161865} -08/30/2021 16:58:18 - INFO - __main__ - Step 20931: {'lr': 0.00048008702856222233, 'samples': 4018752, 'steps': 20930, 'loss/train': 0.07208096235990524} -08/30/2021 16:58:19 - INFO - __main__ - Step 20932: {'lr': 0.0004800849530417312, 'samples': 4018944, 'steps': 20931, 'loss/train': 0.8734824657440186} -08/30/2021 16:58:20 - INFO - __main__ - Step 20933: {'lr': 0.00048008287741756715, 'samples': 4019136, 'steps': 20932, 'loss/train': 1.5740123987197876} -08/30/2021 16:58:20 - INFO - __main__ - Step 20934: {'lr': 0.00048008080168973144, 'samples': 4019328, 'steps': 20933, 'loss/train': 1.2088955640792847} -08/30/2021 16:58:21 - INFO - __main__ - Step 20935: {'lr': 0.00048007872585822486, 'samples': 4019520, 'steps': 20934, 'loss/train': 2.1600000858306885} -08/30/2021 16:58:21 - INFO - __main__ - Step 20936: {'lr': 0.00048007664992304834, 'samples': 4019712, 'steps': 20935, 'loss/train': 1.962638020515442} -08/30/2021 16:58:22 - INFO - __main__ - Step 20937: {'lr': 0.0004800745738842029, 'samples': 4019904, 'steps': 20936, 'loss/train': 1.4366098642349243} -08/30/2021 16:58:23 - INFO - __main__ - Step 20938: {'lr': 0.0004800724977416894, 'samples': 4020096, 'steps': 20937, 'loss/train': 1.3570092916488647} -08/30/2021 16:58:23 - INFO - __main__ - Step 20939: {'lr': 0.00048007042149550866, 'samples': 4020288, 'steps': 20938, 'loss/train': 2.136103868484497} -08/30/2021 16:58:24 - INFO - __main__ - Step 20940: {'lr': 0.00048006834514566183, 'samples': 4020480, 'steps': 20939, 'loss/train': 1.2310088872909546} -08/30/2021 16:58:24 - INFO - __main__ - Step 20941: {'lr': 0.00048006626869214977, 'samples': 4020672, 'steps': 20940, 'loss/train': 1.283164620399475} -08/30/2021 16:58:24 - INFO - __main__ - Step 20942: {'lr': 0.00048006419213497334, 'samples': 4020864, 'steps': 20941, 'loss/train': 1.5024957656860352} -08/30/2021 16:58:25 - INFO - __main__ - Step 20943: {'lr': 0.0004800621154741335, 'samples': 4021056, 'steps': 20942, 'loss/train': 1.8647565841674805} -08/30/2021 16:58:27 - INFO - __main__ - Step 20944: {'lr': 0.00048006003870963135, 'samples': 4021248, 'steps': 20943, 'loss/train': 1.7144920825958252} -08/30/2021 16:58:28 - INFO - __main__ - Step 20945: {'lr': 0.0004800579618414676, 'samples': 4021440, 'steps': 20944, 'loss/train': 0.9009919762611389} -08/30/2021 16:58:28 - INFO - __main__ - Step 20946: {'lr': 0.0004800558848696433, 'samples': 4021632, 'steps': 20945, 'loss/train': 1.5119132995605469} -08/30/2021 16:58:28 - INFO - __main__ - Step 20947: {'lr': 0.0004800538077941594, 'samples': 4021824, 'steps': 20946, 'loss/train': 1.3563536405563354} -08/30/2021 16:58:29 - INFO - __main__ - Step 20948: {'lr': 0.00048005173061501673, 'samples': 4022016, 'steps': 20947, 'loss/train': 0.7356158494949341} -08/30/2021 16:58:29 - INFO - __main__ - Step 20949: {'lr': 0.0004800496533322164, 'samples': 4022208, 'steps': 20948, 'loss/train': 0.7174288034439087} -08/30/2021 16:58:31 - INFO - __main__ - Step 20950: {'lr': 0.00048004757594575923, 'samples': 4022400, 'steps': 20949, 'loss/train': 0.5843749046325684} -08/30/2021 16:58:31 - INFO - __main__ - Step 20951: {'lr': 0.0004800454984556461, 'samples': 4022592, 'steps': 20950, 'loss/train': 1.7752432823181152} -08/30/2021 16:58:31 - INFO - __main__ - Step 20952: {'lr': 0.00048004342086187805, 'samples': 4022784, 'steps': 20951, 'loss/train': 1.4212886095046997} -08/30/2021 16:58:32 - INFO - __main__ - Step 20953: {'lr': 0.000480041343164456, 'samples': 4022976, 'steps': 20952, 'loss/train': 1.3968759775161743} -08/30/2021 16:58:32 - INFO - __main__ - Step 20954: {'lr': 0.0004800392653633808, 'samples': 4023168, 'steps': 20953, 'loss/train': 1.6341660022735596} -08/30/2021 16:58:34 - INFO - __main__ - Step 20955: {'lr': 0.0004800371874586535, 'samples': 4023360, 'steps': 20954, 'loss/train': 0.8786346912384033} -08/30/2021 16:58:34 - INFO - __main__ - Step 20956: {'lr': 0.0004800351094502751, 'samples': 4023552, 'steps': 20955, 'loss/train': 1.3521685600280762} -08/30/2021 16:58:34 - INFO - __main__ - Step 20957: {'lr': 0.00048003303133824633, 'samples': 4023744, 'steps': 20956, 'loss/train': 1.648524522781372} -08/30/2021 16:58:35 - INFO - __main__ - Step 20958: {'lr': 0.0004800309531225683, 'samples': 4023936, 'steps': 20957, 'loss/train': 1.6984584331512451} -08/30/2021 16:58:35 - INFO - __main__ - Step 20959: {'lr': 0.00048002887480324175, 'samples': 4024128, 'steps': 20958, 'loss/train': 1.4897602796554565} -08/30/2021 16:58:37 - INFO - __main__ - Step 20960: {'lr': 0.0004800267963802678, 'samples': 4024320, 'steps': 20959, 'loss/train': 1.420543909072876} -08/30/2021 16:58:38 - INFO - __main__ - Step 20961: {'lr': 0.0004800247178536473, 'samples': 4024512, 'steps': 20960, 'loss/train': 1.5173707008361816} -08/30/2021 16:58:38 - INFO - __main__ - Step 20962: {'lr': 0.0004800226392233813, 'samples': 4024704, 'steps': 20961, 'loss/train': 1.550585389137268} -08/30/2021 16:58:38 - INFO - __main__ - Step 20963: {'lr': 0.00048002056048947054, 'samples': 4024896, 'steps': 20962, 'loss/train': 1.3969539403915405} -08/30/2021 16:58:39 - INFO - __main__ - Step 20964: {'lr': 0.0004800184816519161, 'samples': 4025088, 'steps': 20963, 'loss/train': 1.7827870845794678} -08/30/2021 16:58:39 - INFO - __main__ - Step 20965: {'lr': 0.0004800164027107189, 'samples': 4025280, 'steps': 20964, 'loss/train': 0.1982184797525406} -08/30/2021 16:58:41 - INFO - __main__ - Step 20966: {'lr': 0.0004800143236658798, 'samples': 4025472, 'steps': 20965, 'loss/train': 1.8056644201278687} -08/30/2021 16:58:41 - INFO - __main__ - Step 20967: {'lr': 0.0004800122445173999, 'samples': 4025664, 'steps': 20966, 'loss/train': 1.2438685894012451} -08/30/2021 16:58:42 - INFO - __main__ - Step 20968: {'lr': 0.00048001016526528, 'samples': 4025856, 'steps': 20967, 'loss/train': 1.4209654331207275} -08/30/2021 16:58:42 - INFO - __main__ - Step 20969: {'lr': 0.00048000808590952106, 'samples': 4026048, 'steps': 20968, 'loss/train': 1.1624550819396973} -08/30/2021 16:58:42 - INFO - __main__ - Step 20970: {'lr': 0.0004800060064501239, 'samples': 4026240, 'steps': 20969, 'loss/train': 1.373073935508728} -08/30/2021 16:58:44 - INFO - __main__ - Step 20971: {'lr': 0.00048000392688708976, 'samples': 4026432, 'steps': 20970, 'loss/train': 1.401117205619812} -08/30/2021 16:58:44 - INFO - __main__ - Step 20972: {'lr': 0.00048000184722041934, 'samples': 4026624, 'steps': 20971, 'loss/train': 1.7493475675582886} -08/30/2021 16:58:45 - INFO - __main__ - Step 20973: {'lr': 0.00047999976745011366, 'samples': 4026816, 'steps': 20972, 'loss/train': 1.0928475856781006} -08/30/2021 16:58:45 - INFO - __main__ - Step 20974: {'lr': 0.0004799976875761736, 'samples': 4027008, 'steps': 20973, 'loss/train': 2.1853578090667725} -08/30/2021 16:58:45 - INFO - __main__ - Step 20975: {'lr': 0.00047999560759860006, 'samples': 4027200, 'steps': 20974, 'loss/train': 2.230820894241333} -08/30/2021 16:58:47 - INFO - __main__ - Step 20976: {'lr': 0.00047999352751739414, 'samples': 4027392, 'steps': 20975, 'loss/train': 1.414308786392212} -08/30/2021 16:58:48 - INFO - __main__ - Step 20977: {'lr': 0.0004799914473325567, 'samples': 4027584, 'steps': 20976, 'loss/train': 1.6380691528320312} -08/30/2021 16:58:48 - INFO - __main__ - Step 20978: {'lr': 0.00047998936704408865, 'samples': 4027776, 'steps': 20977, 'loss/train': 1.5667731761932373} -08/30/2021 16:58:48 - INFO - __main__ - Step 20979: {'lr': 0.00047998728665199085, 'samples': 4027968, 'steps': 20978, 'loss/train': 0.7598178386688232} -08/30/2021 16:58:49 - INFO - __main__ - Step 20980: {'lr': 0.00047998520615626447, 'samples': 4028160, 'steps': 20979, 'loss/train': 0.548076331615448} -08/30/2021 16:58:49 - INFO - __main__ - Step 20981: {'lr': 0.0004799831255569102, 'samples': 4028352, 'steps': 20980, 'loss/train': 3.950775384902954} -08/30/2021 16:58:51 - INFO - __main__ - Step 20982: {'lr': 0.00047998104485392915, 'samples': 4028544, 'steps': 20981, 'loss/train': 1.2458995580673218} -08/30/2021 16:58:51 - INFO - __main__ - Step 20983: {'lr': 0.0004799789640473221, 'samples': 4028736, 'steps': 20982, 'loss/train': 3.2928640842437744} -08/30/2021 16:58:51 - INFO - __main__ - Step 20984: {'lr': 0.0004799768831370902, 'samples': 4028928, 'steps': 20983, 'loss/train': 1.4735898971557617} -08/30/2021 16:58:52 - INFO - __main__ - Step 20985: {'lr': 0.0004799748021232342, 'samples': 4029120, 'steps': 20984, 'loss/train': 1.8679158687591553} -08/30/2021 16:58:52 - INFO - __main__ - Step 20986: {'lr': 0.00047997272100575505, 'samples': 4029312, 'steps': 20985, 'loss/train': 2.7078568935394287} -08/30/2021 16:58:54 - INFO - __main__ - Step 20987: {'lr': 0.00047997063978465383, 'samples': 4029504, 'steps': 20986, 'loss/train': 1.5304360389709473} -08/30/2021 16:58:54 - INFO - __main__ - Step 20988: {'lr': 0.0004799685584599313, 'samples': 4029696, 'steps': 20987, 'loss/train': 1.5792006254196167} -08/30/2021 16:58:54 - INFO - __main__ - Step 20989: {'lr': 0.00047996647703158857, 'samples': 4029888, 'steps': 20988, 'loss/train': 2.113802433013916} -08/30/2021 16:58:55 - INFO - __main__ - Step 20990: {'lr': 0.00047996439549962647, 'samples': 4030080, 'steps': 20989, 'loss/train': 1.8476831912994385} -08/30/2021 16:58:55 - INFO - __main__ - Step 20991: {'lr': 0.00047996231386404593, 'samples': 4030272, 'steps': 20990, 'loss/train': 1.592795729637146} -08/30/2021 16:58:57 - INFO - __main__ - Step 20992: {'lr': 0.00047996023212484797, 'samples': 4030464, 'steps': 20991, 'loss/train': 1.5453822612762451} -08/30/2021 16:58:57 - INFO - __main__ - Step 20993: {'lr': 0.00047995815028203346, 'samples': 4030656, 'steps': 20992, 'loss/train': 2.155550003051758} -08/30/2021 16:58:58 - INFO - __main__ - Step 20994: {'lr': 0.00047995606833560337, 'samples': 4030848, 'steps': 20993, 'loss/train': 3.0335333347320557} -08/30/2021 16:58:58 - INFO - __main__ - Step 20995: {'lr': 0.0004799539862855585, 'samples': 4031040, 'steps': 20994, 'loss/train': 1.8598829507827759} -08/30/2021 16:58:58 - INFO - __main__ - Step 20996: {'lr': 0.00047995190413190004, 'samples': 4031232, 'steps': 20995, 'loss/train': 0.11773476749658585} -08/30/2021 16:58:59 - INFO - __main__ - Step 20997: {'lr': 0.00047994982187462876, 'samples': 4031424, 'steps': 20996, 'loss/train': 1.9217010736465454} -08/30/2021 16:59:00 - INFO - __main__ - Step 20998: {'lr': 0.0004799477395137457, 'samples': 4031616, 'steps': 20997, 'loss/train': 2.0599071979522705} -08/30/2021 16:59:01 - INFO - __main__ - Step 20999: {'lr': 0.00047994565704925166, 'samples': 4031808, 'steps': 20998, 'loss/train': 1.5909682512283325} -08/30/2021 16:59:01 - INFO - __main__ - Step 21000: {'lr': 0.0004799435744811477, 'samples': 4032000, 'steps': 20999, 'loss/train': 1.0935367345809937} -08/30/2021 16:59:01 - INFO - __main__ - Step 21001: {'lr': 0.0004799414918094347, 'samples': 4032192, 'steps': 21000, 'loss/train': 1.9355828762054443} -08/30/2021 16:59:02 - INFO - __main__ - Step 21002: {'lr': 0.0004799394090341136, 'samples': 4032384, 'steps': 21001, 'loss/train': 1.5669392347335815} -08/30/2021 16:59:03 - INFO - __main__ - Step 21003: {'lr': 0.0004799373261551854, 'samples': 4032576, 'steps': 21002, 'loss/train': 1.6707897186279297} -08/30/2021 16:59:04 - INFO - __main__ - Step 21004: {'lr': 0.0004799352431726509, 'samples': 4032768, 'steps': 21003, 'loss/train': 1.8671692609786987} -08/30/2021 16:59:04 - INFO - __main__ - Step 21005: {'lr': 0.0004799331600865112, 'samples': 4032960, 'steps': 21004, 'loss/train': 1.4355348348617554} -08/30/2021 16:59:04 - INFO - __main__ - Step 21006: {'lr': 0.0004799310768967671, 'samples': 4033152, 'steps': 21005, 'loss/train': 1.6290297508239746} -08/30/2021 16:59:05 - INFO - __main__ - Step 21007: {'lr': 0.00047992899360341966, 'samples': 4033344, 'steps': 21006, 'loss/train': 1.5777473449707031} -08/30/2021 16:59:06 - INFO - __main__ - Step 21008: {'lr': 0.0004799269102064698, 'samples': 4033536, 'steps': 21007, 'loss/train': 1.8052923679351807} -08/30/2021 16:59:06 - INFO - __main__ - Step 21009: {'lr': 0.0004799248267059183, 'samples': 4033728, 'steps': 21008, 'loss/train': 1.715876579284668} -08/30/2021 16:59:07 - INFO - __main__ - Step 21010: {'lr': 0.0004799227431017663, 'samples': 4033920, 'steps': 21009, 'loss/train': 1.5748149156570435} -08/30/2021 16:59:07 - INFO - __main__ - Step 21011: {'lr': 0.0004799206593940147, 'samples': 4034112, 'steps': 21010, 'loss/train': 1.6504967212677002} -08/30/2021 16:59:08 - INFO - __main__ - Step 21012: {'lr': 0.0004799185755826644, 'samples': 4034304, 'steps': 21011, 'loss/train': 1.7354111671447754} -08/30/2021 16:59:09 - INFO - __main__ - Step 21013: {'lr': 0.00047991649166771624, 'samples': 4034496, 'steps': 21012, 'loss/train': 1.6346644163131714} -08/30/2021 16:59:10 - INFO - __main__ - Step 21014: {'lr': 0.00047991440764917127, 'samples': 4034688, 'steps': 21013, 'loss/train': 2.4204812049865723} -08/30/2021 16:59:10 - INFO - __main__ - Step 21015: {'lr': 0.0004799123235270305, 'samples': 4034880, 'steps': 21014, 'loss/train': 1.6461856365203857} -08/30/2021 16:59:10 - INFO - __main__ - Step 21016: {'lr': 0.0004799102393012947, 'samples': 4035072, 'steps': 21015, 'loss/train': 1.6606346368789673} -08/30/2021 16:59:11 - INFO - __main__ - Step 21017: {'lr': 0.0004799081549719649, 'samples': 4035264, 'steps': 21016, 'loss/train': 1.1760226488113403} -08/30/2021 16:59:12 - INFO - __main__ - Step 21018: {'lr': 0.0004799060705390421, 'samples': 4035456, 'steps': 21017, 'loss/train': 2.0579817295074463} -08/30/2021 16:59:12 - INFO - __main__ - Step 21019: {'lr': 0.00047990398600252713, 'samples': 4035648, 'steps': 21018, 'loss/train': 1.7861557006835938} -08/30/2021 16:59:13 - INFO - __main__ - Step 21020: {'lr': 0.00047990190136242103, 'samples': 4035840, 'steps': 21019, 'loss/train': 1.7574015855789185} -08/30/2021 16:59:13 - INFO - __main__ - Step 21021: {'lr': 0.0004798998166187246, 'samples': 4036032, 'steps': 21020, 'loss/train': 1.1989426612854004} -08/30/2021 16:59:14 - INFO - __main__ - Step 21022: {'lr': 0.0004798977317714389, 'samples': 4036224, 'steps': 21021, 'loss/train': 1.8363909721374512} -08/30/2021 16:59:16 - INFO - __main__ - Step 21023: {'lr': 0.00047989564682056487, 'samples': 4036416, 'steps': 21022, 'loss/train': 1.7746086120605469} -08/30/2021 16:59:16 - INFO - __main__ - Step 21024: {'lr': 0.0004798935617661033, 'samples': 4036608, 'steps': 21023, 'loss/train': 1.5361837148666382} -08/30/2021 16:59:16 - INFO - __main__ - Step 21025: {'lr': 0.0004798914766080553, 'samples': 4036800, 'steps': 21024, 'loss/train': 2.529196262359619} -08/30/2021 16:59:17 - INFO - __main__ - Step 21026: {'lr': 0.00047988939134642174, 'samples': 4036992, 'steps': 21025, 'loss/train': 1.467066764831543} -08/30/2021 16:59:17 - INFO - __main__ - Step 21027: {'lr': 0.00047988730598120356, 'samples': 4037184, 'steps': 21026, 'loss/train': 1.8944923877716064} -08/30/2021 16:59:19 - INFO - __main__ - Step 21028: {'lr': 0.00047988522051240173, 'samples': 4037376, 'steps': 21027, 'loss/train': 0.8948488831520081} -08/30/2021 16:59:19 - INFO - __main__ - Step 21029: {'lr': 0.0004798831349400172, 'samples': 4037568, 'steps': 21028, 'loss/train': 2.0099880695343018} -08/30/2021 16:59:19 - INFO - __main__ - Step 21030: {'lr': 0.0004798810492640508, 'samples': 4037760, 'steps': 21029, 'loss/train': 1.7088042497634888} -08/30/2021 16:59:20 - INFO - __main__ - Step 21031: {'lr': 0.00047987896348450354, 'samples': 4037952, 'steps': 21030, 'loss/train': 1.5720404386520386} -08/30/2021 16:59:20 - INFO - __main__ - Step 21032: {'lr': 0.00047987687760137646, 'samples': 4038144, 'steps': 21031, 'loss/train': 1.5632773637771606} -08/30/2021 16:59:21 - INFO - __main__ - Step 21033: {'lr': 0.00047987479161467033, 'samples': 4038336, 'steps': 21032, 'loss/train': 1.9008517265319824} -08/30/2021 16:59:22 - INFO - __main__ - Step 21034: {'lr': 0.0004798727055243862, 'samples': 4038528, 'steps': 21033, 'loss/train': 1.5379389524459839} -08/30/2021 16:59:23 - INFO - __main__ - Step 21035: {'lr': 0.000479870619330525, 'samples': 4038720, 'steps': 21034, 'loss/train': 0.876471757888794} -08/30/2021 16:59:23 - INFO - __main__ - Step 21036: {'lr': 0.0004798685330330876, 'samples': 4038912, 'steps': 21035, 'loss/train': 1.7168902158737183} -08/30/2021 16:59:23 - INFO - __main__ - Step 21037: {'lr': 0.000479866446632075, 'samples': 4039104, 'steps': 21036, 'loss/train': 1.406392216682434} -08/30/2021 16:59:24 - INFO - __main__ - Step 21038: {'lr': 0.00047986436012748815, 'samples': 4039296, 'steps': 21037, 'loss/train': 1.267569661140442} -08/30/2021 16:59:25 - INFO - __main__ - Step 21039: {'lr': 0.00047986227351932785, 'samples': 4039488, 'steps': 21038, 'loss/train': 1.684775710105896} -08/30/2021 16:59:26 - INFO - __main__ - Step 21040: {'lr': 0.00047986018680759525, 'samples': 4039680, 'steps': 21039, 'loss/train': 1.8256009817123413} -08/30/2021 16:59:26 - INFO - __main__ - Step 21041: {'lr': 0.00047985809999229125, 'samples': 4039872, 'steps': 21040, 'loss/train': 1.766939640045166} -08/30/2021 16:59:26 - INFO - __main__ - Step 21042: {'lr': 0.00047985601307341667, 'samples': 4040064, 'steps': 21041, 'loss/train': 1.1235382556915283} -08/30/2021 16:59:27 - INFO - __main__ - Step 21043: {'lr': 0.0004798539260509725, 'samples': 4040256, 'steps': 21042, 'loss/train': 1.7099907398223877} -08/30/2021 16:59:28 - INFO - __main__ - Step 21044: {'lr': 0.00047985183892495977, 'samples': 4040448, 'steps': 21043, 'loss/train': 1.3469377756118774} -08/30/2021 16:59:29 - INFO - __main__ - Step 21045: {'lr': 0.00047984975169537925, 'samples': 4040640, 'steps': 21044, 'loss/train': 0.8599517941474915} -08/30/2021 16:59:29 - INFO - __main__ - Step 21046: {'lr': 0.00047984766436223205, 'samples': 4040832, 'steps': 21045, 'loss/train': 1.3645668029785156} -08/30/2021 16:59:29 - INFO - __main__ - Step 21047: {'lr': 0.000479845576925519, 'samples': 4041024, 'steps': 21046, 'loss/train': 1.9667969942092896} -08/30/2021 16:59:30 - INFO - __main__ - Step 21048: {'lr': 0.00047984348938524113, 'samples': 4041216, 'steps': 21047, 'loss/train': 1.1815723180770874} -08/30/2021 16:59:31 - INFO - __main__ - Step 21049: {'lr': 0.00047984140174139926, 'samples': 4041408, 'steps': 21048, 'loss/train': 1.5975016355514526} -08/30/2021 16:59:32 - INFO - __main__ - Step 21050: {'lr': 0.0004798393139939945, 'samples': 4041600, 'steps': 21049, 'loss/train': 1.9904526472091675} -08/30/2021 16:59:32 - INFO - __main__ - Step 21051: {'lr': 0.0004798372261430276, 'samples': 4041792, 'steps': 21050, 'loss/train': 2.2192118167877197} -08/30/2021 16:59:33 - INFO - __main__ - Step 21052: {'lr': 0.00047983513818849967, 'samples': 4041984, 'steps': 21051, 'loss/train': 1.5575976371765137} -08/30/2021 16:59:33 - INFO - __main__ - Step 21053: {'lr': 0.0004798330501304115, 'samples': 4042176, 'steps': 21052, 'loss/train': 1.6344659328460693} -08/30/2021 16:59:34 - INFO - __main__ - Step 21054: {'lr': 0.00047983096196876413, 'samples': 4042368, 'steps': 21053, 'loss/train': 1.3212599754333496} -08/30/2021 16:59:35 - INFO - __main__ - Step 21055: {'lr': 0.00047982887370355846, 'samples': 4042560, 'steps': 21054, 'loss/train': 1.4824053049087524} -08/30/2021 16:59:35 - INFO - __main__ - Step 21056: {'lr': 0.0004798267853347955, 'samples': 4042752, 'steps': 21055, 'loss/train': 1.472094178199768} -08/30/2021 16:59:36 - INFO - __main__ - Step 21057: {'lr': 0.0004798246968624761, 'samples': 4042944, 'steps': 21056, 'loss/train': 1.0333106517791748} -08/30/2021 16:59:36 - INFO - __main__ - Step 21058: {'lr': 0.00047982260828660124, 'samples': 4043136, 'steps': 21057, 'loss/train': 1.8350293636322021} -08/30/2021 16:59:37 - INFO - __main__ - Step 21059: {'lr': 0.0004798205196071719, 'samples': 4043328, 'steps': 21058, 'loss/train': 1.284170150756836} -08/30/2021 16:59:38 - INFO - __main__ - Step 21060: {'lr': 0.00047981843082418884, 'samples': 4043520, 'steps': 21059, 'loss/train': 1.7510058879852295} -08/30/2021 16:59:38 - INFO - __main__ - Step 21061: {'lr': 0.0004798163419376533, 'samples': 4043712, 'steps': 21060, 'loss/train': 1.8825178146362305} -08/30/2021 16:59:39 - INFO - __main__ - Step 21062: {'lr': 0.00047981425294756595, 'samples': 4043904, 'steps': 21061, 'loss/train': 1.579464316368103} -08/30/2021 16:59:39 - INFO - __main__ - Step 21063: {'lr': 0.00047981216385392796, 'samples': 4044096, 'steps': 21062, 'loss/train': 1.7650657892227173} -08/30/2021 16:59:39 - INFO - __main__ - Step 21064: {'lr': 0.0004798100746567401, 'samples': 4044288, 'steps': 21063, 'loss/train': 1.6939369440078735} -08/30/2021 16:59:41 - INFO - __main__ - Step 21065: {'lr': 0.00047980798535600334, 'samples': 4044480, 'steps': 21064, 'loss/train': 1.627752661705017} -08/30/2021 16:59:41 - INFO - __main__ - Step 21066: {'lr': 0.00047980589595171866, 'samples': 4044672, 'steps': 21065, 'loss/train': 1.8847434520721436} -08/30/2021 16:59:42 - INFO - __main__ - Step 21067: {'lr': 0.000479803806443887, 'samples': 4044864, 'steps': 21066, 'loss/train': 1.7405376434326172} -08/30/2021 16:59:42 - INFO - __main__ - Step 21068: {'lr': 0.0004798017168325093, 'samples': 4045056, 'steps': 21067, 'loss/train': 1.945316195487976} -08/30/2021 16:59:42 - INFO - __main__ - Step 21069: {'lr': 0.0004797996271175865, 'samples': 4045248, 'steps': 21068, 'loss/train': 2.127417802810669} -08/30/2021 16:59:44 - INFO - __main__ - Step 21070: {'lr': 0.00047979753729911944, 'samples': 4045440, 'steps': 21069, 'loss/train': 1.282895803451538} -08/30/2021 16:59:44 - INFO - __main__ - Step 21071: {'lr': 0.00047979544737710925, 'samples': 4045632, 'steps': 21070, 'loss/train': 1.419189691543579} -08/30/2021 16:59:45 - INFO - __main__ - Step 21072: {'lr': 0.00047979335735155677, 'samples': 4045824, 'steps': 21071, 'loss/train': 1.1895549297332764} -08/30/2021 16:59:45 - INFO - __main__ - Step 21073: {'lr': 0.00047979126722246294, 'samples': 4046016, 'steps': 21072, 'loss/train': 1.095531940460205} -08/30/2021 16:59:45 - INFO - __main__ - Step 21074: {'lr': 0.0004797891769898287, 'samples': 4046208, 'steps': 21073, 'loss/train': 1.6173202991485596} -08/30/2021 16:59:47 - INFO - __main__ - Step 21075: {'lr': 0.00047978708665365503, 'samples': 4046400, 'steps': 21074, 'loss/train': 0.8989821672439575} -08/30/2021 16:59:48 - INFO - __main__ - Step 21076: {'lr': 0.0004797849962139428, 'samples': 4046592, 'steps': 21075, 'loss/train': 1.6845216751098633} -08/30/2021 16:59:48 - INFO - __main__ - Step 21077: {'lr': 0.00047978290567069306, 'samples': 4046784, 'steps': 21076, 'loss/train': 1.3722569942474365} -08/30/2021 16:59:49 - INFO - __main__ - Step 21078: {'lr': 0.00047978081502390656, 'samples': 4046976, 'steps': 21077, 'loss/train': 1.6358416080474854} -08/30/2021 16:59:49 - INFO - __main__ - Step 21079: {'lr': 0.0004797787242735845, 'samples': 4047168, 'steps': 21078, 'loss/train': 0.790678083896637} -08/30/2021 16:59:49 - INFO - __main__ - Step 21080: {'lr': 0.00047977663341972765, 'samples': 4047360, 'steps': 21079, 'loss/train': 2.2479915618896484} -08/30/2021 16:59:51 - INFO - __main__ - Step 21081: {'lr': 0.00047977454246233696, 'samples': 4047552, 'steps': 21080, 'loss/train': 1.709816575050354} -08/30/2021 16:59:51 - INFO - __main__ - Step 21082: {'lr': 0.00047977245140141354, 'samples': 4047744, 'steps': 21081, 'loss/train': 1.2808079719543457} -08/30/2021 16:59:52 - INFO - __main__ - Step 21083: {'lr': 0.00047977036023695807, 'samples': 4047936, 'steps': 21082, 'loss/train': 1.2697173357009888} -08/30/2021 16:59:52 - INFO - __main__ - Step 21084: {'lr': 0.00047976826896897165, 'samples': 4048128, 'steps': 21083, 'loss/train': 1.6275309324264526} -08/30/2021 16:59:52 - INFO - __main__ - Step 21085: {'lr': 0.0004797661775974552, 'samples': 4048320, 'steps': 21084, 'loss/train': 1.8187636137008667} -08/30/2021 16:59:54 - INFO - __main__ - Step 21086: {'lr': 0.00047976408612240964, 'samples': 4048512, 'steps': 21085, 'loss/train': 1.1905463933944702} -08/30/2021 16:59:54 - INFO - __main__ - Step 21087: {'lr': 0.00047976199454383595, 'samples': 4048704, 'steps': 21086, 'loss/train': 2.2994184494018555} -08/30/2021 16:59:55 - INFO - __main__ - Step 21088: {'lr': 0.00047975990286173504, 'samples': 4048896, 'steps': 21087, 'loss/train': 1.679661512374878} -08/30/2021 16:59:55 - INFO - __main__ - Step 21089: {'lr': 0.00047975781107610784, 'samples': 4049088, 'steps': 21088, 'loss/train': 0.8422901034355164} -08/30/2021 16:59:56 - INFO - __main__ - Step 21090: {'lr': 0.0004797557191869554, 'samples': 4049280, 'steps': 21089, 'loss/train': 1.6706513166427612} -08/30/2021 16:59:57 - INFO - __main__ - Step 21091: {'lr': 0.0004797536271942785, 'samples': 4049472, 'steps': 21090, 'loss/train': 1.8182177543640137} -08/30/2021 16:59:57 - INFO - __main__ - Step 21092: {'lr': 0.00047975153509807815, 'samples': 4049664, 'steps': 21091, 'loss/train': 1.387774109840393} -08/30/2021 16:59:58 - INFO - __main__ - Step 21093: {'lr': 0.0004797494428983553, 'samples': 4049856, 'steps': 21092, 'loss/train': 1.8198074102401733} -08/30/2021 16:59:58 - INFO - __main__ - Step 21094: {'lr': 0.000479747350595111, 'samples': 4050048, 'steps': 21093, 'loss/train': 1.0651737451553345} -08/30/2021 16:59:58 - INFO - __main__ - Step 21095: {'lr': 0.00047974525818834604, 'samples': 4050240, 'steps': 21094, 'loss/train': 1.5520455837249756} -08/30/2021 17:00:00 - INFO - __main__ - Step 21096: {'lr': 0.0004797431656780613, 'samples': 4050432, 'steps': 21095, 'loss/train': 1.5461673736572266} -08/30/2021 17:00:00 - INFO - __main__ - Step 21097: {'lr': 0.000479741073064258, 'samples': 4050624, 'steps': 21096, 'loss/train': 1.611256718635559} -08/30/2021 17:00:01 - INFO - __main__ - Step 21098: {'lr': 0.0004797389803469369, 'samples': 4050816, 'steps': 21097, 'loss/train': 1.0551233291625977} -08/30/2021 17:00:01 - INFO - __main__ - Step 21099: {'lr': 0.0004797368875260988, 'samples': 4051008, 'steps': 21098, 'loss/train': 0.49395498633384705} -08/30/2021 17:00:01 - INFO - __main__ - Step 21100: {'lr': 0.00047973479460174497, 'samples': 4051200, 'steps': 21099, 'loss/train': 1.0994573831558228} -08/30/2021 17:00:03 - INFO - __main__ - Step 21101: {'lr': 0.00047973270157387605, 'samples': 4051392, 'steps': 21100, 'loss/train': 1.73939847946167} -08/30/2021 17:00:04 - INFO - __main__ - Step 21102: {'lr': 0.0004797306084424932, 'samples': 4051584, 'steps': 21101, 'loss/train': 1.246307611465454} -08/30/2021 17:00:04 - INFO - __main__ - Step 21103: {'lr': 0.0004797285152075973, 'samples': 4051776, 'steps': 21102, 'loss/train': 1.6441198587417603} -08/30/2021 17:00:04 - INFO - __main__ - Step 21104: {'lr': 0.00047972642186918925, 'samples': 4051968, 'steps': 21103, 'loss/train': 1.1580528020858765} -08/30/2021 17:00:05 - INFO - __main__ - Step 21105: {'lr': 0.00047972432842727003, 'samples': 4052160, 'steps': 21104, 'loss/train': 2.2623374462127686} -08/30/2021 17:00:06 - INFO - __main__ - Step 21106: {'lr': 0.0004797222348818405, 'samples': 4052352, 'steps': 21105, 'loss/train': 2.3679537773132324} -08/30/2021 17:00:07 - INFO - __main__ - Step 21107: {'lr': 0.00047972014123290183, 'samples': 4052544, 'steps': 21106, 'loss/train': 1.9266010522842407} -08/30/2021 17:00:07 - INFO - __main__ - Step 21108: {'lr': 0.00047971804748045464, 'samples': 4052736, 'steps': 21107, 'loss/train': 1.6839982271194458} -08/30/2021 17:00:07 - INFO - __main__ - Step 21109: {'lr': 0.00047971595362450014, 'samples': 4052928, 'steps': 21108, 'loss/train': 1.119568109512329} -08/30/2021 17:00:08 - INFO - __main__ - Step 21110: {'lr': 0.00047971385966503923, 'samples': 4053120, 'steps': 21109, 'loss/train': 1.3776720762252808} -08/30/2021 17:00:08 - INFO - __main__ - Step 21111: {'lr': 0.0004797117656020727, 'samples': 4053312, 'steps': 21110, 'loss/train': 2.06646728515625} -08/30/2021 17:00:09 - INFO - __main__ - Step 21112: {'lr': 0.0004797096714356016, 'samples': 4053504, 'steps': 21111, 'loss/train': 1.4350123405456543} -08/30/2021 17:00:10 - INFO - __main__ - Step 21113: {'lr': 0.0004797075771656269, 'samples': 4053696, 'steps': 21112, 'loss/train': 6.5142292976379395} -08/30/2021 17:00:10 - INFO - __main__ - Step 21114: {'lr': 0.0004797054827921495, 'samples': 4053888, 'steps': 21113, 'loss/train': 1.6243597269058228} -08/30/2021 17:00:11 - INFO - __main__ - Step 21115: {'lr': 0.0004797033883151703, 'samples': 4054080, 'steps': 21114, 'loss/train': 1.6746667623519897} -08/30/2021 17:00:11 - INFO - __main__ - Step 21116: {'lr': 0.0004797012937346904, 'samples': 4054272, 'steps': 21115, 'loss/train': 1.171312928199768} -08/30/2021 17:00:12 - INFO - __main__ - Step 21117: {'lr': 0.0004796991990507106, 'samples': 4054464, 'steps': 21116, 'loss/train': 1.5629198551177979} -08/30/2021 17:00:13 - INFO - __main__ - Step 21118: {'lr': 0.00047969710426323185, 'samples': 4054656, 'steps': 21117, 'loss/train': 1.9510616064071655} -08/30/2021 17:00:13 - INFO - __main__ - Step 21119: {'lr': 0.0004796950093722552, 'samples': 4054848, 'steps': 21118, 'loss/train': 1.6718730926513672} -08/30/2021 17:00:14 - INFO - __main__ - Step 21120: {'lr': 0.00047969291437778143, 'samples': 4055040, 'steps': 21119, 'loss/train': 1.4792535305023193} -08/30/2021 17:00:14 - INFO - __main__ - Step 21121: {'lr': 0.00047969081927981165, 'samples': 4055232, 'steps': 21120, 'loss/train': 1.7120091915130615} -08/30/2021 17:00:15 - INFO - __main__ - Step 21122: {'lr': 0.0004796887240783467, 'samples': 4055424, 'steps': 21121, 'loss/train': 1.5738706588745117} -08/30/2021 17:00:16 - INFO - __main__ - Step 21123: {'lr': 0.0004796866287733875, 'samples': 4055616, 'steps': 21122, 'loss/train': 1.5310466289520264} -08/30/2021 17:00:16 - INFO - __main__ - Step 21124: {'lr': 0.0004796845333649352, 'samples': 4055808, 'steps': 21123, 'loss/train': 1.5130800008773804} -08/30/2021 17:00:17 - INFO - __main__ - Step 21125: {'lr': 0.00047968243785299046, 'samples': 4056000, 'steps': 21124, 'loss/train': 1.5441941022872925} -08/30/2021 17:00:17 - INFO - __main__ - Step 21126: {'lr': 0.0004796803422375544, 'samples': 4056192, 'steps': 21125, 'loss/train': 1.8245644569396973} -08/30/2021 17:00:17 - INFO - __main__ - Step 21127: {'lr': 0.0004796782465186279, 'samples': 4056384, 'steps': 21126, 'loss/train': 1.6191391944885254} -08/30/2021 17:00:19 - INFO - __main__ - Step 21128: {'lr': 0.00047967615069621197, 'samples': 4056576, 'steps': 21127, 'loss/train': 1.7516992092132568} -08/30/2021 17:00:19 - INFO - __main__ - Step 21129: {'lr': 0.0004796740547703075, 'samples': 4056768, 'steps': 21128, 'loss/train': 1.7212977409362793} -08/30/2021 17:00:20 - INFO - __main__ - Step 21130: {'lr': 0.00047967195874091547, 'samples': 4056960, 'steps': 21129, 'loss/train': 1.614676833152771} -08/30/2021 17:00:20 - INFO - __main__ - Step 21131: {'lr': 0.00047966986260803676, 'samples': 4057152, 'steps': 21130, 'loss/train': 0.2862565517425537} -08/30/2021 17:00:20 - INFO - __main__ - Step 21132: {'lr': 0.0004796677663716723, 'samples': 4057344, 'steps': 21131, 'loss/train': 1.4826680421829224} -08/30/2021 17:00:22 - INFO - __main__ - Step 21133: {'lr': 0.00047966567003182315, 'samples': 4057536, 'steps': 21132, 'loss/train': 1.4634411334991455} -08/30/2021 17:00:23 - INFO - __main__ - Step 21134: {'lr': 0.0004796635735884902, 'samples': 4057728, 'steps': 21133, 'loss/train': 1.0680818557739258} -08/30/2021 17:00:23 - INFO - __main__ - Step 21135: {'lr': 0.0004796614770416744, 'samples': 4057920, 'steps': 21134, 'loss/train': 1.6191478967666626} -08/30/2021 17:00:23 - INFO - __main__ - Step 21136: {'lr': 0.00047965938039137666, 'samples': 4058112, 'steps': 21135, 'loss/train': 1.191550850868225} -08/30/2021 17:00:24 - INFO - __main__ - Step 21137: {'lr': 0.000479657283637598, 'samples': 4058304, 'steps': 21136, 'loss/train': 1.3693060874938965} -08/30/2021 17:00:25 - INFO - __main__ - Step 21138: {'lr': 0.00047965518678033924, 'samples': 4058496, 'steps': 21137, 'loss/train': 0.7484496235847473} -08/30/2021 17:00:26 - INFO - __main__ - Step 21139: {'lr': 0.00047965308981960143, 'samples': 4058688, 'steps': 21138, 'loss/train': 1.3798872232437134} -08/30/2021 17:00:26 - INFO - __main__ - Step 21140: {'lr': 0.0004796509927553854, 'samples': 4058880, 'steps': 21139, 'loss/train': 1.4580025672912598} -08/30/2021 17:00:26 - INFO - __main__ - Step 21141: {'lr': 0.00047964889558769233, 'samples': 4059072, 'steps': 21140, 'loss/train': 2.0219380855560303} -08/30/2021 17:00:27 - INFO - __main__ - Step 21142: {'lr': 0.00047964679831652294, 'samples': 4059264, 'steps': 21141, 'loss/train': 1.180588960647583} -08/30/2021 17:00:28 - INFO - __main__ - Step 21143: {'lr': 0.00047964470094187815, 'samples': 4059456, 'steps': 21142, 'loss/train': 1.8486741781234741} -08/30/2021 17:00:29 - INFO - __main__ - Step 21144: {'lr': 0.0004796426034637591, 'samples': 4059648, 'steps': 21143, 'loss/train': 2.0078158378601074} -08/30/2021 17:00:29 - INFO - __main__ - Step 21145: {'lr': 0.0004796405058821666, 'samples': 4059840, 'steps': 21144, 'loss/train': 1.6045961380004883} -08/30/2021 17:00:30 - INFO - __main__ - Step 21146: {'lr': 0.0004796384081971017, 'samples': 4060032, 'steps': 21145, 'loss/train': 1.570224404335022} -08/30/2021 17:00:30 - INFO - __main__ - Step 21147: {'lr': 0.0004796363104085652, 'samples': 4060224, 'steps': 21146, 'loss/train': 2.0301578044891357} -08/30/2021 17:00:31 - INFO - __main__ - Step 21148: {'lr': 0.00047963421251655817, 'samples': 4060416, 'steps': 21147, 'loss/train': 1.9047797918319702} -08/30/2021 17:00:32 - INFO - __main__ - Step 21149: {'lr': 0.00047963211452108144, 'samples': 4060608, 'steps': 21148, 'loss/train': 1.92880380153656} -08/30/2021 17:00:32 - INFO - __main__ - Step 21150: {'lr': 0.0004796300164221361, 'samples': 4060800, 'steps': 21149, 'loss/train': 1.8172188997268677} -08/30/2021 17:00:33 - INFO - __main__ - Step 21151: {'lr': 0.00047962791821972296, 'samples': 4060992, 'steps': 21150, 'loss/train': 2.119884967803955} -08/30/2021 17:00:33 - INFO - __main__ - Step 21152: {'lr': 0.00047962581991384305, 'samples': 4061184, 'steps': 21151, 'loss/train': 1.7036997079849243} -08/30/2021 17:00:33 - INFO - __main__ - Step 21153: {'lr': 0.0004796237215044973, 'samples': 4061376, 'steps': 21152, 'loss/train': 1.6930289268493652} -08/30/2021 17:00:35 - INFO - __main__ - Step 21154: {'lr': 0.0004796216229916867, 'samples': 4061568, 'steps': 21153, 'loss/train': 1.6659579277038574} -08/30/2021 17:00:35 - INFO - __main__ - Step 21155: {'lr': 0.000479619524375412, 'samples': 4061760, 'steps': 21154, 'loss/train': 1.9712690114974976} -08/30/2021 17:00:36 - INFO - __main__ - Step 21156: {'lr': 0.0004796174256556744, 'samples': 4061952, 'steps': 21155, 'loss/train': 1.701959252357483} -08/30/2021 17:00:36 - INFO - __main__ - Step 21157: {'lr': 0.0004796153268324747, 'samples': 4062144, 'steps': 21156, 'loss/train': 1.6595348119735718} -08/30/2021 17:00:36 - INFO - __main__ - Step 21158: {'lr': 0.00047961322790581384, 'samples': 4062336, 'steps': 21157, 'loss/train': 1.7811648845672607} -08/30/2021 17:00:38 - INFO - __main__ - Step 21159: {'lr': 0.00047961112887569285, 'samples': 4062528, 'steps': 21158, 'loss/train': 1.2896312475204468} -08/30/2021 17:00:38 - INFO - __main__ - Step 21160: {'lr': 0.0004796090297421126, 'samples': 4062720, 'steps': 21159, 'loss/train': 1.0237380266189575} -08/30/2021 17:00:39 - INFO - __main__ - Step 21161: {'lr': 0.0004796069305050741, 'samples': 4062912, 'steps': 21160, 'loss/train': 1.6675056219100952} -08/30/2021 17:00:39 - INFO - __main__ - Step 21162: {'lr': 0.0004796048311645782, 'samples': 4063104, 'steps': 21161, 'loss/train': 1.378087043762207} -08/30/2021 17:00:39 - INFO - __main__ - Step 21163: {'lr': 0.00047960273172062596, 'samples': 4063296, 'steps': 21162, 'loss/train': 1.5852527618408203} -08/30/2021 17:00:41 - INFO - __main__ - Step 21164: {'lr': 0.00047960063217321824, 'samples': 4063488, 'steps': 21163, 'loss/train': 1.6329618692398071} -08/30/2021 17:00:41 - INFO - __main__ - Step 21165: {'lr': 0.0004795985325223561, 'samples': 4063680, 'steps': 21164, 'loss/train': 6.379885673522949} -08/30/2021 17:00:41 - INFO - __main__ - Step 21166: {'lr': 0.00047959643276804026, 'samples': 4063872, 'steps': 21165, 'loss/train': 1.1205564737319946} -08/30/2021 17:00:42 - INFO - __main__ - Step 21167: {'lr': 0.0004795943329102719, 'samples': 4064064, 'steps': 21166, 'loss/train': 1.3630781173706055} -08/30/2021 17:00:42 - INFO - __main__ - Step 21168: {'lr': 0.00047959223294905185, 'samples': 4064256, 'steps': 21167, 'loss/train': 1.8570128679275513} -08/30/2021 17:00:44 - INFO - __main__ - Step 21169: {'lr': 0.00047959013288438113, 'samples': 4064448, 'steps': 21168, 'loss/train': 1.3203643560409546} -08/30/2021 17:00:45 - INFO - __main__ - Step 21170: {'lr': 0.0004795880327162606, 'samples': 4064640, 'steps': 21169, 'loss/train': 1.1915868520736694} -08/30/2021 17:00:45 - INFO - __main__ - Step 21171: {'lr': 0.0004795859324446912, 'samples': 4064832, 'steps': 21170, 'loss/train': 0.10693927109241486} -08/30/2021 17:00:45 - INFO - __main__ - Step 21172: {'lr': 0.000479583832069674, 'samples': 4065024, 'steps': 21171, 'loss/train': 0.39779266715049744} -08/30/2021 17:00:46 - INFO - __main__ - Step 21173: {'lr': 0.00047958173159120984, 'samples': 4065216, 'steps': 21172, 'loss/train': 1.258679986000061} -08/30/2021 17:00:47 - INFO - __main__ - Step 21174: {'lr': 0.0004795796310092997, 'samples': 4065408, 'steps': 21173, 'loss/train': 1.0735141038894653} -08/30/2021 17:00:48 - INFO - __main__ - Step 21175: {'lr': 0.00047957753032394445, 'samples': 4065600, 'steps': 21174, 'loss/train': 1.6297802925109863} -08/30/2021 17:00:48 - INFO - __main__ - Step 21176: {'lr': 0.00047957542953514523, 'samples': 4065792, 'steps': 21175, 'loss/train': 1.7633613348007202} -08/30/2021 17:00:48 - INFO - __main__ - Step 21177: {'lr': 0.00047957332864290283, 'samples': 4065984, 'steps': 21176, 'loss/train': 2.5928258895874023} -08/30/2021 17:00:49 - INFO - __main__ - Step 21178: {'lr': 0.00047957122764721817, 'samples': 4066176, 'steps': 21177, 'loss/train': 1.5828711986541748} -08/30/2021 17:00:50 - INFO - __main__ - Step 21179: {'lr': 0.00047956912654809227, 'samples': 4066368, 'steps': 21178, 'loss/train': 1.8395119905471802} -08/30/2021 17:00:51 - INFO - __main__ - Step 21180: {'lr': 0.0004795670253455261, 'samples': 4066560, 'steps': 21179, 'loss/train': 1.6991662979125977} -08/30/2021 17:00:51 - INFO - __main__ - Step 21181: {'lr': 0.00047956492403952055, 'samples': 4066752, 'steps': 21180, 'loss/train': 2.4299497604370117} -08/30/2021 17:00:51 - INFO - __main__ - Step 21182: {'lr': 0.00047956282263007663, 'samples': 4066944, 'steps': 21181, 'loss/train': 1.1073206663131714} -08/30/2021 17:00:52 - INFO - __main__ - Step 21183: {'lr': 0.00047956072111719517, 'samples': 4067136, 'steps': 21182, 'loss/train': 0.08222738653421402} -08/30/2021 17:00:52 - INFO - __main__ - Step 21184: {'lr': 0.00047955861950087724, 'samples': 4067328, 'steps': 21183, 'loss/train': 1.4232593774795532} -08/30/2021 17:00:54 - INFO - __main__ - Step 21185: {'lr': 0.00047955651778112376, 'samples': 4067520, 'steps': 21184, 'loss/train': 1.5396087169647217} -08/30/2021 17:00:55 - INFO - __main__ - Step 21186: {'lr': 0.00047955441595793556, 'samples': 4067712, 'steps': 21185, 'loss/train': 1.8421236276626587} -08/30/2021 17:00:55 - INFO - __main__ - Step 21187: {'lr': 0.0004795523140313138, 'samples': 4067904, 'steps': 21186, 'loss/train': 1.4485394954681396} -08/30/2021 17:00:56 - INFO - __main__ - Step 21188: {'lr': 0.00047955021200125924, 'samples': 4068096, 'steps': 21187, 'loss/train': 1.758474349975586} -08/30/2021 17:00:56 - INFO - __main__ - Step 21189: {'lr': 0.0004795481098677729, 'samples': 4068288, 'steps': 21188, 'loss/train': 1.2918554544448853} -08/30/2021 17:00:57 - INFO - __main__ - Step 21190: {'lr': 0.00047954600763085577, 'samples': 4068480, 'steps': 21189, 'loss/train': 3.0587217807769775} -08/30/2021 17:00:58 - INFO - __main__ - Step 21191: {'lr': 0.0004795439052905087, 'samples': 4068672, 'steps': 21190, 'loss/train': 1.4779027700424194} -08/30/2021 17:00:58 - INFO - __main__ - Step 21192: {'lr': 0.0004795418028467327, 'samples': 4068864, 'steps': 21191, 'loss/train': 1.567817211151123} -08/30/2021 17:00:59 - INFO - __main__ - Step 21193: {'lr': 0.0004795397002995288, 'samples': 4069056, 'steps': 21192, 'loss/train': 1.5164625644683838} -08/30/2021 17:00:59 - INFO - __main__ - Step 21194: {'lr': 0.0004795375976488977, 'samples': 4069248, 'steps': 21193, 'loss/train': 1.7314308881759644} -08/30/2021 17:01:00 - INFO - __main__ - Step 21195: {'lr': 0.00047953549489484056, 'samples': 4069440, 'steps': 21194, 'loss/train': 1.236986756324768} -08/30/2021 17:01:01 - INFO - __main__ - Step 21196: {'lr': 0.0004795333920373583, 'samples': 4069632, 'steps': 21195, 'loss/train': 1.9612573385238647} -08/30/2021 17:01:01 - INFO - __main__ - Step 21197: {'lr': 0.00047953128907645185, 'samples': 4069824, 'steps': 21196, 'loss/train': 1.5197736024856567} -08/30/2021 17:01:02 - INFO - __main__ - Step 21198: {'lr': 0.000479529186012122, 'samples': 4070016, 'steps': 21197, 'loss/train': 1.5771238803863525} -08/30/2021 17:01:02 - INFO - __main__ - Step 21199: {'lr': 0.00047952708284437, 'samples': 4070208, 'steps': 21198, 'loss/train': 1.7781250476837158} -08/30/2021 17:01:02 - INFO - __main__ - Step 21200: {'lr': 0.0004795249795731966, 'samples': 4070400, 'steps': 21199, 'loss/train': 2.0518839359283447} -08/30/2021 17:01:04 - INFO - __main__ - Step 21201: {'lr': 0.00047952287619860273, 'samples': 4070592, 'steps': 21200, 'loss/train': 1.9785789251327515} -08/30/2021 17:01:04 - INFO - __main__ - Step 21202: {'lr': 0.0004795207727205895, 'samples': 4070784, 'steps': 21201, 'loss/train': 2.0732979774475098} -08/30/2021 17:01:05 - INFO - __main__ - Step 21203: {'lr': 0.00047951866913915767, 'samples': 4070976, 'steps': 21202, 'loss/train': 1.606500506401062} -08/30/2021 17:01:05 - INFO - __main__ - Step 21204: {'lr': 0.0004795165654543082, 'samples': 4071168, 'steps': 21203, 'loss/train': 0.6346612572669983} -08/30/2021 17:01:05 - INFO - __main__ - Step 21205: {'lr': 0.0004795144616660422, 'samples': 4071360, 'steps': 21204, 'loss/train': 1.6594130992889404} -08/30/2021 17:01:07 - INFO - __main__ - Step 21206: {'lr': 0.0004795123577743605, 'samples': 4071552, 'steps': 21205, 'loss/train': 1.4455301761627197} -08/30/2021 17:01:07 - INFO - __main__ - Step 21207: {'lr': 0.0004795102537792641, 'samples': 4071744, 'steps': 21206, 'loss/train': 1.718607783317566} -08/30/2021 17:01:08 - INFO - __main__ - Step 21208: {'lr': 0.000479508149680754, 'samples': 4071936, 'steps': 21207, 'loss/train': 2.245089530944824} -08/30/2021 17:01:08 - INFO - __main__ - Step 21209: {'lr': 0.0004795060454788309, 'samples': 4072128, 'steps': 21208, 'loss/train': 1.3547050952911377} -08/30/2021 17:01:08 - INFO - __main__ - Step 21210: {'lr': 0.000479503941173496, 'samples': 4072320, 'steps': 21209, 'loss/train': 1.5988857746124268} -08/30/2021 17:01:10 - INFO - __main__ - Step 21211: {'lr': 0.0004795018367647501, 'samples': 4072512, 'steps': 21210, 'loss/train': 1.6448431015014648} -08/30/2021 17:01:11 - INFO - __main__ - Step 21212: {'lr': 0.0004794997322525944, 'samples': 4072704, 'steps': 21211, 'loss/train': 1.3287367820739746} -08/30/2021 17:01:11 - INFO - __main__ - Step 21213: {'lr': 0.0004794976276370295, 'samples': 4072896, 'steps': 21212, 'loss/train': 1.5425965785980225} -08/30/2021 17:01:11 - INFO - __main__ - Step 21214: {'lr': 0.00047949552291805654, 'samples': 4073088, 'steps': 21213, 'loss/train': 1.610379934310913} -08/30/2021 17:01:12 - INFO - __main__ - Step 21215: {'lr': 0.0004794934180956764, 'samples': 4073280, 'steps': 21214, 'loss/train': 1.6742967367172241} -08/30/2021 17:01:13 - INFO - __main__ - Step 21216: {'lr': 0.00047949131316989016, 'samples': 4073472, 'steps': 21215, 'loss/train': 1.3280588388442993} -08/30/2021 17:01:14 - INFO - __main__ - Step 21217: {'lr': 0.0004794892081406986, 'samples': 4073664, 'steps': 21216, 'loss/train': 1.492698073387146} -08/30/2021 17:01:14 - INFO - __main__ - Step 21218: {'lr': 0.00047948710300810276, 'samples': 4073856, 'steps': 21217, 'loss/train': 0.12345721572637558} -08/30/2021 17:01:14 - INFO - __main__ - Step 21219: {'lr': 0.0004794849977721036, 'samples': 4074048, 'steps': 21218, 'loss/train': 0.09284964948892593} -08/30/2021 17:01:15 - INFO - __main__ - Step 21220: {'lr': 0.00047948289243270205, 'samples': 4074240, 'steps': 21219, 'loss/train': 0.8473216891288757} -08/30/2021 17:01:16 - INFO - __main__ - Step 21221: {'lr': 0.000479480786989899, 'samples': 4074432, 'steps': 21220, 'loss/train': 0.8647047877311707} -08/30/2021 17:01:17 - INFO - __main__ - Step 21222: {'lr': 0.0004794786814436955, 'samples': 4074624, 'steps': 21221, 'loss/train': 1.4903291463851929} -08/30/2021 17:01:17 - INFO - __main__ - Step 21223: {'lr': 0.0004794765757940924, 'samples': 4074816, 'steps': 21222, 'loss/train': 1.6796345710754395} -08/30/2021 17:01:17 - INFO - __main__ - Step 21224: {'lr': 0.00047947447004109066, 'samples': 4075008, 'steps': 21223, 'loss/train': 1.7726914882659912} -08/30/2021 17:01:18 - INFO - __main__ - Step 21225: {'lr': 0.0004794723641846914, 'samples': 4075200, 'steps': 21224, 'loss/train': 1.5440503358840942} -08/30/2021 17:01:19 - INFO - __main__ - Step 21226: {'lr': 0.0004794702582248953, 'samples': 4075392, 'steps': 21225, 'loss/train': 1.757509708404541} -08/30/2021 17:01:20 - INFO - __main__ - Step 21227: {'lr': 0.0004794681521617035, 'samples': 4075584, 'steps': 21226, 'loss/train': 1.6705842018127441} -08/30/2021 17:01:20 - INFO - __main__ - Step 21228: {'lr': 0.0004794660459951169, 'samples': 4075776, 'steps': 21227, 'loss/train': 1.9040278196334839} -08/30/2021 17:01:20 - INFO - __main__ - Step 21229: {'lr': 0.0004794639397251365, 'samples': 4075968, 'steps': 21228, 'loss/train': 2.0275213718414307} -08/30/2021 17:01:21 - INFO - __main__ - Step 21230: {'lr': 0.00047946183335176307, 'samples': 4076160, 'steps': 21229, 'loss/train': 2.0773203372955322} -08/30/2021 17:01:22 - INFO - __main__ - Step 21231: {'lr': 0.00047945972687499775, 'samples': 4076352, 'steps': 21230, 'loss/train': 1.6731206178665161} -08/30/2021 17:01:23 - INFO - __main__ - Step 21232: {'lr': 0.0004794576202948414, 'samples': 4076544, 'steps': 21231, 'loss/train': 1.5735644102096558} -08/30/2021 17:01:23 - INFO - __main__ - Step 21233: {'lr': 0.000479455513611295, 'samples': 4076736, 'steps': 21232, 'loss/train': 1.4337577819824219} -08/30/2021 17:01:23 - INFO - __main__ - Step 21234: {'lr': 0.00047945340682435943, 'samples': 4076928, 'steps': 21233, 'loss/train': 1.6810390949249268} -08/30/2021 17:01:24 - INFO - __main__ - Step 21235: {'lr': 0.00047945129993403577, 'samples': 4077120, 'steps': 21234, 'loss/train': 1.6172901391983032} -08/30/2021 17:01:26 - INFO - __main__ - Step 21236: {'lr': 0.00047944919294032486, 'samples': 4077312, 'steps': 21235, 'loss/train': 1.9328231811523438} -08/30/2021 17:01:27 - INFO - __main__ - Step 21237: {'lr': 0.00047944708584322763, 'samples': 4077504, 'steps': 21236, 'loss/train': 1.6461139917373657} -08/30/2021 17:01:27 - INFO - __main__ - Step 21238: {'lr': 0.00047944497864274517, 'samples': 4077696, 'steps': 21237, 'loss/train': 1.55856192111969} -08/30/2021 17:01:27 - INFO - __main__ - Step 21239: {'lr': 0.00047944287133887834, 'samples': 4077888, 'steps': 21238, 'loss/train': 2.0300607681274414} -08/30/2021 17:01:28 - INFO - __main__ - Step 21240: {'lr': 0.00047944076393162806, 'samples': 4078080, 'steps': 21239, 'loss/train': 1.751529335975647} -08/30/2021 17:01:28 - INFO - __main__ - Step 21241: {'lr': 0.00047943865642099525, 'samples': 4078272, 'steps': 21240, 'loss/train': 4.960762977600098} -08/30/2021 17:01:30 - INFO - __main__ - Step 21242: {'lr': 0.00047943654880698106, 'samples': 4078464, 'steps': 21241, 'loss/train': 1.579373836517334} -08/30/2021 17:01:30 - INFO - __main__ - Step 21243: {'lr': 0.00047943444108958623, 'samples': 4078656, 'steps': 21242, 'loss/train': 1.9401285648345947} -08/30/2021 17:01:30 - INFO - __main__ - Step 21244: {'lr': 0.00047943233326881176, 'samples': 4078848, 'steps': 21243, 'loss/train': 1.4131957292556763} -08/30/2021 17:01:31 - INFO - __main__ - Step 21245: {'lr': 0.00047943022534465866, 'samples': 4079040, 'steps': 21244, 'loss/train': 1.450485348701477} -08/30/2021 17:01:31 - INFO - __main__ - Step 21246: {'lr': 0.00047942811731712775, 'samples': 4079232, 'steps': 21245, 'loss/train': 2.1429929733276367} -08/30/2021 17:01:33 - INFO - __main__ - Step 21247: {'lr': 0.0004794260091862202, 'samples': 4079424, 'steps': 21246, 'loss/train': 1.7352527379989624} -08/30/2021 17:01:34 - INFO - __main__ - Step 21248: {'lr': 0.0004794239009519368, 'samples': 4079616, 'steps': 21247, 'loss/train': 0.8411003351211548} -08/30/2021 17:01:34 - INFO - __main__ - Step 21249: {'lr': 0.00047942179261427847, 'samples': 4079808, 'steps': 21248, 'loss/train': 1.6848970651626587} -08/30/2021 17:01:34 - INFO - __main__ - Step 21250: {'lr': 0.0004794196841732463, 'samples': 4080000, 'steps': 21249, 'loss/train': 1.6532396078109741} -08/30/2021 17:01:35 - INFO - __main__ - Step 21251: {'lr': 0.0004794175756288411, 'samples': 4080192, 'steps': 21250, 'loss/train': 1.8748997449874878} -08/30/2021 17:01:35 - INFO - __main__ - Step 21252: {'lr': 0.00047941546698106386, 'samples': 4080384, 'steps': 21251, 'loss/train': 1.5357121229171753} -08/30/2021 17:01:36 - INFO - __main__ - Step 21253: {'lr': 0.0004794133582299156, 'samples': 4080576, 'steps': 21252, 'loss/train': 1.219651699066162} -08/30/2021 17:01:37 - INFO - __main__ - Step 21254: {'lr': 0.0004794112493753972, 'samples': 4080768, 'steps': 21253, 'loss/train': 0.07995536178350449} -08/30/2021 17:01:37 - INFO - __main__ - Step 21255: {'lr': 0.0004794091404175097, 'samples': 4080960, 'steps': 21254, 'loss/train': 1.646977424621582} -08/30/2021 17:01:38 - INFO - __main__ - Step 21256: {'lr': 0.00047940703135625386, 'samples': 4081152, 'steps': 21255, 'loss/train': 1.963430643081665} -08/30/2021 17:01:38 - INFO - __main__ - Step 21257: {'lr': 0.0004794049221916308, 'samples': 4081344, 'steps': 21256, 'loss/train': 1.7822097539901733} -08/30/2021 17:01:40 - INFO - __main__ - Step 21258: {'lr': 0.00047940281292364146, 'samples': 4081536, 'steps': 21257, 'loss/train': 1.6705876588821411} -08/30/2021 17:01:40 - INFO - __main__ - Step 21259: {'lr': 0.0004794007035522867, 'samples': 4081728, 'steps': 21258, 'loss/train': 1.3476759195327759} -08/30/2021 17:01:40 - INFO - __main__ - Step 21260: {'lr': 0.0004793985940775676, 'samples': 4081920, 'steps': 21259, 'loss/train': 1.230209469795227} -08/30/2021 17:01:41 - INFO - __main__ - Step 21261: {'lr': 0.0004793964844994849, 'samples': 4082112, 'steps': 21260, 'loss/train': 1.8870868682861328} -08/30/2021 17:01:41 - INFO - __main__ - Step 21262: {'lr': 0.00047939437481803984, 'samples': 4082304, 'steps': 21261, 'loss/train': 1.3441853523254395} -08/30/2021 17:01:43 - INFO - __main__ - Step 21263: {'lr': 0.00047939226503323313, 'samples': 4082496, 'steps': 21262, 'loss/train': 1.5473906993865967} -08/30/2021 17:01:43 - INFO - __main__ - Step 21264: {'lr': 0.0004793901551450658, 'samples': 4082688, 'steps': 21263, 'loss/train': 1.3980252742767334} -08/30/2021 17:01:43 - INFO - __main__ - Step 21265: {'lr': 0.00047938804515353887, 'samples': 4082880, 'steps': 21264, 'loss/train': 1.3707047700881958} -08/30/2021 17:01:44 - INFO - __main__ - Step 21266: {'lr': 0.00047938593505865315, 'samples': 4083072, 'steps': 21265, 'loss/train': 1.526796579360962} -08/30/2021 17:01:44 - INFO - __main__ - Step 21267: {'lr': 0.00047938382486040963, 'samples': 4083264, 'steps': 21266, 'loss/train': 1.7023826837539673} -08/30/2021 17:01:46 - INFO - __main__ - Step 21268: {'lr': 0.0004793817145588094, 'samples': 4083456, 'steps': 21267, 'loss/train': 1.8478944301605225} -08/30/2021 17:01:46 - INFO - __main__ - Step 21269: {'lr': 0.0004793796041538533, 'samples': 4083648, 'steps': 21268, 'loss/train': 1.783738136291504} -08/30/2021 17:01:46 - INFO - __main__ - Step 21270: {'lr': 0.00047937749364554226, 'samples': 4083840, 'steps': 21269, 'loss/train': 1.3065569400787354} -08/30/2021 17:01:47 - INFO - __main__ - Step 21271: {'lr': 0.0004793753830338773, 'samples': 4084032, 'steps': 21270, 'loss/train': 1.9068880081176758} -08/30/2021 17:01:47 - INFO - __main__ - Step 21272: {'lr': 0.00047937327231885925, 'samples': 4084224, 'steps': 21271, 'loss/train': 1.276872992515564} -08/30/2021 17:01:49 - INFO - __main__ - Step 21273: {'lr': 0.0004793711615004892, 'samples': 4084416, 'steps': 21272, 'loss/train': 1.3377857208251953} -08/30/2021 17:01:49 - INFO - __main__ - Step 21274: {'lr': 0.000479369050578768, 'samples': 4084608, 'steps': 21273, 'loss/train': 1.797074317932129} -08/30/2021 17:01:50 - INFO - __main__ - Step 21275: {'lr': 0.0004793669395536967, 'samples': 4084800, 'steps': 21274, 'loss/train': 1.3432343006134033} -08/30/2021 17:01:50 - INFO - __main__ - Step 21276: {'lr': 0.00047936482842527616, 'samples': 4084992, 'steps': 21275, 'loss/train': 0.7991041541099548} -08/30/2021 17:01:50 - INFO - __main__ - Step 21277: {'lr': 0.00047936271719350743, 'samples': 4085184, 'steps': 21276, 'loss/train': 1.4765595197677612} -08/30/2021 17:01:51 - INFO - __main__ - Step 21278: {'lr': 0.0004793606058583913, 'samples': 4085376, 'steps': 21277, 'loss/train': 1.7148023843765259} -08/30/2021 17:01:52 - INFO - __main__ - Step 21279: {'lr': 0.00047935849441992887, 'samples': 4085568, 'steps': 21278, 'loss/train': 1.9708300828933716} -08/30/2021 17:01:53 - INFO - __main__ - Step 21280: {'lr': 0.00047935638287812104, 'samples': 4085760, 'steps': 21279, 'loss/train': 1.4684146642684937} -08/30/2021 17:01:53 - INFO - __main__ - Step 21281: {'lr': 0.00047935427123296884, 'samples': 4085952, 'steps': 21280, 'loss/train': 1.9510747194290161} -08/30/2021 17:01:53 - INFO - __main__ - Step 21282: {'lr': 0.000479352159484473, 'samples': 4086144, 'steps': 21281, 'loss/train': 2.0200250148773193} -08/30/2021 17:01:54 - INFO - __main__ - Step 21283: {'lr': 0.0004793500476326347, 'samples': 4086336, 'steps': 21282, 'loss/train': 1.6954630613327026} -08/30/2021 17:01:56 - INFO - __main__ - Step 21284: {'lr': 0.0004793479356774548, 'samples': 4086528, 'steps': 21283, 'loss/train': 1.9972984790802002} -08/30/2021 17:01:56 - INFO - __main__ - Step 21285: {'lr': 0.00047934582361893423, 'samples': 4086720, 'steps': 21284, 'loss/train': 0.32936790585517883} -08/30/2021 17:01:56 - INFO - __main__ - Step 21286: {'lr': 0.000479343711457074, 'samples': 4086912, 'steps': 21285, 'loss/train': 1.0872018337249756} -08/30/2021 17:01:57 - INFO - __main__ - Step 21287: {'lr': 0.00047934159919187504, 'samples': 4087104, 'steps': 21286, 'loss/train': 2.5703048706054688} -08/30/2021 17:01:57 - INFO - __main__ - Step 21288: {'lr': 0.0004793394868233383, 'samples': 4087296, 'steps': 21287, 'loss/train': 2.1616835594177246} -08/30/2021 17:01:59 - INFO - __main__ - Step 21289: {'lr': 0.0004793373743514647, 'samples': 4087488, 'steps': 21288, 'loss/train': 1.4142788648605347} -08/30/2021 17:01:59 - INFO - __main__ - Step 21290: {'lr': 0.0004793352617762552, 'samples': 4087680, 'steps': 21289, 'loss/train': 1.209137201309204} -08/30/2021 17:02:00 - INFO - __main__ - Step 21291: {'lr': 0.0004793331490977108, 'samples': 4087872, 'steps': 21290, 'loss/train': 1.85906982421875} -08/30/2021 17:02:00 - INFO - __main__ - Step 21292: {'lr': 0.0004793310363158324, 'samples': 4088064, 'steps': 21291, 'loss/train': 1.5463615655899048} -08/30/2021 17:02:00 - INFO - __main__ - Step 21293: {'lr': 0.00047932892343062103, 'samples': 4088256, 'steps': 21292, 'loss/train': 1.8606971502304077} -08/30/2021 17:02:01 - INFO - __main__ - Step 21294: {'lr': 0.00047932681044207757, 'samples': 4088448, 'steps': 21293, 'loss/train': 1.606949806213379} -08/30/2021 17:02:03 - INFO - __main__ - Step 21295: {'lr': 0.0004793246973502029, 'samples': 4088640, 'steps': 21294, 'loss/train': 1.5698412656784058} -08/30/2021 17:02:03 - INFO - __main__ - Step 21296: {'lr': 0.0004793225841549982, 'samples': 4088832, 'steps': 21295, 'loss/train': 1.4163990020751953} -08/30/2021 17:02:04 - INFO - __main__ - Step 21297: {'lr': 0.00047932047085646416, 'samples': 4089024, 'steps': 21296, 'loss/train': 1.8476744890213013} -08/30/2021 17:02:04 - INFO - __main__ - Step 21298: {'lr': 0.0004793183574546019, 'samples': 4089216, 'steps': 21297, 'loss/train': 1.4494456052780151} -08/30/2021 17:02:04 - INFO - __main__ - Step 21299: {'lr': 0.0004793162439494123, 'samples': 4089408, 'steps': 21298, 'loss/train': 2.0465006828308105} -08/30/2021 17:02:06 - INFO - __main__ - Step 21300: {'lr': 0.00047931413034089644, 'samples': 4089600, 'steps': 21299, 'loss/train': 1.387484073638916} -08/30/2021 17:02:06 - INFO - __main__ - Step 21301: {'lr': 0.00047931201662905503, 'samples': 4089792, 'steps': 21300, 'loss/train': 1.4023079872131348} -08/30/2021 17:02:07 - INFO - __main__ - Step 21302: {'lr': 0.00047930990281388927, 'samples': 4089984, 'steps': 21301, 'loss/train': 0.8452826738357544} -08/30/2021 17:02:07 - INFO - __main__ - Step 21303: {'lr': 0.00047930778889539996, 'samples': 4090176, 'steps': 21302, 'loss/train': 1.6854580640792847} -08/30/2021 17:02:07 - INFO - __main__ - Step 21304: {'lr': 0.00047930567487358813, 'samples': 4090368, 'steps': 21303, 'loss/train': 1.1011916399002075} -08/30/2021 17:02:09 - INFO - __main__ - Step 21305: {'lr': 0.00047930356074845466, 'samples': 4090560, 'steps': 21304, 'loss/train': 1.9323705434799194} -08/30/2021 17:02:09 - INFO - __main__ - Step 21306: {'lr': 0.0004793014465200005, 'samples': 4090752, 'steps': 21305, 'loss/train': 2.0195205211639404} -08/30/2021 17:02:10 - INFO - __main__ - Step 21307: {'lr': 0.0004792993321882267, 'samples': 4090944, 'steps': 21306, 'loss/train': 1.7164374589920044} -08/30/2021 17:02:10 - INFO - __main__ - Step 21308: {'lr': 0.0004792972177531342, 'samples': 4091136, 'steps': 21307, 'loss/train': 1.4937433004379272} -08/30/2021 17:02:10 - INFO - __main__ - Step 21309: {'lr': 0.0004792951032147239, 'samples': 4091328, 'steps': 21308, 'loss/train': 2.822166681289673} -08/30/2021 17:02:12 - INFO - __main__ - Step 21310: {'lr': 0.00047929298857299677, 'samples': 4091520, 'steps': 21309, 'loss/train': 1.6812840700149536} -08/30/2021 17:02:13 - INFO - __main__ - Step 21311: {'lr': 0.00047929087382795374, 'samples': 4091712, 'steps': 21310, 'loss/train': 1.897234559059143} -08/30/2021 17:02:13 - INFO - __main__ - Step 21312: {'lr': 0.0004792887589795957, 'samples': 4091904, 'steps': 21311, 'loss/train': 1.7426352500915527} -08/30/2021 17:02:13 - INFO - __main__ - Step 21313: {'lr': 0.00047928664402792376, 'samples': 4092096, 'steps': 21312, 'loss/train': 0.15013180673122406} -08/30/2021 17:02:14 - INFO - __main__ - Step 21314: {'lr': 0.0004792845289729388, 'samples': 4092288, 'steps': 21313, 'loss/train': 1.1719199419021606} -08/30/2021 17:02:14 - INFO - __main__ - Step 21315: {'lr': 0.00047928241381464177, 'samples': 4092480, 'steps': 21314, 'loss/train': 1.3982666730880737} -08/30/2021 17:02:16 - INFO - __main__ - Step 21316: {'lr': 0.0004792802985530337, 'samples': 4092672, 'steps': 21315, 'loss/train': 1.6239895820617676} -08/30/2021 17:02:16 - INFO - __main__ - Step 21317: {'lr': 0.0004792781831881153, 'samples': 4092864, 'steps': 21316, 'loss/train': 1.5348361730575562} -08/30/2021 17:02:16 - INFO - __main__ - Step 21318: {'lr': 0.0004792760677198878, 'samples': 4093056, 'steps': 21317, 'loss/train': 1.8626474142074585} -08/30/2021 17:02:17 - INFO - __main__ - Step 21319: {'lr': 0.00047927395214835203, 'samples': 4093248, 'steps': 21318, 'loss/train': 0.3177369236946106} -08/30/2021 17:02:17 - INFO - __main__ - Step 21320: {'lr': 0.0004792718364735089, 'samples': 4093440, 'steps': 21319, 'loss/train': 1.8100190162658691} -08/30/2021 17:02:19 - INFO - __main__ - Step 21321: {'lr': 0.00047926972069535945, 'samples': 4093632, 'steps': 21320, 'loss/train': 1.7661763429641724} -08/30/2021 17:02:19 - INFO - __main__ - Step 21322: {'lr': 0.00047926760481390465, 'samples': 4093824, 'steps': 21321, 'loss/train': 1.6134295463562012} -08/30/2021 17:02:19 - INFO - __main__ - Step 21323: {'lr': 0.00047926548882914533, 'samples': 4094016, 'steps': 21322, 'loss/train': 1.5928452014923096} -08/30/2021 17:02:20 - INFO - __main__ - Step 21324: {'lr': 0.0004792633727410826, 'samples': 4094208, 'steps': 21323, 'loss/train': 2.4081175327301025} -08/30/2021 17:02:20 - INFO - __main__ - Step 21325: {'lr': 0.0004792612565497172, 'samples': 4094400, 'steps': 21324, 'loss/train': 1.9535518884658813} -08/30/2021 17:02:22 - INFO - __main__ - Step 21326: {'lr': 0.00047925914025505036, 'samples': 4094592, 'steps': 21325, 'loss/train': 1.9374675750732422} -08/30/2021 17:02:22 - INFO - __main__ - Step 21327: {'lr': 0.0004792570238570828, 'samples': 4094784, 'steps': 21326, 'loss/train': 1.8380175828933716} -08/30/2021 17:02:22 - INFO - __main__ - Step 21328: {'lr': 0.00047925490735581557, 'samples': 4094976, 'steps': 21327, 'loss/train': 1.7587676048278809} -08/30/2021 17:02:23 - INFO - __main__ - Step 21329: {'lr': 0.00047925279075124963, 'samples': 4095168, 'steps': 21328, 'loss/train': 1.9400763511657715} -08/30/2021 17:02:23 - INFO - __main__ - Step 21330: {'lr': 0.00047925067404338596, 'samples': 4095360, 'steps': 21329, 'loss/train': 1.9073177576065063} -08/30/2021 17:02:25 - INFO - __main__ - Step 21331: {'lr': 0.00047924855723222536, 'samples': 4095552, 'steps': 21330, 'loss/train': 2.1923956871032715} -08/30/2021 17:02:25 - INFO - __main__ - Step 21332: {'lr': 0.000479246440317769, 'samples': 4095744, 'steps': 21331, 'loss/train': 1.843536138534546} -08/30/2021 17:02:26 - INFO - __main__ - Step 21333: {'lr': 0.00047924432330001776, 'samples': 4095936, 'steps': 21332, 'loss/train': 0.8867649435997009} -08/30/2021 17:02:26 - INFO - __main__ - Step 21334: {'lr': 0.0004792422061789725, 'samples': 4096128, 'steps': 21333, 'loss/train': 1.6919630765914917} -08/30/2021 17:02:26 - INFO - __main__ - Step 21335: {'lr': 0.0004792400889546342, 'samples': 4096320, 'steps': 21334, 'loss/train': 1.719007134437561} -08/30/2021 17:02:27 - INFO - __main__ - Step 21336: {'lr': 0.00047923797162700393, 'samples': 4096512, 'steps': 21335, 'loss/train': 1.297482967376709} -08/30/2021 17:02:28 - INFO - __main__ - Step 21337: {'lr': 0.0004792358541960826, 'samples': 4096704, 'steps': 21336, 'loss/train': 1.2600412368774414} -08/30/2021 17:02:29 - INFO - __main__ - Step 21338: {'lr': 0.000479233736661871, 'samples': 4096896, 'steps': 21337, 'loss/train': 6.028919696807861} -08/30/2021 17:02:29 - INFO - __main__ - Step 21339: {'lr': 0.0004792316190243703, 'samples': 4097088, 'steps': 21338, 'loss/train': 1.9485559463500977} -08/30/2021 17:02:29 - INFO - __main__ - Step 21340: {'lr': 0.0004792295012835814, 'samples': 4097280, 'steps': 21339, 'loss/train': 1.1493204832077026} -08/30/2021 17:02:30 - INFO - __main__ - Step 21341: {'lr': 0.0004792273834395052, 'samples': 4097472, 'steps': 21340, 'loss/train': 1.0050369501113892} -08/30/2021 17:02:31 - INFO - __main__ - Step 21342: {'lr': 0.0004792252654921426, 'samples': 4097664, 'steps': 21341, 'loss/train': 0.5513942837715149} -08/30/2021 17:02:32 - INFO - __main__ - Step 21343: {'lr': 0.00047922314744149475, 'samples': 4097856, 'steps': 21342, 'loss/train': 0.792652428150177} -08/30/2021 17:02:32 - INFO - __main__ - Step 21344: {'lr': 0.0004792210292875624, 'samples': 4098048, 'steps': 21343, 'loss/train': 1.4035366773605347} -08/30/2021 17:02:32 - INFO - __main__ - Step 21345: {'lr': 0.00047921891103034665, 'samples': 4098240, 'steps': 21344, 'loss/train': 1.606066346168518} -08/30/2021 17:02:33 - INFO - __main__ - Step 21346: {'lr': 0.0004792167926698483, 'samples': 4098432, 'steps': 21345, 'loss/train': 1.0577651262283325} -08/30/2021 17:02:33 - INFO - __main__ - Step 21347: {'lr': 0.0004792146742060685, 'samples': 4098624, 'steps': 21346, 'loss/train': 1.8724123239517212} -08/30/2021 17:02:35 - INFO - __main__ - Step 21348: {'lr': 0.00047921255563900813, 'samples': 4098816, 'steps': 21347, 'loss/train': 0.8765449523925781} -08/30/2021 17:02:36 - INFO - __main__ - Step 21349: {'lr': 0.000479210436968668, 'samples': 4099008, 'steps': 21348, 'loss/train': 2.4227795600891113} -08/30/2021 17:02:36 - INFO - __main__ - Step 21350: {'lr': 0.0004792083181950493, 'samples': 4099200, 'steps': 21349, 'loss/train': 1.9457899332046509} -08/30/2021 17:02:37 - INFO - __main__ - Step 21351: {'lr': 0.0004792061993181528, 'samples': 4099392, 'steps': 21350, 'loss/train': 1.9755337238311768} -08/30/2021 17:02:37 - INFO - __main__ - Step 21352: {'lr': 0.00047920408033797954, 'samples': 4099584, 'steps': 21351, 'loss/train': 1.3816801309585571} -08/30/2021 17:02:37 - INFO - __main__ - Step 21353: {'lr': 0.0004792019612545304, 'samples': 4099776, 'steps': 21352, 'loss/train': 1.5029605627059937} -08/30/2021 17:02:39 - INFO - __main__ - Step 21354: {'lr': 0.00047919984206780647, 'samples': 4099968, 'steps': 21353, 'loss/train': 1.8080503940582275} -08/30/2021 17:02:39 - INFO - __main__ - Step 21355: {'lr': 0.0004791977227778086, 'samples': 4100160, 'steps': 21354, 'loss/train': 1.749057650566101} -08/30/2021 17:02:40 - INFO - __main__ - Step 21356: {'lr': 0.00047919560338453783, 'samples': 4100352, 'steps': 21355, 'loss/train': 1.466055989265442} -08/30/2021 17:02:40 - INFO - __main__ - Step 21357: {'lr': 0.000479193483887995, 'samples': 4100544, 'steps': 21356, 'loss/train': 1.9566959142684937} -08/30/2021 17:02:40 - INFO - __main__ - Step 21358: {'lr': 0.0004791913642881811, 'samples': 4100736, 'steps': 21357, 'loss/train': 1.5667201280593872} -08/30/2021 17:02:42 - INFO - __main__ - Step 21359: {'lr': 0.00047918924458509717, 'samples': 4100928, 'steps': 21358, 'loss/train': 1.3140431642532349} -08/30/2021 17:02:42 - INFO - __main__ - Step 21360: {'lr': 0.00047918712477874404, 'samples': 4101120, 'steps': 21359, 'loss/train': 1.1423887014389038} -08/30/2021 17:02:43 - INFO - __main__ - Step 21361: {'lr': 0.00047918500486912276, 'samples': 4101312, 'steps': 21360, 'loss/train': 1.8200029134750366} -08/30/2021 17:02:43 - INFO - __main__ - Step 21362: {'lr': 0.00047918288485623427, 'samples': 4101504, 'steps': 21361, 'loss/train': 1.862265706062317} -08/30/2021 17:02:43 - INFO - __main__ - Step 21363: {'lr': 0.0004791807647400795, 'samples': 4101696, 'steps': 21362, 'loss/train': 1.2375341653823853} -08/30/2021 17:02:44 - INFO - __main__ - Step 21364: {'lr': 0.0004791786445206594, 'samples': 4101888, 'steps': 21363, 'loss/train': 1.9139901399612427} -08/30/2021 17:02:46 - INFO - __main__ - Step 21365: {'lr': 0.00047917652419797495, 'samples': 4102080, 'steps': 21364, 'loss/train': 1.5732009410858154} -08/30/2021 17:02:46 - INFO - __main__ - Step 21366: {'lr': 0.0004791744037720271, 'samples': 4102272, 'steps': 21365, 'loss/train': 1.735299825668335} -08/30/2021 17:02:47 - INFO - __main__ - Step 21367: {'lr': 0.00047917228324281683, 'samples': 4102464, 'steps': 21366, 'loss/train': 0.15128643810749054} -08/30/2021 17:02:47 - INFO - __main__ - Step 21368: {'lr': 0.00047917016261034496, 'samples': 4102656, 'steps': 21367, 'loss/train': 2.277677297592163} -08/30/2021 17:02:47 - INFO - __main__ - Step 21369: {'lr': 0.0004791680418746126, 'samples': 4102848, 'steps': 21368, 'loss/train': 1.6648612022399902} -08/30/2021 17:02:49 - INFO - __main__ - Step 21370: {'lr': 0.00047916592103562075, 'samples': 4103040, 'steps': 21369, 'loss/train': 1.4361931085586548} -08/30/2021 17:02:49 - INFO - __main__ - Step 21371: {'lr': 0.00047916380009337014, 'samples': 4103232, 'steps': 21370, 'loss/train': 1.1085540056228638} -08/30/2021 17:02:50 - INFO - __main__ - Step 21372: {'lr': 0.0004791616790478619, 'samples': 4103424, 'steps': 21371, 'loss/train': 1.6016608476638794} -08/30/2021 17:02:50 - INFO - __main__ - Step 21373: {'lr': 0.000479159557899097, 'samples': 4103616, 'steps': 21372, 'loss/train': 1.678863525390625} -08/30/2021 17:02:50 - INFO - __main__ - Step 21374: {'lr': 0.00047915743664707626, 'samples': 4103808, 'steps': 21373, 'loss/train': 1.0617471933364868} -08/30/2021 17:02:52 - INFO - __main__ - Step 21375: {'lr': 0.0004791553152918008, 'samples': 4104000, 'steps': 21374, 'loss/train': 1.9959217309951782} -08/30/2021 17:02:52 - INFO - __main__ - Step 21376: {'lr': 0.0004791531938332714, 'samples': 4104192, 'steps': 21375, 'loss/train': 1.020253300666809} -08/30/2021 17:02:53 - INFO - __main__ - Step 21377: {'lr': 0.0004791510722714891, 'samples': 4104384, 'steps': 21376, 'loss/train': 1.9851142168045044} -08/30/2021 17:02:53 - INFO - __main__ - Step 21378: {'lr': 0.000479148950606455, 'samples': 4104576, 'steps': 21377, 'loss/train': 1.816135287284851} -08/30/2021 17:02:53 - INFO - __main__ - Step 21379: {'lr': 0.00047914682883816977, 'samples': 4104768, 'steps': 21378, 'loss/train': 1.3393754959106445} -08/30/2021 17:02:54 - INFO - __main__ - Step 21380: {'lr': 0.00047914470696663457, 'samples': 4104960, 'steps': 21379, 'loss/train': 1.6631602048873901} -08/30/2021 17:02:55 - INFO - __main__ - Step 21381: {'lr': 0.00047914258499185037, 'samples': 4105152, 'steps': 21380, 'loss/train': 2.0020618438720703} -08/30/2021 17:02:56 - INFO - __main__ - Step 21382: {'lr': 0.000479140462913818, 'samples': 4105344, 'steps': 21381, 'loss/train': 1.894571304321289} -08/30/2021 17:02:56 - INFO - __main__ - Step 21383: {'lr': 0.0004791383407325384, 'samples': 4105536, 'steps': 21382, 'loss/train': 1.5259020328521729} -08/30/2021 17:02:56 - INFO - __main__ - Step 21384: {'lr': 0.0004791362184480127, 'samples': 4105728, 'steps': 21383, 'loss/train': 1.774632215499878} -08/30/2021 17:02:57 - INFO - __main__ - Step 21385: {'lr': 0.0004791340960602417, 'samples': 4105920, 'steps': 21384, 'loss/train': 1.8958078622817993} -08/30/2021 17:02:58 - INFO - __main__ - Step 21386: {'lr': 0.0004791319735692264, 'samples': 4106112, 'steps': 21385, 'loss/train': 1.8974725008010864} -08/30/2021 17:02:59 - INFO - __main__ - Step 21387: {'lr': 0.00047912985097496786, 'samples': 4106304, 'steps': 21386, 'loss/train': 1.1539653539657593} -08/30/2021 17:02:59 - INFO - __main__ - Step 21388: {'lr': 0.00047912772827746685, 'samples': 4106496, 'steps': 21387, 'loss/train': 1.3914194107055664} -08/30/2021 17:02:59 - INFO - __main__ - Step 21389: {'lr': 0.00047912560547672453, 'samples': 4106688, 'steps': 21388, 'loss/train': 0.16680869460105896} -08/30/2021 17:03:00 - INFO - __main__ - Step 21390: {'lr': 0.0004791234825727416, 'samples': 4106880, 'steps': 21389, 'loss/train': 1.2506459951400757} -08/30/2021 17:03:02 - INFO - __main__ - Step 21391: {'lr': 0.0004791213595655193, 'samples': 4107072, 'steps': 21390, 'loss/train': 1.9134588241577148} -08/30/2021 17:03:02 - INFO - __main__ - Step 21392: {'lr': 0.0004791192364550584, 'samples': 4107264, 'steps': 21391, 'loss/train': 1.4890049695968628} -08/30/2021 17:03:03 - INFO - __main__ - Step 21393: {'lr': 0.00047911711324135985, 'samples': 4107456, 'steps': 21392, 'loss/train': 1.4686373472213745} -08/30/2021 17:03:03 - INFO - __main__ - Step 21394: {'lr': 0.00047911498992442476, 'samples': 4107648, 'steps': 21393, 'loss/train': 1.9358030557632446} -08/30/2021 17:03:03 - INFO - __main__ - Step 21395: {'lr': 0.0004791128665042539, 'samples': 4107840, 'steps': 21394, 'loss/train': 1.6533355712890625} -08/30/2021 17:03:04 - INFO - __main__ - Step 21396: {'lr': 0.0004791107429808484, 'samples': 4108032, 'steps': 21395, 'loss/train': 1.1145198345184326} -08/30/2021 17:03:05 - INFO - __main__ - Step 21397: {'lr': 0.00047910861935420915, 'samples': 4108224, 'steps': 21396, 'loss/train': 3.0373291969299316} -08/30/2021 17:03:06 - INFO - __main__ - Step 21398: {'lr': 0.00047910649562433696, 'samples': 4108416, 'steps': 21397, 'loss/train': 1.8464752435684204} -08/30/2021 17:03:06 - INFO - __main__ - Step 21399: {'lr': 0.000479104371791233, 'samples': 4108608, 'steps': 21398, 'loss/train': 1.7620136737823486} -08/30/2021 17:03:06 - INFO - __main__ - Step 21400: {'lr': 0.0004791022478548982, 'samples': 4108800, 'steps': 21399, 'loss/train': 1.8300144672393799} -08/30/2021 17:03:07 - INFO - __main__ - Step 21401: {'lr': 0.0004791001238153334, 'samples': 4108992, 'steps': 21400, 'loss/train': 1.0013267993927002} -08/30/2021 17:03:09 - INFO - __main__ - Step 21402: {'lr': 0.00047909799967253957, 'samples': 4109184, 'steps': 21401, 'loss/train': 1.5706853866577148} -08/30/2021 17:03:09 - INFO - __main__ - Step 21403: {'lr': 0.00047909587542651776, 'samples': 4109376, 'steps': 21402, 'loss/train': 1.5404706001281738} -08/30/2021 17:03:10 - INFO - __main__ - Step 21404: {'lr': 0.00047909375107726894, 'samples': 4109568, 'steps': 21403, 'loss/train': 1.8566616773605347} -08/30/2021 17:03:10 - INFO - __main__ - Step 21405: {'lr': 0.000479091626624794, 'samples': 4109760, 'steps': 21404, 'loss/train': 5.978694915771484} -08/30/2021 17:03:10 - INFO - __main__ - Step 21406: {'lr': 0.00047908950206909385, 'samples': 4109952, 'steps': 21405, 'loss/train': 1.2774567604064941} -08/30/2021 17:03:11 - INFO - __main__ - Step 21407: {'lr': 0.0004790873774101695, 'samples': 4110144, 'steps': 21406, 'loss/train': 1.7675304412841797} -08/30/2021 17:03:12 - INFO - __main__ - Step 21408: {'lr': 0.00047908525264802194, 'samples': 4110336, 'steps': 21407, 'loss/train': 1.8614758253097534} -08/30/2021 17:03:13 - INFO - __main__ - Step 21409: {'lr': 0.00047908312778265213, 'samples': 4110528, 'steps': 21408, 'loss/train': 2.530635356903076} -08/30/2021 17:03:13 - INFO - __main__ - Step 21410: {'lr': 0.00047908100281406096, 'samples': 4110720, 'steps': 21409, 'loss/train': 0.6041358113288879} -08/30/2021 17:03:14 - INFO - __main__ - Step 21411: {'lr': 0.00047907887774224946, 'samples': 4110912, 'steps': 21410, 'loss/train': 1.3304941654205322} -08/30/2021 17:03:14 - INFO - __main__ - Step 21412: {'lr': 0.0004790767525672185, 'samples': 4111104, 'steps': 21411, 'loss/train': 1.4318076372146606} -08/30/2021 17:03:15 - INFO - __main__ - Step 21413: {'lr': 0.0004790746272889691, 'samples': 4111296, 'steps': 21412, 'loss/train': 1.6282638311386108} -08/30/2021 17:03:16 - INFO - __main__ - Step 21414: {'lr': 0.00047907250190750225, 'samples': 4111488, 'steps': 21413, 'loss/train': 1.9806156158447266} -08/30/2021 17:03:16 - INFO - __main__ - Step 21415: {'lr': 0.0004790703764228188, 'samples': 4111680, 'steps': 21414, 'loss/train': 1.3572484254837036} -08/30/2021 17:03:17 - INFO - __main__ - Step 21416: {'lr': 0.0004790682508349198, 'samples': 4111872, 'steps': 21415, 'loss/train': 1.2222541570663452} -08/30/2021 17:03:17 - INFO - __main__ - Step 21417: {'lr': 0.00047906612514380623, 'samples': 4112064, 'steps': 21416, 'loss/train': 1.5520838499069214} -08/30/2021 17:03:19 - INFO - __main__ - Step 21418: {'lr': 0.000479063999349479, 'samples': 4112256, 'steps': 21417, 'loss/train': 1.7586411237716675} -08/30/2021 17:03:20 - INFO - __main__ - Step 21419: {'lr': 0.00047906187345193895, 'samples': 4112448, 'steps': 21418, 'loss/train': 1.270230770111084} -08/30/2021 17:03:20 - INFO - __main__ - Step 21420: {'lr': 0.0004790597474511873, 'samples': 4112640, 'steps': 21419, 'loss/train': 1.4617196321487427} -08/30/2021 17:03:20 - INFO - __main__ - Step 21421: {'lr': 0.0004790576213472248, 'samples': 4112832, 'steps': 21420, 'loss/train': 1.1790966987609863} -08/30/2021 17:03:21 - INFO - __main__ - Step 21422: {'lr': 0.0004790554951400524, 'samples': 4113024, 'steps': 21421, 'loss/train': 1.1328461170196533} -08/30/2021 17:03:21 - INFO - __main__ - Step 21423: {'lr': 0.0004790533688296712, 'samples': 4113216, 'steps': 21422, 'loss/train': 1.5887815952301025} -08/30/2021 17:03:22 - INFO - __main__ - Step 21424: {'lr': 0.0004790512424160821, 'samples': 4113408, 'steps': 21423, 'loss/train': 1.9631133079528809} -08/30/2021 17:03:23 - INFO - __main__ - Step 21425: {'lr': 0.00047904911589928605, 'samples': 4113600, 'steps': 21424, 'loss/train': 1.9130054712295532} -08/30/2021 17:03:23 - INFO - __main__ - Step 21426: {'lr': 0.00047904698927928404, 'samples': 4113792, 'steps': 21425, 'loss/train': 1.599796175956726} -08/30/2021 17:03:23 - INFO - __main__ - Step 21427: {'lr': 0.0004790448625560769, 'samples': 4113984, 'steps': 21426, 'loss/train': 1.6329631805419922} -08/30/2021 17:03:24 - INFO - __main__ - Step 21428: {'lr': 0.0004790427357296657, 'samples': 4114176, 'steps': 21427, 'loss/train': 1.3552738428115845} -08/30/2021 17:03:26 - INFO - __main__ - Step 21429: {'lr': 0.0004790406088000514, 'samples': 4114368, 'steps': 21428, 'loss/train': 1.5520470142364502} -08/30/2021 17:03:26 - INFO - __main__ - Step 21430: {'lr': 0.00047903848176723493, 'samples': 4114560, 'steps': 21429, 'loss/train': 1.6015326976776123} -08/30/2021 17:03:27 - INFO - __main__ - Step 21431: {'lr': 0.0004790363546312172, 'samples': 4114752, 'steps': 21430, 'loss/train': 1.2645312547683716} -08/30/2021 17:03:27 - INFO - __main__ - Step 21432: {'lr': 0.0004790342273919993, 'samples': 4114944, 'steps': 21431, 'loss/train': 1.4015811681747437} -08/30/2021 17:03:27 - INFO - __main__ - Step 21433: {'lr': 0.00047903210004958207, 'samples': 4115136, 'steps': 21432, 'loss/train': 2.077160120010376} -08/30/2021 17:03:28 - INFO - __main__ - Step 21434: {'lr': 0.0004790299726039665, 'samples': 4115328, 'steps': 21433, 'loss/train': 1.6486338376998901} -08/30/2021 17:03:29 - INFO - __main__ - Step 21435: {'lr': 0.0004790278450551536, 'samples': 4115520, 'steps': 21434, 'loss/train': 0.08832631260156631} -08/30/2021 17:03:30 - INFO - __main__ - Step 21436: {'lr': 0.00047902571740314427, 'samples': 4115712, 'steps': 21435, 'loss/train': 2.3777639865875244} -08/30/2021 17:03:30 - INFO - __main__ - Step 21437: {'lr': 0.00047902358964793944, 'samples': 4115904, 'steps': 21436, 'loss/train': 1.1027485132217407} -08/30/2021 17:03:30 - INFO - __main__ - Step 21438: {'lr': 0.0004790214617895402, 'samples': 4116096, 'steps': 21437, 'loss/train': 2.061546564102173} -08/30/2021 17:03:31 - INFO - __main__ - Step 21439: {'lr': 0.0004790193338279474, 'samples': 4116288, 'steps': 21438, 'loss/train': 1.7133933305740356} -08/30/2021 17:03:32 - INFO - __main__ - Step 21440: {'lr': 0.000479017205763162, 'samples': 4116480, 'steps': 21439, 'loss/train': 1.7539247274398804} -08/30/2021 17:03:33 - INFO - __main__ - Step 21441: {'lr': 0.000479015077595185, 'samples': 4116672, 'steps': 21440, 'loss/train': 1.705939769744873} -08/30/2021 17:03:33 - INFO - __main__ - Step 21442: {'lr': 0.0004790129493240173, 'samples': 4116864, 'steps': 21441, 'loss/train': 1.0331511497497559} -08/30/2021 17:03:33 - INFO - __main__ - Step 21443: {'lr': 0.0004790108209496599, 'samples': 4117056, 'steps': 21442, 'loss/train': 4.733749866485596} -08/30/2021 17:03:34 - INFO - __main__ - Step 21444: {'lr': 0.00047900869247211384, 'samples': 4117248, 'steps': 21443, 'loss/train': 1.3099116086959839} -08/30/2021 17:03:36 - INFO - __main__ - Step 21445: {'lr': 0.0004790065638913799, 'samples': 4117440, 'steps': 21444, 'loss/train': 0.6812911033630371} -08/30/2021 17:03:36 - INFO - __main__ - Step 21446: {'lr': 0.00047900443520745915, 'samples': 4117632, 'steps': 21445, 'loss/train': 1.9747036695480347} -08/30/2021 17:03:36 - INFO - __main__ - Step 21447: {'lr': 0.0004790023064203526, 'samples': 4117824, 'steps': 21446, 'loss/train': 1.5440456867218018} -08/30/2021 17:03:37 - INFO - __main__ - Step 21448: {'lr': 0.00047900017753006106, 'samples': 4118016, 'steps': 21447, 'loss/train': 1.5677807331085205} -08/30/2021 17:03:37 - INFO - __main__ - Step 21449: {'lr': 0.0004789980485365857, 'samples': 4118208, 'steps': 21448, 'loss/train': 1.4878294467926025} -08/30/2021 17:03:38 - INFO - __main__ - Step 21450: {'lr': 0.00047899591943992726, 'samples': 4118400, 'steps': 21449, 'loss/train': 1.6379958391189575} -08/30/2021 17:03:39 - INFO - __main__ - Step 21451: {'lr': 0.0004789937902400868, 'samples': 4118592, 'steps': 21450, 'loss/train': 0.2603890299797058} -08/30/2021 17:03:39 - INFO - __main__ - Step 21452: {'lr': 0.00047899166093706523, 'samples': 4118784, 'steps': 21451, 'loss/train': 1.7019600868225098} -08/30/2021 17:03:40 - INFO - __main__ - Step 21453: {'lr': 0.0004789895315308636, 'samples': 4118976, 'steps': 21452, 'loss/train': 1.7137532234191895} -08/30/2021 17:03:40 - INFO - __main__ - Step 21454: {'lr': 0.00047898740202148284, 'samples': 4119168, 'steps': 21453, 'loss/train': 1.0620163679122925} -08/30/2021 17:03:41 - INFO - __main__ - Step 21455: {'lr': 0.0004789852724089239, 'samples': 4119360, 'steps': 21454, 'loss/train': 1.5766828060150146} -08/30/2021 17:03:42 - INFO - __main__ - Step 21456: {'lr': 0.00047898314269318766, 'samples': 4119552, 'steps': 21455, 'loss/train': 1.6099308729171753} -08/30/2021 17:03:43 - INFO - __main__ - Step 21457: {'lr': 0.00047898101287427523, 'samples': 4119744, 'steps': 21456, 'loss/train': 1.6593270301818848} -08/30/2021 17:03:43 - INFO - __main__ - Step 21458: {'lr': 0.0004789788829521874, 'samples': 4119936, 'steps': 21457, 'loss/train': 1.2930656671524048} -08/30/2021 17:03:44 - INFO - __main__ - Step 21459: {'lr': 0.0004789767529269253, 'samples': 4120128, 'steps': 21458, 'loss/train': 1.334293246269226} -08/30/2021 17:03:44 - INFO - __main__ - Step 21460: {'lr': 0.0004789746227984897, 'samples': 4120320, 'steps': 21459, 'loss/train': 1.5533400774002075} -08/30/2021 17:03:46 - INFO - __main__ - Step 21461: {'lr': 0.0004789724925668818, 'samples': 4120512, 'steps': 21460, 'loss/train': 1.022534728050232} -08/30/2021 17:03:46 - INFO - __main__ - Step 21462: {'lr': 0.00047897036223210234, 'samples': 4120704, 'steps': 21461, 'loss/train': 1.3876748085021973} -08/30/2021 17:03:46 - INFO - __main__ - Step 21463: {'lr': 0.00047896823179415237, 'samples': 4120896, 'steps': 21462, 'loss/train': 1.795861005783081} -08/30/2021 17:03:47 - INFO - __main__ - Step 21464: {'lr': 0.0004789661012530329, 'samples': 4121088, 'steps': 21463, 'loss/train': 1.9045308828353882} -08/30/2021 17:03:47 - INFO - __main__ - Step 21465: {'lr': 0.00047896397060874485, 'samples': 4121280, 'steps': 21464, 'loss/train': 1.2129464149475098} -08/30/2021 17:03:47 - INFO - __main__ - Step 21466: {'lr': 0.0004789618398612891, 'samples': 4121472, 'steps': 21465, 'loss/train': 1.1078848838806152} -08/30/2021 17:03:49 - INFO - __main__ - Step 21467: {'lr': 0.0004789597090106667, 'samples': 4121664, 'steps': 21466, 'loss/train': 1.749743103981018} -08/30/2021 17:03:50 - INFO - __main__ - Step 21468: {'lr': 0.00047895757805687864, 'samples': 4121856, 'steps': 21467, 'loss/train': 2.036487102508545} -08/30/2021 17:03:50 - INFO - __main__ - Step 21469: {'lr': 0.0004789554469999258, 'samples': 4122048, 'steps': 21468, 'loss/train': 1.7220492362976074} -08/30/2021 17:03:50 - INFO - __main__ - Step 21470: {'lr': 0.0004789533158398091, 'samples': 4122240, 'steps': 21469, 'loss/train': 1.6133811473846436} -08/30/2021 17:03:51 - INFO - __main__ - Step 21471: {'lr': 0.00047895118457652965, 'samples': 4122432, 'steps': 21470, 'loss/train': 1.4600428342819214} -08/30/2021 17:03:51 - INFO - __main__ - Step 21472: {'lr': 0.0004789490532100883, 'samples': 4122624, 'steps': 21471, 'loss/train': 0.05137605592608452} -08/30/2021 17:03:53 - INFO - __main__ - Step 21473: {'lr': 0.000478946921740486, 'samples': 4122816, 'steps': 21472, 'loss/train': 1.4794323444366455} -08/30/2021 17:03:53 - INFO - __main__ - Step 21474: {'lr': 0.0004789447901677238, 'samples': 4123008, 'steps': 21473, 'loss/train': 1.8282737731933594} -08/30/2021 17:03:53 - INFO - __main__ - Step 21475: {'lr': 0.00047894265849180264, 'samples': 4123200, 'steps': 21474, 'loss/train': 0.7590158581733704} -08/30/2021 17:03:54 - INFO - __main__ - Step 21476: {'lr': 0.00047894052671272337, 'samples': 4123392, 'steps': 21475, 'loss/train': 1.4974853992462158} -08/30/2021 17:03:54 - INFO - __main__ - Step 21477: {'lr': 0.0004789383948304871, 'samples': 4123584, 'steps': 21476, 'loss/train': 1.531650185585022} -08/30/2021 17:03:56 - INFO - __main__ - Step 21478: {'lr': 0.00047893626284509466, 'samples': 4123776, 'steps': 21477, 'loss/train': 1.5932615995407104} -08/30/2021 17:03:56 - INFO - __main__ - Step 21479: {'lr': 0.0004789341307565471, 'samples': 4123968, 'steps': 21478, 'loss/train': 1.7813539505004883} -08/30/2021 17:03:56 - INFO - __main__ - Step 21480: {'lr': 0.0004789319985648454, 'samples': 4124160, 'steps': 21479, 'loss/train': 1.3085589408874512} -08/30/2021 17:03:57 - INFO - __main__ - Step 21481: {'lr': 0.0004789298662699905, 'samples': 4124352, 'steps': 21480, 'loss/train': 1.8414041996002197} -08/30/2021 17:03:57 - INFO - __main__ - Step 21482: {'lr': 0.0004789277338719832, 'samples': 4124544, 'steps': 21481, 'loss/train': 0.3708147406578064} -08/30/2021 17:03:59 - INFO - __main__ - Step 21483: {'lr': 0.0004789256013708246, 'samples': 4124736, 'steps': 21482, 'loss/train': 1.0991530418395996} -08/30/2021 17:03:59 - INFO - __main__ - Step 21484: {'lr': 0.0004789234687665158, 'samples': 4124928, 'steps': 21483, 'loss/train': 1.7097718715667725} -08/30/2021 17:04:00 - INFO - __main__ - Step 21485: {'lr': 0.0004789213360590575, 'samples': 4125120, 'steps': 21484, 'loss/train': 1.0717169046401978} -08/30/2021 17:04:00 - INFO - __main__ - Step 21486: {'lr': 0.00047891920324845085, 'samples': 4125312, 'steps': 21485, 'loss/train': 1.573041558265686} -08/30/2021 17:04:00 - INFO - __main__ - Step 21487: {'lr': 0.00047891707033469665, 'samples': 4125504, 'steps': 21486, 'loss/train': 1.5038706064224243} -08/30/2021 17:04:01 - INFO - __main__ - Step 21488: {'lr': 0.00047891493731779607, 'samples': 4125696, 'steps': 21487, 'loss/train': 2.181943893432617} -08/30/2021 17:04:02 - INFO - __main__ - Step 21489: {'lr': 0.00047891280419774985, 'samples': 4125888, 'steps': 21488, 'loss/train': 1.6918127536773682} -08/30/2021 17:04:03 - INFO - __main__ - Step 21490: {'lr': 0.0004789106709745591, 'samples': 4126080, 'steps': 21489, 'loss/train': 1.6460556983947754} -08/30/2021 17:04:03 - INFO - __main__ - Step 21491: {'lr': 0.0004789085376482247, 'samples': 4126272, 'steps': 21490, 'loss/train': 1.7745941877365112} -08/30/2021 17:04:03 - INFO - __main__ - Step 21492: {'lr': 0.00047890640421874775, 'samples': 4126464, 'steps': 21491, 'loss/train': 1.7836967706680298} -08/30/2021 17:04:05 - INFO - __main__ - Step 21493: {'lr': 0.000478904270686129, 'samples': 4126656, 'steps': 21492, 'loss/train': 2.0360591411590576} -08/30/2021 17:04:06 - INFO - __main__ - Step 21494: {'lr': 0.00047890213705036955, 'samples': 4126848, 'steps': 21493, 'loss/train': 1.0421425104141235} -08/30/2021 17:04:06 - INFO - __main__ - Step 21495: {'lr': 0.00047890000331147033, 'samples': 4127040, 'steps': 21494, 'loss/train': 1.2720959186553955} -08/30/2021 17:04:07 - INFO - __main__ - Step 21496: {'lr': 0.0004788978694694323, 'samples': 4127232, 'steps': 21495, 'loss/train': 1.3424983024597168} -08/30/2021 17:04:07 - INFO - __main__ - Step 21497: {'lr': 0.0004788957355242564, 'samples': 4127424, 'steps': 21496, 'loss/train': 1.0823028087615967} -08/30/2021 17:04:07 - INFO - __main__ - Step 21498: {'lr': 0.00047889360147594363, 'samples': 4127616, 'steps': 21497, 'loss/train': 2.1946630477905273} -08/30/2021 17:04:09 - INFO - __main__ - Step 21499: {'lr': 0.00047889146732449497, 'samples': 4127808, 'steps': 21498, 'loss/train': 1.4539885520935059} -08/30/2021 17:04:09 - INFO - __main__ - Step 21500: {'lr': 0.00047888933306991136, 'samples': 4128000, 'steps': 21499, 'loss/train': 1.671066403388977} -08/30/2021 17:04:10 - INFO - __main__ - Step 21501: {'lr': 0.00047888719871219367, 'samples': 4128192, 'steps': 21500, 'loss/train': 2.1623952388763428} -08/30/2021 17:04:10 - INFO - __main__ - Step 21502: {'lr': 0.00047888506425134293, 'samples': 4128384, 'steps': 21501, 'loss/train': 1.7121566534042358} -08/30/2021 17:04:10 - INFO - __main__ - Step 21503: {'lr': 0.0004788829296873601, 'samples': 4128576, 'steps': 21502, 'loss/train': 0.30309751629829407} -08/30/2021 17:04:12 - INFO - __main__ - Step 21504: {'lr': 0.0004788807950202463, 'samples': 4128768, 'steps': 21503, 'loss/train': 1.3717628717422485} -08/30/2021 17:04:13 - INFO - __main__ - Step 21505: {'lr': 0.00047887866025000226, 'samples': 4128960, 'steps': 21504, 'loss/train': 1.7132471799850464} -08/30/2021 17:04:13 - INFO - __main__ - Step 21506: {'lr': 0.000478876525376629, 'samples': 4129152, 'steps': 21505, 'loss/train': 1.2056117057800293} -08/30/2021 17:04:13 - INFO - __main__ - Step 21507: {'lr': 0.00047887439040012755, 'samples': 4129344, 'steps': 21506, 'loss/train': 1.7914046049118042} -08/30/2021 17:04:14 - INFO - __main__ - Step 21508: {'lr': 0.0004788722553204988, 'samples': 4129536, 'steps': 21507, 'loss/train': 1.4132291078567505} -08/30/2021 17:04:14 - INFO - __main__ - Step 21509: {'lr': 0.0004788701201377438, 'samples': 4129728, 'steps': 21508, 'loss/train': 1.8986529111862183} -08/30/2021 17:04:15 - INFO - __main__ - Step 21510: {'lr': 0.0004788679848518633, 'samples': 4129920, 'steps': 21509, 'loss/train': 1.638746976852417} -08/30/2021 17:04:16 - INFO - __main__ - Step 21511: {'lr': 0.0004788658494628586, 'samples': 4130112, 'steps': 21510, 'loss/train': 1.896509051322937} -08/30/2021 17:04:16 - INFO - __main__ - Step 21512: {'lr': 0.0004788637139707304, 'samples': 4130304, 'steps': 21511, 'loss/train': 1.7294583320617676} -08/30/2021 17:04:16 - INFO - __main__ - Step 21513: {'lr': 0.00047886157837547975, 'samples': 4130496, 'steps': 21512, 'loss/train': 1.6490304470062256} -08/30/2021 17:04:17 - INFO - __main__ - Step 21514: {'lr': 0.0004788594426771076, 'samples': 4130688, 'steps': 21513, 'loss/train': 1.3523578643798828} -08/30/2021 17:04:20 - INFO - __main__ - Step 21515: {'lr': 0.0004788573068756149, 'samples': 4130880, 'steps': 21514, 'loss/train': 1.8092198371887207} -08/30/2021 17:04:20 - INFO - __main__ - Step 21516: {'lr': 0.0004788551709710027, 'samples': 4131072, 'steps': 21515, 'loss/train': 0.7204294204711914} -08/30/2021 17:04:21 - INFO - __main__ - Step 21517: {'lr': 0.0004788530349632718, 'samples': 4131264, 'steps': 21516, 'loss/train': 0.5451465845108032} -08/30/2021 17:04:21 - INFO - __main__ - Step 21518: {'lr': 0.00047885089885242333, 'samples': 4131456, 'steps': 21517, 'loss/train': 1.6412653923034668} -08/30/2021 17:04:21 - INFO - __main__ - Step 21519: {'lr': 0.0004788487626384581, 'samples': 4131648, 'steps': 21518, 'loss/train': 1.5881367921829224} -08/30/2021 17:04:22 - INFO - __main__ - Step 21520: {'lr': 0.0004788466263213772, 'samples': 4131840, 'steps': 21519, 'loss/train': 1.8423503637313843} -08/30/2021 17:04:23 - INFO - __main__ - Step 21521: {'lr': 0.00047884448990118155, 'samples': 4132032, 'steps': 21520, 'loss/train': 1.8779414892196655} -08/30/2021 17:04:24 - INFO - __main__ - Step 21522: {'lr': 0.0004788423533778721, 'samples': 4132224, 'steps': 21521, 'loss/train': 1.0586224794387817} -08/30/2021 17:04:24 - INFO - __main__ - Step 21523: {'lr': 0.00047884021675144987, 'samples': 4132416, 'steps': 21522, 'loss/train': 1.344202995300293} -08/30/2021 17:04:24 - INFO - __main__ - Step 21524: {'lr': 0.0004788380800219156, 'samples': 4132608, 'steps': 21523, 'loss/train': 1.41176176071167} -08/30/2021 17:04:25 - INFO - __main__ - Step 21525: {'lr': 0.0004788359431892706, 'samples': 4132800, 'steps': 21524, 'loss/train': 1.1432011127471924} -08/30/2021 17:04:26 - INFO - __main__ - Step 21526: {'lr': 0.00047883380625351557, 'samples': 4132992, 'steps': 21525, 'loss/train': 1.7957347631454468} -08/30/2021 17:04:27 - INFO - __main__ - Step 21527: {'lr': 0.00047883166921465156, 'samples': 4133184, 'steps': 21526, 'loss/train': 1.4472945928573608} -08/30/2021 17:04:27 - INFO - __main__ - Step 21528: {'lr': 0.00047882953207267954, 'samples': 4133376, 'steps': 21527, 'loss/train': 1.212437391281128} -08/30/2021 17:04:27 - INFO - __main__ - Step 21529: {'lr': 0.00047882739482760044, 'samples': 4133568, 'steps': 21528, 'loss/train': 1.0129021406173706} -08/30/2021 17:04:28 - INFO - __main__ - Step 21530: {'lr': 0.0004788252574794153, 'samples': 4133760, 'steps': 21529, 'loss/train': 1.4399173259735107} -08/30/2021 17:04:29 - INFO - __main__ - Step 21531: {'lr': 0.000478823120028125, 'samples': 4133952, 'steps': 21530, 'loss/train': 1.6369318962097168} -08/30/2021 17:04:30 - INFO - __main__ - Step 21532: {'lr': 0.0004788209824737305, 'samples': 4134144, 'steps': 21531, 'loss/train': 0.7602819204330444} -08/30/2021 17:04:30 - INFO - __main__ - Step 21533: {'lr': 0.00047881884481623286, 'samples': 4134336, 'steps': 21532, 'loss/train': 0.9776489734649658} -08/30/2021 17:04:30 - INFO - __main__ - Step 21534: {'lr': 0.000478816707055633, 'samples': 4134528, 'steps': 21533, 'loss/train': 1.3832441568374634} -08/30/2021 17:04:31 - INFO - __main__ - Step 21535: {'lr': 0.0004788145691919318, 'samples': 4134720, 'steps': 21534, 'loss/train': 1.7407586574554443} -08/30/2021 17:04:31 - INFO - __main__ - Step 21536: {'lr': 0.0004788124312251303, 'samples': 4134912, 'steps': 21535, 'loss/train': 1.6053481101989746} -08/30/2021 17:04:32 - INFO - __main__ - Step 21537: {'lr': 0.0004788102931552294, 'samples': 4135104, 'steps': 21536, 'loss/train': 1.5271402597427368} -08/30/2021 17:04:33 - INFO - __main__ - Step 21538: {'lr': 0.0004788081549822302, 'samples': 4135296, 'steps': 21537, 'loss/train': 1.834592580795288} -08/30/2021 17:04:33 - INFO - __main__ - Step 21539: {'lr': 0.0004788060167061335, 'samples': 4135488, 'steps': 21538, 'loss/train': 0.9684967994689941} -08/30/2021 17:04:34 - INFO - __main__ - Step 21540: {'lr': 0.0004788038783269404, 'samples': 4135680, 'steps': 21539, 'loss/train': 1.3103408813476562} -08/30/2021 17:04:34 - INFO - __main__ - Step 21541: {'lr': 0.00047880173984465174, 'samples': 4135872, 'steps': 21540, 'loss/train': 1.6949554681777954} -08/30/2021 17:04:36 - INFO - __main__ - Step 21542: {'lr': 0.0004787996012592686, 'samples': 4136064, 'steps': 21541, 'loss/train': 1.6658117771148682} -08/30/2021 17:04:36 - INFO - __main__ - Step 21543: {'lr': 0.0004787974625707919, 'samples': 4136256, 'steps': 21542, 'loss/train': 1.4745776653289795} -08/30/2021 17:04:36 - INFO - __main__ - Step 21544: {'lr': 0.0004787953237792225, 'samples': 4136448, 'steps': 21543, 'loss/train': 1.6299556493759155} -08/30/2021 17:04:37 - INFO - __main__ - Step 21545: {'lr': 0.0004787931848845616, 'samples': 4136640, 'steps': 21544, 'loss/train': 1.6548094749450684} -08/30/2021 17:04:37 - INFO - __main__ - Step 21546: {'lr': 0.00047879104588680987, 'samples': 4136832, 'steps': 21545, 'loss/train': 1.4136765003204346} -08/30/2021 17:04:38 - INFO - __main__ - Step 21547: {'lr': 0.00047878890678596854, 'samples': 4137024, 'steps': 21546, 'loss/train': 1.978952407836914} -08/30/2021 17:04:39 - INFO - __main__ - Step 21548: {'lr': 0.00047878676758203844, 'samples': 4137216, 'steps': 21547, 'loss/train': 2.357581377029419} -08/30/2021 17:04:39 - INFO - __main__ - Step 21549: {'lr': 0.00047878462827502055, 'samples': 4137408, 'steps': 21548, 'loss/train': 1.579661250114441} -08/30/2021 17:04:40 - INFO - __main__ - Step 21550: {'lr': 0.0004787824888649158, 'samples': 4137600, 'steps': 21549, 'loss/train': 1.5313758850097656} -08/30/2021 17:04:40 - INFO - __main__ - Step 21551: {'lr': 0.0004787803493517252, 'samples': 4137792, 'steps': 21550, 'loss/train': 1.173863172531128} -08/30/2021 17:04:42 - INFO - __main__ - Step 21552: {'lr': 0.0004787782097354497, 'samples': 4137984, 'steps': 21551, 'loss/train': 1.7947689294815063} -08/30/2021 17:04:42 - INFO - __main__ - Step 21553: {'lr': 0.00047877607001609035, 'samples': 4138176, 'steps': 21552, 'loss/train': 1.6152856349945068} -08/30/2021 17:04:42 - INFO - __main__ - Step 21554: {'lr': 0.00047877393019364796, 'samples': 4138368, 'steps': 21553, 'loss/train': 0.08391077816486359} -08/30/2021 17:04:43 - INFO - __main__ - Step 21555: {'lr': 0.0004787717902681236, 'samples': 4138560, 'steps': 21554, 'loss/train': 1.3522006273269653} -08/30/2021 17:04:43 - INFO - __main__ - Step 21556: {'lr': 0.00047876965023951814, 'samples': 4138752, 'steps': 21555, 'loss/train': 1.7337920665740967} -08/30/2021 17:04:45 - INFO - __main__ - Step 21557: {'lr': 0.00047876751010783266, 'samples': 4138944, 'steps': 21556, 'loss/train': 1.6510796546936035} -08/30/2021 17:04:45 - INFO - __main__ - Step 21558: {'lr': 0.0004787653698730681, 'samples': 4139136, 'steps': 21557, 'loss/train': 1.9008625745773315} -08/30/2021 17:04:46 - INFO - __main__ - Step 21559: {'lr': 0.00047876322953522535, 'samples': 4139328, 'steps': 21558, 'loss/train': 0.08120544999837875} -08/30/2021 17:04:46 - INFO - __main__ - Step 21560: {'lr': 0.00047876108909430536, 'samples': 4139520, 'steps': 21559, 'loss/train': 1.7383759021759033} -08/30/2021 17:04:46 - INFO - __main__ - Step 21561: {'lr': 0.00047875894855030923, 'samples': 4139712, 'steps': 21560, 'loss/train': 1.2564455270767212} -08/30/2021 17:04:47 - INFO - __main__ - Step 21562: {'lr': 0.00047875680790323785, 'samples': 4139904, 'steps': 21561, 'loss/train': 1.6330316066741943} -08/30/2021 17:04:48 - INFO - __main__ - Step 21563: {'lr': 0.0004787546671530921, 'samples': 4140096, 'steps': 21562, 'loss/train': 1.9583455324172974} -08/30/2021 17:04:48 - INFO - __main__ - Step 21564: {'lr': 0.0004787525262998731, 'samples': 4140288, 'steps': 21563, 'loss/train': 2.428619146347046} -08/30/2021 17:04:49 - INFO - __main__ - Step 21565: {'lr': 0.0004787503853435817, 'samples': 4140480, 'steps': 21564, 'loss/train': 1.3141828775405884} -08/30/2021 17:04:49 - INFO - __main__ - Step 21566: {'lr': 0.00047874824428421897, 'samples': 4140672, 'steps': 21565, 'loss/train': 1.6801226139068604} -08/30/2021 17:04:50 - INFO - __main__ - Step 21567: {'lr': 0.0004787461031217858, 'samples': 4140864, 'steps': 21566, 'loss/train': 1.6470086574554443} -08/30/2021 17:04:51 - INFO - __main__ - Step 21568: {'lr': 0.0004787439618562831, 'samples': 4141056, 'steps': 21567, 'loss/train': 2.1003711223602295} -08/30/2021 17:04:52 - INFO - __main__ - Step 21569: {'lr': 0.000478741820487712, 'samples': 4141248, 'steps': 21568, 'loss/train': 1.7431973218917847} -08/30/2021 17:04:52 - INFO - __main__ - Step 21570: {'lr': 0.0004787396790160733, 'samples': 4141440, 'steps': 21569, 'loss/train': 1.4745862483978271} -08/30/2021 17:04:52 - INFO - __main__ - Step 21571: {'lr': 0.00047873753744136807, 'samples': 4141632, 'steps': 21570, 'loss/train': 1.5483851432800293} -08/30/2021 17:04:53 - INFO - __main__ - Step 21572: {'lr': 0.0004787353957635971, 'samples': 4141824, 'steps': 21571, 'loss/train': 1.7145155668258667} -08/30/2021 17:04:55 - INFO - __main__ - Step 21573: {'lr': 0.0004787332539827617, 'samples': 4142016, 'steps': 21572, 'loss/train': 2.096367835998535} -08/30/2021 17:04:55 - INFO - __main__ - Step 21574: {'lr': 0.00047873111209886245, 'samples': 4142208, 'steps': 21573, 'loss/train': 1.3759455680847168} -08/30/2021 17:04:56 - INFO - __main__ - Step 21575: {'lr': 0.00047872897011190063, 'samples': 4142400, 'steps': 21574, 'loss/train': 1.3320780992507935} -08/30/2021 17:04:56 - INFO - __main__ - Step 21576: {'lr': 0.00047872682802187693, 'samples': 4142592, 'steps': 21575, 'loss/train': 1.7277063131332397} -08/30/2021 17:04:56 - INFO - __main__ - Step 21577: {'lr': 0.0004787246858287926, 'samples': 4142784, 'steps': 21576, 'loss/train': 1.3015682697296143} -08/30/2021 17:04:58 - INFO - __main__ - Step 21578: {'lr': 0.0004787225435326483, 'samples': 4142976, 'steps': 21577, 'loss/train': 1.412316083908081} -08/30/2021 17:04:58 - INFO - __main__ - Step 21579: {'lr': 0.0004787204011334453, 'samples': 4143168, 'steps': 21578, 'loss/train': 2.0656633377075195} -08/30/2021 17:04:59 - INFO - __main__ - Step 21580: {'lr': 0.0004787182586311843, 'samples': 4143360, 'steps': 21579, 'loss/train': 1.8539068698883057} -08/30/2021 17:04:59 - INFO - __main__ - Step 21581: {'lr': 0.0004787161160258664, 'samples': 4143552, 'steps': 21580, 'loss/train': 1.6576381921768188} -08/30/2021 17:04:59 - INFO - __main__ - Step 21582: {'lr': 0.00047871397331749254, 'samples': 4143744, 'steps': 21581, 'loss/train': 1.424061894416809} -08/30/2021 17:05:01 - INFO - __main__ - Step 21583: {'lr': 0.00047871183050606376, 'samples': 4143936, 'steps': 21582, 'loss/train': 1.6823989152908325} -08/30/2021 17:05:02 - INFO - __main__ - Step 21584: {'lr': 0.00047870968759158096, 'samples': 4144128, 'steps': 21583, 'loss/train': 1.2910590171813965} -08/30/2021 17:05:02 - INFO - __main__ - Step 21585: {'lr': 0.000478707544574045, 'samples': 4144320, 'steps': 21584, 'loss/train': 1.3867682218551636} -08/30/2021 17:05:02 - INFO - __main__ - Step 21586: {'lr': 0.000478705401453457, 'samples': 4144512, 'steps': 21585, 'loss/train': 1.9276567697525024} -08/30/2021 17:05:03 - INFO - __main__ - Step 21587: {'lr': 0.000478703258229818, 'samples': 4144704, 'steps': 21586, 'loss/train': 0.12375839799642563} -08/30/2021 17:05:03 - INFO - __main__ - Step 21588: {'lr': 0.0004787011149031287, 'samples': 4144896, 'steps': 21587, 'loss/train': 1.468145728111267} -08/30/2021 17:05:05 - INFO - __main__ - Step 21589: {'lr': 0.0004786989714733902, 'samples': 4145088, 'steps': 21588, 'loss/train': 1.724992036819458} -08/30/2021 17:05:05 - INFO - __main__ - Step 21590: {'lr': 0.0004786968279406035, 'samples': 4145280, 'steps': 21589, 'loss/train': 1.1805689334869385} -08/30/2021 17:05:05 - INFO - __main__ - Step 21591: {'lr': 0.0004786946843047696, 'samples': 4145472, 'steps': 21590, 'loss/train': 1.4405713081359863} -08/30/2021 17:05:06 - INFO - __main__ - Step 21592: {'lr': 0.00047869254056588927, 'samples': 4145664, 'steps': 21591, 'loss/train': 1.5672636032104492} -08/30/2021 17:05:06 - INFO - __main__ - Step 21593: {'lr': 0.0004786903967239637, 'samples': 4145856, 'steps': 21592, 'loss/train': 1.586122751235962} -08/30/2021 17:05:08 - INFO - __main__ - Step 21594: {'lr': 0.0004786882527789938, 'samples': 4146048, 'steps': 21593, 'loss/train': 1.1756656169891357} -08/30/2021 17:05:08 - INFO - __main__ - Step 21595: {'lr': 0.00047868610873098047, 'samples': 4146240, 'steps': 21594, 'loss/train': 2.0050926208496094} -08/30/2021 17:05:09 - INFO - __main__ - Step 21596: {'lr': 0.0004786839645799247, 'samples': 4146432, 'steps': 21595, 'loss/train': 1.450789213180542} -08/30/2021 17:05:09 - INFO - __main__ - Step 21597: {'lr': 0.00047868182032582746, 'samples': 4146624, 'steps': 21596, 'loss/train': 1.3242963552474976} -08/30/2021 17:05:09 - INFO - __main__ - Step 21598: {'lr': 0.00047867967596868974, 'samples': 4146816, 'steps': 21597, 'loss/train': 0.3487500250339508} -08/30/2021 17:05:11 - INFO - __main__ - Step 21599: {'lr': 0.00047867753150851244, 'samples': 4147008, 'steps': 21598, 'loss/train': 2.2175378799438477} -08/30/2021 17:05:11 - INFO - __main__ - Step 21600: {'lr': 0.0004786753869452966, 'samples': 4147200, 'steps': 21599, 'loss/train': 1.419573426246643} -08/30/2021 17:05:12 - INFO - __main__ - Step 21601: {'lr': 0.00047867324227904317, 'samples': 4147392, 'steps': 21600, 'loss/train': 1.3353098630905151} -08/30/2021 17:05:12 - INFO - __main__ - Step 21602: {'lr': 0.0004786710975097531, 'samples': 4147584, 'steps': 21601, 'loss/train': 1.6635923385620117} -08/30/2021 17:05:12 - INFO - __main__ - Step 21603: {'lr': 0.0004786689526374274, 'samples': 4147776, 'steps': 21602, 'loss/train': 1.8505805730819702} -08/30/2021 17:05:13 - INFO - __main__ - Step 21604: {'lr': 0.00047866680766206693, 'samples': 4147968, 'steps': 21603, 'loss/train': 1.4862685203552246} -08/30/2021 17:05:14 - INFO - __main__ - Step 21605: {'lr': 0.0004786646625836727, 'samples': 4148160, 'steps': 21604, 'loss/train': 1.943293809890747} -08/30/2021 17:05:15 - INFO - __main__ - Step 21606: {'lr': 0.0004786625174022458, 'samples': 4148352, 'steps': 21605, 'loss/train': 1.1202270984649658} -08/30/2021 17:05:15 - INFO - __main__ - Step 21607: {'lr': 0.00047866037211778705, 'samples': 4148544, 'steps': 21606, 'loss/train': 2.019742965698242} -08/30/2021 17:05:16 - INFO - __main__ - Step 21608: {'lr': 0.0004786582267302975, 'samples': 4148736, 'steps': 21607, 'loss/train': 1.2123949527740479} -08/30/2021 17:05:16 - INFO - __main__ - Step 21609: {'lr': 0.000478656081239778, 'samples': 4148928, 'steps': 21608, 'loss/train': 1.9415785074234009} -08/30/2021 17:05:17 - INFO - __main__ - Step 21610: {'lr': 0.0004786539356462297, 'samples': 4149120, 'steps': 21609, 'loss/train': 1.5333104133605957} -08/30/2021 17:05:18 - INFO - __main__ - Step 21611: {'lr': 0.0004786517899496534, 'samples': 4149312, 'steps': 21610, 'loss/train': 1.5422704219818115} -08/30/2021 17:05:18 - INFO - __main__ - Step 21612: {'lr': 0.0004786496441500502, 'samples': 4149504, 'steps': 21611, 'loss/train': 1.368769645690918} -08/30/2021 17:05:19 - INFO - __main__ - Step 21613: {'lr': 0.00047864749824742093, 'samples': 4149696, 'steps': 21612, 'loss/train': 1.8876041173934937} -08/30/2021 17:05:19 - INFO - __main__ - Step 21614: {'lr': 0.00047864535224176666, 'samples': 4149888, 'steps': 21613, 'loss/train': 1.2801645994186401} -08/30/2021 17:05:20 - INFO - __main__ - Step 21615: {'lr': 0.0004786432061330882, 'samples': 4150080, 'steps': 21614, 'loss/train': 1.3951793909072876} -08/30/2021 17:05:21 - INFO - __main__ - Step 21616: {'lr': 0.0004786410599213868, 'samples': 4150272, 'steps': 21615, 'loss/train': 1.6834088563919067} -08/30/2021 17:05:21 - INFO - __main__ - Step 21617: {'lr': 0.00047863891360666323, 'samples': 4150464, 'steps': 21616, 'loss/train': 1.1598668098449707} -08/30/2021 17:05:22 - INFO - __main__ - Step 21618: {'lr': 0.00047863676718891846, 'samples': 4150656, 'steps': 21617, 'loss/train': 1.665282130241394} -08/30/2021 17:05:22 - INFO - __main__ - Step 21619: {'lr': 0.0004786346206681535, 'samples': 4150848, 'steps': 21618, 'loss/train': 1.9712655544281006} -08/30/2021 17:05:24 - INFO - __main__ - Step 21620: {'lr': 0.0004786324740443693, 'samples': 4151040, 'steps': 21619, 'loss/train': 1.265072226524353} -08/30/2021 17:05:24 - INFO - __main__ - Step 21621: {'lr': 0.00047863032731756684, 'samples': 4151232, 'steps': 21620, 'loss/train': 0.20737281441688538} -08/30/2021 17:05:24 - INFO - __main__ - Step 21622: {'lr': 0.0004786281804877471, 'samples': 4151424, 'steps': 21621, 'loss/train': 1.6420605182647705} -08/30/2021 17:05:25 - INFO - __main__ - Step 21623: {'lr': 0.00047862603355491103, 'samples': 4151616, 'steps': 21622, 'loss/train': 2.252286434173584} -08/30/2021 17:05:25 - INFO - __main__ - Step 21624: {'lr': 0.0004786238865190595, 'samples': 4151808, 'steps': 21623, 'loss/train': 1.5345619916915894} -08/30/2021 17:05:27 - INFO - __main__ - Step 21625: {'lr': 0.0004786217393801937, 'samples': 4152000, 'steps': 21624, 'loss/train': 1.3157330751419067} -08/30/2021 17:05:27 - INFO - __main__ - Step 21626: {'lr': 0.00047861959213831446, 'samples': 4152192, 'steps': 21625, 'loss/train': 1.9387462139129639} -08/30/2021 17:05:28 - INFO - __main__ - Step 21627: {'lr': 0.0004786174447934227, 'samples': 4152384, 'steps': 21626, 'loss/train': 1.5936999320983887} -08/30/2021 17:05:28 - INFO - __main__ - Step 21628: {'lr': 0.0004786152973455195, 'samples': 4152576, 'steps': 21627, 'loss/train': 1.2677874565124512} -08/30/2021 17:05:28 - INFO - __main__ - Step 21629: {'lr': 0.0004786131497946058, 'samples': 4152768, 'steps': 21628, 'loss/train': 1.9037866592407227} -08/30/2021 17:05:30 - INFO - __main__ - Step 21630: {'lr': 0.0004786110021406824, 'samples': 4152960, 'steps': 21629, 'loss/train': 1.6569949388504028} -08/30/2021 17:05:30 - INFO - __main__ - Step 21631: {'lr': 0.0004786088543837506, 'samples': 4153152, 'steps': 21630, 'loss/train': 1.278141975402832} -08/30/2021 17:05:31 - INFO - __main__ - Step 21632: {'lr': 0.00047860670652381105, 'samples': 4153344, 'steps': 21631, 'loss/train': 1.80409574508667} -08/30/2021 17:05:31 - INFO - __main__ - Step 21633: {'lr': 0.00047860455856086487, 'samples': 4153536, 'steps': 21632, 'loss/train': 1.2285655736923218} -08/30/2021 17:05:31 - INFO - __main__ - Step 21634: {'lr': 0.00047860241049491303, 'samples': 4153728, 'steps': 21633, 'loss/train': 1.7540972232818604} -08/30/2021 17:05:34 - INFO - __main__ - Step 21635: {'lr': 0.00047860026232595645, 'samples': 4153920, 'steps': 21634, 'loss/train': 1.0764487981796265} -08/30/2021 17:05:34 - INFO - __main__ - Step 21636: {'lr': 0.0004785981140539961, 'samples': 4154112, 'steps': 21635, 'loss/train': 2.0278148651123047} -08/30/2021 17:05:34 - INFO - __main__ - Step 21637: {'lr': 0.000478595965679033, 'samples': 4154304, 'steps': 21636, 'loss/train': 1.2128251791000366} -08/30/2021 17:05:35 - INFO - __main__ - Step 21638: {'lr': 0.0004785938172010681, 'samples': 4154496, 'steps': 21637, 'loss/train': 1.9851192235946655} -08/30/2021 17:05:35 - INFO - __main__ - Step 21639: {'lr': 0.0004785916686201023, 'samples': 4154688, 'steps': 21638, 'loss/train': 2.2266154289245605} -08/30/2021 17:05:35 - INFO - __main__ - Step 21640: {'lr': 0.00047858951993613665, 'samples': 4154880, 'steps': 21639, 'loss/train': 1.9012534618377686} -08/30/2021 17:05:37 - INFO - __main__ - Step 21641: {'lr': 0.0004785873711491721, 'samples': 4155072, 'steps': 21640, 'loss/train': 1.3370827436447144} -08/30/2021 17:05:38 - INFO - __main__ - Step 21642: {'lr': 0.00047858522225920964, 'samples': 4155264, 'steps': 21641, 'loss/train': 1.211037039756775} -08/30/2021 17:05:38 - INFO - __main__ - Step 21643: {'lr': 0.00047858307326625014, 'samples': 4155456, 'steps': 21642, 'loss/train': 1.617024540901184} -08/30/2021 17:05:38 - INFO - __main__ - Step 21644: {'lr': 0.00047858092417029464, 'samples': 4155648, 'steps': 21643, 'loss/train': 1.245651125907898} -08/30/2021 17:05:39 - INFO - __main__ - Step 21645: {'lr': 0.00047857877497134416, 'samples': 4155840, 'steps': 21644, 'loss/train': 1.972427248954773} -08/30/2021 17:05:39 - INFO - __main__ - Step 21646: {'lr': 0.0004785766256693995, 'samples': 4156032, 'steps': 21645, 'loss/train': 1.904283881187439} -08/30/2021 17:05:41 - INFO - __main__ - Step 21647: {'lr': 0.0004785744762644619, 'samples': 4156224, 'steps': 21646, 'loss/train': 1.5063691139221191} -08/30/2021 17:05:41 - INFO - __main__ - Step 21648: {'lr': 0.00047857232675653207, 'samples': 4156416, 'steps': 21647, 'loss/train': 0.1265147179365158} -08/30/2021 17:05:42 - INFO - __main__ - Step 21649: {'lr': 0.00047857017714561105, 'samples': 4156608, 'steps': 21648, 'loss/train': 1.8977305889129639} -08/30/2021 17:05:42 - INFO - __main__ - Step 21650: {'lr': 0.00047856802743169994, 'samples': 4156800, 'steps': 21649, 'loss/train': 2.013026237487793} -08/30/2021 17:05:42 - INFO - __main__ - Step 21651: {'lr': 0.00047856587761479954, 'samples': 4156992, 'steps': 21650, 'loss/train': 2.245924711227417} -08/30/2021 17:05:44 - INFO - __main__ - Step 21652: {'lr': 0.00047856372769491083, 'samples': 4157184, 'steps': 21651, 'loss/train': 2.003310203552246} -08/30/2021 17:05:44 - INFO - __main__ - Step 21653: {'lr': 0.0004785615776720349, 'samples': 4157376, 'steps': 21652, 'loss/train': 1.499346375465393} -08/30/2021 17:05:45 - INFO - __main__ - Step 21654: {'lr': 0.0004785594275461726, 'samples': 4157568, 'steps': 21653, 'loss/train': 1.6132514476776123} -08/30/2021 17:05:45 - INFO - __main__ - Step 21655: {'lr': 0.00047855727731732503, 'samples': 4157760, 'steps': 21654, 'loss/train': 1.4317113161087036} -08/30/2021 17:05:45 - INFO - __main__ - Step 21656: {'lr': 0.00047855512698549295, 'samples': 4157952, 'steps': 21655, 'loss/train': 1.4344325065612793} -08/30/2021 17:05:47 - INFO - __main__ - Step 21657: {'lr': 0.00047855297655067754, 'samples': 4158144, 'steps': 21656, 'loss/train': 1.5683907270431519} -08/30/2021 17:05:47 - INFO - __main__ - Step 21658: {'lr': 0.0004785508260128797, 'samples': 4158336, 'steps': 21657, 'loss/train': 1.5640400648117065} -08/30/2021 17:05:48 - INFO - __main__ - Step 21659: {'lr': 0.00047854867537210034, 'samples': 4158528, 'steps': 21658, 'loss/train': 1.8587629795074463} -08/30/2021 17:05:48 - INFO - __main__ - Step 21660: {'lr': 0.00047854652462834055, 'samples': 4158720, 'steps': 21659, 'loss/train': 1.7621623277664185} -08/30/2021 17:05:48 - INFO - __main__ - Step 21661: {'lr': 0.0004785443737816012, 'samples': 4158912, 'steps': 21660, 'loss/train': 1.5130053758621216} -08/30/2021 17:05:50 - INFO - __main__ - Step 21662: {'lr': 0.0004785422228318832, 'samples': 4159104, 'steps': 21661, 'loss/train': 1.2033276557922363} -08/30/2021 17:05:50 - INFO - __main__ - Step 21663: {'lr': 0.0004785400717791877, 'samples': 4159296, 'steps': 21662, 'loss/train': 1.7768971920013428} -08/30/2021 17:05:51 - INFO - __main__ - Step 21664: {'lr': 0.0004785379206235155, 'samples': 4159488, 'steps': 21663, 'loss/train': 1.7159216403961182} -08/30/2021 17:05:51 - INFO - __main__ - Step 21665: {'lr': 0.00047853576936486764, 'samples': 4159680, 'steps': 21664, 'loss/train': 1.5477763414382935} -08/30/2021 17:05:51 - INFO - __main__ - Step 21666: {'lr': 0.00047853361800324516, 'samples': 4159872, 'steps': 21665, 'loss/train': 1.7746342420578003} -08/30/2021 17:05:53 - INFO - __main__ - Step 21667: {'lr': 0.0004785314665386489, 'samples': 4160064, 'steps': 21666, 'loss/train': 1.3123118877410889} -08/30/2021 17:05:53 - INFO - __main__ - Step 21668: {'lr': 0.00047852931497107987, 'samples': 4160256, 'steps': 21667, 'loss/train': 1.0089551210403442} -08/30/2021 17:05:54 - INFO - __main__ - Step 21669: {'lr': 0.0004785271633005391, 'samples': 4160448, 'steps': 21668, 'loss/train': 0.8854736089706421} -08/30/2021 17:05:54 - INFO - __main__ - Step 21670: {'lr': 0.0004785250115270275, 'samples': 4160640, 'steps': 21669, 'loss/train': 1.405593991279602} -08/30/2021 17:05:55 - INFO - __main__ - Step 21671: {'lr': 0.00047852285965054606, 'samples': 4160832, 'steps': 21670, 'loss/train': 1.7800955772399902} -08/30/2021 17:05:56 - INFO - __main__ - Step 21672: {'lr': 0.00047852070767109573, 'samples': 4161024, 'steps': 21671, 'loss/train': 0.6641238927841187} -08/30/2021 17:05:57 - INFO - __main__ - Step 21673: {'lr': 0.00047851855558867754, 'samples': 4161216, 'steps': 21672, 'loss/train': 1.8311665058135986} -08/30/2021 17:05:57 - INFO - __main__ - Step 21674: {'lr': 0.0004785164034032924, 'samples': 4161408, 'steps': 21673, 'loss/train': 1.4423707723617554} -08/30/2021 17:05:57 - INFO - __main__ - Step 21675: {'lr': 0.0004785142511149412, 'samples': 4161600, 'steps': 21674, 'loss/train': 1.4329500198364258} -08/30/2021 17:05:58 - INFO - __main__ - Step 21676: {'lr': 0.0004785120987236251, 'samples': 4161792, 'steps': 21675, 'loss/train': 1.7964509725570679} -08/30/2021 17:05:58 - INFO - __main__ - Step 21677: {'lr': 0.00047850994622934494, 'samples': 4161984, 'steps': 21676, 'loss/train': 2.149315357208252} -08/30/2021 17:06:00 - INFO - __main__ - Step 21678: {'lr': 0.0004785077936321018, 'samples': 4162176, 'steps': 21677, 'loss/train': 1.191805362701416} -08/30/2021 17:06:00 - INFO - __main__ - Step 21679: {'lr': 0.00047850564093189653, 'samples': 4162368, 'steps': 21678, 'loss/train': 1.8324463367462158} -08/30/2021 17:06:01 - INFO - __main__ - Step 21680: {'lr': 0.0004785034881287301, 'samples': 4162560, 'steps': 21679, 'loss/train': 1.6059406995773315} -08/30/2021 17:06:01 - INFO - __main__ - Step 21681: {'lr': 0.0004785013352226035, 'samples': 4162752, 'steps': 21680, 'loss/train': 1.2899469137191772} -08/30/2021 17:06:02 - INFO - __main__ - Step 21682: {'lr': 0.00047849918221351783, 'samples': 4162944, 'steps': 21681, 'loss/train': 1.5513609647750854} -08/30/2021 17:06:03 - INFO - __main__ - Step 21683: {'lr': 0.0004784970291014739, 'samples': 4163136, 'steps': 21682, 'loss/train': 1.4121525287628174} -08/30/2021 17:06:04 - INFO - __main__ - Step 21684: {'lr': 0.0004784948758864727, 'samples': 4163328, 'steps': 21683, 'loss/train': 1.5040241479873657} -08/30/2021 17:06:04 - INFO - __main__ - Step 21685: {'lr': 0.0004784927225685153, 'samples': 4163520, 'steps': 21684, 'loss/train': 1.7399235963821411} -08/30/2021 17:06:04 - INFO - __main__ - Step 21686: {'lr': 0.00047849056914760256, 'samples': 4163712, 'steps': 21685, 'loss/train': 1.5813474655151367} -08/30/2021 17:06:05 - INFO - __main__ - Step 21687: {'lr': 0.00047848841562373557, 'samples': 4163904, 'steps': 21686, 'loss/train': 1.3997126817703247} -08/30/2021 17:06:06 - INFO - __main__ - Step 21688: {'lr': 0.00047848626199691513, 'samples': 4164096, 'steps': 21687, 'loss/train': 0.8966947197914124} -08/30/2021 17:06:07 - INFO - __main__ - Step 21689: {'lr': 0.00047848410826714237, 'samples': 4164288, 'steps': 21688, 'loss/train': 2.055316209793091} -08/30/2021 17:06:07 - INFO - __main__ - Step 21690: {'lr': 0.00047848195443441817, 'samples': 4164480, 'steps': 21689, 'loss/train': 1.6565885543823242} -08/30/2021 17:06:07 - INFO - __main__ - Step 21691: {'lr': 0.0004784798004987435, 'samples': 4164672, 'steps': 21690, 'loss/train': 1.4507962465286255} -08/30/2021 17:06:08 - INFO - __main__ - Step 21692: {'lr': 0.00047847764646011937, 'samples': 4164864, 'steps': 21691, 'loss/train': 1.6128380298614502} -08/30/2021 17:06:09 - INFO - __main__ - Step 21693: {'lr': 0.0004784754923185468, 'samples': 4165056, 'steps': 21692, 'loss/train': 1.4008574485778809} -08/30/2021 17:06:10 - INFO - __main__ - Step 21694: {'lr': 0.00047847333807402666, 'samples': 4165248, 'steps': 21693, 'loss/train': 1.9528981447219849} -08/30/2021 17:06:10 - INFO - __main__ - Step 21695: {'lr': 0.00047847118372655996, 'samples': 4165440, 'steps': 21694, 'loss/train': 1.243920087814331} -08/30/2021 17:06:10 - INFO - __main__ - Step 21696: {'lr': 0.00047846902927614767, 'samples': 4165632, 'steps': 21695, 'loss/train': 1.3261280059814453} -08/30/2021 17:06:11 - INFO - __main__ - Step 21697: {'lr': 0.0004784668747227907, 'samples': 4165824, 'steps': 21696, 'loss/train': 1.3166300058364868} -08/30/2021 17:06:12 - INFO - __main__ - Step 21698: {'lr': 0.00047846472006649016, 'samples': 4166016, 'steps': 21697, 'loss/train': 1.4801424741744995} -08/30/2021 17:06:13 - INFO - __main__ - Step 21699: {'lr': 0.0004784625653072469, 'samples': 4166208, 'steps': 21698, 'loss/train': 1.820278286933899} -08/30/2021 17:06:13 - INFO - __main__ - Step 21700: {'lr': 0.00047846041044506194, 'samples': 4166400, 'steps': 21699, 'loss/train': 1.6920466423034668} -08/30/2021 17:06:13 - INFO - __main__ - Step 21701: {'lr': 0.00047845825547993627, 'samples': 4166592, 'steps': 21700, 'loss/train': 1.3065929412841797} -08/30/2021 17:06:14 - INFO - __main__ - Step 21702: {'lr': 0.0004784561004118708, 'samples': 4166784, 'steps': 21701, 'loss/train': 0.916358470916748} -08/30/2021 17:06:14 - INFO - __main__ - Step 21703: {'lr': 0.0004784539452408666, 'samples': 4166976, 'steps': 21702, 'loss/train': 1.397084355354309} -08/30/2021 17:06:16 - INFO - __main__ - Step 21704: {'lr': 0.0004784517899669245, 'samples': 4167168, 'steps': 21703, 'loss/train': 1.5995969772338867} -08/30/2021 17:06:16 - INFO - __main__ - Step 21705: {'lr': 0.00047844963459004565, 'samples': 4167360, 'steps': 21704, 'loss/train': 1.1845390796661377} -08/30/2021 17:06:16 - INFO - __main__ - Step 21706: {'lr': 0.00047844747911023077, 'samples': 4167552, 'steps': 21705, 'loss/train': 1.4429291486740112} -08/30/2021 17:06:17 - INFO - __main__ - Step 21707: {'lr': 0.00047844532352748115, 'samples': 4167744, 'steps': 21706, 'loss/train': 1.5198560953140259} -08/30/2021 17:06:18 - INFO - __main__ - Step 21708: {'lr': 0.0004784431678417975, 'samples': 4167936, 'steps': 21707, 'loss/train': 1.672396183013916} -08/30/2021 17:06:19 - INFO - __main__ - Step 21709: {'lr': 0.00047844101205318085, 'samples': 4168128, 'steps': 21708, 'loss/train': 1.552107334136963} -08/30/2021 17:06:19 - INFO - __main__ - Step 21710: {'lr': 0.0004784388561616323, 'samples': 4168320, 'steps': 21709, 'loss/train': 1.5733312368392944} -08/30/2021 17:06:20 - INFO - __main__ - Step 21711: {'lr': 0.0004784367001671526, 'samples': 4168512, 'steps': 21710, 'loss/train': 2.090911388397217} -08/30/2021 17:06:20 - INFO - __main__ - Step 21712: {'lr': 0.00047843454406974295, 'samples': 4168704, 'steps': 21711, 'loss/train': 0.10917995125055313} -08/30/2021 17:06:20 - INFO - __main__ - Step 21713: {'lr': 0.00047843238786940423, 'samples': 4168896, 'steps': 21712, 'loss/train': 1.238024115562439} -08/30/2021 17:06:22 - INFO - __main__ - Step 21714: {'lr': 0.0004784302315661373, 'samples': 4169088, 'steps': 21713, 'loss/train': 1.3346723318099976} -08/30/2021 17:06:22 - INFO - __main__ - Step 21715: {'lr': 0.00047842807515994335, 'samples': 4169280, 'steps': 21714, 'loss/train': 1.1240020990371704} -08/30/2021 17:06:22 - INFO - __main__ - Step 21716: {'lr': 0.00047842591865082315, 'samples': 4169472, 'steps': 21715, 'loss/train': 1.3416444063186646} -08/30/2021 17:06:23 - INFO - __main__ - Step 21717: {'lr': 0.0004784237620387778, 'samples': 4169664, 'steps': 21716, 'loss/train': 1.1611155271530151} -08/30/2021 17:06:23 - INFO - __main__ - Step 21718: {'lr': 0.0004784216053238082, 'samples': 4169856, 'steps': 21717, 'loss/train': 1.9573583602905273} -08/30/2021 17:06:25 - INFO - __main__ - Step 21719: {'lr': 0.00047841944850591535, 'samples': 4170048, 'steps': 21718, 'loss/train': 1.6516616344451904} -08/30/2021 17:06:25 - INFO - __main__ - Step 21720: {'lr': 0.0004784172915851003, 'samples': 4170240, 'steps': 21719, 'loss/train': 1.3609671592712402} -08/30/2021 17:06:26 - INFO - __main__ - Step 21721: {'lr': 0.00047841513456136383, 'samples': 4170432, 'steps': 21720, 'loss/train': 1.008778691291809} -08/30/2021 17:06:26 - INFO - __main__ - Step 21722: {'lr': 0.000478412977434707, 'samples': 4170624, 'steps': 21721, 'loss/train': 1.7178418636322021} -08/30/2021 17:06:26 - INFO - __main__ - Step 21723: {'lr': 0.00047841082020513094, 'samples': 4170816, 'steps': 21722, 'loss/train': 1.863709568977356} -08/30/2021 17:06:28 - INFO - __main__ - Step 21724: {'lr': 0.0004784086628726364, 'samples': 4171008, 'steps': 21723, 'loss/train': 3.1482386589050293} -08/30/2021 17:06:28 - INFO - __main__ - Step 21725: {'lr': 0.0004784065054372245, 'samples': 4171200, 'steps': 21724, 'loss/train': 1.9970582723617554} -08/30/2021 17:06:29 - INFO - __main__ - Step 21726: {'lr': 0.0004784043478988961, 'samples': 4171392, 'steps': 21725, 'loss/train': 1.3224568367004395} -08/30/2021 17:06:29 - INFO - __main__ - Step 21727: {'lr': 0.00047840219025765225, 'samples': 4171584, 'steps': 21726, 'loss/train': 2.3315300941467285} -08/30/2021 17:06:29 - INFO - __main__ - Step 21728: {'lr': 0.0004784000325134939, 'samples': 4171776, 'steps': 21727, 'loss/train': 0.11365387588739395} -08/30/2021 17:06:30 - INFO - __main__ - Step 21729: {'lr': 0.00047839787466642206, 'samples': 4171968, 'steps': 21728, 'loss/train': 1.4912441968917847} -08/30/2021 17:06:32 - INFO - __main__ - Step 21730: {'lr': 0.00047839571671643756, 'samples': 4172160, 'steps': 21729, 'loss/train': 1.7546395063400269} -08/30/2021 17:06:33 - INFO - __main__ - Step 21731: {'lr': 0.0004783935586635415, 'samples': 4172352, 'steps': 21730, 'loss/train': 2.2621519565582275} -08/30/2021 17:06:33 - INFO - __main__ - Step 21732: {'lr': 0.0004783914005077349, 'samples': 4172544, 'steps': 21731, 'loss/train': 1.6448993682861328} -08/30/2021 17:06:33 - INFO - __main__ - Step 21733: {'lr': 0.0004783892422490186, 'samples': 4172736, 'steps': 21732, 'loss/train': 1.3782418966293335} -08/30/2021 17:06:34 - INFO - __main__ - Step 21734: {'lr': 0.00047838708388739365, 'samples': 4172928, 'steps': 21733, 'loss/train': 1.9569100141525269} -08/30/2021 17:06:35 - INFO - __main__ - Step 21735: {'lr': 0.000478384925422861, 'samples': 4173120, 'steps': 21734, 'loss/train': 1.675588846206665} -08/30/2021 17:06:36 - INFO - __main__ - Step 21736: {'lr': 0.00047838276685542157, 'samples': 4173312, 'steps': 21735, 'loss/train': 1.4226258993148804} -08/30/2021 17:06:36 - INFO - __main__ - Step 21737: {'lr': 0.0004783806081850765, 'samples': 4173504, 'steps': 21736, 'loss/train': 1.2623894214630127} -08/30/2021 17:06:37 - INFO - __main__ - Step 21738: {'lr': 0.0004783784494118266, 'samples': 4173696, 'steps': 21737, 'loss/train': 1.5730348825454712} -08/30/2021 17:06:37 - INFO - __main__ - Step 21739: {'lr': 0.00047837629053567286, 'samples': 4173888, 'steps': 21738, 'loss/train': 1.30971360206604} -08/30/2021 17:06:39 - INFO - __main__ - Step 21740: {'lr': 0.00047837413155661635, 'samples': 4174080, 'steps': 21739, 'loss/train': 0.17382727563381195} -08/30/2021 17:06:39 - INFO - __main__ - Step 21741: {'lr': 0.000478371972474658, 'samples': 4174272, 'steps': 21740, 'loss/train': 1.891969084739685} -08/30/2021 17:06:39 - INFO - __main__ - Step 21742: {'lr': 0.00047836981328979865, 'samples': 4174464, 'steps': 21741, 'loss/train': 1.3879209756851196} -08/30/2021 17:06:40 - INFO - __main__ - Step 21743: {'lr': 0.00047836765400203953, 'samples': 4174656, 'steps': 21742, 'loss/train': 1.1069267988204956} -08/30/2021 17:06:40 - INFO - __main__ - Step 21744: {'lr': 0.00047836549461138133, 'samples': 4174848, 'steps': 21743, 'loss/train': 1.566767930984497} -08/30/2021 17:06:42 - INFO - __main__ - Step 21745: {'lr': 0.00047836333511782524, 'samples': 4175040, 'steps': 21744, 'loss/train': 1.494236707687378} -08/30/2021 17:06:43 - INFO - __main__ - Step 21746: {'lr': 0.00047836117552137213, 'samples': 4175232, 'steps': 21745, 'loss/train': 1.5211020708084106} -08/30/2021 17:06:43 - INFO - __main__ - Step 21747: {'lr': 0.00047835901582202303, 'samples': 4175424, 'steps': 21746, 'loss/train': 1.3371444940567017} -08/30/2021 17:06:43 - INFO - __main__ - Step 21748: {'lr': 0.00047835685601977886, 'samples': 4175616, 'steps': 21747, 'loss/train': 1.6107068061828613} -08/30/2021 17:06:44 - INFO - __main__ - Step 21749: {'lr': 0.00047835469611464055, 'samples': 4175808, 'steps': 21748, 'loss/train': 1.7145252227783203} -08/30/2021 17:06:44 - INFO - __main__ - Step 21750: {'lr': 0.0004783525361066092, 'samples': 4176000, 'steps': 21749, 'loss/train': 1.872490644454956} -08/30/2021 17:06:46 - INFO - __main__ - Step 21751: {'lr': 0.00047835037599568576, 'samples': 4176192, 'steps': 21750, 'loss/train': 1.7199158668518066} -08/30/2021 17:06:46 - INFO - __main__ - Step 21752: {'lr': 0.0004783482157818711, 'samples': 4176384, 'steps': 21751, 'loss/train': 1.058449149131775} -08/30/2021 17:06:46 - INFO - __main__ - Step 21753: {'lr': 0.0004783460554651663, 'samples': 4176576, 'steps': 21752, 'loss/train': 1.4700802564620972} -08/30/2021 17:06:47 - INFO - __main__ - Step 21754: {'lr': 0.0004783438950455723, 'samples': 4176768, 'steps': 21753, 'loss/train': 1.7727082967758179} -08/30/2021 17:06:47 - INFO - __main__ - Step 21755: {'lr': 0.00047834173452309005, 'samples': 4176960, 'steps': 21754, 'loss/train': 1.5789827108383179} -08/30/2021 17:06:48 - INFO - __main__ - Step 21756: {'lr': 0.00047833957389772046, 'samples': 4177152, 'steps': 21755, 'loss/train': 1.455665946006775} -08/30/2021 17:06:49 - INFO - __main__ - Step 21757: {'lr': 0.0004783374131694647, 'samples': 4177344, 'steps': 21756, 'loss/train': 1.679849624633789} -08/30/2021 17:06:50 - INFO - __main__ - Step 21758: {'lr': 0.00047833525233832356, 'samples': 4177536, 'steps': 21757, 'loss/train': 0.199010968208313} -08/30/2021 17:06:50 - INFO - __main__ - Step 21759: {'lr': 0.00047833309140429803, 'samples': 4177728, 'steps': 21758, 'loss/train': 1.6432427167892456} -08/30/2021 17:06:50 - INFO - __main__ - Step 21760: {'lr': 0.0004783309303673892, 'samples': 4177920, 'steps': 21759, 'loss/train': 1.7864922285079956} -08/30/2021 17:06:51 - INFO - __main__ - Step 21761: {'lr': 0.00047832876922759805, 'samples': 4178112, 'steps': 21760, 'loss/train': 1.6534661054611206} -08/30/2021 17:06:52 - INFO - __main__ - Step 21762: {'lr': 0.0004783266079849253, 'samples': 4178304, 'steps': 21761, 'loss/train': 1.9542009830474854} -08/30/2021 17:06:53 - INFO - __main__ - Step 21763: {'lr': 0.00047832444663937227, 'samples': 4178496, 'steps': 21762, 'loss/train': 1.3221291303634644} -08/30/2021 17:06:53 - INFO - __main__ - Step 21764: {'lr': 0.0004783222851909397, 'samples': 4178688, 'steps': 21763, 'loss/train': 5.238156795501709} -08/30/2021 17:06:53 - INFO - __main__ - Step 21765: {'lr': 0.0004783201236396286, 'samples': 4178880, 'steps': 21764, 'loss/train': 1.62040114402771} -08/30/2021 17:06:54 - INFO - __main__ - Step 21766: {'lr': 0.00047831796198544, 'samples': 4179072, 'steps': 21765, 'loss/train': 1.7173926830291748} -08/30/2021 17:06:54 - INFO - __main__ - Step 21767: {'lr': 0.0004783158002283749, 'samples': 4179264, 'steps': 21766, 'loss/train': 1.612707495689392} -08/30/2021 17:06:56 - INFO - __main__ - Step 21768: {'lr': 0.0004783136383684342, 'samples': 4179456, 'steps': 21767, 'loss/train': 1.9059386253356934} -08/30/2021 17:06:56 - INFO - __main__ - Step 21769: {'lr': 0.0004783114764056188, 'samples': 4179648, 'steps': 21768, 'loss/train': 1.3929764032363892} -08/30/2021 17:06:56 - INFO - __main__ - Step 21770: {'lr': 0.00047830931433992985, 'samples': 4179840, 'steps': 21769, 'loss/train': 0.8066627979278564} -08/30/2021 17:06:57 - INFO - __main__ - Step 21771: {'lr': 0.00047830715217136825, 'samples': 4180032, 'steps': 21770, 'loss/train': 2.010899305343628} -08/30/2021 17:06:57 - INFO - __main__ - Step 21772: {'lr': 0.000478304989899935, 'samples': 4180224, 'steps': 21771, 'loss/train': 0.7552194595336914} -08/30/2021 17:06:58 - INFO - __main__ - Step 21773: {'lr': 0.00047830282752563103, 'samples': 4180416, 'steps': 21772, 'loss/train': 1.7293847799301147} -08/30/2021 17:06:59 - INFO - __main__ - Step 21774: {'lr': 0.00047830066504845725, 'samples': 4180608, 'steps': 21773, 'loss/train': 1.309455394744873} -08/30/2021 17:06:59 - INFO - __main__ - Step 21775: {'lr': 0.0004782985024684148, 'samples': 4180800, 'steps': 21774, 'loss/train': 1.440053105354309} -08/30/2021 17:07:00 - INFO - __main__ - Step 21776: {'lr': 0.0004782963397855046, 'samples': 4180992, 'steps': 21775, 'loss/train': 1.169439673423767} -08/30/2021 17:07:00 - INFO - __main__ - Step 21777: {'lr': 0.00047829417699972747, 'samples': 4181184, 'steps': 21776, 'loss/train': 2.02445650100708} -08/30/2021 17:07:02 - INFO - __main__ - Step 21778: {'lr': 0.0004782920141110846, 'samples': 4181376, 'steps': 21777, 'loss/train': 1.6135485172271729} -08/30/2021 17:07:02 - INFO - __main__ - Step 21779: {'lr': 0.0004782898511195768, 'samples': 4181568, 'steps': 21778, 'loss/train': 0.9269253611564636} -08/30/2021 17:07:03 - INFO - __main__ - Step 21780: {'lr': 0.00047828768802520515, 'samples': 4181760, 'steps': 21779, 'loss/train': 1.4465060234069824} -08/30/2021 17:07:03 - INFO - __main__ - Step 21781: {'lr': 0.0004782855248279706, 'samples': 4181952, 'steps': 21780, 'loss/train': 1.769426703453064} -08/30/2021 17:07:03 - INFO - __main__ - Step 21782: {'lr': 0.0004782833615278741, 'samples': 4182144, 'steps': 21781, 'loss/train': 1.2966687679290771} -08/30/2021 17:07:05 - INFO - __main__ - Step 21783: {'lr': 0.00047828119812491664, 'samples': 4182336, 'steps': 21782, 'loss/train': 1.430395483970642} -08/30/2021 17:07:05 - INFO - __main__ - Step 21784: {'lr': 0.0004782790346190993, 'samples': 4182528, 'steps': 21783, 'loss/train': 1.4945639371871948} -08/30/2021 17:07:06 - INFO - __main__ - Step 21785: {'lr': 0.00047827687101042283, 'samples': 4182720, 'steps': 21784, 'loss/train': 2.0308988094329834} -08/30/2021 17:07:06 - INFO - __main__ - Step 21786: {'lr': 0.00047827470729888834, 'samples': 4182912, 'steps': 21785, 'loss/train': 1.586060643196106} -08/30/2021 17:07:06 - INFO - __main__ - Step 21787: {'lr': 0.0004782725434844968, 'samples': 4183104, 'steps': 21786, 'loss/train': 2.080684185028076} -08/30/2021 17:07:08 - INFO - __main__ - Step 21788: {'lr': 0.00047827037956724915, 'samples': 4183296, 'steps': 21787, 'loss/train': 0.839836835861206} -08/30/2021 17:07:09 - INFO - __main__ - Step 21789: {'lr': 0.00047826821554714644, 'samples': 4183488, 'steps': 21788, 'loss/train': 1.1939973831176758} -08/30/2021 17:07:09 - INFO - __main__ - Step 21790: {'lr': 0.00047826605142418954, 'samples': 4183680, 'steps': 21789, 'loss/train': 1.1964384317398071} -08/30/2021 17:07:10 - INFO - __main__ - Step 21791: {'lr': 0.0004782638871983795, 'samples': 4183872, 'steps': 21790, 'loss/train': 1.6358758211135864} -08/30/2021 17:07:10 - INFO - __main__ - Step 21792: {'lr': 0.0004782617228697173, 'samples': 4184064, 'steps': 21791, 'loss/train': 1.5515676736831665} -08/30/2021 17:07:11 - INFO - __main__ - Step 21793: {'lr': 0.0004782595584382039, 'samples': 4184256, 'steps': 21792, 'loss/train': 1.7221769094467163} -08/30/2021 17:07:12 - INFO - __main__ - Step 21794: {'lr': 0.0004782573939038402, 'samples': 4184448, 'steps': 21793, 'loss/train': 1.7550474405288696} -08/30/2021 17:07:12 - INFO - __main__ - Step 21795: {'lr': 0.0004782552292666273, 'samples': 4184640, 'steps': 21794, 'loss/train': 1.3632317781448364} -08/30/2021 17:07:13 - INFO - __main__ - Step 21796: {'lr': 0.0004782530645265661, 'samples': 4184832, 'steps': 21795, 'loss/train': 1.9573311805725098} -08/30/2021 17:07:13 - INFO - __main__ - Step 21797: {'lr': 0.0004782508996836576, 'samples': 4185024, 'steps': 21796, 'loss/train': 1.5223103761672974} -08/30/2021 17:07:13 - INFO - __main__ - Step 21798: {'lr': 0.00047824873473790275, 'samples': 4185216, 'steps': 21797, 'loss/train': 1.6803069114685059} -08/30/2021 17:07:15 - INFO - __main__ - Step 21799: {'lr': 0.0004782465696893025, 'samples': 4185408, 'steps': 21798, 'loss/train': 0.7478705644607544} -08/30/2021 17:07:15 - INFO - __main__ - Step 21800: {'lr': 0.0004782444045378579, 'samples': 4185600, 'steps': 21799, 'loss/train': 2.2432470321655273} -08/30/2021 17:07:16 - INFO - __main__ - Step 21801: {'lr': 0.00047824223928356993, 'samples': 4185792, 'steps': 21800, 'loss/train': 1.51249361038208} -08/30/2021 17:07:16 - INFO - __main__ - Step 21802: {'lr': 0.0004782400739264395, 'samples': 4185984, 'steps': 21801, 'loss/train': 1.9229987859725952} -08/30/2021 17:07:16 - INFO - __main__ - Step 21803: {'lr': 0.00047823790846646764, 'samples': 4186176, 'steps': 21802, 'loss/train': 1.9468880891799927} -08/30/2021 17:07:18 - INFO - __main__ - Step 21804: {'lr': 0.0004782357429036553, 'samples': 4186368, 'steps': 21803, 'loss/train': 1.4829293489456177} -08/30/2021 17:07:18 - INFO - __main__ - Step 21805: {'lr': 0.00047823357723800344, 'samples': 4186560, 'steps': 21804, 'loss/train': 1.7622202634811401} -08/30/2021 17:07:19 - INFO - __main__ - Step 21806: {'lr': 0.000478231411469513, 'samples': 4186752, 'steps': 21805, 'loss/train': 1.6974397897720337} -08/30/2021 17:07:19 - INFO - __main__ - Step 21807: {'lr': 0.000478229245598185, 'samples': 4186944, 'steps': 21806, 'loss/train': 0.7027131915092468} -08/30/2021 17:07:19 - INFO - __main__ - Step 21808: {'lr': 0.00047822707962402055, 'samples': 4187136, 'steps': 21807, 'loss/train': 1.691078543663025} -08/30/2021 17:07:21 - INFO - __main__ - Step 21809: {'lr': 0.00047822491354702044, 'samples': 4187328, 'steps': 21808, 'loss/train': 1.4254356622695923} -08/30/2021 17:07:21 - INFO - __main__ - Step 21810: {'lr': 0.0004782227473671857, 'samples': 4187520, 'steps': 21809, 'loss/train': 0.9605146646499634} -08/30/2021 17:07:22 - INFO - __main__ - Step 21811: {'lr': 0.00047822058108451727, 'samples': 4187712, 'steps': 21810, 'loss/train': 1.3175225257873535} -08/30/2021 17:07:22 - INFO - __main__ - Step 21812: {'lr': 0.0004782184146990162, 'samples': 4187904, 'steps': 21811, 'loss/train': 1.8008755445480347} -08/30/2021 17:07:22 - INFO - __main__ - Step 21813: {'lr': 0.00047821624821068346, 'samples': 4188096, 'steps': 21812, 'loss/train': 3.052218198776245} -08/30/2021 17:07:24 - INFO - __main__ - Step 21814: {'lr': 0.00047821408161952, 'samples': 4188288, 'steps': 21813, 'loss/train': 1.5098425149917603} -08/30/2021 17:07:24 - INFO - __main__ - Step 21815: {'lr': 0.00047821191492552676, 'samples': 4188480, 'steps': 21814, 'loss/train': 1.8102848529815674} -08/30/2021 17:07:25 - INFO - __main__ - Step 21816: {'lr': 0.00047820974812870477, 'samples': 4188672, 'steps': 21815, 'loss/train': 1.5876659154891968} -08/30/2021 17:07:25 - INFO - __main__ - Step 21817: {'lr': 0.00047820758122905493, 'samples': 4188864, 'steps': 21816, 'loss/train': 1.1264034509658813} -08/30/2021 17:07:25 - INFO - __main__ - Step 21818: {'lr': 0.0004782054142265784, 'samples': 4189056, 'steps': 21817, 'loss/train': 1.609885573387146} -08/30/2021 17:07:26 - INFO - __main__ - Step 21819: {'lr': 0.00047820324712127593, 'samples': 4189248, 'steps': 21818, 'loss/train': 1.475606083869934} -08/30/2021 17:07:27 - INFO - __main__ - Step 21820: {'lr': 0.0004782010799131487, 'samples': 4189440, 'steps': 21819, 'loss/train': 1.5146722793579102} -08/30/2021 17:07:28 - INFO - __main__ - Step 21821: {'lr': 0.0004781989126021975, 'samples': 4189632, 'steps': 21820, 'loss/train': 1.1020145416259766} -08/30/2021 17:07:28 - INFO - __main__ - Step 21822: {'lr': 0.00047819674518842335, 'samples': 4189824, 'steps': 21821, 'loss/train': 1.297472596168518} -08/30/2021 17:07:28 - INFO - __main__ - Step 21823: {'lr': 0.00047819457767182735, 'samples': 4190016, 'steps': 21822, 'loss/train': 1.6172099113464355} -08/30/2021 17:07:29 - INFO - __main__ - Step 21824: {'lr': 0.0004781924100524104, 'samples': 4190208, 'steps': 21823, 'loss/train': 1.5605764389038086} -08/30/2021 17:07:30 - INFO - __main__ - Step 21825: {'lr': 0.00047819024233017337, 'samples': 4190400, 'steps': 21824, 'loss/train': 1.5563044548034668} -08/30/2021 17:07:31 - INFO - __main__ - Step 21826: {'lr': 0.00047818807450511746, 'samples': 4190592, 'steps': 21825, 'loss/train': 1.235628366470337} -08/30/2021 17:07:31 - INFO - __main__ - Step 21827: {'lr': 0.00047818590657724345, 'samples': 4190784, 'steps': 21826, 'loss/train': 1.9041955471038818} -08/30/2021 17:07:31 - INFO - __main__ - Step 21828: {'lr': 0.0004781837385465524, 'samples': 4190976, 'steps': 21827, 'loss/train': 1.5375030040740967} -08/30/2021 17:07:32 - INFO - __main__ - Step 21829: {'lr': 0.00047818157041304535, 'samples': 4191168, 'steps': 21828, 'loss/train': 2.0281591415405273} -08/30/2021 17:07:33 - INFO - __main__ - Step 21830: {'lr': 0.00047817940217672315, 'samples': 4191360, 'steps': 21829, 'loss/train': 0.9340408444404602} -08/30/2021 17:07:34 - INFO - __main__ - Step 21831: {'lr': 0.0004781772338375868, 'samples': 4191552, 'steps': 21830, 'loss/train': 1.8971073627471924} -08/30/2021 17:07:34 - INFO - __main__ - Step 21832: {'lr': 0.0004781750653956374, 'samples': 4191744, 'steps': 21831, 'loss/train': 2.3435568809509277} -08/30/2021 17:07:34 - INFO - __main__ - Step 21833: {'lr': 0.00047817289685087575, 'samples': 4191936, 'steps': 21832, 'loss/train': 0.17955322563648224} -08/30/2021 17:07:35 - INFO - __main__ - Step 21834: {'lr': 0.00047817072820330287, 'samples': 4192128, 'steps': 21833, 'loss/train': 1.461944580078125} -08/30/2021 17:07:36 - INFO - __main__ - Step 21835: {'lr': 0.0004781685594529199, 'samples': 4192320, 'steps': 21834, 'loss/train': 1.583033800125122} -08/30/2021 17:07:36 - INFO - __main__ - Step 21836: {'lr': 0.00047816639059972767, 'samples': 4192512, 'steps': 21835, 'loss/train': 1.778618335723877} -08/30/2021 17:07:37 - INFO - __main__ - Step 21837: {'lr': 0.00047816422164372713, 'samples': 4192704, 'steps': 21836, 'loss/train': 0.9923926591873169} -08/30/2021 17:07:37 - INFO - __main__ - Step 21838: {'lr': 0.00047816205258491935, 'samples': 4192896, 'steps': 21837, 'loss/train': 1.445613145828247} -08/30/2021 17:07:38 - INFO - __main__ - Step 21839: {'lr': 0.0004781598834233053, 'samples': 4193088, 'steps': 21838, 'loss/train': 1.4672938585281372} -08/30/2021 17:07:40 - INFO - __main__ - Step 21840: {'lr': 0.0004781577141588859, 'samples': 4193280, 'steps': 21839, 'loss/train': 1.6474761962890625} -08/30/2021 17:07:40 - INFO - __main__ - Step 21841: {'lr': 0.0004781555447916621, 'samples': 4193472, 'steps': 21840, 'loss/train': 1.7598116397857666} -08/30/2021 17:07:40 - INFO - __main__ - Step 21842: {'lr': 0.000478153375321635, 'samples': 4193664, 'steps': 21841, 'loss/train': 0.5458323955535889} -08/30/2021 17:07:41 - INFO - __main__ - Step 21843: {'lr': 0.0004781512057488055, 'samples': 4193856, 'steps': 21842, 'loss/train': 1.0545837879180908} -08/30/2021 17:07:41 - INFO - __main__ - Step 21844: {'lr': 0.00047814903607317454, 'samples': 4194048, 'steps': 21843, 'loss/train': 1.4126092195510864} -08/30/2021 17:07:43 - INFO - __main__ - Step 21845: {'lr': 0.00047814686629474323, 'samples': 4194240, 'steps': 21844, 'loss/train': 1.4072014093399048} -08/30/2021 17:07:43 - INFO - __main__ - Step 21846: {'lr': 0.00047814469641351237, 'samples': 4194432, 'steps': 21845, 'loss/train': 1.3051915168762207} -08/30/2021 17:07:43 - INFO - __main__ - Step 21847: {'lr': 0.0004781425264294831, 'samples': 4194624, 'steps': 21846, 'loss/train': 1.7459301948547363} -08/30/2021 17:07:44 - INFO - __main__ - Step 21848: {'lr': 0.0004781403563426563, 'samples': 4194816, 'steps': 21847, 'loss/train': 1.3173969984054565} -08/30/2021 17:07:44 - INFO - __main__ - Step 21849: {'lr': 0.00047813818615303295, 'samples': 4195008, 'steps': 21848, 'loss/train': 1.407995343208313} -08/30/2021 17:07:46 - INFO - __main__ - Step 21850: {'lr': 0.00047813601586061414, 'samples': 4195200, 'steps': 21849, 'loss/train': 1.3913586139678955} -08/30/2021 17:07:46 - INFO - __main__ - Step 21851: {'lr': 0.0004781338454654007, 'samples': 4195392, 'steps': 21850, 'loss/train': 1.4758920669555664} -08/30/2021 17:07:46 - INFO - __main__ - Step 21852: {'lr': 0.00047813167496739363, 'samples': 4195584, 'steps': 21851, 'loss/train': 2.059255838394165} -08/30/2021 17:07:47 - INFO - __main__ - Step 21853: {'lr': 0.00047812950436659405, 'samples': 4195776, 'steps': 21852, 'loss/train': 1.5771533250808716} -08/30/2021 17:07:47 - INFO - __main__ - Step 21854: {'lr': 0.0004781273336630028, 'samples': 4195968, 'steps': 21853, 'loss/train': 2.0807173252105713} -08/30/2021 17:07:49 - INFO - __main__ - Step 21855: {'lr': 0.00047812516285662086, 'samples': 4196160, 'steps': 21854, 'loss/train': 1.947556972503662} -08/30/2021 17:07:50 - INFO - __main__ - Step 21856: {'lr': 0.00047812299194744924, 'samples': 4196352, 'steps': 21855, 'loss/train': 1.3786648511886597} -08/30/2021 17:07:50 - INFO - __main__ - Step 21857: {'lr': 0.0004781208209354889, 'samples': 4196544, 'steps': 21856, 'loss/train': 0.08374021202325821} -08/30/2021 17:07:50 - INFO - __main__ - Step 21858: {'lr': 0.00047811864982074087, 'samples': 4196736, 'steps': 21857, 'loss/train': 1.6885826587677002} -08/30/2021 17:07:51 - INFO - __main__ - Step 21859: {'lr': 0.0004781164786032061, 'samples': 4196928, 'steps': 21858, 'loss/train': 0.2487347275018692} -08/30/2021 17:07:51 - INFO - __main__ - Step 21860: {'lr': 0.0004781143072828856, 'samples': 4197120, 'steps': 21859, 'loss/train': 0.22958756983280182} -08/30/2021 17:07:51 - INFO - __main__ - Step 21861: {'lr': 0.00047811213585978023, 'samples': 4197312, 'steps': 21860, 'loss/train': 1.1175928115844727} -08/30/2021 17:07:53 - INFO - __main__ - Step 21862: {'lr': 0.0004781099643338911, 'samples': 4197504, 'steps': 21861, 'loss/train': 2.00122332572937} -08/30/2021 17:07:54 - INFO - __main__ - Step 21863: {'lr': 0.00047810779270521914, 'samples': 4197696, 'steps': 21862, 'loss/train': 1.7286481857299805} -08/30/2021 17:07:54 - INFO - __main__ - Step 21864: {'lr': 0.0004781056209737653, 'samples': 4197888, 'steps': 21863, 'loss/train': 0.907160222530365} -08/30/2021 17:07:54 - INFO - __main__ - Step 21865: {'lr': 0.00047810344913953065, 'samples': 4198080, 'steps': 21864, 'loss/train': 2.0779623985290527} -08/30/2021 17:07:55 - INFO - __main__ - Step 21866: {'lr': 0.0004781012772025161, 'samples': 4198272, 'steps': 21865, 'loss/train': 1.2352877855300903} -08/30/2021 17:07:56 - INFO - __main__ - Step 21867: {'lr': 0.0004780991051627226, 'samples': 4198464, 'steps': 21866, 'loss/train': 0.18139822781085968} -08/30/2021 17:07:57 - INFO - __main__ - Step 21868: {'lr': 0.0004780969330201511, 'samples': 4198656, 'steps': 21867, 'loss/train': 1.1665617227554321} -08/30/2021 17:07:57 - INFO - __main__ - Step 21869: {'lr': 0.0004780947607748027, 'samples': 4198848, 'steps': 21868, 'loss/train': 1.9979071617126465} -08/30/2021 17:07:57 - INFO - __main__ - Step 21870: {'lr': 0.00047809258842667837, 'samples': 4199040, 'steps': 21869, 'loss/train': 1.86331307888031} -08/30/2021 17:07:58 - INFO - __main__ - Step 21871: {'lr': 0.000478090415975779, 'samples': 4199232, 'steps': 21870, 'loss/train': 1.8044943809509277} -08/30/2021 17:07:58 - INFO - __main__ - Step 21872: {'lr': 0.00047808824342210565, 'samples': 4199424, 'steps': 21871, 'loss/train': 1.467484951019287} -08/30/2021 17:08:00 - INFO - __main__ - Step 21873: {'lr': 0.0004780860707656592, 'samples': 4199616, 'steps': 21872, 'loss/train': 1.7816983461380005} -08/30/2021 17:08:00 - INFO - __main__ - Step 21874: {'lr': 0.0004780838980064407, 'samples': 4199808, 'steps': 21873, 'loss/train': 1.5336304903030396} -08/30/2021 17:08:01 - INFO - __main__ - Step 21875: {'lr': 0.00047808172514445115, 'samples': 4200000, 'steps': 21874, 'loss/train': 0.0895189642906189} -08/30/2021 17:08:01 - INFO - __main__ - Step 21876: {'lr': 0.0004780795521796914, 'samples': 4200192, 'steps': 21875, 'loss/train': 1.2236469984054565} -08/30/2021 17:08:01 - INFO - __main__ - Step 21877: {'lr': 0.0004780773791121626, 'samples': 4200384, 'steps': 21876, 'loss/train': 1.1106677055358887} -08/30/2021 17:08:03 - INFO - __main__ - Step 21878: {'lr': 0.0004780752059418656, 'samples': 4200576, 'steps': 21877, 'loss/train': 1.9841495752334595} -08/30/2021 17:08:03 - INFO - __main__ - Step 21879: {'lr': 0.0004780730326688015, 'samples': 4200768, 'steps': 21878, 'loss/train': 1.4923685789108276} -08/30/2021 17:08:04 - INFO - __main__ - Step 21880: {'lr': 0.0004780708592929712, 'samples': 4200960, 'steps': 21879, 'loss/train': 1.6637871265411377} -08/30/2021 17:08:04 - INFO - __main__ - Step 21881: {'lr': 0.0004780686858143756, 'samples': 4201152, 'steps': 21880, 'loss/train': 1.4183932542800903} -08/30/2021 17:08:04 - INFO - __main__ - Step 21882: {'lr': 0.0004780665122330159, 'samples': 4201344, 'steps': 21881, 'loss/train': 1.4498711824417114} -08/30/2021 17:08:06 - INFO - __main__ - Step 21883: {'lr': 0.00047806433854889285, 'samples': 4201536, 'steps': 21882, 'loss/train': 1.8202253580093384} -08/30/2021 17:08:06 - INFO - __main__ - Step 21884: {'lr': 0.0004780621647620076, 'samples': 4201728, 'steps': 21883, 'loss/train': 1.8336007595062256} -08/30/2021 17:08:07 - INFO - __main__ - Step 21885: {'lr': 0.00047805999087236097, 'samples': 4201920, 'steps': 21884, 'loss/train': 1.5845669507980347} -08/30/2021 17:08:07 - INFO - __main__ - Step 21886: {'lr': 0.0004780578168799541, 'samples': 4202112, 'steps': 21885, 'loss/train': 2.684797763824463} -08/30/2021 17:08:07 - INFO - __main__ - Step 21887: {'lr': 0.00047805564278478787, 'samples': 4202304, 'steps': 21886, 'loss/train': 1.976189136505127} -08/30/2021 17:08:09 - INFO - __main__ - Step 21888: {'lr': 0.00047805346858686325, 'samples': 4202496, 'steps': 21887, 'loss/train': 0.3722270131111145} -08/30/2021 17:08:09 - INFO - __main__ - Step 21889: {'lr': 0.0004780512942861813, 'samples': 4202688, 'steps': 21888, 'loss/train': 1.7283111810684204} -08/30/2021 17:08:10 - INFO - __main__ - Step 21890: {'lr': 0.00047804911988274303, 'samples': 4202880, 'steps': 21889, 'loss/train': 1.2118431329727173} -08/30/2021 17:08:10 - INFO - __main__ - Step 21891: {'lr': 0.00047804694537654927, 'samples': 4203072, 'steps': 21890, 'loss/train': 1.284872055053711} -08/30/2021 17:08:11 - INFO - __main__ - Step 21892: {'lr': 0.00047804477076760106, 'samples': 4203264, 'steps': 21891, 'loss/train': 1.4628698825836182} -08/30/2021 17:08:12 - INFO - __main__ - Step 21893: {'lr': 0.0004780425960558994, 'samples': 4203456, 'steps': 21892, 'loss/train': 1.623253583908081} -08/30/2021 17:08:13 - INFO - __main__ - Step 21894: {'lr': 0.00047804042124144526, 'samples': 4203648, 'steps': 21893, 'loss/train': 1.5874764919281006} -08/30/2021 17:08:13 - INFO - __main__ - Step 21895: {'lr': 0.00047803824632423967, 'samples': 4203840, 'steps': 21894, 'loss/train': 2.083956480026245} -08/30/2021 17:08:13 - INFO - __main__ - Step 21896: {'lr': 0.0004780360713042835, 'samples': 4204032, 'steps': 21895, 'loss/train': 1.4926472902297974} -08/30/2021 17:08:14 - INFO - __main__ - Step 21897: {'lr': 0.0004780338961815779, 'samples': 4204224, 'steps': 21896, 'loss/train': 1.7445399761199951} -08/30/2021 17:08:16 - INFO - __main__ - Step 21898: {'lr': 0.00047803172095612365, 'samples': 4204416, 'steps': 21897, 'loss/train': 1.6326509714126587} -08/30/2021 17:08:16 - INFO - __main__ - Step 21899: {'lr': 0.00047802954562792185, 'samples': 4204608, 'steps': 21898, 'loss/train': 1.4807627201080322} -08/30/2021 17:08:16 - INFO - __main__ - Step 21900: {'lr': 0.0004780273701969734, 'samples': 4204800, 'steps': 21899, 'loss/train': 1.3924874067306519} -08/30/2021 17:08:17 - INFO - __main__ - Step 21901: {'lr': 0.00047802519466327945, 'samples': 4204992, 'steps': 21900, 'loss/train': 1.9246954917907715} -08/30/2021 17:08:17 - INFO - __main__ - Step 21902: {'lr': 0.00047802301902684076, 'samples': 4205184, 'steps': 21901, 'loss/train': 1.831890344619751} -08/30/2021 17:08:17 - INFO - __main__ - Step 21903: {'lr': 0.0004780208432876585, 'samples': 4205376, 'steps': 21902, 'loss/train': 1.668404221534729} -08/30/2021 17:08:19 - INFO - __main__ - Step 21904: {'lr': 0.00047801866744573353, 'samples': 4205568, 'steps': 21903, 'loss/train': 1.7075095176696777} -08/30/2021 17:08:20 - INFO - __main__ - Step 21905: {'lr': 0.00047801649150106684, 'samples': 4205760, 'steps': 21904, 'loss/train': 1.4642846584320068} -08/30/2021 17:08:20 - INFO - __main__ - Step 21906: {'lr': 0.00047801431545365947, 'samples': 4205952, 'steps': 21905, 'loss/train': 1.674008846282959} -08/30/2021 17:08:20 - INFO - __main__ - Step 21907: {'lr': 0.0004780121393035124, 'samples': 4206144, 'steps': 21906, 'loss/train': 1.1540557146072388} -08/30/2021 17:08:21 - INFO - __main__ - Step 21908: {'lr': 0.0004780099630506265, 'samples': 4206336, 'steps': 21907, 'loss/train': 1.779233694076538} -08/30/2021 17:08:22 - INFO - __main__ - Step 21909: {'lr': 0.0004780077866950029, 'samples': 4206528, 'steps': 21908, 'loss/train': 0.6303631067276001} -08/30/2021 17:08:23 - INFO - __main__ - Step 21910: {'lr': 0.00047800561023664246, 'samples': 4206720, 'steps': 21909, 'loss/train': 1.7209911346435547} -08/30/2021 17:08:23 - INFO - __main__ - Step 21911: {'lr': 0.0004780034336755462, 'samples': 4206912, 'steps': 21910, 'loss/train': 1.7233561277389526} -08/30/2021 17:08:23 - INFO - __main__ - Step 21912: {'lr': 0.00047800125701171517, 'samples': 4207104, 'steps': 21911, 'loss/train': 2.067147731781006} -08/30/2021 17:08:24 - INFO - __main__ - Step 21913: {'lr': 0.00047799908024515026, 'samples': 4207296, 'steps': 21912, 'loss/train': 1.0405805110931396} -08/30/2021 17:08:25 - INFO - __main__ - Step 21914: {'lr': 0.0004779969033758525, 'samples': 4207488, 'steps': 21913, 'loss/train': 1.331740379333496} -08/30/2021 17:08:26 - INFO - __main__ - Step 21915: {'lr': 0.00047799472640382287, 'samples': 4207680, 'steps': 21914, 'loss/train': 1.4365123510360718} -08/30/2021 17:08:26 - INFO - __main__ - Step 21916: {'lr': 0.0004779925493290623, 'samples': 4207872, 'steps': 21915, 'loss/train': 1.0958466529846191} -08/30/2021 17:08:27 - INFO - __main__ - Step 21917: {'lr': 0.00047799037215157184, 'samples': 4208064, 'steps': 21916, 'loss/train': 1.3608423471450806} -08/30/2021 17:08:27 - INFO - __main__ - Step 21918: {'lr': 0.0004779881948713524, 'samples': 4208256, 'steps': 21917, 'loss/train': 0.11266614496707916} -08/30/2021 17:08:28 - INFO - __main__ - Step 21919: {'lr': 0.000477986017488405, 'samples': 4208448, 'steps': 21918, 'loss/train': 1.7626110315322876} -08/30/2021 17:08:29 - INFO - __main__ - Step 21920: {'lr': 0.00047798384000273053, 'samples': 4208640, 'steps': 21919, 'loss/train': 0.45796090364456177} -08/30/2021 17:08:29 - INFO - __main__ - Step 21921: {'lr': 0.0004779816624143302, 'samples': 4208832, 'steps': 21920, 'loss/train': 1.6454553604125977} -08/30/2021 17:08:29 - INFO - __main__ - Step 21922: {'lr': 0.0004779794847232048, 'samples': 4209024, 'steps': 21921, 'loss/train': 2.0480148792266846} -08/30/2021 17:08:30 - INFO - __main__ - Step 21923: {'lr': 0.0004779773069293554, 'samples': 4209216, 'steps': 21922, 'loss/train': 1.4627642631530762} -08/30/2021 17:08:31 - INFO - __main__ - Step 21924: {'lr': 0.00047797512903278283, 'samples': 4209408, 'steps': 21923, 'loss/train': 1.6264673471450806} -08/30/2021 17:08:32 - INFO - __main__ - Step 21925: {'lr': 0.0004779729510334883, 'samples': 4209600, 'steps': 21924, 'loss/train': 1.714000940322876} -08/30/2021 17:08:32 - INFO - __main__ - Step 21926: {'lr': 0.0004779707729314726, 'samples': 4209792, 'steps': 21925, 'loss/train': 1.7017693519592285} -08/30/2021 17:08:33 - INFO - __main__ - Step 21927: {'lr': 0.0004779685947267369, 'samples': 4209984, 'steps': 21926, 'loss/train': 2.342733383178711} -08/30/2021 17:08:33 - INFO - __main__ - Step 21928: {'lr': 0.00047796641641928195, 'samples': 4210176, 'steps': 21927, 'loss/train': 1.6500569581985474} -08/30/2021 17:08:33 - INFO - __main__ - Step 21929: {'lr': 0.00047796423800910894, 'samples': 4210368, 'steps': 21928, 'loss/train': 1.351326823234558} -08/30/2021 17:08:35 - INFO - __main__ - Step 21930: {'lr': 0.00047796205949621873, 'samples': 4210560, 'steps': 21929, 'loss/train': 1.819567084312439} -08/30/2021 17:08:35 - INFO - __main__ - Step 21931: {'lr': 0.00047795988088061224, 'samples': 4210752, 'steps': 21930, 'loss/train': 2.0995278358459473} -08/30/2021 17:08:36 - INFO - __main__ - Step 21932: {'lr': 0.00047795770216229065, 'samples': 4210944, 'steps': 21931, 'loss/train': 1.5262372493743896} -08/30/2021 17:08:36 - INFO - __main__ - Step 21933: {'lr': 0.0004779555233412548, 'samples': 4211136, 'steps': 21932, 'loss/train': 1.0073091983795166} -08/30/2021 17:08:36 - INFO - __main__ - Step 21934: {'lr': 0.0004779533444175058, 'samples': 4211328, 'steps': 21933, 'loss/train': 1.5977104902267456} -08/30/2021 17:08:38 - INFO - __main__ - Step 21935: {'lr': 0.00047795116539104445, 'samples': 4211520, 'steps': 21934, 'loss/train': 1.2242472171783447} -08/30/2021 17:08:38 - INFO - __main__ - Step 21936: {'lr': 0.0004779489862618718, 'samples': 4211712, 'steps': 21935, 'loss/train': 1.6662166118621826} -08/30/2021 17:08:39 - INFO - __main__ - Step 21937: {'lr': 0.00047794680702998893, 'samples': 4211904, 'steps': 21936, 'loss/train': 0.9240788817405701} -08/30/2021 17:08:39 - INFO - __main__ - Step 21938: {'lr': 0.0004779446276953967, 'samples': 4212096, 'steps': 21937, 'loss/train': 0.2507948577404022} -08/30/2021 17:08:39 - INFO - __main__ - Step 21939: {'lr': 0.00047794244825809614, 'samples': 4212288, 'steps': 21938, 'loss/train': 1.4775242805480957} -08/30/2021 17:08:40 - INFO - __main__ - Step 21940: {'lr': 0.0004779402687180882, 'samples': 4212480, 'steps': 21939, 'loss/train': 1.4736164808273315} -08/30/2021 17:08:41 - INFO - __main__ - Step 21941: {'lr': 0.00047793808907537394, 'samples': 4212672, 'steps': 21940, 'loss/train': 1.6653746366500854} -08/30/2021 17:08:42 - INFO - __main__ - Step 21942: {'lr': 0.0004779359093299543, 'samples': 4212864, 'steps': 21941, 'loss/train': 1.8226401805877686} -08/30/2021 17:08:42 - INFO - __main__ - Step 21943: {'lr': 0.00047793372948183024, 'samples': 4213056, 'steps': 21942, 'loss/train': 1.7302875518798828} -08/30/2021 17:08:42 - INFO - __main__ - Step 21944: {'lr': 0.0004779315495310027, 'samples': 4213248, 'steps': 21943, 'loss/train': 1.924445629119873} -08/30/2021 17:08:43 - INFO - __main__ - Step 21945: {'lr': 0.00047792936947747285, 'samples': 4213440, 'steps': 21944, 'loss/train': 1.7569037675857544} -08/30/2021 17:08:44 - INFO - __main__ - Step 21946: {'lr': 0.00047792718932124147, 'samples': 4213632, 'steps': 21945, 'loss/train': 2.1364247798919678} -08/30/2021 17:08:45 - INFO - __main__ - Step 21947: {'lr': 0.00047792500906230963, 'samples': 4213824, 'steps': 21946, 'loss/train': 1.0786246061325073} -08/30/2021 17:08:45 - INFO - __main__ - Step 21948: {'lr': 0.00047792282870067827, 'samples': 4214016, 'steps': 21947, 'loss/train': 0.824955403804779} -08/30/2021 17:08:46 - INFO - __main__ - Step 21949: {'lr': 0.0004779206482363484, 'samples': 4214208, 'steps': 21948, 'loss/train': 2.175302267074585} -08/30/2021 17:08:46 - INFO - __main__ - Step 21950: {'lr': 0.000477918467669321, 'samples': 4214400, 'steps': 21949, 'loss/train': 1.7836651802062988} -08/30/2021 17:08:48 - INFO - __main__ - Step 21951: {'lr': 0.0004779162869995971, 'samples': 4214592, 'steps': 21950, 'loss/train': 1.2974724769592285} -08/30/2021 17:08:49 - INFO - __main__ - Step 21952: {'lr': 0.00047791410622717757, 'samples': 4214784, 'steps': 21951, 'loss/train': 1.5132735967636108} -08/30/2021 17:08:49 - INFO - __main__ - Step 21953: {'lr': 0.0004779119253520635, 'samples': 4214976, 'steps': 21952, 'loss/train': 1.8830792903900146} -08/30/2021 17:08:49 - INFO - __main__ - Step 21954: {'lr': 0.0004779097443742558, 'samples': 4215168, 'steps': 21953, 'loss/train': 1.4688997268676758} -08/30/2021 17:08:50 - INFO - __main__ - Step 21955: {'lr': 0.0004779075632937556, 'samples': 4215360, 'steps': 21954, 'loss/train': 1.3895879983901978} -08/30/2021 17:08:51 - INFO - __main__ - Step 21956: {'lr': 0.00047790538211056366, 'samples': 4215552, 'steps': 21955, 'loss/train': 1.9342215061187744} -08/30/2021 17:08:52 - INFO - __main__ - Step 21957: {'lr': 0.00047790320082468106, 'samples': 4215744, 'steps': 21956, 'loss/train': 1.418033242225647} -08/30/2021 17:08:52 - INFO - __main__ - Step 21958: {'lr': 0.00047790101943610884, 'samples': 4215936, 'steps': 21957, 'loss/train': 1.506151795387268} -08/30/2021 17:08:53 - INFO - __main__ - Step 21959: {'lr': 0.000477898837944848, 'samples': 4216128, 'steps': 21958, 'loss/train': 1.7700694799423218} -08/30/2021 17:08:53 - INFO - __main__ - Step 21960: {'lr': 0.0004778966563508994, 'samples': 4216320, 'steps': 21959, 'loss/train': 0.7527241110801697} -08/30/2021 17:08:53 - INFO - __main__ - Step 21961: {'lr': 0.00047789447465426406, 'samples': 4216512, 'steps': 21960, 'loss/train': 1.2421972751617432} -08/30/2021 17:08:55 - INFO - __main__ - Step 21962: {'lr': 0.000477892292854943, 'samples': 4216704, 'steps': 21961, 'loss/train': 2.6127634048461914} -08/30/2021 17:08:55 - INFO - __main__ - Step 21963: {'lr': 0.00047789011095293723, 'samples': 4216896, 'steps': 21962, 'loss/train': 1.4230536222457886} -08/30/2021 17:08:56 - INFO - __main__ - Step 21964: {'lr': 0.0004778879289482476, 'samples': 4217088, 'steps': 21963, 'loss/train': 1.4664710760116577} -08/30/2021 17:08:56 - INFO - __main__ - Step 21965: {'lr': 0.00047788574684087527, 'samples': 4217280, 'steps': 21964, 'loss/train': 0.14407892525196075} -08/30/2021 17:08:56 - INFO - __main__ - Step 21966: {'lr': 0.0004778835646308211, 'samples': 4217472, 'steps': 21965, 'loss/train': 1.5930671691894531} -08/30/2021 17:08:58 - INFO - __main__ - Step 21967: {'lr': 0.0004778813823180861, 'samples': 4217664, 'steps': 21966, 'loss/train': 1.876437783241272} -08/30/2021 17:08:58 - INFO - __main__ - Step 21968: {'lr': 0.0004778791999026713, 'samples': 4217856, 'steps': 21967, 'loss/train': 1.6596248149871826} -08/30/2021 17:08:59 - INFO - __main__ - Step 21969: {'lr': 0.0004778770173845777, 'samples': 4218048, 'steps': 21968, 'loss/train': 1.4142649173736572} -08/30/2021 17:08:59 - INFO - __main__ - Step 21970: {'lr': 0.00047787483476380613, 'samples': 4218240, 'steps': 21969, 'loss/train': 1.1690462827682495} -08/30/2021 17:08:59 - INFO - __main__ - Step 21971: {'lr': 0.0004778726520403577, 'samples': 4218432, 'steps': 21970, 'loss/train': 1.791285514831543} -08/30/2021 17:09:01 - INFO - __main__ - Step 21972: {'lr': 0.00047787046921423336, 'samples': 4218624, 'steps': 21971, 'loss/train': 1.278337836265564} -08/30/2021 17:09:01 - INFO - __main__ - Step 21973: {'lr': 0.00047786828628543416, 'samples': 4218816, 'steps': 21972, 'loss/train': 2.0375607013702393} -08/30/2021 17:09:02 - INFO - __main__ - Step 21974: {'lr': 0.00047786610325396096, 'samples': 4219008, 'steps': 21973, 'loss/train': 1.6423488855361938} -08/30/2021 17:09:02 - INFO - __main__ - Step 21975: {'lr': 0.0004778639201198149, 'samples': 4219200, 'steps': 21974, 'loss/train': 1.9463797807693481} -08/30/2021 17:09:03 - INFO - __main__ - Step 21976: {'lr': 0.00047786173688299684, 'samples': 4219392, 'steps': 21975, 'loss/train': 2.127964496612549} -08/30/2021 17:09:03 - INFO - __main__ - Step 21977: {'lr': 0.00047785955354350776, 'samples': 4219584, 'steps': 21976, 'loss/train': 1.3553804159164429} -08/30/2021 17:09:04 - INFO - __main__ - Step 21978: {'lr': 0.00047785737010134865, 'samples': 4219776, 'steps': 21977, 'loss/train': 1.9687639474868774} -08/30/2021 17:09:05 - INFO - __main__ - Step 21979: {'lr': 0.0004778551865565206, 'samples': 4219968, 'steps': 21978, 'loss/train': 0.9866222739219666} -08/30/2021 17:09:05 - INFO - __main__ - Step 21980: {'lr': 0.00047785300290902446, 'samples': 4220160, 'steps': 21979, 'loss/train': 1.6148606538772583} -08/30/2021 17:09:05 - INFO - __main__ - Step 21981: {'lr': 0.0004778508191588613, 'samples': 4220352, 'steps': 21980, 'loss/train': 1.819076657295227} -08/30/2021 17:09:06 - INFO - __main__ - Step 21982: {'lr': 0.00047784863530603213, 'samples': 4220544, 'steps': 21981, 'loss/train': 1.618833065032959} -08/30/2021 17:09:07 - INFO - __main__ - Step 21983: {'lr': 0.0004778464513505378, 'samples': 4220736, 'steps': 21982, 'loss/train': 1.7028850317001343} -08/30/2021 17:09:08 - INFO - __main__ - Step 21984: {'lr': 0.0004778442672923794, 'samples': 4220928, 'steps': 21983, 'loss/train': 1.8046437501907349} -08/30/2021 17:09:08 - INFO - __main__ - Step 21985: {'lr': 0.0004778420831315579, 'samples': 4221120, 'steps': 21984, 'loss/train': 1.4114447832107544} -08/30/2021 17:09:09 - INFO - __main__ - Step 21986: {'lr': 0.0004778398988680743, 'samples': 4221312, 'steps': 21985, 'loss/train': 1.4717018604278564} -08/30/2021 17:09:09 - INFO - __main__ - Step 21987: {'lr': 0.00047783771450192946, 'samples': 4221504, 'steps': 21986, 'loss/train': 1.534753441810608} -08/30/2021 17:09:10 - INFO - __main__ - Step 21988: {'lr': 0.00047783553003312456, 'samples': 4221696, 'steps': 21987, 'loss/train': 1.4537556171417236} -08/30/2021 17:09:11 - INFO - __main__ - Step 21989: {'lr': 0.00047783334546166046, 'samples': 4221888, 'steps': 21988, 'loss/train': 1.511865258216858} -08/30/2021 17:09:11 - INFO - __main__ - Step 21990: {'lr': 0.0004778311607875382, 'samples': 4222080, 'steps': 21989, 'loss/train': 1.6200644969940186} -08/30/2021 17:09:12 - INFO - __main__ - Step 21991: {'lr': 0.0004778289760107587, 'samples': 4222272, 'steps': 21990, 'loss/train': 1.7906439304351807} -08/30/2021 17:09:12 - INFO - __main__ - Step 21992: {'lr': 0.00047782679113132293, 'samples': 4222464, 'steps': 21991, 'loss/train': 0.6283571720123291} -08/30/2021 17:09:13 - INFO - __main__ - Step 21993: {'lr': 0.00047782460614923195, 'samples': 4222656, 'steps': 21992, 'loss/train': 1.5765588283538818} -08/30/2021 17:09:14 - INFO - __main__ - Step 21994: {'lr': 0.00047782242106448675, 'samples': 4222848, 'steps': 21993, 'loss/train': 2.792832851409912} -08/30/2021 17:09:14 - INFO - __main__ - Step 21995: {'lr': 0.00047782023587708826, 'samples': 4223040, 'steps': 21994, 'loss/train': 1.3331061601638794} -08/30/2021 17:09:15 - INFO - __main__ - Step 21996: {'lr': 0.0004778180505870375, 'samples': 4223232, 'steps': 21995, 'loss/train': 1.5808993577957153} -08/30/2021 17:09:15 - INFO - __main__ - Step 21997: {'lr': 0.0004778158651943355, 'samples': 4223424, 'steps': 21996, 'loss/train': 1.5907156467437744} -08/30/2021 17:09:16 - INFO - __main__ - Step 21998: {'lr': 0.0004778136796989831, 'samples': 4223616, 'steps': 21997, 'loss/train': 1.80043363571167} -08/30/2021 17:09:17 - INFO - __main__ - Step 21999: {'lr': 0.0004778114941009814, 'samples': 4223808, 'steps': 21998, 'loss/train': 1.2608749866485596} -08/30/2021 17:09:17 - INFO - __main__ - Step 22000: {'lr': 0.0004778093084003313, 'samples': 4224000, 'steps': 21999, 'loss/train': 0.8539326190948486} -08/30/2021 17:09:18 - INFO - __main__ - Step 22001: {'lr': 0.00047780712259703394, 'samples': 4224192, 'steps': 22000, 'loss/train': 1.4201937913894653} -08/30/2021 17:09:18 - INFO - __main__ - Step 22002: {'lr': 0.00047780493669109017, 'samples': 4224384, 'steps': 22001, 'loss/train': 1.4182732105255127} -08/30/2021 17:09:20 - INFO - __main__ - Step 22003: {'lr': 0.000477802750682501, 'samples': 4224576, 'steps': 22002, 'loss/train': 1.5219247341156006} -08/30/2021 17:09:20 - INFO - __main__ - Step 22004: {'lr': 0.0004778005645712674, 'samples': 4224768, 'steps': 22003, 'loss/train': 1.7167892456054688} -08/30/2021 17:09:20 - INFO - __main__ - Step 22005: {'lr': 0.00047779837835739043, 'samples': 4224960, 'steps': 22004, 'loss/train': 0.8052094578742981} -08/30/2021 17:09:21 - INFO - __main__ - Step 22006: {'lr': 0.000477796192040871, 'samples': 4225152, 'steps': 22005, 'loss/train': 1.5867869853973389} -08/30/2021 17:09:21 - INFO - __main__ - Step 22007: {'lr': 0.00047779400562171016, 'samples': 4225344, 'steps': 22006, 'loss/train': 1.7160247564315796} -08/30/2021 17:09:21 - INFO - __main__ - Step 22008: {'lr': 0.00047779181909990876, 'samples': 4225536, 'steps': 22007, 'loss/train': 1.509312391281128} -08/30/2021 17:09:23 - INFO - __main__ - Step 22009: {'lr': 0.000477789632475468, 'samples': 4225728, 'steps': 22008, 'loss/train': 1.5153206586837769} -08/30/2021 17:09:24 - INFO - __main__ - Step 22010: {'lr': 0.00047778744574838864, 'samples': 4225920, 'steps': 22009, 'loss/train': 2.194248676300049} -08/30/2021 17:09:24 - INFO - __main__ - Step 22011: {'lr': 0.00047778525891867187, 'samples': 4226112, 'steps': 22010, 'loss/train': 2.2969167232513428} -08/30/2021 17:09:25 - INFO - __main__ - Step 22012: {'lr': 0.00047778307198631856, 'samples': 4226304, 'steps': 22011, 'loss/train': 1.2941278219223022} -08/30/2021 17:09:25 - INFO - __main__ - Step 22013: {'lr': 0.00047778088495132963, 'samples': 4226496, 'steps': 22012, 'loss/train': 1.1696702241897583} -08/30/2021 17:09:26 - INFO - __main__ - Step 22014: {'lr': 0.0004777786978137062, 'samples': 4226688, 'steps': 22013, 'loss/train': 1.2197378873825073} -08/30/2021 17:09:27 - INFO - __main__ - Step 22015: {'lr': 0.00047777651057344915, 'samples': 4226880, 'steps': 22014, 'loss/train': 1.7497295141220093} -08/30/2021 17:09:27 - INFO - __main__ - Step 22016: {'lr': 0.0004777743232305596, 'samples': 4227072, 'steps': 22015, 'loss/train': 1.6060482263565063} -08/30/2021 17:09:28 - INFO - __main__ - Step 22017: {'lr': 0.00047777213578503844, 'samples': 4227264, 'steps': 22016, 'loss/train': 1.1682275533676147} -08/30/2021 17:09:28 - INFO - __main__ - Step 22018: {'lr': 0.0004777699482368867, 'samples': 4227456, 'steps': 22017, 'loss/train': 1.8457088470458984} -08/30/2021 17:09:29 - INFO - __main__ - Step 22019: {'lr': 0.00047776776058610525, 'samples': 4227648, 'steps': 22018, 'loss/train': 2.1102287769317627} -08/30/2021 17:09:30 - INFO - __main__ - Step 22020: {'lr': 0.0004777655728326952, 'samples': 4227840, 'steps': 22019, 'loss/train': 1.5147463083267212} -08/30/2021 17:09:30 - INFO - __main__ - Step 22021: {'lr': 0.0004777633849766575, 'samples': 4228032, 'steps': 22020, 'loss/train': 2.064711570739746} -08/30/2021 17:09:31 - INFO - __main__ - Step 22022: {'lr': 0.00047776119701799317, 'samples': 4228224, 'steps': 22021, 'loss/train': 1.7333000898361206} -08/30/2021 17:09:31 - INFO - __main__ - Step 22023: {'lr': 0.0004777590089567031, 'samples': 4228416, 'steps': 22022, 'loss/train': 1.8635295629501343} -08/30/2021 17:09:33 - INFO - __main__ - Step 22024: {'lr': 0.00047775682079278836, 'samples': 4228608, 'steps': 22023, 'loss/train': 1.6678019762039185} -08/30/2021 17:09:33 - INFO - __main__ - Step 22025: {'lr': 0.0004777546325262499, 'samples': 4228800, 'steps': 22024, 'loss/train': 1.0993646383285522} -08/30/2021 17:09:34 - INFO - __main__ - Step 22026: {'lr': 0.00047775244415708873, 'samples': 4228992, 'steps': 22025, 'loss/train': 1.463771104812622} -08/30/2021 17:09:34 - INFO - __main__ - Step 22027: {'lr': 0.0004777502556853058, 'samples': 4229184, 'steps': 22026, 'loss/train': 0.112718865275383} -08/30/2021 17:09:34 - INFO - __main__ - Step 22028: {'lr': 0.00047774806711090213, 'samples': 4229376, 'steps': 22027, 'loss/train': 1.41226065158844} -08/30/2021 17:09:36 - INFO - __main__ - Step 22029: {'lr': 0.0004777458784338787, 'samples': 4229568, 'steps': 22028, 'loss/train': 1.7554728984832764} -08/30/2021 17:09:36 - INFO - __main__ - Step 22030: {'lr': 0.00047774368965423653, 'samples': 4229760, 'steps': 22029, 'loss/train': 1.7022331953048706} -08/30/2021 17:09:36 - INFO - __main__ - Step 22031: {'lr': 0.0004777415007719765, 'samples': 4229952, 'steps': 22030, 'loss/train': 1.380596399307251} -08/30/2021 17:09:37 - INFO - __main__ - Step 22032: {'lr': 0.00047773931178709975, 'samples': 4230144, 'steps': 22031, 'loss/train': 1.567521333694458} -08/30/2021 17:09:37 - INFO - __main__ - Step 22033: {'lr': 0.00047773712269960714, 'samples': 4230336, 'steps': 22032, 'loss/train': 1.3691271543502808} -08/30/2021 17:09:39 - INFO - __main__ - Step 22034: {'lr': 0.00047773493350949963, 'samples': 4230528, 'steps': 22033, 'loss/train': 1.634064793586731} -08/30/2021 17:09:39 - INFO - __main__ - Step 22035: {'lr': 0.00047773274421677834, 'samples': 4230720, 'steps': 22034, 'loss/train': 0.20929567515850067} -08/30/2021 17:09:39 - INFO - __main__ - Step 22036: {'lr': 0.0004777305548214442, 'samples': 4230912, 'steps': 22035, 'loss/train': 1.8736116886138916} -08/30/2021 17:09:40 - INFO - __main__ - Step 22037: {'lr': 0.0004777283653234982, 'samples': 4231104, 'steps': 22036, 'loss/train': 1.4712235927581787} -08/30/2021 17:09:40 - INFO - __main__ - Step 22038: {'lr': 0.00047772617572294123, 'samples': 4231296, 'steps': 22037, 'loss/train': 1.524675726890564} -08/30/2021 17:09:41 - INFO - __main__ - Step 22039: {'lr': 0.0004777239860197744, 'samples': 4231488, 'steps': 22038, 'loss/train': 1.3708162307739258} -08/30/2021 17:09:42 - INFO - __main__ - Step 22040: {'lr': 0.0004777217962139987, 'samples': 4231680, 'steps': 22039, 'loss/train': 1.613618016242981} -08/30/2021 17:09:43 - INFO - __main__ - Step 22041: {'lr': 0.000477719606305615, 'samples': 4231872, 'steps': 22040, 'loss/train': 1.3604282140731812} -08/30/2021 17:09:43 - INFO - __main__ - Step 22042: {'lr': 0.0004777174162946244, 'samples': 4232064, 'steps': 22041, 'loss/train': 1.1682003736495972} -08/30/2021 17:09:43 - INFO - __main__ - Step 22043: {'lr': 0.0004777152261810279, 'samples': 4232256, 'steps': 22042, 'loss/train': 1.8293678760528564} -08/30/2021 17:09:44 - INFO - __main__ - Step 22044: {'lr': 0.0004777130359648263, 'samples': 4232448, 'steps': 22043, 'loss/train': 0.9608367681503296} -08/30/2021 17:09:45 - INFO - __main__ - Step 22045: {'lr': 0.0004777108456460208, 'samples': 4232640, 'steps': 22044, 'loss/train': 1.5555115938186646} -08/30/2021 17:09:46 - INFO - __main__ - Step 22046: {'lr': 0.00047770865522461233, 'samples': 4232832, 'steps': 22045, 'loss/train': 1.3933627605438232} -08/30/2021 17:09:46 - INFO - __main__ - Step 22047: {'lr': 0.0004777064647006018, 'samples': 4233024, 'steps': 22046, 'loss/train': 2.507596969604492} -08/30/2021 17:09:46 - INFO - __main__ - Step 22048: {'lr': 0.0004777042740739903, 'samples': 4233216, 'steps': 22047, 'loss/train': 1.6716880798339844} -08/30/2021 17:09:47 - INFO - __main__ - Step 22049: {'lr': 0.0004777020833447787, 'samples': 4233408, 'steps': 22048, 'loss/train': 0.8102055191993713} -08/30/2021 17:09:48 - INFO - __main__ - Step 22050: {'lr': 0.0004776998925129681, 'samples': 4233600, 'steps': 22049, 'loss/train': 1.6614139080047607} -08/30/2021 17:09:49 - INFO - __main__ - Step 22051: {'lr': 0.0004776977015785595, 'samples': 4233792, 'steps': 22050, 'loss/train': 1.5732864141464233} -08/30/2021 17:09:49 - INFO - __main__ - Step 22052: {'lr': 0.0004776955105415537, 'samples': 4233984, 'steps': 22051, 'loss/train': 1.7298601865768433} -08/30/2021 17:09:50 - INFO - __main__ - Step 22053: {'lr': 0.00047769331940195194, 'samples': 4234176, 'steps': 22052, 'loss/train': 1.2789348363876343} -08/30/2021 17:09:50 - INFO - __main__ - Step 22054: {'lr': 0.00047769112815975503, 'samples': 4234368, 'steps': 22053, 'loss/train': 2.008350133895874} -08/30/2021 17:09:50 - INFO - __main__ - Step 22055: {'lr': 0.00047768893681496397, 'samples': 4234560, 'steps': 22054, 'loss/train': 1.403056025505066} -08/30/2021 17:09:52 - INFO - __main__ - Step 22056: {'lr': 0.00047768674536757984, 'samples': 4234752, 'steps': 22055, 'loss/train': 1.2862383127212524} -08/30/2021 17:09:53 - INFO - __main__ - Step 22057: {'lr': 0.00047768455381760357, 'samples': 4234944, 'steps': 22056, 'loss/train': 2.275675058364868} -08/30/2021 17:09:53 - INFO - __main__ - Step 22058: {'lr': 0.00047768236216503613, 'samples': 4235136, 'steps': 22057, 'loss/train': 1.7179292440414429} -08/30/2021 17:09:53 - INFO - __main__ - Step 22059: {'lr': 0.00047768017040987856, 'samples': 4235328, 'steps': 22058, 'loss/train': 3.2524068355560303} -08/30/2021 17:09:54 - INFO - __main__ - Step 22060: {'lr': 0.0004776779785521318, 'samples': 4235520, 'steps': 22059, 'loss/train': 1.4430495500564575} -08/30/2021 17:09:56 - INFO - __main__ - Step 22061: {'lr': 0.0004776757865917969, 'samples': 4235712, 'steps': 22060, 'loss/train': 1.617902159690857} -08/30/2021 17:09:56 - INFO - __main__ - Step 22062: {'lr': 0.0004776735945288747, 'samples': 4235904, 'steps': 22061, 'loss/train': 1.906358242034912} -08/30/2021 17:09:56 - INFO - __main__ - Step 22063: {'lr': 0.00047767140236336635, 'samples': 4236096, 'steps': 22062, 'loss/train': 2.3241195678710938} -08/30/2021 17:09:57 - INFO - __main__ - Step 22064: {'lr': 0.00047766921009527284, 'samples': 4236288, 'steps': 22063, 'loss/train': 1.8307621479034424} -08/30/2021 17:09:57 - INFO - __main__ - Step 22065: {'lr': 0.00047766701772459505, 'samples': 4236480, 'steps': 22064, 'loss/train': 1.2524582147598267} -08/30/2021 17:09:57 - INFO - __main__ - Step 22066: {'lr': 0.00047766482525133405, 'samples': 4236672, 'steps': 22065, 'loss/train': 1.5745614767074585} -08/30/2021 17:09:59 - INFO - __main__ - Step 22067: {'lr': 0.00047766263267549073, 'samples': 4236864, 'steps': 22066, 'loss/train': 1.3962738513946533} -08/30/2021 17:09:59 - INFO - __main__ - Step 22068: {'lr': 0.0004776604399970661, 'samples': 4237056, 'steps': 22067, 'loss/train': 1.452945590019226} -08/30/2021 17:10:00 - INFO - __main__ - Step 22069: {'lr': 0.0004776582472160613, 'samples': 4237248, 'steps': 22068, 'loss/train': 1.9384219646453857} -08/30/2021 17:10:00 - INFO - __main__ - Step 22070: {'lr': 0.0004776560543324772, 'samples': 4237440, 'steps': 22069, 'loss/train': 1.5681068897247314} -08/30/2021 17:10:00 - INFO - __main__ - Step 22071: {'lr': 0.0004776538613463147, 'samples': 4237632, 'steps': 22070, 'loss/train': 2.144890069961548} -08/30/2021 17:10:02 - INFO - __main__ - Step 22072: {'lr': 0.00047765166825757487, 'samples': 4237824, 'steps': 22071, 'loss/train': 1.6291849613189697} -08/30/2021 17:10:03 - INFO - __main__ - Step 22073: {'lr': 0.00047764947506625887, 'samples': 4238016, 'steps': 22072, 'loss/train': 1.8141212463378906} -08/30/2021 17:10:03 - INFO - __main__ - Step 22074: {'lr': 0.00047764728177236736, 'samples': 4238208, 'steps': 22073, 'loss/train': 2.9622011184692383} -08/30/2021 17:10:03 - INFO - __main__ - Step 22075: {'lr': 0.0004776450883759016, 'samples': 4238400, 'steps': 22074, 'loss/train': 1.679767370223999} -08/30/2021 17:10:04 - INFO - __main__ - Step 22076: {'lr': 0.0004776428948768625, 'samples': 4238592, 'steps': 22075, 'loss/train': 0.6758951544761658} -08/30/2021 17:10:06 - INFO - __main__ - Step 22077: {'lr': 0.00047764070127525096, 'samples': 4238784, 'steps': 22076, 'loss/train': 1.738405704498291} -08/30/2021 17:10:07 - INFO - __main__ - Step 22078: {'lr': 0.00047763850757106803, 'samples': 4238976, 'steps': 22077, 'loss/train': 1.8547416925430298} -08/30/2021 17:10:07 - INFO - __main__ - Step 22079: {'lr': 0.0004776363137643147, 'samples': 4239168, 'steps': 22078, 'loss/train': 1.784899115562439} -08/30/2021 17:10:07 - INFO - __main__ - Step 22080: {'lr': 0.000477634119854992, 'samples': 4239360, 'steps': 22079, 'loss/train': 1.3763948678970337} -08/30/2021 17:10:08 - INFO - __main__ - Step 22081: {'lr': 0.00047763192584310087, 'samples': 4239552, 'steps': 22080, 'loss/train': 0.8035991787910461} -08/30/2021 17:10:08 - INFO - __main__ - Step 22082: {'lr': 0.0004776297317286423, 'samples': 4239744, 'steps': 22081, 'loss/train': 0.6462414264678955} -08/30/2021 17:10:09 - INFO - __main__ - Step 22083: {'lr': 0.00047762753751161725, 'samples': 4239936, 'steps': 22082, 'loss/train': 1.702309489250183} -08/30/2021 17:10:10 - INFO - __main__ - Step 22084: {'lr': 0.0004776253431920268, 'samples': 4240128, 'steps': 22083, 'loss/train': 1.4913526773452759} -08/30/2021 17:10:10 - INFO - __main__ - Step 22085: {'lr': 0.00047762314876987185, 'samples': 4240320, 'steps': 22084, 'loss/train': 0.9840775728225708} -08/30/2021 17:10:11 - INFO - __main__ - Step 22086: {'lr': 0.0004776209542451534, 'samples': 4240512, 'steps': 22085, 'loss/train': 1.5377213954925537} -08/30/2021 17:10:11 - INFO - __main__ - Step 22087: {'lr': 0.0004776187596178725, 'samples': 4240704, 'steps': 22086, 'loss/train': 2.0228564739227295} -08/30/2021 17:10:12 - INFO - __main__ - Step 22088: {'lr': 0.00047761656488803006, 'samples': 4240896, 'steps': 22087, 'loss/train': 1.4768586158752441} -08/30/2021 17:10:13 - INFO - __main__ - Step 22089: {'lr': 0.00047761437005562716, 'samples': 4241088, 'steps': 22088, 'loss/train': 1.665913462638855} -08/30/2021 17:10:13 - INFO - __main__ - Step 22090: {'lr': 0.00047761217512066475, 'samples': 4241280, 'steps': 22089, 'loss/train': 2.0579636096954346} -08/30/2021 17:10:14 - INFO - __main__ - Step 22091: {'lr': 0.0004776099800831437, 'samples': 4241472, 'steps': 22090, 'loss/train': 0.23284082114696503} -08/30/2021 17:10:14 - INFO - __main__ - Step 22092: {'lr': 0.0004776077849430652, 'samples': 4241664, 'steps': 22091, 'loss/train': 1.666582465171814} -08/30/2021 17:10:16 - INFO - __main__ - Step 22093: {'lr': 0.0004776055897004301, 'samples': 4241856, 'steps': 22092, 'loss/train': 1.771843433380127} -08/30/2021 17:10:16 - INFO - __main__ - Step 22094: {'lr': 0.0004776033943552395, 'samples': 4242048, 'steps': 22093, 'loss/train': 2.050999402999878} -08/30/2021 17:10:16 - INFO - __main__ - Step 22095: {'lr': 0.0004776011989074943, 'samples': 4242240, 'steps': 22094, 'loss/train': 2.2498724460601807} -08/30/2021 17:10:17 - INFO - __main__ - Step 22096: {'lr': 0.00047759900335719543, 'samples': 4242432, 'steps': 22095, 'loss/train': 1.6556576490402222} -08/30/2021 17:10:17 - INFO - __main__ - Step 22097: {'lr': 0.00047759680770434405, 'samples': 4242624, 'steps': 22096, 'loss/train': 1.60176420211792} -08/30/2021 17:10:18 - INFO - __main__ - Step 22098: {'lr': 0.00047759461194894103, 'samples': 4242816, 'steps': 22097, 'loss/train': 1.6094857454299927} -08/30/2021 17:10:19 - INFO - __main__ - Step 22099: {'lr': 0.00047759241609098734, 'samples': 4243008, 'steps': 22098, 'loss/train': 1.4421844482421875} -08/30/2021 17:10:19 - INFO - __main__ - Step 22100: {'lr': 0.00047759022013048417, 'samples': 4243200, 'steps': 22099, 'loss/train': 1.1010295152664185} -08/30/2021 17:10:20 - INFO - __main__ - Step 22101: {'lr': 0.00047758802406743217, 'samples': 4243392, 'steps': 22100, 'loss/train': 1.3330720663070679} -08/30/2021 17:10:20 - INFO - __main__ - Step 22102: {'lr': 0.0004775858279018326, 'samples': 4243584, 'steps': 22101, 'loss/train': 1.3838764429092407} -08/30/2021 17:10:21 - INFO - __main__ - Step 22103: {'lr': 0.0004775836316336864, 'samples': 4243776, 'steps': 22102, 'loss/train': 1.976652979850769} -08/30/2021 17:10:22 - INFO - __main__ - Step 22104: {'lr': 0.00047758143526299446, 'samples': 4243968, 'steps': 22103, 'loss/train': 1.4156880378723145} -08/30/2021 17:10:22 - INFO - __main__ - Step 22105: {'lr': 0.0004775792387897579, 'samples': 4244160, 'steps': 22104, 'loss/train': 2.0119359493255615} -08/30/2021 17:10:23 - INFO - __main__ - Step 22106: {'lr': 0.0004775770422139776, 'samples': 4244352, 'steps': 22105, 'loss/train': 1.8513189554214478} -08/30/2021 17:10:23 - INFO - __main__ - Step 22107: {'lr': 0.00047757484553565465, 'samples': 4244544, 'steps': 22106, 'loss/train': 1.8542102575302124} -08/30/2021 17:10:23 - INFO - __main__ - Step 22108: {'lr': 0.00047757264875478996, 'samples': 4244736, 'steps': 22107, 'loss/train': 2.1568729877471924} -08/30/2021 17:10:25 - INFO - __main__ - Step 22109: {'lr': 0.0004775704518713845, 'samples': 4244928, 'steps': 22108, 'loss/train': 1.6737103462219238} -08/30/2021 17:10:25 - INFO - __main__ - Step 22110: {'lr': 0.0004775682548854394, 'samples': 4245120, 'steps': 22109, 'loss/train': 2.2088537216186523} -08/30/2021 17:10:25 - INFO - __main__ - Step 22111: {'lr': 0.0004775660577969555, 'samples': 4245312, 'steps': 22110, 'loss/train': 1.5327880382537842} -08/30/2021 17:10:26 - INFO - __main__ - Step 22112: {'lr': 0.0004775638606059338, 'samples': 4245504, 'steps': 22111, 'loss/train': 3.1570706367492676} -08/30/2021 17:10:26 - INFO - __main__ - Step 22113: {'lr': 0.00047756166331237545, 'samples': 4245696, 'steps': 22112, 'loss/train': 1.7394119501113892} -08/30/2021 17:10:28 - INFO - __main__ - Step 22114: {'lr': 0.00047755946591628126, 'samples': 4245888, 'steps': 22113, 'loss/train': 1.5016783475875854} -08/30/2021 17:10:28 - INFO - __main__ - Step 22115: {'lr': 0.00047755726841765224, 'samples': 4246080, 'steps': 22114, 'loss/train': 1.730542540550232} -08/30/2021 17:10:28 - INFO - __main__ - Step 22116: {'lr': 0.0004775550708164895, 'samples': 4246272, 'steps': 22115, 'loss/train': 1.4529187679290771} -08/30/2021 17:10:29 - INFO - __main__ - Step 22117: {'lr': 0.00047755287311279394, 'samples': 4246464, 'steps': 22116, 'loss/train': 1.6635645627975464} -08/30/2021 17:10:29 - INFO - __main__ - Step 22118: {'lr': 0.00047755067530656656, 'samples': 4246656, 'steps': 22117, 'loss/train': 1.3346130847930908} -08/30/2021 17:10:31 - INFO - __main__ - Step 22119: {'lr': 0.00047754847739780835, 'samples': 4246848, 'steps': 22118, 'loss/train': 1.9994735717773438} -08/30/2021 17:10:32 - INFO - __main__ - Step 22120: {'lr': 0.0004775462793865203, 'samples': 4247040, 'steps': 22119, 'loss/train': 1.7999855279922485} -08/30/2021 17:10:32 - INFO - __main__ - Step 22121: {'lr': 0.00047754408127270346, 'samples': 4247232, 'steps': 22120, 'loss/train': 0.8281984925270081} -08/30/2021 17:10:32 - INFO - __main__ - Step 22122: {'lr': 0.0004775418830563587, 'samples': 4247424, 'steps': 22121, 'loss/train': 1.6985368728637695} -08/30/2021 17:10:33 - INFO - __main__ - Step 22123: {'lr': 0.0004775396847374871, 'samples': 4247616, 'steps': 22122, 'loss/train': 1.672114610671997} -08/30/2021 17:10:34 - INFO - __main__ - Step 22124: {'lr': 0.0004775374863160896, 'samples': 4247808, 'steps': 22123, 'loss/train': 1.8892408609390259} -08/30/2021 17:10:35 - INFO - __main__ - Step 22125: {'lr': 0.0004775352877921673, 'samples': 4248000, 'steps': 22124, 'loss/train': 1.277587652206421} -08/30/2021 17:10:35 - INFO - __main__ - Step 22126: {'lr': 0.000477533089165721, 'samples': 4248192, 'steps': 22125, 'loss/train': 1.4643505811691284} -08/30/2021 17:10:35 - INFO - __main__ - Step 22127: {'lr': 0.0004775308904367519, 'samples': 4248384, 'steps': 22126, 'loss/train': 4.364542007446289} -08/30/2021 17:10:36 - INFO - __main__ - Step 22128: {'lr': 0.0004775286916052609, 'samples': 4248576, 'steps': 22127, 'loss/train': 1.5798108577728271} -08/30/2021 17:10:38 - INFO - __main__ - Step 22129: {'lr': 0.00047752649267124894, 'samples': 4248768, 'steps': 22128, 'loss/train': 1.3072041273117065} -08/30/2021 17:10:38 - INFO - __main__ - Step 22130: {'lr': 0.0004775242936347171, 'samples': 4248960, 'steps': 22129, 'loss/train': 1.8408241271972656} -08/30/2021 17:10:39 - INFO - __main__ - Step 22131: {'lr': 0.0004775220944956662, 'samples': 4249152, 'steps': 22130, 'loss/train': 2.2044079303741455} -08/30/2021 17:10:39 - INFO - __main__ - Step 22132: {'lr': 0.00047751989525409745, 'samples': 4249344, 'steps': 22131, 'loss/train': 1.4526580572128296} -08/30/2021 17:10:39 - INFO - __main__ - Step 22133: {'lr': 0.0004775176959100117, 'samples': 4249536, 'steps': 22132, 'loss/train': 1.7001789808273315} -08/30/2021 17:10:41 - INFO - __main__ - Step 22134: {'lr': 0.00047751549646341007, 'samples': 4249728, 'steps': 22133, 'loss/train': 1.269938588142395} -08/30/2021 17:10:41 - INFO - __main__ - Step 22135: {'lr': 0.0004775132969142934, 'samples': 4249920, 'steps': 22134, 'loss/train': 1.303545355796814} -08/30/2021 17:10:42 - INFO - __main__ - Step 22136: {'lr': 0.00047751109726266273, 'samples': 4250112, 'steps': 22135, 'loss/train': 0.9846208095550537} -08/30/2021 17:10:42 - INFO - __main__ - Step 22137: {'lr': 0.00047750889750851913, 'samples': 4250304, 'steps': 22136, 'loss/train': 1.691420555114746} -08/30/2021 17:10:42 - INFO - __main__ - Step 22138: {'lr': 0.0004775066976518635, 'samples': 4250496, 'steps': 22137, 'loss/train': 1.7628076076507568} -08/30/2021 17:10:43 - INFO - __main__ - Step 22139: {'lr': 0.00047750449769269686, 'samples': 4250688, 'steps': 22138, 'loss/train': 1.920169711112976} -08/30/2021 17:10:44 - INFO - __main__ - Step 22140: {'lr': 0.0004775022976310203, 'samples': 4250880, 'steps': 22139, 'loss/train': 1.5844125747680664} -08/30/2021 17:10:45 - INFO - __main__ - Step 22141: {'lr': 0.0004775000974668345, 'samples': 4251072, 'steps': 22140, 'loss/train': 1.3784774541854858} -08/30/2021 17:10:45 - INFO - __main__ - Step 22142: {'lr': 0.00047749789720014085, 'samples': 4251264, 'steps': 22141, 'loss/train': 2.164243698120117} -08/30/2021 17:10:46 - INFO - __main__ - Step 22143: {'lr': 0.00047749569683094015, 'samples': 4251456, 'steps': 22142, 'loss/train': 1.156712293624878} -08/30/2021 17:10:46 - INFO - __main__ - Step 22144: {'lr': 0.00047749349635923334, 'samples': 4251648, 'steps': 22143, 'loss/train': 2.125542640686035} -08/30/2021 17:10:46 - INFO - __main__ - Step 22145: {'lr': 0.0004774912957850215, 'samples': 4251840, 'steps': 22144, 'loss/train': 0.0950431227684021} -08/30/2021 17:10:49 - INFO - __main__ - Step 22146: {'lr': 0.0004774890951083055, 'samples': 4252032, 'steps': 22145, 'loss/train': 1.0042872428894043} -08/30/2021 17:10:49 - INFO - __main__ - Step 22147: {'lr': 0.00047748689432908654, 'samples': 4252224, 'steps': 22146, 'loss/train': 1.9640812873840332} -08/30/2021 17:10:49 - INFO - __main__ - Step 22148: {'lr': 0.00047748469344736547, 'samples': 4252416, 'steps': 22147, 'loss/train': 1.8786741495132446} -08/30/2021 17:10:50 - INFO - __main__ - Step 22149: {'lr': 0.00047748249246314323, 'samples': 4252608, 'steps': 22148, 'loss/train': 1.8291820287704468} -08/30/2021 17:10:50 - INFO - __main__ - Step 22150: {'lr': 0.000477480291376421, 'samples': 4252800, 'steps': 22149, 'loss/train': 1.5574336051940918} -08/30/2021 17:10:50 - INFO - __main__ - Step 22151: {'lr': 0.0004774780901871996, 'samples': 4252992, 'steps': 22150, 'loss/train': 2.3067526817321777} -08/30/2021 17:10:52 - INFO - __main__ - Step 22152: {'lr': 0.0004774758888954801, 'samples': 4253184, 'steps': 22151, 'loss/train': 1.6837538480758667} -08/30/2021 17:10:52 - INFO - __main__ - Step 22153: {'lr': 0.00047747368750126345, 'samples': 4253376, 'steps': 22152, 'loss/train': 1.6451901197433472} -08/30/2021 17:10:53 - INFO - __main__ - Step 22154: {'lr': 0.0004774714860045507, 'samples': 4253568, 'steps': 22153, 'loss/train': 0.507257342338562} -08/30/2021 17:10:53 - INFO - __main__ - Step 22155: {'lr': 0.0004774692844053428, 'samples': 4253760, 'steps': 22154, 'loss/train': 1.1535602807998657} -08/30/2021 17:10:53 - INFO - __main__ - Step 22156: {'lr': 0.00047746708270364073, 'samples': 4253952, 'steps': 22155, 'loss/train': 1.8781384229660034} -08/30/2021 17:10:55 - INFO - __main__ - Step 22157: {'lr': 0.0004774648808994455, 'samples': 4254144, 'steps': 22156, 'loss/train': 1.3260270357131958} -08/30/2021 17:10:56 - INFO - __main__ - Step 22158: {'lr': 0.0004774626789927582, 'samples': 4254336, 'steps': 22157, 'loss/train': 1.7989898920059204} -08/30/2021 17:10:56 - INFO - __main__ - Step 22159: {'lr': 0.0004774604769835796, 'samples': 4254528, 'steps': 22158, 'loss/train': 0.3206104338169098} -08/30/2021 17:10:56 - INFO - __main__ - Step 22160: {'lr': 0.00047745827487191087, 'samples': 4254720, 'steps': 22159, 'loss/train': 1.4987117052078247} -08/30/2021 17:10:57 - INFO - __main__ - Step 22161: {'lr': 0.00047745607265775293, 'samples': 4254912, 'steps': 22160, 'loss/train': 2.027649164199829} -08/30/2021 17:10:57 - INFO - __main__ - Step 22162: {'lr': 0.0004774538703411069, 'samples': 4255104, 'steps': 22161, 'loss/train': 0.652060329914093} -08/30/2021 17:10:59 - INFO - __main__ - Step 22163: {'lr': 0.00047745166792197353, 'samples': 4255296, 'steps': 22162, 'loss/train': 1.7201666831970215} -08/30/2021 17:10:59 - INFO - __main__ - Step 22164: {'lr': 0.000477449465400354, 'samples': 4255488, 'steps': 22163, 'loss/train': 0.7782296538352966} -08/30/2021 17:10:59 - INFO - __main__ - Step 22165: {'lr': 0.00047744726277624926, 'samples': 4255680, 'steps': 22164, 'loss/train': 1.7708029747009277} -08/30/2021 17:11:00 - INFO - __main__ - Step 22166: {'lr': 0.00047744506004966024, 'samples': 4255872, 'steps': 22165, 'loss/train': 2.124933958053589} -08/30/2021 17:11:00 - INFO - __main__ - Step 22167: {'lr': 0.00047744285722058804, 'samples': 4256064, 'steps': 22166, 'loss/train': 1.7922090291976929} -08/30/2021 17:11:02 - INFO - __main__ - Step 22168: {'lr': 0.0004774406542890336, 'samples': 4256256, 'steps': 22167, 'loss/train': 1.4843497276306152} -08/30/2021 17:11:02 - INFO - __main__ - Step 22169: {'lr': 0.0004774384512549979, 'samples': 4256448, 'steps': 22168, 'loss/train': 1.8620972633361816} -08/30/2021 17:11:03 - INFO - __main__ - Step 22170: {'lr': 0.00047743624811848195, 'samples': 4256640, 'steps': 22169, 'loss/train': 1.7882907390594482} -08/30/2021 17:11:03 - INFO - __main__ - Step 22171: {'lr': 0.00047743404487948673, 'samples': 4256832, 'steps': 22170, 'loss/train': 1.7539762258529663} -08/30/2021 17:11:03 - INFO - __main__ - Step 22172: {'lr': 0.0004774318415380132, 'samples': 4257024, 'steps': 22171, 'loss/train': 1.9795050621032715} -08/30/2021 17:11:04 - INFO - __main__ - Step 22173: {'lr': 0.0004774296380940625, 'samples': 4257216, 'steps': 22172, 'loss/train': 1.0491347312927246} -08/30/2021 17:11:05 - INFO - __main__ - Step 22174: {'lr': 0.0004774274345476354, 'samples': 4257408, 'steps': 22173, 'loss/train': 2.025768280029297} -08/30/2021 17:11:06 - INFO - __main__ - Step 22175: {'lr': 0.00047742523089873304, 'samples': 4257600, 'steps': 22174, 'loss/train': 1.32821786403656} -08/30/2021 17:11:06 - INFO - __main__ - Step 22176: {'lr': 0.0004774230271473564, 'samples': 4257792, 'steps': 22175, 'loss/train': 1.7467927932739258} -08/30/2021 17:11:07 - INFO - __main__ - Step 22177: {'lr': 0.00047742082329350644, 'samples': 4257984, 'steps': 22176, 'loss/train': 1.1691381931304932} -08/30/2021 17:11:07 - INFO - __main__ - Step 22178: {'lr': 0.0004774186193371841, 'samples': 4258176, 'steps': 22177, 'loss/train': 2.0946285724639893} -08/30/2021 17:11:08 - INFO - __main__ - Step 22179: {'lr': 0.00047741641527839054, 'samples': 4258368, 'steps': 22178, 'loss/train': 1.907494306564331} -08/30/2021 17:11:09 - INFO - __main__ - Step 22180: {'lr': 0.00047741421111712666, 'samples': 4258560, 'steps': 22179, 'loss/train': 2.1550490856170654} -08/30/2021 17:11:09 - INFO - __main__ - Step 22181: {'lr': 0.00047741200685339337, 'samples': 4258752, 'steps': 22180, 'loss/train': 0.9798780679702759} -08/30/2021 17:11:10 - INFO - __main__ - Step 22182: {'lr': 0.0004774098024871918, 'samples': 4258944, 'steps': 22181, 'loss/train': 1.8367745876312256} -08/30/2021 17:11:10 - INFO - __main__ - Step 22183: {'lr': 0.00047740759801852284, 'samples': 4259136, 'steps': 22182, 'loss/train': 2.275071382522583} -08/30/2021 17:11:10 - INFO - __main__ - Step 22184: {'lr': 0.00047740539344738754, 'samples': 4259328, 'steps': 22183, 'loss/train': 1.5963722467422485} -08/30/2021 17:11:12 - INFO - __main__ - Step 22185: {'lr': 0.00047740318877378685, 'samples': 4259520, 'steps': 22184, 'loss/train': 5.944394111633301} -08/30/2021 17:11:13 - INFO - __main__ - Step 22186: {'lr': 0.00047740098399772185, 'samples': 4259712, 'steps': 22185, 'loss/train': 1.6890538930892944} -08/30/2021 17:11:13 - INFO - __main__ - Step 22187: {'lr': 0.0004773987791191935, 'samples': 4259904, 'steps': 22186, 'loss/train': 1.661117434501648} -08/30/2021 17:11:14 - INFO - __main__ - Step 22188: {'lr': 0.0004773965741382027, 'samples': 4260096, 'steps': 22187, 'loss/train': 1.3339636325836182} -08/30/2021 17:11:14 - INFO - __main__ - Step 22189: {'lr': 0.00047739436905475054, 'samples': 4260288, 'steps': 22188, 'loss/train': 1.8554155826568604} -08/30/2021 17:11:15 - INFO - __main__ - Step 22190: {'lr': 0.00047739216386883797, 'samples': 4260480, 'steps': 22189, 'loss/train': 2.088022470474243} -08/30/2021 17:11:16 - INFO - __main__ - Step 22191: {'lr': 0.000477389958580466, 'samples': 4260672, 'steps': 22190, 'loss/train': 1.8659831285476685} -08/30/2021 17:11:16 - INFO - __main__ - Step 22192: {'lr': 0.0004773877531896356, 'samples': 4260864, 'steps': 22191, 'loss/train': 1.602364182472229} -08/30/2021 17:11:16 - INFO - __main__ - Step 22193: {'lr': 0.00047738554769634784, 'samples': 4261056, 'steps': 22192, 'loss/train': 1.59539794921875} -08/30/2021 17:11:17 - INFO - __main__ - Step 22194: {'lr': 0.00047738334210060366, 'samples': 4261248, 'steps': 22193, 'loss/train': 2.3934431076049805} -08/30/2021 17:11:19 - INFO - __main__ - Step 22195: {'lr': 0.000477381136402404, 'samples': 4261440, 'steps': 22194, 'loss/train': 1.918354868888855} -08/30/2021 17:11:19 - INFO - __main__ - Step 22196: {'lr': 0.00047737893060175, 'samples': 4261632, 'steps': 22195, 'loss/train': 1.7233904600143433} -08/30/2021 17:11:19 - INFO - __main__ - Step 22197: {'lr': 0.00047737672469864246, 'samples': 4261824, 'steps': 22196, 'loss/train': 1.3757588863372803} -08/30/2021 17:11:20 - INFO - __main__ - Step 22198: {'lr': 0.0004773745186930825, 'samples': 4262016, 'steps': 22197, 'loss/train': 1.9363975524902344} -08/30/2021 17:11:20 - INFO - __main__ - Step 22199: {'lr': 0.00047737231258507116, 'samples': 4262208, 'steps': 22198, 'loss/train': 1.716389536857605} -08/30/2021 17:11:21 - INFO - __main__ - Step 22200: {'lr': 0.00047737010637460934, 'samples': 4262400, 'steps': 22199, 'loss/train': 1.666672706604004} -08/30/2021 17:11:21 - INFO - __main__ - Step 22201: {'lr': 0.00047736790006169794, 'samples': 4262592, 'steps': 22200, 'loss/train': 1.411740779876709} -08/30/2021 17:11:22 - INFO - __main__ - Step 22202: {'lr': 0.00047736569364633817, 'samples': 4262784, 'steps': 22201, 'loss/train': 1.2216259241104126} -08/30/2021 17:11:23 - INFO - __main__ - Step 22203: {'lr': 0.00047736348712853094, 'samples': 4262976, 'steps': 22202, 'loss/train': 2.133310556411743} -08/30/2021 17:11:23 - INFO - __main__ - Step 22204: {'lr': 0.0004773612805082772, 'samples': 4263168, 'steps': 22203, 'loss/train': 2.077293634414673} -08/30/2021 17:11:24 - INFO - __main__ - Step 22205: {'lr': 0.000477359073785578, 'samples': 4263360, 'steps': 22204, 'loss/train': 2.1532883644104004} -08/30/2021 17:11:24 - INFO - __main__ - Step 22206: {'lr': 0.00047735686696043434, 'samples': 4263552, 'steps': 22205, 'loss/train': 2.1496901512145996} -08/30/2021 17:11:25 - INFO - __main__ - Step 22207: {'lr': 0.0004773546600328471, 'samples': 4263744, 'steps': 22206, 'loss/train': 2.316821575164795} -08/30/2021 17:11:26 - INFO - __main__ - Step 22208: {'lr': 0.00047735245300281745, 'samples': 4263936, 'steps': 22207, 'loss/train': 1.21135413646698} -08/30/2021 17:11:26 - INFO - __main__ - Step 22209: {'lr': 0.00047735024587034625, 'samples': 4264128, 'steps': 22208, 'loss/train': 1.9529237747192383} -08/30/2021 17:11:27 - INFO - __main__ - Step 22210: {'lr': 0.00047734803863543453, 'samples': 4264320, 'steps': 22209, 'loss/train': 1.8628636598587036} -08/30/2021 17:11:27 - INFO - __main__ - Step 22211: {'lr': 0.00047734583129808327, 'samples': 4264512, 'steps': 22210, 'loss/train': 1.4725264310836792} -08/30/2021 17:11:27 - INFO - __main__ - Step 22212: {'lr': 0.00047734362385829356, 'samples': 4264704, 'steps': 22211, 'loss/train': 2.220416784286499} -08/30/2021 17:11:29 - INFO - __main__ - Step 22213: {'lr': 0.0004773414163160662, 'samples': 4264896, 'steps': 22212, 'loss/train': 1.9183039665222168} -08/30/2021 17:11:29 - INFO - __main__ - Step 22214: {'lr': 0.00047733920867140244, 'samples': 4265088, 'steps': 22213, 'loss/train': 1.4160573482513428} -08/30/2021 17:11:30 - INFO - __main__ - Step 22215: {'lr': 0.00047733700092430305, 'samples': 4265280, 'steps': 22214, 'loss/train': 1.6211538314819336} -08/30/2021 17:11:30 - INFO - __main__ - Step 22216: {'lr': 0.0004773347930747691, 'samples': 4265472, 'steps': 22215, 'loss/train': 3.273075819015503} -08/30/2021 17:11:30 - INFO - __main__ - Step 22217: {'lr': 0.0004773325851228017, 'samples': 4265664, 'steps': 22216, 'loss/train': 1.7557157278060913} -08/30/2021 17:11:32 - INFO - __main__ - Step 22218: {'lr': 0.00047733037706840166, 'samples': 4265856, 'steps': 22217, 'loss/train': 1.849313735961914} -08/30/2021 17:11:32 - INFO - __main__ - Step 22219: {'lr': 0.0004773281689115701, 'samples': 4266048, 'steps': 22218, 'loss/train': 2.089118480682373} -08/30/2021 17:11:32 - INFO - __main__ - Step 22220: {'lr': 0.000477325960652308, 'samples': 4266240, 'steps': 22219, 'loss/train': 1.6515716314315796} -08/30/2021 17:11:33 - INFO - __main__ - Step 22221: {'lr': 0.0004773237522906163, 'samples': 4266432, 'steps': 22220, 'loss/train': 2.2680416107177734} -08/30/2021 17:11:33 - INFO - __main__ - Step 22222: {'lr': 0.000477321543826496, 'samples': 4266624, 'steps': 22221, 'loss/train': 1.7360239028930664} -08/30/2021 17:11:35 - INFO - __main__ - Step 22223: {'lr': 0.00047731933525994814, 'samples': 4266816, 'steps': 22222, 'loss/train': 1.806036353111267} -08/30/2021 17:11:35 - INFO - __main__ - Step 22224: {'lr': 0.0004773171265909737, 'samples': 4267008, 'steps': 22223, 'loss/train': 1.579102873802185} -08/30/2021 17:11:36 - INFO - __main__ - Step 22225: {'lr': 0.00047731491781957366, 'samples': 4267200, 'steps': 22224, 'loss/train': 2.0978195667266846} -08/30/2021 17:11:36 - INFO - __main__ - Step 22226: {'lr': 0.0004773127089457491, 'samples': 4267392, 'steps': 22225, 'loss/train': 0.35885512828826904} -08/30/2021 17:11:36 - INFO - __main__ - Step 22227: {'lr': 0.0004773104999695008, 'samples': 4267584, 'steps': 22226, 'loss/train': 1.8843597173690796} -08/30/2021 17:11:38 - INFO - __main__ - Step 22228: {'lr': 0.00047730829089082994, 'samples': 4267776, 'steps': 22227, 'loss/train': 1.9311151504516602} -08/30/2021 17:11:39 - INFO - __main__ - Step 22229: {'lr': 0.00047730608170973754, 'samples': 4267968, 'steps': 22228, 'loss/train': 1.5460875034332275} -08/30/2021 17:11:39 - INFO - __main__ - Step 22230: {'lr': 0.00047730387242622446, 'samples': 4268160, 'steps': 22229, 'loss/train': 1.5039581060409546} -08/30/2021 17:11:39 - INFO - __main__ - Step 22231: {'lr': 0.00047730166304029185, 'samples': 4268352, 'steps': 22230, 'loss/train': 2.5621299743652344} -08/30/2021 17:11:40 - INFO - __main__ - Step 22232: {'lr': 0.0004772994535519405, 'samples': 4268544, 'steps': 22231, 'loss/train': 0.2551862299442291} -08/30/2021 17:11:41 - INFO - __main__ - Step 22233: {'lr': 0.0004772972439611716, 'samples': 4268736, 'steps': 22232, 'loss/train': 2.1080820560455322} -08/30/2021 17:11:41 - INFO - __main__ - Step 22234: {'lr': 0.00047729503426798605, 'samples': 4268928, 'steps': 22233, 'loss/train': 1.5359896421432495} -08/30/2021 17:11:42 - INFO - __main__ - Step 22235: {'lr': 0.0004772928244723849, 'samples': 4269120, 'steps': 22234, 'loss/train': 2.113858938217163} -08/30/2021 17:11:42 - INFO - __main__ - Step 22236: {'lr': 0.00047729061457436905, 'samples': 4269312, 'steps': 22235, 'loss/train': 1.3084994554519653} -08/30/2021 17:11:43 - INFO - __main__ - Step 22237: {'lr': 0.0004772884045739396, 'samples': 4269504, 'steps': 22236, 'loss/train': 1.6442188024520874} -08/30/2021 17:11:45 - INFO - __main__ - Step 22238: {'lr': 0.0004772861944710974, 'samples': 4269696, 'steps': 22237, 'loss/train': 1.5789165496826172} -08/30/2021 17:11:45 - INFO - __main__ - Step 22239: {'lr': 0.00047728398426584375, 'samples': 4269888, 'steps': 22238, 'loss/train': 1.1186904907226562} -08/30/2021 17:11:46 - INFO - __main__ - Step 22240: {'lr': 0.0004772817739581793, 'samples': 4270080, 'steps': 22239, 'loss/train': 1.960464358329773} -08/30/2021 17:11:46 - INFO - __main__ - Step 22241: {'lr': 0.0004772795635481052, 'samples': 4270272, 'steps': 22240, 'loss/train': 2.104534864425659} -08/30/2021 17:11:46 - INFO - __main__ - Step 22242: {'lr': 0.00047727735303562246, 'samples': 4270464, 'steps': 22241, 'loss/train': 1.1994812488555908} -08/30/2021 17:11:48 - INFO - __main__ - Step 22243: {'lr': 0.000477275142420732, 'samples': 4270656, 'steps': 22242, 'loss/train': 1.981293797492981} -08/30/2021 17:11:48 - INFO - __main__ - Step 22244: {'lr': 0.000477272931703435, 'samples': 4270848, 'steps': 22243, 'loss/train': 1.873092532157898} -08/30/2021 17:11:49 - INFO - __main__ - Step 22245: {'lr': 0.0004772707208837322, 'samples': 4271040, 'steps': 22244, 'loss/train': 2.0743179321289062} -08/30/2021 17:11:49 - INFO - __main__ - Step 22246: {'lr': 0.0004772685099616247, 'samples': 4271232, 'steps': 22245, 'loss/train': 1.9581387042999268} -08/30/2021 17:11:49 - INFO - __main__ - Step 22247: {'lr': 0.0004772662989371136, 'samples': 4271424, 'steps': 22246, 'loss/train': 1.8399993181228638} -08/30/2021 17:11:51 - INFO - __main__ - Step 22248: {'lr': 0.0004772640878101998, 'samples': 4271616, 'steps': 22247, 'loss/train': 0.4765205681324005} -08/30/2021 17:11:51 - INFO - __main__ - Step 22249: {'lr': 0.00047726187658088425, 'samples': 4271808, 'steps': 22248, 'loss/train': 0.857501208782196} -08/30/2021 17:11:52 - INFO - __main__ - Step 22250: {'lr': 0.0004772596652491681, 'samples': 4272000, 'steps': 22249, 'loss/train': 1.1813633441925049} -08/30/2021 17:11:52 - INFO - __main__ - Step 22251: {'lr': 0.0004772574538150522, 'samples': 4272192, 'steps': 22250, 'loss/train': 1.92146897315979} -08/30/2021 17:11:52 - INFO - __main__ - Step 22252: {'lr': 0.0004772552422785376, 'samples': 4272384, 'steps': 22251, 'loss/train': 1.3620665073394775} -08/30/2021 17:11:54 - INFO - __main__ - Step 22253: {'lr': 0.00047725303063962535, 'samples': 4272576, 'steps': 22252, 'loss/train': 1.442641019821167} -08/30/2021 17:11:54 - INFO - __main__ - Step 22254: {'lr': 0.00047725081889831626, 'samples': 4272768, 'steps': 22253, 'loss/train': 1.8525470495224} -08/30/2021 17:11:55 - INFO - __main__ - Step 22255: {'lr': 0.0004772486070546116, 'samples': 4272960, 'steps': 22254, 'loss/train': 1.4444137811660767} -08/30/2021 17:11:55 - INFO - __main__ - Step 22256: {'lr': 0.0004772463951085121, 'samples': 4273152, 'steps': 22255, 'loss/train': 1.7241592407226562} -08/30/2021 17:11:55 - INFO - __main__ - Step 22257: {'lr': 0.00047724418306001895, 'samples': 4273344, 'steps': 22256, 'loss/train': 1.6980116367340088} -08/30/2021 17:11:57 - INFO - __main__ - Step 22258: {'lr': 0.0004772419709091331, 'samples': 4273536, 'steps': 22257, 'loss/train': 1.1155540943145752} -08/30/2021 17:11:57 - INFO - __main__ - Step 22259: {'lr': 0.00047723975865585544, 'samples': 4273728, 'steps': 22258, 'loss/train': 0.32903313636779785} -08/30/2021 17:11:58 - INFO - __main__ - Step 22260: {'lr': 0.00047723754630018715, 'samples': 4273920, 'steps': 22259, 'loss/train': 2.0642480850219727} -08/30/2021 17:11:58 - INFO - __main__ - Step 22261: {'lr': 0.000477235333842129, 'samples': 4274112, 'steps': 22260, 'loss/train': 1.3852115869522095} -08/30/2021 17:11:58 - INFO - __main__ - Step 22262: {'lr': 0.00047723312128168226, 'samples': 4274304, 'steps': 22261, 'loss/train': 1.337482213973999} -08/30/2021 17:11:59 - INFO - __main__ - Step 22263: {'lr': 0.00047723090861884773, 'samples': 4274496, 'steps': 22262, 'loss/train': 2.026703357696533} -08/30/2021 17:12:00 - INFO - __main__ - Step 22264: {'lr': 0.00047722869585362646, 'samples': 4274688, 'steps': 22263, 'loss/train': 2.6244313716888428} -08/30/2021 17:12:01 - INFO - __main__ - Step 22265: {'lr': 0.0004772264829860194, 'samples': 4274880, 'steps': 22264, 'loss/train': 1.8513308763504028} -08/30/2021 17:12:01 - INFO - __main__ - Step 22266: {'lr': 0.00047722427001602765, 'samples': 4275072, 'steps': 22265, 'loss/train': 5.899032115936279} -08/30/2021 17:12:02 - INFO - __main__ - Step 22267: {'lr': 0.0004772220569436521, 'samples': 4275264, 'steps': 22266, 'loss/train': 1.5059112310409546} -08/30/2021 17:12:02 - INFO - __main__ - Step 22268: {'lr': 0.0004772198437688938, 'samples': 4275456, 'steps': 22267, 'loss/train': 1.5607255697250366} -08/30/2021 17:12:04 - INFO - __main__ - Step 22269: {'lr': 0.0004772176304917538, 'samples': 4275648, 'steps': 22268, 'loss/train': 1.8144924640655518} -08/30/2021 17:12:04 - INFO - __main__ - Step 22270: {'lr': 0.00047721541711223306, 'samples': 4275840, 'steps': 22269, 'loss/train': 1.739651083946228} -08/30/2021 17:12:04 - INFO - __main__ - Step 22271: {'lr': 0.00047721320363033247, 'samples': 4276032, 'steps': 22270, 'loss/train': 2.207659959793091} -08/30/2021 17:12:05 - INFO - __main__ - Step 22272: {'lr': 0.00047721099004605316, 'samples': 4276224, 'steps': 22271, 'loss/train': 1.5110259056091309} -08/30/2021 17:12:05 - INFO - __main__ - Step 22273: {'lr': 0.00047720877635939606, 'samples': 4276416, 'steps': 22272, 'loss/train': 1.3257867097854614} -08/30/2021 17:12:05 - INFO - __main__ - Step 22274: {'lr': 0.0004772065625703622, 'samples': 4276608, 'steps': 22273, 'loss/train': 1.6748912334442139} -08/30/2021 17:12:07 - INFO - __main__ - Step 22275: {'lr': 0.0004772043486789526, 'samples': 4276800, 'steps': 22274, 'loss/train': 1.8296105861663818} -08/30/2021 17:12:07 - INFO - __main__ - Step 22276: {'lr': 0.0004772021346851682, 'samples': 4276992, 'steps': 22275, 'loss/train': 1.589489221572876} -08/30/2021 17:12:08 - INFO - __main__ - Step 22277: {'lr': 0.00047719992058901006, 'samples': 4277184, 'steps': 22276, 'loss/train': 2.3670313358306885} -08/30/2021 17:12:08 - INFO - __main__ - Step 22278: {'lr': 0.0004771977063904791, 'samples': 4277376, 'steps': 22277, 'loss/train': 1.057492971420288} -08/30/2021 17:12:08 - INFO - __main__ - Step 22279: {'lr': 0.00047719549208957636, 'samples': 4277568, 'steps': 22278, 'loss/train': 1.414607048034668} -08/30/2021 17:12:10 - INFO - __main__ - Step 22280: {'lr': 0.0004771932776863028, 'samples': 4277760, 'steps': 22279, 'loss/train': 1.5459754467010498} -08/30/2021 17:12:10 - INFO - __main__ - Step 22281: {'lr': 0.0004771910631806595, 'samples': 4277952, 'steps': 22280, 'loss/train': 1.5766849517822266} -08/30/2021 17:12:11 - INFO - __main__ - Step 22282: {'lr': 0.00047718884857264745, 'samples': 4278144, 'steps': 22281, 'loss/train': 2.308119535446167} -08/30/2021 17:12:11 - INFO - __main__ - Step 22283: {'lr': 0.0004771866338622676, 'samples': 4278336, 'steps': 22282, 'loss/train': 1.3916943073272705} -08/30/2021 17:12:11 - INFO - __main__ - Step 22284: {'lr': 0.0004771844190495209, 'samples': 4278528, 'steps': 22283, 'loss/train': 1.7475589513778687} -08/30/2021 17:12:13 - INFO - __main__ - Step 22285: {'lr': 0.0004771822041344085, 'samples': 4278720, 'steps': 22284, 'loss/train': 1.9920268058776855} -08/30/2021 17:12:13 - INFO - __main__ - Step 22286: {'lr': 0.0004771799891169312, 'samples': 4278912, 'steps': 22285, 'loss/train': 1.6034091711044312} -08/30/2021 17:12:14 - INFO - __main__ - Step 22287: {'lr': 0.0004771777739970902, 'samples': 4279104, 'steps': 22286, 'loss/train': 1.5661957263946533} -08/30/2021 17:12:14 - INFO - __main__ - Step 22288: {'lr': 0.0004771755587748863, 'samples': 4279296, 'steps': 22287, 'loss/train': 1.2716710567474365} -08/30/2021 17:12:14 - INFO - __main__ - Step 22289: {'lr': 0.00047717334345032065, 'samples': 4279488, 'steps': 22288, 'loss/train': 1.3670454025268555} -08/30/2021 17:12:16 - INFO - __main__ - Step 22290: {'lr': 0.0004771711280233942, 'samples': 4279680, 'steps': 22289, 'loss/train': 2.0890448093414307} -08/30/2021 17:12:17 - INFO - __main__ - Step 22291: {'lr': 0.000477168912494108, 'samples': 4279872, 'steps': 22290, 'loss/train': 1.223692536354065} -08/30/2021 17:12:17 - INFO - __main__ - Step 22292: {'lr': 0.00047716669686246287, 'samples': 4280064, 'steps': 22291, 'loss/train': 2.1673696041107178} -08/30/2021 17:12:17 - INFO - __main__ - Step 22293: {'lr': 0.00047716448112846, 'samples': 4280256, 'steps': 22292, 'loss/train': 1.7638188600540161} -08/30/2021 17:12:18 - INFO - __main__ - Step 22294: {'lr': 0.00047716226529210035, 'samples': 4280448, 'steps': 22293, 'loss/train': 1.263674020767212} -08/30/2021 17:12:18 - INFO - __main__ - Step 22295: {'lr': 0.00047716004935338484, 'samples': 4280640, 'steps': 22294, 'loss/train': 2.0301637649536133} -08/30/2021 17:12:20 - INFO - __main__ - Step 22296: {'lr': 0.0004771578333123145, 'samples': 4280832, 'steps': 22295, 'loss/train': 0.1532074362039566} -08/30/2021 17:12:21 - INFO - __main__ - Step 22297: {'lr': 0.00047715561716889037, 'samples': 4281024, 'steps': 22296, 'loss/train': 1.6346476078033447} -08/30/2021 17:12:21 - INFO - __main__ - Step 22298: {'lr': 0.0004771534009231134, 'samples': 4281216, 'steps': 22297, 'loss/train': 1.932807445526123} -08/30/2021 17:12:22 - INFO - __main__ - Step 22299: {'lr': 0.00047715118457498473, 'samples': 4281408, 'steps': 22298, 'loss/train': 1.622165322303772} -08/30/2021 17:12:22 - INFO - __main__ - Step 22300: {'lr': 0.00047714896812450514, 'samples': 4281600, 'steps': 22299, 'loss/train': 1.7235090732574463} -08/30/2021 17:12:22 - INFO - __main__ - Step 22301: {'lr': 0.00047714675157167573, 'samples': 4281792, 'steps': 22300, 'loss/train': 1.7315394878387451} -08/30/2021 17:12:24 - INFO - __main__ - Step 22302: {'lr': 0.00047714453491649753, 'samples': 4281984, 'steps': 22301, 'loss/train': 1.458749532699585} -08/30/2021 17:12:24 - INFO - __main__ - Step 22303: {'lr': 0.00047714231815897145, 'samples': 4282176, 'steps': 22302, 'loss/train': 1.760093092918396} -08/30/2021 17:12:25 - INFO - __main__ - Step 22304: {'lr': 0.0004771401012990986, 'samples': 4282368, 'steps': 22303, 'loss/train': 1.0102078914642334} -08/30/2021 17:12:25 - INFO - __main__ - Step 22305: {'lr': 0.0004771378843368799, 'samples': 4282560, 'steps': 22304, 'loss/train': 0.8581253290176392} -08/30/2021 17:12:25 - INFO - __main__ - Step 22306: {'lr': 0.0004771356672723164, 'samples': 4282752, 'steps': 22305, 'loss/train': 1.1559330224990845} -08/30/2021 17:12:27 - INFO - __main__ - Step 22307: {'lr': 0.0004771334501054091, 'samples': 4282944, 'steps': 22306, 'loss/train': 1.6413648128509521} -08/30/2021 17:12:27 - INFO - __main__ - Step 22308: {'lr': 0.0004771312328361589, 'samples': 4283136, 'steps': 22307, 'loss/train': 1.3504822254180908} -08/30/2021 17:12:28 - INFO - __main__ - Step 22309: {'lr': 0.0004771290154645669, 'samples': 4283328, 'steps': 22308, 'loss/train': 1.6743515729904175} -08/30/2021 17:12:28 - INFO - __main__ - Step 22310: {'lr': 0.0004771267979906341, 'samples': 4283520, 'steps': 22309, 'loss/train': 1.1398613452911377} -08/30/2021 17:12:28 - INFO - __main__ - Step 22311: {'lr': 0.0004771245804143615, 'samples': 4283712, 'steps': 22310, 'loss/train': 1.9536066055297852} -08/30/2021 17:12:30 - INFO - __main__ - Step 22312: {'lr': 0.00047712236273574993, 'samples': 4283904, 'steps': 22311, 'loss/train': 1.4108941555023193} -08/30/2021 17:12:30 - INFO - __main__ - Step 22313: {'lr': 0.0004771201449548006, 'samples': 4284096, 'steps': 22312, 'loss/train': 2.030109167098999} -08/30/2021 17:12:31 - INFO - __main__ - Step 22314: {'lr': 0.0004771179270715145, 'samples': 4284288, 'steps': 22313, 'loss/train': 1.5843579769134521} -08/30/2021 17:12:31 - INFO - __main__ - Step 22315: {'lr': 0.0004771157090858925, 'samples': 4284480, 'steps': 22314, 'loss/train': 1.4762053489685059} -08/30/2021 17:12:31 - INFO - __main__ - Step 22316: {'lr': 0.00047711349099793565, 'samples': 4284672, 'steps': 22315, 'loss/train': 1.261612892150879} -08/30/2021 17:12:33 - INFO - __main__ - Step 22317: {'lr': 0.00047711127280764497, 'samples': 4284864, 'steps': 22316, 'loss/train': 1.734206199645996} -08/30/2021 17:12:34 - INFO - __main__ - Step 22318: {'lr': 0.0004771090545150215, 'samples': 4285056, 'steps': 22317, 'loss/train': 2.0448877811431885} -08/30/2021 17:12:34 - INFO - __main__ - Step 22319: {'lr': 0.00047710683612006623, 'samples': 4285248, 'steps': 22318, 'loss/train': 1.1970142126083374} -08/30/2021 17:12:34 - INFO - __main__ - Step 22320: {'lr': 0.00047710461762278, 'samples': 4285440, 'steps': 22319, 'loss/train': 1.1002840995788574} -08/30/2021 17:12:35 - INFO - __main__ - Step 22321: {'lr': 0.00047710239902316404, 'samples': 4285632, 'steps': 22320, 'loss/train': 1.3517085313796997} -08/30/2021 17:12:35 - INFO - __main__ - Step 22322: {'lr': 0.0004771001803212192, 'samples': 4285824, 'steps': 22321, 'loss/train': 0.12081053853034973} -08/30/2021 17:12:36 - INFO - __main__ - Step 22323: {'lr': 0.0004770979615169466, 'samples': 4286016, 'steps': 22322, 'loss/train': 1.2311862707138062} -08/30/2021 17:12:37 - INFO - __main__ - Step 22324: {'lr': 0.00047709574261034705, 'samples': 4286208, 'steps': 22323, 'loss/train': 1.5089372396469116} -08/30/2021 17:12:37 - INFO - __main__ - Step 22325: {'lr': 0.0004770935236014217, 'samples': 4286400, 'steps': 22324, 'loss/train': 1.385047435760498} -08/30/2021 17:12:38 - INFO - __main__ - Step 22326: {'lr': 0.00047709130449017154, 'samples': 4286592, 'steps': 22325, 'loss/train': 1.8321505784988403} -08/30/2021 17:12:38 - INFO - __main__ - Step 22327: {'lr': 0.0004770890852765975, 'samples': 4286784, 'steps': 22326, 'loss/train': 1.692516565322876} -08/30/2021 17:12:39 - INFO - __main__ - Step 22328: {'lr': 0.00047708686596070065, 'samples': 4286976, 'steps': 22327, 'loss/train': 1.6043461561203003} -08/30/2021 17:12:40 - INFO - __main__ - Step 22329: {'lr': 0.00047708464654248195, 'samples': 4287168, 'steps': 22328, 'loss/train': 3.0700507164001465} -08/30/2021 17:12:40 - INFO - __main__ - Step 22330: {'lr': 0.0004770824270219424, 'samples': 4287360, 'steps': 22329, 'loss/train': 1.9059228897094727} -08/30/2021 17:12:41 - INFO - __main__ - Step 22331: {'lr': 0.0004770802073990831, 'samples': 4287552, 'steps': 22330, 'loss/train': 1.1868107318878174} -08/30/2021 17:12:41 - INFO - __main__ - Step 22332: {'lr': 0.00047707798767390486, 'samples': 4287744, 'steps': 22331, 'loss/train': 1.798985481262207} -08/30/2021 17:12:41 - INFO - __main__ - Step 22333: {'lr': 0.00047707576784640883, 'samples': 4287936, 'steps': 22332, 'loss/train': 1.9564640522003174} -08/30/2021 17:12:43 - INFO - __main__ - Step 22334: {'lr': 0.00047707354791659594, 'samples': 4288128, 'steps': 22333, 'loss/train': 1.6558359861373901} -08/30/2021 17:12:44 - INFO - __main__ - Step 22335: {'lr': 0.0004770713278844672, 'samples': 4288320, 'steps': 22334, 'loss/train': 1.7436270713806152} -08/30/2021 17:12:44 - INFO - __main__ - Step 22336: {'lr': 0.00047706910775002363, 'samples': 4288512, 'steps': 22335, 'loss/train': 1.8189456462860107} -08/30/2021 17:12:44 - INFO - __main__ - Step 22337: {'lr': 0.0004770668875132663, 'samples': 4288704, 'steps': 22336, 'loss/train': 0.8251792192459106} -08/30/2021 17:12:45 - INFO - __main__ - Step 22338: {'lr': 0.00047706466717419607, 'samples': 4288896, 'steps': 22337, 'loss/train': 1.2290778160095215} -08/30/2021 17:12:46 - INFO - __main__ - Step 22339: {'lr': 0.000477062446732814, 'samples': 4289088, 'steps': 22338, 'loss/train': 1.2256410121917725} -08/30/2021 17:12:47 - INFO - __main__ - Step 22340: {'lr': 0.0004770602261891211, 'samples': 4289280, 'steps': 22339, 'loss/train': 1.7080248594284058} -08/30/2021 17:12:47 - INFO - __main__ - Step 22341: {'lr': 0.00047705800554311836, 'samples': 4289472, 'steps': 22340, 'loss/train': 2.1394202709198} -08/30/2021 17:12:47 - INFO - __main__ - Step 22342: {'lr': 0.0004770557847948068, 'samples': 4289664, 'steps': 22341, 'loss/train': 0.19599613547325134} -08/30/2021 17:12:48 - INFO - __main__ - Step 22343: {'lr': 0.0004770535639441874, 'samples': 4289856, 'steps': 22342, 'loss/train': 1.7449849843978882} -08/30/2021 17:12:50 - INFO - __main__ - Step 22344: {'lr': 0.0004770513429912612, 'samples': 4290048, 'steps': 22343, 'loss/train': 1.2627513408660889} -08/30/2021 17:12:50 - INFO - __main__ - Step 22345: {'lr': 0.0004770491219360291, 'samples': 4290240, 'steps': 22344, 'loss/train': 1.4885687828063965} -08/30/2021 17:12:50 - INFO - __main__ - Step 22346: {'lr': 0.00047704690077849223, 'samples': 4290432, 'steps': 22345, 'loss/train': 1.65871000289917} -08/30/2021 17:12:51 - INFO - __main__ - Step 22347: {'lr': 0.0004770446795186515, 'samples': 4290624, 'steps': 22346, 'loss/train': 1.5663443803787231} -08/30/2021 17:12:51 - INFO - __main__ - Step 22348: {'lr': 0.0004770424581565079, 'samples': 4290816, 'steps': 22347, 'loss/train': 1.3566665649414062} -08/30/2021 17:12:54 - INFO - __main__ - Step 22349: {'lr': 0.0004770402366920625, 'samples': 4291008, 'steps': 22348, 'loss/train': 0.32403233647346497} -08/30/2021 17:12:54 - INFO - __main__ - Step 22350: {'lr': 0.00047703801512531636, 'samples': 4291200, 'steps': 22349, 'loss/train': 1.629690170288086} -08/30/2021 17:12:55 - INFO - __main__ - Step 22351: {'lr': 0.00047703579345627036, 'samples': 4291392, 'steps': 22350, 'loss/train': 1.9505356550216675} -08/30/2021 17:12:55 - INFO - __main__ - Step 22352: {'lr': 0.00047703357168492544, 'samples': 4291584, 'steps': 22351, 'loss/train': 1.5575278997421265} -08/30/2021 17:12:55 - INFO - __main__ - Step 22353: {'lr': 0.0004770313498112828, 'samples': 4291776, 'steps': 22352, 'loss/train': 1.1776572465896606} -08/30/2021 17:12:56 - INFO - __main__ - Step 22354: {'lr': 0.0004770291278353433, 'samples': 4291968, 'steps': 22353, 'loss/train': 1.4709523916244507} -08/30/2021 17:12:56 - INFO - __main__ - Step 22355: {'lr': 0.00047702690575710796, 'samples': 4292160, 'steps': 22354, 'loss/train': 2.1087942123413086} -08/30/2021 17:12:58 - INFO - __main__ - Step 22356: {'lr': 0.0004770246835765778, 'samples': 4292352, 'steps': 22355, 'loss/train': 1.793090581893921} -08/30/2021 17:12:58 - INFO - __main__ - Step 22357: {'lr': 0.0004770224612937538, 'samples': 4292544, 'steps': 22356, 'loss/train': 1.7314915657043457} -08/30/2021 17:12:58 - INFO - __main__ - Step 22358: {'lr': 0.0004770202389086371, 'samples': 4292736, 'steps': 22357, 'loss/train': 1.6197714805603027} -08/30/2021 17:12:59 - INFO - __main__ - Step 22359: {'lr': 0.0004770180164212284, 'samples': 4292928, 'steps': 22358, 'loss/train': 2.251490831375122} -08/30/2021 17:12:59 - INFO - __main__ - Step 22360: {'lr': 0.00047701579383152906, 'samples': 4293120, 'steps': 22359, 'loss/train': 1.3303654193878174} -08/30/2021 17:13:01 - INFO - __main__ - Step 22361: {'lr': 0.0004770135711395398, 'samples': 4293312, 'steps': 22360, 'loss/train': 1.2282088994979858} -08/30/2021 17:13:01 - INFO - __main__ - Step 22362: {'lr': 0.0004770113483452618, 'samples': 4293504, 'steps': 22361, 'loss/train': 2.1275947093963623} -08/30/2021 17:13:02 - INFO - __main__ - Step 22363: {'lr': 0.00047700912544869595, 'samples': 4293696, 'steps': 22362, 'loss/train': 2.052558183670044} -08/30/2021 17:13:02 - INFO - __main__ - Step 22364: {'lr': 0.0004770069024498433, 'samples': 4293888, 'steps': 22363, 'loss/train': 1.709843635559082} -08/30/2021 17:13:02 - INFO - __main__ - Step 22365: {'lr': 0.00047700467934870484, 'samples': 4294080, 'steps': 22364, 'loss/train': 0.11012905836105347} -08/30/2021 17:13:05 - INFO - __main__ - Step 22366: {'lr': 0.0004770024561452816, 'samples': 4294272, 'steps': 22365, 'loss/train': 1.4906331300735474} -08/30/2021 17:13:05 - INFO - __main__ - Step 22367: {'lr': 0.0004770002328395745, 'samples': 4294464, 'steps': 22366, 'loss/train': 1.7107250690460205} -08/30/2021 17:13:05 - INFO - __main__ - Step 22368: {'lr': 0.00047699800943158454, 'samples': 4294656, 'steps': 22367, 'loss/train': 0.14216406643390656} -08/30/2021 17:13:06 - INFO - __main__ - Step 22369: {'lr': 0.0004769957859213129, 'samples': 4294848, 'steps': 22368, 'loss/train': 1.6559343338012695} -08/30/2021 17:13:06 - INFO - __main__ - Step 22370: {'lr': 0.00047699356230876047, 'samples': 4295040, 'steps': 22369, 'loss/train': 1.896594762802124} -08/30/2021 17:13:07 - INFO - __main__ - Step 22371: {'lr': 0.0004769913385939282, 'samples': 4295232, 'steps': 22370, 'loss/train': 1.1542118787765503} -08/30/2021 17:13:07 - INFO - __main__ - Step 22372: {'lr': 0.0004769891147768171, 'samples': 4295424, 'steps': 22371, 'loss/train': 2.6675169467926025} -08/30/2021 17:13:07 - INFO - __main__ - Step 22373: {'lr': 0.00047698689085742823, 'samples': 4295616, 'steps': 22372, 'loss/train': 1.9953951835632324} -08/30/2021 17:13:09 - INFO - __main__ - Step 22374: {'lr': 0.00047698466683576256, 'samples': 4295808, 'steps': 22373, 'loss/train': 1.745845913887024} -08/30/2021 17:13:09 - INFO - __main__ - Step 22375: {'lr': 0.0004769824427118211, 'samples': 4296000, 'steps': 22374, 'loss/train': 1.9689626693725586} -08/30/2021 17:13:09 - INFO - __main__ - Step 22376: {'lr': 0.00047698021848560494, 'samples': 4296192, 'steps': 22375, 'loss/train': 2.4756383895874023} -08/30/2021 17:13:10 - INFO - __main__ - Step 22377: {'lr': 0.0004769779941571149, 'samples': 4296384, 'steps': 22376, 'loss/train': 1.3743934631347656} -08/30/2021 17:13:10 - INFO - __main__ - Step 22378: {'lr': 0.00047697576972635213, 'samples': 4296576, 'steps': 22377, 'loss/train': 1.7336702346801758} -08/30/2021 17:13:12 - INFO - __main__ - Step 22379: {'lr': 0.0004769735451933176, 'samples': 4296768, 'steps': 22378, 'loss/train': 1.7430158853530884} -08/30/2021 17:13:12 - INFO - __main__ - Step 22380: {'lr': 0.0004769713205580122, 'samples': 4296960, 'steps': 22379, 'loss/train': 1.7553653717041016} -08/30/2021 17:13:12 - INFO - __main__ - Step 22381: {'lr': 0.0004769690958204371, 'samples': 4297152, 'steps': 22380, 'loss/train': 1.4760040044784546} -08/30/2021 17:13:13 - INFO - __main__ - Step 22382: {'lr': 0.0004769668709805932, 'samples': 4297344, 'steps': 22381, 'loss/train': 2.4359185695648193} -08/30/2021 17:13:13 - INFO - __main__ - Step 22383: {'lr': 0.0004769646460384816, 'samples': 4297536, 'steps': 22382, 'loss/train': 2.0891146659851074} -08/30/2021 17:13:15 - INFO - __main__ - Step 22384: {'lr': 0.00047696242099410307, 'samples': 4297728, 'steps': 22383, 'loss/train': 1.869328498840332} -08/30/2021 17:13:15 - INFO - __main__ - Step 22385: {'lr': 0.00047696019584745887, 'samples': 4297920, 'steps': 22384, 'loss/train': 1.9483591318130493} -08/30/2021 17:13:15 - INFO - __main__ - Step 22386: {'lr': 0.00047695797059854996, 'samples': 4298112, 'steps': 22385, 'loss/train': 1.746274471282959} -08/30/2021 17:13:16 - INFO - __main__ - Step 22387: {'lr': 0.0004769557452473772, 'samples': 4298304, 'steps': 22386, 'loss/train': 2.275529384613037} -08/30/2021 17:13:16 - INFO - __main__ - Step 22388: {'lr': 0.00047695351979394173, 'samples': 4298496, 'steps': 22387, 'loss/train': 1.8169291019439697} -08/30/2021 17:13:18 - INFO - __main__ - Step 22389: {'lr': 0.00047695129423824454, 'samples': 4298688, 'steps': 22388, 'loss/train': 2.1064412593841553} -08/30/2021 17:13:18 - INFO - __main__ - Step 22390: {'lr': 0.0004769490685802865, 'samples': 4298880, 'steps': 22389, 'loss/train': 1.5430718660354614} -08/30/2021 17:13:18 - INFO - __main__ - Step 22391: {'lr': 0.00047694684282006885, 'samples': 4299072, 'steps': 22390, 'loss/train': 1.8566498756408691} -08/30/2021 17:13:19 - INFO - __main__ - Step 22392: {'lr': 0.00047694461695759236, 'samples': 4299264, 'steps': 22391, 'loss/train': 1.4858124256134033} -08/30/2021 17:13:19 - INFO - __main__ - Step 22393: {'lr': 0.00047694239099285815, 'samples': 4299456, 'steps': 22392, 'loss/train': 1.1314911842346191} -08/30/2021 17:13:21 - INFO - __main__ - Step 22394: {'lr': 0.00047694016492586715, 'samples': 4299648, 'steps': 22393, 'loss/train': 1.2198786735534668} -08/30/2021 17:13:21 - INFO - __main__ - Step 22395: {'lr': 0.0004769379387566205, 'samples': 4299840, 'steps': 22394, 'loss/train': 2.0493226051330566} -08/30/2021 17:13:21 - INFO - __main__ - Step 22396: {'lr': 0.000476935712485119, 'samples': 4300032, 'steps': 22395, 'loss/train': 1.9728707075119019} -08/30/2021 17:13:22 - INFO - __main__ - Step 22397: {'lr': 0.0004769334861113639, 'samples': 4300224, 'steps': 22396, 'loss/train': 1.7758984565734863} -08/30/2021 17:13:22 - INFO - __main__ - Step 22398: {'lr': 0.000476931259635356, 'samples': 4300416, 'steps': 22397, 'loss/train': 1.9279731512069702} -08/30/2021 17:13:24 - INFO - __main__ - Step 22399: {'lr': 0.00047692903305709646, 'samples': 4300608, 'steps': 22398, 'loss/train': 1.7467641830444336} -08/30/2021 17:13:25 - INFO - __main__ - Step 22400: {'lr': 0.0004769268063765861, 'samples': 4300800, 'steps': 22399, 'loss/train': 1.9367769956588745} -08/30/2021 17:13:25 - INFO - __main__ - Step 22401: {'lr': 0.00047692457959382605, 'samples': 4300992, 'steps': 22400, 'loss/train': 2.1889874935150146} -08/30/2021 17:13:25 - INFO - __main__ - Step 22402: {'lr': 0.0004769223527088173, 'samples': 4301184, 'steps': 22401, 'loss/train': 3.266441583633423} -08/30/2021 17:13:26 - INFO - __main__ - Step 22403: {'lr': 0.00047692012572156086, 'samples': 4301376, 'steps': 22402, 'loss/train': 2.4790022373199463} -08/30/2021 17:13:26 - INFO - __main__ - Step 22404: {'lr': 0.00047691789863205764, 'samples': 4301568, 'steps': 22403, 'loss/train': 1.6065174341201782} -08/30/2021 17:13:26 - INFO - __main__ - Step 22405: {'lr': 0.0004769156714403088, 'samples': 4301760, 'steps': 22404, 'loss/train': 0.8410873413085938} -08/30/2021 17:13:28 - INFO - __main__ - Step 22406: {'lr': 0.0004769134441463152, 'samples': 4301952, 'steps': 22405, 'loss/train': 1.2901523113250732} -08/30/2021 17:13:29 - INFO - __main__ - Step 22407: {'lr': 0.0004769112167500779, 'samples': 4302144, 'steps': 22406, 'loss/train': 1.9885972738265991} -08/30/2021 17:13:29 - INFO - __main__ - Step 22408: {'lr': 0.00047690898925159796, 'samples': 4302336, 'steps': 22407, 'loss/train': 2.138716697692871} -08/30/2021 17:13:30 - INFO - __main__ - Step 22409: {'lr': 0.0004769067616508763, 'samples': 4302528, 'steps': 22408, 'loss/train': 1.79085111618042} -08/30/2021 17:13:30 - INFO - __main__ - Step 22410: {'lr': 0.00047690453394791393, 'samples': 4302720, 'steps': 22409, 'loss/train': 2.0332047939300537} -08/30/2021 17:13:30 - INFO - __main__ - Step 22411: {'lr': 0.0004769023061427119, 'samples': 4302912, 'steps': 22410, 'loss/train': 1.719641923904419} -08/30/2021 17:13:32 - INFO - __main__ - Step 22412: {'lr': 0.0004769000782352713, 'samples': 4303104, 'steps': 22411, 'loss/train': 2.0749473571777344} -08/30/2021 17:13:33 - INFO - __main__ - Step 22413: {'lr': 0.00047689785022559284, 'samples': 4303296, 'steps': 22412, 'loss/train': 2.0759830474853516} -08/30/2021 17:13:33 - INFO - __main__ - Step 22414: {'lr': 0.0004768956221136778, 'samples': 4303488, 'steps': 22413, 'loss/train': 1.7461432218551636} -08/30/2021 17:13:33 - INFO - __main__ - Step 22415: {'lr': 0.00047689339389952713, 'samples': 4303680, 'steps': 22414, 'loss/train': 1.7579646110534668} -08/30/2021 17:13:34 - INFO - __main__ - Step 22416: {'lr': 0.0004768911655831417, 'samples': 4303872, 'steps': 22415, 'loss/train': 2.2065553665161133} -08/30/2021 17:13:35 - INFO - __main__ - Step 22417: {'lr': 0.0004768889371645227, 'samples': 4304064, 'steps': 22416, 'loss/train': 1.7390761375427246} -08/30/2021 17:13:36 - INFO - __main__ - Step 22418: {'lr': 0.000476886708643671, 'samples': 4304256, 'steps': 22417, 'loss/train': 1.4862357378005981} -08/30/2021 17:13:36 - INFO - __main__ - Step 22419: {'lr': 0.0004768844800205877, 'samples': 4304448, 'steps': 22418, 'loss/train': 1.667893648147583} -08/30/2021 17:13:37 - INFO - __main__ - Step 22420: {'lr': 0.0004768822512952737, 'samples': 4304640, 'steps': 22419, 'loss/train': 1.1174753904342651} -08/30/2021 17:13:37 - INFO - __main__ - Step 22421: {'lr': 0.0004768800224677301, 'samples': 4304832, 'steps': 22420, 'loss/train': 1.2558841705322266} -08/30/2021 17:13:39 - INFO - __main__ - Step 22422: {'lr': 0.0004768777935379578, 'samples': 4305024, 'steps': 22421, 'loss/train': 1.9752498865127563} -08/30/2021 17:13:39 - INFO - __main__ - Step 22423: {'lr': 0.0004768755645059579, 'samples': 4305216, 'steps': 22422, 'loss/train': 1.7126777172088623} -08/30/2021 17:13:39 - INFO - __main__ - Step 22424: {'lr': 0.00047687333537173136, 'samples': 4305408, 'steps': 22423, 'loss/train': 1.5196870565414429} -08/30/2021 17:13:40 - INFO - __main__ - Step 22425: {'lr': 0.00047687110613527924, 'samples': 4305600, 'steps': 22424, 'loss/train': 2.162867307662964} -08/30/2021 17:13:40 - INFO - __main__ - Step 22426: {'lr': 0.00047686887679660253, 'samples': 4305792, 'steps': 22425, 'loss/train': 1.4038060903549194} -08/30/2021 17:13:42 - INFO - __main__ - Step 22427: {'lr': 0.0004768666473557021, 'samples': 4305984, 'steps': 22426, 'loss/train': 0.17870919406414032} -08/30/2021 17:13:42 - INFO - __main__ - Step 22428: {'lr': 0.0004768644178125791, 'samples': 4306176, 'steps': 22427, 'loss/train': 1.2794487476348877} -08/30/2021 17:13:43 - INFO - __main__ - Step 22429: {'lr': 0.0004768621881672345, 'samples': 4306368, 'steps': 22428, 'loss/train': 1.6502145528793335} -08/30/2021 17:13:43 - INFO - __main__ - Step 22430: {'lr': 0.00047685995841966936, 'samples': 4306560, 'steps': 22429, 'loss/train': 1.9061843156814575} -08/30/2021 17:13:43 - INFO - __main__ - Step 22431: {'lr': 0.0004768577285698845, 'samples': 4306752, 'steps': 22430, 'loss/train': 1.8811677694320679} -08/30/2021 17:13:45 - INFO - __main__ - Step 22432: {'lr': 0.00047685549861788113, 'samples': 4306944, 'steps': 22431, 'loss/train': 1.7884986400604248} -08/30/2021 17:13:45 - INFO - __main__ - Step 22433: {'lr': 0.0004768532685636602, 'samples': 4307136, 'steps': 22432, 'loss/train': 1.5401004552841187} -08/30/2021 17:13:46 - INFO - __main__ - Step 22434: {'lr': 0.0004768510384072226, 'samples': 4307328, 'steps': 22433, 'loss/train': 1.6148316860198975} -08/30/2021 17:13:46 - INFO - __main__ - Step 22435: {'lr': 0.0004768488081485695, 'samples': 4307520, 'steps': 22434, 'loss/train': 1.414378046989441} -08/30/2021 17:13:46 - INFO - __main__ - Step 22436: {'lr': 0.0004768465777877018, 'samples': 4307712, 'steps': 22435, 'loss/train': 1.9817149639129639} -08/30/2021 17:13:47 - INFO - __main__ - Step 22437: {'lr': 0.0004768443473246205, 'samples': 4307904, 'steps': 22436, 'loss/train': 1.8146398067474365} -08/30/2021 17:13:48 - INFO - __main__ - Step 22438: {'lr': 0.00047684211675932665, 'samples': 4308096, 'steps': 22437, 'loss/train': 1.8666608333587646} -08/30/2021 17:13:49 - INFO - __main__ - Step 22439: {'lr': 0.0004768398860918213, 'samples': 4308288, 'steps': 22438, 'loss/train': 2.1716370582580566} -08/30/2021 17:13:49 - INFO - __main__ - Step 22440: {'lr': 0.0004768376553221053, 'samples': 4308480, 'steps': 22439, 'loss/train': 1.9423466920852661} -08/30/2021 17:13:49 - INFO - __main__ - Step 22441: {'lr': 0.0004768354244501798, 'samples': 4308672, 'steps': 22440, 'loss/train': 1.6935824155807495} -08/30/2021 17:13:50 - INFO - __main__ - Step 22442: {'lr': 0.0004768331934760458, 'samples': 4308864, 'steps': 22441, 'loss/train': 1.7347948551177979} -08/30/2021 17:13:51 - INFO - __main__ - Step 22443: {'lr': 0.00047683096239970423, 'samples': 4309056, 'steps': 22442, 'loss/train': 1.7142823934555054} -08/30/2021 17:13:52 - INFO - __main__ - Step 22444: {'lr': 0.0004768287312211561, 'samples': 4309248, 'steps': 22443, 'loss/train': 0.21094796061515808} -08/30/2021 17:13:52 - INFO - __main__ - Step 22445: {'lr': 0.0004768264999404025, 'samples': 4309440, 'steps': 22444, 'loss/train': 1.8671423196792603} -08/30/2021 17:13:52 - INFO - __main__ - Step 22446: {'lr': 0.00047682426855744434, 'samples': 4309632, 'steps': 22445, 'loss/train': 1.7412782907485962} -08/30/2021 17:13:53 - INFO - __main__ - Step 22447: {'lr': 0.00047682203707228264, 'samples': 4309824, 'steps': 22446, 'loss/train': 1.6040568351745605} -08/30/2021 17:13:55 - INFO - __main__ - Step 22448: {'lr': 0.00047681980548491853, 'samples': 4310016, 'steps': 22447, 'loss/train': 1.5771088600158691} -08/30/2021 17:13:55 - INFO - __main__ - Step 22449: {'lr': 0.00047681757379535285, 'samples': 4310208, 'steps': 22448, 'loss/train': 1.3620716333389282} -08/30/2021 17:13:55 - INFO - __main__ - Step 22450: {'lr': 0.00047681534200358665, 'samples': 4310400, 'steps': 22449, 'loss/train': 1.7939502000808716} -08/30/2021 17:13:56 - INFO - __main__ - Step 22451: {'lr': 0.000476813110109621, 'samples': 4310592, 'steps': 22450, 'loss/train': 1.5142356157302856} -08/30/2021 17:13:56 - INFO - __main__ - Step 22452: {'lr': 0.0004768108781134568, 'samples': 4310784, 'steps': 22451, 'loss/train': 3.149855375289917} -08/30/2021 17:13:56 - INFO - __main__ - Step 22453: {'lr': 0.0004768086460150952, 'samples': 4310976, 'steps': 22452, 'loss/train': 1.7269551753997803} -08/30/2021 17:13:58 - INFO - __main__ - Step 22454: {'lr': 0.00047680641381453703, 'samples': 4311168, 'steps': 22453, 'loss/train': 0.6760121583938599} -08/30/2021 17:13:58 - INFO - __main__ - Step 22455: {'lr': 0.0004768041815117835, 'samples': 4311360, 'steps': 22454, 'loss/train': 1.962514042854309} -08/30/2021 17:13:59 - INFO - __main__ - Step 22456: {'lr': 0.00047680194910683545, 'samples': 4311552, 'steps': 22455, 'loss/train': 1.614229679107666} -08/30/2021 17:13:59 - INFO - __main__ - Step 22457: {'lr': 0.0004767997165996939, 'samples': 4311744, 'steps': 22456, 'loss/train': 1.7352981567382812} -08/30/2021 17:13:59 - INFO - __main__ - Step 22458: {'lr': 0.00047679748399035994, 'samples': 4311936, 'steps': 22457, 'loss/train': 1.9201675653457642} -08/30/2021 17:14:01 - INFO - __main__ - Step 22459: {'lr': 0.00047679525127883456, 'samples': 4312128, 'steps': 22458, 'loss/train': 2.225206136703491} -08/30/2021 17:14:01 - INFO - __main__ - Step 22460: {'lr': 0.0004767930184651187, 'samples': 4312320, 'steps': 22459, 'loss/train': 1.8964154720306396} -08/30/2021 17:14:02 - INFO - __main__ - Step 22461: {'lr': 0.0004767907855492134, 'samples': 4312512, 'steps': 22460, 'loss/train': 2.0226051807403564} -08/30/2021 17:14:02 - INFO - __main__ - Step 22462: {'lr': 0.0004767885525311197, 'samples': 4312704, 'steps': 22461, 'loss/train': 1.9483298063278198} -08/30/2021 17:14:02 - INFO - __main__ - Step 22463: {'lr': 0.0004767863194108386, 'samples': 4312896, 'steps': 22462, 'loss/train': 1.5516774654388428} -08/30/2021 17:14:04 - INFO - __main__ - Step 22464: {'lr': 0.000476784086188371, 'samples': 4313088, 'steps': 22463, 'loss/train': 2.108454465866089} -08/30/2021 17:14:05 - INFO - __main__ - Step 22465: {'lr': 0.00047678185286371803, 'samples': 4313280, 'steps': 22464, 'loss/train': 1.8621517419815063} -08/30/2021 17:14:05 - INFO - __main__ - Step 22466: {'lr': 0.0004767796194368807, 'samples': 4313472, 'steps': 22465, 'loss/train': 2.0400550365448} -08/30/2021 17:14:06 - INFO - __main__ - Step 22467: {'lr': 0.00047677738590786, 'samples': 4313664, 'steps': 22466, 'loss/train': 5.935624599456787} -08/30/2021 17:14:06 - INFO - __main__ - Step 22468: {'lr': 0.0004767751522766568, 'samples': 4313856, 'steps': 22467, 'loss/train': 1.3310096263885498} -08/30/2021 17:14:08 - INFO - __main__ - Step 22469: {'lr': 0.00047677291854327224, 'samples': 4314048, 'steps': 22468, 'loss/train': 1.2661097049713135} -08/30/2021 17:14:08 - INFO - __main__ - Step 22470: {'lr': 0.00047677068470770737, 'samples': 4314240, 'steps': 22469, 'loss/train': 1.8714877367019653} -08/30/2021 17:14:08 - INFO - __main__ - Step 22471: {'lr': 0.00047676845076996305, 'samples': 4314432, 'steps': 22470, 'loss/train': 1.7654696702957153} -08/30/2021 17:14:09 - INFO - __main__ - Step 22472: {'lr': 0.0004767662167300404, 'samples': 4314624, 'steps': 22471, 'loss/train': 0.48746439814567566} -08/30/2021 17:14:09 - INFO - __main__ - Step 22473: {'lr': 0.0004767639825879404, 'samples': 4314816, 'steps': 22472, 'loss/train': 1.8187942504882812} -08/30/2021 17:14:09 - INFO - __main__ - Step 22474: {'lr': 0.000476761748343664, 'samples': 4315008, 'steps': 22473, 'loss/train': 0.5924195647239685} -08/30/2021 17:14:11 - INFO - __main__ - Step 22475: {'lr': 0.00047675951399721235, 'samples': 4315200, 'steps': 22474, 'loss/train': 1.7742091417312622} -08/30/2021 17:14:11 - INFO - __main__ - Step 22476: {'lr': 0.0004767572795485863, 'samples': 4315392, 'steps': 22475, 'loss/train': 1.7919718027114868} -08/30/2021 17:14:12 - INFO - __main__ - Step 22477: {'lr': 0.00047675504499778695, 'samples': 4315584, 'steps': 22476, 'loss/train': 2.61266827583313} -08/30/2021 17:14:12 - INFO - __main__ - Step 22478: {'lr': 0.0004767528103448152, 'samples': 4315776, 'steps': 22477, 'loss/train': 1.3702067136764526} -08/30/2021 17:14:12 - INFO - __main__ - Step 22479: {'lr': 0.00047675057558967224, 'samples': 4315968, 'steps': 22478, 'loss/train': 1.984159231185913} -08/30/2021 17:14:14 - INFO - __main__ - Step 22480: {'lr': 0.0004767483407323589, 'samples': 4316160, 'steps': 22479, 'loss/train': 2.2095019817352295} -08/30/2021 17:14:14 - INFO - __main__ - Step 22481: {'lr': 0.00047674610577287625, 'samples': 4316352, 'steps': 22480, 'loss/train': 1.7467973232269287} -08/30/2021 17:14:15 - INFO - __main__ - Step 22482: {'lr': 0.00047674387071122536, 'samples': 4316544, 'steps': 22481, 'loss/train': 1.6091501712799072} -08/30/2021 17:14:15 - INFO - __main__ - Step 22483: {'lr': 0.0004767416355474071, 'samples': 4316736, 'steps': 22482, 'loss/train': 1.6895766258239746} -08/30/2021 17:14:15 - INFO - __main__ - Step 22484: {'lr': 0.00047673940028142265, 'samples': 4316928, 'steps': 22483, 'loss/train': 1.633849024772644} -08/30/2021 17:14:17 - INFO - __main__ - Step 22485: {'lr': 0.0004767371649132729, 'samples': 4317120, 'steps': 22484, 'loss/train': 1.660505771636963} -08/30/2021 17:14:17 - INFO - __main__ - Step 22486: {'lr': 0.00047673492944295883, 'samples': 4317312, 'steps': 22485, 'loss/train': 1.2509496212005615} -08/30/2021 17:14:18 - INFO - __main__ - Step 22487: {'lr': 0.0004767326938704816, 'samples': 4317504, 'steps': 22486, 'loss/train': 1.9188863039016724} -08/30/2021 17:14:18 - INFO - __main__ - Step 22488: {'lr': 0.00047673045819584197, 'samples': 4317696, 'steps': 22487, 'loss/train': 1.0761938095092773} -08/30/2021 17:14:18 - INFO - __main__ - Step 22489: {'lr': 0.0004767282224190412, 'samples': 4317888, 'steps': 22488, 'loss/train': 1.7531883716583252} -08/30/2021 17:14:20 - INFO - __main__ - Step 22490: {'lr': 0.00047672598654008015, 'samples': 4318080, 'steps': 22489, 'loss/train': 1.7927989959716797} -08/30/2021 17:14:20 - INFO - __main__ - Step 22491: {'lr': 0.0004767237505589599, 'samples': 4318272, 'steps': 22490, 'loss/train': 1.0618451833724976} -08/30/2021 17:14:21 - INFO - __main__ - Step 22492: {'lr': 0.0004767215144756814, 'samples': 4318464, 'steps': 22491, 'loss/train': 1.719399094581604} -08/30/2021 17:14:21 - INFO - __main__ - Step 22493: {'lr': 0.0004767192782902457, 'samples': 4318656, 'steps': 22492, 'loss/train': 1.0271601676940918} -08/30/2021 17:14:21 - INFO - __main__ - Step 22494: {'lr': 0.0004767170420026538, 'samples': 4318848, 'steps': 22493, 'loss/train': 0.9355188012123108} -08/30/2021 17:14:23 - INFO - __main__ - Step 22495: {'lr': 0.0004767148056129067, 'samples': 4319040, 'steps': 22494, 'loss/train': 2.2111897468566895} -08/30/2021 17:14:23 - INFO - __main__ - Step 22496: {'lr': 0.0004767125691210054, 'samples': 4319232, 'steps': 22495, 'loss/train': 1.777457356452942} -08/30/2021 17:14:24 - INFO - __main__ - Step 22497: {'lr': 0.00047671033252695083, 'samples': 4319424, 'steps': 22496, 'loss/train': 1.7731730937957764} -08/30/2021 17:14:24 - INFO - __main__ - Step 22498: {'lr': 0.0004767080958307442, 'samples': 4319616, 'steps': 22497, 'loss/train': 1.4276859760284424} -08/30/2021 17:14:24 - INFO - __main__ - Step 22499: {'lr': 0.0004767058590323864, 'samples': 4319808, 'steps': 22498, 'loss/train': 1.6239917278289795} -08/30/2021 17:14:26 - INFO - __main__ - Step 22500: {'lr': 0.00047670362213187833, 'samples': 4320000, 'steps': 22499, 'loss/train': 1.0119229555130005} -08/30/2021 17:14:27 - INFO - __main__ - Step 22501: {'lr': 0.0004767013851292212, 'samples': 4320192, 'steps': 22500, 'loss/train': 1.2648358345031738} -08/30/2021 17:14:27 - INFO - __main__ - Step 22502: {'lr': 0.0004766991480244159, 'samples': 4320384, 'steps': 22501, 'loss/train': 0.3033278286457062} -08/30/2021 17:14:28 - INFO - __main__ - Step 22503: {'lr': 0.0004766969108174635, 'samples': 4320576, 'steps': 22502, 'loss/train': 0.16322974860668182} -08/30/2021 17:14:28 - INFO - __main__ - Step 22504: {'lr': 0.0004766946735083649, 'samples': 4320768, 'steps': 22503, 'loss/train': 1.9770796298980713} -08/30/2021 17:14:30 - INFO - __main__ - Step 22505: {'lr': 0.0004766924360971212, 'samples': 4320960, 'steps': 22504, 'loss/train': 1.3510984182357788} -08/30/2021 17:14:30 - INFO - __main__ - Step 22506: {'lr': 0.00047669019858373343, 'samples': 4321152, 'steps': 22505, 'loss/train': 1.9653582572937012} -08/30/2021 17:14:30 - INFO - __main__ - Step 22507: {'lr': 0.00047668796096820247, 'samples': 4321344, 'steps': 22506, 'loss/train': 0.5082666277885437} -08/30/2021 17:14:31 - INFO - __main__ - Step 22508: {'lr': 0.00047668572325052953, 'samples': 4321536, 'steps': 22507, 'loss/train': 1.9479482173919678} -08/30/2021 17:14:31 - INFO - __main__ - Step 22509: {'lr': 0.00047668348543071536, 'samples': 4321728, 'steps': 22508, 'loss/train': 1.757729172706604} -08/30/2021 17:14:31 - INFO - __main__ - Step 22510: {'lr': 0.00047668124750876117, 'samples': 4321920, 'steps': 22509, 'loss/train': 3.3465144634246826} -08/30/2021 17:14:33 - INFO - __main__ - Step 22511: {'lr': 0.0004766790094846679, 'samples': 4322112, 'steps': 22510, 'loss/train': 2.3180856704711914} -08/30/2021 17:14:34 - INFO - __main__ - Step 22512: {'lr': 0.0004766767713584367, 'samples': 4322304, 'steps': 22511, 'loss/train': 1.4776660203933716} -08/30/2021 17:14:34 - INFO - __main__ - Step 22513: {'lr': 0.00047667453313006826, 'samples': 4322496, 'steps': 22512, 'loss/train': 1.8642196655273438} -08/30/2021 17:14:34 - INFO - __main__ - Step 22514: {'lr': 0.00047667229479956386, 'samples': 4322688, 'steps': 22513, 'loss/train': 1.3936805725097656} -08/30/2021 17:14:35 - INFO - __main__ - Step 22515: {'lr': 0.0004766700563669244, 'samples': 4322880, 'steps': 22514, 'loss/train': 1.9357175827026367} -08/30/2021 17:14:35 - INFO - __main__ - Step 22516: {'lr': 0.0004766678178321509, 'samples': 4323072, 'steps': 22515, 'loss/train': 0.9189608097076416} -08/30/2021 17:14:37 - INFO - __main__ - Step 22517: {'lr': 0.0004766655791952444, 'samples': 4323264, 'steps': 22516, 'loss/train': 1.9477885961532593} -08/30/2021 17:14:38 - INFO - __main__ - Step 22518: {'lr': 0.0004766633404562059, 'samples': 4323456, 'steps': 22517, 'loss/train': 0.5487386584281921} -08/30/2021 17:14:38 - INFO - __main__ - Step 22519: {'lr': 0.0004766611016150364, 'samples': 4323648, 'steps': 22518, 'loss/train': 1.230427861213684} -08/30/2021 17:14:38 - INFO - __main__ - Step 22520: {'lr': 0.00047665886267173686, 'samples': 4323840, 'steps': 22519, 'loss/train': 1.2861769199371338} -08/30/2021 17:14:39 - INFO - __main__ - Step 22521: {'lr': 0.00047665662362630836, 'samples': 4324032, 'steps': 22520, 'loss/train': 1.6450291872024536} -08/30/2021 17:14:40 - INFO - __main__ - Step 22522: {'lr': 0.00047665438447875186, 'samples': 4324224, 'steps': 22521, 'loss/train': 1.6257888078689575} -08/30/2021 17:14:41 - INFO - __main__ - Step 22523: {'lr': 0.0004766521452290684, 'samples': 4324416, 'steps': 22522, 'loss/train': 2.009296417236328} -08/30/2021 17:14:41 - INFO - __main__ - Step 22524: {'lr': 0.00047664990587725905, 'samples': 4324608, 'steps': 22523, 'loss/train': 1.138895034790039} -08/30/2021 17:14:41 - INFO - __main__ - Step 22525: {'lr': 0.0004766476664233247, 'samples': 4324800, 'steps': 22524, 'loss/train': 1.378551959991455} -08/30/2021 17:14:42 - INFO - __main__ - Step 22526: {'lr': 0.0004766454268672664, 'samples': 4324992, 'steps': 22525, 'loss/train': 1.2025744915008545} -08/30/2021 17:14:42 - INFO - __main__ - Step 22527: {'lr': 0.00047664318720908516, 'samples': 4325184, 'steps': 22526, 'loss/train': 2.2128894329071045} -08/30/2021 17:14:44 - INFO - __main__ - Step 22528: {'lr': 0.000476640947448782, 'samples': 4325376, 'steps': 22527, 'loss/train': 2.173571825027466} -08/30/2021 17:14:44 - INFO - __main__ - Step 22529: {'lr': 0.000476638707586358, 'samples': 4325568, 'steps': 22528, 'loss/train': 1.637187123298645} -08/30/2021 17:14:44 - INFO - __main__ - Step 22530: {'lr': 0.000476636467621814, 'samples': 4325760, 'steps': 22529, 'loss/train': 1.5273845195770264} -08/30/2021 17:14:45 - INFO - __main__ - Step 22531: {'lr': 0.00047663422755515113, 'samples': 4325952, 'steps': 22530, 'loss/train': 1.323721170425415} -08/30/2021 17:14:45 - INFO - __main__ - Step 22532: {'lr': 0.00047663198738637035, 'samples': 4326144, 'steps': 22531, 'loss/train': 1.6435048580169678} -08/30/2021 17:14:47 - INFO - __main__ - Step 22533: {'lr': 0.00047662974711547274, 'samples': 4326336, 'steps': 22532, 'loss/train': 1.8532849550247192} -08/30/2021 17:14:47 - INFO - __main__ - Step 22534: {'lr': 0.0004766275067424593, 'samples': 4326528, 'steps': 22533, 'loss/train': 1.458275318145752} -08/30/2021 17:14:47 - INFO - __main__ - Step 22535: {'lr': 0.0004766252662673309, 'samples': 4326720, 'steps': 22534, 'loss/train': 1.8849378824234009} -08/30/2021 17:14:48 - INFO - __main__ - Step 22536: {'lr': 0.0004766230256900887, 'samples': 4326912, 'steps': 22535, 'loss/train': 1.1653574705123901} -08/30/2021 17:14:48 - INFO - __main__ - Step 22537: {'lr': 0.0004766207850107337, 'samples': 4327104, 'steps': 22536, 'loss/train': 1.4604711532592773} -08/30/2021 17:14:50 - INFO - __main__ - Step 22538: {'lr': 0.00047661854422926674, 'samples': 4327296, 'steps': 22537, 'loss/train': 2.063953161239624} -08/30/2021 17:14:50 - INFO - __main__ - Step 22539: {'lr': 0.0004766163033456891, 'samples': 4327488, 'steps': 22538, 'loss/train': 1.9041965007781982} -08/30/2021 17:14:51 - INFO - __main__ - Step 22540: {'lr': 0.0004766140623600016, 'samples': 4327680, 'steps': 22539, 'loss/train': 1.9534395933151245} -08/30/2021 17:14:51 - INFO - __main__ - Step 22541: {'lr': 0.0004766118212722053, 'samples': 4327872, 'steps': 22540, 'loss/train': 0.12554432451725006} -08/30/2021 17:14:51 - INFO - __main__ - Step 22542: {'lr': 0.0004766095800823013, 'samples': 4328064, 'steps': 22541, 'loss/train': 2.0189404487609863} -08/30/2021 17:14:53 - INFO - __main__ - Step 22543: {'lr': 0.0004766073387902904, 'samples': 4328256, 'steps': 22542, 'loss/train': 0.27141886949539185} -08/30/2021 17:14:53 - INFO - __main__ - Step 22544: {'lr': 0.00047660509739617376, 'samples': 4328448, 'steps': 22543, 'loss/train': 1.2854547500610352} -08/30/2021 17:14:54 - INFO - __main__ - Step 22545: {'lr': 0.00047660285589995233, 'samples': 4328640, 'steps': 22544, 'loss/train': 1.238966703414917} -08/30/2021 17:14:54 - INFO - __main__ - Step 22546: {'lr': 0.0004766006143016272, 'samples': 4328832, 'steps': 22545, 'loss/train': 2.324779510498047} -08/30/2021 17:14:54 - INFO - __main__ - Step 22547: {'lr': 0.0004765983726011993, 'samples': 4329024, 'steps': 22546, 'loss/train': 1.4933652877807617} -08/30/2021 17:14:56 - INFO - __main__ - Step 22548: {'lr': 0.0004765961307986697, 'samples': 4329216, 'steps': 22547, 'loss/train': 1.3241190910339355} -08/30/2021 17:14:56 - INFO - __main__ - Step 22549: {'lr': 0.0004765938888940393, 'samples': 4329408, 'steps': 22548, 'loss/train': 1.0358211994171143} -08/30/2021 17:14:57 - INFO - __main__ - Step 22550: {'lr': 0.00047659164688730935, 'samples': 4329600, 'steps': 22549, 'loss/train': 1.617812156677246} -08/30/2021 17:14:57 - INFO - __main__ - Step 22551: {'lr': 0.00047658940477848056, 'samples': 4329792, 'steps': 22550, 'loss/train': 1.7339508533477783} -08/30/2021 17:14:57 - INFO - __main__ - Step 22552: {'lr': 0.00047658716256755414, 'samples': 4329984, 'steps': 22551, 'loss/train': 1.7117106914520264} -08/30/2021 17:14:58 - INFO - __main__ - Step 22553: {'lr': 0.00047658492025453106, 'samples': 4330176, 'steps': 22552, 'loss/train': 1.3234061002731323} -08/30/2021 17:14:59 - INFO - __main__ - Step 22554: {'lr': 0.00047658267783941223, 'samples': 4330368, 'steps': 22553, 'loss/train': 1.2777682542800903} -08/30/2021 17:14:59 - INFO - __main__ - Step 22555: {'lr': 0.0004765804353221988, 'samples': 4330560, 'steps': 22554, 'loss/train': 2.290679693222046} -08/30/2021 17:15:00 - INFO - __main__ - Step 22556: {'lr': 0.0004765781927028917, 'samples': 4330752, 'steps': 22555, 'loss/train': 1.369117259979248} -08/30/2021 17:15:00 - INFO - __main__ - Step 22557: {'lr': 0.000476575949981492, 'samples': 4330944, 'steps': 22556, 'loss/train': 1.2444427013397217} -08/30/2021 17:15:00 - INFO - __main__ - Step 22558: {'lr': 0.00047657370715800066, 'samples': 4331136, 'steps': 22557, 'loss/train': 2.076911687850952} -08/30/2021 17:15:02 - INFO - __main__ - Step 22559: {'lr': 0.0004765714642324187, 'samples': 4331328, 'steps': 22558, 'loss/train': 1.3288944959640503} -08/30/2021 17:15:02 - INFO - __main__ - Step 22560: {'lr': 0.0004765692212047471, 'samples': 4331520, 'steps': 22559, 'loss/train': 1.579010248184204} -08/30/2021 17:15:03 - INFO - __main__ - Step 22561: {'lr': 0.00047656697807498693, 'samples': 4331712, 'steps': 22560, 'loss/train': 1.5661537647247314} -08/30/2021 17:15:03 - INFO - __main__ - Step 22562: {'lr': 0.0004765647348431392, 'samples': 4331904, 'steps': 22561, 'loss/train': 1.6125584840774536} -08/30/2021 17:15:03 - INFO - __main__ - Step 22563: {'lr': 0.00047656249150920485, 'samples': 4332096, 'steps': 22562, 'loss/train': 2.1038525104522705} -08/30/2021 17:15:06 - INFO - __main__ - Step 22564: {'lr': 0.000476560248073185, 'samples': 4332288, 'steps': 22563, 'loss/train': 1.730812430381775} -08/30/2021 17:15:06 - INFO - __main__ - Step 22565: {'lr': 0.0004765580045350805, 'samples': 4332480, 'steps': 22564, 'loss/train': 1.7798317670822144} -08/30/2021 17:15:06 - INFO - __main__ - Step 22566: {'lr': 0.00047655576089489254, 'samples': 4332672, 'steps': 22565, 'loss/train': 1.7542918920516968} -08/30/2021 17:15:07 - INFO - __main__ - Step 22567: {'lr': 0.00047655351715262205, 'samples': 4332864, 'steps': 22566, 'loss/train': 1.4907829761505127} -08/30/2021 17:15:07 - INFO - __main__ - Step 22568: {'lr': 0.00047655127330827, 'samples': 4333056, 'steps': 22567, 'loss/train': 3.5989739894866943} -08/30/2021 17:15:07 - INFO - __main__ - Step 22569: {'lr': 0.00047654902936183745, 'samples': 4333248, 'steps': 22568, 'loss/train': 3.7340481281280518} -08/30/2021 17:15:08 - INFO - __main__ - Step 22570: {'lr': 0.00047654678531332544, 'samples': 4333440, 'steps': 22569, 'loss/train': 4.774858474731445} -08/30/2021 17:15:09 - INFO - __main__ - Step 22571: {'lr': 0.00047654454116273493, 'samples': 4333632, 'steps': 22570, 'loss/train': 1.9201209545135498} -08/30/2021 17:15:10 - INFO - __main__ - Step 22572: {'lr': 0.0004765422969100669, 'samples': 4333824, 'steps': 22571, 'loss/train': 1.6501644849777222} -08/30/2021 17:15:10 - INFO - __main__ - Step 22573: {'lr': 0.00047654005255532247, 'samples': 4334016, 'steps': 22572, 'loss/train': 1.9358325004577637} -08/30/2021 17:15:10 - INFO - __main__ - Step 22574: {'lr': 0.0004765378080985026, 'samples': 4334208, 'steps': 22573, 'loss/train': 1.5381373167037964} -08/30/2021 17:15:11 - INFO - __main__ - Step 22575: {'lr': 0.00047653556353960825, 'samples': 4334400, 'steps': 22574, 'loss/train': 1.7209357023239136} -08/30/2021 17:15:13 - INFO - __main__ - Step 22576: {'lr': 0.0004765333188786404, 'samples': 4334592, 'steps': 22575, 'loss/train': 1.5887960195541382} -08/30/2021 17:15:13 - INFO - __main__ - Step 22577: {'lr': 0.00047653107411560025, 'samples': 4334784, 'steps': 22576, 'loss/train': 2.440398931503296} -08/30/2021 17:15:14 - INFO - __main__ - Step 22578: {'lr': 0.00047652882925048863, 'samples': 4334976, 'steps': 22577, 'loss/train': 1.467909336090088} -08/30/2021 17:15:14 - INFO - __main__ - Step 22579: {'lr': 0.00047652658428330664, 'samples': 4335168, 'steps': 22578, 'loss/train': 1.7069509029388428} -08/30/2021 17:15:14 - INFO - __main__ - Step 22580: {'lr': 0.00047652433921405526, 'samples': 4335360, 'steps': 22579, 'loss/train': 1.4549226760864258} -08/30/2021 17:15:16 - INFO - __main__ - Step 22581: {'lr': 0.0004765220940427355, 'samples': 4335552, 'steps': 22580, 'loss/train': 1.1382648944854736} -08/30/2021 17:15:16 - INFO - __main__ - Step 22582: {'lr': 0.0004765198487693484, 'samples': 4335744, 'steps': 22581, 'loss/train': 1.7741187810897827} -08/30/2021 17:15:17 - INFO - __main__ - Step 22583: {'lr': 0.00047651760339389494, 'samples': 4335936, 'steps': 22582, 'loss/train': 3.3371052742004395} -08/30/2021 17:15:17 - INFO - __main__ - Step 22584: {'lr': 0.0004765153579163761, 'samples': 4336128, 'steps': 22583, 'loss/train': 0.11780780553817749} -08/30/2021 17:15:17 - INFO - __main__ - Step 22585: {'lr': 0.000476513112336793, 'samples': 4336320, 'steps': 22584, 'loss/train': 1.8284790515899658} -08/30/2021 17:15:18 - INFO - __main__ - Step 22586: {'lr': 0.00047651086665514655, 'samples': 4336512, 'steps': 22585, 'loss/train': 1.7586549520492554} -08/30/2021 17:15:19 - INFO - __main__ - Step 22587: {'lr': 0.00047650862087143787, 'samples': 4336704, 'steps': 22586, 'loss/train': 1.6524969339370728} -08/30/2021 17:15:20 - INFO - __main__ - Step 22588: {'lr': 0.0004765063749856678, 'samples': 4336896, 'steps': 22587, 'loss/train': 1.9591922760009766} -08/30/2021 17:15:20 - INFO - __main__ - Step 22589: {'lr': 0.00047650412899783747, 'samples': 4337088, 'steps': 22588, 'loss/train': 2.1798973083496094} -08/30/2021 17:15:21 - INFO - __main__ - Step 22590: {'lr': 0.0004765018829079479, 'samples': 4337280, 'steps': 22589, 'loss/train': 2.203218698501587} -08/30/2021 17:15:21 - INFO - __main__ - Step 22591: {'lr': 0.0004764996367160001, 'samples': 4337472, 'steps': 22590, 'loss/train': 1.7837680578231812} -08/30/2021 17:15:22 - INFO - __main__ - Step 22592: {'lr': 0.000476497390421995, 'samples': 4337664, 'steps': 22591, 'loss/train': 1.498328447341919} -08/30/2021 17:15:23 - INFO - __main__ - Step 22593: {'lr': 0.00047649514402593377, 'samples': 4337856, 'steps': 22592, 'loss/train': 1.4952605962753296} -08/30/2021 17:15:23 - INFO - __main__ - Step 22594: {'lr': 0.0004764928975278172, 'samples': 4338048, 'steps': 22593, 'loss/train': 1.6838277578353882} -08/30/2021 17:15:24 - INFO - __main__ - Step 22595: {'lr': 0.0004764906509276465, 'samples': 4338240, 'steps': 22594, 'loss/train': 2.1396031379699707} -08/30/2021 17:15:24 - INFO - __main__ - Step 22596: {'lr': 0.0004764884042254226, 'samples': 4338432, 'steps': 22595, 'loss/train': 1.8890920877456665} -08/30/2021 17:15:25 - INFO - __main__ - Step 22597: {'lr': 0.0004764861574211465, 'samples': 4338624, 'steps': 22596, 'loss/train': 1.6218863725662231} -08/30/2021 17:15:26 - INFO - __main__ - Step 22598: {'lr': 0.0004764839105148193, 'samples': 4338816, 'steps': 22597, 'loss/train': 1.2731597423553467} -08/30/2021 17:15:26 - INFO - __main__ - Step 22599: {'lr': 0.00047648166350644185, 'samples': 4339008, 'steps': 22598, 'loss/train': 1.2360286712646484} -08/30/2021 17:15:26 - INFO - __main__ - Step 22600: {'lr': 0.00047647941639601535, 'samples': 4339200, 'steps': 22599, 'loss/train': 1.8576124906539917} -08/30/2021 17:15:27 - INFO - __main__ - Step 22601: {'lr': 0.00047647716918354066, 'samples': 4339392, 'steps': 22600, 'loss/train': 2.1882736682891846} -08/30/2021 17:15:28 - INFO - __main__ - Step 22602: {'lr': 0.00047647492186901884, 'samples': 4339584, 'steps': 22601, 'loss/train': 2.1269142627716064} -08/30/2021 17:15:29 - INFO - __main__ - Step 22603: {'lr': 0.0004764726744524509, 'samples': 4339776, 'steps': 22602, 'loss/train': 1.6733989715576172} -08/30/2021 17:15:29 - INFO - __main__ - Step 22604: {'lr': 0.0004764704269338379, 'samples': 4339968, 'steps': 22603, 'loss/train': 1.9329251050949097} -08/30/2021 17:15:30 - INFO - __main__ - Step 22605: {'lr': 0.00047646817931318086, 'samples': 4340160, 'steps': 22604, 'loss/train': 1.058057427406311} -08/30/2021 17:15:30 - INFO - __main__ - Step 22606: {'lr': 0.0004764659315904807, 'samples': 4340352, 'steps': 22605, 'loss/train': 0.18052689731121063} -08/30/2021 17:15:32 - INFO - __main__ - Step 22607: {'lr': 0.0004764636837657385, 'samples': 4340544, 'steps': 22606, 'loss/train': 0.8237510919570923} -08/30/2021 17:15:32 - INFO - __main__ - Step 22608: {'lr': 0.0004764614358389553, 'samples': 4340736, 'steps': 22607, 'loss/train': 1.9010093212127686} -08/30/2021 17:15:33 - INFO - __main__ - Step 22609: {'lr': 0.00047645918781013196, 'samples': 4340928, 'steps': 22608, 'loss/train': 2.0348987579345703} -08/30/2021 17:15:33 - INFO - __main__ - Step 22610: {'lr': 0.0004764569396792697, 'samples': 4341120, 'steps': 22609, 'loss/train': 1.808739185333252} -08/30/2021 17:15:33 - INFO - __main__ - Step 22611: {'lr': 0.0004764546914463694, 'samples': 4341312, 'steps': 22610, 'loss/train': 0.1274918168783188} -08/30/2021 17:15:35 - INFO - __main__ - Step 22612: {'lr': 0.0004764524431114321, 'samples': 4341504, 'steps': 22611, 'loss/train': 1.0096627473831177} -08/30/2021 17:15:35 - INFO - __main__ - Step 22613: {'lr': 0.0004764501946744589, 'samples': 4341696, 'steps': 22612, 'loss/train': 1.1949007511138916} -08/30/2021 17:15:36 - INFO - __main__ - Step 22614: {'lr': 0.00047644794613545065, 'samples': 4341888, 'steps': 22613, 'loss/train': 1.3782620429992676} -08/30/2021 17:15:36 - INFO - __main__ - Step 22615: {'lr': 0.00047644569749440846, 'samples': 4342080, 'steps': 22614, 'loss/train': 1.6585488319396973} -08/30/2021 17:15:36 - INFO - __main__ - Step 22616: {'lr': 0.0004764434487513334, 'samples': 4342272, 'steps': 22615, 'loss/train': 1.5861353874206543} -08/30/2021 17:15:37 - INFO - __main__ - Step 22617: {'lr': 0.00047644119990622637, 'samples': 4342464, 'steps': 22616, 'loss/train': 2.112118721008301} -08/30/2021 17:15:38 - INFO - __main__ - Step 22618: {'lr': 0.0004764389509590884, 'samples': 4342656, 'steps': 22617, 'loss/train': 1.8465508222579956} -08/30/2021 17:15:39 - INFO - __main__ - Step 22619: {'lr': 0.0004764367019099206, 'samples': 4342848, 'steps': 22618, 'loss/train': 0.16180749237537384} -08/30/2021 17:15:39 - INFO - __main__ - Step 22620: {'lr': 0.0004764344527587239, 'samples': 4343040, 'steps': 22619, 'loss/train': 1.7559525966644287} -08/30/2021 17:15:39 - INFO - __main__ - Step 22621: {'lr': 0.00047643220350549934, 'samples': 4343232, 'steps': 22620, 'loss/train': 1.9561069011688232} -08/30/2021 17:15:40 - INFO - __main__ - Step 22622: {'lr': 0.0004764299541502478, 'samples': 4343424, 'steps': 22621, 'loss/train': 1.8269357681274414} -08/30/2021 17:15:41 - INFO - __main__ - Step 22623: {'lr': 0.0004764277046929706, 'samples': 4343616, 'steps': 22622, 'loss/train': 1.68116295337677} -08/30/2021 17:15:42 - INFO - __main__ - Step 22624: {'lr': 0.00047642545513366843, 'samples': 4343808, 'steps': 22623, 'loss/train': 0.982194185256958} -08/30/2021 17:15:42 - INFO - __main__ - Step 22625: {'lr': 0.0004764232054723425, 'samples': 4344000, 'steps': 22624, 'loss/train': 0.14288485050201416} -08/30/2021 17:15:43 - INFO - __main__ - Step 22626: {'lr': 0.0004764209557089938, 'samples': 4344192, 'steps': 22625, 'loss/train': 1.557816743850708} -08/30/2021 17:15:43 - INFO - __main__ - Step 22627: {'lr': 0.00047641870584362323, 'samples': 4344384, 'steps': 22626, 'loss/train': 1.734743595123291} -08/30/2021 17:15:45 - INFO - __main__ - Step 22628: {'lr': 0.00047641645587623196, 'samples': 4344576, 'steps': 22627, 'loss/train': 2.719785213470459} -08/30/2021 17:15:46 - INFO - __main__ - Step 22629: {'lr': 0.0004764142058068209, 'samples': 4344768, 'steps': 22628, 'loss/train': 1.2836214303970337} -08/30/2021 17:15:46 - INFO - __main__ - Step 22630: {'lr': 0.00047641195563539107, 'samples': 4344960, 'steps': 22629, 'loss/train': 1.551599383354187} -08/30/2021 17:15:47 - INFO - __main__ - Step 22631: {'lr': 0.0004764097053619435, 'samples': 4345152, 'steps': 22630, 'loss/train': 1.526296854019165} -08/30/2021 17:15:47 - INFO - __main__ - Step 22632: {'lr': 0.00047640745498647925, 'samples': 4345344, 'steps': 22631, 'loss/train': 3.1410653591156006} -08/30/2021 17:15:47 - INFO - __main__ - Step 22633: {'lr': 0.00047640520450899926, 'samples': 4345536, 'steps': 22632, 'loss/train': 3.2670083045959473} -08/30/2021 17:15:49 - INFO - __main__ - Step 22634: {'lr': 0.0004764029539295046, 'samples': 4345728, 'steps': 22633, 'loss/train': 1.6931003332138062} -08/30/2021 17:15:50 - INFO - __main__ - Step 22635: {'lr': 0.0004764007032479963, 'samples': 4345920, 'steps': 22634, 'loss/train': 1.7444283962249756} -08/30/2021 17:15:50 - INFO - __main__ - Step 22636: {'lr': 0.00047639845246447534, 'samples': 4346112, 'steps': 22635, 'loss/train': 1.6407912969589233} -08/30/2021 17:15:50 - INFO - __main__ - Step 22637: {'lr': 0.00047639620157894264, 'samples': 4346304, 'steps': 22636, 'loss/train': 1.3127738237380981} -08/30/2021 17:15:51 - INFO - __main__ - Step 22638: {'lr': 0.00047639395059139936, 'samples': 4346496, 'steps': 22637, 'loss/train': 1.869842767715454} -08/30/2021 17:15:51 - INFO - __main__ - Step 22639: {'lr': 0.0004763916995018465, 'samples': 4346688, 'steps': 22638, 'loss/train': 1.3320239782333374} -08/30/2021 17:15:53 - INFO - __main__ - Step 22640: {'lr': 0.00047638944831028497, 'samples': 4346880, 'steps': 22639, 'loss/train': 1.6166237592697144} -08/30/2021 17:15:53 - INFO - __main__ - Step 22641: {'lr': 0.00047638719701671587, 'samples': 4347072, 'steps': 22640, 'loss/train': 1.786665678024292} -08/30/2021 17:15:53 - INFO - __main__ - Step 22642: {'lr': 0.00047638494562114015, 'samples': 4347264, 'steps': 22641, 'loss/train': 1.4907608032226562} -08/30/2021 17:15:54 - INFO - __main__ - Step 22643: {'lr': 0.0004763826941235589, 'samples': 4347456, 'steps': 22642, 'loss/train': 1.1272971630096436} -08/30/2021 17:15:54 - INFO - __main__ - Step 22644: {'lr': 0.00047638044252397313, 'samples': 4347648, 'steps': 22643, 'loss/train': 1.7200355529785156} -08/30/2021 17:15:56 - INFO - __main__ - Step 22645: {'lr': 0.0004763781908223838, 'samples': 4347840, 'steps': 22644, 'loss/train': 1.3382102251052856} -08/30/2021 17:15:56 - INFO - __main__ - Step 22646: {'lr': 0.00047637593901879194, 'samples': 4348032, 'steps': 22645, 'loss/train': 1.9048612117767334} -08/30/2021 17:15:56 - INFO - __main__ - Step 22647: {'lr': 0.00047637368711319863, 'samples': 4348224, 'steps': 22646, 'loss/train': 1.7801023721694946} -08/30/2021 17:15:57 - INFO - __main__ - Step 22648: {'lr': 0.00047637143510560477, 'samples': 4348416, 'steps': 22647, 'loss/train': 1.4967598915100098} -08/30/2021 17:15:57 - INFO - __main__ - Step 22649: {'lr': 0.0004763691829960114, 'samples': 4348608, 'steps': 22648, 'loss/train': 1.8857465982437134} -08/30/2021 17:15:59 - INFO - __main__ - Step 22650: {'lr': 0.00047636693078441963, 'samples': 4348800, 'steps': 22649, 'loss/train': 1.1992545127868652} -08/30/2021 17:15:59 - INFO - __main__ - Step 22651: {'lr': 0.0004763646784708304, 'samples': 4348992, 'steps': 22650, 'loss/train': 0.19952024519443512} -08/30/2021 17:16:00 - INFO - __main__ - Step 22652: {'lr': 0.00047636242605524477, 'samples': 4349184, 'steps': 22651, 'loss/train': 1.5169461965560913} -08/30/2021 17:16:00 - INFO - __main__ - Step 22653: {'lr': 0.0004763601735376637, 'samples': 4349376, 'steps': 22652, 'loss/train': 1.5541881322860718} -08/30/2021 17:16:00 - INFO - __main__ - Step 22654: {'lr': 0.0004763579209180882, 'samples': 4349568, 'steps': 22653, 'loss/train': 1.364939570426941} -08/30/2021 17:16:02 - INFO - __main__ - Step 22655: {'lr': 0.00047635566819651936, 'samples': 4349760, 'steps': 22654, 'loss/train': 1.6734801530838013} -08/30/2021 17:16:03 - INFO - __main__ - Step 22656: {'lr': 0.00047635341537295814, 'samples': 4349952, 'steps': 22655, 'loss/train': 2.059765338897705} -08/30/2021 17:16:03 - INFO - __main__ - Step 22657: {'lr': 0.0004763511624474055, 'samples': 4350144, 'steps': 22656, 'loss/train': 2.098519802093506} -08/30/2021 17:16:03 - INFO - __main__ - Step 22658: {'lr': 0.00047634890941986263, 'samples': 4350336, 'steps': 22657, 'loss/train': 1.7504721879959106} -08/30/2021 17:16:04 - INFO - __main__ - Step 22659: {'lr': 0.00047634665629033035, 'samples': 4350528, 'steps': 22658, 'loss/train': 1.7271106243133545} -08/30/2021 17:16:05 - INFO - __main__ - Step 22660: {'lr': 0.00047634440305880976, 'samples': 4350720, 'steps': 22659, 'loss/train': 1.0989255905151367} -08/30/2021 17:16:05 - INFO - __main__ - Step 22661: {'lr': 0.0004763421497253019, 'samples': 4350912, 'steps': 22660, 'loss/train': 2.4688119888305664} -08/30/2021 17:16:06 - INFO - __main__ - Step 22662: {'lr': 0.0004763398962898078, 'samples': 4351104, 'steps': 22661, 'loss/train': 1.638301134109497} -08/30/2021 17:16:06 - INFO - __main__ - Step 22663: {'lr': 0.0004763376427523284, 'samples': 4351296, 'steps': 22662, 'loss/train': 1.5809268951416016} -08/30/2021 17:16:06 - INFO - __main__ - Step 22664: {'lr': 0.0004763353891128648, 'samples': 4351488, 'steps': 22663, 'loss/train': 1.5273466110229492} -08/30/2021 17:16:07 - INFO - __main__ - Step 22665: {'lr': 0.00047633313537141786, 'samples': 4351680, 'steps': 22664, 'loss/train': 1.8765552043914795} -08/30/2021 17:16:08 - INFO - __main__ - Step 22666: {'lr': 0.00047633088152798875, 'samples': 4351872, 'steps': 22665, 'loss/train': 1.879747748374939} -08/30/2021 17:16:09 - INFO - __main__ - Step 22667: {'lr': 0.00047632862758257845, 'samples': 4352064, 'steps': 22666, 'loss/train': 1.3156960010528564} -08/30/2021 17:16:09 - INFO - __main__ - Step 22668: {'lr': 0.0004763263735351879, 'samples': 4352256, 'steps': 22667, 'loss/train': 1.77305269241333} -08/30/2021 17:16:09 - INFO - __main__ - Step 22669: {'lr': 0.0004763241193858183, 'samples': 4352448, 'steps': 22668, 'loss/train': 2.2486209869384766} -08/30/2021 17:16:10 - INFO - __main__ - Step 22670: {'lr': 0.00047632186513447045, 'samples': 4352640, 'steps': 22669, 'loss/train': 1.4093332290649414} -08/30/2021 17:16:11 - INFO - __main__ - Step 22671: {'lr': 0.0004763196107811455, 'samples': 4352832, 'steps': 22670, 'loss/train': 1.8424217700958252} -08/30/2021 17:16:12 - INFO - __main__ - Step 22672: {'lr': 0.0004763173563258444, 'samples': 4353024, 'steps': 22671, 'loss/train': 1.6107220649719238} -08/30/2021 17:16:12 - INFO - __main__ - Step 22673: {'lr': 0.0004763151017685682, 'samples': 4353216, 'steps': 22672, 'loss/train': 1.0175189971923828} -08/30/2021 17:16:12 - INFO - __main__ - Step 22674: {'lr': 0.0004763128471093179, 'samples': 4353408, 'steps': 22673, 'loss/train': 1.0710530281066895} -08/30/2021 17:16:13 - INFO - __main__ - Step 22675: {'lr': 0.0004763105923480946, 'samples': 4353600, 'steps': 22674, 'loss/train': 1.3609719276428223} -08/30/2021 17:16:14 - INFO - __main__ - Step 22676: {'lr': 0.0004763083374848991, 'samples': 4353792, 'steps': 22675, 'loss/train': 1.3715710639953613} -08/30/2021 17:16:15 - INFO - __main__ - Step 22677: {'lr': 0.00047630608251973265, 'samples': 4353984, 'steps': 22676, 'loss/train': 2.1492466926574707} -08/30/2021 17:16:15 - INFO - __main__ - Step 22678: {'lr': 0.00047630382745259616, 'samples': 4354176, 'steps': 22677, 'loss/train': 1.9249857664108276} -08/30/2021 17:16:15 - INFO - __main__ - Step 22679: {'lr': 0.0004763015722834907, 'samples': 4354368, 'steps': 22678, 'loss/train': 1.978841781616211} -08/30/2021 17:16:16 - INFO - __main__ - Step 22680: {'lr': 0.00047629931701241715, 'samples': 4354560, 'steps': 22679, 'loss/train': 1.268255352973938} -08/30/2021 17:16:17 - INFO - __main__ - Step 22681: {'lr': 0.0004762970616393767, 'samples': 4354752, 'steps': 22680, 'loss/train': 1.7757965326309204} -08/30/2021 17:16:18 - INFO - __main__ - Step 22682: {'lr': 0.0004762948061643702, 'samples': 4354944, 'steps': 22681, 'loss/train': 0.6261685490608215} -08/30/2021 17:16:18 - INFO - __main__ - Step 22683: {'lr': 0.0004762925505873988, 'samples': 4355136, 'steps': 22682, 'loss/train': 2.0943148136138916} -08/30/2021 17:16:18 - INFO - __main__ - Step 22684: {'lr': 0.00047629029490846346, 'samples': 4355328, 'steps': 22683, 'loss/train': 0.6795475482940674} -08/30/2021 17:16:19 - INFO - __main__ - Step 22685: {'lr': 0.00047628803912756523, 'samples': 4355520, 'steps': 22684, 'loss/train': 1.8683626651763916} -08/30/2021 17:16:21 - INFO - __main__ - Step 22686: {'lr': 0.00047628578324470505, 'samples': 4355712, 'steps': 22685, 'loss/train': 1.8733292818069458} -08/30/2021 17:16:21 - INFO - __main__ - Step 22687: {'lr': 0.00047628352725988406, 'samples': 4355904, 'steps': 22686, 'loss/train': 1.759171724319458} -08/30/2021 17:16:21 - INFO - __main__ - Step 22688: {'lr': 0.0004762812711731032, 'samples': 4356096, 'steps': 22687, 'loss/train': 1.767892837524414} -08/30/2021 17:16:22 - INFO - __main__ - Step 22689: {'lr': 0.00047627901498436344, 'samples': 4356288, 'steps': 22688, 'loss/train': 1.8540290594100952} -08/30/2021 17:16:22 - INFO - __main__ - Step 22690: {'lr': 0.0004762767586936658, 'samples': 4356480, 'steps': 22689, 'loss/train': 1.75572669506073} -08/30/2021 17:16:24 - INFO - __main__ - Step 22691: {'lr': 0.00047627450230101144, 'samples': 4356672, 'steps': 22690, 'loss/train': 1.6989866495132446} -08/30/2021 17:16:24 - INFO - __main__ - Step 22692: {'lr': 0.0004762722458064013, 'samples': 4356864, 'steps': 22691, 'loss/train': 1.6670310497283936} -08/30/2021 17:16:24 - INFO - __main__ - Step 22693: {'lr': 0.0004762699892098363, 'samples': 4357056, 'steps': 22692, 'loss/train': 1.6908589601516724} -08/30/2021 17:16:25 - INFO - __main__ - Step 22694: {'lr': 0.0004762677325113176, 'samples': 4357248, 'steps': 22693, 'loss/train': 1.4345744848251343} -08/30/2021 17:16:25 - INFO - __main__ - Step 22695: {'lr': 0.0004762654757108461, 'samples': 4357440, 'steps': 22694, 'loss/train': 2.0730648040771484} -08/30/2021 17:16:26 - INFO - __main__ - Step 22696: {'lr': 0.00047626321880842287, 'samples': 4357632, 'steps': 22695, 'loss/train': 1.5803663730621338} -08/30/2021 17:16:27 - INFO - __main__ - Step 22697: {'lr': 0.00047626096180404895, 'samples': 4357824, 'steps': 22696, 'loss/train': 1.8902571201324463} -08/30/2021 17:16:27 - INFO - __main__ - Step 22698: {'lr': 0.0004762587046977253, 'samples': 4358016, 'steps': 22697, 'loss/train': 1.4248958826065063} -08/30/2021 17:16:28 - INFO - __main__ - Step 22699: {'lr': 0.000476256447489453, 'samples': 4358208, 'steps': 22698, 'loss/train': 1.7172247171401978} -08/30/2021 17:16:28 - INFO - __main__ - Step 22700: {'lr': 0.000476254190179233, 'samples': 4358400, 'steps': 22699, 'loss/train': 1.6442368030548096} -08/30/2021 17:16:30 - INFO - __main__ - Step 22701: {'lr': 0.0004762519327670664, 'samples': 4358592, 'steps': 22700, 'loss/train': 1.4775010347366333} -08/30/2021 17:16:30 - INFO - __main__ - Step 22702: {'lr': 0.0004762496752529541, 'samples': 4358784, 'steps': 22701, 'loss/train': 1.758837103843689} -08/30/2021 17:16:30 - INFO - __main__ - Step 22703: {'lr': 0.0004762474176368973, 'samples': 4358976, 'steps': 22702, 'loss/train': 1.3404951095581055} -08/30/2021 17:16:31 - INFO - __main__ - Step 22704: {'lr': 0.00047624515991889684, 'samples': 4359168, 'steps': 22703, 'loss/train': 2.242572546005249} -08/30/2021 17:16:31 - INFO - __main__ - Step 22705: {'lr': 0.00047624290209895384, 'samples': 4359360, 'steps': 22704, 'loss/train': 2.0615878105163574} -08/30/2021 17:16:33 - INFO - __main__ - Step 22706: {'lr': 0.00047624064417706917, 'samples': 4359552, 'steps': 22705, 'loss/train': 1.3389997482299805} -08/30/2021 17:16:34 - INFO - __main__ - Step 22707: {'lr': 0.00047623838615324407, 'samples': 4359744, 'steps': 22706, 'loss/train': 1.843644142150879} -08/30/2021 17:16:34 - INFO - __main__ - Step 22708: {'lr': 0.0004762361280274794, 'samples': 4359936, 'steps': 22707, 'loss/train': 1.8705817461013794} -08/30/2021 17:16:34 - INFO - __main__ - Step 22709: {'lr': 0.0004762338697997762, 'samples': 4360128, 'steps': 22708, 'loss/train': 1.4605693817138672} -08/30/2021 17:16:35 - INFO - __main__ - Step 22710: {'lr': 0.00047623161147013557, 'samples': 4360320, 'steps': 22709, 'loss/train': 1.4370949268341064} -08/30/2021 17:16:36 - INFO - __main__ - Step 22711: {'lr': 0.0004762293530385584, 'samples': 4360512, 'steps': 22710, 'loss/train': 0.1271795928478241} -08/30/2021 17:16:36 - INFO - __main__ - Step 22712: {'lr': 0.0004762270945050458, 'samples': 4360704, 'steps': 22711, 'loss/train': 2.282175064086914} -08/30/2021 17:16:37 - INFO - __main__ - Step 22713: {'lr': 0.00047622483586959877, 'samples': 4360896, 'steps': 22712, 'loss/train': 1.7745230197906494} -08/30/2021 17:16:37 - INFO - __main__ - Step 22714: {'lr': 0.00047622257713221826, 'samples': 4361088, 'steps': 22713, 'loss/train': 1.5097118616104126} -08/30/2021 17:16:38 - INFO - __main__ - Step 22715: {'lr': 0.00047622031829290545, 'samples': 4361280, 'steps': 22714, 'loss/train': 1.5611250400543213} -08/30/2021 17:16:39 - INFO - __main__ - Step 22716: {'lr': 0.0004762180593516612, 'samples': 4361472, 'steps': 22715, 'loss/train': 1.5972368717193604} -08/30/2021 17:16:40 - INFO - __main__ - Step 22717: {'lr': 0.0004762158003084867, 'samples': 4361664, 'steps': 22716, 'loss/train': 2.6648776531219482} -08/30/2021 17:16:40 - INFO - __main__ - Step 22718: {'lr': 0.0004762135411633827, 'samples': 4361856, 'steps': 22717, 'loss/train': 1.5549181699752808} -08/30/2021 17:16:40 - INFO - __main__ - Step 22719: {'lr': 0.0004762112819163504, 'samples': 4362048, 'steps': 22718, 'loss/train': 1.5840942859649658} -08/30/2021 17:16:41 - INFO - __main__ - Step 22720: {'lr': 0.0004762090225673908, 'samples': 4362240, 'steps': 22719, 'loss/train': 1.1802986860275269} -08/30/2021 17:16:41 - INFO - __main__ - Step 22721: {'lr': 0.0004762067631165049, 'samples': 4362432, 'steps': 22720, 'loss/train': 1.972393274307251} -08/30/2021 17:16:43 - INFO - __main__ - Step 22722: {'lr': 0.0004762045035636937, 'samples': 4362624, 'steps': 22721, 'loss/train': 0.8380379676818848} -08/30/2021 17:16:43 - INFO - __main__ - Step 22723: {'lr': 0.0004762022439089583, 'samples': 4362816, 'steps': 22722, 'loss/train': 1.7101861238479614} -08/30/2021 17:16:43 - INFO - __main__ - Step 22724: {'lr': 0.0004761999841522996, 'samples': 4363008, 'steps': 22723, 'loss/train': 2.1470186710357666} -08/30/2021 17:16:44 - INFO - __main__ - Step 22725: {'lr': 0.0004761977242937188, 'samples': 4363200, 'steps': 22724, 'loss/train': 1.7504310607910156} -08/30/2021 17:16:44 - INFO - __main__ - Step 22726: {'lr': 0.00047619546433321663, 'samples': 4363392, 'steps': 22725, 'loss/train': 1.112618327140808} -08/30/2021 17:16:46 - INFO - __main__ - Step 22727: {'lr': 0.00047619320427079437, 'samples': 4363584, 'steps': 22726, 'loss/train': 1.5926406383514404} -08/30/2021 17:16:46 - INFO - __main__ - Step 22728: {'lr': 0.00047619094410645293, 'samples': 4363776, 'steps': 22727, 'loss/train': 0.8259417414665222} -08/30/2021 17:16:47 - INFO - __main__ - Step 22729: {'lr': 0.0004761886838401933, 'samples': 4363968, 'steps': 22728, 'loss/train': 1.9355567693710327} -08/30/2021 17:16:47 - INFO - __main__ - Step 22730: {'lr': 0.0004761864234720166, 'samples': 4364160, 'steps': 22729, 'loss/train': 1.997549057006836} -08/30/2021 17:16:47 - INFO - __main__ - Step 22731: {'lr': 0.00047618416300192375, 'samples': 4364352, 'steps': 22730, 'loss/train': 1.2267361879348755} -08/30/2021 17:16:48 - INFO - __main__ - Step 22732: {'lr': 0.0004761819024299158, 'samples': 4364544, 'steps': 22731, 'loss/train': 1.8489607572555542} -08/30/2021 17:16:49 - INFO - __main__ - Step 22733: {'lr': 0.0004761796417559938, 'samples': 4364736, 'steps': 22732, 'loss/train': 1.7026993036270142} -08/30/2021 17:16:50 - INFO - __main__ - Step 22734: {'lr': 0.0004761773809801587, 'samples': 4364928, 'steps': 22733, 'loss/train': 1.4597245454788208} -08/30/2021 17:16:50 - INFO - __main__ - Step 22735: {'lr': 0.0004761751201024116, 'samples': 4365120, 'steps': 22734, 'loss/train': 1.5148273706436157} -08/30/2021 17:16:50 - INFO - __main__ - Step 22736: {'lr': 0.0004761728591227535, 'samples': 4365312, 'steps': 22735, 'loss/train': 1.2636899948120117} -08/30/2021 17:16:51 - INFO - __main__ - Step 22737: {'lr': 0.00047617059804118536, 'samples': 4365504, 'steps': 22736, 'loss/train': 1.7436262369155884} -08/30/2021 17:16:53 - INFO - __main__ - Step 22738: {'lr': 0.0004761683368577083, 'samples': 4365696, 'steps': 22737, 'loss/train': 1.5510469675064087} -08/30/2021 17:16:53 - INFO - __main__ - Step 22739: {'lr': 0.0004761660755723232, 'samples': 4365888, 'steps': 22738, 'loss/train': 1.2957271337509155} -08/30/2021 17:16:54 - INFO - __main__ - Step 22740: {'lr': 0.0004761638141850312, 'samples': 4366080, 'steps': 22739, 'loss/train': 1.8613446950912476} -08/30/2021 17:16:54 - INFO - __main__ - Step 22741: {'lr': 0.0004761615526958333, 'samples': 4366272, 'steps': 22740, 'loss/train': 1.8560149669647217} -08/30/2021 17:16:54 - INFO - __main__ - Step 22742: {'lr': 0.0004761592911047304, 'samples': 4366464, 'steps': 22741, 'loss/train': 1.860827922821045} -08/30/2021 17:16:56 - INFO - __main__ - Step 22743: {'lr': 0.00047615702941172366, 'samples': 4366656, 'steps': 22742, 'loss/train': 1.5457545518875122} -08/30/2021 17:16:56 - INFO - __main__ - Step 22744: {'lr': 0.0004761547676168141, 'samples': 4366848, 'steps': 22743, 'loss/train': 1.7188726663589478} -08/30/2021 17:16:57 - INFO - __main__ - Step 22745: {'lr': 0.0004761525057200027, 'samples': 4367040, 'steps': 22744, 'loss/train': 2.0277504920959473} -08/30/2021 17:16:57 - INFO - __main__ - Step 22746: {'lr': 0.00047615024372129033, 'samples': 4367232, 'steps': 22745, 'loss/train': 1.4906532764434814} -08/30/2021 17:16:57 - INFO - __main__ - Step 22747: {'lr': 0.0004761479816206783, 'samples': 4367424, 'steps': 22746, 'loss/train': 1.1546109914779663} -08/30/2021 17:16:59 - INFO - __main__ - Step 22748: {'lr': 0.00047614571941816743, 'samples': 4367616, 'steps': 22747, 'loss/train': 0.0923515036702156} -08/30/2021 17:16:59 - INFO - __main__ - Step 22749: {'lr': 0.00047614345711375874, 'samples': 4367808, 'steps': 22748, 'loss/train': 1.6979933977127075} -08/30/2021 17:17:00 - INFO - __main__ - Step 22750: {'lr': 0.0004761411947074533, 'samples': 4368000, 'steps': 22749, 'loss/train': 1.2950513362884521} -08/30/2021 17:17:00 - INFO - __main__ - Step 22751: {'lr': 0.00047613893219925217, 'samples': 4368192, 'steps': 22750, 'loss/train': 0.35021892189979553} -08/30/2021 17:17:00 - INFO - __main__ - Step 22752: {'lr': 0.00047613666958915636, 'samples': 4368384, 'steps': 22751, 'loss/train': 0.8060241937637329} -08/30/2021 17:17:02 - INFO - __main__ - Step 22753: {'lr': 0.0004761344068771668, 'samples': 4368576, 'steps': 22752, 'loss/train': 1.5739452838897705} -08/30/2021 17:17:02 - INFO - __main__ - Step 22754: {'lr': 0.0004761321440632846, 'samples': 4368768, 'steps': 22753, 'loss/train': 1.9471994638442993} -08/30/2021 17:17:03 - INFO - __main__ - Step 22755: {'lr': 0.00047612988114751074, 'samples': 4368960, 'steps': 22754, 'loss/train': 0.7910296320915222} -08/30/2021 17:17:03 - INFO - __main__ - Step 22756: {'lr': 0.00047612761812984626, 'samples': 4369152, 'steps': 22755, 'loss/train': 1.2983958721160889} -08/30/2021 17:17:03 - INFO - __main__ - Step 22757: {'lr': 0.00047612535501029215, 'samples': 4369344, 'steps': 22756, 'loss/train': 1.8251382112503052} -08/30/2021 17:17:04 - INFO - __main__ - Step 22758: {'lr': 0.0004761230917888494, 'samples': 4369536, 'steps': 22757, 'loss/train': 1.9290217161178589} -08/30/2021 17:17:05 - INFO - __main__ - Step 22759: {'lr': 0.00047612082846551913, 'samples': 4369728, 'steps': 22758, 'loss/train': 1.0281867980957031} -08/30/2021 17:17:06 - INFO - __main__ - Step 22760: {'lr': 0.0004761185650403023, 'samples': 4369920, 'steps': 22759, 'loss/train': 1.2882440090179443} -08/30/2021 17:17:06 - INFO - __main__ - Step 22761: {'lr': 0.0004761163015131999, 'samples': 4370112, 'steps': 22760, 'loss/train': 1.6148911714553833} -08/30/2021 17:17:07 - INFO - __main__ - Step 22762: {'lr': 0.00047611403788421305, 'samples': 4370304, 'steps': 22761, 'loss/train': 1.910568356513977} -08/30/2021 17:17:07 - INFO - __main__ - Step 22763: {'lr': 0.0004761117741533426, 'samples': 4370496, 'steps': 22762, 'loss/train': 1.8226226568222046} -08/30/2021 17:17:08 - INFO - __main__ - Step 22764: {'lr': 0.0004761095103205897, 'samples': 4370688, 'steps': 22763, 'loss/train': 1.7216705083847046} -08/30/2021 17:17:09 - INFO - __main__ - Step 22765: {'lr': 0.00047610724638595545, 'samples': 4370880, 'steps': 22764, 'loss/train': 0.06404563039541245} -08/30/2021 17:17:09 - INFO - __main__ - Step 22766: {'lr': 0.00047610498234944065, 'samples': 4371072, 'steps': 22765, 'loss/train': 1.3860447406768799} -08/30/2021 17:17:10 - INFO - __main__ - Step 22767: {'lr': 0.00047610271821104647, 'samples': 4371264, 'steps': 22766, 'loss/train': 1.1288124322891235} -08/30/2021 17:17:10 - INFO - __main__ - Step 22768: {'lr': 0.0004761004539707739, 'samples': 4371456, 'steps': 22767, 'loss/train': 1.9874215126037598} -08/30/2021 17:17:11 - INFO - __main__ - Step 22769: {'lr': 0.00047609818962862394, 'samples': 4371648, 'steps': 22768, 'loss/train': 1.9229989051818848} -08/30/2021 17:17:12 - INFO - __main__ - Step 22770: {'lr': 0.00047609592518459766, 'samples': 4371840, 'steps': 22769, 'loss/train': 1.4309335947036743} -08/30/2021 17:17:12 - INFO - __main__ - Step 22771: {'lr': 0.00047609366063869595, 'samples': 4372032, 'steps': 22770, 'loss/train': 1.706612467765808} -08/30/2021 17:17:13 - INFO - __main__ - Step 22772: {'lr': 0.00047609139599092006, 'samples': 4372224, 'steps': 22771, 'loss/train': 0.9627857208251953} -08/30/2021 17:17:13 - INFO - __main__ - Step 22773: {'lr': 0.0004760891312412708, 'samples': 4372416, 'steps': 22772, 'loss/train': 1.4608187675476074} -08/30/2021 17:17:14 - INFO - __main__ - Step 22774: {'lr': 0.0004760868663897493, 'samples': 4372608, 'steps': 22773, 'loss/train': 1.4157202243804932} -08/30/2021 17:17:15 - INFO - __main__ - Step 22775: {'lr': 0.0004760846014363565, 'samples': 4372800, 'steps': 22774, 'loss/train': 1.8349318504333496} -08/30/2021 17:17:15 - INFO - __main__ - Step 22776: {'lr': 0.0004760823363810935, 'samples': 4372992, 'steps': 22775, 'loss/train': 1.6829019784927368} -08/30/2021 17:17:16 - INFO - __main__ - Step 22777: {'lr': 0.0004760800712239612, 'samples': 4373184, 'steps': 22776, 'loss/train': 1.3641904592514038} -08/30/2021 17:17:16 - INFO - __main__ - Step 22778: {'lr': 0.0004760778059649609, 'samples': 4373376, 'steps': 22777, 'loss/train': 1.5136724710464478} -08/30/2021 17:17:17 - INFO - __main__ - Step 22779: {'lr': 0.0004760755406040933, 'samples': 4373568, 'steps': 22778, 'loss/train': 1.8314247131347656} -08/30/2021 17:17:18 - INFO - __main__ - Step 22780: {'lr': 0.00047607327514135955, 'samples': 4373760, 'steps': 22779, 'loss/train': 1.7004406452178955} -08/30/2021 17:17:18 - INFO - __main__ - Step 22781: {'lr': 0.00047607100957676067, 'samples': 4373952, 'steps': 22780, 'loss/train': 1.4628232717514038} -08/30/2021 17:17:19 - INFO - __main__ - Step 22782: {'lr': 0.0004760687439102977, 'samples': 4374144, 'steps': 22781, 'loss/train': 1.600130558013916} -08/30/2021 17:17:19 - INFO - __main__ - Step 22783: {'lr': 0.0004760664781419717, 'samples': 4374336, 'steps': 22782, 'loss/train': 1.2052366733551025} -08/30/2021 17:17:21 - INFO - __main__ - Step 22784: {'lr': 0.00047606421227178354, 'samples': 4374528, 'steps': 22783, 'loss/train': 1.670741081237793} -08/30/2021 17:17:21 - INFO - __main__ - Step 22785: {'lr': 0.0004760619462997343, 'samples': 4374720, 'steps': 22784, 'loss/train': 1.5195059776306152} -08/30/2021 17:17:22 - INFO - __main__ - Step 22786: {'lr': 0.00047605968022582513, 'samples': 4374912, 'steps': 22785, 'loss/train': 1.409189224243164} -08/30/2021 17:17:22 - INFO - __main__ - Step 22787: {'lr': 0.000476057414050057, 'samples': 4375104, 'steps': 22786, 'loss/train': 1.396681308746338} -08/30/2021 17:17:22 - INFO - __main__ - Step 22788: {'lr': 0.00047605514777243076, 'samples': 4375296, 'steps': 22787, 'loss/train': 1.1407527923583984} -08/30/2021 17:17:24 - INFO - __main__ - Step 22789: {'lr': 0.0004760528813929476, 'samples': 4375488, 'steps': 22788, 'loss/train': 0.10242465138435364} -08/30/2021 17:17:25 - INFO - __main__ - Step 22790: {'lr': 0.0004760506149116085, 'samples': 4375680, 'steps': 22789, 'loss/train': 1.7497690916061401} -08/30/2021 17:17:25 - INFO - __main__ - Step 22791: {'lr': 0.0004760483483284145, 'samples': 4375872, 'steps': 22790, 'loss/train': 2.0616135597229004} -08/30/2021 17:17:25 - INFO - __main__ - Step 22792: {'lr': 0.0004760460816433666, 'samples': 4376064, 'steps': 22791, 'loss/train': 1.7703133821487427} -08/30/2021 17:17:26 - INFO - __main__ - Step 22793: {'lr': 0.0004760438148564659, 'samples': 4376256, 'steps': 22792, 'loss/train': 1.3119556903839111} -08/30/2021 17:17:26 - INFO - __main__ - Step 22794: {'lr': 0.00047604154796771327, 'samples': 4376448, 'steps': 22793, 'loss/train': 1.9411065578460693} -08/30/2021 17:17:28 - INFO - __main__ - Step 22795: {'lr': 0.0004760392809771098, 'samples': 4376640, 'steps': 22794, 'loss/train': 1.8020325899124146} -08/30/2021 17:17:28 - INFO - __main__ - Step 22796: {'lr': 0.00047603701388465646, 'samples': 4376832, 'steps': 22795, 'loss/train': 2.1383056640625} -08/30/2021 17:17:28 - INFO - __main__ - Step 22797: {'lr': 0.0004760347466903544, 'samples': 4377024, 'steps': 22796, 'loss/train': 1.6379649639129639} -08/30/2021 17:17:29 - INFO - __main__ - Step 22798: {'lr': 0.0004760324793942046, 'samples': 4377216, 'steps': 22797, 'loss/train': 1.4360427856445312} -08/30/2021 17:17:29 - INFO - __main__ - Step 22799: {'lr': 0.000476030211996208, 'samples': 4377408, 'steps': 22798, 'loss/train': 0.5922221541404724} -08/30/2021 17:17:31 - INFO - __main__ - Step 22800: {'lr': 0.0004760279444963657, 'samples': 4377600, 'steps': 22799, 'loss/train': 1.4615356922149658} -08/30/2021 17:17:31 - INFO - __main__ - Step 22801: {'lr': 0.0004760256768946787, 'samples': 4377792, 'steps': 22800, 'loss/train': 1.6913899183273315} -08/30/2021 17:17:31 - INFO - __main__ - Step 22802: {'lr': 0.00047602340919114793, 'samples': 4377984, 'steps': 22801, 'loss/train': 1.722115159034729} -08/30/2021 17:17:32 - INFO - __main__ - Step 22803: {'lr': 0.00047602114138577464, 'samples': 4378176, 'steps': 22802, 'loss/train': 1.2216346263885498} -08/30/2021 17:17:32 - INFO - __main__ - Step 22804: {'lr': 0.00047601887347855965, 'samples': 4378368, 'steps': 22803, 'loss/train': 1.5958867073059082} -08/30/2021 17:17:34 - INFO - __main__ - Step 22805: {'lr': 0.00047601660546950396, 'samples': 4378560, 'steps': 22804, 'loss/train': 1.288720965385437} -08/30/2021 17:17:34 - INFO - __main__ - Step 22806: {'lr': 0.0004760143373586088, 'samples': 4378752, 'steps': 22805, 'loss/train': 1.337775707244873} -08/30/2021 17:17:35 - INFO - __main__ - Step 22807: {'lr': 0.000476012069145875, 'samples': 4378944, 'steps': 22806, 'loss/train': 1.4912784099578857} -08/30/2021 17:17:35 - INFO - __main__ - Step 22808: {'lr': 0.00047600980083130367, 'samples': 4379136, 'steps': 22807, 'loss/train': 0.16186995804309845} -08/30/2021 17:17:35 - INFO - __main__ - Step 22809: {'lr': 0.0004760075324148959, 'samples': 4379328, 'steps': 22808, 'loss/train': 2.0144107341766357} -08/30/2021 17:17:36 - INFO - __main__ - Step 22810: {'lr': 0.00047600526389665246, 'samples': 4379520, 'steps': 22809, 'loss/train': 1.2294877767562866} -08/30/2021 17:17:37 - INFO - __main__ - Step 22811: {'lr': 0.00047600299527657464, 'samples': 4379712, 'steps': 22810, 'loss/train': 1.824755072593689} -08/30/2021 17:17:38 - INFO - __main__ - Step 22812: {'lr': 0.0004760007265546633, 'samples': 4379904, 'steps': 22811, 'loss/train': 1.269286036491394} -08/30/2021 17:17:38 - INFO - __main__ - Step 22813: {'lr': 0.00047599845773091957, 'samples': 4380096, 'steps': 22812, 'loss/train': 1.4401121139526367} -08/30/2021 17:17:39 - INFO - __main__ - Step 22814: {'lr': 0.0004759961888053444, 'samples': 4380288, 'steps': 22813, 'loss/train': 2.1565186977386475} -08/30/2021 17:17:39 - INFO - __main__ - Step 22815: {'lr': 0.00047599391977793884, 'samples': 4380480, 'steps': 22814, 'loss/train': 1.5639879703521729} -08/30/2021 17:17:40 - INFO - __main__ - Step 22816: {'lr': 0.00047599165064870385, 'samples': 4380672, 'steps': 22815, 'loss/train': 3.1073622703552246} -08/30/2021 17:17:41 - INFO - __main__ - Step 22817: {'lr': 0.0004759893814176406, 'samples': 4380864, 'steps': 22816, 'loss/train': 0.3915186822414398} -08/30/2021 17:17:41 - INFO - __main__ - Step 22818: {'lr': 0.00047598711208475, 'samples': 4381056, 'steps': 22817, 'loss/train': 1.7690671682357788} -08/30/2021 17:17:41 - INFO - __main__ - Step 22819: {'lr': 0.00047598484265003307, 'samples': 4381248, 'steps': 22818, 'loss/train': 1.451126217842102} -08/30/2021 17:17:42 - INFO - __main__ - Step 22820: {'lr': 0.00047598257311349087, 'samples': 4381440, 'steps': 22819, 'loss/train': 1.9935786724090576} -08/30/2021 17:17:42 - INFO - __main__ - Step 22821: {'lr': 0.0004759803034751244, 'samples': 4381632, 'steps': 22820, 'loss/train': 1.9499880075454712} -08/30/2021 17:17:44 - INFO - __main__ - Step 22822: {'lr': 0.0004759780337349347, 'samples': 4381824, 'steps': 22821, 'loss/train': 1.7148023843765259} -08/30/2021 17:17:44 - INFO - __main__ - Step 22823: {'lr': 0.0004759757638929227, 'samples': 4382016, 'steps': 22822, 'loss/train': 5.891917705535889} -08/30/2021 17:17:44 - INFO - __main__ - Step 22824: {'lr': 0.00047597349394908967, 'samples': 4382208, 'steps': 22823, 'loss/train': 1.981136441230774} -08/30/2021 17:17:45 - INFO - __main__ - Step 22825: {'lr': 0.0004759712239034364, 'samples': 4382400, 'steps': 22824, 'loss/train': 1.6211497783660889} -08/30/2021 17:17:45 - INFO - __main__ - Step 22826: {'lr': 0.0004759689537559639, 'samples': 4382592, 'steps': 22825, 'loss/train': 1.9349123239517212} -08/30/2021 17:17:47 - INFO - __main__ - Step 22827: {'lr': 0.0004759666835066734, 'samples': 4382784, 'steps': 22826, 'loss/train': 1.3486504554748535} -08/30/2021 17:17:47 - INFO - __main__ - Step 22828: {'lr': 0.00047596441315556575, 'samples': 4382976, 'steps': 22827, 'loss/train': 2.139190196990967} -08/30/2021 17:17:48 - INFO - __main__ - Step 22829: {'lr': 0.00047596214270264204, 'samples': 4383168, 'steps': 22828, 'loss/train': 1.8058923482894897} -08/30/2021 17:17:48 - INFO - __main__ - Step 22830: {'lr': 0.00047595987214790324, 'samples': 4383360, 'steps': 22829, 'loss/train': 1.976863980293274} -08/30/2021 17:17:48 - INFO - __main__ - Step 22831: {'lr': 0.0004759576014913505, 'samples': 4383552, 'steps': 22830, 'loss/train': 0.43058809638023376} -08/30/2021 17:17:49 - INFO - __main__ - Step 22832: {'lr': 0.0004759553307329846, 'samples': 4383744, 'steps': 22831, 'loss/train': 2.1321988105773926} -08/30/2021 17:17:50 - INFO - __main__ - Step 22833: {'lr': 0.0004759530598728068, 'samples': 4383936, 'steps': 22832, 'loss/train': 1.539613962173462} -08/30/2021 17:17:51 - INFO - __main__ - Step 22834: {'lr': 0.000475950788910818, 'samples': 4384128, 'steps': 22833, 'loss/train': 1.6206520795822144} -08/30/2021 17:17:51 - INFO - __main__ - Step 22835: {'lr': 0.0004759485178470193, 'samples': 4384320, 'steps': 22834, 'loss/train': 1.404211401939392} -08/30/2021 17:17:51 - INFO - __main__ - Step 22836: {'lr': 0.0004759462466814117, 'samples': 4384512, 'steps': 22835, 'loss/train': 1.3100310564041138} -08/30/2021 17:17:52 - INFO - __main__ - Step 22837: {'lr': 0.0004759439754139962, 'samples': 4384704, 'steps': 22836, 'loss/train': 1.5406081676483154} -08/30/2021 17:17:53 - INFO - __main__ - Step 22838: {'lr': 0.0004759417040447738, 'samples': 4384896, 'steps': 22837, 'loss/train': 1.3121213912963867} -08/30/2021 17:17:54 - INFO - __main__ - Step 22839: {'lr': 0.00047593943257374563, 'samples': 4385088, 'steps': 22838, 'loss/train': 1.3830492496490479} -08/30/2021 17:17:54 - INFO - __main__ - Step 22840: {'lr': 0.00047593716100091253, 'samples': 4385280, 'steps': 22839, 'loss/train': 1.1399668455123901} -08/30/2021 17:17:55 - INFO - __main__ - Step 22841: {'lr': 0.00047593488932627567, 'samples': 4385472, 'steps': 22840, 'loss/train': 0.2697351276874542} -08/30/2021 17:17:55 - INFO - __main__ - Step 22842: {'lr': 0.00047593261754983607, 'samples': 4385664, 'steps': 22841, 'loss/train': 0.36397024989128113} -08/30/2021 17:17:55 - INFO - __main__ - Step 22843: {'lr': 0.00047593034567159465, 'samples': 4385856, 'steps': 22842, 'loss/train': 1.7801777124404907} -08/30/2021 17:17:57 - INFO - __main__ - Step 22844: {'lr': 0.00047592807369155256, 'samples': 4386048, 'steps': 22843, 'loss/train': 1.2506732940673828} -08/30/2021 17:17:57 - INFO - __main__ - Step 22845: {'lr': 0.0004759258016097108, 'samples': 4386240, 'steps': 22844, 'loss/train': 2.4678118228912354} -08/30/2021 17:17:58 - INFO - __main__ - Step 22846: {'lr': 0.0004759235294260703, 'samples': 4386432, 'steps': 22845, 'loss/train': 1.5825022459030151} -08/30/2021 17:17:58 - INFO - __main__ - Step 22847: {'lr': 0.0004759212571406321, 'samples': 4386624, 'steps': 22846, 'loss/train': 0.9864962697029114} -08/30/2021 17:17:58 - INFO - __main__ - Step 22848: {'lr': 0.00047591898475339735, 'samples': 4386816, 'steps': 22847, 'loss/train': 1.507699966430664} -08/30/2021 17:18:00 - INFO - __main__ - Step 22849: {'lr': 0.00047591671226436695, 'samples': 4387008, 'steps': 22848, 'loss/train': 1.8230257034301758} -08/30/2021 17:18:01 - INFO - __main__ - Step 22850: {'lr': 0.00047591443967354196, 'samples': 4387200, 'steps': 22849, 'loss/train': 1.8146308660507202} -08/30/2021 17:18:01 - INFO - __main__ - Step 22851: {'lr': 0.00047591216698092344, 'samples': 4387392, 'steps': 22850, 'loss/train': 1.4738590717315674} -08/30/2021 17:18:02 - INFO - __main__ - Step 22852: {'lr': 0.00047590989418651243, 'samples': 4387584, 'steps': 22851, 'loss/train': 1.4997490644454956} -08/30/2021 17:18:02 - INFO - __main__ - Step 22853: {'lr': 0.00047590762129030986, 'samples': 4387776, 'steps': 22852, 'loss/train': 2.373847723007202} -08/30/2021 17:18:04 - INFO - __main__ - Step 22854: {'lr': 0.00047590534829231675, 'samples': 4387968, 'steps': 22853, 'loss/train': 1.1073637008666992} -08/30/2021 17:18:04 - INFO - __main__ - Step 22855: {'lr': 0.00047590307519253423, 'samples': 4388160, 'steps': 22854, 'loss/train': 1.5946327447891235} -08/30/2021 17:18:05 - INFO - __main__ - Step 22856: {'lr': 0.00047590080199096324, 'samples': 4388352, 'steps': 22855, 'loss/train': 1.5366663932800293} -08/30/2021 17:18:05 - INFO - __main__ - Step 22857: {'lr': 0.00047589852868760486, 'samples': 4388544, 'steps': 22856, 'loss/train': 1.5052390098571777} -08/30/2021 17:18:05 - INFO - __main__ - Step 22858: {'lr': 0.00047589625528246006, 'samples': 4388736, 'steps': 22857, 'loss/train': 1.7839717864990234} -08/30/2021 17:18:07 - INFO - __main__ - Step 22859: {'lr': 0.0004758939817755299, 'samples': 4388928, 'steps': 22858, 'loss/train': 0.096491739153862} -08/30/2021 17:18:07 - INFO - __main__ - Step 22860: {'lr': 0.0004758917081668155, 'samples': 4389120, 'steps': 22859, 'loss/train': 1.6763114929199219} -08/30/2021 17:18:08 - INFO - __main__ - Step 22861: {'lr': 0.00047588943445631767, 'samples': 4389312, 'steps': 22860, 'loss/train': 1.6641391515731812} -08/30/2021 17:18:08 - INFO - __main__ - Step 22862: {'lr': 0.0004758871606440376, 'samples': 4389504, 'steps': 22861, 'loss/train': 2.582131862640381} -08/30/2021 17:18:08 - INFO - __main__ - Step 22863: {'lr': 0.0004758848867299762, 'samples': 4389696, 'steps': 22862, 'loss/train': 1.5989612340927124} -08/30/2021 17:18:10 - INFO - __main__ - Step 22864: {'lr': 0.0004758826127141346, 'samples': 4389888, 'steps': 22863, 'loss/train': 1.7373689413070679} -08/30/2021 17:18:10 - INFO - __main__ - Step 22865: {'lr': 0.00047588033859651376, 'samples': 4390080, 'steps': 22864, 'loss/train': 1.8764578104019165} -08/30/2021 17:18:11 - INFO - __main__ - Step 22866: {'lr': 0.00047587806437711475, 'samples': 4390272, 'steps': 22865, 'loss/train': 2.0728724002838135} -08/30/2021 17:18:11 - INFO - __main__ - Step 22867: {'lr': 0.0004758757900559385, 'samples': 4390464, 'steps': 22866, 'loss/train': 1.1344109773635864} -08/30/2021 17:18:11 - INFO - __main__ - Step 22868: {'lr': 0.0004758735156329862, 'samples': 4390656, 'steps': 22867, 'loss/train': 1.8590474128723145} -08/30/2021 17:18:12 - INFO - __main__ - Step 22869: {'lr': 0.00047587124110825874, 'samples': 4390848, 'steps': 22868, 'loss/train': 1.8620820045471191} -08/30/2021 17:18:13 - INFO - __main__ - Step 22870: {'lr': 0.00047586896648175715, 'samples': 4391040, 'steps': 22869, 'loss/train': 1.315921425819397} -08/30/2021 17:18:14 - INFO - __main__ - Step 22871: {'lr': 0.00047586669175348254, 'samples': 4391232, 'steps': 22870, 'loss/train': 1.1827940940856934} -08/30/2021 17:18:14 - INFO - __main__ - Step 22872: {'lr': 0.0004758644169234359, 'samples': 4391424, 'steps': 22871, 'loss/train': 1.5243394374847412} -08/30/2021 17:18:14 - INFO - __main__ - Step 22873: {'lr': 0.00047586214199161814, 'samples': 4391616, 'steps': 22872, 'loss/train': 1.2829667329788208} -08/30/2021 17:18:15 - INFO - __main__ - Step 22874: {'lr': 0.00047585986695803046, 'samples': 4391808, 'steps': 22873, 'loss/train': 1.6022831201553345} -08/30/2021 17:18:16 - INFO - __main__ - Step 22875: {'lr': 0.0004758575918226738, 'samples': 4392000, 'steps': 22874, 'loss/train': 2.4123387336730957} -08/30/2021 17:18:17 - INFO - __main__ - Step 22876: {'lr': 0.0004758553165855492, 'samples': 4392192, 'steps': 22875, 'loss/train': 1.2562882900238037} -08/30/2021 17:18:17 - INFO - __main__ - Step 22877: {'lr': 0.00047585304124665766, 'samples': 4392384, 'steps': 22876, 'loss/train': 2.1552555561065674} -08/30/2021 17:18:17 - INFO - __main__ - Step 22878: {'lr': 0.0004758507658060003, 'samples': 4392576, 'steps': 22877, 'loss/train': 1.7031769752502441} -08/30/2021 17:18:18 - INFO - __main__ - Step 22879: {'lr': 0.00047584849026357796, 'samples': 4392768, 'steps': 22878, 'loss/train': 1.3326934576034546} -08/30/2021 17:18:19 - INFO - __main__ - Step 22880: {'lr': 0.0004758462146193918, 'samples': 4392960, 'steps': 22879, 'loss/train': 1.129577875137329} -08/30/2021 17:18:20 - INFO - __main__ - Step 22881: {'lr': 0.00047584393887344285, 'samples': 4393152, 'steps': 22880, 'loss/train': 1.4693756103515625} -08/30/2021 17:18:20 - INFO - __main__ - Step 22882: {'lr': 0.00047584166302573204, 'samples': 4393344, 'steps': 22881, 'loss/train': 1.6039628982543945} -08/30/2021 17:18:20 - INFO - __main__ - Step 22883: {'lr': 0.0004758393870762606, 'samples': 4393536, 'steps': 22882, 'loss/train': 1.9116535186767578} -08/30/2021 17:18:21 - INFO - __main__ - Step 22884: {'lr': 0.00047583711102502934, 'samples': 4393728, 'steps': 22883, 'loss/train': 1.4598807096481323} -08/30/2021 17:18:22 - INFO - __main__ - Step 22885: {'lr': 0.0004758348348720393, 'samples': 4393920, 'steps': 22884, 'loss/train': 1.155315637588501} -08/30/2021 17:18:23 - INFO - __main__ - Step 22886: {'lr': 0.00047583255861729167, 'samples': 4394112, 'steps': 22885, 'loss/train': 1.7323552370071411} -08/30/2021 17:18:23 - INFO - __main__ - Step 22887: {'lr': 0.00047583028226078734, 'samples': 4394304, 'steps': 22886, 'loss/train': 1.7252373695373535} -08/30/2021 17:18:23 - INFO - __main__ - Step 22888: {'lr': 0.0004758280058025274, 'samples': 4394496, 'steps': 22887, 'loss/train': 1.758551836013794} -08/30/2021 17:18:24 - INFO - __main__ - Step 22889: {'lr': 0.00047582572924251276, 'samples': 4394688, 'steps': 22888, 'loss/train': 2.229707956314087} -08/30/2021 17:18:25 - INFO - __main__ - Step 22890: {'lr': 0.00047582345258074453, 'samples': 4394880, 'steps': 22889, 'loss/train': 1.6733328104019165} -08/30/2021 17:18:26 - INFO - __main__ - Step 22891: {'lr': 0.0004758211758172238, 'samples': 4395072, 'steps': 22890, 'loss/train': 1.8109558820724487} -08/30/2021 17:18:26 - INFO - __main__ - Step 22892: {'lr': 0.00047581889895195154, 'samples': 4395264, 'steps': 22891, 'loss/train': 2.3365039825439453} -08/30/2021 17:18:26 - INFO - __main__ - Step 22893: {'lr': 0.00047581662198492873, 'samples': 4395456, 'steps': 22892, 'loss/train': 1.775614619255066} -08/30/2021 17:18:27 - INFO - __main__ - Step 22894: {'lr': 0.0004758143449161565, 'samples': 4395648, 'steps': 22893, 'loss/train': 1.4363470077514648} -08/30/2021 17:18:27 - INFO - __main__ - Step 22895: {'lr': 0.00047581206774563575, 'samples': 4395840, 'steps': 22894, 'loss/train': 1.4303739070892334} -08/30/2021 17:18:28 - INFO - __main__ - Step 22896: {'lr': 0.0004758097904733676, 'samples': 4396032, 'steps': 22895, 'loss/train': 1.9553728103637695} -08/30/2021 17:18:29 - INFO - __main__ - Step 22897: {'lr': 0.000475807513099353, 'samples': 4396224, 'steps': 22896, 'loss/train': 1.7079744338989258} -08/30/2021 17:18:29 - INFO - __main__ - Step 22898: {'lr': 0.000475805235623593, 'samples': 4396416, 'steps': 22897, 'loss/train': 2.0140016078948975} -08/30/2021 17:18:30 - INFO - __main__ - Step 22899: {'lr': 0.0004758029580460887, 'samples': 4396608, 'steps': 22898, 'loss/train': 1.715692400932312} -08/30/2021 17:18:30 - INFO - __main__ - Step 22900: {'lr': 0.0004758006803668411, 'samples': 4396800, 'steps': 22899, 'loss/train': 1.5090689659118652} -08/30/2021 17:18:32 - INFO - __main__ - Step 22901: {'lr': 0.0004757984025858511, 'samples': 4396992, 'steps': 22900, 'loss/train': 1.0468246936798096} -08/30/2021 17:18:33 - INFO - __main__ - Step 22902: {'lr': 0.0004757961247031199, 'samples': 4397184, 'steps': 22901, 'loss/train': 0.2992228865623474} -08/30/2021 17:18:33 - INFO - __main__ - Step 22903: {'lr': 0.00047579384671864845, 'samples': 4397376, 'steps': 22902, 'loss/train': 1.5388532876968384} -08/30/2021 17:18:34 - INFO - __main__ - Step 22904: {'lr': 0.0004757915686324377, 'samples': 4397568, 'steps': 22903, 'loss/train': 1.5558629035949707} -08/30/2021 17:18:34 - INFO - __main__ - Step 22905: {'lr': 0.00047578929044448883, 'samples': 4397760, 'steps': 22904, 'loss/train': 1.2496048212051392} -08/30/2021 17:18:36 - INFO - __main__ - Step 22906: {'lr': 0.0004757870121548028, 'samples': 4397952, 'steps': 22905, 'loss/train': 2.200721263885498} -08/30/2021 17:18:36 - INFO - __main__ - Step 22907: {'lr': 0.0004757847337633806, 'samples': 4398144, 'steps': 22906, 'loss/train': 1.0412330627441406} -08/30/2021 17:18:36 - INFO - __main__ - Step 22908: {'lr': 0.0004757824552702232, 'samples': 4398336, 'steps': 22907, 'loss/train': 0.11058652400970459} -08/30/2021 17:18:37 - INFO - __main__ - Step 22909: {'lr': 0.0004757801766753318, 'samples': 4398528, 'steps': 22908, 'loss/train': 1.9616198539733887} -08/30/2021 17:18:37 - INFO - __main__ - Step 22910: {'lr': 0.00047577789797870743, 'samples': 4398720, 'steps': 22909, 'loss/train': 1.3215875625610352} -08/30/2021 17:18:37 - INFO - __main__ - Step 22911: {'lr': 0.0004757756191803508, 'samples': 4398912, 'steps': 22910, 'loss/train': 1.7832579612731934} -08/30/2021 17:18:39 - INFO - __main__ - Step 22912: {'lr': 0.0004757733402802633, 'samples': 4399104, 'steps': 22911, 'loss/train': 1.880214810371399} -08/30/2021 17:18:40 - INFO - __main__ - Step 22913: {'lr': 0.0004757710612784458, 'samples': 4399296, 'steps': 22912, 'loss/train': 0.1897026151418686} -08/30/2021 17:18:40 - INFO - __main__ - Step 22914: {'lr': 0.0004757687821748994, 'samples': 4399488, 'steps': 22913, 'loss/train': 1.9128143787384033} -08/30/2021 17:18:40 - INFO - __main__ - Step 22915: {'lr': 0.00047576650296962496, 'samples': 4399680, 'steps': 22914, 'loss/train': 1.9582329988479614} -08/30/2021 17:18:41 - INFO - __main__ - Step 22916: {'lr': 0.0004757642236626237, 'samples': 4399872, 'steps': 22915, 'loss/train': 1.375234842300415} -08/30/2021 17:18:42 - INFO - __main__ - Step 22917: {'lr': 0.00047576194425389654, 'samples': 4400064, 'steps': 22916, 'loss/train': 1.1546584367752075} -08/30/2021 17:18:43 - INFO - __main__ - Step 22918: {'lr': 0.00047575966474344445, 'samples': 4400256, 'steps': 22917, 'loss/train': 1.2885922193527222} -08/30/2021 17:18:43 - INFO - __main__ - Step 22919: {'lr': 0.00047575738513126867, 'samples': 4400448, 'steps': 22918, 'loss/train': 1.3296352624893188} -08/30/2021 17:18:43 - INFO - __main__ - Step 22920: {'lr': 0.00047575510541737, 'samples': 4400640, 'steps': 22919, 'loss/train': 1.962688684463501} -08/30/2021 17:18:44 - INFO - __main__ - Step 22921: {'lr': 0.0004757528256017496, 'samples': 4400832, 'steps': 22920, 'loss/train': 1.3125160932540894} -08/30/2021 17:18:45 - INFO - __main__ - Step 22922: {'lr': 0.00047575054568440846, 'samples': 4401024, 'steps': 22921, 'loss/train': 3.0557782649993896} -08/30/2021 17:18:46 - INFO - __main__ - Step 22923: {'lr': 0.00047574826566534764, 'samples': 4401216, 'steps': 22922, 'loss/train': 1.4462623596191406} -08/30/2021 17:18:46 - INFO - __main__ - Step 22924: {'lr': 0.0004757459855445681, 'samples': 4401408, 'steps': 22923, 'loss/train': 1.3010894060134888} -08/30/2021 17:18:46 - INFO - __main__ - Step 22925: {'lr': 0.0004757437053220709, 'samples': 4401600, 'steps': 22924, 'loss/train': 1.4071928262710571} -08/30/2021 17:18:47 - INFO - __main__ - Step 22926: {'lr': 0.0004757414249978571, 'samples': 4401792, 'steps': 22925, 'loss/train': 1.6209383010864258} -08/30/2021 17:18:47 - INFO - __main__ - Step 22927: {'lr': 0.0004757391445719277, 'samples': 4401984, 'steps': 22926, 'loss/train': 1.5751428604125977} -08/30/2021 17:18:49 - INFO - __main__ - Step 22928: {'lr': 0.00047573686404428365, 'samples': 4402176, 'steps': 22927, 'loss/train': 1.1744216680526733} -08/30/2021 17:18:49 - INFO - __main__ - Step 22929: {'lr': 0.0004757345834149261, 'samples': 4402368, 'steps': 22928, 'loss/train': 1.4119768142700195} -08/30/2021 17:18:50 - INFO - __main__ - Step 22930: {'lr': 0.00047573230268385604, 'samples': 4402560, 'steps': 22929, 'loss/train': 1.8124980926513672} -08/30/2021 17:18:50 - INFO - __main__ - Step 22931: {'lr': 0.0004757300218510745, 'samples': 4402752, 'steps': 22930, 'loss/train': 1.4101451635360718} -08/30/2021 17:18:50 - INFO - __main__ - Step 22932: {'lr': 0.00047572774091658243, 'samples': 4402944, 'steps': 22931, 'loss/train': 1.6242215633392334} -08/30/2021 17:18:52 - INFO - __main__ - Step 22933: {'lr': 0.000475725459880381, 'samples': 4403136, 'steps': 22932, 'loss/train': 1.5872819423675537} -08/30/2021 17:18:52 - INFO - __main__ - Step 22934: {'lr': 0.00047572317874247107, 'samples': 4403328, 'steps': 22933, 'loss/train': 1.8957769870758057} -08/30/2021 17:18:53 - INFO - __main__ - Step 22935: {'lr': 0.00047572089750285383, 'samples': 4403520, 'steps': 22934, 'loss/train': 1.7136831283569336} -08/30/2021 17:18:53 - INFO - __main__ - Step 22936: {'lr': 0.00047571861616153025, 'samples': 4403712, 'steps': 22935, 'loss/train': 1.3539509773254395} -08/30/2021 17:18:53 - INFO - __main__ - Step 22937: {'lr': 0.0004757163347185013, 'samples': 4403904, 'steps': 22936, 'loss/train': 1.2230592966079712} -08/30/2021 17:18:55 - INFO - __main__ - Step 22938: {'lr': 0.00047571405317376803, 'samples': 4404096, 'steps': 22937, 'loss/train': 2.0420732498168945} -08/30/2021 17:18:55 - INFO - __main__ - Step 22939: {'lr': 0.0004757117715273316, 'samples': 4404288, 'steps': 22938, 'loss/train': 1.3886237144470215} -08/30/2021 17:18:56 - INFO - __main__ - Step 22940: {'lr': 0.00047570948977919284, 'samples': 4404480, 'steps': 22939, 'loss/train': 1.8188010454177856} -08/30/2021 17:18:56 - INFO - __main__ - Step 22941: {'lr': 0.00047570720792935284, 'samples': 4404672, 'steps': 22940, 'loss/train': 1.5992809534072876} -08/30/2021 17:18:56 - INFO - __main__ - Step 22942: {'lr': 0.00047570492597781274, 'samples': 4404864, 'steps': 22941, 'loss/train': 1.5576814413070679} -08/30/2021 17:18:58 - INFO - __main__ - Step 22943: {'lr': 0.0004757026439245735, 'samples': 4405056, 'steps': 22942, 'loss/train': 1.3755614757537842} -08/30/2021 17:18:59 - INFO - __main__ - Step 22944: {'lr': 0.0004757003617696361, 'samples': 4405248, 'steps': 22943, 'loss/train': 1.7030465602874756} -08/30/2021 17:18:59 - INFO - __main__ - Step 22945: {'lr': 0.0004756980795130015, 'samples': 4405440, 'steps': 22944, 'loss/train': 1.8665271997451782} -08/30/2021 17:18:59 - INFO - __main__ - Step 22946: {'lr': 0.00047569579715467093, 'samples': 4405632, 'steps': 22945, 'loss/train': 1.5804766416549683} -08/30/2021 17:19:00 - INFO - __main__ - Step 22947: {'lr': 0.00047569351469464526, 'samples': 4405824, 'steps': 22946, 'loss/train': 1.5600886344909668} -08/30/2021 17:19:00 - INFO - __main__ - Step 22948: {'lr': 0.0004756912321329256, 'samples': 4406016, 'steps': 22947, 'loss/train': 0.07514391839504242} -08/30/2021 17:19:01 - INFO - __main__ - Step 22949: {'lr': 0.000475688949469513, 'samples': 4406208, 'steps': 22948, 'loss/train': 1.5531437397003174} -08/30/2021 17:19:02 - INFO - __main__ - Step 22950: {'lr': 0.0004756866667044084, 'samples': 4406400, 'steps': 22949, 'loss/train': 1.7941099405288696} -08/30/2021 17:19:02 - INFO - __main__ - Step 22951: {'lr': 0.0004756843838376128, 'samples': 4406592, 'steps': 22950, 'loss/train': 0.19485221803188324} -08/30/2021 17:19:03 - INFO - __main__ - Step 22952: {'lr': 0.0004756821008691274, 'samples': 4406784, 'steps': 22951, 'loss/train': 1.46951162815094} -08/30/2021 17:19:03 - INFO - __main__ - Step 22953: {'lr': 0.0004756798177989531, 'samples': 4406976, 'steps': 22952, 'loss/train': 1.5732104778289795} -08/30/2021 17:19:05 - INFO - __main__ - Step 22954: {'lr': 0.00047567753462709095, 'samples': 4407168, 'steps': 22953, 'loss/train': 1.7873196601867676} -08/30/2021 17:19:06 - INFO - __main__ - Step 22955: {'lr': 0.00047567525135354193, 'samples': 4407360, 'steps': 22954, 'loss/train': 1.5982166528701782} -08/30/2021 17:19:06 - INFO - __main__ - Step 22956: {'lr': 0.00047567296797830727, 'samples': 4407552, 'steps': 22955, 'loss/train': 1.9292433261871338} -08/30/2021 17:19:06 - INFO - __main__ - Step 22957: {'lr': 0.00047567068450138773, 'samples': 4407744, 'steps': 22956, 'loss/train': 1.453284740447998} -08/30/2021 17:19:07 - INFO - __main__ - Step 22958: {'lr': 0.0004756684009227845, 'samples': 4407936, 'steps': 22957, 'loss/train': 1.9705432653427124} -08/30/2021 17:19:08 - INFO - __main__ - Step 22959: {'lr': 0.0004756661172424986, 'samples': 4408128, 'steps': 22958, 'loss/train': 1.847352385520935} -08/30/2021 17:19:08 - INFO - __main__ - Step 22960: {'lr': 0.000475663833460531, 'samples': 4408320, 'steps': 22959, 'loss/train': 1.7003968954086304} -08/30/2021 17:19:09 - INFO - __main__ - Step 22961: {'lr': 0.00047566154957688275, 'samples': 4408512, 'steps': 22960, 'loss/train': 0.9619525671005249} -08/30/2021 17:19:09 - INFO - __main__ - Step 22962: {'lr': 0.0004756592655915549, 'samples': 4408704, 'steps': 22961, 'loss/train': 1.66960871219635} -08/30/2021 17:19:10 - INFO - __main__ - Step 22963: {'lr': 0.00047565698150454845, 'samples': 4408896, 'steps': 22962, 'loss/train': 1.9270974397659302} -08/30/2021 17:19:11 - INFO - __main__ - Step 22964: {'lr': 0.0004756546973158644, 'samples': 4409088, 'steps': 22963, 'loss/train': 1.7784135341644287} -08/30/2021 17:19:12 - INFO - __main__ - Step 22965: {'lr': 0.00047565241302550395, 'samples': 4409280, 'steps': 22964, 'loss/train': 1.859703540802002} -08/30/2021 17:19:12 - INFO - __main__ - Step 22966: {'lr': 0.0004756501286334679, 'samples': 4409472, 'steps': 22965, 'loss/train': 1.8214054107666016} -08/30/2021 17:19:13 - INFO - __main__ - Step 22967: {'lr': 0.0004756478441397575, 'samples': 4409664, 'steps': 22966, 'loss/train': 0.06283416599035263} -08/30/2021 17:19:13 - INFO - __main__ - Step 22968: {'lr': 0.0004756455595443735, 'samples': 4409856, 'steps': 22967, 'loss/train': 1.3767576217651367} -08/30/2021 17:19:13 - INFO - __main__ - Step 22969: {'lr': 0.00047564327484731725, 'samples': 4410048, 'steps': 22968, 'loss/train': 2.7831339836120605} -08/30/2021 17:19:15 - INFO - __main__ - Step 22970: {'lr': 0.0004756409900485895, 'samples': 4410240, 'steps': 22969, 'loss/train': 2.001856803894043} -08/30/2021 17:19:15 - INFO - __main__ - Step 22971: {'lr': 0.00047563870514819154, 'samples': 4410432, 'steps': 22970, 'loss/train': 1.5054091215133667} -08/30/2021 17:19:16 - INFO - __main__ - Step 22972: {'lr': 0.0004756364201461241, 'samples': 4410624, 'steps': 22971, 'loss/train': 2.18689227104187} -08/30/2021 17:19:16 - INFO - __main__ - Step 22973: {'lr': 0.00047563413504238847, 'samples': 4410816, 'steps': 22972, 'loss/train': 1.7257452011108398} -08/30/2021 17:19:16 - INFO - __main__ - Step 22974: {'lr': 0.0004756318498369855, 'samples': 4411008, 'steps': 22973, 'loss/train': 1.1092854738235474} -08/30/2021 17:19:18 - INFO - __main__ - Step 22975: {'lr': 0.0004756295645299164, 'samples': 4411200, 'steps': 22974, 'loss/train': 1.6956833600997925} -08/30/2021 17:19:18 - INFO - __main__ - Step 22976: {'lr': 0.00047562727912118206, 'samples': 4411392, 'steps': 22975, 'loss/train': 2.3967127799987793} -08/30/2021 17:19:19 - INFO - __main__ - Step 22977: {'lr': 0.00047562499361078356, 'samples': 4411584, 'steps': 22976, 'loss/train': 1.6982682943344116} -08/30/2021 17:19:19 - INFO - __main__ - Step 22978: {'lr': 0.00047562270799872186, 'samples': 4411776, 'steps': 22977, 'loss/train': 1.9491908550262451} -08/30/2021 17:19:19 - INFO - __main__ - Step 22979: {'lr': 0.00047562042228499815, 'samples': 4411968, 'steps': 22978, 'loss/train': 1.7589589357376099} -08/30/2021 17:19:21 - INFO - __main__ - Step 22980: {'lr': 0.00047561813646961325, 'samples': 4412160, 'steps': 22979, 'loss/train': 1.4948928356170654} -08/30/2021 17:19:21 - INFO - __main__ - Step 22981: {'lr': 0.0004756158505525684, 'samples': 4412352, 'steps': 22980, 'loss/train': 1.483370065689087} -08/30/2021 17:19:22 - INFO - __main__ - Step 22982: {'lr': 0.0004756135645338644, 'samples': 4412544, 'steps': 22981, 'loss/train': 1.978050708770752} -08/30/2021 17:19:22 - INFO - __main__ - Step 22983: {'lr': 0.00047561127841350256, 'samples': 4412736, 'steps': 22982, 'loss/train': 1.9036160707473755} -08/30/2021 17:19:22 - INFO - __main__ - Step 22984: {'lr': 0.0004756089921914837, 'samples': 4412928, 'steps': 22983, 'loss/train': 0.5567795038223267} -08/30/2021 17:19:23 - INFO - __main__ - Step 22985: {'lr': 0.00047560670586780886, 'samples': 4413120, 'steps': 22984, 'loss/train': 1.0332645177841187} -08/30/2021 17:19:24 - INFO - __main__ - Step 22986: {'lr': 0.0004756044194424792, 'samples': 4413312, 'steps': 22985, 'loss/train': 1.9853816032409668} -08/30/2021 17:19:25 - INFO - __main__ - Step 22987: {'lr': 0.0004756021329154956, 'samples': 4413504, 'steps': 22986, 'loss/train': 1.6890605688095093} -08/30/2021 17:19:25 - INFO - __main__ - Step 22988: {'lr': 0.0004755998462868592, 'samples': 4413696, 'steps': 22987, 'loss/train': 1.4336907863616943} -08/30/2021 17:19:25 - INFO - __main__ - Step 22989: {'lr': 0.00047559755955657097, 'samples': 4413888, 'steps': 22988, 'loss/train': 1.275169849395752} -08/30/2021 17:19:26 - INFO - __main__ - Step 22990: {'lr': 0.000475595272724632, 'samples': 4414080, 'steps': 22989, 'loss/train': 2.0036916732788086} -08/30/2021 17:19:27 - INFO - __main__ - Step 22991: {'lr': 0.00047559298579104325, 'samples': 4414272, 'steps': 22990, 'loss/train': 1.9356542825698853} -08/30/2021 17:19:27 - INFO - __main__ - Step 22992: {'lr': 0.00047559069875580573, 'samples': 4414464, 'steps': 22991, 'loss/train': 2.0371615886688232} -08/30/2021 17:19:28 - INFO - __main__ - Step 22993: {'lr': 0.00047558841161892063, 'samples': 4414656, 'steps': 22992, 'loss/train': 1.7100064754486084} -08/30/2021 17:19:28 - INFO - __main__ - Step 22994: {'lr': 0.00047558612438038887, 'samples': 4414848, 'steps': 22993, 'loss/train': 1.5306779146194458} -08/30/2021 17:19:29 - INFO - __main__ - Step 22995: {'lr': 0.00047558383704021136, 'samples': 4415040, 'steps': 22994, 'loss/train': 1.7773598432540894} -08/30/2021 17:19:30 - INFO - __main__ - Step 22996: {'lr': 0.00047558154959838935, 'samples': 4415232, 'steps': 22995, 'loss/train': 2.1924450397491455} -08/30/2021 17:19:31 - INFO - __main__ - Step 22997: {'lr': 0.0004755792620549237, 'samples': 4415424, 'steps': 22996, 'loss/train': 1.473719835281372} -08/30/2021 17:19:31 - INFO - __main__ - Step 22998: {'lr': 0.0004755769744098156, 'samples': 4415616, 'steps': 22997, 'loss/train': 1.3908065557479858} -08/30/2021 17:19:31 - INFO - __main__ - Step 22999: {'lr': 0.00047557468666306596, 'samples': 4415808, 'steps': 22998, 'loss/train': 1.2253528833389282} -08/30/2021 17:19:32 - INFO - __main__ - Step 23000: {'lr': 0.00047557239881467584, 'samples': 4416000, 'steps': 22999, 'loss/train': 1.6886320114135742} -08/30/2021 17:19:32 - INFO - __main__ - Step 23001: {'lr': 0.0004755701108646463, 'samples': 4416192, 'steps': 23000, 'loss/train': 5.877809524536133} -08/30/2021 17:19:33 - INFO - __main__ - Step 23002: {'lr': 0.0004755678228129784, 'samples': 4416384, 'steps': 23001, 'loss/train': 1.6232523918151855} -08/30/2021 17:19:34 - INFO - __main__ - Step 23003: {'lr': 0.000475565534659673, 'samples': 4416576, 'steps': 23002, 'loss/train': 0.8050466179847717} -08/30/2021 17:19:34 - INFO - __main__ - Step 23004: {'lr': 0.00047556324640473134, 'samples': 4416768, 'steps': 23003, 'loss/train': 1.570481300354004} -08/30/2021 17:19:35 - INFO - __main__ - Step 23005: {'lr': 0.0004755609580481543, 'samples': 4416960, 'steps': 23004, 'loss/train': 1.5985801219940186} -08/30/2021 17:19:35 - INFO - __main__ - Step 23006: {'lr': 0.00047555866958994296, 'samples': 4417152, 'steps': 23005, 'loss/train': 1.6451317071914673} -08/30/2021 17:19:36 - INFO - __main__ - Step 23007: {'lr': 0.00047555638103009845, 'samples': 4417344, 'steps': 23006, 'loss/train': 1.5482604503631592} -08/30/2021 17:19:37 - INFO - __main__ - Step 23008: {'lr': 0.0004755540923686217, 'samples': 4417536, 'steps': 23007, 'loss/train': 2.0507125854492188} -08/30/2021 17:19:37 - INFO - __main__ - Step 23009: {'lr': 0.0004755518036055137, 'samples': 4417728, 'steps': 23008, 'loss/train': 1.5620150566101074} -08/30/2021 17:19:38 - INFO - __main__ - Step 23010: {'lr': 0.0004755495147407756, 'samples': 4417920, 'steps': 23009, 'loss/train': 1.3272922039031982} -08/30/2021 17:19:38 - INFO - __main__ - Step 23011: {'lr': 0.00047554722577440833, 'samples': 4418112, 'steps': 23010, 'loss/train': 1.2647225856781006} -08/30/2021 17:19:40 - INFO - __main__ - Step 23012: {'lr': 0.00047554493670641296, 'samples': 4418304, 'steps': 23011, 'loss/train': 1.5204968452453613} -08/30/2021 17:19:40 - INFO - __main__ - Step 23013: {'lr': 0.0004755426475367905, 'samples': 4418496, 'steps': 23012, 'loss/train': 2.0286548137664795} -08/30/2021 17:19:41 - INFO - __main__ - Step 23014: {'lr': 0.00047554035826554206, 'samples': 4418688, 'steps': 23013, 'loss/train': 1.5546232461929321} -08/30/2021 17:19:41 - INFO - __main__ - Step 23015: {'lr': 0.0004755380688926686, 'samples': 4418880, 'steps': 23014, 'loss/train': 1.2495543956756592} -08/30/2021 17:19:42 - INFO - __main__ - Step 23016: {'lr': 0.00047553577941817114, 'samples': 4419072, 'steps': 23015, 'loss/train': 1.704040765762329} -08/30/2021 17:19:43 - INFO - __main__ - Step 23017: {'lr': 0.0004755334898420507, 'samples': 4419264, 'steps': 23016, 'loss/train': 1.5796982049942017} -08/30/2021 17:19:43 - INFO - __main__ - Step 23018: {'lr': 0.00047553120016430837, 'samples': 4419456, 'steps': 23017, 'loss/train': 2.387077808380127} -08/30/2021 17:19:44 - INFO - __main__ - Step 23019: {'lr': 0.0004755289103849453, 'samples': 4419648, 'steps': 23018, 'loss/train': 1.6557508707046509} -08/30/2021 17:19:44 - INFO - __main__ - Step 23020: {'lr': 0.0004755266205039622, 'samples': 4419840, 'steps': 23019, 'loss/train': 1.4642345905303955} -08/30/2021 17:19:44 - INFO - __main__ - Step 23021: {'lr': 0.00047552433052136034, 'samples': 4420032, 'steps': 23020, 'loss/train': 1.5368373394012451} -08/30/2021 17:19:46 - INFO - __main__ - Step 23022: {'lr': 0.00047552204043714076, 'samples': 4420224, 'steps': 23021, 'loss/train': 1.7309247255325317} -08/30/2021 17:19:46 - INFO - __main__ - Step 23023: {'lr': 0.0004755197502513043, 'samples': 4420416, 'steps': 23022, 'loss/train': 1.6309560537338257} -08/30/2021 17:19:47 - INFO - __main__ - Step 23024: {'lr': 0.00047551745996385233, 'samples': 4420608, 'steps': 23023, 'loss/train': 1.8825452327728271} -08/30/2021 17:19:47 - INFO - __main__ - Step 23025: {'lr': 0.00047551516957478545, 'samples': 4420800, 'steps': 23024, 'loss/train': 1.3205102682113647} -08/30/2021 17:19:47 - INFO - __main__ - Step 23026: {'lr': 0.0004755128790841051, 'samples': 4420992, 'steps': 23025, 'loss/train': 1.8629093170166016} -08/30/2021 17:19:48 - INFO - __main__ - Step 23027: {'lr': 0.000475510588491812, 'samples': 4421184, 'steps': 23026, 'loss/train': 1.561285138130188} -08/30/2021 17:19:49 - INFO - __main__ - Step 23028: {'lr': 0.00047550829779790735, 'samples': 4421376, 'steps': 23027, 'loss/train': 1.763322114944458} -08/30/2021 17:19:50 - INFO - __main__ - Step 23029: {'lr': 0.0004755060070023921, 'samples': 4421568, 'steps': 23028, 'loss/train': 1.6220554113388062} -08/30/2021 17:19:50 - INFO - __main__ - Step 23030: {'lr': 0.0004755037161052674, 'samples': 4421760, 'steps': 23029, 'loss/train': 1.757729172706604} -08/30/2021 17:19:50 - INFO - __main__ - Step 23031: {'lr': 0.00047550142510653415, 'samples': 4421952, 'steps': 23030, 'loss/train': 0.825249969959259} -08/30/2021 17:19:51 - INFO - __main__ - Step 23032: {'lr': 0.0004754991340061935, 'samples': 4422144, 'steps': 23031, 'loss/train': 1.0758825540542603} -08/30/2021 17:19:53 - INFO - __main__ - Step 23033: {'lr': 0.0004754968428042463, 'samples': 4422336, 'steps': 23032, 'loss/train': 1.6299127340316772} -08/30/2021 17:19:53 - INFO - __main__ - Step 23034: {'lr': 0.0004754945515006938, 'samples': 4422528, 'steps': 23033, 'loss/train': 1.7288877964019775} -08/30/2021 17:19:54 - INFO - __main__ - Step 23035: {'lr': 0.0004754922600955369, 'samples': 4422720, 'steps': 23034, 'loss/train': 1.4009493589401245} -08/30/2021 17:19:54 - INFO - __main__ - Step 23036: {'lr': 0.0004754899685887767, 'samples': 4422912, 'steps': 23035, 'loss/train': 1.2913403511047363} -08/30/2021 17:19:54 - INFO - __main__ - Step 23037: {'lr': 0.0004754876769804142, 'samples': 4423104, 'steps': 23036, 'loss/train': 1.4569898843765259} -08/30/2021 17:19:55 - INFO - __main__ - Step 23038: {'lr': 0.00047548538527045035, 'samples': 4423296, 'steps': 23037, 'loss/train': 0.17948797345161438} -08/30/2021 17:19:57 - INFO - __main__ - Step 23039: {'lr': 0.00047548309345888637, 'samples': 4423488, 'steps': 23038, 'loss/train': 0.34549573063850403} -08/30/2021 17:19:57 - INFO - __main__ - Step 23040: {'lr': 0.00047548080154572315, 'samples': 4423680, 'steps': 23039, 'loss/train': 1.16763436794281} -08/30/2021 17:19:58 - INFO - __main__ - Step 23041: {'lr': 0.00047547850953096174, 'samples': 4423872, 'steps': 23040, 'loss/train': 1.441243052482605} -08/30/2021 17:19:58 - INFO - __main__ - Step 23042: {'lr': 0.0004754762174146032, 'samples': 4424064, 'steps': 23041, 'loss/train': 1.9190456867218018} -08/30/2021 17:19:58 - INFO - __main__ - Step 23043: {'lr': 0.00047547392519664853, 'samples': 4424256, 'steps': 23042, 'loss/train': 2.913517713546753} -08/30/2021 17:19:59 - INFO - __main__ - Step 23044: {'lr': 0.0004754716328770988, 'samples': 4424448, 'steps': 23043, 'loss/train': 2.9844703674316406} -08/30/2021 17:20:00 - INFO - __main__ - Step 23045: {'lr': 0.00047546934045595516, 'samples': 4424640, 'steps': 23044, 'loss/train': 1.363848090171814} -08/30/2021 17:20:01 - INFO - __main__ - Step 23046: {'lr': 0.00047546704793321835, 'samples': 4424832, 'steps': 23045, 'loss/train': 1.8653638362884521} -08/30/2021 17:20:01 - INFO - __main__ - Step 23047: {'lr': 0.0004754647553088896, 'samples': 4425024, 'steps': 23046, 'loss/train': 1.5340021848678589} -08/30/2021 17:20:02 - INFO - __main__ - Step 23048: {'lr': 0.00047546246258297, 'samples': 4425216, 'steps': 23047, 'loss/train': 1.547456979751587} -08/30/2021 17:20:02 - INFO - __main__ - Step 23049: {'lr': 0.00047546016975546037, 'samples': 4425408, 'steps': 23048, 'loss/train': 0.10871273279190063} -08/30/2021 17:20:03 - INFO - __main__ - Step 23050: {'lr': 0.00047545787682636194, 'samples': 4425600, 'steps': 23049, 'loss/train': 1.824331283569336} -08/30/2021 17:20:04 - INFO - __main__ - Step 23051: {'lr': 0.00047545558379567565, 'samples': 4425792, 'steps': 23050, 'loss/train': 1.2129907608032227} -08/30/2021 17:20:04 - INFO - __main__ - Step 23052: {'lr': 0.00047545329066340256, 'samples': 4425984, 'steps': 23051, 'loss/train': 1.473488688468933} -08/30/2021 17:20:05 - INFO - __main__ - Step 23053: {'lr': 0.00047545099742954367, 'samples': 4426176, 'steps': 23052, 'loss/train': 1.6842970848083496} -08/30/2021 17:20:05 - INFO - __main__ - Step 23054: {'lr': 0.0004754487040941001, 'samples': 4426368, 'steps': 23053, 'loss/train': 1.7076953649520874} -08/30/2021 17:20:05 - INFO - __main__ - Step 23055: {'lr': 0.0004754464106570727, 'samples': 4426560, 'steps': 23054, 'loss/train': 1.6193013191223145} -08/30/2021 17:20:07 - INFO - __main__ - Step 23056: {'lr': 0.00047544411711846277, 'samples': 4426752, 'steps': 23055, 'loss/train': 1.618159294128418} -08/30/2021 17:20:07 - INFO - __main__ - Step 23057: {'lr': 0.00047544182347827114, 'samples': 4426944, 'steps': 23056, 'loss/train': 1.6489686965942383} -08/30/2021 17:20:08 - INFO - __main__ - Step 23058: {'lr': 0.0004754395297364989, 'samples': 4427136, 'steps': 23057, 'loss/train': 1.1632510423660278} -08/30/2021 17:20:08 - INFO - __main__ - Step 23059: {'lr': 0.0004754372358931471, 'samples': 4427328, 'steps': 23058, 'loss/train': 1.6978973150253296} -08/30/2021 17:20:08 - INFO - __main__ - Step 23060: {'lr': 0.00047543494194821675, 'samples': 4427520, 'steps': 23059, 'loss/train': 2.407747983932495} -08/30/2021 17:20:10 - INFO - __main__ - Step 23061: {'lr': 0.00047543264790170887, 'samples': 4427712, 'steps': 23060, 'loss/train': 1.26861572265625} -08/30/2021 17:20:10 - INFO - __main__ - Step 23062: {'lr': 0.00047543035375362453, 'samples': 4427904, 'steps': 23061, 'loss/train': 1.7939304113388062} -08/30/2021 17:20:11 - INFO - __main__ - Step 23063: {'lr': 0.00047542805950396476, 'samples': 4428096, 'steps': 23062, 'loss/train': 1.8011139631271362} -08/30/2021 17:20:11 - INFO - __main__ - Step 23064: {'lr': 0.00047542576515273064, 'samples': 4428288, 'steps': 23063, 'loss/train': 1.9798765182495117} -08/30/2021 17:20:11 - INFO - __main__ - Step 23065: {'lr': 0.0004754234706999231, 'samples': 4428480, 'steps': 23064, 'loss/train': 2.1380014419555664} -08/30/2021 17:20:13 - INFO - __main__ - Step 23066: {'lr': 0.0004754211761455432, 'samples': 4428672, 'steps': 23065, 'loss/train': 1.8568460941314697} -08/30/2021 17:20:14 - INFO - __main__ - Step 23067: {'lr': 0.000475418881489592, 'samples': 4428864, 'steps': 23066, 'loss/train': 2.2325549125671387} -08/30/2021 17:20:14 - INFO - __main__ - Step 23068: {'lr': 0.0004754165867320706, 'samples': 4429056, 'steps': 23067, 'loss/train': 1.2719651460647583} -08/30/2021 17:20:14 - INFO - __main__ - Step 23069: {'lr': 0.00047541429187297984, 'samples': 4429248, 'steps': 23068, 'loss/train': 0.6197928190231323} -08/30/2021 17:20:15 - INFO - __main__ - Step 23070: {'lr': 0.00047541199691232094, 'samples': 4429440, 'steps': 23069, 'loss/train': 1.4448164701461792} -08/30/2021 17:20:16 - INFO - __main__ - Step 23071: {'lr': 0.0004754097018500949, 'samples': 4429632, 'steps': 23070, 'loss/train': 1.665648102760315} -08/30/2021 17:20:17 - INFO - __main__ - Step 23072: {'lr': 0.0004754074066863027, 'samples': 4429824, 'steps': 23071, 'loss/train': 1.2831231355667114} -08/30/2021 17:20:17 - INFO - __main__ - Step 23073: {'lr': 0.0004754051114209454, 'samples': 4430016, 'steps': 23072, 'loss/train': 2.770606756210327} -08/30/2021 17:20:18 - INFO - __main__ - Step 23074: {'lr': 0.0004754028160540241, 'samples': 4430208, 'steps': 23073, 'loss/train': 1.4709585905075073} -08/30/2021 17:20:18 - INFO - __main__ - Step 23075: {'lr': 0.0004754005205855397, 'samples': 4430400, 'steps': 23074, 'loss/train': 1.0107523202896118} -08/30/2021 17:20:18 - INFO - __main__ - Step 23076: {'lr': 0.0004753982250154933, 'samples': 4430592, 'steps': 23075, 'loss/train': 1.0506287813186646} -08/30/2021 17:20:20 - INFO - __main__ - Step 23077: {'lr': 0.00047539592934388596, 'samples': 4430784, 'steps': 23076, 'loss/train': 1.9369217157363892} -08/30/2021 17:20:20 - INFO - __main__ - Step 23078: {'lr': 0.0004753936335707187, 'samples': 4430976, 'steps': 23077, 'loss/train': 1.4263718128204346} -08/30/2021 17:20:21 - INFO - __main__ - Step 23079: {'lr': 0.0004753913376959925, 'samples': 4431168, 'steps': 23078, 'loss/train': 1.7650058269500732} -08/30/2021 17:20:21 - INFO - __main__ - Step 23080: {'lr': 0.00047538904171970847, 'samples': 4431360, 'steps': 23079, 'loss/train': 0.5631402730941772} -08/30/2021 17:20:21 - INFO - __main__ - Step 23081: {'lr': 0.0004753867456418677, 'samples': 4431552, 'steps': 23080, 'loss/train': 1.8370333909988403} -08/30/2021 17:20:23 - INFO - __main__ - Step 23082: {'lr': 0.000475384449462471, 'samples': 4431744, 'steps': 23081, 'loss/train': 1.7785964012145996} -08/30/2021 17:20:24 - INFO - __main__ - Step 23083: {'lr': 0.00047538215318151955, 'samples': 4431936, 'steps': 23082, 'loss/train': 1.7811259031295776} -08/30/2021 17:20:24 - INFO - __main__ - Step 23084: {'lr': 0.0004753798567990145, 'samples': 4432128, 'steps': 23083, 'loss/train': 0.8969607949256897} -08/30/2021 17:20:24 - INFO - __main__ - Step 23085: {'lr': 0.00047537756031495673, 'samples': 4432320, 'steps': 23084, 'loss/train': 1.802507758140564} -08/30/2021 17:20:25 - INFO - __main__ - Step 23086: {'lr': 0.0004753752637293473, 'samples': 4432512, 'steps': 23085, 'loss/train': 1.6796890497207642} -08/30/2021 17:20:25 - INFO - __main__ - Step 23087: {'lr': 0.0004753729670421871, 'samples': 4432704, 'steps': 23086, 'loss/train': 1.564009428024292} -08/30/2021 17:20:27 - INFO - __main__ - Step 23088: {'lr': 0.0004753706702534775, 'samples': 4432896, 'steps': 23087, 'loss/train': 2.1037065982818604} -08/30/2021 17:20:27 - INFO - __main__ - Step 23089: {'lr': 0.0004753683733632193, 'samples': 4433088, 'steps': 23088, 'loss/train': 1.561545729637146} -08/30/2021 17:20:28 - INFO - __main__ - Step 23090: {'lr': 0.0004753660763714136, 'samples': 4433280, 'steps': 23089, 'loss/train': 1.6166492700576782} -08/30/2021 17:20:28 - INFO - __main__ - Step 23091: {'lr': 0.00047536377927806143, 'samples': 4433472, 'steps': 23090, 'loss/train': 1.104941487312317} -08/30/2021 17:20:28 - INFO - __main__ - Step 23092: {'lr': 0.0004753614820831638, 'samples': 4433664, 'steps': 23091, 'loss/train': 1.2165592908859253} -08/30/2021 17:20:29 - INFO - __main__ - Step 23093: {'lr': 0.0004753591847867218, 'samples': 4433856, 'steps': 23092, 'loss/train': 1.848177194595337} -08/30/2021 17:20:31 - INFO - __main__ - Step 23094: {'lr': 0.0004753568873887364, 'samples': 4434048, 'steps': 23093, 'loss/train': 1.8158068656921387} -08/30/2021 17:20:31 - INFO - __main__ - Step 23095: {'lr': 0.00047535458988920865, 'samples': 4434240, 'steps': 23094, 'loss/train': 0.7858121991157532} -08/30/2021 17:20:31 - INFO - __main__ - Step 23096: {'lr': 0.0004753522922881396, 'samples': 4434432, 'steps': 23095, 'loss/train': 0.13198018074035645} -08/30/2021 17:20:32 - INFO - __main__ - Step 23097: {'lr': 0.00047534999458553027, 'samples': 4434624, 'steps': 23096, 'loss/train': 1.726241111755371} -08/30/2021 17:20:32 - INFO - __main__ - Step 23098: {'lr': 0.00047534769678138177, 'samples': 4434816, 'steps': 23097, 'loss/train': 2.280733823776245} -08/30/2021 17:20:34 - INFO - __main__ - Step 23099: {'lr': 0.00047534539887569507, 'samples': 4435008, 'steps': 23098, 'loss/train': 1.5222843885421753} -08/30/2021 17:20:34 - INFO - __main__ - Step 23100: {'lr': 0.00047534310086847116, 'samples': 4435200, 'steps': 23099, 'loss/train': 2.4165260791778564} -08/30/2021 17:20:35 - INFO - __main__ - Step 23101: {'lr': 0.0004753408027597111, 'samples': 4435392, 'steps': 23100, 'loss/train': 1.8077912330627441} -08/30/2021 17:20:35 - INFO - __main__ - Step 23102: {'lr': 0.0004753385045494161, 'samples': 4435584, 'steps': 23101, 'loss/train': 1.6808812618255615} -08/30/2021 17:20:35 - INFO - __main__ - Step 23103: {'lr': 0.0004753362062375869, 'samples': 4435776, 'steps': 23102, 'loss/train': 1.5910356044769287} -08/30/2021 17:20:36 - INFO - __main__ - Step 23104: {'lr': 0.0004753339078242247, 'samples': 4435968, 'steps': 23103, 'loss/train': 1.5396397113800049} -08/30/2021 17:20:37 - INFO - __main__ - Step 23105: {'lr': 0.00047533160930933054, 'samples': 4436160, 'steps': 23104, 'loss/train': 1.3970762491226196} -08/30/2021 17:20:38 - INFO - __main__ - Step 23106: {'lr': 0.00047532931069290546, 'samples': 4436352, 'steps': 23105, 'loss/train': 2.041872978210449} -08/30/2021 17:20:38 - INFO - __main__ - Step 23107: {'lr': 0.00047532701197495043, 'samples': 4436544, 'steps': 23106, 'loss/train': 1.8742706775665283} -08/30/2021 17:20:39 - INFO - __main__ - Step 23108: {'lr': 0.00047532471315546654, 'samples': 4436736, 'steps': 23107, 'loss/train': 1.6420570611953735} -08/30/2021 17:20:39 - INFO - __main__ - Step 23109: {'lr': 0.00047532241423445487, 'samples': 4436928, 'steps': 23108, 'loss/train': 1.8693948984146118} -08/30/2021 17:20:40 - INFO - __main__ - Step 23110: {'lr': 0.00047532011521191634, 'samples': 4437120, 'steps': 23109, 'loss/train': 2.1753315925598145} -08/30/2021 17:20:41 - INFO - __main__ - Step 23111: {'lr': 0.00047531781608785203, 'samples': 4437312, 'steps': 23110, 'loss/train': 1.7467502355575562} -08/30/2021 17:20:41 - INFO - __main__ - Step 23112: {'lr': 0.00047531551686226303, 'samples': 4437504, 'steps': 23111, 'loss/train': 1.3459922075271606} -08/30/2021 17:20:42 - INFO - __main__ - Step 23113: {'lr': 0.00047531321753515026, 'samples': 4437696, 'steps': 23112, 'loss/train': 1.6046158075332642} -08/30/2021 17:20:42 - INFO - __main__ - Step 23114: {'lr': 0.0004753109181065149, 'samples': 4437888, 'steps': 23113, 'loss/train': 1.420710563659668} -08/30/2021 17:20:44 - INFO - __main__ - Step 23115: {'lr': 0.00047530861857635786, 'samples': 4438080, 'steps': 23114, 'loss/train': 2.168738603591919} -08/30/2021 17:20:44 - INFO - __main__ - Step 23116: {'lr': 0.00047530631894468034, 'samples': 4438272, 'steps': 23115, 'loss/train': 0.11286278069019318} -08/30/2021 17:20:44 - INFO - __main__ - Step 23117: {'lr': 0.0004753040192114831, 'samples': 4438464, 'steps': 23116, 'loss/train': 0.7792182564735413} -08/30/2021 17:20:45 - INFO - __main__ - Step 23118: {'lr': 0.00047530171937676754, 'samples': 4438656, 'steps': 23117, 'loss/train': 1.52216374874115} -08/30/2021 17:20:45 - INFO - __main__ - Step 23119: {'lr': 0.0004752994194405344, 'samples': 4438848, 'steps': 23118, 'loss/train': 1.2353326082229614} -08/30/2021 17:20:46 - INFO - __main__ - Step 23120: {'lr': 0.0004752971194027848, 'samples': 4439040, 'steps': 23119, 'loss/train': 1.8364794254302979} -08/30/2021 17:20:47 - INFO - __main__ - Step 23121: {'lr': 0.0004752948192635198, 'samples': 4439232, 'steps': 23120, 'loss/train': 1.6021615266799927} -08/30/2021 17:20:47 - INFO - __main__ - Step 23122: {'lr': 0.0004752925190227405, 'samples': 4439424, 'steps': 23121, 'loss/train': 1.5915093421936035} -08/30/2021 17:20:48 - INFO - __main__ - Step 23123: {'lr': 0.0004752902186804478, 'samples': 4439616, 'steps': 23122, 'loss/train': 1.4561430215835571} -08/30/2021 17:20:48 - INFO - __main__ - Step 23124: {'lr': 0.0004752879182366429, 'samples': 4439808, 'steps': 23123, 'loss/train': 2.071640968322754} -08/30/2021 17:20:50 - INFO - __main__ - Step 23125: {'lr': 0.0004752856176913266, 'samples': 4440000, 'steps': 23124, 'loss/train': 0.09368572384119034} -08/30/2021 17:20:50 - INFO - __main__ - Step 23126: {'lr': 0.0004752833170445001, 'samples': 4440192, 'steps': 23125, 'loss/train': 1.8942292928695679} -08/30/2021 17:20:51 - INFO - __main__ - Step 23127: {'lr': 0.0004752810162961645, 'samples': 4440384, 'steps': 23126, 'loss/train': 0.2813170254230499} -08/30/2021 17:20:51 - INFO - __main__ - Step 23128: {'lr': 0.0004752787154463207, 'samples': 4440576, 'steps': 23127, 'loss/train': 1.6915593147277832} -08/30/2021 17:20:51 - INFO - __main__ - Step 23129: {'lr': 0.0004752764144949698, 'samples': 4440768, 'steps': 23128, 'loss/train': 0.9356757402420044} -08/30/2021 17:20:53 - INFO - __main__ - Step 23130: {'lr': 0.0004752741134421128, 'samples': 4440960, 'steps': 23129, 'loss/train': 1.650490164756775} -08/30/2021 17:20:53 - INFO - __main__ - Step 23131: {'lr': 0.00047527181228775077, 'samples': 4441152, 'steps': 23130, 'loss/train': 1.3722552061080933} -08/30/2021 17:20:54 - INFO - __main__ - Step 23132: {'lr': 0.0004752695110318848, 'samples': 4441344, 'steps': 23131, 'loss/train': 1.715676188468933} -08/30/2021 17:20:54 - INFO - __main__ - Step 23133: {'lr': 0.00047526720967451573, 'samples': 4441536, 'steps': 23132, 'loss/train': 1.761802077293396} -08/30/2021 17:20:54 - INFO - __main__ - Step 23134: {'lr': 0.0004752649082156448, 'samples': 4441728, 'steps': 23133, 'loss/train': 1.4513990879058838} -08/30/2021 17:20:56 - INFO - __main__ - Step 23135: {'lr': 0.00047526260665527306, 'samples': 4441920, 'steps': 23134, 'loss/train': 1.4010471105575562} -08/30/2021 17:20:56 - INFO - __main__ - Step 23136: {'lr': 0.0004752603049934014, 'samples': 4442112, 'steps': 23135, 'loss/train': 1.3411589860916138} -08/30/2021 17:20:57 - INFO - __main__ - Step 23137: {'lr': 0.0004752580032300309, 'samples': 4442304, 'steps': 23136, 'loss/train': 1.944082498550415} -08/30/2021 17:20:57 - INFO - __main__ - Step 23138: {'lr': 0.0004752557013651626, 'samples': 4442496, 'steps': 23137, 'loss/train': 1.626043677330017} -08/30/2021 17:20:57 - INFO - __main__ - Step 23139: {'lr': 0.00047525339939879764, 'samples': 4442688, 'steps': 23138, 'loss/train': 1.9153451919555664} -08/30/2021 17:20:58 - INFO - __main__ - Step 23140: {'lr': 0.0004752510973309369, 'samples': 4442880, 'steps': 23139, 'loss/train': 1.190613031387329} -08/30/2021 17:20:59 - INFO - __main__ - Step 23141: {'lr': 0.00047524879516158155, 'samples': 4443072, 'steps': 23140, 'loss/train': 1.5332773923873901} -08/30/2021 17:21:00 - INFO - __main__ - Step 23142: {'lr': 0.00047524649289073254, 'samples': 4443264, 'steps': 23141, 'loss/train': 1.2286112308502197} -08/30/2021 17:21:00 - INFO - __main__ - Step 23143: {'lr': 0.00047524419051839093, 'samples': 4443456, 'steps': 23142, 'loss/train': 1.7234455347061157} -08/30/2021 17:21:00 - INFO - __main__ - Step 23144: {'lr': 0.00047524188804455776, 'samples': 4443648, 'steps': 23143, 'loss/train': 0.9118403196334839} -08/30/2021 17:21:01 - INFO - __main__ - Step 23145: {'lr': 0.0004752395854692341, 'samples': 4443840, 'steps': 23144, 'loss/train': 0.801737368106842} -08/30/2021 17:21:02 - INFO - __main__ - Step 23146: {'lr': 0.0004752372827924209, 'samples': 4444032, 'steps': 23145, 'loss/train': 1.4815832376480103} -08/30/2021 17:21:03 - INFO - __main__ - Step 23147: {'lr': 0.0004752349800141193, 'samples': 4444224, 'steps': 23146, 'loss/train': 0.1470886766910553} -08/30/2021 17:21:03 - INFO - __main__ - Step 23148: {'lr': 0.0004752326771343303, 'samples': 4444416, 'steps': 23147, 'loss/train': 1.0431610345840454} -08/30/2021 17:21:04 - INFO - __main__ - Step 23149: {'lr': 0.00047523037415305494, 'samples': 4444608, 'steps': 23148, 'loss/train': 1.5535979270935059} -08/30/2021 17:21:04 - INFO - __main__ - Step 23150: {'lr': 0.0004752280710702942, 'samples': 4444800, 'steps': 23149, 'loss/train': 1.115715742111206} -08/30/2021 17:21:04 - INFO - __main__ - Step 23151: {'lr': 0.0004752257678860492, 'samples': 4444992, 'steps': 23150, 'loss/train': 1.6098699569702148} -08/30/2021 17:21:06 - INFO - __main__ - Step 23152: {'lr': 0.00047522346460032093, 'samples': 4445184, 'steps': 23151, 'loss/train': 1.8715747594833374} -08/30/2021 17:21:07 - INFO - __main__ - Step 23153: {'lr': 0.0004752211612131104, 'samples': 4445376, 'steps': 23152, 'loss/train': 1.5347611904144287} -08/30/2021 17:21:07 - INFO - __main__ - Step 23154: {'lr': 0.00047521885772441874, 'samples': 4445568, 'steps': 23153, 'loss/train': 0.14605779945850372} -08/30/2021 17:21:07 - INFO - __main__ - Step 23155: {'lr': 0.00047521655413424705, 'samples': 4445760, 'steps': 23154, 'loss/train': 0.32538989186286926} -08/30/2021 17:21:08 - INFO - __main__ - Step 23156: {'lr': 0.0004752142504425961, 'samples': 4445952, 'steps': 23155, 'loss/train': 1.354323387145996} -08/30/2021 17:21:09 - INFO - __main__ - Step 23157: {'lr': 0.0004752119466494671, 'samples': 4446144, 'steps': 23156, 'loss/train': 1.461428165435791} -08/30/2021 17:21:09 - INFO - __main__ - Step 23158: {'lr': 0.0004752096427548611, 'samples': 4446336, 'steps': 23157, 'loss/train': 1.5017316341400146} -08/30/2021 17:21:10 - INFO - __main__ - Step 23159: {'lr': 0.00047520733875877906, 'samples': 4446528, 'steps': 23158, 'loss/train': 1.8959764242172241} -08/30/2021 17:21:10 - INFO - __main__ - Step 23160: {'lr': 0.00047520503466122216, 'samples': 4446720, 'steps': 23159, 'loss/train': 1.2578843832015991} -08/30/2021 17:21:11 - INFO - __main__ - Step 23161: {'lr': 0.0004752027304621913, 'samples': 4446912, 'steps': 23160, 'loss/train': 1.6839022636413574} -08/30/2021 17:21:12 - INFO - __main__ - Step 23162: {'lr': 0.0004752004261616876, 'samples': 4447104, 'steps': 23161, 'loss/train': 1.5024852752685547} -08/30/2021 17:21:12 - INFO - __main__ - Step 23163: {'lr': 0.000475198121759712, 'samples': 4447296, 'steps': 23162, 'loss/train': 1.121056079864502} -08/30/2021 17:21:13 - INFO - __main__ - Step 23164: {'lr': 0.0004751958172562656, 'samples': 4447488, 'steps': 23163, 'loss/train': 1.6009811162948608} -08/30/2021 17:21:13 - INFO - __main__ - Step 23165: {'lr': 0.00047519351265134954, 'samples': 4447680, 'steps': 23164, 'loss/train': 0.7221185564994812} -08/30/2021 17:21:14 - INFO - __main__ - Step 23166: {'lr': 0.00047519120794496466, 'samples': 4447872, 'steps': 23165, 'loss/train': 1.5631213188171387} -08/30/2021 17:21:15 - INFO - __main__ - Step 23167: {'lr': 0.00047518890313711217, 'samples': 4448064, 'steps': 23166, 'loss/train': 1.6122443675994873} -08/30/2021 17:21:16 - INFO - __main__ - Step 23168: {'lr': 0.000475186598227793, 'samples': 4448256, 'steps': 23167, 'loss/train': 1.6459945440292358} -08/30/2021 17:21:16 - INFO - __main__ - Step 23169: {'lr': 0.0004751842932170082, 'samples': 4448448, 'steps': 23168, 'loss/train': 2.0564258098602295} -08/30/2021 17:21:16 - INFO - __main__ - Step 23170: {'lr': 0.00047518198810475885, 'samples': 4448640, 'steps': 23169, 'loss/train': 1.6809388399124146} -08/30/2021 17:21:17 - INFO - __main__ - Step 23171: {'lr': 0.00047517968289104596, 'samples': 4448832, 'steps': 23170, 'loss/train': 1.9831767082214355} -08/30/2021 17:21:17 - INFO - __main__ - Step 23172: {'lr': 0.0004751773775758706, 'samples': 4449024, 'steps': 23171, 'loss/train': 3.460151195526123} -08/30/2021 17:21:19 - INFO - __main__ - Step 23173: {'lr': 0.00047517507215923376, 'samples': 4449216, 'steps': 23172, 'loss/train': 1.5345171689987183} -08/30/2021 17:21:19 - INFO - __main__ - Step 23174: {'lr': 0.00047517276664113653, 'samples': 4449408, 'steps': 23173, 'loss/train': 1.496776819229126} -08/30/2021 17:21:20 - INFO - __main__ - Step 23175: {'lr': 0.0004751704610215799, 'samples': 4449600, 'steps': 23174, 'loss/train': 2.006037950515747} -08/30/2021 17:21:20 - INFO - __main__ - Step 23176: {'lr': 0.000475168155300565, 'samples': 4449792, 'steps': 23175, 'loss/train': 1.4301276206970215} -08/30/2021 17:21:20 - INFO - __main__ - Step 23177: {'lr': 0.00047516584947809274, 'samples': 4449984, 'steps': 23176, 'loss/train': 1.7376550436019897} -08/30/2021 17:21:22 - INFO - __main__ - Step 23178: {'lr': 0.00047516354355416426, 'samples': 4450176, 'steps': 23177, 'loss/train': 1.3079065084457397} -08/30/2021 17:21:23 - INFO - __main__ - Step 23179: {'lr': 0.00047516123752878054, 'samples': 4450368, 'steps': 23178, 'loss/train': 2.0567970275878906} -08/30/2021 17:21:23 - INFO - __main__ - Step 23180: {'lr': 0.00047515893140194265, 'samples': 4450560, 'steps': 23179, 'loss/train': 1.5286344289779663} -08/30/2021 17:21:24 - INFO - __main__ - Step 23181: {'lr': 0.0004751566251736516, 'samples': 4450752, 'steps': 23180, 'loss/train': 1.5406385660171509} -08/30/2021 17:21:24 - INFO - __main__ - Step 23182: {'lr': 0.00047515431884390845, 'samples': 4450944, 'steps': 23181, 'loss/train': 0.1824532300233841} -08/30/2021 17:21:24 - INFO - __main__ - Step 23183: {'lr': 0.00047515201241271426, 'samples': 4451136, 'steps': 23182, 'loss/train': 1.3524411916732788} -08/30/2021 17:21:26 - INFO - __main__ - Step 23184: {'lr': 0.00047514970588007007, 'samples': 4451328, 'steps': 23183, 'loss/train': 1.7183396816253662} -08/30/2021 17:21:26 - INFO - __main__ - Step 23185: {'lr': 0.0004751473992459768, 'samples': 4451520, 'steps': 23184, 'loss/train': 1.3646972179412842} -08/30/2021 17:21:27 - INFO - __main__ - Step 23186: {'lr': 0.0004751450925104357, 'samples': 4451712, 'steps': 23185, 'loss/train': 2.6572694778442383} -08/30/2021 17:21:27 - INFO - __main__ - Step 23187: {'lr': 0.00047514278567344765, 'samples': 4451904, 'steps': 23186, 'loss/train': 1.613290786743164} -08/30/2021 17:21:27 - INFO - __main__ - Step 23188: {'lr': 0.00047514047873501374, 'samples': 4452096, 'steps': 23187, 'loss/train': 1.8051426410675049} -08/30/2021 17:21:29 - INFO - __main__ - Step 23189: {'lr': 0.000475138171695135, 'samples': 4452288, 'steps': 23188, 'loss/train': 1.572274088859558} -08/30/2021 17:21:29 - INFO - __main__ - Step 23190: {'lr': 0.00047513586455381245, 'samples': 4452480, 'steps': 23189, 'loss/train': 1.9939802885055542} -08/30/2021 17:21:30 - INFO - __main__ - Step 23191: {'lr': 0.00047513355731104717, 'samples': 4452672, 'steps': 23190, 'loss/train': 1.7568353414535522} -08/30/2021 17:21:30 - INFO - __main__ - Step 23192: {'lr': 0.0004751312499668402, 'samples': 4452864, 'steps': 23191, 'loss/train': 1.5489119291305542} -08/30/2021 17:21:30 - INFO - __main__ - Step 23193: {'lr': 0.00047512894252119256, 'samples': 4453056, 'steps': 23192, 'loss/train': 1.2617095708847046} -08/30/2021 17:21:32 - INFO - __main__ - Step 23194: {'lr': 0.0004751266349741053, 'samples': 4453248, 'steps': 23193, 'loss/train': 1.708428144454956} -08/30/2021 17:21:32 - INFO - __main__ - Step 23195: {'lr': 0.0004751243273255794, 'samples': 4453440, 'steps': 23194, 'loss/train': 0.8694499731063843} -08/30/2021 17:21:33 - INFO - __main__ - Step 23196: {'lr': 0.000475122019575616, 'samples': 4453632, 'steps': 23195, 'loss/train': 2.340193510055542} -08/30/2021 17:21:33 - INFO - __main__ - Step 23197: {'lr': 0.0004751197117242161, 'samples': 4453824, 'steps': 23196, 'loss/train': 1.6779906749725342} -08/30/2021 17:21:33 - INFO - __main__ - Step 23198: {'lr': 0.0004751174037713807, 'samples': 4454016, 'steps': 23197, 'loss/train': 1.6135693788528442} -08/30/2021 17:21:35 - INFO - __main__ - Step 23199: {'lr': 0.00047511509571711085, 'samples': 4454208, 'steps': 23198, 'loss/train': 1.5950708389282227} -08/30/2021 17:21:36 - INFO - __main__ - Step 23200: {'lr': 0.00047511278756140766, 'samples': 4454400, 'steps': 23199, 'loss/train': 1.4282525777816772} -08/30/2021 17:21:36 - INFO - __main__ - Step 23201: {'lr': 0.00047511047930427216, 'samples': 4454592, 'steps': 23200, 'loss/train': 1.557000994682312} -08/30/2021 17:21:36 - INFO - __main__ - Step 23202: {'lr': 0.00047510817094570526, 'samples': 4454784, 'steps': 23201, 'loss/train': 1.6131747961044312} -08/30/2021 17:21:37 - INFO - __main__ - Step 23203: {'lr': 0.00047510586248570815, 'samples': 4454976, 'steps': 23202, 'loss/train': 0.7795226573944092} -08/30/2021 17:21:38 - INFO - __main__ - Step 23204: {'lr': 0.00047510355392428176, 'samples': 4455168, 'steps': 23203, 'loss/train': 1.7070263624191284} -08/30/2021 17:21:39 - INFO - __main__ - Step 23205: {'lr': 0.00047510124526142723, 'samples': 4455360, 'steps': 23204, 'loss/train': 1.9022858142852783} -08/30/2021 17:21:39 - INFO - __main__ - Step 23206: {'lr': 0.00047509893649714554, 'samples': 4455552, 'steps': 23205, 'loss/train': 1.6807376146316528} -08/30/2021 17:21:39 - INFO - __main__ - Step 23207: {'lr': 0.00047509662763143775, 'samples': 4455744, 'steps': 23206, 'loss/train': 1.791644811630249} -08/30/2021 17:21:40 - INFO - __main__ - Step 23208: {'lr': 0.00047509431866430487, 'samples': 4455936, 'steps': 23207, 'loss/train': 1.6276882886886597} -08/30/2021 17:21:40 - INFO - __main__ - Step 23209: {'lr': 0.000475092009595748, 'samples': 4456128, 'steps': 23208, 'loss/train': 1.7554091215133667} -08/30/2021 17:21:41 - INFO - __main__ - Step 23210: {'lr': 0.0004750897004257681, 'samples': 4456320, 'steps': 23209, 'loss/train': 1.5933202505111694} -08/30/2021 17:21:42 - INFO - __main__ - Step 23211: {'lr': 0.0004750873911543663, 'samples': 4456512, 'steps': 23210, 'loss/train': 1.8493651151657104} -08/30/2021 17:21:42 - INFO - __main__ - Step 23212: {'lr': 0.00047508508178154354, 'samples': 4456704, 'steps': 23211, 'loss/train': 1.3049308061599731} -08/30/2021 17:21:43 - INFO - __main__ - Step 23213: {'lr': 0.00047508277230730095, 'samples': 4456896, 'steps': 23212, 'loss/train': 1.920776605606079} -08/30/2021 17:21:43 - INFO - __main__ - Step 23214: {'lr': 0.00047508046273163953, 'samples': 4457088, 'steps': 23213, 'loss/train': 1.2272385358810425} -08/30/2021 17:21:44 - INFO - __main__ - Step 23215: {'lr': 0.0004750781530545603, 'samples': 4457280, 'steps': 23214, 'loss/train': 1.6449463367462158} -08/30/2021 17:21:45 - INFO - __main__ - Step 23216: {'lr': 0.0004750758432760644, 'samples': 4457472, 'steps': 23215, 'loss/train': 1.731659173965454} -08/30/2021 17:21:45 - INFO - __main__ - Step 23217: {'lr': 0.0004750735333961527, 'samples': 4457664, 'steps': 23216, 'loss/train': 1.3513771295547485} -08/30/2021 17:21:45 - INFO - __main__ - Step 23218: {'lr': 0.00047507122341482644, 'samples': 4457856, 'steps': 23217, 'loss/train': 1.6106244325637817} -08/30/2021 17:21:46 - INFO - __main__ - Step 23219: {'lr': 0.00047506891333208654, 'samples': 4458048, 'steps': 23218, 'loss/train': 1.494199275970459} -08/30/2021 17:21:47 - INFO - __main__ - Step 23220: {'lr': 0.000475066603147934, 'samples': 4458240, 'steps': 23219, 'loss/train': 1.7515572309494019} -08/30/2021 17:21:48 - INFO - __main__ - Step 23221: {'lr': 0.00047506429286236997, 'samples': 4458432, 'steps': 23220, 'loss/train': 1.638920545578003} -08/30/2021 17:21:48 - INFO - __main__ - Step 23222: {'lr': 0.00047506198247539546, 'samples': 4458624, 'steps': 23221, 'loss/train': 1.7657824754714966} -08/30/2021 17:21:48 - INFO - __main__ - Step 23223: {'lr': 0.0004750596719870114, 'samples': 4458816, 'steps': 23222, 'loss/train': 1.6600230932235718} -08/30/2021 17:21:49 - INFO - __main__ - Step 23224: {'lr': 0.000475057361397219, 'samples': 4459008, 'steps': 23223, 'loss/train': 1.6566829681396484} -08/30/2021 17:21:50 - INFO - __main__ - Step 23225: {'lr': 0.0004750550507060192, 'samples': 4459200, 'steps': 23224, 'loss/train': 1.5358529090881348} -08/30/2021 17:21:51 - INFO - __main__ - Step 23226: {'lr': 0.0004750527399134131, 'samples': 4459392, 'steps': 23225, 'loss/train': 1.396316647529602} -08/30/2021 17:21:51 - INFO - __main__ - Step 23227: {'lr': 0.00047505042901940163, 'samples': 4459584, 'steps': 23226, 'loss/train': 1.651220679283142} -08/30/2021 17:21:51 - INFO - __main__ - Step 23228: {'lr': 0.00047504811802398603, 'samples': 4459776, 'steps': 23227, 'loss/train': 1.394845962524414} -08/30/2021 17:21:52 - INFO - __main__ - Step 23229: {'lr': 0.0004750458069271671, 'samples': 4459968, 'steps': 23228, 'loss/train': 0.3783375918865204} -08/30/2021 17:21:54 - INFO - __main__ - Step 23230: {'lr': 0.0004750434957289461, 'samples': 4460160, 'steps': 23229, 'loss/train': 1.5883769989013672} -08/30/2021 17:21:54 - INFO - __main__ - Step 23231: {'lr': 0.0004750411844293239, 'samples': 4460352, 'steps': 23230, 'loss/train': 1.9355220794677734} -08/30/2021 17:21:54 - INFO - __main__ - Step 23232: {'lr': 0.0004750388730283016, 'samples': 4460544, 'steps': 23231, 'loss/train': 1.310945749282837} -08/30/2021 17:21:55 - INFO - __main__ - Step 23233: {'lr': 0.0004750365615258804, 'samples': 4460736, 'steps': 23232, 'loss/train': 1.852506160736084} -08/30/2021 17:21:55 - INFO - __main__ - Step 23234: {'lr': 0.00047503424992206107, 'samples': 4460928, 'steps': 23233, 'loss/train': 1.3770300149917603} -08/30/2021 17:21:57 - INFO - __main__ - Step 23235: {'lr': 0.00047503193821684476, 'samples': 4461120, 'steps': 23234, 'loss/train': 1.3650484085083008} -08/30/2021 17:21:57 - INFO - __main__ - Step 23236: {'lr': 0.0004750296264102326, 'samples': 4461312, 'steps': 23235, 'loss/train': 1.575400710105896} -08/30/2021 17:21:57 - INFO - __main__ - Step 23237: {'lr': 0.0004750273145022256, 'samples': 4461504, 'steps': 23236, 'loss/train': 1.0140916109085083} -08/30/2021 17:21:58 - INFO - __main__ - Step 23238: {'lr': 0.00047502500249282464, 'samples': 4461696, 'steps': 23237, 'loss/train': 2.0177133083343506} -08/30/2021 17:21:58 - INFO - __main__ - Step 23239: {'lr': 0.000475022690382031, 'samples': 4461888, 'steps': 23238, 'loss/train': 1.9535596370697021} -08/30/2021 17:22:00 - INFO - __main__ - Step 23240: {'lr': 0.0004750203781698456, 'samples': 4462080, 'steps': 23239, 'loss/train': 1.9856034517288208} -08/30/2021 17:22:00 - INFO - __main__ - Step 23241: {'lr': 0.0004750180658562694, 'samples': 4462272, 'steps': 23240, 'loss/train': 0.20193614065647125} -08/30/2021 17:22:00 - INFO - __main__ - Step 23242: {'lr': 0.00047501575344130356, 'samples': 4462464, 'steps': 23241, 'loss/train': 1.469152808189392} -08/30/2021 17:22:01 - INFO - __main__ - Step 23243: {'lr': 0.00047501344092494915, 'samples': 4462656, 'steps': 23242, 'loss/train': 1.6817524433135986} -08/30/2021 17:22:01 - INFO - __main__ - Step 23244: {'lr': 0.0004750111283072071, 'samples': 4462848, 'steps': 23243, 'loss/train': 1.05733323097229} -08/30/2021 17:22:03 - INFO - __main__ - Step 23245: {'lr': 0.00047500881558807854, 'samples': 4463040, 'steps': 23244, 'loss/train': 1.526496410369873} -08/30/2021 17:22:04 - INFO - __main__ - Step 23246: {'lr': 0.00047500650276756455, 'samples': 4463232, 'steps': 23245, 'loss/train': 1.9825046062469482} -08/30/2021 17:22:04 - INFO - __main__ - Step 23247: {'lr': 0.00047500418984566594, 'samples': 4463424, 'steps': 23246, 'loss/train': 2.217878818511963} -08/30/2021 17:22:04 - INFO - __main__ - Step 23248: {'lr': 0.000475001876822384, 'samples': 4463616, 'steps': 23247, 'loss/train': 1.6152948141098022} -08/30/2021 17:22:05 - INFO - __main__ - Step 23249: {'lr': 0.00047499956369771967, 'samples': 4463808, 'steps': 23248, 'loss/train': 0.9902798533439636} -08/30/2021 17:22:05 - INFO - __main__ - Step 23250: {'lr': 0.00047499725047167406, 'samples': 4464000, 'steps': 23249, 'loss/train': 1.7276273965835571} -08/30/2021 17:22:05 - INFO - __main__ - Step 23251: {'lr': 0.0004749949371442481, 'samples': 4464192, 'steps': 23250, 'loss/train': 1.323229193687439} -08/30/2021 17:22:07 - INFO - __main__ - Step 23252: {'lr': 0.00047499262371544294, 'samples': 4464384, 'steps': 23251, 'loss/train': 2.0143301486968994} -08/30/2021 17:22:07 - INFO - __main__ - Step 23253: {'lr': 0.00047499031018525953, 'samples': 4464576, 'steps': 23252, 'loss/train': 1.3034156560897827} -08/30/2021 17:22:08 - INFO - __main__ - Step 23254: {'lr': 0.00047498799655369895, 'samples': 4464768, 'steps': 23253, 'loss/train': 1.3375436067581177} -08/30/2021 17:22:08 - INFO - __main__ - Step 23255: {'lr': 0.0004749856828207623, 'samples': 4464960, 'steps': 23254, 'loss/train': 2.0281713008880615} -08/30/2021 17:22:08 - INFO - __main__ - Step 23256: {'lr': 0.00047498336898645055, 'samples': 4465152, 'steps': 23255, 'loss/train': 1.6792418956756592} -08/30/2021 17:22:10 - INFO - __main__ - Step 23257: {'lr': 0.00047498105505076475, 'samples': 4465344, 'steps': 23256, 'loss/train': 0.7893033027648926} -08/30/2021 17:22:10 - INFO - __main__ - Step 23258: {'lr': 0.000474978741013706, 'samples': 4465536, 'steps': 23257, 'loss/train': 1.6571929454803467} -08/30/2021 17:22:11 - INFO - __main__ - Step 23259: {'lr': 0.0004749764268752753, 'samples': 4465728, 'steps': 23258, 'loss/train': 1.4134469032287598} -08/30/2021 17:22:11 - INFO - __main__ - Step 23260: {'lr': 0.0004749741126354736, 'samples': 4465920, 'steps': 23259, 'loss/train': 1.9693456888198853} -08/30/2021 17:22:11 - INFO - __main__ - Step 23261: {'lr': 0.00047497179829430217, 'samples': 4466112, 'steps': 23260, 'loss/train': 1.663743495941162} -08/30/2021 17:22:13 - INFO - __main__ - Step 23262: {'lr': 0.0004749694838517619, 'samples': 4466304, 'steps': 23261, 'loss/train': 1.4114000797271729} -08/30/2021 17:22:14 - INFO - __main__ - Step 23263: {'lr': 0.0004749671693078538, 'samples': 4466496, 'steps': 23262, 'loss/train': 1.3881969451904297} -08/30/2021 17:22:14 - INFO - __main__ - Step 23264: {'lr': 0.00047496485466257896, 'samples': 4466688, 'steps': 23263, 'loss/train': 0.1113017275929451} -08/30/2021 17:22:14 - INFO - __main__ - Step 23265: {'lr': 0.0004749625399159384, 'samples': 4466880, 'steps': 23264, 'loss/train': 1.3417302370071411} -08/30/2021 17:22:15 - INFO - __main__ - Step 23266: {'lr': 0.0004749602250679332, 'samples': 4467072, 'steps': 23265, 'loss/train': 0.23997275531291962} -08/30/2021 17:22:16 - INFO - __main__ - Step 23267: {'lr': 0.00047495791011856447, 'samples': 4467264, 'steps': 23266, 'loss/train': 0.29367148876190186} -08/30/2021 17:22:17 - INFO - __main__ - Step 23268: {'lr': 0.00047495559506783317, 'samples': 4467456, 'steps': 23267, 'loss/train': 1.3928866386413574} -08/30/2021 17:22:17 - INFO - __main__ - Step 23269: {'lr': 0.00047495327991574034, 'samples': 4467648, 'steps': 23268, 'loss/train': 1.7561638355255127} -08/30/2021 17:22:17 - INFO - __main__ - Step 23270: {'lr': 0.0004749509646622869, 'samples': 4467840, 'steps': 23269, 'loss/train': 1.2333191633224487} -08/30/2021 17:22:18 - INFO - __main__ - Step 23271: {'lr': 0.00047494864930747415, 'samples': 4468032, 'steps': 23270, 'loss/train': 1.8547008037567139} -08/30/2021 17:22:19 - INFO - __main__ - Step 23272: {'lr': 0.000474946333851303, 'samples': 4468224, 'steps': 23271, 'loss/train': 0.4618629515171051} -08/30/2021 17:22:20 - INFO - __main__ - Step 23273: {'lr': 0.0004749440182937745, 'samples': 4468416, 'steps': 23272, 'loss/train': 1.3728739023208618} -08/30/2021 17:22:20 - INFO - __main__ - Step 23274: {'lr': 0.0004749417026348897, 'samples': 4468608, 'steps': 23273, 'loss/train': 2.0360350608825684} -08/30/2021 17:22:20 - INFO - __main__ - Step 23275: {'lr': 0.0004749393868746497, 'samples': 4468800, 'steps': 23274, 'loss/train': 1.6930845975875854} -08/30/2021 17:22:21 - INFO - __main__ - Step 23276: {'lr': 0.0004749370710130554, 'samples': 4468992, 'steps': 23275, 'loss/train': 0.9200928211212158} -08/30/2021 17:22:22 - INFO - __main__ - Step 23277: {'lr': 0.00047493475505010793, 'samples': 4469184, 'steps': 23276, 'loss/train': 1.4903265237808228} -08/30/2021 17:22:23 - INFO - __main__ - Step 23278: {'lr': 0.0004749324389858083, 'samples': 4469376, 'steps': 23277, 'loss/train': 1.6839574575424194} -08/30/2021 17:22:23 - INFO - __main__ - Step 23279: {'lr': 0.00047493012282015767, 'samples': 4469568, 'steps': 23278, 'loss/train': 1.6174678802490234} -08/30/2021 17:22:23 - INFO - __main__ - Step 23280: {'lr': 0.00047492780655315693, 'samples': 4469760, 'steps': 23279, 'loss/train': 1.8059922456741333} -08/30/2021 17:22:24 - INFO - __main__ - Step 23281: {'lr': 0.00047492549018480725, 'samples': 4469952, 'steps': 23280, 'loss/train': 1.4149961471557617} -08/30/2021 17:22:25 - INFO - __main__ - Step 23282: {'lr': 0.00047492317371510955, 'samples': 4470144, 'steps': 23281, 'loss/train': 0.8420997858047485} -08/30/2021 17:22:26 - INFO - __main__ - Step 23283: {'lr': 0.00047492085714406497, 'samples': 4470336, 'steps': 23282, 'loss/train': 1.0607054233551025} -08/30/2021 17:22:26 - INFO - __main__ - Step 23284: {'lr': 0.00047491854047167453, 'samples': 4470528, 'steps': 23283, 'loss/train': 1.798923373222351} -08/30/2021 17:22:27 - INFO - __main__ - Step 23285: {'lr': 0.0004749162236979393, 'samples': 4470720, 'steps': 23284, 'loss/train': 1.8167866468429565} -08/30/2021 17:22:27 - INFO - __main__ - Step 23286: {'lr': 0.0004749139068228602, 'samples': 4470912, 'steps': 23285, 'loss/train': 1.3599193096160889} -08/30/2021 17:22:27 - INFO - __main__ - Step 23287: {'lr': 0.00047491158984643846, 'samples': 4471104, 'steps': 23286, 'loss/train': 2.153561592102051} -08/30/2021 17:22:30 - INFO - __main__ - Step 23288: {'lr': 0.0004749092727686749, 'samples': 4471296, 'steps': 23287, 'loss/train': 1.4420368671417236} -08/30/2021 17:22:30 - INFO - __main__ - Step 23289: {'lr': 0.00047490695558957083, 'samples': 4471488, 'steps': 23288, 'loss/train': 1.1183713674545288} -08/30/2021 17:22:31 - INFO - __main__ - Step 23290: {'lr': 0.00047490463830912713, 'samples': 4471680, 'steps': 23289, 'loss/train': 2.230461359024048} -08/30/2021 17:22:31 - INFO - __main__ - Step 23291: {'lr': 0.0004749023209273448, 'samples': 4471872, 'steps': 23290, 'loss/train': 2.1331839561462402} -08/30/2021 17:22:31 - INFO - __main__ - Step 23292: {'lr': 0.000474900003444225, 'samples': 4472064, 'steps': 23291, 'loss/train': 1.9077094793319702} -08/30/2021 17:22:33 - INFO - __main__ - Step 23293: {'lr': 0.0004748976858597687, 'samples': 4472256, 'steps': 23292, 'loss/train': 1.3912080526351929} -08/30/2021 17:22:33 - INFO - __main__ - Step 23294: {'lr': 0.00047489536817397706, 'samples': 4472448, 'steps': 23293, 'loss/train': 1.8662384748458862} -08/30/2021 17:22:34 - INFO - __main__ - Step 23295: {'lr': 0.00047489305038685094, 'samples': 4472640, 'steps': 23294, 'loss/train': 1.615684986114502} -08/30/2021 17:22:34 - INFO - __main__ - Step 23296: {'lr': 0.00047489073249839153, 'samples': 4472832, 'steps': 23295, 'loss/train': 1.5429795980453491} -08/30/2021 17:22:34 - INFO - __main__ - Step 23297: {'lr': 0.0004748884145085998, 'samples': 4473024, 'steps': 23296, 'loss/train': 1.2033603191375732} -08/30/2021 17:22:35 - INFO - __main__ - Step 23298: {'lr': 0.0004748860964174768, 'samples': 4473216, 'steps': 23297, 'loss/train': 1.162532925605774} -08/30/2021 17:22:36 - INFO - __main__ - Step 23299: {'lr': 0.00047488377822502365, 'samples': 4473408, 'steps': 23298, 'loss/train': 1.6472742557525635} -08/30/2021 17:22:37 - INFO - __main__ - Step 23300: {'lr': 0.00047488145993124134, 'samples': 4473600, 'steps': 23299, 'loss/train': 1.606379747390747} -08/30/2021 17:22:37 - INFO - __main__ - Step 23301: {'lr': 0.0004748791415361309, 'samples': 4473792, 'steps': 23300, 'loss/train': 1.5527448654174805} -08/30/2021 17:22:37 - INFO - __main__ - Step 23302: {'lr': 0.00047487682303969336, 'samples': 4473984, 'steps': 23301, 'loss/train': 1.3916690349578857} -08/30/2021 17:22:38 - INFO - __main__ - Step 23303: {'lr': 0.0004748745044419298, 'samples': 4474176, 'steps': 23302, 'loss/train': 0.8504519462585449} -08/30/2021 17:22:39 - INFO - __main__ - Step 23304: {'lr': 0.0004748721857428413, 'samples': 4474368, 'steps': 23303, 'loss/train': 2.007427215576172} -08/30/2021 17:22:40 - INFO - __main__ - Step 23305: {'lr': 0.00047486986694242887, 'samples': 4474560, 'steps': 23304, 'loss/train': 2.2359650135040283} -08/30/2021 17:22:40 - INFO - __main__ - Step 23306: {'lr': 0.0004748675480406934, 'samples': 4474752, 'steps': 23305, 'loss/train': 1.6426920890808105} -08/30/2021 17:22:40 - INFO - __main__ - Step 23307: {'lr': 0.0004748652290376363, 'samples': 4474944, 'steps': 23306, 'loss/train': 1.280753493309021} -08/30/2021 17:22:41 - INFO - __main__ - Step 23308: {'lr': 0.00047486290993325824, 'samples': 4475136, 'steps': 23307, 'loss/train': 1.0288336277008057} -08/30/2021 17:22:41 - INFO - __main__ - Step 23309: {'lr': 0.00047486059072756047, 'samples': 4475328, 'steps': 23308, 'loss/train': 1.8509293794631958} -08/30/2021 17:22:43 - INFO - __main__ - Step 23310: {'lr': 0.00047485827142054407, 'samples': 4475520, 'steps': 23309, 'loss/train': 1.7704225778579712} -08/30/2021 17:22:43 - INFO - __main__ - Step 23311: {'lr': 0.0004748559520122099, 'samples': 4475712, 'steps': 23310, 'loss/train': 1.6992249488830566} -08/30/2021 17:22:44 - INFO - __main__ - Step 23312: {'lr': 0.0004748536325025591, 'samples': 4475904, 'steps': 23311, 'loss/train': 1.788007378578186} -08/30/2021 17:22:44 - INFO - __main__ - Step 23313: {'lr': 0.0004748513128915928, 'samples': 4476096, 'steps': 23312, 'loss/train': 1.953972339630127} -08/30/2021 17:22:44 - INFO - __main__ - Step 23314: {'lr': 0.0004748489931793119, 'samples': 4476288, 'steps': 23313, 'loss/train': 1.7730237245559692} -08/30/2021 17:22:46 - INFO - __main__ - Step 23315: {'lr': 0.00047484667336571753, 'samples': 4476480, 'steps': 23314, 'loss/train': 1.0370426177978516} -08/30/2021 17:22:46 - INFO - __main__ - Step 23316: {'lr': 0.0004748443534508107, 'samples': 4476672, 'steps': 23315, 'loss/train': 2.3911044597625732} -08/30/2021 17:22:46 - INFO - __main__ - Step 23317: {'lr': 0.00047484203343459256, 'samples': 4476864, 'steps': 23316, 'loss/train': 1.7602030038833618} -08/30/2021 17:22:47 - INFO - __main__ - Step 23318: {'lr': 0.000474839713317064, 'samples': 4477056, 'steps': 23317, 'loss/train': 1.7041176557540894} -08/30/2021 17:22:47 - INFO - __main__ - Step 23319: {'lr': 0.00047483739309822615, 'samples': 4477248, 'steps': 23318, 'loss/train': 1.4947415590286255} -08/30/2021 17:22:49 - INFO - __main__ - Step 23320: {'lr': 0.00047483507277808, 'samples': 4477440, 'steps': 23319, 'loss/train': 1.7281042337417603} -08/30/2021 17:22:49 - INFO - __main__ - Step 23321: {'lr': 0.0004748327523566267, 'samples': 4477632, 'steps': 23320, 'loss/train': 1.1908296346664429} -08/30/2021 17:22:49 - INFO - __main__ - Step 23322: {'lr': 0.0004748304318338672, 'samples': 4477824, 'steps': 23321, 'loss/train': 0.6295861005783081} -08/30/2021 17:22:50 - INFO - __main__ - Step 23323: {'lr': 0.00047482811120980254, 'samples': 4478016, 'steps': 23322, 'loss/train': 1.4904004335403442} -08/30/2021 17:22:50 - INFO - __main__ - Step 23324: {'lr': 0.0004748257904844339, 'samples': 4478208, 'steps': 23323, 'loss/train': 0.9871253967285156} -08/30/2021 17:22:52 - INFO - __main__ - Step 23325: {'lr': 0.00047482346965776215, 'samples': 4478400, 'steps': 23324, 'loss/train': 1.551640510559082} -08/30/2021 17:22:52 - INFO - __main__ - Step 23326: {'lr': 0.0004748211487297884, 'samples': 4478592, 'steps': 23325, 'loss/train': 1.6661995649337769} -08/30/2021 17:22:52 - INFO - __main__ - Step 23327: {'lr': 0.00047481882770051377, 'samples': 4478784, 'steps': 23326, 'loss/train': 1.2789151668548584} -08/30/2021 17:22:53 - INFO - __main__ - Step 23328: {'lr': 0.00047481650656993924, 'samples': 4478976, 'steps': 23327, 'loss/train': 1.8919947147369385} -08/30/2021 17:22:53 - INFO - __main__ - Step 23329: {'lr': 0.00047481418533806586, 'samples': 4479168, 'steps': 23328, 'loss/train': 1.881327748298645} -08/30/2021 17:22:55 - INFO - __main__ - Step 23330: {'lr': 0.0004748118640048946, 'samples': 4479360, 'steps': 23329, 'loss/train': 1.0059058666229248} -08/30/2021 17:22:55 - INFO - __main__ - Step 23331: {'lr': 0.00047480954257042666, 'samples': 4479552, 'steps': 23330, 'loss/train': 1.5549612045288086} -08/30/2021 17:22:55 - INFO - __main__ - Step 23332: {'lr': 0.000474807221034663, 'samples': 4479744, 'steps': 23331, 'loss/train': 1.6566517353057861} -08/30/2021 17:22:56 - INFO - __main__ - Step 23333: {'lr': 0.0004748048993976046, 'samples': 4479936, 'steps': 23332, 'loss/train': 1.3243255615234375} -08/30/2021 17:22:56 - INFO - __main__ - Step 23334: {'lr': 0.0004748025776592527, 'samples': 4480128, 'steps': 23333, 'loss/train': 1.6638424396514893} -08/30/2021 17:22:58 - INFO - __main__ - Step 23335: {'lr': 0.00047480025581960817, 'samples': 4480320, 'steps': 23334, 'loss/train': 1.2825798988342285} -08/30/2021 17:22:58 - INFO - __main__ - Step 23336: {'lr': 0.0004747979338786721, 'samples': 4480512, 'steps': 23335, 'loss/train': 1.877795934677124} -08/30/2021 17:22:58 - INFO - __main__ - Step 23337: {'lr': 0.00047479561183644557, 'samples': 4480704, 'steps': 23336, 'loss/train': 1.6736769676208496} -08/30/2021 17:22:59 - INFO - __main__ - Step 23338: {'lr': 0.00047479328969292963, 'samples': 4480896, 'steps': 23337, 'loss/train': 1.8154802322387695} -08/30/2021 17:22:59 - INFO - __main__ - Step 23339: {'lr': 0.0004747909674481253, 'samples': 4481088, 'steps': 23338, 'loss/train': 1.9429608583450317} -08/30/2021 17:23:01 - INFO - __main__ - Step 23340: {'lr': 0.00047478864510203355, 'samples': 4481280, 'steps': 23339, 'loss/train': 1.302916169166565} -08/30/2021 17:23:01 - INFO - __main__ - Step 23341: {'lr': 0.0004747863226546556, 'samples': 4481472, 'steps': 23340, 'loss/train': 1.8804534673690796} -08/30/2021 17:23:02 - INFO - __main__ - Step 23342: {'lr': 0.0004747840001059923, 'samples': 4481664, 'steps': 23341, 'loss/train': 1.4982608556747437} -08/30/2021 17:23:02 - INFO - __main__ - Step 23343: {'lr': 0.00047478167745604495, 'samples': 4481856, 'steps': 23342, 'loss/train': 0.9054900407791138} -08/30/2021 17:23:02 - INFO - __main__ - Step 23344: {'lr': 0.00047477935470481434, 'samples': 4482048, 'steps': 23343, 'loss/train': 1.4744951725006104} -08/30/2021 17:23:04 - INFO - __main__ - Step 23345: {'lr': 0.00047477703185230157, 'samples': 4482240, 'steps': 23344, 'loss/train': 1.1306208372116089} -08/30/2021 17:23:04 - INFO - __main__ - Step 23346: {'lr': 0.00047477470889850784, 'samples': 4482432, 'steps': 23345, 'loss/train': 1.7451003789901733} -08/30/2021 17:23:05 - INFO - __main__ - Step 23347: {'lr': 0.00047477238584343407, 'samples': 4482624, 'steps': 23346, 'loss/train': 1.4920345544815063} -08/30/2021 17:23:05 - INFO - __main__ - Step 23348: {'lr': 0.00047477006268708134, 'samples': 4482816, 'steps': 23347, 'loss/train': 1.6318023204803467} -08/30/2021 17:23:05 - INFO - __main__ - Step 23349: {'lr': 0.00047476773942945063, 'samples': 4483008, 'steps': 23348, 'loss/train': 1.410489559173584} -08/30/2021 17:23:06 - INFO - __main__ - Step 23350: {'lr': 0.00047476541607054313, 'samples': 4483200, 'steps': 23349, 'loss/train': 1.4952244758605957} -08/30/2021 17:23:07 - INFO - __main__ - Step 23351: {'lr': 0.0004747630926103597, 'samples': 4483392, 'steps': 23350, 'loss/train': 1.6330492496490479} -08/30/2021 17:23:08 - INFO - __main__ - Step 23352: {'lr': 0.0004747607690489015, 'samples': 4483584, 'steps': 23351, 'loss/train': 1.2275327444076538} -08/30/2021 17:23:08 - INFO - __main__ - Step 23353: {'lr': 0.00047475844538616966, 'samples': 4483776, 'steps': 23352, 'loss/train': 1.9747304916381836} -08/30/2021 17:23:08 - INFO - __main__ - Step 23354: {'lr': 0.0004747561216221651, 'samples': 4483968, 'steps': 23353, 'loss/train': 1.918383240699768} -08/30/2021 17:23:09 - INFO - __main__ - Step 23355: {'lr': 0.0004747537977568889, 'samples': 4484160, 'steps': 23354, 'loss/train': 0.5475494265556335} -08/30/2021 17:23:11 - INFO - __main__ - Step 23356: {'lr': 0.00047475147379034206, 'samples': 4484352, 'steps': 23355, 'loss/train': 1.4513154029846191} -08/30/2021 17:23:11 - INFO - __main__ - Step 23357: {'lr': 0.0004747491497225257, 'samples': 4484544, 'steps': 23356, 'loss/train': 1.5879918336868286} -08/30/2021 17:23:12 - INFO - __main__ - Step 23358: {'lr': 0.00047474682555344083, 'samples': 4484736, 'steps': 23357, 'loss/train': 1.2888751029968262} -08/30/2021 17:23:12 - INFO - __main__ - Step 23359: {'lr': 0.00047474450128308853, 'samples': 4484928, 'steps': 23358, 'loss/train': 1.9676098823547363} -08/30/2021 17:23:13 - INFO - __main__ - Step 23360: {'lr': 0.0004747421769114698, 'samples': 4485120, 'steps': 23359, 'loss/train': 2.159215211868286} -08/30/2021 17:23:13 - INFO - __main__ - Step 23361: {'lr': 0.00047473985243858577, 'samples': 4485312, 'steps': 23360, 'loss/train': 1.4242740869522095} -08/30/2021 17:23:13 - INFO - __main__ - Step 23362: {'lr': 0.00047473752786443736, 'samples': 4485504, 'steps': 23361, 'loss/train': 1.536911129951477} -08/30/2021 17:23:15 - INFO - __main__ - Step 23363: {'lr': 0.0004747352031890257, 'samples': 4485696, 'steps': 23362, 'loss/train': 1.0240377187728882} -08/30/2021 17:23:15 - INFO - __main__ - Step 23364: {'lr': 0.0004747328784123519, 'samples': 4485888, 'steps': 23363, 'loss/train': 1.4924437999725342} -08/30/2021 17:23:16 - INFO - __main__ - Step 23365: {'lr': 0.00047473055353441685, 'samples': 4486080, 'steps': 23364, 'loss/train': 1.7939375638961792} -08/30/2021 17:23:16 - INFO - __main__ - Step 23366: {'lr': 0.0004747282285552217, 'samples': 4486272, 'steps': 23365, 'loss/train': 2.470353841781616} -08/30/2021 17:23:16 - INFO - __main__ - Step 23367: {'lr': 0.0004747259034747675, 'samples': 4486464, 'steps': 23366, 'loss/train': 2.460697889328003} -08/30/2021 17:23:18 - INFO - __main__ - Step 23368: {'lr': 0.00047472357829305524, 'samples': 4486656, 'steps': 23367, 'loss/train': 1.9643207788467407} -08/30/2021 17:23:18 - INFO - __main__ - Step 23369: {'lr': 0.0004747212530100861, 'samples': 4486848, 'steps': 23368, 'loss/train': 1.8857786655426025} -08/30/2021 17:23:19 - INFO - __main__ - Step 23370: {'lr': 0.0004747189276258609, 'samples': 4487040, 'steps': 23369, 'loss/train': 1.8279653787612915} -08/30/2021 17:23:19 - INFO - __main__ - Step 23371: {'lr': 0.0004747166021403809, 'samples': 4487232, 'steps': 23370, 'loss/train': 1.2541252374649048} -08/30/2021 17:23:19 - INFO - __main__ - Step 23372: {'lr': 0.000474714276553647, 'samples': 4487424, 'steps': 23371, 'loss/train': 1.3642388582229614} -08/30/2021 17:23:20 - INFO - __main__ - Step 23373: {'lr': 0.00047471195086566035, 'samples': 4487616, 'steps': 23372, 'loss/train': 1.1675230264663696} -08/30/2021 17:23:21 - INFO - __main__ - Step 23374: {'lr': 0.000474709625076422, 'samples': 4487808, 'steps': 23373, 'loss/train': 1.4698249101638794} -08/30/2021 17:23:22 - INFO - __main__ - Step 23375: {'lr': 0.0004747072991859329, 'samples': 4488000, 'steps': 23374, 'loss/train': 1.673593282699585} -08/30/2021 17:23:22 - INFO - __main__ - Step 23376: {'lr': 0.0004747049731941942, 'samples': 4488192, 'steps': 23375, 'loss/train': 1.6737829446792603} -08/30/2021 17:23:23 - INFO - __main__ - Step 23377: {'lr': 0.0004747026471012069, 'samples': 4488384, 'steps': 23376, 'loss/train': 1.8373947143554688} -08/30/2021 17:23:23 - INFO - __main__ - Step 23378: {'lr': 0.000474700320906972, 'samples': 4488576, 'steps': 23377, 'loss/train': 0.3915119171142578} -08/30/2021 17:23:25 - INFO - __main__ - Step 23379: {'lr': 0.0004746979946114907, 'samples': 4488768, 'steps': 23378, 'loss/train': 0.2655538320541382} -08/30/2021 17:23:25 - INFO - __main__ - Step 23380: {'lr': 0.000474695668214764, 'samples': 4488960, 'steps': 23379, 'loss/train': 2.253612995147705} -08/30/2021 17:23:25 - INFO - __main__ - Step 23381: {'lr': 0.00047469334171679266, 'samples': 4489152, 'steps': 23380, 'loss/train': 2.6099472045898438} -08/30/2021 17:23:26 - INFO - __main__ - Step 23382: {'lr': 0.00047469101511757815, 'samples': 4489344, 'steps': 23381, 'loss/train': 1.9087992906570435} -08/30/2021 17:23:26 - INFO - __main__ - Step 23383: {'lr': 0.00047468868841712134, 'samples': 4489536, 'steps': 23382, 'loss/train': 1.361952543258667} -08/30/2021 17:23:28 - INFO - __main__ - Step 23384: {'lr': 0.00047468636161542325, 'samples': 4489728, 'steps': 23383, 'loss/train': 1.7354804277420044} -08/30/2021 17:23:28 - INFO - __main__ - Step 23385: {'lr': 0.0004746840347124849, 'samples': 4489920, 'steps': 23384, 'loss/train': 1.5653932094573975} -08/30/2021 17:23:28 - INFO - __main__ - Step 23386: {'lr': 0.0004746817077083074, 'samples': 4490112, 'steps': 23385, 'loss/train': 2.235689163208008} -08/30/2021 17:23:29 - INFO - __main__ - Step 23387: {'lr': 0.00047467938060289185, 'samples': 4490304, 'steps': 23386, 'loss/train': 1.6533534526824951} -08/30/2021 17:23:29 - INFO - __main__ - Step 23388: {'lr': 0.0004746770533962391, 'samples': 4490496, 'steps': 23387, 'loss/train': 1.812745213508606} -08/30/2021 17:23:29 - INFO - __main__ - Step 23389: {'lr': 0.0004746747260883505, 'samples': 4490688, 'steps': 23388, 'loss/train': 1.734961748123169} -08/30/2021 17:23:31 - INFO - __main__ - Step 23390: {'lr': 0.0004746723986792268, 'samples': 4490880, 'steps': 23389, 'loss/train': 1.3688782453536987} -08/30/2021 17:23:31 - INFO - __main__ - Step 23391: {'lr': 0.0004746700711688693, 'samples': 4491072, 'steps': 23390, 'loss/train': 1.6471861600875854} -08/30/2021 17:23:32 - INFO - __main__ - Step 23392: {'lr': 0.0004746677435572789, 'samples': 4491264, 'steps': 23391, 'loss/train': 1.8662527799606323} -08/30/2021 17:23:32 - INFO - __main__ - Step 23393: {'lr': 0.00047466541584445667, 'samples': 4491456, 'steps': 23392, 'loss/train': 1.7130470275878906} -08/30/2021 17:23:32 - INFO - __main__ - Step 23394: {'lr': 0.0004746630880304037, 'samples': 4491648, 'steps': 23393, 'loss/train': 0.8440204858779907} -08/30/2021 17:23:34 - INFO - __main__ - Step 23395: {'lr': 0.0004746607601151209, 'samples': 4491840, 'steps': 23394, 'loss/train': 1.6433444023132324} -08/30/2021 17:23:35 - INFO - __main__ - Step 23396: {'lr': 0.0004746584320986096, 'samples': 4492032, 'steps': 23395, 'loss/train': 1.9183671474456787} -08/30/2021 17:23:35 - INFO - __main__ - Step 23397: {'lr': 0.0004746561039808706, 'samples': 4492224, 'steps': 23396, 'loss/train': 1.188535451889038} -08/30/2021 17:23:35 - INFO - __main__ - Step 23398: {'lr': 0.0004746537757619049, 'samples': 4492416, 'steps': 23397, 'loss/train': 1.4544490575790405} -08/30/2021 17:23:36 - INFO - __main__ - Step 23399: {'lr': 0.00047465144744171387, 'samples': 4492608, 'steps': 23398, 'loss/train': 1.52882719039917} -08/30/2021 17:23:37 - INFO - __main__ - Step 23400: {'lr': 0.0004746491190202983, 'samples': 4492800, 'steps': 23399, 'loss/train': 1.3295679092407227} -08/30/2021 17:23:38 - INFO - __main__ - Step 23401: {'lr': 0.00047464679049765926, 'samples': 4492992, 'steps': 23400, 'loss/train': 1.7973284721374512} -08/30/2021 17:23:38 - INFO - __main__ - Step 23402: {'lr': 0.00047464446187379787, 'samples': 4493184, 'steps': 23401, 'loss/train': 1.505181074142456} -08/30/2021 17:23:39 - INFO - __main__ - Step 23403: {'lr': 0.00047464213314871514, 'samples': 4493376, 'steps': 23402, 'loss/train': 1.8122906684875488} -08/30/2021 17:23:39 - INFO - __main__ - Step 23404: {'lr': 0.0004746398043224122, 'samples': 4493568, 'steps': 23403, 'loss/train': 1.5950868129730225} -08/30/2021 17:23:41 - INFO - __main__ - Step 23405: {'lr': 0.0004746374753948899, 'samples': 4493760, 'steps': 23404, 'loss/train': 1.5152009725570679} -08/30/2021 17:23:41 - INFO - __main__ - Step 23406: {'lr': 0.00047463514636614945, 'samples': 4493952, 'steps': 23405, 'loss/train': 1.8622397184371948} -08/30/2021 17:23:42 - INFO - __main__ - Step 23407: {'lr': 0.00047463281723619203, 'samples': 4494144, 'steps': 23406, 'loss/train': 0.7602947950363159} -08/30/2021 17:23:42 - INFO - __main__ - Step 23408: {'lr': 0.00047463048800501837, 'samples': 4494336, 'steps': 23407, 'loss/train': 1.307937741279602} -08/30/2021 17:23:42 - INFO - __main__ - Step 23409: {'lr': 0.00047462815867262967, 'samples': 4494528, 'steps': 23408, 'loss/train': 2.198789358139038} -08/30/2021 17:23:44 - INFO - __main__ - Step 23410: {'lr': 0.0004746258292390271, 'samples': 4494720, 'steps': 23409, 'loss/train': 1.6767184734344482} -08/30/2021 17:23:44 - INFO - __main__ - Step 23411: {'lr': 0.00047462349970421147, 'samples': 4494912, 'steps': 23410, 'loss/train': 1.3218573331832886} -08/30/2021 17:23:45 - INFO - __main__ - Step 23412: {'lr': 0.0004746211700681841, 'samples': 4495104, 'steps': 23411, 'loss/train': 1.3264437913894653} -08/30/2021 17:23:45 - INFO - __main__ - Step 23413: {'lr': 0.0004746188403309457, 'samples': 4495296, 'steps': 23412, 'loss/train': 1.8527815341949463} -08/30/2021 17:23:45 - INFO - __main__ - Step 23414: {'lr': 0.00047461651049249764, 'samples': 4495488, 'steps': 23413, 'loss/train': 1.2875312566757202} -08/30/2021 17:23:48 - INFO - __main__ - Step 23415: {'lr': 0.0004746141805528409, 'samples': 4495680, 'steps': 23414, 'loss/train': 1.7617915868759155} -08/30/2021 17:23:48 - INFO - __main__ - Step 23416: {'lr': 0.00047461185051197644, 'samples': 4495872, 'steps': 23415, 'loss/train': 1.4624656438827515} -08/30/2021 17:23:48 - INFO - __main__ - Step 23417: {'lr': 0.0004746095203699053, 'samples': 4496064, 'steps': 23416, 'loss/train': 5.8519086837768555} -08/30/2021 17:23:49 - INFO - __main__ - Step 23418: {'lr': 0.00047460719012662857, 'samples': 4496256, 'steps': 23417, 'loss/train': 4.7854485511779785} -08/30/2021 17:23:49 - INFO - __main__ - Step 23419: {'lr': 0.00047460485978214733, 'samples': 4496448, 'steps': 23418, 'loss/train': 5.4564738273620605} -08/30/2021 17:23:49 - INFO - __main__ - Step 23420: {'lr': 0.00047460252933646265, 'samples': 4496640, 'steps': 23419, 'loss/train': 4.870734691619873} -08/30/2021 17:23:50 - INFO - __main__ - Step 23421: {'lr': 0.0004746001987895755, 'samples': 4496832, 'steps': 23420, 'loss/train': 1.6050056219100952} -08/30/2021 17:23:51 - INFO - __main__ - Step 23422: {'lr': 0.00047459786814148697, 'samples': 4497024, 'steps': 23421, 'loss/train': 1.7520097494125366} -08/30/2021 17:23:52 - INFO - __main__ - Step 23423: {'lr': 0.0004745955373921981, 'samples': 4497216, 'steps': 23422, 'loss/train': 0.8850692510604858} -08/30/2021 17:23:52 - INFO - __main__ - Step 23424: {'lr': 0.0004745932065417099, 'samples': 4497408, 'steps': 23423, 'loss/train': 1.8354878425598145} -08/30/2021 17:23:52 - INFO - __main__ - Step 23425: {'lr': 0.00047459087559002355, 'samples': 4497600, 'steps': 23424, 'loss/train': 1.7539135217666626} -08/30/2021 17:23:53 - INFO - __main__ - Step 23426: {'lr': 0.00047458854453713995, 'samples': 4497792, 'steps': 23425, 'loss/train': 1.7263280153274536} -08/30/2021 17:23:54 - INFO - __main__ - Step 23427: {'lr': 0.0004745862133830603, 'samples': 4497984, 'steps': 23426, 'loss/train': 1.466227412223816} -08/30/2021 17:23:55 - INFO - __main__ - Step 23428: {'lr': 0.00047458388212778547, 'samples': 4498176, 'steps': 23427, 'loss/train': 1.9011969566345215} -08/30/2021 17:23:55 - INFO - __main__ - Step 23429: {'lr': 0.00047458155077131664, 'samples': 4498368, 'steps': 23428, 'loss/train': 0.665778636932373} -08/30/2021 17:23:56 - INFO - __main__ - Step 23430: {'lr': 0.0004745792193136549, 'samples': 4498560, 'steps': 23429, 'loss/train': 1.4582651853561401} -08/30/2021 17:23:56 - INFO - __main__ - Step 23431: {'lr': 0.00047457688775480114, 'samples': 4498752, 'steps': 23430, 'loss/train': 2.1060478687286377} -08/30/2021 17:23:56 - INFO - __main__ - Step 23432: {'lr': 0.0004745745560947565, 'samples': 4498944, 'steps': 23431, 'loss/train': 0.9793155789375305} -08/30/2021 17:23:58 - INFO - __main__ - Step 23433: {'lr': 0.0004745722243335221, 'samples': 4499136, 'steps': 23432, 'loss/train': 1.958113670349121} -08/30/2021 17:23:59 - INFO - __main__ - Step 23434: {'lr': 0.0004745698924710988, 'samples': 4499328, 'steps': 23433, 'loss/train': 1.1268386840820312} -08/30/2021 17:23:59 - INFO - __main__ - Step 23435: {'lr': 0.00047456756050748793, 'samples': 4499520, 'steps': 23434, 'loss/train': 2.3697609901428223} -08/30/2021 17:23:59 - INFO - __main__ - Step 23436: {'lr': 0.0004745652284426903, 'samples': 4499712, 'steps': 23435, 'loss/train': 2.8915159702301025} -08/30/2021 17:24:00 - INFO - __main__ - Step 23437: {'lr': 0.00047456289627670703, 'samples': 4499904, 'steps': 23436, 'loss/train': 1.2846698760986328} -08/30/2021 17:24:01 - INFO - __main__ - Step 23438: {'lr': 0.0004745605640095392, 'samples': 4500096, 'steps': 23437, 'loss/train': 1.5122549533843994} -08/30/2021 17:24:02 - INFO - __main__ - Step 23439: {'lr': 0.00047455823164118787, 'samples': 4500288, 'steps': 23438, 'loss/train': 2.0294601917266846} -08/30/2021 17:24:02 - INFO - __main__ - Step 23440: {'lr': 0.00047455589917165406, 'samples': 4500480, 'steps': 23439, 'loss/train': 1.3264708518981934} -08/30/2021 17:24:02 - INFO - __main__ - Step 23441: {'lr': 0.00047455356660093886, 'samples': 4500672, 'steps': 23440, 'loss/train': 1.8434523344039917} -08/30/2021 17:24:03 - INFO - __main__ - Step 23442: {'lr': 0.0004745512339290432, 'samples': 4500864, 'steps': 23441, 'loss/train': 1.5019114017486572} -08/30/2021 17:24:04 - INFO - __main__ - Step 23443: {'lr': 0.00047454890115596824, 'samples': 4501056, 'steps': 23442, 'loss/train': 1.7407407760620117} -08/30/2021 17:24:05 - INFO - __main__ - Step 23444: {'lr': 0.00047454656828171504, 'samples': 4501248, 'steps': 23443, 'loss/train': 1.4007312059402466} -08/30/2021 17:24:05 - INFO - __main__ - Step 23445: {'lr': 0.0004745442353062846, 'samples': 4501440, 'steps': 23444, 'loss/train': 1.9586397409439087} -08/30/2021 17:24:05 - INFO - __main__ - Step 23446: {'lr': 0.000474541902229678, 'samples': 4501632, 'steps': 23445, 'loss/train': 0.6901741623878479} -08/30/2021 17:24:06 - INFO - __main__ - Step 23447: {'lr': 0.0004745395690518963, 'samples': 4501824, 'steps': 23446, 'loss/train': 1.9121707677841187} -08/30/2021 17:24:07 - INFO - __main__ - Step 23448: {'lr': 0.0004745372357729405, 'samples': 4502016, 'steps': 23447, 'loss/train': 1.4843432903289795} -08/30/2021 17:24:08 - INFO - __main__ - Step 23449: {'lr': 0.0004745349023928117, 'samples': 4502208, 'steps': 23448, 'loss/train': 1.4363607168197632} -08/30/2021 17:24:08 - INFO - __main__ - Step 23450: {'lr': 0.000474532568911511, 'samples': 4502400, 'steps': 23449, 'loss/train': 3.3592400550842285} -08/30/2021 17:24:09 - INFO - __main__ - Step 23451: {'lr': 0.00047453023532903927, 'samples': 4502592, 'steps': 23450, 'loss/train': 0.9863831996917725} -08/30/2021 17:24:09 - INFO - __main__ - Step 23452: {'lr': 0.00047452790164539775, 'samples': 4502784, 'steps': 23451, 'loss/train': 1.3867384195327759} -08/30/2021 17:24:09 - INFO - __main__ - Step 23453: {'lr': 0.00047452556786058744, 'samples': 4502976, 'steps': 23452, 'loss/train': 2.2206199169158936} -08/30/2021 17:24:11 - INFO - __main__ - Step 23454: {'lr': 0.0004745232339746094, 'samples': 4503168, 'steps': 23453, 'loss/train': 1.588103175163269} -08/30/2021 17:24:12 - INFO - __main__ - Step 23455: {'lr': 0.00047452089998746463, 'samples': 4503360, 'steps': 23454, 'loss/train': 1.7924898862838745} -08/30/2021 17:24:12 - INFO - __main__ - Step 23456: {'lr': 0.0004745185658991541, 'samples': 4503552, 'steps': 23455, 'loss/train': 1.5315626859664917} -08/30/2021 17:24:12 - INFO - __main__ - Step 23457: {'lr': 0.0004745162317096791, 'samples': 4503744, 'steps': 23456, 'loss/train': 1.523364782333374} -08/30/2021 17:24:13 - INFO - __main__ - Step 23458: {'lr': 0.0004745138974190405, 'samples': 4503936, 'steps': 23457, 'loss/train': 1.3494212627410889} -08/30/2021 17:24:14 - INFO - __main__ - Step 23459: {'lr': 0.0004745115630272394, 'samples': 4504128, 'steps': 23458, 'loss/train': 1.3633402585983276} -08/30/2021 17:24:15 - INFO - __main__ - Step 23460: {'lr': 0.00047450922853427686, 'samples': 4504320, 'steps': 23459, 'loss/train': 0.2803743779659271} -08/30/2021 17:24:15 - INFO - __main__ - Step 23461: {'lr': 0.0004745068939401539, 'samples': 4504512, 'steps': 23460, 'loss/train': 1.6602718830108643} -08/30/2021 17:24:16 - INFO - __main__ - Step 23462: {'lr': 0.0004745045592448717, 'samples': 4504704, 'steps': 23461, 'loss/train': 1.833642840385437} -08/30/2021 17:24:16 - INFO - __main__ - Step 23463: {'lr': 0.00047450222444843105, 'samples': 4504896, 'steps': 23462, 'loss/train': 1.7407232522964478} -08/30/2021 17:24:18 - INFO - __main__ - Step 23464: {'lr': 0.0004744998895508333, 'samples': 4505088, 'steps': 23463, 'loss/train': 1.4313862323760986} -08/30/2021 17:24:18 - INFO - __main__ - Step 23465: {'lr': 0.0004744975545520793, 'samples': 4505280, 'steps': 23464, 'loss/train': 1.3955929279327393} -08/30/2021 17:24:18 - INFO - __main__ - Step 23466: {'lr': 0.00047449521945217016, 'samples': 4505472, 'steps': 23465, 'loss/train': 0.11742239445447922} -08/30/2021 17:24:19 - INFO - __main__ - Step 23467: {'lr': 0.00047449288425110693, 'samples': 4505664, 'steps': 23466, 'loss/train': 1.964247226715088} -08/30/2021 17:24:19 - INFO - __main__ - Step 23468: {'lr': 0.00047449054894889073, 'samples': 4505856, 'steps': 23467, 'loss/train': 1.281093716621399} -08/30/2021 17:24:21 - INFO - __main__ - Step 23469: {'lr': 0.00047448821354552253, 'samples': 4506048, 'steps': 23468, 'loss/train': 1.9166456460952759} -08/30/2021 17:24:21 - INFO - __main__ - Step 23470: {'lr': 0.0004744858780410034, 'samples': 4506240, 'steps': 23469, 'loss/train': 1.4999719858169556} -08/30/2021 17:24:22 - INFO - __main__ - Step 23471: {'lr': 0.0004744835424353344, 'samples': 4506432, 'steps': 23470, 'loss/train': 1.7396823167800903} -08/30/2021 17:24:22 - INFO - __main__ - Step 23472: {'lr': 0.00047448120672851653, 'samples': 4506624, 'steps': 23471, 'loss/train': 2.032892942428589} -08/30/2021 17:24:22 - INFO - __main__ - Step 23473: {'lr': 0.0004744788709205509, 'samples': 4506816, 'steps': 23472, 'loss/train': 1.2991772890090942} -08/30/2021 17:24:23 - INFO - __main__ - Step 23474: {'lr': 0.0004744765350114386, 'samples': 4507008, 'steps': 23473, 'loss/train': 1.8414204120635986} -08/30/2021 17:24:24 - INFO - __main__ - Step 23475: {'lr': 0.00047447419900118067, 'samples': 4507200, 'steps': 23474, 'loss/train': 2.0994033813476562} -08/30/2021 17:24:25 - INFO - __main__ - Step 23476: {'lr': 0.00047447186288977804, 'samples': 4507392, 'steps': 23475, 'loss/train': 1.974700689315796} -08/30/2021 17:24:25 - INFO - __main__ - Step 23477: {'lr': 0.0004744695266772319, 'samples': 4507584, 'steps': 23476, 'loss/train': 0.30462032556533813} -08/30/2021 17:24:26 - INFO - __main__ - Step 23478: {'lr': 0.00047446719036354324, 'samples': 4507776, 'steps': 23477, 'loss/train': 1.4962259531021118} -08/30/2021 17:24:26 - INFO - __main__ - Step 23479: {'lr': 0.0004744648539487132, 'samples': 4507968, 'steps': 23478, 'loss/train': 1.6455671787261963} -08/30/2021 17:24:28 - INFO - __main__ - Step 23480: {'lr': 0.00047446251743274263, 'samples': 4508160, 'steps': 23479, 'loss/train': 1.8071171045303345} -08/30/2021 17:24:28 - INFO - __main__ - Step 23481: {'lr': 0.0004744601808156328, 'samples': 4508352, 'steps': 23480, 'loss/train': 1.5873665809631348} -08/30/2021 17:24:29 - INFO - __main__ - Step 23482: {'lr': 0.00047445784409738467, 'samples': 4508544, 'steps': 23481, 'loss/train': 1.4687551259994507} -08/30/2021 17:24:29 - INFO - __main__ - Step 23483: {'lr': 0.0004744555072779993, 'samples': 4508736, 'steps': 23482, 'loss/train': 2.1719584465026855} -08/30/2021 17:24:30 - INFO - __main__ - Step 23484: {'lr': 0.0004744531703574777, 'samples': 4508928, 'steps': 23483, 'loss/train': 1.622030258178711} -08/30/2021 17:24:30 - INFO - __main__ - Step 23485: {'lr': 0.00047445083333582104, 'samples': 4509120, 'steps': 23484, 'loss/train': 0.7606672644615173} -08/30/2021 17:24:31 - INFO - __main__ - Step 23486: {'lr': 0.00047444849621303023, 'samples': 4509312, 'steps': 23485, 'loss/train': 0.7390870451927185} -08/30/2021 17:24:32 - INFO - __main__ - Step 23487: {'lr': 0.00047444615898910644, 'samples': 4509504, 'steps': 23486, 'loss/train': 1.55876624584198} -08/30/2021 17:24:32 - INFO - __main__ - Step 23488: {'lr': 0.00047444382166405067, 'samples': 4509696, 'steps': 23487, 'loss/train': 2.046896457672119} -08/30/2021 17:24:33 - INFO - __main__ - Step 23489: {'lr': 0.0004744414842378639, 'samples': 4509888, 'steps': 23488, 'loss/train': 1.255998134613037} -08/30/2021 17:24:33 - INFO - __main__ - Step 23490: {'lr': 0.0004744391467105473, 'samples': 4510080, 'steps': 23489, 'loss/train': 1.868764042854309} -08/30/2021 17:24:35 - INFO - __main__ - Step 23491: {'lr': 0.00047443680908210194, 'samples': 4510272, 'steps': 23490, 'loss/train': 2.182711362838745} -08/30/2021 17:24:36 - INFO - __main__ - Step 23492: {'lr': 0.00047443447135252876, 'samples': 4510464, 'steps': 23491, 'loss/train': 1.7871869802474976} -08/30/2021 17:24:36 - INFO - __main__ - Step 23493: {'lr': 0.0004744321335218289, 'samples': 4510656, 'steps': 23492, 'loss/train': 1.6534804105758667} -08/30/2021 17:24:36 - INFO - __main__ - Step 23494: {'lr': 0.0004744297955900034, 'samples': 4510848, 'steps': 23493, 'loss/train': 0.16427098214626312} -08/30/2021 17:24:37 - INFO - __main__ - Step 23495: {'lr': 0.00047442745755705326, 'samples': 4511040, 'steps': 23494, 'loss/train': 0.5807023048400879} -08/30/2021 17:24:38 - INFO - __main__ - Step 23496: {'lr': 0.00047442511942297953, 'samples': 4511232, 'steps': 23495, 'loss/train': 1.61563241481781} -08/30/2021 17:24:39 - INFO - __main__ - Step 23497: {'lr': 0.00047442278118778336, 'samples': 4511424, 'steps': 23496, 'loss/train': 1.7230396270751953} -08/30/2021 17:24:39 - INFO - __main__ - Step 23498: {'lr': 0.0004744204428514658, 'samples': 4511616, 'steps': 23497, 'loss/train': 1.6623622179031372} -08/30/2021 17:24:40 - INFO - __main__ - Step 23499: {'lr': 0.00047441810441402777, 'samples': 4511808, 'steps': 23498, 'loss/train': 0.14661931991577148} -08/30/2021 17:24:40 - INFO - __main__ - Step 23500: {'lr': 0.0004744157658754704, 'samples': 4512000, 'steps': 23499, 'loss/train': 1.5369865894317627} -08/30/2021 17:24:41 - INFO - __main__ - Step 23501: {'lr': 0.0004744134272357948, 'samples': 4512192, 'steps': 23500, 'loss/train': 1.2457892894744873} -08/30/2021 17:24:42 - INFO - __main__ - Step 23502: {'lr': 0.0004744110884950019, 'samples': 4512384, 'steps': 23501, 'loss/train': 1.8913642168045044} -08/30/2021 17:24:42 - INFO - __main__ - Step 23503: {'lr': 0.00047440874965309286, 'samples': 4512576, 'steps': 23502, 'loss/train': 1.378138542175293} -08/30/2021 17:24:42 - INFO - __main__ - Step 23504: {'lr': 0.00047440641071006874, 'samples': 4512768, 'steps': 23503, 'loss/train': 1.9634078741073608} -08/30/2021 17:24:43 - INFO - __main__ - Step 23505: {'lr': 0.00047440407166593056, 'samples': 4512960, 'steps': 23504, 'loss/train': 1.6665253639221191} -08/30/2021 17:24:45 - INFO - __main__ - Step 23506: {'lr': 0.0004744017325206793, 'samples': 4513152, 'steps': 23505, 'loss/train': 1.0028982162475586} -08/30/2021 17:24:45 - INFO - __main__ - Step 23507: {'lr': 0.00047439939327431613, 'samples': 4513344, 'steps': 23506, 'loss/train': 1.8394252061843872} -08/30/2021 17:24:46 - INFO - __main__ - Step 23508: {'lr': 0.0004743970539268421, 'samples': 4513536, 'steps': 23507, 'loss/train': 1.3555352687835693} -08/30/2021 17:24:46 - INFO - __main__ - Step 23509: {'lr': 0.00047439471447825813, 'samples': 4513728, 'steps': 23508, 'loss/train': 0.9830705523490906} -08/30/2021 17:24:46 - INFO - __main__ - Step 23510: {'lr': 0.00047439237492856543, 'samples': 4513920, 'steps': 23509, 'loss/train': 1.154396891593933} -08/30/2021 17:24:47 - INFO - __main__ - Step 23511: {'lr': 0.0004743900352777649, 'samples': 4514112, 'steps': 23510, 'loss/train': 1.7377116680145264} -08/30/2021 17:24:48 - INFO - __main__ - Step 23512: {'lr': 0.0004743876955258578, 'samples': 4514304, 'steps': 23511, 'loss/train': 1.7903070449829102} -08/30/2021 17:24:49 - INFO - __main__ - Step 23513: {'lr': 0.00047438535567284504, 'samples': 4514496, 'steps': 23512, 'loss/train': 2.2499351501464844} -08/30/2021 17:24:49 - INFO - __main__ - Step 23514: {'lr': 0.00047438301571872763, 'samples': 4514688, 'steps': 23513, 'loss/train': 1.4361882209777832} -08/30/2021 17:24:49 - INFO - __main__ - Step 23515: {'lr': 0.00047438067566350675, 'samples': 4514880, 'steps': 23514, 'loss/train': 1.3551257848739624} -08/30/2021 17:24:50 - INFO - __main__ - Step 23516: {'lr': 0.00047437833550718336, 'samples': 4515072, 'steps': 23515, 'loss/train': 1.4749128818511963} -08/30/2021 17:24:51 - INFO - __main__ - Step 23517: {'lr': 0.0004743759952497586, 'samples': 4515264, 'steps': 23516, 'loss/train': 1.697044849395752} -08/30/2021 17:24:52 - INFO - __main__ - Step 23518: {'lr': 0.0004743736548912334, 'samples': 4515456, 'steps': 23517, 'loss/train': 2.0789573192596436} -08/30/2021 17:24:52 - INFO - __main__ - Step 23519: {'lr': 0.00047437131443160897, 'samples': 4515648, 'steps': 23518, 'loss/train': 1.4848761558532715} -08/30/2021 17:24:52 - INFO - __main__ - Step 23520: {'lr': 0.0004743689738708863, 'samples': 4515840, 'steps': 23519, 'loss/train': 1.4723833799362183} -08/30/2021 17:24:53 - INFO - __main__ - Step 23521: {'lr': 0.0004743666332090664, 'samples': 4516032, 'steps': 23520, 'loss/train': 2.1788690090179443} -08/30/2021 17:24:54 - INFO - __main__ - Step 23522: {'lr': 0.00047436429244615037, 'samples': 4516224, 'steps': 23521, 'loss/train': 1.716915249824524} -08/30/2021 17:24:55 - INFO - __main__ - Step 23523: {'lr': 0.0004743619515821392, 'samples': 4516416, 'steps': 23522, 'loss/train': 1.7972381114959717} -08/30/2021 17:24:55 - INFO - __main__ - Step 23524: {'lr': 0.00047435961061703403, 'samples': 4516608, 'steps': 23523, 'loss/train': 1.5950313806533813} -08/30/2021 17:24:55 - INFO - __main__ - Step 23525: {'lr': 0.00047435726955083593, 'samples': 4516800, 'steps': 23524, 'loss/train': 1.8461427688598633} -08/30/2021 17:24:56 - INFO - __main__ - Step 23526: {'lr': 0.0004743549283835459, 'samples': 4516992, 'steps': 23525, 'loss/train': 1.5676671266555786} -08/30/2021 17:24:58 - INFO - __main__ - Step 23527: {'lr': 0.00047435258711516496, 'samples': 4517184, 'steps': 23526, 'loss/train': 1.7245956659317017} -08/30/2021 17:24:58 - INFO - __main__ - Step 23528: {'lr': 0.0004743502457456942, 'samples': 4517376, 'steps': 23527, 'loss/train': 1.6351948976516724} -08/30/2021 17:24:58 - INFO - __main__ - Step 23529: {'lr': 0.0004743479042751347, 'samples': 4517568, 'steps': 23528, 'loss/train': 1.687272310256958} -08/30/2021 17:24:59 - INFO - __main__ - Step 23530: {'lr': 0.0004743455627034875, 'samples': 4517760, 'steps': 23529, 'loss/train': 1.19921875} -08/30/2021 17:24:59 - INFO - __main__ - Step 23531: {'lr': 0.0004743432210307536, 'samples': 4517952, 'steps': 23530, 'loss/train': 0.26170551776885986} -08/30/2021 17:25:01 - INFO - __main__ - Step 23532: {'lr': 0.00047434087925693415, 'samples': 4518144, 'steps': 23531, 'loss/train': 1.4048240184783936} -08/30/2021 17:25:01 - INFO - __main__ - Step 23533: {'lr': 0.00047433853738203013, 'samples': 4518336, 'steps': 23532, 'loss/train': 0.34342679381370544} -08/30/2021 17:25:02 - INFO - __main__ - Step 23534: {'lr': 0.00047433619540604264, 'samples': 4518528, 'steps': 23533, 'loss/train': 0.4432034492492676} -08/30/2021 17:25:02 - INFO - __main__ - Step 23535: {'lr': 0.0004743338533289728, 'samples': 4518720, 'steps': 23534, 'loss/train': 1.9128985404968262} -08/30/2021 17:25:02 - INFO - __main__ - Step 23536: {'lr': 0.0004743315111508215, 'samples': 4518912, 'steps': 23535, 'loss/train': 1.51212477684021} -08/30/2021 17:25:03 - INFO - __main__ - Step 23537: {'lr': 0.00047432916887158995, 'samples': 4519104, 'steps': 23536, 'loss/train': 2.5439515113830566} -08/30/2021 17:25:05 - INFO - __main__ - Step 23538: {'lr': 0.00047432682649127913, 'samples': 4519296, 'steps': 23537, 'loss/train': 1.9498885869979858} -08/30/2021 17:25:05 - INFO - __main__ - Step 23539: {'lr': 0.00047432448400989004, 'samples': 4519488, 'steps': 23538, 'loss/train': 1.6660622358322144} -08/30/2021 17:25:05 - INFO - __main__ - Step 23540: {'lr': 0.0004743221414274238, 'samples': 4519680, 'steps': 23539, 'loss/train': 0.14143574237823486} -08/30/2021 17:25:06 - INFO - __main__ - Step 23541: {'lr': 0.00047431979874388154, 'samples': 4519872, 'steps': 23540, 'loss/train': 2.1670846939086914} -08/30/2021 17:25:06 - INFO - __main__ - Step 23542: {'lr': 0.0004743174559592642, 'samples': 4520064, 'steps': 23541, 'loss/train': 0.116717129945755} -08/30/2021 17:25:07 - INFO - __main__ - Step 23543: {'lr': 0.0004743151130735729, 'samples': 4520256, 'steps': 23542, 'loss/train': 0.14372417330741882} -08/30/2021 17:25:08 - INFO - __main__ - Step 23544: {'lr': 0.0004743127700868086, 'samples': 4520448, 'steps': 23543, 'loss/train': 0.09387094527482986} -08/30/2021 17:25:09 - INFO - __main__ - Step 23545: {'lr': 0.00047431042699897245, 'samples': 4520640, 'steps': 23544, 'loss/train': 1.1553503274917603} -08/30/2021 17:25:09 - INFO - __main__ - Step 23546: {'lr': 0.0004743080838100655, 'samples': 4520832, 'steps': 23545, 'loss/train': 1.2153754234313965} -08/30/2021 17:25:09 - INFO - __main__ - Step 23547: {'lr': 0.0004743057405200888, 'samples': 4521024, 'steps': 23546, 'loss/train': 2.096493721008301} -08/30/2021 17:25:10 - INFO - __main__ - Step 23548: {'lr': 0.0004743033971290434, 'samples': 4521216, 'steps': 23547, 'loss/train': 1.7743288278579712} -08/30/2021 17:25:11 - INFO - __main__ - Step 23549: {'lr': 0.00047430105363693034, 'samples': 4521408, 'steps': 23548, 'loss/train': 1.6424707174301147} -08/30/2021 17:25:12 - INFO - __main__ - Step 23550: {'lr': 0.0004742987100437507, 'samples': 4521600, 'steps': 23549, 'loss/train': 1.471112608909607} -08/30/2021 17:25:12 - INFO - __main__ - Step 23551: {'lr': 0.00047429636634950545, 'samples': 4521792, 'steps': 23550, 'loss/train': 1.3400425910949707} -08/30/2021 17:25:12 - INFO - __main__ - Step 23552: {'lr': 0.0004742940225541958, 'samples': 4521984, 'steps': 23551, 'loss/train': 1.497818112373352} -08/30/2021 17:25:13 - INFO - __main__ - Step 23553: {'lr': 0.0004742916786578227, 'samples': 4522176, 'steps': 23552, 'loss/train': 1.3833774328231812} -08/30/2021 17:25:14 - INFO - __main__ - Step 23554: {'lr': 0.00047428933466038726, 'samples': 4522368, 'steps': 23553, 'loss/train': 1.2099409103393555} -08/30/2021 17:25:15 - INFO - __main__ - Step 23555: {'lr': 0.00047428699056189047, 'samples': 4522560, 'steps': 23554, 'loss/train': 0.5132454633712769} -08/30/2021 17:25:15 - INFO - __main__ - Step 23556: {'lr': 0.0004742846463623334, 'samples': 4522752, 'steps': 23555, 'loss/train': 1.5360429286956787} -08/30/2021 17:25:15 - INFO - __main__ - Step 23557: {'lr': 0.0004742823020617172, 'samples': 4522944, 'steps': 23556, 'loss/train': 0.2798418700695038} -08/30/2021 17:25:16 - INFO - __main__ - Step 23558: {'lr': 0.0004742799576600427, 'samples': 4523136, 'steps': 23557, 'loss/train': 1.546321153640747} -08/30/2021 17:25:16 - INFO - __main__ - Step 23559: {'lr': 0.00047427761315731133, 'samples': 4523328, 'steps': 23558, 'loss/train': 1.2455106973648071} -08/30/2021 17:25:17 - INFO - __main__ - Step 23560: {'lr': 0.0004742752685535238, 'samples': 4523520, 'steps': 23559, 'loss/train': 1.5118094682693481} -08/30/2021 17:25:18 - INFO - __main__ - Step 23561: {'lr': 0.00047427292384868134, 'samples': 4523712, 'steps': 23560, 'loss/train': 1.2776174545288086} -08/30/2021 17:25:18 - INFO - __main__ - Step 23562: {'lr': 0.0004742705790427849, 'samples': 4523904, 'steps': 23561, 'loss/train': 1.1823251247406006} -08/30/2021 17:25:19 - INFO - __main__ - Step 23563: {'lr': 0.00047426823413583563, 'samples': 4524096, 'steps': 23562, 'loss/train': 1.9637054204940796} -08/30/2021 17:25:19 - INFO - __main__ - Step 23564: {'lr': 0.0004742658891278346, 'samples': 4524288, 'steps': 23563, 'loss/train': 1.7814786434173584} -08/30/2021 17:25:21 - INFO - __main__ - Step 23565: {'lr': 0.0004742635440187828, 'samples': 4524480, 'steps': 23564, 'loss/train': 1.6499422788619995} -08/30/2021 17:25:21 - INFO - __main__ - Step 23566: {'lr': 0.00047426119880868123, 'samples': 4524672, 'steps': 23565, 'loss/train': 1.9455660581588745} -08/30/2021 17:25:21 - INFO - __main__ - Step 23567: {'lr': 0.00047425885349753114, 'samples': 4524864, 'steps': 23566, 'loss/train': 1.504725456237793} -08/30/2021 17:25:22 - INFO - __main__ - Step 23568: {'lr': 0.0004742565080853334, 'samples': 4525056, 'steps': 23567, 'loss/train': 1.4364367723464966} -08/30/2021 17:25:22 - INFO - __main__ - Step 23569: {'lr': 0.00047425416257208916, 'samples': 4525248, 'steps': 23568, 'loss/train': 2.000889778137207} -08/30/2021 17:25:24 - INFO - __main__ - Step 23570: {'lr': 0.0004742518169577994, 'samples': 4525440, 'steps': 23569, 'loss/train': 0.8818508982658386} -08/30/2021 17:25:24 - INFO - __main__ - Step 23571: {'lr': 0.0004742494712424653, 'samples': 4525632, 'steps': 23570, 'loss/train': 1.1138865947723389} -08/30/2021 17:25:24 - INFO - __main__ - Step 23572: {'lr': 0.0004742471254260878, 'samples': 4525824, 'steps': 23571, 'loss/train': 2.152121067047119} -08/30/2021 17:25:25 - INFO - __main__ - Step 23573: {'lr': 0.0004742447795086681, 'samples': 4526016, 'steps': 23572, 'loss/train': 1.2545866966247559} -08/30/2021 17:25:25 - INFO - __main__ - Step 23574: {'lr': 0.00047424243349020705, 'samples': 4526208, 'steps': 23573, 'loss/train': 1.5952011346817017} -08/30/2021 17:25:27 - INFO - __main__ - Step 23575: {'lr': 0.0004742400873707059, 'samples': 4526400, 'steps': 23574, 'loss/train': 1.7012284994125366} -08/30/2021 17:25:28 - INFO - __main__ - Step 23576: {'lr': 0.0004742377411501656, 'samples': 4526592, 'steps': 23575, 'loss/train': 1.9678068161010742} -08/30/2021 17:25:28 - INFO - __main__ - Step 23577: {'lr': 0.00047423539482858724, 'samples': 4526784, 'steps': 23576, 'loss/train': 2.030181646347046} -08/30/2021 17:25:28 - INFO - __main__ - Step 23578: {'lr': 0.0004742330484059718, 'samples': 4526976, 'steps': 23577, 'loss/train': 1.1054855585098267} -08/30/2021 17:25:29 - INFO - __main__ - Step 23579: {'lr': 0.0004742307018823205, 'samples': 4527168, 'steps': 23578, 'loss/train': 1.9471453428268433} -08/30/2021 17:25:29 - INFO - __main__ - Step 23580: {'lr': 0.0004742283552576343, 'samples': 4527360, 'steps': 23579, 'loss/train': 1.2475463151931763} -08/30/2021 17:25:31 - INFO - __main__ - Step 23581: {'lr': 0.0004742260085319142, 'samples': 4527552, 'steps': 23580, 'loss/train': 1.7846564054489136} -08/30/2021 17:25:31 - INFO - __main__ - Step 23582: {'lr': 0.0004742236617051614, 'samples': 4527744, 'steps': 23581, 'loss/train': 1.6171941757202148} -08/30/2021 17:25:31 - INFO - __main__ - Step 23583: {'lr': 0.00047422131477737684, 'samples': 4527936, 'steps': 23582, 'loss/train': 1.8229527473449707} -08/30/2021 17:25:32 - INFO - __main__ - Step 23584: {'lr': 0.00047421896774856156, 'samples': 4528128, 'steps': 23583, 'loss/train': 1.7556407451629639} -08/30/2021 17:25:32 - INFO - __main__ - Step 23585: {'lr': 0.00047421662061871675, 'samples': 4528320, 'steps': 23584, 'loss/train': 1.4895778894424438} -08/30/2021 17:25:34 - INFO - __main__ - Step 23586: {'lr': 0.0004742142733878433, 'samples': 4528512, 'steps': 23585, 'loss/train': 2.789318561553955} -08/30/2021 17:25:34 - INFO - __main__ - Step 23587: {'lr': 0.0004742119260559424, 'samples': 4528704, 'steps': 23586, 'loss/train': 1.1185063123703003} -08/30/2021 17:25:35 - INFO - __main__ - Step 23588: {'lr': 0.0004742095786230152, 'samples': 4528896, 'steps': 23587, 'loss/train': 1.6517226696014404} -08/30/2021 17:25:35 - INFO - __main__ - Step 23589: {'lr': 0.00047420723108906247, 'samples': 4529088, 'steps': 23588, 'loss/train': 1.8413761854171753} -08/30/2021 17:25:35 - INFO - __main__ - Step 23590: {'lr': 0.0004742048834540855, 'samples': 4529280, 'steps': 23589, 'loss/train': 1.9400454759597778} -08/30/2021 17:25:36 - INFO - __main__ - Step 23591: {'lr': 0.0004742025357180852, 'samples': 4529472, 'steps': 23590, 'loss/train': 1.9612764120101929} -08/30/2021 17:25:37 - INFO - __main__ - Step 23592: {'lr': 0.00047420018788106274, 'samples': 4529664, 'steps': 23591, 'loss/train': 1.7768454551696777} -08/30/2021 17:25:38 - INFO - __main__ - Step 23593: {'lr': 0.00047419783994301915, 'samples': 4529856, 'steps': 23592, 'loss/train': 1.7378946542739868} -08/30/2021 17:25:38 - INFO - __main__ - Step 23594: {'lr': 0.0004741954919039554, 'samples': 4530048, 'steps': 23593, 'loss/train': 1.406349539756775} -08/30/2021 17:25:38 - INFO - __main__ - Step 23595: {'lr': 0.0004741931437638727, 'samples': 4530240, 'steps': 23594, 'loss/train': 1.4765241146087646} -08/30/2021 17:25:39 - INFO - __main__ - Step 23596: {'lr': 0.000474190795522772, 'samples': 4530432, 'steps': 23595, 'loss/train': 2.1187362670898438} -08/30/2021 17:25:40 - INFO - __main__ - Step 23597: {'lr': 0.00047418844718065433, 'samples': 4530624, 'steps': 23596, 'loss/train': 0.4812004864215851} -08/30/2021 17:25:41 - INFO - __main__ - Step 23598: {'lr': 0.0004741860987375209, 'samples': 4530816, 'steps': 23597, 'loss/train': 1.5386368036270142} -08/30/2021 17:25:41 - INFO - __main__ - Step 23599: {'lr': 0.00047418375019337263, 'samples': 4531008, 'steps': 23598, 'loss/train': 1.9456770420074463} -08/30/2021 17:25:41 - INFO - __main__ - Step 23600: {'lr': 0.00047418140154821065, 'samples': 4531200, 'steps': 23599, 'loss/train': 1.0276881456375122} -08/30/2021 17:25:42 - INFO - __main__ - Step 23601: {'lr': 0.00047417905280203594, 'samples': 4531392, 'steps': 23600, 'loss/train': 1.151970624923706} -08/30/2021 17:25:43 - INFO - __main__ - Step 23602: {'lr': 0.00047417670395484963, 'samples': 4531584, 'steps': 23601, 'loss/train': 1.806605339050293} -08/30/2021 17:25:44 - INFO - __main__ - Step 23603: {'lr': 0.0004741743550066527, 'samples': 4531776, 'steps': 23602, 'loss/train': 1.379116415977478} -08/30/2021 17:25:44 - INFO - __main__ - Step 23604: {'lr': 0.00047417200595744637, 'samples': 4531968, 'steps': 23603, 'loss/train': 1.7826013565063477} -08/30/2021 17:25:44 - INFO - __main__ - Step 23605: {'lr': 0.0004741696568072316, 'samples': 4532160, 'steps': 23604, 'loss/train': 1.6874490976333618} -08/30/2021 17:25:45 - INFO - __main__ - Step 23606: {'lr': 0.00047416730755600936, 'samples': 4532352, 'steps': 23605, 'loss/train': 1.602535605430603} -08/30/2021 17:25:46 - INFO - __main__ - Step 23607: {'lr': 0.0004741649582037808, 'samples': 4532544, 'steps': 23606, 'loss/train': 3.4111196994781494} -08/30/2021 17:25:47 - INFO - __main__ - Step 23608: {'lr': 0.000474162608750547, 'samples': 4532736, 'steps': 23607, 'loss/train': 1.413873314857483} -08/30/2021 17:25:47 - INFO - __main__ - Step 23609: {'lr': 0.000474160259196309, 'samples': 4532928, 'steps': 23608, 'loss/train': 1.287006139755249} -08/30/2021 17:25:48 - INFO - __main__ - Step 23610: {'lr': 0.0004741579095410678, 'samples': 4533120, 'steps': 23609, 'loss/train': 2.030071496963501} -08/30/2021 17:25:48 - INFO - __main__ - Step 23611: {'lr': 0.0004741555597848245, 'samples': 4533312, 'steps': 23610, 'loss/train': 2.079184055328369} -08/30/2021 17:25:50 - INFO - __main__ - Step 23612: {'lr': 0.00047415320992758025, 'samples': 4533504, 'steps': 23611, 'loss/train': 2.58381724357605} -08/30/2021 17:25:50 - INFO - __main__ - Step 23613: {'lr': 0.00047415085996933593, 'samples': 4533696, 'steps': 23612, 'loss/train': 1.6858973503112793} -08/30/2021 17:25:50 - INFO - __main__ - Step 23614: {'lr': 0.00047414850991009275, 'samples': 4533888, 'steps': 23613, 'loss/train': 1.6573758125305176} -08/30/2021 17:25:51 - INFO - __main__ - Step 23615: {'lr': 0.00047414615974985164, 'samples': 4534080, 'steps': 23614, 'loss/train': 1.5540821552276611} -08/30/2021 17:25:51 - INFO - __main__ - Step 23616: {'lr': 0.0004741438094886138, 'samples': 4534272, 'steps': 23615, 'loss/train': 1.774855375289917} -08/30/2021 17:25:51 - INFO - __main__ - Step 23617: {'lr': 0.00047414145912638017, 'samples': 4534464, 'steps': 23616, 'loss/train': 1.572225570678711} -08/30/2021 17:25:53 - INFO - __main__ - Step 23618: {'lr': 0.00047413910866315193, 'samples': 4534656, 'steps': 23617, 'loss/train': 1.414900541305542} -08/30/2021 17:25:53 - INFO - __main__ - Step 23619: {'lr': 0.00047413675809893, 'samples': 4534848, 'steps': 23618, 'loss/train': 1.2714629173278809} -08/30/2021 17:25:54 - INFO - __main__ - Step 23620: {'lr': 0.0004741344074337155, 'samples': 4535040, 'steps': 23619, 'loss/train': 1.5200704336166382} -08/30/2021 17:25:54 - INFO - __main__ - Step 23621: {'lr': 0.00047413205666750955, 'samples': 4535232, 'steps': 23620, 'loss/train': 1.6622098684310913} -08/30/2021 17:25:55 - INFO - __main__ - Step 23622: {'lr': 0.0004741297058003131, 'samples': 4535424, 'steps': 23621, 'loss/train': 2.0289008617401123} -08/30/2021 17:25:56 - INFO - __main__ - Step 23623: {'lr': 0.00047412735483212725, 'samples': 4535616, 'steps': 23622, 'loss/train': 1.5492668151855469} -08/30/2021 17:25:56 - INFO - __main__ - Step 23624: {'lr': 0.0004741250037629531, 'samples': 4535808, 'steps': 23623, 'loss/train': 1.347144603729248} -08/30/2021 17:25:57 - INFO - __main__ - Step 23625: {'lr': 0.00047412265259279176, 'samples': 4536000, 'steps': 23624, 'loss/train': 1.609100103378296} -08/30/2021 17:25:57 - INFO - __main__ - Step 23626: {'lr': 0.0004741203013216441, 'samples': 4536192, 'steps': 23625, 'loss/train': 1.5195554494857788} -08/30/2021 17:25:57 - INFO - __main__ - Step 23627: {'lr': 0.0004741179499495113, 'samples': 4536384, 'steps': 23626, 'loss/train': 1.8828595876693726} -08/30/2021 17:26:00 - INFO - __main__ - Step 23628: {'lr': 0.00047411559847639447, 'samples': 4536576, 'steps': 23627, 'loss/train': 1.3689078092575073} -08/30/2021 17:26:00 - INFO - __main__ - Step 23629: {'lr': 0.0004741132469022946, 'samples': 4536768, 'steps': 23628, 'loss/train': 6.122838973999023} -08/30/2021 17:26:01 - INFO - __main__ - Step 23630: {'lr': 0.00047411089522721275, 'samples': 4536960, 'steps': 23629, 'loss/train': 1.442733645439148} -08/30/2021 17:26:01 - INFO - __main__ - Step 23631: {'lr': 0.00047410854345114996, 'samples': 4537152, 'steps': 23630, 'loss/train': 1.2228111028671265} -08/30/2021 17:26:01 - INFO - __main__ - Step 23632: {'lr': 0.0004741061915741073, 'samples': 4537344, 'steps': 23631, 'loss/train': 2.2163054943084717} -08/30/2021 17:26:02 - INFO - __main__ - Step 23633: {'lr': 0.0004741038395960859, 'samples': 4537536, 'steps': 23632, 'loss/train': 0.09782514721155167} -08/30/2021 17:26:03 - INFO - __main__ - Step 23634: {'lr': 0.0004741014875170867, 'samples': 4537728, 'steps': 23633, 'loss/train': 2.023845672607422} -08/30/2021 17:26:04 - INFO - __main__ - Step 23635: {'lr': 0.0004740991353371109, 'samples': 4537920, 'steps': 23634, 'loss/train': 1.860496163368225} -08/30/2021 17:26:04 - INFO - __main__ - Step 23636: {'lr': 0.0004740967830561595, 'samples': 4538112, 'steps': 23635, 'loss/train': 1.764891505241394} -08/30/2021 17:26:04 - INFO - __main__ - Step 23637: {'lr': 0.0004740944306742335, 'samples': 4538304, 'steps': 23636, 'loss/train': 1.920194387435913} -08/30/2021 17:26:05 - INFO - __main__ - Step 23638: {'lr': 0.00047409207819133406, 'samples': 4538496, 'steps': 23637, 'loss/train': 1.4395520687103271} -08/30/2021 17:26:06 - INFO - __main__ - Step 23639: {'lr': 0.0004740897256074621, 'samples': 4538688, 'steps': 23638, 'loss/train': 1.7058806419372559} -08/30/2021 17:26:07 - INFO - __main__ - Step 23640: {'lr': 0.00047408737292261883, 'samples': 4538880, 'steps': 23639, 'loss/train': 1.8294278383255005} -08/30/2021 17:26:07 - INFO - __main__ - Step 23641: {'lr': 0.0004740850201368052, 'samples': 4539072, 'steps': 23640, 'loss/train': 1.08510160446167} -08/30/2021 17:26:07 - INFO - __main__ - Step 23642: {'lr': 0.00047408266725002234, 'samples': 4539264, 'steps': 23641, 'loss/train': 1.2237006425857544} -08/30/2021 17:26:08 - INFO - __main__ - Step 23643: {'lr': 0.00047408031426227136, 'samples': 4539456, 'steps': 23642, 'loss/train': 1.8229749202728271} -08/30/2021 17:26:09 - INFO - __main__ - Step 23644: {'lr': 0.0004740779611735532, 'samples': 4539648, 'steps': 23643, 'loss/train': 1.9241870641708374} -08/30/2021 17:26:10 - INFO - __main__ - Step 23645: {'lr': 0.00047407560798386894, 'samples': 4539840, 'steps': 23644, 'loss/train': 1.0174429416656494} -08/30/2021 17:26:10 - INFO - __main__ - Step 23646: {'lr': 0.00047407325469321973, 'samples': 4540032, 'steps': 23645, 'loss/train': 1.2745970487594604} -08/30/2021 17:26:10 - INFO - __main__ - Step 23647: {'lr': 0.0004740709013016065, 'samples': 4540224, 'steps': 23646, 'loss/train': 1.042733073234558} -08/30/2021 17:26:11 - INFO - __main__ - Step 23648: {'lr': 0.0004740685478090304, 'samples': 4540416, 'steps': 23647, 'loss/train': 1.7291159629821777} -08/30/2021 17:26:13 - INFO - __main__ - Step 23649: {'lr': 0.00047406619421549247, 'samples': 4540608, 'steps': 23648, 'loss/train': 1.4979697465896606} -08/30/2021 17:26:13 - INFO - __main__ - Step 23650: {'lr': 0.0004740638405209938, 'samples': 4540800, 'steps': 23649, 'loss/train': 1.1898342370986938} -08/30/2021 17:26:13 - INFO - __main__ - Step 23651: {'lr': 0.0004740614867255353, 'samples': 4540992, 'steps': 23650, 'loss/train': 0.5996770858764648} -08/30/2021 17:26:14 - INFO - __main__ - Step 23652: {'lr': 0.0004740591328291183, 'samples': 4541184, 'steps': 23651, 'loss/train': 1.409492015838623} -08/30/2021 17:26:14 - INFO - __main__ - Step 23653: {'lr': 0.0004740567788317437, 'samples': 4541376, 'steps': 23652, 'loss/train': 1.5661993026733398} -08/30/2021 17:26:14 - INFO - __main__ - Step 23654: {'lr': 0.00047405442473341246, 'samples': 4541568, 'steps': 23653, 'loss/train': 5.594666481018066} -08/30/2021 17:26:15 - INFO - __main__ - Step 23655: {'lr': 0.0004740520705341259, 'samples': 4541760, 'steps': 23654, 'loss/train': 6.806138515472412} -08/30/2021 17:26:16 - INFO - __main__ - Step 23656: {'lr': 0.0004740497162338848, 'samples': 4541952, 'steps': 23655, 'loss/train': 1.7770015001296997} -08/30/2021 17:26:17 - INFO - __main__ - Step 23657: {'lr': 0.00047404736183269045, 'samples': 4542144, 'steps': 23656, 'loss/train': 1.4531251192092896} -08/30/2021 17:26:17 - INFO - __main__ - Step 23658: {'lr': 0.0004740450073305438, 'samples': 4542336, 'steps': 23657, 'loss/train': 1.4769870042800903} -08/30/2021 17:26:17 - INFO - __main__ - Step 23659: {'lr': 0.00047404265272744586, 'samples': 4542528, 'steps': 23658, 'loss/train': 1.9212251901626587} -08/30/2021 17:26:18 - INFO - __main__ - Step 23660: {'lr': 0.0004740402980233978, 'samples': 4542720, 'steps': 23659, 'loss/train': 1.7518775463104248} -08/30/2021 17:26:19 - INFO - __main__ - Step 23661: {'lr': 0.00047403794321840064, 'samples': 4542912, 'steps': 23660, 'loss/train': 2.1008946895599365} -08/30/2021 17:26:20 - INFO - __main__ - Step 23662: {'lr': 0.0004740355883124555, 'samples': 4543104, 'steps': 23661, 'loss/train': 1.7716931104660034} -08/30/2021 17:26:20 - INFO - __main__ - Step 23663: {'lr': 0.0004740332333055633, 'samples': 4543296, 'steps': 23662, 'loss/train': 1.3145335912704468} -08/30/2021 17:26:20 - INFO - __main__ - Step 23664: {'lr': 0.00047403087819772517, 'samples': 4543488, 'steps': 23663, 'loss/train': 2.1947436332702637} -08/30/2021 17:26:21 - INFO - __main__ - Step 23665: {'lr': 0.0004740285229889423, 'samples': 4543680, 'steps': 23664, 'loss/train': 1.6230443716049194} -08/30/2021 17:26:22 - INFO - __main__ - Step 23666: {'lr': 0.0004740261676792155, 'samples': 4543872, 'steps': 23665, 'loss/train': 1.6724753379821777} -08/30/2021 17:26:23 - INFO - __main__ - Step 23667: {'lr': 0.00047402381226854606, 'samples': 4544064, 'steps': 23666, 'loss/train': 1.950594186782837} -08/30/2021 17:26:23 - INFO - __main__ - Step 23668: {'lr': 0.0004740214567569349, 'samples': 4544256, 'steps': 23667, 'loss/train': 1.1832435131072998} -08/30/2021 17:26:23 - INFO - __main__ - Step 23669: {'lr': 0.00047401910114438313, 'samples': 4544448, 'steps': 23668, 'loss/train': 0.7969381809234619} -08/30/2021 17:26:24 - INFO - __main__ - Step 23670: {'lr': 0.0004740167454308918, 'samples': 4544640, 'steps': 23669, 'loss/train': 1.410292148590088} -08/30/2021 17:26:25 - INFO - __main__ - Step 23671: {'lr': 0.00047401438961646206, 'samples': 4544832, 'steps': 23670, 'loss/train': 1.860082983970642} -08/30/2021 17:26:26 - INFO - __main__ - Step 23672: {'lr': 0.0004740120337010948, 'samples': 4545024, 'steps': 23671, 'loss/train': 1.6472742557525635} -08/30/2021 17:26:26 - INFO - __main__ - Step 23673: {'lr': 0.0004740096776847912, 'samples': 4545216, 'steps': 23672, 'loss/train': 0.9796372056007385} -08/30/2021 17:26:26 - INFO - __main__ - Step 23674: {'lr': 0.0004740073215675523, 'samples': 4545408, 'steps': 23673, 'loss/train': 1.9655559062957764} -08/30/2021 17:26:27 - INFO - __main__ - Step 23675: {'lr': 0.00047400496534937914, 'samples': 4545600, 'steps': 23674, 'loss/train': 1.719420075416565} -08/30/2021 17:26:27 - INFO - __main__ - Step 23676: {'lr': 0.00047400260903027283, 'samples': 4545792, 'steps': 23675, 'loss/train': 0.5504816770553589} -08/30/2021 17:26:29 - INFO - __main__ - Step 23677: {'lr': 0.0004740002526102344, 'samples': 4545984, 'steps': 23676, 'loss/train': 0.38618308305740356} -08/30/2021 17:26:29 - INFO - __main__ - Step 23678: {'lr': 0.0004739978960892649, 'samples': 4546176, 'steps': 23677, 'loss/train': 1.6172184944152832} -08/30/2021 17:26:30 - INFO - __main__ - Step 23679: {'lr': 0.0004739955394673654, 'samples': 4546368, 'steps': 23678, 'loss/train': 1.553303837776184} -08/30/2021 17:26:30 - INFO - __main__ - Step 23680: {'lr': 0.000473993182744537, 'samples': 4546560, 'steps': 23679, 'loss/train': 1.5233919620513916} -08/30/2021 17:26:30 - INFO - __main__ - Step 23681: {'lr': 0.0004739908259207807, 'samples': 4546752, 'steps': 23680, 'loss/train': 0.3007315993309021} -08/30/2021 17:26:32 - INFO - __main__ - Step 23682: {'lr': 0.00047398846899609755, 'samples': 4546944, 'steps': 23681, 'loss/train': 6.533685684204102} -08/30/2021 17:26:33 - INFO - __main__ - Step 23683: {'lr': 0.0004739861119704887, 'samples': 4547136, 'steps': 23682, 'loss/train': 1.275080919265747} -08/30/2021 17:26:33 - INFO - __main__ - Step 23684: {'lr': 0.00047398375484395517, 'samples': 4547328, 'steps': 23683, 'loss/train': 1.5425148010253906} -08/30/2021 17:26:33 - INFO - __main__ - Step 23685: {'lr': 0.00047398139761649794, 'samples': 4547520, 'steps': 23684, 'loss/train': 1.7344295978546143} -08/30/2021 17:26:34 - INFO - __main__ - Step 23686: {'lr': 0.00047397904028811824, 'samples': 4547712, 'steps': 23685, 'loss/train': 1.391536831855774} -08/30/2021 17:26:34 - INFO - __main__ - Step 23687: {'lr': 0.000473976682858817, 'samples': 4547904, 'steps': 23686, 'loss/train': 2.121718645095825} -08/30/2021 17:26:36 - INFO - __main__ - Step 23688: {'lr': 0.00047397432532859533, 'samples': 4548096, 'steps': 23687, 'loss/train': 1.1281750202178955} -08/30/2021 17:26:36 - INFO - __main__ - Step 23689: {'lr': 0.00047397196769745435, 'samples': 4548288, 'steps': 23688, 'loss/train': 1.6202231645584106} -08/30/2021 17:26:36 - INFO - __main__ - Step 23690: {'lr': 0.00047396960996539495, 'samples': 4548480, 'steps': 23689, 'loss/train': 1.5830765962600708} -08/30/2021 17:26:37 - INFO - __main__ - Step 23691: {'lr': 0.00047396725213241835, 'samples': 4548672, 'steps': 23690, 'loss/train': 1.1786617040634155} -08/30/2021 17:26:37 - INFO - __main__ - Step 23692: {'lr': 0.0004739648941985256, 'samples': 4548864, 'steps': 23691, 'loss/train': 1.6706563234329224} -08/30/2021 17:26:38 - INFO - __main__ - Step 23693: {'lr': 0.00047396253616371767, 'samples': 4549056, 'steps': 23692, 'loss/train': 1.6007726192474365} -08/30/2021 17:26:39 - INFO - __main__ - Step 23694: {'lr': 0.00047396017802799566, 'samples': 4549248, 'steps': 23693, 'loss/train': 1.8842920064926147} -08/30/2021 17:26:39 - INFO - __main__ - Step 23695: {'lr': 0.0004739578197913607, 'samples': 4549440, 'steps': 23694, 'loss/train': 1.7273802757263184} -08/30/2021 17:26:40 - INFO - __main__ - Step 23696: {'lr': 0.00047395546145381377, 'samples': 4549632, 'steps': 23695, 'loss/train': 1.6088329553604126} -08/30/2021 17:26:40 - INFO - __main__ - Step 23697: {'lr': 0.000473953103015356, 'samples': 4549824, 'steps': 23696, 'loss/train': 2.488471508026123} -08/30/2021 17:26:41 - INFO - __main__ - Step 23698: {'lr': 0.0004739507444759884, 'samples': 4550016, 'steps': 23697, 'loss/train': 1.784038782119751} -08/30/2021 17:26:42 - INFO - __main__ - Step 23699: {'lr': 0.0004739483858357121, 'samples': 4550208, 'steps': 23698, 'loss/train': 1.3716033697128296} -08/30/2021 17:26:42 - INFO - __main__ - Step 23700: {'lr': 0.00047394602709452806, 'samples': 4550400, 'steps': 23699, 'loss/train': 1.6060470342636108} -08/30/2021 17:26:43 - INFO - __main__ - Step 23701: {'lr': 0.0004739436682524373, 'samples': 4550592, 'steps': 23700, 'loss/train': 1.7302641868591309} -08/30/2021 17:26:43 - INFO - __main__ - Step 23702: {'lr': 0.00047394130930944115, 'samples': 4550784, 'steps': 23701, 'loss/train': 1.2669318914413452} -08/30/2021 17:26:45 - INFO - __main__ - Step 23703: {'lr': 0.0004739389502655404, 'samples': 4550976, 'steps': 23702, 'loss/train': 1.8177402019500732} -08/30/2021 17:26:45 - INFO - __main__ - Step 23704: {'lr': 0.0004739365911207363, 'samples': 4551168, 'steps': 23703, 'loss/train': 1.7356849908828735} -08/30/2021 17:26:45 - INFO - __main__ - Step 23705: {'lr': 0.0004739342318750297, 'samples': 4551360, 'steps': 23704, 'loss/train': 2.165408134460449} -08/30/2021 17:26:46 - INFO - __main__ - Step 23706: {'lr': 0.00047393187252842183, 'samples': 4551552, 'steps': 23705, 'loss/train': 1.984107255935669} -08/30/2021 17:26:46 - INFO - __main__ - Step 23707: {'lr': 0.0004739295130809138, 'samples': 4551744, 'steps': 23706, 'loss/train': 1.9873802661895752} -08/30/2021 17:26:47 - INFO - __main__ - Step 23708: {'lr': 0.0004739271535325065, 'samples': 4551936, 'steps': 23707, 'loss/train': 1.2757214307785034} -08/30/2021 17:26:48 - INFO - __main__ - Step 23709: {'lr': 0.00047392479388320106, 'samples': 4552128, 'steps': 23708, 'loss/train': 1.105953574180603} -08/30/2021 17:26:48 - INFO - __main__ - Step 23710: {'lr': 0.0004739224341329987, 'samples': 4552320, 'steps': 23709, 'loss/train': 1.5607233047485352} -08/30/2021 17:26:49 - INFO - __main__ - Step 23711: {'lr': 0.0004739200742819002, 'samples': 4552512, 'steps': 23710, 'loss/train': 2.1628360748291016} -08/30/2021 17:26:49 - INFO - __main__ - Step 23712: {'lr': 0.0004739177143299068, 'samples': 4552704, 'steps': 23711, 'loss/train': 1.4729646444320679} -08/30/2021 17:26:49 - INFO - __main__ - Step 23713: {'lr': 0.00047391535427701966, 'samples': 4552896, 'steps': 23712, 'loss/train': 1.4183703660964966} -08/30/2021 17:26:51 - INFO - __main__ - Step 23714: {'lr': 0.0004739129941232396, 'samples': 4553088, 'steps': 23713, 'loss/train': 1.4096698760986328} -08/30/2021 17:26:51 - INFO - __main__ - Step 23715: {'lr': 0.0004739106338685678, 'samples': 4553280, 'steps': 23714, 'loss/train': 1.3374930620193481} -08/30/2021 17:26:52 - INFO - __main__ - Step 23716: {'lr': 0.00047390827351300537, 'samples': 4553472, 'steps': 23715, 'loss/train': 1.6537529230117798} -08/30/2021 17:26:52 - INFO - __main__ - Step 23717: {'lr': 0.00047390591305655327, 'samples': 4553664, 'steps': 23716, 'loss/train': 1.4693373441696167} -08/30/2021 17:26:52 - INFO - __main__ - Step 23718: {'lr': 0.0004739035524992127, 'samples': 4553856, 'steps': 23717, 'loss/train': 1.6239254474639893} -08/30/2021 17:26:54 - INFO - __main__ - Step 23719: {'lr': 0.00047390119184098455, 'samples': 4554048, 'steps': 23718, 'loss/train': 1.8840086460113525} -08/30/2021 17:26:55 - INFO - __main__ - Step 23720: {'lr': 0.00047389883108187004, 'samples': 4554240, 'steps': 23719, 'loss/train': 0.38106250762939453} -08/30/2021 17:26:55 - INFO - __main__ - Step 23721: {'lr': 0.00047389647022187014, 'samples': 4554432, 'steps': 23720, 'loss/train': 1.8415324687957764} -08/30/2021 17:26:55 - INFO - __main__ - Step 23722: {'lr': 0.000473894109260986, 'samples': 4554624, 'steps': 23721, 'loss/train': 1.9239407777786255} -08/30/2021 17:26:56 - INFO - __main__ - Step 23723: {'lr': 0.00047389174819921856, 'samples': 4554816, 'steps': 23722, 'loss/train': 0.0727807879447937} -08/30/2021 17:26:56 - INFO - __main__ - Step 23724: {'lr': 0.000473889387036569, 'samples': 4555008, 'steps': 23723, 'loss/train': 1.2444167137145996} -08/30/2021 17:26:57 - INFO - __main__ - Step 23725: {'lr': 0.0004738870257730383, 'samples': 4555200, 'steps': 23724, 'loss/train': 1.8511418104171753} -08/30/2021 17:26:58 - INFO - __main__ - Step 23726: {'lr': 0.00047388466440862755, 'samples': 4555392, 'steps': 23725, 'loss/train': 1.8768689632415771} -08/30/2021 17:26:58 - INFO - __main__ - Step 23727: {'lr': 0.0004738823029433379, 'samples': 4555584, 'steps': 23726, 'loss/train': 1.9509973526000977} -08/30/2021 17:26:59 - INFO - __main__ - Step 23728: {'lr': 0.0004738799413771703, 'samples': 4555776, 'steps': 23727, 'loss/train': 1.3229200839996338} -08/30/2021 17:26:59 - INFO - __main__ - Step 23729: {'lr': 0.0004738775797101258, 'samples': 4555968, 'steps': 23728, 'loss/train': 1.505495548248291} -08/30/2021 17:27:01 - INFO - __main__ - Step 23730: {'lr': 0.0004738752179422056, 'samples': 4556160, 'steps': 23729, 'loss/train': 1.695680022239685} -08/30/2021 17:27:01 - INFO - __main__ - Step 23731: {'lr': 0.00047387285607341064, 'samples': 4556352, 'steps': 23730, 'loss/train': 1.7703814506530762} -08/30/2021 17:27:01 - INFO - __main__ - Step 23732: {'lr': 0.00047387049410374207, 'samples': 4556544, 'steps': 23731, 'loss/train': 1.450698971748352} -08/30/2021 17:27:02 - INFO - __main__ - Step 23733: {'lr': 0.00047386813203320084, 'samples': 4556736, 'steps': 23732, 'loss/train': 1.589904546737671} -08/30/2021 17:27:02 - INFO - __main__ - Step 23734: {'lr': 0.0004738657698617881, 'samples': 4556928, 'steps': 23733, 'loss/train': 1.4130483865737915} -08/30/2021 17:27:05 - INFO - __main__ - Step 23735: {'lr': 0.00047386340758950494, 'samples': 4557120, 'steps': 23734, 'loss/train': 1.88881254196167} -08/30/2021 17:27:05 - INFO - __main__ - Step 23736: {'lr': 0.0004738610452163523, 'samples': 4557312, 'steps': 23735, 'loss/train': 2.1662113666534424} -08/30/2021 17:27:05 - INFO - __main__ - Step 23737: {'lr': 0.00047385868274233144, 'samples': 4557504, 'steps': 23736, 'loss/train': 2.7109947204589844} -08/30/2021 17:27:06 - INFO - __main__ - Step 23738: {'lr': 0.0004738563201674432, 'samples': 4557696, 'steps': 23737, 'loss/train': 1.4272804260253906} -08/30/2021 17:27:06 - INFO - __main__ - Step 23739: {'lr': 0.00047385395749168885, 'samples': 4557888, 'steps': 23738, 'loss/train': 1.6467515230178833} -08/30/2021 17:27:06 - INFO - __main__ - Step 23740: {'lr': 0.00047385159471506936, 'samples': 4558080, 'steps': 23739, 'loss/train': 1.569273829460144} -08/30/2021 17:27:08 - INFO - __main__ - Step 23741: {'lr': 0.00047384923183758573, 'samples': 4558272, 'steps': 23740, 'loss/train': 0.1312096118927002} -08/30/2021 17:27:09 - INFO - __main__ - Step 23742: {'lr': 0.0004738468688592391, 'samples': 4558464, 'steps': 23741, 'loss/train': 1.763966679573059} -08/30/2021 17:27:09 - INFO - __main__ - Step 23743: {'lr': 0.00047384450578003055, 'samples': 4558656, 'steps': 23742, 'loss/train': 1.6272128820419312} -08/30/2021 17:27:09 - INFO - __main__ - Step 23744: {'lr': 0.00047384214259996117, 'samples': 4558848, 'steps': 23743, 'loss/train': 1.6774150133132935} -08/30/2021 17:27:10 - INFO - __main__ - Step 23745: {'lr': 0.0004738397793190319, 'samples': 4559040, 'steps': 23744, 'loss/train': 1.3481712341308594} -08/30/2021 17:27:11 - INFO - __main__ - Step 23746: {'lr': 0.00047383741593724386, 'samples': 4559232, 'steps': 23745, 'loss/train': 1.5829099416732788} -08/30/2021 17:27:12 - INFO - __main__ - Step 23747: {'lr': 0.0004738350524545982, 'samples': 4559424, 'steps': 23746, 'loss/train': 1.2665964365005493} -08/30/2021 17:27:12 - INFO - __main__ - Step 23748: {'lr': 0.0004738326888710959, 'samples': 4559616, 'steps': 23747, 'loss/train': 1.731207013130188} -08/30/2021 17:27:12 - INFO - __main__ - Step 23749: {'lr': 0.000473830325186738, 'samples': 4559808, 'steps': 23748, 'loss/train': 1.6543854475021362} -08/30/2021 17:27:13 - INFO - __main__ - Step 23750: {'lr': 0.0004738279614015257, 'samples': 4560000, 'steps': 23749, 'loss/train': 1.592079758644104} -08/30/2021 17:27:15 - INFO - __main__ - Step 23751: {'lr': 0.0004738255975154599, 'samples': 4560192, 'steps': 23750, 'loss/train': 1.4464178085327148} -08/30/2021 17:27:15 - INFO - __main__ - Step 23752: {'lr': 0.0004738232335285417, 'samples': 4560384, 'steps': 23751, 'loss/train': 1.5318843126296997} -08/30/2021 17:27:16 - INFO - __main__ - Step 23753: {'lr': 0.0004738208694407723, 'samples': 4560576, 'steps': 23752, 'loss/train': 1.4185625314712524} -08/30/2021 17:27:16 - INFO - __main__ - Step 23754: {'lr': 0.00047381850525215265, 'samples': 4560768, 'steps': 23753, 'loss/train': 0.732387363910675} -08/30/2021 17:27:16 - INFO - __main__ - Step 23755: {'lr': 0.0004738161409626838, 'samples': 4560960, 'steps': 23754, 'loss/train': 0.6555193066596985} -08/30/2021 17:27:18 - INFO - __main__ - Step 23756: {'lr': 0.0004738137765723669, 'samples': 4561152, 'steps': 23755, 'loss/train': 1.698353886604309} -08/30/2021 17:27:18 - INFO - __main__ - Step 23757: {'lr': 0.0004738114120812029, 'samples': 4561344, 'steps': 23756, 'loss/train': 1.4144833087921143} -08/30/2021 17:27:19 - INFO - __main__ - Step 23758: {'lr': 0.000473809047489193, 'samples': 4561536, 'steps': 23757, 'loss/train': 1.623138189315796} -08/30/2021 17:27:19 - INFO - __main__ - Step 23759: {'lr': 0.00047380668279633814, 'samples': 4561728, 'steps': 23758, 'loss/train': 1.5347778797149658} -08/30/2021 17:27:19 - INFO - __main__ - Step 23760: {'lr': 0.00047380431800263945, 'samples': 4561920, 'steps': 23759, 'loss/train': 1.3153525590896606} -08/30/2021 17:27:20 - INFO - __main__ - Step 23761: {'lr': 0.000473801953108098, 'samples': 4562112, 'steps': 23760, 'loss/train': 1.927691102027893} -08/30/2021 17:27:21 - INFO - __main__ - Step 23762: {'lr': 0.0004737995881127149, 'samples': 4562304, 'steps': 23761, 'loss/train': 1.7205820083618164} -08/30/2021 17:27:22 - INFO - __main__ - Step 23763: {'lr': 0.0004737972230164911, 'samples': 4562496, 'steps': 23762, 'loss/train': 1.9505927562713623} -08/30/2021 17:27:22 - INFO - __main__ - Step 23764: {'lr': 0.0004737948578194278, 'samples': 4562688, 'steps': 23763, 'loss/train': 1.2602747678756714} -08/30/2021 17:27:22 - INFO - __main__ - Step 23765: {'lr': 0.00047379249252152585, 'samples': 4562880, 'steps': 23764, 'loss/train': 1.6362367868423462} -08/30/2021 17:27:23 - INFO - __main__ - Step 23766: {'lr': 0.00047379012712278656, 'samples': 4563072, 'steps': 23765, 'loss/train': 1.6800568103790283} -08/30/2021 17:27:24 - INFO - __main__ - Step 23767: {'lr': 0.0004737877616232108, 'samples': 4563264, 'steps': 23766, 'loss/train': 0.21542313694953918} -08/30/2021 17:27:25 - INFO - __main__ - Step 23768: {'lr': 0.0004737853960227998, 'samples': 4563456, 'steps': 23767, 'loss/train': 1.5183273553848267} -08/30/2021 17:27:25 - INFO - __main__ - Step 23769: {'lr': 0.00047378303032155454, 'samples': 4563648, 'steps': 23768, 'loss/train': 0.9760209918022156} -08/30/2021 17:27:25 - INFO - __main__ - Step 23770: {'lr': 0.0004737806645194761, 'samples': 4563840, 'steps': 23769, 'loss/train': 1.4840788841247559} -08/30/2021 17:27:26 - INFO - __main__ - Step 23771: {'lr': 0.00047377829861656556, 'samples': 4564032, 'steps': 23770, 'loss/train': 1.7820886373519897} -08/30/2021 17:27:27 - INFO - __main__ - Step 23772: {'lr': 0.000473775932612824, 'samples': 4564224, 'steps': 23771, 'loss/train': 2.6842691898345947} -08/30/2021 17:27:28 - INFO - __main__ - Step 23773: {'lr': 0.00047377356650825245, 'samples': 4564416, 'steps': 23772, 'loss/train': 1.359667420387268} -08/30/2021 17:27:28 - INFO - __main__ - Step 23774: {'lr': 0.00047377120030285194, 'samples': 4564608, 'steps': 23773, 'loss/train': 1.8385834693908691} -08/30/2021 17:27:29 - INFO - __main__ - Step 23775: {'lr': 0.0004737688339966235, 'samples': 4564800, 'steps': 23774, 'loss/train': 2.1206347942352295} -08/30/2021 17:27:29 - INFO - __main__ - Step 23776: {'lr': 0.00047376646758956844, 'samples': 4564992, 'steps': 23775, 'loss/train': 2.2828104496002197} -08/30/2021 17:27:31 - INFO - __main__ - Step 23777: {'lr': 0.00047376410108168756, 'samples': 4565184, 'steps': 23776, 'loss/train': 1.7378520965576172} -08/30/2021 17:27:31 - INFO - __main__ - Step 23778: {'lr': 0.0004737617344729821, 'samples': 4565376, 'steps': 23777, 'loss/train': 1.6882611513137817} -08/30/2021 17:27:31 - INFO - __main__ - Step 23779: {'lr': 0.00047375936776345297, 'samples': 4565568, 'steps': 23778, 'loss/train': 1.908403754234314} -08/30/2021 17:27:32 - INFO - __main__ - Step 23780: {'lr': 0.00047375700095310136, 'samples': 4565760, 'steps': 23779, 'loss/train': 1.5699435472488403} -08/30/2021 17:27:32 - INFO - __main__ - Step 23781: {'lr': 0.0004737546340419283, 'samples': 4565952, 'steps': 23780, 'loss/train': 1.626193881034851} -08/30/2021 17:27:34 - INFO - __main__ - Step 23782: {'lr': 0.0004737522670299349, 'samples': 4566144, 'steps': 23781, 'loss/train': 1.1423419713974} -08/30/2021 17:27:34 - INFO - __main__ - Step 23783: {'lr': 0.00047374989991712214, 'samples': 4566336, 'steps': 23782, 'loss/train': 1.3004885911941528} -08/30/2021 17:27:34 - INFO - __main__ - Step 23784: {'lr': 0.00047374753270349113, 'samples': 4566528, 'steps': 23783, 'loss/train': 0.8821494579315186} -08/30/2021 17:27:35 - INFO - __main__ - Step 23785: {'lr': 0.00047374516538904287, 'samples': 4566720, 'steps': 23784, 'loss/train': 1.9171324968338013} -08/30/2021 17:27:35 - INFO - __main__ - Step 23786: {'lr': 0.0004737427979737786, 'samples': 4566912, 'steps': 23785, 'loss/train': 0.9794736504554749} -08/30/2021 17:27:35 - INFO - __main__ - Step 23787: {'lr': 0.0004737404304576992, 'samples': 4567104, 'steps': 23786, 'loss/train': 1.1728854179382324} -08/30/2021 17:27:37 - INFO - __main__ - Step 23788: {'lr': 0.0004737380628408059, 'samples': 4567296, 'steps': 23787, 'loss/train': 1.5640099048614502} -08/30/2021 17:27:37 - INFO - __main__ - Step 23789: {'lr': 0.00047373569512309963, 'samples': 4567488, 'steps': 23788, 'loss/train': 1.8454991579055786} -08/30/2021 17:27:38 - INFO - __main__ - Step 23790: {'lr': 0.0004737333273045815, 'samples': 4567680, 'steps': 23789, 'loss/train': 1.1946204900741577} -08/30/2021 17:27:38 - INFO - __main__ - Step 23791: {'lr': 0.00047373095938525256, 'samples': 4567872, 'steps': 23790, 'loss/train': 1.8148601055145264} -08/30/2021 17:27:38 - INFO - __main__ - Step 23792: {'lr': 0.0004737285913651139, 'samples': 4568064, 'steps': 23791, 'loss/train': 1.5275744199752808} -08/30/2021 17:27:40 - INFO - __main__ - Step 23793: {'lr': 0.0004737262232441667, 'samples': 4568256, 'steps': 23792, 'loss/train': 1.3972017765045166} -08/30/2021 17:27:41 - INFO - __main__ - Step 23794: {'lr': 0.00047372385502241176, 'samples': 4568448, 'steps': 23793, 'loss/train': 2.057589054107666} -08/30/2021 17:27:41 - INFO - __main__ - Step 23795: {'lr': 0.0004737214866998504, 'samples': 4568640, 'steps': 23794, 'loss/train': 1.5424411296844482} -08/30/2021 17:27:42 - INFO - __main__ - Step 23796: {'lr': 0.0004737191182764836, 'samples': 4568832, 'steps': 23795, 'loss/train': 0.7936122417449951} -08/30/2021 17:27:42 - INFO - __main__ - Step 23797: {'lr': 0.0004737167497523124, 'samples': 4569024, 'steps': 23796, 'loss/train': 1.339007019996643} -08/30/2021 17:27:44 - INFO - __main__ - Step 23798: {'lr': 0.0004737143811273379, 'samples': 4569216, 'steps': 23797, 'loss/train': 1.971666693687439} -08/30/2021 17:27:44 - INFO - __main__ - Step 23799: {'lr': 0.0004737120124015611, 'samples': 4569408, 'steps': 23798, 'loss/train': 1.2081353664398193} -08/30/2021 17:27:44 - INFO - __main__ - Step 23800: {'lr': 0.00047370964357498313, 'samples': 4569600, 'steps': 23799, 'loss/train': 1.5187081098556519} -08/30/2021 17:27:45 - INFO - __main__ - Step 23801: {'lr': 0.0004737072746476051, 'samples': 4569792, 'steps': 23800, 'loss/train': 2.2719743251800537} -08/30/2021 17:27:45 - INFO - __main__ - Step 23802: {'lr': 0.00047370490561942795, 'samples': 4569984, 'steps': 23801, 'loss/train': 1.1148394346237183} -08/30/2021 17:27:45 - INFO - __main__ - Step 23803: {'lr': 0.00047370253649045286, 'samples': 4570176, 'steps': 23802, 'loss/train': 0.7776064872741699} -08/30/2021 17:27:47 - INFO - __main__ - Step 23804: {'lr': 0.00047370016726068086, 'samples': 4570368, 'steps': 23803, 'loss/train': 1.7910127639770508} -08/30/2021 17:27:47 - INFO - __main__ - Step 23805: {'lr': 0.000473697797930113, 'samples': 4570560, 'steps': 23804, 'loss/train': 1.3740880489349365} -08/30/2021 17:27:48 - INFO - __main__ - Step 23806: {'lr': 0.00047369542849875037, 'samples': 4570752, 'steps': 23805, 'loss/train': 0.9818909764289856} -08/30/2021 17:27:48 - INFO - __main__ - Step 23807: {'lr': 0.0004736930589665941, 'samples': 4570944, 'steps': 23806, 'loss/train': 1.7987041473388672} -08/30/2021 17:27:48 - INFO - __main__ - Step 23808: {'lr': 0.0004736906893336451, 'samples': 4571136, 'steps': 23807, 'loss/train': 1.6192020177841187} -08/30/2021 17:27:50 - INFO - __main__ - Step 23809: {'lr': 0.00047368831959990453, 'samples': 4571328, 'steps': 23808, 'loss/train': 1.2590991258621216} -08/30/2021 17:27:51 - INFO - __main__ - Step 23810: {'lr': 0.0004736859497653735, 'samples': 4571520, 'steps': 23809, 'loss/train': 1.176614761352539} -08/30/2021 17:27:51 - INFO - __main__ - Step 23811: {'lr': 0.0004736835798300531, 'samples': 4571712, 'steps': 23810, 'loss/train': 1.0427967309951782} -08/30/2021 17:27:52 - INFO - __main__ - Step 23812: {'lr': 0.00047368120979394415, 'samples': 4571904, 'steps': 23811, 'loss/train': 1.492321252822876} -08/30/2021 17:27:52 - INFO - __main__ - Step 23813: {'lr': 0.000473678839657048, 'samples': 4572096, 'steps': 23812, 'loss/train': 1.3117263317108154} -08/30/2021 17:27:52 - INFO - __main__ - Step 23814: {'lr': 0.0004736764694193656, 'samples': 4572288, 'steps': 23813, 'loss/train': 0.9067861437797546} -08/30/2021 17:27:54 - INFO - __main__ - Step 23815: {'lr': 0.0004736740990808981, 'samples': 4572480, 'steps': 23814, 'loss/train': 2.07078218460083} -08/30/2021 17:27:54 - INFO - __main__ - Step 23816: {'lr': 0.0004736717286416464, 'samples': 4572672, 'steps': 23815, 'loss/train': 1.5327759981155396} -08/30/2021 17:27:54 - INFO - __main__ - Step 23817: {'lr': 0.0004736693581016117, 'samples': 4572864, 'steps': 23816, 'loss/train': 1.7998594045639038} -08/30/2021 17:27:55 - INFO - __main__ - Step 23818: {'lr': 0.00047366698746079507, 'samples': 4573056, 'steps': 23817, 'loss/train': 1.7322137355804443} -08/30/2021 17:27:55 - INFO - __main__ - Step 23819: {'lr': 0.0004736646167191975, 'samples': 4573248, 'steps': 23818, 'loss/train': 1.8632237911224365} -08/30/2021 17:27:57 - INFO - __main__ - Step 23820: {'lr': 0.00047366224587682017, 'samples': 4573440, 'steps': 23819, 'loss/train': 1.5942620038986206} -08/30/2021 17:27:57 - INFO - __main__ - Step 23821: {'lr': 0.000473659874933664, 'samples': 4573632, 'steps': 23820, 'loss/train': 1.4017938375473022} -08/30/2021 17:27:57 - INFO - __main__ - Step 23822: {'lr': 0.0004736575038897303, 'samples': 4573824, 'steps': 23821, 'loss/train': 1.2695995569229126} -08/30/2021 17:27:58 - INFO - __main__ - Step 23823: {'lr': 0.0004736551327450198, 'samples': 4574016, 'steps': 23822, 'loss/train': 1.5489740371704102} -08/30/2021 17:27:58 - INFO - __main__ - Step 23824: {'lr': 0.00047365276149953387, 'samples': 4574208, 'steps': 23823, 'loss/train': 1.4475749731063843} -08/30/2021 17:28:00 - INFO - __main__ - Step 23825: {'lr': 0.0004736503901532734, 'samples': 4574400, 'steps': 23824, 'loss/train': 1.526062250137329} -08/30/2021 17:28:00 - INFO - __main__ - Step 23826: {'lr': 0.00047364801870623954, 'samples': 4574592, 'steps': 23825, 'loss/train': 1.7532002925872803} -08/30/2021 17:28:00 - INFO - __main__ - Step 23827: {'lr': 0.00047364564715843326, 'samples': 4574784, 'steps': 23826, 'loss/train': 1.91557776927948} -08/30/2021 17:28:01 - INFO - __main__ - Step 23828: {'lr': 0.00047364327550985575, 'samples': 4574976, 'steps': 23827, 'loss/train': 2.0333333015441895} -08/30/2021 17:28:01 - INFO - __main__ - Step 23829: {'lr': 0.00047364090376050805, 'samples': 4575168, 'steps': 23828, 'loss/train': 1.6888744831085205} -08/30/2021 17:28:03 - INFO - __main__ - Step 23830: {'lr': 0.0004736385319103912, 'samples': 4575360, 'steps': 23829, 'loss/train': 1.4075181484222412} -08/30/2021 17:28:03 - INFO - __main__ - Step 23831: {'lr': 0.00047363615995950624, 'samples': 4575552, 'steps': 23830, 'loss/train': 1.7036877870559692} -08/30/2021 17:28:03 - INFO - __main__ - Step 23832: {'lr': 0.0004736337879078544, 'samples': 4575744, 'steps': 23831, 'loss/train': 1.2392202615737915} -08/30/2021 17:28:04 - INFO - __main__ - Step 23833: {'lr': 0.0004736314157554365, 'samples': 4575936, 'steps': 23832, 'loss/train': 1.7700579166412354} -08/30/2021 17:28:04 - INFO - __main__ - Step 23834: {'lr': 0.00047362904350225376, 'samples': 4576128, 'steps': 23833, 'loss/train': 0.9120385646820068} -08/30/2021 17:28:06 - INFO - __main__ - Step 23835: {'lr': 0.0004736266711483073, 'samples': 4576320, 'steps': 23834, 'loss/train': 0.18678513169288635} -08/30/2021 17:28:06 - INFO - __main__ - Step 23836: {'lr': 0.00047362429869359803, 'samples': 4576512, 'steps': 23835, 'loss/train': 1.412263035774231} -08/30/2021 17:28:07 - INFO - __main__ - Step 23837: {'lr': 0.0004736219261381271, 'samples': 4576704, 'steps': 23836, 'loss/train': 1.8080602884292603} -08/30/2021 17:28:07 - INFO - __main__ - Step 23838: {'lr': 0.0004736195534818956, 'samples': 4576896, 'steps': 23837, 'loss/train': 0.12009059637784958} -08/30/2021 17:28:07 - INFO - __main__ - Step 23839: {'lr': 0.00047361718072490457, 'samples': 4577088, 'steps': 23838, 'loss/train': 1.80378258228302} -08/30/2021 17:28:09 - INFO - __main__ - Step 23840: {'lr': 0.00047361480786715514, 'samples': 4577280, 'steps': 23839, 'loss/train': 1.8580217361450195} -08/30/2021 17:28:10 - INFO - __main__ - Step 23841: {'lr': 0.00047361243490864826, 'samples': 4577472, 'steps': 23840, 'loss/train': 1.0173853635787964} -08/30/2021 17:28:10 - INFO - __main__ - Step 23842: {'lr': 0.00047361006184938517, 'samples': 4577664, 'steps': 23841, 'loss/train': 1.4172651767730713} -08/30/2021 17:28:10 - INFO - __main__ - Step 23843: {'lr': 0.00047360768868936673, 'samples': 4577856, 'steps': 23842, 'loss/train': 0.18533694744110107} -08/30/2021 17:28:11 - INFO - __main__ - Step 23844: {'lr': 0.00047360531542859415, 'samples': 4578048, 'steps': 23843, 'loss/train': 2.061516046524048} -08/30/2021 17:28:11 - INFO - __main__ - Step 23845: {'lr': 0.00047360294206706845, 'samples': 4578240, 'steps': 23844, 'loss/train': 2.084402084350586} -08/30/2021 17:28:13 - INFO - __main__ - Step 23846: {'lr': 0.0004736005686047907, 'samples': 4578432, 'steps': 23845, 'loss/train': 1.6754575967788696} -08/30/2021 17:28:14 - INFO - __main__ - Step 23847: {'lr': 0.000473598195041762, 'samples': 4578624, 'steps': 23846, 'loss/train': 1.7514890432357788} -08/30/2021 17:28:14 - INFO - __main__ - Step 23848: {'lr': 0.0004735958213779835, 'samples': 4578816, 'steps': 23847, 'loss/train': 1.93454909324646} -08/30/2021 17:28:14 - INFO - __main__ - Step 23849: {'lr': 0.0004735934476134561, 'samples': 4579008, 'steps': 23848, 'loss/train': 1.8268200159072876} -08/30/2021 17:28:15 - INFO - __main__ - Step 23850: {'lr': 0.0004735910737481809, 'samples': 4579200, 'steps': 23849, 'loss/train': 1.6639269590377808} -08/30/2021 17:28:16 - INFO - __main__ - Step 23851: {'lr': 0.0004735886997821591, 'samples': 4579392, 'steps': 23850, 'loss/train': 1.5180392265319824} -08/30/2021 17:28:17 - INFO - __main__ - Step 23852: {'lr': 0.00047358632571539163, 'samples': 4579584, 'steps': 23851, 'loss/train': 1.6867505311965942} -08/30/2021 17:28:17 - INFO - __main__ - Step 23853: {'lr': 0.0004735839515478796, 'samples': 4579776, 'steps': 23852, 'loss/train': 1.8900582790374756} -08/30/2021 17:28:18 - INFO - __main__ - Step 23854: {'lr': 0.0004735815772796241, 'samples': 4579968, 'steps': 23853, 'loss/train': 1.4159471988677979} -08/30/2021 17:28:18 - INFO - __main__ - Step 23855: {'lr': 0.0004735792029106262, 'samples': 4580160, 'steps': 23854, 'loss/train': 1.7847771644592285} -08/30/2021 17:28:19 - INFO - __main__ - Step 23856: {'lr': 0.0004735768284408869, 'samples': 4580352, 'steps': 23855, 'loss/train': 1.3962061405181885} -08/30/2021 17:28:20 - INFO - __main__ - Step 23857: {'lr': 0.00047357445387040745, 'samples': 4580544, 'steps': 23856, 'loss/train': 1.7047101259231567} -08/30/2021 17:28:20 - INFO - __main__ - Step 23858: {'lr': 0.0004735720791991887, 'samples': 4580736, 'steps': 23857, 'loss/train': 1.3259724378585815} -08/30/2021 17:28:20 - INFO - __main__ - Step 23859: {'lr': 0.00047356970442723184, 'samples': 4580928, 'steps': 23858, 'loss/train': 1.4971916675567627} -08/30/2021 17:28:21 - INFO - __main__ - Step 23860: {'lr': 0.00047356732955453794, 'samples': 4581120, 'steps': 23859, 'loss/train': 1.8438758850097656} -08/30/2021 17:28:21 - INFO - __main__ - Step 23861: {'lr': 0.00047356495458110806, 'samples': 4581312, 'steps': 23860, 'loss/train': 1.6122157573699951} -08/30/2021 17:28:23 - INFO - __main__ - Step 23862: {'lr': 0.00047356257950694326, 'samples': 4581504, 'steps': 23861, 'loss/train': 1.2520089149475098} -08/30/2021 17:28:23 - INFO - __main__ - Step 23863: {'lr': 0.0004735602043320446, 'samples': 4581696, 'steps': 23862, 'loss/train': 0.912713885307312} -08/30/2021 17:28:24 - INFO - __main__ - Step 23864: {'lr': 0.0004735578290564132, 'samples': 4581888, 'steps': 23863, 'loss/train': 2.071293830871582} -08/30/2021 17:28:24 - INFO - __main__ - Step 23865: {'lr': 0.00047355545368005003, 'samples': 4582080, 'steps': 23864, 'loss/train': 0.1382804811000824} -08/30/2021 17:28:24 - INFO - __main__ - Step 23866: {'lr': 0.00047355307820295625, 'samples': 4582272, 'steps': 23865, 'loss/train': 0.18995091319084167} -08/30/2021 17:28:25 - INFO - __main__ - Step 23867: {'lr': 0.00047355070262513287, 'samples': 4582464, 'steps': 23866, 'loss/train': 0.23722438514232635} -08/30/2021 17:28:26 - INFO - __main__ - Step 23868: {'lr': 0.00047354832694658104, 'samples': 4582656, 'steps': 23867, 'loss/train': 1.927314043045044} -08/30/2021 17:28:27 - INFO - __main__ - Step 23869: {'lr': 0.0004735459511673018, 'samples': 4582848, 'steps': 23868, 'loss/train': 1.8384425640106201} -08/30/2021 17:28:27 - INFO - __main__ - Step 23870: {'lr': 0.0004735435752872962, 'samples': 4583040, 'steps': 23869, 'loss/train': 1.5113917589187622} -08/30/2021 17:28:27 - INFO - __main__ - Step 23871: {'lr': 0.00047354119930656524, 'samples': 4583232, 'steps': 23870, 'loss/train': 1.3223645687103271} -08/30/2021 17:28:28 - INFO - __main__ - Step 23872: {'lr': 0.0004735388232251101, 'samples': 4583424, 'steps': 23871, 'loss/train': 1.503225326538086} -08/30/2021 17:28:29 - INFO - __main__ - Step 23873: {'lr': 0.00047353644704293185, 'samples': 4583616, 'steps': 23872, 'loss/train': 1.4452446699142456} -08/30/2021 17:28:30 - INFO - __main__ - Step 23874: {'lr': 0.0004735340707600315, 'samples': 4583808, 'steps': 23873, 'loss/train': 1.406503438949585} -08/30/2021 17:28:30 - INFO - __main__ - Step 23875: {'lr': 0.0004735316943764102, 'samples': 4584000, 'steps': 23874, 'loss/train': 1.6812968254089355} -08/30/2021 17:28:30 - INFO - __main__ - Step 23876: {'lr': 0.0004735293178920689, 'samples': 4584192, 'steps': 23875, 'loss/train': 2.136699914932251} -08/30/2021 17:28:31 - INFO - __main__ - Step 23877: {'lr': 0.00047352694130700873, 'samples': 4584384, 'steps': 23876, 'loss/train': 0.8547267913818359} -08/30/2021 17:28:32 - INFO - __main__ - Step 23878: {'lr': 0.00047352456462123086, 'samples': 4584576, 'steps': 23877, 'loss/train': 1.6009595394134521} -08/30/2021 17:28:33 - INFO - __main__ - Step 23879: {'lr': 0.00047352218783473614, 'samples': 4584768, 'steps': 23878, 'loss/train': 0.06502050906419754} -08/30/2021 17:28:33 - INFO - __main__ - Step 23880: {'lr': 0.0004735198109475258, 'samples': 4584960, 'steps': 23879, 'loss/train': 2.0369484424591064} -08/30/2021 17:28:34 - INFO - __main__ - Step 23881: {'lr': 0.000473517433959601, 'samples': 4585152, 'steps': 23880, 'loss/train': 1.5942567586898804} -08/30/2021 17:28:34 - INFO - __main__ - Step 23882: {'lr': 0.00047351505687096257, 'samples': 4585344, 'steps': 23881, 'loss/train': 2.0245325565338135} -08/30/2021 17:28:36 - INFO - __main__ - Step 23883: {'lr': 0.00047351267968161176, 'samples': 4585536, 'steps': 23882, 'loss/train': 1.6382445096969604} -08/30/2021 17:28:36 - INFO - __main__ - Step 23884: {'lr': 0.0004735103023915496, 'samples': 4585728, 'steps': 23883, 'loss/train': 1.2688628435134888} -08/30/2021 17:28:37 - INFO - __main__ - Step 23885: {'lr': 0.0004735079250007771, 'samples': 4585920, 'steps': 23884, 'loss/train': 1.2023228406906128} -08/30/2021 17:28:37 - INFO - __main__ - Step 23886: {'lr': 0.00047350554750929543, 'samples': 4586112, 'steps': 23885, 'loss/train': 1.6293264627456665} -08/30/2021 17:28:37 - INFO - __main__ - Step 23887: {'lr': 0.0004735031699171055, 'samples': 4586304, 'steps': 23886, 'loss/train': 1.5460349321365356} -08/30/2021 17:28:39 - INFO - __main__ - Step 23888: {'lr': 0.0004735007922242086, 'samples': 4586496, 'steps': 23887, 'loss/train': 0.10107112675905228} -08/30/2021 17:28:39 - INFO - __main__ - Step 23889: {'lr': 0.0004734984144306057, 'samples': 4586688, 'steps': 23888, 'loss/train': 1.457375168800354} -08/30/2021 17:28:40 - INFO - __main__ - Step 23890: {'lr': 0.0004734960365362978, 'samples': 4586880, 'steps': 23889, 'loss/train': 1.3192206621170044} -08/30/2021 17:28:40 - INFO - __main__ - Step 23891: {'lr': 0.0004734936585412861, 'samples': 4587072, 'steps': 23890, 'loss/train': 1.0279250144958496} -08/30/2021 17:28:40 - INFO - __main__ - Step 23892: {'lr': 0.00047349128044557153, 'samples': 4587264, 'steps': 23891, 'loss/train': 1.7531778812408447} -08/30/2021 17:28:42 - INFO - __main__ - Step 23893: {'lr': 0.0004734889022491553, 'samples': 4587456, 'steps': 23892, 'loss/train': 1.7402050495147705} -08/30/2021 17:28:42 - INFO - __main__ - Step 23894: {'lr': 0.0004734865239520384, 'samples': 4587648, 'steps': 23893, 'loss/train': 1.4512770175933838} -08/30/2021 17:28:42 - INFO - __main__ - Step 23895: {'lr': 0.0004734841455542219, 'samples': 4587840, 'steps': 23894, 'loss/train': 1.7012555599212646} -08/30/2021 17:28:43 - INFO - __main__ - Step 23896: {'lr': 0.0004734817670557069, 'samples': 4588032, 'steps': 23895, 'loss/train': 0.9944023489952087} -08/30/2021 17:28:43 - INFO - __main__ - Step 23897: {'lr': 0.00047347938845649447, 'samples': 4588224, 'steps': 23896, 'loss/train': 1.2406022548675537} -08/30/2021 17:28:45 - INFO - __main__ - Step 23898: {'lr': 0.0004734770097565857, 'samples': 4588416, 'steps': 23897, 'loss/train': 1.8092373609542847} -08/30/2021 17:28:45 - INFO - __main__ - Step 23899: {'lr': 0.00047347463095598157, 'samples': 4588608, 'steps': 23898, 'loss/train': 2.0713953971862793} -08/30/2021 17:28:45 - INFO - __main__ - Step 23900: {'lr': 0.00047347225205468323, 'samples': 4588800, 'steps': 23899, 'loss/train': 1.4054807424545288} -08/30/2021 17:28:46 - INFO - __main__ - Step 23901: {'lr': 0.00047346987305269184, 'samples': 4588992, 'steps': 23900, 'loss/train': 1.2611148357391357} -08/30/2021 17:28:46 - INFO - __main__ - Step 23902: {'lr': 0.0004734674939500083, 'samples': 4589184, 'steps': 23901, 'loss/train': 1.083526372909546} -08/30/2021 17:28:46 - INFO - __main__ - Step 23903: {'lr': 0.0004734651147466338, 'samples': 4589376, 'steps': 23902, 'loss/train': 1.7088778018951416} -08/30/2021 17:28:48 - INFO - __main__ - Step 23904: {'lr': 0.00047346273544256927, 'samples': 4589568, 'steps': 23903, 'loss/train': 0.4893910884857178} -08/30/2021 17:28:49 - INFO - __main__ - Step 23905: {'lr': 0.00047346035603781597, 'samples': 4589760, 'steps': 23904, 'loss/train': 1.1126079559326172} -08/30/2021 17:28:49 - INFO - __main__ - Step 23906: {'lr': 0.00047345797653237486, 'samples': 4589952, 'steps': 23905, 'loss/train': 1.494066834449768} -08/30/2021 17:28:50 - INFO - __main__ - Step 23907: {'lr': 0.000473455596926247, 'samples': 4590144, 'steps': 23906, 'loss/train': 1.458207607269287} -08/30/2021 17:28:50 - INFO - __main__ - Step 23908: {'lr': 0.0004734532172194335, 'samples': 4590336, 'steps': 23907, 'loss/train': 1.5953456163406372} -08/30/2021 17:28:51 - INFO - __main__ - Step 23909: {'lr': 0.0004734508374119355, 'samples': 4590528, 'steps': 23908, 'loss/train': 1.9063292741775513} -08/30/2021 17:28:52 - INFO - __main__ - Step 23910: {'lr': 0.0004734484575037539, 'samples': 4590720, 'steps': 23909, 'loss/train': 1.5804921388626099} -08/30/2021 17:28:52 - INFO - __main__ - Step 23911: {'lr': 0.00047344607749489, 'samples': 4590912, 'steps': 23910, 'loss/train': 1.5822813510894775} -08/30/2021 17:28:53 - INFO - __main__ - Step 23912: {'lr': 0.00047344369738534466, 'samples': 4591104, 'steps': 23911, 'loss/train': 1.5705474615097046} -08/30/2021 17:28:53 - INFO - __main__ - Step 23913: {'lr': 0.000473441317175119, 'samples': 4591296, 'steps': 23912, 'loss/train': 2.1579926013946533} -08/30/2021 17:28:54 - INFO - __main__ - Step 23914: {'lr': 0.0004734389368642142, 'samples': 4591488, 'steps': 23913, 'loss/train': 1.5677502155303955} -08/30/2021 17:28:55 - INFO - __main__ - Step 23915: {'lr': 0.0004734365564526313, 'samples': 4591680, 'steps': 23914, 'loss/train': 1.2844774723052979} -08/30/2021 17:28:55 - INFO - __main__ - Step 23916: {'lr': 0.00047343417594037117, 'samples': 4591872, 'steps': 23915, 'loss/train': 1.2457770109176636} -08/30/2021 17:28:56 - INFO - __main__ - Step 23917: {'lr': 0.00047343179532743516, 'samples': 4592064, 'steps': 23916, 'loss/train': 1.7153592109680176} -08/30/2021 17:28:56 - INFO - __main__ - Step 23918: {'lr': 0.00047342941461382427, 'samples': 4592256, 'steps': 23917, 'loss/train': 1.7542444467544556} -08/30/2021 17:28:58 - INFO - __main__ - Step 23919: {'lr': 0.0004734270337995395, 'samples': 4592448, 'steps': 23918, 'loss/train': 1.5001026391983032} -08/30/2021 17:28:58 - INFO - __main__ - Step 23920: {'lr': 0.0004734246528845819, 'samples': 4592640, 'steps': 23919, 'loss/train': 1.0851719379425049} -08/30/2021 17:28:58 - INFO - __main__ - Step 23921: {'lr': 0.0004734222718689527, 'samples': 4592832, 'steps': 23920, 'loss/train': 1.639939308166504} -08/30/2021 17:28:59 - INFO - __main__ - Step 23922: {'lr': 0.0004734198907526528, 'samples': 4593024, 'steps': 23921, 'loss/train': 1.6189429759979248} -08/30/2021 17:28:59 - INFO - __main__ - Step 23923: {'lr': 0.00047341750953568335, 'samples': 4593216, 'steps': 23922, 'loss/train': 1.2667911052703857} -08/30/2021 17:29:01 - INFO - __main__ - Step 23924: {'lr': 0.0004734151282180454, 'samples': 4593408, 'steps': 23923, 'loss/train': 1.7822493314743042} -08/30/2021 17:29:01 - INFO - __main__ - Step 23925: {'lr': 0.0004734127467997401, 'samples': 4593600, 'steps': 23924, 'loss/train': 1.4168741703033447} -08/30/2021 17:29:01 - INFO - __main__ - Step 23926: {'lr': 0.0004734103652807684, 'samples': 4593792, 'steps': 23925, 'loss/train': 1.5136585235595703} -08/30/2021 17:29:02 - INFO - __main__ - Step 23927: {'lr': 0.0004734079836611315, 'samples': 4593984, 'steps': 23926, 'loss/train': 1.656827688217163} -08/30/2021 17:29:02 - INFO - __main__ - Step 23928: {'lr': 0.0004734056019408304, 'samples': 4594176, 'steps': 23927, 'loss/train': 1.1633803844451904} -08/30/2021 17:29:04 - INFO - __main__ - Step 23929: {'lr': 0.00047340322011986614, 'samples': 4594368, 'steps': 23928, 'loss/train': 1.5292781591415405} -08/30/2021 17:29:04 - INFO - __main__ - Step 23930: {'lr': 0.0004734008381982399, 'samples': 4594560, 'steps': 23929, 'loss/train': 1.594104290008545} -08/30/2021 17:29:05 - INFO - __main__ - Step 23931: {'lr': 0.0004733984561759527, 'samples': 4594752, 'steps': 23930, 'loss/train': 0.07521896809339523} -08/30/2021 17:29:05 - INFO - __main__ - Step 23932: {'lr': 0.0004733960740530055, 'samples': 4594944, 'steps': 23931, 'loss/train': 0.9714577198028564} -08/30/2021 17:29:05 - INFO - __main__ - Step 23933: {'lr': 0.0004733936918293995, 'samples': 4595136, 'steps': 23932, 'loss/train': 1.1091326475143433} -08/30/2021 17:29:06 - INFO - __main__ - Step 23934: {'lr': 0.0004733913095051358, 'samples': 4595328, 'steps': 23933, 'loss/train': 1.7921544313430786} -08/30/2021 17:29:07 - INFO - __main__ - Step 23935: {'lr': 0.0004733889270802154, 'samples': 4595520, 'steps': 23934, 'loss/train': 1.0680391788482666} -08/30/2021 17:29:08 - INFO - __main__ - Step 23936: {'lr': 0.00047338654455463935, 'samples': 4595712, 'steps': 23935, 'loss/train': 1.6875224113464355} -08/30/2021 17:29:08 - INFO - __main__ - Step 23937: {'lr': 0.00047338416192840887, 'samples': 4595904, 'steps': 23936, 'loss/train': 0.544355034828186} -08/30/2021 17:29:08 - INFO - __main__ - Step 23938: {'lr': 0.0004733817792015249, 'samples': 4596096, 'steps': 23937, 'loss/train': 1.8118723630905151} -08/30/2021 17:29:09 - INFO - __main__ - Step 23939: {'lr': 0.00047337939637398855, 'samples': 4596288, 'steps': 23938, 'loss/train': 0.7021389603614807} -08/30/2021 17:29:10 - INFO - __main__ - Step 23940: {'lr': 0.0004733770134458009, 'samples': 4596480, 'steps': 23939, 'loss/train': 1.6260449886322021} -08/30/2021 17:29:11 - INFO - __main__ - Step 23941: {'lr': 0.0004733746304169629, 'samples': 4596672, 'steps': 23940, 'loss/train': 1.067652702331543} -08/30/2021 17:29:11 - INFO - __main__ - Step 23942: {'lr': 0.0004733722472874759, 'samples': 4596864, 'steps': 23941, 'loss/train': 0.08660119771957397} -08/30/2021 17:29:12 - INFO - __main__ - Step 23943: {'lr': 0.0004733698640573407, 'samples': 4597056, 'steps': 23942, 'loss/train': 0.7692243456840515} -08/30/2021 17:29:12 - INFO - __main__ - Step 23944: {'lr': 0.0004733674807265585, 'samples': 4597248, 'steps': 23943, 'loss/train': 1.3763090372085571} -08/30/2021 17:29:14 - INFO - __main__ - Step 23945: {'lr': 0.0004733650972951304, 'samples': 4597440, 'steps': 23944, 'loss/train': 1.3232545852661133} -08/30/2021 17:29:14 - INFO - __main__ - Step 23946: {'lr': 0.0004733627137630574, 'samples': 4597632, 'steps': 23945, 'loss/train': 1.1721309423446655} -08/30/2021 17:29:14 - INFO - __main__ - Step 23947: {'lr': 0.00047336033013034063, 'samples': 4597824, 'steps': 23946, 'loss/train': 0.9328784346580505} -08/30/2021 17:29:15 - INFO - __main__ - Step 23948: {'lr': 0.00047335794639698117, 'samples': 4598016, 'steps': 23947, 'loss/train': 1.1213229894638062} -08/30/2021 17:29:15 - INFO - __main__ - Step 23949: {'lr': 0.00047335556256298, 'samples': 4598208, 'steps': 23948, 'loss/train': 1.6727445125579834} -08/30/2021 17:29:17 - INFO - __main__ - Step 23950: {'lr': 0.0004733531786283383, 'samples': 4598400, 'steps': 23949, 'loss/train': 1.4021284580230713} -08/30/2021 17:29:17 - INFO - __main__ - Step 23951: {'lr': 0.0004733507945930571, 'samples': 4598592, 'steps': 23950, 'loss/train': 1.8878673315048218} -08/30/2021 17:29:18 - INFO - __main__ - Step 23952: {'lr': 0.0004733484104571375, 'samples': 4598784, 'steps': 23951, 'loss/train': 1.5105644464492798} -08/30/2021 17:29:18 - INFO - __main__ - Step 23953: {'lr': 0.0004733460262205805, 'samples': 4598976, 'steps': 23952, 'loss/train': 2.0807597637176514} -08/30/2021 17:29:18 - INFO - __main__ - Step 23954: {'lr': 0.00047334364188338725, 'samples': 4599168, 'steps': 23953, 'loss/train': 1.6940207481384277} -08/30/2021 17:29:20 - INFO - __main__ - Step 23955: {'lr': 0.0004733412574455588, 'samples': 4599360, 'steps': 23954, 'loss/train': 1.5082449913024902} -08/30/2021 17:29:21 - INFO - __main__ - Step 23956: {'lr': 0.00047333887290709623, 'samples': 4599552, 'steps': 23955, 'loss/train': 1.1699519157409668} -08/30/2021 17:29:21 - INFO - __main__ - Step 23957: {'lr': 0.00047333648826800056, 'samples': 4599744, 'steps': 23956, 'loss/train': 1.5576560497283936} -08/30/2021 17:29:21 - INFO - __main__ - Step 23958: {'lr': 0.000473334103528273, 'samples': 4599936, 'steps': 23957, 'loss/train': 1.5029267072677612} -08/30/2021 17:29:22 - INFO - __main__ - Step 23959: {'lr': 0.00047333171868791453, 'samples': 4600128, 'steps': 23958, 'loss/train': 1.5009058713912964} -08/30/2021 17:29:23 - INFO - __main__ - Step 23960: {'lr': 0.00047332933374692623, 'samples': 4600320, 'steps': 23959, 'loss/train': 1.3994954824447632} -08/30/2021 17:29:24 - INFO - __main__ - Step 23961: {'lr': 0.0004733269487053091, 'samples': 4600512, 'steps': 23960, 'loss/train': 1.5259203910827637} -08/30/2021 17:29:24 - INFO - __main__ - Step 23962: {'lr': 0.0004733245635630644, 'samples': 4600704, 'steps': 23961, 'loss/train': 1.4005982875823975} -08/30/2021 17:29:24 - INFO - __main__ - Step 23963: {'lr': 0.000473322178320193, 'samples': 4600896, 'steps': 23962, 'loss/train': 1.6762452125549316} -08/30/2021 17:29:25 - INFO - __main__ - Step 23964: {'lr': 0.0004733197929766961, 'samples': 4601088, 'steps': 23963, 'loss/train': 1.6293858289718628} -08/30/2021 17:29:26 - INFO - __main__ - Step 23965: {'lr': 0.0004733174075325748, 'samples': 4601280, 'steps': 23964, 'loss/train': 1.3817896842956543} -08/30/2021 17:29:27 - INFO - __main__ - Step 23966: {'lr': 0.0004733150219878301, 'samples': 4601472, 'steps': 23965, 'loss/train': 1.376197099685669} -08/30/2021 17:29:27 - INFO - __main__ - Step 23967: {'lr': 0.00047331263634246314, 'samples': 4601664, 'steps': 23966, 'loss/train': 1.2290537357330322} -08/30/2021 17:29:27 - INFO - __main__ - Step 23968: {'lr': 0.0004733102505964749, 'samples': 4601856, 'steps': 23967, 'loss/train': 1.452670931816101} -08/30/2021 17:29:28 - INFO - __main__ - Step 23969: {'lr': 0.00047330786474986645, 'samples': 4602048, 'steps': 23968, 'loss/train': 1.2899892330169678} -08/30/2021 17:29:29 - INFO - __main__ - Step 23970: {'lr': 0.00047330547880263896, 'samples': 4602240, 'steps': 23969, 'loss/train': 1.491136908531189} -08/30/2021 17:29:30 - INFO - __main__ - Step 23971: {'lr': 0.00047330309275479354, 'samples': 4602432, 'steps': 23970, 'loss/train': 1.4215087890625} -08/30/2021 17:29:30 - INFO - __main__ - Step 23972: {'lr': 0.00047330070660633113, 'samples': 4602624, 'steps': 23971, 'loss/train': 1.8291187286376953} -08/30/2021 17:29:30 - INFO - __main__ - Step 23973: {'lr': 0.00047329832035725286, 'samples': 4602816, 'steps': 23972, 'loss/train': 1.5089482069015503} -08/30/2021 17:29:31 - INFO - __main__ - Step 23974: {'lr': 0.0004732959340075598, 'samples': 4603008, 'steps': 23973, 'loss/train': 1.8125065565109253} -08/30/2021 17:29:32 - INFO - __main__ - Step 23975: {'lr': 0.0004732935475572531, 'samples': 4603200, 'steps': 23974, 'loss/train': 1.5856719017028809} -08/30/2021 17:29:33 - INFO - __main__ - Step 23976: {'lr': 0.00047329116100633373, 'samples': 4603392, 'steps': 23975, 'loss/train': 2.2570695877075195} -08/30/2021 17:29:33 - INFO - __main__ - Step 23977: {'lr': 0.0004732887743548028, 'samples': 4603584, 'steps': 23976, 'loss/train': 1.0739967823028564} -08/30/2021 17:29:33 - INFO - __main__ - Step 23978: {'lr': 0.0004732863876026614, 'samples': 4603776, 'steps': 23977, 'loss/train': 1.5266087055206299} -08/30/2021 17:29:34 - INFO - __main__ - Step 23979: {'lr': 0.00047328400074991064, 'samples': 4603968, 'steps': 23978, 'loss/train': 0.9839372038841248} -08/30/2021 17:29:34 - INFO - __main__ - Step 23980: {'lr': 0.00047328161379655155, 'samples': 4604160, 'steps': 23979, 'loss/train': 0.6058788895606995} -08/30/2021 17:29:35 - INFO - __main__ - Step 23981: {'lr': 0.00047327922674258516, 'samples': 4604352, 'steps': 23980, 'loss/train': 1.6976488828659058} -08/30/2021 17:29:36 - INFO - __main__ - Step 23982: {'lr': 0.00047327683958801257, 'samples': 4604544, 'steps': 23981, 'loss/train': 1.3941693305969238} -08/30/2021 17:29:36 - INFO - __main__ - Step 23983: {'lr': 0.00047327445233283496, 'samples': 4604736, 'steps': 23982, 'loss/train': 1.415250539779663} -08/30/2021 17:29:37 - INFO - __main__ - Step 23984: {'lr': 0.0004732720649770533, 'samples': 4604928, 'steps': 23983, 'loss/train': 1.7057350873947144} -08/30/2021 17:29:37 - INFO - __main__ - Step 23985: {'lr': 0.00047326967752066876, 'samples': 4605120, 'steps': 23984, 'loss/train': 1.5120905637741089} -08/30/2021 17:29:39 - INFO - __main__ - Step 23986: {'lr': 0.0004732672899636822, 'samples': 4605312, 'steps': 23985, 'loss/train': 1.9327870607376099} -08/30/2021 17:29:40 - INFO - __main__ - Step 23987: {'lr': 0.00047326490230609495, 'samples': 4605504, 'steps': 23986, 'loss/train': 1.3406269550323486} -08/30/2021 17:29:40 - INFO - __main__ - Step 23988: {'lr': 0.000473262514547908, 'samples': 4605696, 'steps': 23987, 'loss/train': 0.6682289838790894} -08/30/2021 17:29:41 - INFO - __main__ - Step 23989: {'lr': 0.00047326012668912233, 'samples': 4605888, 'steps': 23988, 'loss/train': 0.570551335811615} -08/30/2021 17:29:41 - INFO - __main__ - Step 23990: {'lr': 0.0004732577387297391, 'samples': 4606080, 'steps': 23989, 'loss/train': 1.1935884952545166} -08/30/2021 17:29:41 - INFO - __main__ - Step 23991: {'lr': 0.00047325535066975946, 'samples': 4606272, 'steps': 23990, 'loss/train': 1.4759531021118164} -08/30/2021 17:29:43 - INFO - __main__ - Step 23992: {'lr': 0.0004732529625091843, 'samples': 4606464, 'steps': 23991, 'loss/train': 1.1583490371704102} -08/30/2021 17:29:43 - INFO - __main__ - Step 23993: {'lr': 0.0004732505742480149, 'samples': 4606656, 'steps': 23992, 'loss/train': 2.132206916809082} -08/30/2021 17:29:44 - INFO - __main__ - Step 23994: {'lr': 0.00047324818588625214, 'samples': 4606848, 'steps': 23993, 'loss/train': 1.8066595792770386} -08/30/2021 17:29:44 - INFO - __main__ - Step 23995: {'lr': 0.0004732457974238972, 'samples': 4607040, 'steps': 23994, 'loss/train': 2.031420946121216} -08/30/2021 17:29:44 - INFO - __main__ - Step 23996: {'lr': 0.0004732434088609512, 'samples': 4607232, 'steps': 23995, 'loss/train': 1.9712618589401245} -08/30/2021 17:29:46 - INFO - __main__ - Step 23997: {'lr': 0.00047324102019741514, 'samples': 4607424, 'steps': 23996, 'loss/train': 1.8564987182617188} -08/30/2021 17:29:46 - INFO - __main__ - Step 23998: {'lr': 0.00047323863143329016, 'samples': 4607616, 'steps': 23997, 'loss/train': 1.965773582458496} -08/30/2021 17:29:47 - INFO - __main__ - Step 23999: {'lr': 0.00047323624256857724, 'samples': 4607808, 'steps': 23998, 'loss/train': 1.5524145364761353} -08/30/2021 17:29:47 - INFO - __main__ - Step 24000: {'lr': 0.0004732338536032775, 'samples': 4608000, 'steps': 23999, 'loss/train': 1.7805531024932861} -08/30/2021 17:29:47 - INFO - __main__ - Step 24001: {'lr': 0.0004732314645373921, 'samples': 4608192, 'steps': 24000, 'loss/train': 1.941765308380127} -08/30/2021 17:29:49 - INFO - __main__ - Step 24002: {'lr': 0.0004732290753709221, 'samples': 4608384, 'steps': 24001, 'loss/train': 2.1082425117492676} -08/30/2021 17:29:49 - INFO - __main__ - Step 24003: {'lr': 0.0004732266861038684, 'samples': 4608576, 'steps': 24002, 'loss/train': 1.6280622482299805} -08/30/2021 17:29:50 - INFO - __main__ - Step 24004: {'lr': 0.0004732242967362322, 'samples': 4608768, 'steps': 24003, 'loss/train': 1.4950611591339111} -08/30/2021 17:29:50 - INFO - __main__ - Step 24005: {'lr': 0.00047322190726801464, 'samples': 4608960, 'steps': 24004, 'loss/train': 1.7071781158447266} -08/30/2021 17:29:50 - INFO - __main__ - Step 24006: {'lr': 0.0004732195176992167, 'samples': 4609152, 'steps': 24005, 'loss/train': 1.6114521026611328} -08/30/2021 17:29:52 - INFO - __main__ - Step 24007: {'lr': 0.0004732171280298395, 'samples': 4609344, 'steps': 24006, 'loss/train': 1.3769075870513916} -08/30/2021 17:29:52 - INFO - __main__ - Step 24008: {'lr': 0.0004732147382598842, 'samples': 4609536, 'steps': 24007, 'loss/train': 1.3611992597579956} -08/30/2021 17:29:53 - INFO - __main__ - Step 24009: {'lr': 0.00047321234838935164, 'samples': 4609728, 'steps': 24008, 'loss/train': 1.4643421173095703} -08/30/2021 17:29:53 - INFO - __main__ - Step 24010: {'lr': 0.0004732099584182431, 'samples': 4609920, 'steps': 24009, 'loss/train': 1.8271245956420898} -08/30/2021 17:29:53 - INFO - __main__ - Step 24011: {'lr': 0.00047320756834655955, 'samples': 4610112, 'steps': 24010, 'loss/train': 1.9192742109298706} -08/30/2021 17:29:56 - INFO - __main__ - Step 24012: {'lr': 0.0004732051781743022, 'samples': 4610304, 'steps': 24011, 'loss/train': 1.5685092210769653} -08/30/2021 17:29:56 - INFO - __main__ - Step 24013: {'lr': 0.00047320278790147197, 'samples': 4610496, 'steps': 24012, 'loss/train': 2.033869743347168} -08/30/2021 17:29:56 - INFO - __main__ - Step 24014: {'lr': 0.00047320039752807, 'samples': 4610688, 'steps': 24013, 'loss/train': 1.8639260530471802} -08/30/2021 17:29:57 - INFO - __main__ - Step 24015: {'lr': 0.0004731980070540974, 'samples': 4610880, 'steps': 24014, 'loss/train': 1.352035403251648} -08/30/2021 17:29:57 - INFO - __main__ - Step 24016: {'lr': 0.0004731956164795552, 'samples': 4611072, 'steps': 24015, 'loss/train': 1.722882628440857} -08/30/2021 17:29:57 - INFO - __main__ - Step 24017: {'lr': 0.0004731932258044446, 'samples': 4611264, 'steps': 24016, 'loss/train': 0.7408400177955627} -08/30/2021 17:29:59 - INFO - __main__ - Step 24018: {'lr': 0.00047319083502876647, 'samples': 4611456, 'steps': 24017, 'loss/train': 1.7358992099761963} -08/30/2021 17:29:59 - INFO - __main__ - Step 24019: {'lr': 0.00047318844415252204, 'samples': 4611648, 'steps': 24018, 'loss/train': 1.7989447116851807} -08/30/2021 17:30:00 - INFO - __main__ - Step 24020: {'lr': 0.00047318605317571227, 'samples': 4611840, 'steps': 24019, 'loss/train': 1.5153939723968506} -08/30/2021 17:30:00 - INFO - __main__ - Step 24021: {'lr': 0.0004731836620983384, 'samples': 4612032, 'steps': 24020, 'loss/train': 1.7799488306045532} -08/30/2021 17:30:00 - INFO - __main__ - Step 24022: {'lr': 0.00047318127092040144, 'samples': 4612224, 'steps': 24021, 'loss/train': 1.7262390851974487} -08/30/2021 17:30:02 - INFO - __main__ - Step 24023: {'lr': 0.00047317887964190233, 'samples': 4612416, 'steps': 24022, 'loss/train': 1.7322629690170288} -08/30/2021 17:30:02 - INFO - __main__ - Step 24024: {'lr': 0.00047317648826284233, 'samples': 4612608, 'steps': 24023, 'loss/train': 1.7015255689620972} -08/30/2021 17:30:03 - INFO - __main__ - Step 24025: {'lr': 0.0004731740967832224, 'samples': 4612800, 'steps': 24024, 'loss/train': 0.9546807408332825} -08/30/2021 17:30:03 - INFO - __main__ - Step 24026: {'lr': 0.00047317170520304373, 'samples': 4612992, 'steps': 24025, 'loss/train': 1.139951229095459} -08/30/2021 17:30:03 - INFO - __main__ - Step 24027: {'lr': 0.0004731693135223073, 'samples': 4613184, 'steps': 24026, 'loss/train': 1.8629801273345947} -08/30/2021 17:30:05 - INFO - __main__ - Step 24028: {'lr': 0.0004731669217410142, 'samples': 4613376, 'steps': 24027, 'loss/train': 1.068621039390564} -08/30/2021 17:30:05 - INFO - __main__ - Step 24029: {'lr': 0.0004731645298591656, 'samples': 4613568, 'steps': 24028, 'loss/train': 1.1456061601638794} -08/30/2021 17:30:06 - INFO - __main__ - Step 24030: {'lr': 0.0004731621378767624, 'samples': 4613760, 'steps': 24029, 'loss/train': 1.7382146120071411} -08/30/2021 17:30:06 - INFO - __main__ - Step 24031: {'lr': 0.0004731597457938059, 'samples': 4613952, 'steps': 24030, 'loss/train': 0.7456815242767334} -08/30/2021 17:30:06 - INFO - __main__ - Step 24032: {'lr': 0.000473157353610297, 'samples': 4614144, 'steps': 24031, 'loss/train': 1.714818000793457} -08/30/2021 17:30:08 - INFO - __main__ - Step 24033: {'lr': 0.0004731549613262368, 'samples': 4614336, 'steps': 24032, 'loss/train': 1.5012445449829102} -08/30/2021 17:30:09 - INFO - __main__ - Step 24034: {'lr': 0.0004731525689416265, 'samples': 4614528, 'steps': 24033, 'loss/train': 1.5666781663894653} -08/30/2021 17:30:09 - INFO - __main__ - Step 24035: {'lr': 0.0004731501764564671, 'samples': 4614720, 'steps': 24034, 'loss/train': 0.3431834876537323} -08/30/2021 17:30:10 - INFO - __main__ - Step 24036: {'lr': 0.00047314778387075963, 'samples': 4614912, 'steps': 24035, 'loss/train': 1.9771511554718018} -08/30/2021 17:30:10 - INFO - __main__ - Step 24037: {'lr': 0.00047314539118450516, 'samples': 4615104, 'steps': 24036, 'loss/train': 1.9900704622268677} -08/30/2021 17:30:12 - INFO - __main__ - Step 24038: {'lr': 0.0004731429983977049, 'samples': 4615296, 'steps': 24037, 'loss/train': 1.5211819410324097} -08/30/2021 17:30:12 - INFO - __main__ - Step 24039: {'lr': 0.00047314060551035983, 'samples': 4615488, 'steps': 24038, 'loss/train': 2.0710344314575195} -08/30/2021 17:30:12 - INFO - __main__ - Step 24040: {'lr': 0.00047313821252247104, 'samples': 4615680, 'steps': 24039, 'loss/train': 1.251976490020752} -08/30/2021 17:30:13 - INFO - __main__ - Step 24041: {'lr': 0.00047313581943403963, 'samples': 4615872, 'steps': 24040, 'loss/train': 0.08993315696716309} -08/30/2021 17:30:13 - INFO - __main__ - Step 24042: {'lr': 0.0004731334262450666, 'samples': 4616064, 'steps': 24041, 'loss/train': 2.274127244949341} -08/30/2021 17:30:15 - INFO - __main__ - Step 24043: {'lr': 0.00047313103295555317, 'samples': 4616256, 'steps': 24042, 'loss/train': 1.7268720865249634} -08/30/2021 17:30:15 - INFO - __main__ - Step 24044: {'lr': 0.0004731286395655003, 'samples': 4616448, 'steps': 24043, 'loss/train': 1.7036787271499634} -08/30/2021 17:30:15 - INFO - __main__ - Step 24045: {'lr': 0.00047312624607490913, 'samples': 4616640, 'steps': 24044, 'loss/train': 1.509076714515686} -08/30/2021 17:30:16 - INFO - __main__ - Step 24046: {'lr': 0.0004731238524837807, 'samples': 4616832, 'steps': 24045, 'loss/train': 0.5438427329063416} -08/30/2021 17:30:16 - INFO - __main__ - Step 24047: {'lr': 0.00047312145879211607, 'samples': 4617024, 'steps': 24046, 'loss/train': 1.9037859439849854} -08/30/2021 17:30:18 - INFO - __main__ - Step 24048: {'lr': 0.0004731190649999164, 'samples': 4617216, 'steps': 24047, 'loss/train': 1.426287293434143} -08/30/2021 17:30:18 - INFO - __main__ - Step 24049: {'lr': 0.0004731166711071827, 'samples': 4617408, 'steps': 24048, 'loss/train': 1.7205524444580078} -08/30/2021 17:30:18 - INFO - __main__ - Step 24050: {'lr': 0.0004731142771139161, 'samples': 4617600, 'steps': 24049, 'loss/train': 1.7110624313354492} -08/30/2021 17:30:19 - INFO - __main__ - Step 24051: {'lr': 0.00047311188302011766, 'samples': 4617792, 'steps': 24050, 'loss/train': 1.59541654586792} -08/30/2021 17:30:19 - INFO - __main__ - Step 24052: {'lr': 0.00047310948882578843, 'samples': 4617984, 'steps': 24051, 'loss/train': 1.8222190141677856} -08/30/2021 17:30:19 - INFO - __main__ - Step 24053: {'lr': 0.0004731070945309295, 'samples': 4618176, 'steps': 24052, 'loss/train': 1.5752980709075928} -08/30/2021 17:30:21 - INFO - __main__ - Step 24054: {'lr': 0.00047310470013554195, 'samples': 4618368, 'steps': 24053, 'loss/train': 1.4789464473724365} -08/30/2021 17:30:21 - INFO - __main__ - Step 24055: {'lr': 0.0004731023056396269, 'samples': 4618560, 'steps': 24054, 'loss/train': 1.7332782745361328} -08/30/2021 17:30:22 - INFO - __main__ - Step 24056: {'lr': 0.00047309991104318533, 'samples': 4618752, 'steps': 24055, 'loss/train': 1.697275161743164} -08/30/2021 17:30:22 - INFO - __main__ - Step 24057: {'lr': 0.00047309751634621845, 'samples': 4618944, 'steps': 24056, 'loss/train': 1.4491691589355469} -08/30/2021 17:30:22 - INFO - __main__ - Step 24058: {'lr': 0.0004730951215487272, 'samples': 4619136, 'steps': 24057, 'loss/train': 1.2856816053390503} -08/30/2021 17:30:24 - INFO - __main__ - Step 24059: {'lr': 0.0004730927266507128, 'samples': 4619328, 'steps': 24058, 'loss/train': 1.5663295984268188} -08/30/2021 17:30:24 - INFO - __main__ - Step 24060: {'lr': 0.00047309033165217617, 'samples': 4619520, 'steps': 24059, 'loss/train': 2.148709535598755} -08/30/2021 17:30:25 - INFO - __main__ - Step 24061: {'lr': 0.00047308793655311855, 'samples': 4619712, 'steps': 24060, 'loss/train': 1.327816128730774} -08/30/2021 17:30:25 - INFO - __main__ - Step 24062: {'lr': 0.000473085541353541, 'samples': 4619904, 'steps': 24061, 'loss/train': 1.5505187511444092} -08/30/2021 17:30:25 - INFO - __main__ - Step 24063: {'lr': 0.00047308314605344447, 'samples': 4620096, 'steps': 24062, 'loss/train': 1.7892699241638184} -08/30/2021 17:30:28 - INFO - __main__ - Step 24064: {'lr': 0.00047308075065283006, 'samples': 4620288, 'steps': 24063, 'loss/train': 0.2885242700576782} -08/30/2021 17:30:28 - INFO - __main__ - Step 24065: {'lr': 0.00047307835515169905, 'samples': 4620480, 'steps': 24064, 'loss/train': 1.5652493238449097} -08/30/2021 17:30:29 - INFO - __main__ - Step 24066: {'lr': 0.00047307595955005226, 'samples': 4620672, 'steps': 24065, 'loss/train': 1.5013893842697144} -08/30/2021 17:30:29 - INFO - __main__ - Step 24067: {'lr': 0.000473073563847891, 'samples': 4620864, 'steps': 24066, 'loss/train': 1.1477336883544922} -08/30/2021 17:30:29 - INFO - __main__ - Step 24068: {'lr': 0.0004730711680452161, 'samples': 4621056, 'steps': 24067, 'loss/train': 1.3155384063720703} -08/30/2021 17:30:30 - INFO - __main__ - Step 24069: {'lr': 0.00047306877214202885, 'samples': 4621248, 'steps': 24068, 'loss/train': 1.609187364578247} -08/30/2021 17:30:31 - INFO - __main__ - Step 24070: {'lr': 0.00047306637613833024, 'samples': 4621440, 'steps': 24069, 'loss/train': 0.14481352269649506} -08/30/2021 17:30:32 - INFO - __main__ - Step 24071: {'lr': 0.00047306398003412137, 'samples': 4621632, 'steps': 24070, 'loss/train': 1.548281192779541} -08/30/2021 17:30:32 - INFO - __main__ - Step 24072: {'lr': 0.00047306158382940327, 'samples': 4621824, 'steps': 24071, 'loss/train': 1.4533778429031372} -08/30/2021 17:30:32 - INFO - __main__ - Step 24073: {'lr': 0.0004730591875241771, 'samples': 4622016, 'steps': 24072, 'loss/train': 1.5265815258026123} -08/30/2021 17:30:33 - INFO - __main__ - Step 24074: {'lr': 0.0004730567911184439, 'samples': 4622208, 'steps': 24073, 'loss/train': 1.9236773252487183} -08/30/2021 17:30:34 - INFO - __main__ - Step 24075: {'lr': 0.00047305439461220477, 'samples': 4622400, 'steps': 24074, 'loss/train': 1.5820451974868774} -08/30/2021 17:30:35 - INFO - __main__ - Step 24076: {'lr': 0.00047305199800546077, 'samples': 4622592, 'steps': 24075, 'loss/train': 1.6401923894882202} -08/30/2021 17:30:35 - INFO - __main__ - Step 24077: {'lr': 0.00047304960129821295, 'samples': 4622784, 'steps': 24076, 'loss/train': 1.445767879486084} -08/30/2021 17:30:35 - INFO - __main__ - Step 24078: {'lr': 0.00047304720449046247, 'samples': 4622976, 'steps': 24077, 'loss/train': 1.603904366493225} -08/30/2021 17:30:36 - INFO - __main__ - Step 24079: {'lr': 0.0004730448075822103, 'samples': 4623168, 'steps': 24078, 'loss/train': 1.342221975326538} -08/30/2021 17:30:37 - INFO - __main__ - Step 24080: {'lr': 0.0004730424105734576, 'samples': 4623360, 'steps': 24079, 'loss/train': 1.8074901103973389} -08/30/2021 17:30:38 - INFO - __main__ - Step 24081: {'lr': 0.00047304001346420543, 'samples': 4623552, 'steps': 24080, 'loss/train': 1.4292932748794556} -08/30/2021 17:30:38 - INFO - __main__ - Step 24082: {'lr': 0.0004730376162544549, 'samples': 4623744, 'steps': 24081, 'loss/train': 1.706549048423767} -08/30/2021 17:30:38 - INFO - __main__ - Step 24083: {'lr': 0.00047303521894420707, 'samples': 4623936, 'steps': 24082, 'loss/train': 1.5007423162460327} -08/30/2021 17:30:39 - INFO - __main__ - Step 24084: {'lr': 0.00047303282153346297, 'samples': 4624128, 'steps': 24083, 'loss/train': 1.8951566219329834} -08/30/2021 17:30:40 - INFO - __main__ - Step 24085: {'lr': 0.00047303042402222373, 'samples': 4624320, 'steps': 24084, 'loss/train': 1.940564751625061} -08/30/2021 17:30:41 - INFO - __main__ - Step 24086: {'lr': 0.00047302802641049045, 'samples': 4624512, 'steps': 24085, 'loss/train': 1.6670588254928589} -08/30/2021 17:30:41 - INFO - __main__ - Step 24087: {'lr': 0.00047302562869826415, 'samples': 4624704, 'steps': 24086, 'loss/train': 1.5259641408920288} -08/30/2021 17:30:41 - INFO - __main__ - Step 24088: {'lr': 0.000473023230885546, 'samples': 4624896, 'steps': 24087, 'loss/train': 1.1554542779922485} -08/30/2021 17:30:42 - INFO - __main__ - Step 24089: {'lr': 0.00047302083297233693, 'samples': 4625088, 'steps': 24088, 'loss/train': 0.5441455245018005} -08/30/2021 17:30:43 - INFO - __main__ - Step 24090: {'lr': 0.0004730184349586382, 'samples': 4625280, 'steps': 24089, 'loss/train': 1.6687731742858887} -08/30/2021 17:30:44 - INFO - __main__ - Step 24091: {'lr': 0.0004730160368444507, 'samples': 4625472, 'steps': 24090, 'loss/train': 1.3922580480575562} -08/30/2021 17:30:44 - INFO - __main__ - Step 24092: {'lr': 0.00047301363862977574, 'samples': 4625664, 'steps': 24091, 'loss/train': 1.4776488542556763} -08/30/2021 17:30:44 - INFO - __main__ - Step 24093: {'lr': 0.00047301124031461425, 'samples': 4625856, 'steps': 24092, 'loss/train': 2.0109939575195312} -08/30/2021 17:30:45 - INFO - __main__ - Step 24094: {'lr': 0.00047300884189896734, 'samples': 4626048, 'steps': 24093, 'loss/train': 1.547519564628601} -08/30/2021 17:30:46 - INFO - __main__ - Step 24095: {'lr': 0.00047300644338283597, 'samples': 4626240, 'steps': 24094, 'loss/train': 1.7417045831680298} -08/30/2021 17:30:47 - INFO - __main__ - Step 24096: {'lr': 0.00047300404476622145, 'samples': 4626432, 'steps': 24095, 'loss/train': 1.456769585609436} -08/30/2021 17:30:47 - INFO - __main__ - Step 24097: {'lr': 0.0004730016460491247, 'samples': 4626624, 'steps': 24096, 'loss/train': 1.4040253162384033} -08/30/2021 17:30:47 - INFO - __main__ - Step 24098: {'lr': 0.00047299924723154686, 'samples': 4626816, 'steps': 24097, 'loss/train': 1.5261404514312744} -08/30/2021 17:30:48 - INFO - __main__ - Step 24099: {'lr': 0.000472996848313489, 'samples': 4627008, 'steps': 24098, 'loss/train': 1.7699613571166992} -08/30/2021 17:30:49 - INFO - __main__ - Step 24100: {'lr': 0.0004729944492949523, 'samples': 4627200, 'steps': 24099, 'loss/train': 1.2860987186431885} -08/30/2021 17:30:50 - INFO - __main__ - Step 24101: {'lr': 0.0004729920501759376, 'samples': 4627392, 'steps': 24100, 'loss/train': 1.514662742614746} -08/30/2021 17:30:50 - INFO - __main__ - Step 24102: {'lr': 0.0004729896509564462, 'samples': 4627584, 'steps': 24101, 'loss/train': 0.47807011008262634} -08/30/2021 17:30:50 - INFO - __main__ - Step 24103: {'lr': 0.00047298725163647903, 'samples': 4627776, 'steps': 24102, 'loss/train': 2.083526372909546} -08/30/2021 17:30:51 - INFO - __main__ - Step 24104: {'lr': 0.00047298485221603735, 'samples': 4627968, 'steps': 24103, 'loss/train': 1.6912801265716553} -08/30/2021 17:30:52 - INFO - __main__ - Step 24105: {'lr': 0.0004729824526951221, 'samples': 4628160, 'steps': 24104, 'loss/train': 1.7747036218643188} -08/30/2021 17:30:53 - INFO - __main__ - Step 24106: {'lr': 0.0004729800530737344, 'samples': 4628352, 'steps': 24105, 'loss/train': 1.7489311695098877} -08/30/2021 17:30:53 - INFO - __main__ - Step 24107: {'lr': 0.0004729776533518753, 'samples': 4628544, 'steps': 24106, 'loss/train': 1.7768486738204956} -08/30/2021 17:30:53 - INFO - __main__ - Step 24108: {'lr': 0.00047297525352954587, 'samples': 4628736, 'steps': 24107, 'loss/train': 0.32257765531539917} -08/30/2021 17:30:54 - INFO - __main__ - Step 24109: {'lr': 0.00047297285360674724, 'samples': 4628928, 'steps': 24108, 'loss/train': 1.5983144044876099} -08/30/2021 17:30:56 - INFO - __main__ - Step 24110: {'lr': 0.0004729704535834806, 'samples': 4629120, 'steps': 24109, 'loss/train': 0.20864179730415344} -08/30/2021 17:30:57 - INFO - __main__ - Step 24111: {'lr': 0.0004729680534597468, 'samples': 4629312, 'steps': 24110, 'loss/train': 1.459895372390747} -08/30/2021 17:30:57 - INFO - __main__ - Step 24112: {'lr': 0.0004729656532355471, 'samples': 4629504, 'steps': 24111, 'loss/train': 1.8617894649505615} -08/30/2021 17:30:57 - INFO - __main__ - Step 24113: {'lr': 0.00047296325291088247, 'samples': 4629696, 'steps': 24112, 'loss/train': 1.8113024234771729} -08/30/2021 17:30:58 - INFO - __main__ - Step 24114: {'lr': 0.00047296085248575405, 'samples': 4629888, 'steps': 24113, 'loss/train': 1.8138296604156494} -08/30/2021 17:30:58 - INFO - __main__ - Step 24115: {'lr': 0.000472958451960163, 'samples': 4630080, 'steps': 24114, 'loss/train': 1.3801623582839966} -08/30/2021 17:30:58 - INFO - __main__ - Step 24116: {'lr': 0.0004729560513341101, 'samples': 4630272, 'steps': 24115, 'loss/train': 0.46274125576019287} -08/30/2021 17:31:00 - INFO - __main__ - Step 24117: {'lr': 0.0004729536506075969, 'samples': 4630464, 'steps': 24116, 'loss/train': 1.6889135837554932} -08/30/2021 17:31:01 - INFO - __main__ - Step 24118: {'lr': 0.000472951249780624, 'samples': 4630656, 'steps': 24117, 'loss/train': 0.9251886010169983} -08/30/2021 17:31:01 - INFO - __main__ - Step 24119: {'lr': 0.0004729488488531928, 'samples': 4630848, 'steps': 24118, 'loss/train': 1.5236133337020874} -08/30/2021 17:31:01 - INFO - __main__ - Step 24120: {'lr': 0.00047294644782530437, 'samples': 4631040, 'steps': 24119, 'loss/train': 1.7088730335235596} -08/30/2021 17:31:02 - INFO - __main__ - Step 24121: {'lr': 0.0004729440466969596, 'samples': 4631232, 'steps': 24120, 'loss/train': 1.5327494144439697} -08/30/2021 17:31:03 - INFO - __main__ - Step 24122: {'lr': 0.00047294164546815977, 'samples': 4631424, 'steps': 24121, 'loss/train': 1.44022798538208} -08/30/2021 17:31:04 - INFO - __main__ - Step 24123: {'lr': 0.0004729392441389058, 'samples': 4631616, 'steps': 24122, 'loss/train': 1.5222587585449219} -08/30/2021 17:31:04 - INFO - __main__ - Step 24124: {'lr': 0.0004729368427091989, 'samples': 4631808, 'steps': 24123, 'loss/train': 1.7540864944458008} -08/30/2021 17:31:04 - INFO - __main__ - Step 24125: {'lr': 0.0004729344411790401, 'samples': 4632000, 'steps': 24124, 'loss/train': 1.841918706893921} -08/30/2021 17:31:05 - INFO - __main__ - Step 24126: {'lr': 0.00047293203954843036, 'samples': 4632192, 'steps': 24125, 'loss/train': 1.6288747787475586} -08/30/2021 17:31:05 - INFO - __main__ - Step 24127: {'lr': 0.000472929637817371, 'samples': 4632384, 'steps': 24126, 'loss/train': 2.0986011028289795} -08/30/2021 17:31:07 - INFO - __main__ - Step 24128: {'lr': 0.00047292723598586295, 'samples': 4632576, 'steps': 24127, 'loss/train': 1.5108201503753662} -08/30/2021 17:31:07 - INFO - __main__ - Step 24129: {'lr': 0.0004729248340539074, 'samples': 4632768, 'steps': 24128, 'loss/train': 2.7759737968444824} -08/30/2021 17:31:08 - INFO - __main__ - Step 24130: {'lr': 0.00047292243202150524, 'samples': 4632960, 'steps': 24129, 'loss/train': 1.0917391777038574} -08/30/2021 17:31:08 - INFO - __main__ - Step 24131: {'lr': 0.00047292002988865773, 'samples': 4633152, 'steps': 24130, 'loss/train': 1.4824484586715698} -08/30/2021 17:31:08 - INFO - __main__ - Step 24132: {'lr': 0.0004729176276553659, 'samples': 4633344, 'steps': 24131, 'loss/train': 2.507643938064575} -08/30/2021 17:31:10 - INFO - __main__ - Step 24133: {'lr': 0.00047291522532163084, 'samples': 4633536, 'steps': 24132, 'loss/train': 1.381656289100647} -08/30/2021 17:31:10 - INFO - __main__ - Step 24134: {'lr': 0.0004729128228874536, 'samples': 4633728, 'steps': 24133, 'loss/train': 1.7645857334136963} -08/30/2021 17:31:11 - INFO - __main__ - Step 24135: {'lr': 0.0004729104203528353, 'samples': 4633920, 'steps': 24134, 'loss/train': 1.740995168685913} -08/30/2021 17:31:11 - INFO - __main__ - Step 24136: {'lr': 0.0004729080177177769, 'samples': 4634112, 'steps': 24135, 'loss/train': 1.6431689262390137} -08/30/2021 17:31:11 - INFO - __main__ - Step 24137: {'lr': 0.0004729056149822797, 'samples': 4634304, 'steps': 24136, 'loss/train': 2.0831339359283447} -08/30/2021 17:31:13 - INFO - __main__ - Step 24138: {'lr': 0.0004729032121463447, 'samples': 4634496, 'steps': 24137, 'loss/train': 1.8646323680877686} -08/30/2021 17:31:13 - INFO - __main__ - Step 24139: {'lr': 0.00047290080920997285, 'samples': 4634688, 'steps': 24138, 'loss/train': 1.3936610221862793} -08/30/2021 17:31:14 - INFO - __main__ - Step 24140: {'lr': 0.0004728984061731654, 'samples': 4634880, 'steps': 24139, 'loss/train': 1.1847268342971802} -08/30/2021 17:31:14 - INFO - __main__ - Step 24141: {'lr': 0.00047289600303592334, 'samples': 4635072, 'steps': 24140, 'loss/train': 2.7018134593963623} -08/30/2021 17:31:14 - INFO - __main__ - Step 24142: {'lr': 0.00047289359979824774, 'samples': 4635264, 'steps': 24141, 'loss/train': 1.3059297800064087} -08/30/2021 17:31:15 - INFO - __main__ - Step 24143: {'lr': 0.0004728911964601398, 'samples': 4635456, 'steps': 24142, 'loss/train': 1.1995608806610107} -08/30/2021 17:31:16 - INFO - __main__ - Step 24144: {'lr': 0.00047288879302160046, 'samples': 4635648, 'steps': 24143, 'loss/train': 1.5299186706542969} -08/30/2021 17:31:17 - INFO - __main__ - Step 24145: {'lr': 0.000472886389482631, 'samples': 4635840, 'steps': 24144, 'loss/train': 1.3630061149597168} -08/30/2021 17:31:17 - INFO - __main__ - Step 24146: {'lr': 0.00047288398584323225, 'samples': 4636032, 'steps': 24145, 'loss/train': 1.2673616409301758} -08/30/2021 17:31:18 - INFO - __main__ - Step 24147: {'lr': 0.0004728815821034055, 'samples': 4636224, 'steps': 24146, 'loss/train': 1.2929073572158813} -08/30/2021 17:31:18 - INFO - __main__ - Step 24148: {'lr': 0.00047287917826315163, 'samples': 4636416, 'steps': 24147, 'loss/train': 1.5669113397598267} -08/30/2021 17:31:19 - INFO - __main__ - Step 24149: {'lr': 0.00047287677432247187, 'samples': 4636608, 'steps': 24148, 'loss/train': 1.558624267578125} -08/30/2021 17:31:20 - INFO - __main__ - Step 24150: {'lr': 0.0004728743702813674, 'samples': 4636800, 'steps': 24149, 'loss/train': 1.7655826807022095} -08/30/2021 17:31:20 - INFO - __main__ - Step 24151: {'lr': 0.00047287196613983906, 'samples': 4636992, 'steps': 24150, 'loss/train': 1.4004069566726685} -08/30/2021 17:31:21 - INFO - __main__ - Step 24152: {'lr': 0.00047286956189788803, 'samples': 4637184, 'steps': 24151, 'loss/train': 1.6315075159072876} -08/30/2021 17:31:21 - INFO - __main__ - Step 24153: {'lr': 0.0004728671575555155, 'samples': 4637376, 'steps': 24152, 'loss/train': 1.4012001752853394} -08/30/2021 17:31:23 - INFO - __main__ - Step 24154: {'lr': 0.00047286475311272244, 'samples': 4637568, 'steps': 24153, 'loss/train': 1.7974354028701782} -08/30/2021 17:31:23 - INFO - __main__ - Step 24155: {'lr': 0.00047286234856950995, 'samples': 4637760, 'steps': 24154, 'loss/train': 1.489810585975647} -08/30/2021 17:31:23 - INFO - __main__ - Step 24156: {'lr': 0.0004728599439258791, 'samples': 4637952, 'steps': 24155, 'loss/train': 0.9652630686759949} -08/30/2021 17:31:24 - INFO - __main__ - Step 24157: {'lr': 0.00047285753918183105, 'samples': 4638144, 'steps': 24156, 'loss/train': 1.7588778734207153} -08/30/2021 17:31:24 - INFO - __main__ - Step 24158: {'lr': 0.0004728551343373668, 'samples': 4638336, 'steps': 24157, 'loss/train': 1.049881935119629} -08/30/2021 17:31:26 - INFO - __main__ - Step 24159: {'lr': 0.0004728527293924875, 'samples': 4638528, 'steps': 24158, 'loss/train': 1.8188709020614624} -08/30/2021 17:31:26 - INFO - __main__ - Step 24160: {'lr': 0.0004728503243471941, 'samples': 4638720, 'steps': 24159, 'loss/train': 1.3873933553695679} -08/30/2021 17:31:26 - INFO - __main__ - Step 24161: {'lr': 0.00047284791920148786, 'samples': 4638912, 'steps': 24160, 'loss/train': 1.9750440120697021} -08/30/2021 17:31:27 - INFO - __main__ - Step 24162: {'lr': 0.0004728455139553698, 'samples': 4639104, 'steps': 24161, 'loss/train': 1.8615262508392334} -08/30/2021 17:31:27 - INFO - __main__ - Step 24163: {'lr': 0.00047284310860884097, 'samples': 4639296, 'steps': 24162, 'loss/train': 0.7791587114334106} -08/30/2021 17:31:27 - INFO - __main__ - Step 24164: {'lr': 0.0004728407031619025, 'samples': 4639488, 'steps': 24163, 'loss/train': 1.7196199893951416} -08/30/2021 17:31:29 - INFO - __main__ - Step 24165: {'lr': 0.00047283829761455545, 'samples': 4639680, 'steps': 24164, 'loss/train': 1.6915156841278076} -08/30/2021 17:31:29 - INFO - __main__ - Step 24166: {'lr': 0.00047283589196680083, 'samples': 4639872, 'steps': 24165, 'loss/train': 1.31031334400177} -08/30/2021 17:31:30 - INFO - __main__ - Step 24167: {'lr': 0.00047283348621863987, 'samples': 4640064, 'steps': 24166, 'loss/train': 2.1443991661071777} -08/30/2021 17:31:30 - INFO - __main__ - Step 24168: {'lr': 0.0004728310803700735, 'samples': 4640256, 'steps': 24167, 'loss/train': 1.0439376831054688} -08/30/2021 17:31:30 - INFO - __main__ - Step 24169: {'lr': 0.00047282867442110296, 'samples': 4640448, 'steps': 24168, 'loss/train': 1.2532795667648315} -08/30/2021 17:31:32 - INFO - __main__ - Step 24170: {'lr': 0.0004728262683717292, 'samples': 4640640, 'steps': 24169, 'loss/train': 1.6778916120529175} -08/30/2021 17:31:32 - INFO - __main__ - Step 24171: {'lr': 0.0004728238622219534, 'samples': 4640832, 'steps': 24170, 'loss/train': 0.9244217872619629} -08/30/2021 17:31:33 - INFO - __main__ - Step 24172: {'lr': 0.0004728214559717766, 'samples': 4641024, 'steps': 24171, 'loss/train': 1.2623051404953003} -08/30/2021 17:31:33 - INFO - __main__ - Step 24173: {'lr': 0.0004728190496211999, 'samples': 4641216, 'steps': 24172, 'loss/train': 0.8274864554405212} -08/30/2021 17:31:33 - INFO - __main__ - Step 24174: {'lr': 0.0004728166431702243, 'samples': 4641408, 'steps': 24173, 'loss/train': 0.09556277096271515} -08/30/2021 17:31:36 - INFO - __main__ - Step 24175: {'lr': 0.0004728142366188511, 'samples': 4641600, 'steps': 24174, 'loss/train': 1.373371958732605} -08/30/2021 17:31:36 - INFO - __main__ - Step 24176: {'lr': 0.0004728118299670812, 'samples': 4641792, 'steps': 24175, 'loss/train': 1.5632140636444092} -08/30/2021 17:31:36 - INFO - __main__ - Step 24177: {'lr': 0.0004728094232149156, 'samples': 4641984, 'steps': 24176, 'loss/train': 1.4556348323822021} -08/30/2021 17:31:37 - INFO - __main__ - Step 24178: {'lr': 0.0004728070163623557, 'samples': 4642176, 'steps': 24177, 'loss/train': 1.4671134948730469} -08/30/2021 17:31:37 - INFO - __main__ - Step 24179: {'lr': 0.00047280460940940224, 'samples': 4642368, 'steps': 24178, 'loss/train': 1.8795233964920044} -08/30/2021 17:31:39 - INFO - __main__ - Step 24180: {'lr': 0.00047280220235605653, 'samples': 4642560, 'steps': 24179, 'loss/train': 1.7222018241882324} -08/30/2021 17:31:39 - INFO - __main__ - Step 24181: {'lr': 0.00047279979520231956, 'samples': 4642752, 'steps': 24180, 'loss/train': 1.2071528434753418} -08/30/2021 17:31:40 - INFO - __main__ - Step 24182: {'lr': 0.0004727973879481925, 'samples': 4642944, 'steps': 24181, 'loss/train': 1.6211045980453491} -08/30/2021 17:31:40 - INFO - __main__ - Step 24183: {'lr': 0.0004727949805936763, 'samples': 4643136, 'steps': 24182, 'loss/train': 0.08287215232849121} -08/30/2021 17:31:40 - INFO - __main__ - Step 24184: {'lr': 0.00047279257313877216, 'samples': 4643328, 'steps': 24183, 'loss/train': 1.7023415565490723} -08/30/2021 17:31:42 - INFO - __main__ - Step 24185: {'lr': 0.00047279016558348107, 'samples': 4643520, 'steps': 24184, 'loss/train': 1.1026681661605835} -08/30/2021 17:31:42 - INFO - __main__ - Step 24186: {'lr': 0.00047278775792780424, 'samples': 4643712, 'steps': 24185, 'loss/train': 1.096640706062317} -08/30/2021 17:31:43 - INFO - __main__ - Step 24187: {'lr': 0.00047278535017174266, 'samples': 4643904, 'steps': 24186, 'loss/train': 1.5994592905044556} -08/30/2021 17:31:43 - INFO - __main__ - Step 24188: {'lr': 0.00047278294231529745, 'samples': 4644096, 'steps': 24187, 'loss/train': 1.5921953916549683} -08/30/2021 17:31:43 - INFO - __main__ - Step 24189: {'lr': 0.0004727805343584697, 'samples': 4644288, 'steps': 24188, 'loss/train': 2.005462646484375} -08/30/2021 17:31:44 - INFO - __main__ - Step 24190: {'lr': 0.00047277812630126044, 'samples': 4644480, 'steps': 24189, 'loss/train': 1.9981228113174438} -08/30/2021 17:31:45 - INFO - __main__ - Step 24191: {'lr': 0.0004727757181436708, 'samples': 4644672, 'steps': 24190, 'loss/train': 2.7588233947753906} -08/30/2021 17:31:46 - INFO - __main__ - Step 24192: {'lr': 0.0004727733098857019, 'samples': 4644864, 'steps': 24191, 'loss/train': 1.3896721601486206} -08/30/2021 17:31:46 - INFO - __main__ - Step 24193: {'lr': 0.0004727709015273547, 'samples': 4645056, 'steps': 24192, 'loss/train': 1.611689567565918} -08/30/2021 17:31:46 - INFO - __main__ - Step 24194: {'lr': 0.00047276849306863045, 'samples': 4645248, 'steps': 24193, 'loss/train': 1.6118241548538208} -08/30/2021 17:31:47 - INFO - __main__ - Step 24195: {'lr': 0.0004727660845095301, 'samples': 4645440, 'steps': 24194, 'loss/train': 1.285235047340393} -08/30/2021 17:31:48 - INFO - __main__ - Step 24196: {'lr': 0.0004727636758500548, 'samples': 4645632, 'steps': 24195, 'loss/train': 2.496720552444458} -08/30/2021 17:31:49 - INFO - __main__ - Step 24197: {'lr': 0.0004727612670902057, 'samples': 4645824, 'steps': 24196, 'loss/train': 1.511696457862854} -08/30/2021 17:31:49 - INFO - __main__ - Step 24198: {'lr': 0.0004727588582299837, 'samples': 4646016, 'steps': 24197, 'loss/train': 1.4814748764038086} -08/30/2021 17:31:50 - INFO - __main__ - Step 24199: {'lr': 0.00047275644926939004, 'samples': 4646208, 'steps': 24198, 'loss/train': 1.5196963548660278} -08/30/2021 17:31:50 - INFO - __main__ - Step 24200: {'lr': 0.0004727540402084258, 'samples': 4646400, 'steps': 24199, 'loss/train': 0.9592801332473755} -08/30/2021 17:31:52 - INFO - __main__ - Step 24201: {'lr': 0.00047275163104709196, 'samples': 4646592, 'steps': 24200, 'loss/train': 1.3029142618179321} -08/30/2021 17:31:52 - INFO - __main__ - Step 24202: {'lr': 0.0004727492217853897, 'samples': 4646784, 'steps': 24201, 'loss/train': 1.6478257179260254} -08/30/2021 17:31:53 - INFO - __main__ - Step 24203: {'lr': 0.0004727468124233201, 'samples': 4646976, 'steps': 24202, 'loss/train': 0.0755089670419693} -08/30/2021 17:31:53 - INFO - __main__ - Step 24204: {'lr': 0.0004727444029608842, 'samples': 4647168, 'steps': 24203, 'loss/train': 1.6308687925338745} -08/30/2021 17:31:53 - INFO - __main__ - Step 24205: {'lr': 0.0004727419933980831, 'samples': 4647360, 'steps': 24204, 'loss/train': 0.07464733719825745} -08/30/2021 17:31:54 - INFO - __main__ - Step 24206: {'lr': 0.00047273958373491795, 'samples': 4647552, 'steps': 24205, 'loss/train': 1.1177918910980225} -08/30/2021 17:31:55 - INFO - __main__ - Step 24207: {'lr': 0.0004727371739713897, 'samples': 4647744, 'steps': 24206, 'loss/train': 1.2107316255569458} -08/30/2021 17:31:56 - INFO - __main__ - Step 24208: {'lr': 0.0004727347641074996, 'samples': 4647936, 'steps': 24207, 'loss/train': 0.38301005959510803} -08/30/2021 17:31:56 - INFO - __main__ - Step 24209: {'lr': 0.0004727323541432486, 'samples': 4648128, 'steps': 24208, 'loss/train': 1.2750030755996704} -08/30/2021 17:31:56 - INFO - __main__ - Step 24210: {'lr': 0.0004727299440786378, 'samples': 4648320, 'steps': 24209, 'loss/train': 0.07609347999095917} -08/30/2021 17:31:57 - INFO - __main__ - Step 24211: {'lr': 0.0004727275339136684, 'samples': 4648512, 'steps': 24210, 'loss/train': 1.7404375076293945} -08/30/2021 17:31:58 - INFO - __main__ - Step 24212: {'lr': 0.0004727251236483414, 'samples': 4648704, 'steps': 24211, 'loss/train': 1.6821720600128174} -08/30/2021 17:31:59 - INFO - __main__ - Step 24213: {'lr': 0.0004727227132826579, 'samples': 4648896, 'steps': 24212, 'loss/train': 0.4785604774951935} -08/30/2021 17:31:59 - INFO - __main__ - Step 24214: {'lr': 0.00047272030281661894, 'samples': 4649088, 'steps': 24213, 'loss/train': 1.7701137065887451} -08/30/2021 17:31:59 - INFO - __main__ - Step 24215: {'lr': 0.0004727178922502257, 'samples': 4649280, 'steps': 24214, 'loss/train': 1.6530342102050781} -08/30/2021 17:32:00 - INFO - __main__ - Step 24216: {'lr': 0.00047271548158347917, 'samples': 4649472, 'steps': 24215, 'loss/train': 1.57979154586792} -08/30/2021 17:32:01 - INFO - __main__ - Step 24217: {'lr': 0.00047271307081638047, 'samples': 4649664, 'steps': 24216, 'loss/train': 1.8712079524993896} -08/30/2021 17:32:02 - INFO - __main__ - Step 24218: {'lr': 0.0004727106599489307, 'samples': 4649856, 'steps': 24217, 'loss/train': 1.3714122772216797} -08/30/2021 17:32:02 - INFO - __main__ - Step 24219: {'lr': 0.000472708248981131, 'samples': 4650048, 'steps': 24218, 'loss/train': 1.398590087890625} -08/30/2021 17:32:03 - INFO - __main__ - Step 24220: {'lr': 0.0004727058379129824, 'samples': 4650240, 'steps': 24219, 'loss/train': 2.153866767883301} -08/30/2021 17:32:03 - INFO - __main__ - Step 24221: {'lr': 0.00047270342674448593, 'samples': 4650432, 'steps': 24220, 'loss/train': 1.706506371498108} -08/30/2021 17:32:03 - INFO - __main__ - Step 24222: {'lr': 0.0004727010154756427, 'samples': 4650624, 'steps': 24221, 'loss/train': 1.6973432302474976} -08/30/2021 17:32:05 - INFO - __main__ - Step 24223: {'lr': 0.00047269860410645395, 'samples': 4650816, 'steps': 24222, 'loss/train': 0.9720464944839478} -08/30/2021 17:32:05 - INFO - __main__ - Step 24224: {'lr': 0.00047269619263692056, 'samples': 4651008, 'steps': 24223, 'loss/train': 1.3337974548339844} -08/30/2021 17:32:06 - INFO - __main__ - Step 24225: {'lr': 0.0004726937810670437, 'samples': 4651200, 'steps': 24224, 'loss/train': 1.5803866386413574} -08/30/2021 17:32:06 - INFO - __main__ - Step 24226: {'lr': 0.00047269136939682445, 'samples': 4651392, 'steps': 24225, 'loss/train': 2.019972801208496} -08/30/2021 17:32:06 - INFO - __main__ - Step 24227: {'lr': 0.00047268895762626396, 'samples': 4651584, 'steps': 24226, 'loss/train': 1.2218983173370361} -08/30/2021 17:32:08 - INFO - __main__ - Step 24228: {'lr': 0.00047268654575536326, 'samples': 4651776, 'steps': 24227, 'loss/train': 1.298556923866272} -08/30/2021 17:32:09 - INFO - __main__ - Step 24229: {'lr': 0.0004726841337841234, 'samples': 4651968, 'steps': 24228, 'loss/train': 1.2394062280654907} -08/30/2021 17:32:09 - INFO - __main__ - Step 24230: {'lr': 0.00047268172171254554, 'samples': 4652160, 'steps': 24229, 'loss/train': 0.9660944938659668} -08/30/2021 17:32:09 - INFO - __main__ - Step 24231: {'lr': 0.00047267930954063064, 'samples': 4652352, 'steps': 24230, 'loss/train': 1.059150218963623} -08/30/2021 17:32:10 - INFO - __main__ - Step 24232: {'lr': 0.00047267689726838004, 'samples': 4652544, 'steps': 24231, 'loss/train': 1.8086531162261963} -08/30/2021 17:32:12 - INFO - __main__ - Step 24233: {'lr': 0.00047267448489579455, 'samples': 4652736, 'steps': 24232, 'loss/train': 1.8478260040283203} -08/30/2021 17:32:12 - INFO - __main__ - Step 24234: {'lr': 0.00047267207242287536, 'samples': 4652928, 'steps': 24233, 'loss/train': 1.5857752561569214} -08/30/2021 17:32:12 - INFO - __main__ - Step 24235: {'lr': 0.0004726696598496236, 'samples': 4653120, 'steps': 24234, 'loss/train': 0.16051620244979858} -08/30/2021 17:32:13 - INFO - __main__ - Step 24236: {'lr': 0.0004726672471760404, 'samples': 4653312, 'steps': 24235, 'loss/train': 1.6289249658584595} -08/30/2021 17:32:13 - INFO - __main__ - Step 24237: {'lr': 0.0004726648344021267, 'samples': 4653504, 'steps': 24236, 'loss/train': 1.943662405014038} -08/30/2021 17:32:14 - INFO - __main__ - Step 24238: {'lr': 0.0004726624215278836, 'samples': 4653696, 'steps': 24237, 'loss/train': 1.3714585304260254} -08/30/2021 17:32:15 - INFO - __main__ - Step 24239: {'lr': 0.0004726600085533124, 'samples': 4653888, 'steps': 24238, 'loss/train': 0.8313621282577515} -08/30/2021 17:32:16 - INFO - __main__ - Step 24240: {'lr': 0.0004726575954784139, 'samples': 4654080, 'steps': 24239, 'loss/train': 1.6338189840316772} -08/30/2021 17:32:16 - INFO - __main__ - Step 24241: {'lr': 0.0004726551823031894, 'samples': 4654272, 'steps': 24240, 'loss/train': 0.32059958577156067} -08/30/2021 17:32:16 - INFO - __main__ - Step 24242: {'lr': 0.0004726527690276399, 'samples': 4654464, 'steps': 24241, 'loss/train': 1.0379594564437866} -08/30/2021 17:32:17 - INFO - __main__ - Step 24243: {'lr': 0.0004726503556517665, 'samples': 4654656, 'steps': 24242, 'loss/train': 0.9742986559867859} -08/30/2021 17:32:19 - INFO - __main__ - Step 24244: {'lr': 0.0004726479421755703, 'samples': 4654848, 'steps': 24243, 'loss/train': 1.7805272340774536} -08/30/2021 17:32:19 - INFO - __main__ - Step 24245: {'lr': 0.0004726455285990523, 'samples': 4655040, 'steps': 24244, 'loss/train': 1.415780782699585} -08/30/2021 17:32:20 - INFO - __main__ - Step 24246: {'lr': 0.00047264311492221375, 'samples': 4655232, 'steps': 24245, 'loss/train': 1.180909514427185} -08/30/2021 17:32:20 - INFO - __main__ - Step 24247: {'lr': 0.00047264070114505556, 'samples': 4655424, 'steps': 24246, 'loss/train': 1.2102290391921997} -08/30/2021 17:32:20 - INFO - __main__ - Step 24248: {'lr': 0.00047263828726757897, 'samples': 4655616, 'steps': 24247, 'loss/train': 1.481451153755188} -08/30/2021 17:32:21 - INFO - __main__ - Step 24249: {'lr': 0.00047263587328978495, 'samples': 4655808, 'steps': 24248, 'loss/train': 0.053167395293712616} -08/30/2021 17:32:22 - INFO - __main__ - Step 24250: {'lr': 0.00047263345921167473, 'samples': 4656000, 'steps': 24249, 'loss/train': 0.05923473462462425} -08/30/2021 17:32:23 - INFO - __main__ - Step 24251: {'lr': 0.00047263104503324926, 'samples': 4656192, 'steps': 24250, 'loss/train': 1.8162950277328491} -08/30/2021 17:32:23 - INFO - __main__ - Step 24252: {'lr': 0.00047262863075450966, 'samples': 4656384, 'steps': 24251, 'loss/train': 1.594192624092102} -08/30/2021 17:32:23 - INFO - __main__ - Step 24253: {'lr': 0.0004726262163754571, 'samples': 4656576, 'steps': 24252, 'loss/train': 1.113451361656189} -08/30/2021 17:32:24 - INFO - __main__ - Step 24254: {'lr': 0.00047262380189609253, 'samples': 4656768, 'steps': 24253, 'loss/train': 1.1306809186935425} -08/30/2021 17:32:25 - INFO - __main__ - Step 24255: {'lr': 0.0004726213873164171, 'samples': 4656960, 'steps': 24254, 'loss/train': 1.96120285987854} -08/30/2021 17:32:25 - INFO - __main__ - Step 24256: {'lr': 0.00047261897263643196, 'samples': 4657152, 'steps': 24255, 'loss/train': 1.1570863723754883} -08/30/2021 17:32:26 - INFO - __main__ - Step 24257: {'lr': 0.0004726165578561381, 'samples': 4657344, 'steps': 24256, 'loss/train': 1.8087940216064453} -08/30/2021 17:32:26 - INFO - __main__ - Step 24258: {'lr': 0.0004726141429755367, 'samples': 4657536, 'steps': 24257, 'loss/train': 1.9370120763778687} -08/30/2021 17:32:27 - INFO - __main__ - Step 24259: {'lr': 0.0004726117279946288, 'samples': 4657728, 'steps': 24258, 'loss/train': 1.0272470712661743} -08/30/2021 17:32:27 - INFO - __main__ - Step 24260: {'lr': 0.0004726093129134155, 'samples': 4657920, 'steps': 24259, 'loss/train': 1.2489008903503418} -08/30/2021 17:32:28 - INFO - __main__ - Step 24261: {'lr': 0.0004726068977318978, 'samples': 4658112, 'steps': 24260, 'loss/train': 1.3908486366271973} -08/30/2021 17:32:29 - INFO - __main__ - Step 24262: {'lr': 0.0004726044824500769, 'samples': 4658304, 'steps': 24261, 'loss/train': 1.5788671970367432} -08/30/2021 17:32:29 - INFO - __main__ - Step 24263: {'lr': 0.0004726020670679538, 'samples': 4658496, 'steps': 24262, 'loss/train': 1.5976192951202393} -08/30/2021 17:32:29 - INFO - __main__ - Step 24264: {'lr': 0.00047259965158552976, 'samples': 4658688, 'steps': 24263, 'loss/train': 1.7133711576461792} -08/30/2021 17:32:30 - INFO - __main__ - Step 24265: {'lr': 0.00047259723600280573, 'samples': 4658880, 'steps': 24264, 'loss/train': 1.972362756729126} -08/30/2021 17:32:31 - INFO - __main__ - Step 24266: {'lr': 0.0004725948203197828, 'samples': 4659072, 'steps': 24265, 'loss/train': 1.0435600280761719} -08/30/2021 17:32:32 - INFO - __main__ - Step 24267: {'lr': 0.0004725924045364621, 'samples': 4659264, 'steps': 24266, 'loss/train': 1.598348617553711} -08/30/2021 17:32:32 - INFO - __main__ - Step 24268: {'lr': 0.00047258998865284463, 'samples': 4659456, 'steps': 24267, 'loss/train': 1.8444726467132568} -08/30/2021 17:32:32 - INFO - __main__ - Step 24269: {'lr': 0.0004725875726689316, 'samples': 4659648, 'steps': 24268, 'loss/train': 1.5474190711975098} -08/30/2021 17:32:33 - INFO - __main__ - Step 24270: {'lr': 0.000472585156584724, 'samples': 4659840, 'steps': 24269, 'loss/train': 0.962842583656311} -08/30/2021 17:32:35 - INFO - __main__ - Step 24271: {'lr': 0.00047258274040022305, 'samples': 4660032, 'steps': 24270, 'loss/train': 1.7693638801574707} -08/30/2021 17:32:35 - INFO - __main__ - Step 24272: {'lr': 0.0004725803241154297, 'samples': 4660224, 'steps': 24271, 'loss/train': 1.7162286043167114} -08/30/2021 17:32:36 - INFO - __main__ - Step 24273: {'lr': 0.0004725779077303451, 'samples': 4660416, 'steps': 24272, 'loss/train': 1.45207679271698} -08/30/2021 17:32:36 - INFO - __main__ - Step 24274: {'lr': 0.0004725754912449703, 'samples': 4660608, 'steps': 24273, 'loss/train': 1.6680254936218262} -08/30/2021 17:32:36 - INFO - __main__ - Step 24275: {'lr': 0.0004725730746593064, 'samples': 4660800, 'steps': 24274, 'loss/train': 1.67513906955719} -08/30/2021 17:32:37 - INFO - __main__ - Step 24276: {'lr': 0.0004725706579733546, 'samples': 4660992, 'steps': 24275, 'loss/train': 0.5670360326766968} -08/30/2021 17:32:38 - INFO - __main__ - Step 24277: {'lr': 0.00047256824118711583, 'samples': 4661184, 'steps': 24276, 'loss/train': 0.58359295129776} -08/30/2021 17:32:39 - INFO - __main__ - Step 24278: {'lr': 0.00047256582430059126, 'samples': 4661376, 'steps': 24277, 'loss/train': 1.6768839359283447} -08/30/2021 17:32:39 - INFO - __main__ - Step 24279: {'lr': 0.00047256340731378194, 'samples': 4661568, 'steps': 24278, 'loss/train': 1.20183527469635} -08/30/2021 17:32:39 - INFO - __main__ - Step 24280: {'lr': 0.00047256099022668896, 'samples': 4661760, 'steps': 24279, 'loss/train': 1.9832605123519897} -08/30/2021 17:32:40 - INFO - __main__ - Step 24281: {'lr': 0.00047255857303931347, 'samples': 4661952, 'steps': 24280, 'loss/train': 1.5650697946548462} -08/30/2021 17:32:42 - INFO - __main__ - Step 24282: {'lr': 0.00047255615575165653, 'samples': 4662144, 'steps': 24281, 'loss/train': 1.5526493787765503} -08/30/2021 17:32:42 - INFO - __main__ - Step 24283: {'lr': 0.0004725537383637193, 'samples': 4662336, 'steps': 24282, 'loss/train': 1.8533439636230469} -08/30/2021 17:32:42 - INFO - __main__ - Step 24284: {'lr': 0.0004725513208755027, 'samples': 4662528, 'steps': 24283, 'loss/train': 1.8512705564498901} -08/30/2021 17:32:43 - INFO - __main__ - Step 24285: {'lr': 0.0004725489032870079, 'samples': 4662720, 'steps': 24284, 'loss/train': 1.6501190662384033} -08/30/2021 17:32:43 - INFO - __main__ - Step 24286: {'lr': 0.000472546485598236, 'samples': 4662912, 'steps': 24285, 'loss/train': 1.2825064659118652} -08/30/2021 17:32:45 - INFO - __main__ - Step 24287: {'lr': 0.0004725440678091881, 'samples': 4663104, 'steps': 24286, 'loss/train': 1.427514672279358} -08/30/2021 17:32:45 - INFO - __main__ - Step 24288: {'lr': 0.00047254164991986525, 'samples': 4663296, 'steps': 24287, 'loss/train': 1.4465891122817993} -08/30/2021 17:32:46 - INFO - __main__ - Step 24289: {'lr': 0.0004725392319302686, 'samples': 4663488, 'steps': 24288, 'loss/train': 1.5587409734725952} -08/30/2021 17:32:46 - INFO - __main__ - Step 24290: {'lr': 0.0004725368138403992, 'samples': 4663680, 'steps': 24289, 'loss/train': 2.178434371948242} -08/30/2021 17:32:46 - INFO - __main__ - Step 24291: {'lr': 0.00047253439565025815, 'samples': 4663872, 'steps': 24290, 'loss/train': 1.6974729299545288} -08/30/2021 17:32:47 - INFO - __main__ - Step 24292: {'lr': 0.00047253197735984653, 'samples': 4664064, 'steps': 24291, 'loss/train': 1.7663254737854004} -08/30/2021 17:32:48 - INFO - __main__ - Step 24293: {'lr': 0.00047252955896916546, 'samples': 4664256, 'steps': 24292, 'loss/train': 0.25294041633605957} -08/30/2021 17:32:49 - INFO - __main__ - Step 24294: {'lr': 0.000472527140478216, 'samples': 4664448, 'steps': 24293, 'loss/train': 1.2851003408432007} -08/30/2021 17:32:49 - INFO - __main__ - Step 24295: {'lr': 0.00047252472188699917, 'samples': 4664640, 'steps': 24294, 'loss/train': 1.701158046722412} -08/30/2021 17:32:49 - INFO - __main__ - Step 24296: {'lr': 0.0004725223031955162, 'samples': 4664832, 'steps': 24295, 'loss/train': 1.6793968677520752} -08/30/2021 17:32:50 - INFO - __main__ - Step 24297: {'lr': 0.0004725198844037681, 'samples': 4665024, 'steps': 24296, 'loss/train': 1.1335865259170532} -08/30/2021 17:32:51 - INFO - __main__ - Step 24298: {'lr': 0.00047251746551175603, 'samples': 4665216, 'steps': 24297, 'loss/train': 3.253445863723755} -08/30/2021 17:32:52 - INFO - __main__ - Step 24299: {'lr': 0.000472515046519481, 'samples': 4665408, 'steps': 24298, 'loss/train': 1.2532851696014404} -08/30/2021 17:32:52 - INFO - __main__ - Step 24300: {'lr': 0.000472512627426944, 'samples': 4665600, 'steps': 24299, 'loss/train': 1.5509803295135498} -08/30/2021 17:32:52 - INFO - __main__ - Step 24301: {'lr': 0.0004725102082341464, 'samples': 4665792, 'steps': 24300, 'loss/train': 1.648585319519043} -08/30/2021 17:32:53 - INFO - __main__ - Step 24302: {'lr': 0.00047250778894108905, 'samples': 4665984, 'steps': 24301, 'loss/train': 1.331283688545227} -08/30/2021 17:32:54 - INFO - __main__ - Step 24303: {'lr': 0.0004725053695477731, 'samples': 4666176, 'steps': 24302, 'loss/train': 1.0451349020004272} -08/30/2021 17:32:55 - INFO - __main__ - Step 24304: {'lr': 0.0004725029500541997, 'samples': 4666368, 'steps': 24303, 'loss/train': 2.3015499114990234} -08/30/2021 17:32:55 - INFO - __main__ - Step 24305: {'lr': 0.00047250053046036996, 'samples': 4666560, 'steps': 24304, 'loss/train': 1.9148674011230469} -08/30/2021 17:32:55 - INFO - __main__ - Step 24306: {'lr': 0.00047249811076628483, 'samples': 4666752, 'steps': 24305, 'loss/train': 1.507433533668518} -08/30/2021 17:32:56 - INFO - __main__ - Step 24307: {'lr': 0.00047249569097194554, 'samples': 4666944, 'steps': 24306, 'loss/train': 1.850820779800415} -08/30/2021 17:32:58 - INFO - __main__ - Step 24308: {'lr': 0.0004724932710773531, 'samples': 4667136, 'steps': 24307, 'loss/train': 1.5423920154571533} -08/30/2021 17:32:58 - INFO - __main__ - Step 24309: {'lr': 0.00047249085108250867, 'samples': 4667328, 'steps': 24308, 'loss/train': 1.714725375175476} -08/30/2021 17:32:59 - INFO - __main__ - Step 24310: {'lr': 0.0004724884309874132, 'samples': 4667520, 'steps': 24309, 'loss/train': 1.6923638582229614} -08/30/2021 17:32:59 - INFO - __main__ - Step 24311: {'lr': 0.00047248601079206797, 'samples': 4667712, 'steps': 24310, 'loss/train': 1.9769870042800903} -08/30/2021 17:32:59 - INFO - __main__ - Step 24312: {'lr': 0.0004724835904964739, 'samples': 4667904, 'steps': 24311, 'loss/train': 1.5941286087036133} -08/30/2021 17:33:00 - INFO - __main__ - Step 24313: {'lr': 0.0004724811701006322, 'samples': 4668096, 'steps': 24312, 'loss/train': 0.18794506788253784} -08/30/2021 17:33:01 - INFO - __main__ - Step 24314: {'lr': 0.00047247874960454394, 'samples': 4668288, 'steps': 24313, 'loss/train': 1.3424668312072754} -08/30/2021 17:33:02 - INFO - __main__ - Step 24315: {'lr': 0.0004724763290082102, 'samples': 4668480, 'steps': 24314, 'loss/train': 2.002727746963501} -08/30/2021 17:33:02 - INFO - __main__ - Step 24316: {'lr': 0.000472473908311632, 'samples': 4668672, 'steps': 24315, 'loss/train': 1.3826675415039062} -08/30/2021 17:33:02 - INFO - __main__ - Step 24317: {'lr': 0.0004724714875148105, 'samples': 4668864, 'steps': 24316, 'loss/train': 1.2146414518356323} -08/30/2021 17:33:03 - INFO - __main__ - Step 24318: {'lr': 0.0004724690666177468, 'samples': 4669056, 'steps': 24317, 'loss/train': 1.3559935092926025} -08/30/2021 17:33:04 - INFO - __main__ - Step 24319: {'lr': 0.00047246664562044193, 'samples': 4669248, 'steps': 24318, 'loss/train': 1.227448582649231} -08/30/2021 17:33:05 - INFO - __main__ - Step 24320: {'lr': 0.0004724642245228971, 'samples': 4669440, 'steps': 24319, 'loss/train': 1.6217232942581177} -08/30/2021 17:33:05 - INFO - __main__ - Step 24321: {'lr': 0.0004724618033251133, 'samples': 4669632, 'steps': 24320, 'loss/train': 2.008260726928711} -08/30/2021 17:33:05 - INFO - __main__ - Step 24322: {'lr': 0.0004724593820270916, 'samples': 4669824, 'steps': 24321, 'loss/train': 1.8731880187988281} -08/30/2021 17:33:06 - INFO - __main__ - Step 24323: {'lr': 0.00047245696062883316, 'samples': 4670016, 'steps': 24322, 'loss/train': 1.4362927675247192} -08/30/2021 17:33:07 - INFO - __main__ - Step 24324: {'lr': 0.0004724545391303391, 'samples': 4670208, 'steps': 24323, 'loss/train': 1.5768028497695923} -08/30/2021 17:33:08 - INFO - __main__ - Step 24325: {'lr': 0.0004724521175316103, 'samples': 4670400, 'steps': 24324, 'loss/train': 1.0141940116882324} -08/30/2021 17:33:08 - INFO - __main__ - Step 24326: {'lr': 0.0004724496958326482, 'samples': 4670592, 'steps': 24325, 'loss/train': 1.013269305229187} -08/30/2021 17:33:08 - INFO - __main__ - Step 24327: {'lr': 0.00047244727403345356, 'samples': 4670784, 'steps': 24326, 'loss/train': 1.1677967309951782} -08/30/2021 17:33:09 - INFO - __main__ - Step 24328: {'lr': 0.00047244485213402765, 'samples': 4670976, 'steps': 24327, 'loss/train': 1.6913164854049683} -08/30/2021 17:33:10 - INFO - __main__ - Step 24329: {'lr': 0.0004724424301343716, 'samples': 4671168, 'steps': 24328, 'loss/train': 1.6653810739517212} -08/30/2021 17:33:11 - INFO - __main__ - Step 24330: {'lr': 0.00047244000803448635, 'samples': 4671360, 'steps': 24329, 'loss/train': 0.9741966724395752} -08/30/2021 17:33:11 - INFO - __main__ - Step 24331: {'lr': 0.000472437585834373, 'samples': 4671552, 'steps': 24330, 'loss/train': 1.6117873191833496} -08/30/2021 17:33:12 - INFO - __main__ - Step 24332: {'lr': 0.00047243516353403283, 'samples': 4671744, 'steps': 24331, 'loss/train': 1.9478338956832886} -08/30/2021 17:33:12 - INFO - __main__ - Step 24333: {'lr': 0.0004724327411334668, 'samples': 4671936, 'steps': 24332, 'loss/train': 1.7630128860473633} -08/30/2021 17:33:12 - INFO - __main__ - Step 24334: {'lr': 0.00047243031863267594, 'samples': 4672128, 'steps': 24333, 'loss/train': 1.1125938892364502} -08/30/2021 17:33:14 - INFO - __main__ - Step 24335: {'lr': 0.0004724278960316615, 'samples': 4672320, 'steps': 24334, 'loss/train': 1.0044838190078735} -08/30/2021 17:33:14 - INFO - __main__ - Step 24336: {'lr': 0.00047242547333042434, 'samples': 4672512, 'steps': 24335, 'loss/train': 1.2330117225646973} -08/30/2021 17:33:15 - INFO - __main__ - Step 24337: {'lr': 0.0004724230505289658, 'samples': 4672704, 'steps': 24336, 'loss/train': 1.748183250427246} -08/30/2021 17:33:15 - INFO - __main__ - Step 24338: {'lr': 0.0004724206276272868, 'samples': 4672896, 'steps': 24337, 'loss/train': 1.4580626487731934} -08/30/2021 17:33:15 - INFO - __main__ - Step 24339: {'lr': 0.0004724182046253885, 'samples': 4673088, 'steps': 24338, 'loss/train': 0.9954025149345398} -08/30/2021 17:33:17 - INFO - __main__ - Step 24340: {'lr': 0.0004724157815232721, 'samples': 4673280, 'steps': 24339, 'loss/train': 1.7079565525054932} -08/30/2021 17:33:18 - INFO - __main__ - Step 24341: {'lr': 0.00047241335832093844, 'samples': 4673472, 'steps': 24340, 'loss/train': 1.7329707145690918} -08/30/2021 17:33:18 - INFO - __main__ - Step 24342: {'lr': 0.00047241093501838887, 'samples': 4673664, 'steps': 24341, 'loss/train': 1.664844274520874} -08/30/2021 17:33:19 - INFO - __main__ - Step 24343: {'lr': 0.00047240851161562433, 'samples': 4673856, 'steps': 24342, 'loss/train': 1.1673303842544556} -08/30/2021 17:33:19 - INFO - __main__ - Step 24344: {'lr': 0.00047240608811264595, 'samples': 4674048, 'steps': 24343, 'loss/train': 1.3469853401184082} -08/30/2021 17:33:21 - INFO - __main__ - Step 24345: {'lr': 0.0004724036645094548, 'samples': 4674240, 'steps': 24344, 'loss/train': 1.9298440217971802} -08/30/2021 17:33:21 - INFO - __main__ - Step 24346: {'lr': 0.00047240124080605197, 'samples': 4674432, 'steps': 24345, 'loss/train': 1.7860263586044312} -08/30/2021 17:33:21 - INFO - __main__ - Step 24347: {'lr': 0.0004723988170024386, 'samples': 4674624, 'steps': 24346, 'loss/train': 1.76042902469635} -08/30/2021 17:33:22 - INFO - __main__ - Step 24348: {'lr': 0.0004723963930986157, 'samples': 4674816, 'steps': 24347, 'loss/train': 1.1373618841171265} -08/30/2021 17:33:22 - INFO - __main__ - Step 24349: {'lr': 0.0004723939690945845, 'samples': 4675008, 'steps': 24348, 'loss/train': 0.9944627285003662} -08/30/2021 17:33:22 - INFO - __main__ - Step 24350: {'lr': 0.000472391544990346, 'samples': 4675200, 'steps': 24349, 'loss/train': 1.1673153638839722} -08/30/2021 17:33:24 - INFO - __main__ - Step 24351: {'lr': 0.0004723891207859012, 'samples': 4675392, 'steps': 24350, 'loss/train': 1.4055306911468506} -08/30/2021 17:33:24 - INFO - __main__ - Step 24352: {'lr': 0.00047238669648125146, 'samples': 4675584, 'steps': 24351, 'loss/train': 2.0462114810943604} -08/30/2021 17:33:25 - INFO - __main__ - Step 24353: {'lr': 0.00047238427207639755, 'samples': 4675776, 'steps': 24352, 'loss/train': 1.9095929861068726} -08/30/2021 17:33:25 - INFO - __main__ - Step 24354: {'lr': 0.0004723818475713408, 'samples': 4675968, 'steps': 24353, 'loss/train': 1.2838232517242432} -08/30/2021 17:33:25 - INFO - __main__ - Step 24355: {'lr': 0.00047237942296608223, 'samples': 4676160, 'steps': 24354, 'loss/train': 1.488679051399231} -08/30/2021 17:33:27 - INFO - __main__ - Step 24356: {'lr': 0.00047237699826062286, 'samples': 4676352, 'steps': 24355, 'loss/train': 1.953740119934082} -08/30/2021 17:33:27 - INFO - __main__ - Step 24357: {'lr': 0.0004723745734549639, 'samples': 4676544, 'steps': 24356, 'loss/train': 1.2457115650177002} -08/30/2021 17:33:28 - INFO - __main__ - Step 24358: {'lr': 0.0004723721485491064, 'samples': 4676736, 'steps': 24357, 'loss/train': 1.6974021196365356} -08/30/2021 17:33:28 - INFO - __main__ - Step 24359: {'lr': 0.0004723697235430514, 'samples': 4676928, 'steps': 24358, 'loss/train': 1.1630061864852905} -08/30/2021 17:33:29 - INFO - __main__ - Step 24360: {'lr': 0.0004723672984368, 'samples': 4677120, 'steps': 24359, 'loss/train': 2.0134353637695312} -08/30/2021 17:33:29 - INFO - __main__ - Step 24361: {'lr': 0.00047236487323035344, 'samples': 4677312, 'steps': 24360, 'loss/train': 1.538875699043274} -08/30/2021 17:33:30 - INFO - __main__ - Step 24362: {'lr': 0.00047236244792371265, 'samples': 4677504, 'steps': 24361, 'loss/train': 1.7127004861831665} -08/30/2021 17:33:31 - INFO - __main__ - Step 24363: {'lr': 0.0004723600225168787, 'samples': 4677696, 'steps': 24362, 'loss/train': 1.7155966758728027} -08/30/2021 17:33:31 - INFO - __main__ - Step 24364: {'lr': 0.0004723575970098528, 'samples': 4677888, 'steps': 24363, 'loss/train': 1.8337619304656982} -08/30/2021 17:33:31 - INFO - __main__ - Step 24365: {'lr': 0.00047235517140263605, 'samples': 4678080, 'steps': 24364, 'loss/train': 1.7331677675247192} -08/30/2021 17:33:32 - INFO - __main__ - Step 24366: {'lr': 0.00047235274569522946, 'samples': 4678272, 'steps': 24365, 'loss/train': 1.7484673261642456} -08/30/2021 17:33:33 - INFO - __main__ - Step 24367: {'lr': 0.0004723503198876341, 'samples': 4678464, 'steps': 24366, 'loss/train': 1.4265400171279907} -08/30/2021 17:33:34 - INFO - __main__ - Step 24368: {'lr': 0.0004723478939798512, 'samples': 4678656, 'steps': 24367, 'loss/train': 1.637850284576416} -08/30/2021 17:33:34 - INFO - __main__ - Step 24369: {'lr': 0.0004723454679718817, 'samples': 4678848, 'steps': 24368, 'loss/train': 1.5267797708511353} -08/30/2021 17:33:34 - INFO - __main__ - Step 24370: {'lr': 0.00047234304186372685, 'samples': 4679040, 'steps': 24369, 'loss/train': 1.452715277671814} -08/30/2021 17:33:35 - INFO - __main__ - Step 24371: {'lr': 0.00047234061565538753, 'samples': 4679232, 'steps': 24370, 'loss/train': 1.788153886795044} -08/30/2021 17:33:36 - INFO - __main__ - Step 24372: {'lr': 0.0004723381893468651, 'samples': 4679424, 'steps': 24371, 'loss/train': 1.638181209564209} -08/30/2021 17:33:37 - INFO - __main__ - Step 24373: {'lr': 0.00047233576293816045, 'samples': 4679616, 'steps': 24372, 'loss/train': 2.1719155311584473} -08/30/2021 17:33:37 - INFO - __main__ - Step 24374: {'lr': 0.00047233333642927465, 'samples': 4679808, 'steps': 24373, 'loss/train': 1.6320966482162476} -08/30/2021 17:33:37 - INFO - __main__ - Step 24375: {'lr': 0.000472330909820209, 'samples': 4680000, 'steps': 24374, 'loss/train': 2.1833300590515137} -08/30/2021 17:33:38 - INFO - __main__ - Step 24376: {'lr': 0.0004723284831109644, 'samples': 4680192, 'steps': 24375, 'loss/train': 1.494808554649353} -08/30/2021 17:33:39 - INFO - __main__ - Step 24377: {'lr': 0.0004723260563015421, 'samples': 4680384, 'steps': 24376, 'loss/train': 1.3499294519424438} -08/30/2021 17:33:40 - INFO - __main__ - Step 24378: {'lr': 0.00047232362939194305, 'samples': 4680576, 'steps': 24377, 'loss/train': 1.245821475982666} -08/30/2021 17:33:40 - INFO - __main__ - Step 24379: {'lr': 0.0004723212023821684, 'samples': 4680768, 'steps': 24378, 'loss/train': 1.4235199689865112} -08/30/2021 17:33:40 - INFO - __main__ - Step 24380: {'lr': 0.0004723187752722193, 'samples': 4680960, 'steps': 24379, 'loss/train': 1.8682743310928345} -08/30/2021 17:33:41 - INFO - __main__ - Step 24381: {'lr': 0.00047231634806209675, 'samples': 4681152, 'steps': 24380, 'loss/train': 1.592482328414917} -08/30/2021 17:33:42 - INFO - __main__ - Step 24382: {'lr': 0.0004723139207518019, 'samples': 4681344, 'steps': 24381, 'loss/train': 1.9671236276626587} -08/30/2021 17:33:43 - INFO - __main__ - Step 24383: {'lr': 0.00047231149334133577, 'samples': 4681536, 'steps': 24382, 'loss/train': 1.4625492095947266} -08/30/2021 17:33:43 - INFO - __main__ - Step 24384: {'lr': 0.00047230906583069953, 'samples': 4681728, 'steps': 24383, 'loss/train': 0.7411932945251465} -08/30/2021 17:33:44 - INFO - __main__ - Step 24385: {'lr': 0.0004723066382198943, 'samples': 4681920, 'steps': 24384, 'loss/train': 1.7482298612594604} -08/30/2021 17:33:44 - INFO - __main__ - Step 24386: {'lr': 0.00047230421050892116, 'samples': 4682112, 'steps': 24385, 'loss/train': 1.3088852167129517} -08/30/2021 17:33:46 - INFO - __main__ - Step 24387: {'lr': 0.00047230178269778105, 'samples': 4682304, 'steps': 24386, 'loss/train': 1.6270971298217773} -08/30/2021 17:33:46 - INFO - __main__ - Step 24388: {'lr': 0.00047229935478647524, 'samples': 4682496, 'steps': 24387, 'loss/train': 1.438279628753662} -08/30/2021 17:33:47 - INFO - __main__ - Step 24389: {'lr': 0.0004722969267750048, 'samples': 4682688, 'steps': 24388, 'loss/train': 0.08078933507204056} -08/30/2021 17:33:47 - INFO - __main__ - Step 24390: {'lr': 0.0004722944986633708, 'samples': 4682880, 'steps': 24389, 'loss/train': 1.1382778882980347} -08/30/2021 17:33:47 - INFO - __main__ - Step 24391: {'lr': 0.0004722920704515743, 'samples': 4683072, 'steps': 24390, 'loss/train': 1.44602370262146} -08/30/2021 17:33:48 - INFO - __main__ - Step 24392: {'lr': 0.00047228964213961647, 'samples': 4683264, 'steps': 24391, 'loss/train': 1.3812720775604248} -08/30/2021 17:33:48 - INFO - __main__ - Step 24393: {'lr': 0.00047228721372749826, 'samples': 4683456, 'steps': 24392, 'loss/train': 1.5855101346969604} -08/30/2021 17:33:50 - INFO - __main__ - Step 24394: {'lr': 0.000472284785215221, 'samples': 4683648, 'steps': 24393, 'loss/train': 1.642717957496643} -08/30/2021 17:33:51 - INFO - __main__ - Step 24395: {'lr': 0.0004722823566027855, 'samples': 4683840, 'steps': 24394, 'loss/train': 1.7613502740859985} -08/30/2021 17:33:51 - INFO - __main__ - Step 24396: {'lr': 0.00047227992789019316, 'samples': 4684032, 'steps': 24395, 'loss/train': 1.6548693180084229} -08/30/2021 17:33:51 - INFO - __main__ - Step 24397: {'lr': 0.0004722774990774448, 'samples': 4684224, 'steps': 24396, 'loss/train': 1.6467336416244507} -08/30/2021 17:33:52 - INFO - __main__ - Step 24398: {'lr': 0.00047227507016454163, 'samples': 4684416, 'steps': 24397, 'loss/train': 1.679891586303711} -08/30/2021 17:33:53 - INFO - __main__ - Step 24399: {'lr': 0.00047227264115148475, 'samples': 4684608, 'steps': 24398, 'loss/train': 1.6772023439407349} -08/30/2021 17:33:54 - INFO - __main__ - Step 24400: {'lr': 0.00047227021203827523, 'samples': 4684800, 'steps': 24399, 'loss/train': 1.7842049598693848} -08/30/2021 17:33:54 - INFO - __main__ - Step 24401: {'lr': 0.0004722677828249142, 'samples': 4684992, 'steps': 24400, 'loss/train': 1.0591225624084473} -08/30/2021 17:33:54 - INFO - __main__ - Step 24402: {'lr': 0.0004722653535114028, 'samples': 4685184, 'steps': 24401, 'loss/train': 1.6557775735855103} -08/30/2021 17:33:55 - INFO - __main__ - Step 24403: {'lr': 0.00047226292409774205, 'samples': 4685376, 'steps': 24402, 'loss/train': 0.9989805817604065} -08/30/2021 17:33:56 - INFO - __main__ - Step 24404: {'lr': 0.00047226049458393306, 'samples': 4685568, 'steps': 24403, 'loss/train': 1.0077651739120483} -08/30/2021 17:33:57 - INFO - __main__ - Step 24405: {'lr': 0.0004722580649699768, 'samples': 4685760, 'steps': 24404, 'loss/train': 1.518217921257019} -08/30/2021 17:33:57 - INFO - __main__ - Step 24406: {'lr': 0.00047225563525587463, 'samples': 4685952, 'steps': 24405, 'loss/train': 1.2954621315002441} -08/30/2021 17:33:57 - INFO - __main__ - Step 24407: {'lr': 0.0004722532054416274, 'samples': 4686144, 'steps': 24406, 'loss/train': 2.0343549251556396} -08/30/2021 17:33:58 - INFO - __main__ - Step 24408: {'lr': 0.0004722507755272364, 'samples': 4686336, 'steps': 24407, 'loss/train': 1.5305819511413574} -08/30/2021 17:33:58 - INFO - __main__ - Step 24409: {'lr': 0.0004722483455127026, 'samples': 4686528, 'steps': 24408, 'loss/train': 1.5015907287597656} -08/30/2021 17:34:00 - INFO - __main__ - Step 24410: {'lr': 0.000472245915398027, 'samples': 4686720, 'steps': 24409, 'loss/train': 0.2329707145690918} -08/30/2021 17:34:00 - INFO - __main__ - Step 24411: {'lr': 0.0004722434851832109, 'samples': 4686912, 'steps': 24410, 'loss/train': 0.9077503085136414} -08/30/2021 17:34:00 - INFO - __main__ - Step 24412: {'lr': 0.00047224105486825543, 'samples': 4687104, 'steps': 24411, 'loss/train': 1.0722583532333374} -08/30/2021 17:34:01 - INFO - __main__ - Step 24413: {'lr': 0.0004722386244531615, 'samples': 4687296, 'steps': 24412, 'loss/train': 1.7993780374526978} -08/30/2021 17:34:01 - INFO - __main__ - Step 24414: {'lr': 0.0004722361939379302, 'samples': 4687488, 'steps': 24413, 'loss/train': 0.5120288133621216} -08/30/2021 17:34:03 - INFO - __main__ - Step 24415: {'lr': 0.0004722337633225627, 'samples': 4687680, 'steps': 24414, 'loss/train': 1.5795621871948242} -08/30/2021 17:34:03 - INFO - __main__ - Step 24416: {'lr': 0.0004722313326070602, 'samples': 4687872, 'steps': 24415, 'loss/train': 1.7287003993988037} -08/30/2021 17:34:04 - INFO - __main__ - Step 24417: {'lr': 0.00047222890179142365, 'samples': 4688064, 'steps': 24416, 'loss/train': 1.6448042392730713} -08/30/2021 17:34:04 - INFO - __main__ - Step 24418: {'lr': 0.00047222647087565413, 'samples': 4688256, 'steps': 24417, 'loss/train': 1.8849087953567505} -08/30/2021 17:34:04 - INFO - __main__ - Step 24419: {'lr': 0.0004722240398597528, 'samples': 4688448, 'steps': 24418, 'loss/train': 1.5503348112106323} -08/30/2021 17:34:06 - INFO - __main__ - Step 24420: {'lr': 0.0004722216087437208, 'samples': 4688640, 'steps': 24419, 'loss/train': 1.3734948635101318} -08/30/2021 17:34:06 - INFO - __main__ - Step 24421: {'lr': 0.0004722191775275592, 'samples': 4688832, 'steps': 24420, 'loss/train': 1.6976292133331299} -08/30/2021 17:34:07 - INFO - __main__ - Step 24422: {'lr': 0.00047221674621126896, 'samples': 4689024, 'steps': 24421, 'loss/train': 1.557907223701477} -08/30/2021 17:34:07 - INFO - __main__ - Step 24423: {'lr': 0.0004722143147948513, 'samples': 4689216, 'steps': 24422, 'loss/train': 1.8630753755569458} -08/30/2021 17:34:07 - INFO - __main__ - Step 24424: {'lr': 0.0004722118832783074, 'samples': 4689408, 'steps': 24423, 'loss/train': 1.3790898323059082} -08/30/2021 17:34:09 - INFO - __main__ - Step 24425: {'lr': 0.0004722094516616382, 'samples': 4689600, 'steps': 24424, 'loss/train': 1.4910532236099243} -08/30/2021 17:34:09 - INFO - __main__ - Step 24426: {'lr': 0.0004722070199448448, 'samples': 4689792, 'steps': 24425, 'loss/train': 1.119583010673523} -08/30/2021 17:34:10 - INFO - __main__ - Step 24427: {'lr': 0.00047220458812792846, 'samples': 4689984, 'steps': 24426, 'loss/train': 1.6967073678970337} -08/30/2021 17:34:10 - INFO - __main__ - Step 24428: {'lr': 0.00047220215621089005, 'samples': 4690176, 'steps': 24427, 'loss/train': 1.7348392009735107} -08/30/2021 17:34:10 - INFO - __main__ - Step 24429: {'lr': 0.00047219972419373083, 'samples': 4690368, 'steps': 24428, 'loss/train': 2.005463123321533} -08/30/2021 17:34:11 - INFO - __main__ - Step 24430: {'lr': 0.00047219729207645183, 'samples': 4690560, 'steps': 24429, 'loss/train': 1.2426892518997192} -08/30/2021 17:34:12 - INFO - __main__ - Step 24431: {'lr': 0.0004721948598590542, 'samples': 4690752, 'steps': 24430, 'loss/train': 1.5733124017715454} -08/30/2021 17:34:12 - INFO - __main__ - Step 24432: {'lr': 0.0004721924275415389, 'samples': 4690944, 'steps': 24431, 'loss/train': 1.5471230745315552} -08/30/2021 17:34:13 - INFO - __main__ - Step 24433: {'lr': 0.0004721899951239072, 'samples': 4691136, 'steps': 24432, 'loss/train': 1.5222989320755005} -08/30/2021 17:34:13 - INFO - __main__ - Step 24434: {'lr': 0.0004721875626061601, 'samples': 4691328, 'steps': 24433, 'loss/train': 1.4067974090576172} -08/30/2021 17:34:14 - INFO - __main__ - Step 24435: {'lr': 0.00047218512998829874, 'samples': 4691520, 'steps': 24434, 'loss/train': 2.027573823928833} -08/30/2021 17:34:15 - INFO - __main__ - Step 24436: {'lr': 0.00047218269727032413, 'samples': 4691712, 'steps': 24435, 'loss/train': 0.8910576701164246} -08/30/2021 17:34:15 - INFO - __main__ - Step 24437: {'lr': 0.00047218026445223745, 'samples': 4691904, 'steps': 24436, 'loss/train': 1.7636796236038208} -08/30/2021 17:34:16 - INFO - __main__ - Step 24438: {'lr': 0.0004721778315340398, 'samples': 4692096, 'steps': 24437, 'loss/train': 2.344608783721924} -08/30/2021 17:34:16 - INFO - __main__ - Step 24439: {'lr': 0.0004721753985157322, 'samples': 4692288, 'steps': 24438, 'loss/train': 1.692981243133545} -08/30/2021 17:34:17 - INFO - __main__ - Step 24440: {'lr': 0.0004721729653973158, 'samples': 4692480, 'steps': 24439, 'loss/train': 1.5303928852081299} -08/30/2021 17:34:19 - INFO - __main__ - Step 24441: {'lr': 0.0004721705321787917, 'samples': 4692672, 'steps': 24440, 'loss/train': 1.9622113704681396} -08/30/2021 17:34:20 - INFO - __main__ - Step 24442: {'lr': 0.00047216809886016097, 'samples': 4692864, 'steps': 24441, 'loss/train': 1.4492759704589844} -08/30/2021 17:34:20 - INFO - __main__ - Step 24443: {'lr': 0.0004721656654414248, 'samples': 4693056, 'steps': 24442, 'loss/train': 2.025129795074463} -08/30/2021 17:34:20 - INFO - __main__ - Step 24444: {'lr': 0.00047216323192258416, 'samples': 4693248, 'steps': 24443, 'loss/train': 1.435434103012085} -08/30/2021 17:34:21 - INFO - __main__ - Step 24445: {'lr': 0.0004721607983036401, 'samples': 4693440, 'steps': 24444, 'loss/train': 1.6196428537368774} -08/30/2021 17:34:21 - INFO - __main__ - Step 24446: {'lr': 0.00047215836458459393, 'samples': 4693632, 'steps': 24445, 'loss/train': 1.436138391494751} -08/30/2021 17:34:23 - INFO - __main__ - Step 24447: {'lr': 0.00047215593076544663, 'samples': 4693824, 'steps': 24446, 'loss/train': 1.5719879865646362} -08/30/2021 17:34:23 - INFO - __main__ - Step 24448: {'lr': 0.0004721534968461992, 'samples': 4694016, 'steps': 24447, 'loss/train': 2.2825469970703125} -08/30/2021 17:34:24 - INFO - __main__ - Step 24449: {'lr': 0.00047215106282685296, 'samples': 4694208, 'steps': 24448, 'loss/train': 1.108061671257019} -08/30/2021 17:34:24 - INFO - __main__ - Step 24450: {'lr': 0.0004721486287074088, 'samples': 4694400, 'steps': 24449, 'loss/train': 1.4066286087036133} -08/30/2021 17:34:25 - INFO - __main__ - Step 24451: {'lr': 0.0004721461944878679, 'samples': 4694592, 'steps': 24450, 'loss/train': 1.2571030855178833} -08/30/2021 17:34:26 - INFO - __main__ - Step 24452: {'lr': 0.00047214376016823143, 'samples': 4694784, 'steps': 24451, 'loss/train': 1.665950894355774} -08/30/2021 17:34:27 - INFO - __main__ - Step 24453: {'lr': 0.0004721413257485003, 'samples': 4694976, 'steps': 24452, 'loss/train': 1.733527421951294} -08/30/2021 17:34:27 - INFO - __main__ - Step 24454: {'lr': 0.0004721388912286758, 'samples': 4695168, 'steps': 24453, 'loss/train': 2.084660768508911} -08/30/2021 17:34:27 - INFO - __main__ - Step 24455: {'lr': 0.0004721364566087589, 'samples': 4695360, 'steps': 24454, 'loss/train': 1.8475679159164429} -08/30/2021 17:34:28 - INFO - __main__ - Step 24456: {'lr': 0.00047213402188875077, 'samples': 4695552, 'steps': 24455, 'loss/train': 1.7513166666030884} -08/30/2021 17:34:29 - INFO - __main__ - Step 24457: {'lr': 0.00047213158706865246, 'samples': 4695744, 'steps': 24456, 'loss/train': 1.285531759262085} -08/30/2021 17:34:30 - INFO - __main__ - Step 24458: {'lr': 0.000472129152148465, 'samples': 4695936, 'steps': 24457, 'loss/train': 1.658231496810913} -08/30/2021 17:34:30 - INFO - __main__ - Step 24459: {'lr': 0.0004721267171281897, 'samples': 4696128, 'steps': 24458, 'loss/train': 0.07067694514989853} -08/30/2021 17:34:30 - INFO - __main__ - Step 24460: {'lr': 0.00047212428200782744, 'samples': 4696320, 'steps': 24459, 'loss/train': 1.6212053298950195} -08/30/2021 17:34:31 - INFO - __main__ - Step 24461: {'lr': 0.00047212184678737946, 'samples': 4696512, 'steps': 24460, 'loss/train': 1.081878423690796} -08/30/2021 17:34:31 - INFO - __main__ - Step 24462: {'lr': 0.00047211941146684677, 'samples': 4696704, 'steps': 24461, 'loss/train': 0.767326295375824} -08/30/2021 17:34:32 - INFO - __main__ - Step 24463: {'lr': 0.00047211697604623056, 'samples': 4696896, 'steps': 24462, 'loss/train': 1.8081620931625366} -08/30/2021 17:34:33 - INFO - __main__ - Step 24464: {'lr': 0.0004721145405255318, 'samples': 4697088, 'steps': 24463, 'loss/train': 1.461976408958435} -08/30/2021 17:34:33 - INFO - __main__ - Step 24465: {'lr': 0.00047211210490475167, 'samples': 4697280, 'steps': 24464, 'loss/train': 1.7162853479385376} -08/30/2021 17:34:34 - INFO - __main__ - Step 24466: {'lr': 0.0004721096691838913, 'samples': 4697472, 'steps': 24465, 'loss/train': 1.5274393558502197} -08/30/2021 17:34:34 - INFO - __main__ - Step 24467: {'lr': 0.00047210723336295167, 'samples': 4697664, 'steps': 24466, 'loss/train': 1.5892138481140137} -08/30/2021 17:34:36 - INFO - __main__ - Step 24468: {'lr': 0.00047210479744193404, 'samples': 4697856, 'steps': 24467, 'loss/train': 1.749915361404419} -08/30/2021 17:34:36 - INFO - __main__ - Step 24469: {'lr': 0.0004721023614208393, 'samples': 4698048, 'steps': 24468, 'loss/train': 1.882742166519165} -08/30/2021 17:34:36 - INFO - __main__ - Step 24470: {'lr': 0.0004720999252996687, 'samples': 4698240, 'steps': 24469, 'loss/train': 1.774699330329895} -08/30/2021 17:34:37 - INFO - __main__ - Step 24471: {'lr': 0.00047209748907842337, 'samples': 4698432, 'steps': 24470, 'loss/train': 1.6665769815444946} -08/30/2021 17:34:37 - INFO - __main__ - Step 24472: {'lr': 0.0004720950527571043, 'samples': 4698624, 'steps': 24471, 'loss/train': 1.5818909406661987} -08/30/2021 17:34:39 - INFO - __main__ - Step 24473: {'lr': 0.0004720926163357126, 'samples': 4698816, 'steps': 24472, 'loss/train': 1.6217882633209229} -08/30/2021 17:34:40 - INFO - __main__ - Step 24474: {'lr': 0.0004720901798142494, 'samples': 4699008, 'steps': 24473, 'loss/train': 1.221812129020691} -08/30/2021 17:34:40 - INFO - __main__ - Step 24475: {'lr': 0.00047208774319271586, 'samples': 4699200, 'steps': 24474, 'loss/train': 1.7934091091156006} -08/30/2021 17:34:40 - INFO - __main__ - Step 24476: {'lr': 0.00047208530647111294, 'samples': 4699392, 'steps': 24475, 'loss/train': 1.7955983877182007} -08/30/2021 17:34:41 - INFO - __main__ - Step 24477: {'lr': 0.0004720828696494418, 'samples': 4699584, 'steps': 24476, 'loss/train': 1.424503207206726} -08/30/2021 17:34:41 - INFO - __main__ - Step 24478: {'lr': 0.00047208043272770354, 'samples': 4699776, 'steps': 24477, 'loss/train': 0.26392412185668945} -08/30/2021 17:34:42 - INFO - __main__ - Step 24479: {'lr': 0.0004720779957058993, 'samples': 4699968, 'steps': 24478, 'loss/train': 1.5823725461959839} -08/30/2021 17:34:43 - INFO - __main__ - Step 24480: {'lr': 0.0004720755585840302, 'samples': 4700160, 'steps': 24479, 'loss/train': 1.8605295419692993} -08/30/2021 17:34:43 - INFO - __main__ - Step 24481: {'lr': 0.0004720731213620972, 'samples': 4700352, 'steps': 24480, 'loss/train': 1.994153618812561} -08/30/2021 17:34:44 - INFO - __main__ - Step 24482: {'lr': 0.00047207068404010147, 'samples': 4700544, 'steps': 24481, 'loss/train': 2.2493860721588135} -08/30/2021 17:34:44 - INFO - __main__ - Step 24483: {'lr': 0.00047206824661804415, 'samples': 4700736, 'steps': 24482, 'loss/train': 2.090334892272949} -08/30/2021 17:34:44 - INFO - __main__ - Step 24484: {'lr': 0.0004720658090959263, 'samples': 4700928, 'steps': 24483, 'loss/train': 1.520559310913086} -08/30/2021 17:34:46 - INFO - __main__ - Step 24485: {'lr': 0.000472063371473749, 'samples': 4701120, 'steps': 24484, 'loss/train': 1.8299134969711304} -08/30/2021 17:34:46 - INFO - __main__ - Step 24486: {'lr': 0.0004720609337515134, 'samples': 4701312, 'steps': 24485, 'loss/train': 1.7684216499328613} -08/30/2021 17:34:47 - INFO - __main__ - Step 24487: {'lr': 0.00047205849592922057, 'samples': 4701504, 'steps': 24486, 'loss/train': 1.4957983493804932} -08/30/2021 17:34:47 - INFO - __main__ - Step 24488: {'lr': 0.00047205605800687154, 'samples': 4701696, 'steps': 24487, 'loss/train': 1.4721304178237915} -08/30/2021 17:34:47 - INFO - __main__ - Step 24489: {'lr': 0.0004720536199844676, 'samples': 4701888, 'steps': 24488, 'loss/train': 1.8148545026779175} -08/30/2021 17:34:49 - INFO - __main__ - Step 24490: {'lr': 0.00047205118186200963, 'samples': 4702080, 'steps': 24489, 'loss/train': 1.6523698568344116} -08/30/2021 17:34:49 - INFO - __main__ - Step 24491: {'lr': 0.00047204874363949886, 'samples': 4702272, 'steps': 24490, 'loss/train': 1.5222666263580322} -08/30/2021 17:34:50 - INFO - __main__ - Step 24492: {'lr': 0.00047204630531693634, 'samples': 4702464, 'steps': 24491, 'loss/train': 1.5540434122085571} -08/30/2021 17:34:50 - INFO - __main__ - Step 24493: {'lr': 0.0004720438668943232, 'samples': 4702656, 'steps': 24492, 'loss/train': 1.5921696424484253} -08/30/2021 17:34:50 - INFO - __main__ - Step 24494: {'lr': 0.0004720414283716605, 'samples': 4702848, 'steps': 24493, 'loss/train': 1.4510645866394043} -08/30/2021 17:34:52 - INFO - __main__ - Step 24495: {'lr': 0.00047203898974894934, 'samples': 4703040, 'steps': 24494, 'loss/train': 1.844099998474121} -08/30/2021 17:34:52 - INFO - __main__ - Step 24496: {'lr': 0.0004720365510261909, 'samples': 4703232, 'steps': 24495, 'loss/train': 1.3378582000732422} -08/30/2021 17:34:53 - INFO - __main__ - Step 24497: {'lr': 0.00047203411220338615, 'samples': 4703424, 'steps': 24496, 'loss/train': 1.5024641752243042} -08/30/2021 17:34:53 - INFO - __main__ - Step 24498: {'lr': 0.00047203167328053634, 'samples': 4703616, 'steps': 24497, 'loss/train': 1.207093358039856} -08/30/2021 17:34:53 - INFO - __main__ - Step 24499: {'lr': 0.0004720292342576423, 'samples': 4703808, 'steps': 24498, 'loss/train': 1.2374742031097412} -08/30/2021 17:34:55 - INFO - __main__ - Step 24500: {'lr': 0.0004720267951347055, 'samples': 4704000, 'steps': 24499, 'loss/train': 1.4379520416259766} -08/30/2021 17:34:55 - INFO - __main__ - Step 24501: {'lr': 0.00047202435591172677, 'samples': 4704192, 'steps': 24500, 'loss/train': 1.6501487493515015} -08/30/2021 17:34:56 - INFO - __main__ - Step 24502: {'lr': 0.00047202191658870737, 'samples': 4704384, 'steps': 24501, 'loss/train': 1.4039591550827026} -08/30/2021 17:34:56 - INFO - __main__ - Step 24503: {'lr': 0.00047201947716564826, 'samples': 4704576, 'steps': 24502, 'loss/train': 1.4813679456710815} -08/30/2021 17:34:56 - INFO - __main__ - Step 24504: {'lr': 0.00047201703764255057, 'samples': 4704768, 'steps': 24503, 'loss/train': 1.0740585327148438} -08/30/2021 17:34:58 - INFO - __main__ - Step 24505: {'lr': 0.0004720145980194155, 'samples': 4704960, 'steps': 24504, 'loss/train': 1.3868985176086426} -08/30/2021 17:34:59 - INFO - __main__ - Step 24506: {'lr': 0.000472012158296244, 'samples': 4705152, 'steps': 24505, 'loss/train': 1.3370076417922974} -08/30/2021 17:34:59 - INFO - __main__ - Step 24507: {'lr': 0.0004720097184730373, 'samples': 4705344, 'steps': 24506, 'loss/train': 1.75924551486969} -08/30/2021 17:34:59 - INFO - __main__ - Step 24508: {'lr': 0.00047200727854979644, 'samples': 4705536, 'steps': 24507, 'loss/train': 1.5830689668655396} -08/30/2021 17:35:00 - INFO - __main__ - Step 24509: {'lr': 0.00047200483852652257, 'samples': 4705728, 'steps': 24508, 'loss/train': 1.1779227256774902} -08/30/2021 17:35:01 - INFO - __main__ - Step 24510: {'lr': 0.0004720023984032167, 'samples': 4705920, 'steps': 24509, 'loss/train': 0.502585768699646} -08/30/2021 17:35:02 - INFO - __main__ - Step 24511: {'lr': 0.00047199995817987997, 'samples': 4706112, 'steps': 24510, 'loss/train': 0.9358653426170349} -08/30/2021 17:35:02 - INFO - __main__ - Step 24512: {'lr': 0.00047199751785651346, 'samples': 4706304, 'steps': 24511, 'loss/train': 1.063664436340332} -08/30/2021 17:35:02 - INFO - __main__ - Step 24513: {'lr': 0.0004719950774331183, 'samples': 4706496, 'steps': 24512, 'loss/train': 2.2083916664123535} -08/30/2021 17:35:03 - INFO - __main__ - Step 24514: {'lr': 0.00047199263690969563, 'samples': 4706688, 'steps': 24513, 'loss/train': 1.5452370643615723} -08/30/2021 17:35:04 - INFO - __main__ - Step 24515: {'lr': 0.00047199019628624647, 'samples': 4706880, 'steps': 24514, 'loss/train': 1.8068499565124512} -08/30/2021 17:35:05 - INFO - __main__ - Step 24516: {'lr': 0.00047198775556277195, 'samples': 4707072, 'steps': 24515, 'loss/train': 1.927861213684082} -08/30/2021 17:35:05 - INFO - __main__ - Step 24517: {'lr': 0.0004719853147392732, 'samples': 4707264, 'steps': 24516, 'loss/train': 1.4510259628295898} -08/30/2021 17:35:05 - INFO - __main__ - Step 24518: {'lr': 0.0004719828738157512, 'samples': 4707456, 'steps': 24517, 'loss/train': 1.6395998001098633} -08/30/2021 17:35:06 - INFO - __main__ - Step 24519: {'lr': 0.0004719804327922073, 'samples': 4707648, 'steps': 24518, 'loss/train': 1.6449280977249146} -08/30/2021 17:35:07 - INFO - __main__ - Step 24520: {'lr': 0.00047197799166864233, 'samples': 4707840, 'steps': 24519, 'loss/train': 1.774253249168396} -08/30/2021 17:35:08 - INFO - __main__ - Step 24521: {'lr': 0.00047197555044505756, 'samples': 4708032, 'steps': 24520, 'loss/train': 1.4616219997406006} -08/30/2021 17:35:08 - INFO - __main__ - Step 24522: {'lr': 0.000471973109121454, 'samples': 4708224, 'steps': 24521, 'loss/train': 1.4657056331634521} -08/30/2021 17:35:08 - INFO - __main__ - Step 24523: {'lr': 0.00047197066769783284, 'samples': 4708416, 'steps': 24522, 'loss/train': 1.2063186168670654} -08/30/2021 17:35:09 - INFO - __main__ - Step 24524: {'lr': 0.000471968226174195, 'samples': 4708608, 'steps': 24523, 'loss/train': 0.091896653175354} -08/30/2021 17:35:10 - INFO - __main__ - Step 24525: {'lr': 0.00047196578455054175, 'samples': 4708800, 'steps': 24524, 'loss/train': 0.9957613348960876} -08/30/2021 17:35:11 - INFO - __main__ - Step 24526: {'lr': 0.00047196334282687414, 'samples': 4708992, 'steps': 24525, 'loss/train': 1.7564043998718262} -08/30/2021 17:35:11 - INFO - __main__ - Step 24527: {'lr': 0.00047196090100319333, 'samples': 4709184, 'steps': 24526, 'loss/train': 1.4603902101516724} -08/30/2021 17:35:12 - INFO - __main__ - Step 24528: {'lr': 0.00047195845907950035, 'samples': 4709376, 'steps': 24527, 'loss/train': 1.472461223602295} -08/30/2021 17:35:12 - INFO - __main__ - Step 24529: {'lr': 0.0004719560170557963, 'samples': 4709568, 'steps': 24528, 'loss/train': 1.436963677406311} -08/30/2021 17:35:13 - INFO - __main__ - Step 24530: {'lr': 0.0004719535749320823, 'samples': 4709760, 'steps': 24529, 'loss/train': 0.232659712433815} -08/30/2021 17:35:14 - INFO - __main__ - Step 24531: {'lr': 0.0004719511327083594, 'samples': 4709952, 'steps': 24530, 'loss/train': 0.26898905634880066} -08/30/2021 17:35:14 - INFO - __main__ - Step 24532: {'lr': 0.0004719486903846288, 'samples': 4710144, 'steps': 24531, 'loss/train': 1.497463583946228} -08/30/2021 17:35:15 - INFO - __main__ - Step 24533: {'lr': 0.0004719462479608915, 'samples': 4710336, 'steps': 24532, 'loss/train': 1.2646433115005493} -08/30/2021 17:35:15 - INFO - __main__ - Step 24534: {'lr': 0.0004719438054371487, 'samples': 4710528, 'steps': 24533, 'loss/train': 1.1970287561416626} -08/30/2021 17:35:15 - INFO - __main__ - Step 24535: {'lr': 0.00047194136281340137, 'samples': 4710720, 'steps': 24534, 'loss/train': 1.7726329565048218} -08/30/2021 17:35:17 - INFO - __main__ - Step 24536: {'lr': 0.00047193892008965077, 'samples': 4710912, 'steps': 24535, 'loss/train': 1.4720901250839233} -08/30/2021 17:35:17 - INFO - __main__ - Step 24537: {'lr': 0.0004719364772658978, 'samples': 4711104, 'steps': 24536, 'loss/train': 1.4312533140182495} -08/30/2021 17:35:18 - INFO - __main__ - Step 24538: {'lr': 0.00047193403434214385, 'samples': 4711296, 'steps': 24537, 'loss/train': 1.2726963758468628} -08/30/2021 17:35:18 - INFO - __main__ - Step 24539: {'lr': 0.0004719315913183897, 'samples': 4711488, 'steps': 24538, 'loss/train': 1.411854863166809} -08/30/2021 17:35:18 - INFO - __main__ - Step 24540: {'lr': 0.0004719291481946367, 'samples': 4711680, 'steps': 24539, 'loss/train': 1.7104921340942383} -08/30/2021 17:35:20 - INFO - __main__ - Step 24541: {'lr': 0.00047192670497088577, 'samples': 4711872, 'steps': 24540, 'loss/train': 1.3718091249465942} -08/30/2021 17:35:20 - INFO - __main__ - Step 24542: {'lr': 0.0004719242616471381, 'samples': 4712064, 'steps': 24541, 'loss/train': 1.6246330738067627} -08/30/2021 17:35:21 - INFO - __main__ - Step 24543: {'lr': 0.00047192181822339484, 'samples': 4712256, 'steps': 24542, 'loss/train': 1.1429835557937622} -08/30/2021 17:35:21 - INFO - __main__ - Step 24544: {'lr': 0.000471919374699657, 'samples': 4712448, 'steps': 24543, 'loss/train': 1.4758931398391724} -08/30/2021 17:35:21 - INFO - __main__ - Step 24545: {'lr': 0.0004719169310759257, 'samples': 4712640, 'steps': 24544, 'loss/train': 5.920523166656494} -08/30/2021 17:35:23 - INFO - __main__ - Step 24546: {'lr': 0.0004719144873522021, 'samples': 4712832, 'steps': 24545, 'loss/train': 1.7054550647735596} -08/30/2021 17:35:23 - INFO - __main__ - Step 24547: {'lr': 0.0004719120435284872, 'samples': 4713024, 'steps': 24546, 'loss/train': 1.2541141510009766} -08/30/2021 17:35:24 - INFO - __main__ - Step 24548: {'lr': 0.0004719095996047822, 'samples': 4713216, 'steps': 24547, 'loss/train': 1.8921313285827637} -08/30/2021 17:35:24 - INFO - __main__ - Step 24549: {'lr': 0.0004719071555810881, 'samples': 4713408, 'steps': 24548, 'loss/train': 1.8774735927581787} -08/30/2021 17:35:25 - INFO - __main__ - Step 24550: {'lr': 0.00047190471145740616, 'samples': 4713600, 'steps': 24549, 'loss/train': 0.6641445159912109} -08/30/2021 17:35:25 - INFO - __main__ - Step 24551: {'lr': 0.0004719022672337373, 'samples': 4713792, 'steps': 24550, 'loss/train': 0.7229032516479492} -08/30/2021 17:35:26 - INFO - __main__ - Step 24552: {'lr': 0.0004718998229100827, 'samples': 4713984, 'steps': 24551, 'loss/train': 1.1109299659729004} -08/30/2021 17:35:27 - INFO - __main__ - Step 24553: {'lr': 0.00047189737848644356, 'samples': 4714176, 'steps': 24552, 'loss/train': 1.7704217433929443} -08/30/2021 17:35:27 - INFO - __main__ - Step 24554: {'lr': 0.0004718949339628208, 'samples': 4714368, 'steps': 24553, 'loss/train': 1.3112504482269287} -08/30/2021 17:35:28 - INFO - __main__ - Step 24555: {'lr': 0.0004718924893392156, 'samples': 4714560, 'steps': 24554, 'loss/train': 1.695735216140747} -08/30/2021 17:35:28 - INFO - __main__ - Step 24556: {'lr': 0.0004718900446156291, 'samples': 4714752, 'steps': 24555, 'loss/train': 1.3627787828445435} -08/30/2021 17:35:30 - INFO - __main__ - Step 24557: {'lr': 0.00047188759979206236, 'samples': 4714944, 'steps': 24556, 'loss/train': 1.5065007209777832} -08/30/2021 17:35:30 - INFO - __main__ - Step 24558: {'lr': 0.00047188515486851646, 'samples': 4715136, 'steps': 24557, 'loss/train': 1.5328236818313599} -08/30/2021 17:35:31 - INFO - __main__ - Step 24559: {'lr': 0.0004718827098449926, 'samples': 4715328, 'steps': 24558, 'loss/train': 1.2341324090957642} -08/30/2021 17:35:31 - INFO - __main__ - Step 24560: {'lr': 0.00047188026472149184, 'samples': 4715520, 'steps': 24559, 'loss/train': 2.171665906906128} -08/30/2021 17:35:31 - INFO - __main__ - Step 24561: {'lr': 0.0004718778194980151, 'samples': 4715712, 'steps': 24560, 'loss/train': 1.7486183643341064} -08/30/2021 17:35:33 - INFO - __main__ - Step 24562: {'lr': 0.00047187537417456375, 'samples': 4715904, 'steps': 24561, 'loss/train': 1.7060445547103882} -08/30/2021 17:35:33 - INFO - __main__ - Step 24563: {'lr': 0.00047187292875113874, 'samples': 4716096, 'steps': 24562, 'loss/train': 2.457808017730713} -08/30/2021 17:35:34 - INFO - __main__ - Step 24564: {'lr': 0.0004718704832277413, 'samples': 4716288, 'steps': 24563, 'loss/train': 1.622470736503601} -08/30/2021 17:35:34 - INFO - __main__ - Step 24565: {'lr': 0.0004718680376043724, 'samples': 4716480, 'steps': 24564, 'loss/train': 1.4234267473220825} -08/30/2021 17:35:34 - INFO - __main__ - Step 24566: {'lr': 0.00047186559188103314, 'samples': 4716672, 'steps': 24565, 'loss/train': 1.6230226755142212} -08/30/2021 17:35:36 - INFO - __main__ - Step 24567: {'lr': 0.00047186314605772466, 'samples': 4716864, 'steps': 24566, 'loss/train': 1.4558249711990356} -08/30/2021 17:35:36 - INFO - __main__ - Step 24568: {'lr': 0.00047186070013444814, 'samples': 4717056, 'steps': 24567, 'loss/train': 1.0605478286743164} -08/30/2021 17:35:37 - INFO - __main__ - Step 24569: {'lr': 0.00047185825411120454, 'samples': 4717248, 'steps': 24568, 'loss/train': 1.3696558475494385} -08/30/2021 17:35:37 - INFO - __main__ - Step 24570: {'lr': 0.0004718558079879951, 'samples': 4717440, 'steps': 24569, 'loss/train': 1.3347958326339722} -08/30/2021 17:35:37 - INFO - __main__ - Step 24571: {'lr': 0.00047185336176482084, 'samples': 4717632, 'steps': 24570, 'loss/train': 1.8632763624191284} -08/30/2021 17:35:39 - INFO - __main__ - Step 24572: {'lr': 0.00047185091544168286, 'samples': 4717824, 'steps': 24571, 'loss/train': 1.8458465337753296} -08/30/2021 17:35:39 - INFO - __main__ - Step 24573: {'lr': 0.00047184846901858225, 'samples': 4718016, 'steps': 24572, 'loss/train': 0.7646589279174805} -08/30/2021 17:35:40 - INFO - __main__ - Step 24574: {'lr': 0.0004718460224955202, 'samples': 4718208, 'steps': 24573, 'loss/train': 1.0524741411209106} -08/30/2021 17:35:40 - INFO - __main__ - Step 24575: {'lr': 0.0004718435758724977, 'samples': 4718400, 'steps': 24574, 'loss/train': 1.3564406633377075} -08/30/2021 17:35:40 - INFO - __main__ - Step 24576: {'lr': 0.000471841129149516, 'samples': 4718592, 'steps': 24575, 'loss/train': 1.1782338619232178} -08/30/2021 17:35:41 - INFO - __main__ - Step 24577: {'lr': 0.000471838682326576, 'samples': 4718784, 'steps': 24576, 'loss/train': 1.1804299354553223} -08/30/2021 17:35:42 - INFO - __main__ - Step 24578: {'lr': 0.000471836235403679, 'samples': 4718976, 'steps': 24577, 'loss/train': 1.9783321619033813} -08/30/2021 17:35:43 - INFO - __main__ - Step 24579: {'lr': 0.000471833788380826, 'samples': 4719168, 'steps': 24578, 'loss/train': 1.8166775703430176} -08/30/2021 17:35:43 - INFO - __main__ - Step 24580: {'lr': 0.0004718313412580181, 'samples': 4719360, 'steps': 24579, 'loss/train': 1.8016951084136963} -08/30/2021 17:35:43 - INFO - __main__ - Step 24581: {'lr': 0.0004718288940352564, 'samples': 4719552, 'steps': 24580, 'loss/train': 1.562361717224121} -08/30/2021 17:35:44 - INFO - __main__ - Step 24582: {'lr': 0.00047182644671254207, 'samples': 4719744, 'steps': 24581, 'loss/train': 3.886920213699341} -08/30/2021 17:35:45 - INFO - __main__ - Step 24583: {'lr': 0.0004718239992898761, 'samples': 4719936, 'steps': 24582, 'loss/train': 1.9974838495254517} -08/30/2021 17:35:46 - INFO - __main__ - Step 24584: {'lr': 0.00047182155176725974, 'samples': 4720128, 'steps': 24583, 'loss/train': 1.6186575889587402} -08/30/2021 17:35:46 - INFO - __main__ - Step 24585: {'lr': 0.00047181910414469396, 'samples': 4720320, 'steps': 24584, 'loss/train': 1.5206100940704346} -08/30/2021 17:35:46 - INFO - __main__ - Step 24586: {'lr': 0.0004718166564221799, 'samples': 4720512, 'steps': 24585, 'loss/train': 1.3282649517059326} -08/30/2021 17:35:47 - INFO - __main__ - Step 24587: {'lr': 0.0004718142085997187, 'samples': 4720704, 'steps': 24586, 'loss/train': 1.8367680311203003} -08/30/2021 17:35:48 - INFO - __main__ - Step 24588: {'lr': 0.0004718117606773115, 'samples': 4720896, 'steps': 24587, 'loss/train': 1.4244365692138672} -08/30/2021 17:35:49 - INFO - __main__ - Step 24589: {'lr': 0.0004718093126549592, 'samples': 4721088, 'steps': 24588, 'loss/train': 3.3588130474090576} -08/30/2021 17:35:49 - INFO - __main__ - Step 24590: {'lr': 0.0004718068645326632, 'samples': 4721280, 'steps': 24589, 'loss/train': 2.0005922317504883} -08/30/2021 17:35:50 - INFO - __main__ - Step 24591: {'lr': 0.0004718044163104244, 'samples': 4721472, 'steps': 24590, 'loss/train': 1.963279366493225} -08/30/2021 17:35:50 - INFO - __main__ - Step 24592: {'lr': 0.0004718019679882439, 'samples': 4721664, 'steps': 24591, 'loss/train': 1.429451584815979} -08/30/2021 17:35:51 - INFO - __main__ - Step 24593: {'lr': 0.0004717995195661229, 'samples': 4721856, 'steps': 24592, 'loss/train': 1.9033617973327637} -08/30/2021 17:35:52 - INFO - __main__ - Step 24594: {'lr': 0.00047179707104406243, 'samples': 4722048, 'steps': 24593, 'loss/train': 1.8315582275390625} -08/30/2021 17:35:52 - INFO - __main__ - Step 24595: {'lr': 0.0004717946224220637, 'samples': 4722240, 'steps': 24594, 'loss/train': 1.625569224357605} -08/30/2021 17:35:53 - INFO - __main__ - Step 24596: {'lr': 0.0004717921737001276, 'samples': 4722432, 'steps': 24595, 'loss/train': 1.7163532972335815} -08/30/2021 17:35:53 - INFO - __main__ - Step 24597: {'lr': 0.0004717897248782555, 'samples': 4722624, 'steps': 24596, 'loss/train': 1.384665846824646} -08/30/2021 17:35:55 - INFO - __main__ - Step 24598: {'lr': 0.0004717872759564483, 'samples': 4722816, 'steps': 24597, 'loss/train': 1.6244404315948486} -08/30/2021 17:35:55 - INFO - __main__ - Step 24599: {'lr': 0.00047178482693470723, 'samples': 4723008, 'steps': 24598, 'loss/train': 1.0666124820709229} -08/30/2021 17:35:56 - INFO - __main__ - Step 24600: {'lr': 0.0004717823778130333, 'samples': 4723200, 'steps': 24599, 'loss/train': 1.7034012079238892} -08/30/2021 17:35:56 - INFO - __main__ - Step 24601: {'lr': 0.0004717799285914276, 'samples': 4723392, 'steps': 24600, 'loss/train': 0.16433797776699066} -08/30/2021 17:35:56 - INFO - __main__ - Step 24602: {'lr': 0.00047177747926989134, 'samples': 4723584, 'steps': 24601, 'loss/train': 2.712157726287842} -08/30/2021 17:35:57 - INFO - __main__ - Step 24603: {'lr': 0.00047177502984842556, 'samples': 4723776, 'steps': 24602, 'loss/train': 1.598645806312561} -08/30/2021 17:35:58 - INFO - __main__ - Step 24604: {'lr': 0.0004717725803270314, 'samples': 4723968, 'steps': 24603, 'loss/train': 1.755679965019226} -08/30/2021 17:35:59 - INFO - __main__ - Step 24605: {'lr': 0.00047177013070570997, 'samples': 4724160, 'steps': 24604, 'loss/train': 1.4169636964797974} -08/30/2021 17:35:59 - INFO - __main__ - Step 24606: {'lr': 0.00047176768098446234, 'samples': 4724352, 'steps': 24605, 'loss/train': 1.1529072523117065} -08/30/2021 17:36:00 - INFO - __main__ - Step 24607: {'lr': 0.0004717652311632895, 'samples': 4724544, 'steps': 24606, 'loss/train': 1.3863716125488281} -08/30/2021 17:36:00 - INFO - __main__ - Step 24608: {'lr': 0.00047176278124219276, 'samples': 4724736, 'steps': 24607, 'loss/train': 1.675790786743164} -08/30/2021 17:36:02 - INFO - __main__ - Step 24609: {'lr': 0.0004717603312211731, 'samples': 4724928, 'steps': 24608, 'loss/train': 0.26380455493927} -08/30/2021 17:36:02 - INFO - __main__ - Step 24610: {'lr': 0.0004717578811002317, 'samples': 4725120, 'steps': 24609, 'loss/train': 1.3129373788833618} -08/30/2021 17:36:02 - INFO - __main__ - Step 24611: {'lr': 0.00047175543087936954, 'samples': 4725312, 'steps': 24610, 'loss/train': 1.8768680095672607} -08/30/2021 17:36:03 - INFO - __main__ - Step 24612: {'lr': 0.0004717529805585879, 'samples': 4725504, 'steps': 24611, 'loss/train': 1.6882539987564087} -08/30/2021 17:36:03 - INFO - __main__ - Step 24613: {'lr': 0.0004717505301378877, 'samples': 4725696, 'steps': 24612, 'loss/train': 1.4596537351608276} -08/30/2021 17:36:05 - INFO - __main__ - Step 24614: {'lr': 0.0004717480796172702, 'samples': 4725888, 'steps': 24613, 'loss/train': 1.701680064201355} -08/30/2021 17:36:06 - INFO - __main__ - Step 24615: {'lr': 0.00047174562899673645, 'samples': 4726080, 'steps': 24614, 'loss/train': 1.0368670225143433} -08/30/2021 17:36:06 - INFO - __main__ - Step 24616: {'lr': 0.0004717431782762875, 'samples': 4726272, 'steps': 24615, 'loss/train': 1.6600544452667236} -08/30/2021 17:36:06 - INFO - __main__ - Step 24617: {'lr': 0.0004717407274559245, 'samples': 4726464, 'steps': 24616, 'loss/train': 1.3087135553359985} -08/30/2021 17:36:07 - INFO - __main__ - Step 24618: {'lr': 0.0004717382765356485, 'samples': 4726656, 'steps': 24617, 'loss/train': 1.6702946424484253} -08/30/2021 17:36:09 - INFO - __main__ - Step 24619: {'lr': 0.0004717358255154607, 'samples': 4726848, 'steps': 24618, 'loss/train': 1.688079595565796} -08/30/2021 17:36:09 - INFO - __main__ - Step 24620: {'lr': 0.0004717333743953622, 'samples': 4727040, 'steps': 24619, 'loss/train': 1.955341100692749} -08/30/2021 17:36:10 - INFO - __main__ - Step 24621: {'lr': 0.00047173092317535404, 'samples': 4727232, 'steps': 24620, 'loss/train': 8.874281883239746} -08/30/2021 17:36:10 - INFO - __main__ - Step 24622: {'lr': 0.0004717284718554373, 'samples': 4727424, 'steps': 24621, 'loss/train': 2.65262508392334} -08/30/2021 17:36:10 - INFO - __main__ - Step 24623: {'lr': 0.00047172602043561317, 'samples': 4727616, 'steps': 24622, 'loss/train': 2.1952600479125977} -08/30/2021 17:36:11 - INFO - __main__ - Step 24624: {'lr': 0.00047172356891588273, 'samples': 4727808, 'steps': 24623, 'loss/train': 2.558573007583618} -08/30/2021 17:36:12 - INFO - __main__ - Step 24625: {'lr': 0.0004717211172962471, 'samples': 4728000, 'steps': 24624, 'loss/train': 2.1402010917663574} -08/30/2021 17:36:13 - INFO - __main__ - Step 24626: {'lr': 0.0004717186655767073, 'samples': 4728192, 'steps': 24625, 'loss/train': 2.7358956336975098} -08/30/2021 17:36:13 - INFO - __main__ - Step 24627: {'lr': 0.0004717162137572645, 'samples': 4728384, 'steps': 24626, 'loss/train': 2.4930129051208496} -08/30/2021 17:36:13 - INFO - __main__ - Step 24628: {'lr': 0.0004717137618379198, 'samples': 4728576, 'steps': 24627, 'loss/train': 1.7966632843017578} -08/30/2021 17:36:14 - INFO - __main__ - Step 24629: {'lr': 0.0004717113098186743, 'samples': 4728768, 'steps': 24628, 'loss/train': 1.99289870262146} -08/30/2021 17:36:15 - INFO - __main__ - Step 24630: {'lr': 0.00047170885769952907, 'samples': 4728960, 'steps': 24629, 'loss/train': 1.6715341806411743} -08/30/2021 17:36:15 - INFO - __main__ - Step 24631: {'lr': 0.00047170640548048525, 'samples': 4729152, 'steps': 24630, 'loss/train': 1.4821505546569824} -08/30/2021 17:36:16 - INFO - __main__ - Step 24632: {'lr': 0.000471703953161544, 'samples': 4729344, 'steps': 24631, 'loss/train': 1.797239065170288} -08/30/2021 17:36:16 - INFO - __main__ - Step 24633: {'lr': 0.00047170150074270635, 'samples': 4729536, 'steps': 24632, 'loss/train': 1.791114091873169} -08/30/2021 17:36:17 - INFO - __main__ - Step 24634: {'lr': 0.0004716990482239735, 'samples': 4729728, 'steps': 24633, 'loss/train': 1.8352652788162231} -08/30/2021 17:36:18 - INFO - __main__ - Step 24635: {'lr': 0.0004716965956053463, 'samples': 4729920, 'steps': 24634, 'loss/train': 2.2326345443725586} -08/30/2021 17:36:19 - INFO - __main__ - Step 24636: {'lr': 0.00047169414288682616, 'samples': 4730112, 'steps': 24635, 'loss/train': 2.186173677444458} -08/30/2021 17:36:19 - INFO - __main__ - Step 24637: {'lr': 0.0004716916900684141, 'samples': 4730304, 'steps': 24636, 'loss/train': 1.9529016017913818} -08/30/2021 17:36:19 - INFO - __main__ - Step 24638: {'lr': 0.00047168923715011103, 'samples': 4730496, 'steps': 24637, 'loss/train': 2.344886064529419} -08/30/2021 17:36:20 - INFO - __main__ - Step 24639: {'lr': 0.00047168678413191833, 'samples': 4730688, 'steps': 24638, 'loss/train': 1.982452630996704} -08/30/2021 17:36:21 - INFO - __main__ - Step 24640: {'lr': 0.00047168433101383694, 'samples': 4730880, 'steps': 24639, 'loss/train': 1.9556173086166382} -08/30/2021 17:36:22 - INFO - __main__ - Step 24641: {'lr': 0.000471681877795868, 'samples': 4731072, 'steps': 24640, 'loss/train': 1.4128801822662354} -08/30/2021 17:36:22 - INFO - __main__ - Step 24642: {'lr': 0.0004716794244780127, 'samples': 4731264, 'steps': 24641, 'loss/train': 2.0736827850341797} -08/30/2021 17:36:22 - INFO - __main__ - Step 24643: {'lr': 0.0004716769710602721, 'samples': 4731456, 'steps': 24642, 'loss/train': 2.4431746006011963} -08/30/2021 17:36:23 - INFO - __main__ - Step 24644: {'lr': 0.00047167451754264714, 'samples': 4731648, 'steps': 24643, 'loss/train': 1.5567020177841187} -08/30/2021 17:36:23 - INFO - __main__ - Step 24645: {'lr': 0.0004716720639251392, 'samples': 4731840, 'steps': 24644, 'loss/train': 2.360151767730713} -08/30/2021 17:36:24 - INFO - __main__ - Step 24646: {'lr': 0.0004716696102077491, 'samples': 4732032, 'steps': 24645, 'loss/train': 1.8170424699783325} -08/30/2021 17:36:25 - INFO - __main__ - Step 24647: {'lr': 0.0004716671563904782, 'samples': 4732224, 'steps': 24646, 'loss/train': 2.0453975200653076} -08/30/2021 17:36:25 - INFO - __main__ - Step 24648: {'lr': 0.0004716647024733275, 'samples': 4732416, 'steps': 24647, 'loss/train': 1.7449759244918823} -08/30/2021 17:36:26 - INFO - __main__ - Step 24649: {'lr': 0.00047166224845629804, 'samples': 4732608, 'steps': 24648, 'loss/train': 1.9197039604187012} -08/30/2021 17:36:26 - INFO - __main__ - Step 24650: {'lr': 0.000471659794339391, 'samples': 4732800, 'steps': 24649, 'loss/train': 1.9616122245788574} -08/30/2021 17:36:28 - INFO - __main__ - Step 24651: {'lr': 0.00047165734012260754, 'samples': 4732992, 'steps': 24650, 'loss/train': 2.1116483211517334} -08/30/2021 17:36:28 - INFO - __main__ - Step 24652: {'lr': 0.0004716548858059486, 'samples': 4733184, 'steps': 24651, 'loss/train': 1.3150659799575806} -08/30/2021 17:36:28 - INFO - __main__ - Step 24653: {'lr': 0.0004716524313894155, 'samples': 4733376, 'steps': 24652, 'loss/train': 1.4902786016464233} -08/30/2021 17:36:29 - INFO - __main__ - Step 24654: {'lr': 0.0004716499768730092, 'samples': 4733568, 'steps': 24653, 'loss/train': 1.7323554754257202} -08/30/2021 17:36:29 - INFO - __main__ - Step 24655: {'lr': 0.0004716475222567308, 'samples': 4733760, 'steps': 24654, 'loss/train': 1.4266170263290405} -08/30/2021 17:36:31 - INFO - __main__ - Step 24656: {'lr': 0.0004716450675405815, 'samples': 4733952, 'steps': 24655, 'loss/train': 2.019360303878784} -08/30/2021 17:36:31 - INFO - __main__ - Step 24657: {'lr': 0.0004716426127245623, 'samples': 4734144, 'steps': 24656, 'loss/train': 1.9479265213012695} -08/30/2021 17:36:31 - INFO - __main__ - Step 24658: {'lr': 0.00047164015780867444, 'samples': 4734336, 'steps': 24657, 'loss/train': 1.0647599697113037} -08/30/2021 17:36:32 - INFO - __main__ - Step 24659: {'lr': 0.0004716377027929189, 'samples': 4734528, 'steps': 24658, 'loss/train': 1.8619252443313599} -08/30/2021 17:36:32 - INFO - __main__ - Step 24660: {'lr': 0.00047163524767729684, 'samples': 4734720, 'steps': 24659, 'loss/train': 1.6403992176055908} -08/30/2021 17:36:32 - INFO - __main__ - Step 24661: {'lr': 0.0004716327924618093, 'samples': 4734912, 'steps': 24660, 'loss/train': 0.9954274296760559} -08/30/2021 17:36:35 - INFO - __main__ - Step 24662: {'lr': 0.0004716303371464575, 'samples': 4735104, 'steps': 24661, 'loss/train': 1.2608269453048706} -08/30/2021 17:36:35 - INFO - __main__ - Step 24663: {'lr': 0.0004716278817312425, 'samples': 4735296, 'steps': 24662, 'loss/train': 1.1998200416564941} -08/30/2021 17:36:35 - INFO - __main__ - Step 24664: {'lr': 0.0004716254262161653, 'samples': 4735488, 'steps': 24663, 'loss/train': 3.4208500385284424} -08/30/2021 17:36:36 - INFO - __main__ - Step 24665: {'lr': 0.00047162297060122726, 'samples': 4735680, 'steps': 24664, 'loss/train': 1.499505639076233} -08/30/2021 17:36:36 - INFO - __main__ - Step 24666: {'lr': 0.0004716205148864292, 'samples': 4735872, 'steps': 24665, 'loss/train': 1.7700446844100952} -08/30/2021 17:36:38 - INFO - __main__ - Step 24667: {'lr': 0.0004716180590717724, 'samples': 4736064, 'steps': 24666, 'loss/train': 2.8480496406555176} -08/30/2021 17:36:38 - INFO - __main__ - Step 24668: {'lr': 0.0004716156031572579, 'samples': 4736256, 'steps': 24667, 'loss/train': 1.711680293083191} -08/30/2021 17:36:38 - INFO - __main__ - Step 24669: {'lr': 0.00047161314714288697, 'samples': 4736448, 'steps': 24668, 'loss/train': 1.791342854499817} -08/30/2021 17:36:39 - INFO - __main__ - Step 24670: {'lr': 0.00047161069102866037, 'samples': 4736640, 'steps': 24669, 'loss/train': 2.0235402584075928} -08/30/2021 17:36:39 - INFO - __main__ - Step 24671: {'lr': 0.00047160823481457955, 'samples': 4736832, 'steps': 24670, 'loss/train': 1.6442534923553467} -08/30/2021 17:36:41 - INFO - __main__ - Step 24672: {'lr': 0.0004716057785006454, 'samples': 4737024, 'steps': 24671, 'loss/train': 2.016108274459839} -08/30/2021 17:36:41 - INFO - __main__ - Step 24673: {'lr': 0.00047160332208685915, 'samples': 4737216, 'steps': 24672, 'loss/train': 1.0705252885818481} -08/30/2021 17:36:42 - INFO - __main__ - Step 24674: {'lr': 0.00047160086557322185, 'samples': 4737408, 'steps': 24673, 'loss/train': 1.2105544805526733} -08/30/2021 17:36:42 - INFO - __main__ - Step 24675: {'lr': 0.0004715984089597346, 'samples': 4737600, 'steps': 24674, 'loss/train': 1.826501727104187} -08/30/2021 17:36:42 - INFO - __main__ - Step 24676: {'lr': 0.00047159595224639854, 'samples': 4737792, 'steps': 24675, 'loss/train': 0.3165826201438904} -08/30/2021 17:36:44 - INFO - __main__ - Step 24677: {'lr': 0.00047159349543321477, 'samples': 4737984, 'steps': 24676, 'loss/train': 2.6708781719207764} -08/30/2021 17:36:44 - INFO - __main__ - Step 24678: {'lr': 0.00047159103852018443, 'samples': 4738176, 'steps': 24677, 'loss/train': 2.4192936420440674} -08/30/2021 17:36:45 - INFO - __main__ - Step 24679: {'lr': 0.00047158858150730856, 'samples': 4738368, 'steps': 24678, 'loss/train': 1.0226179361343384} -08/30/2021 17:36:45 - INFO - __main__ - Step 24680: {'lr': 0.00047158612439458824, 'samples': 4738560, 'steps': 24679, 'loss/train': 1.7899672985076904} -08/30/2021 17:36:45 - INFO - __main__ - Step 24681: {'lr': 0.00047158366718202466, 'samples': 4738752, 'steps': 24680, 'loss/train': 1.428963541984558} -08/30/2021 17:36:47 - INFO - __main__ - Step 24682: {'lr': 0.00047158120986961897, 'samples': 4738944, 'steps': 24681, 'loss/train': 3.1310064792633057} -08/30/2021 17:36:47 - INFO - __main__ - Step 24683: {'lr': 0.00047157875245737213, 'samples': 4739136, 'steps': 24682, 'loss/train': 1.679357886314392} -08/30/2021 17:36:48 - INFO - __main__ - Step 24684: {'lr': 0.0004715762949452853, 'samples': 4739328, 'steps': 24683, 'loss/train': 1.8991272449493408} -08/30/2021 17:36:48 - INFO - __main__ - Step 24685: {'lr': 0.0004715738373333597, 'samples': 4739520, 'steps': 24684, 'loss/train': 2.5505757331848145} -08/30/2021 17:36:48 - INFO - __main__ - Step 24686: {'lr': 0.00047157137962159626, 'samples': 4739712, 'steps': 24685, 'loss/train': 1.6282877922058105} -08/30/2021 17:36:50 - INFO - __main__ - Step 24687: {'lr': 0.00047156892180999624, 'samples': 4739904, 'steps': 24686, 'loss/train': 1.6711379289627075} -08/30/2021 17:36:50 - INFO - __main__ - Step 24688: {'lr': 0.0004715664638985606, 'samples': 4740096, 'steps': 24687, 'loss/train': 1.3490301370620728} -08/30/2021 17:36:51 - INFO - __main__ - Step 24689: {'lr': 0.00047156400588729066, 'samples': 4740288, 'steps': 24688, 'loss/train': 1.1491557359695435} -08/30/2021 17:36:51 - INFO - __main__ - Step 24690: {'lr': 0.0004715615477761873, 'samples': 4740480, 'steps': 24689, 'loss/train': 1.516879677772522} -08/30/2021 17:36:51 - INFO - __main__ - Step 24691: {'lr': 0.00047155908956525173, 'samples': 4740672, 'steps': 24690, 'loss/train': 1.952373743057251} -08/30/2021 17:36:53 - INFO - __main__ - Step 24692: {'lr': 0.00047155663125448514, 'samples': 4740864, 'steps': 24691, 'loss/train': 1.933780550956726} -08/30/2021 17:36:53 - INFO - __main__ - Step 24693: {'lr': 0.00047155417284388846, 'samples': 4741056, 'steps': 24692, 'loss/train': 1.5821880102157593} -08/30/2021 17:36:54 - INFO - __main__ - Step 24694: {'lr': 0.0004715517143334629, 'samples': 4741248, 'steps': 24693, 'loss/train': 1.258436918258667} -08/30/2021 17:36:54 - INFO - __main__ - Step 24695: {'lr': 0.00047154925572320957, 'samples': 4741440, 'steps': 24694, 'loss/train': 1.8043732643127441} -08/30/2021 17:36:54 - INFO - __main__ - Step 24696: {'lr': 0.00047154679701312953, 'samples': 4741632, 'steps': 24695, 'loss/train': 1.8346304893493652} -08/30/2021 17:36:56 - INFO - __main__ - Step 24697: {'lr': 0.00047154433820322395, 'samples': 4741824, 'steps': 24696, 'loss/train': 1.851894736289978} -08/30/2021 17:36:57 - INFO - __main__ - Step 24698: {'lr': 0.0004715418792934939, 'samples': 4742016, 'steps': 24697, 'loss/train': 0.8953798413276672} -08/30/2021 17:36:57 - INFO - __main__ - Step 24699: {'lr': 0.00047153942028394056, 'samples': 4742208, 'steps': 24698, 'loss/train': 1.6787607669830322} -08/30/2021 17:36:57 - INFO - __main__ - Step 24700: {'lr': 0.0004715369611745649, 'samples': 4742400, 'steps': 24699, 'loss/train': 0.9864576458930969} -08/30/2021 17:36:58 - INFO - __main__ - Step 24701: {'lr': 0.00047153450196536816, 'samples': 4742592, 'steps': 24700, 'loss/train': 1.7255611419677734} -08/30/2021 17:36:58 - INFO - __main__ - Step 24702: {'lr': 0.00047153204265635136, 'samples': 4742784, 'steps': 24701, 'loss/train': 1.9156755208969116} -08/30/2021 17:37:00 - INFO - __main__ - Step 24703: {'lr': 0.0004715295832475156, 'samples': 4742976, 'steps': 24702, 'loss/train': 0.8458746075630188} -08/30/2021 17:37:00 - INFO - __main__ - Step 24704: {'lr': 0.0004715271237388621, 'samples': 4743168, 'steps': 24703, 'loss/train': 2.1463427543640137} -08/30/2021 17:37:01 - INFO - __main__ - Step 24705: {'lr': 0.00047152466413039187, 'samples': 4743360, 'steps': 24704, 'loss/train': 1.0671817064285278} -08/30/2021 17:37:01 - INFO - __main__ - Step 24706: {'lr': 0.000471522204422106, 'samples': 4743552, 'steps': 24705, 'loss/train': 1.732177972793579} -08/30/2021 17:37:01 - INFO - __main__ - Step 24707: {'lr': 0.0004715197446140057, 'samples': 4743744, 'steps': 24706, 'loss/train': 1.5347830057144165} -08/30/2021 17:37:03 - INFO - __main__ - Step 24708: {'lr': 0.000471517284706092, 'samples': 4743936, 'steps': 24707, 'loss/train': 0.5448461174964905} -08/30/2021 17:37:04 - INFO - __main__ - Step 24709: {'lr': 0.0004715148246983661, 'samples': 4744128, 'steps': 24708, 'loss/train': 1.5225915908813477} -08/30/2021 17:37:04 - INFO - __main__ - Step 24710: {'lr': 0.000471512364590829, 'samples': 4744320, 'steps': 24709, 'loss/train': 2.057853937149048} -08/30/2021 17:37:05 - INFO - __main__ - Step 24711: {'lr': 0.0004715099043834818, 'samples': 4744512, 'steps': 24710, 'loss/train': 1.7252074480056763} -08/30/2021 17:37:05 - INFO - __main__ - Step 24712: {'lr': 0.00047150744407632565, 'samples': 4744704, 'steps': 24711, 'loss/train': 1.6189361810684204} -08/30/2021 17:37:05 - INFO - __main__ - Step 24713: {'lr': 0.00047150498366936165, 'samples': 4744896, 'steps': 24712, 'loss/train': 1.311771035194397} -08/30/2021 17:37:07 - INFO - __main__ - Step 24714: {'lr': 0.000471502523162591, 'samples': 4745088, 'steps': 24713, 'loss/train': 0.9976238012313843} -08/30/2021 17:37:07 - INFO - __main__ - Step 24715: {'lr': 0.00047150006255601475, 'samples': 4745280, 'steps': 24714, 'loss/train': 1.0881123542785645} -08/30/2021 17:37:08 - INFO - __main__ - Step 24716: {'lr': 0.00047149760184963385, 'samples': 4745472, 'steps': 24715, 'loss/train': 1.610553503036499} -08/30/2021 17:37:08 - INFO - __main__ - Step 24717: {'lr': 0.0004714951410434497, 'samples': 4745664, 'steps': 24716, 'loss/train': 1.5979219675064087} -08/30/2021 17:37:08 - INFO - __main__ - Step 24718: {'lr': 0.00047149268013746317, 'samples': 4745856, 'steps': 24717, 'loss/train': 1.687117576599121} -08/30/2021 17:37:09 - INFO - __main__ - Step 24719: {'lr': 0.00047149021913167545, 'samples': 4746048, 'steps': 24718, 'loss/train': 1.535128116607666} -08/30/2021 17:37:11 - INFO - __main__ - Step 24720: {'lr': 0.0004714877580260877, 'samples': 4746240, 'steps': 24719, 'loss/train': 0.8547623157501221} -08/30/2021 17:37:11 - INFO - __main__ - Step 24721: {'lr': 0.00047148529682070094, 'samples': 4746432, 'steps': 24720, 'loss/train': 1.5548758506774902} -08/30/2021 17:37:12 - INFO - __main__ - Step 24722: {'lr': 0.00047148283551551643, 'samples': 4746624, 'steps': 24721, 'loss/train': 1.661041021347046} -08/30/2021 17:37:12 - INFO - __main__ - Step 24723: {'lr': 0.000471480374110535, 'samples': 4746816, 'steps': 24722, 'loss/train': 1.4511311054229736} -08/30/2021 17:37:12 - INFO - __main__ - Step 24724: {'lr': 0.00047147791260575804, 'samples': 4747008, 'steps': 24723, 'loss/train': 2.2207934856414795} -08/30/2021 17:37:14 - INFO - __main__ - Step 24725: {'lr': 0.0004714754510011866, 'samples': 4747200, 'steps': 24724, 'loss/train': 1.2171140909194946} -08/30/2021 17:37:14 - INFO - __main__ - Step 24726: {'lr': 0.0004714729892968216, 'samples': 4747392, 'steps': 24725, 'loss/train': 1.4494720697402954} -08/30/2021 17:37:15 - INFO - __main__ - Step 24727: {'lr': 0.0004714705274926644, 'samples': 4747584, 'steps': 24726, 'loss/train': 1.689841389656067} -08/30/2021 17:37:15 - INFO - __main__ - Step 24728: {'lr': 0.00047146806558871594, 'samples': 4747776, 'steps': 24727, 'loss/train': 2.315096139907837} -08/30/2021 17:37:15 - INFO - __main__ - Step 24729: {'lr': 0.0004714656035849774, 'samples': 4747968, 'steps': 24728, 'loss/train': 2.113011598587036} -08/30/2021 17:37:17 - INFO - __main__ - Step 24730: {'lr': 0.00047146314148144986, 'samples': 4748160, 'steps': 24729, 'loss/train': 1.8264377117156982} -08/30/2021 17:37:17 - INFO - __main__ - Step 24731: {'lr': 0.00047146067927813454, 'samples': 4748352, 'steps': 24730, 'loss/train': 1.8549612760543823} -08/30/2021 17:37:18 - INFO - __main__ - Step 24732: {'lr': 0.00047145821697503235, 'samples': 4748544, 'steps': 24731, 'loss/train': 1.5308011770248413} -08/30/2021 17:37:18 - INFO - __main__ - Step 24733: {'lr': 0.00047145575457214453, 'samples': 4748736, 'steps': 24732, 'loss/train': 2.0067386627197266} -08/30/2021 17:37:18 - INFO - __main__ - Step 24734: {'lr': 0.00047145329206947216, 'samples': 4748928, 'steps': 24733, 'loss/train': 2.21530818939209} -08/30/2021 17:37:20 - INFO - __main__ - Step 24735: {'lr': 0.0004714508294670164, 'samples': 4749120, 'steps': 24734, 'loss/train': 1.8082433938980103} -08/30/2021 17:37:21 - INFO - __main__ - Step 24736: {'lr': 0.00047144836676477823, 'samples': 4749312, 'steps': 24735, 'loss/train': 1.5817692279815674} -08/30/2021 17:37:21 - INFO - __main__ - Step 24737: {'lr': 0.00047144590396275895, 'samples': 4749504, 'steps': 24736, 'loss/train': 1.4714477062225342} -08/30/2021 17:37:21 - INFO - __main__ - Step 24738: {'lr': 0.0004714434410609595, 'samples': 4749696, 'steps': 24737, 'loss/train': 1.575246810913086} -08/30/2021 17:37:22 - INFO - __main__ - Step 24739: {'lr': 0.00047144097805938104, 'samples': 4749888, 'steps': 24738, 'loss/train': 2.1753039360046387} -08/30/2021 17:37:23 - INFO - __main__ - Step 24740: {'lr': 0.0004714385149580247, 'samples': 4750080, 'steps': 24739, 'loss/train': 1.9992939233779907} -08/30/2021 17:37:24 - INFO - __main__ - Step 24741: {'lr': 0.0004714360517568916, 'samples': 4750272, 'steps': 24740, 'loss/train': 1.570160984992981} -08/30/2021 17:37:24 - INFO - __main__ - Step 24742: {'lr': 0.00047143358845598283, 'samples': 4750464, 'steps': 24741, 'loss/train': 1.3570243120193481} -08/30/2021 17:37:25 - INFO - __main__ - Step 24743: {'lr': 0.0004714311250552995, 'samples': 4750656, 'steps': 24742, 'loss/train': 1.7493219375610352} -08/30/2021 17:37:25 - INFO - __main__ - Step 24744: {'lr': 0.0004714286615548427, 'samples': 4750848, 'steps': 24743, 'loss/train': 1.5323597192764282} -08/30/2021 17:37:25 - INFO - __main__ - Step 24745: {'lr': 0.00047142619795461363, 'samples': 4751040, 'steps': 24744, 'loss/train': 1.1970270872116089} -08/30/2021 17:37:27 - INFO - __main__ - Step 24746: {'lr': 0.0004714237342546133, 'samples': 4751232, 'steps': 24745, 'loss/train': 0.1257409304380417} -08/30/2021 17:37:27 - INFO - __main__ - Step 24747: {'lr': 0.0004714212704548428, 'samples': 4751424, 'steps': 24746, 'loss/train': 1.4161252975463867} -08/30/2021 17:37:28 - INFO - __main__ - Step 24748: {'lr': 0.0004714188065553033, 'samples': 4751616, 'steps': 24747, 'loss/train': 1.1785532236099243} -08/30/2021 17:37:28 - INFO - __main__ - Step 24749: {'lr': 0.000471416342555996, 'samples': 4751808, 'steps': 24748, 'loss/train': 1.6573036909103394} -08/30/2021 17:37:28 - INFO - __main__ - Step 24750: {'lr': 0.00047141387845692174, 'samples': 4752000, 'steps': 24749, 'loss/train': 1.5083427429199219} -08/30/2021 17:37:30 - INFO - __main__ - Step 24751: {'lr': 0.0004714114142580819, 'samples': 4752192, 'steps': 24750, 'loss/train': 1.8364665508270264} -08/30/2021 17:37:30 - INFO - __main__ - Step 24752: {'lr': 0.00047140894995947755, 'samples': 4752384, 'steps': 24751, 'loss/train': 1.4609259366989136} -08/30/2021 17:37:31 - INFO - __main__ - Step 24753: {'lr': 0.00047140648556110966, 'samples': 4752576, 'steps': 24752, 'loss/train': 0.3895515501499176} -08/30/2021 17:37:31 - INFO - __main__ - Step 24754: {'lr': 0.00047140402106297946, 'samples': 4752768, 'steps': 24753, 'loss/train': 0.6205389499664307} -08/30/2021 17:37:31 - INFO - __main__ - Step 24755: {'lr': 0.000471401556465088, 'samples': 4752960, 'steps': 24754, 'loss/train': 1.293762445449829} -08/30/2021 17:37:33 - INFO - __main__ - Step 24756: {'lr': 0.00047139909176743643, 'samples': 4753152, 'steps': 24755, 'loss/train': 2.1234817504882812} -08/30/2021 17:37:33 - INFO - __main__ - Step 24757: {'lr': 0.0004713966269700259, 'samples': 4753344, 'steps': 24756, 'loss/train': 1.7344706058502197} -08/30/2021 17:37:34 - INFO - __main__ - Step 24758: {'lr': 0.0004713941620728574, 'samples': 4753536, 'steps': 24757, 'loss/train': 1.5988022089004517} -08/30/2021 17:37:34 - INFO - __main__ - Step 24759: {'lr': 0.0004713916970759321, 'samples': 4753728, 'steps': 24758, 'loss/train': 1.777037262916565} -08/30/2021 17:37:34 - INFO - __main__ - Step 24760: {'lr': 0.0004713892319792512, 'samples': 4753920, 'steps': 24759, 'loss/train': 2.254842758178711} -08/30/2021 17:37:35 - INFO - __main__ - Step 24761: {'lr': 0.00047138676678281564, 'samples': 4754112, 'steps': 24760, 'loss/train': 1.8314911127090454} -08/30/2021 17:37:36 - INFO - __main__ - Step 24762: {'lr': 0.00047138430148662666, 'samples': 4754304, 'steps': 24761, 'loss/train': 1.539853572845459} -08/30/2021 17:37:37 - INFO - __main__ - Step 24763: {'lr': 0.0004713818360906853, 'samples': 4754496, 'steps': 24762, 'loss/train': 1.1455368995666504} -08/30/2021 17:37:37 - INFO - __main__ - Step 24764: {'lr': 0.0004713793705949927, 'samples': 4754688, 'steps': 24763, 'loss/train': 1.1345278024673462} -08/30/2021 17:37:37 - INFO - __main__ - Step 24765: {'lr': 0.00047137690499955, 'samples': 4754880, 'steps': 24764, 'loss/train': 1.9125782251358032} -08/30/2021 17:37:38 - INFO - __main__ - Step 24766: {'lr': 0.0004713744393043583, 'samples': 4755072, 'steps': 24765, 'loss/train': 1.405653715133667} -08/30/2021 17:37:39 - INFO - __main__ - Step 24767: {'lr': 0.00047137197350941864, 'samples': 4755264, 'steps': 24766, 'loss/train': 2.287050485610962} -08/30/2021 17:37:40 - INFO - __main__ - Step 24768: {'lr': 0.0004713695076147322, 'samples': 4755456, 'steps': 24767, 'loss/train': 1.530613899230957} -08/30/2021 17:37:40 - INFO - __main__ - Step 24769: {'lr': 0.0004713670416203001, 'samples': 4755648, 'steps': 24768, 'loss/train': 1.371817708015442} -08/30/2021 17:37:40 - INFO - __main__ - Step 24770: {'lr': 0.00047136457552612344, 'samples': 4755840, 'steps': 24769, 'loss/train': 1.6049026250839233} -08/30/2021 17:37:41 - INFO - __main__ - Step 24771: {'lr': 0.00047136210933220325, 'samples': 4756032, 'steps': 24770, 'loss/train': 1.4269808530807495} -08/30/2021 17:37:43 - INFO - __main__ - Step 24772: {'lr': 0.0004713596430385408, 'samples': 4756224, 'steps': 24771, 'loss/train': 1.1746535301208496} -08/30/2021 17:37:43 - INFO - __main__ - Step 24773: {'lr': 0.00047135717664513704, 'samples': 4756416, 'steps': 24772, 'loss/train': 1.168184518814087} -08/30/2021 17:37:43 - INFO - __main__ - Step 24774: {'lr': 0.00047135471015199315, 'samples': 4756608, 'steps': 24773, 'loss/train': 2.0779831409454346} -08/30/2021 17:37:44 - INFO - __main__ - Step 24775: {'lr': 0.00047135224355911035, 'samples': 4756800, 'steps': 24774, 'loss/train': 1.5183665752410889} -08/30/2021 17:37:44 - INFO - __main__ - Step 24776: {'lr': 0.0004713497768664895, 'samples': 4756992, 'steps': 24775, 'loss/train': 1.5069047212600708} -08/30/2021 17:37:45 - INFO - __main__ - Step 24777: {'lr': 0.00047134731007413195, 'samples': 4757184, 'steps': 24776, 'loss/train': 1.4242967367172241} -08/30/2021 17:37:46 - INFO - __main__ - Step 24778: {'lr': 0.0004713448431820387, 'samples': 4757376, 'steps': 24777, 'loss/train': 1.7829294204711914} -08/30/2021 17:37:46 - INFO - __main__ - Step 24779: {'lr': 0.00047134237619021085, 'samples': 4757568, 'steps': 24778, 'loss/train': 1.5085433721542358} -08/30/2021 17:37:47 - INFO - __main__ - Step 24780: {'lr': 0.00047133990909864953, 'samples': 4757760, 'steps': 24779, 'loss/train': 1.993310809135437} -08/30/2021 17:37:47 - INFO - __main__ - Step 24781: {'lr': 0.0004713374419073559, 'samples': 4757952, 'steps': 24780, 'loss/train': 0.9177327156066895} -08/30/2021 17:37:49 - INFO - __main__ - Step 24782: {'lr': 0.000471334974616331, 'samples': 4758144, 'steps': 24781, 'loss/train': 1.706955075263977} -08/30/2021 17:37:49 - INFO - __main__ - Step 24783: {'lr': 0.0004713325072255761, 'samples': 4758336, 'steps': 24782, 'loss/train': 0.8460226655006409} -08/30/2021 17:37:49 - INFO - __main__ - Step 24784: {'lr': 0.000471330039735092, 'samples': 4758528, 'steps': 24783, 'loss/train': 2.2417311668395996} -08/30/2021 17:37:50 - INFO - __main__ - Step 24785: {'lr': 0.0004713275721448801, 'samples': 4758720, 'steps': 24784, 'loss/train': 1.4460208415985107} -08/30/2021 17:37:50 - INFO - __main__ - Step 24786: {'lr': 0.0004713251044549414, 'samples': 4758912, 'steps': 24785, 'loss/train': 1.573750376701355} -08/30/2021 17:37:52 - INFO - __main__ - Step 24787: {'lr': 0.000471322636665277, 'samples': 4759104, 'steps': 24786, 'loss/train': 1.1347050666809082} -08/30/2021 17:37:52 - INFO - __main__ - Step 24788: {'lr': 0.0004713201687758881, 'samples': 4759296, 'steps': 24787, 'loss/train': 1.8069311380386353} -08/30/2021 17:37:53 - INFO - __main__ - Step 24789: {'lr': 0.00047131770078677574, 'samples': 4759488, 'steps': 24788, 'loss/train': 1.2345600128173828} -08/30/2021 17:37:53 - INFO - __main__ - Step 24790: {'lr': 0.000471315232697941, 'samples': 4759680, 'steps': 24789, 'loss/train': 1.3568607568740845} -08/30/2021 17:37:53 - INFO - __main__ - Step 24791: {'lr': 0.000471312764509385, 'samples': 4759872, 'steps': 24790, 'loss/train': 1.601361870765686} -08/30/2021 17:37:55 - INFO - __main__ - Step 24792: {'lr': 0.0004713102962211089, 'samples': 4760064, 'steps': 24791, 'loss/train': 1.5752657651901245} -08/30/2021 17:37:55 - INFO - __main__ - Step 24793: {'lr': 0.0004713078278331138, 'samples': 4760256, 'steps': 24792, 'loss/train': 1.6407828330993652} -08/30/2021 17:37:55 - INFO - __main__ - Step 24794: {'lr': 0.00047130535934540086, 'samples': 4760448, 'steps': 24793, 'loss/train': 1.9434902667999268} -08/30/2021 17:37:56 - INFO - __main__ - Step 24795: {'lr': 0.00047130289075797107, 'samples': 4760640, 'steps': 24794, 'loss/train': 1.1096513271331787} -08/30/2021 17:37:56 - INFO - __main__ - Step 24796: {'lr': 0.0004713004220708257, 'samples': 4760832, 'steps': 24795, 'loss/train': 1.5200589895248413} -08/30/2021 17:37:56 - INFO - __main__ - Step 24797: {'lr': 0.0004712979532839656, 'samples': 4761024, 'steps': 24796, 'loss/train': 1.271109700202942} -08/30/2021 17:37:58 - INFO - __main__ - Step 24798: {'lr': 0.00047129548439739225, 'samples': 4761216, 'steps': 24797, 'loss/train': 1.5104845762252808} -08/30/2021 17:37:58 - INFO - __main__ - Step 24799: {'lr': 0.0004712930154111065, 'samples': 4761408, 'steps': 24798, 'loss/train': 1.9404298067092896} -08/30/2021 17:37:59 - INFO - __main__ - Step 24800: {'lr': 0.00047129054632510947, 'samples': 4761600, 'steps': 24799, 'loss/train': 1.883735179901123} -08/30/2021 17:37:59 - INFO - __main__ - Step 24801: {'lr': 0.00047128807713940244, 'samples': 4761792, 'steps': 24800, 'loss/train': 1.948649287223816} -08/30/2021 17:38:00 - INFO - __main__ - Step 24802: {'lr': 0.00047128560785398633, 'samples': 4761984, 'steps': 24801, 'loss/train': 1.259140968322754} -08/30/2021 17:38:01 - INFO - __main__ - Step 24803: {'lr': 0.0004712831384688624, 'samples': 4762176, 'steps': 24802, 'loss/train': 1.251665472984314} -08/30/2021 17:38:01 - INFO - __main__ - Step 24804: {'lr': 0.00047128066898403166, 'samples': 4762368, 'steps': 24803, 'loss/train': 1.5575450658798218} -08/30/2021 17:38:02 - INFO - __main__ - Step 24805: {'lr': 0.00047127819939949534, 'samples': 4762560, 'steps': 24804, 'loss/train': 1.2906776666641235} -08/30/2021 17:38:02 - INFO - __main__ - Step 24806: {'lr': 0.00047127572971525437, 'samples': 4762752, 'steps': 24805, 'loss/train': 1.4693801403045654} -08/30/2021 17:38:02 - INFO - __main__ - Step 24807: {'lr': 0.00047127325993131006, 'samples': 4762944, 'steps': 24806, 'loss/train': 1.3121047019958496} -08/30/2021 17:38:04 - INFO - __main__ - Step 24808: {'lr': 0.0004712707900476634, 'samples': 4763136, 'steps': 24807, 'loss/train': 1.6688311100006104} -08/30/2021 17:38:04 - INFO - __main__ - Step 24809: {'lr': 0.00047126832006431555, 'samples': 4763328, 'steps': 24808, 'loss/train': 1.9442788362503052} -08/30/2021 17:38:05 - INFO - __main__ - Step 24810: {'lr': 0.00047126584998126756, 'samples': 4763520, 'steps': 24809, 'loss/train': 1.3375706672668457} -08/30/2021 17:38:05 - INFO - __main__ - Step 24811: {'lr': 0.0004712633797985206, 'samples': 4763712, 'steps': 24810, 'loss/train': 1.653232216835022} -08/30/2021 17:38:05 - INFO - __main__ - Step 24812: {'lr': 0.0004712609095160758, 'samples': 4763904, 'steps': 24811, 'loss/train': 1.692129373550415} -08/30/2021 17:38:07 - INFO - __main__ - Step 24813: {'lr': 0.0004712584391339343, 'samples': 4764096, 'steps': 24812, 'loss/train': 1.700097680091858} -08/30/2021 17:38:07 - INFO - __main__ - Step 24814: {'lr': 0.0004712559686520971, 'samples': 4764288, 'steps': 24813, 'loss/train': 1.7158104181289673} -08/30/2021 17:38:08 - INFO - __main__ - Step 24815: {'lr': 0.0004712534980705654, 'samples': 4764480, 'steps': 24814, 'loss/train': 2.4246253967285156} -08/30/2021 17:38:08 - INFO - __main__ - Step 24816: {'lr': 0.0004712510273893402, 'samples': 4764672, 'steps': 24815, 'loss/train': 1.4810903072357178} -08/30/2021 17:38:08 - INFO - __main__ - Step 24817: {'lr': 0.00047124855660842283, 'samples': 4764864, 'steps': 24816, 'loss/train': 0.9266908168792725} -08/30/2021 17:38:10 - INFO - __main__ - Step 24818: {'lr': 0.00047124608572781426, 'samples': 4765056, 'steps': 24817, 'loss/train': 1.8865001201629639} -08/30/2021 17:38:10 - INFO - __main__ - Step 24819: {'lr': 0.0004712436147475155, 'samples': 4765248, 'steps': 24818, 'loss/train': 1.4311137199401855} -08/30/2021 17:38:11 - INFO - __main__ - Step 24820: {'lr': 0.0004712411436675279, 'samples': 4765440, 'steps': 24819, 'loss/train': 0.7995826601982117} -08/30/2021 17:38:11 - INFO - __main__ - Step 24821: {'lr': 0.0004712386724878524, 'samples': 4765632, 'steps': 24820, 'loss/train': 0.9235925674438477} -08/30/2021 17:38:11 - INFO - __main__ - Step 24822: {'lr': 0.0004712362012084902, 'samples': 4765824, 'steps': 24821, 'loss/train': 1.8593734502792358} -08/30/2021 17:38:13 - INFO - __main__ - Step 24823: {'lr': 0.00047123372982944237, 'samples': 4766016, 'steps': 24822, 'loss/train': 1.6541578769683838} -08/30/2021 17:38:14 - INFO - __main__ - Step 24824: {'lr': 0.00047123125835071004, 'samples': 4766208, 'steps': 24823, 'loss/train': 1.3145304918289185} -08/30/2021 17:38:14 - INFO - __main__ - Step 24825: {'lr': 0.00047122878677229426, 'samples': 4766400, 'steps': 24824, 'loss/train': 2.6243112087249756} -08/30/2021 17:38:15 - INFO - __main__ - Step 24826: {'lr': 0.0004712263150941962, 'samples': 4766592, 'steps': 24825, 'loss/train': 1.3207083940505981} -08/30/2021 17:38:15 - INFO - __main__ - Step 24827: {'lr': 0.0004712238433164171, 'samples': 4766784, 'steps': 24826, 'loss/train': 0.24122515320777893} -08/30/2021 17:38:15 - INFO - __main__ - Step 24828: {'lr': 0.00047122137143895785, 'samples': 4766976, 'steps': 24827, 'loss/train': 2.5779922008514404} -08/30/2021 17:38:18 - INFO - __main__ - Step 24829: {'lr': 0.0004712188994618197, 'samples': 4767168, 'steps': 24828, 'loss/train': 1.5170645713806152} -08/30/2021 17:38:18 - INFO - __main__ - Step 24830: {'lr': 0.0004712164273850037, 'samples': 4767360, 'steps': 24829, 'loss/train': 1.8882523775100708} -08/30/2021 17:38:19 - INFO - __main__ - Step 24831: {'lr': 0.00047121395520851103, 'samples': 4767552, 'steps': 24830, 'loss/train': 1.510980248451233} -08/30/2021 17:38:19 - INFO - __main__ - Step 24832: {'lr': 0.00047121148293234274, 'samples': 4767744, 'steps': 24831, 'loss/train': 1.9384924173355103} -08/30/2021 17:38:19 - INFO - __main__ - Step 24833: {'lr': 0.00047120901055649995, 'samples': 4767936, 'steps': 24832, 'loss/train': 1.7600089311599731} -08/30/2021 17:38:20 - INFO - __main__ - Step 24834: {'lr': 0.0004712065380809838, 'samples': 4768128, 'steps': 24833, 'loss/train': 1.4324185848236084} -08/30/2021 17:38:21 - INFO - __main__ - Step 24835: {'lr': 0.0004712040655057954, 'samples': 4768320, 'steps': 24834, 'loss/train': 0.06933899223804474} -08/30/2021 17:38:22 - INFO - __main__ - Step 24836: {'lr': 0.0004712015928309359, 'samples': 4768512, 'steps': 24835, 'loss/train': 1.336204171180725} -08/30/2021 17:38:22 - INFO - __main__ - Step 24837: {'lr': 0.0004711991200564064, 'samples': 4768704, 'steps': 24836, 'loss/train': 2.059105157852173} -08/30/2021 17:38:22 - INFO - __main__ - Step 24838: {'lr': 0.0004711966471822079, 'samples': 4768896, 'steps': 24837, 'loss/train': 1.3179295063018799} -08/30/2021 17:38:23 - INFO - __main__ - Step 24839: {'lr': 0.00047119417420834163, 'samples': 4769088, 'steps': 24838, 'loss/train': 1.1504651308059692} -08/30/2021 17:38:24 - INFO - __main__ - Step 24840: {'lr': 0.00047119170113480867, 'samples': 4769280, 'steps': 24839, 'loss/train': 2.1416375637054443} -08/30/2021 17:38:25 - INFO - __main__ - Step 24841: {'lr': 0.00047118922796161026, 'samples': 4769472, 'steps': 24840, 'loss/train': 1.8710228204727173} -08/30/2021 17:38:25 - INFO - __main__ - Step 24842: {'lr': 0.00047118675468874727, 'samples': 4769664, 'steps': 24841, 'loss/train': 1.23186194896698} -08/30/2021 17:38:25 - INFO - __main__ - Step 24843: {'lr': 0.00047118428131622095, 'samples': 4769856, 'steps': 24842, 'loss/train': 1.758584976196289} -08/30/2021 17:38:26 - INFO - __main__ - Step 24844: {'lr': 0.00047118180784403243, 'samples': 4770048, 'steps': 24843, 'loss/train': 2.0206093788146973} -08/30/2021 17:38:26 - INFO - __main__ - Step 24845: {'lr': 0.0004711793342721828, 'samples': 4770240, 'steps': 24844, 'loss/train': 1.0911056995391846} -08/30/2021 17:38:28 - INFO - __main__ - Step 24846: {'lr': 0.00047117686060067315, 'samples': 4770432, 'steps': 24845, 'loss/train': 2.045301675796509} -08/30/2021 17:38:28 - INFO - __main__ - Step 24847: {'lr': 0.00047117438682950467, 'samples': 4770624, 'steps': 24846, 'loss/train': 0.5238175988197327} -08/30/2021 17:38:29 - INFO - __main__ - Step 24848: {'lr': 0.0004711719129586784, 'samples': 4770816, 'steps': 24847, 'loss/train': 1.743025302886963} -08/30/2021 17:38:29 - INFO - __main__ - Step 24849: {'lr': 0.0004711694389881955, 'samples': 4771008, 'steps': 24848, 'loss/train': 1.199263334274292} -08/30/2021 17:38:29 - INFO - __main__ - Step 24850: {'lr': 0.000471166964918057, 'samples': 4771200, 'steps': 24849, 'loss/train': 1.631496787071228} -08/30/2021 17:38:31 - INFO - __main__ - Step 24851: {'lr': 0.0004711644907482641, 'samples': 4771392, 'steps': 24850, 'loss/train': 1.8362065553665161} -08/30/2021 17:38:31 - INFO - __main__ - Step 24852: {'lr': 0.00047116201647881794, 'samples': 4771584, 'steps': 24851, 'loss/train': 1.4992926120758057} -08/30/2021 17:38:32 - INFO - __main__ - Step 24853: {'lr': 0.00047115954210971955, 'samples': 4771776, 'steps': 24852, 'loss/train': 1.4682295322418213} -08/30/2021 17:38:32 - INFO - __main__ - Step 24854: {'lr': 0.0004711570676409701, 'samples': 4771968, 'steps': 24853, 'loss/train': 1.775540828704834} -08/30/2021 17:38:32 - INFO - __main__ - Step 24855: {'lr': 0.0004711545930725707, 'samples': 4772160, 'steps': 24854, 'loss/train': 1.4458611011505127} -08/30/2021 17:38:34 - INFO - __main__ - Step 24856: {'lr': 0.0004711521184045224, 'samples': 4772352, 'steps': 24855, 'loss/train': 1.4048656225204468} -08/30/2021 17:38:34 - INFO - __main__ - Step 24857: {'lr': 0.0004711496436368264, 'samples': 4772544, 'steps': 24856, 'loss/train': 2.022448778152466} -08/30/2021 17:38:35 - INFO - __main__ - Step 24858: {'lr': 0.00047114716876948384, 'samples': 4772736, 'steps': 24857, 'loss/train': 1.2480905055999756} -08/30/2021 17:38:35 - INFO - __main__ - Step 24859: {'lr': 0.0004711446938024957, 'samples': 4772928, 'steps': 24858, 'loss/train': 0.9936212301254272} -08/30/2021 17:38:35 - INFO - __main__ - Step 24860: {'lr': 0.00047114221873586316, 'samples': 4773120, 'steps': 24859, 'loss/train': 1.71892249584198} -08/30/2021 17:38:37 - INFO - __main__ - Step 24861: {'lr': 0.00047113974356958744, 'samples': 4773312, 'steps': 24860, 'loss/train': 1.7533053159713745} -08/30/2021 17:38:37 - INFO - __main__ - Step 24862: {'lr': 0.0004711372683036695, 'samples': 4773504, 'steps': 24861, 'loss/train': 2.017672538757324} -08/30/2021 17:38:38 - INFO - __main__ - Step 24863: {'lr': 0.0004711347929381105, 'samples': 4773696, 'steps': 24862, 'loss/train': 1.5883532762527466} -08/30/2021 17:38:38 - INFO - __main__ - Step 24864: {'lr': 0.00047113231747291165, 'samples': 4773888, 'steps': 24863, 'loss/train': 1.5586352348327637} -08/30/2021 17:38:38 - INFO - __main__ - Step 24865: {'lr': 0.0004711298419080739, 'samples': 4774080, 'steps': 24864, 'loss/train': 1.341946005821228} -08/30/2021 17:38:40 - INFO - __main__ - Step 24866: {'lr': 0.00047112736624359855, 'samples': 4774272, 'steps': 24865, 'loss/train': 1.8073546886444092} -08/30/2021 17:38:40 - INFO - __main__ - Step 24867: {'lr': 0.00047112489047948655, 'samples': 4774464, 'steps': 24866, 'loss/train': 1.7532434463500977} -08/30/2021 17:38:41 - INFO - __main__ - Step 24868: {'lr': 0.00047112241461573913, 'samples': 4774656, 'steps': 24867, 'loss/train': 1.4599817991256714} -08/30/2021 17:38:41 - INFO - __main__ - Step 24869: {'lr': 0.0004711199386523573, 'samples': 4774848, 'steps': 24868, 'loss/train': 1.343593716621399} -08/30/2021 17:38:41 - INFO - __main__ - Step 24870: {'lr': 0.0004711174625893423, 'samples': 4775040, 'steps': 24869, 'loss/train': 1.7296785116195679} -08/30/2021 17:38:43 - INFO - __main__ - Step 24871: {'lr': 0.00047111498642669517, 'samples': 4775232, 'steps': 24870, 'loss/train': 1.6996002197265625} -08/30/2021 17:38:43 - INFO - __main__ - Step 24872: {'lr': 0.00047111251016441704, 'samples': 4775424, 'steps': 24871, 'loss/train': 2.030810832977295} -08/30/2021 17:38:44 - INFO - __main__ - Step 24873: {'lr': 0.0004711100338025089, 'samples': 4775616, 'steps': 24872, 'loss/train': 0.7744000554084778} -08/30/2021 17:38:44 - INFO - __main__ - Step 24874: {'lr': 0.00047110755734097216, 'samples': 4775808, 'steps': 24873, 'loss/train': 1.6111209392547607} -08/30/2021 17:38:44 - INFO - __main__ - Step 24875: {'lr': 0.00047110508077980774, 'samples': 4776000, 'steps': 24874, 'loss/train': 1.3004311323165894} -08/30/2021 17:38:46 - INFO - __main__ - Step 24876: {'lr': 0.00047110260411901674, 'samples': 4776192, 'steps': 24875, 'loss/train': 1.915921926498413} -08/30/2021 17:38:46 - INFO - __main__ - Step 24877: {'lr': 0.0004711001273586003, 'samples': 4776384, 'steps': 24876, 'loss/train': 1.6893506050109863} -08/30/2021 17:38:47 - INFO - __main__ - Step 24878: {'lr': 0.0004710976504985596, 'samples': 4776576, 'steps': 24877, 'loss/train': 2.1351051330566406} -08/30/2021 17:38:47 - INFO - __main__ - Step 24879: {'lr': 0.00047109517353889575, 'samples': 4776768, 'steps': 24878, 'loss/train': 1.200385332107544} -08/30/2021 17:38:47 - INFO - __main__ - Step 24880: {'lr': 0.0004710926964796097, 'samples': 4776960, 'steps': 24879, 'loss/train': 1.736669898033142} -08/30/2021 17:38:50 - INFO - __main__ - Step 24881: {'lr': 0.00047109021932070284, 'samples': 4777152, 'steps': 24880, 'loss/train': 1.8226144313812256} -08/30/2021 17:38:50 - INFO - __main__ - Step 24882: {'lr': 0.00047108774206217605, 'samples': 4777344, 'steps': 24881, 'loss/train': 1.485541582107544} -08/30/2021 17:38:50 - INFO - __main__ - Step 24883: {'lr': 0.00047108526470403055, 'samples': 4777536, 'steps': 24882, 'loss/train': 1.3955153226852417} -08/30/2021 17:38:51 - INFO - __main__ - Step 24884: {'lr': 0.0004710827872462674, 'samples': 4777728, 'steps': 24883, 'loss/train': 1.0091819763183594} -08/30/2021 17:38:51 - INFO - __main__ - Step 24885: {'lr': 0.00047108030968888784, 'samples': 4777920, 'steps': 24884, 'loss/train': 1.0975103378295898} -08/30/2021 17:38:51 - INFO - __main__ - Step 24886: {'lr': 0.00047107783203189285, 'samples': 4778112, 'steps': 24885, 'loss/train': 2.1459314823150635} -08/30/2021 17:38:53 - INFO - __main__ - Step 24887: {'lr': 0.0004710753542752836, 'samples': 4778304, 'steps': 24886, 'loss/train': 1.6431077718734741} -08/30/2021 17:38:53 - INFO - __main__ - Step 24888: {'lr': 0.0004710728764190612, 'samples': 4778496, 'steps': 24887, 'loss/train': 1.7486584186553955} -08/30/2021 17:38:54 - INFO - __main__ - Step 24889: {'lr': 0.0004710703984632268, 'samples': 4778688, 'steps': 24888, 'loss/train': 1.5060125589370728} -08/30/2021 17:38:54 - INFO - __main__ - Step 24890: {'lr': 0.0004710679204077815, 'samples': 4778880, 'steps': 24889, 'loss/train': 1.759198546409607} -08/30/2021 17:38:55 - INFO - __main__ - Step 24891: {'lr': 0.0004710654422527264, 'samples': 4779072, 'steps': 24890, 'loss/train': 1.566688060760498} -08/30/2021 17:38:56 - INFO - __main__ - Step 24892: {'lr': 0.0004710629639980626, 'samples': 4779264, 'steps': 24891, 'loss/train': 1.099583387374878} -08/30/2021 17:38:57 - INFO - __main__ - Step 24893: {'lr': 0.0004710604856437912, 'samples': 4779456, 'steps': 24892, 'loss/train': 1.08847975730896} -08/30/2021 17:38:57 - INFO - __main__ - Step 24894: {'lr': 0.00047105800718991343, 'samples': 4779648, 'steps': 24893, 'loss/train': 1.5162407159805298} -08/30/2021 17:38:57 - INFO - __main__ - Step 24895: {'lr': 0.0004710555286364303, 'samples': 4779840, 'steps': 24894, 'loss/train': 1.71968412399292} -08/30/2021 17:38:58 - INFO - __main__ - Step 24896: {'lr': 0.000471053049983343, 'samples': 4780032, 'steps': 24895, 'loss/train': 1.7614107131958008} -08/30/2021 17:39:00 - INFO - __main__ - Step 24897: {'lr': 0.0004710505712306526, 'samples': 4780224, 'steps': 24896, 'loss/train': 0.6114704608917236} -08/30/2021 17:39:00 - INFO - __main__ - Step 24898: {'lr': 0.00047104809237836023, 'samples': 4780416, 'steps': 24897, 'loss/train': 1.1677278280258179} -08/30/2021 17:39:00 - INFO - __main__ - Step 24899: {'lr': 0.0004710456134264669, 'samples': 4780608, 'steps': 24898, 'loss/train': 2.2039995193481445} -08/30/2021 17:39:01 - INFO - __main__ - Step 24900: {'lr': 0.0004710431343749739, 'samples': 4780800, 'steps': 24899, 'loss/train': 1.7204174995422363} -08/30/2021 17:39:01 - INFO - __main__ - Step 24901: {'lr': 0.0004710406552238823, 'samples': 4780992, 'steps': 24900, 'loss/train': 1.0888166427612305} -08/30/2021 17:39:02 - INFO - __main__ - Step 24902: {'lr': 0.0004710381759731932, 'samples': 4781184, 'steps': 24901, 'loss/train': 1.6266021728515625} -08/30/2021 17:39:03 - INFO - __main__ - Step 24903: {'lr': 0.0004710356966229077, 'samples': 4781376, 'steps': 24902, 'loss/train': 1.5151076316833496} -08/30/2021 17:39:03 - INFO - __main__ - Step 24904: {'lr': 0.00047103321717302684, 'samples': 4781568, 'steps': 24903, 'loss/train': 0.9552773833274841} -08/30/2021 17:39:04 - INFO - __main__ - Step 24905: {'lr': 0.00047103073762355186, 'samples': 4781760, 'steps': 24904, 'loss/train': 1.417817234992981} -08/30/2021 17:39:04 - INFO - __main__ - Step 24906: {'lr': 0.0004710282579744839, 'samples': 4781952, 'steps': 24905, 'loss/train': 1.8440959453582764} -08/30/2021 17:39:06 - INFO - __main__ - Step 24907: {'lr': 0.000471025778225824, 'samples': 4782144, 'steps': 24906, 'loss/train': 1.4775582551956177} -08/30/2021 17:39:06 - INFO - __main__ - Step 24908: {'lr': 0.0004710232983775733, 'samples': 4782336, 'steps': 24907, 'loss/train': 1.6019210815429688} -08/30/2021 17:39:06 - INFO - __main__ - Step 24909: {'lr': 0.0004710208184297329, 'samples': 4782528, 'steps': 24908, 'loss/train': 0.8739994168281555} -08/30/2021 17:39:07 - INFO - __main__ - Step 24910: {'lr': 0.0004710183383823039, 'samples': 4782720, 'steps': 24909, 'loss/train': 1.1203923225402832} -08/30/2021 17:39:07 - INFO - __main__ - Step 24911: {'lr': 0.00047101585823528745, 'samples': 4782912, 'steps': 24910, 'loss/train': 1.5857607126235962} -08/30/2021 17:39:08 - INFO - __main__ - Step 24912: {'lr': 0.0004710133779886847, 'samples': 4783104, 'steps': 24911, 'loss/train': 1.714115023612976} -08/30/2021 17:39:09 - INFO - __main__ - Step 24913: {'lr': 0.00047101089764249674, 'samples': 4783296, 'steps': 24912, 'loss/train': 1.8911681175231934} -08/30/2021 17:39:10 - INFO - __main__ - Step 24914: {'lr': 0.0004710084171967246, 'samples': 4783488, 'steps': 24913, 'loss/train': 2.1133487224578857} -08/30/2021 17:39:10 - INFO - __main__ - Step 24915: {'lr': 0.00047100593665136946, 'samples': 4783680, 'steps': 24914, 'loss/train': 2.4652905464172363} -08/30/2021 17:39:10 - INFO - __main__ - Step 24916: {'lr': 0.0004710034560064326, 'samples': 4783872, 'steps': 24915, 'loss/train': 1.652906060218811} -08/30/2021 17:39:11 - INFO - __main__ - Step 24917: {'lr': 0.00047100097526191486, 'samples': 4784064, 'steps': 24916, 'loss/train': 1.570051908493042} -08/30/2021 17:39:12 - INFO - __main__ - Step 24918: {'lr': 0.0004709984944178176, 'samples': 4784256, 'steps': 24917, 'loss/train': 0.9035937190055847} -08/30/2021 17:39:12 - INFO - __main__ - Step 24919: {'lr': 0.0004709960134741418, 'samples': 4784448, 'steps': 24918, 'loss/train': 1.7699795961380005} -08/30/2021 17:39:13 - INFO - __main__ - Step 24920: {'lr': 0.00047099353243088856, 'samples': 4784640, 'steps': 24919, 'loss/train': 1.5828999280929565} -08/30/2021 17:39:13 - INFO - __main__ - Step 24921: {'lr': 0.00047099105128805906, 'samples': 4784832, 'steps': 24920, 'loss/train': 1.346340537071228} -08/30/2021 17:39:14 - INFO - __main__ - Step 24922: {'lr': 0.00047098857004565444, 'samples': 4785024, 'steps': 24921, 'loss/train': 1.6656728982925415} -08/30/2021 17:39:15 - INFO - __main__ - Step 24923: {'lr': 0.00047098608870367576, 'samples': 4785216, 'steps': 24922, 'loss/train': 1.6750472784042358} -08/30/2021 17:39:15 - INFO - __main__ - Step 24924: {'lr': 0.00047098360726212406, 'samples': 4785408, 'steps': 24923, 'loss/train': 1.434363603591919} -08/30/2021 17:39:16 - INFO - __main__ - Step 24925: {'lr': 0.0004709811257210007, 'samples': 4785600, 'steps': 24924, 'loss/train': 1.6387243270874023} -08/30/2021 17:39:16 - INFO - __main__ - Step 24926: {'lr': 0.0004709786440803066, 'samples': 4785792, 'steps': 24925, 'loss/train': 1.2350859642028809} -08/30/2021 17:39:16 - INFO - __main__ - Step 24927: {'lr': 0.00047097616234004295, 'samples': 4785984, 'steps': 24926, 'loss/train': 1.7146450281143188} -08/30/2021 17:39:18 - INFO - __main__ - Step 24928: {'lr': 0.00047097368050021083, 'samples': 4786176, 'steps': 24927, 'loss/train': 1.990890383720398} -08/30/2021 17:39:18 - INFO - __main__ - Step 24929: {'lr': 0.0004709711985608114, 'samples': 4786368, 'steps': 24928, 'loss/train': 1.1382001638412476} -08/30/2021 17:39:19 - INFO - __main__ - Step 24930: {'lr': 0.0004709687165218457, 'samples': 4786560, 'steps': 24929, 'loss/train': 1.7983508110046387} -08/30/2021 17:39:19 - INFO - __main__ - Step 24931: {'lr': 0.00047096623438331497, 'samples': 4786752, 'steps': 24930, 'loss/train': 1.7613146305084229} -08/30/2021 17:39:19 - INFO - __main__ - Step 24932: {'lr': 0.00047096375214522026, 'samples': 4786944, 'steps': 24931, 'loss/train': 1.2897993326187134} -08/30/2021 17:39:21 - INFO - __main__ - Step 24933: {'lr': 0.0004709612698075627, 'samples': 4787136, 'steps': 24932, 'loss/train': 1.6820757389068604} -08/30/2021 17:39:21 - INFO - __main__ - Step 24934: {'lr': 0.00047095878737034335, 'samples': 4787328, 'steps': 24933, 'loss/train': 1.4690594673156738} -08/30/2021 17:39:22 - INFO - __main__ - Step 24935: {'lr': 0.00047095630483356336, 'samples': 4787520, 'steps': 24934, 'loss/train': 1.6006884574890137} -08/30/2021 17:39:22 - INFO - __main__ - Step 24936: {'lr': 0.00047095382219722396, 'samples': 4787712, 'steps': 24935, 'loss/train': 2.2609922885894775} -08/30/2021 17:39:22 - INFO - __main__ - Step 24937: {'lr': 0.0004709513394613261, 'samples': 4787904, 'steps': 24936, 'loss/train': 0.47464871406555176} -08/30/2021 17:39:25 - INFO - __main__ - Step 24938: {'lr': 0.00047094885662587104, 'samples': 4788096, 'steps': 24937, 'loss/train': 1.642889142036438} -08/30/2021 17:39:25 - INFO - __main__ - Step 24939: {'lr': 0.0004709463736908598, 'samples': 4788288, 'steps': 24938, 'loss/train': 1.1965306997299194} -08/30/2021 17:39:26 - INFO - __main__ - Step 24940: {'lr': 0.0004709438906562935, 'samples': 4788480, 'steps': 24939, 'loss/train': 1.2444170713424683} -08/30/2021 17:39:26 - INFO - __main__ - Step 24941: {'lr': 0.0004709414075221734, 'samples': 4788672, 'steps': 24940, 'loss/train': 1.7122747898101807} -08/30/2021 17:39:26 - INFO - __main__ - Step 24942: {'lr': 0.0004709389242885004, 'samples': 4788864, 'steps': 24941, 'loss/train': 1.6825224161148071} -08/30/2021 17:39:27 - INFO - __main__ - Step 24943: {'lr': 0.00047093644095527574, 'samples': 4789056, 'steps': 24942, 'loss/train': 1.1214473247528076} -08/30/2021 17:39:28 - INFO - __main__ - Step 24944: {'lr': 0.00047093395752250056, 'samples': 4789248, 'steps': 24943, 'loss/train': 4.759702205657959} -08/30/2021 17:39:28 - INFO - __main__ - Step 24945: {'lr': 0.000470931473990176, 'samples': 4789440, 'steps': 24944, 'loss/train': 1.3784898519515991} -08/30/2021 17:39:29 - INFO - __main__ - Step 24946: {'lr': 0.00047092899035830303, 'samples': 4789632, 'steps': 24945, 'loss/train': 1.405518651008606} -08/30/2021 17:39:29 - INFO - __main__ - Step 24947: {'lr': 0.00047092650662688295, 'samples': 4789824, 'steps': 24946, 'loss/train': 2.6035568714141846} -08/30/2021 17:39:30 - INFO - __main__ - Step 24948: {'lr': 0.00047092402279591674, 'samples': 4790016, 'steps': 24947, 'loss/train': 1.7906999588012695} -08/30/2021 17:39:31 - INFO - __main__ - Step 24949: {'lr': 0.00047092153886540554, 'samples': 4790208, 'steps': 24948, 'loss/train': 1.128928303718567} -08/30/2021 17:39:32 - INFO - __main__ - Step 24950: {'lr': 0.0004709190548353506, 'samples': 4790400, 'steps': 24949, 'loss/train': 1.5134373903274536} -08/30/2021 17:39:32 - INFO - __main__ - Step 24951: {'lr': 0.0004709165707057529, 'samples': 4790592, 'steps': 24950, 'loss/train': 0.7753484845161438} -08/30/2021 17:39:33 - INFO - __main__ - Step 24952: {'lr': 0.0004709140864766136, 'samples': 4790784, 'steps': 24951, 'loss/train': 1.4935215711593628} -08/30/2021 17:39:33 - INFO - __main__ - Step 24953: {'lr': 0.0004709116021479338, 'samples': 4790976, 'steps': 24952, 'loss/train': 1.3633826971054077} -08/30/2021 17:39:34 - INFO - __main__ - Step 24954: {'lr': 0.00047090911771971466, 'samples': 4791168, 'steps': 24953, 'loss/train': 1.789441466331482} -08/30/2021 17:39:35 - INFO - __main__ - Step 24955: {'lr': 0.0004709066331919573, 'samples': 4791360, 'steps': 24954, 'loss/train': 0.17537353932857513} -08/30/2021 17:39:36 - INFO - __main__ - Step 24956: {'lr': 0.0004709041485646628, 'samples': 4791552, 'steps': 24955, 'loss/train': 0.8306893110275269} -08/30/2021 17:39:36 - INFO - __main__ - Step 24957: {'lr': 0.0004709016638378323, 'samples': 4791744, 'steps': 24956, 'loss/train': 1.2651863098144531} -08/30/2021 17:39:36 - INFO - __main__ - Step 24958: {'lr': 0.00047089917901146694, 'samples': 4791936, 'steps': 24957, 'loss/train': 1.9289519786834717} -08/30/2021 17:39:37 - INFO - __main__ - Step 24959: {'lr': 0.0004708966940855678, 'samples': 4792128, 'steps': 24958, 'loss/train': 1.972502589225769} -08/30/2021 17:39:38 - INFO - __main__ - Step 24960: {'lr': 0.00047089420906013603, 'samples': 4792320, 'steps': 24959, 'loss/train': 1.3213255405426025} -08/30/2021 17:39:38 - INFO - __main__ - Step 24961: {'lr': 0.0004708917239351727, 'samples': 4792512, 'steps': 24960, 'loss/train': 2.070970058441162} -08/30/2021 17:39:39 - INFO - __main__ - Step 24962: {'lr': 0.000470889238710679, 'samples': 4792704, 'steps': 24961, 'loss/train': 1.6014602184295654} -08/30/2021 17:39:39 - INFO - __main__ - Step 24963: {'lr': 0.00047088675338665596, 'samples': 4792896, 'steps': 24962, 'loss/train': 1.116607666015625} -08/30/2021 17:39:40 - INFO - __main__ - Step 24964: {'lr': 0.00047088426796310486, 'samples': 4793088, 'steps': 24963, 'loss/train': 1.4058283567428589} -08/30/2021 17:39:41 - INFO - __main__ - Step 24965: {'lr': 0.00047088178244002665, 'samples': 4793280, 'steps': 24964, 'loss/train': 1.330124855041504} -08/30/2021 17:39:41 - INFO - __main__ - Step 24966: {'lr': 0.00047087929681742253, 'samples': 4793472, 'steps': 24965, 'loss/train': 1.7067776918411255} -08/30/2021 17:39:42 - INFO - __main__ - Step 24967: {'lr': 0.00047087681109529364, 'samples': 4793664, 'steps': 24966, 'loss/train': 1.6116641759872437} -08/30/2021 17:39:42 - INFO - __main__ - Step 24968: {'lr': 0.00047087432527364106, 'samples': 4793856, 'steps': 24967, 'loss/train': 1.295219898223877} -08/30/2021 17:39:43 - INFO - __main__ - Step 24969: {'lr': 0.0004708718393524659, 'samples': 4794048, 'steps': 24968, 'loss/train': 1.5851590633392334} -08/30/2021 17:39:44 - INFO - __main__ - Step 24970: {'lr': 0.0004708693533317693, 'samples': 4794240, 'steps': 24969, 'loss/train': 0.9088825583457947} -08/30/2021 17:39:44 - INFO - __main__ - Step 24971: {'lr': 0.00047086686721155237, 'samples': 4794432, 'steps': 24970, 'loss/train': 1.8053698539733887} -08/30/2021 17:39:45 - INFO - __main__ - Step 24972: {'lr': 0.00047086438099181615, 'samples': 4794624, 'steps': 24971, 'loss/train': 1.4603807926177979} -08/30/2021 17:39:45 - INFO - __main__ - Step 24973: {'lr': 0.00047086189467256194, 'samples': 4794816, 'steps': 24972, 'loss/train': 1.676476001739502} -08/30/2021 17:39:46 - INFO - __main__ - Step 24974: {'lr': 0.0004708594082537908, 'samples': 4795008, 'steps': 24973, 'loss/train': 1.2030974626541138} -08/30/2021 17:39:46 - INFO - __main__ - Step 24975: {'lr': 0.00047085692173550375, 'samples': 4795200, 'steps': 24974, 'loss/train': 1.249074101448059} -08/30/2021 17:39:47 - INFO - __main__ - Step 24976: {'lr': 0.00047085443511770206, 'samples': 4795392, 'steps': 24975, 'loss/train': 1.3432697057724} -08/30/2021 17:39:48 - INFO - __main__ - Step 24977: {'lr': 0.0004708519484003867, 'samples': 4795584, 'steps': 24976, 'loss/train': 1.0533641576766968} -08/30/2021 17:39:48 - INFO - __main__ - Step 24978: {'lr': 0.0004708494615835589, 'samples': 4795776, 'steps': 24977, 'loss/train': 1.8369439840316772} -08/30/2021 17:39:49 - INFO - __main__ - Step 24979: {'lr': 0.00047084697466721973, 'samples': 4795968, 'steps': 24978, 'loss/train': 1.2232842445373535} -08/30/2021 17:39:49 - INFO - __main__ - Step 24980: {'lr': 0.0004708444876513703, 'samples': 4796160, 'steps': 24979, 'loss/train': 1.6410752534866333} -08/30/2021 17:39:50 - INFO - __main__ - Step 24981: {'lr': 0.0004708420005360118, 'samples': 4796352, 'steps': 24980, 'loss/train': 0.9991140365600586} -08/30/2021 17:39:51 - INFO - __main__ - Step 24982: {'lr': 0.0004708395133211452, 'samples': 4796544, 'steps': 24981, 'loss/train': 1.582206130027771} -08/30/2021 17:39:51 - INFO - __main__ - Step 24983: {'lr': 0.0004708370260067718, 'samples': 4796736, 'steps': 24982, 'loss/train': 1.5868440866470337} -08/30/2021 17:39:51 - INFO - __main__ - Step 24984: {'lr': 0.00047083453859289267, 'samples': 4796928, 'steps': 24983, 'loss/train': 1.836672067642212} -08/30/2021 17:39:52 - INFO - __main__ - Step 24985: {'lr': 0.00047083205107950886, 'samples': 4797120, 'steps': 24984, 'loss/train': 1.5847891569137573} -08/30/2021 17:39:53 - INFO - __main__ - Step 24986: {'lr': 0.00047082956346662153, 'samples': 4797312, 'steps': 24985, 'loss/train': 0.21408843994140625} -08/30/2021 17:39:54 - INFO - __main__ - Step 24987: {'lr': 0.00047082707575423177, 'samples': 4797504, 'steps': 24986, 'loss/train': 1.650818943977356} -08/30/2021 17:39:54 - INFO - __main__ - Step 24988: {'lr': 0.00047082458794234087, 'samples': 4797696, 'steps': 24987, 'loss/train': 1.6033084392547607} -08/30/2021 17:39:54 - INFO - __main__ - Step 24989: {'lr': 0.0004708221000309497, 'samples': 4797888, 'steps': 24988, 'loss/train': 1.9122878313064575} -08/30/2021 17:39:55 - INFO - __main__ - Step 24990: {'lr': 0.0004708196120200595, 'samples': 4798080, 'steps': 24989, 'loss/train': 1.5654484033584595} -08/30/2021 17:39:56 - INFO - __main__ - Step 24991: {'lr': 0.0004708171239096715, 'samples': 4798272, 'steps': 24990, 'loss/train': 1.3105615377426147} -08/30/2021 17:39:57 - INFO - __main__ - Step 24992: {'lr': 0.00047081463569978655, 'samples': 4798464, 'steps': 24991, 'loss/train': 1.3675084114074707} -08/30/2021 17:39:57 - INFO - __main__ - Step 24993: {'lr': 0.00047081214739040606, 'samples': 4798656, 'steps': 24992, 'loss/train': 1.4760974645614624} -08/30/2021 17:39:58 - INFO - __main__ - Step 24994: {'lr': 0.000470809658981531, 'samples': 4798848, 'steps': 24993, 'loss/train': 2.2376883029937744} -08/30/2021 17:39:58 - INFO - __main__ - Step 24995: {'lr': 0.00047080717047316245, 'samples': 4799040, 'steps': 24994, 'loss/train': 1.4054299592971802} -08/30/2021 17:39:59 - INFO - __main__ - Step 24996: {'lr': 0.0004708046818653017, 'samples': 4799232, 'steps': 24995, 'loss/train': 1.6642056703567505} -08/30/2021 17:40:00 - INFO - __main__ - Step 24997: {'lr': 0.0004708021931579497, 'samples': 4799424, 'steps': 24996, 'loss/train': 1.3085339069366455} -08/30/2021 17:40:00 - INFO - __main__ - Step 24998: {'lr': 0.00047079970435110765, 'samples': 4799616, 'steps': 24997, 'loss/train': 1.699511170387268} -08/30/2021 17:40:01 - INFO - __main__ - Step 24999: {'lr': 0.0004707972154447766, 'samples': 4799808, 'steps': 24998, 'loss/train': 4.631608963012695} -08/30/2021 17:40:01 - INFO - __main__ - Step 25000: {'lr': 0.00047079472643895784, 'samples': 4800000, 'steps': 24999, 'loss/train': 1.5615689754486084} -08/30/2021 17:40:01 - INFO - __main__ - Step 25001: {'lr': 0.00047079223733365234, 'samples': 4800192, 'steps': 25000, 'loss/train': 1.6584721803665161} -08/30/2021 17:40:03 - INFO - __main__ - Step 25002: {'lr': 0.0004707897481288612, 'samples': 4800384, 'steps': 25001, 'loss/train': 1.011987328529358} -08/30/2021 17:40:03 - INFO - __main__ - Step 25003: {'lr': 0.00047078725882458575, 'samples': 4800576, 'steps': 25002, 'loss/train': 1.2912969589233398} -08/30/2021 17:40:04 - INFO - __main__ - Step 25004: {'lr': 0.0004707847694208269, 'samples': 4800768, 'steps': 25003, 'loss/train': 1.742913007736206} -08/30/2021 17:40:04 - INFO - __main__ - Step 25005: {'lr': 0.0004707822799175858, 'samples': 4800960, 'steps': 25004, 'loss/train': 1.720575213432312} -08/30/2021 17:40:04 - INFO - __main__ - Step 25006: {'lr': 0.00047077979031486363, 'samples': 4801152, 'steps': 25005, 'loss/train': 1.5674479007720947} -08/30/2021 17:40:06 - INFO - __main__ - Step 25007: {'lr': 0.0004707773006126615, 'samples': 4801344, 'steps': 25006, 'loss/train': 1.6338114738464355} -08/30/2021 17:40:07 - INFO - __main__ - Step 25008: {'lr': 0.0004707748108109805, 'samples': 4801536, 'steps': 25007, 'loss/train': 1.4947255849838257} -08/30/2021 17:40:07 - INFO - __main__ - Step 25009: {'lr': 0.0004707723209098218, 'samples': 4801728, 'steps': 25008, 'loss/train': 1.4501467943191528} -08/30/2021 17:40:08 - INFO - __main__ - Step 25010: {'lr': 0.0004707698309091865, 'samples': 4801920, 'steps': 25009, 'loss/train': 1.4030537605285645} -08/30/2021 17:40:08 - INFO - __main__ - Step 25011: {'lr': 0.00047076734080907576, 'samples': 4802112, 'steps': 25010, 'loss/train': 1.7794524431228638} -08/30/2021 17:40:09 - INFO - __main__ - Step 25012: {'lr': 0.0004707648506094906, 'samples': 4802304, 'steps': 25011, 'loss/train': 1.6770697832107544} -08/30/2021 17:40:10 - INFO - __main__ - Step 25013: {'lr': 0.0004707623603104322, 'samples': 4802496, 'steps': 25012, 'loss/train': 1.873600721359253} -08/30/2021 17:40:10 - INFO - __main__ - Step 25014: {'lr': 0.0004707598699119018, 'samples': 4802688, 'steps': 25013, 'loss/train': 1.5718786716461182} -08/30/2021 17:40:11 - INFO - __main__ - Step 25015: {'lr': 0.0004707573794139003, 'samples': 4802880, 'steps': 25014, 'loss/train': 1.6327112913131714} -08/30/2021 17:40:11 - INFO - __main__ - Step 25016: {'lr': 0.0004707548888164289, 'samples': 4803072, 'steps': 25015, 'loss/train': 1.7203716039657593} -08/30/2021 17:40:12 - INFO - __main__ - Step 25017: {'lr': 0.0004707523981194889, 'samples': 4803264, 'steps': 25016, 'loss/train': 1.2609792947769165} -08/30/2021 17:40:13 - INFO - __main__ - Step 25018: {'lr': 0.00047074990732308116, 'samples': 4803456, 'steps': 25017, 'loss/train': 1.330159068107605} -08/30/2021 17:40:13 - INFO - __main__ - Step 25019: {'lr': 0.00047074741642720694, 'samples': 4803648, 'steps': 25018, 'loss/train': 1.607756495475769} -08/30/2021 17:40:14 - INFO - __main__ - Step 25020: {'lr': 0.0004707449254318673, 'samples': 4803840, 'steps': 25019, 'loss/train': 1.688234567642212} -08/30/2021 17:40:14 - INFO - __main__ - Step 25021: {'lr': 0.0004707424343370635, 'samples': 4804032, 'steps': 25020, 'loss/train': 1.5290659666061401} -08/30/2021 17:40:16 - INFO - __main__ - Step 25022: {'lr': 0.00047073994314279647, 'samples': 4804224, 'steps': 25021, 'loss/train': 1.3709489107131958} -08/30/2021 17:40:16 - INFO - __main__ - Step 25023: {'lr': 0.0004707374518490675, 'samples': 4804416, 'steps': 25022, 'loss/train': 1.2842025756835938} -08/30/2021 17:40:16 - INFO - __main__ - Step 25024: {'lr': 0.0004707349604558776, 'samples': 4804608, 'steps': 25023, 'loss/train': 1.225508451461792} -08/30/2021 17:40:17 - INFO - __main__ - Step 25025: {'lr': 0.00047073246896322797, 'samples': 4804800, 'steps': 25024, 'loss/train': 2.0839381217956543} -08/30/2021 17:40:17 - INFO - __main__ - Step 25026: {'lr': 0.00047072997737111966, 'samples': 4804992, 'steps': 25025, 'loss/train': 1.4561882019042969} -08/30/2021 17:40:17 - INFO - __main__ - Step 25027: {'lr': 0.0004707274856795538, 'samples': 4805184, 'steps': 25026, 'loss/train': 1.6024748086929321} -08/30/2021 17:40:19 - INFO - __main__ - Step 25028: {'lr': 0.00047072499388853164, 'samples': 4805376, 'steps': 25027, 'loss/train': 1.900529146194458} -08/30/2021 17:40:19 - INFO - __main__ - Step 25029: {'lr': 0.0004707225019980541, 'samples': 4805568, 'steps': 25028, 'loss/train': 1.4839271306991577} -08/30/2021 17:40:20 - INFO - __main__ - Step 25030: {'lr': 0.00047072001000812247, 'samples': 4805760, 'steps': 25029, 'loss/train': 1.487958312034607} -08/30/2021 17:40:20 - INFO - __main__ - Step 25031: {'lr': 0.00047071751791873774, 'samples': 4805952, 'steps': 25030, 'loss/train': 1.3906569480895996} -08/30/2021 17:40:20 - INFO - __main__ - Step 25032: {'lr': 0.0004707150257299012, 'samples': 4806144, 'steps': 25031, 'loss/train': 1.6489684581756592} -08/30/2021 17:40:22 - INFO - __main__ - Step 25033: {'lr': 0.0004707125334416138, 'samples': 4806336, 'steps': 25032, 'loss/train': 1.3826849460601807} -08/30/2021 17:40:23 - INFO - __main__ - Step 25034: {'lr': 0.00047071004105387677, 'samples': 4806528, 'steps': 25033, 'loss/train': 1.9108388423919678} -08/30/2021 17:40:23 - INFO - __main__ - Step 25035: {'lr': 0.00047070754856669115, 'samples': 4806720, 'steps': 25034, 'loss/train': 1.31353759765625} -08/30/2021 17:40:24 - INFO - __main__ - Step 25036: {'lr': 0.0004707050559800582, 'samples': 4806912, 'steps': 25035, 'loss/train': 1.1166515350341797} -08/30/2021 17:40:24 - INFO - __main__ - Step 25037: {'lr': 0.00047070256329397893, 'samples': 4807104, 'steps': 25036, 'loss/train': 0.8583371639251709} -08/30/2021 17:40:24 - INFO - __main__ - Step 25038: {'lr': 0.0004707000705084545, 'samples': 4807296, 'steps': 25037, 'loss/train': 0.057708073407411575} -08/30/2021 17:40:26 - INFO - __main__ - Step 25039: {'lr': 0.000470697577623486, 'samples': 4807488, 'steps': 25038, 'loss/train': 1.9112403392791748} -08/30/2021 17:40:26 - INFO - __main__ - Step 25040: {'lr': 0.0004706950846390746, 'samples': 4807680, 'steps': 25039, 'loss/train': 1.9506802558898926} -08/30/2021 17:40:27 - INFO - __main__ - Step 25041: {'lr': 0.00047069259155522135, 'samples': 4807872, 'steps': 25040, 'loss/train': 1.3299362659454346} -08/30/2021 17:40:27 - INFO - __main__ - Step 25042: {'lr': 0.0004706900983719274, 'samples': 4808064, 'steps': 25041, 'loss/train': 2.207509756088257} -08/30/2021 17:40:27 - INFO - __main__ - Step 25043: {'lr': 0.000470687605089194, 'samples': 4808256, 'steps': 25042, 'loss/train': 1.5854017734527588} -08/30/2021 17:40:29 - INFO - __main__ - Step 25044: {'lr': 0.0004706851117070221, 'samples': 4808448, 'steps': 25043, 'loss/train': 1.9118982553482056} -08/30/2021 17:40:29 - INFO - __main__ - Step 25045: {'lr': 0.0004706826182254129, 'samples': 4808640, 'steps': 25044, 'loss/train': 1.6057268381118774} -08/30/2021 17:40:30 - INFO - __main__ - Step 25046: {'lr': 0.0004706801246443676, 'samples': 4808832, 'steps': 25045, 'loss/train': 1.7143179178237915} -08/30/2021 17:40:30 - INFO - __main__ - Step 25047: {'lr': 0.00047067763096388717, 'samples': 4809024, 'steps': 25046, 'loss/train': 1.1472886800765991} -08/30/2021 17:40:30 - INFO - __main__ - Step 25048: {'lr': 0.00047067513718397283, 'samples': 4809216, 'steps': 25047, 'loss/train': 1.8607536554336548} -08/30/2021 17:40:32 - INFO - __main__ - Step 25049: {'lr': 0.0004706726433046256, 'samples': 4809408, 'steps': 25048, 'loss/train': 1.89994478225708} -08/30/2021 17:40:32 - INFO - __main__ - Step 25050: {'lr': 0.00047067014932584674, 'samples': 4809600, 'steps': 25049, 'loss/train': 1.3649753332138062} -08/30/2021 17:40:33 - INFO - __main__ - Step 25051: {'lr': 0.0004706676552476373, 'samples': 4809792, 'steps': 25050, 'loss/train': 1.4867832660675049} -08/30/2021 17:40:33 - INFO - __main__ - Step 25052: {'lr': 0.0004706651610699985, 'samples': 4809984, 'steps': 25051, 'loss/train': 1.2261881828308105} -08/30/2021 17:40:33 - INFO - __main__ - Step 25053: {'lr': 0.00047066266679293125, 'samples': 4810176, 'steps': 25052, 'loss/train': 0.8619534969329834} -08/30/2021 17:40:34 - INFO - __main__ - Step 25054: {'lr': 0.0004706601724164369, 'samples': 4810368, 'steps': 25053, 'loss/train': 2.069847583770752} -08/30/2021 17:40:35 - INFO - __main__ - Step 25055: {'lr': 0.0004706576779405165, 'samples': 4810560, 'steps': 25054, 'loss/train': 1.9539846181869507} -08/30/2021 17:40:36 - INFO - __main__ - Step 25056: {'lr': 0.0004706551833651711, 'samples': 4810752, 'steps': 25055, 'loss/train': 0.2109277993440628} -08/30/2021 17:40:36 - INFO - __main__ - Step 25057: {'lr': 0.0004706526886904019, 'samples': 4810944, 'steps': 25056, 'loss/train': 1.317997694015503} -08/30/2021 17:40:37 - INFO - __main__ - Step 25058: {'lr': 0.00047065019391621, 'samples': 4811136, 'steps': 25057, 'loss/train': 1.2071038484573364} -08/30/2021 17:40:37 - INFO - __main__ - Step 25059: {'lr': 0.0004706476990425965, 'samples': 4811328, 'steps': 25058, 'loss/train': 1.1856105327606201} -08/30/2021 17:40:38 - INFO - __main__ - Step 25060: {'lr': 0.0004706452040695626, 'samples': 4811520, 'steps': 25059, 'loss/train': 1.4010510444641113} -08/30/2021 17:40:39 - INFO - __main__ - Step 25061: {'lr': 0.0004706427089971093, 'samples': 4811712, 'steps': 25060, 'loss/train': 1.15224027633667} -08/30/2021 17:40:39 - INFO - __main__ - Step 25062: {'lr': 0.0004706402138252379, 'samples': 4811904, 'steps': 25061, 'loss/train': 1.3296509981155396} -08/30/2021 17:40:39 - INFO - __main__ - Step 25063: {'lr': 0.00047063771855394935, 'samples': 4812096, 'steps': 25062, 'loss/train': 2.1697821617126465} -08/30/2021 17:40:40 - INFO - __main__ - Step 25064: {'lr': 0.00047063522318324484, 'samples': 4812288, 'steps': 25063, 'loss/train': 1.5971816778182983} -08/30/2021 17:40:42 - INFO - __main__ - Step 25065: {'lr': 0.00047063272771312556, 'samples': 4812480, 'steps': 25064, 'loss/train': 1.9891161918640137} -08/30/2021 17:40:43 - INFO - __main__ - Step 25066: {'lr': 0.0004706302321435926, 'samples': 4812672, 'steps': 25065, 'loss/train': 1.7171852588653564} -08/30/2021 17:40:43 - INFO - __main__ - Step 25067: {'lr': 0.00047062773647464694, 'samples': 4812864, 'steps': 25066, 'loss/train': 1.5297914743423462} -08/30/2021 17:40:43 - INFO - __main__ - Step 25068: {'lr': 0.00047062524070628993, 'samples': 4813056, 'steps': 25067, 'loss/train': 1.6285282373428345} -08/30/2021 17:40:44 - INFO - __main__ - Step 25069: {'lr': 0.00047062274483852253, 'samples': 4813248, 'steps': 25068, 'loss/train': 1.307554841041565} -08/30/2021 17:40:45 - INFO - __main__ - Step 25070: {'lr': 0.000470620248871346, 'samples': 4813440, 'steps': 25069, 'loss/train': 0.15752136707305908} -08/30/2021 17:40:46 - INFO - __main__ - Step 25071: {'lr': 0.00047061775280476134, 'samples': 4813632, 'steps': 25070, 'loss/train': 0.3412875831127167} -08/30/2021 17:40:46 - INFO - __main__ - Step 25072: {'lr': 0.0004706152566387697, 'samples': 4813824, 'steps': 25071, 'loss/train': 2.12052583694458} -08/30/2021 17:40:46 - INFO - __main__ - Step 25073: {'lr': 0.0004706127603733723, 'samples': 4814016, 'steps': 25072, 'loss/train': 0.8742642402648926} -08/30/2021 17:40:47 - INFO - __main__ - Step 25074: {'lr': 0.00047061026400857015, 'samples': 4814208, 'steps': 25073, 'loss/train': 0.27285999059677124} -08/30/2021 17:40:49 - INFO - __main__ - Step 25075: {'lr': 0.0004706077675443644, 'samples': 4814400, 'steps': 25074, 'loss/train': 1.3892403841018677} -08/30/2021 17:40:49 - INFO - __main__ - Step 25076: {'lr': 0.00047060527098075625, 'samples': 4814592, 'steps': 25075, 'loss/train': 1.2786834239959717} -08/30/2021 17:40:50 - INFO - __main__ - Step 25077: {'lr': 0.0004706027743177467, 'samples': 4814784, 'steps': 25076, 'loss/train': 1.3125505447387695} -08/30/2021 17:40:50 - INFO - __main__ - Step 25078: {'lr': 0.000470600277555337, 'samples': 4814976, 'steps': 25077, 'loss/train': 1.3752082586288452} -08/30/2021 17:40:50 - INFO - __main__ - Step 25079: {'lr': 0.0004705977806935282, 'samples': 4815168, 'steps': 25078, 'loss/train': 1.3756707906723022} -08/30/2021 17:40:51 - INFO - __main__ - Step 25080: {'lr': 0.00047059528373232147, 'samples': 4815360, 'steps': 25079, 'loss/train': 2.5226731300354004} -08/30/2021 17:40:52 - INFO - __main__ - Step 25081: {'lr': 0.0004705927866717179, 'samples': 4815552, 'steps': 25080, 'loss/train': 1.7651067972183228} -08/30/2021 17:40:53 - INFO - __main__ - Step 25082: {'lr': 0.0004705902895117186, 'samples': 4815744, 'steps': 25081, 'loss/train': 1.9038233757019043} -08/30/2021 17:40:53 - INFO - __main__ - Step 25083: {'lr': 0.00047058779225232474, 'samples': 4815936, 'steps': 25082, 'loss/train': 1.8142799139022827} -08/30/2021 17:40:53 - INFO - __main__ - Step 25084: {'lr': 0.0004705852948935374, 'samples': 4816128, 'steps': 25083, 'loss/train': 1.6670634746551514} -08/30/2021 17:40:54 - INFO - __main__ - Step 25085: {'lr': 0.00047058279743535775, 'samples': 4816320, 'steps': 25084, 'loss/train': 1.678105115890503} -08/30/2021 17:40:55 - INFO - __main__ - Step 25086: {'lr': 0.0004705802998777869, 'samples': 4816512, 'steps': 25085, 'loss/train': 1.5790992975234985} -08/30/2021 17:40:56 - INFO - __main__ - Step 25087: {'lr': 0.0004705778022208259, 'samples': 4816704, 'steps': 25086, 'loss/train': 1.2291311025619507} -08/30/2021 17:40:56 - INFO - __main__ - Step 25088: {'lr': 0.000470575304464476, 'samples': 4816896, 'steps': 25087, 'loss/train': 1.6294530630111694} -08/30/2021 17:40:57 - INFO - __main__ - Step 25089: {'lr': 0.00047057280660873835, 'samples': 4817088, 'steps': 25088, 'loss/train': 1.641780972480774} -08/30/2021 17:40:57 - INFO - __main__ - Step 25090: {'lr': 0.00047057030865361397, 'samples': 4817280, 'steps': 25089, 'loss/train': 1.677525520324707} -08/30/2021 17:40:59 - INFO - __main__ - Step 25091: {'lr': 0.0004705678105991039, 'samples': 4817472, 'steps': 25090, 'loss/train': 0.21901018917560577} -08/30/2021 17:40:59 - INFO - __main__ - Step 25092: {'lr': 0.00047056531244520945, 'samples': 4817664, 'steps': 25091, 'loss/train': 0.9002791047096252} -08/30/2021 17:41:00 - INFO - __main__ - Step 25093: {'lr': 0.0004705628141919317, 'samples': 4817856, 'steps': 25092, 'loss/train': 0.9649285674095154} -08/30/2021 17:41:00 - INFO - __main__ - Step 25094: {'lr': 0.00047056031583927175, 'samples': 4818048, 'steps': 25093, 'loss/train': 1.1545499563217163} -08/30/2021 17:41:00 - INFO - __main__ - Step 25095: {'lr': 0.00047055781738723063, 'samples': 4818240, 'steps': 25094, 'loss/train': 1.1860684156417847} -08/30/2021 17:41:02 - INFO - __main__ - Step 25096: {'lr': 0.0004705553188358096, 'samples': 4818432, 'steps': 25095, 'loss/train': 1.0877487659454346} -08/30/2021 17:41:02 - INFO - __main__ - Step 25097: {'lr': 0.00047055282018500976, 'samples': 4818624, 'steps': 25096, 'loss/train': 1.5303350687026978} -08/30/2021 17:41:03 - INFO - __main__ - Step 25098: {'lr': 0.0004705503214348323, 'samples': 4818816, 'steps': 25097, 'loss/train': 1.5555001497268677} -08/30/2021 17:41:03 - INFO - __main__ - Step 25099: {'lr': 0.0004705478225852782, 'samples': 4819008, 'steps': 25098, 'loss/train': 1.4041889905929565} -08/30/2021 17:41:03 - INFO - __main__ - Step 25100: {'lr': 0.0004705453236363486, 'samples': 4819200, 'steps': 25099, 'loss/train': 2.064286947250366} -08/30/2021 17:41:04 - INFO - __main__ - Step 25101: {'lr': 0.00047054282458804477, 'samples': 4819392, 'steps': 25100, 'loss/train': 1.1360825300216675} -08/30/2021 17:41:05 - INFO - __main__ - Step 25102: {'lr': 0.0004705403254403677, 'samples': 4819584, 'steps': 25101, 'loss/train': 1.521355152130127} -08/30/2021 17:41:06 - INFO - __main__ - Step 25103: {'lr': 0.0004705378261933186, 'samples': 4819776, 'steps': 25102, 'loss/train': 0.9425626993179321} -08/30/2021 17:41:06 - INFO - __main__ - Step 25104: {'lr': 0.0004705353268468985, 'samples': 4819968, 'steps': 25103, 'loss/train': 1.4939793348312378} -08/30/2021 17:41:06 - INFO - __main__ - Step 25105: {'lr': 0.00047053282740110863, 'samples': 4820160, 'steps': 25104, 'loss/train': 1.3788909912109375} -08/30/2021 17:41:07 - INFO - __main__ - Step 25106: {'lr': 0.00047053032785595005, 'samples': 4820352, 'steps': 25105, 'loss/train': 1.9078004360198975} -08/30/2021 17:41:09 - INFO - __main__ - Step 25107: {'lr': 0.0004705278282114239, 'samples': 4820544, 'steps': 25106, 'loss/train': 1.6420369148254395} -08/30/2021 17:41:09 - INFO - __main__ - Step 25108: {'lr': 0.0004705253284675314, 'samples': 4820736, 'steps': 25107, 'loss/train': 1.7942553758621216} -08/30/2021 17:41:09 - INFO - __main__ - Step 25109: {'lr': 0.00047052282862427355, 'samples': 4820928, 'steps': 25108, 'loss/train': 1.8953509330749512} -08/30/2021 17:41:10 - INFO - __main__ - Step 25110: {'lr': 0.0004705203286816514, 'samples': 4821120, 'steps': 25109, 'loss/train': 1.2782175540924072} -08/30/2021 17:41:10 - INFO - __main__ - Step 25111: {'lr': 0.0004705178286396663, 'samples': 4821312, 'steps': 25110, 'loss/train': 1.3305717706680298} -08/30/2021 17:41:10 - INFO - __main__ - Step 25112: {'lr': 0.0004705153284983192, 'samples': 4821504, 'steps': 25111, 'loss/train': 0.05513116344809532} -08/30/2021 17:41:12 - INFO - __main__ - Step 25113: {'lr': 0.00047051282825761145, 'samples': 4821696, 'steps': 25112, 'loss/train': 1.161117672920227} -08/30/2021 17:41:12 - INFO - __main__ - Step 25114: {'lr': 0.0004705103279175439, 'samples': 4821888, 'steps': 25113, 'loss/train': 1.6258196830749512} -08/30/2021 17:41:13 - INFO - __main__ - Step 25115: {'lr': 0.0004705078274781178, 'samples': 4822080, 'steps': 25114, 'loss/train': 1.7940661907196045} -08/30/2021 17:41:13 - INFO - __main__ - Step 25116: {'lr': 0.0004705053269393343, 'samples': 4822272, 'steps': 25115, 'loss/train': 0.8398537635803223} -08/30/2021 17:41:13 - INFO - __main__ - Step 25117: {'lr': 0.00047050282630119444, 'samples': 4822464, 'steps': 25116, 'loss/train': 1.5013272762298584} -08/30/2021 17:41:15 - INFO - __main__ - Step 25118: {'lr': 0.0004705003255636995, 'samples': 4822656, 'steps': 25117, 'loss/train': 1.9050203561782837} -08/30/2021 17:41:16 - INFO - __main__ - Step 25119: {'lr': 0.0004704978247268505, 'samples': 4822848, 'steps': 25118, 'loss/train': 0.638746440410614} -08/30/2021 17:41:16 - INFO - __main__ - Step 25120: {'lr': 0.0004704953237906485, 'samples': 4823040, 'steps': 25119, 'loss/train': 1.5404378175735474} -08/30/2021 17:41:17 - INFO - __main__ - Step 25121: {'lr': 0.0004704928227550949, 'samples': 4823232, 'steps': 25120, 'loss/train': 1.76178777217865} -08/30/2021 17:41:17 - INFO - __main__ - Step 25122: {'lr': 0.00047049032162019044, 'samples': 4823424, 'steps': 25121, 'loss/train': 1.4631903171539307} -08/30/2021 17:41:19 - INFO - __main__ - Step 25123: {'lr': 0.0004704878203859365, 'samples': 4823616, 'steps': 25122, 'loss/train': 0.8127224445343018} -08/30/2021 17:41:19 - INFO - __main__ - Step 25124: {'lr': 0.0004704853190523342, 'samples': 4823808, 'steps': 25123, 'loss/train': 1.4740229845046997} -08/30/2021 17:41:19 - INFO - __main__ - Step 25125: {'lr': 0.00047048281761938456, 'samples': 4824000, 'steps': 25124, 'loss/train': 1.1336865425109863} -08/30/2021 17:41:20 - INFO - __main__ - Step 25126: {'lr': 0.00047048031608708875, 'samples': 4824192, 'steps': 25125, 'loss/train': 1.0112028121948242} -08/30/2021 17:41:20 - INFO - __main__ - Step 25127: {'lr': 0.000470477814455448, 'samples': 4824384, 'steps': 25126, 'loss/train': 1.4916080236434937} -08/30/2021 17:41:22 - INFO - __main__ - Step 25128: {'lr': 0.0004704753127244633, 'samples': 4824576, 'steps': 25127, 'loss/train': 0.8901615142822266} -08/30/2021 17:41:22 - INFO - __main__ - Step 25129: {'lr': 0.0004704728108941358, 'samples': 4824768, 'steps': 25128, 'loss/train': 1.0653492212295532} -08/30/2021 17:41:22 - INFO - __main__ - Step 25130: {'lr': 0.00047047030896446665, 'samples': 4824960, 'steps': 25129, 'loss/train': 1.1029903888702393} -08/30/2021 17:41:23 - INFO - __main__ - Step 25131: {'lr': 0.000470467806935457, 'samples': 4825152, 'steps': 25130, 'loss/train': 1.9126156568527222} -08/30/2021 17:41:23 - INFO - __main__ - Step 25132: {'lr': 0.000470465304807108, 'samples': 4825344, 'steps': 25131, 'loss/train': 1.6000009775161743} -08/30/2021 17:41:25 - INFO - __main__ - Step 25133: {'lr': 0.00047046280257942067, 'samples': 4825536, 'steps': 25132, 'loss/train': 1.7084357738494873} -08/30/2021 17:41:25 - INFO - __main__ - Step 25134: {'lr': 0.0004704603002523962, 'samples': 4825728, 'steps': 25133, 'loss/train': 1.66991126537323} -08/30/2021 17:41:25 - INFO - __main__ - Step 25135: {'lr': 0.00047045779782603584, 'samples': 4825920, 'steps': 25134, 'loss/train': 1.288764476776123} -08/30/2021 17:41:26 - INFO - __main__ - Step 25136: {'lr': 0.0004704552953003405, 'samples': 4826112, 'steps': 25135, 'loss/train': 1.651648759841919} -08/30/2021 17:41:26 - INFO - __main__ - Step 25137: {'lr': 0.0004704527926753114, 'samples': 4826304, 'steps': 25136, 'loss/train': 2.0784590244293213} -08/30/2021 17:41:28 - INFO - __main__ - Step 25138: {'lr': 0.00047045028995094967, 'samples': 4826496, 'steps': 25137, 'loss/train': 1.7070115804672241} -08/30/2021 17:41:28 - INFO - __main__ - Step 25139: {'lr': 0.0004704477871272564, 'samples': 4826688, 'steps': 25138, 'loss/train': 1.3351141214370728} -08/30/2021 17:41:28 - INFO - __main__ - Step 25140: {'lr': 0.0004704452842042329, 'samples': 4826880, 'steps': 25139, 'loss/train': 1.4742670059204102} -08/30/2021 17:41:29 - INFO - __main__ - Step 25141: {'lr': 0.00047044278118188004, 'samples': 4827072, 'steps': 25140, 'loss/train': 1.3778868913650513} -08/30/2021 17:41:29 - INFO - __main__ - Step 25142: {'lr': 0.00047044027806019914, 'samples': 4827264, 'steps': 25141, 'loss/train': 1.4661959409713745} -08/30/2021 17:41:31 - INFO - __main__ - Step 25143: {'lr': 0.0004704377748391912, 'samples': 4827456, 'steps': 25142, 'loss/train': 2.056394577026367} -08/30/2021 17:41:31 - INFO - __main__ - Step 25144: {'lr': 0.0004704352715188574, 'samples': 4827648, 'steps': 25143, 'loss/train': 1.6076358556747437} -08/30/2021 17:41:31 - INFO - __main__ - Step 25145: {'lr': 0.0004704327680991989, 'samples': 4827840, 'steps': 25144, 'loss/train': 1.732292890548706} -08/30/2021 17:41:32 - INFO - __main__ - Step 25146: {'lr': 0.00047043026458021677, 'samples': 4828032, 'steps': 25145, 'loss/train': 1.7129887342453003} -08/30/2021 17:41:32 - INFO - __main__ - Step 25147: {'lr': 0.0004704277609619122, 'samples': 4828224, 'steps': 25146, 'loss/train': 1.8288956880569458} -08/30/2021 17:41:34 - INFO - __main__ - Step 25148: {'lr': 0.0004704252572442862, 'samples': 4828416, 'steps': 25147, 'loss/train': 0.5143375992774963} -08/30/2021 17:41:34 - INFO - __main__ - Step 25149: {'lr': 0.00047042275342734006, 'samples': 4828608, 'steps': 25148, 'loss/train': 1.0501458644866943} -08/30/2021 17:41:35 - INFO - __main__ - Step 25150: {'lr': 0.0004704202495110748, 'samples': 4828800, 'steps': 25149, 'loss/train': 0.18096794188022614} -08/30/2021 17:41:35 - INFO - __main__ - Step 25151: {'lr': 0.00047041774549549156, 'samples': 4828992, 'steps': 25150, 'loss/train': 0.6156520843505859} -08/30/2021 17:41:35 - INFO - __main__ - Step 25152: {'lr': 0.00047041524138059153, 'samples': 4829184, 'steps': 25151, 'loss/train': 1.241715908050537} -08/30/2021 17:41:36 - INFO - __main__ - Step 25153: {'lr': 0.00047041273716637576, 'samples': 4829376, 'steps': 25152, 'loss/train': 1.6219685077667236} -08/30/2021 17:41:37 - INFO - __main__ - Step 25154: {'lr': 0.00047041023285284545, 'samples': 4829568, 'steps': 25153, 'loss/train': 1.4883368015289307} -08/30/2021 17:41:37 - INFO - __main__ - Step 25155: {'lr': 0.0004704077284400017, 'samples': 4829760, 'steps': 25154, 'loss/train': 1.6693414449691772} -08/30/2021 17:41:38 - INFO - __main__ - Step 25156: {'lr': 0.0004704052239278456, 'samples': 4829952, 'steps': 25155, 'loss/train': 1.5799920558929443} -08/30/2021 17:41:38 - INFO - __main__ - Step 25157: {'lr': 0.00047040271931637824, 'samples': 4830144, 'steps': 25156, 'loss/train': 1.7024641036987305} -08/30/2021 17:41:38 - INFO - __main__ - Step 25158: {'lr': 0.0004704002146056009, 'samples': 4830336, 'steps': 25157, 'loss/train': 1.5750199556350708} -08/30/2021 17:41:40 - INFO - __main__ - Step 25159: {'lr': 0.0004703977097955146, 'samples': 4830528, 'steps': 25158, 'loss/train': 1.4540636539459229} -08/30/2021 17:41:41 - INFO - __main__ - Step 25160: {'lr': 0.0004703952048861204, 'samples': 4830720, 'steps': 25159, 'loss/train': 1.2269320487976074} -08/30/2021 17:41:41 - INFO - __main__ - Step 25161: {'lr': 0.00047039269987741967, 'samples': 4830912, 'steps': 25160, 'loss/train': 1.3916511535644531} -08/30/2021 17:41:41 - INFO - __main__ - Step 25162: {'lr': 0.0004703901947694134, 'samples': 4831104, 'steps': 25161, 'loss/train': 1.8600291013717651} -08/30/2021 17:41:42 - INFO - __main__ - Step 25163: {'lr': 0.0004703876895621025, 'samples': 4831296, 'steps': 25162, 'loss/train': 1.2141042947769165} -08/30/2021 17:41:43 - INFO - __main__ - Step 25164: {'lr': 0.0004703851842554885, 'samples': 4831488, 'steps': 25163, 'loss/train': 1.958831787109375} -08/30/2021 17:41:44 - INFO - __main__ - Step 25165: {'lr': 0.0004703826788495723, 'samples': 4831680, 'steps': 25164, 'loss/train': 1.3399730920791626} -08/30/2021 17:41:44 - INFO - __main__ - Step 25166: {'lr': 0.00047038017334435504, 'samples': 4831872, 'steps': 25165, 'loss/train': 0.9132199883460999} -08/30/2021 17:41:44 - INFO - __main__ - Step 25167: {'lr': 0.00047037766773983794, 'samples': 4832064, 'steps': 25166, 'loss/train': 1.8331776857376099} -08/30/2021 17:41:45 - INFO - __main__ - Step 25168: {'lr': 0.00047037516203602195, 'samples': 4832256, 'steps': 25167, 'loss/train': 1.5712714195251465} -08/30/2021 17:41:46 - INFO - __main__ - Step 25169: {'lr': 0.0004703726562329084, 'samples': 4832448, 'steps': 25168, 'loss/train': 1.8494906425476074} -08/30/2021 17:41:47 - INFO - __main__ - Step 25170: {'lr': 0.0004703701503304983, 'samples': 4832640, 'steps': 25169, 'loss/train': 0.22215215861797333} -08/30/2021 17:41:47 - INFO - __main__ - Step 25171: {'lr': 0.0004703676443287928, 'samples': 4832832, 'steps': 25170, 'loss/train': 1.6323357820510864} -08/30/2021 17:41:47 - INFO - __main__ - Step 25172: {'lr': 0.000470365138227793, 'samples': 4833024, 'steps': 25171, 'loss/train': 0.9610714912414551} -08/30/2021 17:41:48 - INFO - __main__ - Step 25173: {'lr': 0.0004703626320275002, 'samples': 4833216, 'steps': 25172, 'loss/train': 1.2970154285430908} -08/30/2021 17:41:48 - INFO - __main__ - Step 25174: {'lr': 0.0004703601257279153, 'samples': 4833408, 'steps': 25173, 'loss/train': 2.189345598220825} -08/30/2021 17:41:50 - INFO - __main__ - Step 25175: {'lr': 0.0004703576193290395, 'samples': 4833600, 'steps': 25174, 'loss/train': 1.9523824453353882} -08/30/2021 17:41:51 - INFO - __main__ - Step 25176: {'lr': 0.0004703551128308741, 'samples': 4833792, 'steps': 25175, 'loss/train': 1.7613623142242432} -08/30/2021 17:41:51 - INFO - __main__ - Step 25177: {'lr': 0.00047035260623341996, 'samples': 4833984, 'steps': 25176, 'loss/train': 1.345569133758545} -08/30/2021 17:41:51 - INFO - __main__ - Step 25178: {'lr': 0.0004703500995366784, 'samples': 4834176, 'steps': 25177, 'loss/train': 1.8932678699493408} -08/30/2021 17:41:52 - INFO - __main__ - Step 25179: {'lr': 0.00047034759274065043, 'samples': 4834368, 'steps': 25178, 'loss/train': 1.2226879596710205} -08/30/2021 17:41:53 - INFO - __main__ - Step 25180: {'lr': 0.00047034508584533724, 'samples': 4834560, 'steps': 25179, 'loss/train': 1.2147520780563354} -08/30/2021 17:41:53 - INFO - __main__ - Step 25181: {'lr': 0.00047034257885074, 'samples': 4834752, 'steps': 25180, 'loss/train': 1.4377487897872925} -08/30/2021 17:41:54 - INFO - __main__ - Step 25182: {'lr': 0.00047034007175685976, 'samples': 4834944, 'steps': 25181, 'loss/train': 1.7231919765472412} -08/30/2021 17:41:54 - INFO - __main__ - Step 25183: {'lr': 0.0004703375645636977, 'samples': 4835136, 'steps': 25182, 'loss/train': 1.3159558773040771} -08/30/2021 17:41:54 - INFO - __main__ - Step 25184: {'lr': 0.0004703350572712549, 'samples': 4835328, 'steps': 25183, 'loss/train': 1.1757681369781494} -08/30/2021 17:41:56 - INFO - __main__ - Step 25185: {'lr': 0.00047033254987953254, 'samples': 4835520, 'steps': 25184, 'loss/train': 1.2443501949310303} -08/30/2021 17:41:57 - INFO - __main__ - Step 25186: {'lr': 0.0004703300423885318, 'samples': 4835712, 'steps': 25185, 'loss/train': 1.4792664051055908} -08/30/2021 17:41:57 - INFO - __main__ - Step 25187: {'lr': 0.0004703275347982536, 'samples': 4835904, 'steps': 25186, 'loss/train': 1.8373013734817505} -08/30/2021 17:41:57 - INFO - __main__ - Step 25188: {'lr': 0.00047032502710869935, 'samples': 4836096, 'steps': 25187, 'loss/train': 1.3806008100509644} -08/30/2021 17:41:58 - INFO - __main__ - Step 25189: {'lr': 0.00047032251931987, 'samples': 4836288, 'steps': 25188, 'loss/train': 1.3953410387039185} -08/30/2021 17:42:00 - INFO - __main__ - Step 25190: {'lr': 0.0004703200114317667, 'samples': 4836480, 'steps': 25189, 'loss/train': 1.228415608406067} -08/30/2021 17:42:00 - INFO - __main__ - Step 25191: {'lr': 0.0004703175034443906, 'samples': 4836672, 'steps': 25190, 'loss/train': 1.8546063899993896} -08/30/2021 17:42:00 - INFO - __main__ - Step 25192: {'lr': 0.00047031499535774284, 'samples': 4836864, 'steps': 25191, 'loss/train': 1.718413233757019} -08/30/2021 17:42:01 - INFO - __main__ - Step 25193: {'lr': 0.00047031248717182455, 'samples': 4837056, 'steps': 25192, 'loss/train': 1.4340121746063232} -08/30/2021 17:42:01 - INFO - __main__ - Step 25194: {'lr': 0.00047030997888663687, 'samples': 4837248, 'steps': 25193, 'loss/train': 0.7193629145622253} -08/30/2021 17:42:01 - INFO - __main__ - Step 25195: {'lr': 0.00047030747050218094, 'samples': 4837440, 'steps': 25194, 'loss/train': 1.7720571756362915} -08/30/2021 17:42:02 - INFO - __main__ - Step 25196: {'lr': 0.0004703049620184578, 'samples': 4837632, 'steps': 25195, 'loss/train': 1.7892900705337524} -08/30/2021 17:42:03 - INFO - __main__ - Step 25197: {'lr': 0.0004703024534354686, 'samples': 4837824, 'steps': 25196, 'loss/train': 2.4770662784576416} -08/30/2021 17:42:04 - INFO - __main__ - Step 25198: {'lr': 0.0004702999447532146, 'samples': 4838016, 'steps': 25197, 'loss/train': 1.5416127443313599} -08/30/2021 17:42:04 - INFO - __main__ - Step 25199: {'lr': 0.00047029743597169684, 'samples': 4838208, 'steps': 25198, 'loss/train': 1.4073939323425293} -08/30/2021 17:42:04 - INFO - __main__ - Step 25200: {'lr': 0.0004702949270909164, 'samples': 4838400, 'steps': 25199, 'loss/train': 1.692219614982605} -08/30/2021 17:42:05 - INFO - __main__ - Step 25201: {'lr': 0.0004702924181108745, 'samples': 4838592, 'steps': 25200, 'loss/train': 1.675784945487976} -08/30/2021 17:42:06 - INFO - __main__ - Step 25202: {'lr': 0.00047028990903157233, 'samples': 4838784, 'steps': 25201, 'loss/train': 1.6392043828964233} -08/30/2021 17:42:07 - INFO - __main__ - Step 25203: {'lr': 0.0004702873998530108, 'samples': 4838976, 'steps': 25202, 'loss/train': 1.324642300605774} -08/30/2021 17:42:07 - INFO - __main__ - Step 25204: {'lr': 0.0004702848905751912, 'samples': 4839168, 'steps': 25203, 'loss/train': 1.2755097150802612} -08/30/2021 17:42:08 - INFO - __main__ - Step 25205: {'lr': 0.0004702823811981146, 'samples': 4839360, 'steps': 25204, 'loss/train': 0.1903872936964035} -08/30/2021 17:42:08 - INFO - __main__ - Step 25206: {'lr': 0.0004702798717217822, 'samples': 4839552, 'steps': 25205, 'loss/train': 1.8723169565200806} -08/30/2021 17:42:09 - INFO - __main__ - Step 25207: {'lr': 0.0004702773621461951, 'samples': 4839744, 'steps': 25206, 'loss/train': 1.4872665405273438} -08/30/2021 17:42:10 - INFO - __main__ - Step 25208: {'lr': 0.0004702748524713544, 'samples': 4839936, 'steps': 25207, 'loss/train': 1.4404301643371582} -08/30/2021 17:42:10 - INFO - __main__ - Step 25209: {'lr': 0.00047027234269726123, 'samples': 4840128, 'steps': 25208, 'loss/train': 1.5485769510269165} -08/30/2021 17:42:11 - INFO - __main__ - Step 25210: {'lr': 0.0004702698328239167, 'samples': 4840320, 'steps': 25209, 'loss/train': 1.690459132194519} -08/30/2021 17:42:11 - INFO - __main__ - Step 25211: {'lr': 0.0004702673228513221, 'samples': 4840512, 'steps': 25210, 'loss/train': 1.505952000617981} -08/30/2021 17:42:12 - INFO - __main__ - Step 25212: {'lr': 0.00047026481277947835, 'samples': 4840704, 'steps': 25211, 'loss/train': 1.7400099039077759} -08/30/2021 17:42:13 - INFO - __main__ - Step 25213: {'lr': 0.0004702623026083867, 'samples': 4840896, 'steps': 25212, 'loss/train': 1.3989006280899048} -08/30/2021 17:42:13 - INFO - __main__ - Step 25214: {'lr': 0.00047025979233804825, 'samples': 4841088, 'steps': 25213, 'loss/train': 1.509686827659607} -08/30/2021 17:42:14 - INFO - __main__ - Step 25215: {'lr': 0.00047025728196846417, 'samples': 4841280, 'steps': 25214, 'loss/train': 1.5531995296478271} -08/30/2021 17:42:14 - INFO - __main__ - Step 25216: {'lr': 0.0004702547714996355, 'samples': 4841472, 'steps': 25215, 'loss/train': 1.4401838779449463} -08/30/2021 17:42:15 - INFO - __main__ - Step 25217: {'lr': 0.00047025226093156346, 'samples': 4841664, 'steps': 25216, 'loss/train': 1.3402336835861206} -08/30/2021 17:42:16 - INFO - __main__ - Step 25218: {'lr': 0.0004702497502642492, 'samples': 4841856, 'steps': 25217, 'loss/train': 1.020683765411377} -08/30/2021 17:42:16 - INFO - __main__ - Step 25219: {'lr': 0.0004702472394976938, 'samples': 4842048, 'steps': 25218, 'loss/train': 1.6742174625396729} -08/30/2021 17:42:17 - INFO - __main__ - Step 25220: {'lr': 0.0004702447286318983, 'samples': 4842240, 'steps': 25219, 'loss/train': 1.570212721824646} -08/30/2021 17:42:17 - INFO - __main__ - Step 25221: {'lr': 0.0004702422176668639, 'samples': 4842432, 'steps': 25220, 'loss/train': 1.4703494310379028} -08/30/2021 17:42:18 - INFO - __main__ - Step 25222: {'lr': 0.00047023970660259193, 'samples': 4842624, 'steps': 25221, 'loss/train': 1.8031941652297974} -08/30/2021 17:42:19 - INFO - __main__ - Step 25223: {'lr': 0.0004702371954390832, 'samples': 4842816, 'steps': 25222, 'loss/train': 1.4215047359466553} -08/30/2021 17:42:19 - INFO - __main__ - Step 25224: {'lr': 0.00047023468417633905, 'samples': 4843008, 'steps': 25223, 'loss/train': 0.1384240835905075} -08/30/2021 17:42:20 - INFO - __main__ - Step 25225: {'lr': 0.0004702321728143605, 'samples': 4843200, 'steps': 25224, 'loss/train': 1.4457356929779053} -08/30/2021 17:42:20 - INFO - __main__ - Step 25226: {'lr': 0.0004702296613531488, 'samples': 4843392, 'steps': 25225, 'loss/train': 1.6307753324508667} -08/30/2021 17:42:20 - INFO - __main__ - Step 25227: {'lr': 0.00047022714979270497, 'samples': 4843584, 'steps': 25226, 'loss/train': 1.2742396593093872} -08/30/2021 17:42:22 - INFO - __main__ - Step 25228: {'lr': 0.0004702246381330302, 'samples': 4843776, 'steps': 25227, 'loss/train': 1.5508121252059937} -08/30/2021 17:42:23 - INFO - __main__ - Step 25229: {'lr': 0.00047022212637412553, 'samples': 4843968, 'steps': 25228, 'loss/train': 1.4460803270339966} -08/30/2021 17:42:23 - INFO - __main__ - Step 25230: {'lr': 0.00047021961451599226, 'samples': 4844160, 'steps': 25229, 'loss/train': 1.8290355205535889} -08/30/2021 17:42:24 - INFO - __main__ - Step 25231: {'lr': 0.00047021710255863144, 'samples': 4844352, 'steps': 25230, 'loss/train': 1.8114560842514038} -08/30/2021 17:42:24 - INFO - __main__ - Step 25232: {'lr': 0.0004702145905020442, 'samples': 4844544, 'steps': 25231, 'loss/train': 1.5833290815353394} -08/30/2021 17:42:26 - INFO - __main__ - Step 25233: {'lr': 0.0004702120783462316, 'samples': 4844736, 'steps': 25232, 'loss/train': 1.5759029388427734} -08/30/2021 17:42:26 - INFO - __main__ - Step 25234: {'lr': 0.00047020956609119483, 'samples': 4844928, 'steps': 25233, 'loss/train': 1.5939463376998901} -08/30/2021 17:42:27 - INFO - __main__ - Step 25235: {'lr': 0.0004702070537369351, 'samples': 4845120, 'steps': 25234, 'loss/train': 1.4793111085891724} -08/30/2021 17:42:27 - INFO - __main__ - Step 25236: {'lr': 0.00047020454128345333, 'samples': 4845312, 'steps': 25235, 'loss/train': 1.8605574369430542} -08/30/2021 17:42:27 - INFO - __main__ - Step 25237: {'lr': 0.00047020202873075093, 'samples': 4845504, 'steps': 25236, 'loss/train': 1.7368876934051514} -08/30/2021 17:42:29 - INFO - __main__ - Step 25238: {'lr': 0.00047019951607882884, 'samples': 4845696, 'steps': 25237, 'loss/train': 1.234832525253296} -08/30/2021 17:42:29 - INFO - __main__ - Step 25239: {'lr': 0.0004701970033276882, 'samples': 4845888, 'steps': 25238, 'loss/train': 1.7299489974975586} -08/30/2021 17:42:30 - INFO - __main__ - Step 25240: {'lr': 0.0004701944904773303, 'samples': 4846080, 'steps': 25239, 'loss/train': 1.5737006664276123} -08/30/2021 17:42:30 - INFO - __main__ - Step 25241: {'lr': 0.0004701919775277561, 'samples': 4846272, 'steps': 25240, 'loss/train': 1.537653923034668} -08/30/2021 17:42:30 - INFO - __main__ - Step 25242: {'lr': 0.0004701894644789668, 'samples': 4846464, 'steps': 25241, 'loss/train': 1.1209821701049805} -08/30/2021 17:42:31 - INFO - __main__ - Step 25243: {'lr': 0.0004701869513309635, 'samples': 4846656, 'steps': 25242, 'loss/train': 2.0428268909454346} -08/30/2021 17:42:32 - INFO - __main__ - Step 25244: {'lr': 0.0004701844380837474, 'samples': 4846848, 'steps': 25243, 'loss/train': 1.5601223707199097} -08/30/2021 17:42:33 - INFO - __main__ - Step 25245: {'lr': 0.00047018192473731956, 'samples': 4847040, 'steps': 25244, 'loss/train': 1.5865105390548706} -08/30/2021 17:42:33 - INFO - __main__ - Step 25246: {'lr': 0.0004701794112916812, 'samples': 4847232, 'steps': 25245, 'loss/train': 1.503543496131897} -08/30/2021 17:42:34 - INFO - __main__ - Step 25247: {'lr': 0.00047017689774683325, 'samples': 4847424, 'steps': 25246, 'loss/train': 0.28209388256073} -08/30/2021 17:42:34 - INFO - __main__ - Step 25248: {'lr': 0.0004701743841027771, 'samples': 4847616, 'steps': 25247, 'loss/train': 0.06271487474441528} -08/30/2021 17:42:34 - INFO - __main__ - Step 25249: {'lr': 0.0004701718703595138, 'samples': 4847808, 'steps': 25248, 'loss/train': 2.7639365196228027} -08/30/2021 17:42:36 - INFO - __main__ - Step 25250: {'lr': 0.0004701693565170444, 'samples': 4848000, 'steps': 25249, 'loss/train': 1.5656744241714478} -08/30/2021 17:42:36 - INFO - __main__ - Step 25251: {'lr': 0.0004701668425753701, 'samples': 4848192, 'steps': 25250, 'loss/train': 1.3499870300292969} -08/30/2021 17:42:37 - INFO - __main__ - Step 25252: {'lr': 0.000470164328534492, 'samples': 4848384, 'steps': 25251, 'loss/train': 1.202694296836853} -08/30/2021 17:42:37 - INFO - __main__ - Step 25253: {'lr': 0.00047016181439441126, 'samples': 4848576, 'steps': 25252, 'loss/train': 1.1313468217849731} -08/30/2021 17:42:37 - INFO - __main__ - Step 25254: {'lr': 0.000470159300155129, 'samples': 4848768, 'steps': 25253, 'loss/train': 1.4647761583328247} -08/30/2021 17:42:39 - INFO - __main__ - Step 25255: {'lr': 0.00047015678581664635, 'samples': 4848960, 'steps': 25254, 'loss/train': 1.358678936958313} -08/30/2021 17:42:39 - INFO - __main__ - Step 25256: {'lr': 0.00047015427137896446, 'samples': 4849152, 'steps': 25255, 'loss/train': 1.532971978187561} -08/30/2021 17:42:40 - INFO - __main__ - Step 25257: {'lr': 0.0004701517568420844, 'samples': 4849344, 'steps': 25256, 'loss/train': 1.8707044124603271} -08/30/2021 17:42:40 - INFO - __main__ - Step 25258: {'lr': 0.0004701492422060074, 'samples': 4849536, 'steps': 25257, 'loss/train': 1.8581136465072632} -08/30/2021 17:42:40 - INFO - __main__ - Step 25259: {'lr': 0.0004701467274707346, 'samples': 4849728, 'steps': 25258, 'loss/train': 1.7593551874160767} -08/30/2021 17:42:42 - INFO - __main__ - Step 25260: {'lr': 0.0004701442126362671, 'samples': 4849920, 'steps': 25259, 'loss/train': 1.5137451887130737} -08/30/2021 17:42:42 - INFO - __main__ - Step 25261: {'lr': 0.0004701416977026059, 'samples': 4850112, 'steps': 25260, 'loss/train': 1.8200294971466064} -08/30/2021 17:42:43 - INFO - __main__ - Step 25262: {'lr': 0.0004701391826697523, 'samples': 4850304, 'steps': 25261, 'loss/train': 1.3076450824737549} -08/30/2021 17:42:43 - INFO - __main__ - Step 25263: {'lr': 0.00047013666753770736, 'samples': 4850496, 'steps': 25262, 'loss/train': 1.9197431802749634} -08/30/2021 17:42:43 - INFO - __main__ - Step 25264: {'lr': 0.00047013415230647227, 'samples': 4850688, 'steps': 25263, 'loss/train': 1.3357831239700317} -08/30/2021 17:42:44 - INFO - __main__ - Step 25265: {'lr': 0.0004701316369760481, 'samples': 4850880, 'steps': 25264, 'loss/train': 1.7137293815612793} -08/30/2021 17:42:45 - INFO - __main__ - Step 25266: {'lr': 0.00047012912154643607, 'samples': 4851072, 'steps': 25265, 'loss/train': 1.2234370708465576} -08/30/2021 17:42:46 - INFO - __main__ - Step 25267: {'lr': 0.0004701266060176372, 'samples': 4851264, 'steps': 25266, 'loss/train': 1.6347157955169678} -08/30/2021 17:42:46 - INFO - __main__ - Step 25268: {'lr': 0.00047012409038965267, 'samples': 4851456, 'steps': 25267, 'loss/train': 0.9743822813034058} -08/30/2021 17:42:47 - INFO - __main__ - Step 25269: {'lr': 0.0004701215746624836, 'samples': 4851648, 'steps': 25268, 'loss/train': 1.2258555889129639} -08/30/2021 17:42:47 - INFO - __main__ - Step 25270: {'lr': 0.0004701190588361312, 'samples': 4851840, 'steps': 25269, 'loss/train': 1.1441996097564697} -08/30/2021 17:42:48 - INFO - __main__ - Step 25271: {'lr': 0.0004701165429105966, 'samples': 4852032, 'steps': 25270, 'loss/train': 1.479071021080017} -08/30/2021 17:42:49 - INFO - __main__ - Step 25272: {'lr': 0.0004701140268858808, 'samples': 4852224, 'steps': 25271, 'loss/train': 1.2729097604751587} -08/30/2021 17:42:49 - INFO - __main__ - Step 25273: {'lr': 0.000470111510761985, 'samples': 4852416, 'steps': 25272, 'loss/train': 1.414404273033142} -08/30/2021 17:42:49 - INFO - __main__ - Step 25274: {'lr': 0.0004701089945389104, 'samples': 4852608, 'steps': 25273, 'loss/train': 1.2719674110412598} -08/30/2021 17:42:50 - INFO - __main__ - Step 25275: {'lr': 0.00047010647821665803, 'samples': 4852800, 'steps': 25274, 'loss/train': 1.6211355924606323} -08/30/2021 17:42:52 - INFO - __main__ - Step 25276: {'lr': 0.0004701039617952291, 'samples': 4852992, 'steps': 25275, 'loss/train': 1.2120165824890137} -08/30/2021 17:42:52 - INFO - __main__ - Step 25277: {'lr': 0.00047010144527462474, 'samples': 4853184, 'steps': 25276, 'loss/train': 1.619185209274292} -08/30/2021 17:42:53 - INFO - __main__ - Step 25278: {'lr': 0.00047009892865484607, 'samples': 4853376, 'steps': 25277, 'loss/train': 1.2005964517593384} -08/30/2021 17:42:53 - INFO - __main__ - Step 25279: {'lr': 0.00047009641193589423, 'samples': 4853568, 'steps': 25278, 'loss/train': 1.9050300121307373} -08/30/2021 17:42:53 - INFO - __main__ - Step 25280: {'lr': 0.00047009389511777036, 'samples': 4853760, 'steps': 25279, 'loss/train': 1.250523328781128} -08/30/2021 17:42:54 - INFO - __main__ - Step 25281: {'lr': 0.0004700913782004755, 'samples': 4853952, 'steps': 25280, 'loss/train': 0.06701329350471497} -08/30/2021 17:42:56 - INFO - __main__ - Step 25282: {'lr': 0.00047008886118401084, 'samples': 4854144, 'steps': 25281, 'loss/train': 0.11463990062475204} -08/30/2021 17:42:57 - INFO - __main__ - Step 25283: {'lr': 0.0004700863440683776, 'samples': 4854336, 'steps': 25282, 'loss/train': 1.488193392753601} -08/30/2021 17:42:57 - INFO - __main__ - Step 25284: {'lr': 0.00047008382685357686, 'samples': 4854528, 'steps': 25283, 'loss/train': 1.741093635559082} -08/30/2021 17:42:58 - INFO - __main__ - Step 25285: {'lr': 0.0004700813095396098, 'samples': 4854720, 'steps': 25284, 'loss/train': 0.9684827327728271} -08/30/2021 17:42:58 - INFO - __main__ - Step 25286: {'lr': 0.00047007879212647744, 'samples': 4854912, 'steps': 25285, 'loss/train': 2.1591384410858154} -08/30/2021 17:42:58 - INFO - __main__ - Step 25287: {'lr': 0.0004700762746141809, 'samples': 4855104, 'steps': 25286, 'loss/train': 0.5560943484306335} -08/30/2021 17:42:59 - INFO - __main__ - Step 25288: {'lr': 0.0004700737570027214, 'samples': 4855296, 'steps': 25287, 'loss/train': 0.5318044424057007} -08/30/2021 17:43:00 - INFO - __main__ - Step 25289: {'lr': 0.00047007123929210015, 'samples': 4855488, 'steps': 25288, 'loss/train': 1.8834632635116577} -08/30/2021 17:43:01 - INFO - __main__ - Step 25290: {'lr': 0.00047006872148231814, 'samples': 4855680, 'steps': 25289, 'loss/train': 1.5034270286560059} -08/30/2021 17:43:01 - INFO - __main__ - Step 25291: {'lr': 0.0004700662035733766, 'samples': 4855872, 'steps': 25290, 'loss/train': 1.0896543264389038} -08/30/2021 17:43:01 - INFO - __main__ - Step 25292: {'lr': 0.0004700636855652766, 'samples': 4856064, 'steps': 25291, 'loss/train': 1.7092068195343018} -08/30/2021 17:43:02 - INFO - __main__ - Step 25293: {'lr': 0.0004700611674580193, 'samples': 4856256, 'steps': 25292, 'loss/train': 1.38180410861969} -08/30/2021 17:43:03 - INFO - __main__ - Step 25294: {'lr': 0.0004700586492516058, 'samples': 4856448, 'steps': 25293, 'loss/train': 1.4817906618118286} -08/30/2021 17:43:04 - INFO - __main__ - Step 25295: {'lr': 0.00047005613094603727, 'samples': 4856640, 'steps': 25294, 'loss/train': 1.761993169784546} -08/30/2021 17:43:04 - INFO - __main__ - Step 25296: {'lr': 0.0004700536125413149, 'samples': 4856832, 'steps': 25295, 'loss/train': 1.5468003749847412} -08/30/2021 17:43:04 - INFO - __main__ - Step 25297: {'lr': 0.00047005109403743976, 'samples': 4857024, 'steps': 25296, 'loss/train': 1.3205429315567017} -08/30/2021 17:43:05 - INFO - __main__ - Step 25298: {'lr': 0.00047004857543441294, 'samples': 4857216, 'steps': 25297, 'loss/train': 1.649469256401062} -08/30/2021 17:43:06 - INFO - __main__ - Step 25299: {'lr': 0.00047004605673223567, 'samples': 4857408, 'steps': 25298, 'loss/train': 1.7398124933242798} -08/30/2021 17:43:07 - INFO - __main__ - Step 25300: {'lr': 0.00047004353793090903, 'samples': 4857600, 'steps': 25299, 'loss/train': 1.5071388483047485} -08/30/2021 17:43:07 - INFO - __main__ - Step 25301: {'lr': 0.00047004101903043416, 'samples': 4857792, 'steps': 25300, 'loss/train': 2.0160562992095947} -08/30/2021 17:43:07 - INFO - __main__ - Step 25302: {'lr': 0.00047003850003081215, 'samples': 4857984, 'steps': 25301, 'loss/train': 1.5995603799819946} -08/30/2021 17:43:08 - INFO - __main__ - Step 25303: {'lr': 0.0004700359809320443, 'samples': 4858176, 'steps': 25302, 'loss/train': 1.3620502948760986} -08/30/2021 17:43:09 - INFO - __main__ - Step 25304: {'lr': 0.0004700334617341316, 'samples': 4858368, 'steps': 25303, 'loss/train': 1.541378378868103} -08/30/2021 17:43:10 - INFO - __main__ - Step 25305: {'lr': 0.0004700309424370752, 'samples': 4858560, 'steps': 25304, 'loss/train': 1.3634676933288574} -08/30/2021 17:43:10 - INFO - __main__ - Step 25306: {'lr': 0.00047002842304087625, 'samples': 4858752, 'steps': 25305, 'loss/train': 1.8207916021347046} -08/30/2021 17:43:10 - INFO - __main__ - Step 25307: {'lr': 0.00047002590354553586, 'samples': 4858944, 'steps': 25306, 'loss/train': 1.3307744264602661} -08/30/2021 17:43:11 - INFO - __main__ - Step 25308: {'lr': 0.00047002338395105527, 'samples': 4859136, 'steps': 25307, 'loss/train': 1.7076677083969116} -08/30/2021 17:43:12 - INFO - __main__ - Step 25309: {'lr': 0.00047002086425743545, 'samples': 4859328, 'steps': 25308, 'loss/train': 1.6849370002746582} -08/30/2021 17:43:13 - INFO - __main__ - Step 25310: {'lr': 0.0004700183444646776, 'samples': 4859520, 'steps': 25309, 'loss/train': 1.9664829969406128} -08/30/2021 17:43:13 - INFO - __main__ - Step 25311: {'lr': 0.000470015824572783, 'samples': 4859712, 'steps': 25310, 'loss/train': 1.1894611120224} -08/30/2021 17:43:13 - INFO - __main__ - Step 25312: {'lr': 0.00047001330458175264, 'samples': 4859904, 'steps': 25311, 'loss/train': 1.2179572582244873} -08/30/2021 17:43:14 - INFO - __main__ - Step 25313: {'lr': 0.0004700107844915876, 'samples': 4860096, 'steps': 25312, 'loss/train': 1.4157882928848267} -08/30/2021 17:43:15 - INFO - __main__ - Step 25314: {'lr': 0.00047000826430228915, 'samples': 4860288, 'steps': 25313, 'loss/train': 1.395578145980835} -08/30/2021 17:43:16 - INFO - __main__ - Step 25315: {'lr': 0.00047000574401385835, 'samples': 4860480, 'steps': 25314, 'loss/train': 1.1564863920211792} -08/30/2021 17:43:16 - INFO - __main__ - Step 25316: {'lr': 0.0004700032236262964, 'samples': 4860672, 'steps': 25315, 'loss/train': 1.2295942306518555} -08/30/2021 17:43:16 - INFO - __main__ - Step 25317: {'lr': 0.00047000070313960436, 'samples': 4860864, 'steps': 25316, 'loss/train': 1.541870355606079} -08/30/2021 17:43:17 - INFO - __main__ - Step 25318: {'lr': 0.00046999818255378335, 'samples': 4861056, 'steps': 25317, 'loss/train': 1.2594361305236816} -08/30/2021 17:43:17 - INFO - __main__ - Step 25319: {'lr': 0.00046999566186883466, 'samples': 4861248, 'steps': 25318, 'loss/train': 1.2627118825912476} -08/30/2021 17:43:19 - INFO - __main__ - Step 25320: {'lr': 0.0004699931410847592, 'samples': 4861440, 'steps': 25319, 'loss/train': 2.373678684234619} -08/30/2021 17:43:19 - INFO - __main__ - Step 25321: {'lr': 0.00046999062020155834, 'samples': 4861632, 'steps': 25320, 'loss/train': 1.7835915088653564} -08/30/2021 17:43:19 - INFO - __main__ - Step 25322: {'lr': 0.00046998809921923305, 'samples': 4861824, 'steps': 25321, 'loss/train': 1.5494893789291382} -08/30/2021 17:43:20 - INFO - __main__ - Step 25323: {'lr': 0.0004699855781377845, 'samples': 4862016, 'steps': 25322, 'loss/train': 1.909134030342102} -08/30/2021 17:43:20 - INFO - __main__ - Step 25324: {'lr': 0.0004699830569572139, 'samples': 4862208, 'steps': 25323, 'loss/train': 1.4210063219070435} -08/30/2021 17:43:22 - INFO - __main__ - Step 25325: {'lr': 0.00046998053567752225, 'samples': 4862400, 'steps': 25324, 'loss/train': 1.3654412031173706} -08/30/2021 17:43:22 - INFO - __main__ - Step 25326: {'lr': 0.0004699780142987108, 'samples': 4862592, 'steps': 25325, 'loss/train': 1.767876386642456} -08/30/2021 17:43:23 - INFO - __main__ - Step 25327: {'lr': 0.0004699754928207807, 'samples': 4862784, 'steps': 25326, 'loss/train': 1.529049038887024} -08/30/2021 17:43:23 - INFO - __main__ - Step 25328: {'lr': 0.00046997297124373293, 'samples': 4862976, 'steps': 25327, 'loss/train': 1.7410838603973389} -08/30/2021 17:43:23 - INFO - __main__ - Step 25329: {'lr': 0.00046997044956756883, 'samples': 4863168, 'steps': 25328, 'loss/train': 2.0541467666625977} -08/30/2021 17:43:25 - INFO - __main__ - Step 25330: {'lr': 0.00046996792779228935, 'samples': 4863360, 'steps': 25329, 'loss/train': 1.0298115015029907} -08/30/2021 17:43:25 - INFO - __main__ - Step 25331: {'lr': 0.00046996540591789584, 'samples': 4863552, 'steps': 25330, 'loss/train': 1.5683554410934448} -08/30/2021 17:43:26 - INFO - __main__ - Step 25332: {'lr': 0.00046996288394438924, 'samples': 4863744, 'steps': 25331, 'loss/train': 1.9218753576278687} -08/30/2021 17:43:26 - INFO - __main__ - Step 25333: {'lr': 0.00046996036187177073, 'samples': 4863936, 'steps': 25332, 'loss/train': 1.5016952753067017} -08/30/2021 17:43:26 - INFO - __main__ - Step 25334: {'lr': 0.0004699578397000415, 'samples': 4864128, 'steps': 25333, 'loss/train': 1.7984638214111328} -08/30/2021 17:43:27 - INFO - __main__ - Step 25335: {'lr': 0.00046995531742920264, 'samples': 4864320, 'steps': 25334, 'loss/train': 1.4689041376113892} -08/30/2021 17:43:28 - INFO - __main__ - Step 25336: {'lr': 0.00046995279505925535, 'samples': 4864512, 'steps': 25335, 'loss/train': 2.0290894508361816} -08/30/2021 17:43:29 - INFO - __main__ - Step 25337: {'lr': 0.00046995027259020075, 'samples': 4864704, 'steps': 25336, 'loss/train': 0.7744262218475342} -08/30/2021 17:43:29 - INFO - __main__ - Step 25338: {'lr': 0.00046994775002203994, 'samples': 4864896, 'steps': 25337, 'loss/train': 1.737314224243164} -08/30/2021 17:43:29 - INFO - __main__ - Step 25339: {'lr': 0.000469945227354774, 'samples': 4865088, 'steps': 25338, 'loss/train': 1.1786948442459106} -08/30/2021 17:43:30 - INFO - __main__ - Step 25340: {'lr': 0.00046994270458840416, 'samples': 4865280, 'steps': 25339, 'loss/train': 1.2766237258911133} -08/30/2021 17:43:32 - INFO - __main__ - Step 25341: {'lr': 0.0004699401817229316, 'samples': 4865472, 'steps': 25340, 'loss/train': 5.965412139892578} -08/30/2021 17:43:32 - INFO - __main__ - Step 25342: {'lr': 0.0004699376587583573, 'samples': 4865664, 'steps': 25341, 'loss/train': 1.4611304998397827} -08/30/2021 17:43:33 - INFO - __main__ - Step 25343: {'lr': 0.0004699351356946825, 'samples': 4865856, 'steps': 25342, 'loss/train': 1.7490977048873901} -08/30/2021 17:43:33 - INFO - __main__ - Step 25344: {'lr': 0.00046993261253190833, 'samples': 4866048, 'steps': 25343, 'loss/train': 0.5217673182487488} -08/30/2021 17:43:33 - INFO - __main__ - Step 25345: {'lr': 0.000469930089270036, 'samples': 4866240, 'steps': 25344, 'loss/train': 1.523060917854309} -08/30/2021 17:43:35 - INFO - __main__ - Step 25346: {'lr': 0.0004699275659090665, 'samples': 4866432, 'steps': 25345, 'loss/train': 1.999556064605713} -08/30/2021 17:43:35 - INFO - __main__ - Step 25347: {'lr': 0.000469925042449001, 'samples': 4866624, 'steps': 25346, 'loss/train': 1.2873411178588867} -08/30/2021 17:43:35 - INFO - __main__ - Step 25348: {'lr': 0.0004699225188898407, 'samples': 4866816, 'steps': 25347, 'loss/train': 1.5357632637023926} -08/30/2021 17:43:36 - INFO - __main__ - Step 25349: {'lr': 0.00046991999523158666, 'samples': 4867008, 'steps': 25348, 'loss/train': 2.1388795375823975} -08/30/2021 17:43:36 - INFO - __main__ - Step 25350: {'lr': 0.0004699174714742401, 'samples': 4867200, 'steps': 25349, 'loss/train': 1.9474326372146606} -08/30/2021 17:43:38 - INFO - __main__ - Step 25351: {'lr': 0.0004699149476178022, 'samples': 4867392, 'steps': 25350, 'loss/train': 1.4059033393859863} -08/30/2021 17:43:38 - INFO - __main__ - Step 25352: {'lr': 0.00046991242366227395, 'samples': 4867584, 'steps': 25351, 'loss/train': 1.1270959377288818} -08/30/2021 17:43:39 - INFO - __main__ - Step 25353: {'lr': 0.0004699098996076565, 'samples': 4867776, 'steps': 25352, 'loss/train': 1.432145595550537} -08/30/2021 17:43:39 - INFO - __main__ - Step 25354: {'lr': 0.0004699073754539511, 'samples': 4867968, 'steps': 25353, 'loss/train': 3.1782290935516357} -08/30/2021 17:43:39 - INFO - __main__ - Step 25355: {'lr': 0.0004699048512011588, 'samples': 4868160, 'steps': 25354, 'loss/train': 1.304602026939392} -08/30/2021 17:43:40 - INFO - __main__ - Step 25356: {'lr': 0.0004699023268492808, 'samples': 4868352, 'steps': 25355, 'loss/train': 1.4980871677398682} -08/30/2021 17:43:41 - INFO - __main__ - Step 25357: {'lr': 0.0004698998023983182, 'samples': 4868544, 'steps': 25356, 'loss/train': 1.8318673372268677} -08/30/2021 17:43:42 - INFO - __main__ - Step 25358: {'lr': 0.0004698972778482722, 'samples': 4868736, 'steps': 25357, 'loss/train': 0.9058358073234558} -08/30/2021 17:43:42 - INFO - __main__ - Step 25359: {'lr': 0.0004698947531991438, 'samples': 4868928, 'steps': 25358, 'loss/train': 2.269063711166382} -08/30/2021 17:43:42 - INFO - __main__ - Step 25360: {'lr': 0.0004698922284509342, 'samples': 4869120, 'steps': 25359, 'loss/train': 1.332290768623352} -08/30/2021 17:43:43 - INFO - __main__ - Step 25361: {'lr': 0.00046988970360364456, 'samples': 4869312, 'steps': 25360, 'loss/train': 0.07109788060188293} -08/30/2021 17:43:44 - INFO - __main__ - Step 25362: {'lr': 0.0004698871786572761, 'samples': 4869504, 'steps': 25361, 'loss/train': 1.6190969944000244} -08/30/2021 17:43:45 - INFO - __main__ - Step 25363: {'lr': 0.0004698846536118298, 'samples': 4869696, 'steps': 25362, 'loss/train': 1.6887255907058716} -08/30/2021 17:43:45 - INFO - __main__ - Step 25364: {'lr': 0.00046988212846730686, 'samples': 4869888, 'steps': 25363, 'loss/train': 0.9800006747245789} -08/30/2021 17:43:46 - INFO - __main__ - Step 25365: {'lr': 0.0004698796032237085, 'samples': 4870080, 'steps': 25364, 'loss/train': 1.5346888303756714} -08/30/2021 17:43:46 - INFO - __main__ - Step 25366: {'lr': 0.0004698770778810357, 'samples': 4870272, 'steps': 25365, 'loss/train': 1.5946332216262817} -08/30/2021 17:43:47 - INFO - __main__ - Step 25367: {'lr': 0.00046987455243928974, 'samples': 4870464, 'steps': 25366, 'loss/train': 0.903740644454956} -08/30/2021 17:43:48 - INFO - __main__ - Step 25368: {'lr': 0.00046987202689847165, 'samples': 4870656, 'steps': 25367, 'loss/train': 1.2486778497695923} -08/30/2021 17:43:48 - INFO - __main__ - Step 25369: {'lr': 0.00046986950125858264, 'samples': 4870848, 'steps': 25368, 'loss/train': 0.8976453542709351} -08/30/2021 17:43:48 - INFO - __main__ - Step 25370: {'lr': 0.0004698669755196239, 'samples': 4871040, 'steps': 25369, 'loss/train': 0.5826310515403748} -08/30/2021 17:43:49 - INFO - __main__ - Step 25371: {'lr': 0.0004698644496815964, 'samples': 4871232, 'steps': 25370, 'loss/train': 1.3482331037521362} -08/30/2021 17:43:49 - INFO - __main__ - Step 25372: {'lr': 0.0004698619237445013, 'samples': 4871424, 'steps': 25371, 'loss/train': 1.227567195892334} -08/30/2021 17:43:51 - INFO - __main__ - Step 25373: {'lr': 0.00046985939770834, 'samples': 4871616, 'steps': 25372, 'loss/train': 1.7992637157440186} -08/30/2021 17:43:51 - INFO - __main__ - Step 25374: {'lr': 0.0004698568715731133, 'samples': 4871808, 'steps': 25373, 'loss/train': 1.4941823482513428} -08/30/2021 17:43:51 - INFO - __main__ - Step 25375: {'lr': 0.00046985434533882255, 'samples': 4872000, 'steps': 25374, 'loss/train': 1.5480879545211792} -08/30/2021 17:43:52 - INFO - __main__ - Step 25376: {'lr': 0.00046985181900546883, 'samples': 4872192, 'steps': 25375, 'loss/train': 1.8641072511672974} -08/30/2021 17:43:52 - INFO - __main__ - Step 25377: {'lr': 0.0004698492925730532, 'samples': 4872384, 'steps': 25376, 'loss/train': 0.9216536283493042} -08/30/2021 17:43:54 - INFO - __main__ - Step 25378: {'lr': 0.00046984676604157696, 'samples': 4872576, 'steps': 25377, 'loss/train': 1.636277198791504} -08/30/2021 17:43:54 - INFO - __main__ - Step 25379: {'lr': 0.0004698442394110411, 'samples': 4872768, 'steps': 25378, 'loss/train': 1.1136679649353027} -08/30/2021 17:43:54 - INFO - __main__ - Step 25380: {'lr': 0.0004698417126814468, 'samples': 4872960, 'steps': 25379, 'loss/train': 1.6927865743637085} -08/30/2021 17:43:55 - INFO - __main__ - Step 25381: {'lr': 0.0004698391858527953, 'samples': 4873152, 'steps': 25380, 'loss/train': 1.4523926973342896} -08/30/2021 17:43:55 - INFO - __main__ - Step 25382: {'lr': 0.0004698366589250876, 'samples': 4873344, 'steps': 25381, 'loss/train': 0.926530122756958} -08/30/2021 17:43:57 - INFO - __main__ - Step 25383: {'lr': 0.0004698341318983249, 'samples': 4873536, 'steps': 25382, 'loss/train': 1.1641733646392822} -08/30/2021 17:43:57 - INFO - __main__ - Step 25384: {'lr': 0.00046983160477250837, 'samples': 4873728, 'steps': 25383, 'loss/train': 1.6348788738250732} -08/30/2021 17:43:57 - INFO - __main__ - Step 25385: {'lr': 0.00046982907754763905, 'samples': 4873920, 'steps': 25384, 'loss/train': 1.8218257427215576} -08/30/2021 17:43:58 - INFO - __main__ - Step 25386: {'lr': 0.0004698265502237182, 'samples': 4874112, 'steps': 25385, 'loss/train': 1.2216225862503052} -08/30/2021 17:43:58 - INFO - __main__ - Step 25387: {'lr': 0.0004698240228007469, 'samples': 4874304, 'steps': 25386, 'loss/train': 1.2502230405807495} -08/30/2021 17:44:00 - INFO - __main__ - Step 25388: {'lr': 0.0004698214952787262, 'samples': 4874496, 'steps': 25387, 'loss/train': 1.3003475666046143} -08/30/2021 17:44:00 - INFO - __main__ - Step 25389: {'lr': 0.0004698189676576574, 'samples': 4874688, 'steps': 25388, 'loss/train': 1.8169384002685547} -08/30/2021 17:44:00 - INFO - __main__ - Step 25390: {'lr': 0.00046981643993754155, 'samples': 4874880, 'steps': 25389, 'loss/train': 1.12261962890625} -08/30/2021 17:44:01 - INFO - __main__ - Step 25391: {'lr': 0.0004698139121183798, 'samples': 4875072, 'steps': 25390, 'loss/train': 0.12249408662319183} -08/30/2021 17:44:01 - INFO - __main__ - Step 25392: {'lr': 0.00046981138420017335, 'samples': 4875264, 'steps': 25391, 'loss/train': 1.4036651849746704} -08/30/2021 17:44:03 - INFO - __main__ - Step 25393: {'lr': 0.00046980885618292317, 'samples': 4875456, 'steps': 25392, 'loss/train': 1.4431445598602295} -08/30/2021 17:44:04 - INFO - __main__ - Step 25394: {'lr': 0.0004698063280666306, 'samples': 4875648, 'steps': 25393, 'loss/train': 1.2885441780090332} -08/30/2021 17:44:04 - INFO - __main__ - Step 25395: {'lr': 0.0004698037998512966, 'samples': 4875840, 'steps': 25394, 'loss/train': 1.0415525436401367} -08/30/2021 17:44:04 - INFO - __main__ - Step 25396: {'lr': 0.00046980127153692256, 'samples': 4876032, 'steps': 25395, 'loss/train': 0.9374186992645264} -08/30/2021 17:44:05 - INFO - __main__ - Step 25397: {'lr': 0.00046979874312350935, 'samples': 4876224, 'steps': 25396, 'loss/train': 1.3083512783050537} -08/30/2021 17:44:06 - INFO - __main__ - Step 25398: {'lr': 0.00046979621461105817, 'samples': 4876416, 'steps': 25397, 'loss/train': 2.505147933959961} -08/30/2021 17:44:07 - INFO - __main__ - Step 25399: {'lr': 0.0004697936859995703, 'samples': 4876608, 'steps': 25398, 'loss/train': 1.09427809715271} -08/30/2021 17:44:07 - INFO - __main__ - Step 25400: {'lr': 0.00046979115728904675, 'samples': 4876800, 'steps': 25399, 'loss/train': 1.5842044353485107} -08/30/2021 17:44:07 - INFO - __main__ - Step 25401: {'lr': 0.0004697886284794887, 'samples': 4876992, 'steps': 25400, 'loss/train': 1.6713145971298218} -08/30/2021 17:44:08 - INFO - __main__ - Step 25402: {'lr': 0.00046978609957089724, 'samples': 4877184, 'steps': 25401, 'loss/train': 1.7712210416793823} -08/30/2021 17:44:09 - INFO - __main__ - Step 25403: {'lr': 0.0004697835705632736, 'samples': 4877376, 'steps': 25402, 'loss/train': 1.5067243576049805} -08/30/2021 17:44:10 - INFO - __main__ - Step 25404: {'lr': 0.00046978104145661885, 'samples': 4877568, 'steps': 25403, 'loss/train': 1.6991065740585327} -08/30/2021 17:44:10 - INFO - __main__ - Step 25405: {'lr': 0.00046977851225093423, 'samples': 4877760, 'steps': 25404, 'loss/train': 1.6329655647277832} -08/30/2021 17:44:10 - INFO - __main__ - Step 25406: {'lr': 0.0004697759829462207, 'samples': 4877952, 'steps': 25405, 'loss/train': 0.882095217704773} -08/30/2021 17:44:11 - INFO - __main__ - Step 25407: {'lr': 0.0004697734535424796, 'samples': 4878144, 'steps': 25406, 'loss/train': 1.3212653398513794} -08/30/2021 17:44:12 - INFO - __main__ - Step 25408: {'lr': 0.0004697709240397119, 'samples': 4878336, 'steps': 25407, 'loss/train': 1.644166111946106} -08/30/2021 17:44:13 - INFO - __main__ - Step 25409: {'lr': 0.00046976839443791887, 'samples': 4878528, 'steps': 25408, 'loss/train': 1.7067017555236816} -08/30/2021 17:44:13 - INFO - __main__ - Step 25410: {'lr': 0.00046976586473710156, 'samples': 4878720, 'steps': 25409, 'loss/train': 1.8410892486572266} -08/30/2021 17:44:13 - INFO - __main__ - Step 25411: {'lr': 0.0004697633349372611, 'samples': 4878912, 'steps': 25410, 'loss/train': 1.5275639295578003} -08/30/2021 17:44:14 - INFO - __main__ - Step 25412: {'lr': 0.00046976080503839874, 'samples': 4879104, 'steps': 25411, 'loss/train': 1.1855192184448242} -08/30/2021 17:44:14 - INFO - __main__ - Step 25413: {'lr': 0.0004697582750405155, 'samples': 4879296, 'steps': 25412, 'loss/train': 1.9466181993484497} -08/30/2021 17:44:15 - INFO - __main__ - Step 25414: {'lr': 0.00046975574494361263, 'samples': 4879488, 'steps': 25413, 'loss/train': 1.5716698169708252} -08/30/2021 17:44:16 - INFO - __main__ - Step 25415: {'lr': 0.00046975321474769115, 'samples': 4879680, 'steps': 25414, 'loss/train': 1.5435230731964111} -08/30/2021 17:44:16 - INFO - __main__ - Step 25416: {'lr': 0.0004697506844527523, 'samples': 4879872, 'steps': 25415, 'loss/train': 1.956175446510315} -08/30/2021 17:44:17 - INFO - __main__ - Step 25417: {'lr': 0.0004697481540587972, 'samples': 4880064, 'steps': 25416, 'loss/train': 1.6351418495178223} -08/30/2021 17:44:18 - INFO - __main__ - Step 25418: {'lr': 0.00046974562356582694, 'samples': 4880256, 'steps': 25417, 'loss/train': 1.8114688396453857} -08/30/2021 17:44:19 - INFO - __main__ - Step 25419: {'lr': 0.0004697430929738427, 'samples': 4880448, 'steps': 25418, 'loss/train': 1.5406980514526367} -08/30/2021 17:44:19 - INFO - __main__ - Step 25420: {'lr': 0.0004697405622828456, 'samples': 4880640, 'steps': 25419, 'loss/train': 1.1471892595291138} -08/30/2021 17:44:19 - INFO - __main__ - Step 25421: {'lr': 0.00046973803149283686, 'samples': 4880832, 'steps': 25420, 'loss/train': 1.5557366609573364} -08/30/2021 17:44:20 - INFO - __main__ - Step 25422: {'lr': 0.0004697355006038175, 'samples': 4881024, 'steps': 25421, 'loss/train': 1.213868498802185} -08/30/2021 17:44:20 - INFO - __main__ - Step 25423: {'lr': 0.0004697329696157887, 'samples': 4881216, 'steps': 25422, 'loss/train': 1.227020502090454} -08/30/2021 17:44:22 - INFO - __main__ - Step 25424: {'lr': 0.00046973043852875163, 'samples': 4881408, 'steps': 25423, 'loss/train': 1.4905178546905518} -08/30/2021 17:44:22 - INFO - __main__ - Step 25425: {'lr': 0.00046972790734270745, 'samples': 4881600, 'steps': 25424, 'loss/train': 1.2755528688430786} -08/30/2021 17:44:23 - INFO - __main__ - Step 25426: {'lr': 0.0004697253760576572, 'samples': 4881792, 'steps': 25425, 'loss/train': 0.5819177627563477} -08/30/2021 17:44:23 - INFO - __main__ - Step 25427: {'lr': 0.00046972284467360217, 'samples': 4881984, 'steps': 25426, 'loss/train': 2.251990795135498} -08/30/2021 17:44:23 - INFO - __main__ - Step 25428: {'lr': 0.0004697203131905433, 'samples': 4882176, 'steps': 25427, 'loss/train': 1.4739199876785278} -08/30/2021 17:44:25 - INFO - __main__ - Step 25429: {'lr': 0.00046971778160848196, 'samples': 4882368, 'steps': 25428, 'loss/train': 1.7662568092346191} -08/30/2021 17:44:25 - INFO - __main__ - Step 25430: {'lr': 0.0004697152499274191, 'samples': 4882560, 'steps': 25429, 'loss/train': 1.4754798412322998} -08/30/2021 17:44:26 - INFO - __main__ - Step 25431: {'lr': 0.00046971271814735593, 'samples': 4882752, 'steps': 25430, 'loss/train': 1.8401789665222168} -08/30/2021 17:44:26 - INFO - __main__ - Step 25432: {'lr': 0.0004697101862682936, 'samples': 4882944, 'steps': 25431, 'loss/train': 1.6103200912475586} -08/30/2021 17:44:26 - INFO - __main__ - Step 25433: {'lr': 0.00046970765429023336, 'samples': 4883136, 'steps': 25432, 'loss/train': 1.4708747863769531} -08/30/2021 17:44:27 - INFO - __main__ - Step 25434: {'lr': 0.00046970512221317616, 'samples': 4883328, 'steps': 25433, 'loss/train': 2.0800564289093018} -08/30/2021 17:44:28 - INFO - __main__ - Step 25435: {'lr': 0.00046970259003712323, 'samples': 4883520, 'steps': 25434, 'loss/train': 1.524448275566101} -08/30/2021 17:44:29 - INFO - __main__ - Step 25436: {'lr': 0.00046970005776207575, 'samples': 4883712, 'steps': 25435, 'loss/train': 1.4247024059295654} -08/30/2021 17:44:29 - INFO - __main__ - Step 25437: {'lr': 0.00046969752538803477, 'samples': 4883904, 'steps': 25436, 'loss/train': 1.6538536548614502} -08/30/2021 17:44:29 - INFO - __main__ - Step 25438: {'lr': 0.0004696949929150015, 'samples': 4884096, 'steps': 25437, 'loss/train': 1.7013219594955444} -08/30/2021 17:44:30 - INFO - __main__ - Step 25439: {'lr': 0.00046969246034297697, 'samples': 4884288, 'steps': 25438, 'loss/train': 1.6243163347244263} -08/30/2021 17:44:32 - INFO - __main__ - Step 25440: {'lr': 0.0004696899276719625, 'samples': 4884480, 'steps': 25439, 'loss/train': 1.6684882640838623} -08/30/2021 17:44:32 - INFO - __main__ - Step 25441: {'lr': 0.0004696873949019591, 'samples': 4884672, 'steps': 25440, 'loss/train': 1.020603895187378} -08/30/2021 17:44:32 - INFO - __main__ - Step 25442: {'lr': 0.000469684862032968, 'samples': 4884864, 'steps': 25441, 'loss/train': 1.7380231618881226} -08/30/2021 17:44:33 - INFO - __main__ - Step 25443: {'lr': 0.0004696823290649902, 'samples': 4885056, 'steps': 25442, 'loss/train': 1.3856931924819946} -08/30/2021 17:44:33 - INFO - __main__ - Step 25444: {'lr': 0.000469679795998027, 'samples': 4885248, 'steps': 25443, 'loss/train': 1.4510107040405273} -08/30/2021 17:44:35 - INFO - __main__ - Step 25445: {'lr': 0.00046967726283207945, 'samples': 4885440, 'steps': 25444, 'loss/train': 0.13812634348869324} -08/30/2021 17:44:36 - INFO - __main__ - Step 25446: {'lr': 0.0004696747295671487, 'samples': 4885632, 'steps': 25445, 'loss/train': 2.291543960571289} -08/30/2021 17:44:36 - INFO - __main__ - Step 25447: {'lr': 0.000469672196203236, 'samples': 4885824, 'steps': 25446, 'loss/train': 1.3286209106445312} -08/30/2021 17:44:36 - INFO - __main__ - Step 25448: {'lr': 0.0004696696627403423, 'samples': 4886016, 'steps': 25447, 'loss/train': 1.4469770193099976} -08/30/2021 17:44:37 - INFO - __main__ - Step 25449: {'lr': 0.00046966712917846887, 'samples': 4886208, 'steps': 25448, 'loss/train': 1.811905860900879} -08/30/2021 17:44:38 - INFO - __main__ - Step 25450: {'lr': 0.00046966459551761684, 'samples': 4886400, 'steps': 25449, 'loss/train': 1.3242791891098022} -08/30/2021 17:44:39 - INFO - __main__ - Step 25451: {'lr': 0.00046966206175778723, 'samples': 4886592, 'steps': 25450, 'loss/train': 1.4418113231658936} -08/30/2021 17:44:39 - INFO - __main__ - Step 25452: {'lr': 0.0004696595278989814, 'samples': 4886784, 'steps': 25451, 'loss/train': 0.7630012035369873} -08/30/2021 17:44:39 - INFO - __main__ - Step 25453: {'lr': 0.00046965699394120033, 'samples': 4886976, 'steps': 25452, 'loss/train': 1.5333282947540283} -08/30/2021 17:44:40 - INFO - __main__ - Step 25454: {'lr': 0.0004696544598844452, 'samples': 4887168, 'steps': 25453, 'loss/train': 1.9732431173324585} -08/30/2021 17:44:40 - INFO - __main__ - Step 25455: {'lr': 0.00046965192572871723, 'samples': 4887360, 'steps': 25454, 'loss/train': 2.340667486190796} -08/30/2021 17:44:42 - INFO - __main__ - Step 25456: {'lr': 0.0004696493914740174, 'samples': 4887552, 'steps': 25455, 'loss/train': 1.558553695678711} -08/30/2021 17:44:42 - INFO - __main__ - Step 25457: {'lr': 0.00046964685712034697, 'samples': 4887744, 'steps': 25456, 'loss/train': 1.2132066488265991} -08/30/2021 17:44:42 - INFO - __main__ - Step 25458: {'lr': 0.00046964432266770713, 'samples': 4887936, 'steps': 25457, 'loss/train': 1.4271546602249146} -08/30/2021 17:44:43 - INFO - __main__ - Step 25459: {'lr': 0.0004696417881160989, 'samples': 4888128, 'steps': 25458, 'loss/train': 1.5363397598266602} -08/30/2021 17:44:43 - INFO - __main__ - Step 25460: {'lr': 0.0004696392534655234, 'samples': 4888320, 'steps': 25459, 'loss/train': 1.0493687391281128} -08/30/2021 17:44:45 - INFO - __main__ - Step 25461: {'lr': 0.0004696367187159819, 'samples': 4888512, 'steps': 25460, 'loss/train': 1.2178057432174683} -08/30/2021 17:44:45 - INFO - __main__ - Step 25462: {'lr': 0.00046963418386747547, 'samples': 4888704, 'steps': 25461, 'loss/train': 1.4813568592071533} -08/30/2021 17:44:46 - INFO - __main__ - Step 25463: {'lr': 0.0004696316489200053, 'samples': 4888896, 'steps': 25462, 'loss/train': 1.36184823513031} -08/30/2021 17:44:46 - INFO - __main__ - Step 25464: {'lr': 0.00046962911387357246, 'samples': 4889088, 'steps': 25463, 'loss/train': 1.0938376188278198} -08/30/2021 17:44:46 - INFO - __main__ - Step 25465: {'lr': 0.0004696265787281782, 'samples': 4889280, 'steps': 25464, 'loss/train': 1.818878412246704} -08/30/2021 17:44:48 - INFO - __main__ - Step 25466: {'lr': 0.0004696240434838235, 'samples': 4889472, 'steps': 25465, 'loss/train': 1.3407108783721924} -08/30/2021 17:44:48 - INFO - __main__ - Step 25467: {'lr': 0.00046962150814050963, 'samples': 4889664, 'steps': 25466, 'loss/train': 0.990451455116272} -08/30/2021 17:44:49 - INFO - __main__ - Step 25468: {'lr': 0.0004696189726982377, 'samples': 4889856, 'steps': 25467, 'loss/train': 1.6361366510391235} -08/30/2021 17:44:49 - INFO - __main__ - Step 25469: {'lr': 0.00046961643715700885, 'samples': 4890048, 'steps': 25468, 'loss/train': 1.463179111480713} -08/30/2021 17:44:49 - INFO - __main__ - Step 25470: {'lr': 0.00046961390151682426, 'samples': 4890240, 'steps': 25469, 'loss/train': 2.0250563621520996} -08/30/2021 17:44:51 - INFO - __main__ - Step 25471: {'lr': 0.000469611365777685, 'samples': 4890432, 'steps': 25470, 'loss/train': 1.1111315488815308} -08/30/2021 17:44:51 - INFO - __main__ - Step 25472: {'lr': 0.0004696088299395922, 'samples': 4890624, 'steps': 25471, 'loss/train': 1.9752123355865479} -08/30/2021 17:44:52 - INFO - __main__ - Step 25473: {'lr': 0.0004696062940025471, 'samples': 4890816, 'steps': 25472, 'loss/train': 1.439778447151184} -08/30/2021 17:44:52 - INFO - __main__ - Step 25474: {'lr': 0.0004696037579665509, 'samples': 4891008, 'steps': 25473, 'loss/train': 1.630651593208313} -08/30/2021 17:44:52 - INFO - __main__ - Step 25475: {'lr': 0.00046960122183160446, 'samples': 4891200, 'steps': 25474, 'loss/train': 1.4994152784347534} -08/30/2021 17:44:54 - INFO - __main__ - Step 25476: {'lr': 0.00046959868559770914, 'samples': 4891392, 'steps': 25475, 'loss/train': 0.9759613871574402} -08/30/2021 17:44:54 - INFO - __main__ - Step 25477: {'lr': 0.00046959614926486606, 'samples': 4891584, 'steps': 25476, 'loss/train': 0.8181150555610657} -08/30/2021 17:44:55 - INFO - __main__ - Step 25478: {'lr': 0.00046959361283307636, 'samples': 4891776, 'steps': 25477, 'loss/train': 2.7366108894348145} -08/30/2021 17:44:55 - INFO - __main__ - Step 25479: {'lr': 0.0004695910763023412, 'samples': 4891968, 'steps': 25478, 'loss/train': 1.9911137819290161} -08/30/2021 17:44:55 - INFO - __main__ - Step 25480: {'lr': 0.0004695885396726616, 'samples': 4892160, 'steps': 25479, 'loss/train': 1.0219414234161377} -08/30/2021 17:44:56 - INFO - __main__ - Step 25481: {'lr': 0.00046958600294403887, 'samples': 4892352, 'steps': 25480, 'loss/train': 1.419118046760559} -08/30/2021 17:44:57 - INFO - __main__ - Step 25482: {'lr': 0.000469583466116474, 'samples': 4892544, 'steps': 25481, 'loss/train': 1.3893498182296753} -08/30/2021 17:44:58 - INFO - __main__ - Step 25483: {'lr': 0.00046958092918996823, 'samples': 4892736, 'steps': 25482, 'loss/train': 0.8322604298591614} -08/30/2021 17:44:58 - INFO - __main__ - Step 25484: {'lr': 0.0004695783921645227, 'samples': 4892928, 'steps': 25483, 'loss/train': 2.1924386024475098} -08/30/2021 17:44:59 - INFO - __main__ - Step 25485: {'lr': 0.00046957585504013853, 'samples': 4893120, 'steps': 25484, 'loss/train': 1.9128268957138062} -08/30/2021 17:44:59 - INFO - __main__ - Step 25486: {'lr': 0.0004695733178168169, 'samples': 4893312, 'steps': 25485, 'loss/train': 1.4193248748779297} -08/30/2021 17:45:00 - INFO - __main__ - Step 25487: {'lr': 0.00046957078049455895, 'samples': 4893504, 'steps': 25486, 'loss/train': 0.7644988894462585} -08/30/2021 17:45:01 - INFO - __main__ - Step 25488: {'lr': 0.00046956824307336565, 'samples': 4893696, 'steps': 25487, 'loss/train': 1.4632740020751953} -08/30/2021 17:45:01 - INFO - __main__ - Step 25489: {'lr': 0.0004695657055532384, 'samples': 4893888, 'steps': 25488, 'loss/train': 1.8015514612197876} -08/30/2021 17:45:02 - INFO - __main__ - Step 25490: {'lr': 0.0004695631679341782, 'samples': 4894080, 'steps': 25489, 'loss/train': 1.416368842124939} -08/30/2021 17:45:02 - INFO - __main__ - Step 25491: {'lr': 0.0004695606302161862, 'samples': 4894272, 'steps': 25490, 'loss/train': 1.3531547784805298} -08/30/2021 17:45:04 - INFO - __main__ - Step 25492: {'lr': 0.0004695580923992636, 'samples': 4894464, 'steps': 25491, 'loss/train': 1.4158116579055786} -08/30/2021 17:45:04 - INFO - __main__ - Step 25493: {'lr': 0.0004695555544834116, 'samples': 4894656, 'steps': 25492, 'loss/train': 1.2660306692123413} -08/30/2021 17:45:04 - INFO - __main__ - Step 25494: {'lr': 0.00046955301646863114, 'samples': 4894848, 'steps': 25493, 'loss/train': 1.0336216688156128} -08/30/2021 17:45:05 - INFO - __main__ - Step 25495: {'lr': 0.0004695504783549235, 'samples': 4895040, 'steps': 25494, 'loss/train': 1.3519583940505981} -08/30/2021 17:45:05 - INFO - __main__ - Step 25496: {'lr': 0.0004695479401422898, 'samples': 4895232, 'steps': 25495, 'loss/train': 1.8910647630691528} -08/30/2021 17:45:07 - INFO - __main__ - Step 25497: {'lr': 0.0004695454018307312, 'samples': 4895424, 'steps': 25496, 'loss/train': 1.2742998600006104} -08/30/2021 17:45:08 - INFO - __main__ - Step 25498: {'lr': 0.0004695428634202488, 'samples': 4895616, 'steps': 25497, 'loss/train': 1.496669888496399} -08/30/2021 17:45:08 - INFO - __main__ - Step 25499: {'lr': 0.0004695403249108438, 'samples': 4895808, 'steps': 25498, 'loss/train': 1.51729416847229} -08/30/2021 17:45:08 - INFO - __main__ - Step 25500: {'lr': 0.0004695377863025173, 'samples': 4896000, 'steps': 25499, 'loss/train': 0.8094951510429382} -08/30/2021 17:45:09 - INFO - __main__ - Step 25501: {'lr': 0.00046953524759527055, 'samples': 4896192, 'steps': 25500, 'loss/train': 1.338602900505066} -08/30/2021 17:45:10 - INFO - __main__ - Step 25502: {'lr': 0.0004695327087891045, 'samples': 4896384, 'steps': 25501, 'loss/train': 0.6852303147315979} -08/30/2021 17:45:11 - INFO - __main__ - Step 25503: {'lr': 0.00046953016988402044, 'samples': 4896576, 'steps': 25502, 'loss/train': 1.0759178400039673} -08/30/2021 17:45:11 - INFO - __main__ - Step 25504: {'lr': 0.0004695276308800194, 'samples': 4896768, 'steps': 25503, 'loss/train': 1.9079062938690186} -08/30/2021 17:45:11 - INFO - __main__ - Step 25505: {'lr': 0.00046952509177710267, 'samples': 4896960, 'steps': 25504, 'loss/train': 1.7435216903686523} -08/30/2021 17:45:12 - INFO - __main__ - Step 25506: {'lr': 0.00046952255257527134, 'samples': 4897152, 'steps': 25505, 'loss/train': 1.421472430229187} -08/30/2021 17:45:12 - INFO - __main__ - Step 25507: {'lr': 0.0004695200132745265, 'samples': 4897344, 'steps': 25506, 'loss/train': 0.0785176008939743} -08/30/2021 17:45:14 - INFO - __main__ - Step 25508: {'lr': 0.00046951747387486933, 'samples': 4897536, 'steps': 25507, 'loss/train': 1.4423470497131348} -08/30/2021 17:45:14 - INFO - __main__ - Step 25509: {'lr': 0.00046951493437630097, 'samples': 4897728, 'steps': 25508, 'loss/train': 1.6386562585830688} -08/30/2021 17:45:15 - INFO - __main__ - Step 25510: {'lr': 0.0004695123947788226, 'samples': 4897920, 'steps': 25509, 'loss/train': 1.7119576930999756} -08/30/2021 17:45:15 - INFO - __main__ - Step 25511: {'lr': 0.0004695098550824353, 'samples': 4898112, 'steps': 25510, 'loss/train': 1.0653730630874634} -08/30/2021 17:45:15 - INFO - __main__ - Step 25512: {'lr': 0.0004695073152871403, 'samples': 4898304, 'steps': 25511, 'loss/train': 1.4548927545547485} -08/30/2021 17:45:17 - INFO - __main__ - Step 25513: {'lr': 0.00046950477539293864, 'samples': 4898496, 'steps': 25512, 'loss/train': 1.291247844696045} -08/30/2021 17:45:17 - INFO - __main__ - Step 25514: {'lr': 0.0004695022353998315, 'samples': 4898688, 'steps': 25513, 'loss/train': 0.42855507135391235} -08/30/2021 17:45:18 - INFO - __main__ - Step 25515: {'lr': 0.0004694996953078201, 'samples': 4898880, 'steps': 25514, 'loss/train': 1.4016495943069458} -08/30/2021 17:45:18 - INFO - __main__ - Step 25516: {'lr': 0.0004694971551169055, 'samples': 4899072, 'steps': 25515, 'loss/train': 2.0857272148132324} -08/30/2021 17:45:18 - INFO - __main__ - Step 25517: {'lr': 0.00046949461482708875, 'samples': 4899264, 'steps': 25516, 'loss/train': 1.2822951078414917} -08/30/2021 17:45:20 - INFO - __main__ - Step 25518: {'lr': 0.0004694920744383713, 'samples': 4899456, 'steps': 25517, 'loss/train': 2.0646729469299316} -08/30/2021 17:45:20 - INFO - __main__ - Step 25519: {'lr': 0.000469489533950754, 'samples': 4899648, 'steps': 25518, 'loss/train': 1.6781165599822998} -08/30/2021 17:45:21 - INFO - __main__ - Step 25520: {'lr': 0.00046948699336423817, 'samples': 4899840, 'steps': 25519, 'loss/train': 2.136193037033081} -08/30/2021 17:45:21 - INFO - __main__ - Step 25521: {'lr': 0.0004694844526788248, 'samples': 4900032, 'steps': 25520, 'loss/train': 1.3668781518936157} -08/30/2021 17:45:21 - INFO - __main__ - Step 25522: {'lr': 0.0004694819118945152, 'samples': 4900224, 'steps': 25521, 'loss/train': 1.7951041460037231} -08/30/2021 17:45:22 - INFO - __main__ - Step 25523: {'lr': 0.00046947937101131046, 'samples': 4900416, 'steps': 25522, 'loss/train': 1.076138973236084} -08/30/2021 17:45:23 - INFO - __main__ - Step 25524: {'lr': 0.0004694768300292116, 'samples': 4900608, 'steps': 25523, 'loss/train': 0.799167811870575} -08/30/2021 17:45:24 - INFO - __main__ - Step 25525: {'lr': 0.0004694742889482199, 'samples': 4900800, 'steps': 25524, 'loss/train': 1.3842781782150269} -08/30/2021 17:45:24 - INFO - __main__ - Step 25526: {'lr': 0.0004694717477683365, 'samples': 4900992, 'steps': 25525, 'loss/train': 1.9871892929077148} -08/30/2021 17:45:25 - INFO - __main__ - Step 25527: {'lr': 0.0004694692064895625, 'samples': 4901184, 'steps': 25526, 'loss/train': 1.5205962657928467} -08/30/2021 17:45:25 - INFO - __main__ - Step 25528: {'lr': 0.0004694666651118991, 'samples': 4901376, 'steps': 25527, 'loss/train': 0.9289355278015137} -08/30/2021 17:45:27 - INFO - __main__ - Step 25529: {'lr': 0.00046946412363534735, 'samples': 4901568, 'steps': 25528, 'loss/train': 1.7455404996871948} -08/30/2021 17:45:28 - INFO - __main__ - Step 25530: {'lr': 0.0004694615820599085, 'samples': 4901760, 'steps': 25529, 'loss/train': 0.96571284532547} -08/30/2021 17:45:28 - INFO - __main__ - Step 25531: {'lr': 0.00046945904038558364, 'samples': 4901952, 'steps': 25530, 'loss/train': 1.6810768842697144} -08/30/2021 17:45:28 - INFO - __main__ - Step 25532: {'lr': 0.00046945649861237387, 'samples': 4902144, 'steps': 25531, 'loss/train': 2.0984668731689453} -08/30/2021 17:45:29 - INFO - __main__ - Step 25533: {'lr': 0.00046945395674028047, 'samples': 4902336, 'steps': 25532, 'loss/train': 1.5089911222457886} -08/30/2021 17:45:29 - INFO - __main__ - Step 25534: {'lr': 0.0004694514147693044, 'samples': 4902528, 'steps': 25533, 'loss/train': 1.3756768703460693} -08/30/2021 17:45:31 - INFO - __main__ - Step 25535: {'lr': 0.000469448872699447, 'samples': 4902720, 'steps': 25534, 'loss/train': 0.13290277123451233} -08/30/2021 17:45:31 - INFO - __main__ - Step 25536: {'lr': 0.0004694463305307093, 'samples': 4902912, 'steps': 25535, 'loss/train': 1.2443565130233765} -08/30/2021 17:45:31 - INFO - __main__ - Step 25537: {'lr': 0.00046944378826309244, 'samples': 4903104, 'steps': 25536, 'loss/train': 1.7121107578277588} -08/30/2021 17:45:32 - INFO - __main__ - Step 25538: {'lr': 0.00046944124589659765, 'samples': 4903296, 'steps': 25537, 'loss/train': 1.3854635953903198} -08/30/2021 17:45:32 - INFO - __main__ - Step 25539: {'lr': 0.00046943870343122595, 'samples': 4903488, 'steps': 25538, 'loss/train': 1.3788626194000244} -08/30/2021 17:45:34 - INFO - __main__ - Step 25540: {'lr': 0.0004694361608669786, 'samples': 4903680, 'steps': 25539, 'loss/train': 1.0962517261505127} -08/30/2021 17:45:34 - INFO - __main__ - Step 25541: {'lr': 0.0004694336182038567, 'samples': 4903872, 'steps': 25540, 'loss/train': 1.5978034734725952} -08/30/2021 17:45:34 - INFO - __main__ - Step 25542: {'lr': 0.00046943107544186144, 'samples': 4904064, 'steps': 25541, 'loss/train': 1.7243266105651855} -08/30/2021 17:45:35 - INFO - __main__ - Step 25543: {'lr': 0.0004694285325809938, 'samples': 4904256, 'steps': 25542, 'loss/train': 1.7463313341140747} -08/30/2021 17:45:35 - INFO - __main__ - Step 25544: {'lr': 0.00046942598962125515, 'samples': 4904448, 'steps': 25543, 'loss/train': 1.8773432970046997} -08/30/2021 17:45:37 - INFO - __main__ - Step 25545: {'lr': 0.00046942344656264657, 'samples': 4904640, 'steps': 25544, 'loss/train': 1.6174808740615845} -08/30/2021 17:45:38 - INFO - __main__ - Step 25546: {'lr': 0.0004694209034051691, 'samples': 4904832, 'steps': 25545, 'loss/train': 1.2789280414581299} -08/30/2021 17:45:38 - INFO - __main__ - Step 25547: {'lr': 0.00046941836014882394, 'samples': 4905024, 'steps': 25546, 'loss/train': 0.8335281610488892} -08/30/2021 17:45:38 - INFO - __main__ - Step 25548: {'lr': 0.00046941581679361234, 'samples': 4905216, 'steps': 25547, 'loss/train': 0.897831380367279} -08/30/2021 17:45:39 - INFO - __main__ - Step 25549: {'lr': 0.00046941327333953526, 'samples': 4905408, 'steps': 25548, 'loss/train': 1.5635565519332886} -08/30/2021 17:45:39 - INFO - __main__ - Step 25550: {'lr': 0.00046941072978659397, 'samples': 4905600, 'steps': 25549, 'loss/train': 1.523878574371338} -08/30/2021 17:45:40 - INFO - __main__ - Step 25551: {'lr': 0.00046940818613478964, 'samples': 4905792, 'steps': 25550, 'loss/train': 0.07167031615972519} -08/30/2021 17:45:41 - INFO - __main__ - Step 25552: {'lr': 0.0004694056423841233, 'samples': 4905984, 'steps': 25551, 'loss/train': 1.5276508331298828} -08/30/2021 17:45:41 - INFO - __main__ - Step 25553: {'lr': 0.00046940309853459625, 'samples': 4906176, 'steps': 25552, 'loss/train': 1.7026442289352417} -08/30/2021 17:45:42 - INFO - __main__ - Step 25554: {'lr': 0.00046940055458620945, 'samples': 4906368, 'steps': 25553, 'loss/train': 1.2607771158218384} -08/30/2021 17:45:42 - INFO - __main__ - Step 25555: {'lr': 0.0004693980105389642, 'samples': 4906560, 'steps': 25554, 'loss/train': 1.650815725326538} -08/30/2021 17:45:44 - INFO - __main__ - Step 25556: {'lr': 0.00046939546639286156, 'samples': 4906752, 'steps': 25555, 'loss/train': 1.2766176462173462} -08/30/2021 17:45:44 - INFO - __main__ - Step 25557: {'lr': 0.00046939292214790275, 'samples': 4906944, 'steps': 25556, 'loss/train': 1.824107050895691} -08/30/2021 17:45:45 - INFO - __main__ - Step 25558: {'lr': 0.0004693903778040889, 'samples': 4907136, 'steps': 25557, 'loss/train': 1.6804702281951904} -08/30/2021 17:45:45 - INFO - __main__ - Step 25559: {'lr': 0.0004693878333614211, 'samples': 4907328, 'steps': 25558, 'loss/train': 0.14626309275627136} -08/30/2021 17:45:45 - INFO - __main__ - Step 25560: {'lr': 0.0004693852888199005, 'samples': 4907520, 'steps': 25559, 'loss/train': 1.5664700269699097} -08/30/2021 17:45:47 - INFO - __main__ - Step 25561: {'lr': 0.0004693827441795283, 'samples': 4907712, 'steps': 25560, 'loss/train': 1.2916374206542969} -08/30/2021 17:45:47 - INFO - __main__ - Step 25562: {'lr': 0.00046938019944030556, 'samples': 4907904, 'steps': 25561, 'loss/train': 1.253320574760437} -08/30/2021 17:45:48 - INFO - __main__ - Step 25563: {'lr': 0.00046937765460223357, 'samples': 4908096, 'steps': 25562, 'loss/train': 1.8996003866195679} -08/30/2021 17:45:48 - INFO - __main__ - Step 25564: {'lr': 0.0004693751096653134, 'samples': 4908288, 'steps': 25563, 'loss/train': 1.5907924175262451} -08/30/2021 17:45:48 - INFO - __main__ - Step 25565: {'lr': 0.00046937256462954615, 'samples': 4908480, 'steps': 25564, 'loss/train': 1.7696524858474731} -08/30/2021 17:45:50 - INFO - __main__ - Step 25566: {'lr': 0.00046937001949493294, 'samples': 4908672, 'steps': 25565, 'loss/train': 1.5918571949005127} -08/30/2021 17:45:50 - INFO - __main__ - Step 25567: {'lr': 0.0004693674742614751, 'samples': 4908864, 'steps': 25566, 'loss/train': 1.2720521688461304} -08/30/2021 17:45:51 - INFO - __main__ - Step 25568: {'lr': 0.0004693649289291736, 'samples': 4909056, 'steps': 25567, 'loss/train': 1.2477308511734009} -08/30/2021 17:45:51 - INFO - __main__ - Step 25569: {'lr': 0.0004693623834980297, 'samples': 4909248, 'steps': 25568, 'loss/train': 0.08667182177305222} -08/30/2021 17:45:52 - INFO - __main__ - Step 25570: {'lr': 0.00046935983796804443, 'samples': 4909440, 'steps': 25569, 'loss/train': 1.7546091079711914} -08/30/2021 17:45:52 - INFO - __main__ - Step 25571: {'lr': 0.000469357292339219, 'samples': 4909632, 'steps': 25570, 'loss/train': 2.3846867084503174} -08/30/2021 17:45:54 - INFO - __main__ - Step 25572: {'lr': 0.00046935474661155465, 'samples': 4909824, 'steps': 25571, 'loss/train': 1.219957947731018} -08/30/2021 17:45:54 - INFO - __main__ - Step 25573: {'lr': 0.00046935220078505235, 'samples': 4910016, 'steps': 25572, 'loss/train': 2.4779434204101562} -08/30/2021 17:45:54 - INFO - __main__ - Step 25574: {'lr': 0.00046934965485971337, 'samples': 4910208, 'steps': 25573, 'loss/train': 1.1145262718200684} -08/30/2021 17:45:55 - INFO - __main__ - Step 25575: {'lr': 0.00046934710883553884, 'samples': 4910400, 'steps': 25574, 'loss/train': 0.08766800910234451} -08/30/2021 17:45:55 - INFO - __main__ - Step 25576: {'lr': 0.00046934456271252985, 'samples': 4910592, 'steps': 25575, 'loss/train': 1.6031591892242432} -08/30/2021 17:45:57 - INFO - __main__ - Step 25577: {'lr': 0.0004693420164906876, 'samples': 4910784, 'steps': 25576, 'loss/train': 1.3525570631027222} -08/30/2021 17:45:57 - INFO - __main__ - Step 25578: {'lr': 0.0004693394701700132, 'samples': 4910976, 'steps': 25577, 'loss/train': 1.410264015197754} -08/30/2021 17:45:58 - INFO - __main__ - Step 25579: {'lr': 0.00046933692375050783, 'samples': 4911168, 'steps': 25578, 'loss/train': 1.3000317811965942} -08/30/2021 17:45:58 - INFO - __main__ - Step 25580: {'lr': 0.00046933437723217265, 'samples': 4911360, 'steps': 25579, 'loss/train': 1.3320658206939697} -08/30/2021 17:45:58 - INFO - __main__ - Step 25581: {'lr': 0.0004693318306150087, 'samples': 4911552, 'steps': 25580, 'loss/train': 0.5477054119110107} -08/30/2021 17:46:00 - INFO - __main__ - Step 25582: {'lr': 0.0004693292838990173, 'samples': 4911744, 'steps': 25581, 'loss/train': 1.3790009021759033} -08/30/2021 17:46:01 - INFO - __main__ - Step 25583: {'lr': 0.0004693267370841995, 'samples': 4911936, 'steps': 25582, 'loss/train': 1.1315293312072754} -08/30/2021 17:46:01 - INFO - __main__ - Step 25584: {'lr': 0.00046932419017055646, 'samples': 4912128, 'steps': 25583, 'loss/train': 1.6476805210113525} -08/30/2021 17:46:01 - INFO - __main__ - Step 25585: {'lr': 0.0004693216431580893, 'samples': 4912320, 'steps': 25584, 'loss/train': 1.3029710054397583} -08/30/2021 17:46:02 - INFO - __main__ - Step 25586: {'lr': 0.00046931909604679925, 'samples': 4912512, 'steps': 25585, 'loss/train': 1.1572575569152832} -08/30/2021 17:46:03 - INFO - __main__ - Step 25587: {'lr': 0.0004693165488366873, 'samples': 4912704, 'steps': 25586, 'loss/train': 1.7142897844314575} -08/30/2021 17:46:04 - INFO - __main__ - Step 25588: {'lr': 0.00046931400152775473, 'samples': 4912896, 'steps': 25587, 'loss/train': 1.4758199453353882} -08/30/2021 17:46:04 - INFO - __main__ - Step 25589: {'lr': 0.00046931145412000265, 'samples': 4913088, 'steps': 25588, 'loss/train': 1.551531434059143} -08/30/2021 17:46:04 - INFO - __main__ - Step 25590: {'lr': 0.00046930890661343226, 'samples': 4913280, 'steps': 25589, 'loss/train': 1.546036720275879} -08/30/2021 17:46:05 - INFO - __main__ - Step 25591: {'lr': 0.00046930635900804466, 'samples': 4913472, 'steps': 25590, 'loss/train': 1.1229722499847412} -08/30/2021 17:46:06 - INFO - __main__ - Step 25592: {'lr': 0.0004693038113038409, 'samples': 4913664, 'steps': 25591, 'loss/train': 1.2015138864517212} -08/30/2021 17:46:07 - INFO - __main__ - Step 25593: {'lr': 0.0004693012635008224, 'samples': 4913856, 'steps': 25592, 'loss/train': 1.4687280654907227} -08/30/2021 17:46:07 - INFO - __main__ - Step 25594: {'lr': 0.00046929871559898994, 'samples': 4914048, 'steps': 25593, 'loss/train': 1.2752095460891724} -08/30/2021 17:46:07 - INFO - __main__ - Step 25595: {'lr': 0.00046929616759834505, 'samples': 4914240, 'steps': 25594, 'loss/train': 1.6353528499603271} -08/30/2021 17:46:08 - INFO - __main__ - Step 25596: {'lr': 0.00046929361949888857, 'samples': 4914432, 'steps': 25595, 'loss/train': 1.7392250299453735} -08/30/2021 17:46:09 - INFO - __main__ - Step 25597: {'lr': 0.00046929107130062176, 'samples': 4914624, 'steps': 25596, 'loss/train': 1.8298649787902832} -08/30/2021 17:46:10 - INFO - __main__ - Step 25598: {'lr': 0.00046928852300354585, 'samples': 4914816, 'steps': 25597, 'loss/train': 1.7110896110534668} -08/30/2021 17:46:10 - INFO - __main__ - Step 25599: {'lr': 0.0004692859746076619, 'samples': 4915008, 'steps': 25598, 'loss/train': 1.1671812534332275} -08/30/2021 17:46:11 - INFO - __main__ - Step 25600: {'lr': 0.00046928342611297105, 'samples': 4915200, 'steps': 25599, 'loss/train': 1.6852355003356934} -08/30/2021 17:46:11 - INFO - __main__ - Step 25601: {'lr': 0.00046928087751947444, 'samples': 4915392, 'steps': 25600, 'loss/train': 0.975641131401062} -08/30/2021 17:46:12 - INFO - __main__ - Step 25602: {'lr': 0.00046927832882717323, 'samples': 4915584, 'steps': 25601, 'loss/train': 1.9378066062927246} -08/30/2021 17:46:13 - INFO - __main__ - Step 25603: {'lr': 0.0004692757800360687, 'samples': 4915776, 'steps': 25602, 'loss/train': 1.595958948135376} -08/30/2021 17:46:13 - INFO - __main__ - Step 25604: {'lr': 0.0004692732311461618, 'samples': 4915968, 'steps': 25603, 'loss/train': 1.5733797550201416} -08/30/2021 17:46:13 - INFO - __main__ - Step 25605: {'lr': 0.0004692706821574538, 'samples': 4916160, 'steps': 25604, 'loss/train': 1.6840075254440308} -08/30/2021 17:46:14 - INFO - __main__ - Step 25606: {'lr': 0.00046926813306994586, 'samples': 4916352, 'steps': 25605, 'loss/train': 1.3816670179367065} -08/30/2021 17:46:15 - INFO - __main__ - Step 25607: {'lr': 0.00046926558388363904, 'samples': 4916544, 'steps': 25606, 'loss/train': 1.2792718410491943} -08/30/2021 17:46:16 - INFO - __main__ - Step 25608: {'lr': 0.00046926303459853447, 'samples': 4916736, 'steps': 25607, 'loss/train': 1.5633635520935059} -08/30/2021 17:46:16 - INFO - __main__ - Step 25609: {'lr': 0.00046926048521463344, 'samples': 4916928, 'steps': 25608, 'loss/train': 1.4930192232131958} -08/30/2021 17:46:16 - INFO - __main__ - Step 25610: {'lr': 0.000469257935731937, 'samples': 4917120, 'steps': 25609, 'loss/train': 1.3920789957046509} -08/30/2021 17:46:17 - INFO - __main__ - Step 25611: {'lr': 0.0004692553861504463, 'samples': 4917312, 'steps': 25610, 'loss/train': 1.2099542617797852} -08/30/2021 17:46:17 - INFO - __main__ - Step 25612: {'lr': 0.00046925283647016253, 'samples': 4917504, 'steps': 25611, 'loss/train': 0.5829740762710571} -08/30/2021 17:46:19 - INFO - __main__ - Step 25613: {'lr': 0.0004692502866910868, 'samples': 4917696, 'steps': 25612, 'loss/train': 1.332496166229248} -08/30/2021 17:46:20 - INFO - __main__ - Step 25614: {'lr': 0.0004692477368132203, 'samples': 4917888, 'steps': 25613, 'loss/train': 2.0153746604919434} -08/30/2021 17:46:20 - INFO - __main__ - Step 25615: {'lr': 0.0004692451868365641, 'samples': 4918080, 'steps': 25614, 'loss/train': 1.5743674039840698} -08/30/2021 17:46:21 - INFO - __main__ - Step 25616: {'lr': 0.00046924263676111945, 'samples': 4918272, 'steps': 25615, 'loss/train': 1.4915242195129395} -08/30/2021 17:46:21 - INFO - __main__ - Step 25617: {'lr': 0.00046924008658688745, 'samples': 4918464, 'steps': 25616, 'loss/train': 1.3996468782424927} -08/30/2021 17:46:22 - INFO - __main__ - Step 25618: {'lr': 0.00046923753631386924, 'samples': 4918656, 'steps': 25617, 'loss/train': 2.0151290893554688} -08/30/2021 17:46:23 - INFO - __main__ - Step 25619: {'lr': 0.0004692349859420659, 'samples': 4918848, 'steps': 25618, 'loss/train': 1.116296648979187} -08/30/2021 17:46:23 - INFO - __main__ - Step 25620: {'lr': 0.00046923243547147874, 'samples': 4919040, 'steps': 25619, 'loss/train': 1.6149743795394897} -08/30/2021 17:46:24 - INFO - __main__ - Step 25621: {'lr': 0.0004692298849021088, 'samples': 4919232, 'steps': 25620, 'loss/train': 1.7254117727279663} -08/30/2021 17:46:24 - INFO - __main__ - Step 25622: {'lr': 0.00046922733423395736, 'samples': 4919424, 'steps': 25621, 'loss/train': 0.910541296005249} -08/30/2021 17:46:25 - INFO - __main__ - Step 25623: {'lr': 0.0004692247834670253, 'samples': 4919616, 'steps': 25622, 'loss/train': 1.3471633195877075} -08/30/2021 17:46:26 - INFO - __main__ - Step 25624: {'lr': 0.000469222232601314, 'samples': 4919808, 'steps': 25623, 'loss/train': 1.6275146007537842} -08/30/2021 17:46:26 - INFO - __main__ - Step 25625: {'lr': 0.0004692196816368246, 'samples': 4920000, 'steps': 25624, 'loss/train': 0.9021770358085632} -08/30/2021 17:46:27 - INFO - __main__ - Step 25626: {'lr': 0.00046921713057355817, 'samples': 4920192, 'steps': 25625, 'loss/train': 1.6000720262527466} -08/30/2021 17:46:27 - INFO - __main__ - Step 25627: {'lr': 0.0004692145794115159, 'samples': 4920384, 'steps': 25626, 'loss/train': 2.384751081466675} -08/30/2021 17:46:29 - INFO - __main__ - Step 25628: {'lr': 0.00046921202815069883, 'samples': 4920576, 'steps': 25627, 'loss/train': 0.963126003742218} -08/30/2021 17:46:29 - INFO - __main__ - Step 25629: {'lr': 0.00046920947679110833, 'samples': 4920768, 'steps': 25628, 'loss/train': 1.5333893299102783} -08/30/2021 17:46:30 - INFO - __main__ - Step 25630: {'lr': 0.00046920692533274533, 'samples': 4920960, 'steps': 25629, 'loss/train': 5.969575881958008} -08/30/2021 17:46:30 - INFO - __main__ - Step 25631: {'lr': 0.0004692043737756111, 'samples': 4921152, 'steps': 25630, 'loss/train': 5.858996391296387} -08/30/2021 17:46:30 - INFO - __main__ - Step 25632: {'lr': 0.00046920182211970677, 'samples': 4921344, 'steps': 25631, 'loss/train': 1.7322770357131958} -08/30/2021 17:46:31 - INFO - __main__ - Step 25633: {'lr': 0.00046919927036503353, 'samples': 4921536, 'steps': 25632, 'loss/train': 1.5119572877883911} -08/30/2021 17:46:31 - INFO - __main__ - Step 25634: {'lr': 0.0004691967185115924, 'samples': 4921728, 'steps': 25633, 'loss/train': 1.7821234464645386} -08/30/2021 17:46:33 - INFO - __main__ - Step 25635: {'lr': 0.00046919416655938465, 'samples': 4921920, 'steps': 25634, 'loss/train': 1.7719392776489258} -08/30/2021 17:46:33 - INFO - __main__ - Step 25636: {'lr': 0.0004691916145084113, 'samples': 4922112, 'steps': 25635, 'loss/train': 1.672731876373291} -08/30/2021 17:46:34 - INFO - __main__ - Step 25637: {'lr': 0.0004691890623586737, 'samples': 4922304, 'steps': 25636, 'loss/train': 1.2098770141601562} -08/30/2021 17:46:34 - INFO - __main__ - Step 25638: {'lr': 0.00046918651011017287, 'samples': 4922496, 'steps': 25637, 'loss/train': 1.5956040620803833} -08/30/2021 17:46:34 - INFO - __main__ - Step 25639: {'lr': 0.00046918395776290997, 'samples': 4922688, 'steps': 25638, 'loss/train': 1.457015037536621} -08/30/2021 17:46:36 - INFO - __main__ - Step 25640: {'lr': 0.0004691814053168861, 'samples': 4922880, 'steps': 25639, 'loss/train': 1.3072255849838257} -08/30/2021 17:46:36 - INFO - __main__ - Step 25641: {'lr': 0.0004691788527721026, 'samples': 4923072, 'steps': 25640, 'loss/train': 1.556615948677063} -08/30/2021 17:46:37 - INFO - __main__ - Step 25642: {'lr': 0.0004691763001285604, 'samples': 4923264, 'steps': 25641, 'loss/train': 1.2920417785644531} -08/30/2021 17:46:37 - INFO - __main__ - Step 25643: {'lr': 0.0004691737473862607, 'samples': 4923456, 'steps': 25642, 'loss/train': 1.911281704902649} -08/30/2021 17:46:37 - INFO - __main__ - Step 25644: {'lr': 0.00046917119454520487, 'samples': 4923648, 'steps': 25643, 'loss/train': 1.6087640523910522} -08/30/2021 17:46:39 - INFO - __main__ - Step 25645: {'lr': 0.00046916864160539376, 'samples': 4923840, 'steps': 25644, 'loss/train': 1.8666285276412964} -08/30/2021 17:46:39 - INFO - __main__ - Step 25646: {'lr': 0.00046916608856682865, 'samples': 4924032, 'steps': 25645, 'loss/train': 1.5911983251571655} -08/30/2021 17:46:40 - INFO - __main__ - Step 25647: {'lr': 0.0004691635354295106, 'samples': 4924224, 'steps': 25646, 'loss/train': 1.169861912727356} -08/30/2021 17:46:40 - INFO - __main__ - Step 25648: {'lr': 0.00046916098219344093, 'samples': 4924416, 'steps': 25647, 'loss/train': 1.3354626893997192} -08/30/2021 17:46:40 - INFO - __main__ - Step 25649: {'lr': 0.0004691584288586207, 'samples': 4924608, 'steps': 25648, 'loss/train': 1.26406729221344} -08/30/2021 17:46:42 - INFO - __main__ - Step 25650: {'lr': 0.0004691558754250511, 'samples': 4924800, 'steps': 25649, 'loss/train': 1.3049681186676025} -08/30/2021 17:46:42 - INFO - __main__ - Step 25651: {'lr': 0.0004691533218927332, 'samples': 4924992, 'steps': 25650, 'loss/train': 1.289215326309204} -08/30/2021 17:46:43 - INFO - __main__ - Step 25652: {'lr': 0.00046915076826166814, 'samples': 4925184, 'steps': 25651, 'loss/train': 1.2583330869674683} -08/30/2021 17:46:43 - INFO - __main__ - Step 25653: {'lr': 0.0004691482145318572, 'samples': 4925376, 'steps': 25652, 'loss/train': 1.0070675611495972} -08/30/2021 17:46:43 - INFO - __main__ - Step 25654: {'lr': 0.00046914566070330144, 'samples': 4925568, 'steps': 25653, 'loss/train': 1.2272132635116577} -08/30/2021 17:46:44 - INFO - __main__ - Step 25655: {'lr': 0.00046914310677600204, 'samples': 4925760, 'steps': 25654, 'loss/train': 1.4363913536071777} -08/30/2021 17:46:45 - INFO - __main__ - Step 25656: {'lr': 0.00046914055274996017, 'samples': 4925952, 'steps': 25655, 'loss/train': 1.8204822540283203} -08/30/2021 17:46:46 - INFO - __main__ - Step 25657: {'lr': 0.00046913799862517686, 'samples': 4926144, 'steps': 25656, 'loss/train': 1.3860546350479126} -08/30/2021 17:46:46 - INFO - __main__ - Step 25658: {'lr': 0.0004691354444016534, 'samples': 4926336, 'steps': 25657, 'loss/train': 1.6931554079055786} -08/30/2021 17:46:46 - INFO - __main__ - Step 25659: {'lr': 0.00046913289007939087, 'samples': 4926528, 'steps': 25658, 'loss/train': 1.4370806217193604} -08/30/2021 17:46:47 - INFO - __main__ - Step 25660: {'lr': 0.00046913033565839046, 'samples': 4926720, 'steps': 25659, 'loss/train': 1.4942413568496704} -08/30/2021 17:46:49 - INFO - __main__ - Step 25661: {'lr': 0.0004691277811386533, 'samples': 4926912, 'steps': 25660, 'loss/train': 1.5427632331848145} -08/30/2021 17:46:49 - INFO - __main__ - Step 25662: {'lr': 0.0004691252265201805, 'samples': 4927104, 'steps': 25661, 'loss/train': 1.3137925863265991} -08/30/2021 17:46:50 - INFO - __main__ - Step 25663: {'lr': 0.00046912267180297337, 'samples': 4927296, 'steps': 25662, 'loss/train': 0.063136987388134} -08/30/2021 17:46:50 - INFO - __main__ - Step 25664: {'lr': 0.0004691201169870328, 'samples': 4927488, 'steps': 25663, 'loss/train': 2.225656509399414} -08/30/2021 17:46:50 - INFO - __main__ - Step 25665: {'lr': 0.00046911756207236024, 'samples': 4927680, 'steps': 25664, 'loss/train': 1.6347001791000366} -08/30/2021 17:46:51 - INFO - __main__ - Step 25666: {'lr': 0.0004691150070589566, 'samples': 4927872, 'steps': 25665, 'loss/train': 1.7294188737869263} -08/30/2021 17:46:53 - INFO - __main__ - Step 25667: {'lr': 0.00046911245194682306, 'samples': 4928064, 'steps': 25666, 'loss/train': 1.6906583309173584} -08/30/2021 17:46:53 - INFO - __main__ - Step 25668: {'lr': 0.00046910989673596093, 'samples': 4928256, 'steps': 25667, 'loss/train': 1.4899779558181763} -08/30/2021 17:46:53 - INFO - __main__ - Step 25669: {'lr': 0.00046910734142637124, 'samples': 4928448, 'steps': 25668, 'loss/train': 1.5659645795822144} -08/30/2021 17:46:54 - INFO - __main__ - Step 25670: {'lr': 0.00046910478601805514, 'samples': 4928640, 'steps': 25669, 'loss/train': 1.0884144306182861} -08/30/2021 17:46:54 - INFO - __main__ - Step 25671: {'lr': 0.0004691022305110138, 'samples': 4928832, 'steps': 25670, 'loss/train': 1.4707077741622925} -08/30/2021 17:46:56 - INFO - __main__ - Step 25672: {'lr': 0.0004690996749052484, 'samples': 4929024, 'steps': 25671, 'loss/train': 1.7564407587051392} -08/30/2021 17:46:56 - INFO - __main__ - Step 25673: {'lr': 0.00046909711920076, 'samples': 4929216, 'steps': 25672, 'loss/train': 2.032792091369629} -08/30/2021 17:46:56 - INFO - __main__ - Step 25674: {'lr': 0.0004690945633975499, 'samples': 4929408, 'steps': 25673, 'loss/train': 1.2514983415603638} -08/30/2021 17:46:57 - INFO - __main__ - Step 25675: {'lr': 0.00046909200749561914, 'samples': 4929600, 'steps': 25674, 'loss/train': 1.769295334815979} -08/30/2021 17:46:57 - INFO - __main__ - Step 25676: {'lr': 0.00046908945149496897, 'samples': 4929792, 'steps': 25675, 'loss/train': 1.2579846382141113} -08/30/2021 17:46:59 - INFO - __main__ - Step 25677: {'lr': 0.00046908689539560034, 'samples': 4929984, 'steps': 25676, 'loss/train': 1.221014380455017} -08/30/2021 17:46:59 - INFO - __main__ - Step 25678: {'lr': 0.0004690843391975146, 'samples': 4930176, 'steps': 25677, 'loss/train': 1.0823017358779907} -08/30/2021 17:47:00 - INFO - __main__ - Step 25679: {'lr': 0.0004690817829007129, 'samples': 4930368, 'steps': 25678, 'loss/train': 1.5751724243164062} -08/30/2021 17:47:00 - INFO - __main__ - Step 25680: {'lr': 0.00046907922650519623, 'samples': 4930560, 'steps': 25679, 'loss/train': 0.8998758792877197} -08/30/2021 17:47:00 - INFO - __main__ - Step 25681: {'lr': 0.0004690766700109659, 'samples': 4930752, 'steps': 25680, 'loss/train': 1.2231260538101196} -08/30/2021 17:47:02 - INFO - __main__ - Step 25682: {'lr': 0.00046907411341802295, 'samples': 4930944, 'steps': 25681, 'loss/train': 1.7166142463684082} -08/30/2021 17:47:02 - INFO - __main__ - Step 25683: {'lr': 0.0004690715567263687, 'samples': 4931136, 'steps': 25682, 'loss/train': 1.4265334606170654} -08/30/2021 17:47:03 - INFO - __main__ - Step 25684: {'lr': 0.00046906899993600406, 'samples': 4931328, 'steps': 25683, 'loss/train': 0.09770724177360535} -08/30/2021 17:47:03 - INFO - __main__ - Step 25685: {'lr': 0.00046906644304693033, 'samples': 4931520, 'steps': 25684, 'loss/train': 1.1788661479949951} -08/30/2021 17:47:03 - INFO - __main__ - Step 25686: {'lr': 0.0004690638860591487, 'samples': 4931712, 'steps': 25685, 'loss/train': 1.6538797616958618} -08/30/2021 17:47:04 - INFO - __main__ - Step 25687: {'lr': 0.00046906132897266026, 'samples': 4931904, 'steps': 25686, 'loss/train': 1.9894604682922363} -08/30/2021 17:47:05 - INFO - __main__ - Step 25688: {'lr': 0.00046905877178746614, 'samples': 4932096, 'steps': 25687, 'loss/train': 1.5378966331481934} -08/30/2021 17:47:06 - INFO - __main__ - Step 25689: {'lr': 0.0004690562145035675, 'samples': 4932288, 'steps': 25688, 'loss/train': 1.540313720703125} -08/30/2021 17:47:06 - INFO - __main__ - Step 25690: {'lr': 0.00046905365712096553, 'samples': 4932480, 'steps': 25689, 'loss/train': 1.1325825452804565} -08/30/2021 17:47:06 - INFO - __main__ - Step 25691: {'lr': 0.0004690510996396614, 'samples': 4932672, 'steps': 25690, 'loss/train': 1.6712768077850342} -08/30/2021 17:47:07 - INFO - __main__ - Step 25692: {'lr': 0.0004690485420596561, 'samples': 4932864, 'steps': 25691, 'loss/train': 1.5641427040100098} -08/30/2021 17:47:08 - INFO - __main__ - Step 25693: {'lr': 0.000469045984380951, 'samples': 4933056, 'steps': 25692, 'loss/train': 1.4656329154968262} -08/30/2021 17:47:09 - INFO - __main__ - Step 25694: {'lr': 0.0004690434266035471, 'samples': 4933248, 'steps': 25693, 'loss/train': 1.7872800827026367} -08/30/2021 17:47:09 - INFO - __main__ - Step 25695: {'lr': 0.00046904086872744577, 'samples': 4933440, 'steps': 25694, 'loss/train': 1.1971526145935059} -08/30/2021 17:47:10 - INFO - __main__ - Step 25696: {'lr': 0.0004690383107526479, 'samples': 4933632, 'steps': 25695, 'loss/train': 1.3781235218048096} -08/30/2021 17:47:10 - INFO - __main__ - Step 25697: {'lr': 0.0004690357526791547, 'samples': 4933824, 'steps': 25696, 'loss/train': 0.2671090066432953} -08/30/2021 17:47:11 - INFO - __main__ - Step 25698: {'lr': 0.00046903319450696744, 'samples': 4934016, 'steps': 25697, 'loss/train': 1.2729966640472412} -08/30/2021 17:47:12 - INFO - __main__ - Step 25699: {'lr': 0.00046903063623608714, 'samples': 4934208, 'steps': 25698, 'loss/train': 1.397875189781189} -08/30/2021 17:47:12 - INFO - __main__ - Step 25700: {'lr': 0.00046902807786651507, 'samples': 4934400, 'steps': 25699, 'loss/train': 1.6402528285980225} -08/30/2021 17:47:13 - INFO - __main__ - Step 25701: {'lr': 0.00046902551939825236, 'samples': 4934592, 'steps': 25700, 'loss/train': 1.5903586149215698} -08/30/2021 17:47:13 - INFO - __main__ - Step 25702: {'lr': 0.00046902296083130003, 'samples': 4934784, 'steps': 25701, 'loss/train': 1.797283411026001} -08/30/2021 17:47:14 - INFO - __main__ - Step 25703: {'lr': 0.00046902040216565945, 'samples': 4934976, 'steps': 25702, 'loss/train': 1.37621009349823} -08/30/2021 17:47:15 - INFO - __main__ - Step 25704: {'lr': 0.0004690178434013316, 'samples': 4935168, 'steps': 25703, 'loss/train': 1.568002700805664} -08/30/2021 17:47:15 - INFO - __main__ - Step 25705: {'lr': 0.00046901528453831764, 'samples': 4935360, 'steps': 25704, 'loss/train': 2.126760482788086} -08/30/2021 17:47:16 - INFO - __main__ - Step 25706: {'lr': 0.0004690127255766188, 'samples': 4935552, 'steps': 25705, 'loss/train': 1.5658352375030518} -08/30/2021 17:47:16 - INFO - __main__ - Step 25707: {'lr': 0.0004690101665162362, 'samples': 4935744, 'steps': 25706, 'loss/train': 1.1048375368118286} -08/30/2021 17:47:17 - INFO - __main__ - Step 25708: {'lr': 0.00046900760735717103, 'samples': 4935936, 'steps': 25707, 'loss/train': 1.774127721786499} -08/30/2021 17:47:18 - INFO - __main__ - Step 25709: {'lr': 0.00046900504809942433, 'samples': 4936128, 'steps': 25708, 'loss/train': 1.4984357357025146} -08/30/2021 17:47:18 - INFO - __main__ - Step 25710: {'lr': 0.00046900248874299746, 'samples': 4936320, 'steps': 25709, 'loss/train': 1.3653550148010254} -08/30/2021 17:47:18 - INFO - __main__ - Step 25711: {'lr': 0.0004689999292878914, 'samples': 4936512, 'steps': 25710, 'loss/train': 1.5078903436660767} -08/30/2021 17:47:19 - INFO - __main__ - Step 25712: {'lr': 0.00046899736973410734, 'samples': 4936704, 'steps': 25711, 'loss/train': 3.89837384223938} -08/30/2021 17:47:19 - INFO - __main__ - Step 25713: {'lr': 0.0004689948100816465, 'samples': 4936896, 'steps': 25712, 'loss/train': 1.0883709192276} -08/30/2021 17:47:21 - INFO - __main__ - Step 25714: {'lr': 0.00046899225033050985, 'samples': 4937088, 'steps': 25713, 'loss/train': 1.235689401626587} -08/30/2021 17:47:21 - INFO - __main__ - Step 25715: {'lr': 0.0004689896904806987, 'samples': 4937280, 'steps': 25714, 'loss/train': 0.9609364867210388} -08/30/2021 17:47:22 - INFO - __main__ - Step 25716: {'lr': 0.0004689871305322143, 'samples': 4937472, 'steps': 25715, 'loss/train': 0.1189139187335968} -08/30/2021 17:47:22 - INFO - __main__ - Step 25717: {'lr': 0.0004689845704850576, 'samples': 4937664, 'steps': 25716, 'loss/train': 1.5079913139343262} -08/30/2021 17:47:22 - INFO - __main__ - Step 25718: {'lr': 0.0004689820103392298, 'samples': 4937856, 'steps': 25717, 'loss/train': 0.09478290379047394} -08/30/2021 17:47:24 - INFO - __main__ - Step 25719: {'lr': 0.0004689794500947321, 'samples': 4938048, 'steps': 25718, 'loss/train': 1.803954839706421} -08/30/2021 17:47:25 - INFO - __main__ - Step 25720: {'lr': 0.0004689768897515657, 'samples': 4938240, 'steps': 25719, 'loss/train': 1.8638983964920044} -08/30/2021 17:47:25 - INFO - __main__ - Step 25721: {'lr': 0.0004689743293097316, 'samples': 4938432, 'steps': 25720, 'loss/train': 0.07366359978914261} -08/30/2021 17:47:26 - INFO - __main__ - Step 25722: {'lr': 0.0004689717687692311, 'samples': 4938624, 'steps': 25721, 'loss/train': 0.05595998093485832} -08/30/2021 17:47:26 - INFO - __main__ - Step 25723: {'lr': 0.0004689692081300653, 'samples': 4938816, 'steps': 25722, 'loss/train': 1.9962135553359985} -08/30/2021 17:47:28 - INFO - __main__ - Step 25724: {'lr': 0.0004689666473922354, 'samples': 4939008, 'steps': 25723, 'loss/train': 1.1417449712753296} -08/30/2021 17:47:28 - INFO - __main__ - Step 25725: {'lr': 0.0004689640865557424, 'samples': 4939200, 'steps': 25724, 'loss/train': 2.1349759101867676} -08/30/2021 17:47:28 - INFO - __main__ - Step 25726: {'lr': 0.0004689615256205876, 'samples': 4939392, 'steps': 25725, 'loss/train': 1.6161985397338867} -08/30/2021 17:47:29 - INFO - __main__ - Step 25727: {'lr': 0.0004689589645867721, 'samples': 4939584, 'steps': 25726, 'loss/train': 1.3147382736206055} -08/30/2021 17:47:29 - INFO - __main__ - Step 25728: {'lr': 0.0004689564034542971, 'samples': 4939776, 'steps': 25727, 'loss/train': 1.0522000789642334} -08/30/2021 17:47:31 - INFO - __main__ - Step 25729: {'lr': 0.00046895384222316375, 'samples': 4939968, 'steps': 25728, 'loss/train': 0.741268515586853} -08/30/2021 17:47:31 - INFO - __main__ - Step 25730: {'lr': 0.0004689512808933731, 'samples': 4940160, 'steps': 25729, 'loss/train': 1.3964345455169678} -08/30/2021 17:47:31 - INFO - __main__ - Step 25731: {'lr': 0.0004689487194649265, 'samples': 4940352, 'steps': 25730, 'loss/train': 1.5941787958145142} -08/30/2021 17:47:32 - INFO - __main__ - Step 25732: {'lr': 0.0004689461579378249, 'samples': 4940544, 'steps': 25731, 'loss/train': 0.07148110121488571} -08/30/2021 17:47:32 - INFO - __main__ - Step 25733: {'lr': 0.0004689435963120696, 'samples': 4940736, 'steps': 25732, 'loss/train': 1.2390637397766113} -08/30/2021 17:47:34 - INFO - __main__ - Step 25734: {'lr': 0.00046894103458766163, 'samples': 4940928, 'steps': 25733, 'loss/train': 1.6882007122039795} -08/30/2021 17:47:34 - INFO - __main__ - Step 25735: {'lr': 0.0004689384727646022, 'samples': 4941120, 'steps': 25734, 'loss/train': 1.6453152894973755} -08/30/2021 17:47:34 - INFO - __main__ - Step 25736: {'lr': 0.00046893591084289256, 'samples': 4941312, 'steps': 25735, 'loss/train': 1.415347933769226} -08/30/2021 17:47:35 - INFO - __main__ - Step 25737: {'lr': 0.0004689333488225337, 'samples': 4941504, 'steps': 25736, 'loss/train': 2.184805393218994} -08/30/2021 17:47:35 - INFO - __main__ - Step 25738: {'lr': 0.00046893078670352686, 'samples': 4941696, 'steps': 25737, 'loss/train': 1.5168434381484985} -08/30/2021 17:47:37 - INFO - __main__ - Step 25739: {'lr': 0.0004689282244858732, 'samples': 4941888, 'steps': 25738, 'loss/train': 1.8757611513137817} -08/30/2021 17:47:37 - INFO - __main__ - Step 25740: {'lr': 0.00046892566216957387, 'samples': 4942080, 'steps': 25739, 'loss/train': 0.890189528465271} -08/30/2021 17:47:37 - INFO - __main__ - Step 25741: {'lr': 0.00046892309975463, 'samples': 4942272, 'steps': 25740, 'loss/train': 0.6732057332992554} -08/30/2021 17:47:38 - INFO - __main__ - Step 25742: {'lr': 0.0004689205372410427, 'samples': 4942464, 'steps': 25741, 'loss/train': 1.7113462686538696} -08/30/2021 17:47:38 - INFO - __main__ - Step 25743: {'lr': 0.00046891797462881327, 'samples': 4942656, 'steps': 25742, 'loss/train': 1.5250897407531738} -08/30/2021 17:47:40 - INFO - __main__ - Step 25744: {'lr': 0.0004689154119179427, 'samples': 4942848, 'steps': 25743, 'loss/train': 0.9668641090393066} -08/30/2021 17:47:40 - INFO - __main__ - Step 25745: {'lr': 0.00046891284910843237, 'samples': 4943040, 'steps': 25744, 'loss/train': 1.6589901447296143} -08/30/2021 17:47:40 - INFO - __main__ - Step 25746: {'lr': 0.0004689102862002832, 'samples': 4943232, 'steps': 25745, 'loss/train': 1.1028515100479126} -08/30/2021 17:47:41 - INFO - __main__ - Step 25747: {'lr': 0.00046890772319349637, 'samples': 4943424, 'steps': 25746, 'loss/train': 0.047654375433921814} -08/30/2021 17:47:41 - INFO - __main__ - Step 25748: {'lr': 0.00046890516008807315, 'samples': 4943616, 'steps': 25747, 'loss/train': 1.8506273031234741} -08/30/2021 17:47:43 - INFO - __main__ - Step 25749: {'lr': 0.0004689025968840147, 'samples': 4943808, 'steps': 25748, 'loss/train': 1.621748447418213} -08/30/2021 17:47:43 - INFO - __main__ - Step 25750: {'lr': 0.00046890003358132204, 'samples': 4944000, 'steps': 25749, 'loss/train': 0.8986481428146362} -08/30/2021 17:47:43 - INFO - __main__ - Step 25751: {'lr': 0.0004688974701799964, 'samples': 4944192, 'steps': 25750, 'loss/train': 1.985831379890442} -08/30/2021 17:47:44 - INFO - __main__ - Step 25752: {'lr': 0.00046889490668003896, 'samples': 4944384, 'steps': 25751, 'loss/train': 1.158137321472168} -08/30/2021 17:47:44 - INFO - __main__ - Step 25753: {'lr': 0.0004688923430814509, 'samples': 4944576, 'steps': 25752, 'loss/train': 2.002857208251953} -08/30/2021 17:47:44 - INFO - __main__ - Step 25754: {'lr': 0.00046888977938423326, 'samples': 4944768, 'steps': 25753, 'loss/train': 1.1062910556793213} -08/30/2021 17:47:46 - INFO - __main__ - Step 25755: {'lr': 0.00046888721558838734, 'samples': 4944960, 'steps': 25754, 'loss/train': 1.763000249862671} -08/30/2021 17:47:46 - INFO - __main__ - Step 25756: {'lr': 0.00046888465169391414, 'samples': 4945152, 'steps': 25755, 'loss/train': 1.028965711593628} -08/30/2021 17:47:47 - INFO - __main__ - Step 25757: {'lr': 0.00046888208770081493, 'samples': 4945344, 'steps': 25756, 'loss/train': 1.6193593740463257} -08/30/2021 17:47:47 - INFO - __main__ - Step 25758: {'lr': 0.0004688795236090908, 'samples': 4945536, 'steps': 25757, 'loss/train': 1.2246124744415283} -08/30/2021 17:47:47 - INFO - __main__ - Step 25759: {'lr': 0.000468876959418743, 'samples': 4945728, 'steps': 25758, 'loss/train': 1.90020751953125} -08/30/2021 17:47:49 - INFO - __main__ - Step 25760: {'lr': 0.0004688743951297726, 'samples': 4945920, 'steps': 25759, 'loss/train': 1.3285982608795166} -08/30/2021 17:47:49 - INFO - __main__ - Step 25761: {'lr': 0.0004688718307421807, 'samples': 4946112, 'steps': 25760, 'loss/train': 0.6641785502433777} -08/30/2021 17:47:50 - INFO - __main__ - Step 25762: {'lr': 0.0004688692662559686, 'samples': 4946304, 'steps': 25761, 'loss/train': 1.5299488306045532} -08/30/2021 17:47:50 - INFO - __main__ - Step 25763: {'lr': 0.00046886670167113734, 'samples': 4946496, 'steps': 25762, 'loss/train': 1.4613096714019775} -08/30/2021 17:47:50 - INFO - __main__ - Step 25764: {'lr': 0.00046886413698768816, 'samples': 4946688, 'steps': 25763, 'loss/train': 1.715574860572815} -08/30/2021 17:47:52 - INFO - __main__ - Step 25765: {'lr': 0.0004688615722056222, 'samples': 4946880, 'steps': 25764, 'loss/train': 1.7326476573944092} -08/30/2021 17:47:52 - INFO - __main__ - Step 25766: {'lr': 0.00046885900732494053, 'samples': 4947072, 'steps': 25765, 'loss/train': 1.8465771675109863} -08/30/2021 17:47:53 - INFO - __main__ - Step 25767: {'lr': 0.0004688564423456444, 'samples': 4947264, 'steps': 25766, 'loss/train': 2.3126943111419678} -08/30/2021 17:47:53 - INFO - __main__ - Step 25768: {'lr': 0.00046885387726773494, 'samples': 4947456, 'steps': 25767, 'loss/train': 1.471281886100769} -08/30/2021 17:47:53 - INFO - __main__ - Step 25769: {'lr': 0.0004688513120912133, 'samples': 4947648, 'steps': 25768, 'loss/train': 1.0972404479980469} -08/30/2021 17:47:55 - INFO - __main__ - Step 25770: {'lr': 0.0004688487468160806, 'samples': 4947840, 'steps': 25769, 'loss/train': 1.7421773672103882} -08/30/2021 17:47:55 - INFO - __main__ - Step 25771: {'lr': 0.000468846181442338, 'samples': 4948032, 'steps': 25770, 'loss/train': 1.0144166946411133} -08/30/2021 17:47:56 - INFO - __main__ - Step 25772: {'lr': 0.0004688436159699868, 'samples': 4948224, 'steps': 25771, 'loss/train': 1.7927099466323853} -08/30/2021 17:47:56 - INFO - __main__ - Step 25773: {'lr': 0.000468841050399028, 'samples': 4948416, 'steps': 25772, 'loss/train': 1.3223836421966553} -08/30/2021 17:47:56 - INFO - __main__ - Step 25774: {'lr': 0.0004688384847294628, 'samples': 4948608, 'steps': 25773, 'loss/train': 1.6288995742797852} -08/30/2021 17:47:58 - INFO - __main__ - Step 25775: {'lr': 0.0004688359189612923, 'samples': 4948800, 'steps': 25774, 'loss/train': 0.46493470668792725} -08/30/2021 17:47:59 - INFO - __main__ - Step 25776: {'lr': 0.0004688333530945178, 'samples': 4948992, 'steps': 25775, 'loss/train': 1.0550819635391235} -08/30/2021 17:47:59 - INFO - __main__ - Step 25777: {'lr': 0.0004688307871291403, 'samples': 4949184, 'steps': 25776, 'loss/train': 1.7852526903152466} -08/30/2021 17:47:59 - INFO - __main__ - Step 25778: {'lr': 0.0004688282210651611, 'samples': 4949376, 'steps': 25777, 'loss/train': 1.324590802192688} -08/30/2021 17:48:00 - INFO - __main__ - Step 25779: {'lr': 0.00046882565490258125, 'samples': 4949568, 'steps': 25778, 'loss/train': 1.9621769189834595} -08/30/2021 17:48:00 - INFO - __main__ - Step 25780: {'lr': 0.0004688230886414019, 'samples': 4949760, 'steps': 25779, 'loss/train': 1.7752286195755005} -08/30/2021 17:48:02 - INFO - __main__ - Step 25781: {'lr': 0.0004688205222816242, 'samples': 4949952, 'steps': 25780, 'loss/train': 1.5793185234069824} -08/30/2021 17:48:02 - INFO - __main__ - Step 25782: {'lr': 0.00046881795582324944, 'samples': 4950144, 'steps': 25781, 'loss/train': 1.5692440271377563} -08/30/2021 17:48:03 - INFO - __main__ - Step 25783: {'lr': 0.00046881538926627864, 'samples': 4950336, 'steps': 25782, 'loss/train': 1.4250872135162354} -08/30/2021 17:48:03 - INFO - __main__ - Step 25784: {'lr': 0.000468812822610713, 'samples': 4950528, 'steps': 25783, 'loss/train': 1.7000045776367188} -08/30/2021 17:48:03 - INFO - __main__ - Step 25785: {'lr': 0.00046881025585655367, 'samples': 4950720, 'steps': 25784, 'loss/train': 1.6478009223937988} -08/30/2021 17:48:05 - INFO - __main__ - Step 25786: {'lr': 0.0004688076890038019, 'samples': 4950912, 'steps': 25785, 'loss/train': 3.8902199268341064} -08/30/2021 17:48:05 - INFO - __main__ - Step 25787: {'lr': 0.00046880512205245867, 'samples': 4951104, 'steps': 25786, 'loss/train': 1.7694299221038818} -08/30/2021 17:48:06 - INFO - __main__ - Step 25788: {'lr': 0.00046880255500252526, 'samples': 4951296, 'steps': 25787, 'loss/train': 1.4008413553237915} -08/30/2021 17:48:06 - INFO - __main__ - Step 25789: {'lr': 0.0004687999878540028, 'samples': 4951488, 'steps': 25788, 'loss/train': 1.402262568473816} -08/30/2021 17:48:06 - INFO - __main__ - Step 25790: {'lr': 0.00046879742060689243, 'samples': 4951680, 'steps': 25789, 'loss/train': 1.4390090703964233} -08/30/2021 17:48:08 - INFO - __main__ - Step 25791: {'lr': 0.0004687948532611953, 'samples': 4951872, 'steps': 25790, 'loss/train': 1.5752841234207153} -08/30/2021 17:48:08 - INFO - __main__ - Step 25792: {'lr': 0.0004687922858169126, 'samples': 4952064, 'steps': 25791, 'loss/train': 1.81866455078125} -08/30/2021 17:48:09 - INFO - __main__ - Step 25793: {'lr': 0.0004687897182740455, 'samples': 4952256, 'steps': 25792, 'loss/train': 1.4577043056488037} -08/30/2021 17:48:09 - INFO - __main__ - Step 25794: {'lr': 0.0004687871506325951, 'samples': 4952448, 'steps': 25793, 'loss/train': 1.6696598529815674} -08/30/2021 17:48:09 - INFO - __main__ - Step 25795: {'lr': 0.00046878458289256264, 'samples': 4952640, 'steps': 25794, 'loss/train': 1.4243284463882446} -08/30/2021 17:48:11 - INFO - __main__ - Step 25796: {'lr': 0.00046878201505394913, 'samples': 4952832, 'steps': 25795, 'loss/train': 1.4257913827896118} -08/30/2021 17:48:12 - INFO - __main__ - Step 25797: {'lr': 0.0004687794471167559, 'samples': 4953024, 'steps': 25796, 'loss/train': 1.295582890510559} -08/30/2021 17:48:12 - INFO - __main__ - Step 25798: {'lr': 0.00046877687908098396, 'samples': 4953216, 'steps': 25797, 'loss/train': 1.5752441883087158} -08/30/2021 17:48:12 - INFO - __main__ - Step 25799: {'lr': 0.0004687743109466346, 'samples': 4953408, 'steps': 25798, 'loss/train': 0.2516460716724396} -08/30/2021 17:48:13 - INFO - __main__ - Step 25800: {'lr': 0.00046877174271370894, 'samples': 4953600, 'steps': 25799, 'loss/train': 1.274735927581787} -08/30/2021 17:48:14 - INFO - __main__ - Step 25801: {'lr': 0.000468769174382208, 'samples': 4953792, 'steps': 25800, 'loss/train': 0.0804050862789154} -08/30/2021 17:48:14 - INFO - __main__ - Step 25802: {'lr': 0.0004687666059521331, 'samples': 4953984, 'steps': 25801, 'loss/train': 1.858128547668457} -08/30/2021 17:48:15 - INFO - __main__ - Step 25803: {'lr': 0.0004687640374234854, 'samples': 4954176, 'steps': 25802, 'loss/train': 1.530103087425232} -08/30/2021 17:48:15 - INFO - __main__ - Step 25804: {'lr': 0.0004687614687962659, 'samples': 4954368, 'steps': 25803, 'loss/train': 0.8512210845947266} -08/30/2021 17:48:16 - INFO - __main__ - Step 25805: {'lr': 0.0004687589000704759, 'samples': 4954560, 'steps': 25804, 'loss/train': 1.9007976055145264} -08/30/2021 17:48:18 - INFO - __main__ - Step 25806: {'lr': 0.0004687563312461165, 'samples': 4954752, 'steps': 25805, 'loss/train': 1.5209821462631226} -08/30/2021 17:48:18 - INFO - __main__ - Step 25807: {'lr': 0.00046875376232318887, 'samples': 4954944, 'steps': 25806, 'loss/train': 1.3787906169891357} -08/30/2021 17:48:19 - INFO - __main__ - Step 25808: {'lr': 0.00046875119330169426, 'samples': 4955136, 'steps': 25807, 'loss/train': 0.5449550747871399} -08/30/2021 17:48:19 - INFO - __main__ - Step 25809: {'lr': 0.00046874862418163363, 'samples': 4955328, 'steps': 25808, 'loss/train': 0.5622909069061279} -08/30/2021 17:48:19 - INFO - __main__ - Step 25810: {'lr': 0.00046874605496300824, 'samples': 4955520, 'steps': 25809, 'loss/train': 1.6267250776290894} -08/30/2021 17:48:20 - INFO - __main__ - Step 25811: {'lr': 0.00046874348564581933, 'samples': 4955712, 'steps': 25810, 'loss/train': 1.5047783851623535} -08/30/2021 17:48:20 - INFO - __main__ - Step 25812: {'lr': 0.00046874091623006793, 'samples': 4955904, 'steps': 25811, 'loss/train': 1.4574873447418213} -08/30/2021 17:48:22 - INFO - __main__ - Step 25813: {'lr': 0.0004687383467157553, 'samples': 4956096, 'steps': 25812, 'loss/train': 1.5586751699447632} -08/30/2021 17:48:22 - INFO - __main__ - Step 25814: {'lr': 0.0004687357771028825, 'samples': 4956288, 'steps': 25813, 'loss/train': 1.671359658241272} -08/30/2021 17:48:22 - INFO - __main__ - Step 25815: {'lr': 0.00046873320739145073, 'samples': 4956480, 'steps': 25814, 'loss/train': 1.4551055431365967} -08/30/2021 17:48:23 - INFO - __main__ - Step 25816: {'lr': 0.0004687306375814612, 'samples': 4956672, 'steps': 25815, 'loss/train': 1.6281694173812866} -08/30/2021 17:48:23 - INFO - __main__ - Step 25817: {'lr': 0.000468728067672915, 'samples': 4956864, 'steps': 25816, 'loss/train': 1.8594871759414673} -08/30/2021 17:48:25 - INFO - __main__ - Step 25818: {'lr': 0.00046872549766581326, 'samples': 4957056, 'steps': 25817, 'loss/train': 1.5035878419876099} -08/30/2021 17:48:25 - INFO - __main__ - Step 25819: {'lr': 0.00046872292756015724, 'samples': 4957248, 'steps': 25818, 'loss/train': 1.4658355712890625} -08/30/2021 17:48:25 - INFO - __main__ - Step 25820: {'lr': 0.000468720357355948, 'samples': 4957440, 'steps': 25819, 'loss/train': 1.4506713151931763} -08/30/2021 17:48:26 - INFO - __main__ - Step 25821: {'lr': 0.00046871778705318673, 'samples': 4957632, 'steps': 25820, 'loss/train': 1.3372007608413696} -08/30/2021 17:48:26 - INFO - __main__ - Step 25822: {'lr': 0.0004687152166518747, 'samples': 4957824, 'steps': 25821, 'loss/train': 2.044471502304077} -08/30/2021 17:48:28 - INFO - __main__ - Step 25823: {'lr': 0.0004687126461520128, 'samples': 4958016, 'steps': 25822, 'loss/train': 1.5280523300170898} -08/30/2021 17:48:28 - INFO - __main__ - Step 25824: {'lr': 0.0004687100755536025, 'samples': 4958208, 'steps': 25823, 'loss/train': 1.6051236391067505} -08/30/2021 17:48:29 - INFO - __main__ - Step 25825: {'lr': 0.00046870750485664484, 'samples': 4958400, 'steps': 25824, 'loss/train': 0.11616300791501999} -08/30/2021 17:48:29 - INFO - __main__ - Step 25826: {'lr': 0.00046870493406114084, 'samples': 4958592, 'steps': 25825, 'loss/train': 1.6234893798828125} -08/30/2021 17:48:29 - INFO - __main__ - Step 25827: {'lr': 0.0004687023631670918, 'samples': 4958784, 'steps': 25826, 'loss/train': 1.6770555973052979} -08/30/2021 17:48:31 - INFO - __main__ - Step 25828: {'lr': 0.0004686997921744989, 'samples': 4958976, 'steps': 25827, 'loss/train': 0.9241091012954712} -08/30/2021 17:48:32 - INFO - __main__ - Step 25829: {'lr': 0.0004686972210833632, 'samples': 4959168, 'steps': 25828, 'loss/train': 0.8609564900398254} -08/30/2021 17:48:32 - INFO - __main__ - Step 25830: {'lr': 0.0004686946498936859, 'samples': 4959360, 'steps': 25829, 'loss/train': 0.9588181972503662} -08/30/2021 17:48:33 - INFO - __main__ - Step 25831: {'lr': 0.00046869207860546826, 'samples': 4959552, 'steps': 25830, 'loss/train': 1.30747652053833} -08/30/2021 17:48:33 - INFO - __main__ - Step 25832: {'lr': 0.00046868950721871126, 'samples': 4959744, 'steps': 25831, 'loss/train': 0.08194424957036972} -08/30/2021 17:48:35 - INFO - __main__ - Step 25833: {'lr': 0.00046868693573341616, 'samples': 4959936, 'steps': 25832, 'loss/train': 1.5127626657485962} -08/30/2021 17:48:35 - INFO - __main__ - Step 25834: {'lr': 0.00046868436414958405, 'samples': 4960128, 'steps': 25833, 'loss/train': 1.5270503759384155} -08/30/2021 17:48:35 - INFO - __main__ - Step 25835: {'lr': 0.00046868179246721623, 'samples': 4960320, 'steps': 25834, 'loss/train': 1.227791428565979} -08/30/2021 17:48:36 - INFO - __main__ - Step 25836: {'lr': 0.00046867922068631374, 'samples': 4960512, 'steps': 25835, 'loss/train': 1.333652377128601} -08/30/2021 17:48:36 - INFO - __main__ - Step 25837: {'lr': 0.00046867664880687775, 'samples': 4960704, 'steps': 25836, 'loss/train': 1.6279029846191406} -08/30/2021 17:48:37 - INFO - __main__ - Step 25838: {'lr': 0.00046867407682890937, 'samples': 4960896, 'steps': 25837, 'loss/train': 2.670116662979126} -08/30/2021 17:48:38 - INFO - __main__ - Step 25839: {'lr': 0.00046867150475240994, 'samples': 4961088, 'steps': 25838, 'loss/train': 1.530759334564209} -08/30/2021 17:48:39 - INFO - __main__ - Step 25840: {'lr': 0.0004686689325773805, 'samples': 4961280, 'steps': 25839, 'loss/train': 0.8202062845230103} -08/30/2021 17:48:39 - INFO - __main__ - Step 25841: {'lr': 0.00046866636030382217, 'samples': 4961472, 'steps': 25840, 'loss/train': 0.588380753993988} -08/30/2021 17:48:40 - INFO - __main__ - Step 25842: {'lr': 0.00046866378793173616, 'samples': 4961664, 'steps': 25841, 'loss/train': 0.047773007303476334} -08/30/2021 17:48:40 - INFO - __main__ - Step 25843: {'lr': 0.0004686612154611236, 'samples': 4961856, 'steps': 25842, 'loss/train': 0.8975650668144226} -08/30/2021 17:48:40 - INFO - __main__ - Step 25844: {'lr': 0.0004686586428919857, 'samples': 4962048, 'steps': 25843, 'loss/train': 1.4415950775146484} -08/30/2021 17:48:42 - INFO - __main__ - Step 25845: {'lr': 0.00046865607022432356, 'samples': 4962240, 'steps': 25844, 'loss/train': 1.4818027019500732} -08/30/2021 17:48:43 - INFO - __main__ - Step 25846: {'lr': 0.00046865349745813835, 'samples': 4962432, 'steps': 25845, 'loss/train': 0.41203126311302185} -08/30/2021 17:48:43 - INFO - __main__ - Step 25847: {'lr': 0.00046865092459343126, 'samples': 4962624, 'steps': 25846, 'loss/train': 0.39638659358024597} -08/30/2021 17:48:43 - INFO - __main__ - Step 25848: {'lr': 0.00046864835163020353, 'samples': 4962816, 'steps': 25847, 'loss/train': 3.1060988903045654} -08/30/2021 17:48:44 - INFO - __main__ - Step 25849: {'lr': 0.00046864577856845613, 'samples': 4963008, 'steps': 25848, 'loss/train': 1.3016031980514526} -08/30/2021 17:48:45 - INFO - __main__ - Step 25850: {'lr': 0.0004686432054081904, 'samples': 4963200, 'steps': 25849, 'loss/train': 1.7076200246810913} -08/30/2021 17:48:46 - INFO - __main__ - Step 25851: {'lr': 0.00046864063214940735, 'samples': 4963392, 'steps': 25850, 'loss/train': 1.5625218152999878} -08/30/2021 17:48:46 - INFO - __main__ - Step 25852: {'lr': 0.0004686380587921082, 'samples': 4963584, 'steps': 25851, 'loss/train': 1.1658756732940674} -08/30/2021 17:48:46 - INFO - __main__ - Step 25853: {'lr': 0.00046863548533629406, 'samples': 4963776, 'steps': 25852, 'loss/train': 1.4682843685150146} -08/30/2021 17:48:47 - INFO - __main__ - Step 25854: {'lr': 0.00046863291178196625, 'samples': 4963968, 'steps': 25853, 'loss/train': 1.3993884325027466} -08/30/2021 17:48:48 - INFO - __main__ - Step 25855: {'lr': 0.0004686303381291258, 'samples': 4964160, 'steps': 25854, 'loss/train': 1.115661382675171} -08/30/2021 17:48:49 - INFO - __main__ - Step 25856: {'lr': 0.00046862776437777386, 'samples': 4964352, 'steps': 25855, 'loss/train': 1.8204008340835571} -08/30/2021 17:48:49 - INFO - __main__ - Step 25857: {'lr': 0.00046862519052791166, 'samples': 4964544, 'steps': 25856, 'loss/train': 1.7891380786895752} -08/30/2021 17:48:49 - INFO - __main__ - Step 25858: {'lr': 0.00046862261657954033, 'samples': 4964736, 'steps': 25857, 'loss/train': 1.8477543592453003} -08/30/2021 17:48:50 - INFO - __main__ - Step 25859: {'lr': 0.000468620042532661, 'samples': 4964928, 'steps': 25858, 'loss/train': 1.9821393489837646} -08/30/2021 17:48:50 - INFO - __main__ - Step 25860: {'lr': 0.0004686174683872748, 'samples': 4965120, 'steps': 25859, 'loss/train': 1.1302052736282349} -08/30/2021 17:48:52 - INFO - __main__ - Step 25861: {'lr': 0.00046861489414338304, 'samples': 4965312, 'steps': 25860, 'loss/train': 1.3140689134597778} -08/30/2021 17:48:52 - INFO - __main__ - Step 25862: {'lr': 0.0004686123198009867, 'samples': 4965504, 'steps': 25861, 'loss/train': 1.688848853111267} -08/30/2021 17:48:52 - INFO - __main__ - Step 25863: {'lr': 0.00046860974536008706, 'samples': 4965696, 'steps': 25862, 'loss/train': 2.353419065475464} -08/30/2021 17:48:53 - INFO - __main__ - Step 25864: {'lr': 0.0004686071708206853, 'samples': 4965888, 'steps': 25863, 'loss/train': 1.376936912536621} -08/30/2021 17:48:53 - INFO - __main__ - Step 25865: {'lr': 0.0004686045961827824, 'samples': 4966080, 'steps': 25864, 'loss/train': 1.745242714881897} -08/30/2021 17:48:55 - INFO - __main__ - Step 25866: {'lr': 0.00046860202144637976, 'samples': 4966272, 'steps': 25865, 'loss/train': 1.4062267541885376} -08/30/2021 17:48:55 - INFO - __main__ - Step 25867: {'lr': 0.00046859944661147837, 'samples': 4966464, 'steps': 25866, 'loss/train': 1.6638727188110352} -08/30/2021 17:48:55 - INFO - __main__ - Step 25868: {'lr': 0.00046859687167807943, 'samples': 4966656, 'steps': 25867, 'loss/train': 1.9906589984893799} -08/30/2021 17:48:56 - INFO - __main__ - Step 25869: {'lr': 0.0004685942966461841, 'samples': 4966848, 'steps': 25868, 'loss/train': 0.9553824663162231} -08/30/2021 17:48:56 - INFO - __main__ - Step 25870: {'lr': 0.00046859172151579354, 'samples': 4967040, 'steps': 25869, 'loss/train': 1.0746548175811768} -08/30/2021 17:48:58 - INFO - __main__ - Step 25871: {'lr': 0.00046858914628690896, 'samples': 4967232, 'steps': 25870, 'loss/train': 1.5431541204452515} -08/30/2021 17:48:58 - INFO - __main__ - Step 25872: {'lr': 0.0004685865709595315, 'samples': 4967424, 'steps': 25871, 'loss/train': 0.1604749858379364} -08/30/2021 17:48:59 - INFO - __main__ - Step 25873: {'lr': 0.00046858399553366224, 'samples': 4967616, 'steps': 25872, 'loss/train': 0.8738030791282654} -08/30/2021 17:48:59 - INFO - __main__ - Step 25874: {'lr': 0.0004685814200093025, 'samples': 4967808, 'steps': 25873, 'loss/train': 1.4320909976959229} -08/30/2021 17:48:59 - INFO - __main__ - Step 25875: {'lr': 0.00046857884438645327, 'samples': 4968000, 'steps': 25874, 'loss/train': 1.1554865837097168} -08/30/2021 17:49:01 - INFO - __main__ - Step 25876: {'lr': 0.0004685762686651158, 'samples': 4968192, 'steps': 25875, 'loss/train': 1.8846144676208496} -08/30/2021 17:49:02 - INFO - __main__ - Step 25877: {'lr': 0.0004685736928452913, 'samples': 4968384, 'steps': 25876, 'loss/train': 0.9436670541763306} -08/30/2021 17:49:02 - INFO - __main__ - Step 25878: {'lr': 0.00046857111692698083, 'samples': 4968576, 'steps': 25877, 'loss/train': 1.8042160272598267} -08/30/2021 17:49:02 - INFO - __main__ - Step 25879: {'lr': 0.0004685685409101855, 'samples': 4968768, 'steps': 25878, 'loss/train': 1.3830060958862305} -08/30/2021 17:49:03 - INFO - __main__ - Step 25880: {'lr': 0.00046856596479490667, 'samples': 4968960, 'steps': 25879, 'loss/train': 0.16645364463329315} -08/30/2021 17:49:05 - INFO - __main__ - Step 25881: {'lr': 0.0004685633885811453, 'samples': 4969152, 'steps': 25880, 'loss/train': 1.3824928998947144} -08/30/2021 17:49:05 - INFO - __main__ - Step 25882: {'lr': 0.0004685608122689027, 'samples': 4969344, 'steps': 25881, 'loss/train': 0.9586479663848877} -08/30/2021 17:49:06 - INFO - __main__ - Step 25883: {'lr': 0.00046855823585818004, 'samples': 4969536, 'steps': 25882, 'loss/train': 1.8196073770523071} -08/30/2021 17:49:06 - INFO - __main__ - Step 25884: {'lr': 0.0004685556593489783, 'samples': 4969728, 'steps': 25883, 'loss/train': 1.5329629182815552} -08/30/2021 17:49:06 - INFO - __main__ - Step 25885: {'lr': 0.0004685530827412988, 'samples': 4969920, 'steps': 25884, 'loss/train': 1.9199702739715576} -08/30/2021 17:49:08 - INFO - __main__ - Step 25886: {'lr': 0.0004685505060351426, 'samples': 4970112, 'steps': 25885, 'loss/train': 0.08527534455060959} -08/30/2021 17:49:08 - INFO - __main__ - Step 25887: {'lr': 0.00046854792923051094, 'samples': 4970304, 'steps': 25886, 'loss/train': 1.6177213191986084} -08/30/2021 17:49:09 - INFO - __main__ - Step 25888: {'lr': 0.00046854535232740505, 'samples': 4970496, 'steps': 25887, 'loss/train': 1.8536111116409302} -08/30/2021 17:49:09 - INFO - __main__ - Step 25889: {'lr': 0.00046854277532582585, 'samples': 4970688, 'steps': 25888, 'loss/train': 1.2673453092575073} -08/30/2021 17:49:10 - INFO - __main__ - Step 25890: {'lr': 0.0004685401982257747, 'samples': 4970880, 'steps': 25889, 'loss/train': 1.2118864059448242} -08/30/2021 17:49:11 - INFO - __main__ - Step 25891: {'lr': 0.0004685376210272527, 'samples': 4971072, 'steps': 25890, 'loss/train': 1.2783883810043335} -08/30/2021 17:49:11 - INFO - __main__ - Step 25892: {'lr': 0.00046853504373026107, 'samples': 4971264, 'steps': 25891, 'loss/train': 1.3913556337356567} -08/30/2021 17:49:12 - INFO - __main__ - Step 25893: {'lr': 0.00046853246633480087, 'samples': 4971456, 'steps': 25892, 'loss/train': 0.5311654806137085} -08/30/2021 17:49:12 - INFO - __main__ - Step 25894: {'lr': 0.0004685298888408733, 'samples': 4971648, 'steps': 25893, 'loss/train': 1.2150635719299316} -08/30/2021 17:49:13 - INFO - __main__ - Step 25895: {'lr': 0.0004685273112484796, 'samples': 4971840, 'steps': 25894, 'loss/train': 1.3217010498046875} -08/30/2021 17:49:14 - INFO - __main__ - Step 25896: {'lr': 0.0004685247335576209, 'samples': 4972032, 'steps': 25895, 'loss/train': 1.5537326335906982} -08/30/2021 17:49:15 - INFO - __main__ - Step 25897: {'lr': 0.00046852215576829824, 'samples': 4972224, 'steps': 25896, 'loss/train': 2.15730881690979} -08/30/2021 17:49:15 - INFO - __main__ - Step 25898: {'lr': 0.0004685195778805129, 'samples': 4972416, 'steps': 25897, 'loss/train': 1.7009484767913818} -08/30/2021 17:49:15 - INFO - __main__ - Step 25899: {'lr': 0.000468516999894266, 'samples': 4972608, 'steps': 25898, 'loss/train': 1.350884199142456} -08/30/2021 17:49:16 - INFO - __main__ - Step 25900: {'lr': 0.0004685144218095587, 'samples': 4972800, 'steps': 25899, 'loss/train': 1.6464431285858154} -08/30/2021 17:49:16 - INFO - __main__ - Step 25901: {'lr': 0.00046851184362639223, 'samples': 4972992, 'steps': 25900, 'loss/train': 1.436650037765503} -08/30/2021 17:49:18 - INFO - __main__ - Step 25902: {'lr': 0.0004685092653447676, 'samples': 4973184, 'steps': 25901, 'loss/train': 1.5484634637832642} -08/30/2021 17:49:18 - INFO - __main__ - Step 25903: {'lr': 0.00046850668696468614, 'samples': 4973376, 'steps': 25902, 'loss/train': 1.5408024787902832} -08/30/2021 17:49:19 - INFO - __main__ - Step 25904: {'lr': 0.0004685041084861489, 'samples': 4973568, 'steps': 25903, 'loss/train': 1.5481486320495605} -08/30/2021 17:49:19 - INFO - __main__ - Step 25905: {'lr': 0.00046850152990915705, 'samples': 4973760, 'steps': 25904, 'loss/train': 2.10436749458313} -08/30/2021 17:49:19 - INFO - __main__ - Step 25906: {'lr': 0.0004684989512337119, 'samples': 4973952, 'steps': 25905, 'loss/train': 1.1209992170333862} -08/30/2021 17:49:21 - INFO - __main__ - Step 25907: {'lr': 0.00046849637245981434, 'samples': 4974144, 'steps': 25906, 'loss/train': 1.4587196111679077} -08/30/2021 17:49:21 - INFO - __main__ - Step 25908: {'lr': 0.0004684937935874658, 'samples': 4974336, 'steps': 25907, 'loss/train': 1.7507963180541992} -08/30/2021 17:49:22 - INFO - __main__ - Step 25909: {'lr': 0.00046849121461666734, 'samples': 4974528, 'steps': 25908, 'loss/train': 1.6651357412338257} -08/30/2021 17:49:22 - INFO - __main__ - Step 25910: {'lr': 0.00046848863554742006, 'samples': 4974720, 'steps': 25909, 'loss/train': 0.44157132506370544} -08/30/2021 17:49:22 - INFO - __main__ - Step 25911: {'lr': 0.0004684860563797252, 'samples': 4974912, 'steps': 25910, 'loss/train': 1.385323166847229} -08/30/2021 17:49:24 - INFO - __main__ - Step 25912: {'lr': 0.00046848347711358384, 'samples': 4975104, 'steps': 25911, 'loss/train': 1.5163391828536987} -08/30/2021 17:49:24 - INFO - __main__ - Step 25913: {'lr': 0.0004684808977489973, 'samples': 4975296, 'steps': 25912, 'loss/train': 1.2386027574539185} -08/30/2021 17:49:25 - INFO - __main__ - Step 25914: {'lr': 0.00046847831828596647, 'samples': 4975488, 'steps': 25913, 'loss/train': 1.4422698020935059} -08/30/2021 17:49:25 - INFO - __main__ - Step 25915: {'lr': 0.0004684757387244928, 'samples': 4975680, 'steps': 25914, 'loss/train': 1.869231104850769} -08/30/2021 17:49:25 - INFO - __main__ - Step 25916: {'lr': 0.00046847315906457733, 'samples': 4975872, 'steps': 25915, 'loss/train': 1.5322262048721313} -08/30/2021 17:49:27 - INFO - __main__ - Step 25917: {'lr': 0.0004684705793062212, 'samples': 4976064, 'steps': 25916, 'loss/train': 1.3759723901748657} -08/30/2021 17:49:27 - INFO - __main__ - Step 25918: {'lr': 0.00046846799944942564, 'samples': 4976256, 'steps': 25917, 'loss/train': 1.4368705749511719} -08/30/2021 17:49:28 - INFO - __main__ - Step 25919: {'lr': 0.00046846541949419177, 'samples': 4976448, 'steps': 25918, 'loss/train': 0.6463767886161804} -08/30/2021 17:49:28 - INFO - __main__ - Step 25920: {'lr': 0.00046846283944052073, 'samples': 4976640, 'steps': 25919, 'loss/train': 1.723982334136963} -08/30/2021 17:49:28 - INFO - __main__ - Step 25921: {'lr': 0.0004684602592884136, 'samples': 4976832, 'steps': 25920, 'loss/train': 0.3706967830657959} -08/30/2021 17:49:30 - INFO - __main__ - Step 25922: {'lr': 0.0004684576790378718, 'samples': 4977024, 'steps': 25921, 'loss/train': 1.5728548765182495} -08/30/2021 17:49:31 - INFO - __main__ - Step 25923: {'lr': 0.00046845509868889625, 'samples': 4977216, 'steps': 25922, 'loss/train': 1.5348352193832397} -08/30/2021 17:49:31 - INFO - __main__ - Step 25924: {'lr': 0.00046845251824148825, 'samples': 4977408, 'steps': 25923, 'loss/train': 1.6719447374343872} -08/30/2021 17:49:31 - INFO - __main__ - Step 25925: {'lr': 0.0004684499376956489, 'samples': 4977600, 'steps': 25924, 'loss/train': 0.8076337575912476} -08/30/2021 17:49:32 - INFO - __main__ - Step 25926: {'lr': 0.00046844735705137944, 'samples': 4977792, 'steps': 25925, 'loss/train': 1.2432372570037842} -08/30/2021 17:49:32 - INFO - __main__ - Step 25927: {'lr': 0.0004684447763086809, 'samples': 4977984, 'steps': 25926, 'loss/train': 1.2376854419708252} -08/30/2021 17:49:34 - INFO - __main__ - Step 25928: {'lr': 0.00046844219546755454, 'samples': 4978176, 'steps': 25927, 'loss/train': 2.077136754989624} -08/30/2021 17:49:34 - INFO - __main__ - Step 25929: {'lr': 0.0004684396145280014, 'samples': 4978368, 'steps': 25928, 'loss/train': 1.3480955362319946} -08/30/2021 17:49:34 - INFO - __main__ - Step 25930: {'lr': 0.00046843703349002286, 'samples': 4978560, 'steps': 25929, 'loss/train': 1.5316728353500366} -08/30/2021 17:49:35 - INFO - __main__ - Step 25931: {'lr': 0.00046843445235361994, 'samples': 4978752, 'steps': 25930, 'loss/train': 0.6487564444541931} -08/30/2021 17:49:35 - INFO - __main__ - Step 25932: {'lr': 0.0004684318711187938, 'samples': 4978944, 'steps': 25931, 'loss/train': 0.9000486135482788} -08/30/2021 17:49:37 - INFO - __main__ - Step 25933: {'lr': 0.0004684292897855457, 'samples': 4979136, 'steps': 25932, 'loss/train': 1.7701318264007568} -08/30/2021 17:49:37 - INFO - __main__ - Step 25934: {'lr': 0.00046842670835387667, 'samples': 4979328, 'steps': 25933, 'loss/train': 1.7426519393920898} -08/30/2021 17:49:38 - INFO - __main__ - Step 25935: {'lr': 0.00046842412682378796, 'samples': 4979520, 'steps': 25934, 'loss/train': 2.0687735080718994} -08/30/2021 17:49:38 - INFO - __main__ - Step 25936: {'lr': 0.0004684215451952807, 'samples': 4979712, 'steps': 25935, 'loss/train': 0.18766005337238312} -08/30/2021 17:49:38 - INFO - __main__ - Step 25937: {'lr': 0.000468418963468356, 'samples': 4979904, 'steps': 25936, 'loss/train': 0.8473954200744629} -08/30/2021 17:49:40 - INFO - __main__ - Step 25938: {'lr': 0.0004684163816430152, 'samples': 4980096, 'steps': 25937, 'loss/train': 1.2398358583450317} -08/30/2021 17:49:41 - INFO - __main__ - Step 25939: {'lr': 0.00046841379971925923, 'samples': 4980288, 'steps': 25938, 'loss/train': 2.2545342445373535} -08/30/2021 17:49:41 - INFO - __main__ - Step 25940: {'lr': 0.0004684112176970895, 'samples': 4980480, 'steps': 25939, 'loss/train': 0.9708952307701111} -08/30/2021 17:49:42 - INFO - __main__ - Step 25941: {'lr': 0.0004684086355765069, 'samples': 4980672, 'steps': 25940, 'loss/train': 1.5442172288894653} -08/30/2021 17:49:42 - INFO - __main__ - Step 25942: {'lr': 0.00046840605335751284, 'samples': 4980864, 'steps': 25941, 'loss/train': 0.12289529293775558} -08/30/2021 17:49:42 - INFO - __main__ - Step 25943: {'lr': 0.0004684034710401084, 'samples': 4981056, 'steps': 25942, 'loss/train': 1.1677873134613037} -08/30/2021 17:49:44 - INFO - __main__ - Step 25944: {'lr': 0.00046840088862429465, 'samples': 4981248, 'steps': 25943, 'loss/train': 0.9567702412605286} -08/30/2021 17:49:44 - INFO - __main__ - Step 25945: {'lr': 0.00046839830611007297, 'samples': 4981440, 'steps': 25944, 'loss/train': 1.7980859279632568} -08/30/2021 17:49:44 - INFO - __main__ - Step 25946: {'lr': 0.00046839572349744417, 'samples': 4981632, 'steps': 25945, 'loss/train': 1.9469941854476929} -08/30/2021 17:49:45 - INFO - __main__ - Step 25947: {'lr': 0.0004683931407864098, 'samples': 4981824, 'steps': 25946, 'loss/train': 1.7215113639831543} -08/30/2021 17:49:45 - INFO - __main__ - Step 25948: {'lr': 0.0004683905579769708, 'samples': 4982016, 'steps': 25947, 'loss/train': 1.8378640413284302} -08/30/2021 17:49:47 - INFO - __main__ - Step 25949: {'lr': 0.0004683879750691283, 'samples': 4982208, 'steps': 25948, 'loss/train': 1.6385730504989624} -08/30/2021 17:49:47 - INFO - __main__ - Step 25950: {'lr': 0.00046838539206288366, 'samples': 4982400, 'steps': 25949, 'loss/train': 0.9481050968170166} -08/30/2021 17:49:48 - INFO - __main__ - Step 25951: {'lr': 0.00046838280895823795, 'samples': 4982592, 'steps': 25950, 'loss/train': 1.8381636142730713} -08/30/2021 17:49:48 - INFO - __main__ - Step 25952: {'lr': 0.0004683802257551922, 'samples': 4982784, 'steps': 25951, 'loss/train': 0.21413718163967133} -08/30/2021 17:49:48 - INFO - __main__ - Step 25953: {'lr': 0.00046837764245374777, 'samples': 4982976, 'steps': 25952, 'loss/train': 1.6276837587356567} -08/30/2021 17:49:50 - INFO - __main__ - Step 25954: {'lr': 0.0004683750590539057, 'samples': 4983168, 'steps': 25953, 'loss/train': 1.499752163887024} -08/30/2021 17:49:51 - INFO - __main__ - Step 25955: {'lr': 0.00046837247555566727, 'samples': 4983360, 'steps': 25954, 'loss/train': 1.5714073181152344} -08/30/2021 17:49:51 - INFO - __main__ - Step 25956: {'lr': 0.00046836989195903344, 'samples': 4983552, 'steps': 25955, 'loss/train': 1.6329160928726196} -08/30/2021 17:49:51 - INFO - __main__ - Step 25957: {'lr': 0.00046836730826400565, 'samples': 4983744, 'steps': 25956, 'loss/train': 0.05928225815296173} -08/30/2021 17:49:52 - INFO - __main__ - Step 25958: {'lr': 0.00046836472447058485, 'samples': 4983936, 'steps': 25957, 'loss/train': 1.316361427307129} -08/30/2021 17:49:52 - INFO - __main__ - Step 25959: {'lr': 0.0004683621405787723, 'samples': 4984128, 'steps': 25958, 'loss/train': 1.761487364768982} -08/30/2021 17:49:54 - INFO - __main__ - Step 25960: {'lr': 0.0004683595565885691, 'samples': 4984320, 'steps': 25959, 'loss/train': 1.3059948682785034} -08/30/2021 17:49:54 - INFO - __main__ - Step 25961: {'lr': 0.0004683569724999765, 'samples': 4984512, 'steps': 25960, 'loss/train': 1.4094239473342896} -08/30/2021 17:49:54 - INFO - __main__ - Step 25962: {'lr': 0.0004683543883129956, 'samples': 4984704, 'steps': 25961, 'loss/train': 1.1170181035995483} -08/30/2021 17:49:55 - INFO - __main__ - Step 25963: {'lr': 0.00046835180402762756, 'samples': 4984896, 'steps': 25962, 'loss/train': 1.4737088680267334} -08/30/2021 17:49:55 - INFO - __main__ - Step 25964: {'lr': 0.00046834921964387363, 'samples': 4985088, 'steps': 25963, 'loss/train': 1.6293675899505615} -08/30/2021 17:49:57 - INFO - __main__ - Step 25965: {'lr': 0.0004683466351617348, 'samples': 4985280, 'steps': 25964, 'loss/train': 1.4512293338775635} -08/30/2021 17:49:57 - INFO - __main__ - Step 25966: {'lr': 0.00046834405058121244, 'samples': 4985472, 'steps': 25965, 'loss/train': 1.2718610763549805} -08/30/2021 17:49:58 - INFO - __main__ - Step 25967: {'lr': 0.0004683414659023076, 'samples': 4985664, 'steps': 25966, 'loss/train': 1.3894829750061035} -08/30/2021 17:49:58 - INFO - __main__ - Step 25968: {'lr': 0.0004683388811250214, 'samples': 4985856, 'steps': 25967, 'loss/train': 0.07728894799947739} -08/30/2021 17:49:58 - INFO - __main__ - Step 25969: {'lr': 0.0004683362962493552, 'samples': 4986048, 'steps': 25968, 'loss/train': 1.0849885940551758} -08/30/2021 17:50:00 - INFO - __main__ - Step 25970: {'lr': 0.00046833371127530995, 'samples': 4986240, 'steps': 25969, 'loss/train': 1.3206024169921875} -08/30/2021 17:50:00 - INFO - __main__ - Step 25971: {'lr': 0.00046833112620288684, 'samples': 4986432, 'steps': 25970, 'loss/train': 1.8398730754852295} -08/30/2021 17:50:01 - INFO - __main__ - Step 25972: {'lr': 0.0004683285410320872, 'samples': 4986624, 'steps': 25971, 'loss/train': 1.4553896188735962} -08/30/2021 17:50:01 - INFO - __main__ - Step 25973: {'lr': 0.000468325955762912, 'samples': 4986816, 'steps': 25972, 'loss/train': 2.4145243167877197} -08/30/2021 17:50:01 - INFO - __main__ - Step 25974: {'lr': 0.0004683233703953626, 'samples': 4987008, 'steps': 25973, 'loss/train': 0.05586782097816467} -08/30/2021 17:50:03 - INFO - __main__ - Step 25975: {'lr': 0.00046832078492944, 'samples': 4987200, 'steps': 25974, 'loss/train': 1.1521482467651367} -08/30/2021 17:50:04 - INFO - __main__ - Step 25976: {'lr': 0.0004683181993651454, 'samples': 4987392, 'steps': 25975, 'loss/train': 1.6343966722488403} -08/30/2021 17:50:04 - INFO - __main__ - Step 25977: {'lr': 0.0004683156137024801, 'samples': 4987584, 'steps': 25976, 'loss/train': 1.1978342533111572} -08/30/2021 17:50:05 - INFO - __main__ - Step 25978: {'lr': 0.00046831302794144504, 'samples': 4987776, 'steps': 25977, 'loss/train': 1.5771232843399048} -08/30/2021 17:50:05 - INFO - __main__ - Step 25979: {'lr': 0.00046831044208204154, 'samples': 4987968, 'steps': 25978, 'loss/train': 0.8119454383850098} -08/30/2021 17:50:05 - INFO - __main__ - Step 25980: {'lr': 0.0004683078561242707, 'samples': 4988160, 'steps': 25979, 'loss/train': 1.2827008962631226} -08/30/2021 17:50:06 - INFO - __main__ - Step 25981: {'lr': 0.00046830527006813373, 'samples': 4988352, 'steps': 25980, 'loss/train': 1.6679977178573608} -08/30/2021 17:50:07 - INFO - __main__ - Step 25982: {'lr': 0.00046830268391363176, 'samples': 4988544, 'steps': 25981, 'loss/train': 1.65229332447052} -08/30/2021 17:50:08 - INFO - __main__ - Step 25983: {'lr': 0.0004683000976607659, 'samples': 4988736, 'steps': 25982, 'loss/train': 1.8264904022216797} -08/30/2021 17:50:08 - INFO - __main__ - Step 25984: {'lr': 0.00046829751130953747, 'samples': 4988928, 'steps': 25983, 'loss/train': 1.3469122648239136} -08/30/2021 17:50:08 - INFO - __main__ - Step 25985: {'lr': 0.0004682949248599476, 'samples': 4989120, 'steps': 25984, 'loss/train': 1.5895007848739624} -08/30/2021 17:50:09 - INFO - __main__ - Step 25986: {'lr': 0.0004682923383119973, 'samples': 4989312, 'steps': 25985, 'loss/train': 1.8001866340637207} -08/30/2021 17:50:10 - INFO - __main__ - Step 25987: {'lr': 0.0004682897516656879, 'samples': 4989504, 'steps': 25986, 'loss/train': 1.8371360301971436} -08/30/2021 17:50:11 - INFO - __main__ - Step 25988: {'lr': 0.00046828716492102043, 'samples': 4989696, 'steps': 25987, 'loss/train': 1.1633650064468384} -08/30/2021 17:50:11 - INFO - __main__ - Step 25989: {'lr': 0.0004682845780779962, 'samples': 4989888, 'steps': 25988, 'loss/train': 1.2397024631500244} -08/30/2021 17:50:11 - INFO - __main__ - Step 25990: {'lr': 0.00046828199113661627, 'samples': 4990080, 'steps': 25989, 'loss/train': 1.7234729528427124} -08/30/2021 17:50:12 - INFO - __main__ - Step 25991: {'lr': 0.0004682794040968819, 'samples': 4990272, 'steps': 25990, 'loss/train': 1.2466639280319214} -08/30/2021 17:50:14 - INFO - __main__ - Step 25992: {'lr': 0.0004682768169587942, 'samples': 4990464, 'steps': 25991, 'loss/train': 1.100614070892334} -08/30/2021 17:50:15 - INFO - __main__ - Step 25993: {'lr': 0.0004682742297223543, 'samples': 4990656, 'steps': 25992, 'loss/train': 1.6922521591186523} -08/30/2021 17:50:15 - INFO - __main__ - Step 25994: {'lr': 0.00046827164238756337, 'samples': 4990848, 'steps': 25993, 'loss/train': 0.9433560371398926} -08/30/2021 17:50:15 - INFO - __main__ - Step 25995: {'lr': 0.00046826905495442263, 'samples': 4991040, 'steps': 25994, 'loss/train': 0.9941039681434631} -08/30/2021 17:50:16 - INFO - __main__ - Step 25996: {'lr': 0.00046826646742293326, 'samples': 4991232, 'steps': 25995, 'loss/train': 1.782634973526001} -08/30/2021 17:50:16 - INFO - __main__ - Step 25997: {'lr': 0.00046826387979309635, 'samples': 4991424, 'steps': 25996, 'loss/train': 3.086235761642456} -08/30/2021 17:50:18 - INFO - __main__ - Step 25998: {'lr': 0.0004682612920649131, 'samples': 4991616, 'steps': 25997, 'loss/train': 0.8794245719909668} -08/30/2021 17:50:18 - INFO - __main__ - Step 25999: {'lr': 0.00046825870423838466, 'samples': 4991808, 'steps': 25998, 'loss/train': 0.8561205863952637} -08/30/2021 17:50:18 - INFO - __main__ - Step 26000: {'lr': 0.00046825611631351227, 'samples': 4992000, 'steps': 25999, 'loss/train': 0.7992864847183228} -08/30/2021 17:50:19 - INFO - __main__ - Step 26001: {'lr': 0.00046825352829029705, 'samples': 4992192, 'steps': 26000, 'loss/train': 1.2635619640350342} -08/30/2021 17:50:19 - INFO - __main__ - Step 26002: {'lr': 0.00046825094016874014, 'samples': 4992384, 'steps': 26001, 'loss/train': 0.7718640565872192} -08/30/2021 17:50:21 - INFO - __main__ - Step 26003: {'lr': 0.00046824835194884273, 'samples': 4992576, 'steps': 26002, 'loss/train': 2.029985189437866} -08/30/2021 17:50:21 - INFO - __main__ - Step 26004: {'lr': 0.0004682457636306059, 'samples': 4992768, 'steps': 26003, 'loss/train': 0.8590334057807922} -08/30/2021 17:50:22 - INFO - __main__ - Step 26005: {'lr': 0.000468243175214031, 'samples': 4992960, 'steps': 26004, 'loss/train': 1.890396237373352} -08/30/2021 17:50:22 - INFO - __main__ - Step 26006: {'lr': 0.00046824058669911906, 'samples': 4993152, 'steps': 26005, 'loss/train': 1.6611837148666382} -08/30/2021 17:50:22 - INFO - __main__ - Step 26007: {'lr': 0.00046823799808587126, 'samples': 4993344, 'steps': 26006, 'loss/train': 1.3633774518966675} -08/30/2021 17:50:23 - INFO - __main__ - Step 26008: {'lr': 0.00046823540937428876, 'samples': 4993536, 'steps': 26007, 'loss/train': 1.5682960748672485} -08/30/2021 17:50:24 - INFO - __main__ - Step 26009: {'lr': 0.0004682328205643728, 'samples': 4993728, 'steps': 26008, 'loss/train': 1.2900131940841675} -08/30/2021 17:50:25 - INFO - __main__ - Step 26010: {'lr': 0.00046823023165612455, 'samples': 4993920, 'steps': 26009, 'loss/train': 1.6659449338912964} -08/30/2021 17:50:25 - INFO - __main__ - Step 26011: {'lr': 0.000468227642649545, 'samples': 4994112, 'steps': 26010, 'loss/train': 1.5601441860198975} -08/30/2021 17:50:25 - INFO - __main__ - Step 26012: {'lr': 0.00046822505354463553, 'samples': 4994304, 'steps': 26011, 'loss/train': 1.3833215236663818} -08/30/2021 17:50:26 - INFO - __main__ - Step 26013: {'lr': 0.0004682224643413972, 'samples': 4994496, 'steps': 26012, 'loss/train': 1.6717795133590698} -08/30/2021 17:50:27 - INFO - __main__ - Step 26014: {'lr': 0.0004682198750398312, 'samples': 4994688, 'steps': 26013, 'loss/train': 1.347379446029663} -08/30/2021 17:50:28 - INFO - __main__ - Step 26015: {'lr': 0.00046821728563993867, 'samples': 4994880, 'steps': 26014, 'loss/train': 0.42934542894363403} -08/30/2021 17:50:28 - INFO - __main__ - Step 26016: {'lr': 0.0004682146961417208, 'samples': 4995072, 'steps': 26015, 'loss/train': 1.59308922290802} -08/30/2021 17:50:28 - INFO - __main__ - Step 26017: {'lr': 0.00046821210654517874, 'samples': 4995264, 'steps': 26016, 'loss/train': 1.338724970817566} -08/30/2021 17:50:29 - INFO - __main__ - Step 26018: {'lr': 0.0004682095168503137, 'samples': 4995456, 'steps': 26017, 'loss/train': 1.399625539779663} -08/30/2021 17:50:30 - INFO - __main__ - Step 26019: {'lr': 0.00046820692705712685, 'samples': 4995648, 'steps': 26018, 'loss/train': 1.3258057832717896} -08/30/2021 17:50:31 - INFO - __main__ - Step 26020: {'lr': 0.00046820433716561927, 'samples': 4995840, 'steps': 26019, 'loss/train': 0.8071329593658447} -08/30/2021 17:50:31 - INFO - __main__ - Step 26021: {'lr': 0.0004682017471757922, 'samples': 4996032, 'steps': 26020, 'loss/train': 1.1271674633026123} -08/30/2021 17:50:32 - INFO - __main__ - Step 26022: {'lr': 0.0004681991570876468, 'samples': 4996224, 'steps': 26021, 'loss/train': 1.7399072647094727} -08/30/2021 17:50:32 - INFO - __main__ - Step 26023: {'lr': 0.00046819656690118424, 'samples': 4996416, 'steps': 26022, 'loss/train': 0.3772258162498474} -08/30/2021 17:50:32 - INFO - __main__ - Step 26024: {'lr': 0.00046819397661640563, 'samples': 4996608, 'steps': 26023, 'loss/train': 1.1453603506088257} -08/30/2021 17:50:34 - INFO - __main__ - Step 26025: {'lr': 0.0004681913862333122, 'samples': 4996800, 'steps': 26024, 'loss/train': 1.5894954204559326} -08/30/2021 17:50:34 - INFO - __main__ - Step 26026: {'lr': 0.0004681887957519051, 'samples': 4996992, 'steps': 26025, 'loss/train': 1.5680606365203857} -08/30/2021 17:50:35 - INFO - __main__ - Step 26027: {'lr': 0.00046818620517218544, 'samples': 4997184, 'steps': 26026, 'loss/train': 1.8114136457443237} -08/30/2021 17:50:35 - INFO - __main__ - Step 26028: {'lr': 0.00046818361449415456, 'samples': 4997376, 'steps': 26027, 'loss/train': 1.4232066869735718} -08/30/2021 17:50:35 - INFO - __main__ - Step 26029: {'lr': 0.00046818102371781343, 'samples': 4997568, 'steps': 26028, 'loss/train': 1.4627221822738647} -08/30/2021 17:50:37 - INFO - __main__ - Step 26030: {'lr': 0.0004681784328431633, 'samples': 4997760, 'steps': 26029, 'loss/train': 1.7061995267868042} -08/30/2021 17:50:37 - INFO - __main__ - Step 26031: {'lr': 0.0004681758418702054, 'samples': 4997952, 'steps': 26030, 'loss/train': 1.5513299703598022} -08/30/2021 17:50:37 - INFO - __main__ - Step 26032: {'lr': 0.0004681732507989408, 'samples': 4998144, 'steps': 26031, 'loss/train': 1.32917320728302} -08/30/2021 17:50:38 - INFO - __main__ - Step 26033: {'lr': 0.00046817065962937067, 'samples': 4998336, 'steps': 26032, 'loss/train': 1.118119478225708} -08/30/2021 17:50:38 - INFO - __main__ - Step 26034: {'lr': 0.00046816806836149624, 'samples': 4998528, 'steps': 26033, 'loss/train': 1.4400163888931274} -08/30/2021 17:50:40 - INFO - __main__ - Step 26035: {'lr': 0.00046816547699531866, 'samples': 4998720, 'steps': 26034, 'loss/train': 1.7957981824874878} -08/30/2021 17:50:40 - INFO - __main__ - Step 26036: {'lr': 0.000468162885530839, 'samples': 4998912, 'steps': 26035, 'loss/train': 1.4501303434371948} -08/30/2021 17:50:40 - INFO - __main__ - Step 26037: {'lr': 0.00046816029396805857, 'samples': 4999104, 'steps': 26036, 'loss/train': 1.2901222705841064} -08/30/2021 17:50:41 - INFO - __main__ - Step 26038: {'lr': 0.00046815770230697844, 'samples': 4999296, 'steps': 26037, 'loss/train': 1.858233094215393} -08/30/2021 17:50:41 - INFO - __main__ - Step 26039: {'lr': 0.0004681551105475999, 'samples': 4999488, 'steps': 26038, 'loss/train': 1.8129796981811523} -08/30/2021 17:50:41 - INFO - __main__ - Step 26040: {'lr': 0.0004681525186899239, 'samples': 4999680, 'steps': 26039, 'loss/train': 1.7217713594436646} -08/30/2021 17:50:43 - INFO - __main__ - Step 26041: {'lr': 0.00046814992673395185, 'samples': 4999872, 'steps': 26040, 'loss/train': 1.1990773677825928} -08/30/2021 17:50:44 - INFO - __main__ - Step 26042: {'lr': 0.0004681473346796848, 'samples': 5000064, 'steps': 26041, 'loss/train': 1.7544848918914795} -08/30/2021 17:50:44 - INFO - __main__ - Step 26043: {'lr': 0.0004681447425271239, 'samples': 5000256, 'steps': 26042, 'loss/train': 1.2271026372909546} -08/30/2021 17:50:44 - INFO - __main__ - Step 26044: {'lr': 0.0004681421502762704, 'samples': 5000448, 'steps': 26043, 'loss/train': 1.074222207069397} -08/30/2021 17:50:45 - INFO - __main__ - Step 26045: {'lr': 0.0004681395579271253, 'samples': 5000640, 'steps': 26044, 'loss/train': 2.0768239498138428} -08/30/2021 17:50:47 - INFO - __main__ - Step 26046: {'lr': 0.00046813696547969, 'samples': 5000832, 'steps': 26045, 'loss/train': 1.8352888822555542} -08/30/2021 17:50:48 - INFO - __main__ - Step 26047: {'lr': 0.00046813437293396543, 'samples': 5001024, 'steps': 26046, 'loss/train': 1.2411599159240723} -08/30/2021 17:50:48 - INFO - __main__ - Step 26048: {'lr': 0.000468131780289953, 'samples': 5001216, 'steps': 26047, 'loss/train': 4.784865379333496} -08/30/2021 17:50:48 - INFO - __main__ - Step 26049: {'lr': 0.00046812918754765364, 'samples': 5001408, 'steps': 26048, 'loss/train': 2.1499345302581787} -08/30/2021 17:50:49 - INFO - __main__ - Step 26050: {'lr': 0.00046812659470706877, 'samples': 5001600, 'steps': 26049, 'loss/train': 1.6595525741577148} -08/30/2021 17:50:49 - INFO - __main__ - Step 26051: {'lr': 0.0004681240017681993, 'samples': 5001792, 'steps': 26050, 'loss/train': 0.07554569095373154} -08/30/2021 17:50:51 - INFO - __main__ - Step 26052: {'lr': 0.00046812140873104657, 'samples': 5001984, 'steps': 26051, 'loss/train': 0.09549978375434875} -08/30/2021 17:50:51 - INFO - __main__ - Step 26053: {'lr': 0.00046811881559561167, 'samples': 5002176, 'steps': 26052, 'loss/train': 1.808426856994629} -08/30/2021 17:50:51 - INFO - __main__ - Step 26054: {'lr': 0.00046811622236189585, 'samples': 5002368, 'steps': 26053, 'loss/train': 2.0313563346862793} -08/30/2021 17:50:52 - INFO - __main__ - Step 26055: {'lr': 0.0004681136290299002, 'samples': 5002560, 'steps': 26054, 'loss/train': 1.5682562589645386} -08/30/2021 17:50:52 - INFO - __main__ - Step 26056: {'lr': 0.00046811103559962585, 'samples': 5002752, 'steps': 26055, 'loss/train': 1.0956287384033203} -08/30/2021 17:50:54 - INFO - __main__ - Step 26057: {'lr': 0.00046810844207107415, 'samples': 5002944, 'steps': 26056, 'loss/train': 1.8528767824172974} -08/30/2021 17:50:54 - INFO - __main__ - Step 26058: {'lr': 0.0004681058484442461, 'samples': 5003136, 'steps': 26057, 'loss/train': 1.6794477701187134} -08/30/2021 17:50:54 - INFO - __main__ - Step 26059: {'lr': 0.00046810325471914295, 'samples': 5003328, 'steps': 26058, 'loss/train': 1.7115200757980347} -08/30/2021 17:50:55 - INFO - __main__ - Step 26060: {'lr': 0.00046810066089576573, 'samples': 5003520, 'steps': 26059, 'loss/train': 1.1765812635421753} -08/30/2021 17:50:55 - INFO - __main__ - Step 26061: {'lr': 0.00046809806697411583, 'samples': 5003712, 'steps': 26060, 'loss/train': 2.1888034343719482} -08/30/2021 17:50:55 - INFO - __main__ - Step 26062: {'lr': 0.0004680954729541942, 'samples': 5003904, 'steps': 26061, 'loss/train': 1.1539087295532227} -08/30/2021 17:50:57 - INFO - __main__ - Step 26063: {'lr': 0.00046809287883600227, 'samples': 5004096, 'steps': 26062, 'loss/train': 2.0836567878723145} -08/30/2021 17:50:57 - INFO - __main__ - Step 26064: {'lr': 0.00046809028461954093, 'samples': 5004288, 'steps': 26063, 'loss/train': 1.8824714422225952} -08/30/2021 17:50:58 - INFO - __main__ - Step 26065: {'lr': 0.00046808769030481153, 'samples': 5004480, 'steps': 26064, 'loss/train': 1.9013277292251587} -08/30/2021 17:50:58 - INFO - __main__ - Step 26066: {'lr': 0.00046808509589181513, 'samples': 5004672, 'steps': 26065, 'loss/train': 1.2778221368789673} -08/30/2021 17:50:58 - INFO - __main__ - Step 26067: {'lr': 0.00046808250138055305, 'samples': 5004864, 'steps': 26066, 'loss/train': 1.5713587999343872} -08/30/2021 17:51:00 - INFO - __main__ - Step 26068: {'lr': 0.0004680799067710263, 'samples': 5005056, 'steps': 26067, 'loss/train': 1.123359203338623} -08/30/2021 17:51:00 - INFO - __main__ - Step 26069: {'lr': 0.00046807731206323605, 'samples': 5005248, 'steps': 26068, 'loss/train': 1.8972338438034058} -08/30/2021 17:51:01 - INFO - __main__ - Step 26070: {'lr': 0.00046807471725718357, 'samples': 5005440, 'steps': 26069, 'loss/train': 1.82386314868927} -08/30/2021 17:51:01 - INFO - __main__ - Step 26071: {'lr': 0.00046807212235287, 'samples': 5005632, 'steps': 26070, 'loss/train': 2.1682937145233154} -08/30/2021 17:51:01 - INFO - __main__ - Step 26072: {'lr': 0.0004680695273502965, 'samples': 5005824, 'steps': 26071, 'loss/train': 1.6509768962860107} -08/30/2021 17:51:03 - INFO - __main__ - Step 26073: {'lr': 0.00046806693224946426, 'samples': 5006016, 'steps': 26072, 'loss/train': 1.665516972541809} -08/30/2021 17:51:03 - INFO - __main__ - Step 26074: {'lr': 0.00046806433705037445, 'samples': 5006208, 'steps': 26073, 'loss/train': 1.6082911491394043} -08/30/2021 17:51:04 - INFO - __main__ - Step 26075: {'lr': 0.00046806174175302806, 'samples': 5006400, 'steps': 26074, 'loss/train': 1.735235571861267} -08/30/2021 17:51:04 - INFO - __main__ - Step 26076: {'lr': 0.00046805914635742656, 'samples': 5006592, 'steps': 26075, 'loss/train': 1.4829130172729492} -08/30/2021 17:51:04 - INFO - __main__ - Step 26077: {'lr': 0.0004680565508635709, 'samples': 5006784, 'steps': 26076, 'loss/train': 1.7443983554840088} -08/30/2021 17:51:06 - INFO - __main__ - Step 26078: {'lr': 0.00046805395527146237, 'samples': 5006976, 'steps': 26077, 'loss/train': 1.7859952449798584} -08/30/2021 17:51:06 - INFO - __main__ - Step 26079: {'lr': 0.0004680513595811021, 'samples': 5007168, 'steps': 26078, 'loss/train': 2.150747060775757} -08/30/2021 17:51:07 - INFO - __main__ - Step 26080: {'lr': 0.0004680487637924912, 'samples': 5007360, 'steps': 26079, 'loss/train': 1.501441478729248} -08/30/2021 17:51:07 - INFO - __main__ - Step 26081: {'lr': 0.0004680461679056309, 'samples': 5007552, 'steps': 26080, 'loss/train': 1.599752426147461} -08/30/2021 17:51:07 - INFO - __main__ - Step 26082: {'lr': 0.00046804357192052246, 'samples': 5007744, 'steps': 26081, 'loss/train': 1.835063099861145} -08/30/2021 17:51:08 - INFO - __main__ - Step 26083: {'lr': 0.00046804097583716685, 'samples': 5007936, 'steps': 26082, 'loss/train': 1.6404485702514648} -08/30/2021 17:51:09 - INFO - __main__ - Step 26084: {'lr': 0.0004680383796555654, 'samples': 5008128, 'steps': 26083, 'loss/train': 1.8288980722427368} -08/30/2021 17:51:10 - INFO - __main__ - Step 26085: {'lr': 0.00046803578337571917, 'samples': 5008320, 'steps': 26084, 'loss/train': 1.72828209400177} -08/30/2021 17:51:10 - INFO - __main__ - Step 26086: {'lr': 0.00046803318699762937, 'samples': 5008512, 'steps': 26085, 'loss/train': 1.5738255977630615} -08/30/2021 17:51:10 - INFO - __main__ - Step 26087: {'lr': 0.0004680305905212972, 'samples': 5008704, 'steps': 26086, 'loss/train': 1.195892095565796} -08/30/2021 17:51:11 - INFO - __main__ - Step 26088: {'lr': 0.0004680279939467238, 'samples': 5008896, 'steps': 26087, 'loss/train': 1.6134518384933472} -08/30/2021 17:51:12 - INFO - __main__ - Step 26089: {'lr': 0.00046802539727391033, 'samples': 5009088, 'steps': 26088, 'loss/train': 1.4556657075881958} -08/30/2021 17:51:13 - INFO - __main__ - Step 26090: {'lr': 0.0004680228005028581, 'samples': 5009280, 'steps': 26089, 'loss/train': 1.530471682548523} -08/30/2021 17:51:13 - INFO - __main__ - Step 26091: {'lr': 0.000468020203633568, 'samples': 5009472, 'steps': 26090, 'loss/train': 1.8344494104385376} -08/30/2021 17:51:13 - INFO - __main__ - Step 26092: {'lr': 0.0004680176066660415, 'samples': 5009664, 'steps': 26091, 'loss/train': 1.8249365091323853} -08/30/2021 17:51:14 - INFO - __main__ - Step 26093: {'lr': 0.00046801500960027957, 'samples': 5009856, 'steps': 26092, 'loss/train': 1.8713473081588745} -08/30/2021 17:51:15 - INFO - __main__ - Step 26094: {'lr': 0.00046801241243628344, 'samples': 5010048, 'steps': 26093, 'loss/train': 1.3450409173965454} -08/30/2021 17:51:16 - INFO - __main__ - Step 26095: {'lr': 0.00046800981517405426, 'samples': 5010240, 'steps': 26094, 'loss/train': 1.082474708557129} -08/30/2021 17:51:16 - INFO - __main__ - Step 26096: {'lr': 0.0004680072178135932, 'samples': 5010432, 'steps': 26095, 'loss/train': 2.279996871948242} -08/30/2021 17:51:17 - INFO - __main__ - Step 26097: {'lr': 0.00046800462035490156, 'samples': 5010624, 'steps': 26096, 'loss/train': 0.10333873331546783} -08/30/2021 17:51:17 - INFO - __main__ - Step 26098: {'lr': 0.0004680020227979803, 'samples': 5010816, 'steps': 26097, 'loss/train': 1.4143881797790527} -08/30/2021 17:51:18 - INFO - __main__ - Step 26099: {'lr': 0.0004679994251428308, 'samples': 5011008, 'steps': 26098, 'loss/train': 0.8577102422714233} -08/30/2021 17:51:19 - INFO - __main__ - Step 26100: {'lr': 0.00046799682738945397, 'samples': 5011200, 'steps': 26099, 'loss/train': 1.9826905727386475} -08/30/2021 17:51:19 - INFO - __main__ - Step 26101: {'lr': 0.00046799422953785124, 'samples': 5011392, 'steps': 26100, 'loss/train': 0.7031465768814087} -08/30/2021 17:51:20 - INFO - __main__ - Step 26102: {'lr': 0.00046799163158802365, 'samples': 5011584, 'steps': 26101, 'loss/train': 0.7783217430114746} -08/30/2021 17:51:20 - INFO - __main__ - Step 26103: {'lr': 0.00046798903353997243, 'samples': 5011776, 'steps': 26102, 'loss/train': 1.5363852977752686} -08/30/2021 17:51:22 - INFO - __main__ - Step 26104: {'lr': 0.0004679864353936987, 'samples': 5011968, 'steps': 26103, 'loss/train': 1.148025393486023} -08/30/2021 17:51:23 - INFO - __main__ - Step 26105: {'lr': 0.0004679838371492036, 'samples': 5012160, 'steps': 26104, 'loss/train': 1.8366453647613525} -08/30/2021 17:51:23 - INFO - __main__ - Step 26106: {'lr': 0.00046798123880648833, 'samples': 5012352, 'steps': 26105, 'loss/train': 0.735233724117279} -08/30/2021 17:51:23 - INFO - __main__ - Step 26107: {'lr': 0.0004679786403655542, 'samples': 5012544, 'steps': 26106, 'loss/train': 0.5969606637954712} -08/30/2021 17:51:24 - INFO - __main__ - Step 26108: {'lr': 0.0004679760418264021, 'samples': 5012736, 'steps': 26107, 'loss/train': 1.3180538415908813} -08/30/2021 17:51:25 - INFO - __main__ - Step 26109: {'lr': 0.00046797344318903343, 'samples': 5012928, 'steps': 26108, 'loss/train': 1.8988051414489746} -08/30/2021 17:51:26 - INFO - __main__ - Step 26110: {'lr': 0.0004679708444534493, 'samples': 5013120, 'steps': 26109, 'loss/train': 1.5253174304962158} -08/30/2021 17:51:26 - INFO - __main__ - Step 26111: {'lr': 0.0004679682456196509, 'samples': 5013312, 'steps': 26110, 'loss/train': 0.9396080374717712} -08/30/2021 17:51:26 - INFO - __main__ - Step 26112: {'lr': 0.0004679656466876393, 'samples': 5013504, 'steps': 26111, 'loss/train': 1.5866893529891968} -08/30/2021 17:51:27 - INFO - __main__ - Step 26113: {'lr': 0.00046796304765741583, 'samples': 5013696, 'steps': 26112, 'loss/train': 1.6055492162704468} -08/30/2021 17:51:27 - INFO - __main__ - Step 26114: {'lr': 0.00046796044852898144, 'samples': 5013888, 'steps': 26113, 'loss/train': 1.7148551940917969} -08/30/2021 17:51:28 - INFO - __main__ - Step 26115: {'lr': 0.0004679578493023375, 'samples': 5014080, 'steps': 26114, 'loss/train': 1.5810562372207642} -08/30/2021 17:51:29 - INFO - __main__ - Step 26116: {'lr': 0.00046795524997748515, 'samples': 5014272, 'steps': 26115, 'loss/train': 1.0068461894989014} -08/30/2021 17:51:29 - INFO - __main__ - Step 26117: {'lr': 0.0004679526505544256, 'samples': 5014464, 'steps': 26116, 'loss/train': 1.168715000152588} -08/30/2021 17:51:30 - INFO - __main__ - Step 26118: {'lr': 0.0004679500510331598, 'samples': 5014656, 'steps': 26117, 'loss/train': 2.080726385116577} -08/30/2021 17:51:30 - INFO - __main__ - Step 26119: {'lr': 0.00046794745141368917, 'samples': 5014848, 'steps': 26118, 'loss/train': 1.7851732969284058} -08/30/2021 17:51:32 - INFO - __main__ - Step 26120: {'lr': 0.00046794485169601474, 'samples': 5015040, 'steps': 26119, 'loss/train': 1.5185885429382324} -08/30/2021 17:51:32 - INFO - __main__ - Step 26121: {'lr': 0.00046794225188013773, 'samples': 5015232, 'steps': 26120, 'loss/train': 1.8581764698028564} -08/30/2021 17:51:32 - INFO - __main__ - Step 26122: {'lr': 0.00046793965196605927, 'samples': 5015424, 'steps': 26121, 'loss/train': 1.7707773447036743} -08/30/2021 17:51:33 - INFO - __main__ - Step 26123: {'lr': 0.00046793705195378066, 'samples': 5015616, 'steps': 26122, 'loss/train': 1.5318524837493896} -08/30/2021 17:51:33 - INFO - __main__ - Step 26124: {'lr': 0.0004679344518433029, 'samples': 5015808, 'steps': 26123, 'loss/train': 1.4481995105743408} -08/30/2021 17:51:35 - INFO - __main__ - Step 26125: {'lr': 0.0004679318516346273, 'samples': 5016000, 'steps': 26124, 'loss/train': 1.2897790670394897} -08/30/2021 17:51:35 - INFO - __main__ - Step 26126: {'lr': 0.0004679292513277549, 'samples': 5016192, 'steps': 26125, 'loss/train': 1.6501446962356567} -08/30/2021 17:51:35 - INFO - __main__ - Step 26127: {'lr': 0.0004679266509226869, 'samples': 5016384, 'steps': 26126, 'loss/train': 1.3101930618286133} -08/30/2021 17:51:36 - INFO - __main__ - Step 26128: {'lr': 0.0004679240504194246, 'samples': 5016576, 'steps': 26127, 'loss/train': 1.645825982093811} -08/30/2021 17:51:36 - INFO - __main__ - Step 26129: {'lr': 0.00046792144981796905, 'samples': 5016768, 'steps': 26128, 'loss/train': 0.7791157364845276} -08/30/2021 17:51:38 - INFO - __main__ - Step 26130: {'lr': 0.0004679188491183215, 'samples': 5016960, 'steps': 26129, 'loss/train': 1.2416889667510986} -08/30/2021 17:51:38 - INFO - __main__ - Step 26131: {'lr': 0.00046791624832048307, 'samples': 5017152, 'steps': 26130, 'loss/train': 1.7181764841079712} -08/30/2021 17:51:39 - INFO - __main__ - Step 26132: {'lr': 0.0004679136474244549, 'samples': 5017344, 'steps': 26131, 'loss/train': 1.6692501306533813} -08/30/2021 17:51:39 - INFO - __main__ - Step 26133: {'lr': 0.00046791104643023823, 'samples': 5017536, 'steps': 26132, 'loss/train': 1.8287296295166016} -08/30/2021 17:51:39 - INFO - __main__ - Step 26134: {'lr': 0.0004679084453378342, 'samples': 5017728, 'steps': 26133, 'loss/train': 0.9401084780693054} -08/30/2021 17:51:41 - INFO - __main__ - Step 26135: {'lr': 0.00046790584414724404, 'samples': 5017920, 'steps': 26134, 'loss/train': 1.7611048221588135} -08/30/2021 17:51:41 - INFO - __main__ - Step 26136: {'lr': 0.0004679032428584687, 'samples': 5018112, 'steps': 26135, 'loss/train': 1.5844484567642212} -08/30/2021 17:51:42 - INFO - __main__ - Step 26137: {'lr': 0.0004679006414715097, 'samples': 5018304, 'steps': 26136, 'loss/train': 0.9440152645111084} -08/30/2021 17:51:42 - INFO - __main__ - Step 26138: {'lr': 0.00046789803998636796, 'samples': 5018496, 'steps': 26137, 'loss/train': 2.4105002880096436} -08/30/2021 17:51:42 - INFO - __main__ - Step 26139: {'lr': 0.0004678954384030448, 'samples': 5018688, 'steps': 26138, 'loss/train': 1.4241313934326172} -08/30/2021 17:51:44 - INFO - __main__ - Step 26140: {'lr': 0.00046789283672154125, 'samples': 5018880, 'steps': 26139, 'loss/train': 0.9175655841827393} -08/30/2021 17:51:44 - INFO - __main__ - Step 26141: {'lr': 0.00046789023494185855, 'samples': 5019072, 'steps': 26140, 'loss/train': 1.0826953649520874} -08/30/2021 17:51:45 - INFO - __main__ - Step 26142: {'lr': 0.0004678876330639978, 'samples': 5019264, 'steps': 26141, 'loss/train': 1.167996883392334} -08/30/2021 17:51:45 - INFO - __main__ - Step 26143: {'lr': 0.0004678850310879604, 'samples': 5019456, 'steps': 26142, 'loss/train': 1.8836358785629272} -08/30/2021 17:51:45 - INFO - __main__ - Step 26144: {'lr': 0.0004678824290137473, 'samples': 5019648, 'steps': 26143, 'loss/train': 1.3544318675994873} -08/30/2021 17:51:47 - INFO - __main__ - Step 26145: {'lr': 0.0004678798268413597, 'samples': 5019840, 'steps': 26144, 'loss/train': 1.3764623403549194} -08/30/2021 17:51:47 - INFO - __main__ - Step 26146: {'lr': 0.00046787722457079887, 'samples': 5020032, 'steps': 26145, 'loss/train': 1.5148603916168213} -08/30/2021 17:51:48 - INFO - __main__ - Step 26147: {'lr': 0.00046787462220206587, 'samples': 5020224, 'steps': 26146, 'loss/train': 1.8436599969863892} -08/30/2021 17:51:48 - INFO - __main__ - Step 26148: {'lr': 0.00046787201973516195, 'samples': 5020416, 'steps': 26147, 'loss/train': 0.5548301339149475} -08/30/2021 17:51:48 - INFO - __main__ - Step 26149: {'lr': 0.00046786941717008823, 'samples': 5020608, 'steps': 26148, 'loss/train': 0.637928307056427} -08/30/2021 17:51:49 - INFO - __main__ - Step 26150: {'lr': 0.00046786681450684597, 'samples': 5020800, 'steps': 26149, 'loss/train': 2.0019750595092773} -08/30/2021 17:51:50 - INFO - __main__ - Step 26151: {'lr': 0.00046786421174543625, 'samples': 5020992, 'steps': 26150, 'loss/train': 1.213064193725586} -08/30/2021 17:51:51 - INFO - __main__ - Step 26152: {'lr': 0.0004678616088858603, 'samples': 5021184, 'steps': 26151, 'loss/train': 1.6105926036834717} -08/30/2021 17:51:51 - INFO - __main__ - Step 26153: {'lr': 0.0004678590059281193, 'samples': 5021376, 'steps': 26152, 'loss/train': 1.7457095384597778} -08/30/2021 17:51:51 - INFO - __main__ - Step 26154: {'lr': 0.0004678564028722143, 'samples': 5021568, 'steps': 26153, 'loss/train': 2.446765184402466} -08/30/2021 17:51:52 - INFO - __main__ - Step 26155: {'lr': 0.0004678537997181467, 'samples': 5021760, 'steps': 26154, 'loss/train': 1.2729811668395996} -08/30/2021 17:51:54 - INFO - __main__ - Step 26156: {'lr': 0.00046785119646591746, 'samples': 5021952, 'steps': 26155, 'loss/train': 1.7035256624221802} -08/30/2021 17:51:54 - INFO - __main__ - Step 26157: {'lr': 0.0004678485931155278, 'samples': 5022144, 'steps': 26156, 'loss/train': 1.5122156143188477} -08/30/2021 17:51:55 - INFO - __main__ - Step 26158: {'lr': 0.000467845989666979, 'samples': 5022336, 'steps': 26157, 'loss/train': 1.3289146423339844} -08/30/2021 17:51:55 - INFO - __main__ - Step 26159: {'lr': 0.0004678433861202721, 'samples': 5022528, 'steps': 26158, 'loss/train': 1.6197569370269775} -08/30/2021 17:51:55 - INFO - __main__ - Step 26160: {'lr': 0.0004678407824754083, 'samples': 5022720, 'steps': 26159, 'loss/train': 1.7705466747283936} -08/30/2021 17:51:56 - INFO - __main__ - Step 26161: {'lr': 0.00046783817873238885, 'samples': 5022912, 'steps': 26160, 'loss/train': 0.09180153906345367} -08/30/2021 17:51:57 - INFO - __main__ - Step 26162: {'lr': 0.0004678355748912149, 'samples': 5023104, 'steps': 26161, 'loss/train': 0.6512777209281921} -08/30/2021 17:51:58 - INFO - __main__ - Step 26163: {'lr': 0.0004678329709518876, 'samples': 5023296, 'steps': 26162, 'loss/train': 1.0051910877227783} -08/30/2021 17:51:58 - INFO - __main__ - Step 26164: {'lr': 0.0004678303669144081, 'samples': 5023488, 'steps': 26163, 'loss/train': 1.294397234916687} -08/30/2021 17:51:58 - INFO - __main__ - Step 26165: {'lr': 0.0004678277627787776, 'samples': 5023680, 'steps': 26164, 'loss/train': 0.5985181927680969} -08/30/2021 17:51:59 - INFO - __main__ - Step 26166: {'lr': 0.0004678251585449973, 'samples': 5023872, 'steps': 26165, 'loss/train': 1.6224207878112793} -08/30/2021 17:52:00 - INFO - __main__ - Step 26167: {'lr': 0.0004678225542130683, 'samples': 5024064, 'steps': 26166, 'loss/train': 1.5821278095245361} -08/30/2021 17:52:01 - INFO - __main__ - Step 26168: {'lr': 0.0004678199497829919, 'samples': 5024256, 'steps': 26167, 'loss/train': 1.2952234745025635} -08/30/2021 17:52:01 - INFO - __main__ - Step 26169: {'lr': 0.0004678173452547691, 'samples': 5024448, 'steps': 26168, 'loss/train': 1.4567570686340332} -08/30/2021 17:52:01 - INFO - __main__ - Step 26170: {'lr': 0.00046781474062840126, 'samples': 5024640, 'steps': 26169, 'loss/train': 1.1379626989364624} -08/30/2021 17:52:02 - INFO - __main__ - Step 26171: {'lr': 0.0004678121359038894, 'samples': 5024832, 'steps': 26170, 'loss/train': 1.627280831336975} -08/30/2021 17:52:04 - INFO - __main__ - Step 26172: {'lr': 0.0004678095310812347, 'samples': 5025024, 'steps': 26171, 'loss/train': 0.38083937764167786} -08/30/2021 17:52:04 - INFO - __main__ - Step 26173: {'lr': 0.0004678069261604384, 'samples': 5025216, 'steps': 26172, 'loss/train': 1.146022081375122} -08/30/2021 17:52:05 - INFO - __main__ - Step 26174: {'lr': 0.00046780432114150173, 'samples': 5025408, 'steps': 26173, 'loss/train': 1.4485677480697632} -08/30/2021 17:52:05 - INFO - __main__ - Step 26175: {'lr': 0.0004678017160244258, 'samples': 5025600, 'steps': 26174, 'loss/train': 1.5082147121429443} -08/30/2021 17:52:05 - INFO - __main__ - Step 26176: {'lr': 0.00046779911080921166, 'samples': 5025792, 'steps': 26175, 'loss/train': 2.016350269317627} -08/30/2021 17:52:06 - INFO - __main__ - Step 26177: {'lr': 0.00046779650549586075, 'samples': 5025984, 'steps': 26176, 'loss/train': 1.5053982734680176} -08/30/2021 17:52:07 - INFO - __main__ - Step 26178: {'lr': 0.000467793900084374, 'samples': 5026176, 'steps': 26177, 'loss/train': 0.363174706697464} -08/30/2021 17:52:08 - INFO - __main__ - Step 26179: {'lr': 0.0004677912945747527, 'samples': 5026368, 'steps': 26178, 'loss/train': 2.0944387912750244} -08/30/2021 17:52:08 - INFO - __main__ - Step 26180: {'lr': 0.000467788688966998, 'samples': 5026560, 'steps': 26179, 'loss/train': 1.557246446609497} -08/30/2021 17:52:08 - INFO - __main__ - Step 26181: {'lr': 0.00046778608326111104, 'samples': 5026752, 'steps': 26180, 'loss/train': 2.4179751873016357} -08/30/2021 17:52:09 - INFO - __main__ - Step 26182: {'lr': 0.00046778347745709317, 'samples': 5026944, 'steps': 26181, 'loss/train': 1.5029606819152832} -08/30/2021 17:52:10 - INFO - __main__ - Step 26183: {'lr': 0.0004677808715549453, 'samples': 5027136, 'steps': 26182, 'loss/train': 0.08202935755252838} -08/30/2021 17:52:11 - INFO - __main__ - Step 26184: {'lr': 0.0004677782655546687, 'samples': 5027328, 'steps': 26183, 'loss/train': 2.0947749614715576} -08/30/2021 17:52:11 - INFO - __main__ - Step 26185: {'lr': 0.00046777565945626463, 'samples': 5027520, 'steps': 26184, 'loss/train': 0.14571039378643036} -08/30/2021 17:52:12 - INFO - __main__ - Step 26186: {'lr': 0.0004677730532597343, 'samples': 5027712, 'steps': 26185, 'loss/train': 0.664777398109436} -08/30/2021 17:52:12 - INFO - __main__ - Step 26187: {'lr': 0.00046777044696507867, 'samples': 5027904, 'steps': 26186, 'loss/train': 1.4623806476593018} -08/30/2021 17:52:14 - INFO - __main__ - Step 26188: {'lr': 0.00046776784057229906, 'samples': 5028096, 'steps': 26187, 'loss/train': 1.3610191345214844} -08/30/2021 17:52:14 - INFO - __main__ - Step 26189: {'lr': 0.00046776523408139666, 'samples': 5028288, 'steps': 26188, 'loss/train': 1.5496939420700073} -08/30/2021 17:52:14 - INFO - __main__ - Step 26190: {'lr': 0.0004677626274923726, 'samples': 5028480, 'steps': 26189, 'loss/train': 1.611902117729187} -08/30/2021 17:52:15 - INFO - __main__ - Step 26191: {'lr': 0.000467760020805228, 'samples': 5028672, 'steps': 26190, 'loss/train': 1.2484333515167236} -08/30/2021 17:52:15 - INFO - __main__ - Step 26192: {'lr': 0.0004677574140199642, 'samples': 5028864, 'steps': 26191, 'loss/train': 1.459053635597229} -08/30/2021 17:52:16 - INFO - __main__ - Step 26193: {'lr': 0.00046775480713658215, 'samples': 5029056, 'steps': 26192, 'loss/train': 1.6826428174972534} -08/30/2021 17:52:17 - INFO - __main__ - Step 26194: {'lr': 0.00046775220015508325, 'samples': 5029248, 'steps': 26193, 'loss/train': 1.5191541910171509} -08/30/2021 17:52:17 - INFO - __main__ - Step 26195: {'lr': 0.0004677495930754685, 'samples': 5029440, 'steps': 26194, 'loss/train': 1.6067183017730713} -08/30/2021 17:52:18 - INFO - __main__ - Step 26196: {'lr': 0.0004677469858977391, 'samples': 5029632, 'steps': 26195, 'loss/train': 1.3620458841323853} -08/30/2021 17:52:18 - INFO - __main__ - Step 26197: {'lr': 0.00046774437862189634, 'samples': 5029824, 'steps': 26196, 'loss/train': 1.465554118156433} -08/30/2021 17:52:19 - INFO - __main__ - Step 26198: {'lr': 0.00046774177124794136, 'samples': 5030016, 'steps': 26197, 'loss/train': 0.8533470034599304} -08/30/2021 17:52:20 - INFO - __main__ - Step 26199: {'lr': 0.00046773916377587524, 'samples': 5030208, 'steps': 26198, 'loss/train': 1.480251431465149} -08/30/2021 17:52:20 - INFO - __main__ - Step 26200: {'lr': 0.00046773655620569924, 'samples': 5030400, 'steps': 26199, 'loss/train': 1.3872203826904297} -08/30/2021 17:52:20 - INFO - __main__ - Step 26201: {'lr': 0.0004677339485374145, 'samples': 5030592, 'steps': 26200, 'loss/train': 1.836183786392212} -08/30/2021 17:52:21 - INFO - __main__ - Step 26202: {'lr': 0.00046773134077102217, 'samples': 5030784, 'steps': 26201, 'loss/train': 1.560879111289978} -08/30/2021 17:52:22 - INFO - __main__ - Step 26203: {'lr': 0.00046772873290652344, 'samples': 5030976, 'steps': 26202, 'loss/train': 1.932642936706543} -08/30/2021 17:52:23 - INFO - __main__ - Step 26204: {'lr': 0.0004677261249439196, 'samples': 5031168, 'steps': 26203, 'loss/train': 1.487125039100647} -08/30/2021 17:52:23 - INFO - __main__ - Step 26205: {'lr': 0.0004677235168832117, 'samples': 5031360, 'steps': 26204, 'loss/train': 0.585166871547699} -08/30/2021 17:52:24 - INFO - __main__ - Step 26206: {'lr': 0.0004677209087244009, 'samples': 5031552, 'steps': 26205, 'loss/train': 1.2288188934326172} -08/30/2021 17:52:24 - INFO - __main__ - Step 26207: {'lr': 0.0004677183004674884, 'samples': 5031744, 'steps': 26206, 'loss/train': 1.764260172843933} -08/30/2021 17:52:24 - INFO - __main__ - Step 26208: {'lr': 0.00046771569211247546, 'samples': 5031936, 'steps': 26207, 'loss/train': 1.874774694442749} -08/30/2021 17:52:27 - INFO - __main__ - Step 26209: {'lr': 0.00046771308365936315, 'samples': 5032128, 'steps': 26208, 'loss/train': 1.7931764125823975} -08/30/2021 17:52:27 - INFO - __main__ - Step 26210: {'lr': 0.00046771047510815267, 'samples': 5032320, 'steps': 26209, 'loss/train': 1.2996633052825928} -08/30/2021 17:52:27 - INFO - __main__ - Step 26211: {'lr': 0.0004677078664588452, 'samples': 5032512, 'steps': 26210, 'loss/train': 1.447281002998352} -08/30/2021 17:52:28 - INFO - __main__ - Step 26212: {'lr': 0.000467705257711442, 'samples': 5032704, 'steps': 26211, 'loss/train': 1.5091127157211304} -08/30/2021 17:52:28 - INFO - __main__ - Step 26213: {'lr': 0.0004677026488659441, 'samples': 5032896, 'steps': 26212, 'loss/train': 1.8863173723220825} -08/30/2021 17:52:29 - INFO - __main__ - Step 26214: {'lr': 0.0004677000399223528, 'samples': 5033088, 'steps': 26213, 'loss/train': 2.09542179107666} -08/30/2021 17:52:30 - INFO - __main__ - Step 26215: {'lr': 0.0004676974308806692, 'samples': 5033280, 'steps': 26214, 'loss/train': 1.9482330083847046} -08/30/2021 17:52:30 - INFO - __main__ - Step 26216: {'lr': 0.00046769482174089446, 'samples': 5033472, 'steps': 26215, 'loss/train': 1.2161154747009277} -08/30/2021 17:52:31 - INFO - __main__ - Step 26217: {'lr': 0.00046769221250302984, 'samples': 5033664, 'steps': 26216, 'loss/train': 0.5359983444213867} -08/30/2021 17:52:31 - INFO - __main__ - Step 26218: {'lr': 0.0004676896031670764, 'samples': 5033856, 'steps': 26217, 'loss/train': 1.6811681985855103} -08/30/2021 17:52:32 - INFO - __main__ - Step 26219: {'lr': 0.00046768699373303546, 'samples': 5034048, 'steps': 26218, 'loss/train': 1.6467416286468506} -08/30/2021 17:52:33 - INFO - __main__ - Step 26220: {'lr': 0.00046768438420090807, 'samples': 5034240, 'steps': 26219, 'loss/train': 1.2183287143707275} -08/30/2021 17:52:33 - INFO - __main__ - Step 26221: {'lr': 0.0004676817745706955, 'samples': 5034432, 'steps': 26220, 'loss/train': 1.2806841135025024} -08/30/2021 17:52:34 - INFO - __main__ - Step 26222: {'lr': 0.0004676791648423989, 'samples': 5034624, 'steps': 26221, 'loss/train': 1.8384215831756592} -08/30/2021 17:52:34 - INFO - __main__ - Step 26223: {'lr': 0.00046767655501601935, 'samples': 5034816, 'steps': 26222, 'loss/train': 1.3472853899002075} -08/30/2021 17:52:36 - INFO - __main__ - Step 26224: {'lr': 0.0004676739450915581, 'samples': 5035008, 'steps': 26223, 'loss/train': 1.0090837478637695} -08/30/2021 17:52:36 - INFO - __main__ - Step 26225: {'lr': 0.0004676713350690164, 'samples': 5035200, 'steps': 26224, 'loss/train': 1.7016509771347046} -08/30/2021 17:52:36 - INFO - __main__ - Step 26226: {'lr': 0.0004676687249483953, 'samples': 5035392, 'steps': 26225, 'loss/train': 2.773500919342041} -08/30/2021 17:52:37 - INFO - __main__ - Step 26227: {'lr': 0.0004676661147296961, 'samples': 5035584, 'steps': 26226, 'loss/train': 1.444489598274231} -08/30/2021 17:52:37 - INFO - __main__ - Step 26228: {'lr': 0.00046766350441291985, 'samples': 5035776, 'steps': 26227, 'loss/train': 1.0572092533111572} -08/30/2021 17:52:39 - INFO - __main__ - Step 26229: {'lr': 0.00046766089399806775, 'samples': 5035968, 'steps': 26228, 'loss/train': 0.6948620080947876} -08/30/2021 17:52:39 - INFO - __main__ - Step 26230: {'lr': 0.0004676582834851411, 'samples': 5036160, 'steps': 26229, 'loss/train': 1.6123915910720825} -08/30/2021 17:52:39 - INFO - __main__ - Step 26231: {'lr': 0.0004676556728741409, 'samples': 5036352, 'steps': 26230, 'loss/train': 0.19862884283065796} -08/30/2021 17:52:40 - INFO - __main__ - Step 26232: {'lr': 0.0004676530621650685, 'samples': 5036544, 'steps': 26231, 'loss/train': 1.3207002878189087} -08/30/2021 17:52:40 - INFO - __main__ - Step 26233: {'lr': 0.00046765045135792495, 'samples': 5036736, 'steps': 26232, 'loss/train': 2.133751153945923} -08/30/2021 17:52:42 - INFO - __main__ - Step 26234: {'lr': 0.00046764784045271146, 'samples': 5036928, 'steps': 26233, 'loss/train': 1.8287540674209595} -08/30/2021 17:52:42 - INFO - __main__ - Step 26235: {'lr': 0.0004676452294494292, 'samples': 5037120, 'steps': 26234, 'loss/train': 1.5834941864013672} -08/30/2021 17:52:42 - INFO - __main__ - Step 26236: {'lr': 0.00046764261834807944, 'samples': 5037312, 'steps': 26235, 'loss/train': 2.87629771232605} -08/30/2021 17:52:43 - INFO - __main__ - Step 26237: {'lr': 0.0004676400071486632, 'samples': 5037504, 'steps': 26236, 'loss/train': 2.2349281311035156} -08/30/2021 17:52:43 - INFO - __main__ - Step 26238: {'lr': 0.0004676373958511817, 'samples': 5037696, 'steps': 26237, 'loss/train': 1.0710747241973877} -08/30/2021 17:52:45 - INFO - __main__ - Step 26239: {'lr': 0.00046763478445563617, 'samples': 5037888, 'steps': 26238, 'loss/train': 2.6107187271118164} -08/30/2021 17:52:45 - INFO - __main__ - Step 26240: {'lr': 0.0004676321729620278, 'samples': 5038080, 'steps': 26239, 'loss/train': 1.5706325769424438} -08/30/2021 17:52:46 - INFO - __main__ - Step 26241: {'lr': 0.0004676295613703577, 'samples': 5038272, 'steps': 26240, 'loss/train': 1.8564623594284058} -08/30/2021 17:52:46 - INFO - __main__ - Step 26242: {'lr': 0.00046762694968062706, 'samples': 5038464, 'steps': 26241, 'loss/train': 1.5979385375976562} -08/30/2021 17:52:46 - INFO - __main__ - Step 26243: {'lr': 0.0004676243378928371, 'samples': 5038656, 'steps': 26242, 'loss/train': 2.0918338298797607} -08/30/2021 17:52:47 - INFO - __main__ - Step 26244: {'lr': 0.000467621726006989, 'samples': 5038848, 'steps': 26243, 'loss/train': 0.6312897205352783} -08/30/2021 17:52:48 - INFO - __main__ - Step 26245: {'lr': 0.0004676191140230839, 'samples': 5039040, 'steps': 26244, 'loss/train': 1.396957516670227} -08/30/2021 17:52:49 - INFO - __main__ - Step 26246: {'lr': 0.0004676165019411229, 'samples': 5039232, 'steps': 26245, 'loss/train': 1.4047967195510864} -08/30/2021 17:52:49 - INFO - __main__ - Step 26247: {'lr': 0.00046761388976110737, 'samples': 5039424, 'steps': 26246, 'loss/train': 1.378141164779663} -08/30/2021 17:52:49 - INFO - __main__ - Step 26248: {'lr': 0.00046761127748303833, 'samples': 5039616, 'steps': 26247, 'loss/train': 1.552869439125061} -08/30/2021 17:52:50 - INFO - __main__ - Step 26249: {'lr': 0.000467608665106917, 'samples': 5039808, 'steps': 26248, 'loss/train': 1.6121121644973755} -08/30/2021 17:52:51 - INFO - __main__ - Step 26250: {'lr': 0.0004676060526327446, 'samples': 5040000, 'steps': 26249, 'loss/train': 1.5323083400726318} -08/30/2021 17:52:52 - INFO - __main__ - Step 26251: {'lr': 0.00046760344006052223, 'samples': 5040192, 'steps': 26250, 'loss/train': 1.0000609159469604} -08/30/2021 17:52:52 - INFO - __main__ - Step 26252: {'lr': 0.00046760082739025113, 'samples': 5040384, 'steps': 26251, 'loss/train': 1.5879063606262207} -08/30/2021 17:52:52 - INFO - __main__ - Step 26253: {'lr': 0.0004675982146219324, 'samples': 5040576, 'steps': 26252, 'loss/train': 0.24589650332927704} -08/30/2021 17:52:53 - INFO - __main__ - Step 26254: {'lr': 0.00046759560175556737, 'samples': 5040768, 'steps': 26253, 'loss/train': 1.4122611284255981} -08/30/2021 17:52:54 - INFO - __main__ - Step 26255: {'lr': 0.0004675929887911571, 'samples': 5040960, 'steps': 26254, 'loss/train': 1.3601524829864502} -08/30/2021 17:52:55 - INFO - __main__ - Step 26256: {'lr': 0.0004675903757287027, 'samples': 5041152, 'steps': 26255, 'loss/train': 1.5401798486709595} -08/30/2021 17:52:55 - INFO - __main__ - Step 26257: {'lr': 0.0004675877625682055, 'samples': 5041344, 'steps': 26256, 'loss/train': 1.829728126525879} -08/30/2021 17:52:55 - INFO - __main__ - Step 26258: {'lr': 0.00046758514930966664, 'samples': 5041536, 'steps': 26257, 'loss/train': 1.5436458587646484} -08/30/2021 17:52:56 - INFO - __main__ - Step 26259: {'lr': 0.0004675825359530872, 'samples': 5041728, 'steps': 26258, 'loss/train': 1.1547647714614868} -08/30/2021 17:52:58 - INFO - __main__ - Step 26260: {'lr': 0.0004675799224984685, 'samples': 5041920, 'steps': 26259, 'loss/train': 1.8499315977096558} -08/30/2021 17:52:58 - INFO - __main__ - Step 26261: {'lr': 0.00046757730894581164, 'samples': 5042112, 'steps': 26260, 'loss/train': 1.8405916690826416} -08/30/2021 17:52:58 - INFO - __main__ - Step 26262: {'lr': 0.00046757469529511777, 'samples': 5042304, 'steps': 26261, 'loss/train': 1.6968600749969482} -08/30/2021 17:52:59 - INFO - __main__ - Step 26263: {'lr': 0.0004675720815463881, 'samples': 5042496, 'steps': 26262, 'loss/train': 1.6263556480407715} -08/30/2021 17:52:59 - INFO - __main__ - Step 26264: {'lr': 0.00046756946769962375, 'samples': 5042688, 'steps': 26263, 'loss/train': 1.757317066192627} -08/30/2021 17:53:01 - INFO - __main__ - Step 26265: {'lr': 0.000467566853754826, 'samples': 5042880, 'steps': 26264, 'loss/train': 1.6671481132507324} -08/30/2021 17:53:01 - INFO - __main__ - Step 26266: {'lr': 0.00046756423971199603, 'samples': 5043072, 'steps': 26265, 'loss/train': 1.3835176229476929} -08/30/2021 17:53:02 - INFO - __main__ - Step 26267: {'lr': 0.0004675616255711349, 'samples': 5043264, 'steps': 26266, 'loss/train': 5.911319732666016} -08/30/2021 17:53:02 - INFO - __main__ - Step 26268: {'lr': 0.0004675590113322439, 'samples': 5043456, 'steps': 26267, 'loss/train': 1.204235315322876} -08/30/2021 17:53:02 - INFO - __main__ - Step 26269: {'lr': 0.00046755639699532414, 'samples': 5043648, 'steps': 26268, 'loss/train': 1.2118866443634033} -08/30/2021 17:53:03 - INFO - __main__ - Step 26270: {'lr': 0.00046755378256037685, 'samples': 5043840, 'steps': 26269, 'loss/train': 1.761609435081482} -08/30/2021 17:53:04 - INFO - __main__ - Step 26271: {'lr': 0.00046755116802740316, 'samples': 5044032, 'steps': 26270, 'loss/train': 1.9451550245285034} -08/30/2021 17:53:05 - INFO - __main__ - Step 26272: {'lr': 0.00046754855339640436, 'samples': 5044224, 'steps': 26271, 'loss/train': 0.941116213798523} -08/30/2021 17:53:05 - INFO - __main__ - Step 26273: {'lr': 0.00046754593866738144, 'samples': 5044416, 'steps': 26272, 'loss/train': 1.11298668384552} -08/30/2021 17:53:06 - INFO - __main__ - Step 26274: {'lr': 0.0004675433238403357, 'samples': 5044608, 'steps': 26273, 'loss/train': 1.162381887435913} -08/30/2021 17:53:06 - INFO - __main__ - Step 26275: {'lr': 0.0004675407089152683, 'samples': 5044800, 'steps': 26274, 'loss/train': 1.1345688104629517} -08/30/2021 17:53:06 - INFO - __main__ - Step 26276: {'lr': 0.00046753809389218036, 'samples': 5044992, 'steps': 26275, 'loss/train': 1.559865117073059} -08/30/2021 17:53:08 - INFO - __main__ - Step 26277: {'lr': 0.0004675354787710732, 'samples': 5045184, 'steps': 26276, 'loss/train': 1.0282788276672363} -08/30/2021 17:53:08 - INFO - __main__ - Step 26278: {'lr': 0.0004675328635519479, 'samples': 5045376, 'steps': 26277, 'loss/train': 0.7387611269950867} -08/30/2021 17:53:08 - INFO - __main__ - Step 26279: {'lr': 0.0004675302482348056, 'samples': 5045568, 'steps': 26278, 'loss/train': 1.364940881729126} -08/30/2021 17:53:09 - INFO - __main__ - Step 26280: {'lr': 0.00046752763281964757, 'samples': 5045760, 'steps': 26279, 'loss/train': 1.4897438287734985} -08/30/2021 17:53:09 - INFO - __main__ - Step 26281: {'lr': 0.0004675250173064749, 'samples': 5045952, 'steps': 26280, 'loss/train': 1.7558190822601318} -08/30/2021 17:53:11 - INFO - __main__ - Step 26282: {'lr': 0.0004675224016952888, 'samples': 5046144, 'steps': 26281, 'loss/train': 1.4290552139282227} -08/30/2021 17:53:11 - INFO - __main__ - Step 26283: {'lr': 0.00046751978598609056, 'samples': 5046336, 'steps': 26282, 'loss/train': 1.4846059083938599} -08/30/2021 17:53:11 - INFO - __main__ - Step 26284: {'lr': 0.00046751717017888116, 'samples': 5046528, 'steps': 26283, 'loss/train': 1.951148509979248} -08/30/2021 17:53:12 - INFO - __main__ - Step 26285: {'lr': 0.00046751455427366194, 'samples': 5046720, 'steps': 26284, 'loss/train': 1.6930569410324097} -08/30/2021 17:53:12 - INFO - __main__ - Step 26286: {'lr': 0.00046751193827043405, 'samples': 5046912, 'steps': 26285, 'loss/train': 1.0926343202590942} -08/30/2021 17:53:14 - INFO - __main__ - Step 26287: {'lr': 0.0004675093221691985, 'samples': 5047104, 'steps': 26286, 'loss/train': 1.2144969701766968} -08/30/2021 17:53:14 - INFO - __main__ - Step 26288: {'lr': 0.0004675067059699567, 'samples': 5047296, 'steps': 26287, 'loss/train': 1.193758249282837} -08/30/2021 17:53:15 - INFO - __main__ - Step 26289: {'lr': 0.00046750408967270973, 'samples': 5047488, 'steps': 26288, 'loss/train': 1.3849986791610718} -08/30/2021 17:53:15 - INFO - __main__ - Step 26290: {'lr': 0.0004675014732774588, 'samples': 5047680, 'steps': 26289, 'loss/train': 1.406269907951355} -08/30/2021 17:53:15 - INFO - __main__ - Step 26291: {'lr': 0.000467498856784205, 'samples': 5047872, 'steps': 26290, 'loss/train': 1.1837278604507446} -08/30/2021 17:53:17 - INFO - __main__ - Step 26292: {'lr': 0.0004674962401929496, 'samples': 5048064, 'steps': 26291, 'loss/train': 1.9569282531738281} -08/30/2021 17:53:17 - INFO - __main__ - Step 26293: {'lr': 0.0004674936235036938, 'samples': 5048256, 'steps': 26292, 'loss/train': 1.192387580871582} -08/30/2021 17:53:18 - INFO - __main__ - Step 26294: {'lr': 0.00046749100671643866, 'samples': 5048448, 'steps': 26293, 'loss/train': 0.874843418598175} -08/30/2021 17:53:18 - INFO - __main__ - Step 26295: {'lr': 0.00046748838983118546, 'samples': 5048640, 'steps': 26294, 'loss/train': 0.8066315650939941} -08/30/2021 17:53:18 - INFO - __main__ - Step 26296: {'lr': 0.00046748577284793535, 'samples': 5048832, 'steps': 26295, 'loss/train': 1.4623510837554932} -08/30/2021 17:53:20 - INFO - __main__ - Step 26297: {'lr': 0.00046748315576668946, 'samples': 5049024, 'steps': 26296, 'loss/train': 1.4491009712219238} -08/30/2021 17:53:20 - INFO - __main__ - Step 26298: {'lr': 0.0004674805385874491, 'samples': 5049216, 'steps': 26297, 'loss/train': 2.0263445377349854} -08/30/2021 17:53:21 - INFO - __main__ - Step 26299: {'lr': 0.0004674779213102153, 'samples': 5049408, 'steps': 26298, 'loss/train': 0.7796643972396851} -08/30/2021 17:53:21 - INFO - __main__ - Step 26300: {'lr': 0.00046747530393498934, 'samples': 5049600, 'steps': 26299, 'loss/train': 5.412769317626953} -08/30/2021 17:53:21 - INFO - __main__ - Step 26301: {'lr': 0.0004674726864617723, 'samples': 5049792, 'steps': 26300, 'loss/train': 1.9228533506393433} -08/30/2021 17:53:22 - INFO - __main__ - Step 26302: {'lr': 0.00046747006889056556, 'samples': 5049984, 'steps': 26301, 'loss/train': 2.1370584964752197} -08/30/2021 17:53:23 - INFO - __main__ - Step 26303: {'lr': 0.00046746745122137, 'samples': 5050176, 'steps': 26302, 'loss/train': 1.3682295083999634} -08/30/2021 17:53:24 - INFO - __main__ - Step 26304: {'lr': 0.000467464833454187, 'samples': 5050368, 'steps': 26303, 'loss/train': 1.6545788049697876} -08/30/2021 17:53:24 - INFO - __main__ - Step 26305: {'lr': 0.0004674622155890178, 'samples': 5050560, 'steps': 26304, 'loss/train': 1.717965006828308} -08/30/2021 17:53:25 - INFO - __main__ - Step 26306: {'lr': 0.00046745959762586344, 'samples': 5050752, 'steps': 26305, 'loss/train': 0.475311279296875} -08/30/2021 17:53:25 - INFO - __main__ - Step 26307: {'lr': 0.0004674569795647251, 'samples': 5050944, 'steps': 26306, 'loss/train': 1.924486756324768} -08/30/2021 17:53:27 - INFO - __main__ - Step 26308: {'lr': 0.00046745436140560397, 'samples': 5051136, 'steps': 26307, 'loss/train': 1.3409497737884521} -08/30/2021 17:53:27 - INFO - __main__ - Step 26309: {'lr': 0.00046745174314850136, 'samples': 5051328, 'steps': 26308, 'loss/train': 1.4483742713928223} -08/30/2021 17:53:27 - INFO - __main__ - Step 26310: {'lr': 0.00046744912479341826, 'samples': 5051520, 'steps': 26309, 'loss/train': 0.8104193806648254} -08/30/2021 17:53:28 - INFO - __main__ - Step 26311: {'lr': 0.00046744650634035603, 'samples': 5051712, 'steps': 26310, 'loss/train': 1.873723030090332} -08/30/2021 17:53:28 - INFO - __main__ - Step 26312: {'lr': 0.0004674438877893157, 'samples': 5051904, 'steps': 26311, 'loss/train': 2.0275466442108154} -08/30/2021 17:53:29 - INFO - __main__ - Step 26313: {'lr': 0.0004674412691402985, 'samples': 5052096, 'steps': 26312, 'loss/train': 1.306639552116394} -08/30/2021 17:53:30 - INFO - __main__ - Step 26314: {'lr': 0.00046743865039330565, 'samples': 5052288, 'steps': 26313, 'loss/train': 1.2984265089035034} -08/30/2021 17:53:30 - INFO - __main__ - Step 26315: {'lr': 0.00046743603154833827, 'samples': 5052480, 'steps': 26314, 'loss/train': 0.90952467918396} -08/30/2021 17:53:31 - INFO - __main__ - Step 26316: {'lr': 0.00046743341260539756, 'samples': 5052672, 'steps': 26315, 'loss/train': 1.4084138870239258} -08/30/2021 17:53:31 - INFO - __main__ - Step 26317: {'lr': 0.00046743079356448476, 'samples': 5052864, 'steps': 26316, 'loss/train': 1.8966929912567139} -08/30/2021 17:53:33 - INFO - __main__ - Step 26318: {'lr': 0.000467428174425601, 'samples': 5053056, 'steps': 26317, 'loss/train': 1.3839093446731567} -08/30/2021 17:53:33 - INFO - __main__ - Step 26319: {'lr': 0.0004674255551887474, 'samples': 5053248, 'steps': 26318, 'loss/train': 1.144919753074646} -08/30/2021 17:53:34 - INFO - __main__ - Step 26320: {'lr': 0.0004674229358539253, 'samples': 5053440, 'steps': 26319, 'loss/train': 1.1010702848434448} -08/30/2021 17:53:34 - INFO - __main__ - Step 26321: {'lr': 0.0004674203164211357, 'samples': 5053632, 'steps': 26320, 'loss/train': 1.3001075983047485} -08/30/2021 17:53:34 - INFO - __main__ - Step 26322: {'lr': 0.00046741769689037985, 'samples': 5053824, 'steps': 26321, 'loss/train': 1.4087958335876465} -08/30/2021 17:53:36 - INFO - __main__ - Step 26323: {'lr': 0.0004674150772616589, 'samples': 5054016, 'steps': 26322, 'loss/train': 1.2034153938293457} -08/30/2021 17:53:36 - INFO - __main__ - Step 26324: {'lr': 0.0004674124575349742, 'samples': 5054208, 'steps': 26323, 'loss/train': 1.8088667392730713} -08/30/2021 17:53:37 - INFO - __main__ - Step 26325: {'lr': 0.00046740983771032674, 'samples': 5054400, 'steps': 26324, 'loss/train': 5.845498085021973} -08/30/2021 17:53:37 - INFO - __main__ - Step 26326: {'lr': 0.0004674072177877178, 'samples': 5054592, 'steps': 26325, 'loss/train': 1.6823536157608032} -08/30/2021 17:53:37 - INFO - __main__ - Step 26327: {'lr': 0.0004674045977671484, 'samples': 5054784, 'steps': 26326, 'loss/train': 1.9012107849121094} -08/30/2021 17:53:38 - INFO - __main__ - Step 26328: {'lr': 0.00046740197764862, 'samples': 5054976, 'steps': 26327, 'loss/train': 2.1735944747924805} -08/30/2021 17:53:39 - INFO - __main__ - Step 26329: {'lr': 0.00046739935743213344, 'samples': 5055168, 'steps': 26328, 'loss/train': 1.2146939039230347} -08/30/2021 17:53:40 - INFO - __main__ - Step 26330: {'lr': 0.00046739673711769026, 'samples': 5055360, 'steps': 26329, 'loss/train': 1.8299793004989624} -08/30/2021 17:53:40 - INFO - __main__ - Step 26331: {'lr': 0.0004673941167052914, 'samples': 5055552, 'steps': 26330, 'loss/train': 1.4739185571670532} -08/30/2021 17:53:41 - INFO - __main__ - Step 26332: {'lr': 0.0004673914961949381, 'samples': 5055744, 'steps': 26331, 'loss/train': 2.0954718589782715} -08/30/2021 17:53:41 - INFO - __main__ - Step 26333: {'lr': 0.0004673888755866316, 'samples': 5055936, 'steps': 26332, 'loss/train': 0.09940269589424133} -08/30/2021 17:53:42 - INFO - __main__ - Step 26334: {'lr': 0.0004673862548803729, 'samples': 5056128, 'steps': 26333, 'loss/train': 2.0142016410827637} -08/30/2021 17:53:43 - INFO - __main__ - Step 26335: {'lr': 0.0004673836340761634, 'samples': 5056320, 'steps': 26334, 'loss/train': 1.219390630722046} -08/30/2021 17:53:43 - INFO - __main__ - Step 26336: {'lr': 0.00046738101317400415, 'samples': 5056512, 'steps': 26335, 'loss/train': 1.3998562097549438} -08/30/2021 17:53:44 - INFO - __main__ - Step 26337: {'lr': 0.00046737839217389645, 'samples': 5056704, 'steps': 26336, 'loss/train': 0.6932715773582458} -08/30/2021 17:53:44 - INFO - __main__ - Step 26338: {'lr': 0.0004673757710758413, 'samples': 5056896, 'steps': 26337, 'loss/train': 1.809666395187378} -08/30/2021 17:53:46 - INFO - __main__ - Step 26339: {'lr': 0.00046737314987984, 'samples': 5057088, 'steps': 26338, 'loss/train': 1.7099965810775757} -08/30/2021 17:53:46 - INFO - __main__ - Step 26340: {'lr': 0.0004673705285858938, 'samples': 5057280, 'steps': 26339, 'loss/train': 1.4753388166427612} -08/30/2021 17:53:47 - INFO - __main__ - Step 26341: {'lr': 0.00046736790719400373, 'samples': 5057472, 'steps': 26340, 'loss/train': 1.5072438716888428} -08/30/2021 17:53:47 - INFO - __main__ - Step 26342: {'lr': 0.000467365285704171, 'samples': 5057664, 'steps': 26341, 'loss/train': 1.5418766736984253} -08/30/2021 17:53:48 - INFO - __main__ - Step 26343: {'lr': 0.00046736266411639694, 'samples': 5057856, 'steps': 26342, 'loss/train': 1.4100966453552246} -08/30/2021 17:53:49 - INFO - __main__ - Step 26344: {'lr': 0.00046736004243068255, 'samples': 5058048, 'steps': 26343, 'loss/train': 0.12519323825836182} -08/30/2021 17:53:50 - INFO - __main__ - Step 26345: {'lr': 0.00046735742064702904, 'samples': 5058240, 'steps': 26344, 'loss/train': 1.8921748399734497} -08/30/2021 17:53:50 - INFO - __main__ - Step 26346: {'lr': 0.00046735479876543765, 'samples': 5058432, 'steps': 26345, 'loss/train': 1.4676744937896729} -08/30/2021 17:53:51 - INFO - __main__ - Step 26347: {'lr': 0.00046735217678590957, 'samples': 5058624, 'steps': 26346, 'loss/train': 0.17673909664154053} -08/30/2021 17:53:51 - INFO - __main__ - Step 26348: {'lr': 0.00046734955470844594, 'samples': 5058816, 'steps': 26347, 'loss/train': 1.8397572040557861} -08/30/2021 17:53:51 - INFO - __main__ - Step 26349: {'lr': 0.00046734693253304795, 'samples': 5059008, 'steps': 26348, 'loss/train': 1.236518144607544} -08/30/2021 17:53:53 - INFO - __main__ - Step 26350: {'lr': 0.0004673443102597168, 'samples': 5059200, 'steps': 26349, 'loss/train': 1.5384405851364136} -08/30/2021 17:53:53 - INFO - __main__ - Step 26351: {'lr': 0.00046734168788845363, 'samples': 5059392, 'steps': 26350, 'loss/train': 1.015964150428772} -08/30/2021 17:53:54 - INFO - __main__ - Step 26352: {'lr': 0.00046733906541925963, 'samples': 5059584, 'steps': 26351, 'loss/train': 0.9438610076904297} -08/30/2021 17:53:54 - INFO - __main__ - Step 26353: {'lr': 0.00046733644285213604, 'samples': 5059776, 'steps': 26352, 'loss/train': 1.6680570840835571} -08/30/2021 17:53:54 - INFO - __main__ - Step 26354: {'lr': 0.00046733382018708405, 'samples': 5059968, 'steps': 26353, 'loss/train': 1.1922476291656494} -08/30/2021 17:53:56 - INFO - __main__ - Step 26355: {'lr': 0.00046733119742410476, 'samples': 5060160, 'steps': 26354, 'loss/train': 1.4690243005752563} -08/30/2021 17:53:56 - INFO - __main__ - Step 26356: {'lr': 0.0004673285745631993, 'samples': 5060352, 'steps': 26355, 'loss/train': 1.4539414644241333} -08/30/2021 17:53:57 - INFO - __main__ - Step 26357: {'lr': 0.000467325951604369, 'samples': 5060544, 'steps': 26356, 'loss/train': 2.1293528079986572} -08/30/2021 17:53:57 - INFO - __main__ - Step 26358: {'lr': 0.00046732332854761507, 'samples': 5060736, 'steps': 26357, 'loss/train': 1.4316747188568115} -08/30/2021 17:53:57 - INFO - __main__ - Step 26359: {'lr': 0.00046732070539293847, 'samples': 5060928, 'steps': 26358, 'loss/train': 1.9339829683303833} -08/30/2021 17:53:59 - INFO - __main__ - Step 26360: {'lr': 0.0004673180821403405, 'samples': 5061120, 'steps': 26359, 'loss/train': 3.5390784740448} -08/30/2021 17:53:59 - INFO - __main__ - Step 26361: {'lr': 0.00046731545878982253, 'samples': 5061312, 'steps': 26360, 'loss/train': 1.214211344718933} -08/30/2021 17:54:00 - INFO - __main__ - Step 26362: {'lr': 0.0004673128353413854, 'samples': 5061504, 'steps': 26361, 'loss/train': 1.7859796285629272} -08/30/2021 17:54:00 - INFO - __main__ - Step 26363: {'lr': 0.00046731021179503054, 'samples': 5061696, 'steps': 26362, 'loss/train': 5.96531343460083} -08/30/2021 17:54:00 - INFO - __main__ - Step 26364: {'lr': 0.00046730758815075903, 'samples': 5061888, 'steps': 26363, 'loss/train': 1.6871147155761719} -08/30/2021 17:54:01 - INFO - __main__ - Step 26365: {'lr': 0.0004673049644085721, 'samples': 5062080, 'steps': 26364, 'loss/train': 1.836182951927185} -08/30/2021 17:54:02 - INFO - __main__ - Step 26366: {'lr': 0.00046730234056847084, 'samples': 5062272, 'steps': 26365, 'loss/train': 1.4646716117858887} -08/30/2021 17:54:03 - INFO - __main__ - Step 26367: {'lr': 0.00046729971663045654, 'samples': 5062464, 'steps': 26366, 'loss/train': 0.11875174939632416} -08/30/2021 17:54:03 - INFO - __main__ - Step 26368: {'lr': 0.00046729709259453033, 'samples': 5062656, 'steps': 26367, 'loss/train': 0.17010241746902466} -08/30/2021 17:54:04 - INFO - __main__ - Step 26369: {'lr': 0.0004672944684606934, 'samples': 5062848, 'steps': 26368, 'loss/train': 2.159951686859131} -08/30/2021 17:54:04 - INFO - __main__ - Step 26370: {'lr': 0.000467291844228947, 'samples': 5063040, 'steps': 26369, 'loss/train': 1.3013253211975098} -08/30/2021 17:54:05 - INFO - __main__ - Step 26371: {'lr': 0.00046728921989929215, 'samples': 5063232, 'steps': 26370, 'loss/train': 1.547684669494629} -08/30/2021 17:54:06 - INFO - __main__ - Step 26372: {'lr': 0.0004672865954717301, 'samples': 5063424, 'steps': 26371, 'loss/train': 1.6107161045074463} -08/30/2021 17:54:06 - INFO - __main__ - Step 26373: {'lr': 0.00046728397094626217, 'samples': 5063616, 'steps': 26372, 'loss/train': 1.6851725578308105} -08/30/2021 17:54:06 - INFO - __main__ - Step 26374: {'lr': 0.0004672813463228894, 'samples': 5063808, 'steps': 26373, 'loss/train': 1.5158199071884155} -08/30/2021 17:54:07 - INFO - __main__ - Step 26375: {'lr': 0.00046727872160161305, 'samples': 5064000, 'steps': 26374, 'loss/train': 1.4802353382110596} -08/30/2021 17:54:09 - INFO - __main__ - Step 26376: {'lr': 0.0004672760967824342, 'samples': 5064192, 'steps': 26375, 'loss/train': 1.8279871940612793} -08/30/2021 17:54:09 - INFO - __main__ - Step 26377: {'lr': 0.0004672734718653541, 'samples': 5064384, 'steps': 26376, 'loss/train': 0.11590936779975891} -08/30/2021 17:54:10 - INFO - __main__ - Step 26378: {'lr': 0.00046727084685037394, 'samples': 5064576, 'steps': 26377, 'loss/train': 3.5200276374816895} -08/30/2021 17:54:10 - INFO - __main__ - Step 26379: {'lr': 0.00046726822173749497, 'samples': 5064768, 'steps': 26378, 'loss/train': 1.3514212369918823} -08/30/2021 17:54:11 - INFO - __main__ - Step 26380: {'lr': 0.0004672655965267182, 'samples': 5064960, 'steps': 26379, 'loss/train': 1.2324953079223633} -08/30/2021 17:54:12 - INFO - __main__ - Step 26381: {'lr': 0.0004672629712180448, 'samples': 5065152, 'steps': 26380, 'loss/train': 1.6526532173156738} -08/30/2021 17:54:13 - INFO - __main__ - Step 26382: {'lr': 0.00046726034581147624, 'samples': 5065344, 'steps': 26381, 'loss/train': 0.951452910900116} -08/30/2021 17:54:13 - INFO - __main__ - Step 26383: {'lr': 0.0004672577203070135, 'samples': 5065536, 'steps': 26382, 'loss/train': 1.8518738746643066} -08/30/2021 17:54:13 - INFO - __main__ - Step 26384: {'lr': 0.0004672550947046577, 'samples': 5065728, 'steps': 26383, 'loss/train': 0.9917610883712769} -08/30/2021 17:54:14 - INFO - __main__ - Step 26385: {'lr': 0.0004672524690044102, 'samples': 5065920, 'steps': 26384, 'loss/train': 2.4184682369232178} -08/30/2021 17:54:14 - INFO - __main__ - Step 26386: {'lr': 0.000467249843206272, 'samples': 5066112, 'steps': 26385, 'loss/train': 1.4285353422164917} -08/30/2021 17:54:15 - INFO - __main__ - Step 26387: {'lr': 0.00046724721731024446, 'samples': 5066304, 'steps': 26386, 'loss/train': 1.8097509145736694} -08/30/2021 17:54:16 - INFO - __main__ - Step 26388: {'lr': 0.00046724459131632854, 'samples': 5066496, 'steps': 26387, 'loss/train': 1.3934749364852905} -08/30/2021 17:54:16 - INFO - __main__ - Step 26389: {'lr': 0.00046724196522452565, 'samples': 5066688, 'steps': 26388, 'loss/train': 1.9031007289886475} -08/30/2021 17:54:17 - INFO - __main__ - Step 26390: {'lr': 0.00046723933903483687, 'samples': 5066880, 'steps': 26389, 'loss/train': 1.7344425916671753} -08/30/2021 17:54:17 - INFO - __main__ - Step 26391: {'lr': 0.00046723671274726344, 'samples': 5067072, 'steps': 26390, 'loss/train': 1.6269930601119995} -08/30/2021 17:54:18 - INFO - __main__ - Step 26392: {'lr': 0.00046723408636180645, 'samples': 5067264, 'steps': 26391, 'loss/train': 1.904179334640503} -08/30/2021 17:54:19 - INFO - __main__ - Step 26393: {'lr': 0.00046723145987846715, 'samples': 5067456, 'steps': 26392, 'loss/train': 1.6348963975906372} -08/30/2021 17:54:19 - INFO - __main__ - Step 26394: {'lr': 0.00046722883329724667, 'samples': 5067648, 'steps': 26393, 'loss/train': 1.3784867525100708} -08/30/2021 17:54:19 - INFO - __main__ - Step 26395: {'lr': 0.0004672262066181463, 'samples': 5067840, 'steps': 26394, 'loss/train': 1.7997623682022095} -08/30/2021 17:54:20 - INFO - __main__ - Step 26396: {'lr': 0.00046722357984116717, 'samples': 5068032, 'steps': 26395, 'loss/train': 1.4385432004928589} -08/30/2021 17:54:21 - INFO - __main__ - Step 26397: {'lr': 0.0004672209529663103, 'samples': 5068224, 'steps': 26396, 'loss/train': 1.9246010780334473} -08/30/2021 17:54:22 - INFO - __main__ - Step 26398: {'lr': 0.00046721832599357717, 'samples': 5068416, 'steps': 26397, 'loss/train': 1.470102071762085} -08/30/2021 17:54:22 - INFO - __main__ - Step 26399: {'lr': 0.00046721569892296875, 'samples': 5068608, 'steps': 26398, 'loss/train': 1.6469706296920776} -08/30/2021 17:54:22 - INFO - __main__ - Step 26400: {'lr': 0.00046721307175448626, 'samples': 5068800, 'steps': 26399, 'loss/train': 1.223879337310791} -08/30/2021 17:54:23 - INFO - __main__ - Step 26401: {'lr': 0.000467210444488131, 'samples': 5068992, 'steps': 26400, 'loss/train': 0.6934109330177307} -08/30/2021 17:54:25 - INFO - __main__ - Step 26402: {'lr': 0.000467207817123904, 'samples': 5069184, 'steps': 26401, 'loss/train': 1.8567276000976562} -08/30/2021 17:54:25 - INFO - __main__ - Step 26403: {'lr': 0.0004672051896618065, 'samples': 5069376, 'steps': 26402, 'loss/train': 0.9742704033851624} -08/30/2021 17:54:25 - INFO - __main__ - Step 26404: {'lr': 0.0004672025621018397, 'samples': 5069568, 'steps': 26403, 'loss/train': 0.0499262660741806} -08/30/2021 17:54:26 - INFO - __main__ - Step 26405: {'lr': 0.00046719993444400477, 'samples': 5069760, 'steps': 26404, 'loss/train': 1.4353646039962769} -08/30/2021 17:54:26 - INFO - __main__ - Step 26406: {'lr': 0.00046719730668830293, 'samples': 5069952, 'steps': 26405, 'loss/train': 1.8499877452850342} -08/30/2021 17:54:27 - INFO - __main__ - Step 26407: {'lr': 0.0004671946788347353, 'samples': 5070144, 'steps': 26406, 'loss/train': 1.4248777627944946} -08/30/2021 17:54:27 - INFO - __main__ - Step 26408: {'lr': 0.00046719205088330317, 'samples': 5070336, 'steps': 26407, 'loss/train': 1.6838206052780151} -08/30/2021 17:54:28 - INFO - __main__ - Step 26409: {'lr': 0.0004671894228340076, 'samples': 5070528, 'steps': 26408, 'loss/train': 1.920997977256775} -08/30/2021 17:54:29 - INFO - __main__ - Step 26410: {'lr': 0.0004671867946868499, 'samples': 5070720, 'steps': 26409, 'loss/train': 1.8226802349090576} -08/30/2021 17:54:29 - INFO - __main__ - Step 26411: {'lr': 0.000467184166441831, 'samples': 5070912, 'steps': 26410, 'loss/train': 1.7642099857330322} -08/30/2021 17:54:29 - INFO - __main__ - Step 26412: {'lr': 0.0004671815380989525, 'samples': 5071104, 'steps': 26411, 'loss/train': 0.9808248281478882} -08/30/2021 17:54:30 - INFO - __main__ - Step 26413: {'lr': 0.0004671789096582152, 'samples': 5071296, 'steps': 26412, 'loss/train': 1.769890546798706} -08/30/2021 17:54:32 - INFO - __main__ - Step 26414: {'lr': 0.00046717628111962045, 'samples': 5071488, 'steps': 26413, 'loss/train': 1.6621394157409668} -08/30/2021 17:54:32 - INFO - __main__ - Step 26415: {'lr': 0.00046717365248316947, 'samples': 5071680, 'steps': 26414, 'loss/train': 1.7568658590316772} -08/30/2021 17:54:33 - INFO - __main__ - Step 26416: {'lr': 0.00046717102374886334, 'samples': 5071872, 'steps': 26415, 'loss/train': 0.8884730935096741} -08/30/2021 17:54:33 - INFO - __main__ - Step 26417: {'lr': 0.0004671683949167033, 'samples': 5072064, 'steps': 26416, 'loss/train': 1.5018233060836792} -08/30/2021 17:54:33 - INFO - __main__ - Step 26418: {'lr': 0.0004671657659866906, 'samples': 5072256, 'steps': 26417, 'loss/train': 2.1330373287200928} -08/30/2021 17:54:34 - INFO - __main__ - Step 26419: {'lr': 0.00046716313695882626, 'samples': 5072448, 'steps': 26418, 'loss/train': 0.3153764307498932} -08/30/2021 17:54:36 - INFO - __main__ - Step 26420: {'lr': 0.00046716050783311166, 'samples': 5072640, 'steps': 26419, 'loss/train': 0.04831329733133316} -08/30/2021 17:54:36 - INFO - __main__ - Step 26421: {'lr': 0.00046715787860954785, 'samples': 5072832, 'steps': 26420, 'loss/train': 1.573830008506775} -08/30/2021 17:54:36 - INFO - __main__ - Step 26422: {'lr': 0.000467155249288136, 'samples': 5073024, 'steps': 26421, 'loss/train': 1.1698150634765625} -08/30/2021 17:54:37 - INFO - __main__ - Step 26423: {'lr': 0.00046715261986887734, 'samples': 5073216, 'steps': 26422, 'loss/train': 1.5478065013885498} -08/30/2021 17:54:37 - INFO - __main__ - Step 26424: {'lr': 0.0004671499903517732, 'samples': 5073408, 'steps': 26423, 'loss/train': 1.3033256530761719} -08/30/2021 17:54:39 - INFO - __main__ - Step 26425: {'lr': 0.00046714736073682453, 'samples': 5073600, 'steps': 26424, 'loss/train': 0.21836160123348236} -08/30/2021 17:54:39 - INFO - __main__ - Step 26426: {'lr': 0.00046714473102403255, 'samples': 5073792, 'steps': 26425, 'loss/train': 1.481293797492981} -08/30/2021 17:54:39 - INFO - __main__ - Step 26427: {'lr': 0.0004671421012133986, 'samples': 5073984, 'steps': 26426, 'loss/train': 1.5887008905410767} -08/30/2021 17:54:40 - INFO - __main__ - Step 26428: {'lr': 0.00046713947130492373, 'samples': 5074176, 'steps': 26427, 'loss/train': 1.770939826965332} -08/30/2021 17:54:40 - INFO - __main__ - Step 26429: {'lr': 0.0004671368412986091, 'samples': 5074368, 'steps': 26428, 'loss/train': 1.5196409225463867} -08/30/2021 17:54:43 - INFO - __main__ - Step 26430: {'lr': 0.0004671342111944561, 'samples': 5074560, 'steps': 26429, 'loss/train': 1.2715877294540405} -08/30/2021 17:54:44 - INFO - __main__ - Step 26431: {'lr': 0.00046713158099246564, 'samples': 5074752, 'steps': 26430, 'loss/train': 1.879807710647583} -08/30/2021 17:54:44 - INFO - __main__ - Step 26432: {'lr': 0.00046712895069263917, 'samples': 5074944, 'steps': 26431, 'loss/train': 1.8316450119018555} -08/30/2021 17:54:44 - INFO - __main__ - Step 26433: {'lr': 0.00046712632029497766, 'samples': 5075136, 'steps': 26432, 'loss/train': 1.1785908937454224} -08/30/2021 17:54:45 - INFO - __main__ - Step 26434: {'lr': 0.0004671236897994824, 'samples': 5075328, 'steps': 26433, 'loss/train': 1.2271547317504883} -08/30/2021 17:54:45 - INFO - __main__ - Step 26435: {'lr': 0.00046712105920615455, 'samples': 5075520, 'steps': 26434, 'loss/train': 2.026353120803833} -08/30/2021 17:54:45 - INFO - __main__ - Step 26436: {'lr': 0.00046711842851499533, 'samples': 5075712, 'steps': 26435, 'loss/train': 3.067622661590576} -08/30/2021 17:54:46 - INFO - __main__ - Step 26437: {'lr': 0.0004671157977260059, 'samples': 5075904, 'steps': 26436, 'loss/train': 1.6393345594406128} -08/30/2021 17:54:47 - INFO - __main__ - Step 26438: {'lr': 0.0004671131668391874, 'samples': 5076096, 'steps': 26437, 'loss/train': 0.8563994765281677} -08/30/2021 17:54:48 - INFO - __main__ - Step 26439: {'lr': 0.00046711053585454104, 'samples': 5076288, 'steps': 26438, 'loss/train': 1.2317432165145874} -08/30/2021 17:54:48 - INFO - __main__ - Step 26440: {'lr': 0.0004671079047720681, 'samples': 5076480, 'steps': 26439, 'loss/train': 1.503592610359192} -08/30/2021 17:54:49 - INFO - __main__ - Step 26441: {'lr': 0.00046710527359176957, 'samples': 5076672, 'steps': 26440, 'loss/train': 1.7058897018432617} -08/30/2021 17:54:49 - INFO - __main__ - Step 26442: {'lr': 0.0004671026423136469, 'samples': 5076864, 'steps': 26441, 'loss/train': 1.1538952589035034} -08/30/2021 17:54:50 - INFO - __main__ - Step 26443: {'lr': 0.00046710001093770107, 'samples': 5077056, 'steps': 26442, 'loss/train': 1.1952552795410156} -08/30/2021 17:54:51 - INFO - __main__ - Step 26444: {'lr': 0.0004670973794639333, 'samples': 5077248, 'steps': 26443, 'loss/train': 1.5073482990264893} -08/30/2021 17:54:51 - INFO - __main__ - Step 26445: {'lr': 0.0004670947478923447, 'samples': 5077440, 'steps': 26444, 'loss/train': 1.3746172189712524} -08/30/2021 17:54:52 - INFO - __main__ - Step 26446: {'lr': 0.00046709211622293677, 'samples': 5077632, 'steps': 26445, 'loss/train': 1.3588981628417969} -08/30/2021 17:54:52 - INFO - __main__ - Step 26447: {'lr': 0.00046708948445571037, 'samples': 5077824, 'steps': 26446, 'loss/train': 1.8258367776870728} -08/30/2021 17:54:54 - INFO - __main__ - Step 26448: {'lr': 0.0004670868525906668, 'samples': 5078016, 'steps': 26447, 'loss/train': 1.0081768035888672} -08/30/2021 17:54:55 - INFO - __main__ - Step 26449: {'lr': 0.00046708422062780725, 'samples': 5078208, 'steps': 26448, 'loss/train': 1.5623821020126343} -08/30/2021 17:54:55 - INFO - __main__ - Step 26450: {'lr': 0.0004670815885671329, 'samples': 5078400, 'steps': 26449, 'loss/train': 1.381220817565918} -08/30/2021 17:54:56 - INFO - __main__ - Step 26451: {'lr': 0.00046707895640864494, 'samples': 5078592, 'steps': 26450, 'loss/train': 0.7613924145698547} -08/30/2021 17:54:56 - INFO - __main__ - Step 26452: {'lr': 0.0004670763241523446, 'samples': 5078784, 'steps': 26451, 'loss/train': 0.6841173768043518} -08/30/2021 17:54:56 - INFO - __main__ - Step 26453: {'lr': 0.00046707369179823294, 'samples': 5078976, 'steps': 26452, 'loss/train': 0.5758198499679565} -08/30/2021 17:54:57 - INFO - __main__ - Step 26454: {'lr': 0.00046707105934631123, 'samples': 5079168, 'steps': 26453, 'loss/train': 0.5321375727653503} -08/30/2021 17:54:58 - INFO - __main__ - Step 26455: {'lr': 0.00046706842679658067, 'samples': 5079360, 'steps': 26454, 'loss/train': 1.0598952770233154} -08/30/2021 17:54:59 - INFO - __main__ - Step 26456: {'lr': 0.0004670657941490425, 'samples': 5079552, 'steps': 26455, 'loss/train': 0.2264997810125351} -08/30/2021 17:54:59 - INFO - __main__ - Step 26457: {'lr': 0.00046706316140369774, 'samples': 5079744, 'steps': 26456, 'loss/train': 1.4735705852508545} -08/30/2021 17:54:59 - INFO - __main__ - Step 26458: {'lr': 0.0004670605285605477, 'samples': 5079936, 'steps': 26457, 'loss/train': 1.39555025100708} -08/30/2021 17:55:00 - INFO - __main__ - Step 26459: {'lr': 0.0004670578956195935, 'samples': 5080128, 'steps': 26458, 'loss/train': 1.5469558238983154} -08/30/2021 17:55:01 - INFO - __main__ - Step 26460: {'lr': 0.00046705526258083643, 'samples': 5080320, 'steps': 26459, 'loss/train': 1.3662614822387695} -08/30/2021 17:55:02 - INFO - __main__ - Step 26461: {'lr': 0.0004670526294442775, 'samples': 5080512, 'steps': 26460, 'loss/train': 1.7535197734832764} -08/30/2021 17:55:02 - INFO - __main__ - Step 26462: {'lr': 0.0004670499962099181, 'samples': 5080704, 'steps': 26461, 'loss/train': 2.2103404998779297} -08/30/2021 17:55:02 - INFO - __main__ - Step 26463: {'lr': 0.0004670473628777593, 'samples': 5080896, 'steps': 26462, 'loss/train': 1.1556077003479004} -08/30/2021 17:55:03 - INFO - __main__ - Step 26464: {'lr': 0.0004670447294478023, 'samples': 5081088, 'steps': 26463, 'loss/train': 1.4666619300842285} -08/30/2021 17:55:04 - INFO - __main__ - Step 26465: {'lr': 0.0004670420959200483, 'samples': 5081280, 'steps': 26464, 'loss/train': 1.7490825653076172} -08/30/2021 17:55:05 - INFO - __main__ - Step 26466: {'lr': 0.00046703946229449846, 'samples': 5081472, 'steps': 26465, 'loss/train': 1.3428783416748047} -08/30/2021 17:55:05 - INFO - __main__ - Step 26467: {'lr': 0.00046703682857115406, 'samples': 5081664, 'steps': 26466, 'loss/train': 1.2313660383224487} -08/30/2021 17:55:06 - INFO - __main__ - Step 26468: {'lr': 0.0004670341947500161, 'samples': 5081856, 'steps': 26467, 'loss/train': 1.5175172090530396} -08/30/2021 17:55:06 - INFO - __main__ - Step 26469: {'lr': 0.00046703156083108597, 'samples': 5082048, 'steps': 26468, 'loss/train': 1.4003242254257202} -08/30/2021 17:55:07 - INFO - __main__ - Step 26470: {'lr': 0.0004670289268143647, 'samples': 5082240, 'steps': 26469, 'loss/train': 0.4863508343696594} -08/30/2021 17:55:08 - INFO - __main__ - Step 26471: {'lr': 0.0004670262926998536, 'samples': 5082432, 'steps': 26470, 'loss/train': 1.4212708473205566} -08/30/2021 17:55:08 - INFO - __main__ - Step 26472: {'lr': 0.00046702365848755377, 'samples': 5082624, 'steps': 26471, 'loss/train': 1.6410430669784546} -08/30/2021 17:55:08 - INFO - __main__ - Step 26473: {'lr': 0.0004670210241774664, 'samples': 5082816, 'steps': 26472, 'loss/train': 1.008784294128418} -08/30/2021 17:55:09 - INFO - __main__ - Step 26474: {'lr': 0.0004670183897695928, 'samples': 5083008, 'steps': 26473, 'loss/train': 1.7928823232650757} -08/30/2021 17:55:10 - INFO - __main__ - Step 26475: {'lr': 0.00046701575526393395, 'samples': 5083200, 'steps': 26474, 'loss/train': 1.339598536491394} -08/30/2021 17:55:11 - INFO - __main__ - Step 26476: {'lr': 0.00046701312066049126, 'samples': 5083392, 'steps': 26475, 'loss/train': 1.4918270111083984} -08/30/2021 17:55:11 - INFO - __main__ - Step 26477: {'lr': 0.00046701048595926574, 'samples': 5083584, 'steps': 26476, 'loss/train': 2.120662212371826} -08/30/2021 17:55:12 - INFO - __main__ - Step 26478: {'lr': 0.00046700785116025867, 'samples': 5083776, 'steps': 26477, 'loss/train': 1.672579050064087} -08/30/2021 17:55:12 - INFO - __main__ - Step 26479: {'lr': 0.0004670052162634712, 'samples': 5083968, 'steps': 26478, 'loss/train': 1.7572641372680664} -08/30/2021 17:55:12 - INFO - __main__ - Step 26480: {'lr': 0.0004670025812689045, 'samples': 5084160, 'steps': 26479, 'loss/train': 1.507641315460205} -08/30/2021 17:55:14 - INFO - __main__ - Step 26481: {'lr': 0.00046699994617655985, 'samples': 5084352, 'steps': 26480, 'loss/train': 1.281359314918518} -08/30/2021 17:55:14 - INFO - __main__ - Step 26482: {'lr': 0.0004669973109864383, 'samples': 5084544, 'steps': 26481, 'loss/train': 1.397874116897583} -08/30/2021 17:55:14 - INFO - __main__ - Step 26483: {'lr': 0.00046699467569854115, 'samples': 5084736, 'steps': 26482, 'loss/train': 1.1106603145599365} -08/30/2021 17:55:15 - INFO - __main__ - Step 26484: {'lr': 0.0004669920403128696, 'samples': 5084928, 'steps': 26483, 'loss/train': 1.7543003559112549} -08/30/2021 17:55:15 - INFO - __main__ - Step 26485: {'lr': 0.00046698940482942466, 'samples': 5085120, 'steps': 26484, 'loss/train': 1.2458912134170532} -08/30/2021 17:55:17 - INFO - __main__ - Step 26486: {'lr': 0.0004669867692482077, 'samples': 5085312, 'steps': 26485, 'loss/train': 1.9360105991363525} -08/30/2021 17:55:18 - INFO - __main__ - Step 26487: {'lr': 0.00046698413356921985, 'samples': 5085504, 'steps': 26486, 'loss/train': 0.9060123562812805} -08/30/2021 17:55:18 - INFO - __main__ - Step 26488: {'lr': 0.00046698149779246235, 'samples': 5085696, 'steps': 26487, 'loss/train': 1.7709970474243164} -08/30/2021 17:55:18 - INFO - __main__ - Step 26489: {'lr': 0.0004669788619179363, 'samples': 5085888, 'steps': 26488, 'loss/train': 1.8481642007827759} -08/30/2021 17:55:19 - INFO - __main__ - Step 26490: {'lr': 0.0004669762259456429, 'samples': 5086080, 'steps': 26489, 'loss/train': 1.6907516717910767} -08/30/2021 17:55:20 - INFO - __main__ - Step 26491: {'lr': 0.00046697358987558336, 'samples': 5086272, 'steps': 26490, 'loss/train': 1.2334203720092773} -08/30/2021 17:55:21 - INFO - __main__ - Step 26492: {'lr': 0.0004669709537077589, 'samples': 5086464, 'steps': 26491, 'loss/train': 1.840136170387268} -08/30/2021 17:55:21 - INFO - __main__ - Step 26493: {'lr': 0.00046696831744217065, 'samples': 5086656, 'steps': 26492, 'loss/train': 0.9647053480148315} -08/30/2021 17:55:21 - INFO - __main__ - Step 26494: {'lr': 0.0004669656810788199, 'samples': 5086848, 'steps': 26493, 'loss/train': 1.555384635925293} -08/30/2021 17:55:22 - INFO - __main__ - Step 26495: {'lr': 0.0004669630446177077, 'samples': 5087040, 'steps': 26494, 'loss/train': 0.9002858400344849} -08/30/2021 17:55:24 - INFO - __main__ - Step 26496: {'lr': 0.0004669604080588352, 'samples': 5087232, 'steps': 26495, 'loss/train': 2.0909271240234375} -08/30/2021 17:55:24 - INFO - __main__ - Step 26497: {'lr': 0.0004669577714022039, 'samples': 5087424, 'steps': 26496, 'loss/train': 1.7274521589279175} -08/30/2021 17:55:24 - INFO - __main__ - Step 26498: {'lr': 0.00046695513464781456, 'samples': 5087616, 'steps': 26497, 'loss/train': 1.4134820699691772} -08/30/2021 17:55:25 - INFO - __main__ - Step 26499: {'lr': 0.00046695249779566875, 'samples': 5087808, 'steps': 26498, 'loss/train': 1.7090868949890137} -08/30/2021 17:55:25 - INFO - __main__ - Step 26500: {'lr': 0.0004669498608457674, 'samples': 5088000, 'steps': 26499, 'loss/train': 2.725168466567993} -08/30/2021 17:55:25 - INFO - __main__ - Step 26501: {'lr': 0.0004669472237981118, 'samples': 5088192, 'steps': 26500, 'loss/train': 1.5974403619766235} -08/30/2021 17:55:27 - INFO - __main__ - Step 26502: {'lr': 0.00046694458665270315, 'samples': 5088384, 'steps': 26501, 'loss/train': 1.7336952686309814} -08/30/2021 17:55:28 - INFO - __main__ - Step 26503: {'lr': 0.0004669419494095426, 'samples': 5088576, 'steps': 26502, 'loss/train': 1.2236595153808594} -08/30/2021 17:55:28 - INFO - __main__ - Step 26504: {'lr': 0.0004669393120686314, 'samples': 5088768, 'steps': 26503, 'loss/train': 1.8604410886764526} -08/30/2021 17:55:28 - INFO - __main__ - Step 26505: {'lr': 0.0004669366746299707, 'samples': 5088960, 'steps': 26504, 'loss/train': 4.852655410766602} -08/30/2021 17:55:29 - INFO - __main__ - Step 26506: {'lr': 0.00046693403709356163, 'samples': 5089152, 'steps': 26505, 'loss/train': 1.74601149559021} -08/30/2021 17:55:29 - INFO - __main__ - Step 26507: {'lr': 0.00046693139945940546, 'samples': 5089344, 'steps': 26506, 'loss/train': 1.7411202192306519} -08/30/2021 17:55:31 - INFO - __main__ - Step 26508: {'lr': 0.0004669287617275033, 'samples': 5089536, 'steps': 26507, 'loss/train': 2.4722275733947754} -08/30/2021 17:55:31 - INFO - __main__ - Step 26509: {'lr': 0.0004669261238978564, 'samples': 5089728, 'steps': 26508, 'loss/train': 1.3681408166885376} -08/30/2021 17:55:31 - INFO - __main__ - Step 26510: {'lr': 0.00046692348597046596, 'samples': 5089920, 'steps': 26509, 'loss/train': 1.345752239227295} -08/30/2021 17:55:32 - INFO - __main__ - Step 26511: {'lr': 0.0004669208479453332, 'samples': 5090112, 'steps': 26510, 'loss/train': 1.8200063705444336} -08/30/2021 17:55:32 - INFO - __main__ - Step 26512: {'lr': 0.00046691820982245913, 'samples': 5090304, 'steps': 26511, 'loss/train': 1.7139945030212402} -08/30/2021 17:55:34 - INFO - __main__ - Step 26513: {'lr': 0.00046691557160184516, 'samples': 5090496, 'steps': 26512, 'loss/train': 1.4040721654891968} -08/30/2021 17:55:34 - INFO - __main__ - Step 26514: {'lr': 0.0004669129332834923, 'samples': 5090688, 'steps': 26513, 'loss/train': 1.6137622594833374} -08/30/2021 17:55:34 - INFO - __main__ - Step 26515: {'lr': 0.0004669102948674019, 'samples': 5090880, 'steps': 26514, 'loss/train': 1.3544131517410278} -08/30/2021 17:55:35 - INFO - __main__ - Step 26516: {'lr': 0.000466907656353575, 'samples': 5091072, 'steps': 26515, 'loss/train': 1.6316208839416504} -08/30/2021 17:55:35 - INFO - __main__ - Step 26517: {'lr': 0.0004669050177420129, 'samples': 5091264, 'steps': 26516, 'loss/train': 1.7549480199813843} -08/30/2021 17:55:35 - INFO - __main__ - Step 26518: {'lr': 0.0004669023790327168, 'samples': 5091456, 'steps': 26517, 'loss/train': 1.9351155757904053} -08/30/2021 17:55:37 - INFO - __main__ - Step 26519: {'lr': 0.0004668997402256877, 'samples': 5091648, 'steps': 26518, 'loss/train': 1.75971519947052} -08/30/2021 17:55:37 - INFO - __main__ - Step 26520: {'lr': 0.00046689710132092704, 'samples': 5091840, 'steps': 26519, 'loss/train': 1.475289225578308} -08/30/2021 17:55:38 - INFO - __main__ - Step 26521: {'lr': 0.00046689446231843585, 'samples': 5092032, 'steps': 26520, 'loss/train': 0.4546389579772949} -08/30/2021 17:55:38 - INFO - __main__ - Step 26522: {'lr': 0.0004668918232182153, 'samples': 5092224, 'steps': 26521, 'loss/train': 1.20957612991333} -08/30/2021 17:55:38 - INFO - __main__ - Step 26523: {'lr': 0.0004668891840202668, 'samples': 5092416, 'steps': 26522, 'loss/train': 1.6378568410873413} -08/30/2021 17:55:40 - INFO - __main__ - Step 26524: {'lr': 0.00046688654472459124, 'samples': 5092608, 'steps': 26523, 'loss/train': 1.5544283390045166} -08/30/2021 17:55:41 - INFO - __main__ - Step 26525: {'lr': 0.00046688390533119003, 'samples': 5092800, 'steps': 26524, 'loss/train': 1.7190724611282349} -08/30/2021 17:55:41 - INFO - __main__ - Step 26526: {'lr': 0.00046688126584006425, 'samples': 5092992, 'steps': 26525, 'loss/train': 2.415898323059082} -08/30/2021 17:55:41 - INFO - __main__ - Step 26527: {'lr': 0.00046687862625121505, 'samples': 5093184, 'steps': 26526, 'loss/train': 1.759015679359436} -08/30/2021 17:55:42 - INFO - __main__ - Step 26528: {'lr': 0.0004668759865646438, 'samples': 5093376, 'steps': 26527, 'loss/train': 0.3155175745487213} -08/30/2021 17:55:43 - INFO - __main__ - Step 26529: {'lr': 0.00046687334678035153, 'samples': 5093568, 'steps': 26528, 'loss/train': 1.1815344095230103} -08/30/2021 17:55:44 - INFO - __main__ - Step 26530: {'lr': 0.00046687070689833943, 'samples': 5093760, 'steps': 26529, 'loss/train': 1.4764231443405151} -08/30/2021 17:55:44 - INFO - __main__ - Step 26531: {'lr': 0.00046686806691860884, 'samples': 5093952, 'steps': 26530, 'loss/train': 1.9032479524612427} -08/30/2021 17:55:44 - INFO - __main__ - Step 26532: {'lr': 0.00046686542684116073, 'samples': 5094144, 'steps': 26531, 'loss/train': 1.7096304893493652} -08/30/2021 17:55:45 - INFO - __main__ - Step 26533: {'lr': 0.00046686278666599647, 'samples': 5094336, 'steps': 26532, 'loss/train': 1.3388385772705078} -08/30/2021 17:55:46 - INFO - __main__ - Step 26534: {'lr': 0.0004668601463931172, 'samples': 5094528, 'steps': 26533, 'loss/train': 1.315308928489685} -08/30/2021 17:55:47 - INFO - __main__ - Step 26535: {'lr': 0.00046685750602252406, 'samples': 5094720, 'steps': 26534, 'loss/train': 1.5765104293823242} -08/30/2021 17:55:47 - INFO - __main__ - Step 26536: {'lr': 0.0004668548655542183, 'samples': 5094912, 'steps': 26535, 'loss/train': 1.4822983741760254} -08/30/2021 17:55:47 - INFO - __main__ - Step 26537: {'lr': 0.000466852224988201, 'samples': 5095104, 'steps': 26536, 'loss/train': 0.7185746431350708} -08/30/2021 17:55:48 - INFO - __main__ - Step 26538: {'lr': 0.00046684958432447355, 'samples': 5095296, 'steps': 26537, 'loss/train': 1.265125036239624} -08/30/2021 17:55:50 - INFO - __main__ - Step 26539: {'lr': 0.00046684694356303693, 'samples': 5095488, 'steps': 26538, 'loss/train': 1.5037517547607422} -08/30/2021 17:55:50 - INFO - __main__ - Step 26540: {'lr': 0.0004668443027038925, 'samples': 5095680, 'steps': 26539, 'loss/train': 2.094182252883911} -08/30/2021 17:55:50 - INFO - __main__ - Step 26541: {'lr': 0.00046684166174704134, 'samples': 5095872, 'steps': 26540, 'loss/train': 1.6000418663024902} -08/30/2021 17:55:51 - INFO - __main__ - Step 26542: {'lr': 0.00046683902069248465, 'samples': 5096064, 'steps': 26541, 'loss/train': 1.3042372465133667} -08/30/2021 17:55:51 - INFO - __main__ - Step 26543: {'lr': 0.0004668363795402237, 'samples': 5096256, 'steps': 26542, 'loss/train': 1.4274382591247559} -08/30/2021 17:55:53 - INFO - __main__ - Step 26544: {'lr': 0.00046683373829025954, 'samples': 5096448, 'steps': 26543, 'loss/train': 1.6654459238052368} -08/30/2021 17:55:53 - INFO - __main__ - Step 26545: {'lr': 0.0004668310969425935, 'samples': 5096640, 'steps': 26544, 'loss/train': 1.9225696325302124} -08/30/2021 17:55:53 - INFO - __main__ - Step 26546: {'lr': 0.00046682845549722677, 'samples': 5096832, 'steps': 26545, 'loss/train': 1.6828829050064087} -08/30/2021 17:55:54 - INFO - __main__ - Step 26547: {'lr': 0.0004668258139541604, 'samples': 5097024, 'steps': 26546, 'loss/train': 2.350262403488159} -08/30/2021 17:55:54 - INFO - __main__ - Step 26548: {'lr': 0.00046682317231339565, 'samples': 5097216, 'steps': 26547, 'loss/train': 1.8005173206329346} -08/30/2021 17:55:56 - INFO - __main__ - Step 26549: {'lr': 0.00046682053057493377, 'samples': 5097408, 'steps': 26548, 'loss/train': 1.7175638675689697} -08/30/2021 17:55:56 - INFO - __main__ - Step 26550: {'lr': 0.00046681788873877595, 'samples': 5097600, 'steps': 26549, 'loss/train': 1.4173011779785156} -08/30/2021 17:55:57 - INFO - __main__ - Step 26551: {'lr': 0.00046681524680492327, 'samples': 5097792, 'steps': 26550, 'loss/train': 2.0777764320373535} -08/30/2021 17:55:57 - INFO - __main__ - Step 26552: {'lr': 0.00046681260477337693, 'samples': 5097984, 'steps': 26551, 'loss/train': 0.9717393517494202} -08/30/2021 17:55:57 - INFO - __main__ - Step 26553: {'lr': 0.0004668099626441383, 'samples': 5098176, 'steps': 26552, 'loss/train': 4.609521389007568} -08/30/2021 17:55:58 - INFO - __main__ - Step 26554: {'lr': 0.00046680732041720836, 'samples': 5098368, 'steps': 26553, 'loss/train': 1.4219341278076172} -08/30/2021 17:55:59 - INFO - __main__ - Step 26555: {'lr': 0.0004668046780925884, 'samples': 5098560, 'steps': 26554, 'loss/train': 1.711804747581482} -08/30/2021 17:56:00 - INFO - __main__ - Step 26556: {'lr': 0.0004668020356702796, 'samples': 5098752, 'steps': 26555, 'loss/train': 1.7388359308242798} -08/30/2021 17:56:00 - INFO - __main__ - Step 26557: {'lr': 0.0004667993931502832, 'samples': 5098944, 'steps': 26556, 'loss/train': 1.4576250314712524} -08/30/2021 17:56:00 - INFO - __main__ - Step 26558: {'lr': 0.00046679675053260027, 'samples': 5099136, 'steps': 26557, 'loss/train': 2.0638508796691895} -08/30/2021 17:56:01 - INFO - __main__ - Step 26559: {'lr': 0.00046679410781723206, 'samples': 5099328, 'steps': 26558, 'loss/train': 1.4840946197509766} -08/30/2021 17:56:02 - INFO - __main__ - Step 26560: {'lr': 0.0004667914650041799, 'samples': 5099520, 'steps': 26559, 'loss/train': 2.2055389881134033} -08/30/2021 17:56:03 - INFO - __main__ - Step 26561: {'lr': 0.00046678882209344474, 'samples': 5099712, 'steps': 26560, 'loss/train': 1.8977118730545044} -08/30/2021 17:56:03 - INFO - __main__ - Step 26562: {'lr': 0.00046678617908502785, 'samples': 5099904, 'steps': 26561, 'loss/train': 0.975948691368103} -08/30/2021 17:56:04 - INFO - __main__ - Step 26563: {'lr': 0.00046678353597893053, 'samples': 5100096, 'steps': 26562, 'loss/train': 0.4861288368701935} -08/30/2021 17:56:04 - INFO - __main__ - Step 26564: {'lr': 0.0004667808927751539, 'samples': 5100288, 'steps': 26563, 'loss/train': 0.9822503924369812} -08/30/2021 17:56:06 - INFO - __main__ - Step 26565: {'lr': 0.00046677824947369907, 'samples': 5100480, 'steps': 26564, 'loss/train': 1.2419246435165405} -08/30/2021 17:56:06 - INFO - __main__ - Step 26566: {'lr': 0.0004667756060745674, 'samples': 5100672, 'steps': 26565, 'loss/train': 1.6193146705627441} -08/30/2021 17:56:06 - INFO - __main__ - Step 26567: {'lr': 0.0004667729625777599, 'samples': 5100864, 'steps': 26566, 'loss/train': 1.7757670879364014} -08/30/2021 17:56:07 - INFO - __main__ - Step 26568: {'lr': 0.0004667703189832779, 'samples': 5101056, 'steps': 26567, 'loss/train': 1.699609637260437} -08/30/2021 17:56:07 - INFO - __main__ - Step 26569: {'lr': 0.00046676767529112254, 'samples': 5101248, 'steps': 26568, 'loss/train': 1.9243919849395752} -08/30/2021 17:56:07 - INFO - __main__ - Step 26570: {'lr': 0.000466765031501295, 'samples': 5101440, 'steps': 26569, 'loss/train': 1.4580461978912354} -08/30/2021 17:56:09 - INFO - __main__ - Step 26571: {'lr': 0.0004667623876137965, 'samples': 5101632, 'steps': 26570, 'loss/train': 1.9228307008743286} -08/30/2021 17:56:09 - INFO - __main__ - Step 26572: {'lr': 0.00046675974362862815, 'samples': 5101824, 'steps': 26571, 'loss/train': 1.4032305479049683} -08/30/2021 17:56:10 - INFO - __main__ - Step 26573: {'lr': 0.00046675709954579125, 'samples': 5102016, 'steps': 26572, 'loss/train': 1.2667769193649292} -08/30/2021 17:56:10 - INFO - __main__ - Step 26574: {'lr': 0.0004667544553652869, 'samples': 5102208, 'steps': 26573, 'loss/train': 1.661678671836853} -08/30/2021 17:56:10 - INFO - __main__ - Step 26575: {'lr': 0.0004667518110871164, 'samples': 5102400, 'steps': 26574, 'loss/train': 0.1847216784954071} -08/30/2021 17:56:12 - INFO - __main__ - Step 26576: {'lr': 0.0004667491667112809, 'samples': 5102592, 'steps': 26575, 'loss/train': 0.9313610196113586} -08/30/2021 17:56:12 - INFO - __main__ - Step 26577: {'lr': 0.0004667465222377815, 'samples': 5102784, 'steps': 26576, 'loss/train': 1.1827235221862793} -08/30/2021 17:56:13 - INFO - __main__ - Step 26578: {'lr': 0.0004667438776666195, 'samples': 5102976, 'steps': 26577, 'loss/train': 1.0463329553604126} -08/30/2021 17:56:13 - INFO - __main__ - Step 26579: {'lr': 0.00046674123299779603, 'samples': 5103168, 'steps': 26578, 'loss/train': 1.9854336977005005} -08/30/2021 17:56:13 - INFO - __main__ - Step 26580: {'lr': 0.0004667385882313123, 'samples': 5103360, 'steps': 26579, 'loss/train': 0.7418782711029053} -08/30/2021 17:56:15 - INFO - __main__ - Step 26581: {'lr': 0.0004667359433671695, 'samples': 5103552, 'steps': 26580, 'loss/train': 1.5804579257965088} -08/30/2021 17:56:15 - INFO - __main__ - Step 26582: {'lr': 0.0004667332984053689, 'samples': 5103744, 'steps': 26581, 'loss/train': 1.3505744934082031} -08/30/2021 17:56:16 - INFO - __main__ - Step 26583: {'lr': 0.00046673065334591155, 'samples': 5103936, 'steps': 26582, 'loss/train': 1.6267030239105225} -08/30/2021 17:56:16 - INFO - __main__ - Step 26584: {'lr': 0.00046672800818879873, 'samples': 5104128, 'steps': 26583, 'loss/train': 1.9608153104782104} -08/30/2021 17:56:16 - INFO - __main__ - Step 26585: {'lr': 0.0004667253629340316, 'samples': 5104320, 'steps': 26584, 'loss/train': 1.3606011867523193} -08/30/2021 17:56:17 - INFO - __main__ - Step 26586: {'lr': 0.0004667227175816114, 'samples': 5104512, 'steps': 26585, 'loss/train': 1.891992449760437} -08/30/2021 17:56:18 - INFO - __main__ - Step 26587: {'lr': 0.0004667200721315393, 'samples': 5104704, 'steps': 26586, 'loss/train': 1.6568644046783447} -08/30/2021 17:56:19 - INFO - __main__ - Step 26588: {'lr': 0.00046671742658381646, 'samples': 5104896, 'steps': 26587, 'loss/train': 1.5922542810440063} -08/30/2021 17:56:19 - INFO - __main__ - Step 26589: {'lr': 0.000466714780938444, 'samples': 5105088, 'steps': 26588, 'loss/train': 0.1373966485261917} -08/30/2021 17:56:20 - INFO - __main__ - Step 26590: {'lr': 0.0004667121351954233, 'samples': 5105280, 'steps': 26589, 'loss/train': 1.6285159587860107} -08/30/2021 17:56:20 - INFO - __main__ - Step 26591: {'lr': 0.00046670948935475544, 'samples': 5105472, 'steps': 26590, 'loss/train': 1.7560625076293945} -08/30/2021 17:56:21 - INFO - __main__ - Step 26592: {'lr': 0.00046670684341644167, 'samples': 5105664, 'steps': 26591, 'loss/train': 1.802418828010559} -08/30/2021 17:56:22 - INFO - __main__ - Step 26593: {'lr': 0.0004667041973804831, 'samples': 5105856, 'steps': 26592, 'loss/train': 1.8346643447875977} -08/30/2021 17:56:22 - INFO - __main__ - Step 26594: {'lr': 0.00046670155124688096, 'samples': 5106048, 'steps': 26593, 'loss/train': 2.776232957839966} -08/30/2021 17:56:23 - INFO - __main__ - Step 26595: {'lr': 0.00046669890501563636, 'samples': 5106240, 'steps': 26594, 'loss/train': 0.9451594948768616} -08/30/2021 17:56:23 - INFO - __main__ - Step 26596: {'lr': 0.0004666962586867507, 'samples': 5106432, 'steps': 26595, 'loss/train': 1.706702709197998} -08/30/2021 17:56:25 - INFO - __main__ - Step 26597: {'lr': 0.000466693612260225, 'samples': 5106624, 'steps': 26596, 'loss/train': 2.128802537918091} -08/30/2021 17:56:26 - INFO - __main__ - Step 26598: {'lr': 0.00046669096573606053, 'samples': 5106816, 'steps': 26597, 'loss/train': 1.3077977895736694} -08/30/2021 17:56:26 - INFO - __main__ - Step 26599: {'lr': 0.00046668831911425844, 'samples': 5107008, 'steps': 26598, 'loss/train': 0.24058596789836884} -08/30/2021 17:56:26 - INFO - __main__ - Step 26600: {'lr': 0.00046668567239481994, 'samples': 5107200, 'steps': 26599, 'loss/train': 1.5694202184677124} -08/30/2021 17:56:27 - INFO - __main__ - Step 26601: {'lr': 0.0004666830255777462, 'samples': 5107392, 'steps': 26600, 'loss/train': 1.5089735984802246} -08/30/2021 17:56:28 - INFO - __main__ - Step 26602: {'lr': 0.00046668037866303845, 'samples': 5107584, 'steps': 26601, 'loss/train': 1.3394880294799805} -08/30/2021 17:56:29 - INFO - __main__ - Step 26603: {'lr': 0.0004666777316506979, 'samples': 5107776, 'steps': 26602, 'loss/train': 1.7052606344223022} -08/30/2021 17:56:29 - INFO - __main__ - Step 26604: {'lr': 0.00046667508454072566, 'samples': 5107968, 'steps': 26603, 'loss/train': 1.8480103015899658} -08/30/2021 17:56:29 - INFO - __main__ - Step 26605: {'lr': 0.00046667243733312296, 'samples': 5108160, 'steps': 26604, 'loss/train': 1.675742745399475} -08/30/2021 17:56:30 - INFO - __main__ - Step 26606: {'lr': 0.000466669790027891, 'samples': 5108352, 'steps': 26605, 'loss/train': 1.3788155317306519} -08/30/2021 17:56:31 - INFO - __main__ - Step 26607: {'lr': 0.00046666714262503107, 'samples': 5108544, 'steps': 26606, 'loss/train': 1.5237983465194702} -08/30/2021 17:56:32 - INFO - __main__ - Step 26608: {'lr': 0.00046666449512454416, 'samples': 5108736, 'steps': 26607, 'loss/train': 1.323991060256958} -08/30/2021 17:56:32 - INFO - __main__ - Step 26609: {'lr': 0.0004666618475264316, 'samples': 5108928, 'steps': 26608, 'loss/train': 1.3702112436294556} -08/30/2021 17:56:32 - INFO - __main__ - Step 26610: {'lr': 0.0004666591998306946, 'samples': 5109120, 'steps': 26609, 'loss/train': 1.3449513912200928} -08/30/2021 17:56:33 - INFO - __main__ - Step 26611: {'lr': 0.0004666565520373343, 'samples': 5109312, 'steps': 26610, 'loss/train': 1.2981202602386475} -08/30/2021 17:56:33 - INFO - __main__ - Step 26612: {'lr': 0.00046665390414635184, 'samples': 5109504, 'steps': 26611, 'loss/train': 1.5928764343261719} -08/30/2021 17:56:34 - INFO - __main__ - Step 26613: {'lr': 0.0004666512561577485, 'samples': 5109696, 'steps': 26612, 'loss/train': 1.3780946731567383} -08/30/2021 17:56:35 - INFO - __main__ - Step 26614: {'lr': 0.0004666486080715255, 'samples': 5109888, 'steps': 26613, 'loss/train': 1.5655570030212402} -08/30/2021 17:56:35 - INFO - __main__ - Step 26615: {'lr': 0.0004666459598876839, 'samples': 5110080, 'steps': 26614, 'loss/train': 1.0367977619171143} -08/30/2021 17:56:36 - INFO - __main__ - Step 26616: {'lr': 0.000466643311606225, 'samples': 5110272, 'steps': 26615, 'loss/train': 1.6685724258422852} -08/30/2021 17:56:36 - INFO - __main__ - Step 26617: {'lr': 0.00046664066322715006, 'samples': 5110464, 'steps': 26616, 'loss/train': 1.5906468629837036} -08/30/2021 17:56:38 - INFO - __main__ - Step 26618: {'lr': 0.00046663801475046004, 'samples': 5110656, 'steps': 26617, 'loss/train': 1.2674009799957275} -08/30/2021 17:56:38 - INFO - __main__ - Step 26619: {'lr': 0.0004666353661761563, 'samples': 5110848, 'steps': 26618, 'loss/train': 1.5779671669006348} -08/30/2021 17:56:39 - INFO - __main__ - Step 26620: {'lr': 0.0004666327175042401, 'samples': 5111040, 'steps': 26619, 'loss/train': 0.14954562485218048} -08/30/2021 17:56:39 - INFO - __main__ - Step 26621: {'lr': 0.00046663006873471247, 'samples': 5111232, 'steps': 26620, 'loss/train': 1.7937462329864502} -08/30/2021 17:56:39 - INFO - __main__ - Step 26622: {'lr': 0.00046662741986757463, 'samples': 5111424, 'steps': 26621, 'loss/train': 1.360806941986084} -08/30/2021 17:56:41 - INFO - __main__ - Step 26623: {'lr': 0.0004666247709028279, 'samples': 5111616, 'steps': 26622, 'loss/train': 1.251752257347107} -08/30/2021 17:56:41 - INFO - __main__ - Step 26624: {'lr': 0.00046662212184047334, 'samples': 5111808, 'steps': 26623, 'loss/train': 1.4638067483901978} -08/30/2021 17:56:42 - INFO - __main__ - Step 26625: {'lr': 0.0004666194726805122, 'samples': 5112000, 'steps': 26624, 'loss/train': 0.9021357297897339} -08/30/2021 17:56:42 - INFO - __main__ - Step 26626: {'lr': 0.0004666168234229457, 'samples': 5112192, 'steps': 26625, 'loss/train': 2.011953592300415} -08/30/2021 17:56:42 - INFO - __main__ - Step 26627: {'lr': 0.000466614174067775, 'samples': 5112384, 'steps': 26626, 'loss/train': 0.7863146066665649} -08/30/2021 17:56:44 - INFO - __main__ - Step 26628: {'lr': 0.00046661152461500126, 'samples': 5112576, 'steps': 26627, 'loss/train': 2.0708909034729004} -08/30/2021 17:56:45 - INFO - __main__ - Step 26629: {'lr': 0.0004666088750646257, 'samples': 5112768, 'steps': 26628, 'loss/train': 1.9464064836502075} -08/30/2021 17:56:45 - INFO - __main__ - Step 26630: {'lr': 0.0004666062254166496, 'samples': 5112960, 'steps': 26629, 'loss/train': 0.6118735671043396} -08/30/2021 17:56:45 - INFO - __main__ - Step 26631: {'lr': 0.000466603575671074, 'samples': 5113152, 'steps': 26630, 'loss/train': 1.2635018825531006} -08/30/2021 17:56:46 - INFO - __main__ - Step 26632: {'lr': 0.00046660092582790025, 'samples': 5113344, 'steps': 26631, 'loss/train': 1.6213116645812988} -08/30/2021 17:56:46 - INFO - __main__ - Step 26633: {'lr': 0.0004665982758871294, 'samples': 5113536, 'steps': 26632, 'loss/train': 1.2657393217086792} -08/30/2021 17:56:48 - INFO - __main__ - Step 26634: {'lr': 0.0004665956258487627, 'samples': 5113728, 'steps': 26633, 'loss/train': 1.2259384393692017} -08/30/2021 17:56:48 - INFO - __main__ - Step 26635: {'lr': 0.0004665929757128014, 'samples': 5113920, 'steps': 26634, 'loss/train': 1.1367225646972656} -08/30/2021 17:56:48 - INFO - __main__ - Step 26636: {'lr': 0.0004665903254792466, 'samples': 5114112, 'steps': 26635, 'loss/train': 1.2556160688400269} -08/30/2021 17:56:49 - INFO - __main__ - Step 26637: {'lr': 0.0004665876751480996, 'samples': 5114304, 'steps': 26636, 'loss/train': 1.492944359779358} -08/30/2021 17:56:49 - INFO - __main__ - Step 26638: {'lr': 0.0004665850247193615, 'samples': 5114496, 'steps': 26637, 'loss/train': 1.5703942775726318} -08/30/2021 17:56:51 - INFO - __main__ - Step 26639: {'lr': 0.0004665823741930335, 'samples': 5114688, 'steps': 26638, 'loss/train': 1.1665278673171997} -08/30/2021 17:56:51 - INFO - __main__ - Step 26640: {'lr': 0.00046657972356911696, 'samples': 5114880, 'steps': 26639, 'loss/train': 0.4462893307209015} -08/30/2021 17:56:51 - INFO - __main__ - Step 26641: {'lr': 0.00046657707284761274, 'samples': 5115072, 'steps': 26640, 'loss/train': 1.648575782775879} -08/30/2021 17:56:52 - INFO - __main__ - Step 26642: {'lr': 0.0004665744220285224, 'samples': 5115264, 'steps': 26641, 'loss/train': 1.681076169013977} -08/30/2021 17:56:52 - INFO - __main__ - Step 26643: {'lr': 0.0004665717711118469, 'samples': 5115456, 'steps': 26642, 'loss/train': 2.1270596981048584} -08/30/2021 17:56:54 - INFO - __main__ - Step 26644: {'lr': 0.00046656912009758743, 'samples': 5115648, 'steps': 26643, 'loss/train': 1.60477614402771} -08/30/2021 17:56:54 - INFO - __main__ - Step 26645: {'lr': 0.0004665664689857454, 'samples': 5115840, 'steps': 26644, 'loss/train': 1.2852739095687866} -08/30/2021 17:56:55 - INFO - __main__ - Step 26646: {'lr': 0.00046656381777632173, 'samples': 5116032, 'steps': 26645, 'loss/train': 1.433002233505249} -08/30/2021 17:56:55 - INFO - __main__ - Step 26647: {'lr': 0.0004665611664693178, 'samples': 5116224, 'steps': 26646, 'loss/train': 0.8877944350242615} -08/30/2021 17:56:55 - INFO - __main__ - Step 26648: {'lr': 0.0004665585150647348, 'samples': 5116416, 'steps': 26647, 'loss/train': 0.9069812893867493} -08/30/2021 17:56:57 - INFO - __main__ - Step 26649: {'lr': 0.0004665558635625738, 'samples': 5116608, 'steps': 26648, 'loss/train': 1.624466896057129} -08/30/2021 17:56:57 - INFO - __main__ - Step 26650: {'lr': 0.00046655321196283604, 'samples': 5116800, 'steps': 26649, 'loss/train': 1.2025951147079468} -08/30/2021 17:56:58 - INFO - __main__ - Step 26651: {'lr': 0.00046655056026552287, 'samples': 5116992, 'steps': 26650, 'loss/train': 1.448067307472229} -08/30/2021 17:56:58 - INFO - __main__ - Step 26652: {'lr': 0.0004665479084706353, 'samples': 5117184, 'steps': 26651, 'loss/train': 1.4956330060958862} -08/30/2021 17:56:58 - INFO - __main__ - Step 26653: {'lr': 0.00046654525657817457, 'samples': 5117376, 'steps': 26652, 'loss/train': 1.2684885263442993} -08/30/2021 17:57:00 - INFO - __main__ - Step 26654: {'lr': 0.0004665426045881419, 'samples': 5117568, 'steps': 26653, 'loss/train': 1.571487307548523} -08/30/2021 17:57:01 - INFO - __main__ - Step 26655: {'lr': 0.00046653995250053843, 'samples': 5117760, 'steps': 26654, 'loss/train': 1.648902416229248} -08/30/2021 17:57:01 - INFO - __main__ - Step 26656: {'lr': 0.00046653730031536545, 'samples': 5117952, 'steps': 26655, 'loss/train': 0.6627792119979858} -08/30/2021 17:57:02 - INFO - __main__ - Step 26657: {'lr': 0.0004665346480326241, 'samples': 5118144, 'steps': 26656, 'loss/train': 1.4905503988265991} -08/30/2021 17:57:02 - INFO - __main__ - Step 26658: {'lr': 0.00046653199565231554, 'samples': 5118336, 'steps': 26657, 'loss/train': 1.935055136680603} -08/30/2021 17:57:03 - INFO - __main__ - Step 26659: {'lr': 0.00046652934317444104, 'samples': 5118528, 'steps': 26658, 'loss/train': 1.2012574672698975} -08/30/2021 17:57:04 - INFO - __main__ - Step 26660: {'lr': 0.00046652669059900174, 'samples': 5118720, 'steps': 26659, 'loss/train': 1.693825364112854} -08/30/2021 17:57:04 - INFO - __main__ - Step 26661: {'lr': 0.0004665240379259989, 'samples': 5118912, 'steps': 26660, 'loss/train': 2.019569158554077} -08/30/2021 17:57:05 - INFO - __main__ - Step 26662: {'lr': 0.00046652138515543366, 'samples': 5119104, 'steps': 26661, 'loss/train': 1.3235939741134644} -08/30/2021 17:57:05 - INFO - __main__ - Step 26663: {'lr': 0.00046651873228730715, 'samples': 5119296, 'steps': 26662, 'loss/train': 0.3999435007572174} -08/30/2021 17:57:05 - INFO - __main__ - Step 26664: {'lr': 0.0004665160793216207, 'samples': 5119488, 'steps': 26663, 'loss/train': 1.3439934253692627} -08/30/2021 17:57:07 - INFO - __main__ - Step 26665: {'lr': 0.00046651342625837544, 'samples': 5119680, 'steps': 26664, 'loss/train': 1.6201248168945312} -08/30/2021 17:57:07 - INFO - __main__ - Step 26666: {'lr': 0.00046651077309757256, 'samples': 5119872, 'steps': 26665, 'loss/train': 1.9719942808151245} -08/30/2021 17:57:08 - INFO - __main__ - Step 26667: {'lr': 0.0004665081198392133, 'samples': 5120064, 'steps': 26666, 'loss/train': 1.5221664905548096} -08/30/2021 17:57:08 - INFO - __main__ - Step 26668: {'lr': 0.0004665054664832988, 'samples': 5120256, 'steps': 26667, 'loss/train': 1.5162558555603027} -08/30/2021 17:57:08 - INFO - __main__ - Step 26669: {'lr': 0.00046650281302983024, 'samples': 5120448, 'steps': 26668, 'loss/train': 1.4170496463775635} -08/30/2021 17:57:10 - INFO - __main__ - Step 26670: {'lr': 0.00046650015947880886, 'samples': 5120640, 'steps': 26669, 'loss/train': 1.8704843521118164} -08/30/2021 17:57:10 - INFO - __main__ - Step 26671: {'lr': 0.00046649750583023595, 'samples': 5120832, 'steps': 26670, 'loss/train': 1.5668845176696777} -08/30/2021 17:57:11 - INFO - __main__ - Step 26672: {'lr': 0.00046649485208411244, 'samples': 5121024, 'steps': 26671, 'loss/train': 1.3336966037750244} -08/30/2021 17:57:11 - INFO - __main__ - Step 26673: {'lr': 0.00046649219824043984, 'samples': 5121216, 'steps': 26672, 'loss/train': 1.2383750677108765} -08/30/2021 17:57:11 - INFO - __main__ - Step 26674: {'lr': 0.00046648954429921914, 'samples': 5121408, 'steps': 26673, 'loss/train': 1.6487102508544922} -08/30/2021 17:57:13 - INFO - __main__ - Step 26675: {'lr': 0.00046648689026045157, 'samples': 5121600, 'steps': 26674, 'loss/train': 1.3962541818618774} -08/30/2021 17:57:13 - INFO - __main__ - Step 26676: {'lr': 0.0004664842361241384, 'samples': 5121792, 'steps': 26675, 'loss/train': 1.617918848991394} -08/30/2021 17:57:14 - INFO - __main__ - Step 26677: {'lr': 0.00046648158189028073, 'samples': 5121984, 'steps': 26676, 'loss/train': 1.6024278402328491} -08/30/2021 17:57:14 - INFO - __main__ - Step 26678: {'lr': 0.0004664789275588798, 'samples': 5122176, 'steps': 26677, 'loss/train': 1.7752492427825928} -08/30/2021 17:57:14 - INFO - __main__ - Step 26679: {'lr': 0.0004664762731299368, 'samples': 5122368, 'steps': 26678, 'loss/train': 0.10728741437196732} -08/30/2021 17:57:16 - INFO - __main__ - Step 26680: {'lr': 0.00046647361860345293, 'samples': 5122560, 'steps': 26679, 'loss/train': 1.3969312906265259} -08/30/2021 17:57:16 - INFO - __main__ - Step 26681: {'lr': 0.00046647096397942945, 'samples': 5122752, 'steps': 26680, 'loss/train': 1.6737064123153687} -08/30/2021 17:57:17 - INFO - __main__ - Step 26682: {'lr': 0.0004664683092578674, 'samples': 5122944, 'steps': 26681, 'loss/train': 1.1327248811721802} -08/30/2021 17:57:17 - INFO - __main__ - Step 26683: {'lr': 0.00046646565443876815, 'samples': 5123136, 'steps': 26682, 'loss/train': 1.356799602508545} -08/30/2021 17:57:17 - INFO - __main__ - Step 26684: {'lr': 0.00046646299952213277, 'samples': 5123328, 'steps': 26683, 'loss/train': 0.6211066842079163} -08/30/2021 17:57:19 - INFO - __main__ - Step 26685: {'lr': 0.00046646034450796255, 'samples': 5123520, 'steps': 26684, 'loss/train': 2.2446956634521484} -08/30/2021 17:57:19 - INFO - __main__ - Step 26686: {'lr': 0.0004664576893962586, 'samples': 5123712, 'steps': 26685, 'loss/train': 1.8335237503051758} -08/30/2021 17:57:20 - INFO - __main__ - Step 26687: {'lr': 0.0004664550341870222, 'samples': 5123904, 'steps': 26686, 'loss/train': 1.1680623292922974} -08/30/2021 17:57:20 - INFO - __main__ - Step 26688: {'lr': 0.00046645237888025444, 'samples': 5124096, 'steps': 26687, 'loss/train': 2.169955253601074} -08/30/2021 17:57:20 - INFO - __main__ - Step 26689: {'lr': 0.0004664497234759566, 'samples': 5124288, 'steps': 26688, 'loss/train': 0.5427646040916443} -08/30/2021 17:57:21 - INFO - __main__ - Step 26690: {'lr': 0.00046644706797412984, 'samples': 5124480, 'steps': 26689, 'loss/train': 1.4893057346343994} -08/30/2021 17:57:22 - INFO - __main__ - Step 26691: {'lr': 0.00046644441237477544, 'samples': 5124672, 'steps': 26690, 'loss/train': 1.658414602279663} -08/30/2021 17:57:23 - INFO - __main__ - Step 26692: {'lr': 0.00046644175667789444, 'samples': 5124864, 'steps': 26691, 'loss/train': 1.52473783493042} -08/30/2021 17:57:23 - INFO - __main__ - Step 26693: {'lr': 0.00046643910088348817, 'samples': 5125056, 'steps': 26692, 'loss/train': 0.9235119819641113} -08/30/2021 17:57:23 - INFO - __main__ - Step 26694: {'lr': 0.0004664364449915578, 'samples': 5125248, 'steps': 26693, 'loss/train': 1.717477560043335} -08/30/2021 17:57:24 - INFO - __main__ - Step 26695: {'lr': 0.0004664337890021044, 'samples': 5125440, 'steps': 26694, 'loss/train': 1.2940359115600586} -08/30/2021 17:57:25 - INFO - __main__ - Step 26696: {'lr': 0.0004664311329151294, 'samples': 5125632, 'steps': 26695, 'loss/train': 1.9891644716262817} -08/30/2021 17:57:26 - INFO - __main__ - Step 26697: {'lr': 0.0004664284767306338, 'samples': 5125824, 'steps': 26696, 'loss/train': 1.8456469774246216} -08/30/2021 17:57:26 - INFO - __main__ - Step 26698: {'lr': 0.0004664258204486189, 'samples': 5126016, 'steps': 26697, 'loss/train': 1.663969874382019} -08/30/2021 17:57:27 - INFO - __main__ - Step 26699: {'lr': 0.0004664231640690859, 'samples': 5126208, 'steps': 26698, 'loss/train': 1.5915356874465942} -08/30/2021 17:57:27 - INFO - __main__ - Step 26700: {'lr': 0.0004664205075920359, 'samples': 5126400, 'steps': 26699, 'loss/train': 1.0144003629684448} -08/30/2021 17:57:29 - INFO - __main__ - Step 26701: {'lr': 0.0004664178510174702, 'samples': 5126592, 'steps': 26700, 'loss/train': 1.863483190536499} -08/30/2021 17:57:30 - INFO - __main__ - Step 26702: {'lr': 0.0004664151943453899, 'samples': 5126784, 'steps': 26701, 'loss/train': 1.5355284214019775} -08/30/2021 17:57:30 - INFO - __main__ - Step 26703: {'lr': 0.0004664125375757963, 'samples': 5126976, 'steps': 26702, 'loss/train': 1.4345295429229736} -08/30/2021 17:57:30 - INFO - __main__ - Step 26704: {'lr': 0.00046640988070869053, 'samples': 5127168, 'steps': 26703, 'loss/train': 1.6513216495513916} -08/30/2021 17:57:31 - INFO - __main__ - Step 26705: {'lr': 0.00046640722374407384, 'samples': 5127360, 'steps': 26704, 'loss/train': 1.3768072128295898} -08/30/2021 17:57:31 - INFO - __main__ - Step 26706: {'lr': 0.00046640456668194737, 'samples': 5127552, 'steps': 26705, 'loss/train': 1.8468369245529175} -08/30/2021 17:57:32 - INFO - __main__ - Step 26707: {'lr': 0.0004664019095223123, 'samples': 5127744, 'steps': 26706, 'loss/train': 2.6544859409332275} -08/30/2021 17:57:33 - INFO - __main__ - Step 26708: {'lr': 0.00046639925226517, 'samples': 5127936, 'steps': 26707, 'loss/train': 1.6677361726760864} -08/30/2021 17:57:33 - INFO - __main__ - Step 26709: {'lr': 0.0004663965949105214, 'samples': 5128128, 'steps': 26708, 'loss/train': 1.158858060836792} -08/30/2021 17:57:34 - INFO - __main__ - Step 26710: {'lr': 0.0004663939374583679, 'samples': 5128320, 'steps': 26709, 'loss/train': 1.6500035524368286} -08/30/2021 17:57:34 - INFO - __main__ - Step 26711: {'lr': 0.00046639127990871055, 'samples': 5128512, 'steps': 26710, 'loss/train': 1.7814421653747559} -08/30/2021 17:57:36 - INFO - __main__ - Step 26712: {'lr': 0.00046638862226155075, 'samples': 5128704, 'steps': 26711, 'loss/train': 1.1269235610961914} -08/30/2021 17:57:36 - INFO - __main__ - Step 26713: {'lr': 0.0004663859645168895, 'samples': 5128896, 'steps': 26712, 'loss/train': 1.0910543203353882} -08/30/2021 17:57:36 - INFO - __main__ - Step 26714: {'lr': 0.00046638330667472805, 'samples': 5129088, 'steps': 26713, 'loss/train': 1.7232025861740112} -08/30/2021 17:57:37 - INFO - __main__ - Step 26715: {'lr': 0.0004663806487350677, 'samples': 5129280, 'steps': 26714, 'loss/train': 1.5871376991271973} -08/30/2021 17:57:37 - INFO - __main__ - Step 26716: {'lr': 0.00046637799069790953, 'samples': 5129472, 'steps': 26715, 'loss/train': 0.08858071267604828} -08/30/2021 17:57:39 - INFO - __main__ - Step 26717: {'lr': 0.00046637533256325476, 'samples': 5129664, 'steps': 26716, 'loss/train': 1.5392704010009766} -08/30/2021 17:57:39 - INFO - __main__ - Step 26718: {'lr': 0.0004663726743311046, 'samples': 5129856, 'steps': 26717, 'loss/train': 1.4603545665740967} -08/30/2021 17:57:40 - INFO - __main__ - Step 26719: {'lr': 0.00046637001600146027, 'samples': 5130048, 'steps': 26718, 'loss/train': 0.09331375360488892} -08/30/2021 17:57:40 - INFO - __main__ - Step 26720: {'lr': 0.000466367357574323, 'samples': 5130240, 'steps': 26719, 'loss/train': 1.9333102703094482} -08/30/2021 17:57:41 - INFO - __main__ - Step 26721: {'lr': 0.00046636469904969387, 'samples': 5130432, 'steps': 26720, 'loss/train': 1.365154504776001} -08/30/2021 17:57:41 - INFO - __main__ - Step 26722: {'lr': 0.0004663620404275741, 'samples': 5130624, 'steps': 26721, 'loss/train': 1.0078293085098267} -08/30/2021 17:57:42 - INFO - __main__ - Step 26723: {'lr': 0.00046635938170796505, 'samples': 5130816, 'steps': 26722, 'loss/train': 1.0311357975006104} -08/30/2021 17:57:43 - INFO - __main__ - Step 26724: {'lr': 0.00046635672289086774, 'samples': 5131008, 'steps': 26723, 'loss/train': 1.319662094116211} -08/30/2021 17:57:43 - INFO - __main__ - Step 26725: {'lr': 0.00046635406397628346, 'samples': 5131200, 'steps': 26724, 'loss/train': 1.5365781784057617} -08/30/2021 17:57:44 - INFO - __main__ - Step 26726: {'lr': 0.00046635140496421336, 'samples': 5131392, 'steps': 26725, 'loss/train': 1.5976406335830688} -08/30/2021 17:57:44 - INFO - __main__ - Step 26727: {'lr': 0.0004663487458546586, 'samples': 5131584, 'steps': 26726, 'loss/train': 1.6156132221221924} -08/30/2021 17:57:45 - INFO - __main__ - Step 26728: {'lr': 0.0004663460866476205, 'samples': 5131776, 'steps': 26727, 'loss/train': 1.5820831060409546} -08/30/2021 17:57:46 - INFO - __main__ - Step 26729: {'lr': 0.00046634342734310023, 'samples': 5131968, 'steps': 26728, 'loss/train': 1.461832880973816} -08/30/2021 17:57:46 - INFO - __main__ - Step 26730: {'lr': 0.0004663407679410988, 'samples': 5132160, 'steps': 26729, 'loss/train': 0.21380048990249634} -08/30/2021 17:57:47 - INFO - __main__ - Step 26731: {'lr': 0.0004663381084416177, 'samples': 5132352, 'steps': 26730, 'loss/train': 1.8571300506591797} -08/30/2021 17:57:47 - INFO - __main__ - Step 26732: {'lr': 0.00046633544884465796, 'samples': 5132544, 'steps': 26731, 'loss/train': 1.300208330154419} -08/30/2021 17:57:48 - INFO - __main__ - Step 26733: {'lr': 0.0004663327891502208, 'samples': 5132736, 'steps': 26732, 'loss/train': 0.3474135100841522} -08/30/2021 17:57:49 - INFO - __main__ - Step 26734: {'lr': 0.0004663301293583073, 'samples': 5132928, 'steps': 26733, 'loss/train': 1.2446075677871704} -08/30/2021 17:57:49 - INFO - __main__ - Step 26735: {'lr': 0.000466327469468919, 'samples': 5133120, 'steps': 26734, 'loss/train': 1.6891194581985474} -08/30/2021 17:57:50 - INFO - __main__ - Step 26736: {'lr': 0.0004663248094820567, 'samples': 5133312, 'steps': 26735, 'loss/train': 1.2903902530670166} -08/30/2021 17:57:50 - INFO - __main__ - Step 26737: {'lr': 0.00046632214939772187, 'samples': 5133504, 'steps': 26736, 'loss/train': 1.6359522342681885} -08/30/2021 17:57:52 - INFO - __main__ - Step 26738: {'lr': 0.0004663194892159156, 'samples': 5133696, 'steps': 26737, 'loss/train': 1.2313135862350464} -08/30/2021 17:57:52 - INFO - __main__ - Step 26739: {'lr': 0.0004663168289366391, 'samples': 5133888, 'steps': 26738, 'loss/train': 1.1805410385131836} -08/30/2021 17:57:52 - INFO - __main__ - Step 26740: {'lr': 0.0004663141685598936, 'samples': 5134080, 'steps': 26739, 'loss/train': 4.346454620361328} -08/30/2021 17:57:53 - INFO - __main__ - Step 26741: {'lr': 0.00046631150808568026, 'samples': 5134272, 'steps': 26740, 'loss/train': 1.359296441078186} -08/30/2021 17:57:53 - INFO - __main__ - Step 26742: {'lr': 0.00046630884751400024, 'samples': 5134464, 'steps': 26741, 'loss/train': 1.4907121658325195} -08/30/2021 17:57:53 - INFO - __main__ - Step 26743: {'lr': 0.0004663061868448548, 'samples': 5134656, 'steps': 26742, 'loss/train': 1.8572890758514404} -08/30/2021 17:57:55 - INFO - __main__ - Step 26744: {'lr': 0.0004663035260782452, 'samples': 5134848, 'steps': 26743, 'loss/train': 1.7632564306259155} -08/30/2021 17:57:55 - INFO - __main__ - Step 26745: {'lr': 0.0004663008652141726, 'samples': 5135040, 'steps': 26744, 'loss/train': 1.5466748476028442} -08/30/2021 17:57:56 - INFO - __main__ - Step 26746: {'lr': 0.00046629820425263805, 'samples': 5135232, 'steps': 26745, 'loss/train': 1.1536327600479126} -08/30/2021 17:57:56 - INFO - __main__ - Step 26747: {'lr': 0.00046629554319364293, 'samples': 5135424, 'steps': 26746, 'loss/train': 1.0963774919509888} -08/30/2021 17:57:56 - INFO - __main__ - Step 26748: {'lr': 0.00046629288203718834, 'samples': 5135616, 'steps': 26747, 'loss/train': 1.7901570796966553} -08/30/2021 17:57:58 - INFO - __main__ - Step 26749: {'lr': 0.00046629022078327557, 'samples': 5135808, 'steps': 26748, 'loss/train': 1.4945642948150635} -08/30/2021 17:57:58 - INFO - __main__ - Step 26750: {'lr': 0.0004662875594319057, 'samples': 5136000, 'steps': 26749, 'loss/train': 1.3612560033798218} -08/30/2021 17:57:59 - INFO - __main__ - Step 26751: {'lr': 0.00046628489798308006, 'samples': 5136192, 'steps': 26750, 'loss/train': 1.6134798526763916} -08/30/2021 17:57:59 - INFO - __main__ - Step 26752: {'lr': 0.0004662822364367997, 'samples': 5136384, 'steps': 26751, 'loss/train': 1.331142783164978} -08/30/2021 17:57:59 - INFO - __main__ - Step 26753: {'lr': 0.000466279574793066, 'samples': 5136576, 'steps': 26752, 'loss/train': 1.8044636249542236} -08/30/2021 17:58:01 - INFO - __main__ - Step 26754: {'lr': 0.00046627691305188004, 'samples': 5136768, 'steps': 26753, 'loss/train': 0.5285789966583252} -08/30/2021 17:58:02 - INFO - __main__ - Step 26755: {'lr': 0.00046627425121324294, 'samples': 5136960, 'steps': 26754, 'loss/train': 2.230715751647949} -08/30/2021 17:58:02 - INFO - __main__ - Step 26756: {'lr': 0.0004662715892771561, 'samples': 5137152, 'steps': 26755, 'loss/train': 1.5442594289779663} -08/30/2021 17:58:03 - INFO - __main__ - Step 26757: {'lr': 0.0004662689272436206, 'samples': 5137344, 'steps': 26756, 'loss/train': 1.7846076488494873} -08/30/2021 17:58:03 - INFO - __main__ - Step 26758: {'lr': 0.00046626626511263764, 'samples': 5137536, 'steps': 26757, 'loss/train': 0.08230098336935043} -08/30/2021 17:58:03 - INFO - __main__ - Step 26759: {'lr': 0.00046626360288420845, 'samples': 5137728, 'steps': 26758, 'loss/train': 1.536605715751648} -08/30/2021 17:58:05 - INFO - __main__ - Step 26760: {'lr': 0.00046626094055833426, 'samples': 5137920, 'steps': 26759, 'loss/train': 1.6113698482513428} -08/30/2021 17:58:06 - INFO - __main__ - Step 26761: {'lr': 0.0004662582781350161, 'samples': 5138112, 'steps': 26760, 'loss/train': 1.4732036590576172} -08/30/2021 17:58:06 - INFO - __main__ - Step 26762: {'lr': 0.00046625561561425543, 'samples': 5138304, 'steps': 26761, 'loss/train': 1.2604283094406128} -08/30/2021 17:58:06 - INFO - __main__ - Step 26763: {'lr': 0.00046625295299605323, 'samples': 5138496, 'steps': 26762, 'loss/train': 1.4922982454299927} -08/30/2021 17:58:07 - INFO - __main__ - Step 26764: {'lr': 0.0004662502902804109, 'samples': 5138688, 'steps': 26763, 'loss/train': 1.4694780111312866} -08/30/2021 17:58:07 - INFO - __main__ - Step 26765: {'lr': 0.0004662476274673294, 'samples': 5138880, 'steps': 26764, 'loss/train': 1.683996319770813} -08/30/2021 17:58:09 - INFO - __main__ - Step 26766: {'lr': 0.00046624496455681006, 'samples': 5139072, 'steps': 26765, 'loss/train': 1.5728793144226074} -08/30/2021 17:58:09 - INFO - __main__ - Step 26767: {'lr': 0.00046624230154885415, 'samples': 5139264, 'steps': 26766, 'loss/train': 1.5897480249404907} -08/30/2021 17:58:10 - INFO - __main__ - Step 26768: {'lr': 0.0004662396384434627, 'samples': 5139456, 'steps': 26767, 'loss/train': 1.5656379461288452} -08/30/2021 17:58:10 - INFO - __main__ - Step 26769: {'lr': 0.00046623697524063713, 'samples': 5139648, 'steps': 26768, 'loss/train': 1.7227659225463867} -08/30/2021 17:58:10 - INFO - __main__ - Step 26770: {'lr': 0.00046623431194037847, 'samples': 5139840, 'steps': 26769, 'loss/train': 1.4630969762802124} -08/30/2021 17:58:12 - INFO - __main__ - Step 26771: {'lr': 0.000466231648542688, 'samples': 5140032, 'steps': 26770, 'loss/train': 1.9150218963623047} -08/30/2021 17:58:12 - INFO - __main__ - Step 26772: {'lr': 0.0004662289850475668, 'samples': 5140224, 'steps': 26771, 'loss/train': 1.0994112491607666} -08/30/2021 17:58:13 - INFO - __main__ - Step 26773: {'lr': 0.0004662263214550162, 'samples': 5140416, 'steps': 26772, 'loss/train': 1.8346391916275024} -08/30/2021 17:58:13 - INFO - __main__ - Step 26774: {'lr': 0.00046622365776503735, 'samples': 5140608, 'steps': 26773, 'loss/train': 1.2081940174102783} -08/30/2021 17:58:14 - INFO - __main__ - Step 26775: {'lr': 0.0004662209939776315, 'samples': 5140800, 'steps': 26774, 'loss/train': 1.7097142934799194} -08/30/2021 17:58:15 - INFO - __main__ - Step 26776: {'lr': 0.0004662183300927997, 'samples': 5140992, 'steps': 26775, 'loss/train': 1.4779356718063354} -08/30/2021 17:58:16 - INFO - __main__ - Step 26777: {'lr': 0.0004662156661105433, 'samples': 5141184, 'steps': 26776, 'loss/train': 1.3889614343643188} -08/30/2021 17:58:16 - INFO - __main__ - Step 26778: {'lr': 0.0004662130020308635, 'samples': 5141376, 'steps': 26777, 'loss/train': 1.6845752000808716} -08/30/2021 17:58:16 - INFO - __main__ - Step 26779: {'lr': 0.00046621033785376146, 'samples': 5141568, 'steps': 26778, 'loss/train': 1.0824769735336304} -08/30/2021 17:58:17 - INFO - __main__ - Step 26780: {'lr': 0.00046620767357923834, 'samples': 5141760, 'steps': 26779, 'loss/train': 1.6082614660263062} -08/30/2021 17:58:18 - INFO - __main__ - Step 26781: {'lr': 0.0004662050092072954, 'samples': 5141952, 'steps': 26780, 'loss/train': 1.775464653968811} -08/30/2021 17:58:19 - INFO - __main__ - Step 26782: {'lr': 0.0004662023447379338, 'samples': 5142144, 'steps': 26781, 'loss/train': 1.8717602491378784} -08/30/2021 17:58:19 - INFO - __main__ - Step 26783: {'lr': 0.0004661996801711548, 'samples': 5142336, 'steps': 26782, 'loss/train': 1.1960712671279907} -08/30/2021 17:58:19 - INFO - __main__ - Step 26784: {'lr': 0.0004661970155069595, 'samples': 5142528, 'steps': 26783, 'loss/train': 1.3057440519332886} -08/30/2021 17:58:20 - INFO - __main__ - Step 26785: {'lr': 0.00046619435074534923, 'samples': 5142720, 'steps': 26784, 'loss/train': 1.7113823890686035} -08/30/2021 17:58:22 - INFO - __main__ - Step 26786: {'lr': 0.0004661916858863251, 'samples': 5142912, 'steps': 26785, 'loss/train': 1.7824463844299316} -08/30/2021 17:58:22 - INFO - __main__ - Step 26787: {'lr': 0.00046618902092988824, 'samples': 5143104, 'steps': 26786, 'loss/train': 1.6778502464294434} -08/30/2021 17:58:22 - INFO - __main__ - Step 26788: {'lr': 0.00046618635587604006, 'samples': 5143296, 'steps': 26787, 'loss/train': 0.2964571714401245} -08/30/2021 17:58:23 - INFO - __main__ - Step 26789: {'lr': 0.00046618369072478163, 'samples': 5143488, 'steps': 26788, 'loss/train': 1.3270459175109863} -08/30/2021 17:58:23 - INFO - __main__ - Step 26790: {'lr': 0.0004661810254761141, 'samples': 5143680, 'steps': 26789, 'loss/train': 0.05226729065179825} -08/30/2021 17:58:23 - INFO - __main__ - Step 26791: {'lr': 0.0004661783601300388, 'samples': 5143872, 'steps': 26790, 'loss/train': 1.418766975402832} -08/30/2021 17:58:25 - INFO - __main__ - Step 26792: {'lr': 0.00046617569468655686, 'samples': 5144064, 'steps': 26791, 'loss/train': 1.2048664093017578} -08/30/2021 17:58:25 - INFO - __main__ - Step 26793: {'lr': 0.00046617302914566945, 'samples': 5144256, 'steps': 26792, 'loss/train': 0.2802641987800598} -08/30/2021 17:58:26 - INFO - __main__ - Step 26794: {'lr': 0.00046617036350737786, 'samples': 5144448, 'steps': 26793, 'loss/train': 2.003206729888916} -08/30/2021 17:58:26 - INFO - __main__ - Step 26795: {'lr': 0.0004661676977716832, 'samples': 5144640, 'steps': 26794, 'loss/train': 1.377181887626648} -08/30/2021 17:58:26 - INFO - __main__ - Step 26796: {'lr': 0.0004661650319385867, 'samples': 5144832, 'steps': 26795, 'loss/train': 1.4903490543365479} -08/30/2021 17:58:28 - INFO - __main__ - Step 26797: {'lr': 0.0004661623660080896, 'samples': 5145024, 'steps': 26796, 'loss/train': 1.5612714290618896} -08/30/2021 17:58:28 - INFO - __main__ - Step 26798: {'lr': 0.000466159699980193, 'samples': 5145216, 'steps': 26797, 'loss/train': 2.395564556121826} -08/30/2021 17:58:29 - INFO - __main__ - Step 26799: {'lr': 0.0004661570338548983, 'samples': 5145408, 'steps': 26798, 'loss/train': 1.3965349197387695} -08/30/2021 17:58:29 - INFO - __main__ - Step 26800: {'lr': 0.00046615436763220645, 'samples': 5145600, 'steps': 26799, 'loss/train': 1.2196152210235596} -08/30/2021 17:58:29 - INFO - __main__ - Step 26801: {'lr': 0.0004661517013121189, 'samples': 5145792, 'steps': 26800, 'loss/train': 1.6071802377700806} -08/30/2021 17:58:31 - INFO - __main__ - Step 26802: {'lr': 0.00046614903489463667, 'samples': 5145984, 'steps': 26801, 'loss/train': 1.6098366975784302} -08/30/2021 17:58:31 - INFO - __main__ - Step 26803: {'lr': 0.000466146368379761, 'samples': 5146176, 'steps': 26802, 'loss/train': 1.8973139524459839} -08/30/2021 17:58:32 - INFO - __main__ - Step 26804: {'lr': 0.0004661437017674931, 'samples': 5146368, 'steps': 26803, 'loss/train': 1.0908960103988647} -08/30/2021 17:58:32 - INFO - __main__ - Step 26805: {'lr': 0.00046614103505783423, 'samples': 5146560, 'steps': 26804, 'loss/train': 1.4314018487930298} -08/30/2021 17:58:32 - INFO - __main__ - Step 26806: {'lr': 0.0004661383682507856, 'samples': 5146752, 'steps': 26805, 'loss/train': 1.9222533702850342} -08/30/2021 17:58:34 - INFO - __main__ - Step 26807: {'lr': 0.00046613570134634825, 'samples': 5146944, 'steps': 26806, 'loss/train': 1.7310898303985596} -08/30/2021 17:58:34 - INFO - __main__ - Step 26808: {'lr': 0.00046613303434452346, 'samples': 5147136, 'steps': 26807, 'loss/train': 1.17205810546875} -08/30/2021 17:58:35 - INFO - __main__ - Step 26809: {'lr': 0.00046613036724531254, 'samples': 5147328, 'steps': 26808, 'loss/train': 0.9658483862876892} -08/30/2021 17:58:35 - INFO - __main__ - Step 26810: {'lr': 0.00046612770004871663, 'samples': 5147520, 'steps': 26809, 'loss/train': 1.5939700603485107} -08/30/2021 17:58:35 - INFO - __main__ - Step 26811: {'lr': 0.00046612503275473687, 'samples': 5147712, 'steps': 26810, 'loss/train': 1.7550020217895508} -08/30/2021 17:58:37 - INFO - __main__ - Step 26812: {'lr': 0.00046612236536337456, 'samples': 5147904, 'steps': 26811, 'loss/train': 1.9856510162353516} -08/30/2021 17:58:38 - INFO - __main__ - Step 26813: {'lr': 0.00046611969787463083, 'samples': 5148096, 'steps': 26812, 'loss/train': 4.578228950500488} -08/30/2021 17:58:38 - INFO - __main__ - Step 26814: {'lr': 0.00046611703028850683, 'samples': 5148288, 'steps': 26813, 'loss/train': 1.394594430923462} -08/30/2021 17:58:38 - INFO - __main__ - Step 26815: {'lr': 0.00046611436260500386, 'samples': 5148480, 'steps': 26814, 'loss/train': 1.1023682355880737} -08/30/2021 17:58:39 - INFO - __main__ - Step 26816: {'lr': 0.00046611169482412305, 'samples': 5148672, 'steps': 26815, 'loss/train': 1.971582055091858} -08/30/2021 17:58:39 - INFO - __main__ - Step 26817: {'lr': 0.00046610902694586576, 'samples': 5148864, 'steps': 26816, 'loss/train': 0.7202461957931519} -08/30/2021 17:58:41 - INFO - __main__ - Step 26818: {'lr': 0.00046610635897023303, 'samples': 5149056, 'steps': 26817, 'loss/train': 1.480725646018982} -08/30/2021 17:58:41 - INFO - __main__ - Step 26819: {'lr': 0.0004661036908972261, 'samples': 5149248, 'steps': 26818, 'loss/train': 2.1650359630584717} -08/30/2021 17:58:41 - INFO - __main__ - Step 26820: {'lr': 0.0004661010227268462, 'samples': 5149440, 'steps': 26819, 'loss/train': 1.171453595161438} -08/30/2021 17:58:42 - INFO - __main__ - Step 26821: {'lr': 0.0004660983544590944, 'samples': 5149632, 'steps': 26820, 'loss/train': 1.4449701309204102} -08/30/2021 17:58:42 - INFO - __main__ - Step 26822: {'lr': 0.0004660956860939722, 'samples': 5149824, 'steps': 26821, 'loss/train': 1.9287570714950562} -08/30/2021 17:58:44 - INFO - __main__ - Step 26823: {'lr': 0.0004660930176314805, 'samples': 5150016, 'steps': 26822, 'loss/train': 1.3852072954177856} -08/30/2021 17:58:44 - INFO - __main__ - Step 26824: {'lr': 0.0004660903490716206, 'samples': 5150208, 'steps': 26823, 'loss/train': 1.145975112915039} -08/30/2021 17:58:44 - INFO - __main__ - Step 26825: {'lr': 0.0004660876804143938, 'samples': 5150400, 'steps': 26824, 'loss/train': 1.3981616497039795} -08/30/2021 17:58:45 - INFO - __main__ - Step 26826: {'lr': 0.0004660850116598012, 'samples': 5150592, 'steps': 26825, 'loss/train': 1.5617139339447021} -08/30/2021 17:58:45 - INFO - __main__ - Step 26827: {'lr': 0.00046608234280784406, 'samples': 5150784, 'steps': 26826, 'loss/train': 1.561122179031372} -08/30/2021 17:58:47 - INFO - __main__ - Step 26828: {'lr': 0.0004660796738585235, 'samples': 5150976, 'steps': 26827, 'loss/train': 1.611430287361145} -08/30/2021 17:58:47 - INFO - __main__ - Step 26829: {'lr': 0.0004660770048118408, 'samples': 5151168, 'steps': 26828, 'loss/train': 1.7318994998931885} -08/30/2021 17:58:47 - INFO - __main__ - Step 26830: {'lr': 0.00046607433566779713, 'samples': 5151360, 'steps': 26829, 'loss/train': 1.8213824033737183} -08/30/2021 17:58:48 - INFO - __main__ - Step 26831: {'lr': 0.00046607166642639365, 'samples': 5151552, 'steps': 26830, 'loss/train': 1.9512497186660767} -08/30/2021 17:58:48 - INFO - __main__ - Step 26832: {'lr': 0.00046606899708763174, 'samples': 5151744, 'steps': 26831, 'loss/train': 1.0352290868759155} -08/30/2021 17:58:50 - INFO - __main__ - Step 26833: {'lr': 0.0004660663276515124, 'samples': 5151936, 'steps': 26832, 'loss/train': 1.424996256828308} -08/30/2021 17:58:50 - INFO - __main__ - Step 26834: {'lr': 0.00046606365811803686, 'samples': 5152128, 'steps': 26833, 'loss/train': 1.511102557182312} -08/30/2021 17:58:50 - INFO - __main__ - Step 26835: {'lr': 0.0004660609884872064, 'samples': 5152320, 'steps': 26834, 'loss/train': 1.5556164979934692} -08/30/2021 17:58:51 - INFO - __main__ - Step 26836: {'lr': 0.00046605831875902215, 'samples': 5152512, 'steps': 26835, 'loss/train': 1.4919860363006592} -08/30/2021 17:58:51 - INFO - __main__ - Step 26837: {'lr': 0.00046605564893348545, 'samples': 5152704, 'steps': 26836, 'loss/train': 1.5208078622817993} -08/30/2021 17:58:52 - INFO - __main__ - Step 26838: {'lr': 0.0004660529790105974, 'samples': 5152896, 'steps': 26837, 'loss/train': 1.2910549640655518} -08/30/2021 17:58:53 - INFO - __main__ - Step 26839: {'lr': 0.00046605030899035915, 'samples': 5153088, 'steps': 26838, 'loss/train': 1.374462366104126} -08/30/2021 17:58:53 - INFO - __main__ - Step 26840: {'lr': 0.000466047638872772, 'samples': 5153280, 'steps': 26839, 'loss/train': 2.2235822677612305} -08/30/2021 17:58:54 - INFO - __main__ - Step 26841: {'lr': 0.0004660449686578371, 'samples': 5153472, 'steps': 26840, 'loss/train': 1.8461415767669678} -08/30/2021 17:58:54 - INFO - __main__ - Step 26842: {'lr': 0.0004660422983455557, 'samples': 5153664, 'steps': 26841, 'loss/train': 1.227088451385498} -08/30/2021 17:58:56 - INFO - __main__ - Step 26843: {'lr': 0.0004660396279359289, 'samples': 5153856, 'steps': 26842, 'loss/train': 1.391221284866333} -08/30/2021 17:58:56 - INFO - __main__ - Step 26844: {'lr': 0.000466036957428958, 'samples': 5154048, 'steps': 26843, 'loss/train': 1.4195990562438965} -08/30/2021 17:58:57 - INFO - __main__ - Step 26845: {'lr': 0.0004660342868246442, 'samples': 5154240, 'steps': 26844, 'loss/train': 1.849786400794983} -08/30/2021 17:58:57 - INFO - __main__ - Step 26846: {'lr': 0.0004660316161229887, 'samples': 5154432, 'steps': 26845, 'loss/train': 0.9779144525527954} -08/30/2021 17:58:57 - INFO - __main__ - Step 26847: {'lr': 0.00046602894532399275, 'samples': 5154624, 'steps': 26846, 'loss/train': 1.4024840593338013} -08/30/2021 17:58:59 - INFO - __main__ - Step 26848: {'lr': 0.00046602627442765744, 'samples': 5154816, 'steps': 26847, 'loss/train': 1.672475814819336} -08/30/2021 17:58:59 - INFO - __main__ - Step 26849: {'lr': 0.00046602360343398397, 'samples': 5155008, 'steps': 26848, 'loss/train': 2.846569061279297} -08/30/2021 17:58:59 - INFO - __main__ - Step 26850: {'lr': 0.0004660209323429736, 'samples': 5155200, 'steps': 26849, 'loss/train': 1.5409947633743286} -08/30/2021 17:59:00 - INFO - __main__ - Step 26851: {'lr': 0.0004660182611546276, 'samples': 5155392, 'steps': 26850, 'loss/train': 1.9352277517318726} -08/30/2021 17:59:00 - INFO - __main__ - Step 26852: {'lr': 0.0004660155898689471, 'samples': 5155584, 'steps': 26851, 'loss/train': 1.462173581123352} -08/30/2021 17:59:01 - INFO - __main__ - Step 26853: {'lr': 0.0004660129184859332, 'samples': 5155776, 'steps': 26852, 'loss/train': 1.3452694416046143} -08/30/2021 17:59:02 - INFO - __main__ - Step 26854: {'lr': 0.00046601024700558736, 'samples': 5155968, 'steps': 26853, 'loss/train': 1.82614004611969} -08/30/2021 17:59:02 - INFO - __main__ - Step 26855: {'lr': 0.0004660075754279105, 'samples': 5156160, 'steps': 26854, 'loss/train': 0.9493875503540039} -08/30/2021 17:59:03 - INFO - __main__ - Step 26856: {'lr': 0.00046600490375290406, 'samples': 5156352, 'steps': 26855, 'loss/train': 1.6828885078430176} -08/30/2021 17:59:03 - INFO - __main__ - Step 26857: {'lr': 0.0004660022319805691, 'samples': 5156544, 'steps': 26856, 'loss/train': 1.6080266237258911} -08/30/2021 17:59:03 - INFO - __main__ - Step 26858: {'lr': 0.0004659995601109069, 'samples': 5156736, 'steps': 26857, 'loss/train': 1.231449007987976} -08/30/2021 17:59:05 - INFO - __main__ - Step 26859: {'lr': 0.0004659968881439186, 'samples': 5156928, 'steps': 26858, 'loss/train': 0.4787122309207916} -08/30/2021 17:59:06 - INFO - __main__ - Step 26860: {'lr': 0.00046599421607960545, 'samples': 5157120, 'steps': 26859, 'loss/train': 1.3173683881759644} -08/30/2021 17:59:06 - INFO - __main__ - Step 26861: {'lr': 0.0004659915439179686, 'samples': 5157312, 'steps': 26860, 'loss/train': 0.1036704033613205} -08/30/2021 17:59:06 - INFO - __main__ - Step 26862: {'lr': 0.0004659888716590094, 'samples': 5157504, 'steps': 26861, 'loss/train': 1.4828739166259766} -08/30/2021 17:59:07 - INFO - __main__ - Step 26863: {'lr': 0.00046598619930272883, 'samples': 5157696, 'steps': 26862, 'loss/train': 1.2362053394317627} -08/30/2021 17:59:08 - INFO - __main__ - Step 26864: {'lr': 0.00046598352684912824, 'samples': 5157888, 'steps': 26863, 'loss/train': 1.6815341711044312} -08/30/2021 17:59:09 - INFO - __main__ - Step 26865: {'lr': 0.0004659808542982088, 'samples': 5158080, 'steps': 26864, 'loss/train': 1.1082732677459717} -08/30/2021 17:59:09 - INFO - __main__ - Step 26866: {'lr': 0.0004659781816499718, 'samples': 5158272, 'steps': 26865, 'loss/train': 1.7296682596206665} -08/30/2021 17:59:09 - INFO - __main__ - Step 26867: {'lr': 0.0004659755089044183, 'samples': 5158464, 'steps': 26866, 'loss/train': 1.1451698541641235} -08/30/2021 17:59:10 - INFO - __main__ - Step 26868: {'lr': 0.00046597283606154957, 'samples': 5158656, 'steps': 26867, 'loss/train': 1.3216966390609741} -08/30/2021 17:59:12 - INFO - __main__ - Step 26869: {'lr': 0.0004659701631213668, 'samples': 5158848, 'steps': 26868, 'loss/train': 0.9072578549385071} -08/30/2021 17:59:12 - INFO - __main__ - Step 26870: {'lr': 0.00046596749008387124, 'samples': 5159040, 'steps': 26869, 'loss/train': 1.7794842720031738} -08/30/2021 17:59:13 - INFO - __main__ - Step 26871: {'lr': 0.00046596481694906403, 'samples': 5159232, 'steps': 26870, 'loss/train': 1.610386610031128} -08/30/2021 17:59:13 - INFO - __main__ - Step 26872: {'lr': 0.00046596214371694643, 'samples': 5159424, 'steps': 26871, 'loss/train': 1.3272669315338135} -08/30/2021 17:59:13 - INFO - __main__ - Step 26873: {'lr': 0.00046595947038751963, 'samples': 5159616, 'steps': 26872, 'loss/train': 1.3920873403549194} -08/30/2021 17:59:15 - INFO - __main__ - Step 26874: {'lr': 0.00046595679696078476, 'samples': 5159808, 'steps': 26873, 'loss/train': 2.0769612789154053} -08/30/2021 17:59:15 - INFO - __main__ - Step 26875: {'lr': 0.00046595412343674317, 'samples': 5160000, 'steps': 26874, 'loss/train': 1.1637133359909058} -08/30/2021 17:59:15 - INFO - __main__ - Step 26876: {'lr': 0.00046595144981539596, 'samples': 5160192, 'steps': 26875, 'loss/train': 1.4622235298156738} -08/30/2021 17:59:16 - INFO - __main__ - Step 26877: {'lr': 0.00046594877609674437, 'samples': 5160384, 'steps': 26876, 'loss/train': 1.3788200616836548} -08/30/2021 17:59:16 - INFO - __main__ - Step 26878: {'lr': 0.00046594610228078954, 'samples': 5160576, 'steps': 26877, 'loss/train': 1.8409117460250854} -08/30/2021 17:59:18 - INFO - __main__ - Step 26879: {'lr': 0.00046594342836753276, 'samples': 5160768, 'steps': 26878, 'loss/train': 1.4835433959960938} -08/30/2021 17:59:18 - INFO - __main__ - Step 26880: {'lr': 0.0004659407543569752, 'samples': 5160960, 'steps': 26879, 'loss/train': 0.2934632897377014} -08/30/2021 17:59:19 - INFO - __main__ - Step 26881: {'lr': 0.0004659380802491181, 'samples': 5161152, 'steps': 26880, 'loss/train': 0.262529581785202} -08/30/2021 17:59:19 - INFO - __main__ - Step 26882: {'lr': 0.00046593540604396256, 'samples': 5161344, 'steps': 26881, 'loss/train': 1.2058743238449097} -08/30/2021 17:59:19 - INFO - __main__ - Step 26883: {'lr': 0.00046593273174150995, 'samples': 5161536, 'steps': 26882, 'loss/train': 1.7408865690231323} -08/30/2021 17:59:20 - INFO - __main__ - Step 26884: {'lr': 0.0004659300573417613, 'samples': 5161728, 'steps': 26883, 'loss/train': 0.8488700985908508} -08/30/2021 17:59:22 - INFO - __main__ - Step 26885: {'lr': 0.00046592738284471794, 'samples': 5161920, 'steps': 26884, 'loss/train': 1.6995694637298584} -08/30/2021 17:59:22 - INFO - __main__ - Step 26886: {'lr': 0.000465924708250381, 'samples': 5162112, 'steps': 26885, 'loss/train': 1.3161303997039795} -08/30/2021 17:59:22 - INFO - __main__ - Step 26887: {'lr': 0.00046592203355875177, 'samples': 5162304, 'steps': 26886, 'loss/train': 1.1734241247177124} -08/30/2021 17:59:23 - INFO - __main__ - Step 26888: {'lr': 0.00046591935876983136, 'samples': 5162496, 'steps': 26887, 'loss/train': 0.04021792858839035} -08/30/2021 17:59:23 - INFO - __main__ - Step 26889: {'lr': 0.0004659166838836211, 'samples': 5162688, 'steps': 26888, 'loss/train': 1.476667046546936} -08/30/2021 17:59:24 - INFO - __main__ - Step 26890: {'lr': 0.000465914008900122, 'samples': 5162880, 'steps': 26889, 'loss/train': 2.0075557231903076} -08/30/2021 17:59:25 - INFO - __main__ - Step 26891: {'lr': 0.00046591133381933546, 'samples': 5163072, 'steps': 26890, 'loss/train': 1.437656044960022} -08/30/2021 17:59:26 - INFO - __main__ - Step 26892: {'lr': 0.0004659086586412626, 'samples': 5163264, 'steps': 26891, 'loss/train': 0.061180729418992996} -08/30/2021 17:59:26 - INFO - __main__ - Step 26893: {'lr': 0.0004659059833659046, 'samples': 5163456, 'steps': 26892, 'loss/train': 0.9740949869155884} -08/30/2021 17:59:26 - INFO - __main__ - Step 26894: {'lr': 0.0004659033079932627, 'samples': 5163648, 'steps': 26893, 'loss/train': 2.013864278793335} -08/30/2021 17:59:27 - INFO - __main__ - Step 26895: {'lr': 0.00046590063252333806, 'samples': 5163840, 'steps': 26894, 'loss/train': 1.2683641910552979} -08/30/2021 17:59:28 - INFO - __main__ - Step 26896: {'lr': 0.000465897956956132, 'samples': 5164032, 'steps': 26895, 'loss/train': 0.9575828313827515} -08/30/2021 17:59:29 - INFO - __main__ - Step 26897: {'lr': 0.0004658952812916456, 'samples': 5164224, 'steps': 26896, 'loss/train': 1.3946799039840698} -08/30/2021 17:59:29 - INFO - __main__ - Step 26898: {'lr': 0.0004658926055298802, 'samples': 5164416, 'steps': 26897, 'loss/train': 1.4117990732192993} -08/30/2021 17:59:29 - INFO - __main__ - Step 26899: {'lr': 0.0004658899296708369, 'samples': 5164608, 'steps': 26898, 'loss/train': 1.3764944076538086} -08/30/2021 17:59:30 - INFO - __main__ - Step 26900: {'lr': 0.00046588725371451685, 'samples': 5164800, 'steps': 26899, 'loss/train': 1.512864589691162} -08/30/2021 17:59:31 - INFO - __main__ - Step 26901: {'lr': 0.00046588457766092134, 'samples': 5164992, 'steps': 26900, 'loss/train': 1.5008000135421753} -08/30/2021 17:59:31 - INFO - __main__ - Step 26902: {'lr': 0.00046588190151005163, 'samples': 5165184, 'steps': 26901, 'loss/train': 1.5895146131515503} -08/30/2021 17:59:32 - INFO - __main__ - Step 26903: {'lr': 0.00046587922526190883, 'samples': 5165376, 'steps': 26902, 'loss/train': 1.352649211883545} -08/30/2021 17:59:32 - INFO - __main__ - Step 26904: {'lr': 0.00046587654891649423, 'samples': 5165568, 'steps': 26903, 'loss/train': 2.2640106678009033} -08/30/2021 17:59:32 - INFO - __main__ - Step 26905: {'lr': 0.00046587387247380897, 'samples': 5165760, 'steps': 26904, 'loss/train': 1.7070716619491577} -08/30/2021 17:59:34 - INFO - __main__ - Step 26906: {'lr': 0.00046587119593385424, 'samples': 5165952, 'steps': 26905, 'loss/train': 1.495260238647461} -08/30/2021 17:59:34 - INFO - __main__ - Step 26907: {'lr': 0.00046586851929663134, 'samples': 5166144, 'steps': 26906, 'loss/train': 1.2227405309677124} -08/30/2021 17:59:35 - INFO - __main__ - Step 26908: {'lr': 0.00046586584256214135, 'samples': 5166336, 'steps': 26907, 'loss/train': 1.274914026260376} -08/30/2021 17:59:35 - INFO - __main__ - Step 26909: {'lr': 0.0004658631657303856, 'samples': 5166528, 'steps': 26908, 'loss/train': 0.8560934662818909} -08/30/2021 17:59:36 - INFO - __main__ - Step 26910: {'lr': 0.0004658604888013652, 'samples': 5166720, 'steps': 26909, 'loss/train': 1.6615206003189087} -08/30/2021 17:59:36 - INFO - __main__ - Step 26911: {'lr': 0.00046585781177508137, 'samples': 5166912, 'steps': 26910, 'loss/train': 2.079286813735962} -08/30/2021 17:59:38 - INFO - __main__ - Step 26912: {'lr': 0.0004658551346515354, 'samples': 5167104, 'steps': 26911, 'loss/train': 0.07465283572673798} -08/30/2021 17:59:38 - INFO - __main__ - Step 26913: {'lr': 0.00046585245743072833, 'samples': 5167296, 'steps': 26912, 'loss/train': 1.620635986328125} -08/30/2021 17:59:39 - INFO - __main__ - Step 26914: {'lr': 0.0004658497801126616, 'samples': 5167488, 'steps': 26913, 'loss/train': 1.3414040803909302} -08/30/2021 17:59:39 - INFO - __main__ - Step 26915: {'lr': 0.00046584710269733623, 'samples': 5167680, 'steps': 26914, 'loss/train': 1.435752272605896} -08/30/2021 17:59:39 - INFO - __main__ - Step 26916: {'lr': 0.00046584442518475354, 'samples': 5167872, 'steps': 26915, 'loss/train': 1.3708261251449585} -08/30/2021 17:59:41 - INFO - __main__ - Step 26917: {'lr': 0.0004658417475749146, 'samples': 5168064, 'steps': 26916, 'loss/train': 0.06692387163639069} -08/30/2021 17:59:41 - INFO - __main__ - Step 26918: {'lr': 0.00046583906986782074, 'samples': 5168256, 'steps': 26917, 'loss/train': 1.6083214282989502} -08/30/2021 17:59:42 - INFO - __main__ - Step 26919: {'lr': 0.0004658363920634732, 'samples': 5168448, 'steps': 26918, 'loss/train': 1.3549399375915527} -08/30/2021 17:59:42 - INFO - __main__ - Step 26920: {'lr': 0.000465833714161873, 'samples': 5168640, 'steps': 26919, 'loss/train': 1.7720448970794678} -08/30/2021 17:59:42 - INFO - __main__ - Step 26921: {'lr': 0.00046583103616302146, 'samples': 5168832, 'steps': 26920, 'loss/train': 0.20303179323673248} -08/30/2021 17:59:43 - INFO - __main__ - Step 26922: {'lr': 0.0004658283580669198, 'samples': 5169024, 'steps': 26921, 'loss/train': 1.0080013275146484} -08/30/2021 17:59:45 - INFO - __main__ - Step 26923: {'lr': 0.0004658256798735693, 'samples': 5169216, 'steps': 26922, 'loss/train': 1.368169903755188} -08/30/2021 17:59:45 - INFO - __main__ - Step 26924: {'lr': 0.000465823001582971, 'samples': 5169408, 'steps': 26923, 'loss/train': 1.1282775402069092} -08/30/2021 17:59:46 - INFO - __main__ - Step 26925: {'lr': 0.00046582032319512624, 'samples': 5169600, 'steps': 26924, 'loss/train': 2.120058536529541} -08/30/2021 17:59:46 - INFO - __main__ - Step 26926: {'lr': 0.00046581764471003605, 'samples': 5169792, 'steps': 26925, 'loss/train': 1.5686094760894775} -08/30/2021 17:59:46 - INFO - __main__ - Step 26927: {'lr': 0.0004658149661277019, 'samples': 5169984, 'steps': 26926, 'loss/train': 1.1897062063217163} -08/30/2021 17:59:48 - INFO - __main__ - Step 26928: {'lr': 0.0004658122874481248, 'samples': 5170176, 'steps': 26927, 'loss/train': 1.6875969171524048} -08/30/2021 17:59:48 - INFO - __main__ - Step 26929: {'lr': 0.000465809608671306, 'samples': 5170368, 'steps': 26928, 'loss/train': 1.5299280881881714} -08/30/2021 17:59:49 - INFO - __main__ - Step 26930: {'lr': 0.0004658069297972467, 'samples': 5170560, 'steps': 26929, 'loss/train': 1.452596664428711} -08/30/2021 17:59:49 - INFO - __main__ - Step 26931: {'lr': 0.00046580425082594823, 'samples': 5170752, 'steps': 26930, 'loss/train': 1.6443637609481812} -08/30/2021 17:59:49 - INFO - __main__ - Step 26932: {'lr': 0.00046580157175741155, 'samples': 5170944, 'steps': 26931, 'loss/train': 1.6452678442001343} -08/30/2021 17:59:51 - INFO - __main__ - Step 26933: {'lr': 0.0004657988925916381, 'samples': 5171136, 'steps': 26932, 'loss/train': 1.4347848892211914} -08/30/2021 17:59:51 - INFO - __main__ - Step 26934: {'lr': 0.000465796213328629, 'samples': 5171328, 'steps': 26933, 'loss/train': 1.8302736282348633} -08/30/2021 17:59:52 - INFO - __main__ - Step 26935: {'lr': 0.00046579353396838545, 'samples': 5171520, 'steps': 26934, 'loss/train': 1.3067013025283813} -08/30/2021 17:59:52 - INFO - __main__ - Step 26936: {'lr': 0.00046579085451090864, 'samples': 5171712, 'steps': 26935, 'loss/train': 2.155531406402588} -08/30/2021 17:59:52 - INFO - __main__ - Step 26937: {'lr': 0.00046578817495619983, 'samples': 5171904, 'steps': 26936, 'loss/train': 1.717665672302246} -08/30/2021 17:59:54 - INFO - __main__ - Step 26938: {'lr': 0.0004657854953042602, 'samples': 5172096, 'steps': 26937, 'loss/train': 1.2332600355148315} -08/30/2021 17:59:55 - INFO - __main__ - Step 26939: {'lr': 0.00046578281555509094, 'samples': 5172288, 'steps': 26938, 'loss/train': 1.4292773008346558} -08/30/2021 17:59:55 - INFO - __main__ - Step 26940: {'lr': 0.00046578013570869325, 'samples': 5172480, 'steps': 26939, 'loss/train': 0.8554905652999878} -08/30/2021 17:59:55 - INFO - __main__ - Step 26941: {'lr': 0.00046577745576506844, 'samples': 5172672, 'steps': 26940, 'loss/train': 1.1735535860061646} -08/30/2021 17:59:56 - INFO - __main__ - Step 26942: {'lr': 0.00046577477572421757, 'samples': 5172864, 'steps': 26941, 'loss/train': 1.6115187406539917} -08/30/2021 17:59:57 - INFO - __main__ - Step 26943: {'lr': 0.0004657720955861419, 'samples': 5173056, 'steps': 26942, 'loss/train': 1.2197036743164062} -08/30/2021 17:59:58 - INFO - __main__ - Step 26944: {'lr': 0.00046576941535084274, 'samples': 5173248, 'steps': 26943, 'loss/train': 1.4582329988479614} -08/30/2021 17:59:58 - INFO - __main__ - Step 26945: {'lr': 0.0004657667350183211, 'samples': 5173440, 'steps': 26944, 'loss/train': 1.435172200202942} -08/30/2021 17:59:58 - INFO - __main__ - Step 26946: {'lr': 0.00046576405458857836, 'samples': 5173632, 'steps': 26945, 'loss/train': 1.965851068496704} -08/30/2021 17:59:59 - INFO - __main__ - Step 26947: {'lr': 0.0004657613740616157, 'samples': 5173824, 'steps': 26946, 'loss/train': 1.4533733129501343} -08/30/2021 18:00:00 - INFO - __main__ - Step 26948: {'lr': 0.0004657586934374342, 'samples': 5174016, 'steps': 26947, 'loss/train': 2.0454695224761963} -08/30/2021 18:00:01 - INFO - __main__ - Step 26949: {'lr': 0.0004657560127160352, 'samples': 5174208, 'steps': 26948, 'loss/train': 0.8816270232200623} -08/30/2021 18:00:01 - INFO - __main__ - Step 26950: {'lr': 0.00046575333189741993, 'samples': 5174400, 'steps': 26949, 'loss/train': 1.6166325807571411} -08/30/2021 18:00:01 - INFO - __main__ - Step 26951: {'lr': 0.00046575065098158945, 'samples': 5174592, 'steps': 26950, 'loss/train': 1.4760130643844604} -08/30/2021 18:00:02 - INFO - __main__ - Step 26952: {'lr': 0.0004657479699685451, 'samples': 5174784, 'steps': 26951, 'loss/train': 1.284529447555542} -08/30/2021 18:00:03 - INFO - __main__ - Step 26953: {'lr': 0.00046574528885828803, 'samples': 5174976, 'steps': 26952, 'loss/train': 1.1363043785095215} -08/30/2021 18:00:04 - INFO - __main__ - Step 26954: {'lr': 0.0004657426076508195, 'samples': 5175168, 'steps': 26953, 'loss/train': 0.8876258134841919} -08/30/2021 18:00:04 - INFO - __main__ - Step 26955: {'lr': 0.00046573992634614064, 'samples': 5175360, 'steps': 26954, 'loss/train': 1.6934928894042969} -08/30/2021 18:00:04 - INFO - __main__ - Step 26956: {'lr': 0.00046573724494425274, 'samples': 5175552, 'steps': 26955, 'loss/train': 1.5810352563858032} -08/30/2021 18:00:05 - INFO - __main__ - Step 26957: {'lr': 0.00046573456344515694, 'samples': 5175744, 'steps': 26956, 'loss/train': 1.250922679901123} -08/30/2021 18:00:06 - INFO - __main__ - Step 26958: {'lr': 0.00046573188184885445, 'samples': 5175936, 'steps': 26957, 'loss/train': 1.3188906908035278} -08/30/2021 18:00:07 - INFO - __main__ - Step 26959: {'lr': 0.0004657292001553465, 'samples': 5176128, 'steps': 26958, 'loss/train': 0.06328149139881134} -08/30/2021 18:00:07 - INFO - __main__ - Step 26960: {'lr': 0.0004657265183646344, 'samples': 5176320, 'steps': 26959, 'loss/train': 1.6511822938919067} -08/30/2021 18:00:07 - INFO - __main__ - Step 26961: {'lr': 0.00046572383647671913, 'samples': 5176512, 'steps': 26960, 'loss/train': 1.7765454053878784} -08/30/2021 18:00:08 - INFO - __main__ - Step 26962: {'lr': 0.0004657211544916021, 'samples': 5176704, 'steps': 26961, 'loss/train': 0.3017668128013611} -08/30/2021 18:00:08 - INFO - __main__ - Step 26963: {'lr': 0.00046571847240928444, 'samples': 5176896, 'steps': 26962, 'loss/train': 1.1066577434539795} -08/30/2021 18:00:10 - INFO - __main__ - Step 26964: {'lr': 0.0004657157902297674, 'samples': 5177088, 'steps': 26963, 'loss/train': 1.6019381284713745} -08/30/2021 18:00:10 - INFO - __main__ - Step 26965: {'lr': 0.00046571310795305213, 'samples': 5177280, 'steps': 26964, 'loss/train': 1.538810133934021} -08/30/2021 18:00:10 - INFO - __main__ - Step 26966: {'lr': 0.0004657104255791398, 'samples': 5177472, 'steps': 26965, 'loss/train': 1.459782600402832} -08/30/2021 18:00:11 - INFO - __main__ - Step 26967: {'lr': 0.0004657077431080317, 'samples': 5177664, 'steps': 26966, 'loss/train': 0.059555113315582275} -08/30/2021 18:00:11 - INFO - __main__ - Step 26968: {'lr': 0.00046570506053972906, 'samples': 5177856, 'steps': 26967, 'loss/train': 0.24769888818264008} -08/30/2021 18:00:13 - INFO - __main__ - Step 26969: {'lr': 0.000465702377874233, 'samples': 5178048, 'steps': 26968, 'loss/train': 1.255476474761963} -08/30/2021 18:00:13 - INFO - __main__ - Step 26970: {'lr': 0.00046569969511154485, 'samples': 5178240, 'steps': 26969, 'loss/train': 1.66780424118042} -08/30/2021 18:00:13 - INFO - __main__ - Step 26971: {'lr': 0.0004656970122516657, 'samples': 5178432, 'steps': 26970, 'loss/train': 1.5754352807998657} -08/30/2021 18:00:14 - INFO - __main__ - Step 26972: {'lr': 0.0004656943292945968, 'samples': 5178624, 'steps': 26971, 'loss/train': 1.924007773399353} -08/30/2021 18:00:14 - INFO - __main__ - Step 26973: {'lr': 0.0004656916462403394, 'samples': 5178816, 'steps': 26972, 'loss/train': 1.4658902883529663} -08/30/2021 18:00:17 - INFO - __main__ - Step 26974: {'lr': 0.0004656889630888946, 'samples': 5179008, 'steps': 26973, 'loss/train': 2.0741961002349854} -08/30/2021 18:00:18 - INFO - __main__ - Step 26975: {'lr': 0.0004656862798402638, 'samples': 5179200, 'steps': 26974, 'loss/train': 1.6244912147521973} -08/30/2021 18:00:18 - INFO - __main__ - Step 26976: {'lr': 0.00046568359649444796, 'samples': 5179392, 'steps': 26975, 'loss/train': 1.8216925859451294} -08/30/2021 18:00:18 - INFO - __main__ - Step 26977: {'lr': 0.0004656809130514485, 'samples': 5179584, 'steps': 26976, 'loss/train': 1.8022947311401367} -08/30/2021 18:00:19 - INFO - __main__ - Step 26978: {'lr': 0.00046567822951126646, 'samples': 5179776, 'steps': 26977, 'loss/train': 1.8025085926055908} -08/30/2021 18:00:19 - INFO - __main__ - Step 26979: {'lr': 0.00046567554587390324, 'samples': 5179968, 'steps': 26978, 'loss/train': 1.7827305793762207} -08/30/2021 18:00:19 - INFO - __main__ - Step 26980: {'lr': 0.00046567286213935994, 'samples': 5180160, 'steps': 26979, 'loss/train': 1.6404439210891724} -08/30/2021 18:00:20 - INFO - __main__ - Step 26981: {'lr': 0.00046567017830763776, 'samples': 5180352, 'steps': 26980, 'loss/train': 1.7375833988189697} -08/30/2021 18:00:22 - INFO - __main__ - Step 26982: {'lr': 0.0004656674943787379, 'samples': 5180544, 'steps': 26981, 'loss/train': 1.5636651515960693} -08/30/2021 18:00:22 - INFO - __main__ - Step 26983: {'lr': 0.0004656648103526616, 'samples': 5180736, 'steps': 26982, 'loss/train': 1.382455825805664} -08/30/2021 18:00:23 - INFO - __main__ - Step 26984: {'lr': 0.00046566212622941005, 'samples': 5180928, 'steps': 26983, 'loss/train': 1.688787579536438} -08/30/2021 18:00:23 - INFO - __main__ - Step 26985: {'lr': 0.00046565944200898453, 'samples': 5181120, 'steps': 26984, 'loss/train': 1.9001823663711548} -08/30/2021 18:00:23 - INFO - __main__ - Step 26986: {'lr': 0.00046565675769138614, 'samples': 5181312, 'steps': 26985, 'loss/train': 0.9823494553565979} -08/30/2021 18:00:25 - INFO - __main__ - Step 26987: {'lr': 0.00046565407327661614, 'samples': 5181504, 'steps': 26986, 'loss/train': 1.2785985469818115} -08/30/2021 18:00:25 - INFO - __main__ - Step 26988: {'lr': 0.0004656513887646758, 'samples': 5181696, 'steps': 26987, 'loss/train': 0.9510458707809448} -08/30/2021 18:00:26 - INFO - __main__ - Step 26989: {'lr': 0.00046564870415556625, 'samples': 5181888, 'steps': 26988, 'loss/train': 1.7741374969482422} -08/30/2021 18:00:26 - INFO - __main__ - Step 26990: {'lr': 0.0004656460194492887, 'samples': 5182080, 'steps': 26989, 'loss/train': 1.8898942470550537} -08/30/2021 18:00:26 - INFO - __main__ - Step 26991: {'lr': 0.0004656433346458444, 'samples': 5182272, 'steps': 26990, 'loss/train': 1.4533418416976929} -08/30/2021 18:00:28 - INFO - __main__ - Step 26992: {'lr': 0.0004656406497452345, 'samples': 5182464, 'steps': 26991, 'loss/train': 0.4570915102958679} -08/30/2021 18:00:29 - INFO - __main__ - Step 26993: {'lr': 0.0004656379647474603, 'samples': 5182656, 'steps': 26992, 'loss/train': 1.7154120206832886} -08/30/2021 18:00:29 - INFO - __main__ - Step 26994: {'lr': 0.0004656352796525229, 'samples': 5182848, 'steps': 26993, 'loss/train': 1.6002998352050781} -08/30/2021 18:00:29 - INFO - __main__ - Step 26995: {'lr': 0.0004656325944604236, 'samples': 5183040, 'steps': 26994, 'loss/train': 2.3379414081573486} -08/30/2021 18:00:30 - INFO - __main__ - Step 26996: {'lr': 0.00046562990917116366, 'samples': 5183232, 'steps': 26995, 'loss/train': 2.3268332481384277} -08/30/2021 18:00:30 - INFO - __main__ - Step 26997: {'lr': 0.0004656272237847441, 'samples': 5183424, 'steps': 26996, 'loss/train': 1.5761443376541138} -08/30/2021 18:00:31 - INFO - __main__ - Step 26998: {'lr': 0.0004656245383011663, 'samples': 5183616, 'steps': 26997, 'loss/train': 1.7556006908416748} -08/30/2021 18:00:32 - INFO - __main__ - Step 26999: {'lr': 0.00046562185272043137, 'samples': 5183808, 'steps': 26998, 'loss/train': 1.1383898258209229} -08/30/2021 18:00:32 - INFO - __main__ - Step 27000: {'lr': 0.00046561916704254057, 'samples': 5184000, 'steps': 26999, 'loss/train': 1.391679048538208} -08/30/2021 18:00:33 - INFO - __main__ - Step 27001: {'lr': 0.0004656164812674951, 'samples': 5184192, 'steps': 27000, 'loss/train': 1.0219672918319702} -08/30/2021 18:00:33 - INFO - __main__ - Step 27002: {'lr': 0.00046561379539529626, 'samples': 5184384, 'steps': 27001, 'loss/train': 1.7161716222763062} -08/30/2021 18:00:34 - INFO - __main__ - Step 27003: {'lr': 0.0004656111094259451, 'samples': 5184576, 'steps': 27002, 'loss/train': 1.537265658378601} -08/30/2021 18:00:35 - INFO - __main__ - Step 27004: {'lr': 0.0004656084233594429, 'samples': 5184768, 'steps': 27003, 'loss/train': 1.6356860399246216} -08/30/2021 18:00:35 - INFO - __main__ - Step 27005: {'lr': 0.0004656057371957908, 'samples': 5184960, 'steps': 27004, 'loss/train': 1.807446837425232} -08/30/2021 18:00:36 - INFO - __main__ - Step 27006: {'lr': 0.00046560305093499015, 'samples': 5185152, 'steps': 27005, 'loss/train': 1.366638422012329} -08/30/2021 18:00:36 - INFO - __main__ - Step 27007: {'lr': 0.00046560036457704215, 'samples': 5185344, 'steps': 27006, 'loss/train': 1.4681525230407715} -08/30/2021 18:00:37 - INFO - __main__ - Step 27008: {'lr': 0.00046559767812194786, 'samples': 5185536, 'steps': 27007, 'loss/train': 1.4224255084991455} -08/30/2021 18:00:38 - INFO - __main__ - Step 27009: {'lr': 0.0004655949915697086, 'samples': 5185728, 'steps': 27008, 'loss/train': 1.3201313018798828} -08/30/2021 18:00:38 - INFO - __main__ - Step 27010: {'lr': 0.0004655923049203256, 'samples': 5185920, 'steps': 27009, 'loss/train': 1.4706474542617798} -08/30/2021 18:00:39 - INFO - __main__ - Step 27011: {'lr': 0.00046558961817380005, 'samples': 5186112, 'steps': 27010, 'loss/train': 2.05584454536438} -08/30/2021 18:00:39 - INFO - __main__ - Step 27012: {'lr': 0.00046558693133013306, 'samples': 5186304, 'steps': 27011, 'loss/train': 1.6807987689971924} -08/30/2021 18:00:39 - INFO - __main__ - Step 27013: {'lr': 0.000465584244389326, 'samples': 5186496, 'steps': 27012, 'loss/train': 1.2257968187332153} -08/30/2021 18:00:41 - INFO - __main__ - Step 27014: {'lr': 0.00046558155735137996, 'samples': 5186688, 'steps': 27013, 'loss/train': 1.448624610900879} -08/30/2021 18:00:41 - INFO - __main__ - Step 27015: {'lr': 0.00046557887021629623, 'samples': 5186880, 'steps': 27014, 'loss/train': 1.1582815647125244} -08/30/2021 18:00:41 - INFO - __main__ - Step 27016: {'lr': 0.000465576182984076, 'samples': 5187072, 'steps': 27015, 'loss/train': 2.0148961544036865} -08/30/2021 18:00:42 - INFO - __main__ - Step 27017: {'lr': 0.0004655734956547204, 'samples': 5187264, 'steps': 27016, 'loss/train': 1.5241016149520874} -08/30/2021 18:00:42 - INFO - __main__ - Step 27018: {'lr': 0.00046557080822823076, 'samples': 5187456, 'steps': 27017, 'loss/train': 1.4491941928863525} -08/30/2021 18:00:44 - INFO - __main__ - Step 27019: {'lr': 0.0004655681207046083, 'samples': 5187648, 'steps': 27018, 'loss/train': 0.8379098176956177} -08/30/2021 18:00:44 - INFO - __main__ - Step 27020: {'lr': 0.0004655654330838541, 'samples': 5187840, 'steps': 27019, 'loss/train': 1.3857444524765015} -08/30/2021 18:00:44 - INFO - __main__ - Step 27021: {'lr': 0.00046556274536596945, 'samples': 5188032, 'steps': 27020, 'loss/train': 1.6075927019119263} -08/30/2021 18:00:45 - INFO - __main__ - Step 27022: {'lr': 0.00046556005755095555, 'samples': 5188224, 'steps': 27021, 'loss/train': 1.4196367263793945} -08/30/2021 18:00:45 - INFO - __main__ - Step 27023: {'lr': 0.00046555736963881355, 'samples': 5188416, 'steps': 27022, 'loss/train': 1.0890384912490845} -08/30/2021 18:00:47 - INFO - __main__ - Step 27024: {'lr': 0.0004655546816295448, 'samples': 5188608, 'steps': 27023, 'loss/train': 1.5265403985977173} -08/30/2021 18:00:47 - INFO - __main__ - Step 27025: {'lr': 0.0004655519935231505, 'samples': 5188800, 'steps': 27024, 'loss/train': 1.6783900260925293} -08/30/2021 18:00:47 - INFO - __main__ - Step 27026: {'lr': 0.00046554930531963166, 'samples': 5188992, 'steps': 27025, 'loss/train': 1.0980746746063232} -08/30/2021 18:00:48 - INFO - __main__ - Step 27027: {'lr': 0.0004655466170189897, 'samples': 5189184, 'steps': 27026, 'loss/train': 1.1677947044372559} -08/30/2021 18:00:48 - INFO - __main__ - Step 27028: {'lr': 0.0004655439286212257, 'samples': 5189376, 'steps': 27027, 'loss/train': 1.392407774925232} -08/30/2021 18:00:50 - INFO - __main__ - Step 27029: {'lr': 0.00046554124012634105, 'samples': 5189568, 'steps': 27028, 'loss/train': 1.6881626844406128} -08/30/2021 18:00:50 - INFO - __main__ - Step 27030: {'lr': 0.0004655385515343368, 'samples': 5189760, 'steps': 27029, 'loss/train': 1.3778564929962158} -08/30/2021 18:00:51 - INFO - __main__ - Step 27031: {'lr': 0.0004655358628452142, 'samples': 5189952, 'steps': 27030, 'loss/train': 1.9335951805114746} -08/30/2021 18:00:51 - INFO - __main__ - Step 27032: {'lr': 0.00046553317405897444, 'samples': 5190144, 'steps': 27031, 'loss/train': 1.3064842224121094} -08/30/2021 18:00:51 - INFO - __main__ - Step 27033: {'lr': 0.0004655304851756188, 'samples': 5190336, 'steps': 27032, 'loss/train': 1.3732681274414062} -08/30/2021 18:00:53 - INFO - __main__ - Step 27034: {'lr': 0.0004655277961951484, 'samples': 5190528, 'steps': 27033, 'loss/train': 1.7316031455993652} -08/30/2021 18:00:54 - INFO - __main__ - Step 27035: {'lr': 0.00046552510711756444, 'samples': 5190720, 'steps': 27034, 'loss/train': 1.9706547260284424} -08/30/2021 18:00:54 - INFO - __main__ - Step 27036: {'lr': 0.0004655224179428683, 'samples': 5190912, 'steps': 27035, 'loss/train': 1.7437993288040161} -08/30/2021 18:00:54 - INFO - __main__ - Step 27037: {'lr': 0.00046551972867106106, 'samples': 5191104, 'steps': 27036, 'loss/train': 1.3878881931304932} -08/30/2021 18:00:55 - INFO - __main__ - Step 27038: {'lr': 0.00046551703930214393, 'samples': 5191296, 'steps': 27037, 'loss/train': 1.2605842351913452} -08/30/2021 18:00:56 - INFO - __main__ - Step 27039: {'lr': 0.00046551434983611823, 'samples': 5191488, 'steps': 27038, 'loss/train': 1.619400143623352} -08/30/2021 18:00:57 - INFO - __main__ - Step 27040: {'lr': 0.00046551166027298505, 'samples': 5191680, 'steps': 27039, 'loss/train': 1.4501162767410278} -08/30/2021 18:00:57 - INFO - __main__ - Step 27041: {'lr': 0.0004655089706127456, 'samples': 5191872, 'steps': 27040, 'loss/train': 1.5991936922073364} -08/30/2021 18:00:57 - INFO - __main__ - Step 27042: {'lr': 0.00046550628085540114, 'samples': 5192064, 'steps': 27041, 'loss/train': 1.3747488260269165} -08/30/2021 18:00:58 - INFO - __main__ - Step 27043: {'lr': 0.0004655035910009529, 'samples': 5192256, 'steps': 27042, 'loss/train': 1.0718268156051636} -08/30/2021 18:00:58 - INFO - __main__ - Step 27044: {'lr': 0.00046550090104940207, 'samples': 5192448, 'steps': 27043, 'loss/train': 1.4601668119430542} -08/30/2021 18:00:59 - INFO - __main__ - Step 27045: {'lr': 0.00046549821100074987, 'samples': 5192640, 'steps': 27044, 'loss/train': 1.5553958415985107} -08/30/2021 18:01:00 - INFO - __main__ - Step 27046: {'lr': 0.0004654955208549975, 'samples': 5192832, 'steps': 27045, 'loss/train': 0.8060368895530701} -08/30/2021 18:01:00 - INFO - __main__ - Step 27047: {'lr': 0.0004654928306121461, 'samples': 5193024, 'steps': 27046, 'loss/train': 1.4210699796676636} -08/30/2021 18:01:00 - INFO - __main__ - Step 27048: {'lr': 0.000465490140272197, 'samples': 5193216, 'steps': 27047, 'loss/train': 1.130094289779663} -08/30/2021 18:01:01 - INFO - __main__ - Step 27049: {'lr': 0.00046548744983515133, 'samples': 5193408, 'steps': 27048, 'loss/train': 1.4835467338562012} -08/30/2021 18:01:02 - INFO - __main__ - Step 27050: {'lr': 0.0004654847593010104, 'samples': 5193600, 'steps': 27049, 'loss/train': 1.7109342813491821} -08/30/2021 18:01:03 - INFO - __main__ - Step 27051: {'lr': 0.0004654820686697754, 'samples': 5193792, 'steps': 27050, 'loss/train': 1.5904674530029297} -08/30/2021 18:01:03 - INFO - __main__ - Step 27052: {'lr': 0.00046547937794144743, 'samples': 5193984, 'steps': 27051, 'loss/train': 0.756737470626831} -08/30/2021 18:01:03 - INFO - __main__ - Step 27053: {'lr': 0.00046547668711602774, 'samples': 5194176, 'steps': 27052, 'loss/train': 2.063991069793701} -08/30/2021 18:01:04 - INFO - __main__ - Step 27054: {'lr': 0.0004654739961935177, 'samples': 5194368, 'steps': 27053, 'loss/train': 1.1815845966339111} -08/30/2021 18:01:06 - INFO - __main__ - Step 27055: {'lr': 0.0004654713051739183, 'samples': 5194560, 'steps': 27054, 'loss/train': 1.8301626443862915} -08/30/2021 18:01:06 - INFO - __main__ - Step 27056: {'lr': 0.000465468614057231, 'samples': 5194752, 'steps': 27055, 'loss/train': 1.7003332376480103} -08/30/2021 18:01:06 - INFO - __main__ - Step 27057: {'lr': 0.0004654659228434567, 'samples': 5194944, 'steps': 27056, 'loss/train': 1.5856363773345947} -08/30/2021 18:01:07 - INFO - __main__ - Step 27058: {'lr': 0.00046546323153259686, 'samples': 5195136, 'steps': 27057, 'loss/train': 0.06997363269329071} -08/30/2021 18:01:07 - INFO - __main__ - Step 27059: {'lr': 0.00046546054012465253, 'samples': 5195328, 'steps': 27058, 'loss/train': 1.8706170320510864} -08/30/2021 18:01:09 - INFO - __main__ - Step 27060: {'lr': 0.00046545784861962516, 'samples': 5195520, 'steps': 27059, 'loss/train': 1.5879230499267578} -08/30/2021 18:01:09 - INFO - __main__ - Step 27061: {'lr': 0.00046545515701751567, 'samples': 5195712, 'steps': 27060, 'loss/train': 1.664392113685608} -08/30/2021 18:01:10 - INFO - __main__ - Step 27062: {'lr': 0.00046545246531832547, 'samples': 5195904, 'steps': 27061, 'loss/train': 1.0261359214782715} -08/30/2021 18:01:10 - INFO - __main__ - Step 27063: {'lr': 0.0004654497735220557, 'samples': 5196096, 'steps': 27062, 'loss/train': 1.1374526023864746} -08/30/2021 18:01:10 - INFO - __main__ - Step 27064: {'lr': 0.0004654470816287076, 'samples': 5196288, 'steps': 27063, 'loss/train': 1.4947664737701416} -08/30/2021 18:01:12 - INFO - __main__ - Step 27065: {'lr': 0.0004654443896382824, 'samples': 5196480, 'steps': 27064, 'loss/train': 1.6301007270812988} -08/30/2021 18:01:13 - INFO - __main__ - Step 27066: {'lr': 0.0004654416975507812, 'samples': 5196672, 'steps': 27065, 'loss/train': 1.6354727745056152} -08/30/2021 18:01:13 - INFO - __main__ - Step 27067: {'lr': 0.0004654390053662053, 'samples': 5196864, 'steps': 27066, 'loss/train': 1.7120006084442139} -08/30/2021 18:01:13 - INFO - __main__ - Step 27068: {'lr': 0.000465436313084556, 'samples': 5197056, 'steps': 27067, 'loss/train': 0.16369417309761047} -08/30/2021 18:01:14 - INFO - __main__ - Step 27069: {'lr': 0.0004654336207058344, 'samples': 5197248, 'steps': 27068, 'loss/train': 0.050382111221551895} -08/30/2021 18:01:14 - INFO - __main__ - Step 27070: {'lr': 0.0004654309282300416, 'samples': 5197440, 'steps': 27069, 'loss/train': 1.7151918411254883} -08/30/2021 18:01:16 - INFO - __main__ - Step 27071: {'lr': 0.00046542823565717914, 'samples': 5197632, 'steps': 27070, 'loss/train': 1.1886026859283447} -08/30/2021 18:01:16 - INFO - __main__ - Step 27072: {'lr': 0.00046542554298724793, 'samples': 5197824, 'steps': 27071, 'loss/train': 2.072775363922119} -08/30/2021 18:01:17 - INFO - __main__ - Step 27073: {'lr': 0.00046542285022024935, 'samples': 5198016, 'steps': 27072, 'loss/train': 1.4394422769546509} -08/30/2021 18:01:17 - INFO - __main__ - Step 27074: {'lr': 0.0004654201573561845, 'samples': 5198208, 'steps': 27073, 'loss/train': 1.8477309942245483} -08/30/2021 18:01:17 - INFO - __main__ - Step 27075: {'lr': 0.00046541746439505467, 'samples': 5198400, 'steps': 27074, 'loss/train': 1.052707314491272} -08/30/2021 18:01:19 - INFO - __main__ - Step 27076: {'lr': 0.00046541477133686107, 'samples': 5198592, 'steps': 27075, 'loss/train': 1.182202696800232} -08/30/2021 18:01:19 - INFO - __main__ - Step 27077: {'lr': 0.0004654120781816049, 'samples': 5198784, 'steps': 27076, 'loss/train': 1.7987797260284424} -08/30/2021 18:01:20 - INFO - __main__ - Step 27078: {'lr': 0.00046540938492928735, 'samples': 5198976, 'steps': 27077, 'loss/train': 0.34112757444381714} -08/30/2021 18:01:20 - INFO - __main__ - Step 27079: {'lr': 0.0004654066915799097, 'samples': 5199168, 'steps': 27078, 'loss/train': 1.1117234230041504} -08/30/2021 18:01:20 - INFO - __main__ - Step 27080: {'lr': 0.000465403998133473, 'samples': 5199360, 'steps': 27079, 'loss/train': 1.4834051132202148} -08/30/2021 18:01:22 - INFO - __main__ - Step 27081: {'lr': 0.0004654013045899788, 'samples': 5199552, 'steps': 27080, 'loss/train': 1.434158444404602} -08/30/2021 18:01:22 - INFO - __main__ - Step 27082: {'lr': 0.00046539861094942794, 'samples': 5199744, 'steps': 27081, 'loss/train': 1.2534668445587158} -08/30/2021 18:01:23 - INFO - __main__ - Step 27083: {'lr': 0.00046539591721182175, 'samples': 5199936, 'steps': 27082, 'loss/train': 1.9246628284454346} -08/30/2021 18:01:23 - INFO - __main__ - Step 27084: {'lr': 0.00046539322337716153, 'samples': 5200128, 'steps': 27083, 'loss/train': 3.3916218280792236} -08/30/2021 18:01:23 - INFO - __main__ - Step 27085: {'lr': 0.00046539052944544846, 'samples': 5200320, 'steps': 27084, 'loss/train': 1.1483354568481445} -08/30/2021 18:01:26 - INFO - __main__ - Step 27086: {'lr': 0.0004653878354166838, 'samples': 5200512, 'steps': 27085, 'loss/train': 0.10694511234760284} -08/30/2021 18:01:26 - INFO - __main__ - Step 27087: {'lr': 0.0004653851412908686, 'samples': 5200704, 'steps': 27086, 'loss/train': 1.6052772998809814} -08/30/2021 18:01:27 - INFO - __main__ - Step 27088: {'lr': 0.0004653824470680043, 'samples': 5200896, 'steps': 27087, 'loss/train': 1.2588305473327637} -08/30/2021 18:01:27 - INFO - __main__ - Step 27089: {'lr': 0.00046537975274809186, 'samples': 5201088, 'steps': 27088, 'loss/train': 0.16034357249736786} -08/30/2021 18:01:27 - INFO - __main__ - Step 27090: {'lr': 0.0004653770583311327, 'samples': 5201280, 'steps': 27089, 'loss/train': 1.302323579788208} -08/30/2021 18:01:29 - INFO - __main__ - Step 27091: {'lr': 0.00046537436381712796, 'samples': 5201472, 'steps': 27090, 'loss/train': 1.091360330581665} -08/30/2021 18:01:29 - INFO - __main__ - Step 27092: {'lr': 0.00046537166920607886, 'samples': 5201664, 'steps': 27091, 'loss/train': 1.9743883609771729} -08/30/2021 18:01:30 - INFO - __main__ - Step 27093: {'lr': 0.00046536897449798656, 'samples': 5201856, 'steps': 27092, 'loss/train': 1.6381726264953613} -08/30/2021 18:01:30 - INFO - __main__ - Step 27094: {'lr': 0.00046536627969285236, 'samples': 5202048, 'steps': 27093, 'loss/train': 1.96189546585083} -08/30/2021 18:01:30 - INFO - __main__ - Step 27095: {'lr': 0.0004653635847906774, 'samples': 5202240, 'steps': 27094, 'loss/train': 1.8539103269577026} -08/30/2021 18:01:31 - INFO - __main__ - Step 27096: {'lr': 0.000465360889791463, 'samples': 5202432, 'steps': 27095, 'loss/train': 1.4487504959106445} -08/30/2021 18:01:32 - INFO - __main__ - Step 27097: {'lr': 0.0004653581946952103, 'samples': 5202624, 'steps': 27096, 'loss/train': 2.0275697708129883} -08/30/2021 18:01:33 - INFO - __main__ - Step 27098: {'lr': 0.0004653554995019205, 'samples': 5202816, 'steps': 27097, 'loss/train': 1.635689377784729} -08/30/2021 18:01:33 - INFO - __main__ - Step 27099: {'lr': 0.0004653528042115948, 'samples': 5203008, 'steps': 27098, 'loss/train': 1.2576196193695068} -08/30/2021 18:01:33 - INFO - __main__ - Step 27100: {'lr': 0.0004653501088242345, 'samples': 5203200, 'steps': 27099, 'loss/train': 1.8818833827972412} -08/30/2021 18:01:34 - INFO - __main__ - Step 27101: {'lr': 0.0004653474133398408, 'samples': 5203392, 'steps': 27100, 'loss/train': 1.4839212894439697} -08/30/2021 18:01:35 - INFO - __main__ - Step 27102: {'lr': 0.00046534471775841474, 'samples': 5203584, 'steps': 27101, 'loss/train': 0.7570738196372986} -08/30/2021 18:01:36 - INFO - __main__ - Step 27103: {'lr': 0.0004653420220799578, 'samples': 5203776, 'steps': 27102, 'loss/train': 0.6034243702888489} -08/30/2021 18:01:36 - INFO - __main__ - Step 27104: {'lr': 0.000465339326304471, 'samples': 5203968, 'steps': 27103, 'loss/train': 0.27861687541007996} -08/30/2021 18:01:37 - INFO - __main__ - Step 27105: {'lr': 0.0004653366304319556, 'samples': 5204160, 'steps': 27104, 'loss/train': 1.9334520101547241} -08/30/2021 18:01:37 - INFO - __main__ - Step 27106: {'lr': 0.0004653339344624129, 'samples': 5204352, 'steps': 27105, 'loss/train': 1.6144770383834839} -08/30/2021 18:01:38 - INFO - __main__ - Step 27107: {'lr': 0.00046533123839584406, 'samples': 5204544, 'steps': 27106, 'loss/train': 0.9711307883262634} -08/30/2021 18:01:39 - INFO - __main__ - Step 27108: {'lr': 0.0004653285422322503, 'samples': 5204736, 'steps': 27107, 'loss/train': 2.1607308387756348} -08/30/2021 18:01:39 - INFO - __main__ - Step 27109: {'lr': 0.00046532584597163275, 'samples': 5204928, 'steps': 27108, 'loss/train': 1.4216431379318237} -08/30/2021 18:01:40 - INFO - __main__ - Step 27110: {'lr': 0.0004653231496139927, 'samples': 5205120, 'steps': 27109, 'loss/train': 1.1179980039596558} -08/30/2021 18:01:40 - INFO - __main__ - Step 27111: {'lr': 0.0004653204531593315, 'samples': 5205312, 'steps': 27110, 'loss/train': 1.4066784381866455} -08/30/2021 18:01:42 - INFO - __main__ - Step 27112: {'lr': 0.0004653177566076501, 'samples': 5205504, 'steps': 27111, 'loss/train': 1.4669851064682007} -08/30/2021 18:01:42 - INFO - __main__ - Step 27113: {'lr': 0.0004653150599589498, 'samples': 5205696, 'steps': 27112, 'loss/train': 2.0896048545837402} -08/30/2021 18:01:42 - INFO - __main__ - Step 27114: {'lr': 0.0004653123632132319, 'samples': 5205888, 'steps': 27113, 'loss/train': 2.693441867828369} -08/30/2021 18:01:43 - INFO - __main__ - Step 27115: {'lr': 0.0004653096663704976, 'samples': 5206080, 'steps': 27114, 'loss/train': 1.4360371828079224} -08/30/2021 18:01:43 - INFO - __main__ - Step 27116: {'lr': 0.0004653069694307481, 'samples': 5206272, 'steps': 27115, 'loss/train': 1.2330105304718018} -08/30/2021 18:01:44 - INFO - __main__ - Step 27117: {'lr': 0.00046530427239398453, 'samples': 5206464, 'steps': 27116, 'loss/train': 1.0283563137054443} -08/30/2021 18:01:45 - INFO - __main__ - Step 27118: {'lr': 0.0004653015752602082, 'samples': 5206656, 'steps': 27117, 'loss/train': 1.6964225769042969} -08/30/2021 18:01:45 - INFO - __main__ - Step 27119: {'lr': 0.0004652988780294204, 'samples': 5206848, 'steps': 27118, 'loss/train': 1.095198392868042} -08/30/2021 18:01:46 - INFO - __main__ - Step 27120: {'lr': 0.00046529618070162215, 'samples': 5207040, 'steps': 27119, 'loss/train': 1.318901777267456} -08/30/2021 18:01:46 - INFO - __main__ - Step 27121: {'lr': 0.00046529348327681476, 'samples': 5207232, 'steps': 27120, 'loss/train': 1.682550311088562} -08/30/2021 18:01:46 - INFO - __main__ - Step 27122: {'lr': 0.0004652907857549995, 'samples': 5207424, 'steps': 27121, 'loss/train': 1.5472487211227417} -08/30/2021 18:01:48 - INFO - __main__ - Step 27123: {'lr': 0.0004652880881361775, 'samples': 5207616, 'steps': 27122, 'loss/train': 0.8448706865310669} -08/30/2021 18:01:48 - INFO - __main__ - Step 27124: {'lr': 0.00046528539042035, 'samples': 5207808, 'steps': 27123, 'loss/train': 1.7188612222671509} -08/30/2021 18:01:49 - INFO - __main__ - Step 27125: {'lr': 0.0004652826926075183, 'samples': 5208000, 'steps': 27124, 'loss/train': 1.3044096231460571} -08/30/2021 18:01:49 - INFO - __main__ - Step 27126: {'lr': 0.00046527999469768346, 'samples': 5208192, 'steps': 27125, 'loss/train': 1.2946099042892456} -08/30/2021 18:01:49 - INFO - __main__ - Step 27127: {'lr': 0.0004652772966908468, 'samples': 5208384, 'steps': 27126, 'loss/train': 1.1339104175567627} -08/30/2021 18:01:51 - INFO - __main__ - Step 27128: {'lr': 0.0004652745985870095, 'samples': 5208576, 'steps': 27127, 'loss/train': 1.3347536325454712} -08/30/2021 18:01:51 - INFO - __main__ - Step 27129: {'lr': 0.0004652719003861728, 'samples': 5208768, 'steps': 27128, 'loss/train': 1.338863730430603} -08/30/2021 18:01:52 - INFO - __main__ - Step 27130: {'lr': 0.0004652692020883379, 'samples': 5208960, 'steps': 27129, 'loss/train': 0.1407596915960312} -08/30/2021 18:01:52 - INFO - __main__ - Step 27131: {'lr': 0.00046526650369350605, 'samples': 5209152, 'steps': 27130, 'loss/train': 1.8553941249847412} -08/30/2021 18:01:53 - INFO - __main__ - Step 27132: {'lr': 0.0004652638052016784, 'samples': 5209344, 'steps': 27131, 'loss/train': 1.689576268196106} -08/30/2021 18:01:54 - INFO - __main__ - Step 27133: {'lr': 0.00046526110661285615, 'samples': 5209536, 'steps': 27132, 'loss/train': 1.757028341293335} -08/30/2021 18:01:55 - INFO - __main__ - Step 27134: {'lr': 0.00046525840792704064, 'samples': 5209728, 'steps': 27133, 'loss/train': 2.376382350921631} -08/30/2021 18:01:55 - INFO - __main__ - Step 27135: {'lr': 0.000465255709144233, 'samples': 5209920, 'steps': 27134, 'loss/train': 1.4509390592575073} -08/30/2021 18:01:55 - INFO - __main__ - Step 27136: {'lr': 0.00046525301026443443, 'samples': 5210112, 'steps': 27135, 'loss/train': 1.6816036701202393} -08/30/2021 18:01:56 - INFO - __main__ - Step 27137: {'lr': 0.0004652503112876463, 'samples': 5210304, 'steps': 27136, 'loss/train': 1.2493385076522827} -08/30/2021 18:01:57 - INFO - __main__ - Step 27138: {'lr': 0.00046524761221386956, 'samples': 5210496, 'steps': 27137, 'loss/train': 1.4471927881240845} -08/30/2021 18:01:58 - INFO - __main__ - Step 27139: {'lr': 0.0004652449130431056, 'samples': 5210688, 'steps': 27138, 'loss/train': 1.7560170888900757} -08/30/2021 18:01:58 - INFO - __main__ - Step 27140: {'lr': 0.00046524221377535564, 'samples': 5210880, 'steps': 27139, 'loss/train': 1.0139490365982056} -08/30/2021 18:01:58 - INFO - __main__ - Step 27141: {'lr': 0.00046523951441062087, 'samples': 5211072, 'steps': 27140, 'loss/train': 1.6119662523269653} -08/30/2021 18:01:59 - INFO - __main__ - Step 27142: {'lr': 0.0004652368149489024, 'samples': 5211264, 'steps': 27141, 'loss/train': 1.7705886363983154} -08/30/2021 18:02:01 - INFO - __main__ - Step 27143: {'lr': 0.0004652341153902016, 'samples': 5211456, 'steps': 27142, 'loss/train': 1.0436846017837524} -08/30/2021 18:02:01 - INFO - __main__ - Step 27144: {'lr': 0.00046523141573451965, 'samples': 5211648, 'steps': 27143, 'loss/train': 0.8901267051696777} -08/30/2021 18:02:02 - INFO - __main__ - Step 27145: {'lr': 0.0004652287159818577, 'samples': 5211840, 'steps': 27144, 'loss/train': 1.3173696994781494} -08/30/2021 18:02:02 - INFO - __main__ - Step 27146: {'lr': 0.00046522601613221704, 'samples': 5212032, 'steps': 27145, 'loss/train': 1.683090329170227} -08/30/2021 18:02:02 - INFO - __main__ - Step 27147: {'lr': 0.0004652233161855989, 'samples': 5212224, 'steps': 27146, 'loss/train': 1.6737595796585083} -08/30/2021 18:02:04 - INFO - __main__ - Step 27148: {'lr': 0.0004652206161420044, 'samples': 5212416, 'steps': 27147, 'loss/train': 1.9634326696395874} -08/30/2021 18:02:04 - INFO - __main__ - Step 27149: {'lr': 0.00046521791600143483, 'samples': 5212608, 'steps': 27148, 'loss/train': 1.0778173208236694} -08/30/2021 18:02:05 - INFO - __main__ - Step 27150: {'lr': 0.00046521521576389134, 'samples': 5212800, 'steps': 27149, 'loss/train': 1.6184779405593872} -08/30/2021 18:02:05 - INFO - __main__ - Step 27151: {'lr': 0.00046521251542937524, 'samples': 5212992, 'steps': 27150, 'loss/train': 1.2396254539489746} -08/30/2021 18:02:05 - INFO - __main__ - Step 27152: {'lr': 0.0004652098149978877, 'samples': 5213184, 'steps': 27151, 'loss/train': 1.4671834707260132} -08/30/2021 18:02:06 - INFO - __main__ - Step 27153: {'lr': 0.00046520711446943, 'samples': 5213376, 'steps': 27152, 'loss/train': 1.4779397249221802} -08/30/2021 18:02:07 - INFO - __main__ - Step 27154: {'lr': 0.0004652044138440032, 'samples': 5213568, 'steps': 27153, 'loss/train': 1.2149711847305298} -08/30/2021 18:02:08 - INFO - __main__ - Step 27155: {'lr': 0.00046520171312160863, 'samples': 5213760, 'steps': 27154, 'loss/train': 1.5334635972976685} -08/30/2021 18:02:08 - INFO - __main__ - Step 27156: {'lr': 0.00046519901230224756, 'samples': 5213952, 'steps': 27155, 'loss/train': 1.6847068071365356} -08/30/2021 18:02:08 - INFO - __main__ - Step 27157: {'lr': 0.000465196311385921, 'samples': 5214144, 'steps': 27156, 'loss/train': 1.1634342670440674} -08/30/2021 18:02:09 - INFO - __main__ - Step 27158: {'lr': 0.0004651936103726304, 'samples': 5214336, 'steps': 27157, 'loss/train': 1.6953181028366089} -08/30/2021 18:02:10 - INFO - __main__ - Step 27159: {'lr': 0.0004651909092623769, 'samples': 5214528, 'steps': 27158, 'loss/train': 1.682037115097046} -08/30/2021 18:02:11 - INFO - __main__ - Step 27160: {'lr': 0.00046518820805516165, 'samples': 5214720, 'steps': 27159, 'loss/train': 2.1666359901428223} -08/30/2021 18:02:11 - INFO - __main__ - Step 27161: {'lr': 0.0004651855067509859, 'samples': 5214912, 'steps': 27160, 'loss/train': 0.923642635345459} -08/30/2021 18:02:11 - INFO - __main__ - Step 27162: {'lr': 0.0004651828053498509, 'samples': 5215104, 'steps': 27161, 'loss/train': 0.15039899945259094} -08/30/2021 18:02:12 - INFO - __main__ - Step 27163: {'lr': 0.0004651801038517579, 'samples': 5215296, 'steps': 27162, 'loss/train': 1.6620742082595825} -08/30/2021 18:02:13 - INFO - __main__ - Step 27164: {'lr': 0.000465177402256708, 'samples': 5215488, 'steps': 27163, 'loss/train': 1.2420668601989746} -08/30/2021 18:02:14 - INFO - __main__ - Step 27165: {'lr': 0.00046517470056470244, 'samples': 5215680, 'steps': 27164, 'loss/train': 1.8143824338912964} -08/30/2021 18:02:14 - INFO - __main__ - Step 27166: {'lr': 0.00046517199877574257, 'samples': 5215872, 'steps': 27165, 'loss/train': 1.2720283269882202} -08/30/2021 18:02:14 - INFO - __main__ - Step 27167: {'lr': 0.0004651692968898295, 'samples': 5216064, 'steps': 27166, 'loss/train': 1.4383347034454346} -08/30/2021 18:02:15 - INFO - __main__ - Step 27168: {'lr': 0.00046516659490696444, 'samples': 5216256, 'steps': 27167, 'loss/train': 1.142825722694397} -08/30/2021 18:02:16 - INFO - __main__ - Step 27169: {'lr': 0.0004651638928271487, 'samples': 5216448, 'steps': 27168, 'loss/train': 1.1730382442474365} -08/30/2021 18:02:17 - INFO - __main__ - Step 27170: {'lr': 0.00046516119065038335, 'samples': 5216640, 'steps': 27169, 'loss/train': 1.4490641355514526} -08/30/2021 18:02:17 - INFO - __main__ - Step 27171: {'lr': 0.00046515848837666975, 'samples': 5216832, 'steps': 27170, 'loss/train': 1.3089524507522583} -08/30/2021 18:02:17 - INFO - __main__ - Step 27172: {'lr': 0.00046515578600600895, 'samples': 5217024, 'steps': 27171, 'loss/train': 1.6375516653060913} -08/30/2021 18:02:18 - INFO - __main__ - Step 27173: {'lr': 0.0004651530835384024, 'samples': 5217216, 'steps': 27172, 'loss/train': 0.993874192237854} -08/30/2021 18:02:20 - INFO - __main__ - Step 27174: {'lr': 0.0004651503809738511, 'samples': 5217408, 'steps': 27173, 'loss/train': 1.8553403615951538} -08/30/2021 18:02:20 - INFO - __main__ - Step 27175: {'lr': 0.0004651476783123564, 'samples': 5217600, 'steps': 27174, 'loss/train': 0.7931986451148987} -08/30/2021 18:02:20 - INFO - __main__ - Step 27176: {'lr': 0.00046514497555391946, 'samples': 5217792, 'steps': 27175, 'loss/train': 1.2725205421447754} -08/30/2021 18:02:21 - INFO - __main__ - Step 27177: {'lr': 0.0004651422726985415, 'samples': 5217984, 'steps': 27176, 'loss/train': 1.2557040452957153} -08/30/2021 18:02:21 - INFO - __main__ - Step 27178: {'lr': 0.00046513956974622377, 'samples': 5218176, 'steps': 27177, 'loss/train': 1.3666027784347534} -08/30/2021 18:02:21 - INFO - __main__ - Step 27179: {'lr': 0.00046513686669696756, 'samples': 5218368, 'steps': 27178, 'loss/train': 1.3838618993759155} -08/30/2021 18:02:23 - INFO - __main__ - Step 27180: {'lr': 0.00046513416355077386, 'samples': 5218560, 'steps': 27179, 'loss/train': 0.4842136800289154} -08/30/2021 18:02:23 - INFO - __main__ - Step 27181: {'lr': 0.0004651314603076441, 'samples': 5218752, 'steps': 27180, 'loss/train': 0.9858081936836243} -08/30/2021 18:02:24 - INFO - __main__ - Step 27182: {'lr': 0.00046512875696757937, 'samples': 5218944, 'steps': 27181, 'loss/train': 1.5500998497009277} -08/30/2021 18:02:24 - INFO - __main__ - Step 27183: {'lr': 0.00046512605353058096, 'samples': 5219136, 'steps': 27182, 'loss/train': 1.9521722793579102} -08/30/2021 18:02:24 - INFO - __main__ - Step 27184: {'lr': 0.00046512334999665006, 'samples': 5219328, 'steps': 27183, 'loss/train': 1.0258973836898804} -08/30/2021 18:02:26 - INFO - __main__ - Step 27185: {'lr': 0.000465120646365788, 'samples': 5219520, 'steps': 27184, 'loss/train': 1.4164693355560303} -08/30/2021 18:02:26 - INFO - __main__ - Step 27186: {'lr': 0.0004651179426379958, 'samples': 5219712, 'steps': 27185, 'loss/train': 1.3320482969284058} -08/30/2021 18:02:27 - INFO - __main__ - Step 27187: {'lr': 0.00046511523881327476, 'samples': 5219904, 'steps': 27186, 'loss/train': 1.5076208114624023} -08/30/2021 18:02:27 - INFO - __main__ - Step 27188: {'lr': 0.00046511253489162616, 'samples': 5220096, 'steps': 27187, 'loss/train': 1.540059208869934} -08/30/2021 18:02:27 - INFO - __main__ - Step 27189: {'lr': 0.00046510983087305114, 'samples': 5220288, 'steps': 27188, 'loss/train': 1.2916322946548462} -08/30/2021 18:02:29 - INFO - __main__ - Step 27190: {'lr': 0.00046510712675755094, 'samples': 5220480, 'steps': 27189, 'loss/train': 1.959316611289978} -08/30/2021 18:02:29 - INFO - __main__ - Step 27191: {'lr': 0.00046510442254512686, 'samples': 5220672, 'steps': 27190, 'loss/train': 1.4867103099822998} -08/30/2021 18:02:30 - INFO - __main__ - Step 27192: {'lr': 0.00046510171823578, 'samples': 5220864, 'steps': 27191, 'loss/train': 1.876558542251587} -08/30/2021 18:02:30 - INFO - __main__ - Step 27193: {'lr': 0.0004650990138295116, 'samples': 5221056, 'steps': 27192, 'loss/train': 1.6605374813079834} -08/30/2021 18:02:30 - INFO - __main__ - Step 27194: {'lr': 0.00046509630932632293, 'samples': 5221248, 'steps': 27193, 'loss/train': 1.2944283485412598} -08/30/2021 18:02:31 - INFO - __main__ - Step 27195: {'lr': 0.0004650936047262152, 'samples': 5221440, 'steps': 27194, 'loss/train': 1.754934310913086} -08/30/2021 18:02:33 - INFO - __main__ - Step 27196: {'lr': 0.0004650909000291895, 'samples': 5221632, 'steps': 27195, 'loss/train': 0.21176883578300476} -08/30/2021 18:02:33 - INFO - __main__ - Step 27197: {'lr': 0.00046508819523524724, 'samples': 5221824, 'steps': 27196, 'loss/train': 1.88222336769104} -08/30/2021 18:02:33 - INFO - __main__ - Step 27198: {'lr': 0.0004650854903443896, 'samples': 5222016, 'steps': 27197, 'loss/train': 1.7587685585021973} -08/30/2021 18:02:34 - INFO - __main__ - Step 27199: {'lr': 0.00046508278535661775, 'samples': 5222208, 'steps': 27198, 'loss/train': 1.02782142162323} -08/30/2021 18:02:34 - INFO - __main__ - Step 27200: {'lr': 0.00046508008027193286, 'samples': 5222400, 'steps': 27199, 'loss/train': 1.965057373046875} -08/30/2021 18:02:36 - INFO - __main__ - Step 27201: {'lr': 0.0004650773750903363, 'samples': 5222592, 'steps': 27200, 'loss/train': 1.212222695350647} -08/30/2021 18:02:36 - INFO - __main__ - Step 27202: {'lr': 0.0004650746698118291, 'samples': 5222784, 'steps': 27201, 'loss/train': 1.7200069427490234} -08/30/2021 18:02:36 - INFO - __main__ - Step 27203: {'lr': 0.0004650719644364126, 'samples': 5222976, 'steps': 27202, 'loss/train': 1.4639238119125366} -08/30/2021 18:02:37 - INFO - __main__ - Step 27204: {'lr': 0.000465069258964088, 'samples': 5223168, 'steps': 27203, 'loss/train': 1.1928578615188599} -08/30/2021 18:02:37 - INFO - __main__ - Step 27205: {'lr': 0.0004650665533948565, 'samples': 5223360, 'steps': 27204, 'loss/train': 1.671126127243042} -08/30/2021 18:02:39 - INFO - __main__ - Step 27206: {'lr': 0.00046506384772871935, 'samples': 5223552, 'steps': 27205, 'loss/train': 1.2450087070465088} -08/30/2021 18:02:39 - INFO - __main__ - Step 27207: {'lr': 0.0004650611419656777, 'samples': 5223744, 'steps': 27206, 'loss/train': 1.1245115995407104} -08/30/2021 18:02:39 - INFO - __main__ - Step 27208: {'lr': 0.0004650584361057328, 'samples': 5223936, 'steps': 27207, 'loss/train': 0.17484788596630096} -08/30/2021 18:02:40 - INFO - __main__ - Step 27209: {'lr': 0.00046505573014888604, 'samples': 5224128, 'steps': 27208, 'loss/train': 1.763199806213379} -08/30/2021 18:02:40 - INFO - __main__ - Step 27210: {'lr': 0.0004650530240951383, 'samples': 5224320, 'steps': 27209, 'loss/train': 1.5048365592956543} -08/30/2021 18:02:42 - INFO - __main__ - Step 27211: {'lr': 0.0004650503179444911, 'samples': 5224512, 'steps': 27210, 'loss/train': 1.3131428956985474} -08/30/2021 18:02:42 - INFO - __main__ - Step 27212: {'lr': 0.00046504761169694555, 'samples': 5224704, 'steps': 27211, 'loss/train': 1.455526351928711} -08/30/2021 18:02:42 - INFO - __main__ - Step 27213: {'lr': 0.0004650449053525028, 'samples': 5224896, 'steps': 27212, 'loss/train': 1.5415327548980713} -08/30/2021 18:02:43 - INFO - __main__ - Step 27214: {'lr': 0.00046504219891116416, 'samples': 5225088, 'steps': 27213, 'loss/train': 1.2887331247329712} -08/30/2021 18:02:43 - INFO - __main__ - Step 27215: {'lr': 0.0004650394923729309, 'samples': 5225280, 'steps': 27214, 'loss/train': 1.2204267978668213} -08/30/2021 18:02:45 - INFO - __main__ - Step 27216: {'lr': 0.00046503678573780403, 'samples': 5225472, 'steps': 27215, 'loss/train': 1.389278531074524} -08/30/2021 18:02:45 - INFO - __main__ - Step 27217: {'lr': 0.000465034079005785, 'samples': 5225664, 'steps': 27216, 'loss/train': 2.055776596069336} -08/30/2021 18:02:46 - INFO - __main__ - Step 27218: {'lr': 0.00046503137217687485, 'samples': 5225856, 'steps': 27217, 'loss/train': 0.0949811041355133} -08/30/2021 18:02:46 - INFO - __main__ - Step 27219: {'lr': 0.0004650286652510749, 'samples': 5226048, 'steps': 27218, 'loss/train': 1.3490337133407593} -08/30/2021 18:02:46 - INFO - __main__ - Step 27220: {'lr': 0.0004650259582283864, 'samples': 5226240, 'steps': 27219, 'loss/train': 1.026698112487793} -08/30/2021 18:02:48 - INFO - __main__ - Step 27221: {'lr': 0.0004650232511088105, 'samples': 5226432, 'steps': 27220, 'loss/train': 1.5688090324401855} -08/30/2021 18:02:48 - INFO - __main__ - Step 27222: {'lr': 0.00046502054389234844, 'samples': 5226624, 'steps': 27221, 'loss/train': 1.7997719049453735} -08/30/2021 18:02:49 - INFO - __main__ - Step 27223: {'lr': 0.0004650178365790014, 'samples': 5226816, 'steps': 27222, 'loss/train': 0.0738530382514} -08/30/2021 18:02:49 - INFO - __main__ - Step 27224: {'lr': 0.0004650151291687707, 'samples': 5227008, 'steps': 27223, 'loss/train': 1.3296082019805908} -08/30/2021 18:02:49 - INFO - __main__ - Step 27225: {'lr': 0.00046501242166165747, 'samples': 5227200, 'steps': 27224, 'loss/train': 1.095910906791687} -08/30/2021 18:02:51 - INFO - __main__ - Step 27226: {'lr': 0.000465009714057663, 'samples': 5227392, 'steps': 27225, 'loss/train': 1.1816964149475098} -08/30/2021 18:02:51 - INFO - __main__ - Step 27227: {'lr': 0.00046500700635678844, 'samples': 5227584, 'steps': 27226, 'loss/train': 1.519883155822754} -08/30/2021 18:02:52 - INFO - __main__ - Step 27228: {'lr': 0.000465004298559035, 'samples': 5227776, 'steps': 27227, 'loss/train': 1.5541470050811768} -08/30/2021 18:02:52 - INFO - __main__ - Step 27229: {'lr': 0.00046500159066440404, 'samples': 5227968, 'steps': 27228, 'loss/train': 1.4665356874465942} -08/30/2021 18:02:52 - INFO - __main__ - Step 27230: {'lr': 0.0004649988826728966, 'samples': 5228160, 'steps': 27229, 'loss/train': 0.8733643889427185} -08/30/2021 18:02:53 - INFO - __main__ - Step 27231: {'lr': 0.000464996174584514, 'samples': 5228352, 'steps': 27230, 'loss/train': 1.6681219339370728} -08/30/2021 18:02:54 - INFO - __main__ - Step 27232: {'lr': 0.00046499346639925746, 'samples': 5228544, 'steps': 27231, 'loss/train': 1.3323636054992676} -08/30/2021 18:02:55 - INFO - __main__ - Step 27233: {'lr': 0.0004649907581171282, 'samples': 5228736, 'steps': 27232, 'loss/train': 1.2746250629425049} -08/30/2021 18:02:55 - INFO - __main__ - Step 27234: {'lr': 0.00046498804973812735, 'samples': 5228928, 'steps': 27233, 'loss/train': 1.0236037969589233} -08/30/2021 18:02:56 - INFO - __main__ - Step 27235: {'lr': 0.00046498534126225625, 'samples': 5229120, 'steps': 27234, 'loss/train': 1.393905520439148} -08/30/2021 18:02:56 - INFO - __main__ - Step 27236: {'lr': 0.0004649826326895161, 'samples': 5229312, 'steps': 27235, 'loss/train': 1.0438834428787231} -08/30/2021 18:02:57 - INFO - __main__ - Step 27237: {'lr': 0.0004649799240199081, 'samples': 5229504, 'steps': 27236, 'loss/train': 0.7269102931022644} -08/30/2021 18:02:58 - INFO - __main__ - Step 27238: {'lr': 0.0004649772152534334, 'samples': 5229696, 'steps': 27237, 'loss/train': 1.5188666582107544} -08/30/2021 18:02:58 - INFO - __main__ - Step 27239: {'lr': 0.0004649745063900933, 'samples': 5229888, 'steps': 27238, 'loss/train': 1.9725725650787354} -08/30/2021 18:02:58 - INFO - __main__ - Step 27240: {'lr': 0.000464971797429889, 'samples': 5230080, 'steps': 27239, 'loss/train': 1.210260033607483} -08/30/2021 18:02:59 - INFO - __main__ - Step 27241: {'lr': 0.00046496908837282173, 'samples': 5230272, 'steps': 27240, 'loss/train': 1.168676495552063} -08/30/2021 18:03:00 - INFO - __main__ - Step 27242: {'lr': 0.00046496637921889276, 'samples': 5230464, 'steps': 27241, 'loss/train': 1.859948992729187} -08/30/2021 18:03:01 - INFO - __main__ - Step 27243: {'lr': 0.0004649636699681031, 'samples': 5230656, 'steps': 27242, 'loss/train': 1.5435638427734375} -08/30/2021 18:03:01 - INFO - __main__ - Step 27244: {'lr': 0.00046496096062045427, 'samples': 5230848, 'steps': 27243, 'loss/train': 1.488871693611145} -08/30/2021 18:03:02 - INFO - __main__ - Step 27245: {'lr': 0.00046495825117594735, 'samples': 5231040, 'steps': 27244, 'loss/train': 1.4715319871902466} -08/30/2021 18:03:02 - INFO - __main__ - Step 27246: {'lr': 0.0004649555416345835, 'samples': 5231232, 'steps': 27245, 'loss/train': 1.8495218753814697} -08/30/2021 18:03:04 - INFO - __main__ - Step 27247: {'lr': 0.0004649528319963641, 'samples': 5231424, 'steps': 27246, 'loss/train': 1.6618481874465942} -08/30/2021 18:03:04 - INFO - __main__ - Step 27248: {'lr': 0.0004649501222612901, 'samples': 5231616, 'steps': 27247, 'loss/train': 1.2079572677612305} -08/30/2021 18:03:05 - INFO - __main__ - Step 27249: {'lr': 0.000464947412429363, 'samples': 5231808, 'steps': 27248, 'loss/train': 1.9796838760375977} -08/30/2021 18:03:05 - INFO - __main__ - Step 27250: {'lr': 0.000464944702500584, 'samples': 5232000, 'steps': 27249, 'loss/train': 1.690522313117981} -08/30/2021 18:03:05 - INFO - __main__ - Step 27251: {'lr': 0.0004649419924749541, 'samples': 5232192, 'steps': 27250, 'loss/train': 1.7213099002838135} -08/30/2021 18:03:06 - INFO - __main__ - Step 27252: {'lr': 0.0004649392823524746, 'samples': 5232384, 'steps': 27251, 'loss/train': 0.9100295901298523} -08/30/2021 18:03:07 - INFO - __main__ - Step 27253: {'lr': 0.0004649365721331469, 'samples': 5232576, 'steps': 27252, 'loss/train': 1.5809015035629272} -08/30/2021 18:03:08 - INFO - __main__ - Step 27254: {'lr': 0.00046493386181697206, 'samples': 5232768, 'steps': 27253, 'loss/train': 1.7417445182800293} -08/30/2021 18:03:08 - INFO - __main__ - Step 27255: {'lr': 0.00046493115140395136, 'samples': 5232960, 'steps': 27254, 'loss/train': 1.5555888414382935} -08/30/2021 18:03:08 - INFO - __main__ - Step 27256: {'lr': 0.000464928440894086, 'samples': 5233152, 'steps': 27255, 'loss/train': 1.2720096111297607} -08/30/2021 18:03:09 - INFO - __main__ - Step 27257: {'lr': 0.00046492573028737716, 'samples': 5233344, 'steps': 27256, 'loss/train': 1.5129177570343018} -08/30/2021 18:03:10 - INFO - __main__ - Step 27258: {'lr': 0.0004649230195838261, 'samples': 5233536, 'steps': 27257, 'loss/train': 1.2692806720733643} -08/30/2021 18:03:11 - INFO - __main__ - Step 27259: {'lr': 0.00046492030878343406, 'samples': 5233728, 'steps': 27258, 'loss/train': 1.562685251235962} -08/30/2021 18:03:11 - INFO - __main__ - Step 27260: {'lr': 0.00046491759788620227, 'samples': 5233920, 'steps': 27259, 'loss/train': 1.3309409618377686} -08/30/2021 18:03:12 - INFO - __main__ - Step 27261: {'lr': 0.0004649148868921319, 'samples': 5234112, 'steps': 27260, 'loss/train': 1.4846631288528442} -08/30/2021 18:03:12 - INFO - __main__ - Step 27262: {'lr': 0.00046491217580122427, 'samples': 5234304, 'steps': 27261, 'loss/train': 1.4535695314407349} -08/30/2021 18:03:14 - INFO - __main__ - Step 27263: {'lr': 0.00046490946461348045, 'samples': 5234496, 'steps': 27262, 'loss/train': 0.7473717927932739} -08/30/2021 18:03:14 - INFO - __main__ - Step 27264: {'lr': 0.00046490675332890177, 'samples': 5234688, 'steps': 27263, 'loss/train': 0.19532035291194916} -08/30/2021 18:03:14 - INFO - __main__ - Step 27265: {'lr': 0.00046490404194748935, 'samples': 5234880, 'steps': 27264, 'loss/train': 1.9025545120239258} -08/30/2021 18:03:15 - INFO - __main__ - Step 27266: {'lr': 0.00046490133046924457, 'samples': 5235072, 'steps': 27265, 'loss/train': 0.9349351525306702} -08/30/2021 18:03:15 - INFO - __main__ - Step 27267: {'lr': 0.0004648986188941685, 'samples': 5235264, 'steps': 27266, 'loss/train': 0.78515625} -08/30/2021 18:03:16 - INFO - __main__ - Step 27268: {'lr': 0.0004648959072222625, 'samples': 5235456, 'steps': 27267, 'loss/train': 1.3551311492919922} -08/30/2021 18:03:17 - INFO - __main__ - Step 27269: {'lr': 0.0004648931954535277, 'samples': 5235648, 'steps': 27268, 'loss/train': 1.1315070390701294} -08/30/2021 18:03:17 - INFO - __main__ - Step 27270: {'lr': 0.0004648904835879654, 'samples': 5235840, 'steps': 27269, 'loss/train': 1.0739414691925049} -08/30/2021 18:03:18 - INFO - __main__ - Step 27271: {'lr': 0.0004648877716255766, 'samples': 5236032, 'steps': 27270, 'loss/train': 1.052010178565979} -08/30/2021 18:03:18 - INFO - __main__ - Step 27272: {'lr': 0.00046488505956636286, 'samples': 5236224, 'steps': 27271, 'loss/train': 0.9770748019218445} -08/30/2021 18:03:20 - INFO - __main__ - Step 27273: {'lr': 0.0004648823474103251, 'samples': 5236416, 'steps': 27272, 'loss/train': 1.6778689622879028} -08/30/2021 18:03:20 - INFO - __main__ - Step 27274: {'lr': 0.0004648796351574648, 'samples': 5236608, 'steps': 27273, 'loss/train': 1.8462250232696533} -08/30/2021 18:03:20 - INFO - __main__ - Step 27275: {'lr': 0.0004648769228077829, 'samples': 5236800, 'steps': 27274, 'loss/train': 1.6655688285827637} -08/30/2021 18:03:21 - INFO - __main__ - Step 27276: {'lr': 0.00046487421036128085, 'samples': 5236992, 'steps': 27275, 'loss/train': 1.4138898849487305} -08/30/2021 18:03:21 - INFO - __main__ - Step 27277: {'lr': 0.00046487149781795976, 'samples': 5237184, 'steps': 27276, 'loss/train': 0.10334265977144241} -08/30/2021 18:03:21 - INFO - __main__ - Step 27278: {'lr': 0.00046486878517782094, 'samples': 5237376, 'steps': 27277, 'loss/train': 1.682212471961975} -08/30/2021 18:03:23 - INFO - __main__ - Step 27279: {'lr': 0.0004648660724408656, 'samples': 5237568, 'steps': 27278, 'loss/train': 1.694521427154541} -08/30/2021 18:03:23 - INFO - __main__ - Step 27280: {'lr': 0.00046486335960709485, 'samples': 5237760, 'steps': 27279, 'loss/train': 1.7350554466247559} -08/30/2021 18:03:24 - INFO - __main__ - Step 27281: {'lr': 0.00046486064667651, 'samples': 5237952, 'steps': 27280, 'loss/train': 1.4675053358078003} -08/30/2021 18:03:24 - INFO - __main__ - Step 27282: {'lr': 0.0004648579336491123, 'samples': 5238144, 'steps': 27281, 'loss/train': 1.6293554306030273} -08/30/2021 18:03:24 - INFO - __main__ - Step 27283: {'lr': 0.0004648552205249029, 'samples': 5238336, 'steps': 27282, 'loss/train': 1.2510106563568115} -08/30/2021 18:03:26 - INFO - __main__ - Step 27284: {'lr': 0.000464852507303883, 'samples': 5238528, 'steps': 27283, 'loss/train': 2.3260385990142822} -08/30/2021 18:03:26 - INFO - __main__ - Step 27285: {'lr': 0.0004648497939860539, 'samples': 5238720, 'steps': 27284, 'loss/train': 1.5813488960266113} -08/30/2021 18:03:27 - INFO - __main__ - Step 27286: {'lr': 0.0004648470805714169, 'samples': 5238912, 'steps': 27285, 'loss/train': 1.4133464097976685} -08/30/2021 18:03:27 - INFO - __main__ - Step 27287: {'lr': 0.00046484436705997303, 'samples': 5239104, 'steps': 27286, 'loss/train': 1.6518265008926392} -08/30/2021 18:03:27 - INFO - __main__ - Step 27288: {'lr': 0.0004648416534517236, 'samples': 5239296, 'steps': 27287, 'loss/train': 1.3845692873001099} -08/30/2021 18:03:29 - INFO - __main__ - Step 27289: {'lr': 0.00046483893974666983, 'samples': 5239488, 'steps': 27288, 'loss/train': 3.8499529361724854} -08/30/2021 18:03:30 - INFO - __main__ - Step 27290: {'lr': 0.000464836225944813, 'samples': 5239680, 'steps': 27289, 'loss/train': 2.0362470149993896} -08/30/2021 18:03:30 - INFO - __main__ - Step 27291: {'lr': 0.00046483351204615423, 'samples': 5239872, 'steps': 27290, 'loss/train': 1.3258978128433228} -08/30/2021 18:03:30 - INFO - __main__ - Step 27292: {'lr': 0.0004648307980506948, 'samples': 5240064, 'steps': 27291, 'loss/train': 1.7532356977462769} -08/30/2021 18:03:31 - INFO - __main__ - Step 27293: {'lr': 0.00046482808395843594, 'samples': 5240256, 'steps': 27292, 'loss/train': 0.10539980977773666} -08/30/2021 18:03:31 - INFO - __main__ - Step 27294: {'lr': 0.0004648253697693789, 'samples': 5240448, 'steps': 27293, 'loss/train': 0.046046182513237} -08/30/2021 18:03:32 - INFO - __main__ - Step 27295: {'lr': 0.0004648226554835248, 'samples': 5240640, 'steps': 27294, 'loss/train': 1.7988481521606445} -08/30/2021 18:03:33 - INFO - __main__ - Step 27296: {'lr': 0.000464819941100875, 'samples': 5240832, 'steps': 27295, 'loss/train': 1.3836617469787598} -08/30/2021 18:03:33 - INFO - __main__ - Step 27297: {'lr': 0.00046481722662143057, 'samples': 5241024, 'steps': 27296, 'loss/train': 1.6231448650360107} -08/30/2021 18:03:34 - INFO - __main__ - Step 27298: {'lr': 0.0004648145120451929, 'samples': 5241216, 'steps': 27297, 'loss/train': 1.3917350769042969} -08/30/2021 18:03:34 - INFO - __main__ - Step 27299: {'lr': 0.000464811797372163, 'samples': 5241408, 'steps': 27298, 'loss/train': 1.4628976583480835} -08/30/2021 18:03:36 - INFO - __main__ - Step 27300: {'lr': 0.00046480908260234234, 'samples': 5241600, 'steps': 27299, 'loss/train': 1.3640955686569214} -08/30/2021 18:03:36 - INFO - __main__ - Step 27301: {'lr': 0.0004648063677357319, 'samples': 5241792, 'steps': 27300, 'loss/train': 0.8540429472923279} -08/30/2021 18:03:36 - INFO - __main__ - Step 27302: {'lr': 0.00046480365277233316, 'samples': 5241984, 'steps': 27301, 'loss/train': 1.4378702640533447} -08/30/2021 18:03:37 - INFO - __main__ - Step 27303: {'lr': 0.00046480093771214716, 'samples': 5242176, 'steps': 27302, 'loss/train': 1.3795442581176758} -08/30/2021 18:03:37 - INFO - __main__ - Step 27304: {'lr': 0.0004647982225551751, 'samples': 5242368, 'steps': 27303, 'loss/train': 1.8644474744796753} -08/30/2021 18:03:39 - INFO - __main__ - Step 27305: {'lr': 0.0004647955073014184, 'samples': 5242560, 'steps': 27304, 'loss/train': 1.4457502365112305} -08/30/2021 18:03:39 - INFO - __main__ - Step 27306: {'lr': 0.00046479279195087804, 'samples': 5242752, 'steps': 27305, 'loss/train': 0.8158540725708008} -08/30/2021 18:03:40 - INFO - __main__ - Step 27307: {'lr': 0.0004647900765035554, 'samples': 5242944, 'steps': 27306, 'loss/train': 1.3061364889144897} -08/30/2021 18:03:40 - INFO - __main__ - Step 27308: {'lr': 0.0004647873609594517, 'samples': 5243136, 'steps': 27307, 'loss/train': 1.8341137170791626} -08/30/2021 18:03:40 - INFO - __main__ - Step 27309: {'lr': 0.0004647846453185681, 'samples': 5243328, 'steps': 27308, 'loss/train': 1.4347705841064453} -08/30/2021 18:03:42 - INFO - __main__ - Step 27310: {'lr': 0.0004647819295809059, 'samples': 5243520, 'steps': 27309, 'loss/train': 1.2835569381713867} -08/30/2021 18:03:43 - INFO - __main__ - Step 27311: {'lr': 0.00046477921374646624, 'samples': 5243712, 'steps': 27310, 'loss/train': 1.5727505683898926} -08/30/2021 18:03:43 - INFO - __main__ - Step 27312: {'lr': 0.0004647764978152503, 'samples': 5243904, 'steps': 27311, 'loss/train': 1.3658605813980103} -08/30/2021 18:03:43 - INFO - __main__ - Step 27313: {'lr': 0.0004647737817872595, 'samples': 5244096, 'steps': 27312, 'loss/train': 0.8591522574424744} -08/30/2021 18:03:44 - INFO - __main__ - Step 27314: {'lr': 0.0004647710656624949, 'samples': 5244288, 'steps': 27313, 'loss/train': 1.8187135457992554} -08/30/2021 18:03:45 - INFO - __main__ - Step 27315: {'lr': 0.0004647683494409578, 'samples': 5244480, 'steps': 27314, 'loss/train': 1.6067172288894653} -08/30/2021 18:03:45 - INFO - __main__ - Step 27316: {'lr': 0.0004647656331226494, 'samples': 5244672, 'steps': 27315, 'loss/train': 1.51498281955719} -08/30/2021 18:03:46 - INFO - __main__ - Step 27317: {'lr': 0.0004647629167075709, 'samples': 5244864, 'steps': 27316, 'loss/train': 1.5694047212600708} -08/30/2021 18:03:46 - INFO - __main__ - Step 27318: {'lr': 0.00046476020019572354, 'samples': 5245056, 'steps': 27317, 'loss/train': 1.5925524234771729} -08/30/2021 18:03:46 - INFO - __main__ - Step 27319: {'lr': 0.00046475748358710856, 'samples': 5245248, 'steps': 27318, 'loss/train': 1.0620713233947754} -08/30/2021 18:03:47 - INFO - __main__ - Step 27320: {'lr': 0.0004647547668817271, 'samples': 5245440, 'steps': 27319, 'loss/train': 1.2808213233947754} -08/30/2021 18:03:49 - INFO - __main__ - Step 27321: {'lr': 0.00046475205007958054, 'samples': 5245632, 'steps': 27320, 'loss/train': 1.625947117805481} -08/30/2021 18:03:49 - INFO - __main__ - Step 27322: {'lr': 0.00046474933318067004, 'samples': 5245824, 'steps': 27321, 'loss/train': 1.7700499296188354} -08/30/2021 18:03:49 - INFO - __main__ - Step 27323: {'lr': 0.0004647466161849968, 'samples': 5246016, 'steps': 27322, 'loss/train': 1.7060738801956177} -08/30/2021 18:03:50 - INFO - __main__ - Step 27324: {'lr': 0.000464743899092562, 'samples': 5246208, 'steps': 27323, 'loss/train': 1.4622997045516968} -08/30/2021 18:03:50 - INFO - __main__ - Step 27325: {'lr': 0.0004647411819033669, 'samples': 5246400, 'steps': 27324, 'loss/train': 0.04158177599310875} -08/30/2021 18:03:50 - INFO - __main__ - Step 27326: {'lr': 0.00046473846461741276, 'samples': 5246592, 'steps': 27325, 'loss/train': 1.4114559888839722} -08/30/2021 18:03:52 - INFO - __main__ - Step 27327: {'lr': 0.0004647357472347008, 'samples': 5246784, 'steps': 27326, 'loss/train': 1.964754343032837} -08/30/2021 18:03:52 - INFO - __main__ - Step 27328: {'lr': 0.00046473302975523224, 'samples': 5246976, 'steps': 27327, 'loss/train': 1.4276273250579834} -08/30/2021 18:03:53 - INFO - __main__ - Step 27329: {'lr': 0.0004647303121790082, 'samples': 5247168, 'steps': 27328, 'loss/train': 1.6231714487075806} -08/30/2021 18:03:53 - INFO - __main__ - Step 27330: {'lr': 0.0004647275945060301, 'samples': 5247360, 'steps': 27329, 'loss/train': 1.151721715927124} -08/30/2021 18:03:53 - INFO - __main__ - Step 27331: {'lr': 0.000464724876736299, 'samples': 5247552, 'steps': 27330, 'loss/train': 2.5251708030700684} -08/30/2021 18:03:55 - INFO - __main__ - Step 27332: {'lr': 0.00046472215886981616, 'samples': 5247744, 'steps': 27331, 'loss/train': 0.6353248953819275} -08/30/2021 18:03:55 - INFO - __main__ - Step 27333: {'lr': 0.00046471944090658294, 'samples': 5247936, 'steps': 27332, 'loss/train': 1.8478977680206299} -08/30/2021 18:03:56 - INFO - __main__ - Step 27334: {'lr': 0.0004647167228466004, 'samples': 5248128, 'steps': 27333, 'loss/train': 0.6284403800964355} -08/30/2021 18:03:56 - INFO - __main__ - Step 27335: {'lr': 0.0004647140046898697, 'samples': 5248320, 'steps': 27334, 'loss/train': 1.6182653903961182} -08/30/2021 18:03:56 - INFO - __main__ - Step 27336: {'lr': 0.0004647112864363923, 'samples': 5248512, 'steps': 27335, 'loss/train': 1.2258281707763672} -08/30/2021 18:03:58 - INFO - __main__ - Step 27337: {'lr': 0.00046470856808616934, 'samples': 5248704, 'steps': 27336, 'loss/train': 1.7995223999023438} -08/30/2021 18:03:58 - INFO - __main__ - Step 27338: {'lr': 0.0004647058496392019, 'samples': 5248896, 'steps': 27337, 'loss/train': 0.9250343441963196} -08/30/2021 18:03:59 - INFO - __main__ - Step 27339: {'lr': 0.0004647031310954914, 'samples': 5249088, 'steps': 27338, 'loss/train': 1.7553257942199707} -08/30/2021 18:03:59 - INFO - __main__ - Step 27340: {'lr': 0.00046470041245503895, 'samples': 5249280, 'steps': 27339, 'loss/train': 1.399047613143921} -08/30/2021 18:03:59 - INFO - __main__ - Step 27341: {'lr': 0.0004646976937178459, 'samples': 5249472, 'steps': 27340, 'loss/train': 2.1510541439056396} -08/30/2021 18:04:01 - INFO - __main__ - Step 27342: {'lr': 0.0004646949748839132, 'samples': 5249664, 'steps': 27341, 'loss/train': 0.9165777564048767} -08/30/2021 18:04:01 - INFO - __main__ - Step 27343: {'lr': 0.0004646922559532424, 'samples': 5249856, 'steps': 27342, 'loss/train': 1.3690391778945923} -08/30/2021 18:04:02 - INFO - __main__ - Step 27344: {'lr': 0.0004646895369258345, 'samples': 5250048, 'steps': 27343, 'loss/train': 0.8818331360816956} -08/30/2021 18:04:02 - INFO - __main__ - Step 27345: {'lr': 0.00046468681780169086, 'samples': 5250240, 'steps': 27344, 'loss/train': 1.3514323234558105} -08/30/2021 18:04:02 - INFO - __main__ - Step 27346: {'lr': 0.0004646840985808126, 'samples': 5250432, 'steps': 27345, 'loss/train': 1.0465266704559326} -08/30/2021 18:04:04 - INFO - __main__ - Step 27347: {'lr': 0.0004646813792632011, 'samples': 5250624, 'steps': 27346, 'loss/train': 1.541799545288086} -08/30/2021 18:04:04 - INFO - __main__ - Step 27348: {'lr': 0.00046467865984885736, 'samples': 5250816, 'steps': 27347, 'loss/train': 1.7342004776000977} -08/30/2021 18:04:05 - INFO - __main__ - Step 27349: {'lr': 0.0004646759403377828, 'samples': 5251008, 'steps': 27348, 'loss/train': 1.3066784143447876} -08/30/2021 18:04:05 - INFO - __main__ - Step 27350: {'lr': 0.00046467322072997865, 'samples': 5251200, 'steps': 27349, 'loss/train': 1.6642979383468628} -08/30/2021 18:04:05 - INFO - __main__ - Step 27351: {'lr': 0.00046467050102544594, 'samples': 5251392, 'steps': 27350, 'loss/train': 1.3448563814163208} -08/30/2021 18:04:06 - INFO - __main__ - Step 27352: {'lr': 0.0004646677812241861, 'samples': 5251584, 'steps': 27351, 'loss/train': 1.191585659980774} -08/30/2021 18:04:07 - INFO - __main__ - Step 27353: {'lr': 0.0004646650613262001, 'samples': 5251776, 'steps': 27352, 'loss/train': 0.6744791865348816} -08/30/2021 18:04:08 - INFO - __main__ - Step 27354: {'lr': 0.00046466234133148957, 'samples': 5251968, 'steps': 27353, 'loss/train': 1.1724281311035156} -08/30/2021 18:04:08 - INFO - __main__ - Step 27355: {'lr': 0.00046465962124005535, 'samples': 5252160, 'steps': 27354, 'loss/train': 1.4432481527328491} -08/30/2021 18:04:08 - INFO - __main__ - Step 27356: {'lr': 0.0004646569010518988, 'samples': 5252352, 'steps': 27355, 'loss/train': 1.5820986032485962} -08/30/2021 18:04:09 - INFO - __main__ - Step 27357: {'lr': 0.00046465418076702125, 'samples': 5252544, 'steps': 27356, 'loss/train': 1.2430405616760254} -08/30/2021 18:04:11 - INFO - __main__ - Step 27358: {'lr': 0.00046465146038542375, 'samples': 5252736, 'steps': 27357, 'loss/train': 1.4338152408599854} -08/30/2021 18:04:11 - INFO - __main__ - Step 27359: {'lr': 0.0004646487399071077, 'samples': 5252928, 'steps': 27358, 'loss/train': 1.0728802680969238} -08/30/2021 18:04:12 - INFO - __main__ - Step 27360: {'lr': 0.00046464601933207417, 'samples': 5253120, 'steps': 27359, 'loss/train': 1.418859839439392} -08/30/2021 18:04:12 - INFO - __main__ - Step 27361: {'lr': 0.0004646432986603245, 'samples': 5253312, 'steps': 27360, 'loss/train': 1.0611650943756104} -08/30/2021 18:04:12 - INFO - __main__ - Step 27362: {'lr': 0.00046464057789185985, 'samples': 5253504, 'steps': 27361, 'loss/train': 0.5609676241874695} -08/30/2021 18:04:15 - INFO - __main__ - Step 27363: {'lr': 0.00046463785702668156, 'samples': 5253696, 'steps': 27362, 'loss/train': 2.100377082824707} -08/30/2021 18:04:15 - INFO - __main__ - Step 27364: {'lr': 0.0004646351360647907, 'samples': 5253888, 'steps': 27363, 'loss/train': 1.3934309482574463} -08/30/2021 18:04:16 - INFO - __main__ - Step 27365: {'lr': 0.00046463241500618846, 'samples': 5254080, 'steps': 27364, 'loss/train': 1.6407395601272583} -08/30/2021 18:04:16 - INFO - __main__ - Step 27366: {'lr': 0.00046462969385087626, 'samples': 5254272, 'steps': 27365, 'loss/train': 1.9130204916000366} -08/30/2021 18:04:16 - INFO - __main__ - Step 27367: {'lr': 0.00046462697259885523, 'samples': 5254464, 'steps': 27366, 'loss/train': 3.333629846572876} -08/30/2021 18:04:17 - INFO - __main__ - Step 27368: {'lr': 0.0004646242512501266, 'samples': 5254656, 'steps': 27367, 'loss/train': 2.2948241233825684} -08/30/2021 18:04:18 - INFO - __main__ - Step 27369: {'lr': 0.0004646215298046916, 'samples': 5254848, 'steps': 27368, 'loss/train': 2.367582082748413} -08/30/2021 18:04:19 - INFO - __main__ - Step 27370: {'lr': 0.00046461880826255143, 'samples': 5255040, 'steps': 27369, 'loss/train': 1.4502631425857544} -08/30/2021 18:04:19 - INFO - __main__ - Step 27371: {'lr': 0.00046461608662370734, 'samples': 5255232, 'steps': 27370, 'loss/train': 1.9257307052612305} -08/30/2021 18:04:19 - INFO - __main__ - Step 27372: {'lr': 0.0004646133648881606, 'samples': 5255424, 'steps': 27371, 'loss/train': 1.5148178339004517} -08/30/2021 18:04:20 - INFO - __main__ - Step 27373: {'lr': 0.00046461064305591235, 'samples': 5255616, 'steps': 27372, 'loss/train': 1.9873127937316895} -08/30/2021 18:04:20 - INFO - __main__ - Step 27374: {'lr': 0.00046460792112696384, 'samples': 5255808, 'steps': 27373, 'loss/train': 0.8149328231811523} -08/30/2021 18:04:21 - INFO - __main__ - Step 27375: {'lr': 0.0004646051991013163, 'samples': 5256000, 'steps': 27374, 'loss/train': 1.8680310249328613} -08/30/2021 18:04:22 - INFO - __main__ - Step 27376: {'lr': 0.000464602476978971, 'samples': 5256192, 'steps': 27375, 'loss/train': 0.9939104318618774} -08/30/2021 18:04:22 - INFO - __main__ - Step 27377: {'lr': 0.00046459975475992914, 'samples': 5256384, 'steps': 27376, 'loss/train': 1.577289342880249} -08/30/2021 18:04:23 - INFO - __main__ - Step 27378: {'lr': 0.00046459703244419194, 'samples': 5256576, 'steps': 27377, 'loss/train': 1.6684318780899048} -08/30/2021 18:04:23 - INFO - __main__ - Step 27379: {'lr': 0.0004645943100317606, 'samples': 5256768, 'steps': 27378, 'loss/train': 1.620996356010437} -08/30/2021 18:04:25 - INFO - __main__ - Step 27380: {'lr': 0.00046459158752263643, 'samples': 5256960, 'steps': 27379, 'loss/train': 1.4244303703308105} -08/30/2021 18:04:25 - INFO - __main__ - Step 27381: {'lr': 0.0004645888649168205, 'samples': 5257152, 'steps': 27380, 'loss/train': 1.8420264720916748} -08/30/2021 18:04:25 - INFO - __main__ - Step 27382: {'lr': 0.0004645861422143143, 'samples': 5257344, 'steps': 27381, 'loss/train': 1.68105149269104} -08/30/2021 18:04:26 - INFO - __main__ - Step 27383: {'lr': 0.0004645834194151187, 'samples': 5257536, 'steps': 27382, 'loss/train': 1.6556614637374878} -08/30/2021 18:04:26 - INFO - __main__ - Step 27384: {'lr': 0.0004645806965192353, 'samples': 5257728, 'steps': 27383, 'loss/train': 1.6255290508270264} -08/30/2021 18:04:28 - INFO - __main__ - Step 27385: {'lr': 0.000464577973526665, 'samples': 5257920, 'steps': 27384, 'loss/train': 1.6095224618911743} -08/30/2021 18:04:28 - INFO - __main__ - Step 27386: {'lr': 0.00046457525043740926, 'samples': 5258112, 'steps': 27385, 'loss/train': 1.5118950605392456} -08/30/2021 18:04:29 - INFO - __main__ - Step 27387: {'lr': 0.0004645725272514693, 'samples': 5258304, 'steps': 27386, 'loss/train': 1.5710792541503906} -08/30/2021 18:04:29 - INFO - __main__ - Step 27388: {'lr': 0.0004645698039688461, 'samples': 5258496, 'steps': 27387, 'loss/train': 1.990828514099121} -08/30/2021 18:04:29 - INFO - __main__ - Step 27389: {'lr': 0.00046456708058954116, 'samples': 5258688, 'steps': 27388, 'loss/train': 1.6931428909301758} -08/30/2021 18:04:31 - INFO - __main__ - Step 27390: {'lr': 0.0004645643571135556, 'samples': 5258880, 'steps': 27389, 'loss/train': 1.568619966506958} -08/30/2021 18:04:31 - INFO - __main__ - Step 27391: {'lr': 0.00046456163354089065, 'samples': 5259072, 'steps': 27390, 'loss/train': 1.7756857872009277} -08/30/2021 18:04:31 - INFO - __main__ - Step 27392: {'lr': 0.00046455890987154747, 'samples': 5259264, 'steps': 27391, 'loss/train': 2.837989330291748} -08/30/2021 18:04:32 - INFO - __main__ - Step 27393: {'lr': 0.0004645561861055274, 'samples': 5259456, 'steps': 27392, 'loss/train': 1.8848211765289307} -08/30/2021 18:04:32 - INFO - __main__ - Step 27394: {'lr': 0.00046455346224283167, 'samples': 5259648, 'steps': 27393, 'loss/train': 0.8997451663017273} -08/30/2021 18:04:34 - INFO - __main__ - Step 27395: {'lr': 0.00046455073828346137, 'samples': 5259840, 'steps': 27394, 'loss/train': 1.7699164152145386} -08/30/2021 18:04:34 - INFO - __main__ - Step 27396: {'lr': 0.0004645480142274179, 'samples': 5260032, 'steps': 27395, 'loss/train': 1.2306593656539917} -08/30/2021 18:04:34 - INFO - __main__ - Step 27397: {'lr': 0.0004645452900747024, 'samples': 5260224, 'steps': 27396, 'loss/train': 1.6315412521362305} -08/30/2021 18:04:35 - INFO - __main__ - Step 27398: {'lr': 0.00046454256582531604, 'samples': 5260416, 'steps': 27397, 'loss/train': 2.2044410705566406} -08/30/2021 18:04:35 - INFO - __main__ - Step 27399: {'lr': 0.0004645398414792602, 'samples': 5260608, 'steps': 27398, 'loss/train': 0.7364284992218018} -08/30/2021 18:04:37 - INFO - __main__ - Step 27400: {'lr': 0.000464537117036536, 'samples': 5260800, 'steps': 27399, 'loss/train': 1.4160264730453491} -08/30/2021 18:04:37 - INFO - __main__ - Step 27401: {'lr': 0.00046453439249714466, 'samples': 5260992, 'steps': 27400, 'loss/train': 2.031721830368042} -08/30/2021 18:04:37 - INFO - __main__ - Step 27402: {'lr': 0.00046453166786108736, 'samples': 5261184, 'steps': 27401, 'loss/train': 1.9949887990951538} -08/30/2021 18:04:38 - INFO - __main__ - Step 27403: {'lr': 0.00046452894312836547, 'samples': 5261376, 'steps': 27402, 'loss/train': 1.9851300716400146} -08/30/2021 18:04:38 - INFO - __main__ - Step 27404: {'lr': 0.0004645262182989802, 'samples': 5261568, 'steps': 27403, 'loss/train': 1.0105459690093994} -08/30/2021 18:04:40 - INFO - __main__ - Step 27405: {'lr': 0.0004645234933729327, 'samples': 5261760, 'steps': 27404, 'loss/train': 0.06788698583841324} -08/30/2021 18:04:40 - INFO - __main__ - Step 27406: {'lr': 0.00046452076835022416, 'samples': 5261952, 'steps': 27405, 'loss/train': 1.4818108081817627} -08/30/2021 18:04:41 - INFO - __main__ - Step 27407: {'lr': 0.0004645180432308559, 'samples': 5262144, 'steps': 27406, 'loss/train': 1.0781244039535522} -08/30/2021 18:04:41 - INFO - __main__ - Step 27408: {'lr': 0.00046451531801482913, 'samples': 5262336, 'steps': 27407, 'loss/train': 1.3619756698608398} -08/30/2021 18:04:41 - INFO - __main__ - Step 27409: {'lr': 0.00046451259270214505, 'samples': 5262528, 'steps': 27408, 'loss/train': 1.224409580230713} -08/30/2021 18:04:42 - INFO - __main__ - Step 27410: {'lr': 0.00046450986729280495, 'samples': 5262720, 'steps': 27409, 'loss/train': 1.8427653312683105} -08/30/2021 18:04:43 - INFO - __main__ - Step 27411: {'lr': 0.00046450714178680996, 'samples': 5262912, 'steps': 27410, 'loss/train': 1.615390658378601} -08/30/2021 18:04:44 - INFO - __main__ - Step 27412: {'lr': 0.0004645044161841614, 'samples': 5263104, 'steps': 27411, 'loss/train': 1.1181161403656006} -08/30/2021 18:04:44 - INFO - __main__ - Step 27413: {'lr': 0.00046450169048486045, 'samples': 5263296, 'steps': 27412, 'loss/train': 1.1217595338821411} -08/30/2021 18:04:44 - INFO - __main__ - Step 27414: {'lr': 0.0004644989646889084, 'samples': 5263488, 'steps': 27413, 'loss/train': 1.69459068775177} -08/30/2021 18:04:45 - INFO - __main__ - Step 27415: {'lr': 0.0004644962387963063, 'samples': 5263680, 'steps': 27414, 'loss/train': 1.5929012298583984} -08/30/2021 18:04:47 - INFO - __main__ - Step 27416: {'lr': 0.0004644935128070556, 'samples': 5263872, 'steps': 27415, 'loss/train': 1.9933714866638184} -08/30/2021 18:04:47 - INFO - __main__ - Step 27417: {'lr': 0.0004644907867211574, 'samples': 5264064, 'steps': 27416, 'loss/train': 1.4617135524749756} -08/30/2021 18:04:47 - INFO - __main__ - Step 27418: {'lr': 0.000464488060538613, 'samples': 5264256, 'steps': 27417, 'loss/train': 1.5432010889053345} -08/30/2021 18:04:48 - INFO - __main__ - Step 27419: {'lr': 0.0004644853342594235, 'samples': 5264448, 'steps': 27418, 'loss/train': 1.5122867822647095} -08/30/2021 18:04:48 - INFO - __main__ - Step 27420: {'lr': 0.0004644826078835903, 'samples': 5264640, 'steps': 27419, 'loss/train': 1.713381290435791} -08/30/2021 18:04:50 - INFO - __main__ - Step 27421: {'lr': 0.00046447988141111457, 'samples': 5264832, 'steps': 27420, 'loss/train': 1.7288973331451416} -08/30/2021 18:04:50 - INFO - __main__ - Step 27422: {'lr': 0.0004644771548419975, 'samples': 5265024, 'steps': 27421, 'loss/train': 1.3567960262298584} -08/30/2021 18:04:51 - INFO - __main__ - Step 27423: {'lr': 0.0004644744281762403, 'samples': 5265216, 'steps': 27422, 'loss/train': 2.2251620292663574} -08/30/2021 18:04:51 - INFO - __main__ - Step 27424: {'lr': 0.0004644717014138442, 'samples': 5265408, 'steps': 27423, 'loss/train': 1.5661921501159668} -08/30/2021 18:04:51 - INFO - __main__ - Step 27425: {'lr': 0.0004644689745548105, 'samples': 5265600, 'steps': 27424, 'loss/train': 0.5250753164291382} -08/30/2021 18:04:53 - INFO - __main__ - Step 27426: {'lr': 0.00046446624759914043, 'samples': 5265792, 'steps': 27425, 'loss/train': 1.2815206050872803} -08/30/2021 18:04:53 - INFO - __main__ - Step 27427: {'lr': 0.0004644635205468351, 'samples': 5265984, 'steps': 27426, 'loss/train': 1.7290304899215698} -08/30/2021 18:04:54 - INFO - __main__ - Step 27428: {'lr': 0.00046446079339789587, 'samples': 5266176, 'steps': 27427, 'loss/train': 1.6286661624908447} -08/30/2021 18:04:54 - INFO - __main__ - Step 27429: {'lr': 0.0004644580661523239, 'samples': 5266368, 'steps': 27428, 'loss/train': 1.294432520866394} -08/30/2021 18:04:54 - INFO - __main__ - Step 27430: {'lr': 0.00046445533881012043, 'samples': 5266560, 'steps': 27429, 'loss/train': 1.2775497436523438} -08/30/2021 18:04:56 - INFO - __main__ - Step 27431: {'lr': 0.0004644526113712867, 'samples': 5266752, 'steps': 27430, 'loss/train': 1.9153541326522827} -08/30/2021 18:04:57 - INFO - __main__ - Step 27432: {'lr': 0.00046444988383582394, 'samples': 5266944, 'steps': 27431, 'loss/train': 1.5451918840408325} -08/30/2021 18:04:57 - INFO - __main__ - Step 27433: {'lr': 0.0004644471562037333, 'samples': 5267136, 'steps': 27432, 'loss/train': 0.24773718416690826} -08/30/2021 18:04:57 - INFO - __main__ - Step 27434: {'lr': 0.0004644444284750162, 'samples': 5267328, 'steps': 27433, 'loss/train': 1.4150580167770386} -08/30/2021 18:04:58 - INFO - __main__ - Step 27435: {'lr': 0.0004644417006496737, 'samples': 5267520, 'steps': 27434, 'loss/train': 1.601648211479187} -08/30/2021 18:04:59 - INFO - __main__ - Step 27436: {'lr': 0.0004644389727277071, 'samples': 5267712, 'steps': 27435, 'loss/train': 1.2211816310882568} -08/30/2021 18:05:00 - INFO - __main__ - Step 27437: {'lr': 0.00046443624470911754, 'samples': 5267904, 'steps': 27436, 'loss/train': 1.636705994606018} -08/30/2021 18:05:00 - INFO - __main__ - Step 27438: {'lr': 0.00046443351659390637, 'samples': 5268096, 'steps': 27437, 'loss/train': 1.3936412334442139} -08/30/2021 18:05:01 - INFO - __main__ - Step 27439: {'lr': 0.00046443078838207474, 'samples': 5268288, 'steps': 27438, 'loss/train': 1.8843578100204468} -08/30/2021 18:05:01 - INFO - __main__ - Step 27440: {'lr': 0.00046442806007362394, 'samples': 5268480, 'steps': 27439, 'loss/train': 1.2439494132995605} -08/30/2021 18:05:01 - INFO - __main__ - Step 27441: {'lr': 0.00046442533166855517, 'samples': 5268672, 'steps': 27440, 'loss/train': 0.8290183544158936} -08/30/2021 18:05:03 - INFO - __main__ - Step 27442: {'lr': 0.00046442260316686957, 'samples': 5268864, 'steps': 27441, 'loss/train': 1.4382227659225464} -08/30/2021 18:05:03 - INFO - __main__ - Step 27443: {'lr': 0.0004644198745685685, 'samples': 5269056, 'steps': 27442, 'loss/train': 1.6046395301818848} -08/30/2021 18:05:04 - INFO - __main__ - Step 27444: {'lr': 0.00046441714587365317, 'samples': 5269248, 'steps': 27443, 'loss/train': 2.005960464477539} -08/30/2021 18:05:04 - INFO - __main__ - Step 27445: {'lr': 0.00046441441708212477, 'samples': 5269440, 'steps': 27444, 'loss/train': 2.0347695350646973} -08/30/2021 18:05:04 - INFO - __main__ - Step 27446: {'lr': 0.00046441168819398457, 'samples': 5269632, 'steps': 27445, 'loss/train': 1.2989490032196045} -08/30/2021 18:05:06 - INFO - __main__ - Step 27447: {'lr': 0.0004644089592092338, 'samples': 5269824, 'steps': 27446, 'loss/train': 1.4103548526763916} -08/30/2021 18:05:07 - INFO - __main__ - Step 27448: {'lr': 0.0004644062301278735, 'samples': 5270016, 'steps': 27447, 'loss/train': 1.3690731525421143} -08/30/2021 18:05:07 - INFO - __main__ - Step 27449: {'lr': 0.0004644035009499052, 'samples': 5270208, 'steps': 27448, 'loss/train': 1.497934103012085} -08/30/2021 18:05:07 - INFO - __main__ - Step 27450: {'lr': 0.0004644007716753299, 'samples': 5270400, 'steps': 27449, 'loss/train': 1.3804068565368652} -08/30/2021 18:05:08 - INFO - __main__ - Step 27451: {'lr': 0.00046439804230414904, 'samples': 5270592, 'steps': 27450, 'loss/train': 1.993382215499878} -08/30/2021 18:05:09 - INFO - __main__ - Step 27452: {'lr': 0.0004643953128363637, 'samples': 5270784, 'steps': 27451, 'loss/train': 0.4664199650287628} -08/30/2021 18:05:10 - INFO - __main__ - Step 27453: {'lr': 0.0004643925832719751, 'samples': 5270976, 'steps': 27452, 'loss/train': 1.0037028789520264} -08/30/2021 18:05:10 - INFO - __main__ - Step 27454: {'lr': 0.0004643898536109845, 'samples': 5271168, 'steps': 27453, 'loss/train': 1.2655574083328247} -08/30/2021 18:05:10 - INFO - __main__ - Step 27455: {'lr': 0.0004643871238533931, 'samples': 5271360, 'steps': 27454, 'loss/train': 1.277710199356079} -08/30/2021 18:05:11 - INFO - __main__ - Step 27456: {'lr': 0.0004643843939992022, 'samples': 5271552, 'steps': 27455, 'loss/train': 1.315433144569397} -08/30/2021 18:05:11 - INFO - __main__ - Step 27457: {'lr': 0.0004643816640484131, 'samples': 5271744, 'steps': 27456, 'loss/train': 1.73223876953125} -08/30/2021 18:05:13 - INFO - __main__ - Step 27458: {'lr': 0.0004643789340010268, 'samples': 5271936, 'steps': 27457, 'loss/train': 1.7017115354537964} -08/30/2021 18:05:13 - INFO - __main__ - Step 27459: {'lr': 0.00046437620385704476, 'samples': 5272128, 'steps': 27458, 'loss/train': 1.2132965326309204} -08/30/2021 18:05:13 - INFO - __main__ - Step 27460: {'lr': 0.0004643734736164681, 'samples': 5272320, 'steps': 27459, 'loss/train': 1.5949082374572754} -08/30/2021 18:05:14 - INFO - __main__ - Step 27461: {'lr': 0.00046437074327929795, 'samples': 5272512, 'steps': 27460, 'loss/train': 1.6055718660354614} -08/30/2021 18:05:14 - INFO - __main__ - Step 27462: {'lr': 0.0004643680128455358, 'samples': 5272704, 'steps': 27461, 'loss/train': 1.2206093072891235} -08/30/2021 18:05:15 - INFO - __main__ - Step 27463: {'lr': 0.00046436528231518263, 'samples': 5272896, 'steps': 27462, 'loss/train': 1.6541802883148193} -08/30/2021 18:05:16 - INFO - __main__ - Step 27464: {'lr': 0.0004643625516882398, 'samples': 5273088, 'steps': 27463, 'loss/train': 0.5171638131141663} -08/30/2021 18:05:16 - INFO - __main__ - Step 27465: {'lr': 0.0004643598209647085, 'samples': 5273280, 'steps': 27464, 'loss/train': 1.495107650756836} -08/30/2021 18:05:17 - INFO - __main__ - Step 27466: {'lr': 0.00046435709014459, 'samples': 5273472, 'steps': 27465, 'loss/train': 0.47101113200187683} -08/30/2021 18:05:17 - INFO - __main__ - Step 27467: {'lr': 0.0004643543592278855, 'samples': 5273664, 'steps': 27466, 'loss/train': 1.4665911197662354} -08/30/2021 18:05:19 - INFO - __main__ - Step 27468: {'lr': 0.0004643516282145962, 'samples': 5273856, 'steps': 27467, 'loss/train': 1.4858365058898926} -08/30/2021 18:05:20 - INFO - __main__ - Step 27469: {'lr': 0.0004643488971047234, 'samples': 5274048, 'steps': 27468, 'loss/train': 1.8858387470245361} -08/30/2021 18:05:20 - INFO - __main__ - Step 27470: {'lr': 0.0004643461658982683, 'samples': 5274240, 'steps': 27469, 'loss/train': 1.5373194217681885} -08/30/2021 18:05:20 - INFO - __main__ - Step 27471: {'lr': 0.00046434343459523207, 'samples': 5274432, 'steps': 27470, 'loss/train': 1.1708983182907104} -08/30/2021 18:05:21 - INFO - __main__ - Step 27472: {'lr': 0.00046434070319561604, 'samples': 5274624, 'steps': 27471, 'loss/train': 2.240302324295044} -08/30/2021 18:05:21 - INFO - __main__ - Step 27473: {'lr': 0.0004643379716994214, 'samples': 5274816, 'steps': 27472, 'loss/train': 1.2890220880508423} -08/30/2021 18:05:23 - INFO - __main__ - Step 27474: {'lr': 0.0004643352401066494, 'samples': 5275008, 'steps': 27473, 'loss/train': 1.1141462326049805} -08/30/2021 18:05:23 - INFO - __main__ - Step 27475: {'lr': 0.00046433250841730123, 'samples': 5275200, 'steps': 27474, 'loss/train': 1.5007108449935913} -08/30/2021 18:05:23 - INFO - __main__ - Step 27476: {'lr': 0.0004643297766313781, 'samples': 5275392, 'steps': 27475, 'loss/train': 0.09506670385599136} -08/30/2021 18:05:24 - INFO - __main__ - Step 27477: {'lr': 0.0004643270447488813, 'samples': 5275584, 'steps': 27476, 'loss/train': 1.9615954160690308} -08/30/2021 18:05:24 - INFO - __main__ - Step 27478: {'lr': 0.000464324312769812, 'samples': 5275776, 'steps': 27477, 'loss/train': 0.7599114179611206} -08/30/2021 18:05:25 - INFO - __main__ - Step 27479: {'lr': 0.0004643215806941716, 'samples': 5275968, 'steps': 27478, 'loss/train': 1.615844488143921} -08/30/2021 18:05:26 - INFO - __main__ - Step 27480: {'lr': 0.00046431884852196105, 'samples': 5276160, 'steps': 27479, 'loss/train': 1.6542208194732666} -08/30/2021 18:05:26 - INFO - __main__ - Step 27481: {'lr': 0.0004643161162531818, 'samples': 5276352, 'steps': 27480, 'loss/train': 0.086514413356781} -08/30/2021 18:05:27 - INFO - __main__ - Step 27482: {'lr': 0.00046431338388783504, 'samples': 5276544, 'steps': 27481, 'loss/train': 1.6083823442459106} -08/30/2021 18:05:27 - INFO - __main__ - Step 27483: {'lr': 0.000464310651425922, 'samples': 5276736, 'steps': 27482, 'loss/train': 1.7101365327835083} -08/30/2021 18:05:28 - INFO - __main__ - Step 27484: {'lr': 0.00046430791886744384, 'samples': 5276928, 'steps': 27483, 'loss/train': 1.96410071849823} -08/30/2021 18:05:29 - INFO - __main__ - Step 27485: {'lr': 0.0004643051862124018, 'samples': 5277120, 'steps': 27484, 'loss/train': 1.3670763969421387} -08/30/2021 18:05:29 - INFO - __main__ - Step 27486: {'lr': 0.0004643024534607973, 'samples': 5277312, 'steps': 27485, 'loss/train': 1.7785871028900146} -08/30/2021 18:05:30 - INFO - __main__ - Step 27487: {'lr': 0.00046429972061263125, 'samples': 5277504, 'steps': 27486, 'loss/train': 1.5298993587493896} -08/30/2021 18:05:30 - INFO - __main__ - Step 27488: {'lr': 0.0004642969876679051, 'samples': 5277696, 'steps': 27487, 'loss/train': 1.6133230924606323} -08/30/2021 18:05:32 - INFO - __main__ - Step 27489: {'lr': 0.00046429425462662, 'samples': 5277888, 'steps': 27488, 'loss/train': 1.0676636695861816} -08/30/2021 18:05:32 - INFO - __main__ - Step 27490: {'lr': 0.00046429152148877727, 'samples': 5278080, 'steps': 27489, 'loss/train': 0.8648391962051392} -08/30/2021 18:05:32 - INFO - __main__ - Step 27491: {'lr': 0.00046428878825437815, 'samples': 5278272, 'steps': 27490, 'loss/train': 1.1295976638793945} -08/30/2021 18:05:33 - INFO - __main__ - Step 27492: {'lr': 0.00046428605492342367, 'samples': 5278464, 'steps': 27491, 'loss/train': 1.5803020000457764} -08/30/2021 18:05:33 - INFO - __main__ - Step 27493: {'lr': 0.00046428332149591535, 'samples': 5278656, 'steps': 27492, 'loss/train': 1.3380845785140991} -08/30/2021 18:05:35 - INFO - __main__ - Step 27494: {'lr': 0.0004642805879718541, 'samples': 5278848, 'steps': 27493, 'loss/train': 0.903255820274353} -08/30/2021 18:05:35 - INFO - __main__ - Step 27495: {'lr': 0.00046427785435124147, 'samples': 5279040, 'steps': 27494, 'loss/train': 1.5985044240951538} -08/30/2021 18:05:35 - INFO - __main__ - Step 27496: {'lr': 0.0004642751206340785, 'samples': 5279232, 'steps': 27495, 'loss/train': 1.9975924491882324} -08/30/2021 18:05:36 - INFO - __main__ - Step 27497: {'lr': 0.00046427238682036643, 'samples': 5279424, 'steps': 27496, 'loss/train': 1.249411940574646} -08/30/2021 18:05:36 - INFO - __main__ - Step 27498: {'lr': 0.0004642696529101066, 'samples': 5279616, 'steps': 27497, 'loss/train': 2.1159005165100098} -08/30/2021 18:05:38 - INFO - __main__ - Step 27499: {'lr': 0.0004642669189033001, 'samples': 5279808, 'steps': 27498, 'loss/train': 1.5861256122589111} -08/30/2021 18:05:38 - INFO - __main__ - Step 27500: {'lr': 0.0004642641847999483, 'samples': 5280000, 'steps': 27499, 'loss/train': 1.195245623588562} -08/30/2021 18:05:39 - INFO - __main__ - Step 27501: {'lr': 0.0004642614506000523, 'samples': 5280192, 'steps': 27500, 'loss/train': 1.4239248037338257} -08/30/2021 18:05:39 - INFO - __main__ - Step 27502: {'lr': 0.00046425871630361343, 'samples': 5280384, 'steps': 27501, 'loss/train': 0.8084686398506165} -08/30/2021 18:05:39 - INFO - __main__ - Step 27503: {'lr': 0.0004642559819106329, 'samples': 5280576, 'steps': 27502, 'loss/train': 0.9394906759262085} -08/30/2021 18:05:41 - INFO - __main__ - Step 27504: {'lr': 0.0004642532474211119, 'samples': 5280768, 'steps': 27503, 'loss/train': 0.7073948979377747} -08/30/2021 18:05:41 - INFO - __main__ - Step 27505: {'lr': 0.0004642505128350517, 'samples': 5280960, 'steps': 27504, 'loss/train': 1.5602253675460815} -08/30/2021 18:05:42 - INFO - __main__ - Step 27506: {'lr': 0.00046424777815245354, 'samples': 5281152, 'steps': 27505, 'loss/train': 1.404266595840454} -08/30/2021 18:05:42 - INFO - __main__ - Step 27507: {'lr': 0.0004642450433733186, 'samples': 5281344, 'steps': 27506, 'loss/train': 1.1671524047851562} -08/30/2021 18:05:42 - INFO - __main__ - Step 27508: {'lr': 0.0004642423084976482, 'samples': 5281536, 'steps': 27507, 'loss/train': 1.3224974870681763} -08/30/2021 18:05:43 - INFO - __main__ - Step 27509: {'lr': 0.0004642395735254435, 'samples': 5281728, 'steps': 27508, 'loss/train': 1.2267792224884033} -08/30/2021 18:05:44 - INFO - __main__ - Step 27510: {'lr': 0.0004642368384567058, 'samples': 5281920, 'steps': 27509, 'loss/train': 1.0123409032821655} -08/30/2021 18:05:45 - INFO - __main__ - Step 27511: {'lr': 0.0004642341032914362, 'samples': 5282112, 'steps': 27510, 'loss/train': 1.685687780380249} -08/30/2021 18:05:45 - INFO - __main__ - Step 27512: {'lr': 0.00046423136802963607, 'samples': 5282304, 'steps': 27511, 'loss/train': 1.1748380661010742} -08/30/2021 18:05:45 - INFO - __main__ - Step 27513: {'lr': 0.0004642286326713065, 'samples': 5282496, 'steps': 27512, 'loss/train': 0.4168582260608673} -08/30/2021 18:05:46 - INFO - __main__ - Step 27514: {'lr': 0.000464225897216449, 'samples': 5282688, 'steps': 27513, 'loss/train': 1.7291203737258911} -08/30/2021 18:05:47 - INFO - __main__ - Step 27515: {'lr': 0.0004642231616650645, 'samples': 5282880, 'steps': 27514, 'loss/train': 1.0879120826721191} -08/30/2021 18:05:48 - INFO - __main__ - Step 27516: {'lr': 0.00046422042601715433, 'samples': 5283072, 'steps': 27515, 'loss/train': 1.5452195405960083} -08/30/2021 18:05:48 - INFO - __main__ - Step 27517: {'lr': 0.00046421769027271974, 'samples': 5283264, 'steps': 27516, 'loss/train': 1.001875638961792} -08/30/2021 18:05:48 - INFO - __main__ - Step 27518: {'lr': 0.00046421495443176204, 'samples': 5283456, 'steps': 27517, 'loss/train': 1.0665472745895386} -08/30/2021 18:05:49 - INFO - __main__ - Step 27519: {'lr': 0.0004642122184942824, 'samples': 5283648, 'steps': 27518, 'loss/train': 1.7137739658355713} -08/30/2021 18:05:49 - INFO - __main__ - Step 27520: {'lr': 0.00046420948246028194, 'samples': 5283840, 'steps': 27519, 'loss/train': 1.6226041316986084} -08/30/2021 18:05:51 - INFO - __main__ - Step 27521: {'lr': 0.000464206746329762, 'samples': 5284032, 'steps': 27520, 'loss/train': 0.6680510640144348} -08/30/2021 18:05:52 - INFO - __main__ - Step 27522: {'lr': 0.00046420401010272385, 'samples': 5284224, 'steps': 27521, 'loss/train': 0.7357050776481628} -08/30/2021 18:05:52 - INFO - __main__ - Step 27523: {'lr': 0.00046420127377916863, 'samples': 5284416, 'steps': 27522, 'loss/train': 1.5431907176971436} -08/30/2021 18:05:53 - INFO - __main__ - Step 27524: {'lr': 0.0004641985373590977, 'samples': 5284608, 'steps': 27523, 'loss/train': 1.854203224182129} -08/30/2021 18:05:53 - INFO - __main__ - Step 27525: {'lr': 0.00046419580084251224, 'samples': 5284800, 'steps': 27524, 'loss/train': 1.321053147315979} -08/30/2021 18:05:55 - INFO - __main__ - Step 27526: {'lr': 0.0004641930642294133, 'samples': 5284992, 'steps': 27525, 'loss/train': 1.2070436477661133} -08/30/2021 18:05:55 - INFO - __main__ - Step 27527: {'lr': 0.0004641903275198024, 'samples': 5285184, 'steps': 27526, 'loss/train': 1.359650731086731} -08/30/2021 18:05:56 - INFO - __main__ - Step 27528: {'lr': 0.0004641875907136806, 'samples': 5285376, 'steps': 27527, 'loss/train': 2.0673930644989014} -08/30/2021 18:05:56 - INFO - __main__ - Step 27529: {'lr': 0.0004641848538110492, 'samples': 5285568, 'steps': 27528, 'loss/train': 1.2977995872497559} -08/30/2021 18:05:56 - INFO - __main__ - Step 27530: {'lr': 0.00046418211681190937, 'samples': 5285760, 'steps': 27529, 'loss/train': 0.6407142877578735} -08/30/2021 18:05:57 - INFO - __main__ - Step 27531: {'lr': 0.00046417937971626245, 'samples': 5285952, 'steps': 27530, 'loss/train': 1.3707348108291626} -08/30/2021 18:05:59 - INFO - __main__ - Step 27532: {'lr': 0.0004641766425241095, 'samples': 5286144, 'steps': 27531, 'loss/train': 1.8964557647705078} -08/30/2021 18:05:59 - INFO - __main__ - Step 27533: {'lr': 0.000464173905235452, 'samples': 5286336, 'steps': 27532, 'loss/train': 1.7082087993621826} -08/30/2021 18:06:00 - INFO - __main__ - Step 27534: {'lr': 0.0004641711678502909, 'samples': 5286528, 'steps': 27533, 'loss/train': 0.717869758605957} -08/30/2021 18:06:00 - INFO - __main__ - Step 27535: {'lr': 0.00046416843036862766, 'samples': 5286720, 'steps': 27534, 'loss/train': 1.10735023021698} -08/30/2021 18:06:00 - INFO - __main__ - Step 27536: {'lr': 0.0004641656927904634, 'samples': 5286912, 'steps': 27535, 'loss/train': 1.5429867506027222} -08/30/2021 18:06:01 - INFO - __main__ - Step 27537: {'lr': 0.00046416295511579944, 'samples': 5287104, 'steps': 27536, 'loss/train': 1.511547565460205} -08/30/2021 18:06:02 - INFO - __main__ - Step 27538: {'lr': 0.0004641602173446369, 'samples': 5287296, 'steps': 27537, 'loss/train': 1.8700331449508667} -08/30/2021 18:06:03 - INFO - __main__ - Step 27539: {'lr': 0.00046415747947697704, 'samples': 5287488, 'steps': 27538, 'loss/train': 1.083155870437622} -08/30/2021 18:06:03 - INFO - __main__ - Step 27540: {'lr': 0.00046415474151282124, 'samples': 5287680, 'steps': 27539, 'loss/train': 1.6107252836227417} -08/30/2021 18:06:04 - INFO - __main__ - Step 27541: {'lr': 0.0004641520034521705, 'samples': 5287872, 'steps': 27540, 'loss/train': 1.9646943807601929} -08/30/2021 18:06:04 - INFO - __main__ - Step 27542: {'lr': 0.0004641492652950262, 'samples': 5288064, 'steps': 27541, 'loss/train': 1.8504058122634888} -08/30/2021 18:06:06 - INFO - __main__ - Step 27543: {'lr': 0.0004641465270413896, 'samples': 5288256, 'steps': 27542, 'loss/train': 1.7035349607467651} -08/30/2021 18:06:06 - INFO - __main__ - Step 27544: {'lr': 0.00046414378869126185, 'samples': 5288448, 'steps': 27543, 'loss/train': 1.5890493392944336} -08/30/2021 18:06:06 - INFO - __main__ - Step 27545: {'lr': 0.0004641410502446442, 'samples': 5288640, 'steps': 27544, 'loss/train': 1.467052698135376} -08/30/2021 18:06:07 - INFO - __main__ - Step 27546: {'lr': 0.00046413831170153785, 'samples': 5288832, 'steps': 27545, 'loss/train': 1.6460683345794678} -08/30/2021 18:06:07 - INFO - __main__ - Step 27547: {'lr': 0.0004641355730619442, 'samples': 5289024, 'steps': 27546, 'loss/train': 1.3892771005630493} -08/30/2021 18:06:08 - INFO - __main__ - Step 27548: {'lr': 0.0004641328343258643, 'samples': 5289216, 'steps': 27547, 'loss/train': 1.299553632736206} -08/30/2021 18:06:09 - INFO - __main__ - Step 27549: {'lr': 0.00046413009549329946, 'samples': 5289408, 'steps': 27548, 'loss/train': 1.835012435913086} -08/30/2021 18:06:09 - INFO - __main__ - Step 27550: {'lr': 0.0004641273565642509, 'samples': 5289600, 'steps': 27549, 'loss/train': 1.6101205348968506} -08/30/2021 18:06:10 - INFO - __main__ - Step 27551: {'lr': 0.0004641246175387198, 'samples': 5289792, 'steps': 27550, 'loss/train': 1.294134497642517} -08/30/2021 18:06:10 - INFO - __main__ - Step 27552: {'lr': 0.0004641218784167075, 'samples': 5289984, 'steps': 27551, 'loss/train': 1.0548399686813354} -08/30/2021 18:06:11 - INFO - __main__ - Step 27553: {'lr': 0.0004641191391982152, 'samples': 5290176, 'steps': 27552, 'loss/train': 0.045883212238550186} -08/30/2021 18:06:12 - INFO - __main__ - Step 27554: {'lr': 0.00046411639988324407, 'samples': 5290368, 'steps': 27553, 'loss/train': 1.2484043836593628} -08/30/2021 18:06:12 - INFO - __main__ - Step 27555: {'lr': 0.00046411366047179547, 'samples': 5290560, 'steps': 27554, 'loss/train': 1.6914410591125488} -08/30/2021 18:06:13 - INFO - __main__ - Step 27556: {'lr': 0.00046411092096387054, 'samples': 5290752, 'steps': 27555, 'loss/train': 1.036177396774292} -08/30/2021 18:06:13 - INFO - __main__ - Step 27557: {'lr': 0.0004641081813594705, 'samples': 5290944, 'steps': 27556, 'loss/train': 1.6183223724365234} -08/30/2021 18:06:14 - INFO - __main__ - Step 27558: {'lr': 0.0004641054416585966, 'samples': 5291136, 'steps': 27557, 'loss/train': 1.4377225637435913} -08/30/2021 18:06:15 - INFO - __main__ - Step 27559: {'lr': 0.00046410270186125014, 'samples': 5291328, 'steps': 27558, 'loss/train': 1.66042959690094} -08/30/2021 18:06:15 - INFO - __main__ - Step 27560: {'lr': 0.0004640999619674323, 'samples': 5291520, 'steps': 27559, 'loss/train': 1.374444603919983} -08/30/2021 18:06:16 - INFO - __main__ - Step 27561: {'lr': 0.0004640972219771443, 'samples': 5291712, 'steps': 27560, 'loss/train': 1.6468956470489502} -08/30/2021 18:06:16 - INFO - __main__ - Step 27562: {'lr': 0.00046409448189038737, 'samples': 5291904, 'steps': 27561, 'loss/train': 0.9795956611633301} -08/30/2021 18:06:16 - INFO - __main__ - Step 27563: {'lr': 0.00046409174170716284, 'samples': 5292096, 'steps': 27562, 'loss/train': 1.2625643014907837} -08/30/2021 18:06:18 - INFO - __main__ - Step 27564: {'lr': 0.0004640890014274718, 'samples': 5292288, 'steps': 27563, 'loss/train': 1.4325306415557861} -08/30/2021 18:06:18 - INFO - __main__ - Step 27565: {'lr': 0.0004640862610513156, 'samples': 5292480, 'steps': 27564, 'loss/train': 1.565487265586853} -08/30/2021 18:06:19 - INFO - __main__ - Step 27566: {'lr': 0.00046408352057869545, 'samples': 5292672, 'steps': 27565, 'loss/train': 1.7046473026275635} -08/30/2021 18:06:19 - INFO - __main__ - Step 27567: {'lr': 0.0004640807800096126, 'samples': 5292864, 'steps': 27566, 'loss/train': 1.3343174457550049} -08/30/2021 18:06:19 - INFO - __main__ - Step 27568: {'lr': 0.0004640780393440682, 'samples': 5293056, 'steps': 27567, 'loss/train': 1.3126369714736938} -08/30/2021 18:06:21 - INFO - __main__ - Step 27569: {'lr': 0.0004640752985820635, 'samples': 5293248, 'steps': 27568, 'loss/train': 1.5438686609268188} -08/30/2021 18:06:21 - INFO - __main__ - Step 27570: {'lr': 0.0004640725577235998, 'samples': 5293440, 'steps': 27569, 'loss/train': 1.6290587186813354} -08/30/2021 18:06:22 - INFO - __main__ - Step 27571: {'lr': 0.00046406981676867836, 'samples': 5293632, 'steps': 27570, 'loss/train': 1.1571675539016724} -08/30/2021 18:06:22 - INFO - __main__ - Step 27572: {'lr': 0.00046406707571730035, 'samples': 5293824, 'steps': 27571, 'loss/train': 1.7105413675308228} -08/30/2021 18:06:22 - INFO - __main__ - Step 27573: {'lr': 0.000464064334569467, 'samples': 5294016, 'steps': 27572, 'loss/train': 1.4792060852050781} -08/30/2021 18:06:23 - INFO - __main__ - Step 27574: {'lr': 0.00046406159332517956, 'samples': 5294208, 'steps': 27573, 'loss/train': 1.5216033458709717} -08/30/2021 18:06:24 - INFO - __main__ - Step 27575: {'lr': 0.00046405885198443926, 'samples': 5294400, 'steps': 27574, 'loss/train': 1.0698562860488892} -08/30/2021 18:06:25 - INFO - __main__ - Step 27576: {'lr': 0.00046405611054724737, 'samples': 5294592, 'steps': 27575, 'loss/train': 0.6250839829444885} -08/30/2021 18:06:25 - INFO - __main__ - Step 27577: {'lr': 0.00046405336901360507, 'samples': 5294784, 'steps': 27576, 'loss/train': 1.4426932334899902} -08/30/2021 18:06:26 - INFO - __main__ - Step 27578: {'lr': 0.00046405062738351366, 'samples': 5294976, 'steps': 27577, 'loss/train': 1.29835844039917} -08/30/2021 18:06:26 - INFO - __main__ - Step 27579: {'lr': 0.00046404788565697434, 'samples': 5295168, 'steps': 27578, 'loss/train': 1.392787218093872} -08/30/2021 18:06:29 - INFO - __main__ - Step 27580: {'lr': 0.00046404514383398835, 'samples': 5295360, 'steps': 27579, 'loss/train': 1.0488930940628052} -08/30/2021 18:06:29 - INFO - __main__ - Step 27581: {'lr': 0.0004640424019145568, 'samples': 5295552, 'steps': 27580, 'loss/train': 1.4656857252120972} -08/30/2021 18:06:29 - INFO - __main__ - Step 27582: {'lr': 0.00046403965989868124, 'samples': 5295744, 'steps': 27581, 'loss/train': 1.8126304149627686} -08/30/2021 18:06:30 - INFO - __main__ - Step 27583: {'lr': 0.0004640369177863626, 'samples': 5295936, 'steps': 27582, 'loss/train': 7.011992454528809} -08/30/2021 18:06:30 - INFO - __main__ - Step 27584: {'lr': 0.00046403417557760226, 'samples': 5296128, 'steps': 27583, 'loss/train': 6.432428359985352} -08/30/2021 18:06:30 - INFO - __main__ - Step 27585: {'lr': 0.00046403143327240136, 'samples': 5296320, 'steps': 27584, 'loss/train': 1.8334565162658691} -08/30/2021 18:06:32 - INFO - __main__ - Step 27586: {'lr': 0.00046402869087076127, 'samples': 5296512, 'steps': 27585, 'loss/train': 1.7581672668457031} -08/30/2021 18:06:32 - INFO - __main__ - Step 27587: {'lr': 0.00046402594837268314, 'samples': 5296704, 'steps': 27586, 'loss/train': 1.6860690116882324} -08/30/2021 18:06:33 - INFO - __main__ - Step 27588: {'lr': 0.0004640232057781682, 'samples': 5296896, 'steps': 27587, 'loss/train': 1.6744991540908813} -08/30/2021 18:06:33 - INFO - __main__ - Step 27589: {'lr': 0.00046402046308721776, 'samples': 5297088, 'steps': 27588, 'loss/train': 1.4241410493850708} -08/30/2021 18:06:33 - INFO - __main__ - Step 27590: {'lr': 0.0004640177202998329, 'samples': 5297280, 'steps': 27589, 'loss/train': 1.7457475662231445} -08/30/2021 18:06:35 - INFO - __main__ - Step 27591: {'lr': 0.00046401497741601505, 'samples': 5297472, 'steps': 27590, 'loss/train': 1.491798996925354} -08/30/2021 18:06:35 - INFO - __main__ - Step 27592: {'lr': 0.00046401223443576537, 'samples': 5297664, 'steps': 27591, 'loss/train': 1.9089938402175903} -08/30/2021 18:06:36 - INFO - __main__ - Step 27593: {'lr': 0.00046400949135908497, 'samples': 5297856, 'steps': 27592, 'loss/train': 1.1968921422958374} -08/30/2021 18:06:36 - INFO - __main__ - Step 27594: {'lr': 0.0004640067481859753, 'samples': 5298048, 'steps': 27593, 'loss/train': 1.713312029838562} -08/30/2021 18:06:36 - INFO - __main__ - Step 27595: {'lr': 0.00046400400491643744, 'samples': 5298240, 'steps': 27594, 'loss/train': 1.557417392730713} -08/30/2021 18:06:38 - INFO - __main__ - Step 27596: {'lr': 0.00046400126155047265, 'samples': 5298432, 'steps': 27595, 'loss/train': 1.3746501207351685} -08/30/2021 18:06:38 - INFO - __main__ - Step 27597: {'lr': 0.0004639985180880822, 'samples': 5298624, 'steps': 27596, 'loss/train': 1.3247319459915161} -08/30/2021 18:06:39 - INFO - __main__ - Step 27598: {'lr': 0.0004639957745292674, 'samples': 5298816, 'steps': 27597, 'loss/train': 2.03164005279541} -08/30/2021 18:06:39 - INFO - __main__ - Step 27599: {'lr': 0.00046399303087402935, 'samples': 5299008, 'steps': 27598, 'loss/train': 2.0356204509735107} -08/30/2021 18:06:39 - INFO - __main__ - Step 27600: {'lr': 0.00046399028712236935, 'samples': 5299200, 'steps': 27599, 'loss/train': 1.4001091718673706} -08/30/2021 18:06:40 - INFO - __main__ - Step 27601: {'lr': 0.0004639875432742886, 'samples': 5299392, 'steps': 27600, 'loss/train': 1.5931395292282104} -08/30/2021 18:06:41 - INFO - __main__ - Step 27602: {'lr': 0.0004639847993297884, 'samples': 5299584, 'steps': 27601, 'loss/train': 1.3520549535751343} -08/30/2021 18:06:42 - INFO - __main__ - Step 27603: {'lr': 0.00046398205528886994, 'samples': 5299776, 'steps': 27602, 'loss/train': 1.39707350730896} -08/30/2021 18:06:42 - INFO - __main__ - Step 27604: {'lr': 0.00046397931115153444, 'samples': 5299968, 'steps': 27603, 'loss/train': 1.2671536207199097} -08/30/2021 18:06:42 - INFO - __main__ - Step 27605: {'lr': 0.0004639765669177833, 'samples': 5300160, 'steps': 27604, 'loss/train': 1.5328627824783325} -08/30/2021 18:06:43 - INFO - __main__ - Step 27606: {'lr': 0.00046397382258761744, 'samples': 5300352, 'steps': 27605, 'loss/train': 1.51702082157135} -08/30/2021 18:06:44 - INFO - __main__ - Step 27607: {'lr': 0.0004639710781610384, 'samples': 5300544, 'steps': 27606, 'loss/train': 1.5836141109466553} -08/30/2021 18:06:45 - INFO - __main__ - Step 27608: {'lr': 0.00046396833363804724, 'samples': 5300736, 'steps': 27607, 'loss/train': 1.9068845510482788} -08/30/2021 18:06:45 - INFO - __main__ - Step 27609: {'lr': 0.00046396558901864527, 'samples': 5300928, 'steps': 27608, 'loss/train': 1.3824971914291382} -08/30/2021 18:06:45 - INFO - __main__ - Step 27610: {'lr': 0.0004639628443028337, 'samples': 5301120, 'steps': 27609, 'loss/train': 1.9928569793701172} -08/30/2021 18:06:46 - INFO - __main__ - Step 27611: {'lr': 0.0004639600994906138, 'samples': 5301312, 'steps': 27610, 'loss/train': 1.3614623546600342} -08/30/2021 18:06:47 - INFO - __main__ - Step 27612: {'lr': 0.00046395735458198674, 'samples': 5301504, 'steps': 27611, 'loss/train': 1.3806707859039307} -08/30/2021 18:06:48 - INFO - __main__ - Step 27613: {'lr': 0.0004639546095769538, 'samples': 5301696, 'steps': 27612, 'loss/train': 1.3501548767089844} -08/30/2021 18:06:48 - INFO - __main__ - Step 27614: {'lr': 0.00046395186447551617, 'samples': 5301888, 'steps': 27613, 'loss/train': 1.0119539499282837} -08/30/2021 18:06:48 - INFO - __main__ - Step 27615: {'lr': 0.00046394911927767526, 'samples': 5302080, 'steps': 27614, 'loss/train': 1.538619875907898} -08/30/2021 18:06:49 - INFO - __main__ - Step 27616: {'lr': 0.0004639463739834321, 'samples': 5302272, 'steps': 27615, 'loss/train': 1.4405438899993896} -08/30/2021 18:06:50 - INFO - __main__ - Step 27617: {'lr': 0.00046394362859278793, 'samples': 5302464, 'steps': 27616, 'loss/train': 1.3817137479782104} -08/30/2021 18:06:51 - INFO - __main__ - Step 27618: {'lr': 0.00046394088310574416, 'samples': 5302656, 'steps': 27617, 'loss/train': 1.5324381589889526} -08/30/2021 18:06:51 - INFO - __main__ - Step 27619: {'lr': 0.000463938137522302, 'samples': 5302848, 'steps': 27618, 'loss/train': 0.08424973487854004} -08/30/2021 18:06:52 - INFO - __main__ - Step 27620: {'lr': 0.00046393539184246246, 'samples': 5303040, 'steps': 27619, 'loss/train': 2.311727523803711} -08/30/2021 18:06:52 - INFO - __main__ - Step 27621: {'lr': 0.000463932646066227, 'samples': 5303232, 'steps': 27620, 'loss/train': 1.9144822359085083} -08/30/2021 18:06:54 - INFO - __main__ - Step 27622: {'lr': 0.0004639299001935968, 'samples': 5303424, 'steps': 27621, 'loss/train': 2.442072629928589} -08/30/2021 18:06:54 - INFO - __main__ - Step 27623: {'lr': 0.0004639271542245731, 'samples': 5303616, 'steps': 27622, 'loss/train': 1.1727242469787598} -08/30/2021 18:06:55 - INFO - __main__ - Step 27624: {'lr': 0.000463924408159157, 'samples': 5303808, 'steps': 27623, 'loss/train': 1.5860928297042847} -08/30/2021 18:06:55 - INFO - __main__ - Step 27625: {'lr': 0.00046392166199735, 'samples': 5304000, 'steps': 27624, 'loss/train': 4.4631733894348145} -08/30/2021 18:06:55 - INFO - __main__ - Step 27626: {'lr': 0.00046391891573915325, 'samples': 5304192, 'steps': 27625, 'loss/train': 1.963142991065979} -08/30/2021 18:06:56 - INFO - __main__ - Step 27627: {'lr': 0.0004639161693845678, 'samples': 5304384, 'steps': 27626, 'loss/train': 1.4789601564407349} -08/30/2021 18:06:58 - INFO - __main__ - Step 27628: {'lr': 0.0004639134229335951, 'samples': 5304576, 'steps': 27627, 'loss/train': 1.5334399938583374} -08/30/2021 18:06:58 - INFO - __main__ - Step 27629: {'lr': 0.0004639106763862363, 'samples': 5304768, 'steps': 27628, 'loss/train': 2.497802495956421} -08/30/2021 18:06:59 - INFO - __main__ - Step 27630: {'lr': 0.00046390792974249263, 'samples': 5304960, 'steps': 27629, 'loss/train': 1.5521652698516846} -08/30/2021 18:06:59 - INFO - __main__ - Step 27631: {'lr': 0.00046390518300236535, 'samples': 5305152, 'steps': 27630, 'loss/train': 0.13609883189201355} -08/30/2021 18:07:00 - INFO - __main__ - Step 27632: {'lr': 0.0004639024361658557, 'samples': 5305344, 'steps': 27631, 'loss/train': 1.7635130882263184} -08/30/2021 18:07:00 - INFO - __main__ - Step 27633: {'lr': 0.00046389968923296496, 'samples': 5305536, 'steps': 27632, 'loss/train': 0.6495070457458496} -08/30/2021 18:07:00 - INFO - __main__ - Step 27634: {'lr': 0.0004638969422036943, 'samples': 5305728, 'steps': 27633, 'loss/train': 0.4948667287826538} -08/30/2021 18:07:02 - INFO - __main__ - Step 27635: {'lr': 0.00046389419507804493, 'samples': 5305920, 'steps': 27634, 'loss/train': 0.7599722146987915} -08/30/2021 18:07:03 - INFO - __main__ - Step 27636: {'lr': 0.00046389144785601813, 'samples': 5306112, 'steps': 27635, 'loss/train': 1.4174884557724} -08/30/2021 18:07:03 - INFO - __main__ - Step 27637: {'lr': 0.0004638887005376152, 'samples': 5306304, 'steps': 27636, 'loss/train': 1.350616693496704} -08/30/2021 18:07:03 - INFO - __main__ - Step 27638: {'lr': 0.0004638859531228373, 'samples': 5306496, 'steps': 27637, 'loss/train': 1.6200162172317505} -08/30/2021 18:07:04 - INFO - __main__ - Step 27639: {'lr': 0.00046388320561168567, 'samples': 5306688, 'steps': 27638, 'loss/train': 1.3006216287612915} -08/30/2021 18:07:05 - INFO - __main__ - Step 27640: {'lr': 0.00046388045800416157, 'samples': 5306880, 'steps': 27639, 'loss/train': 1.7380802631378174} -08/30/2021 18:07:06 - INFO - __main__ - Step 27641: {'lr': 0.00046387771030026627, 'samples': 5307072, 'steps': 27640, 'loss/train': 1.850737452507019} -08/30/2021 18:07:06 - INFO - __main__ - Step 27642: {'lr': 0.00046387496250000095, 'samples': 5307264, 'steps': 27641, 'loss/train': 1.9918535947799683} -08/30/2021 18:07:06 - INFO - __main__ - Step 27643: {'lr': 0.0004638722146033669, 'samples': 5307456, 'steps': 27642, 'loss/train': 1.4941896200180054} -08/30/2021 18:07:07 - INFO - __main__ - Step 27644: {'lr': 0.0004638694666103653, 'samples': 5307648, 'steps': 27643, 'loss/train': 2.074228525161743} -08/30/2021 18:07:08 - INFO - __main__ - Step 27645: {'lr': 0.00046386671852099743, 'samples': 5307840, 'steps': 27644, 'loss/train': 1.5714284181594849} -08/30/2021 18:07:09 - INFO - __main__ - Step 27646: {'lr': 0.0004638639703352645, 'samples': 5308032, 'steps': 27645, 'loss/train': 1.7330057621002197} -08/30/2021 18:07:09 - INFO - __main__ - Step 27647: {'lr': 0.00046386122205316783, 'samples': 5308224, 'steps': 27646, 'loss/train': 1.4205405712127686} -08/30/2021 18:07:09 - INFO - __main__ - Step 27648: {'lr': 0.0004638584736747085, 'samples': 5308416, 'steps': 27647, 'loss/train': 1.7681492567062378} -08/30/2021 18:07:10 - INFO - __main__ - Step 27649: {'lr': 0.00046385572519988793, 'samples': 5308608, 'steps': 27648, 'loss/train': 1.0372158288955688} -08/30/2021 18:07:11 - INFO - __main__ - Step 27650: {'lr': 0.00046385297662870716, 'samples': 5308800, 'steps': 27649, 'loss/train': 1.9399640560150146} -08/30/2021 18:07:12 - INFO - __main__ - Step 27651: {'lr': 0.00046385022796116766, 'samples': 5308992, 'steps': 27650, 'loss/train': 1.3714888095855713} -08/30/2021 18:07:12 - INFO - __main__ - Step 27652: {'lr': 0.0004638474791972705, 'samples': 5309184, 'steps': 27651, 'loss/train': 1.6928040981292725} -08/30/2021 18:07:12 - INFO - __main__ - Step 27653: {'lr': 0.000463844730337017, 'samples': 5309376, 'steps': 27652, 'loss/train': 0.8629988431930542} -08/30/2021 18:07:13 - INFO - __main__ - Step 27654: {'lr': 0.00046384198138040825, 'samples': 5309568, 'steps': 27653, 'loss/train': 1.1709786653518677} -08/30/2021 18:07:14 - INFO - __main__ - Step 27655: {'lr': 0.00046383923232744565, 'samples': 5309760, 'steps': 27654, 'loss/train': 1.6784054040908813} -08/30/2021 18:07:15 - INFO - __main__ - Step 27656: {'lr': 0.00046383648317813045, 'samples': 5309952, 'steps': 27655, 'loss/train': 1.5674488544464111} -08/30/2021 18:07:15 - INFO - __main__ - Step 27657: {'lr': 0.0004638337339324638, 'samples': 5310144, 'steps': 27656, 'loss/train': 0.7143456935882568} -08/30/2021 18:07:16 - INFO - __main__ - Step 27658: {'lr': 0.00046383098459044697, 'samples': 5310336, 'steps': 27657, 'loss/train': 1.4924540519714355} -08/30/2021 18:07:16 - INFO - __main__ - Step 27659: {'lr': 0.0004638282351520812, 'samples': 5310528, 'steps': 27658, 'loss/train': 1.1130164861679077} -08/30/2021 18:07:18 - INFO - __main__ - Step 27660: {'lr': 0.00046382548561736773, 'samples': 5310720, 'steps': 27659, 'loss/train': 1.682997226715088} -08/30/2021 18:07:18 - INFO - __main__ - Step 27661: {'lr': 0.0004638227359863078, 'samples': 5310912, 'steps': 27660, 'loss/train': 1.1483876705169678} -08/30/2021 18:07:18 - INFO - __main__ - Step 27662: {'lr': 0.0004638199862589026, 'samples': 5311104, 'steps': 27661, 'loss/train': 1.8646984100341797} -08/30/2021 18:07:19 - INFO - __main__ - Step 27663: {'lr': 0.0004638172364351535, 'samples': 5311296, 'steps': 27662, 'loss/train': 1.0410184860229492} -08/30/2021 18:07:19 - INFO - __main__ - Step 27664: {'lr': 0.00046381448651506153, 'samples': 5311488, 'steps': 27663, 'loss/train': 1.3917937278747559} -08/30/2021 18:07:21 - INFO - __main__ - Step 27665: {'lr': 0.00046381173649862815, 'samples': 5311680, 'steps': 27664, 'loss/train': 1.5901403427124023} -08/30/2021 18:07:21 - INFO - __main__ - Step 27666: {'lr': 0.00046380898638585447, 'samples': 5311872, 'steps': 27665, 'loss/train': 1.7387356758117676} -08/30/2021 18:07:22 - INFO - __main__ - Step 27667: {'lr': 0.0004638062361767418, 'samples': 5312064, 'steps': 27666, 'loss/train': 0.9809238314628601} -08/30/2021 18:07:22 - INFO - __main__ - Step 27668: {'lr': 0.00046380348587129127, 'samples': 5312256, 'steps': 27667, 'loss/train': 1.879568099975586} -08/30/2021 18:07:22 - INFO - __main__ - Step 27669: {'lr': 0.0004638007354695042, 'samples': 5312448, 'steps': 27668, 'loss/train': 2.2002036571502686} -08/30/2021 18:07:23 - INFO - __main__ - Step 27670: {'lr': 0.0004637979849713818, 'samples': 5312640, 'steps': 27669, 'loss/train': 1.5881483554840088} -08/30/2021 18:07:25 - INFO - __main__ - Step 27671: {'lr': 0.0004637952343769254, 'samples': 5312832, 'steps': 27670, 'loss/train': 1.7404872179031372} -08/30/2021 18:07:25 - INFO - __main__ - Step 27672: {'lr': 0.00046379248368613615, 'samples': 5313024, 'steps': 27671, 'loss/train': 1.6770353317260742} -08/30/2021 18:07:25 - INFO - __main__ - Step 27673: {'lr': 0.0004637897328990153, 'samples': 5313216, 'steps': 27672, 'loss/train': 1.2560689449310303} -08/30/2021 18:07:26 - INFO - __main__ - Step 27674: {'lr': 0.000463786982015564, 'samples': 5313408, 'steps': 27673, 'loss/train': 1.4442033767700195} -08/30/2021 18:07:26 - INFO - __main__ - Step 27675: {'lr': 0.00046378423103578373, 'samples': 5313600, 'steps': 27674, 'loss/train': 1.6111303567886353} -08/30/2021 18:07:28 - INFO - __main__ - Step 27676: {'lr': 0.0004637814799596755, 'samples': 5313792, 'steps': 27675, 'loss/train': 0.23090513050556183} -08/30/2021 18:07:28 - INFO - __main__ - Step 27677: {'lr': 0.00046377872878724066, 'samples': 5313984, 'steps': 27676, 'loss/train': 1.3465864658355713} -08/30/2021 18:07:29 - INFO - __main__ - Step 27678: {'lr': 0.0004637759775184804, 'samples': 5314176, 'steps': 27677, 'loss/train': 0.9396185278892517} -08/30/2021 18:07:29 - INFO - __main__ - Step 27679: {'lr': 0.000463773226153396, 'samples': 5314368, 'steps': 27678, 'loss/train': 1.0420961380004883} -08/30/2021 18:07:29 - INFO - __main__ - Step 27680: {'lr': 0.00046377047469198875, 'samples': 5314560, 'steps': 27679, 'loss/train': 0.2202690839767456} -08/30/2021 18:07:30 - INFO - __main__ - Step 27681: {'lr': 0.00046376772313425974, 'samples': 5314752, 'steps': 27680, 'loss/train': 1.2297792434692383} -08/30/2021 18:07:31 - INFO - __main__ - Step 27682: {'lr': 0.0004637649714802102, 'samples': 5314944, 'steps': 27681, 'loss/train': 1.2670255899429321} -08/30/2021 18:07:32 - INFO - __main__ - Step 27683: {'lr': 0.0004637622197298417, 'samples': 5315136, 'steps': 27682, 'loss/train': 1.1371203660964966} -08/30/2021 18:07:32 - INFO - __main__ - Step 27684: {'lr': 0.000463759467883155, 'samples': 5315328, 'steps': 27683, 'loss/train': 1.7195202112197876} -08/30/2021 18:07:32 - INFO - __main__ - Step 27685: {'lr': 0.0004637567159401518, 'samples': 5315520, 'steps': 27684, 'loss/train': 2.2589163780212402} -08/30/2021 18:07:33 - INFO - __main__ - Step 27686: {'lr': 0.00046375396390083303, 'samples': 5315712, 'steps': 27685, 'loss/train': 1.4878872632980347} -08/30/2021 18:07:35 - INFO - __main__ - Step 27687: {'lr': 0.0004637512117652, 'samples': 5315904, 'steps': 27686, 'loss/train': 0.6817157864570618} -08/30/2021 18:07:35 - INFO - __main__ - Step 27688: {'lr': 0.00046374845953325394, 'samples': 5316096, 'steps': 27687, 'loss/train': 1.3332120180130005} -08/30/2021 18:07:36 - INFO - __main__ - Step 27689: {'lr': 0.0004637457072049962, 'samples': 5316288, 'steps': 27688, 'loss/train': 1.6221702098846436} -08/30/2021 18:07:36 - INFO - __main__ - Step 27690: {'lr': 0.0004637429547804279, 'samples': 5316480, 'steps': 27689, 'loss/train': 0.9120870232582092} -08/30/2021 18:07:36 - INFO - __main__ - Step 27691: {'lr': 0.0004637402022595503, 'samples': 5316672, 'steps': 27690, 'loss/train': 3.143947124481201} -08/30/2021 18:07:38 - INFO - __main__ - Step 27692: {'lr': 0.0004637374496423647, 'samples': 5316864, 'steps': 27691, 'loss/train': 1.8292323350906372} -08/30/2021 18:07:39 - INFO - __main__ - Step 27693: {'lr': 0.0004637346969288723, 'samples': 5317056, 'steps': 27692, 'loss/train': 1.2111611366271973} -08/30/2021 18:07:39 - INFO - __main__ - Step 27694: {'lr': 0.0004637319441190743, 'samples': 5317248, 'steps': 27693, 'loss/train': 1.5030843019485474} -08/30/2021 18:07:39 - INFO - __main__ - Step 27695: {'lr': 0.00046372919121297207, 'samples': 5317440, 'steps': 27694, 'loss/train': 1.5317778587341309} -08/30/2021 18:07:40 - INFO - __main__ - Step 27696: {'lr': 0.0004637264382105667, 'samples': 5317632, 'steps': 27695, 'loss/train': 6.138783931732178} -08/30/2021 18:07:40 - INFO - __main__ - Step 27697: {'lr': 0.00046372368511185953, 'samples': 5317824, 'steps': 27696, 'loss/train': 1.5839647054672241} -08/30/2021 18:07:41 - INFO - __main__ - Step 27698: {'lr': 0.0004637209319168517, 'samples': 5318016, 'steps': 27697, 'loss/train': 1.3210899829864502} -08/30/2021 18:07:42 - INFO - __main__ - Step 27699: {'lr': 0.0004637181786255446, 'samples': 5318208, 'steps': 27698, 'loss/train': 1.011793613433838} -08/30/2021 18:07:42 - INFO - __main__ - Step 27700: {'lr': 0.0004637154252379394, 'samples': 5318400, 'steps': 27699, 'loss/train': 1.6124320030212402} -08/30/2021 18:07:42 - INFO - __main__ - Step 27701: {'lr': 0.00046371267175403724, 'samples': 5318592, 'steps': 27700, 'loss/train': 1.9815433025360107} -08/30/2021 18:07:43 - INFO - __main__ - Step 27702: {'lr': 0.0004637099181738395, 'samples': 5318784, 'steps': 27701, 'loss/train': 1.3882966041564941} -08/30/2021 18:07:44 - INFO - __main__ - Step 27703: {'lr': 0.00046370716449734733, 'samples': 5318976, 'steps': 27702, 'loss/train': 1.6488699913024902} -08/30/2021 18:07:45 - INFO - __main__ - Step 27704: {'lr': 0.00046370441072456206, 'samples': 5319168, 'steps': 27703, 'loss/train': 1.132298231124878} -08/30/2021 18:07:45 - INFO - __main__ - Step 27705: {'lr': 0.00046370165685548484, 'samples': 5319360, 'steps': 27704, 'loss/train': 1.264633297920227} -08/30/2021 18:07:45 - INFO - __main__ - Step 27706: {'lr': 0.00046369890289011696, 'samples': 5319552, 'steps': 27705, 'loss/train': 1.7231214046478271} -08/30/2021 18:07:46 - INFO - __main__ - Step 27707: {'lr': 0.0004636961488284597, 'samples': 5319744, 'steps': 27706, 'loss/train': 1.0639294385910034} -08/30/2021 18:07:47 - INFO - __main__ - Step 27708: {'lr': 0.0004636933946705142, 'samples': 5319936, 'steps': 27707, 'loss/train': 1.6238598823547363} -08/30/2021 18:07:48 - INFO - __main__ - Step 27709: {'lr': 0.00046369064041628175, 'samples': 5320128, 'steps': 27708, 'loss/train': 1.059350609779358} -08/30/2021 18:07:48 - INFO - __main__ - Step 27710: {'lr': 0.00046368788606576363, 'samples': 5320320, 'steps': 27709, 'loss/train': 0.749843418598175} -08/30/2021 18:07:48 - INFO - __main__ - Step 27711: {'lr': 0.00046368513161896104, 'samples': 5320512, 'steps': 27710, 'loss/train': 0.402189701795578} -08/30/2021 18:07:49 - INFO - __main__ - Step 27712: {'lr': 0.0004636823770758752, 'samples': 5320704, 'steps': 27711, 'loss/train': 2.0030534267425537} -08/30/2021 18:07:49 - INFO - __main__ - Step 27713: {'lr': 0.0004636796224365074, 'samples': 5320896, 'steps': 27712, 'loss/train': 0.44293150305747986} -08/30/2021 18:07:51 - INFO - __main__ - Step 27714: {'lr': 0.0004636768677008588, 'samples': 5321088, 'steps': 27713, 'loss/train': 1.1427805423736572} -08/30/2021 18:07:51 - INFO - __main__ - Step 27715: {'lr': 0.0004636741128689308, 'samples': 5321280, 'steps': 27714, 'loss/train': 1.3262362480163574} -08/30/2021 18:07:52 - INFO - __main__ - Step 27716: {'lr': 0.00046367135794072445, 'samples': 5321472, 'steps': 27715, 'loss/train': 1.7071841955184937} -08/30/2021 18:07:52 - INFO - __main__ - Step 27717: {'lr': 0.0004636686029162411, 'samples': 5321664, 'steps': 27716, 'loss/train': 1.0002169609069824} -08/30/2021 18:07:52 - INFO - __main__ - Step 27718: {'lr': 0.000463665847795482, 'samples': 5321856, 'steps': 27717, 'loss/train': 1.683854341506958} -08/30/2021 18:07:54 - INFO - __main__ - Step 27719: {'lr': 0.0004636630925784484, 'samples': 5322048, 'steps': 27718, 'loss/train': 1.710624098777771} -08/30/2021 18:07:54 - INFO - __main__ - Step 27720: {'lr': 0.0004636603372651415, 'samples': 5322240, 'steps': 27719, 'loss/train': 1.7615082263946533} -08/30/2021 18:07:54 - INFO - __main__ - Step 27721: {'lr': 0.0004636575818555625, 'samples': 5322432, 'steps': 27720, 'loss/train': 1.3039824962615967} -08/30/2021 18:07:55 - INFO - __main__ - Step 27722: {'lr': 0.00046365482634971275, 'samples': 5322624, 'steps': 27721, 'loss/train': 1.5380810499191284} -08/30/2021 18:07:55 - INFO - __main__ - Step 27723: {'lr': 0.00046365207074759344, 'samples': 5322816, 'steps': 27722, 'loss/train': 1.315588355064392} -08/30/2021 18:07:57 - INFO - __main__ - Step 27724: {'lr': 0.0004636493150492057, 'samples': 5323008, 'steps': 27723, 'loss/train': 1.7833211421966553} -08/30/2021 18:07:57 - INFO - __main__ - Step 27725: {'lr': 0.00046364655925455094, 'samples': 5323200, 'steps': 27724, 'loss/train': 1.352582335472107} -08/30/2021 18:07:57 - INFO - __main__ - Step 27726: {'lr': 0.0004636438033636303, 'samples': 5323392, 'steps': 27725, 'loss/train': 1.3288015127182007} -08/30/2021 18:07:58 - INFO - __main__ - Step 27727: {'lr': 0.00046364104737644515, 'samples': 5323584, 'steps': 27726, 'loss/train': 1.1080595254898071} -08/30/2021 18:07:58 - INFO - __main__ - Step 27728: {'lr': 0.00046363829129299655, 'samples': 5323776, 'steps': 27727, 'loss/train': 1.3275203704833984} -08/30/2021 18:08:00 - INFO - __main__ - Step 27729: {'lr': 0.0004636355351132859, 'samples': 5323968, 'steps': 27728, 'loss/train': 1.7928476333618164} -08/30/2021 18:08:00 - INFO - __main__ - Step 27730: {'lr': 0.00046363277883731437, 'samples': 5324160, 'steps': 27729, 'loss/train': 1.2326266765594482} -08/30/2021 18:08:01 - INFO - __main__ - Step 27731: {'lr': 0.0004636300224650831, 'samples': 5324352, 'steps': 27730, 'loss/train': 1.0478222370147705} -08/30/2021 18:08:01 - INFO - __main__ - Step 27732: {'lr': 0.00046362726599659355, 'samples': 5324544, 'steps': 27731, 'loss/train': 1.4498744010925293} -08/30/2021 18:08:01 - INFO - __main__ - Step 27733: {'lr': 0.0004636245094318468, 'samples': 5324736, 'steps': 27732, 'loss/train': 1.5391539335250854} -08/30/2021 18:08:03 - INFO - __main__ - Step 27734: {'lr': 0.0004636217527708442, 'samples': 5324928, 'steps': 27733, 'loss/train': 1.9058687686920166} -08/30/2021 18:08:03 - INFO - __main__ - Step 27735: {'lr': 0.0004636189960135869, 'samples': 5325120, 'steps': 27734, 'loss/train': 1.4752416610717773} -08/30/2021 18:08:04 - INFO - __main__ - Step 27736: {'lr': 0.0004636162391600761, 'samples': 5325312, 'steps': 27735, 'loss/train': 1.8577532768249512} -08/30/2021 18:08:04 - INFO - __main__ - Step 27737: {'lr': 0.00046361348221031316, 'samples': 5325504, 'steps': 27736, 'loss/train': 1.8980063199996948} -08/30/2021 18:08:04 - INFO - __main__ - Step 27738: {'lr': 0.00046361072516429936, 'samples': 5325696, 'steps': 27737, 'loss/train': 1.3145451545715332} -08/30/2021 18:08:06 - INFO - __main__ - Step 27739: {'lr': 0.0004636079680220358, 'samples': 5325888, 'steps': 27738, 'loss/train': 4.672932147979736} -08/30/2021 18:08:06 - INFO - __main__ - Step 27740: {'lr': 0.0004636052107835238, 'samples': 5326080, 'steps': 27739, 'loss/train': 1.2719616889953613} -08/30/2021 18:08:07 - INFO - __main__ - Step 27741: {'lr': 0.0004636024534487646, 'samples': 5326272, 'steps': 27740, 'loss/train': 1.4490892887115479} -08/30/2021 18:08:07 - INFO - __main__ - Step 27742: {'lr': 0.0004635996960177594, 'samples': 5326464, 'steps': 27741, 'loss/train': 0.4310019612312317} -08/30/2021 18:08:07 - INFO - __main__ - Step 27743: {'lr': 0.0004635969384905095, 'samples': 5326656, 'steps': 27742, 'loss/train': 1.8816343545913696} -08/30/2021 18:08:10 - INFO - __main__ - Step 27744: {'lr': 0.0004635941808670161, 'samples': 5326848, 'steps': 27743, 'loss/train': 1.5247331857681274} -08/30/2021 18:08:10 - INFO - __main__ - Step 27745: {'lr': 0.00046359142314728047, 'samples': 5327040, 'steps': 27744, 'loss/train': 1.325038194656372} -08/30/2021 18:08:10 - INFO - __main__ - Step 27746: {'lr': 0.00046358866533130385, 'samples': 5327232, 'steps': 27745, 'loss/train': 1.7034525871276855} -08/30/2021 18:08:11 - INFO - __main__ - Step 27747: {'lr': 0.00046358590741908744, 'samples': 5327424, 'steps': 27746, 'loss/train': 0.06704515218734741} -08/30/2021 18:08:11 - INFO - __main__ - Step 27748: {'lr': 0.0004635831494106325, 'samples': 5327616, 'steps': 27747, 'loss/train': 1.8906948566436768} -08/30/2021 18:08:11 - INFO - __main__ - Step 27749: {'lr': 0.0004635803913059404, 'samples': 5327808, 'steps': 27748, 'loss/train': 1.3078497648239136} -08/30/2021 18:08:13 - INFO - __main__ - Step 27750: {'lr': 0.00046357763310501216, 'samples': 5328000, 'steps': 27749, 'loss/train': 0.392612099647522} -08/30/2021 18:08:13 - INFO - __main__ - Step 27751: {'lr': 0.0004635748748078492, 'samples': 5328192, 'steps': 27750, 'loss/train': 1.9263042211532593} -08/30/2021 18:08:14 - INFO - __main__ - Step 27752: {'lr': 0.0004635721164144526, 'samples': 5328384, 'steps': 27751, 'loss/train': 1.4707145690917969} -08/30/2021 18:08:14 - INFO - __main__ - Step 27753: {'lr': 0.0004635693579248238, 'samples': 5328576, 'steps': 27752, 'loss/train': 1.5500909090042114} -08/30/2021 18:08:14 - INFO - __main__ - Step 27754: {'lr': 0.00046356659933896393, 'samples': 5328768, 'steps': 27753, 'loss/train': 1.6524235010147095} -08/30/2021 18:08:16 - INFO - __main__ - Step 27755: {'lr': 0.0004635638406568742, 'samples': 5328960, 'steps': 27754, 'loss/train': 1.7313227653503418} -08/30/2021 18:08:16 - INFO - __main__ - Step 27756: {'lr': 0.00046356108187855594, 'samples': 5329152, 'steps': 27755, 'loss/train': 1.8637701272964478} -08/30/2021 18:08:17 - INFO - __main__ - Step 27757: {'lr': 0.00046355832300401035, 'samples': 5329344, 'steps': 27756, 'loss/train': 2.080235481262207} -08/30/2021 18:08:17 - INFO - __main__ - Step 27758: {'lr': 0.0004635555640332386, 'samples': 5329536, 'steps': 27757, 'loss/train': 0.8100613951683044} -08/30/2021 18:08:17 - INFO - __main__ - Step 27759: {'lr': 0.0004635528049662421, 'samples': 5329728, 'steps': 27758, 'loss/train': 1.736909031867981} -08/30/2021 18:08:19 - INFO - __main__ - Step 27760: {'lr': 0.000463550045803022, 'samples': 5329920, 'steps': 27759, 'loss/train': 1.4985519647598267} -08/30/2021 18:08:19 - INFO - __main__ - Step 27761: {'lr': 0.00046354728654357947, 'samples': 5330112, 'steps': 27760, 'loss/train': 1.5650149583816528} -08/30/2021 18:08:20 - INFO - __main__ - Step 27762: {'lr': 0.00046354452718791586, 'samples': 5330304, 'steps': 27761, 'loss/train': 1.3432813882827759} -08/30/2021 18:08:20 - INFO - __main__ - Step 27763: {'lr': 0.0004635417677360324, 'samples': 5330496, 'steps': 27762, 'loss/train': 1.792452096939087} -08/30/2021 18:08:21 - INFO - __main__ - Step 27764: {'lr': 0.0004635390081879303, 'samples': 5330688, 'steps': 27763, 'loss/train': 1.4342265129089355} -08/30/2021 18:08:22 - INFO - __main__ - Step 27765: {'lr': 0.0004635362485436109, 'samples': 5330880, 'steps': 27764, 'loss/train': 1.653233289718628} -08/30/2021 18:08:22 - INFO - __main__ - Step 27766: {'lr': 0.00046353348880307524, 'samples': 5331072, 'steps': 27765, 'loss/train': 0.8268206715583801} -08/30/2021 18:08:23 - INFO - __main__ - Step 27767: {'lr': 0.0004635307289663248, 'samples': 5331264, 'steps': 27766, 'loss/train': 1.4286202192306519} -08/30/2021 18:08:23 - INFO - __main__ - Step 27768: {'lr': 0.0004635279690333606, 'samples': 5331456, 'steps': 27767, 'loss/train': 1.7019968032836914} -08/30/2021 18:08:23 - INFO - __main__ - Step 27769: {'lr': 0.00046352520900418403, 'samples': 5331648, 'steps': 27768, 'loss/train': 1.6425319910049438} -08/30/2021 18:08:24 - INFO - __main__ - Step 27770: {'lr': 0.00046352244887879623, 'samples': 5331840, 'steps': 27769, 'loss/train': 1.5490469932556152} -08/30/2021 18:08:25 - INFO - __main__ - Step 27771: {'lr': 0.0004635196886571986, 'samples': 5332032, 'steps': 27770, 'loss/train': 1.528705358505249} -08/30/2021 18:08:26 - INFO - __main__ - Step 27772: {'lr': 0.0004635169283393923, 'samples': 5332224, 'steps': 27771, 'loss/train': 1.4694417715072632} -08/30/2021 18:08:26 - INFO - __main__ - Step 27773: {'lr': 0.0004635141679253785, 'samples': 5332416, 'steps': 27772, 'loss/train': 1.395058512687683} -08/30/2021 18:08:27 - INFO - __main__ - Step 27774: {'lr': 0.0004635114074151586, 'samples': 5332608, 'steps': 27773, 'loss/train': 1.6506497859954834} -08/30/2021 18:08:27 - INFO - __main__ - Step 27775: {'lr': 0.00046350864680873375, 'samples': 5332800, 'steps': 27774, 'loss/train': 1.5567878484725952} -08/30/2021 18:08:29 - INFO - __main__ - Step 27776: {'lr': 0.0004635058861061051, 'samples': 5332992, 'steps': 27775, 'loss/train': 0.40147650241851807} -08/30/2021 18:08:30 - INFO - __main__ - Step 27777: {'lr': 0.00046350312530727403, 'samples': 5333184, 'steps': 27776, 'loss/train': 1.261691689491272} -08/30/2021 18:08:30 - INFO - __main__ - Step 27778: {'lr': 0.00046350036441224175, 'samples': 5333376, 'steps': 27777, 'loss/train': 0.7986395955085754} -08/30/2021 18:08:30 - INFO - __main__ - Step 27779: {'lr': 0.00046349760342100955, 'samples': 5333568, 'steps': 27778, 'loss/train': 0.9109395146369934} -08/30/2021 18:08:31 - INFO - __main__ - Step 27780: {'lr': 0.00046349484233357854, 'samples': 5333760, 'steps': 27779, 'loss/train': 0.8990795016288757} -08/30/2021 18:08:31 - INFO - __main__ - Step 27781: {'lr': 0.0004634920811499501, 'samples': 5333952, 'steps': 27780, 'loss/train': 1.3686414957046509} -08/30/2021 18:08:32 - INFO - __main__ - Step 27782: {'lr': 0.00046348931987012543, 'samples': 5334144, 'steps': 27781, 'loss/train': 1.518345594406128} -08/30/2021 18:08:33 - INFO - __main__ - Step 27783: {'lr': 0.00046348655849410577, 'samples': 5334336, 'steps': 27782, 'loss/train': 1.1290329694747925} -08/30/2021 18:08:33 - INFO - __main__ - Step 27784: {'lr': 0.0004634837970218924, 'samples': 5334528, 'steps': 27783, 'loss/train': 1.4776440858840942} -08/30/2021 18:08:34 - INFO - __main__ - Step 27785: {'lr': 0.0004634810354534864, 'samples': 5334720, 'steps': 27784, 'loss/train': 1.881790280342102} -08/30/2021 18:08:34 - INFO - __main__ - Step 27786: {'lr': 0.0004634782737888892, 'samples': 5334912, 'steps': 27785, 'loss/train': 1.4031047821044922} -08/30/2021 18:08:35 - INFO - __main__ - Step 27787: {'lr': 0.000463475512028102, 'samples': 5335104, 'steps': 27786, 'loss/train': 1.4787510633468628} -08/30/2021 18:08:36 - INFO - __main__ - Step 27788: {'lr': 0.000463472750171126, 'samples': 5335296, 'steps': 27787, 'loss/train': 0.08194834738969803} -08/30/2021 18:08:36 - INFO - __main__ - Step 27789: {'lr': 0.0004634699882179625, 'samples': 5335488, 'steps': 27788, 'loss/train': 1.0469577312469482} -08/30/2021 18:08:37 - INFO - __main__ - Step 27790: {'lr': 0.0004634672261686127, 'samples': 5335680, 'steps': 27789, 'loss/train': 1.6386882066726685} -08/30/2021 18:08:37 - INFO - __main__ - Step 27791: {'lr': 0.0004634644640230779, 'samples': 5335872, 'steps': 27790, 'loss/train': 0.704902708530426} -08/30/2021 18:08:39 - INFO - __main__ - Step 27792: {'lr': 0.0004634617017813593, 'samples': 5336064, 'steps': 27791, 'loss/train': 1.4183684587478638} -08/30/2021 18:08:39 - INFO - __main__ - Step 27793: {'lr': 0.00046345893944345806, 'samples': 5336256, 'steps': 27792, 'loss/train': 2.2018020153045654} -08/30/2021 18:08:39 - INFO - __main__ - Step 27794: {'lr': 0.00046345617700937564, 'samples': 5336448, 'steps': 27793, 'loss/train': 1.7258145809173584} -08/30/2021 18:08:40 - INFO - __main__ - Step 27795: {'lr': 0.0004634534144791131, 'samples': 5336640, 'steps': 27794, 'loss/train': 0.2126784771680832} -08/30/2021 18:08:40 - INFO - __main__ - Step 27796: {'lr': 0.0004634506518526718, 'samples': 5336832, 'steps': 27795, 'loss/train': 1.3140028715133667} -08/30/2021 18:08:40 - INFO - __main__ - Step 27797: {'lr': 0.00046344788913005286, 'samples': 5337024, 'steps': 27796, 'loss/train': 1.5470367670059204} -08/30/2021 18:08:42 - INFO - __main__ - Step 27798: {'lr': 0.00046344512631125756, 'samples': 5337216, 'steps': 27797, 'loss/train': 1.9504424333572388} -08/30/2021 18:08:43 - INFO - __main__ - Step 27799: {'lr': 0.00046344236339628724, 'samples': 5337408, 'steps': 27798, 'loss/train': 0.5643483400344849} -08/30/2021 18:08:43 - INFO - __main__ - Step 27800: {'lr': 0.0004634396003851431, 'samples': 5337600, 'steps': 27799, 'loss/train': 1.915980577468872} -08/30/2021 18:08:43 - INFO - __main__ - Step 27801: {'lr': 0.00046343683727782635, 'samples': 5337792, 'steps': 27800, 'loss/train': 1.5329633951187134} -08/30/2021 18:08:44 - INFO - __main__ - Step 27802: {'lr': 0.0004634340740743382, 'samples': 5337984, 'steps': 27801, 'loss/train': 1.385451078414917} -08/30/2021 18:08:46 - INFO - __main__ - Step 27803: {'lr': 0.00046343131077468, 'samples': 5338176, 'steps': 27802, 'loss/train': 0.9860138893127441} -08/30/2021 18:08:46 - INFO - __main__ - Step 27804: {'lr': 0.00046342854737885296, 'samples': 5338368, 'steps': 27803, 'loss/train': 1.3522201776504517} -08/30/2021 18:08:46 - INFO - __main__ - Step 27805: {'lr': 0.00046342578388685837, 'samples': 5338560, 'steps': 27804, 'loss/train': 1.868133544921875} -08/30/2021 18:08:47 - INFO - __main__ - Step 27806: {'lr': 0.0004634230202986973, 'samples': 5338752, 'steps': 27805, 'loss/train': 1.3344823122024536} -08/30/2021 18:08:47 - INFO - __main__ - Step 27807: {'lr': 0.0004634202566143712, 'samples': 5338944, 'steps': 27806, 'loss/train': 1.7863492965698242} -08/30/2021 18:08:49 - INFO - __main__ - Step 27808: {'lr': 0.00046341749283388117, 'samples': 5339136, 'steps': 27807, 'loss/train': 1.4219354391098022} -08/30/2021 18:08:49 - INFO - __main__ - Step 27809: {'lr': 0.0004634147289572285, 'samples': 5339328, 'steps': 27808, 'loss/train': 1.2044622898101807} -08/30/2021 18:08:49 - INFO - __main__ - Step 27810: {'lr': 0.00046341196498441453, 'samples': 5339520, 'steps': 27809, 'loss/train': 1.3901963233947754} -08/30/2021 18:08:50 - INFO - __main__ - Step 27811: {'lr': 0.0004634092009154403, 'samples': 5339712, 'steps': 27810, 'loss/train': 1.82839834690094} -08/30/2021 18:08:50 - INFO - __main__ - Step 27812: {'lr': 0.0004634064367503072, 'samples': 5339904, 'steps': 27811, 'loss/train': 0.2811654508113861} -08/30/2021 18:08:52 - INFO - __main__ - Step 27813: {'lr': 0.00046340367248901655, 'samples': 5340096, 'steps': 27812, 'loss/train': 1.6390193700790405} -08/30/2021 18:08:52 - INFO - __main__ - Step 27814: {'lr': 0.00046340090813156944, 'samples': 5340288, 'steps': 27813, 'loss/train': 1.7161142826080322} -08/30/2021 18:08:53 - INFO - __main__ - Step 27815: {'lr': 0.00046339814367796716, 'samples': 5340480, 'steps': 27814, 'loss/train': 1.2551450729370117} -08/30/2021 18:08:53 - INFO - __main__ - Step 27816: {'lr': 0.00046339537912821094, 'samples': 5340672, 'steps': 27815, 'loss/train': 2.1397149562835693} -08/30/2021 18:08:53 - INFO - __main__ - Step 27817: {'lr': 0.0004633926144823022, 'samples': 5340864, 'steps': 27816, 'loss/train': 1.7750980854034424} -08/30/2021 18:08:54 - INFO - __main__ - Step 27818: {'lr': 0.0004633898497402419, 'samples': 5341056, 'steps': 27817, 'loss/train': 1.7932462692260742} -08/30/2021 18:08:55 - INFO - __main__ - Step 27819: {'lr': 0.0004633870849020314, 'samples': 5341248, 'steps': 27818, 'loss/train': 0.15541088581085205} -08/30/2021 18:08:56 - INFO - __main__ - Step 27820: {'lr': 0.00046338431996767205, 'samples': 5341440, 'steps': 27819, 'loss/train': 5.489909648895264} -08/30/2021 18:08:56 - INFO - __main__ - Step 27821: {'lr': 0.00046338155493716503, 'samples': 5341632, 'steps': 27820, 'loss/train': 1.8474998474121094} -08/30/2021 18:08:56 - INFO - __main__ - Step 27822: {'lr': 0.0004633787898105115, 'samples': 5341824, 'steps': 27821, 'loss/train': 1.2274061441421509} -08/30/2021 18:08:57 - INFO - __main__ - Step 27823: {'lr': 0.0004633760245877129, 'samples': 5342016, 'steps': 27822, 'loss/train': 1.5886231660842896} -08/30/2021 18:08:58 - INFO - __main__ - Step 27824: {'lr': 0.0004633732592687703, 'samples': 5342208, 'steps': 27823, 'loss/train': 0.9894622564315796} -08/30/2021 18:08:59 - INFO - __main__ - Step 27825: {'lr': 0.00046337049385368495, 'samples': 5342400, 'steps': 27824, 'loss/train': 1.9861916303634644} -08/30/2021 18:08:59 - INFO - __main__ - Step 27826: {'lr': 0.00046336772834245824, 'samples': 5342592, 'steps': 27825, 'loss/train': 1.5195856094360352} -08/30/2021 18:08:59 - INFO - __main__ - Step 27827: {'lr': 0.0004633649627350912, 'samples': 5342784, 'steps': 27826, 'loss/train': 1.1240161657333374} -08/30/2021 18:09:00 - INFO - __main__ - Step 27828: {'lr': 0.00046336219703158526, 'samples': 5342976, 'steps': 27827, 'loss/train': 1.9857053756713867} -08/30/2021 18:09:02 - INFO - __main__ - Step 27829: {'lr': 0.00046335943123194164, 'samples': 5343168, 'steps': 27828, 'loss/train': 1.4039204120635986} -08/30/2021 18:09:02 - INFO - __main__ - Step 27830: {'lr': 0.0004633566653361615, 'samples': 5343360, 'steps': 27829, 'loss/train': 1.4734183549880981} -08/30/2021 18:09:03 - INFO - __main__ - Step 27831: {'lr': 0.0004633538993442462, 'samples': 5343552, 'steps': 27830, 'loss/train': 1.527032732963562} -08/30/2021 18:09:03 - INFO - __main__ - Step 27832: {'lr': 0.00046335113325619685, 'samples': 5343744, 'steps': 27831, 'loss/train': 1.4288867712020874} -08/30/2021 18:09:03 - INFO - __main__ - Step 27833: {'lr': 0.00046334836707201486, 'samples': 5343936, 'steps': 27832, 'loss/train': 1.7638781070709229} -08/30/2021 18:09:04 - INFO - __main__ - Step 27834: {'lr': 0.0004633456007917013, 'samples': 5344128, 'steps': 27833, 'loss/train': 1.0613548755645752} -08/30/2021 18:09:04 - INFO - __main__ - Step 27835: {'lr': 0.0004633428344152576, 'samples': 5344320, 'steps': 27834, 'loss/train': 1.0412993431091309} -08/30/2021 18:09:06 - INFO - __main__ - Step 27836: {'lr': 0.0004633400679426848, 'samples': 5344512, 'steps': 27835, 'loss/train': 1.024503231048584} -08/30/2021 18:09:06 - INFO - __main__ - Step 27837: {'lr': 0.00046333730137398433, 'samples': 5344704, 'steps': 27836, 'loss/train': 0.8051562309265137} -08/30/2021 18:09:07 - INFO - __main__ - Step 27838: {'lr': 0.00046333453470915736, 'samples': 5344896, 'steps': 27837, 'loss/train': 0.09756675362586975} -08/30/2021 18:09:07 - INFO - __main__ - Step 27839: {'lr': 0.0004633317679482051, 'samples': 5345088, 'steps': 27838, 'loss/train': 1.6739451885223389} -08/30/2021 18:09:07 - INFO - __main__ - Step 27840: {'lr': 0.00046332900109112893, 'samples': 5345280, 'steps': 27839, 'loss/train': 1.2744837999343872} -08/30/2021 18:09:09 - INFO - __main__ - Step 27841: {'lr': 0.0004633262341379299, 'samples': 5345472, 'steps': 27840, 'loss/train': 1.4695515632629395} -08/30/2021 18:09:09 - INFO - __main__ - Step 27842: {'lr': 0.0004633234670886094, 'samples': 5345664, 'steps': 27841, 'loss/train': 1.4233691692352295} -08/30/2021 18:09:10 - INFO - __main__ - Step 27843: {'lr': 0.0004633206999431686, 'samples': 5345856, 'steps': 27842, 'loss/train': 1.7822850942611694} -08/30/2021 18:09:10 - INFO - __main__ - Step 27844: {'lr': 0.00046331793270160885, 'samples': 5346048, 'steps': 27843, 'loss/train': 1.6514739990234375} -08/30/2021 18:09:10 - INFO - __main__ - Step 27845: {'lr': 0.0004633151653639314, 'samples': 5346240, 'steps': 27844, 'loss/train': 2.3348324298858643} -08/30/2021 18:09:12 - INFO - __main__ - Step 27846: {'lr': 0.00046331239793013726, 'samples': 5346432, 'steps': 27845, 'loss/train': 1.9039591550827026} -08/30/2021 18:09:12 - INFO - __main__ - Step 27847: {'lr': 0.0004633096304002279, 'samples': 5346624, 'steps': 27846, 'loss/train': 1.19235360622406} -08/30/2021 18:09:13 - INFO - __main__ - Step 27848: {'lr': 0.00046330686277420454, 'samples': 5346816, 'steps': 27847, 'loss/train': 1.4089248180389404} -08/30/2021 18:09:13 - INFO - __main__ - Step 27849: {'lr': 0.00046330409505206837, 'samples': 5347008, 'steps': 27848, 'loss/train': 1.5183302164077759} -08/30/2021 18:09:13 - INFO - __main__ - Step 27850: {'lr': 0.00046330132723382066, 'samples': 5347200, 'steps': 27849, 'loss/train': 1.5850435495376587} -08/30/2021 18:09:15 - INFO - __main__ - Step 27851: {'lr': 0.0004632985593194627, 'samples': 5347392, 'steps': 27850, 'loss/train': 1.0716716051101685} -08/30/2021 18:09:15 - INFO - __main__ - Step 27852: {'lr': 0.00046329579130899567, 'samples': 5347584, 'steps': 27851, 'loss/train': 1.5987440347671509} -08/30/2021 18:09:16 - INFO - __main__ - Step 27853: {'lr': 0.0004632930232024209, 'samples': 5347776, 'steps': 27852, 'loss/train': 1.7953028678894043} -08/30/2021 18:09:16 - INFO - __main__ - Step 27854: {'lr': 0.0004632902549997395, 'samples': 5347968, 'steps': 27853, 'loss/train': 1.2598515748977661} -08/30/2021 18:09:16 - INFO - __main__ - Step 27855: {'lr': 0.00046328748670095287, 'samples': 5348160, 'steps': 27854, 'loss/train': 1.3424211740493774} -08/30/2021 18:09:18 - INFO - __main__ - Step 27856: {'lr': 0.0004632847183060622, 'samples': 5348352, 'steps': 27855, 'loss/train': 1.6653623580932617} -08/30/2021 18:09:19 - INFO - __main__ - Step 27857: {'lr': 0.0004632819498150688, 'samples': 5348544, 'steps': 27856, 'loss/train': 1.4488108158111572} -08/30/2021 18:09:19 - INFO - __main__ - Step 27858: {'lr': 0.00046327918122797363, 'samples': 5348736, 'steps': 27857, 'loss/train': 1.2262461185455322} -08/30/2021 18:09:20 - INFO - __main__ - Step 27859: {'lr': 0.00046327641254477833, 'samples': 5348928, 'steps': 27858, 'loss/train': 1.7536661624908447} -08/30/2021 18:09:20 - INFO - __main__ - Step 27860: {'lr': 0.00046327364376548384, 'samples': 5349120, 'steps': 27859, 'loss/train': 0.9308289885520935} -08/30/2021 18:09:21 - INFO - __main__ - Step 27861: {'lr': 0.0004632708748900917, 'samples': 5349312, 'steps': 27860, 'loss/train': 1.4292386770248413} -08/30/2021 18:09:22 - INFO - __main__ - Step 27862: {'lr': 0.00046326810591860285, 'samples': 5349504, 'steps': 27861, 'loss/train': 1.91312575340271} -08/30/2021 18:09:22 - INFO - __main__ - Step 27863: {'lr': 0.0004632653368510187, 'samples': 5349696, 'steps': 27862, 'loss/train': 1.5734388828277588} -08/30/2021 18:09:23 - INFO - __main__ - Step 27864: {'lr': 0.00046326256768734053, 'samples': 5349888, 'steps': 27863, 'loss/train': 1.2745591402053833} -08/30/2021 18:09:23 - INFO - __main__ - Step 27865: {'lr': 0.0004632597984275695, 'samples': 5350080, 'steps': 27864, 'loss/train': 0.9460969567298889} -08/30/2021 18:09:23 - INFO - __main__ - Step 27866: {'lr': 0.00046325702907170697, 'samples': 5350272, 'steps': 27865, 'loss/train': 1.5940924882888794} -08/30/2021 18:09:25 - INFO - __main__ - Step 27867: {'lr': 0.000463254259619754, 'samples': 5350464, 'steps': 27866, 'loss/train': 1.37678861618042} -08/30/2021 18:09:25 - INFO - __main__ - Step 27868: {'lr': 0.000463251490071712, 'samples': 5350656, 'steps': 27867, 'loss/train': 1.644361138343811} -08/30/2021 18:09:26 - INFO - __main__ - Step 27869: {'lr': 0.0004632487204275822, 'samples': 5350848, 'steps': 27868, 'loss/train': 1.1219329833984375} -08/30/2021 18:09:26 - INFO - __main__ - Step 27870: {'lr': 0.0004632459506873658, 'samples': 5351040, 'steps': 27869, 'loss/train': 1.184278964996338} -08/30/2021 18:09:26 - INFO - __main__ - Step 27871: {'lr': 0.0004632431808510641, 'samples': 5351232, 'steps': 27870, 'loss/train': 1.9152334928512573} -08/30/2021 18:09:28 - INFO - __main__ - Step 27872: {'lr': 0.0004632404109186782, 'samples': 5351424, 'steps': 27871, 'loss/train': 1.5471254587173462} -08/30/2021 18:09:28 - INFO - __main__ - Step 27873: {'lr': 0.0004632376408902096, 'samples': 5351616, 'steps': 27872, 'loss/train': 1.623543620109558} -08/30/2021 18:09:29 - INFO - __main__ - Step 27874: {'lr': 0.0004632348707656593, 'samples': 5351808, 'steps': 27873, 'loss/train': 1.6411412954330444} -08/30/2021 18:09:29 - INFO - __main__ - Step 27875: {'lr': 0.00046323210054502874, 'samples': 5352000, 'steps': 27874, 'loss/train': 1.30329167842865} -08/30/2021 18:09:29 - INFO - __main__ - Step 27876: {'lr': 0.00046322933022831903, 'samples': 5352192, 'steps': 27875, 'loss/train': 1.4236921072006226} -08/30/2021 18:09:31 - INFO - __main__ - Step 27877: {'lr': 0.0004632265598155315, 'samples': 5352384, 'steps': 27876, 'loss/train': 1.4609565734863281} -08/30/2021 18:09:31 - INFO - __main__ - Step 27878: {'lr': 0.00046322378930666736, 'samples': 5352576, 'steps': 27877, 'loss/train': 1.5716593265533447} -08/30/2021 18:09:32 - INFO - __main__ - Step 27879: {'lr': 0.0004632210187017278, 'samples': 5352768, 'steps': 27878, 'loss/train': 0.8533258438110352} -08/30/2021 18:09:32 - INFO - __main__ - Step 27880: {'lr': 0.00046321824800071425, 'samples': 5352960, 'steps': 27879, 'loss/train': 1.2530912160873413} -08/30/2021 18:09:32 - INFO - __main__ - Step 27881: {'lr': 0.0004632154772036279, 'samples': 5353152, 'steps': 27880, 'loss/train': 1.4827314615249634} -08/30/2021 18:09:34 - INFO - __main__ - Step 27882: {'lr': 0.0004632127063104698, 'samples': 5353344, 'steps': 27881, 'loss/train': 1.599303126335144} -08/30/2021 18:09:34 - INFO - __main__ - Step 27883: {'lr': 0.00046320993532124137, 'samples': 5353536, 'steps': 27882, 'loss/train': 1.5524917840957642} -08/30/2021 18:09:35 - INFO - __main__ - Step 27884: {'lr': 0.0004632071642359439, 'samples': 5353728, 'steps': 27883, 'loss/train': 1.8457468748092651} -08/30/2021 18:09:35 - INFO - __main__ - Step 27885: {'lr': 0.0004632043930545785, 'samples': 5353920, 'steps': 27884, 'loss/train': 0.07377669960260391} -08/30/2021 18:09:35 - INFO - __main__ - Step 27886: {'lr': 0.00046320162177714653, 'samples': 5354112, 'steps': 27885, 'loss/train': 1.8720864057540894} -08/30/2021 18:09:37 - INFO - __main__ - Step 27887: {'lr': 0.00046319885040364925, 'samples': 5354304, 'steps': 27886, 'loss/train': 1.5645158290863037} -08/30/2021 18:09:38 - INFO - __main__ - Step 27888: {'lr': 0.00046319607893408776, 'samples': 5354496, 'steps': 27887, 'loss/train': 1.0230780839920044} -08/30/2021 18:09:38 - INFO - __main__ - Step 27889: {'lr': 0.0004631933073684635, 'samples': 5354688, 'steps': 27888, 'loss/train': 0.8020130395889282} -08/30/2021 18:09:38 - INFO - __main__ - Step 27890: {'lr': 0.00046319053570677754, 'samples': 5354880, 'steps': 27889, 'loss/train': 1.6323224306106567} -08/30/2021 18:09:39 - INFO - __main__ - Step 27891: {'lr': 0.0004631877639490313, 'samples': 5355072, 'steps': 27890, 'loss/train': 1.1596242189407349} -08/30/2021 18:09:40 - INFO - __main__ - Step 27892: {'lr': 0.0004631849920952259, 'samples': 5355264, 'steps': 27891, 'loss/train': 1.720773458480835} -08/30/2021 18:09:40 - INFO - __main__ - Step 27893: {'lr': 0.0004631822201453626, 'samples': 5355456, 'steps': 27892, 'loss/train': 1.4729856252670288} -08/30/2021 18:09:41 - INFO - __main__ - Step 27894: {'lr': 0.0004631794480994427, 'samples': 5355648, 'steps': 27893, 'loss/train': 1.6313401460647583} -08/30/2021 18:09:41 - INFO - __main__ - Step 27895: {'lr': 0.0004631766759574675, 'samples': 5355840, 'steps': 27894, 'loss/train': 0.4398038983345032} -08/30/2021 18:09:42 - INFO - __main__ - Step 27896: {'lr': 0.0004631739037194381, 'samples': 5356032, 'steps': 27895, 'loss/train': 1.3815815448760986} -08/30/2021 18:09:43 - INFO - __main__ - Step 27897: {'lr': 0.00046317113138535584, 'samples': 5356224, 'steps': 27896, 'loss/train': 1.543875813484192} -08/30/2021 18:09:44 - INFO - __main__ - Step 27898: {'lr': 0.0004631683589552219, 'samples': 5356416, 'steps': 27897, 'loss/train': 1.45516836643219} -08/30/2021 18:09:44 - INFO - __main__ - Step 27899: {'lr': 0.00046316558642903774, 'samples': 5356608, 'steps': 27898, 'loss/train': 1.6084994077682495} -08/30/2021 18:09:44 - INFO - __main__ - Step 27900: {'lr': 0.0004631628138068043, 'samples': 5356800, 'steps': 27899, 'loss/train': 1.3844728469848633} -08/30/2021 18:09:45 - INFO - __main__ - Step 27901: {'lr': 0.00046316004108852305, 'samples': 5356992, 'steps': 27900, 'loss/train': 1.730255365371704} -08/30/2021 18:09:45 - INFO - __main__ - Step 27902: {'lr': 0.0004631572682741952, 'samples': 5357184, 'steps': 27901, 'loss/train': 1.5052891969680786} -08/30/2021 18:09:47 - INFO - __main__ - Step 27903: {'lr': 0.0004631544953638219, 'samples': 5357376, 'steps': 27902, 'loss/train': 0.9532438516616821} -08/30/2021 18:09:47 - INFO - __main__ - Step 27904: {'lr': 0.00046315172235740455, 'samples': 5357568, 'steps': 27903, 'loss/train': 0.07877084612846375} -08/30/2021 18:09:47 - INFO - __main__ - Step 27905: {'lr': 0.0004631489492549443, 'samples': 5357760, 'steps': 27904, 'loss/train': 1.857937216758728} -08/30/2021 18:09:48 - INFO - __main__ - Step 27906: {'lr': 0.00046314617605644243, 'samples': 5357952, 'steps': 27905, 'loss/train': 1.09197199344635} -08/30/2021 18:09:48 - INFO - __main__ - Step 27907: {'lr': 0.0004631434027619001, 'samples': 5358144, 'steps': 27906, 'loss/train': 0.6468884944915771} -08/30/2021 18:09:50 - INFO - __main__ - Step 27908: {'lr': 0.0004631406293713188, 'samples': 5358336, 'steps': 27907, 'loss/train': 0.38434073328971863} -08/30/2021 18:09:51 - INFO - __main__ - Step 27909: {'lr': 0.0004631378558846995, 'samples': 5358528, 'steps': 27908, 'loss/train': 1.4693931341171265} -08/30/2021 18:09:51 - INFO - __main__ - Step 27910: {'lr': 0.00046313508230204364, 'samples': 5358720, 'steps': 27909, 'loss/train': 1.861594319343567} -08/30/2021 18:09:51 - INFO - __main__ - Step 27911: {'lr': 0.00046313230862335235, 'samples': 5358912, 'steps': 27910, 'loss/train': 1.4517710208892822} -08/30/2021 18:09:52 - INFO - __main__ - Step 27912: {'lr': 0.000463129534848627, 'samples': 5359104, 'steps': 27911, 'loss/train': 1.1970484256744385} -08/30/2021 18:09:53 - INFO - __main__ - Step 27913: {'lr': 0.0004631267609778687, 'samples': 5359296, 'steps': 27912, 'loss/train': 1.354780912399292} -08/30/2021 18:09:54 - INFO - __main__ - Step 27914: {'lr': 0.0004631239870110788, 'samples': 5359488, 'steps': 27913, 'loss/train': 0.8847267031669617} -08/30/2021 18:09:54 - INFO - __main__ - Step 27915: {'lr': 0.00046312121294825846, 'samples': 5359680, 'steps': 27914, 'loss/train': 2.010751485824585} -08/30/2021 18:09:54 - INFO - __main__ - Step 27916: {'lr': 0.00046311843878940904, 'samples': 5359872, 'steps': 27915, 'loss/train': 1.421433925628662} -08/30/2021 18:09:55 - INFO - __main__ - Step 27917: {'lr': 0.0004631156645345318, 'samples': 5360064, 'steps': 27916, 'loss/train': 1.6389130353927612} -08/30/2021 18:09:56 - INFO - __main__ - Step 27918: {'lr': 0.0004631128901836278, 'samples': 5360256, 'steps': 27917, 'loss/train': 2.283113479614258} -08/30/2021 18:09:57 - INFO - __main__ - Step 27919: {'lr': 0.0004631101157366985, 'samples': 5360448, 'steps': 27918, 'loss/train': 0.6903948187828064} -08/30/2021 18:09:57 - INFO - __main__ - Step 27920: {'lr': 0.0004631073411937451, 'samples': 5360640, 'steps': 27919, 'loss/train': 1.649309515953064} -08/30/2021 18:09:57 - INFO - __main__ - Step 27921: {'lr': 0.00046310456655476875, 'samples': 5360832, 'steps': 27920, 'loss/train': 1.745056390762329} -08/30/2021 18:09:58 - INFO - __main__ - Step 27922: {'lr': 0.0004631017918197709, 'samples': 5361024, 'steps': 27921, 'loss/train': 1.7016445398330688} -08/30/2021 18:09:59 - INFO - __main__ - Step 27923: {'lr': 0.00046309901698875244, 'samples': 5361216, 'steps': 27922, 'loss/train': 1.6440163850784302} -08/30/2021 18:10:00 - INFO - __main__ - Step 27924: {'lr': 0.00046309624206171505, 'samples': 5361408, 'steps': 27923, 'loss/train': 2.148451328277588} -08/30/2021 18:10:00 - INFO - __main__ - Step 27925: {'lr': 0.00046309346703865973, 'samples': 5361600, 'steps': 27924, 'loss/train': 1.5376533269882202} -08/30/2021 18:10:00 - INFO - __main__ - Step 27926: {'lr': 0.00046309069191958775, 'samples': 5361792, 'steps': 27925, 'loss/train': 1.7108235359191895} -08/30/2021 18:10:01 - INFO - __main__ - Step 27927: {'lr': 0.00046308791670450033, 'samples': 5361984, 'steps': 27926, 'loss/train': 1.6991583108901978} -08/30/2021 18:10:02 - INFO - __main__ - Step 27928: {'lr': 0.00046308514139339896, 'samples': 5362176, 'steps': 27927, 'loss/train': 1.648048758506775} -08/30/2021 18:10:03 - INFO - __main__ - Step 27929: {'lr': 0.0004630823659862846, 'samples': 5362368, 'steps': 27928, 'loss/train': 1.1558430194854736} -08/30/2021 18:10:03 - INFO - __main__ - Step 27930: {'lr': 0.0004630795904831586, 'samples': 5362560, 'steps': 27929, 'loss/train': 1.4804942607879639} -08/30/2021 18:10:03 - INFO - __main__ - Step 27931: {'lr': 0.0004630768148840223, 'samples': 5362752, 'steps': 27930, 'loss/train': 0.8264032006263733} -08/30/2021 18:10:04 - INFO - __main__ - Step 27932: {'lr': 0.0004630740391888768, 'samples': 5362944, 'steps': 27931, 'loss/train': 1.671456217765808} -08/30/2021 18:10:04 - INFO - __main__ - Step 27933: {'lr': 0.0004630712633977234, 'samples': 5363136, 'steps': 27932, 'loss/train': 1.25258469581604} -08/30/2021 18:10:05 - INFO - __main__ - Step 27934: {'lr': 0.00046306848751056346, 'samples': 5363328, 'steps': 27933, 'loss/train': 0.786181628704071} -08/30/2021 18:10:06 - INFO - __main__ - Step 27935: {'lr': 0.0004630657115273981, 'samples': 5363520, 'steps': 27934, 'loss/train': 1.7340360879898071} -08/30/2021 18:10:06 - INFO - __main__ - Step 27936: {'lr': 0.0004630629354482286, 'samples': 5363712, 'steps': 27935, 'loss/train': 1.613985538482666} -08/30/2021 18:10:07 - INFO - __main__ - Step 27937: {'lr': 0.00046306015927305633, 'samples': 5363904, 'steps': 27936, 'loss/train': 1.5055582523345947} -08/30/2021 18:10:07 - INFO - __main__ - Step 27938: {'lr': 0.0004630573830018824, 'samples': 5364096, 'steps': 27937, 'loss/train': 0.9066299200057983} -08/30/2021 18:10:08 - INFO - __main__ - Step 27939: {'lr': 0.00046305460663470803, 'samples': 5364288, 'steps': 27938, 'loss/train': 1.687584638595581} -08/30/2021 18:10:09 - INFO - __main__ - Step 27940: {'lr': 0.0004630518301715346, 'samples': 5364480, 'steps': 27939, 'loss/train': 1.1913965940475464} -08/30/2021 18:10:09 - INFO - __main__ - Step 27941: {'lr': 0.00046304905361236335, 'samples': 5364672, 'steps': 27940, 'loss/train': 1.8258600234985352} -08/30/2021 18:10:09 - INFO - __main__ - Step 27942: {'lr': 0.00046304627695719535, 'samples': 5364864, 'steps': 27941, 'loss/train': 1.5701454877853394} -08/30/2021 18:10:10 - INFO - __main__ - Step 27943: {'lr': 0.0004630435002060321, 'samples': 5365056, 'steps': 27942, 'loss/train': 1.3512667417526245} -08/30/2021 18:10:12 - INFO - __main__ - Step 27944: {'lr': 0.0004630407233588747, 'samples': 5365248, 'steps': 27943, 'loss/train': 1.5550307035446167} -08/30/2021 18:10:12 - INFO - __main__ - Step 27945: {'lr': 0.00046303794641572445, 'samples': 5365440, 'steps': 27944, 'loss/train': 1.9324413537979126} -08/30/2021 18:10:12 - INFO - __main__ - Step 27946: {'lr': 0.0004630351693765825, 'samples': 5365632, 'steps': 27945, 'loss/train': 1.4949580430984497} -08/30/2021 18:10:13 - INFO - __main__ - Step 27947: {'lr': 0.0004630323922414503, 'samples': 5365824, 'steps': 27946, 'loss/train': 1.6540135145187378} -08/30/2021 18:10:13 - INFO - __main__ - Step 27948: {'lr': 0.00046302961501032896, 'samples': 5366016, 'steps': 27947, 'loss/train': 1.3547570705413818} -08/30/2021 18:10:15 - INFO - __main__ - Step 27949: {'lr': 0.00046302683768321973, 'samples': 5366208, 'steps': 27948, 'loss/train': 0.8375091552734375} -08/30/2021 18:10:15 - INFO - __main__ - Step 27950: {'lr': 0.00046302406026012396, 'samples': 5366400, 'steps': 27949, 'loss/train': 1.5853266716003418} -08/30/2021 18:10:16 - INFO - __main__ - Step 27951: {'lr': 0.0004630212827410428, 'samples': 5366592, 'steps': 27950, 'loss/train': 2.0909345149993896} -08/30/2021 18:10:16 - INFO - __main__ - Step 27952: {'lr': 0.00046301850512597755, 'samples': 5366784, 'steps': 27951, 'loss/train': 1.000041127204895} -08/30/2021 18:10:16 - INFO - __main__ - Step 27953: {'lr': 0.0004630157274149294, 'samples': 5366976, 'steps': 27952, 'loss/train': 1.8751729726791382} -08/30/2021 18:10:18 - INFO - __main__ - Step 27954: {'lr': 0.0004630129496078997, 'samples': 5367168, 'steps': 27953, 'loss/train': 1.3810734748840332} -08/30/2021 18:10:18 - INFO - __main__ - Step 27955: {'lr': 0.00046301017170488965, 'samples': 5367360, 'steps': 27954, 'loss/train': 1.148566484451294} -08/30/2021 18:10:19 - INFO - __main__ - Step 27956: {'lr': 0.0004630073937059005, 'samples': 5367552, 'steps': 27955, 'loss/train': 0.05812060460448265} -08/30/2021 18:10:19 - INFO - __main__ - Step 27957: {'lr': 0.0004630046156109334, 'samples': 5367744, 'steps': 27956, 'loss/train': 0.6879861354827881} -08/30/2021 18:10:19 - INFO - __main__ - Step 27958: {'lr': 0.0004630018374199899, 'samples': 5367936, 'steps': 27957, 'loss/train': 1.4244699478149414} -08/30/2021 18:10:21 - INFO - __main__ - Step 27959: {'lr': 0.00046299905913307096, 'samples': 5368128, 'steps': 27958, 'loss/train': 1.2281049489974976} -08/30/2021 18:10:22 - INFO - __main__ - Step 27960: {'lr': 0.00046299628075017785, 'samples': 5368320, 'steps': 27959, 'loss/train': 1.7666549682617188} -08/30/2021 18:10:22 - INFO - __main__ - Step 27961: {'lr': 0.000462993502271312, 'samples': 5368512, 'steps': 27960, 'loss/train': 1.5040251016616821} -08/30/2021 18:10:22 - INFO - __main__ - Step 27962: {'lr': 0.00046299072369647453, 'samples': 5368704, 'steps': 27961, 'loss/train': 1.8474175930023193} -08/30/2021 18:10:23 - INFO - __main__ - Step 27963: {'lr': 0.00046298794502566676, 'samples': 5368896, 'steps': 27962, 'loss/train': 1.0150020122528076} -08/30/2021 18:10:24 - INFO - __main__ - Step 27964: {'lr': 0.0004629851662588899, 'samples': 5369088, 'steps': 27963, 'loss/train': 1.4271022081375122} -08/30/2021 18:10:25 - INFO - __main__ - Step 27965: {'lr': 0.00046298238739614524, 'samples': 5369280, 'steps': 27964, 'loss/train': 1.410161018371582} -08/30/2021 18:10:25 - INFO - __main__ - Step 27966: {'lr': 0.0004629796084374339, 'samples': 5369472, 'steps': 27965, 'loss/train': 1.77895987033844} -08/30/2021 18:10:25 - INFO - __main__ - Step 27967: {'lr': 0.00046297682938275733, 'samples': 5369664, 'steps': 27966, 'loss/train': 1.7697396278381348} -08/30/2021 18:10:26 - INFO - __main__ - Step 27968: {'lr': 0.0004629740502321167, 'samples': 5369856, 'steps': 27967, 'loss/train': 1.216433048248291} -08/30/2021 18:10:27 - INFO - __main__ - Step 27969: {'lr': 0.00046297127098551317, 'samples': 5370048, 'steps': 27968, 'loss/train': 1.5631228685379028} -08/30/2021 18:10:28 - INFO - __main__ - Step 27970: {'lr': 0.00046296849164294816, 'samples': 5370240, 'steps': 27969, 'loss/train': 1.7805249691009521} -08/30/2021 18:10:28 - INFO - __main__ - Step 27971: {'lr': 0.00046296571220442274, 'samples': 5370432, 'steps': 27970, 'loss/train': 1.0356769561767578} -08/30/2021 18:10:28 - INFO - __main__ - Step 27972: {'lr': 0.00046296293266993833, 'samples': 5370624, 'steps': 27971, 'loss/train': 1.3386609554290771} -08/30/2021 18:10:29 - INFO - __main__ - Step 27973: {'lr': 0.00046296015303949606, 'samples': 5370816, 'steps': 27972, 'loss/train': 1.3475388288497925} -08/30/2021 18:10:29 - INFO - __main__ - Step 27974: {'lr': 0.0004629573733130973, 'samples': 5371008, 'steps': 27973, 'loss/train': 1.4497339725494385} -08/30/2021 18:10:31 - INFO - __main__ - Step 27975: {'lr': 0.00046295459349074316, 'samples': 5371200, 'steps': 27974, 'loss/train': 1.2262866497039795} -08/30/2021 18:10:31 - INFO - __main__ - Step 27976: {'lr': 0.000462951813572435, 'samples': 5371392, 'steps': 27975, 'loss/train': 0.8015449643135071} -08/30/2021 18:10:31 - INFO - __main__ - Step 27977: {'lr': 0.00046294903355817397, 'samples': 5371584, 'steps': 27976, 'loss/train': 1.5901968479156494} -08/30/2021 18:10:32 - INFO - __main__ - Step 27978: {'lr': 0.0004629462534479615, 'samples': 5371776, 'steps': 27977, 'loss/train': 1.8777004480361938} -08/30/2021 18:10:32 - INFO - __main__ - Step 27979: {'lr': 0.0004629434732417986, 'samples': 5371968, 'steps': 27978, 'loss/train': 1.5026010274887085} -08/30/2021 18:10:34 - INFO - __main__ - Step 27980: {'lr': 0.0004629406929396868, 'samples': 5372160, 'steps': 27979, 'loss/train': 1.3599811792373657} -08/30/2021 18:10:34 - INFO - __main__ - Step 27981: {'lr': 0.00046293791254162713, 'samples': 5372352, 'steps': 27980, 'loss/train': 1.7414216995239258} -08/30/2021 18:10:35 - INFO - __main__ - Step 27982: {'lr': 0.0004629351320476209, 'samples': 5372544, 'steps': 27981, 'loss/train': 1.5243333578109741} -08/30/2021 18:10:35 - INFO - __main__ - Step 27983: {'lr': 0.00046293235145766955, 'samples': 5372736, 'steps': 27982, 'loss/train': 1.3205631971359253} -08/30/2021 18:10:35 - INFO - __main__ - Step 27984: {'lr': 0.000462929570771774, 'samples': 5372928, 'steps': 27983, 'loss/train': 1.3177266120910645} -08/30/2021 18:10:36 - INFO - __main__ - Step 27985: {'lr': 0.0004629267899899358, 'samples': 5373120, 'steps': 27984, 'loss/train': 0.0660424679517746} -08/30/2021 18:10:37 - INFO - __main__ - Step 27986: {'lr': 0.00046292400911215594, 'samples': 5373312, 'steps': 27985, 'loss/train': 0.288720041513443} -08/30/2021 18:10:38 - INFO - __main__ - Step 27987: {'lr': 0.00046292122813843586, 'samples': 5373504, 'steps': 27986, 'loss/train': 1.9169349670410156} -08/30/2021 18:10:38 - INFO - __main__ - Step 27988: {'lr': 0.00046291844706877674, 'samples': 5373696, 'steps': 27987, 'loss/train': 0.8314317464828491} -08/30/2021 18:10:38 - INFO - __main__ - Step 27989: {'lr': 0.0004629156659031799, 'samples': 5373888, 'steps': 27988, 'loss/train': 1.9417732954025269} -08/30/2021 18:10:39 - INFO - __main__ - Step 27990: {'lr': 0.0004629128846416465, 'samples': 5374080, 'steps': 27989, 'loss/train': 1.337670087814331} -08/30/2021 18:10:40 - INFO - __main__ - Step 27991: {'lr': 0.00046291010328417784, 'samples': 5374272, 'steps': 27990, 'loss/train': 1.6752270460128784} -08/30/2021 18:10:41 - INFO - __main__ - Step 27992: {'lr': 0.0004629073218307752, 'samples': 5374464, 'steps': 27991, 'loss/train': 1.6669642925262451} -08/30/2021 18:10:41 - INFO - __main__ - Step 27993: {'lr': 0.0004629045402814398, 'samples': 5374656, 'steps': 27992, 'loss/train': 1.9049948453903198} -08/30/2021 18:10:41 - INFO - __main__ - Step 27994: {'lr': 0.0004629017586361729, 'samples': 5374848, 'steps': 27993, 'loss/train': 0.12876975536346436} -08/30/2021 18:10:42 - INFO - __main__ - Step 27995: {'lr': 0.0004628989768949757, 'samples': 5375040, 'steps': 27994, 'loss/train': 1.8217722177505493} -08/30/2021 18:10:44 - INFO - __main__ - Step 27996: {'lr': 0.0004628961950578496, 'samples': 5375232, 'steps': 27995, 'loss/train': 1.3383779525756836} -08/30/2021 18:10:44 - INFO - __main__ - Step 27997: {'lr': 0.00046289341312479574, 'samples': 5375424, 'steps': 27996, 'loss/train': 1.4796178340911865} -08/30/2021 18:10:44 - INFO - __main__ - Step 27998: {'lr': 0.0004628906310958153, 'samples': 5375616, 'steps': 27997, 'loss/train': 1.280945062637329} -08/30/2021 18:10:45 - INFO - __main__ - Step 27999: {'lr': 0.00046288784897090973, 'samples': 5375808, 'steps': 27998, 'loss/train': 1.3560783863067627} -08/30/2021 18:10:45 - INFO - __main__ - Step 28000: {'lr': 0.00046288506675008014, 'samples': 5376000, 'steps': 27999, 'loss/train': 1.3295682668685913} -08/30/2021 18:10:45 - INFO - __main__ - Step 28001: {'lr': 0.0004628822844333278, 'samples': 5376192, 'steps': 28000, 'loss/train': 0.049830805510282516} -08/30/2021 18:10:47 - INFO - __main__ - Step 28002: {'lr': 0.0004628795020206541, 'samples': 5376384, 'steps': 28001, 'loss/train': 1.1427934169769287} -08/30/2021 18:10:47 - INFO - __main__ - Step 28003: {'lr': 0.00046287671951206004, 'samples': 5376576, 'steps': 28002, 'loss/train': 1.6543828248977661} -08/30/2021 18:10:48 - INFO - __main__ - Step 28004: {'lr': 0.0004628739369075471, 'samples': 5376768, 'steps': 28003, 'loss/train': 1.4621587991714478} -08/30/2021 18:10:48 - INFO - __main__ - Step 28005: {'lr': 0.00046287115420711643, 'samples': 5376960, 'steps': 28004, 'loss/train': 1.7530735731124878} -08/30/2021 18:10:48 - INFO - __main__ - Step 28006: {'lr': 0.00046286837141076934, 'samples': 5377152, 'steps': 28005, 'loss/train': 1.7326995134353638} -08/30/2021 18:10:50 - INFO - __main__ - Step 28007: {'lr': 0.0004628655885185069, 'samples': 5377344, 'steps': 28006, 'loss/train': 1.432509422302246} -08/30/2021 18:10:50 - INFO - __main__ - Step 28008: {'lr': 0.00046286280553033067, 'samples': 5377536, 'steps': 28007, 'loss/train': 1.2272719144821167} -08/30/2021 18:10:51 - INFO - __main__ - Step 28009: {'lr': 0.0004628600224462417, 'samples': 5377728, 'steps': 28008, 'loss/train': 1.5074902772903442} -08/30/2021 18:10:51 - INFO - __main__ - Step 28010: {'lr': 0.00046285723926624126, 'samples': 5377920, 'steps': 28009, 'loss/train': 1.5878270864486694} -08/30/2021 18:10:51 - INFO - __main__ - Step 28011: {'lr': 0.00046285445599033063, 'samples': 5378112, 'steps': 28010, 'loss/train': 1.471692681312561} -08/30/2021 18:10:54 - INFO - __main__ - Step 28012: {'lr': 0.00046285167261851114, 'samples': 5378304, 'steps': 28011, 'loss/train': 1.634076714515686} -08/30/2021 18:10:54 - INFO - __main__ - Step 28013: {'lr': 0.00046284888915078384, 'samples': 5378496, 'steps': 28012, 'loss/train': 1.475229024887085} -08/30/2021 18:10:54 - INFO - __main__ - Step 28014: {'lr': 0.00046284610558715024, 'samples': 5378688, 'steps': 28013, 'loss/train': 0.9592087268829346} -08/30/2021 18:10:55 - INFO - __main__ - Step 28015: {'lr': 0.00046284332192761136, 'samples': 5378880, 'steps': 28014, 'loss/train': 1.7823725938796997} -08/30/2021 18:10:55 - INFO - __main__ - Step 28016: {'lr': 0.0004628405381721686, 'samples': 5379072, 'steps': 28015, 'loss/train': 0.370857298374176} -08/30/2021 18:10:57 - INFO - __main__ - Step 28017: {'lr': 0.00046283775432082327, 'samples': 5379264, 'steps': 28016, 'loss/train': 0.9909529685974121} -08/30/2021 18:10:57 - INFO - __main__ - Step 28018: {'lr': 0.0004628349703735765, 'samples': 5379456, 'steps': 28017, 'loss/train': 1.7473207712173462} -08/30/2021 18:10:57 - INFO - __main__ - Step 28019: {'lr': 0.0004628321863304295, 'samples': 5379648, 'steps': 28018, 'loss/train': 1.4742985963821411} -08/30/2021 18:10:58 - INFO - __main__ - Step 28020: {'lr': 0.00046282940219138366, 'samples': 5379840, 'steps': 28019, 'loss/train': 0.8732110857963562} -08/30/2021 18:10:58 - INFO - __main__ - Step 28021: {'lr': 0.0004628266179564401, 'samples': 5380032, 'steps': 28020, 'loss/train': 0.06682850420475006} -08/30/2021 18:11:00 - INFO - __main__ - Step 28022: {'lr': 0.0004628238336256002, 'samples': 5380224, 'steps': 28021, 'loss/train': 1.029103398323059} -08/30/2021 18:11:00 - INFO - __main__ - Step 28023: {'lr': 0.0004628210491988652, 'samples': 5380416, 'steps': 28022, 'loss/train': 0.6956168413162231} -08/30/2021 18:11:00 - INFO - __main__ - Step 28024: {'lr': 0.0004628182646762363, 'samples': 5380608, 'steps': 28023, 'loss/train': 1.4460898637771606} -08/30/2021 18:11:01 - INFO - __main__ - Step 28025: {'lr': 0.00046281548005771476, 'samples': 5380800, 'steps': 28024, 'loss/train': 1.5885947942733765} -08/30/2021 18:11:01 - INFO - __main__ - Step 28026: {'lr': 0.0004628126953433018, 'samples': 5380992, 'steps': 28025, 'loss/train': 0.1988345831632614} -08/30/2021 18:11:03 - INFO - __main__ - Step 28027: {'lr': 0.00046280991053299883, 'samples': 5381184, 'steps': 28026, 'loss/train': 1.525325059890747} -08/30/2021 18:11:03 - INFO - __main__ - Step 28028: {'lr': 0.00046280712562680695, 'samples': 5381376, 'steps': 28027, 'loss/train': 1.526443600654602} -08/30/2021 18:11:03 - INFO - __main__ - Step 28029: {'lr': 0.0004628043406247274, 'samples': 5381568, 'steps': 28028, 'loss/train': 1.3917332887649536} -08/30/2021 18:11:04 - INFO - __main__ - Step 28030: {'lr': 0.0004628015555267616, 'samples': 5381760, 'steps': 28029, 'loss/train': 1.0822982788085938} -08/30/2021 18:11:04 - INFO - __main__ - Step 28031: {'lr': 0.00046279877033291063, 'samples': 5381952, 'steps': 28030, 'loss/train': 1.3407223224639893} -08/30/2021 18:11:04 - INFO - __main__ - Step 28032: {'lr': 0.0004627959850431759, 'samples': 5382144, 'steps': 28031, 'loss/train': 1.6693180799484253} -08/30/2021 18:11:06 - INFO - __main__ - Step 28033: {'lr': 0.0004627931996575585, 'samples': 5382336, 'steps': 28032, 'loss/train': 1.3858481645584106} -08/30/2021 18:11:06 - INFO - __main__ - Step 28034: {'lr': 0.0004627904141760598, 'samples': 5382528, 'steps': 28033, 'loss/train': 1.325707197189331} -08/30/2021 18:11:07 - INFO - __main__ - Step 28035: {'lr': 0.000462787628598681, 'samples': 5382720, 'steps': 28034, 'loss/train': 1.443479299545288} -08/30/2021 18:11:07 - INFO - __main__ - Step 28036: {'lr': 0.00046278484292542346, 'samples': 5382912, 'steps': 28035, 'loss/train': 1.2646863460540771} -08/30/2021 18:11:07 - INFO - __main__ - Step 28037: {'lr': 0.0004627820571562883, 'samples': 5383104, 'steps': 28036, 'loss/train': 0.8303531408309937} -08/30/2021 18:11:09 - INFO - __main__ - Step 28038: {'lr': 0.0004627792712912768, 'samples': 5383296, 'steps': 28037, 'loss/train': 1.3916767835617065} -08/30/2021 18:11:10 - INFO - __main__ - Step 28039: {'lr': 0.0004627764853303902, 'samples': 5383488, 'steps': 28038, 'loss/train': 1.7772756814956665} -08/30/2021 18:11:10 - INFO - __main__ - Step 28040: {'lr': 0.00046277369927362987, 'samples': 5383680, 'steps': 28039, 'loss/train': 0.15569743514060974} -08/30/2021 18:11:10 - INFO - __main__ - Step 28041: {'lr': 0.00046277091312099704, 'samples': 5383872, 'steps': 28040, 'loss/train': 0.9434666633605957} -08/30/2021 18:11:11 - INFO - __main__ - Step 28042: {'lr': 0.00046276812687249283, 'samples': 5384064, 'steps': 28041, 'loss/train': 2.144589900970459} -08/30/2021 18:11:12 - INFO - __main__ - Step 28043: {'lr': 0.00046276534052811863, 'samples': 5384256, 'steps': 28042, 'loss/train': 1.721571683883667} -08/30/2021 18:11:13 - INFO - __main__ - Step 28044: {'lr': 0.00046276255408787565, 'samples': 5384448, 'steps': 28043, 'loss/train': 2.0207138061523438} -08/30/2021 18:11:13 - INFO - __main__ - Step 28045: {'lr': 0.0004627597675517652, 'samples': 5384640, 'steps': 28044, 'loss/train': 1.3871874809265137} -08/30/2021 18:11:13 - INFO - __main__ - Step 28046: {'lr': 0.00046275698091978836, 'samples': 5384832, 'steps': 28045, 'loss/train': 1.3740190267562866} -08/30/2021 18:11:14 - INFO - __main__ - Step 28047: {'lr': 0.0004627541941919466, 'samples': 5385024, 'steps': 28046, 'loss/train': 1.1003849506378174} -08/30/2021 18:11:15 - INFO - __main__ - Step 28048: {'lr': 0.00046275140736824104, 'samples': 5385216, 'steps': 28047, 'loss/train': 1.3855782747268677} -08/30/2021 18:11:16 - INFO - __main__ - Step 28049: {'lr': 0.000462748620448673, 'samples': 5385408, 'steps': 28048, 'loss/train': 1.782700538635254} -08/30/2021 18:11:16 - INFO - __main__ - Step 28050: {'lr': 0.0004627458334332437, 'samples': 5385600, 'steps': 28049, 'loss/train': 1.8163042068481445} -08/30/2021 18:11:16 - INFO - __main__ - Step 28051: {'lr': 0.0004627430463219544, 'samples': 5385792, 'steps': 28050, 'loss/train': 1.3694815635681152} -08/30/2021 18:11:17 - INFO - __main__ - Step 28052: {'lr': 0.0004627402591148064, 'samples': 5385984, 'steps': 28051, 'loss/train': 1.3943809270858765} -08/30/2021 18:11:19 - INFO - __main__ - Step 28053: {'lr': 0.0004627374718118009, 'samples': 5386176, 'steps': 28052, 'loss/train': 1.8527545928955078} -08/30/2021 18:11:19 - INFO - __main__ - Step 28054: {'lr': 0.0004627346844129392, 'samples': 5386368, 'steps': 28053, 'loss/train': 1.161802887916565} -08/30/2021 18:11:19 - INFO - __main__ - Step 28055: {'lr': 0.0004627318969182225, 'samples': 5386560, 'steps': 28054, 'loss/train': 0.08127857744693756} -08/30/2021 18:11:20 - INFO - __main__ - Step 28056: {'lr': 0.0004627291093276521, 'samples': 5386752, 'steps': 28055, 'loss/train': 1.6853795051574707} -08/30/2021 18:11:20 - INFO - __main__ - Step 28057: {'lr': 0.0004627263216412292, 'samples': 5386944, 'steps': 28056, 'loss/train': 0.6058462858200073} -08/30/2021 18:11:20 - INFO - __main__ - Step 28058: {'lr': 0.00046272353385895515, 'samples': 5387136, 'steps': 28057, 'loss/train': 1.2188124656677246} -08/30/2021 18:11:22 - INFO - __main__ - Step 28059: {'lr': 0.0004627207459808312, 'samples': 5387328, 'steps': 28058, 'loss/train': 1.4666595458984375} -08/30/2021 18:11:22 - INFO - __main__ - Step 28060: {'lr': 0.00046271795800685854, 'samples': 5387520, 'steps': 28059, 'loss/train': 1.025999903678894} -08/30/2021 18:11:23 - INFO - __main__ - Step 28061: {'lr': 0.00046271516993703844, 'samples': 5387712, 'steps': 28060, 'loss/train': 1.3338897228240967} -08/30/2021 18:11:23 - INFO - __main__ - Step 28062: {'lr': 0.00046271238177137216, 'samples': 5387904, 'steps': 28061, 'loss/train': 1.6672204732894897} -08/30/2021 18:11:23 - INFO - __main__ - Step 28063: {'lr': 0.00046270959350986095, 'samples': 5388096, 'steps': 28062, 'loss/train': 1.9613392353057861} -08/30/2021 18:11:25 - INFO - __main__ - Step 28064: {'lr': 0.0004627068051525061, 'samples': 5388288, 'steps': 28063, 'loss/train': 1.6687133312225342} -08/30/2021 18:11:25 - INFO - __main__ - Step 28065: {'lr': 0.00046270401669930885, 'samples': 5388480, 'steps': 28064, 'loss/train': 2.189272165298462} -08/30/2021 18:11:26 - INFO - __main__ - Step 28066: {'lr': 0.0004627012281502704, 'samples': 5388672, 'steps': 28065, 'loss/train': 1.5187551975250244} -08/30/2021 18:11:26 - INFO - __main__ - Step 28067: {'lr': 0.00046269843950539214, 'samples': 5388864, 'steps': 28066, 'loss/train': 0.9895861148834229} -08/30/2021 18:11:26 - INFO - __main__ - Step 28068: {'lr': 0.00046269565076467517, 'samples': 5389056, 'steps': 28067, 'loss/train': 1.294631004333496} -08/30/2021 18:11:28 - INFO - __main__ - Step 28069: {'lr': 0.0004626928619281209, 'samples': 5389248, 'steps': 28068, 'loss/train': 1.447240948677063} -08/30/2021 18:11:29 - INFO - __main__ - Step 28070: {'lr': 0.0004626900729957305, 'samples': 5389440, 'steps': 28069, 'loss/train': 0.9354313015937805} -08/30/2021 18:11:29 - INFO - __main__ - Step 28071: {'lr': 0.00046268728396750515, 'samples': 5389632, 'steps': 28070, 'loss/train': 1.1724275350570679} -08/30/2021 18:11:29 - INFO - __main__ - Step 28072: {'lr': 0.0004626844948434462, 'samples': 5389824, 'steps': 28071, 'loss/train': 1.544147253036499} -08/30/2021 18:11:30 - INFO - __main__ - Step 28073: {'lr': 0.00046268170562355497, 'samples': 5390016, 'steps': 28072, 'loss/train': 0.8086039423942566} -08/30/2021 18:11:30 - INFO - __main__ - Step 28074: {'lr': 0.0004626789163078327, 'samples': 5390208, 'steps': 28073, 'loss/train': 2.0508766174316406} -08/30/2021 18:11:32 - INFO - __main__ - Step 28075: {'lr': 0.00046267612689628046, 'samples': 5390400, 'steps': 28074, 'loss/train': 1.5743684768676758} -08/30/2021 18:11:32 - INFO - __main__ - Step 28076: {'lr': 0.00046267333738889973, 'samples': 5390592, 'steps': 28075, 'loss/train': 1.4540815353393555} -08/30/2021 18:11:33 - INFO - __main__ - Step 28077: {'lr': 0.00046267054778569163, 'samples': 5390784, 'steps': 28076, 'loss/train': 1.152719497680664} -08/30/2021 18:11:33 - INFO - __main__ - Step 28078: {'lr': 0.0004626677580866574, 'samples': 5390976, 'steps': 28077, 'loss/train': 1.2343814373016357} -08/30/2021 18:11:33 - INFO - __main__ - Step 28079: {'lr': 0.00046266496829179847, 'samples': 5391168, 'steps': 28078, 'loss/train': 1.8133282661437988} -08/30/2021 18:11:35 - INFO - __main__ - Step 28080: {'lr': 0.0004626621784011159, 'samples': 5391360, 'steps': 28079, 'loss/train': 1.8737905025482178} -08/30/2021 18:11:35 - INFO - __main__ - Step 28081: {'lr': 0.0004626593884146111, 'samples': 5391552, 'steps': 28080, 'loss/train': 1.972983956336975} -08/30/2021 18:11:36 - INFO - __main__ - Step 28082: {'lr': 0.00046265659833228523, 'samples': 5391744, 'steps': 28081, 'loss/train': 1.348278522491455} -08/30/2021 18:11:36 - INFO - __main__ - Step 28083: {'lr': 0.0004626538081541396, 'samples': 5391936, 'steps': 28082, 'loss/train': 1.663896918296814} -08/30/2021 18:11:36 - INFO - __main__ - Step 28084: {'lr': 0.00046265101788017543, 'samples': 5392128, 'steps': 28083, 'loss/train': 1.6296148300170898} -08/30/2021 18:11:38 - INFO - __main__ - Step 28085: {'lr': 0.00046264822751039406, 'samples': 5392320, 'steps': 28084, 'loss/train': 1.5372482538223267} -08/30/2021 18:11:38 - INFO - __main__ - Step 28086: {'lr': 0.00046264543704479654, 'samples': 5392512, 'steps': 28085, 'loss/train': 1.3979026079177856} -08/30/2021 18:11:38 - INFO - __main__ - Step 28087: {'lr': 0.0004626426464833844, 'samples': 5392704, 'steps': 28086, 'loss/train': 1.364237666130066} -08/30/2021 18:11:39 - INFO - __main__ - Step 28088: {'lr': 0.0004626398558261586, 'samples': 5392896, 'steps': 28087, 'loss/train': 1.6765680313110352} -08/30/2021 18:11:39 - INFO - __main__ - Step 28089: {'lr': 0.00046263706507312073, 'samples': 5393088, 'steps': 28088, 'loss/train': 1.1328810453414917} -08/30/2021 18:11:41 - INFO - __main__ - Step 28090: {'lr': 0.00046263427422427183, 'samples': 5393280, 'steps': 28089, 'loss/train': 1.327867865562439} -08/30/2021 18:11:41 - INFO - __main__ - Step 28091: {'lr': 0.00046263148327961324, 'samples': 5393472, 'steps': 28090, 'loss/train': 1.3953214883804321} -08/30/2021 18:11:42 - INFO - __main__ - Step 28092: {'lr': 0.00046262869223914613, 'samples': 5393664, 'steps': 28091, 'loss/train': 1.0453213453292847} -08/30/2021 18:11:42 - INFO - __main__ - Step 28093: {'lr': 0.00046262590110287183, 'samples': 5393856, 'steps': 28092, 'loss/train': 1.854308843612671} -08/30/2021 18:11:42 - INFO - __main__ - Step 28094: {'lr': 0.00046262310987079156, 'samples': 5394048, 'steps': 28093, 'loss/train': 1.4553587436676025} -08/30/2021 18:11:44 - INFO - __main__ - Step 28095: {'lr': 0.0004626203185429066, 'samples': 5394240, 'steps': 28094, 'loss/train': 1.2204734086990356} -08/30/2021 18:11:45 - INFO - __main__ - Step 28096: {'lr': 0.00046261752711921825, 'samples': 5394432, 'steps': 28095, 'loss/train': 1.5668973922729492} -08/30/2021 18:11:45 - INFO - __main__ - Step 28097: {'lr': 0.00046261473559972764, 'samples': 5394624, 'steps': 28096, 'loss/train': 1.6996465921401978} -08/30/2021 18:11:45 - INFO - __main__ - Step 28098: {'lr': 0.00046261194398443617, 'samples': 5394816, 'steps': 28097, 'loss/train': 1.5285561084747314} -08/30/2021 18:11:46 - INFO - __main__ - Step 28099: {'lr': 0.00046260915227334503, 'samples': 5395008, 'steps': 28098, 'loss/train': 1.1275972127914429} -08/30/2021 18:11:47 - INFO - __main__ - Step 28100: {'lr': 0.0004626063604664555, 'samples': 5395200, 'steps': 28099, 'loss/train': 0.4824984073638916} -08/30/2021 18:11:48 - INFO - __main__ - Step 28101: {'lr': 0.00046260356856376884, 'samples': 5395392, 'steps': 28100, 'loss/train': 1.8263745307922363} -08/30/2021 18:11:48 - INFO - __main__ - Step 28102: {'lr': 0.0004626007765652862, 'samples': 5395584, 'steps': 28101, 'loss/train': 1.334649920463562} -08/30/2021 18:11:48 - INFO - __main__ - Step 28103: {'lr': 0.00046259798447100903, 'samples': 5395776, 'steps': 28102, 'loss/train': 0.9247645735740662} -08/30/2021 18:11:49 - INFO - __main__ - Step 28104: {'lr': 0.0004625951922809385, 'samples': 5395968, 'steps': 28103, 'loss/train': 1.1381335258483887} -08/30/2021 18:11:50 - INFO - __main__ - Step 28105: {'lr': 0.0004625923999950758, 'samples': 5396160, 'steps': 28104, 'loss/train': 1.7762413024902344} -08/30/2021 18:11:51 - INFO - __main__ - Step 28106: {'lr': 0.0004625896076134222, 'samples': 5396352, 'steps': 28105, 'loss/train': 1.751448154449463} -08/30/2021 18:11:51 - INFO - __main__ - Step 28107: {'lr': 0.00046258681513597913, 'samples': 5396544, 'steps': 28106, 'loss/train': 1.4575424194335938} -08/30/2021 18:11:51 - INFO - __main__ - Step 28108: {'lr': 0.0004625840225627476, 'samples': 5396736, 'steps': 28107, 'loss/train': 1.5888158082962036} -08/30/2021 18:11:52 - INFO - __main__ - Step 28109: {'lr': 0.0004625812298937291, 'samples': 5396928, 'steps': 28108, 'loss/train': 1.4933538436889648} -08/30/2021 18:11:53 - INFO - __main__ - Step 28110: {'lr': 0.0004625784371289247, 'samples': 5397120, 'steps': 28109, 'loss/train': 1.0874392986297607} -08/30/2021 18:11:54 - INFO - __main__ - Step 28111: {'lr': 0.00046257564426833574, 'samples': 5397312, 'steps': 28110, 'loss/train': 2.6032867431640625} -08/30/2021 18:11:54 - INFO - __main__ - Step 28112: {'lr': 0.0004625728513119635, 'samples': 5397504, 'steps': 28111, 'loss/train': 0.4529555141925812} -08/30/2021 18:11:54 - INFO - __main__ - Step 28113: {'lr': 0.0004625700582598092, 'samples': 5397696, 'steps': 28112, 'loss/train': 1.5608940124511719} -08/30/2021 18:11:55 - INFO - __main__ - Step 28114: {'lr': 0.00046256726511187407, 'samples': 5397888, 'steps': 28113, 'loss/train': 1.8138625621795654} -08/30/2021 18:11:56 - INFO - __main__ - Step 28115: {'lr': 0.0004625644718681595, 'samples': 5398080, 'steps': 28114, 'loss/train': 1.496962070465088} -08/30/2021 18:11:57 - INFO - __main__ - Step 28116: {'lr': 0.0004625616785286666, 'samples': 5398272, 'steps': 28115, 'loss/train': 1.181666612625122} -08/30/2021 18:11:57 - INFO - __main__ - Step 28117: {'lr': 0.0004625588850933967, 'samples': 5398464, 'steps': 28116, 'loss/train': 1.881162166595459} -08/30/2021 18:11:58 - INFO - __main__ - Step 28118: {'lr': 0.00046255609156235105, 'samples': 5398656, 'steps': 28117, 'loss/train': 1.7869846820831299} -08/30/2021 18:11:58 - INFO - __main__ - Step 28119: {'lr': 0.0004625532979355309, 'samples': 5398848, 'steps': 28118, 'loss/train': 1.6022080183029175} -08/30/2021 18:11:58 - INFO - __main__ - Step 28120: {'lr': 0.00046255050421293756, 'samples': 5399040, 'steps': 28119, 'loss/train': 1.5461374521255493} -08/30/2021 18:12:00 - INFO - __main__ - Step 28121: {'lr': 0.0004625477103945722, 'samples': 5399232, 'steps': 28120, 'loss/train': 1.3789361715316772} -08/30/2021 18:12:01 - INFO - __main__ - Step 28122: {'lr': 0.00046254491648043604, 'samples': 5399424, 'steps': 28121, 'loss/train': 0.5235848426818848} -08/30/2021 18:12:01 - INFO - __main__ - Step 28123: {'lr': 0.00046254212247053055, 'samples': 5399616, 'steps': 28122, 'loss/train': 1.7202489376068115} -08/30/2021 18:12:01 - INFO - __main__ - Step 28124: {'lr': 0.0004625393283648568, 'samples': 5399808, 'steps': 28123, 'loss/train': 1.5611282587051392} -08/30/2021 18:12:02 - INFO - __main__ - Step 28125: {'lr': 0.0004625365341634161, 'samples': 5400000, 'steps': 28124, 'loss/train': 1.266133427619934} -08/30/2021 18:12:03 - INFO - __main__ - Step 28126: {'lr': 0.00046253373986620985, 'samples': 5400192, 'steps': 28125, 'loss/train': 1.058297872543335} -08/30/2021 18:12:04 - INFO - __main__ - Step 28127: {'lr': 0.00046253094547323904, 'samples': 5400384, 'steps': 28126, 'loss/train': 1.3797509670257568} -08/30/2021 18:12:04 - INFO - __main__ - Step 28128: {'lr': 0.0004625281509845051, 'samples': 5400576, 'steps': 28127, 'loss/train': 1.6242307424545288} -08/30/2021 18:12:04 - INFO - __main__ - Step 28129: {'lr': 0.0004625253564000092, 'samples': 5400768, 'steps': 28128, 'loss/train': 0.6565216183662415} -08/30/2021 18:12:05 - INFO - __main__ - Step 28130: {'lr': 0.00046252256171975273, 'samples': 5400960, 'steps': 28129, 'loss/train': 1.4239695072174072} -08/30/2021 18:12:06 - INFO - __main__ - Step 28131: {'lr': 0.0004625197669437368, 'samples': 5401152, 'steps': 28130, 'loss/train': 2.020134449005127} -08/30/2021 18:12:07 - INFO - __main__ - Step 28132: {'lr': 0.0004625169720719628, 'samples': 5401344, 'steps': 28131, 'loss/train': 1.8320237398147583} -08/30/2021 18:12:07 - INFO - __main__ - Step 28133: {'lr': 0.0004625141771044319, 'samples': 5401536, 'steps': 28132, 'loss/train': 1.5916252136230469} -08/30/2021 18:12:08 - INFO - __main__ - Step 28134: {'lr': 0.0004625113820411454, 'samples': 5401728, 'steps': 28133, 'loss/train': 1.3905489444732666} -08/30/2021 18:12:08 - INFO - __main__ - Step 28135: {'lr': 0.0004625085868821046, 'samples': 5401920, 'steps': 28134, 'loss/train': 1.620387077331543} -08/30/2021 18:12:09 - INFO - __main__ - Step 28136: {'lr': 0.0004625057916273107, 'samples': 5402112, 'steps': 28135, 'loss/train': 1.5118495225906372} -08/30/2021 18:12:10 - INFO - __main__ - Step 28137: {'lr': 0.00046250299627676486, 'samples': 5402304, 'steps': 28136, 'loss/train': 1.7144805192947388} -08/30/2021 18:12:10 - INFO - __main__ - Step 28138: {'lr': 0.0004625002008304685, 'samples': 5402496, 'steps': 28137, 'loss/train': 0.9722861051559448} -08/30/2021 18:12:11 - INFO - __main__ - Step 28139: {'lr': 0.00046249740528842286, 'samples': 5402688, 'steps': 28138, 'loss/train': 1.4861527681350708} -08/30/2021 18:12:11 - INFO - __main__ - Step 28140: {'lr': 0.00046249460965062917, 'samples': 5402880, 'steps': 28139, 'loss/train': 0.9521327018737793} -08/30/2021 18:12:11 - INFO - __main__ - Step 28141: {'lr': 0.0004624918139170887, 'samples': 5403072, 'steps': 28140, 'loss/train': 1.579189658164978} -08/30/2021 18:12:13 - INFO - __main__ - Step 28142: {'lr': 0.0004624890180878027, 'samples': 5403264, 'steps': 28141, 'loss/train': 2.330486297607422} -08/30/2021 18:12:13 - INFO - __main__ - Step 28143: {'lr': 0.00046248622216277235, 'samples': 5403456, 'steps': 28142, 'loss/train': 1.2355427742004395} -08/30/2021 18:12:13 - INFO - __main__ - Step 28144: {'lr': 0.0004624834261419991, 'samples': 5403648, 'steps': 28143, 'loss/train': 1.6283841133117676} -08/30/2021 18:12:14 - INFO - __main__ - Step 28145: {'lr': 0.000462480630025484, 'samples': 5403840, 'steps': 28144, 'loss/train': 0.5533981323242188} -08/30/2021 18:12:14 - INFO - __main__ - Step 28146: {'lr': 0.0004624778338132285, 'samples': 5404032, 'steps': 28145, 'loss/train': 1.2688381671905518} -08/30/2021 18:12:16 - INFO - __main__ - Step 28147: {'lr': 0.0004624750375052337, 'samples': 5404224, 'steps': 28146, 'loss/train': 1.3087410926818848} -08/30/2021 18:12:17 - INFO - __main__ - Step 28148: {'lr': 0.0004624722411015009, 'samples': 5404416, 'steps': 28147, 'loss/train': 1.15404212474823} -08/30/2021 18:12:17 - INFO - __main__ - Step 28149: {'lr': 0.0004624694446020314, 'samples': 5404608, 'steps': 28148, 'loss/train': 1.3155434131622314} -08/30/2021 18:12:17 - INFO - __main__ - Step 28150: {'lr': 0.0004624666480068265, 'samples': 5404800, 'steps': 28149, 'loss/train': 0.2286374717950821} -08/30/2021 18:12:18 - INFO - __main__ - Step 28151: {'lr': 0.0004624638513158874, 'samples': 5404992, 'steps': 28150, 'loss/train': 1.9606057405471802} -08/30/2021 18:12:19 - INFO - __main__ - Step 28152: {'lr': 0.0004624610545292154, 'samples': 5405184, 'steps': 28151, 'loss/train': 1.2808737754821777} -08/30/2021 18:12:20 - INFO - __main__ - Step 28153: {'lr': 0.00046245825764681166, 'samples': 5405376, 'steps': 28152, 'loss/train': 2.141594409942627} -08/30/2021 18:12:20 - INFO - __main__ - Step 28154: {'lr': 0.0004624554606686775, 'samples': 5405568, 'steps': 28153, 'loss/train': 1.5030946731567383} -08/30/2021 18:12:21 - INFO - __main__ - Step 28155: {'lr': 0.0004624526635948142, 'samples': 5405760, 'steps': 28154, 'loss/train': 0.11189009994268417} -08/30/2021 18:12:21 - INFO - __main__ - Step 28156: {'lr': 0.000462449866425223, 'samples': 5405952, 'steps': 28155, 'loss/train': 0.05983877554535866} -08/30/2021 18:12:21 - INFO - __main__ - Step 28157: {'lr': 0.0004624470691599052, 'samples': 5406144, 'steps': 28156, 'loss/train': 1.673291802406311} -08/30/2021 18:12:23 - INFO - __main__ - Step 28158: {'lr': 0.00046244427179886207, 'samples': 5406336, 'steps': 28157, 'loss/train': 1.4050617218017578} -08/30/2021 18:12:23 - INFO - __main__ - Step 28159: {'lr': 0.0004624414743420947, 'samples': 5406528, 'steps': 28158, 'loss/train': 2.366166353225708} -08/30/2021 18:12:24 - INFO - __main__ - Step 28160: {'lr': 0.00046243867678960463, 'samples': 5406720, 'steps': 28159, 'loss/train': 1.3358148336410522} -08/30/2021 18:12:24 - INFO - __main__ - Step 28161: {'lr': 0.00046243587914139285, 'samples': 5406912, 'steps': 28160, 'loss/train': 1.6666492223739624} -08/30/2021 18:12:24 - INFO - __main__ - Step 28162: {'lr': 0.00046243308139746076, 'samples': 5407104, 'steps': 28161, 'loss/train': 1.4736043214797974} -08/30/2021 18:12:26 - INFO - __main__ - Step 28163: {'lr': 0.00046243028355780967, 'samples': 5407296, 'steps': 28162, 'loss/train': 1.0821442604064941} -08/30/2021 18:12:26 - INFO - __main__ - Step 28164: {'lr': 0.00046242748562244076, 'samples': 5407488, 'steps': 28163, 'loss/train': 0.5729638934135437} -08/30/2021 18:12:27 - INFO - __main__ - Step 28165: {'lr': 0.00046242468759135523, 'samples': 5407680, 'steps': 28164, 'loss/train': 1.7088289260864258} -08/30/2021 18:12:27 - INFO - __main__ - Step 28166: {'lr': 0.00046242188946455444, 'samples': 5407872, 'steps': 28165, 'loss/train': 1.187338948249817} -08/30/2021 18:12:28 - INFO - __main__ - Step 28167: {'lr': 0.0004624190912420397, 'samples': 5408064, 'steps': 28166, 'loss/train': 1.3360848426818848} -08/30/2021 18:12:29 - INFO - __main__ - Step 28168: {'lr': 0.0004624162929238121, 'samples': 5408256, 'steps': 28167, 'loss/train': 1.753943920135498} -08/30/2021 18:12:30 - INFO - __main__ - Step 28169: {'lr': 0.000462413494509873, 'samples': 5408448, 'steps': 28168, 'loss/train': 1.607373833656311} -08/30/2021 18:12:30 - INFO - __main__ - Step 28170: {'lr': 0.0004624106960002237, 'samples': 5408640, 'steps': 28169, 'loss/train': 1.3224910497665405} -08/30/2021 18:12:30 - INFO - __main__ - Step 28171: {'lr': 0.0004624078973948654, 'samples': 5408832, 'steps': 28170, 'loss/train': 0.07940766960382462} -08/30/2021 18:12:31 - INFO - __main__ - Step 28172: {'lr': 0.00046240509869379943, 'samples': 5409024, 'steps': 28171, 'loss/train': 1.4734846353530884} -08/30/2021 18:12:31 - INFO - __main__ - Step 28173: {'lr': 0.00046240229989702697, 'samples': 5409216, 'steps': 28172, 'loss/train': 1.5718226432800293} -08/30/2021 18:12:33 - INFO - __main__ - Step 28174: {'lr': 0.0004623995010045493, 'samples': 5409408, 'steps': 28173, 'loss/train': 1.8593250513076782} -08/30/2021 18:12:34 - INFO - __main__ - Step 28175: {'lr': 0.0004623967020163677, 'samples': 5409600, 'steps': 28174, 'loss/train': 1.6550480127334595} -08/30/2021 18:12:34 - INFO - __main__ - Step 28176: {'lr': 0.0004623939029324834, 'samples': 5409792, 'steps': 28175, 'loss/train': 1.3389935493469238} -08/30/2021 18:12:34 - INFO - __main__ - Step 28177: {'lr': 0.0004623911037528977, 'samples': 5409984, 'steps': 28176, 'loss/train': 1.6478055715560913} -08/30/2021 18:12:35 - INFO - __main__ - Step 28178: {'lr': 0.00046238830447761184, 'samples': 5410176, 'steps': 28177, 'loss/train': 1.7442591190338135} -08/30/2021 18:12:35 - INFO - __main__ - Step 28179: {'lr': 0.0004623855051066271, 'samples': 5410368, 'steps': 28178, 'loss/train': 1.2677836418151855} -08/30/2021 18:12:37 - INFO - __main__ - Step 28180: {'lr': 0.00046238270563994465, 'samples': 5410560, 'steps': 28179, 'loss/train': 1.6171486377716064} -08/30/2021 18:12:38 - INFO - __main__ - Step 28181: {'lr': 0.00046237990607756596, 'samples': 5410752, 'steps': 28180, 'loss/train': 1.4700666666030884} -08/30/2021 18:12:38 - INFO - __main__ - Step 28182: {'lr': 0.0004623771064194921, 'samples': 5410944, 'steps': 28181, 'loss/train': 0.5983209609985352} -08/30/2021 18:12:38 - INFO - __main__ - Step 28183: {'lr': 0.0004623743066657244, 'samples': 5411136, 'steps': 28182, 'loss/train': 0.4780607223510742} -08/30/2021 18:12:39 - INFO - __main__ - Step 28184: {'lr': 0.00046237150681626414, 'samples': 5411328, 'steps': 28183, 'loss/train': 0.4769774377346039} -08/30/2021 18:12:39 - INFO - __main__ - Step 28185: {'lr': 0.00046236870687111254, 'samples': 5411520, 'steps': 28184, 'loss/train': 1.4490569829940796} -08/30/2021 18:12:41 - INFO - __main__ - Step 28186: {'lr': 0.0004623659068302708, 'samples': 5411712, 'steps': 28185, 'loss/train': 0.22667363286018372} -08/30/2021 18:12:41 - INFO - __main__ - Step 28187: {'lr': 0.00046236310669374035, 'samples': 5411904, 'steps': 28186, 'loss/train': 2.009615898132324} -08/30/2021 18:12:41 - INFO - __main__ - Step 28188: {'lr': 0.0004623603064615223, 'samples': 5412096, 'steps': 28187, 'loss/train': 0.99207603931427} -08/30/2021 18:12:42 - INFO - __main__ - Step 28189: {'lr': 0.000462357506133618, 'samples': 5412288, 'steps': 28188, 'loss/train': 1.8395366668701172} -08/30/2021 18:12:42 - INFO - __main__ - Step 28190: {'lr': 0.00046235470571002877, 'samples': 5412480, 'steps': 28189, 'loss/train': 1.4065794944763184} -08/30/2021 18:12:42 - INFO - __main__ - Step 28191: {'lr': 0.00046235190519075564, 'samples': 5412672, 'steps': 28190, 'loss/train': 1.8146851062774658} -08/30/2021 18:12:44 - INFO - __main__ - Step 28192: {'lr': 0.00046234910457580014, 'samples': 5412864, 'steps': 28191, 'loss/train': 1.6898690462112427} -08/30/2021 18:12:45 - INFO - __main__ - Step 28193: {'lr': 0.0004623463038651633, 'samples': 5413056, 'steps': 28192, 'loss/train': 0.153415709733963} -08/30/2021 18:12:45 - INFO - __main__ - Step 28194: {'lr': 0.0004623435030588466, 'samples': 5413248, 'steps': 28193, 'loss/train': 1.0885311365127563} -08/30/2021 18:12:45 - INFO - __main__ - Step 28195: {'lr': 0.00046234070215685116, 'samples': 5413440, 'steps': 28194, 'loss/train': 1.56862473487854} -08/30/2021 18:12:46 - INFO - __main__ - Step 28196: {'lr': 0.0004623379011591782, 'samples': 5413632, 'steps': 28195, 'loss/train': 0.537412703037262} -08/30/2021 18:12:47 - INFO - __main__ - Step 28197: {'lr': 0.00046233510006582913, 'samples': 5413824, 'steps': 28196, 'loss/train': 1.6278892755508423} -08/30/2021 18:12:48 - INFO - __main__ - Step 28198: {'lr': 0.00046233229887680517, 'samples': 5414016, 'steps': 28197, 'loss/train': 2.501605749130249} -08/30/2021 18:12:48 - INFO - __main__ - Step 28199: {'lr': 0.00046232949759210753, 'samples': 5414208, 'steps': 28198, 'loss/train': 1.147364854812622} -08/30/2021 18:12:48 - INFO - __main__ - Step 28200: {'lr': 0.00046232669621173745, 'samples': 5414400, 'steps': 28199, 'loss/train': 1.6096371412277222} -08/30/2021 18:12:49 - INFO - __main__ - Step 28201: {'lr': 0.00046232389473569623, 'samples': 5414592, 'steps': 28200, 'loss/train': 1.3819606304168701} -08/30/2021 18:12:50 - INFO - __main__ - Step 28202: {'lr': 0.0004623210931639852, 'samples': 5414784, 'steps': 28201, 'loss/train': 2.25793719291687} -08/30/2021 18:12:51 - INFO - __main__ - Step 28203: {'lr': 0.00046231829149660553, 'samples': 5414976, 'steps': 28202, 'loss/train': 1.1932913064956665} -08/30/2021 18:12:51 - INFO - __main__ - Step 28204: {'lr': 0.00046231548973355854, 'samples': 5415168, 'steps': 28203, 'loss/train': 1.3090009689331055} -08/30/2021 18:12:51 - INFO - __main__ - Step 28205: {'lr': 0.00046231268787484545, 'samples': 5415360, 'steps': 28204, 'loss/train': 2.3537867069244385} -08/30/2021 18:12:52 - INFO - __main__ - Step 28206: {'lr': 0.0004623098859204675, 'samples': 5415552, 'steps': 28205, 'loss/train': 1.8150583505630493} -08/30/2021 18:12:53 - INFO - __main__ - Step 28207: {'lr': 0.00046230708387042603, 'samples': 5415744, 'steps': 28206, 'loss/train': 1.7018022537231445} -08/30/2021 18:12:54 - INFO - __main__ - Step 28208: {'lr': 0.0004623042817247223, 'samples': 5415936, 'steps': 28207, 'loss/train': 1.6013038158416748} -08/30/2021 18:12:54 - INFO - __main__ - Step 28209: {'lr': 0.00046230147948335746, 'samples': 5416128, 'steps': 28208, 'loss/train': 1.664321780204773} -08/30/2021 18:12:54 - INFO - __main__ - Step 28210: {'lr': 0.0004622986771463329, 'samples': 5416320, 'steps': 28209, 'loss/train': 1.4428523778915405} -08/30/2021 18:12:55 - INFO - __main__ - Step 28211: {'lr': 0.0004622958747136498, 'samples': 5416512, 'steps': 28210, 'loss/train': 1.4926539659500122} -08/30/2021 18:12:56 - INFO - __main__ - Step 28212: {'lr': 0.00046229307218530945, 'samples': 5416704, 'steps': 28211, 'loss/train': 1.5020993947982788} -08/30/2021 18:12:57 - INFO - __main__ - Step 28213: {'lr': 0.0004622902695613131, 'samples': 5416896, 'steps': 28212, 'loss/train': 1.1484891176223755} -08/30/2021 18:12:57 - INFO - __main__ - Step 28214: {'lr': 0.00046228746684166214, 'samples': 5417088, 'steps': 28213, 'loss/train': 1.8509457111358643} -08/30/2021 18:12:57 - INFO - __main__ - Step 28215: {'lr': 0.00046228466402635764, 'samples': 5417280, 'steps': 28214, 'loss/train': 1.9831180572509766} -08/30/2021 18:12:58 - INFO - __main__ - Step 28216: {'lr': 0.0004622818611154009, 'samples': 5417472, 'steps': 28215, 'loss/train': 1.021217942237854} -08/30/2021 18:12:58 - INFO - __main__ - Step 28217: {'lr': 0.00046227905810879334, 'samples': 5417664, 'steps': 28216, 'loss/train': 0.9175899028778076} -08/30/2021 18:13:00 - INFO - __main__ - Step 28218: {'lr': 0.0004622762550065361, 'samples': 5417856, 'steps': 28217, 'loss/train': 1.1760281324386597} -08/30/2021 18:13:00 - INFO - __main__ - Step 28219: {'lr': 0.0004622734518086304, 'samples': 5418048, 'steps': 28218, 'loss/train': 1.3560354709625244} -08/30/2021 18:13:01 - INFO - __main__ - Step 28220: {'lr': 0.0004622706485150776, 'samples': 5418240, 'steps': 28219, 'loss/train': 1.9772204160690308} -08/30/2021 18:13:01 - INFO - __main__ - Step 28221: {'lr': 0.0004622678451258788, 'samples': 5418432, 'steps': 28220, 'loss/train': 2.1146113872528076} -08/30/2021 18:13:01 - INFO - __main__ - Step 28222: {'lr': 0.00046226504164103557, 'samples': 5418624, 'steps': 28221, 'loss/train': 1.2535582780838013} -08/30/2021 18:13:03 - INFO - __main__ - Step 28223: {'lr': 0.0004622622380605489, 'samples': 5418816, 'steps': 28222, 'loss/train': 0.22345010936260223} -08/30/2021 18:13:03 - INFO - __main__ - Step 28224: {'lr': 0.0004622594343844201, 'samples': 5419008, 'steps': 28223, 'loss/train': 1.1060556173324585} -08/30/2021 18:13:04 - INFO - __main__ - Step 28225: {'lr': 0.00046225663061265056, 'samples': 5419200, 'steps': 28224, 'loss/train': 1.5601060390472412} -08/30/2021 18:13:04 - INFO - __main__ - Step 28226: {'lr': 0.0004622538267452414, 'samples': 5419392, 'steps': 28225, 'loss/train': 1.9933298826217651} -08/30/2021 18:13:04 - INFO - __main__ - Step 28227: {'lr': 0.00046225102278219394, 'samples': 5419584, 'steps': 28226, 'loss/train': 1.4421290159225464} -08/30/2021 18:13:07 - INFO - __main__ - Step 28228: {'lr': 0.0004622482187235094, 'samples': 5419776, 'steps': 28227, 'loss/train': 1.6272094249725342} -08/30/2021 18:13:07 - INFO - __main__ - Step 28229: {'lr': 0.00046224541456918916, 'samples': 5419968, 'steps': 28228, 'loss/train': 1.554030418395996} -08/30/2021 18:13:07 - INFO - __main__ - Step 28230: {'lr': 0.0004622426103192344, 'samples': 5420160, 'steps': 28229, 'loss/train': 1.3759022951126099} -08/30/2021 18:13:08 - INFO - __main__ - Step 28231: {'lr': 0.00046223980597364647, 'samples': 5420352, 'steps': 28230, 'loss/train': 1.3608697652816772} -08/30/2021 18:13:08 - INFO - __main__ - Step 28232: {'lr': 0.0004622370015324264, 'samples': 5420544, 'steps': 28231, 'loss/train': 2.0276691913604736} -08/30/2021 18:13:08 - INFO - __main__ - Step 28233: {'lr': 0.0004622341969955757, 'samples': 5420736, 'steps': 28232, 'loss/train': 1.8577359914779663} -08/30/2021 18:13:10 - INFO - __main__ - Step 28234: {'lr': 0.00046223139236309553, 'samples': 5420928, 'steps': 28233, 'loss/train': 0.9461192488670349} -08/30/2021 18:13:11 - INFO - __main__ - Step 28235: {'lr': 0.0004622285876349872, 'samples': 5421120, 'steps': 28234, 'loss/train': 0.7482120990753174} -08/30/2021 18:13:11 - INFO - __main__ - Step 28236: {'lr': 0.00046222578281125194, 'samples': 5421312, 'steps': 28235, 'loss/train': 1.4742566347122192} -08/30/2021 18:13:11 - INFO - __main__ - Step 28237: {'lr': 0.0004622229778918909, 'samples': 5421504, 'steps': 28236, 'loss/train': 0.9649300575256348} -08/30/2021 18:13:12 - INFO - __main__ - Step 28238: {'lr': 0.00046222017287690566, 'samples': 5421696, 'steps': 28237, 'loss/train': 1.6385213136672974} -08/30/2021 18:13:14 - INFO - __main__ - Step 28239: {'lr': 0.00046221736776629713, 'samples': 5421888, 'steps': 28238, 'loss/train': 1.564038872718811} -08/30/2021 18:13:14 - INFO - __main__ - Step 28240: {'lr': 0.0004622145625600668, 'samples': 5422080, 'steps': 28239, 'loss/train': 1.3118025064468384} -08/30/2021 18:13:15 - INFO - __main__ - Step 28241: {'lr': 0.00046221175725821585, 'samples': 5422272, 'steps': 28240, 'loss/train': 1.225050687789917} -08/30/2021 18:13:15 - INFO - __main__ - Step 28242: {'lr': 0.00046220895186074553, 'samples': 5422464, 'steps': 28241, 'loss/train': 1.1002739667892456} -08/30/2021 18:13:15 - INFO - __main__ - Step 28243: {'lr': 0.0004622061463676572, 'samples': 5422656, 'steps': 28242, 'loss/train': 1.6412336826324463} -08/30/2021 18:13:16 - INFO - __main__ - Step 28244: {'lr': 0.000462203340778952, 'samples': 5422848, 'steps': 28243, 'loss/train': 1.8457484245300293} -08/30/2021 18:13:16 - INFO - __main__ - Step 28245: {'lr': 0.0004622005350946312, 'samples': 5423040, 'steps': 28244, 'loss/train': 0.09960411489009857} -08/30/2021 18:13:17 - INFO - __main__ - Step 28246: {'lr': 0.00046219772931469617, 'samples': 5423232, 'steps': 28245, 'loss/train': 1.8270965814590454} -08/30/2021 18:13:18 - INFO - __main__ - Step 28247: {'lr': 0.00046219492343914815, 'samples': 5423424, 'steps': 28246, 'loss/train': 1.3844245672225952} -08/30/2021 18:13:18 - INFO - __main__ - Step 28248: {'lr': 0.00046219211746798835, 'samples': 5423616, 'steps': 28247, 'loss/train': 1.5090340375900269} -08/30/2021 18:13:19 - INFO - __main__ - Step 28249: {'lr': 0.000462189311401218, 'samples': 5423808, 'steps': 28248, 'loss/train': 1.3838329315185547} -08/30/2021 18:13:20 - INFO - __main__ - Step 28250: {'lr': 0.0004621865052388385, 'samples': 5424000, 'steps': 28249, 'loss/train': 1.3188226222991943} -08/30/2021 18:13:20 - INFO - __main__ - Step 28251: {'lr': 0.00046218369898085097, 'samples': 5424192, 'steps': 28250, 'loss/train': 0.8289266228675842} -08/30/2021 18:13:21 - INFO - __main__ - Step 28252: {'lr': 0.0004621808926272568, 'samples': 5424384, 'steps': 28251, 'loss/train': 1.43550705909729} -08/30/2021 18:13:21 - INFO - __main__ - Step 28253: {'lr': 0.0004621780861780572, 'samples': 5424576, 'steps': 28252, 'loss/train': 1.619834303855896} -08/30/2021 18:13:21 - INFO - __main__ - Step 28254: {'lr': 0.00046217527963325335, 'samples': 5424768, 'steps': 28253, 'loss/train': 1.370830774307251} -08/30/2021 18:13:22 - INFO - __main__ - Step 28255: {'lr': 0.00046217247299284666, 'samples': 5424960, 'steps': 28254, 'loss/train': 1.5683119297027588} -08/30/2021 18:13:23 - INFO - __main__ - Step 28256: {'lr': 0.00046216966625683834, 'samples': 5425152, 'steps': 28255, 'loss/train': 1.78057861328125} -08/30/2021 18:13:24 - INFO - __main__ - Step 28257: {'lr': 0.00046216685942522957, 'samples': 5425344, 'steps': 28256, 'loss/train': 1.5489559173583984} -08/30/2021 18:13:24 - INFO - __main__ - Step 28258: {'lr': 0.00046216405249802176, 'samples': 5425536, 'steps': 28257, 'loss/train': 0.8627528548240662} -08/30/2021 18:13:25 - INFO - __main__ - Step 28259: {'lr': 0.000462161245475216, 'samples': 5425728, 'steps': 28258, 'loss/train': 1.8499099016189575} -08/30/2021 18:13:25 - INFO - __main__ - Step 28260: {'lr': 0.0004621584383568137, 'samples': 5425920, 'steps': 28259, 'loss/train': 1.62791907787323} -08/30/2021 18:13:27 - INFO - __main__ - Step 28261: {'lr': 0.00046215563114281613, 'samples': 5426112, 'steps': 28260, 'loss/train': 1.87300443649292} -08/30/2021 18:13:27 - INFO - __main__ - Step 28262: {'lr': 0.0004621528238332245, 'samples': 5426304, 'steps': 28261, 'loss/train': 1.4125200510025024} -08/30/2021 18:13:28 - INFO - __main__ - Step 28263: {'lr': 0.00046215001642804, 'samples': 5426496, 'steps': 28262, 'loss/train': 1.8862314224243164} -08/30/2021 18:13:28 - INFO - __main__ - Step 28264: {'lr': 0.0004621472089272641, 'samples': 5426688, 'steps': 28263, 'loss/train': 1.7736948728561401} -08/30/2021 18:13:28 - INFO - __main__ - Step 28265: {'lr': 0.0004621444013308979, 'samples': 5426880, 'steps': 28264, 'loss/train': 0.8786599636077881} -08/30/2021 18:13:30 - INFO - __main__ - Step 28266: {'lr': 0.00046214159363894264, 'samples': 5427072, 'steps': 28265, 'loss/train': 1.8863425254821777} -08/30/2021 18:13:30 - INFO - __main__ - Step 28267: {'lr': 0.0004621387858513997, 'samples': 5427264, 'steps': 28266, 'loss/train': 1.5940356254577637} -08/30/2021 18:13:31 - INFO - __main__ - Step 28268: {'lr': 0.0004621359779682703, 'samples': 5427456, 'steps': 28267, 'loss/train': 1.152202844619751} -08/30/2021 18:13:31 - INFO - __main__ - Step 28269: {'lr': 0.0004621331699895557, 'samples': 5427648, 'steps': 28268, 'loss/train': 1.841621994972229} -08/30/2021 18:13:31 - INFO - __main__ - Step 28270: {'lr': 0.00046213036191525714, 'samples': 5427840, 'steps': 28269, 'loss/train': 1.209489107131958} -08/30/2021 18:13:33 - INFO - __main__ - Step 28271: {'lr': 0.00046212755374537594, 'samples': 5428032, 'steps': 28270, 'loss/train': 2.1603636741638184} -08/30/2021 18:13:34 - INFO - __main__ - Step 28272: {'lr': 0.0004621247454799133, 'samples': 5428224, 'steps': 28271, 'loss/train': 2.1762497425079346} -08/30/2021 18:13:34 - INFO - __main__ - Step 28273: {'lr': 0.0004621219371188706, 'samples': 5428416, 'steps': 28272, 'loss/train': 1.7961615324020386} -08/30/2021 18:13:34 - INFO - __main__ - Step 28274: {'lr': 0.0004621191286622489, 'samples': 5428608, 'steps': 28273, 'loss/train': 1.6145116090774536} -08/30/2021 18:13:35 - INFO - __main__ - Step 28275: {'lr': 0.00046211632011004973, 'samples': 5428800, 'steps': 28274, 'loss/train': 1.9258496761322021} -08/30/2021 18:13:35 - INFO - __main__ - Step 28276: {'lr': 0.0004621135114622742, 'samples': 5428992, 'steps': 28275, 'loss/train': 1.7441402673721313} -08/30/2021 18:13:37 - INFO - __main__ - Step 28277: {'lr': 0.00046211070271892353, 'samples': 5429184, 'steps': 28276, 'loss/train': 1.7774789333343506} -08/30/2021 18:13:37 - INFO - __main__ - Step 28278: {'lr': 0.00046210789387999906, 'samples': 5429376, 'steps': 28277, 'loss/train': 1.2015700340270996} -08/30/2021 18:13:37 - INFO - __main__ - Step 28279: {'lr': 0.00046210508494550206, 'samples': 5429568, 'steps': 28278, 'loss/train': 1.683435082435608} -08/30/2021 18:13:38 - INFO - __main__ - Step 28280: {'lr': 0.0004621022759154338, 'samples': 5429760, 'steps': 28279, 'loss/train': 1.4273407459259033} -08/30/2021 18:13:38 - INFO - __main__ - Step 28281: {'lr': 0.0004620994667897955, 'samples': 5429952, 'steps': 28280, 'loss/train': 1.6851435899734497} -08/30/2021 18:13:40 - INFO - __main__ - Step 28282: {'lr': 0.0004620966575685885, 'samples': 5430144, 'steps': 28281, 'loss/train': 1.733172059059143} -08/30/2021 18:13:40 - INFO - __main__ - Step 28283: {'lr': 0.000462093848251814, 'samples': 5430336, 'steps': 28282, 'loss/train': 2.0656027793884277} -08/30/2021 18:13:40 - INFO - __main__ - Step 28284: {'lr': 0.00046209103883947323, 'samples': 5430528, 'steps': 28283, 'loss/train': 2.0980305671691895} -08/30/2021 18:13:41 - INFO - __main__ - Step 28285: {'lr': 0.00046208822933156756, 'samples': 5430720, 'steps': 28284, 'loss/train': 0.9545504450798035} -08/30/2021 18:13:41 - INFO - __main__ - Step 28286: {'lr': 0.00046208541972809824, 'samples': 5430912, 'steps': 28285, 'loss/train': 1.118975281715393} -08/30/2021 18:13:43 - INFO - __main__ - Step 28287: {'lr': 0.00046208261002906643, 'samples': 5431104, 'steps': 28286, 'loss/train': 1.6077806949615479} -08/30/2021 18:13:44 - INFO - __main__ - Step 28288: {'lr': 0.00046207980023447347, 'samples': 5431296, 'steps': 28287, 'loss/train': 1.4952181577682495} -08/30/2021 18:13:44 - INFO - __main__ - Step 28289: {'lr': 0.0004620769903443207, 'samples': 5431488, 'steps': 28288, 'loss/train': 1.4617315530776978} -08/30/2021 18:13:44 - INFO - __main__ - Step 28290: {'lr': 0.00046207418035860927, 'samples': 5431680, 'steps': 28289, 'loss/train': 1.4859063625335693} -08/30/2021 18:13:45 - INFO - __main__ - Step 28291: {'lr': 0.00046207137027734046, 'samples': 5431872, 'steps': 28290, 'loss/train': 1.8514564037322998} -08/30/2021 18:13:47 - INFO - __main__ - Step 28292: {'lr': 0.00046206856010051555, 'samples': 5432064, 'steps': 28291, 'loss/train': 2.224961757659912} -08/30/2021 18:13:47 - INFO - __main__ - Step 28293: {'lr': 0.0004620657498281359, 'samples': 5432256, 'steps': 28292, 'loss/train': 0.8435643911361694} -08/30/2021 18:13:47 - INFO - __main__ - Step 28294: {'lr': 0.0004620629394602027, 'samples': 5432448, 'steps': 28293, 'loss/train': 1.0814980268478394} -08/30/2021 18:13:48 - INFO - __main__ - Step 28295: {'lr': 0.00046206012899671715, 'samples': 5432640, 'steps': 28294, 'loss/train': 1.6488440036773682} -08/30/2021 18:13:48 - INFO - __main__ - Step 28296: {'lr': 0.00046205731843768056, 'samples': 5432832, 'steps': 28295, 'loss/train': 0.16759580373764038} -08/30/2021 18:13:48 - INFO - __main__ - Step 28297: {'lr': 0.0004620545077830942, 'samples': 5433024, 'steps': 28296, 'loss/train': 1.2041758298873901} -08/30/2021 18:13:50 - INFO - __main__ - Step 28298: {'lr': 0.00046205169703295945, 'samples': 5433216, 'steps': 28297, 'loss/train': 0.05389319732785225} -08/30/2021 18:13:50 - INFO - __main__ - Step 28299: {'lr': 0.00046204888618727743, 'samples': 5433408, 'steps': 28298, 'loss/train': 1.9713691473007202} -08/30/2021 18:13:51 - INFO - __main__ - Step 28300: {'lr': 0.00046204607524604944, 'samples': 5433600, 'steps': 28299, 'loss/train': 1.9003307819366455} -08/30/2021 18:13:51 - INFO - __main__ - Step 28301: {'lr': 0.0004620432642092768, 'samples': 5433792, 'steps': 28300, 'loss/train': 1.5967423915863037} -08/30/2021 18:13:51 - INFO - __main__ - Step 28302: {'lr': 0.00046204045307696065, 'samples': 5433984, 'steps': 28301, 'loss/train': 1.4647635221481323} -08/30/2021 18:13:53 - INFO - __main__ - Step 28303: {'lr': 0.0004620376418491024, 'samples': 5434176, 'steps': 28302, 'loss/train': 1.2555168867111206} -08/30/2021 18:13:53 - INFO - __main__ - Step 28304: {'lr': 0.0004620348305257033, 'samples': 5434368, 'steps': 28303, 'loss/train': 1.426172137260437} -08/30/2021 18:13:54 - INFO - __main__ - Step 28305: {'lr': 0.00046203201910676453, 'samples': 5434560, 'steps': 28304, 'loss/train': 2.701510429382324} -08/30/2021 18:13:54 - INFO - __main__ - Step 28306: {'lr': 0.0004620292075922874, 'samples': 5434752, 'steps': 28305, 'loss/train': 0.5252964496612549} -08/30/2021 18:13:55 - INFO - __main__ - Step 28307: {'lr': 0.0004620263959822732, 'samples': 5434944, 'steps': 28306, 'loss/train': 1.3321943283081055} -08/30/2021 18:13:56 - INFO - __main__ - Step 28308: {'lr': 0.00046202358427672313, 'samples': 5435136, 'steps': 28307, 'loss/train': 1.5458296537399292} -08/30/2021 18:13:56 - INFO - __main__ - Step 28309: {'lr': 0.0004620207724756386, 'samples': 5435328, 'steps': 28308, 'loss/train': 2.0445430278778076} -08/30/2021 18:13:57 - INFO - __main__ - Step 28310: {'lr': 0.0004620179605790207, 'samples': 5435520, 'steps': 28309, 'loss/train': 1.6305828094482422} -08/30/2021 18:13:57 - INFO - __main__ - Step 28311: {'lr': 0.00046201514858687075, 'samples': 5435712, 'steps': 28310, 'loss/train': 1.4723097085952759} -08/30/2021 18:13:57 - INFO - __main__ - Step 28312: {'lr': 0.00046201233649919015, 'samples': 5435904, 'steps': 28311, 'loss/train': 1.7970898151397705} -08/30/2021 18:13:58 - INFO - __main__ - Step 28313: {'lr': 0.00046200952431598, 'samples': 5436096, 'steps': 28312, 'loss/train': 1.403132438659668} -08/30/2021 18:13:59 - INFO - __main__ - Step 28314: {'lr': 0.00046200671203724166, 'samples': 5436288, 'steps': 28313, 'loss/train': 1.559372067451477} -08/30/2021 18:14:00 - INFO - __main__ - Step 28315: {'lr': 0.00046200389966297633, 'samples': 5436480, 'steps': 28314, 'loss/train': 1.3774646520614624} -08/30/2021 18:14:00 - INFO - __main__ - Step 28316: {'lr': 0.00046200108719318537, 'samples': 5436672, 'steps': 28315, 'loss/train': 1.62782883644104} -08/30/2021 18:14:01 - INFO - __main__ - Step 28317: {'lr': 0.0004619982746278699, 'samples': 5436864, 'steps': 28316, 'loss/train': 1.450161099433899} -08/30/2021 18:14:01 - INFO - __main__ - Step 28318: {'lr': 0.00046199546196703134, 'samples': 5437056, 'steps': 28317, 'loss/train': 1.4043141603469849} -08/30/2021 18:14:02 - INFO - __main__ - Step 28319: {'lr': 0.0004619926492106709, 'samples': 5437248, 'steps': 28318, 'loss/train': 1.6663156747817993} -08/30/2021 18:14:03 - INFO - __main__ - Step 28320: {'lr': 0.0004619898363587899, 'samples': 5437440, 'steps': 28319, 'loss/train': 1.7252740859985352} -08/30/2021 18:14:03 - INFO - __main__ - Step 28321: {'lr': 0.00046198702341138944, 'samples': 5437632, 'steps': 28320, 'loss/train': 1.3548163175582886} -08/30/2021 18:14:04 - INFO - __main__ - Step 28322: {'lr': 0.00046198421036847093, 'samples': 5437824, 'steps': 28321, 'loss/train': 1.4695861339569092} -08/30/2021 18:14:04 - INFO - __main__ - Step 28323: {'lr': 0.00046198139723003563, 'samples': 5438016, 'steps': 28322, 'loss/train': 1.5358189344406128} -08/30/2021 18:14:05 - INFO - __main__ - Step 28324: {'lr': 0.00046197858399608477, 'samples': 5438208, 'steps': 28323, 'loss/train': 1.2871755361557007} -08/30/2021 18:14:06 - INFO - __main__ - Step 28325: {'lr': 0.00046197577066661965, 'samples': 5438400, 'steps': 28324, 'loss/train': 1.3666163682937622} -08/30/2021 18:14:06 - INFO - __main__ - Step 28326: {'lr': 0.0004619729572416415, 'samples': 5438592, 'steps': 28325, 'loss/train': 2.72617244720459} -08/30/2021 18:14:07 - INFO - __main__ - Step 28327: {'lr': 0.0004619701437211516, 'samples': 5438784, 'steps': 28326, 'loss/train': 1.4934099912643433} -08/30/2021 18:14:07 - INFO - __main__ - Step 28328: {'lr': 0.00046196733010515125, 'samples': 5438976, 'steps': 28327, 'loss/train': 1.6686969995498657} -08/30/2021 18:14:08 - INFO - __main__ - Step 28329: {'lr': 0.0004619645163936417, 'samples': 5439168, 'steps': 28328, 'loss/train': 1.957667350769043} -08/30/2021 18:14:09 - INFO - __main__ - Step 28330: {'lr': 0.0004619617025866242, 'samples': 5439360, 'steps': 28329, 'loss/train': 1.5146355628967285} -08/30/2021 18:14:09 - INFO - __main__ - Step 28331: {'lr': 0.00046195888868409994, 'samples': 5439552, 'steps': 28330, 'loss/train': 1.9308141469955444} -08/30/2021 18:14:10 - INFO - __main__ - Step 28332: {'lr': 0.0004619560746860704, 'samples': 5439744, 'steps': 28331, 'loss/train': 1.9257309436798096} -08/30/2021 18:14:10 - INFO - __main__ - Step 28333: {'lr': 0.0004619532605925366, 'samples': 5439936, 'steps': 28332, 'loss/train': 1.0161665678024292} -08/30/2021 18:14:10 - INFO - __main__ - Step 28334: {'lr': 0.00046195044640350003, 'samples': 5440128, 'steps': 28333, 'loss/train': 1.4778785705566406} -08/30/2021 18:14:12 - INFO - __main__ - Step 28335: {'lr': 0.00046194763211896187, 'samples': 5440320, 'steps': 28334, 'loss/train': 1.8597382307052612} -08/30/2021 18:14:12 - INFO - __main__ - Step 28336: {'lr': 0.0004619448177389233, 'samples': 5440512, 'steps': 28335, 'loss/train': 1.4075936079025269} -08/30/2021 18:14:13 - INFO - __main__ - Step 28337: {'lr': 0.0004619420032633857, 'samples': 5440704, 'steps': 28336, 'loss/train': 2.8559982776641846} -08/30/2021 18:14:13 - INFO - __main__ - Step 28338: {'lr': 0.0004619391886923503, 'samples': 5440896, 'steps': 28337, 'loss/train': 1.4946178197860718} -08/30/2021 18:14:13 - INFO - __main__ - Step 28339: {'lr': 0.0004619363740258184, 'samples': 5441088, 'steps': 28338, 'loss/train': 0.7726243138313293} -08/30/2021 18:14:15 - INFO - __main__ - Step 28340: {'lr': 0.00046193355926379124, 'samples': 5441280, 'steps': 28339, 'loss/train': 1.4866501092910767} -08/30/2021 18:14:16 - INFO - __main__ - Step 28341: {'lr': 0.00046193074440627, 'samples': 5441472, 'steps': 28340, 'loss/train': 1.4543671607971191} -08/30/2021 18:14:16 - INFO - __main__ - Step 28342: {'lr': 0.0004619279294532561, 'samples': 5441664, 'steps': 28341, 'loss/train': 1.950999140739441} -08/30/2021 18:14:16 - INFO - __main__ - Step 28343: {'lr': 0.00046192511440475083, 'samples': 5441856, 'steps': 28342, 'loss/train': 1.2707509994506836} -08/30/2021 18:14:17 - INFO - __main__ - Step 28344: {'lr': 0.00046192229926075526, 'samples': 5442048, 'steps': 28343, 'loss/train': 1.6523293256759644} -08/30/2021 18:14:18 - INFO - __main__ - Step 28345: {'lr': 0.0004619194840212708, 'samples': 5442240, 'steps': 28344, 'loss/train': 1.6364619731903076} -08/30/2021 18:14:19 - INFO - __main__ - Step 28346: {'lr': 0.0004619166686862987, 'samples': 5442432, 'steps': 28345, 'loss/train': 1.5701013803482056} -08/30/2021 18:14:19 - INFO - __main__ - Step 28347: {'lr': 0.0004619138532558402, 'samples': 5442624, 'steps': 28346, 'loss/train': 1.5248124599456787} -08/30/2021 18:14:19 - INFO - __main__ - Step 28348: {'lr': 0.00046191103772989664, 'samples': 5442816, 'steps': 28347, 'loss/train': 1.0147887468338013} -08/30/2021 18:14:20 - INFO - __main__ - Step 28349: {'lr': 0.00046190822210846917, 'samples': 5443008, 'steps': 28348, 'loss/train': 1.3319716453552246} -08/30/2021 18:14:21 - INFO - __main__ - Step 28350: {'lr': 0.0004619054063915592, 'samples': 5443200, 'steps': 28349, 'loss/train': 1.3324525356292725} -08/30/2021 18:14:22 - INFO - __main__ - Step 28351: {'lr': 0.00046190259057916786, 'samples': 5443392, 'steps': 28350, 'loss/train': 0.8180599212646484} -08/30/2021 18:14:22 - INFO - __main__ - Step 28352: {'lr': 0.0004618997746712965, 'samples': 5443584, 'steps': 28351, 'loss/train': 1.5923995971679688} -08/30/2021 18:14:22 - INFO - __main__ - Step 28353: {'lr': 0.00046189695866794635, 'samples': 5443776, 'steps': 28352, 'loss/train': 1.2761247158050537} -08/30/2021 18:14:23 - INFO - __main__ - Step 28354: {'lr': 0.00046189414256911875, 'samples': 5443968, 'steps': 28353, 'loss/train': 2.637528419494629} -08/30/2021 18:14:25 - INFO - __main__ - Step 28355: {'lr': 0.0004618913263748149, 'samples': 5444160, 'steps': 28354, 'loss/train': 1.7462899684906006} -08/30/2021 18:14:25 - INFO - __main__ - Step 28356: {'lr': 0.0004618885100850361, 'samples': 5444352, 'steps': 28355, 'loss/train': 1.6216866970062256} -08/30/2021 18:14:26 - INFO - __main__ - Step 28357: {'lr': 0.0004618856936997836, 'samples': 5444544, 'steps': 28356, 'loss/train': 1.2861307859420776} -08/30/2021 18:14:26 - INFO - __main__ - Step 28358: {'lr': 0.0004618828772190586, 'samples': 5444736, 'steps': 28357, 'loss/train': 1.8551957607269287} -08/30/2021 18:14:26 - INFO - __main__ - Step 28359: {'lr': 0.0004618800606428626, 'samples': 5444928, 'steps': 28358, 'loss/train': 1.779967188835144} -08/30/2021 18:14:27 - INFO - __main__ - Step 28360: {'lr': 0.00046187724397119657, 'samples': 5445120, 'steps': 28359, 'loss/train': 1.662474513053894} -08/30/2021 18:14:29 - INFO - __main__ - Step 28361: {'lr': 0.000461874427204062, 'samples': 5445312, 'steps': 28360, 'loss/train': 1.8396095037460327} -08/30/2021 18:14:29 - INFO - __main__ - Step 28362: {'lr': 0.00046187161034146, 'samples': 5445504, 'steps': 28361, 'loss/train': 1.1978753805160522} -08/30/2021 18:14:29 - INFO - __main__ - Step 28363: {'lr': 0.00046186879338339207, 'samples': 5445696, 'steps': 28362, 'loss/train': 1.5329073667526245} -08/30/2021 18:14:30 - INFO - __main__ - Step 28364: {'lr': 0.0004618659763298592, 'samples': 5445888, 'steps': 28363, 'loss/train': 1.1845771074295044} -08/30/2021 18:14:30 - INFO - __main__ - Step 28365: {'lr': 0.00046186315918086285, 'samples': 5446080, 'steps': 28364, 'loss/train': 1.5781322717666626} -08/30/2021 18:14:30 - INFO - __main__ - Step 28366: {'lr': 0.0004618603419364042, 'samples': 5446272, 'steps': 28365, 'loss/train': 1.47245192527771} -08/30/2021 18:14:32 - INFO - __main__ - Step 28367: {'lr': 0.00046185752459648456, 'samples': 5446464, 'steps': 28366, 'loss/train': 0.07523348927497864} -08/30/2021 18:14:33 - INFO - __main__ - Step 28368: {'lr': 0.00046185470716110516, 'samples': 5446656, 'steps': 28367, 'loss/train': 1.4055206775665283} -08/30/2021 18:14:33 - INFO - __main__ - Step 28369: {'lr': 0.00046185188963026734, 'samples': 5446848, 'steps': 28368, 'loss/train': 3.3890609741210938} -08/30/2021 18:14:33 - INFO - __main__ - Step 28370: {'lr': 0.0004618490720039723, 'samples': 5447040, 'steps': 28369, 'loss/train': 1.3116455078125} -08/30/2021 18:14:34 - INFO - __main__ - Step 28371: {'lr': 0.0004618462542822214, 'samples': 5447232, 'steps': 28370, 'loss/train': 1.5488499402999878} -08/30/2021 18:14:34 - INFO - __main__ - Step 28372: {'lr': 0.0004618434364650158, 'samples': 5447424, 'steps': 28371, 'loss/train': 1.957581639289856} -08/30/2021 18:14:36 - INFO - __main__ - Step 28373: {'lr': 0.00046184061855235683, 'samples': 5447616, 'steps': 28372, 'loss/train': 1.416306495666504} -08/30/2021 18:14:36 - INFO - __main__ - Step 28374: {'lr': 0.00046183780054424574, 'samples': 5447808, 'steps': 28373, 'loss/train': 1.3398233652114868} -08/30/2021 18:14:36 - INFO - __main__ - Step 28375: {'lr': 0.00046183498244068376, 'samples': 5448000, 'steps': 28374, 'loss/train': 1.2787036895751953} -08/30/2021 18:14:37 - INFO - __main__ - Step 28376: {'lr': 0.00046183216424167226, 'samples': 5448192, 'steps': 28375, 'loss/train': 1.8297516107559204} -08/30/2021 18:14:37 - INFO - __main__ - Step 28377: {'lr': 0.0004618293459472124, 'samples': 5448384, 'steps': 28376, 'loss/train': 1.5445353984832764} -08/30/2021 18:14:39 - INFO - __main__ - Step 28378: {'lr': 0.0004618265275573056, 'samples': 5448576, 'steps': 28377, 'loss/train': 2.1174182891845703} -08/30/2021 18:14:39 - INFO - __main__ - Step 28379: {'lr': 0.00046182370907195294, 'samples': 5448768, 'steps': 28378, 'loss/train': 1.0556801557540894} -08/30/2021 18:14:40 - INFO - __main__ - Step 28380: {'lr': 0.00046182089049115585, 'samples': 5448960, 'steps': 28379, 'loss/train': 4.267399787902832} -08/30/2021 18:14:40 - INFO - __main__ - Step 28381: {'lr': 0.0004618180718149155, 'samples': 5449152, 'steps': 28380, 'loss/train': 1.6334525346755981} -08/30/2021 18:14:40 - INFO - __main__ - Step 28382: {'lr': 0.00046181525304323325, 'samples': 5449344, 'steps': 28381, 'loss/train': 1.448195219039917} -08/30/2021 18:14:42 - INFO - __main__ - Step 28383: {'lr': 0.0004618124341761102, 'samples': 5449536, 'steps': 28382, 'loss/train': 1.6182572841644287} -08/30/2021 18:14:42 - INFO - __main__ - Step 28384: {'lr': 0.0004618096152135478, 'samples': 5449728, 'steps': 28383, 'loss/train': 2.207749366760254} -08/30/2021 18:14:42 - INFO - __main__ - Step 28385: {'lr': 0.00046180679615554735, 'samples': 5449920, 'steps': 28384, 'loss/train': 2.3146650791168213} -08/30/2021 18:14:43 - INFO - __main__ - Step 28386: {'lr': 0.00046180397700210985, 'samples': 5450112, 'steps': 28385, 'loss/train': 1.8278053998947144} -08/30/2021 18:14:43 - INFO - __main__ - Step 28387: {'lr': 0.0004618011577532368, 'samples': 5450304, 'steps': 28386, 'loss/train': 1.7210609912872314} -08/30/2021 18:14:45 - INFO - __main__ - Step 28388: {'lr': 0.0004617983384089295, 'samples': 5450496, 'steps': 28387, 'loss/train': 1.3940378427505493} -08/30/2021 18:14:45 - INFO - __main__ - Step 28389: {'lr': 0.00046179551896918916, 'samples': 5450688, 'steps': 28388, 'loss/train': 0.582719624042511} -08/30/2021 18:14:46 - INFO - __main__ - Step 28390: {'lr': 0.00046179269943401693, 'samples': 5450880, 'steps': 28389, 'loss/train': 2.3339428901672363} -08/30/2021 18:14:46 - INFO - __main__ - Step 28391: {'lr': 0.00046178987980341414, 'samples': 5451072, 'steps': 28390, 'loss/train': 1.3789128065109253} -08/30/2021 18:14:47 - INFO - __main__ - Step 28392: {'lr': 0.00046178706007738227, 'samples': 5451264, 'steps': 28391, 'loss/train': 0.16868636012077332} -08/30/2021 18:14:47 - INFO - __main__ - Step 28393: {'lr': 0.0004617842402559223, 'samples': 5451456, 'steps': 28392, 'loss/train': 0.0908598005771637} -08/30/2021 18:14:48 - INFO - __main__ - Step 28394: {'lr': 0.0004617814203390356, 'samples': 5451648, 'steps': 28393, 'loss/train': 2.0442283153533936} -08/30/2021 18:14:49 - INFO - __main__ - Step 28395: {'lr': 0.0004617786003267235, 'samples': 5451840, 'steps': 28394, 'loss/train': 1.7698763608932495} -08/30/2021 18:14:49 - INFO - __main__ - Step 28396: {'lr': 0.00046177578021898717, 'samples': 5452032, 'steps': 28395, 'loss/train': 0.9512029886245728} -08/30/2021 18:14:50 - INFO - __main__ - Step 28397: {'lr': 0.000461772960015828, 'samples': 5452224, 'steps': 28396, 'loss/train': 1.8937252759933472} -08/30/2021 18:14:50 - INFO - __main__ - Step 28398: {'lr': 0.00046177013971724723, 'samples': 5452416, 'steps': 28397, 'loss/train': 2.0061144828796387} -08/30/2021 18:14:50 - INFO - __main__ - Step 28399: {'lr': 0.00046176731932324604, 'samples': 5452608, 'steps': 28398, 'loss/train': 1.6485087871551514} -08/30/2021 18:14:52 - INFO - __main__ - Step 28400: {'lr': 0.0004617644988338258, 'samples': 5452800, 'steps': 28399, 'loss/train': 1.1261181831359863} -08/30/2021 18:14:53 - INFO - __main__ - Step 28401: {'lr': 0.0004617616782489877, 'samples': 5452992, 'steps': 28400, 'loss/train': 0.9156551957130432} -08/30/2021 18:14:53 - INFO - __main__ - Step 28402: {'lr': 0.00046175885756873314, 'samples': 5453184, 'steps': 28401, 'loss/train': 0.07958393543958664} -08/30/2021 18:14:54 - INFO - __main__ - Step 28403: {'lr': 0.00046175603679306324, 'samples': 5453376, 'steps': 28402, 'loss/train': 1.9514942169189453} -08/30/2021 18:14:54 - INFO - __main__ - Step 28404: {'lr': 0.0004617532159219794, 'samples': 5453568, 'steps': 28403, 'loss/train': 1.5115739107131958} -08/30/2021 18:14:55 - INFO - __main__ - Step 28405: {'lr': 0.0004617503949554828, 'samples': 5453760, 'steps': 28404, 'loss/train': 2.2763118743896484} -08/30/2021 18:14:56 - INFO - __main__ - Step 28406: {'lr': 0.0004617475738935747, 'samples': 5453952, 'steps': 28405, 'loss/train': 1.9992116689682007} -08/30/2021 18:14:56 - INFO - __main__ - Step 28407: {'lr': 0.0004617447527362564, 'samples': 5454144, 'steps': 28406, 'loss/train': 1.4851759672164917} -08/30/2021 18:14:57 - INFO - __main__ - Step 28408: {'lr': 0.00046174193148352914, 'samples': 5454336, 'steps': 28407, 'loss/train': 1.3432347774505615} -08/30/2021 18:14:57 - INFO - __main__ - Step 28409: {'lr': 0.00046173911013539437, 'samples': 5454528, 'steps': 28408, 'loss/train': 2.709536075592041} -08/30/2021 18:14:58 - INFO - __main__ - Step 28410: {'lr': 0.0004617362886918531, 'samples': 5454720, 'steps': 28409, 'loss/train': 1.2044527530670166} -08/30/2021 18:14:59 - INFO - __main__ - Step 28411: {'lr': 0.0004617334671529069, 'samples': 5454912, 'steps': 28410, 'loss/train': 2.171020030975342} -08/30/2021 18:14:59 - INFO - __main__ - Step 28412: {'lr': 0.0004617306455185567, 'samples': 5455104, 'steps': 28411, 'loss/train': 1.7233283519744873} -08/30/2021 18:15:00 - INFO - __main__ - Step 28413: {'lr': 0.00046172782378880404, 'samples': 5455296, 'steps': 28412, 'loss/train': 1.5373201370239258} -08/30/2021 18:15:00 - INFO - __main__ - Step 28414: {'lr': 0.00046172500196364996, 'samples': 5455488, 'steps': 28413, 'loss/train': 1.5885015726089478} -08/30/2021 18:15:02 - INFO - __main__ - Step 28415: {'lr': 0.000461722180043096, 'samples': 5455680, 'steps': 28414, 'loss/train': 1.087518572807312} -08/30/2021 18:15:02 - INFO - __main__ - Step 28416: {'lr': 0.0004617193580271433, 'samples': 5455872, 'steps': 28415, 'loss/train': 1.7424510717391968} -08/30/2021 18:15:03 - INFO - __main__ - Step 28417: {'lr': 0.000461716535915793, 'samples': 5456064, 'steps': 28416, 'loss/train': 1.5177549123764038} -08/30/2021 18:15:03 - INFO - __main__ - Step 28418: {'lr': 0.0004617137137090466, 'samples': 5456256, 'steps': 28417, 'loss/train': 1.6655724048614502} -08/30/2021 18:15:03 - INFO - __main__ - Step 28419: {'lr': 0.0004617108914069052, 'samples': 5456448, 'steps': 28418, 'loss/train': 1.6813396215438843} -08/30/2021 18:15:04 - INFO - __main__ - Step 28420: {'lr': 0.0004617080690093701, 'samples': 5456640, 'steps': 28419, 'loss/train': 0.90381920337677} -08/30/2021 18:15:05 - INFO - __main__ - Step 28421: {'lr': 0.00046170524651644276, 'samples': 5456832, 'steps': 28420, 'loss/train': 1.3693146705627441} -08/30/2021 18:15:06 - INFO - __main__ - Step 28422: {'lr': 0.00046170242392812425, 'samples': 5457024, 'steps': 28421, 'loss/train': 1.5474826097488403} -08/30/2021 18:15:06 - INFO - __main__ - Step 28423: {'lr': 0.0004616996012444158, 'samples': 5457216, 'steps': 28422, 'loss/train': 2.1661765575408936} -08/30/2021 18:15:06 - INFO - __main__ - Step 28424: {'lr': 0.00046169677846531884, 'samples': 5457408, 'steps': 28423, 'loss/train': 1.5340081453323364} -08/30/2021 18:15:07 - INFO - __main__ - Step 28425: {'lr': 0.0004616939555908346, 'samples': 5457600, 'steps': 28424, 'loss/train': 1.557504415512085} -08/30/2021 18:15:08 - INFO - __main__ - Step 28426: {'lr': 0.0004616911326209643, 'samples': 5457792, 'steps': 28425, 'loss/train': 2.089592456817627} -08/30/2021 18:15:09 - INFO - __main__ - Step 28427: {'lr': 0.0004616883095557092, 'samples': 5457984, 'steps': 28426, 'loss/train': 1.8241089582443237} -08/30/2021 18:15:09 - INFO - __main__ - Step 28428: {'lr': 0.0004616854863950707, 'samples': 5458176, 'steps': 28427, 'loss/train': 0.5400580167770386} -08/30/2021 18:15:09 - INFO - __main__ - Step 28429: {'lr': 0.00046168266313904995, 'samples': 5458368, 'steps': 28428, 'loss/train': 2.1024491786956787} -08/30/2021 18:15:10 - INFO - __main__ - Step 28430: {'lr': 0.00046167983978764827, 'samples': 5458560, 'steps': 28429, 'loss/train': 1.6214874982833862} -08/30/2021 18:15:11 - INFO - __main__ - Step 28431: {'lr': 0.0004616770163408669, 'samples': 5458752, 'steps': 28430, 'loss/train': 1.847511649131775} -08/30/2021 18:15:12 - INFO - __main__ - Step 28432: {'lr': 0.00046167419279870715, 'samples': 5458944, 'steps': 28431, 'loss/train': 1.8810951709747314} -08/30/2021 18:15:12 - INFO - __main__ - Step 28433: {'lr': 0.00046167136916117025, 'samples': 5459136, 'steps': 28432, 'loss/train': 1.4094552993774414} -08/30/2021 18:15:12 - INFO - __main__ - Step 28434: {'lr': 0.00046166854542825756, 'samples': 5459328, 'steps': 28433, 'loss/train': 1.757566213607788} -08/30/2021 18:15:13 - INFO - __main__ - Step 28435: {'lr': 0.0004616657215999702, 'samples': 5459520, 'steps': 28434, 'loss/train': 1.060879111289978} -08/30/2021 18:15:14 - INFO - __main__ - Step 28436: {'lr': 0.0004616628976763096, 'samples': 5459712, 'steps': 28435, 'loss/train': 1.269731044769287} -08/30/2021 18:15:14 - INFO - __main__ - Step 28437: {'lr': 0.0004616600736572769, 'samples': 5459904, 'steps': 28436, 'loss/train': 1.401597261428833} -08/30/2021 18:15:15 - INFO - __main__ - Step 28438: {'lr': 0.0004616572495428735, 'samples': 5460096, 'steps': 28437, 'loss/train': 1.4698482751846313} -08/30/2021 18:15:15 - INFO - __main__ - Step 28439: {'lr': 0.0004616544253331006, 'samples': 5460288, 'steps': 28438, 'loss/train': 0.9774594902992249} -08/30/2021 18:15:15 - INFO - __main__ - Step 28440: {'lr': 0.00046165160102795943, 'samples': 5460480, 'steps': 28439, 'loss/train': 1.3149068355560303} -08/30/2021 18:15:17 - INFO - __main__ - Step 28441: {'lr': 0.0004616487766274514, 'samples': 5460672, 'steps': 28440, 'loss/train': 1.6768009662628174} -08/30/2021 18:15:18 - INFO - __main__ - Step 28442: {'lr': 0.0004616459521315777, 'samples': 5460864, 'steps': 28441, 'loss/train': 1.2131375074386597} -08/30/2021 18:15:18 - INFO - __main__ - Step 28443: {'lr': 0.0004616431275403395, 'samples': 5461056, 'steps': 28442, 'loss/train': 1.0739957094192505} -08/30/2021 18:15:18 - INFO - __main__ - Step 28444: {'lr': 0.0004616403028537382, 'samples': 5461248, 'steps': 28443, 'loss/train': 3.931757926940918} -08/30/2021 18:15:19 - INFO - __main__ - Step 28445: {'lr': 0.0004616374780717751, 'samples': 5461440, 'steps': 28444, 'loss/train': 1.139050841331482} -08/30/2021 18:15:19 - INFO - __main__ - Step 28446: {'lr': 0.0004616346531944514, 'samples': 5461632, 'steps': 28445, 'loss/train': 1.621245265007019} -08/30/2021 18:15:21 - INFO - __main__ - Step 28447: {'lr': 0.00046163182822176835, 'samples': 5461824, 'steps': 28446, 'loss/train': 1.4106972217559814} -08/30/2021 18:15:21 - INFO - __main__ - Step 28448: {'lr': 0.0004616290031537273, 'samples': 5462016, 'steps': 28447, 'loss/train': 0.29630017280578613} -08/30/2021 18:15:21 - INFO - __main__ - Step 28449: {'lr': 0.0004616261779903295, 'samples': 5462208, 'steps': 28448, 'loss/train': 1.1605528593063354} -08/30/2021 18:15:22 - INFO - __main__ - Step 28450: {'lr': 0.0004616233527315762, 'samples': 5462400, 'steps': 28449, 'loss/train': 1.7201234102249146} -08/30/2021 18:15:22 - INFO - __main__ - Step 28451: {'lr': 0.0004616205273774686, 'samples': 5462592, 'steps': 28450, 'loss/train': 1.6046078205108643} -08/30/2021 18:15:22 - INFO - __main__ - Step 28452: {'lr': 0.00046161770192800817, 'samples': 5462784, 'steps': 28451, 'loss/train': 1.3255046606063843} -08/30/2021 18:15:24 - INFO - __main__ - Step 28453: {'lr': 0.000461614876383196, 'samples': 5462976, 'steps': 28452, 'loss/train': 1.2627551555633545} -08/30/2021 18:15:25 - INFO - __main__ - Step 28454: {'lr': 0.0004616120507430335, 'samples': 5463168, 'steps': 28453, 'loss/train': 1.7005821466445923} -08/30/2021 18:15:25 - INFO - __main__ - Step 28455: {'lr': 0.00046160922500752176, 'samples': 5463360, 'steps': 28454, 'loss/train': 0.6630153656005859} -08/30/2021 18:15:25 - INFO - __main__ - Step 28456: {'lr': 0.0004616063991766623, 'samples': 5463552, 'steps': 28455, 'loss/train': 1.7326027154922485} -08/30/2021 18:15:26 - INFO - __main__ - Step 28457: {'lr': 0.0004616035732504562, 'samples': 5463744, 'steps': 28456, 'loss/train': 1.629073143005371} -08/30/2021 18:15:27 - INFO - __main__ - Step 28458: {'lr': 0.0004616007472289048, 'samples': 5463936, 'steps': 28457, 'loss/train': 1.4131532907485962} -08/30/2021 18:15:28 - INFO - __main__ - Step 28459: {'lr': 0.00046159792111200937, 'samples': 5464128, 'steps': 28458, 'loss/train': 1.3037713766098022} -08/30/2021 18:15:28 - INFO - __main__ - Step 28460: {'lr': 0.0004615950948997711, 'samples': 5464320, 'steps': 28459, 'loss/train': 1.4961373805999756} -08/30/2021 18:15:29 - INFO - __main__ - Step 28461: {'lr': 0.0004615922685921915, 'samples': 5464512, 'steps': 28460, 'loss/train': 1.4120932817459106} -08/30/2021 18:15:29 - INFO - __main__ - Step 28462: {'lr': 0.0004615894421892716, 'samples': 5464704, 'steps': 28461, 'loss/train': 1.5001535415649414} -08/30/2021 18:15:31 - INFO - __main__ - Step 28463: {'lr': 0.0004615866156910128, 'samples': 5464896, 'steps': 28462, 'loss/train': 1.1565515995025635} -08/30/2021 18:15:31 - INFO - __main__ - Step 28464: {'lr': 0.00046158378909741626, 'samples': 5465088, 'steps': 28463, 'loss/train': 2.036403179168701} -08/30/2021 18:15:31 - INFO - __main__ - Step 28465: {'lr': 0.00046158096240848343, 'samples': 5465280, 'steps': 28464, 'loss/train': 1.703019618988037} -08/30/2021 18:15:32 - INFO - __main__ - Step 28466: {'lr': 0.00046157813562421545, 'samples': 5465472, 'steps': 28465, 'loss/train': 1.6842516660690308} -08/30/2021 18:15:32 - INFO - __main__ - Step 28467: {'lr': 0.0004615753087446136, 'samples': 5465664, 'steps': 28466, 'loss/train': 1.8737887144088745} -08/30/2021 18:15:34 - INFO - __main__ - Step 28468: {'lr': 0.00046157248176967915, 'samples': 5465856, 'steps': 28467, 'loss/train': 1.8135250806808472} -08/30/2021 18:15:34 - INFO - __main__ - Step 28469: {'lr': 0.0004615696546994135, 'samples': 5466048, 'steps': 28468, 'loss/train': 1.4749095439910889} -08/30/2021 18:15:35 - INFO - __main__ - Step 28470: {'lr': 0.00046156682753381774, 'samples': 5466240, 'steps': 28469, 'loss/train': 1.223831295967102} -08/30/2021 18:15:35 - INFO - __main__ - Step 28471: {'lr': 0.0004615640002728932, 'samples': 5466432, 'steps': 28470, 'loss/train': 1.4210262298583984} -08/30/2021 18:15:35 - INFO - __main__ - Step 28472: {'lr': 0.00046156117291664133, 'samples': 5466624, 'steps': 28471, 'loss/train': 1.3265413045883179} -08/30/2021 18:15:36 - INFO - __main__ - Step 28473: {'lr': 0.0004615583454650632, 'samples': 5466816, 'steps': 28472, 'loss/train': 1.6798558235168457} -08/30/2021 18:15:37 - INFO - __main__ - Step 28474: {'lr': 0.00046155551791816007, 'samples': 5467008, 'steps': 28473, 'loss/train': 0.0545647032558918} -08/30/2021 18:15:38 - INFO - __main__ - Step 28475: {'lr': 0.00046155269027593337, 'samples': 5467200, 'steps': 28474, 'loss/train': 1.4392448663711548} -08/30/2021 18:15:38 - INFO - __main__ - Step 28476: {'lr': 0.00046154986253838426, 'samples': 5467392, 'steps': 28475, 'loss/train': 1.3955795764923096} -08/30/2021 18:15:38 - INFO - __main__ - Step 28477: {'lr': 0.00046154703470551405, 'samples': 5467584, 'steps': 28476, 'loss/train': 1.797864556312561} -08/30/2021 18:15:39 - INFO - __main__ - Step 28478: {'lr': 0.000461544206777324, 'samples': 5467776, 'steps': 28477, 'loss/train': 0.6715664267539978} -08/30/2021 18:15:40 - INFO - __main__ - Step 28479: {'lr': 0.00046154137875381547, 'samples': 5467968, 'steps': 28478, 'loss/train': 1.7450462579727173} -08/30/2021 18:15:41 - INFO - __main__ - Step 28480: {'lr': 0.00046153855063498964, 'samples': 5468160, 'steps': 28479, 'loss/train': 1.654579758644104} -08/30/2021 18:15:41 - INFO - __main__ - Step 28481: {'lr': 0.00046153572242084776, 'samples': 5468352, 'steps': 28480, 'loss/train': 1.3318246603012085} -08/30/2021 18:15:41 - INFO - __main__ - Step 28482: {'lr': 0.0004615328941113911, 'samples': 5468544, 'steps': 28481, 'loss/train': 1.3417713642120361} -08/30/2021 18:15:42 - INFO - __main__ - Step 28483: {'lr': 0.00046153006570662106, 'samples': 5468736, 'steps': 28482, 'loss/train': 1.5684040784835815} -08/30/2021 18:15:43 - INFO - __main__ - Step 28484: {'lr': 0.0004615272372065388, 'samples': 5468928, 'steps': 28483, 'loss/train': 1.7049928903579712} -08/30/2021 18:15:44 - INFO - __main__ - Step 28485: {'lr': 0.0004615244086111456, 'samples': 5469120, 'steps': 28484, 'loss/train': 1.32969331741333} -08/30/2021 18:15:44 - INFO - __main__ - Step 28486: {'lr': 0.00046152157992044283, 'samples': 5469312, 'steps': 28485, 'loss/train': 1.4608381986618042} -08/30/2021 18:15:44 - INFO - __main__ - Step 28487: {'lr': 0.0004615187511344316, 'samples': 5469504, 'steps': 28486, 'loss/train': 1.3725831508636475} -08/30/2021 18:15:45 - INFO - __main__ - Step 28488: {'lr': 0.00046151592225311347, 'samples': 5469696, 'steps': 28487, 'loss/train': 1.6761726140975952} -08/30/2021 18:15:46 - INFO - __main__ - Step 28489: {'lr': 0.0004615130932764894, 'samples': 5469888, 'steps': 28488, 'loss/train': 1.3599092960357666} -08/30/2021 18:15:46 - INFO - __main__ - Step 28490: {'lr': 0.0004615102642045608, 'samples': 5470080, 'steps': 28489, 'loss/train': 1.5636268854141235} -08/30/2021 18:15:47 - INFO - __main__ - Step 28491: {'lr': 0.00046150743503732897, 'samples': 5470272, 'steps': 28490, 'loss/train': 1.3444204330444336} -08/30/2021 18:15:47 - INFO - __main__ - Step 28492: {'lr': 0.0004615046057747951, 'samples': 5470464, 'steps': 28491, 'loss/train': 1.6677089929580688} -08/30/2021 18:15:48 - INFO - __main__ - Step 28493: {'lr': 0.0004615017764169606, 'samples': 5470656, 'steps': 28492, 'loss/train': 1.0866971015930176} -08/30/2021 18:15:49 - INFO - __main__ - Step 28494: {'lr': 0.00046149894696382655, 'samples': 5470848, 'steps': 28493, 'loss/train': 1.7957838773727417} -08/30/2021 18:15:50 - INFO - __main__ - Step 28495: {'lr': 0.00046149611741539445, 'samples': 5471040, 'steps': 28494, 'loss/train': 1.851419448852539} -08/30/2021 18:15:50 - INFO - __main__ - Step 28496: {'lr': 0.00046149328777166543, 'samples': 5471232, 'steps': 28495, 'loss/train': 1.5098599195480347} -08/30/2021 18:15:50 - INFO - __main__ - Step 28497: {'lr': 0.0004614904580326408, 'samples': 5471424, 'steps': 28496, 'loss/train': 1.1656744480133057} -08/30/2021 18:15:51 - INFO - __main__ - Step 28498: {'lr': 0.0004614876281983218, 'samples': 5471616, 'steps': 28497, 'loss/train': 2.112806797027588} -08/30/2021 18:15:51 - INFO - __main__ - Step 28499: {'lr': 0.0004614847982687097, 'samples': 5471808, 'steps': 28498, 'loss/train': 0.9596072435379028} -08/30/2021 18:15:53 - INFO - __main__ - Step 28500: {'lr': 0.0004614819682438059, 'samples': 5472000, 'steps': 28499, 'loss/train': 1.330038070678711} -08/30/2021 18:15:53 - INFO - __main__ - Step 28501: {'lr': 0.00046147913812361155, 'samples': 5472192, 'steps': 28500, 'loss/train': 0.7673311233520508} -08/30/2021 18:15:53 - INFO - __main__ - Step 28502: {'lr': 0.000461476307908128, 'samples': 5472384, 'steps': 28501, 'loss/train': 0.8263532519340515} -08/30/2021 18:15:54 - INFO - __main__ - Step 28503: {'lr': 0.00046147347759735647, 'samples': 5472576, 'steps': 28502, 'loss/train': 1.9476468563079834} -08/30/2021 18:15:54 - INFO - __main__ - Step 28504: {'lr': 0.00046147064719129823, 'samples': 5472768, 'steps': 28503, 'loss/train': 1.6908648014068604} -08/30/2021 18:15:56 - INFO - __main__ - Step 28505: {'lr': 0.00046146781668995456, 'samples': 5472960, 'steps': 28504, 'loss/train': 1.075881004333496} -08/30/2021 18:15:57 - INFO - __main__ - Step 28506: {'lr': 0.0004614649860933268, 'samples': 5473152, 'steps': 28505, 'loss/train': 1.9262429475784302} -08/30/2021 18:15:57 - INFO - __main__ - Step 28507: {'lr': 0.0004614621554014162, 'samples': 5473344, 'steps': 28506, 'loss/train': 1.8057692050933838} -08/30/2021 18:15:58 - INFO - __main__ - Step 28508: {'lr': 0.00046145932461422396, 'samples': 5473536, 'steps': 28507, 'loss/train': 1.4998582601547241} -08/30/2021 18:15:58 - INFO - __main__ - Step 28509: {'lr': 0.00046145649373175145, 'samples': 5473728, 'steps': 28508, 'loss/train': 1.477571725845337} -08/30/2021 18:15:58 - INFO - __main__ - Step 28510: {'lr': 0.0004614536627539999, 'samples': 5473920, 'steps': 28509, 'loss/train': 1.7403695583343506} -08/30/2021 18:16:00 - INFO - __main__ - Step 28511: {'lr': 0.0004614508316809706, 'samples': 5474112, 'steps': 28510, 'loss/train': 2.421569347381592} -08/30/2021 18:16:00 - INFO - __main__ - Step 28512: {'lr': 0.00046144800051266477, 'samples': 5474304, 'steps': 28511, 'loss/train': 1.2638709545135498} -08/30/2021 18:16:01 - INFO - __main__ - Step 28513: {'lr': 0.00046144516924908377, 'samples': 5474496, 'steps': 28512, 'loss/train': 1.592155933380127} -08/30/2021 18:16:01 - INFO - __main__ - Step 28514: {'lr': 0.0004614423378902289, 'samples': 5474688, 'steps': 28513, 'loss/train': 1.9909541606903076} -08/30/2021 18:16:01 - INFO - __main__ - Step 28515: {'lr': 0.0004614395064361013, 'samples': 5474880, 'steps': 28514, 'loss/train': 0.7892037630081177} -08/30/2021 18:16:03 - INFO - __main__ - Step 28516: {'lr': 0.00046143667488670226, 'samples': 5475072, 'steps': 28515, 'loss/train': 1.0137324333190918} -08/30/2021 18:16:04 - INFO - __main__ - Step 28517: {'lr': 0.00046143384324203325, 'samples': 5475264, 'steps': 28516, 'loss/train': 1.8772464990615845} -08/30/2021 18:16:04 - INFO - __main__ - Step 28518: {'lr': 0.00046143101150209533, 'samples': 5475456, 'steps': 28517, 'loss/train': 0.062400247901678085} -08/30/2021 18:16:04 - INFO - __main__ - Step 28519: {'lr': 0.0004614281796668899, 'samples': 5475648, 'steps': 28518, 'loss/train': 1.7559754848480225} -08/30/2021 18:16:05 - INFO - __main__ - Step 28520: {'lr': 0.0004614253477364182, 'samples': 5475840, 'steps': 28519, 'loss/train': 1.6631942987442017} -08/30/2021 18:16:05 - INFO - __main__ - Step 28521: {'lr': 0.0004614225157106815, 'samples': 5476032, 'steps': 28520, 'loss/train': 1.5449906587600708} -08/30/2021 18:16:06 - INFO - __main__ - Step 28522: {'lr': 0.00046141968358968103, 'samples': 5476224, 'steps': 28521, 'loss/train': 2.165684223175049} -08/30/2021 18:16:07 - INFO - __main__ - Step 28523: {'lr': 0.00046141685137341814, 'samples': 5476416, 'steps': 28522, 'loss/train': 1.218667984008789} -08/30/2021 18:16:07 - INFO - __main__ - Step 28524: {'lr': 0.00046141401906189404, 'samples': 5476608, 'steps': 28523, 'loss/train': 1.5562207698822021} -08/30/2021 18:16:07 - INFO - __main__ - Step 28525: {'lr': 0.0004614111866551101, 'samples': 5476800, 'steps': 28524, 'loss/train': 1.8598761558532715} -08/30/2021 18:16:08 - INFO - __main__ - Step 28526: {'lr': 0.0004614083541530675, 'samples': 5476992, 'steps': 28525, 'loss/train': 1.8451690673828125} -08/30/2021 18:16:09 - INFO - __main__ - Step 28527: {'lr': 0.00046140552155576767, 'samples': 5477184, 'steps': 28526, 'loss/train': 1.7072362899780273} -08/30/2021 18:16:10 - INFO - __main__ - Step 28528: {'lr': 0.0004614026888632116, 'samples': 5477376, 'steps': 28527, 'loss/train': 1.3507329225540161} -08/30/2021 18:16:10 - INFO - __main__ - Step 28529: {'lr': 0.00046139985607540087, 'samples': 5477568, 'steps': 28528, 'loss/train': 1.6900264024734497} -08/30/2021 18:16:10 - INFO - __main__ - Step 28530: {'lr': 0.00046139702319233656, 'samples': 5477760, 'steps': 28529, 'loss/train': 1.7837227582931519} -08/30/2021 18:16:11 - INFO - __main__ - Step 28531: {'lr': 0.00046139419021402005, 'samples': 5477952, 'steps': 28530, 'loss/train': 1.7546217441558838} -08/30/2021 18:16:11 - INFO - __main__ - Step 28532: {'lr': 0.00046139135714045253, 'samples': 5478144, 'steps': 28531, 'loss/train': 1.699596881866455} -08/30/2021 18:16:13 - INFO - __main__ - Step 28533: {'lr': 0.00046138852397163547, 'samples': 5478336, 'steps': 28532, 'loss/train': 1.8266007900238037} -08/30/2021 18:16:13 - INFO - __main__ - Step 28534: {'lr': 0.00046138569070756984, 'samples': 5478528, 'steps': 28533, 'loss/train': 0.06760618835687637} -08/30/2021 18:16:14 - INFO - __main__ - Step 28535: {'lr': 0.00046138285734825715, 'samples': 5478720, 'steps': 28534, 'loss/train': 1.34406578540802} -08/30/2021 18:16:14 - INFO - __main__ - Step 28536: {'lr': 0.0004613800238936986, 'samples': 5478912, 'steps': 28535, 'loss/train': 1.4671729803085327} -08/30/2021 18:16:14 - INFO - __main__ - Step 28537: {'lr': 0.0004613771903438955, 'samples': 5479104, 'steps': 28536, 'loss/train': 1.3227908611297607} -08/30/2021 18:16:16 - INFO - __main__ - Step 28538: {'lr': 0.00046137435669884897, 'samples': 5479296, 'steps': 28537, 'loss/train': 1.5423678159713745} -08/30/2021 18:16:17 - INFO - __main__ - Step 28539: {'lr': 0.00046137152295856054, 'samples': 5479488, 'steps': 28538, 'loss/train': 0.17428183555603027} -08/30/2021 18:16:17 - INFO - __main__ - Step 28540: {'lr': 0.0004613686891230313, 'samples': 5479680, 'steps': 28539, 'loss/train': 1.2126985788345337} -08/30/2021 18:16:17 - INFO - __main__ - Step 28541: {'lr': 0.0004613658551922627, 'samples': 5479872, 'steps': 28540, 'loss/train': 2.0219058990478516} -08/30/2021 18:16:18 - INFO - __main__ - Step 28542: {'lr': 0.0004613630211662558, 'samples': 5480064, 'steps': 28541, 'loss/train': 1.5777045488357544} -08/30/2021 18:16:19 - INFO - __main__ - Step 28543: {'lr': 0.00046136018704501203, 'samples': 5480256, 'steps': 28542, 'loss/train': 1.443447232246399} -08/30/2021 18:16:19 - INFO - __main__ - Step 28544: {'lr': 0.00046135735282853263, 'samples': 5480448, 'steps': 28543, 'loss/train': 1.5230565071105957} -08/30/2021 18:16:20 - INFO - __main__ - Step 28545: {'lr': 0.0004613545185168188, 'samples': 5480640, 'steps': 28544, 'loss/train': 1.427353024482727} -08/30/2021 18:16:20 - INFO - __main__ - Step 28546: {'lr': 0.0004613516841098719, 'samples': 5480832, 'steps': 28545, 'loss/train': 2.22821307182312} -08/30/2021 18:16:21 - INFO - __main__ - Step 28547: {'lr': 0.0004613488496076933, 'samples': 5481024, 'steps': 28546, 'loss/train': 1.7149930000305176} -08/30/2021 18:16:22 - INFO - __main__ - Step 28548: {'lr': 0.00046134601501028404, 'samples': 5481216, 'steps': 28547, 'loss/train': 1.4018101692199707} -08/30/2021 18:16:23 - INFO - __main__ - Step 28549: {'lr': 0.0004613431803176456, 'samples': 5481408, 'steps': 28548, 'loss/train': 0.6721023321151733} -08/30/2021 18:16:23 - INFO - __main__ - Step 28550: {'lr': 0.00046134034552977924, 'samples': 5481600, 'steps': 28549, 'loss/train': 1.870675802230835} -08/30/2021 18:16:23 - INFO - __main__ - Step 28551: {'lr': 0.00046133751064668605, 'samples': 5481792, 'steps': 28550, 'loss/train': 1.046642780303955} -08/30/2021 18:16:24 - INFO - __main__ - Step 28552: {'lr': 0.0004613346756683675, 'samples': 5481984, 'steps': 28551, 'loss/train': 1.702518343925476} -08/30/2021 18:16:25 - INFO - __main__ - Step 28553: {'lr': 0.0004613318405948248, 'samples': 5482176, 'steps': 28552, 'loss/train': 1.886941909790039} -08/30/2021 18:16:26 - INFO - __main__ - Step 28554: {'lr': 0.00046132900542605925, 'samples': 5482368, 'steps': 28553, 'loss/train': 1.116611123085022} -08/30/2021 18:16:26 - INFO - __main__ - Step 28555: {'lr': 0.0004613261701620721, 'samples': 5482560, 'steps': 28554, 'loss/train': 1.2434521913528442} -08/30/2021 18:16:26 - INFO - __main__ - Step 28556: {'lr': 0.0004613233348028646, 'samples': 5482752, 'steps': 28555, 'loss/train': 0.9997589588165283} -08/30/2021 18:16:27 - INFO - __main__ - Step 28557: {'lr': 0.0004613204993484381, 'samples': 5482944, 'steps': 28556, 'loss/train': 1.574049472808838} -08/30/2021 18:16:29 - INFO - __main__ - Step 28558: {'lr': 0.00046131766379879386, 'samples': 5483136, 'steps': 28557, 'loss/train': 1.684670329093933} -08/30/2021 18:16:29 - INFO - __main__ - Step 28559: {'lr': 0.0004613148281539331, 'samples': 5483328, 'steps': 28558, 'loss/train': 1.2109357118606567} -08/30/2021 18:16:30 - INFO - __main__ - Step 28560: {'lr': 0.00046131199241385726, 'samples': 5483520, 'steps': 28559, 'loss/train': 1.1717592477798462} -08/30/2021 18:16:30 - INFO - __main__ - Step 28561: {'lr': 0.0004613091565785673, 'samples': 5483712, 'steps': 28560, 'loss/train': 1.4759520292282104} -08/30/2021 18:16:30 - INFO - __main__ - Step 28562: {'lr': 0.0004613063206480649, 'samples': 5483904, 'steps': 28561, 'loss/train': 1.250970482826233} -08/30/2021 18:16:31 - INFO - __main__ - Step 28563: {'lr': 0.000461303484622351, 'samples': 5484096, 'steps': 28562, 'loss/train': 1.0326673984527588} -08/30/2021 18:16:32 - INFO - __main__ - Step 28564: {'lr': 0.00046130064850142703, 'samples': 5484288, 'steps': 28563, 'loss/train': 1.2959872484207153} -08/30/2021 18:16:33 - INFO - __main__ - Step 28565: {'lr': 0.0004612978122852942, 'samples': 5484480, 'steps': 28564, 'loss/train': 2.220444440841675} -08/30/2021 18:16:33 - INFO - __main__ - Step 28566: {'lr': 0.000461294975973954, 'samples': 5484672, 'steps': 28565, 'loss/train': 1.4092081785202026} -08/30/2021 18:16:34 - INFO - __main__ - Step 28567: {'lr': 0.0004612921395674074, 'samples': 5484864, 'steps': 28566, 'loss/train': 1.0749324560165405} -08/30/2021 18:16:34 - INFO - __main__ - Step 28568: {'lr': 0.0004612893030656559, 'samples': 5485056, 'steps': 28567, 'loss/train': 0.9329726099967957} -08/30/2021 18:16:36 - INFO - __main__ - Step 28569: {'lr': 0.0004612864664687007, 'samples': 5485248, 'steps': 28568, 'loss/train': 1.4765939712524414} -08/30/2021 18:16:36 - INFO - __main__ - Step 28570: {'lr': 0.0004612836297765429, 'samples': 5485440, 'steps': 28569, 'loss/train': 1.9534573554992676} -08/30/2021 18:16:37 - INFO - __main__ - Step 28571: {'lr': 0.00046128079298918414, 'samples': 5485632, 'steps': 28570, 'loss/train': 0.09738225489854813} -08/30/2021 18:16:37 - INFO - __main__ - Step 28572: {'lr': 0.00046127795610662547, 'samples': 5485824, 'steps': 28571, 'loss/train': 0.056263361126184464} -08/30/2021 18:16:37 - INFO - __main__ - Step 28573: {'lr': 0.0004612751191288682, 'samples': 5486016, 'steps': 28572, 'loss/train': 2.102567434310913} -08/30/2021 18:16:38 - INFO - __main__ - Step 28574: {'lr': 0.00046127228205591366, 'samples': 5486208, 'steps': 28573, 'loss/train': 0.9623347520828247} -08/30/2021 18:16:39 - INFO - __main__ - Step 28575: {'lr': 0.0004612694448877631, 'samples': 5486400, 'steps': 28574, 'loss/train': 0.7900848984718323} -08/30/2021 18:16:40 - INFO - __main__ - Step 28576: {'lr': 0.00046126660762441774, 'samples': 5486592, 'steps': 28575, 'loss/train': 1.0455816984176636} -08/30/2021 18:16:40 - INFO - __main__ - Step 28577: {'lr': 0.00046126377026587897, 'samples': 5486784, 'steps': 28576, 'loss/train': 1.4658417701721191} -08/30/2021 18:16:40 - INFO - __main__ - Step 28578: {'lr': 0.0004612609328121479, 'samples': 5486976, 'steps': 28577, 'loss/train': 0.8452721834182739} -08/30/2021 18:16:41 - INFO - __main__ - Step 28579: {'lr': 0.000461258095263226, 'samples': 5487168, 'steps': 28578, 'loss/train': 1.8922438621520996} -08/30/2021 18:16:43 - INFO - __main__ - Step 28580: {'lr': 0.00046125525761911445, 'samples': 5487360, 'steps': 28579, 'loss/train': 2.147704839706421} -08/30/2021 18:16:43 - INFO - __main__ - Step 28581: {'lr': 0.00046125241987981445, 'samples': 5487552, 'steps': 28580, 'loss/train': 1.194510817527771} -08/30/2021 18:16:44 - INFO - __main__ - Step 28582: {'lr': 0.0004612495820453275, 'samples': 5487744, 'steps': 28581, 'loss/train': 1.61212956905365} -08/30/2021 18:16:44 - INFO - __main__ - Step 28583: {'lr': 0.0004612467441156547, 'samples': 5487936, 'steps': 28582, 'loss/train': 1.9254000186920166} -08/30/2021 18:16:44 - INFO - __main__ - Step 28584: {'lr': 0.00046124390609079735, 'samples': 5488128, 'steps': 28583, 'loss/train': 1.859422206878662} -08/30/2021 18:16:45 - INFO - __main__ - Step 28585: {'lr': 0.00046124106797075683, 'samples': 5488320, 'steps': 28584, 'loss/train': 1.4304039478302002} -08/30/2021 18:16:46 - INFO - __main__ - Step 28586: {'lr': 0.00046123822975553425, 'samples': 5488512, 'steps': 28585, 'loss/train': 0.14914561808109283} -08/30/2021 18:16:47 - INFO - __main__ - Step 28587: {'lr': 0.00046123539144513103, 'samples': 5488704, 'steps': 28586, 'loss/train': 1.3258082866668701} -08/30/2021 18:16:47 - INFO - __main__ - Step 28588: {'lr': 0.00046123255303954835, 'samples': 5488896, 'steps': 28587, 'loss/train': 1.047844409942627} -08/30/2021 18:16:47 - INFO - __main__ - Step 28589: {'lr': 0.0004612297145387876, 'samples': 5489088, 'steps': 28588, 'loss/train': 1.5251235961914062} -08/30/2021 18:16:48 - INFO - __main__ - Step 28590: {'lr': 0.00046122687594285, 'samples': 5489280, 'steps': 28589, 'loss/train': 1.2259701490402222} -08/30/2021 18:16:49 - INFO - __main__ - Step 28591: {'lr': 0.0004612240372517368, 'samples': 5489472, 'steps': 28590, 'loss/train': 1.267090916633606} -08/30/2021 18:16:50 - INFO - __main__ - Step 28592: {'lr': 0.00046122119846544936, 'samples': 5489664, 'steps': 28591, 'loss/train': 1.0689455270767212} -08/30/2021 18:16:50 - INFO - __main__ - Step 28593: {'lr': 0.00046121835958398883, 'samples': 5489856, 'steps': 28592, 'loss/train': 1.6659600734710693} -08/30/2021 18:16:50 - INFO - __main__ - Step 28594: {'lr': 0.0004612155206073566, 'samples': 5490048, 'steps': 28593, 'loss/train': 1.393333911895752} -08/30/2021 18:16:51 - INFO - __main__ - Step 28595: {'lr': 0.000461212681535554, 'samples': 5490240, 'steps': 28594, 'loss/train': 1.847856879234314} -08/30/2021 18:16:51 - INFO - __main__ - Step 28596: {'lr': 0.0004612098423685821, 'samples': 5490432, 'steps': 28595, 'loss/train': 1.8090723752975464} -08/30/2021 18:16:53 - INFO - __main__ - Step 28597: {'lr': 0.0004612070031064424, 'samples': 5490624, 'steps': 28596, 'loss/train': 1.2842819690704346} -08/30/2021 18:16:54 - INFO - __main__ - Step 28598: {'lr': 0.000461204163749136, 'samples': 5490816, 'steps': 28597, 'loss/train': 1.440927505493164} -08/30/2021 18:16:54 - INFO - __main__ - Step 28599: {'lr': 0.0004612013242966643, 'samples': 5491008, 'steps': 28598, 'loss/train': 1.4508466720581055} -08/30/2021 18:16:54 - INFO - __main__ - Step 28600: {'lr': 0.0004611984847490285, 'samples': 5491200, 'steps': 28599, 'loss/train': 2.039684534072876} -08/30/2021 18:16:55 - INFO - __main__ - Step 28601: {'lr': 0.00046119564510623, 'samples': 5491392, 'steps': 28600, 'loss/train': 1.1459662914276123} -08/30/2021 18:16:57 - INFO - __main__ - Step 28602: {'lr': 0.00046119280536827, 'samples': 5491584, 'steps': 28601, 'loss/train': 9.737241744995117} -08/30/2021 18:16:57 - INFO - __main__ - Step 28603: {'lr': 0.0004611899655351497, 'samples': 5491776, 'steps': 28602, 'loss/train': 1.809079647064209} -08/30/2021 18:16:57 - INFO - __main__ - Step 28604: {'lr': 0.0004611871256068705, 'samples': 5491968, 'steps': 28603, 'loss/train': 1.655714988708496} -08/30/2021 18:16:58 - INFO - __main__ - Step 28605: {'lr': 0.0004611842855834336, 'samples': 5492160, 'steps': 28604, 'loss/train': 1.823891520500183} -08/30/2021 18:16:58 - INFO - __main__ - Step 28606: {'lr': 0.00046118144546484043, 'samples': 5492352, 'steps': 28605, 'loss/train': 0.7643401026725769} -08/30/2021 18:16:58 - INFO - __main__ - Step 28607: {'lr': 0.0004611786052510921, 'samples': 5492544, 'steps': 28606, 'loss/train': 1.5874062776565552} -08/30/2021 18:17:00 - INFO - __main__ - Step 28608: {'lr': 0.0004611757649421899, 'samples': 5492736, 'steps': 28607, 'loss/train': 1.956817626953125} -08/30/2021 18:17:01 - INFO - __main__ - Step 28609: {'lr': 0.0004611729245381352, 'samples': 5492928, 'steps': 28608, 'loss/train': 1.2808642387390137} -08/30/2021 18:17:01 - INFO - __main__ - Step 28610: {'lr': 0.00046117008403892925, 'samples': 5493120, 'steps': 28609, 'loss/train': 1.8965907096862793} -08/30/2021 18:17:01 - INFO - __main__ - Step 28611: {'lr': 0.0004611672434445733, 'samples': 5493312, 'steps': 28610, 'loss/train': 1.635274052619934} -08/30/2021 18:17:02 - INFO - __main__ - Step 28612: {'lr': 0.0004611644027550687, 'samples': 5493504, 'steps': 28611, 'loss/train': 1.6674134731292725} -08/30/2021 18:17:03 - INFO - __main__ - Step 28613: {'lr': 0.00046116156197041657, 'samples': 5493696, 'steps': 28612, 'loss/train': 1.4661076068878174} -08/30/2021 18:17:04 - INFO - __main__ - Step 28614: {'lr': 0.0004611587210906184, 'samples': 5493888, 'steps': 28613, 'loss/train': 1.6048845052719116} -08/30/2021 18:17:04 - INFO - __main__ - Step 28615: {'lr': 0.0004611558801156753, 'samples': 5494080, 'steps': 28614, 'loss/train': 0.12729088962078094} -08/30/2021 18:17:04 - INFO - __main__ - Step 28616: {'lr': 0.0004611530390455887, 'samples': 5494272, 'steps': 28615, 'loss/train': 1.6169594526290894} -08/30/2021 18:17:05 - INFO - __main__ - Step 28617: {'lr': 0.00046115019788035974, 'samples': 5494464, 'steps': 28616, 'loss/train': 1.4557987451553345} -08/30/2021 18:17:07 - INFO - __main__ - Step 28618: {'lr': 0.00046114735661998975, 'samples': 5494656, 'steps': 28617, 'loss/train': 2.5542166233062744} -08/30/2021 18:17:07 - INFO - __main__ - Step 28619: {'lr': 0.0004611445152644801, 'samples': 5494848, 'steps': 28618, 'loss/train': 0.11091788113117218} -08/30/2021 18:17:08 - INFO - __main__ - Step 28620: {'lr': 0.00046114167381383186, 'samples': 5495040, 'steps': 28619, 'loss/train': 1.2085102796554565} -08/30/2021 18:17:08 - INFO - __main__ - Step 28621: {'lr': 0.0004611388322680465, 'samples': 5495232, 'steps': 28620, 'loss/train': 1.140795111656189} -08/30/2021 18:17:08 - INFO - __main__ - Step 28622: {'lr': 0.0004611359906271253, 'samples': 5495424, 'steps': 28621, 'loss/train': 1.7540414333343506} -08/30/2021 18:17:10 - INFO - __main__ - Step 28623: {'lr': 0.0004611331488910694, 'samples': 5495616, 'steps': 28622, 'loss/train': 1.9007771015167236} -08/30/2021 18:17:10 - INFO - __main__ - Step 28624: {'lr': 0.00046113030705988026, 'samples': 5495808, 'steps': 28623, 'loss/train': 1.7109884023666382} -08/30/2021 18:17:11 - INFO - __main__ - Step 28625: {'lr': 0.000461127465133559, 'samples': 5496000, 'steps': 28624, 'loss/train': 1.7091494798660278} -08/30/2021 18:17:11 - INFO - __main__ - Step 28626: {'lr': 0.0004611246231121069, 'samples': 5496192, 'steps': 28625, 'loss/train': 1.8191943168640137} -08/30/2021 18:17:12 - INFO - __main__ - Step 28627: {'lr': 0.00046112178099552535, 'samples': 5496384, 'steps': 28626, 'loss/train': 1.2781901359558105} -08/30/2021 18:17:13 - INFO - __main__ - Step 28628: {'lr': 0.0004611189387838156, 'samples': 5496576, 'steps': 28627, 'loss/train': 0.9486587047576904} -08/30/2021 18:17:13 - INFO - __main__ - Step 28629: {'lr': 0.00046111609647697893, 'samples': 5496768, 'steps': 28628, 'loss/train': 0.8507620692253113} -08/30/2021 18:17:14 - INFO - __main__ - Step 28630: {'lr': 0.0004611132540750166, 'samples': 5496960, 'steps': 28629, 'loss/train': 2.0000696182250977} -08/30/2021 18:17:14 - INFO - __main__ - Step 28631: {'lr': 0.00046111041157792987, 'samples': 5497152, 'steps': 28630, 'loss/train': 1.7961006164550781} -08/30/2021 18:17:14 - INFO - __main__ - Step 28632: {'lr': 0.00046110756898572, 'samples': 5497344, 'steps': 28631, 'loss/train': 1.5291951894760132} -08/30/2021 18:17:15 - INFO - __main__ - Step 28633: {'lr': 0.0004611047262983884, 'samples': 5497536, 'steps': 28632, 'loss/train': 1.3961063623428345} -08/30/2021 18:17:16 - INFO - __main__ - Step 28634: {'lr': 0.00046110188351593625, 'samples': 5497728, 'steps': 28633, 'loss/train': 1.6091190576553345} -08/30/2021 18:17:17 - INFO - __main__ - Step 28635: {'lr': 0.0004610990406383648, 'samples': 5497920, 'steps': 28634, 'loss/train': 0.5210306644439697} -08/30/2021 18:17:17 - INFO - __main__ - Step 28636: {'lr': 0.00046109619766567547, 'samples': 5498112, 'steps': 28635, 'loss/train': 1.5592787265777588} -08/30/2021 18:17:18 - INFO - __main__ - Step 28637: {'lr': 0.0004610933545978694, 'samples': 5498304, 'steps': 28636, 'loss/train': 0.9747006297111511} -08/30/2021 18:17:18 - INFO - __main__ - Step 28638: {'lr': 0.0004610905114349478, 'samples': 5498496, 'steps': 28637, 'loss/train': 1.6787627935409546} -08/30/2021 18:17:19 - INFO - __main__ - Step 28639: {'lr': 0.0004610876681769123, 'samples': 5498688, 'steps': 28638, 'loss/train': 1.808143973350525} -08/30/2021 18:17:20 - INFO - __main__ - Step 28640: {'lr': 0.0004610848248237638, 'samples': 5498880, 'steps': 28639, 'loss/train': 1.4617542028427124} -08/30/2021 18:17:20 - INFO - __main__ - Step 28641: {'lr': 0.00046108198137550377, 'samples': 5499072, 'steps': 28640, 'loss/train': 1.4664337635040283} -08/30/2021 18:17:21 - INFO - __main__ - Step 28642: {'lr': 0.0004610791378321335, 'samples': 5499264, 'steps': 28641, 'loss/train': 1.9164260625839233} -08/30/2021 18:17:21 - INFO - __main__ - Step 28643: {'lr': 0.0004610762941936542, 'samples': 5499456, 'steps': 28642, 'loss/train': 1.7378405332565308} -08/30/2021 18:17:23 - INFO - __main__ - Step 28644: {'lr': 0.0004610734504600671, 'samples': 5499648, 'steps': 28643, 'loss/train': 1.5796711444854736} -08/30/2021 18:17:23 - INFO - __main__ - Step 28645: {'lr': 0.00046107060663137366, 'samples': 5499840, 'steps': 28644, 'loss/train': 1.4716848134994507} -08/30/2021 18:17:23 - INFO - __main__ - Step 28646: {'lr': 0.00046106776270757506, 'samples': 5500032, 'steps': 28645, 'loss/train': 1.6572840213775635} -08/30/2021 18:17:24 - INFO - __main__ - Step 28647: {'lr': 0.0004610649186886725, 'samples': 5500224, 'steps': 28646, 'loss/train': 1.657213568687439} -08/30/2021 18:17:24 - INFO - __main__ - Step 28648: {'lr': 0.00046106207457466744, 'samples': 5500416, 'steps': 28647, 'loss/train': 1.7196182012557983} -08/30/2021 18:17:26 - INFO - __main__ - Step 28649: {'lr': 0.0004610592303655611, 'samples': 5500608, 'steps': 28648, 'loss/train': 1.4266602993011475} -08/30/2021 18:17:26 - INFO - __main__ - Step 28650: {'lr': 0.0004610563860613546, 'samples': 5500800, 'steps': 28649, 'loss/train': 2.1116340160369873} -08/30/2021 18:17:27 - INFO - __main__ - Step 28651: {'lr': 0.00046105354166204937, 'samples': 5500992, 'steps': 28650, 'loss/train': 1.671355962753296} -08/30/2021 18:17:27 - INFO - __main__ - Step 28652: {'lr': 0.00046105069716764676, 'samples': 5501184, 'steps': 28651, 'loss/train': 0.30662935972213745} -08/30/2021 18:17:27 - INFO - __main__ - Step 28653: {'lr': 0.00046104785257814786, 'samples': 5501376, 'steps': 28652, 'loss/train': 1.6948570013046265} -08/30/2021 18:17:28 - INFO - __main__ - Step 28654: {'lr': 0.0004610450078935541, 'samples': 5501568, 'steps': 28653, 'loss/train': 1.4901260137557983} -08/30/2021 18:17:29 - INFO - __main__ - Step 28655: {'lr': 0.00046104216311386676, 'samples': 5501760, 'steps': 28654, 'loss/train': 1.6524717807769775} -08/30/2021 18:17:30 - INFO - __main__ - Step 28656: {'lr': 0.000461039318239087, 'samples': 5501952, 'steps': 28655, 'loss/train': 1.4687788486480713} -08/30/2021 18:17:30 - INFO - __main__ - Step 28657: {'lr': 0.00046103647326921625, 'samples': 5502144, 'steps': 28656, 'loss/train': 1.4570131301879883} -08/30/2021 18:17:30 - INFO - __main__ - Step 28658: {'lr': 0.00046103362820425567, 'samples': 5502336, 'steps': 28657, 'loss/train': 0.17846554517745972} -08/30/2021 18:17:31 - INFO - __main__ - Step 28659: {'lr': 0.00046103078304420665, 'samples': 5502528, 'steps': 28658, 'loss/train': 1.890275239944458} -08/30/2021 18:17:32 - INFO - __main__ - Step 28660: {'lr': 0.0004610279377890704, 'samples': 5502720, 'steps': 28659, 'loss/train': 1.4584637880325317} -08/30/2021 18:17:33 - INFO - __main__ - Step 28661: {'lr': 0.00046102509243884813, 'samples': 5502912, 'steps': 28660, 'loss/train': 1.3846909999847412} -08/30/2021 18:17:33 - INFO - __main__ - Step 28662: {'lr': 0.0004610222469935413, 'samples': 5503104, 'steps': 28661, 'loss/train': 1.1878535747528076} -08/30/2021 18:17:33 - INFO - __main__ - Step 28663: {'lr': 0.000461019401453151, 'samples': 5503296, 'steps': 28662, 'loss/train': 1.9918683767318726} -08/30/2021 18:17:34 - INFO - __main__ - Step 28664: {'lr': 0.00046101655581767874, 'samples': 5503488, 'steps': 28663, 'loss/train': 1.6148306131362915} -08/30/2021 18:17:35 - INFO - __main__ - Step 28665: {'lr': 0.0004610137100871257, 'samples': 5503680, 'steps': 28664, 'loss/train': 2.0255563259124756} -08/30/2021 18:17:36 - INFO - __main__ - Step 28666: {'lr': 0.00046101086426149297, 'samples': 5503872, 'steps': 28665, 'loss/train': 1.5599926710128784} -08/30/2021 18:17:36 - INFO - __main__ - Step 28667: {'lr': 0.0004610080183407821, 'samples': 5504064, 'steps': 28666, 'loss/train': 1.6037590503692627} -08/30/2021 18:17:36 - INFO - __main__ - Step 28668: {'lr': 0.0004610051723249943, 'samples': 5504256, 'steps': 28667, 'loss/train': 1.7684967517852783} -08/30/2021 18:17:37 - INFO - __main__ - Step 28669: {'lr': 0.0004610023262141308, 'samples': 5504448, 'steps': 28668, 'loss/train': 1.2390328645706177} -08/30/2021 18:17:39 - INFO - __main__ - Step 28670: {'lr': 0.00046099948000819294, 'samples': 5504640, 'steps': 28669, 'loss/train': 0.09077593684196472} -08/30/2021 18:17:40 - INFO - __main__ - Step 28671: {'lr': 0.0004609966337071819, 'samples': 5504832, 'steps': 28670, 'loss/train': 1.1359988451004028} -08/30/2021 18:17:40 - INFO - __main__ - Step 28672: {'lr': 0.00046099378731109906, 'samples': 5505024, 'steps': 28671, 'loss/train': 0.1055753082036972} -08/30/2021 18:17:40 - INFO - __main__ - Step 28673: {'lr': 0.00046099094081994565, 'samples': 5505216, 'steps': 28672, 'loss/train': 1.326877474784851} -08/30/2021 18:17:41 - INFO - __main__ - Step 28674: {'lr': 0.000460988094233723, 'samples': 5505408, 'steps': 28673, 'loss/train': 1.7359426021575928} -08/30/2021 18:17:42 - INFO - __main__ - Step 28675: {'lr': 0.00046098524755243246, 'samples': 5505600, 'steps': 28674, 'loss/train': 2.0015597343444824} -08/30/2021 18:17:43 - INFO - __main__ - Step 28676: {'lr': 0.0004609824007760751, 'samples': 5505792, 'steps': 28675, 'loss/train': 1.6945456266403198} -08/30/2021 18:17:43 - INFO - __main__ - Step 28677: {'lr': 0.0004609795539046524, 'samples': 5505984, 'steps': 28676, 'loss/train': 1.8516099452972412} -08/30/2021 18:17:43 - INFO - __main__ - Step 28678: {'lr': 0.0004609767069381655, 'samples': 5506176, 'steps': 28677, 'loss/train': 0.09904380142688751} -08/30/2021 18:17:44 - INFO - __main__ - Step 28679: {'lr': 0.00046097385987661576, 'samples': 5506368, 'steps': 28678, 'loss/train': 1.4202141761779785} -08/30/2021 18:17:46 - INFO - __main__ - Step 28680: {'lr': 0.00046097101272000454, 'samples': 5506560, 'steps': 28679, 'loss/train': 1.6175774335861206} -08/30/2021 18:17:46 - INFO - __main__ - Step 28681: {'lr': 0.0004609681654683329, 'samples': 5506752, 'steps': 28680, 'loss/train': 0.10689815133810043} -08/30/2021 18:17:46 - INFO - __main__ - Step 28682: {'lr': 0.0004609653181216024, 'samples': 5506944, 'steps': 28681, 'loss/train': 1.893286108970642} -08/30/2021 18:17:47 - INFO - __main__ - Step 28683: {'lr': 0.0004609624706798141, 'samples': 5507136, 'steps': 28682, 'loss/train': 1.6242172718048096} -08/30/2021 18:17:47 - INFO - __main__ - Step 28684: {'lr': 0.00046095962314296934, 'samples': 5507328, 'steps': 28683, 'loss/train': 1.661780834197998} -08/30/2021 18:17:49 - INFO - __main__ - Step 28685: {'lr': 0.00046095677551106953, 'samples': 5507520, 'steps': 28684, 'loss/train': 1.8052581548690796} -08/30/2021 18:17:49 - INFO - __main__ - Step 28686: {'lr': 0.00046095392778411576, 'samples': 5507712, 'steps': 28685, 'loss/train': 1.7522753477096558} -08/30/2021 18:17:49 - INFO - __main__ - Step 28687: {'lr': 0.0004609510799621095, 'samples': 5507904, 'steps': 28686, 'loss/train': 0.726565420627594} -08/30/2021 18:17:50 - INFO - __main__ - Step 28688: {'lr': 0.0004609482320450519, 'samples': 5508096, 'steps': 28687, 'loss/train': 1.686182975769043} -08/30/2021 18:17:50 - INFO - __main__ - Step 28689: {'lr': 0.00046094538403294416, 'samples': 5508288, 'steps': 28688, 'loss/train': 2.193859100341797} -08/30/2021 18:17:51 - INFO - __main__ - Step 28690: {'lr': 0.00046094253592578784, 'samples': 5508480, 'steps': 28689, 'loss/train': 2.0816071033477783} -08/30/2021 18:17:52 - INFO - __main__ - Step 28691: {'lr': 0.000460939687723584, 'samples': 5508672, 'steps': 28690, 'loss/train': 1.7358242273330688} -08/30/2021 18:17:52 - INFO - __main__ - Step 28692: {'lr': 0.000460936839426334, 'samples': 5508864, 'steps': 28691, 'loss/train': 1.5767308473587036} -08/30/2021 18:17:53 - INFO - __main__ - Step 28693: {'lr': 0.00046093399103403913, 'samples': 5509056, 'steps': 28692, 'loss/train': 1.9537839889526367} -08/30/2021 18:17:53 - INFO - __main__ - Step 28694: {'lr': 0.00046093114254670066, 'samples': 5509248, 'steps': 28693, 'loss/train': 0.5270798206329346} -08/30/2021 18:17:55 - INFO - __main__ - Step 28695: {'lr': 0.0004609282939643199, 'samples': 5509440, 'steps': 28694, 'loss/train': 1.5301392078399658} -08/30/2021 18:17:55 - INFO - __main__ - Step 28696: {'lr': 0.00046092544528689806, 'samples': 5509632, 'steps': 28695, 'loss/train': 1.502647876739502} -08/30/2021 18:17:55 - INFO - __main__ - Step 28697: {'lr': 0.0004609225965144365, 'samples': 5509824, 'steps': 28696, 'loss/train': 1.330797791481018} -08/30/2021 18:17:56 - INFO - __main__ - Step 28698: {'lr': 0.00046091974764693645, 'samples': 5510016, 'steps': 28697, 'loss/train': 1.330105185508728} -08/30/2021 18:17:56 - INFO - __main__ - Step 28699: {'lr': 0.0004609168986843992, 'samples': 5510208, 'steps': 28698, 'loss/train': 1.7887258529663086} -08/30/2021 18:17:56 - INFO - __main__ - Step 28700: {'lr': 0.000460914049626826, 'samples': 5510400, 'steps': 28699, 'loss/train': 2.4512386322021484} -08/30/2021 18:17:58 - INFO - __main__ - Step 28701: {'lr': 0.0004609112004742183, 'samples': 5510592, 'steps': 28700, 'loss/train': 1.8095072507858276} -08/30/2021 18:17:59 - INFO - __main__ - Step 28702: {'lr': 0.0004609083512265773, 'samples': 5510784, 'steps': 28701, 'loss/train': 1.917091727256775} -08/30/2021 18:17:59 - INFO - __main__ - Step 28703: {'lr': 0.0004609055018839041, 'samples': 5510976, 'steps': 28702, 'loss/train': 1.2911368608474731} -08/30/2021 18:17:59 - INFO - __main__ - Step 28704: {'lr': 0.0004609026524462002, 'samples': 5511168, 'steps': 28703, 'loss/train': 0.9765636324882507} -08/30/2021 18:18:00 - INFO - __main__ - Step 28705: {'lr': 0.00046089980291346685, 'samples': 5511360, 'steps': 28704, 'loss/train': 1.4764583110809326} -08/30/2021 18:18:00 - INFO - __main__ - Step 28706: {'lr': 0.00046089695328570523, 'samples': 5511552, 'steps': 28705, 'loss/train': 1.5844409465789795} -08/30/2021 18:18:02 - INFO - __main__ - Step 28707: {'lr': 0.0004608941035629168, 'samples': 5511744, 'steps': 28706, 'loss/train': 1.1635280847549438} -08/30/2021 18:18:02 - INFO - __main__ - Step 28708: {'lr': 0.0004608912537451027, 'samples': 5511936, 'steps': 28707, 'loss/train': 1.0059483051300049} -08/30/2021 18:18:02 - INFO - __main__ - Step 28709: {'lr': 0.0004608884038322642, 'samples': 5512128, 'steps': 28708, 'loss/train': 2.412945032119751} -08/30/2021 18:18:03 - INFO - __main__ - Step 28710: {'lr': 0.00046088555382440275, 'samples': 5512320, 'steps': 28709, 'loss/train': 1.2494611740112305} -08/30/2021 18:18:03 - INFO - __main__ - Step 28711: {'lr': 0.0004608827037215194, 'samples': 5512512, 'steps': 28710, 'loss/train': 1.1306918859481812} -08/30/2021 18:18:04 - INFO - __main__ - Step 28712: {'lr': 0.0004608798535236156, 'samples': 5512704, 'steps': 28711, 'loss/train': 1.6654123067855835} -08/30/2021 18:18:05 - INFO - __main__ - Step 28713: {'lr': 0.0004608770032306926, 'samples': 5512896, 'steps': 28712, 'loss/train': 1.8448811769485474} -08/30/2021 18:18:05 - INFO - __main__ - Step 28714: {'lr': 0.0004608741528427517, 'samples': 5513088, 'steps': 28713, 'loss/train': 1.4382745027542114} -08/30/2021 18:18:06 - INFO - __main__ - Step 28715: {'lr': 0.0004608713023597941, 'samples': 5513280, 'steps': 28714, 'loss/train': 1.543492317199707} -08/30/2021 18:18:06 - INFO - __main__ - Step 28716: {'lr': 0.00046086845178182123, 'samples': 5513472, 'steps': 28715, 'loss/train': 1.132645845413208} -08/30/2021 18:18:08 - INFO - __main__ - Step 28717: {'lr': 0.00046086560110883423, 'samples': 5513664, 'steps': 28716, 'loss/train': 1.647782325744629} -08/30/2021 18:18:08 - INFO - __main__ - Step 28718: {'lr': 0.00046086275034083453, 'samples': 5513856, 'steps': 28717, 'loss/train': 1.545560359954834} -08/30/2021 18:18:09 - INFO - __main__ - Step 28719: {'lr': 0.00046085989947782327, 'samples': 5514048, 'steps': 28718, 'loss/train': 1.9469356536865234} -08/30/2021 18:18:09 - INFO - __main__ - Step 28720: {'lr': 0.00046085704851980174, 'samples': 5514240, 'steps': 28719, 'loss/train': 0.14269833266735077} -08/30/2021 18:18:09 - INFO - __main__ - Step 28721: {'lr': 0.00046085419746677136, 'samples': 5514432, 'steps': 28720, 'loss/train': 1.31236732006073} -08/30/2021 18:18:11 - INFO - __main__ - Step 28722: {'lr': 0.00046085134631873326, 'samples': 5514624, 'steps': 28721, 'loss/train': 1.4599498510360718} -08/30/2021 18:18:11 - INFO - __main__ - Step 28723: {'lr': 0.0004608484950756888, 'samples': 5514816, 'steps': 28722, 'loss/train': 1.5662461519241333} -08/30/2021 18:18:11 - INFO - __main__ - Step 28724: {'lr': 0.0004608456437376393, 'samples': 5515008, 'steps': 28723, 'loss/train': 1.6499756574630737} -08/30/2021 18:18:12 - INFO - __main__ - Step 28725: {'lr': 0.000460842792304586, 'samples': 5515200, 'steps': 28724, 'loss/train': 1.1057729721069336} -08/30/2021 18:18:12 - INFO - __main__ - Step 28726: {'lr': 0.00046083994077653024, 'samples': 5515392, 'steps': 28725, 'loss/train': 1.292879581451416} -08/30/2021 18:18:14 - INFO - __main__ - Step 28727: {'lr': 0.0004608370891534732, 'samples': 5515584, 'steps': 28726, 'loss/train': 1.3703200817108154} -08/30/2021 18:18:15 - INFO - __main__ - Step 28728: {'lr': 0.0004608342374354162, 'samples': 5515776, 'steps': 28727, 'loss/train': 1.7802619934082031} -08/30/2021 18:18:15 - INFO - __main__ - Step 28729: {'lr': 0.0004608313856223606, 'samples': 5515968, 'steps': 28728, 'loss/train': 2.003765106201172} -08/30/2021 18:18:16 - INFO - __main__ - Step 28730: {'lr': 0.00046082853371430754, 'samples': 5516160, 'steps': 28729, 'loss/train': 1.603506088256836} -08/30/2021 18:18:16 - INFO - __main__ - Step 28731: {'lr': 0.0004608256817112585, 'samples': 5516352, 'steps': 28730, 'loss/train': 1.374673843383789} -08/30/2021 18:18:17 - INFO - __main__ - Step 28732: {'lr': 0.00046082282961321466, 'samples': 5516544, 'steps': 28731, 'loss/train': 1.6801224946975708} -08/30/2021 18:18:18 - INFO - __main__ - Step 28733: {'lr': 0.00046081997742017725, 'samples': 5516736, 'steps': 28732, 'loss/train': 1.1425230503082275} -08/30/2021 18:18:18 - INFO - __main__ - Step 28734: {'lr': 0.00046081712513214757, 'samples': 5516928, 'steps': 28733, 'loss/train': 1.9179368019104004} -08/30/2021 18:18:19 - INFO - __main__ - Step 28735: {'lr': 0.0004608142727491271, 'samples': 5517120, 'steps': 28734, 'loss/train': 1.8448516130447388} -08/30/2021 18:18:19 - INFO - __main__ - Step 28736: {'lr': 0.00046081142027111683, 'samples': 5517312, 'steps': 28735, 'loss/train': 1.168526530265808} -08/30/2021 18:18:21 - INFO - __main__ - Step 28737: {'lr': 0.0004608085676981182, 'samples': 5517504, 'steps': 28736, 'loss/train': 1.8542293310165405} -08/30/2021 18:18:21 - INFO - __main__ - Step 28738: {'lr': 0.0004608057150301326, 'samples': 5517696, 'steps': 28737, 'loss/train': 0.9919119477272034} -08/30/2021 18:18:21 - INFO - __main__ - Step 28739: {'lr': 0.00046080286226716106, 'samples': 5517888, 'steps': 28738, 'loss/train': 0.2748536765575409} -08/30/2021 18:18:22 - INFO - __main__ - Step 28740: {'lr': 0.00046080000940920506, 'samples': 5518080, 'steps': 28739, 'loss/train': 1.6069672107696533} -08/30/2021 18:18:22 - INFO - __main__ - Step 28741: {'lr': 0.00046079715645626584, 'samples': 5518272, 'steps': 28740, 'loss/train': 0.7914718389511108} -08/30/2021 18:18:23 - INFO - __main__ - Step 28742: {'lr': 0.00046079430340834467, 'samples': 5518464, 'steps': 28741, 'loss/train': 1.358385443687439} -08/30/2021 18:18:24 - INFO - __main__ - Step 28743: {'lr': 0.00046079145026544277, 'samples': 5518656, 'steps': 28742, 'loss/train': 1.2105307579040527} -08/30/2021 18:18:24 - INFO - __main__ - Step 28744: {'lr': 0.0004607885970275616, 'samples': 5518848, 'steps': 28743, 'loss/train': 1.393981695175171} -08/30/2021 18:18:25 - INFO - __main__ - Step 28745: {'lr': 0.0004607857436947023, 'samples': 5519040, 'steps': 28744, 'loss/train': 1.690173864364624} -08/30/2021 18:18:25 - INFO - __main__ - Step 28746: {'lr': 0.00046078289026686616, 'samples': 5519232, 'steps': 28745, 'loss/train': 1.5842844247817993} -08/30/2021 18:18:25 - INFO - __main__ - Step 28747: {'lr': 0.00046078003674405457, 'samples': 5519424, 'steps': 28746, 'loss/train': 1.2636808156967163} -08/30/2021 18:18:27 - INFO - __main__ - Step 28748: {'lr': 0.0004607771831262687, 'samples': 5519616, 'steps': 28747, 'loss/train': 0.9195443391799927} -08/30/2021 18:18:27 - INFO - __main__ - Step 28749: {'lr': 0.00046077432941350993, 'samples': 5519808, 'steps': 28748, 'loss/train': 1.424353837966919} -08/30/2021 18:18:28 - INFO - __main__ - Step 28750: {'lr': 0.00046077147560577943, 'samples': 5520000, 'steps': 28749, 'loss/train': 1.416340947151184} -08/30/2021 18:18:28 - INFO - __main__ - Step 28751: {'lr': 0.0004607686217030786, 'samples': 5520192, 'steps': 28750, 'loss/train': 1.5812209844589233} -08/30/2021 18:18:28 - INFO - __main__ - Step 28752: {'lr': 0.00046076576770540865, 'samples': 5520384, 'steps': 28751, 'loss/train': 1.2292712926864624} -08/30/2021 18:18:30 - INFO - __main__ - Step 28753: {'lr': 0.00046076291361277097, 'samples': 5520576, 'steps': 28752, 'loss/train': 1.74449622631073} -08/30/2021 18:18:31 - INFO - __main__ - Step 28754: {'lr': 0.00046076005942516666, 'samples': 5520768, 'steps': 28753, 'loss/train': 1.7540959119796753} -08/30/2021 18:18:31 - INFO - __main__ - Step 28755: {'lr': 0.0004607572051425972, 'samples': 5520960, 'steps': 28754, 'loss/train': 1.4322564601898193} -08/30/2021 18:18:32 - INFO - __main__ - Step 28756: {'lr': 0.00046075435076506376, 'samples': 5521152, 'steps': 28755, 'loss/train': 0.1628573089838028} -08/30/2021 18:18:32 - INFO - __main__ - Step 28757: {'lr': 0.0004607514962925677, 'samples': 5521344, 'steps': 28756, 'loss/train': 1.1711376905441284} -08/30/2021 18:18:33 - INFO - __main__ - Step 28758: {'lr': 0.00046074864172511025, 'samples': 5521536, 'steps': 28757, 'loss/train': 0.9528539776802063} -08/30/2021 18:18:34 - INFO - __main__ - Step 28759: {'lr': 0.0004607457870626928, 'samples': 5521728, 'steps': 28758, 'loss/train': 1.6156426668167114} -08/30/2021 18:18:34 - INFO - __main__ - Step 28760: {'lr': 0.0004607429323053164, 'samples': 5521920, 'steps': 28759, 'loss/train': 1.670474648475647} -08/30/2021 18:18:34 - INFO - __main__ - Step 28761: {'lr': 0.0004607400774529825, 'samples': 5522112, 'steps': 28760, 'loss/train': 1.3794561624526978} -08/30/2021 18:18:35 - INFO - __main__ - Step 28762: {'lr': 0.0004607372225056925, 'samples': 5522304, 'steps': 28761, 'loss/train': 1.0120388269424438} -08/30/2021 18:18:36 - INFO - __main__ - Step 28763: {'lr': 0.00046073436746344744, 'samples': 5522496, 'steps': 28762, 'loss/train': 1.1292396783828735} -08/30/2021 18:18:37 - INFO - __main__ - Step 28764: {'lr': 0.0004607315123262488, 'samples': 5522688, 'steps': 28763, 'loss/train': 1.728515625} -08/30/2021 18:18:37 - INFO - __main__ - Step 28765: {'lr': 0.0004607286570940977, 'samples': 5522880, 'steps': 28764, 'loss/train': 1.4552578926086426} -08/30/2021 18:18:37 - INFO - __main__ - Step 28766: {'lr': 0.0004607258017669956, 'samples': 5523072, 'steps': 28765, 'loss/train': 1.4807502031326294} -08/30/2021 18:18:38 - INFO - __main__ - Step 28767: {'lr': 0.0004607229463449437, 'samples': 5523264, 'steps': 28766, 'loss/train': 1.7356168031692505} -08/30/2021 18:18:38 - INFO - __main__ - Step 28768: {'lr': 0.00046072009082794333, 'samples': 5523456, 'steps': 28767, 'loss/train': 1.394574522972107} -08/30/2021 18:18:40 - INFO - __main__ - Step 28769: {'lr': 0.00046071723521599563, 'samples': 5523648, 'steps': 28768, 'loss/train': 1.4062213897705078} -08/30/2021 18:18:40 - INFO - __main__ - Step 28770: {'lr': 0.000460714379509102, 'samples': 5523840, 'steps': 28769, 'loss/train': 1.4895013570785522} -08/30/2021 18:18:40 - INFO - __main__ - Step 28771: {'lr': 0.0004607115237072638, 'samples': 5524032, 'steps': 28770, 'loss/train': 1.6866536140441895} -08/30/2021 18:18:41 - INFO - __main__ - Step 28772: {'lr': 0.00046070866781048225, 'samples': 5524224, 'steps': 28771, 'loss/train': 0.6956020593643188} -08/30/2021 18:18:41 - INFO - __main__ - Step 28773: {'lr': 0.0004607058118187586, 'samples': 5524416, 'steps': 28772, 'loss/train': 1.3922953605651855} -08/30/2021 18:18:43 - INFO - __main__ - Step 28774: {'lr': 0.00046070295573209406, 'samples': 5524608, 'steps': 28773, 'loss/train': 1.3464394807815552} -08/30/2021 18:18:43 - INFO - __main__ - Step 28775: {'lr': 0.00046070009955049017, 'samples': 5524800, 'steps': 28774, 'loss/train': 1.44407057762146} -08/30/2021 18:18:43 - INFO - __main__ - Step 28776: {'lr': 0.000460697243273948, 'samples': 5524992, 'steps': 28775, 'loss/train': 1.6780152320861816} -08/30/2021 18:18:44 - INFO - __main__ - Step 28777: {'lr': 0.0004606943869024689, 'samples': 5525184, 'steps': 28776, 'loss/train': 1.5969003438949585} -08/30/2021 18:18:44 - INFO - __main__ - Step 28778: {'lr': 0.0004606915304360542, 'samples': 5525376, 'steps': 28777, 'loss/train': 2.0217835903167725} -08/30/2021 18:18:46 - INFO - __main__ - Step 28779: {'lr': 0.00046068867387470507, 'samples': 5525568, 'steps': 28778, 'loss/train': 1.3903378248214722} -08/30/2021 18:18:47 - INFO - __main__ - Step 28780: {'lr': 0.00046068581721842294, 'samples': 5525760, 'steps': 28779, 'loss/train': 1.7632614374160767} -08/30/2021 18:18:47 - INFO - __main__ - Step 28781: {'lr': 0.00046068296046720904, 'samples': 5525952, 'steps': 28780, 'loss/train': 1.5530871152877808} -08/30/2021 18:18:48 - INFO - __main__ - Step 28782: {'lr': 0.0004606801036210646, 'samples': 5526144, 'steps': 28781, 'loss/train': 1.5877370834350586} -08/30/2021 18:18:48 - INFO - __main__ - Step 28783: {'lr': 0.000460677246679991, 'samples': 5526336, 'steps': 28782, 'loss/train': 0.5917261242866516} -08/30/2021 18:18:49 - INFO - __main__ - Step 28784: {'lr': 0.00046067438964398944, 'samples': 5526528, 'steps': 28783, 'loss/train': 1.719201683998108} -08/30/2021 18:18:50 - INFO - __main__ - Step 28785: {'lr': 0.00046067153251306127, 'samples': 5526720, 'steps': 28784, 'loss/train': 0.9624534249305725} -08/30/2021 18:18:50 - INFO - __main__ - Step 28786: {'lr': 0.0004606686752872078, 'samples': 5526912, 'steps': 28785, 'loss/train': 1.9532489776611328} -08/30/2021 18:18:50 - INFO - __main__ - Step 28787: {'lr': 0.0004606658179664302, 'samples': 5527104, 'steps': 28786, 'loss/train': 1.748219609260559} -08/30/2021 18:18:51 - INFO - __main__ - Step 28788: {'lr': 0.00046066296055072986, 'samples': 5527296, 'steps': 28787, 'loss/train': 1.2918643951416016} -08/30/2021 18:18:52 - INFO - __main__ - Step 28789: {'lr': 0.0004606601030401081, 'samples': 5527488, 'steps': 28788, 'loss/train': 1.6055225133895874} -08/30/2021 18:18:53 - INFO - __main__ - Step 28790: {'lr': 0.0004606572454345661, 'samples': 5527680, 'steps': 28789, 'loss/train': 2.2760958671569824} -08/30/2021 18:18:53 - INFO - __main__ - Step 28791: {'lr': 0.0004606543877341052, 'samples': 5527872, 'steps': 28790, 'loss/train': 1.3080912828445435} -08/30/2021 18:18:54 - INFO - __main__ - Step 28792: {'lr': 0.00046065152993872665, 'samples': 5528064, 'steps': 28791, 'loss/train': 0.6149696111679077} -08/30/2021 18:18:54 - INFO - __main__ - Step 28793: {'lr': 0.0004606486720484318, 'samples': 5528256, 'steps': 28792, 'loss/train': 1.9276411533355713} -08/30/2021 18:18:55 - INFO - __main__ - Step 28794: {'lr': 0.0004606458140632219, 'samples': 5528448, 'steps': 28793, 'loss/train': 1.213881015777588} -08/30/2021 18:18:56 - INFO - __main__ - Step 28795: {'lr': 0.0004606429559830982, 'samples': 5528640, 'steps': 28794, 'loss/train': 1.8192152976989746} -08/30/2021 18:18:56 - INFO - __main__ - Step 28796: {'lr': 0.00046064009780806217, 'samples': 5528832, 'steps': 28795, 'loss/train': 1.3204809427261353} -08/30/2021 18:18:57 - INFO - __main__ - Step 28797: {'lr': 0.0004606372395381149, 'samples': 5529024, 'steps': 28796, 'loss/train': 1.1457908153533936} -08/30/2021 18:18:57 - INFO - __main__ - Step 28798: {'lr': 0.0004606343811732577, 'samples': 5529216, 'steps': 28797, 'loss/train': 1.4433735609054565} -08/30/2021 18:18:58 - INFO - __main__ - Step 28799: {'lr': 0.0004606315227134919, 'samples': 5529408, 'steps': 28798, 'loss/train': 1.2644931077957153} -08/30/2021 18:18:59 - INFO - __main__ - Step 28800: {'lr': 0.0004606286641588188, 'samples': 5529600, 'steps': 28799, 'loss/train': 1.5006144046783447} -08/30/2021 18:18:59 - INFO - __main__ - Step 28801: {'lr': 0.0004606258055092397, 'samples': 5529792, 'steps': 28800, 'loss/train': 1.426822304725647} -08/30/2021 18:19:00 - INFO - __main__ - Step 28802: {'lr': 0.00046062294676475584, 'samples': 5529984, 'steps': 28801, 'loss/train': 1.4379661083221436} -08/30/2021 18:19:00 - INFO - __main__ - Step 28803: {'lr': 0.0004606200879253685, 'samples': 5530176, 'steps': 28802, 'loss/train': 1.4996684789657593} -08/30/2021 18:19:02 - INFO - __main__ - Step 28804: {'lr': 0.00046061722899107905, 'samples': 5530368, 'steps': 28803, 'loss/train': 1.2916420698165894} -08/30/2021 18:19:02 - INFO - __main__ - Step 28805: {'lr': 0.0004606143699618888, 'samples': 5530560, 'steps': 28804, 'loss/train': 1.4700864553451538} -08/30/2021 18:19:02 - INFO - __main__ - Step 28806: {'lr': 0.00046061151083779886, 'samples': 5530752, 'steps': 28805, 'loss/train': 1.9744372367858887} -08/30/2021 18:19:03 - INFO - __main__ - Step 28807: {'lr': 0.0004606086516188106, 'samples': 5530944, 'steps': 28806, 'loss/train': 1.173879861831665} -08/30/2021 18:19:03 - INFO - __main__ - Step 28808: {'lr': 0.00046060579230492533, 'samples': 5531136, 'steps': 28807, 'loss/train': 1.6978788375854492} -08/30/2021 18:19:04 - INFO - __main__ - Step 28809: {'lr': 0.0004606029328961444, 'samples': 5531328, 'steps': 28808, 'loss/train': 1.7924799919128418} -08/30/2021 18:19:05 - INFO - __main__ - Step 28810: {'lr': 0.000460600073392469, 'samples': 5531520, 'steps': 28809, 'loss/train': 1.2540429830551147} -08/30/2021 18:19:05 - INFO - __main__ - Step 28811: {'lr': 0.00046059721379390053, 'samples': 5531712, 'steps': 28810, 'loss/train': 0.6633529663085938} -08/30/2021 18:19:06 - INFO - __main__ - Step 28812: {'lr': 0.0004605943541004401, 'samples': 5531904, 'steps': 28811, 'loss/train': 1.1641274690628052} -08/30/2021 18:19:06 - INFO - __main__ - Step 28813: {'lr': 0.00046059149431208914, 'samples': 5532096, 'steps': 28812, 'loss/train': 1.72393000125885} -08/30/2021 18:19:06 - INFO - __main__ - Step 28814: {'lr': 0.0004605886344288489, 'samples': 5532288, 'steps': 28813, 'loss/train': 1.344095230102539} -08/30/2021 18:19:08 - INFO - __main__ - Step 28815: {'lr': 0.0004605857744507207, 'samples': 5532480, 'steps': 28814, 'loss/train': 1.4743280410766602} -08/30/2021 18:19:08 - INFO - __main__ - Step 28816: {'lr': 0.00046058291437770584, 'samples': 5532672, 'steps': 28815, 'loss/train': 1.1923967599868774} -08/30/2021 18:19:09 - INFO - __main__ - Step 28817: {'lr': 0.0004605800542098054, 'samples': 5532864, 'steps': 28816, 'loss/train': 1.0488197803497314} -08/30/2021 18:19:09 - INFO - __main__ - Step 28818: {'lr': 0.00046057719394702103, 'samples': 5533056, 'steps': 28817, 'loss/train': 1.435438632965088} -08/30/2021 18:19:09 - INFO - __main__ - Step 28819: {'lr': 0.00046057433358935373, 'samples': 5533248, 'steps': 28818, 'loss/train': 0.1840985119342804} -08/30/2021 18:19:11 - INFO - __main__ - Step 28820: {'lr': 0.0004605714731368049, 'samples': 5533440, 'steps': 28819, 'loss/train': 1.9750401973724365} -08/30/2021 18:19:12 - INFO - __main__ - Step 28821: {'lr': 0.0004605686125893758, 'samples': 5533632, 'steps': 28820, 'loss/train': 1.3374357223510742} -08/30/2021 18:19:12 - INFO - __main__ - Step 28822: {'lr': 0.00046056575194706773, 'samples': 5533824, 'steps': 28821, 'loss/train': 0.9989317655563354} -08/30/2021 18:19:12 - INFO - __main__ - Step 28823: {'lr': 0.000460562891209882, 'samples': 5534016, 'steps': 28822, 'loss/train': 1.727424144744873} -08/30/2021 18:19:13 - INFO - __main__ - Step 28824: {'lr': 0.0004605600303778199, 'samples': 5534208, 'steps': 28823, 'loss/train': 1.3220311403274536} -08/30/2021 18:19:13 - INFO - __main__ - Step 28825: {'lr': 0.0004605571694508827, 'samples': 5534400, 'steps': 28824, 'loss/train': 1.4859980344772339} -08/30/2021 18:19:14 - INFO - __main__ - Step 28826: {'lr': 0.0004605543084290716, 'samples': 5534592, 'steps': 28825, 'loss/train': 1.5253325700759888} -08/30/2021 18:19:15 - INFO - __main__ - Step 28827: {'lr': 0.00046055144731238805, 'samples': 5534784, 'steps': 28826, 'loss/train': 1.4258514642715454} -08/30/2021 18:19:15 - INFO - __main__ - Step 28828: {'lr': 0.00046054858610083325, 'samples': 5534976, 'steps': 28827, 'loss/train': 1.5617334842681885} -08/30/2021 18:19:16 - INFO - __main__ - Step 28829: {'lr': 0.0004605457247944086, 'samples': 5535168, 'steps': 28828, 'loss/train': 1.6477042436599731} -08/30/2021 18:19:16 - INFO - __main__ - Step 28830: {'lr': 0.0004605428633931152, 'samples': 5535360, 'steps': 28829, 'loss/train': 1.5681991577148438} -08/30/2021 18:19:18 - INFO - __main__ - Step 28831: {'lr': 0.00046054000189695444, 'samples': 5535552, 'steps': 28830, 'loss/train': 1.8616143465042114} -08/30/2021 18:19:18 - INFO - __main__ - Step 28832: {'lr': 0.00046053714030592764, 'samples': 5535744, 'steps': 28831, 'loss/train': 5.211965084075928} -08/30/2021 18:19:19 - INFO - __main__ - Step 28833: {'lr': 0.0004605342786200359, 'samples': 5535936, 'steps': 28832, 'loss/train': 5.299749374389648} -08/30/2021 18:19:19 - INFO - __main__ - Step 28834: {'lr': 0.0004605314168392809, 'samples': 5536128, 'steps': 28833, 'loss/train': 1.5922120809555054} -08/30/2021 18:19:19 - INFO - __main__ - Step 28835: {'lr': 0.00046052855496366354, 'samples': 5536320, 'steps': 28834, 'loss/train': 2.2216432094573975} -08/30/2021 18:19:20 - INFO - __main__ - Step 28836: {'lr': 0.0004605256929931853, 'samples': 5536512, 'steps': 28835, 'loss/train': 1.0870556831359863} -08/30/2021 18:19:22 - INFO - __main__ - Step 28837: {'lr': 0.0004605228309278474, 'samples': 5536704, 'steps': 28836, 'loss/train': 1.584465503692627} -08/30/2021 18:19:22 - INFO - __main__ - Step 28838: {'lr': 0.0004605199687676512, 'samples': 5536896, 'steps': 28837, 'loss/train': 1.690821886062622} -08/30/2021 18:19:23 - INFO - __main__ - Step 28839: {'lr': 0.00046051710651259797, 'samples': 5537088, 'steps': 28838, 'loss/train': 1.9488508701324463} -08/30/2021 18:19:23 - INFO - __main__ - Step 28840: {'lr': 0.00046051424416268896, 'samples': 5537280, 'steps': 28839, 'loss/train': 1.453596591949463} -08/30/2021 18:19:23 - INFO - __main__ - Step 28841: {'lr': 0.0004605113817179255, 'samples': 5537472, 'steps': 28840, 'loss/train': 1.7849009037017822} -08/30/2021 18:19:25 - INFO - __main__ - Step 28842: {'lr': 0.00046050851917830884, 'samples': 5537664, 'steps': 28841, 'loss/train': 1.0420764684677124} -08/30/2021 18:19:25 - INFO - __main__ - Step 28843: {'lr': 0.00046050565654384023, 'samples': 5537856, 'steps': 28842, 'loss/train': 1.6934154033660889} -08/30/2021 18:19:26 - INFO - __main__ - Step 28844: {'lr': 0.0004605027938145211, 'samples': 5538048, 'steps': 28843, 'loss/train': 1.946616768836975} -08/30/2021 18:19:26 - INFO - __main__ - Step 28845: {'lr': 0.0004604999309903526, 'samples': 5538240, 'steps': 28844, 'loss/train': 1.6108081340789795} -08/30/2021 18:19:26 - INFO - __main__ - Step 28846: {'lr': 0.0004604970680713362, 'samples': 5538432, 'steps': 28845, 'loss/train': 2.1126925945281982} -08/30/2021 18:19:27 - INFO - __main__ - Step 28847: {'lr': 0.00046049420505747294, 'samples': 5538624, 'steps': 28846, 'loss/train': 1.4479706287384033} -08/30/2021 18:19:28 - INFO - __main__ - Step 28848: {'lr': 0.0004604913419487643, 'samples': 5538816, 'steps': 28847, 'loss/train': 1.1913269758224487} -08/30/2021 18:19:29 - INFO - __main__ - Step 28849: {'lr': 0.00046048847874521144, 'samples': 5539008, 'steps': 28848, 'loss/train': 1.337689995765686} -08/30/2021 18:19:29 - INFO - __main__ - Step 28850: {'lr': 0.00046048561544681575, 'samples': 5539200, 'steps': 28849, 'loss/train': 1.0054725408554077} -08/30/2021 18:19:29 - INFO - __main__ - Step 28851: {'lr': 0.00046048275205357855, 'samples': 5539392, 'steps': 28850, 'loss/train': 1.068784475326538} -08/30/2021 18:19:30 - INFO - __main__ - Step 28852: {'lr': 0.00046047988856550104, 'samples': 5539584, 'steps': 28851, 'loss/train': 1.2208802700042725} -08/30/2021 18:19:31 - INFO - __main__ - Step 28853: {'lr': 0.00046047702498258446, 'samples': 5539776, 'steps': 28852, 'loss/train': 1.698395848274231} -08/30/2021 18:19:32 - INFO - __main__ - Step 28854: {'lr': 0.00046047416130483033, 'samples': 5539968, 'steps': 28853, 'loss/train': 1.7481921911239624} -08/30/2021 18:19:32 - INFO - __main__ - Step 28855: {'lr': 0.00046047129753223973, 'samples': 5540160, 'steps': 28854, 'loss/train': 1.0832093954086304} -08/30/2021 18:19:32 - INFO - __main__ - Step 28856: {'lr': 0.0004604684336648139, 'samples': 5540352, 'steps': 28855, 'loss/train': 1.8524690866470337} -08/30/2021 18:19:33 - INFO - __main__ - Step 28857: {'lr': 0.00046046556970255435, 'samples': 5540544, 'steps': 28856, 'loss/train': 1.2693358659744263} -08/30/2021 18:19:34 - INFO - __main__ - Step 28858: {'lr': 0.0004604627056454622, 'samples': 5540736, 'steps': 28857, 'loss/train': 1.1964995861053467} -08/30/2021 18:19:34 - INFO - __main__ - Step 28859: {'lr': 0.00046045984149353894, 'samples': 5540928, 'steps': 28858, 'loss/train': 1.4220203161239624} -08/30/2021 18:19:35 - INFO - __main__ - Step 28860: {'lr': 0.0004604569772467856, 'samples': 5541120, 'steps': 28859, 'loss/train': 1.0095555782318115} -08/30/2021 18:19:35 - INFO - __main__ - Step 28861: {'lr': 0.00046045411290520364, 'samples': 5541312, 'steps': 28860, 'loss/train': 1.8971298933029175} -08/30/2021 18:19:36 - INFO - __main__ - Step 28862: {'lr': 0.00046045124846879427, 'samples': 5541504, 'steps': 28861, 'loss/train': 1.142421007156372} -08/30/2021 18:19:37 - INFO - __main__ - Step 28863: {'lr': 0.00046044838393755885, 'samples': 5541696, 'steps': 28862, 'loss/train': 1.459968090057373} -08/30/2021 18:19:38 - INFO - __main__ - Step 28864: {'lr': 0.00046044551931149856, 'samples': 5541888, 'steps': 28863, 'loss/train': 0.4833144247531891} -08/30/2021 18:19:38 - INFO - __main__ - Step 28865: {'lr': 0.0004604426545906149, 'samples': 5542080, 'steps': 28864, 'loss/train': 1.4947117567062378} -08/30/2021 18:19:38 - INFO - __main__ - Step 28866: {'lr': 0.0004604397897749089, 'samples': 5542272, 'steps': 28865, 'loss/train': 1.7568550109863281} -08/30/2021 18:19:39 - INFO - __main__ - Step 28867: {'lr': 0.00046043692486438207, 'samples': 5542464, 'steps': 28866, 'loss/train': 1.0612441301345825} -08/30/2021 18:19:40 - INFO - __main__ - Step 28868: {'lr': 0.00046043405985903555, 'samples': 5542656, 'steps': 28867, 'loss/train': 1.6154786348342896} -08/30/2021 18:19:41 - INFO - __main__ - Step 28869: {'lr': 0.00046043119475887073, 'samples': 5542848, 'steps': 28868, 'loss/train': 1.5218857526779175} -08/30/2021 18:19:41 - INFO - __main__ - Step 28870: {'lr': 0.0004604283295638888, 'samples': 5543040, 'steps': 28869, 'loss/train': 1.3188573122024536} -08/30/2021 18:19:42 - INFO - __main__ - Step 28871: {'lr': 0.00046042546427409116, 'samples': 5543232, 'steps': 28870, 'loss/train': 0.7918139696121216} -08/30/2021 18:19:42 - INFO - __main__ - Step 28872: {'lr': 0.000460422598889479, 'samples': 5543424, 'steps': 28871, 'loss/train': 1.4799987077713013} -08/30/2021 18:19:43 - INFO - __main__ - Step 28873: {'lr': 0.0004604197334100537, 'samples': 5543616, 'steps': 28872, 'loss/train': 1.4581646919250488} -08/30/2021 18:19:44 - INFO - __main__ - Step 28874: {'lr': 0.0004604168678358166, 'samples': 5543808, 'steps': 28873, 'loss/train': 1.1605101823806763} -08/30/2021 18:19:44 - INFO - __main__ - Step 28875: {'lr': 0.00046041400216676874, 'samples': 5544000, 'steps': 28874, 'loss/train': 1.4286561012268066} -08/30/2021 18:19:45 - INFO - __main__ - Step 28876: {'lr': 0.0004604111364029118, 'samples': 5544192, 'steps': 28875, 'loss/train': 1.7455028295516968} -08/30/2021 18:19:45 - INFO - __main__ - Step 28877: {'lr': 0.0004604082705442466, 'samples': 5544384, 'steps': 28876, 'loss/train': 1.7974566221237183} -08/30/2021 18:19:46 - INFO - __main__ - Step 28878: {'lr': 0.00046040540459077483, 'samples': 5544576, 'steps': 28877, 'loss/train': 0.9158125519752502} -08/30/2021 18:19:47 - INFO - __main__ - Step 28879: {'lr': 0.0004604025385424976, 'samples': 5544768, 'steps': 28878, 'loss/train': 1.5195859670639038} -08/30/2021 18:19:47 - INFO - __main__ - Step 28880: {'lr': 0.00046039967239941626, 'samples': 5544960, 'steps': 28879, 'loss/train': 1.4470536708831787} -08/30/2021 18:19:48 - INFO - __main__ - Step 28881: {'lr': 0.000460396806161532, 'samples': 5545152, 'steps': 28880, 'loss/train': 1.6458234786987305} -08/30/2021 18:19:48 - INFO - __main__ - Step 28882: {'lr': 0.0004603939398288463, 'samples': 5545344, 'steps': 28881, 'loss/train': 1.1609463691711426} -08/30/2021 18:19:49 - INFO - __main__ - Step 28883: {'lr': 0.00046039107340136023, 'samples': 5545536, 'steps': 28882, 'loss/train': 1.6444604396820068} -08/30/2021 18:19:50 - INFO - __main__ - Step 28884: {'lr': 0.00046038820687907523, 'samples': 5545728, 'steps': 28883, 'loss/train': 1.0269838571548462} -08/30/2021 18:19:50 - INFO - __main__ - Step 28885: {'lr': 0.0004603853402619925, 'samples': 5545920, 'steps': 28884, 'loss/train': 1.2960134744644165} -08/30/2021 18:19:51 - INFO - __main__ - Step 28886: {'lr': 0.00046038247355011347, 'samples': 5546112, 'steps': 28885, 'loss/train': 1.117455005645752} -08/30/2021 18:19:51 - INFO - __main__ - Step 28887: {'lr': 0.00046037960674343925, 'samples': 5546304, 'steps': 28886, 'loss/train': 0.9311093688011169} -08/30/2021 18:19:51 - INFO - __main__ - Step 28888: {'lr': 0.0004603767398419713, 'samples': 5546496, 'steps': 28887, 'loss/train': 1.880321741104126} -08/30/2021 18:19:54 - INFO - __main__ - Step 28889: {'lr': 0.0004603738728457109, 'samples': 5546688, 'steps': 28888, 'loss/train': 1.6211706399917603} -08/30/2021 18:19:54 - INFO - __main__ - Step 28890: {'lr': 0.0004603710057546592, 'samples': 5546880, 'steps': 28889, 'loss/train': 0.2054881751537323} -08/30/2021 18:19:55 - INFO - __main__ - Step 28891: {'lr': 0.0004603681385688175, 'samples': 5547072, 'steps': 28890, 'loss/train': 0.07243458181619644} -08/30/2021 18:19:55 - INFO - __main__ - Step 28892: {'lr': 0.00046036527128818724, 'samples': 5547264, 'steps': 28891, 'loss/train': 1.0678194761276245} -08/30/2021 18:19:55 - INFO - __main__ - Step 28893: {'lr': 0.0004603624039127696, 'samples': 5547456, 'steps': 28892, 'loss/train': 1.3182927370071411} -08/30/2021 18:19:56 - INFO - __main__ - Step 28894: {'lr': 0.00046035953644256596, 'samples': 5547648, 'steps': 28893, 'loss/train': 1.3891026973724365} -08/30/2021 18:19:57 - INFO - __main__ - Step 28895: {'lr': 0.00046035666887757755, 'samples': 5547840, 'steps': 28894, 'loss/train': 0.2706478536128998} -08/30/2021 18:19:58 - INFO - __main__ - Step 28896: {'lr': 0.00046035380121780563, 'samples': 5548032, 'steps': 28895, 'loss/train': 0.8166786432266235} -08/30/2021 18:19:58 - INFO - __main__ - Step 28897: {'lr': 0.0004603509334632515, 'samples': 5548224, 'steps': 28896, 'loss/train': 1.5154094696044922} -08/30/2021 18:19:58 - INFO - __main__ - Step 28898: {'lr': 0.00046034806561391655, 'samples': 5548416, 'steps': 28897, 'loss/train': 1.4594331979751587} -08/30/2021 18:19:59 - INFO - __main__ - Step 28899: {'lr': 0.000460345197669802, 'samples': 5548608, 'steps': 28898, 'loss/train': 1.543952465057373} -08/30/2021 18:19:59 - INFO - __main__ - Step 28900: {'lr': 0.0004603423296309092, 'samples': 5548800, 'steps': 28899, 'loss/train': 1.7093851566314697} -08/30/2021 18:20:01 - INFO - __main__ - Step 28901: {'lr': 0.0004603394614972393, 'samples': 5548992, 'steps': 28900, 'loss/train': 1.3952860832214355} -08/30/2021 18:20:01 - INFO - __main__ - Step 28902: {'lr': 0.00046033659326879373, 'samples': 5549184, 'steps': 28901, 'loss/train': 2.4770402908325195} -08/30/2021 18:20:02 - INFO - __main__ - Step 28903: {'lr': 0.00046033372494557373, 'samples': 5549376, 'steps': 28902, 'loss/train': 0.9451573491096497} -08/30/2021 18:20:02 - INFO - __main__ - Step 28904: {'lr': 0.00046033085652758053, 'samples': 5549568, 'steps': 28903, 'loss/train': 0.03911512717604637} -08/30/2021 18:20:02 - INFO - __main__ - Step 28905: {'lr': 0.00046032798801481564, 'samples': 5549760, 'steps': 28904, 'loss/train': 1.26829993724823} -08/30/2021 18:20:03 - INFO - __main__ - Step 28906: {'lr': 0.0004603251194072801, 'samples': 5549952, 'steps': 28905, 'loss/train': 1.5318100452423096} -08/30/2021 18:20:04 - INFO - __main__ - Step 28907: {'lr': 0.0004603222507049754, 'samples': 5550144, 'steps': 28906, 'loss/train': 1.6907885074615479} -08/30/2021 18:20:05 - INFO - __main__ - Step 28908: {'lr': 0.00046031938190790254, 'samples': 5550336, 'steps': 28907, 'loss/train': 1.842464804649353} -08/30/2021 18:20:05 - INFO - __main__ - Step 28909: {'lr': 0.0004603165130160633, 'samples': 5550528, 'steps': 28908, 'loss/train': 1.7786346673965454} -08/30/2021 18:20:05 - INFO - __main__ - Step 28910: {'lr': 0.0004603136440294584, 'samples': 5550720, 'steps': 28909, 'loss/train': 1.5675617456436157} -08/30/2021 18:20:06 - INFO - __main__ - Step 28911: {'lr': 0.0004603107749480896, 'samples': 5550912, 'steps': 28910, 'loss/train': 1.4550175666809082} -08/30/2021 18:20:07 - INFO - __main__ - Step 28912: {'lr': 0.0004603079057719579, 'samples': 5551104, 'steps': 28911, 'loss/train': 1.8844538927078247} -08/30/2021 18:20:08 - INFO - __main__ - Step 28913: {'lr': 0.0004603050365010648, 'samples': 5551296, 'steps': 28912, 'loss/train': 1.815502405166626} -08/30/2021 18:20:08 - INFO - __main__ - Step 28914: {'lr': 0.00046030216713541147, 'samples': 5551488, 'steps': 28913, 'loss/train': 1.5247673988342285} -08/30/2021 18:20:08 - INFO - __main__ - Step 28915: {'lr': 0.00046029929767499924, 'samples': 5551680, 'steps': 28914, 'loss/train': 1.4302256107330322} -08/30/2021 18:20:09 - INFO - __main__ - Step 28916: {'lr': 0.0004602964281198293, 'samples': 5551872, 'steps': 28915, 'loss/train': 1.7288661003112793} -08/30/2021 18:20:10 - INFO - __main__ - Step 28917: {'lr': 0.0004602935584699031, 'samples': 5552064, 'steps': 28916, 'loss/train': 1.8400119543075562} -08/30/2021 18:20:11 - INFO - __main__ - Step 28918: {'lr': 0.00046029068872522185, 'samples': 5552256, 'steps': 28917, 'loss/train': 1.44405198097229} -08/30/2021 18:20:11 - INFO - __main__ - Step 28919: {'lr': 0.0004602878188857869, 'samples': 5552448, 'steps': 28918, 'loss/train': 1.474245548248291} -08/30/2021 18:20:11 - INFO - __main__ - Step 28920: {'lr': 0.0004602849489515995, 'samples': 5552640, 'steps': 28919, 'loss/train': 1.9890936613082886} -08/30/2021 18:20:12 - INFO - __main__ - Step 28921: {'lr': 0.00046028207892266095, 'samples': 5552832, 'steps': 28920, 'loss/train': 1.5841706991195679} -08/30/2021 18:20:13 - INFO - __main__ - Step 28922: {'lr': 0.00046027920879897243, 'samples': 5553024, 'steps': 28921, 'loss/train': 0.14850802719593048} -08/30/2021 18:20:14 - INFO - __main__ - Step 28923: {'lr': 0.00046027633858053554, 'samples': 5553216, 'steps': 28922, 'loss/train': 1.1777100563049316} -08/30/2021 18:20:14 - INFO - __main__ - Step 28924: {'lr': 0.0004602734682673512, 'samples': 5553408, 'steps': 28923, 'loss/train': 1.2692878246307373} -08/30/2021 18:20:14 - INFO - __main__ - Step 28925: {'lr': 0.0004602705978594209, 'samples': 5553600, 'steps': 28924, 'loss/train': 1.4671497344970703} -08/30/2021 18:20:15 - INFO - __main__ - Step 28926: {'lr': 0.00046026772735674606, 'samples': 5553792, 'steps': 28925, 'loss/train': 1.2502681016921997} -08/30/2021 18:20:16 - INFO - __main__ - Step 28927: {'lr': 0.00046026485675932765, 'samples': 5553984, 'steps': 28926, 'loss/train': 1.571979284286499} -08/30/2021 18:20:17 - INFO - __main__ - Step 28928: {'lr': 0.0004602619860671672, 'samples': 5554176, 'steps': 28927, 'loss/train': 0.8823884129524231} -08/30/2021 18:20:17 - INFO - __main__ - Step 28929: {'lr': 0.000460259115280266, 'samples': 5554368, 'steps': 28928, 'loss/train': 2.0176033973693848} -08/30/2021 18:20:17 - INFO - __main__ - Step 28930: {'lr': 0.00046025624439862523, 'samples': 5554560, 'steps': 28929, 'loss/train': 1.8027647733688354} -08/30/2021 18:20:18 - INFO - __main__ - Step 28931: {'lr': 0.0004602533734222463, 'samples': 5554752, 'steps': 28930, 'loss/train': 1.4804277420043945} -08/30/2021 18:20:18 - INFO - __main__ - Step 28932: {'lr': 0.00046025050235113036, 'samples': 5554944, 'steps': 28931, 'loss/train': 1.4038063287734985} -08/30/2021 18:20:20 - INFO - __main__ - Step 28933: {'lr': 0.00046024763118527885, 'samples': 5555136, 'steps': 28932, 'loss/train': 1.8037775754928589} -08/30/2021 18:20:20 - INFO - __main__ - Step 28934: {'lr': 0.00046024475992469295, 'samples': 5555328, 'steps': 28933, 'loss/train': 1.4444252252578735} -08/30/2021 18:20:20 - INFO - __main__ - Step 28935: {'lr': 0.0004602418885693741, 'samples': 5555520, 'steps': 28934, 'loss/train': 1.142490029335022} -08/30/2021 18:20:21 - INFO - __main__ - Step 28936: {'lr': 0.0004602390171193234, 'samples': 5555712, 'steps': 28935, 'loss/train': 1.1529531478881836} -08/30/2021 18:20:21 - INFO - __main__ - Step 28937: {'lr': 0.0004602361455745423, 'samples': 5555904, 'steps': 28936, 'loss/train': 1.541255235671997} -08/30/2021 18:20:23 - INFO - __main__ - Step 28938: {'lr': 0.000460233273935032, 'samples': 5556096, 'steps': 28937, 'loss/train': 1.4332858324050903} -08/30/2021 18:20:23 - INFO - __main__ - Step 28939: {'lr': 0.00046023040220079383, 'samples': 5556288, 'steps': 28938, 'loss/train': 1.8582457304000854} -08/30/2021 18:20:23 - INFO - __main__ - Step 28940: {'lr': 0.00046022753037182915, 'samples': 5556480, 'steps': 28939, 'loss/train': 1.4308955669403076} -08/30/2021 18:20:24 - INFO - __main__ - Step 28941: {'lr': 0.0004602246584481391, 'samples': 5556672, 'steps': 28940, 'loss/train': 2.558939218521118} -08/30/2021 18:20:24 - INFO - __main__ - Step 28942: {'lr': 0.00046022178642972513, 'samples': 5556864, 'steps': 28941, 'loss/train': 0.9509792327880859} -08/30/2021 18:20:26 - INFO - __main__ - Step 28943: {'lr': 0.00046021891431658845, 'samples': 5557056, 'steps': 28942, 'loss/train': 1.919646143913269} -08/30/2021 18:20:27 - INFO - __main__ - Step 28944: {'lr': 0.00046021604210873035, 'samples': 5557248, 'steps': 28943, 'loss/train': 0.7934926748275757} -08/30/2021 18:20:27 - INFO - __main__ - Step 28945: {'lr': 0.0004602131698061521, 'samples': 5557440, 'steps': 28944, 'loss/train': 1.622161626815796} -08/30/2021 18:20:27 - INFO - __main__ - Step 28946: {'lr': 0.0004602102974088551, 'samples': 5557632, 'steps': 28945, 'loss/train': 0.7455008029937744} -08/30/2021 18:20:28 - INFO - __main__ - Step 28947: {'lr': 0.00046020742491684067, 'samples': 5557824, 'steps': 28946, 'loss/train': 1.1160584688186646} -08/30/2021 18:20:29 - INFO - __main__ - Step 28948: {'lr': 0.0004602045523301099, 'samples': 5558016, 'steps': 28947, 'loss/train': 2.048121213912964} -08/30/2021 18:20:30 - INFO - __main__ - Step 28949: {'lr': 0.0004602016796486642, 'samples': 5558208, 'steps': 28948, 'loss/train': 1.2027957439422607} -08/30/2021 18:20:30 - INFO - __main__ - Step 28950: {'lr': 0.00046019880687250494, 'samples': 5558400, 'steps': 28949, 'loss/train': 1.0947144031524658} -08/30/2021 18:20:30 - INFO - __main__ - Step 28951: {'lr': 0.0004601959340016333, 'samples': 5558592, 'steps': 28950, 'loss/train': 0.3539426922798157} -08/30/2021 18:20:31 - INFO - __main__ - Step 28952: {'lr': 0.0004601930610360506, 'samples': 5558784, 'steps': 28951, 'loss/train': 1.6546393632888794} -08/30/2021 18:20:32 - INFO - __main__ - Step 28953: {'lr': 0.0004601901879757582, 'samples': 5558976, 'steps': 28952, 'loss/train': 1.4125444889068604} -08/30/2021 18:20:33 - INFO - __main__ - Step 28954: {'lr': 0.0004601873148207573, 'samples': 5559168, 'steps': 28953, 'loss/train': 1.53622305393219} -08/30/2021 18:20:33 - INFO - __main__ - Step 28955: {'lr': 0.00046018444157104924, 'samples': 5559360, 'steps': 28954, 'loss/train': 1.8789094686508179} -08/30/2021 18:20:33 - INFO - __main__ - Step 28956: {'lr': 0.0004601815682266353, 'samples': 5559552, 'steps': 28955, 'loss/train': 0.9152023196220398} -08/30/2021 18:20:34 - INFO - __main__ - Step 28957: {'lr': 0.00046017869478751685, 'samples': 5559744, 'steps': 28956, 'loss/train': 1.435634970664978} -08/30/2021 18:20:36 - INFO - __main__ - Step 28958: {'lr': 0.00046017582125369505, 'samples': 5559936, 'steps': 28957, 'loss/train': 2.5206053256988525} -08/30/2021 18:20:36 - INFO - __main__ - Step 28959: {'lr': 0.00046017294762517127, 'samples': 5560128, 'steps': 28958, 'loss/train': 1.719394564628601} -08/30/2021 18:20:36 - INFO - __main__ - Step 28960: {'lr': 0.0004601700739019469, 'samples': 5560320, 'steps': 28959, 'loss/train': 1.458498477935791} -08/30/2021 18:20:37 - INFO - __main__ - Step 28961: {'lr': 0.000460167200084023, 'samples': 5560512, 'steps': 28960, 'loss/train': 0.8339565992355347} -08/30/2021 18:20:37 - INFO - __main__ - Step 28962: {'lr': 0.00046016432617140113, 'samples': 5560704, 'steps': 28961, 'loss/train': 1.3075861930847168} -08/30/2021 18:20:38 - INFO - __main__ - Step 28963: {'lr': 0.0004601614521640824, 'samples': 5560896, 'steps': 28962, 'loss/train': 1.3877896070480347} -08/30/2021 18:20:38 - INFO - __main__ - Step 28964: {'lr': 0.00046015857806206816, 'samples': 5561088, 'steps': 28963, 'loss/train': 0.10883594304323196} -08/30/2021 18:20:40 - INFO - __main__ - Step 28965: {'lr': 0.0004601557038653597, 'samples': 5561280, 'steps': 28964, 'loss/train': 0.3230167329311371} -08/30/2021 18:20:40 - INFO - __main__ - Step 28966: {'lr': 0.0004601528295739583, 'samples': 5561472, 'steps': 28965, 'loss/train': 0.9901770353317261} -08/30/2021 18:20:40 - INFO - __main__ - Step 28967: {'lr': 0.00046014995518786536, 'samples': 5561664, 'steps': 28966, 'loss/train': 2.1910712718963623} -08/30/2021 18:20:41 - INFO - __main__ - Step 28968: {'lr': 0.000460147080707082, 'samples': 5561856, 'steps': 28967, 'loss/train': 1.1445995569229126} -08/30/2021 18:20:41 - INFO - __main__ - Step 28969: {'lr': 0.00046014420613160967, 'samples': 5562048, 'steps': 28968, 'loss/train': 1.4583795070648193} -08/30/2021 18:20:42 - INFO - __main__ - Step 28970: {'lr': 0.00046014133146144966, 'samples': 5562240, 'steps': 28969, 'loss/train': 1.804777979850769} -08/30/2021 18:20:43 - INFO - __main__ - Step 28971: {'lr': 0.0004601384566966031, 'samples': 5562432, 'steps': 28970, 'loss/train': 1.1418389081954956} -08/30/2021 18:20:43 - INFO - __main__ - Step 28972: {'lr': 0.0004601355818370714, 'samples': 5562624, 'steps': 28971, 'loss/train': 1.0044198036193848} -08/30/2021 18:20:44 - INFO - __main__ - Step 28973: {'lr': 0.0004601327068828559, 'samples': 5562816, 'steps': 28972, 'loss/train': 1.4819682836532593} -08/30/2021 18:20:44 - INFO - __main__ - Step 28974: {'lr': 0.0004601298318339578, 'samples': 5563008, 'steps': 28973, 'loss/train': 1.3393051624298096} -08/30/2021 18:20:46 - INFO - __main__ - Step 28975: {'lr': 0.0004601269566903785, 'samples': 5563200, 'steps': 28974, 'loss/train': 0.6184431910514832} -08/30/2021 18:20:46 - INFO - __main__ - Step 28976: {'lr': 0.0004601240814521192, 'samples': 5563392, 'steps': 28975, 'loss/train': 1.1198714971542358} -08/30/2021 18:20:47 - INFO - __main__ - Step 28977: {'lr': 0.00046012120611918126, 'samples': 5563584, 'steps': 28976, 'loss/train': 2.6182427406311035} -08/30/2021 18:20:47 - INFO - __main__ - Step 28978: {'lr': 0.0004601183306915659, 'samples': 5563776, 'steps': 28977, 'loss/train': 0.9519802927970886} -08/30/2021 18:20:47 - INFO - __main__ - Step 28979: {'lr': 0.0004601154551692745, 'samples': 5563968, 'steps': 28978, 'loss/train': 1.9191051721572876} -08/30/2021 18:20:48 - INFO - __main__ - Step 28980: {'lr': 0.00046011257955230826, 'samples': 5564160, 'steps': 28979, 'loss/train': 1.1937226057052612} -08/30/2021 18:20:49 - INFO - __main__ - Step 28981: {'lr': 0.00046010970384066863, 'samples': 5564352, 'steps': 28980, 'loss/train': 0.980539083480835} -08/30/2021 18:20:50 - INFO - __main__ - Step 28982: {'lr': 0.00046010682803435674, 'samples': 5564544, 'steps': 28981, 'loss/train': 1.0843158960342407} -08/30/2021 18:20:50 - INFO - __main__ - Step 28983: {'lr': 0.000460103952133374, 'samples': 5564736, 'steps': 28982, 'loss/train': 1.4898028373718262} -08/30/2021 18:20:50 - INFO - __main__ - Step 28984: {'lr': 0.00046010107613772154, 'samples': 5564928, 'steps': 28983, 'loss/train': 1.7888057231903076} -08/30/2021 18:20:51 - INFO - __main__ - Step 28985: {'lr': 0.0004600982000474009, 'samples': 5565120, 'steps': 28984, 'loss/train': 1.3882951736450195} -08/30/2021 18:20:53 - INFO - __main__ - Step 28986: {'lr': 0.0004600953238624133, 'samples': 5565312, 'steps': 28985, 'loss/train': 1.7313249111175537} -08/30/2021 18:20:53 - INFO - __main__ - Step 28987: {'lr': 0.00046009244758275986, 'samples': 5565504, 'steps': 28986, 'loss/train': 1.7693266868591309} -08/30/2021 18:20:54 - INFO - __main__ - Step 28988: {'lr': 0.0004600895712084421, 'samples': 5565696, 'steps': 28987, 'loss/train': 0.8204891085624695} -08/30/2021 18:20:54 - INFO - __main__ - Step 28989: {'lr': 0.0004600866947394611, 'samples': 5565888, 'steps': 28988, 'loss/train': 1.4293334484100342} -08/30/2021 18:20:54 - INFO - __main__ - Step 28990: {'lr': 0.0004600838181758184, 'samples': 5566080, 'steps': 28989, 'loss/train': 0.9987662434577942} -08/30/2021 18:20:55 - INFO - __main__ - Step 28991: {'lr': 0.00046008094151751513, 'samples': 5566272, 'steps': 28990, 'loss/train': 1.6933869123458862} -08/30/2021 18:20:56 - INFO - __main__ - Step 28992: {'lr': 0.0004600780647645526, 'samples': 5566464, 'steps': 28991, 'loss/train': 0.10519556701183319} -08/30/2021 18:20:57 - INFO - __main__ - Step 28993: {'lr': 0.0004600751879169321, 'samples': 5566656, 'steps': 28992, 'loss/train': 1.2371454238891602} -08/30/2021 18:20:57 - INFO - __main__ - Step 28994: {'lr': 0.00046007231097465505, 'samples': 5566848, 'steps': 28993, 'loss/train': 1.0152714252471924} -08/30/2021 18:20:57 - INFO - __main__ - Step 28995: {'lr': 0.00046006943393772274, 'samples': 5567040, 'steps': 28994, 'loss/train': 1.2526971101760864} -08/30/2021 18:20:58 - INFO - __main__ - Step 28996: {'lr': 0.00046006655680613616, 'samples': 5567232, 'steps': 28995, 'loss/train': 1.8520199060440063} -08/30/2021 18:20:59 - INFO - __main__ - Step 28997: {'lr': 0.00046006367957989705, 'samples': 5567424, 'steps': 28996, 'loss/train': 1.6551318168640137} -08/30/2021 18:21:00 - INFO - __main__ - Step 28998: {'lr': 0.0004600608022590064, 'samples': 5567616, 'steps': 28997, 'loss/train': 1.4023603200912476} -08/30/2021 18:21:00 - INFO - __main__ - Step 28999: {'lr': 0.0004600579248434655, 'samples': 5567808, 'steps': 28998, 'loss/train': 1.3744001388549805} -08/30/2021 18:21:01 - INFO - __main__ - Step 29000: {'lr': 0.0004600550473332759, 'samples': 5568000, 'steps': 28999, 'loss/train': 5.890665531158447} -08/30/2021 18:21:01 - INFO - __main__ - Step 29001: {'lr': 0.0004600521697284386, 'samples': 5568192, 'steps': 29000, 'loss/train': 1.5829437971115112} -08/30/2021 18:21:01 - INFO - __main__ - Step 29002: {'lr': 0.0004600492920289551, 'samples': 5568384, 'steps': 29001, 'loss/train': 1.630038857460022} -08/30/2021 18:21:03 - INFO - __main__ - Step 29003: {'lr': 0.00046004641423482665, 'samples': 5568576, 'steps': 29002, 'loss/train': 1.9166052341461182} -08/30/2021 18:21:04 - INFO - __main__ - Step 29004: {'lr': 0.00046004353634605447, 'samples': 5568768, 'steps': 29003, 'loss/train': 1.3703222274780273} -08/30/2021 18:21:04 - INFO - __main__ - Step 29005: {'lr': 0.00046004065836263995, 'samples': 5568960, 'steps': 29004, 'loss/train': 1.461896300315857} -08/30/2021 18:21:04 - INFO - __main__ - Step 29006: {'lr': 0.00046003778028458434, 'samples': 5569152, 'steps': 29005, 'loss/train': 1.6786259412765503} -08/30/2021 18:21:05 - INFO - __main__ - Step 29007: {'lr': 0.00046003490211188894, 'samples': 5569344, 'steps': 29006, 'loss/train': 1.2999341487884521} -08/30/2021 18:21:06 - INFO - __main__ - Step 29008: {'lr': 0.00046003202384455505, 'samples': 5569536, 'steps': 29007, 'loss/train': 0.8424675464630127} -08/30/2021 18:21:07 - INFO - __main__ - Step 29009: {'lr': 0.000460029145482584, 'samples': 5569728, 'steps': 29008, 'loss/train': 1.7033573389053345} -08/30/2021 18:21:07 - INFO - __main__ - Step 29010: {'lr': 0.00046002626702597706, 'samples': 5569920, 'steps': 29009, 'loss/train': 1.7456250190734863} -08/30/2021 18:21:07 - INFO - __main__ - Step 29011: {'lr': 0.00046002338847473545, 'samples': 5570112, 'steps': 29010, 'loss/train': 1.8192698955535889} -08/30/2021 18:21:08 - INFO - __main__ - Step 29012: {'lr': 0.0004600205098288606, 'samples': 5570304, 'steps': 29011, 'loss/train': 1.402625560760498} -08/30/2021 18:21:09 - INFO - __main__ - Step 29013: {'lr': 0.00046001763108835384, 'samples': 5570496, 'steps': 29012, 'loss/train': 0.7089826464653015} -08/30/2021 18:21:10 - INFO - __main__ - Step 29014: {'lr': 0.0004600147522532162, 'samples': 5570688, 'steps': 29013, 'loss/train': 2.035728931427002} -08/30/2021 18:21:10 - INFO - __main__ - Step 29015: {'lr': 0.0004600118733234493, 'samples': 5570880, 'steps': 29014, 'loss/train': 1.5968133211135864} -08/30/2021 18:21:10 - INFO - __main__ - Step 29016: {'lr': 0.0004600089942990542, 'samples': 5571072, 'steps': 29015, 'loss/train': 1.2618802785873413} -08/30/2021 18:21:11 - INFO - __main__ - Step 29017: {'lr': 0.00046000611518003234, 'samples': 5571264, 'steps': 29016, 'loss/train': 1.3774456977844238} -08/30/2021 18:21:11 - INFO - __main__ - Step 29018: {'lr': 0.00046000323596638495, 'samples': 5571456, 'steps': 29017, 'loss/train': 1.3386033773422241} -08/30/2021 18:21:13 - INFO - __main__ - Step 29019: {'lr': 0.0004600003566581133, 'samples': 5571648, 'steps': 29018, 'loss/train': 1.303830623626709} -08/30/2021 18:21:13 - INFO - __main__ - Step 29020: {'lr': 0.00045999747725521876, 'samples': 5571840, 'steps': 29019, 'loss/train': 1.6431649923324585} -08/30/2021 18:21:14 - INFO - __main__ - Step 29021: {'lr': 0.0004599945977577026, 'samples': 5572032, 'steps': 29020, 'loss/train': 0.18844221532344818} -08/30/2021 18:21:14 - INFO - __main__ - Step 29022: {'lr': 0.0004599917181655661, 'samples': 5572224, 'steps': 29021, 'loss/train': 2.0019733905792236} -08/30/2021 18:21:14 - INFO - __main__ - Step 29023: {'lr': 0.00045998883847881057, 'samples': 5572416, 'steps': 29022, 'loss/train': 1.8991312980651855} -08/30/2021 18:21:16 - INFO - __main__ - Step 29024: {'lr': 0.00045998595869743735, 'samples': 5572608, 'steps': 29023, 'loss/train': 1.6134456396102905} -08/30/2021 18:21:16 - INFO - __main__ - Step 29025: {'lr': 0.0004599830788214477, 'samples': 5572800, 'steps': 29024, 'loss/train': 0.056618429720401764} -08/30/2021 18:21:17 - INFO - __main__ - Step 29026: {'lr': 0.0004599801988508429, 'samples': 5572992, 'steps': 29025, 'loss/train': 1.6746482849121094} -08/30/2021 18:21:17 - INFO - __main__ - Step 29027: {'lr': 0.00045997731878562423, 'samples': 5573184, 'steps': 29026, 'loss/train': 1.0732512474060059} -08/30/2021 18:21:18 - INFO - __main__ - Step 29028: {'lr': 0.000459974438625793, 'samples': 5573376, 'steps': 29027, 'loss/train': 1.6636924743652344} -08/30/2021 18:21:19 - INFO - __main__ - Step 29029: {'lr': 0.0004599715583713506, 'samples': 5573568, 'steps': 29028, 'loss/train': 2.3188862800598145} -08/30/2021 18:21:20 - INFO - __main__ - Step 29030: {'lr': 0.00045996867802229824, 'samples': 5573760, 'steps': 29029, 'loss/train': 1.6132086515426636} -08/30/2021 18:21:20 - INFO - __main__ - Step 29031: {'lr': 0.0004599657975786372, 'samples': 5573952, 'steps': 29030, 'loss/train': 0.8914322257041931} -08/30/2021 18:21:20 - INFO - __main__ - Step 29032: {'lr': 0.00045996291704036884, 'samples': 5574144, 'steps': 29031, 'loss/train': 1.1770182847976685} -08/30/2021 18:21:21 - INFO - __main__ - Step 29033: {'lr': 0.00045996003640749446, 'samples': 5574336, 'steps': 29032, 'loss/train': 1.8061771392822266} -08/30/2021 18:21:21 - INFO - __main__ - Step 29034: {'lr': 0.0004599571556800153, 'samples': 5574528, 'steps': 29033, 'loss/train': 1.0761033296585083} -08/30/2021 18:21:23 - INFO - __main__ - Step 29035: {'lr': 0.00045995427485793263, 'samples': 5574720, 'steps': 29034, 'loss/train': 4.809989929199219} -08/30/2021 18:21:23 - INFO - __main__ - Step 29036: {'lr': 0.00045995139394124784, 'samples': 5574912, 'steps': 29035, 'loss/train': 1.8105863332748413} -08/30/2021 18:21:24 - INFO - __main__ - Step 29037: {'lr': 0.0004599485129299622, 'samples': 5575104, 'steps': 29036, 'loss/train': 1.9833271503448486} -08/30/2021 18:21:24 - INFO - __main__ - Step 29038: {'lr': 0.000459945631824077, 'samples': 5575296, 'steps': 29037, 'loss/train': 2.1372933387756348} -08/30/2021 18:21:24 - INFO - __main__ - Step 29039: {'lr': 0.0004599427506235936, 'samples': 5575488, 'steps': 29038, 'loss/train': 1.6469768285751343} -08/30/2021 18:21:26 - INFO - __main__ - Step 29040: {'lr': 0.0004599398693285132, 'samples': 5575680, 'steps': 29039, 'loss/train': 1.6811004877090454} -08/30/2021 18:21:26 - INFO - __main__ - Step 29041: {'lr': 0.0004599369879388371, 'samples': 5575872, 'steps': 29040, 'loss/train': 2.101963996887207} -08/30/2021 18:21:27 - INFO - __main__ - Step 29042: {'lr': 0.0004599341064545666, 'samples': 5576064, 'steps': 29041, 'loss/train': 1.8116940259933472} -08/30/2021 18:21:27 - INFO - __main__ - Step 29043: {'lr': 0.00045993122487570303, 'samples': 5576256, 'steps': 29042, 'loss/train': 1.2629058361053467} -08/30/2021 18:21:27 - INFO - __main__ - Step 29044: {'lr': 0.00045992834320224773, 'samples': 5576448, 'steps': 29043, 'loss/train': 1.6439467668533325} -08/30/2021 18:21:29 - INFO - __main__ - Step 29045: {'lr': 0.000459925461434202, 'samples': 5576640, 'steps': 29044, 'loss/train': 1.284886121749878} -08/30/2021 18:21:29 - INFO - __main__ - Step 29046: {'lr': 0.00045992257957156704, 'samples': 5576832, 'steps': 29045, 'loss/train': 1.5194182395935059} -08/30/2021 18:21:29 - INFO - __main__ - Step 29047: {'lr': 0.00045991969761434426, 'samples': 5577024, 'steps': 29046, 'loss/train': 0.9067851305007935} -08/30/2021 18:21:30 - INFO - __main__ - Step 29048: {'lr': 0.0004599168155625348, 'samples': 5577216, 'steps': 29047, 'loss/train': 1.4850435256958008} -08/30/2021 18:21:30 - INFO - __main__ - Step 29049: {'lr': 0.00045991393341614017, 'samples': 5577408, 'steps': 29048, 'loss/train': 1.5920634269714355} -08/30/2021 18:21:32 - INFO - __main__ - Step 29050: {'lr': 0.0004599110511751615, 'samples': 5577600, 'steps': 29049, 'loss/train': 2.0021350383758545} -08/30/2021 18:21:32 - INFO - __main__ - Step 29051: {'lr': 0.0004599081688396002, 'samples': 5577792, 'steps': 29050, 'loss/train': 1.9680159091949463} -08/30/2021 18:21:32 - INFO - __main__ - Step 29052: {'lr': 0.0004599052864094575, 'samples': 5577984, 'steps': 29051, 'loss/train': 1.4609522819519043} -08/30/2021 18:21:33 - INFO - __main__ - Step 29053: {'lr': 0.0004599024038847347, 'samples': 5578176, 'steps': 29052, 'loss/train': 1.6223266124725342} -08/30/2021 18:21:33 - INFO - __main__ - Step 29054: {'lr': 0.0004598995212654331, 'samples': 5578368, 'steps': 29053, 'loss/train': 1.5891494750976562} -08/30/2021 18:21:35 - INFO - __main__ - Step 29055: {'lr': 0.0004598966385515541, 'samples': 5578560, 'steps': 29054, 'loss/train': 1.203086018562317} -08/30/2021 18:21:36 - INFO - __main__ - Step 29056: {'lr': 0.00045989375574309875, 'samples': 5578752, 'steps': 29055, 'loss/train': 1.7755188941955566} -08/30/2021 18:21:36 - INFO - __main__ - Step 29057: {'lr': 0.00045989087284006863, 'samples': 5578944, 'steps': 29056, 'loss/train': 1.4583615064620972} -08/30/2021 18:21:36 - INFO - __main__ - Step 29058: {'lr': 0.00045988798984246496, 'samples': 5579136, 'steps': 29057, 'loss/train': 1.4929167032241821} -08/30/2021 18:21:37 - INFO - __main__ - Step 29059: {'lr': 0.0004598851067502889, 'samples': 5579328, 'steps': 29058, 'loss/train': 0.9355854392051697} -08/30/2021 18:21:37 - INFO - __main__ - Step 29060: {'lr': 0.00045988222356354186, 'samples': 5579520, 'steps': 29059, 'loss/train': 1.2193325757980347} -08/30/2021 18:21:39 - INFO - __main__ - Step 29061: {'lr': 0.00045987934028222515, 'samples': 5579712, 'steps': 29060, 'loss/train': 1.1979621648788452} -08/30/2021 18:21:39 - INFO - __main__ - Step 29062: {'lr': 0.00045987645690634003, 'samples': 5579904, 'steps': 29061, 'loss/train': 0.2693827152252197} -08/30/2021 18:21:39 - INFO - __main__ - Step 29063: {'lr': 0.0004598735734358879, 'samples': 5580096, 'steps': 29062, 'loss/train': 1.5783582925796509} -08/30/2021 18:21:40 - INFO - __main__ - Step 29064: {'lr': 0.0004598706898708699, 'samples': 5580288, 'steps': 29063, 'loss/train': 0.9061970710754395} -08/30/2021 18:21:40 - INFO - __main__ - Step 29065: {'lr': 0.00045986780621128743, 'samples': 5580480, 'steps': 29064, 'loss/train': 1.7659823894500732} -08/30/2021 18:21:42 - INFO - __main__ - Step 29066: {'lr': 0.00045986492245714175, 'samples': 5580672, 'steps': 29065, 'loss/train': 1.4529715776443481} -08/30/2021 18:21:42 - INFO - __main__ - Step 29067: {'lr': 0.0004598620386084342, 'samples': 5580864, 'steps': 29066, 'loss/train': 1.672145962715149} -08/30/2021 18:21:42 - INFO - __main__ - Step 29068: {'lr': 0.00045985915466516605, 'samples': 5581056, 'steps': 29067, 'loss/train': 1.891939640045166} -08/30/2021 18:21:43 - INFO - __main__ - Step 29069: {'lr': 0.0004598562706273386, 'samples': 5581248, 'steps': 29068, 'loss/train': 1.370741367340088} -08/30/2021 18:21:43 - INFO - __main__ - Step 29070: {'lr': 0.0004598533864949531, 'samples': 5581440, 'steps': 29069, 'loss/train': 1.5381206274032593} -08/30/2021 18:21:45 - INFO - __main__ - Step 29071: {'lr': 0.00045985050226801097, 'samples': 5581632, 'steps': 29070, 'loss/train': 1.79341459274292} -08/30/2021 18:21:45 - INFO - __main__ - Step 29072: {'lr': 0.0004598476179465134, 'samples': 5581824, 'steps': 29071, 'loss/train': 1.566278338432312} -08/30/2021 18:21:46 - INFO - __main__ - Step 29073: {'lr': 0.00045984473353046174, 'samples': 5582016, 'steps': 29072, 'loss/train': 2.284355401992798} -08/30/2021 18:21:46 - INFO - __main__ - Step 29074: {'lr': 0.00045984184901985735, 'samples': 5582208, 'steps': 29073, 'loss/train': 0.9142330288887024} -08/30/2021 18:21:46 - INFO - __main__ - Step 29075: {'lr': 0.00045983896441470143, 'samples': 5582400, 'steps': 29074, 'loss/train': 0.06127826124429703} -08/30/2021 18:21:48 - INFO - __main__ - Step 29076: {'lr': 0.00045983607971499527, 'samples': 5582592, 'steps': 29075, 'loss/train': 1.9395575523376465} -08/30/2021 18:21:48 - INFO - __main__ - Step 29077: {'lr': 0.0004598331949207402, 'samples': 5582784, 'steps': 29076, 'loss/train': 0.9161554574966431} -08/30/2021 18:21:49 - INFO - __main__ - Step 29078: {'lr': 0.00045983031003193756, 'samples': 5582976, 'steps': 29077, 'loss/train': 1.269913911819458} -08/30/2021 18:21:49 - INFO - __main__ - Step 29079: {'lr': 0.0004598274250485886, 'samples': 5583168, 'steps': 29078, 'loss/train': 1.933900237083435} -08/30/2021 18:21:49 - INFO - __main__ - Step 29080: {'lr': 0.00045982453997069463, 'samples': 5583360, 'steps': 29079, 'loss/train': 1.6913996934890747} -08/30/2021 18:21:50 - INFO - __main__ - Step 29081: {'lr': 0.00045982165479825697, 'samples': 5583552, 'steps': 29080, 'loss/train': 0.9966526627540588} -08/30/2021 18:21:51 - INFO - __main__ - Step 29082: {'lr': 0.000459818769531277, 'samples': 5583744, 'steps': 29081, 'loss/train': 1.1565251350402832} -08/30/2021 18:21:52 - INFO - __main__ - Step 29083: {'lr': 0.00045981588416975583, 'samples': 5583936, 'steps': 29082, 'loss/train': 1.4232019186019897} -08/30/2021 18:21:52 - INFO - __main__ - Step 29084: {'lr': 0.00045981299871369484, 'samples': 5584128, 'steps': 29083, 'loss/train': 1.2171101570129395} -08/30/2021 18:21:53 - INFO - __main__ - Step 29085: {'lr': 0.0004598101131630954, 'samples': 5584320, 'steps': 29084, 'loss/train': 0.9350250363349915} -08/30/2021 18:21:53 - INFO - __main__ - Step 29086: {'lr': 0.0004598072275179588, 'samples': 5584512, 'steps': 29085, 'loss/train': 1.704522728919983} -08/30/2021 18:21:54 - INFO - __main__ - Step 29087: {'lr': 0.00045980434177828625, 'samples': 5584704, 'steps': 29086, 'loss/train': 0.9867247343063354} -08/30/2021 18:21:55 - INFO - __main__ - Step 29088: {'lr': 0.00045980145594407907, 'samples': 5584896, 'steps': 29087, 'loss/train': 1.415088176727295} -08/30/2021 18:21:55 - INFO - __main__ - Step 29089: {'lr': 0.00045979857001533867, 'samples': 5585088, 'steps': 29088, 'loss/train': 0.9071172475814819} -08/30/2021 18:21:56 - INFO - __main__ - Step 29090: {'lr': 0.0004597956839920662, 'samples': 5585280, 'steps': 29089, 'loss/train': 2.0894312858581543} -08/30/2021 18:21:56 - INFO - __main__ - Step 29091: {'lr': 0.00045979279787426307, 'samples': 5585472, 'steps': 29090, 'loss/train': 1.352568507194519} -08/30/2021 18:21:57 - INFO - __main__ - Step 29092: {'lr': 0.00045978991166193057, 'samples': 5585664, 'steps': 29091, 'loss/train': 0.5328934192657471} -08/30/2021 18:21:58 - INFO - __main__ - Step 29093: {'lr': 0.0004597870253550699, 'samples': 5585856, 'steps': 29092, 'loss/train': 1.7023544311523438} -08/30/2021 18:21:58 - INFO - __main__ - Step 29094: {'lr': 0.0004597841389536825, 'samples': 5586048, 'steps': 29093, 'loss/train': 1.6095505952835083} -08/30/2021 18:21:58 - INFO - __main__ - Step 29095: {'lr': 0.00045978125245776957, 'samples': 5586240, 'steps': 29094, 'loss/train': 1.1898564100265503} -08/30/2021 18:21:59 - INFO - __main__ - Step 29096: {'lr': 0.00045977836586733246, 'samples': 5586432, 'steps': 29095, 'loss/train': 1.627050518989563} -08/30/2021 18:22:00 - INFO - __main__ - Step 29097: {'lr': 0.00045977547918237243, 'samples': 5586624, 'steps': 29096, 'loss/train': 1.6160439252853394} -08/30/2021 18:22:01 - INFO - __main__ - Step 29098: {'lr': 0.0004597725924028908, 'samples': 5586816, 'steps': 29097, 'loss/train': 2.4444825649261475} -08/30/2021 18:22:01 - INFO - __main__ - Step 29099: {'lr': 0.00045976970552888896, 'samples': 5587008, 'steps': 29098, 'loss/train': 1.269550085067749} -08/30/2021 18:22:01 - INFO - __main__ - Step 29100: {'lr': 0.00045976681856036805, 'samples': 5587200, 'steps': 29099, 'loss/train': 1.4420042037963867} -08/30/2021 18:22:02 - INFO - __main__ - Step 29101: {'lr': 0.00045976393149732943, 'samples': 5587392, 'steps': 29100, 'loss/train': 1.3307113647460938} -08/30/2021 18:22:04 - INFO - __main__ - Step 29102: {'lr': 0.0004597610443397745, 'samples': 5587584, 'steps': 29101, 'loss/train': 1.515670657157898} -08/30/2021 18:22:04 - INFO - __main__ - Step 29103: {'lr': 0.0004597581570877044, 'samples': 5587776, 'steps': 29102, 'loss/train': 1.5040066242218018} -08/30/2021 18:22:05 - INFO - __main__ - Step 29104: {'lr': 0.00045975526974112056, 'samples': 5587968, 'steps': 29103, 'loss/train': 1.9000853300094604} -08/30/2021 18:22:05 - INFO - __main__ - Step 29105: {'lr': 0.0004597523823000243, 'samples': 5588160, 'steps': 29104, 'loss/train': 1.9205955266952515} -08/30/2021 18:22:05 - INFO - __main__ - Step 29106: {'lr': 0.0004597494947644167, 'samples': 5588352, 'steps': 29105, 'loss/train': 0.8787484169006348} -08/30/2021 18:22:06 - INFO - __main__ - Step 29107: {'lr': 0.0004597466071342993, 'samples': 5588544, 'steps': 29106, 'loss/train': 0.05248590558767319} -08/30/2021 18:22:08 - INFO - __main__ - Step 29108: {'lr': 0.0004597437194096733, 'samples': 5588736, 'steps': 29107, 'loss/train': 1.3961764574050903} -08/30/2021 18:22:08 - INFO - __main__ - Step 29109: {'lr': 0.00045974083159054, 'samples': 5588928, 'steps': 29108, 'loss/train': 1.5835131406784058} -08/30/2021 18:22:09 - INFO - __main__ - Step 29110: {'lr': 0.0004597379436769008, 'samples': 5589120, 'steps': 29109, 'loss/train': 1.570286750793457} -08/30/2021 18:22:09 - INFO - __main__ - Step 29111: {'lr': 0.00045973505566875684, 'samples': 5589312, 'steps': 29110, 'loss/train': 1.2224258184432983} -08/30/2021 18:22:09 - INFO - __main__ - Step 29112: {'lr': 0.00045973216756610945, 'samples': 5589504, 'steps': 29111, 'loss/train': 2.063640832901001} -08/30/2021 18:22:11 - INFO - __main__ - Step 29113: {'lr': 0.00045972927936896007, 'samples': 5589696, 'steps': 29112, 'loss/train': 1.0846408605575562} -08/30/2021 18:22:11 - INFO - __main__ - Step 29114: {'lr': 0.0004597263910773099, 'samples': 5589888, 'steps': 29113, 'loss/train': 1.6578137874603271} -08/30/2021 18:22:12 - INFO - __main__ - Step 29115: {'lr': 0.0004597235026911603, 'samples': 5590080, 'steps': 29114, 'loss/train': 1.6081702709197998} -08/30/2021 18:22:12 - INFO - __main__ - Step 29116: {'lr': 0.0004597206142105124, 'samples': 5590272, 'steps': 29115, 'loss/train': 1.46647310256958} -08/30/2021 18:22:12 - INFO - __main__ - Step 29117: {'lr': 0.0004597177256353677, 'samples': 5590464, 'steps': 29116, 'loss/train': 1.7984187602996826} -08/30/2021 18:22:14 - INFO - __main__ - Step 29118: {'lr': 0.0004597148369657275, 'samples': 5590656, 'steps': 29117, 'loss/train': 2.0254669189453125} -08/30/2021 18:22:14 - INFO - __main__ - Step 29119: {'lr': 0.0004597119482015929, 'samples': 5590848, 'steps': 29118, 'loss/train': 1.6421504020690918} -08/30/2021 18:22:15 - INFO - __main__ - Step 29120: {'lr': 0.00045970905934296537, 'samples': 5591040, 'steps': 29119, 'loss/train': 1.6421531438827515} -08/30/2021 18:22:15 - INFO - __main__ - Step 29121: {'lr': 0.0004597061703898462, 'samples': 5591232, 'steps': 29120, 'loss/train': 1.3585336208343506} -08/30/2021 18:22:15 - INFO - __main__ - Step 29122: {'lr': 0.0004597032813422367, 'samples': 5591424, 'steps': 29121, 'loss/train': 1.2464593648910522} -08/30/2021 18:22:17 - INFO - __main__ - Step 29123: {'lr': 0.00045970039220013804, 'samples': 5591616, 'steps': 29122, 'loss/train': 1.6743971109390259} -08/30/2021 18:22:17 - INFO - __main__ - Step 29124: {'lr': 0.00045969750296355173, 'samples': 5591808, 'steps': 29123, 'loss/train': 1.6649267673492432} -08/30/2021 18:22:18 - INFO - __main__ - Step 29125: {'lr': 0.0004596946136324789, 'samples': 5592000, 'steps': 29124, 'loss/train': 1.6004528999328613} -08/30/2021 18:22:18 - INFO - __main__ - Step 29126: {'lr': 0.0004596917242069209, 'samples': 5592192, 'steps': 29125, 'loss/train': 2.043062686920166} -08/30/2021 18:22:18 - INFO - __main__ - Step 29127: {'lr': 0.00045968883468687906, 'samples': 5592384, 'steps': 29126, 'loss/train': 1.749453067779541} -08/30/2021 18:22:19 - INFO - __main__ - Step 29128: {'lr': 0.00045968594507235467, 'samples': 5592576, 'steps': 29127, 'loss/train': 1.4296698570251465} -08/30/2021 18:22:20 - INFO - __main__ - Step 29129: {'lr': 0.00045968305536334906, 'samples': 5592768, 'steps': 29128, 'loss/train': 1.8172740936279297} -08/30/2021 18:22:21 - INFO - __main__ - Step 29130: {'lr': 0.00045968016555986347, 'samples': 5592960, 'steps': 29129, 'loss/train': 1.2048875093460083} -08/30/2021 18:22:21 - INFO - __main__ - Step 29131: {'lr': 0.0004596772756618992, 'samples': 5593152, 'steps': 29130, 'loss/train': 0.16799619793891907} -08/30/2021 18:22:21 - INFO - __main__ - Step 29132: {'lr': 0.0004596743856694576, 'samples': 5593344, 'steps': 29131, 'loss/train': 1.5724396705627441} -08/30/2021 18:22:22 - INFO - __main__ - Step 29133: {'lr': 0.00045967149558254, 'samples': 5593536, 'steps': 29132, 'loss/train': 1.320733666419983} -08/30/2021 18:22:23 - INFO - __main__ - Step 29134: {'lr': 0.0004596686054011476, 'samples': 5593728, 'steps': 29133, 'loss/train': 1.5041048526763916} -08/30/2021 18:22:24 - INFO - __main__ - Step 29135: {'lr': 0.0004596657151252819, 'samples': 5593920, 'steps': 29134, 'loss/train': 1.3871675729751587} -08/30/2021 18:22:24 - INFO - __main__ - Step 29136: {'lr': 0.0004596628247549439, 'samples': 5594112, 'steps': 29135, 'loss/train': 1.1521623134613037} -08/30/2021 18:22:24 - INFO - __main__ - Step 29137: {'lr': 0.00045965993429013507, 'samples': 5594304, 'steps': 29136, 'loss/train': 1.2652631998062134} -08/30/2021 18:22:25 - INFO - __main__ - Step 29138: {'lr': 0.0004596570437308568, 'samples': 5594496, 'steps': 29137, 'loss/train': 1.6733323335647583} -08/30/2021 18:22:26 - INFO - __main__ - Step 29139: {'lr': 0.0004596541530771103, 'samples': 5594688, 'steps': 29138, 'loss/train': 1.4596182107925415} -08/30/2021 18:22:27 - INFO - __main__ - Step 29140: {'lr': 0.0004596512623288969, 'samples': 5594880, 'steps': 29139, 'loss/train': 1.0607844591140747} -08/30/2021 18:22:27 - INFO - __main__ - Step 29141: {'lr': 0.00045964837148621776, 'samples': 5595072, 'steps': 29140, 'loss/train': 1.5667705535888672} -08/30/2021 18:22:27 - INFO - __main__ - Step 29142: {'lr': 0.00045964548054907434, 'samples': 5595264, 'steps': 29141, 'loss/train': 1.7079411745071411} -08/30/2021 18:22:28 - INFO - __main__ - Step 29143: {'lr': 0.00045964258951746795, 'samples': 5595456, 'steps': 29142, 'loss/train': 1.4324219226837158} -08/30/2021 18:22:29 - INFO - __main__ - Step 29144: {'lr': 0.0004596396983913998, 'samples': 5595648, 'steps': 29143, 'loss/train': 1.4762330055236816} -08/30/2021 18:22:30 - INFO - __main__ - Step 29145: {'lr': 0.00045963680717087124, 'samples': 5595840, 'steps': 29144, 'loss/train': 0.9415585994720459} -08/30/2021 18:22:30 - INFO - __main__ - Step 29146: {'lr': 0.0004596339158558835, 'samples': 5596032, 'steps': 29145, 'loss/train': 1.843888759613037} -08/30/2021 18:22:30 - INFO - __main__ - Step 29147: {'lr': 0.0004596310244464381, 'samples': 5596224, 'steps': 29146, 'loss/train': 1.2072358131408691} -08/30/2021 18:22:31 - INFO - __main__ - Step 29148: {'lr': 0.0004596281329425361, 'samples': 5596416, 'steps': 29147, 'loss/train': 1.0851892232894897} -08/30/2021 18:22:32 - INFO - __main__ - Step 29149: {'lr': 0.0004596252413441789, 'samples': 5596608, 'steps': 29148, 'loss/train': 1.4955570697784424} -08/30/2021 18:22:33 - INFO - __main__ - Step 29150: {'lr': 0.00045962234965136783, 'samples': 5596800, 'steps': 29149, 'loss/train': 2.4021732807159424} -08/30/2021 18:22:33 - INFO - __main__ - Step 29151: {'lr': 0.0004596194578641042, 'samples': 5596992, 'steps': 29150, 'loss/train': 1.2575191259384155} -08/30/2021 18:22:33 - INFO - __main__ - Step 29152: {'lr': 0.00045961656598238925, 'samples': 5597184, 'steps': 29151, 'loss/train': 1.2860348224639893} -08/30/2021 18:22:34 - INFO - __main__ - Step 29153: {'lr': 0.00045961367400622436, 'samples': 5597376, 'steps': 29152, 'loss/train': 1.8073841333389282} -08/30/2021 18:22:35 - INFO - __main__ - Step 29154: {'lr': 0.00045961078193561066, 'samples': 5597568, 'steps': 29153, 'loss/train': 1.476631760597229} -08/30/2021 18:22:36 - INFO - __main__ - Step 29155: {'lr': 0.00045960788977054967, 'samples': 5597760, 'steps': 29154, 'loss/train': 1.0465525388717651} -08/30/2021 18:22:36 - INFO - __main__ - Step 29156: {'lr': 0.0004596049975110426, 'samples': 5597952, 'steps': 29155, 'loss/train': 1.152707576751709} -08/30/2021 18:22:36 - INFO - __main__ - Step 29157: {'lr': 0.00045960210515709064, 'samples': 5598144, 'steps': 29156, 'loss/train': 0.7667427062988281} -08/30/2021 18:22:37 - INFO - __main__ - Step 29158: {'lr': 0.0004595992127086953, 'samples': 5598336, 'steps': 29157, 'loss/train': 1.2475523948669434} -08/30/2021 18:22:37 - INFO - __main__ - Step 29159: {'lr': 0.00045959632016585774, 'samples': 5598528, 'steps': 29158, 'loss/train': 1.6949416399002075} -08/30/2021 18:22:39 - INFO - __main__ - Step 29160: {'lr': 0.0004595934275285794, 'samples': 5598720, 'steps': 29159, 'loss/train': 1.3139251470565796} -08/30/2021 18:22:39 - INFO - __main__ - Step 29161: {'lr': 0.00045959053479686143, 'samples': 5598912, 'steps': 29160, 'loss/train': 1.4462741613388062} -08/30/2021 18:22:40 - INFO - __main__ - Step 29162: {'lr': 0.0004595876419707052, 'samples': 5599104, 'steps': 29161, 'loss/train': 1.3975965976715088} -08/30/2021 18:22:40 - INFO - __main__ - Step 29163: {'lr': 0.00045958474905011205, 'samples': 5599296, 'steps': 29162, 'loss/train': 1.3741061687469482} -08/30/2021 18:22:40 - INFO - __main__ - Step 29164: {'lr': 0.0004595818560350832, 'samples': 5599488, 'steps': 29163, 'loss/train': 1.5134464502334595} -08/30/2021 18:22:42 - INFO - __main__ - Step 29165: {'lr': 0.00045957896292562003, 'samples': 5599680, 'steps': 29164, 'loss/train': 0.25229430198669434} -08/30/2021 18:22:43 - INFO - __main__ - Step 29166: {'lr': 0.0004595760697217238, 'samples': 5599872, 'steps': 29165, 'loss/train': 0.8913015723228455} -08/30/2021 18:22:43 - INFO - __main__ - Step 29167: {'lr': 0.0004595731764233958, 'samples': 5600064, 'steps': 29166, 'loss/train': 1.661893367767334} -08/30/2021 18:22:43 - INFO - __main__ - Step 29168: {'lr': 0.0004595702830306374, 'samples': 5600256, 'steps': 29167, 'loss/train': 1.9168347120285034} -08/30/2021 18:22:44 - INFO - __main__ - Step 29169: {'lr': 0.0004595673895434498, 'samples': 5600448, 'steps': 29168, 'loss/train': 0.8361132144927979} -08/30/2021 18:22:45 - INFO - __main__ - Step 29170: {'lr': 0.00045956449596183446, 'samples': 5600640, 'steps': 29169, 'loss/train': 1.3470408916473389} -08/30/2021 18:22:46 - INFO - __main__ - Step 29171: {'lr': 0.00045956160228579257, 'samples': 5600832, 'steps': 29170, 'loss/train': 1.165398120880127} -08/30/2021 18:22:46 - INFO - __main__ - Step 29172: {'lr': 0.00045955870851532545, 'samples': 5601024, 'steps': 29171, 'loss/train': 1.80191171169281} -08/30/2021 18:22:46 - INFO - __main__ - Step 29173: {'lr': 0.0004595558146504344, 'samples': 5601216, 'steps': 29172, 'loss/train': 2.0715763568878174} -08/30/2021 18:22:47 - INFO - __main__ - Step 29174: {'lr': 0.0004595529206911207, 'samples': 5601408, 'steps': 29173, 'loss/train': 1.1101596355438232} -08/30/2021 18:22:48 - INFO - __main__ - Step 29175: {'lr': 0.00045955002663738574, 'samples': 5601600, 'steps': 29174, 'loss/train': 0.09882716089487076} -08/30/2021 18:22:49 - INFO - __main__ - Step 29176: {'lr': 0.0004595471324892307, 'samples': 5601792, 'steps': 29175, 'loss/train': 1.6886543035507202} -08/30/2021 18:22:49 - INFO - __main__ - Step 29177: {'lr': 0.00045954423824665704, 'samples': 5601984, 'steps': 29176, 'loss/train': 1.2996711730957031} -08/30/2021 18:22:49 - INFO - __main__ - Step 29178: {'lr': 0.00045954134390966593, 'samples': 5602176, 'steps': 29177, 'loss/train': 1.4013592004776} -08/30/2021 18:22:50 - INFO - __main__ - Step 29179: {'lr': 0.00045953844947825876, 'samples': 5602368, 'steps': 29178, 'loss/train': 1.9827604293823242} -08/30/2021 18:22:52 - INFO - __main__ - Step 29180: {'lr': 0.0004595355549524368, 'samples': 5602560, 'steps': 29179, 'loss/train': 1.980088233947754} -08/30/2021 18:22:52 - INFO - __main__ - Step 29181: {'lr': 0.0004595326603322013, 'samples': 5602752, 'steps': 29180, 'loss/train': 1.4789692163467407} -08/30/2021 18:22:52 - INFO - __main__ - Step 29182: {'lr': 0.00045952976561755365, 'samples': 5602944, 'steps': 29181, 'loss/train': 1.647566556930542} -08/30/2021 18:22:53 - INFO - __main__ - Step 29183: {'lr': 0.00045952687080849517, 'samples': 5603136, 'steps': 29182, 'loss/train': 0.47545647621154785} -08/30/2021 18:22:53 - INFO - __main__ - Step 29184: {'lr': 0.000459523975905027, 'samples': 5603328, 'steps': 29183, 'loss/train': 1.475440502166748} -08/30/2021 18:22:53 - INFO - __main__ - Step 29185: {'lr': 0.0004595210809071506, 'samples': 5603520, 'steps': 29184, 'loss/train': 0.9235596656799316} -08/30/2021 18:22:55 - INFO - __main__ - Step 29186: {'lr': 0.0004595181858148673, 'samples': 5603712, 'steps': 29185, 'loss/train': 1.172926664352417} -08/30/2021 18:22:55 - INFO - __main__ - Step 29187: {'lr': 0.00045951529062817834, 'samples': 5603904, 'steps': 29186, 'loss/train': 2.1116085052490234} -08/30/2021 18:22:56 - INFO - __main__ - Step 29188: {'lr': 0.00045951239534708496, 'samples': 5604096, 'steps': 29187, 'loss/train': 0.9593750238418579} -08/30/2021 18:22:56 - INFO - __main__ - Step 29189: {'lr': 0.0004595094999715885, 'samples': 5604288, 'steps': 29188, 'loss/train': 1.3687018156051636} -08/30/2021 18:22:56 - INFO - __main__ - Step 29190: {'lr': 0.00045950660450169034, 'samples': 5604480, 'steps': 29189, 'loss/train': 1.3395719528198242} -08/30/2021 18:22:58 - INFO - __main__ - Step 29191: {'lr': 0.0004595037089373918, 'samples': 5604672, 'steps': 29190, 'loss/train': 1.7803689241409302} -08/30/2021 18:22:59 - INFO - __main__ - Step 29192: {'lr': 0.000459500813278694, 'samples': 5604864, 'steps': 29191, 'loss/train': 1.9081834554672241} -08/30/2021 18:22:59 - INFO - __main__ - Step 29193: {'lr': 0.0004594979175255984, 'samples': 5605056, 'steps': 29192, 'loss/train': 1.6339938640594482} -08/30/2021 18:22:59 - INFO - __main__ - Step 29194: {'lr': 0.0004594950216781063, 'samples': 5605248, 'steps': 29193, 'loss/train': 1.5923702716827393} -08/30/2021 18:23:00 - INFO - __main__ - Step 29195: {'lr': 0.000459492125736219, 'samples': 5605440, 'steps': 29194, 'loss/train': 1.3523986339569092} -08/30/2021 18:23:00 - INFO - __main__ - Step 29196: {'lr': 0.00045948922969993777, 'samples': 5605632, 'steps': 29195, 'loss/train': 1.2019221782684326} -08/30/2021 18:23:02 - INFO - __main__ - Step 29197: {'lr': 0.0004594863335692639, 'samples': 5605824, 'steps': 29196, 'loss/train': 1.6492379903793335} -08/30/2021 18:23:02 - INFO - __main__ - Step 29198: {'lr': 0.00045948343734419873, 'samples': 5606016, 'steps': 29197, 'loss/train': 1.7129063606262207} -08/30/2021 18:23:03 - INFO - __main__ - Step 29199: {'lr': 0.00045948054102474357, 'samples': 5606208, 'steps': 29198, 'loss/train': 1.426788091659546} -08/30/2021 18:23:03 - INFO - __main__ - Step 29200: {'lr': 0.00045947764461089967, 'samples': 5606400, 'steps': 29199, 'loss/train': 0.5952116847038269} -08/30/2021 18:23:03 - INFO - __main__ - Step 29201: {'lr': 0.00045947474810266844, 'samples': 5606592, 'steps': 29200, 'loss/train': 1.5822315216064453} -08/30/2021 18:23:05 - INFO - __main__ - Step 29202: {'lr': 0.00045947185150005106, 'samples': 5606784, 'steps': 29201, 'loss/train': 2.031177520751953} -08/30/2021 18:23:05 - INFO - __main__ - Step 29203: {'lr': 0.0004594689548030489, 'samples': 5606976, 'steps': 29202, 'loss/train': 1.9758672714233398} -08/30/2021 18:23:06 - INFO - __main__ - Step 29204: {'lr': 0.0004594660580116633, 'samples': 5607168, 'steps': 29203, 'loss/train': 1.39204740524292} -08/30/2021 18:23:06 - INFO - __main__ - Step 29205: {'lr': 0.00045946316112589546, 'samples': 5607360, 'steps': 29204, 'loss/train': 1.5581611394882202} -08/30/2021 18:23:06 - INFO - __main__ - Step 29206: {'lr': 0.0004594602641457468, 'samples': 5607552, 'steps': 29205, 'loss/train': 1.5157995223999023} -08/30/2021 18:23:08 - INFO - __main__ - Step 29207: {'lr': 0.0004594573670712186, 'samples': 5607744, 'steps': 29206, 'loss/train': 1.6905176639556885} -08/30/2021 18:23:08 - INFO - __main__ - Step 29208: {'lr': 0.0004594544699023121, 'samples': 5607936, 'steps': 29207, 'loss/train': 1.2826634645462036} -08/30/2021 18:23:09 - INFO - __main__ - Step 29209: {'lr': 0.0004594515726390287, 'samples': 5608128, 'steps': 29208, 'loss/train': 0.9444410800933838} -08/30/2021 18:23:09 - INFO - __main__ - Step 29210: {'lr': 0.00045944867528136956, 'samples': 5608320, 'steps': 29209, 'loss/train': 1.087119460105896} -08/30/2021 18:23:09 - INFO - __main__ - Step 29211: {'lr': 0.00045944577782933615, 'samples': 5608512, 'steps': 29210, 'loss/train': 1.0510333776474} -08/30/2021 18:23:10 - INFO - __main__ - Step 29212: {'lr': 0.0004594428802829297, 'samples': 5608704, 'steps': 29211, 'loss/train': 1.255640983581543} -08/30/2021 18:23:11 - INFO - __main__ - Step 29213: {'lr': 0.00045943998264215153, 'samples': 5608896, 'steps': 29212, 'loss/train': 1.7238624095916748} -08/30/2021 18:23:12 - INFO - __main__ - Step 29214: {'lr': 0.0004594370849070029, 'samples': 5609088, 'steps': 29213, 'loss/train': 1.659794569015503} -08/30/2021 18:23:12 - INFO - __main__ - Step 29215: {'lr': 0.00045943418707748517, 'samples': 5609280, 'steps': 29214, 'loss/train': 1.7247980833053589} -08/30/2021 18:23:12 - INFO - __main__ - Step 29216: {'lr': 0.00045943128915359966, 'samples': 5609472, 'steps': 29215, 'loss/train': 1.1598666906356812} -08/30/2021 18:23:13 - INFO - __main__ - Step 29217: {'lr': 0.0004594283911353476, 'samples': 5609664, 'steps': 29216, 'loss/train': 1.5883209705352783} -08/30/2021 18:23:15 - INFO - __main__ - Step 29218: {'lr': 0.0004594254930227303, 'samples': 5609856, 'steps': 29217, 'loss/train': 1.5780142545700073} -08/30/2021 18:23:15 - INFO - __main__ - Step 29219: {'lr': 0.0004594225948157492, 'samples': 5610048, 'steps': 29218, 'loss/train': 1.6981172561645508} -08/30/2021 18:23:16 - INFO - __main__ - Step 29220: {'lr': 0.0004594196965144054, 'samples': 5610240, 'steps': 29219, 'loss/train': 1.4002854824066162} -08/30/2021 18:23:16 - INFO - __main__ - Step 29221: {'lr': 0.0004594167981187004, 'samples': 5610432, 'steps': 29220, 'loss/train': 1.4901771545410156} -08/30/2021 18:23:16 - INFO - __main__ - Step 29222: {'lr': 0.00045941389962863546, 'samples': 5610624, 'steps': 29221, 'loss/train': 1.5295490026474} -08/30/2021 18:23:18 - INFO - __main__ - Step 29223: {'lr': 0.00045941100104421176, 'samples': 5610816, 'steps': 29222, 'loss/train': 1.678505539894104} -08/30/2021 18:23:18 - INFO - __main__ - Step 29224: {'lr': 0.0004594081023654307, 'samples': 5611008, 'steps': 29223, 'loss/train': 1.438895344734192} -08/30/2021 18:23:19 - INFO - __main__ - Step 29225: {'lr': 0.00045940520359229366, 'samples': 5611200, 'steps': 29224, 'loss/train': 1.273938536643982} -08/30/2021 18:23:19 - INFO - __main__ - Step 29226: {'lr': 0.0004594023047248018, 'samples': 5611392, 'steps': 29225, 'loss/train': 1.7192295789718628} -08/30/2021 18:23:19 - INFO - __main__ - Step 29227: {'lr': 0.0004593994057629565, 'samples': 5611584, 'steps': 29226, 'loss/train': 1.2510654926300049} -08/30/2021 18:23:21 - INFO - __main__ - Step 29228: {'lr': 0.000459396506706759, 'samples': 5611776, 'steps': 29227, 'loss/train': 0.9602096676826477} -08/30/2021 18:23:21 - INFO - __main__ - Step 29229: {'lr': 0.00045939360755621074, 'samples': 5611968, 'steps': 29228, 'loss/train': 1.667063593864441} -08/30/2021 18:23:22 - INFO - __main__ - Step 29230: {'lr': 0.00045939070831131293, 'samples': 5612160, 'steps': 29229, 'loss/train': 1.843064546585083} -08/30/2021 18:23:22 - INFO - __main__ - Step 29231: {'lr': 0.00045938780897206686, 'samples': 5612352, 'steps': 29230, 'loss/train': 1.830507755279541} -08/30/2021 18:23:22 - INFO - __main__ - Step 29232: {'lr': 0.000459384909538474, 'samples': 5612544, 'steps': 29231, 'loss/train': 1.4795317649841309} -08/30/2021 18:23:24 - INFO - __main__ - Step 29233: {'lr': 0.00045938201001053546, 'samples': 5612736, 'steps': 29232, 'loss/train': 1.0575584173202515} -08/30/2021 18:23:24 - INFO - __main__ - Step 29234: {'lr': 0.00045937911038825257, 'samples': 5612928, 'steps': 29233, 'loss/train': 1.151182770729065} -08/30/2021 18:23:24 - INFO - __main__ - Step 29235: {'lr': 0.00045937621067162674, 'samples': 5613120, 'steps': 29234, 'loss/train': 1.608346700668335} -08/30/2021 18:23:25 - INFO - __main__ - Step 29236: {'lr': 0.0004593733108606592, 'samples': 5613312, 'steps': 29235, 'loss/train': 1.6283247470855713} -08/30/2021 18:23:25 - INFO - __main__ - Step 29237: {'lr': 0.00045937041095535125, 'samples': 5613504, 'steps': 29236, 'loss/train': 0.992626965045929} -08/30/2021 18:23:27 - INFO - __main__ - Step 29238: {'lr': 0.00045936751095570426, 'samples': 5613696, 'steps': 29237, 'loss/train': 1.8615106344223022} -08/30/2021 18:23:27 - INFO - __main__ - Step 29239: {'lr': 0.0004593646108617195, 'samples': 5613888, 'steps': 29238, 'loss/train': 1.2490863800048828} -08/30/2021 18:23:28 - INFO - __main__ - Step 29240: {'lr': 0.00045936171067339826, 'samples': 5614080, 'steps': 29239, 'loss/train': 0.8721458911895752} -08/30/2021 18:23:28 - INFO - __main__ - Step 29241: {'lr': 0.0004593588103907419, 'samples': 5614272, 'steps': 29240, 'loss/train': 1.4577882289886475} -08/30/2021 18:23:28 - INFO - __main__ - Step 29242: {'lr': 0.00045935591001375163, 'samples': 5614464, 'steps': 29241, 'loss/train': 1.1836299896240234} -08/30/2021 18:23:30 - INFO - __main__ - Step 29243: {'lr': 0.0004593530095424289, 'samples': 5614656, 'steps': 29242, 'loss/train': 1.4437614679336548} -08/30/2021 18:23:30 - INFO - __main__ - Step 29244: {'lr': 0.0004593501089767749, 'samples': 5614848, 'steps': 29243, 'loss/train': 1.8363823890686035} -08/30/2021 18:23:31 - INFO - __main__ - Step 29245: {'lr': 0.00045934720831679093, 'samples': 5615040, 'steps': 29244, 'loss/train': 1.7396713495254517} -08/30/2021 18:23:31 - INFO - __main__ - Step 29246: {'lr': 0.00045934430756247835, 'samples': 5615232, 'steps': 29245, 'loss/train': 1.134104609489441} -08/30/2021 18:23:31 - INFO - __main__ - Step 29247: {'lr': 0.0004593414067138385, 'samples': 5615424, 'steps': 29246, 'loss/train': 1.3727607727050781} -08/30/2021 18:23:33 - INFO - __main__ - Step 29248: {'lr': 0.0004593385057708726, 'samples': 5615616, 'steps': 29247, 'loss/train': 2.2144601345062256} -08/30/2021 18:23:33 - INFO - __main__ - Step 29249: {'lr': 0.00045933560473358206, 'samples': 5615808, 'steps': 29248, 'loss/train': 0.8779964447021484} -08/30/2021 18:23:34 - INFO - __main__ - Step 29250: {'lr': 0.00045933270360196804, 'samples': 5616000, 'steps': 29249, 'loss/train': 0.9211687445640564} -08/30/2021 18:23:34 - INFO - __main__ - Step 29251: {'lr': 0.00045932980237603196, 'samples': 5616192, 'steps': 29250, 'loss/train': 1.9939184188842773} -08/30/2021 18:23:34 - INFO - __main__ - Step 29252: {'lr': 0.0004593269010557751, 'samples': 5616384, 'steps': 29251, 'loss/train': 1.875595211982727} -08/30/2021 18:23:36 - INFO - __main__ - Step 29253: {'lr': 0.00045932399964119884, 'samples': 5616576, 'steps': 29252, 'loss/train': 0.7005326151847839} -08/30/2021 18:23:36 - INFO - __main__ - Step 29254: {'lr': 0.00045932109813230437, 'samples': 5616768, 'steps': 29253, 'loss/train': 0.7504449486732483} -08/30/2021 18:23:37 - INFO - __main__ - Step 29255: {'lr': 0.00045931819652909303, 'samples': 5616960, 'steps': 29254, 'loss/train': 1.004144310951233} -08/30/2021 18:23:37 - INFO - __main__ - Step 29256: {'lr': 0.0004593152948315661, 'samples': 5617152, 'steps': 29255, 'loss/train': 2.0227677822113037} -08/30/2021 18:23:37 - INFO - __main__ - Step 29257: {'lr': 0.000459312393039725, 'samples': 5617344, 'steps': 29256, 'loss/train': 1.3434467315673828} -08/30/2021 18:23:39 - INFO - __main__ - Step 29258: {'lr': 0.0004593094911535709, 'samples': 5617536, 'steps': 29257, 'loss/train': 1.2487927675247192} -08/30/2021 18:23:39 - INFO - __main__ - Step 29259: {'lr': 0.00045930658917310525, 'samples': 5617728, 'steps': 29258, 'loss/train': 1.1003031730651855} -08/30/2021 18:23:40 - INFO - __main__ - Step 29260: {'lr': 0.0004593036870983293, 'samples': 5617920, 'steps': 29259, 'loss/train': 0.5249273777008057} -08/30/2021 18:23:40 - INFO - __main__ - Step 29261: {'lr': 0.0004593007849292442, 'samples': 5618112, 'steps': 29260, 'loss/train': 1.3971539735794067} -08/30/2021 18:23:40 - INFO - __main__ - Step 29262: {'lr': 0.0004592978826658515, 'samples': 5618304, 'steps': 29261, 'loss/train': 1.1266720294952393} -08/30/2021 18:23:41 - INFO - __main__ - Step 29263: {'lr': 0.0004592949803081524, 'samples': 5618496, 'steps': 29262, 'loss/train': 1.3973729610443115} -08/30/2021 18:23:42 - INFO - __main__ - Step 29264: {'lr': 0.0004592920778561481, 'samples': 5618688, 'steps': 29263, 'loss/train': 1.573115587234497} -08/30/2021 18:23:43 - INFO - __main__ - Step 29265: {'lr': 0.00045928917530984014, 'samples': 5618880, 'steps': 29264, 'loss/train': 1.5579097270965576} -08/30/2021 18:23:43 - INFO - __main__ - Step 29266: {'lr': 0.00045928627266922974, 'samples': 5619072, 'steps': 29265, 'loss/train': 1.3227323293685913} -08/30/2021 18:23:43 - INFO - __main__ - Step 29267: {'lr': 0.0004592833699343181, 'samples': 5619264, 'steps': 29266, 'loss/train': 1.3814913034439087} -08/30/2021 18:23:44 - INFO - __main__ - Step 29268: {'lr': 0.0004592804671051066, 'samples': 5619456, 'steps': 29267, 'loss/train': 1.4172732830047607} -08/30/2021 18:23:46 - INFO - __main__ - Step 29269: {'lr': 0.0004592775641815966, 'samples': 5619648, 'steps': 29268, 'loss/train': 1.255063772201538} -08/30/2021 18:23:46 - INFO - __main__ - Step 29270: {'lr': 0.0004592746611637893, 'samples': 5619840, 'steps': 29269, 'loss/train': 1.000472068786621} -08/30/2021 18:23:46 - INFO - __main__ - Step 29271: {'lr': 0.00045927175805168607, 'samples': 5620032, 'steps': 29270, 'loss/train': 1.4347294569015503} -08/30/2021 18:23:47 - INFO - __main__ - Step 29272: {'lr': 0.00045926885484528823, 'samples': 5620224, 'steps': 29271, 'loss/train': 1.3716964721679688} -08/30/2021 18:23:47 - INFO - __main__ - Step 29273: {'lr': 0.0004592659515445971, 'samples': 5620416, 'steps': 29272, 'loss/train': 1.3793617486953735} -08/30/2021 18:23:49 - INFO - __main__ - Step 29274: {'lr': 0.00045926304814961397, 'samples': 5620608, 'steps': 29273, 'loss/train': 2.1355173587799072} -08/30/2021 18:23:49 - INFO - __main__ - Step 29275: {'lr': 0.00045926014466034004, 'samples': 5620800, 'steps': 29274, 'loss/train': 1.9838016033172607} -08/30/2021 18:23:49 - INFO - __main__ - Step 29276: {'lr': 0.0004592572410767768, 'samples': 5620992, 'steps': 29275, 'loss/train': 1.316576600074768} -08/30/2021 18:23:50 - INFO - __main__ - Step 29277: {'lr': 0.0004592543373989255, 'samples': 5621184, 'steps': 29276, 'loss/train': 1.364548921585083} -08/30/2021 18:23:50 - INFO - __main__ - Step 29278: {'lr': 0.0004592514336267874, 'samples': 5621376, 'steps': 29277, 'loss/train': 0.8687638640403748} -08/30/2021 18:23:52 - INFO - __main__ - Step 29279: {'lr': 0.0004592485297603638, 'samples': 5621568, 'steps': 29278, 'loss/train': 1.6683703660964966} -08/30/2021 18:23:52 - INFO - __main__ - Step 29280: {'lr': 0.0004592456257996561, 'samples': 5621760, 'steps': 29279, 'loss/train': 1.223831295967102} -08/30/2021 18:23:53 - INFO - __main__ - Step 29281: {'lr': 0.0004592427217446655, 'samples': 5621952, 'steps': 29280, 'loss/train': 1.568655014038086} -08/30/2021 18:23:53 - INFO - __main__ - Step 29282: {'lr': 0.00045923981759539336, 'samples': 5622144, 'steps': 29281, 'loss/train': 0.8661690950393677} -08/30/2021 18:23:53 - INFO - __main__ - Step 29283: {'lr': 0.000459236913351841, 'samples': 5622336, 'steps': 29282, 'loss/train': 2.0108747482299805} -08/30/2021 18:23:54 - INFO - __main__ - Step 29284: {'lr': 0.0004592340090140097, 'samples': 5622528, 'steps': 29283, 'loss/train': 0.9387965202331543} -08/30/2021 18:23:55 - INFO - __main__ - Step 29285: {'lr': 0.0004592311045819008, 'samples': 5622720, 'steps': 29284, 'loss/train': 1.8075882196426392} -08/30/2021 18:23:56 - INFO - __main__ - Step 29286: {'lr': 0.00045922820005551556, 'samples': 5622912, 'steps': 29285, 'loss/train': 0.9452568292617798} -08/30/2021 18:23:56 - INFO - __main__ - Step 29287: {'lr': 0.0004592252954348554, 'samples': 5623104, 'steps': 29286, 'loss/train': 1.3390796184539795} -08/30/2021 18:23:56 - INFO - __main__ - Step 29288: {'lr': 0.0004592223907199215, 'samples': 5623296, 'steps': 29287, 'loss/train': 1.1554780006408691} -08/30/2021 18:23:57 - INFO - __main__ - Step 29289: {'lr': 0.0004592194859107153, 'samples': 5623488, 'steps': 29288, 'loss/train': 1.4837032556533813} -08/30/2021 18:23:58 - INFO - __main__ - Step 29290: {'lr': 0.0004592165810072379, 'samples': 5623680, 'steps': 29289, 'loss/train': 1.022546648979187} -08/30/2021 18:23:58 - INFO - __main__ - Step 29291: {'lr': 0.00045921367600949077, 'samples': 5623872, 'steps': 29290, 'loss/train': 2.0431230068206787} -08/30/2021 18:23:59 - INFO - __main__ - Step 29292: {'lr': 0.0004592107709174752, 'samples': 5624064, 'steps': 29291, 'loss/train': 1.0799243450164795} -08/30/2021 18:23:59 - INFO - __main__ - Step 29293: {'lr': 0.0004592078657311925, 'samples': 5624256, 'steps': 29292, 'loss/train': 1.9466733932495117} -08/30/2021 18:24:00 - INFO - __main__ - Step 29294: {'lr': 0.000459204960450644, 'samples': 5624448, 'steps': 29293, 'loss/train': 1.696338415145874} -08/30/2021 18:24:01 - INFO - __main__ - Step 29295: {'lr': 0.0004592020550758309, 'samples': 5624640, 'steps': 29294, 'loss/train': 1.9128203392028809} -08/30/2021 18:24:02 - INFO - __main__ - Step 29296: {'lr': 0.0004591991496067546, 'samples': 5624832, 'steps': 29295, 'loss/train': 0.7891136407852173} -08/30/2021 18:24:02 - INFO - __main__ - Step 29297: {'lr': 0.00045919624404341643, 'samples': 5625024, 'steps': 29296, 'loss/train': 0.862982988357544} -08/30/2021 18:24:02 - INFO - __main__ - Step 29298: {'lr': 0.00045919333838581757, 'samples': 5625216, 'steps': 29297, 'loss/train': 1.9168561697006226} -08/30/2021 18:24:03 - INFO - __main__ - Step 29299: {'lr': 0.00045919043263395953, 'samples': 5625408, 'steps': 29298, 'loss/train': 2.242788076400757} -08/30/2021 18:24:05 - INFO - __main__ - Step 29300: {'lr': 0.00045918752678784344, 'samples': 5625600, 'steps': 29299, 'loss/train': 0.987244725227356} -08/30/2021 18:24:05 - INFO - __main__ - Step 29301: {'lr': 0.0004591846208474707, 'samples': 5625792, 'steps': 29300, 'loss/train': 1.4617302417755127} -08/30/2021 18:24:05 - INFO - __main__ - Step 29302: {'lr': 0.00045918171481284256, 'samples': 5625984, 'steps': 29301, 'loss/train': 1.0888047218322754} -08/30/2021 18:24:06 - INFO - __main__ - Step 29303: {'lr': 0.0004591788086839604, 'samples': 5626176, 'steps': 29302, 'loss/train': 1.3656442165374756} -08/30/2021 18:24:06 - INFO - __main__ - Step 29304: {'lr': 0.0004591759024608255, 'samples': 5626368, 'steps': 29303, 'loss/train': 0.27926814556121826} -08/30/2021 18:24:08 - INFO - __main__ - Step 29305: {'lr': 0.0004591729961434392, 'samples': 5626560, 'steps': 29304, 'loss/train': 0.8646825551986694} -08/30/2021 18:24:08 - INFO - __main__ - Step 29306: {'lr': 0.00045917008973180273, 'samples': 5626752, 'steps': 29305, 'loss/train': 1.7475866079330444} -08/30/2021 18:24:09 - INFO - __main__ - Step 29307: {'lr': 0.0004591671832259174, 'samples': 5626944, 'steps': 29306, 'loss/train': 1.5658386945724487} -08/30/2021 18:24:09 - INFO - __main__ - Step 29308: {'lr': 0.00045916427662578464, 'samples': 5627136, 'steps': 29307, 'loss/train': 1.567349910736084} -08/30/2021 18:24:09 - INFO - __main__ - Step 29309: {'lr': 0.00045916136993140574, 'samples': 5627328, 'steps': 29308, 'loss/train': 1.929797649383545} -08/30/2021 18:24:11 - INFO - __main__ - Step 29310: {'lr': 0.00045915846314278187, 'samples': 5627520, 'steps': 29309, 'loss/train': 1.587865948677063} -08/30/2021 18:24:11 - INFO - __main__ - Step 29311: {'lr': 0.0004591555562599144, 'samples': 5627712, 'steps': 29310, 'loss/train': 1.904259443283081} -08/30/2021 18:24:11 - INFO - __main__ - Step 29312: {'lr': 0.00045915264928280476, 'samples': 5627904, 'steps': 29311, 'loss/train': 0.4572484493255615} -08/30/2021 18:24:12 - INFO - __main__ - Step 29313: {'lr': 0.00045914974221145403, 'samples': 5628096, 'steps': 29312, 'loss/train': 1.4013017416000366} -08/30/2021 18:24:12 - INFO - __main__ - Step 29314: {'lr': 0.00045914683504586374, 'samples': 5628288, 'steps': 29313, 'loss/train': 1.0001164674758911} -08/30/2021 18:24:13 - INFO - __main__ - Step 29315: {'lr': 0.0004591439277860351, 'samples': 5628480, 'steps': 29314, 'loss/train': 1.1321221590042114} -08/30/2021 18:24:14 - INFO - __main__ - Step 29316: {'lr': 0.00045914102043196947, 'samples': 5628672, 'steps': 29315, 'loss/train': 1.1323622465133667} -08/30/2021 18:24:14 - INFO - __main__ - Step 29317: {'lr': 0.00045913811298366804, 'samples': 5628864, 'steps': 29316, 'loss/train': 0.9505067467689514} -08/30/2021 18:24:15 - INFO - __main__ - Step 29318: {'lr': 0.0004591352054411323, 'samples': 5629056, 'steps': 29317, 'loss/train': 1.6290580034255981} -08/30/2021 18:24:15 - INFO - __main__ - Step 29319: {'lr': 0.00045913229780436337, 'samples': 5629248, 'steps': 29318, 'loss/train': 1.8942209482192993} -08/30/2021 18:24:16 - INFO - __main__ - Step 29320: {'lr': 0.00045912939007336273, 'samples': 5629440, 'steps': 29319, 'loss/train': 1.6758254766464233} -08/30/2021 18:24:17 - INFO - __main__ - Step 29321: {'lr': 0.0004591264822481316, 'samples': 5629632, 'steps': 29320, 'loss/train': 1.3814494609832764} -08/30/2021 18:24:17 - INFO - __main__ - Step 29322: {'lr': 0.00045912357432867124, 'samples': 5629824, 'steps': 29321, 'loss/train': 1.2043546438217163} -08/30/2021 18:24:18 - INFO - __main__ - Step 29323: {'lr': 0.00045912066631498304, 'samples': 5630016, 'steps': 29322, 'loss/train': 2.0598459243774414} -08/30/2021 18:24:18 - INFO - __main__ - Step 29324: {'lr': 0.00045911775820706835, 'samples': 5630208, 'steps': 29323, 'loss/train': 0.9047432541847229} -08/30/2021 18:24:18 - INFO - __main__ - Step 29325: {'lr': 0.0004591148500049284, 'samples': 5630400, 'steps': 29324, 'loss/train': 0.9984139800071716} -08/30/2021 18:24:21 - INFO - __main__ - Step 29326: {'lr': 0.00045911194170856454, 'samples': 5630592, 'steps': 29325, 'loss/train': 1.636504888534546} -08/30/2021 18:24:21 - INFO - __main__ - Step 29327: {'lr': 0.00045910903331797807, 'samples': 5630784, 'steps': 29326, 'loss/train': 2.1306819915771484} -08/30/2021 18:24:22 - INFO - __main__ - Step 29328: {'lr': 0.00045910612483317025, 'samples': 5630976, 'steps': 29327, 'loss/train': 1.4284075498580933} -08/30/2021 18:24:22 - INFO - __main__ - Step 29329: {'lr': 0.00045910321625414245, 'samples': 5631168, 'steps': 29328, 'loss/train': 1.2354590892791748} -08/30/2021 18:24:22 - INFO - __main__ - Step 29330: {'lr': 0.00045910030758089597, 'samples': 5631360, 'steps': 29329, 'loss/train': 1.5467263460159302} -08/30/2021 18:24:24 - INFO - __main__ - Step 29331: {'lr': 0.00045909739881343215, 'samples': 5631552, 'steps': 29330, 'loss/train': 1.8582510948181152} -08/30/2021 18:24:24 - INFO - __main__ - Step 29332: {'lr': 0.00045909448995175224, 'samples': 5631744, 'steps': 29331, 'loss/train': 1.2985451221466064} -08/30/2021 18:24:25 - INFO - __main__ - Step 29333: {'lr': 0.00045909158099585756, 'samples': 5631936, 'steps': 29332, 'loss/train': 1.6099449396133423} -08/30/2021 18:24:25 - INFO - __main__ - Step 29334: {'lr': 0.00045908867194574955, 'samples': 5632128, 'steps': 29333, 'loss/train': 2.1385371685028076} -08/30/2021 18:24:25 - INFO - __main__ - Step 29335: {'lr': 0.00045908576280142925, 'samples': 5632320, 'steps': 29334, 'loss/train': 1.5409995317459106} -08/30/2021 18:24:26 - INFO - __main__ - Step 29336: {'lr': 0.00045908285356289824, 'samples': 5632512, 'steps': 29335, 'loss/train': 1.1011066436767578} -08/30/2021 18:24:27 - INFO - __main__ - Step 29337: {'lr': 0.0004590799442301577, 'samples': 5632704, 'steps': 29336, 'loss/train': 1.2381199598312378} -08/30/2021 18:24:28 - INFO - __main__ - Step 29338: {'lr': 0.00045907703480320894, 'samples': 5632896, 'steps': 29337, 'loss/train': 1.1147611141204834} -08/30/2021 18:24:28 - INFO - __main__ - Step 29339: {'lr': 0.0004590741252820533, 'samples': 5633088, 'steps': 29338, 'loss/train': 1.4083908796310425} -08/30/2021 18:24:29 - INFO - __main__ - Step 29340: {'lr': 0.00045907121566669216, 'samples': 5633280, 'steps': 29339, 'loss/train': 1.5535962581634521} -08/30/2021 18:24:29 - INFO - __main__ - Step 29341: {'lr': 0.0004590683059571267, 'samples': 5633472, 'steps': 29340, 'loss/train': 1.7197771072387695} -08/30/2021 18:24:30 - INFO - __main__ - Step 29342: {'lr': 0.0004590653961533582, 'samples': 5633664, 'steps': 29341, 'loss/train': 1.7851433753967285} -08/30/2021 18:24:31 - INFO - __main__ - Step 29343: {'lr': 0.00045906248625538816, 'samples': 5633856, 'steps': 29342, 'loss/train': 1.4537101984024048} -08/30/2021 18:24:31 - INFO - __main__ - Step 29344: {'lr': 0.00045905957626321775, 'samples': 5634048, 'steps': 29343, 'loss/train': 1.348261833190918} -08/30/2021 18:24:32 - INFO - __main__ - Step 29345: {'lr': 0.0004590566661768484, 'samples': 5634240, 'steps': 29344, 'loss/train': 1.3653773069381714} -08/30/2021 18:24:32 - INFO - __main__ - Step 29346: {'lr': 0.00045905375599628127, 'samples': 5634432, 'steps': 29345, 'loss/train': 0.8258079290390015} -08/30/2021 18:24:33 - INFO - __main__ - Step 29347: {'lr': 0.00045905084572151774, 'samples': 5634624, 'steps': 29346, 'loss/train': 1.3003286123275757} -08/30/2021 18:24:34 - INFO - __main__ - Step 29348: {'lr': 0.0004590479353525591, 'samples': 5634816, 'steps': 29347, 'loss/train': 1.6447889804840088} -08/30/2021 18:24:34 - INFO - __main__ - Step 29349: {'lr': 0.00045904502488940677, 'samples': 5635008, 'steps': 29348, 'loss/train': 1.581138253211975} -08/30/2021 18:24:35 - INFO - __main__ - Step 29350: {'lr': 0.0004590421143320619, 'samples': 5635200, 'steps': 29349, 'loss/train': 1.915869116783142} -08/30/2021 18:24:35 - INFO - __main__ - Step 29351: {'lr': 0.0004590392036805259, 'samples': 5635392, 'steps': 29350, 'loss/train': 1.9172983169555664} -08/30/2021 18:24:35 - INFO - __main__ - Step 29352: {'lr': 0.0004590362929348001, 'samples': 5635584, 'steps': 29351, 'loss/train': 2.118647336959839} -08/30/2021 18:24:37 - INFO - __main__ - Step 29353: {'lr': 0.00045903338209488575, 'samples': 5635776, 'steps': 29352, 'loss/train': 1.2624213695526123} -08/30/2021 18:24:37 - INFO - __main__ - Step 29354: {'lr': 0.0004590304711607842, 'samples': 5635968, 'steps': 29353, 'loss/train': 0.9841771721839905} -08/30/2021 18:24:38 - INFO - __main__ - Step 29355: {'lr': 0.0004590275601324967, 'samples': 5636160, 'steps': 29354, 'loss/train': 1.7141315937042236} -08/30/2021 18:24:38 - INFO - __main__ - Step 29356: {'lr': 0.0004590246490100246, 'samples': 5636352, 'steps': 29355, 'loss/train': 1.6033127307891846} -08/30/2021 18:24:38 - INFO - __main__ - Step 29357: {'lr': 0.00045902173779336925, 'samples': 5636544, 'steps': 29356, 'loss/train': 1.4778285026550293} -08/30/2021 18:24:40 - INFO - __main__ - Step 29358: {'lr': 0.0004590188264825319, 'samples': 5636736, 'steps': 29357, 'loss/train': 1.6052192449569702} -08/30/2021 18:24:41 - INFO - __main__ - Step 29359: {'lr': 0.00045901591507751393, 'samples': 5636928, 'steps': 29358, 'loss/train': 3.5689525604248047} -08/30/2021 18:24:41 - INFO - __main__ - Step 29360: {'lr': 0.00045901300357831666, 'samples': 5637120, 'steps': 29359, 'loss/train': 9.343769073486328} -08/30/2021 18:24:41 - INFO - __main__ - Step 29361: {'lr': 0.00045901009198494124, 'samples': 5637312, 'steps': 29360, 'loss/train': 1.572585940361023} -08/30/2021 18:24:42 - INFO - __main__ - Step 29362: {'lr': 0.0004590071802973892, 'samples': 5637504, 'steps': 29361, 'loss/train': 1.0418428182601929} -08/30/2021 18:24:42 - INFO - __main__ - Step 29363: {'lr': 0.0004590042685156617, 'samples': 5637696, 'steps': 29362, 'loss/train': 1.0124503374099731} -08/30/2021 18:24:43 - INFO - __main__ - Step 29364: {'lr': 0.0004590013566397601, 'samples': 5637888, 'steps': 29363, 'loss/train': 1.5964131355285645} -08/30/2021 18:24:44 - INFO - __main__ - Step 29365: {'lr': 0.00045899844466968574, 'samples': 5638080, 'steps': 29364, 'loss/train': 1.4689416885375977} -08/30/2021 18:24:44 - INFO - __main__ - Step 29366: {'lr': 0.00045899553260543986, 'samples': 5638272, 'steps': 29365, 'loss/train': 1.0361446142196655} -08/30/2021 18:24:45 - INFO - __main__ - Step 29367: {'lr': 0.0004589926204470238, 'samples': 5638464, 'steps': 29366, 'loss/train': 1.4815704822540283} -08/30/2021 18:24:45 - INFO - __main__ - Step 29368: {'lr': 0.000458989708194439, 'samples': 5638656, 'steps': 29367, 'loss/train': 1.4048242568969727} -08/30/2021 18:24:45 - INFO - __main__ - Step 29369: {'lr': 0.0004589867958476866, 'samples': 5638848, 'steps': 29368, 'loss/train': 1.5980817079544067} -08/30/2021 18:24:47 - INFO - __main__ - Step 29370: {'lr': 0.000458983883406768, 'samples': 5639040, 'steps': 29369, 'loss/train': 1.6755766868591309} -08/30/2021 18:24:48 - INFO - __main__ - Step 29371: {'lr': 0.0004589809708716844, 'samples': 5639232, 'steps': 29370, 'loss/train': 1.5317788124084473} -08/30/2021 18:24:48 - INFO - __main__ - Step 29372: {'lr': 0.0004589780582424373, 'samples': 5639424, 'steps': 29371, 'loss/train': 1.7573219537734985} -08/30/2021 18:24:48 - INFO - __main__ - Step 29373: {'lr': 0.00045897514551902785, 'samples': 5639616, 'steps': 29372, 'loss/train': 1.8937082290649414} -08/30/2021 18:24:49 - INFO - __main__ - Step 29374: {'lr': 0.0004589722327014575, 'samples': 5639808, 'steps': 29373, 'loss/train': 0.046694349497556686} -08/30/2021 18:24:50 - INFO - __main__ - Step 29375: {'lr': 0.0004589693197897274, 'samples': 5640000, 'steps': 29374, 'loss/train': 1.5517034530639648} -08/30/2021 18:24:51 - INFO - __main__ - Step 29376: {'lr': 0.0004589664067838389, 'samples': 5640192, 'steps': 29375, 'loss/train': 1.9797797203063965} -08/30/2021 18:24:51 - INFO - __main__ - Step 29377: {'lr': 0.00045896349368379356, 'samples': 5640384, 'steps': 29376, 'loss/train': 1.8868993520736694} -08/30/2021 18:24:51 - INFO - __main__ - Step 29378: {'lr': 0.00045896058048959233, 'samples': 5640576, 'steps': 29377, 'loss/train': 1.7486587762832642} -08/30/2021 18:24:52 - INFO - __main__ - Step 29379: {'lr': 0.00045895766720123677, 'samples': 5640768, 'steps': 29378, 'loss/train': 1.639821171760559} -08/30/2021 18:24:52 - INFO - __main__ - Step 29380: {'lr': 0.0004589547538187281, 'samples': 5640960, 'steps': 29379, 'loss/train': 1.2783039808273315} -08/30/2021 18:24:54 - INFO - __main__ - Step 29381: {'lr': 0.0004589518403420676, 'samples': 5641152, 'steps': 29380, 'loss/train': 1.9844601154327393} -08/30/2021 18:24:54 - INFO - __main__ - Step 29382: {'lr': 0.00045894892677125667, 'samples': 5641344, 'steps': 29381, 'loss/train': 0.6697326302528381} -08/30/2021 18:24:54 - INFO - __main__ - Step 29383: {'lr': 0.0004589460131062965, 'samples': 5641536, 'steps': 29382, 'loss/train': 1.7014347314834595} -08/30/2021 18:24:55 - INFO - __main__ - Step 29384: {'lr': 0.00045894309934718853, 'samples': 5641728, 'steps': 29383, 'loss/train': 1.9141618013381958} -08/30/2021 18:24:55 - INFO - __main__ - Step 29385: {'lr': 0.00045894018549393404, 'samples': 5641920, 'steps': 29384, 'loss/train': 1.6436084508895874} -08/30/2021 18:24:57 - INFO - __main__ - Step 29386: {'lr': 0.0004589372715465343, 'samples': 5642112, 'steps': 29385, 'loss/train': 1.6123789548873901} -08/30/2021 18:24:57 - INFO - __main__ - Step 29387: {'lr': 0.0004589343575049907, 'samples': 5642304, 'steps': 29386, 'loss/train': 0.6841147541999817} -08/30/2021 18:24:58 - INFO - __main__ - Step 29388: {'lr': 0.0004589314433693044, 'samples': 5642496, 'steps': 29387, 'loss/train': 1.6462756395339966} -08/30/2021 18:24:58 - INFO - __main__ - Step 29389: {'lr': 0.0004589285291394769, 'samples': 5642688, 'steps': 29388, 'loss/train': 3.1464827060699463} -08/30/2021 18:24:58 - INFO - __main__ - Step 29390: {'lr': 0.00045892561481550943, 'samples': 5642880, 'steps': 29389, 'loss/train': 1.0138169527053833} -08/30/2021 18:25:00 - INFO - __main__ - Step 29391: {'lr': 0.0004589227003974032, 'samples': 5643072, 'steps': 29390, 'loss/train': 1.6912964582443237} -08/30/2021 18:25:00 - INFO - __main__ - Step 29392: {'lr': 0.00045891978588515975, 'samples': 5643264, 'steps': 29391, 'loss/train': 2.052468776702881} -08/30/2021 18:25:01 - INFO - __main__ - Step 29393: {'lr': 0.0004589168712787802, 'samples': 5643456, 'steps': 29392, 'loss/train': 1.9062495231628418} -08/30/2021 18:25:01 - INFO - __main__ - Step 29394: {'lr': 0.00045891395657826595, 'samples': 5643648, 'steps': 29393, 'loss/train': 1.2196245193481445} -08/30/2021 18:25:01 - INFO - __main__ - Step 29395: {'lr': 0.0004589110417836183, 'samples': 5643840, 'steps': 29394, 'loss/train': 1.4842808246612549} -08/30/2021 18:25:03 - INFO - __main__ - Step 29396: {'lr': 0.0004589081268948386, 'samples': 5644032, 'steps': 29395, 'loss/train': 1.4386818408966064} -08/30/2021 18:25:04 - INFO - __main__ - Step 29397: {'lr': 0.00045890521191192807, 'samples': 5644224, 'steps': 29396, 'loss/train': 0.10482214391231537} -08/30/2021 18:25:04 - INFO - __main__ - Step 29398: {'lr': 0.0004589022968348881, 'samples': 5644416, 'steps': 29397, 'loss/train': 1.5119930505752563} -08/30/2021 18:25:04 - INFO - __main__ - Step 29399: {'lr': 0.0004588993816637199, 'samples': 5644608, 'steps': 29398, 'loss/train': 1.028935194015503} -08/30/2021 18:25:05 - INFO - __main__ - Step 29400: {'lr': 0.00045889646639842496, 'samples': 5644800, 'steps': 29399, 'loss/train': 1.5866012573242188} -08/30/2021 18:25:06 - INFO - __main__ - Step 29401: {'lr': 0.0004588935510390045, 'samples': 5644992, 'steps': 29400, 'loss/train': 1.3974342346191406} -08/30/2021 18:25:07 - INFO - __main__ - Step 29402: {'lr': 0.00045889063558545974, 'samples': 5645184, 'steps': 29401, 'loss/train': 1.3678932189941406} -08/30/2021 18:25:07 - INFO - __main__ - Step 29403: {'lr': 0.0004588877200377921, 'samples': 5645376, 'steps': 29402, 'loss/train': 2.091094970703125} -08/30/2021 18:25:07 - INFO - __main__ - Step 29404: {'lr': 0.000458884804396003, 'samples': 5645568, 'steps': 29403, 'loss/train': 0.39705920219421387} -08/30/2021 18:25:08 - INFO - __main__ - Step 29405: {'lr': 0.0004588818886600935, 'samples': 5645760, 'steps': 29404, 'loss/train': 1.5316617488861084} -08/30/2021 18:25:09 - INFO - __main__ - Step 29406: {'lr': 0.00045887897283006506, 'samples': 5645952, 'steps': 29405, 'loss/train': 1.222008228302002} -08/30/2021 18:25:10 - INFO - __main__ - Step 29407: {'lr': 0.00045887605690591904, 'samples': 5646144, 'steps': 29406, 'loss/train': 1.6904852390289307} -08/30/2021 18:25:10 - INFO - __main__ - Step 29408: {'lr': 0.0004588731408876566, 'samples': 5646336, 'steps': 29407, 'loss/train': 1.104187250137329} -08/30/2021 18:25:11 - INFO - __main__ - Step 29409: {'lr': 0.00045887022477527923, 'samples': 5646528, 'steps': 29408, 'loss/train': 0.0872500017285347} -08/30/2021 18:25:11 - INFO - __main__ - Step 29410: {'lr': 0.0004588673085687881, 'samples': 5646720, 'steps': 29409, 'loss/train': 3.6997017860412598} -08/30/2021 18:25:11 - INFO - __main__ - Step 29411: {'lr': 0.00045886439226818464, 'samples': 5646912, 'steps': 29410, 'loss/train': 1.5496467351913452} -08/30/2021 18:25:13 - INFO - __main__ - Step 29412: {'lr': 0.0004588614758734701, 'samples': 5647104, 'steps': 29411, 'loss/train': 1.7699309587478638} -08/30/2021 18:25:14 - INFO - __main__ - Step 29413: {'lr': 0.0004588585593846458, 'samples': 5647296, 'steps': 29412, 'loss/train': 0.24823713302612305} -08/30/2021 18:25:14 - INFO - __main__ - Step 29414: {'lr': 0.000458855642801713, 'samples': 5647488, 'steps': 29413, 'loss/train': 1.5737879276275635} -08/30/2021 18:25:14 - INFO - __main__ - Step 29415: {'lr': 0.00045885272612467313, 'samples': 5647680, 'steps': 29414, 'loss/train': 0.5294879078865051} -08/30/2021 18:25:15 - INFO - __main__ - Step 29416: {'lr': 0.0004588498093535274, 'samples': 5647872, 'steps': 29415, 'loss/train': 1.0835024118423462} -08/30/2021 18:25:15 - INFO - __main__ - Step 29417: {'lr': 0.0004588468924882772, 'samples': 5648064, 'steps': 29416, 'loss/train': 1.8900400400161743} -08/30/2021 18:25:17 - INFO - __main__ - Step 29418: {'lr': 0.0004588439755289238, 'samples': 5648256, 'steps': 29417, 'loss/train': 1.8867288827896118} -08/30/2021 18:25:18 - INFO - __main__ - Step 29419: {'lr': 0.00045884105847546853, 'samples': 5648448, 'steps': 29418, 'loss/train': 1.3944100141525269} -08/30/2021 18:25:18 - INFO - __main__ - Step 29420: {'lr': 0.00045883814132791274, 'samples': 5648640, 'steps': 29419, 'loss/train': 1.8383020162582397} -08/30/2021 18:25:18 - INFO - __main__ - Step 29421: {'lr': 0.0004588352240862577, 'samples': 5648832, 'steps': 29420, 'loss/train': 1.4362998008728027} -08/30/2021 18:25:19 - INFO - __main__ - Step 29422: {'lr': 0.0004588323067505047, 'samples': 5649024, 'steps': 29421, 'loss/train': 1.4182742834091187} -08/30/2021 18:25:20 - INFO - __main__ - Step 29423: {'lr': 0.00045882938932065504, 'samples': 5649216, 'steps': 29422, 'loss/train': 1.8948737382888794} -08/30/2021 18:25:21 - INFO - __main__ - Step 29424: {'lr': 0.0004588264717967101, 'samples': 5649408, 'steps': 29423, 'loss/train': 1.822411060333252} -08/30/2021 18:25:21 - INFO - __main__ - Step 29425: {'lr': 0.00045882355417867124, 'samples': 5649600, 'steps': 29424, 'loss/train': 0.877035915851593} -08/30/2021 18:25:21 - INFO - __main__ - Step 29426: {'lr': 0.00045882063646653966, 'samples': 5649792, 'steps': 29425, 'loss/train': 0.966000497341156} -08/30/2021 18:25:22 - INFO - __main__ - Step 29427: {'lr': 0.00045881771866031673, 'samples': 5649984, 'steps': 29426, 'loss/train': 1.2050514221191406} -08/30/2021 18:25:23 - INFO - __main__ - Step 29428: {'lr': 0.00045881480076000376, 'samples': 5650176, 'steps': 29427, 'loss/train': 1.1730661392211914} -08/30/2021 18:25:24 - INFO - __main__ - Step 29429: {'lr': 0.00045881188276560204, 'samples': 5650368, 'steps': 29428, 'loss/train': 1.0626200437545776} -08/30/2021 18:25:24 - INFO - __main__ - Step 29430: {'lr': 0.000458808964677113, 'samples': 5650560, 'steps': 29429, 'loss/train': 1.5473029613494873} -08/30/2021 18:25:24 - INFO - __main__ - Step 29431: {'lr': 0.00045880604649453774, 'samples': 5650752, 'steps': 29430, 'loss/train': 1.8532428741455078} -08/30/2021 18:25:25 - INFO - __main__ - Step 29432: {'lr': 0.00045880312821787775, 'samples': 5650944, 'steps': 29431, 'loss/train': 1.6421610116958618} -08/30/2021 18:25:26 - INFO - __main__ - Step 29433: {'lr': 0.00045880020984713434, 'samples': 5651136, 'steps': 29432, 'loss/train': 1.980318546295166} -08/30/2021 18:25:27 - INFO - __main__ - Step 29434: {'lr': 0.0004587972913823087, 'samples': 5651328, 'steps': 29433, 'loss/train': 1.8178534507751465} -08/30/2021 18:25:27 - INFO - __main__ - Step 29435: {'lr': 0.00045879437282340225, 'samples': 5651520, 'steps': 29434, 'loss/train': 1.2301417589187622} -08/30/2021 18:25:27 - INFO - __main__ - Step 29436: {'lr': 0.00045879145417041623, 'samples': 5651712, 'steps': 29435, 'loss/train': 1.4887574911117554} -08/30/2021 18:25:28 - INFO - __main__ - Step 29437: {'lr': 0.0004587885354233521, 'samples': 5651904, 'steps': 29436, 'loss/train': 1.3315002918243408} -08/30/2021 18:25:29 - INFO - __main__ - Step 29438: {'lr': 0.0004587856165822111, 'samples': 5652096, 'steps': 29437, 'loss/train': 1.6939550638198853} -08/30/2021 18:25:30 - INFO - __main__ - Step 29439: {'lr': 0.0004587826976469944, 'samples': 5652288, 'steps': 29438, 'loss/train': 1.3654032945632935} -08/30/2021 18:25:30 - INFO - __main__ - Step 29440: {'lr': 0.0004587797786177035, 'samples': 5652480, 'steps': 29439, 'loss/train': 1.600990891456604} -08/30/2021 18:25:30 - INFO - __main__ - Step 29441: {'lr': 0.0004587768594943396, 'samples': 5652672, 'steps': 29440, 'loss/train': 1.4263916015625} -08/30/2021 18:25:31 - INFO - __main__ - Step 29442: {'lr': 0.00045877394027690413, 'samples': 5652864, 'steps': 29441, 'loss/train': 1.4905107021331787} -08/30/2021 18:25:31 - INFO - __main__ - Step 29443: {'lr': 0.0004587710209653984, 'samples': 5653056, 'steps': 29442, 'loss/train': 1.9826242923736572} -08/30/2021 18:25:32 - INFO - __main__ - Step 29444: {'lr': 0.0004587681015598235, 'samples': 5653248, 'steps': 29443, 'loss/train': 1.6064846515655518} -08/30/2021 18:25:33 - INFO - __main__ - Step 29445: {'lr': 0.00045876518206018103, 'samples': 5653440, 'steps': 29444, 'loss/train': 1.5464205741882324} -08/30/2021 18:25:33 - INFO - __main__ - Step 29446: {'lr': 0.00045876226246647226, 'samples': 5653632, 'steps': 29445, 'loss/train': 1.4796415567398071} -08/30/2021 18:25:34 - INFO - __main__ - Step 29447: {'lr': 0.0004587593427786983, 'samples': 5653824, 'steps': 29446, 'loss/train': 0.5536571741104126} -08/30/2021 18:25:34 - INFO - __main__ - Step 29448: {'lr': 0.0004587564229968606, 'samples': 5654016, 'steps': 29447, 'loss/train': 1.7594894170761108} -08/30/2021 18:25:35 - INFO - __main__ - Step 29449: {'lr': 0.00045875350312096053, 'samples': 5654208, 'steps': 29448, 'loss/train': 1.3968859910964966} -08/30/2021 18:25:36 - INFO - __main__ - Step 29450: {'lr': 0.0004587505831509994, 'samples': 5654400, 'steps': 29449, 'loss/train': 1.7576875686645508} -08/30/2021 18:25:36 - INFO - __main__ - Step 29451: {'lr': 0.0004587476630869784, 'samples': 5654592, 'steps': 29450, 'loss/train': 1.3094887733459473} -08/30/2021 18:25:37 - INFO - __main__ - Step 29452: {'lr': 0.000458744742928899, 'samples': 5654784, 'steps': 29451, 'loss/train': 1.0282065868377686} -08/30/2021 18:25:37 - INFO - __main__ - Step 29453: {'lr': 0.00045874182267676236, 'samples': 5654976, 'steps': 29452, 'loss/train': 1.4678053855895996} -08/30/2021 18:25:39 - INFO - __main__ - Step 29454: {'lr': 0.0004587389023305699, 'samples': 5655168, 'steps': 29453, 'loss/train': 1.8546245098114014} -08/30/2021 18:25:39 - INFO - __main__ - Step 29455: {'lr': 0.00045873598189032295, 'samples': 5655360, 'steps': 29454, 'loss/train': 0.6133260130882263} -08/30/2021 18:25:39 - INFO - __main__ - Step 29456: {'lr': 0.00045873306135602276, 'samples': 5655552, 'steps': 29455, 'loss/train': 1.0019116401672363} -08/30/2021 18:25:40 - INFO - __main__ - Step 29457: {'lr': 0.00045873014072767064, 'samples': 5655744, 'steps': 29456, 'loss/train': 0.6915490627288818} -08/30/2021 18:25:40 - INFO - __main__ - Step 29458: {'lr': 0.000458727220005268, 'samples': 5655936, 'steps': 29457, 'loss/train': 1.015907645225525} -08/30/2021 18:25:40 - INFO - __main__ - Step 29459: {'lr': 0.00045872429918881606, 'samples': 5656128, 'steps': 29458, 'loss/train': 0.957791268825531} -08/30/2021 18:25:42 - INFO - __main__ - Step 29460: {'lr': 0.00045872137827831616, 'samples': 5656320, 'steps': 29459, 'loss/train': 1.2022985219955444} -08/30/2021 18:25:42 - INFO - __main__ - Step 29461: {'lr': 0.00045871845727376973, 'samples': 5656512, 'steps': 29460, 'loss/train': 1.2923895120620728} -08/30/2021 18:25:43 - INFO - __main__ - Step 29462: {'lr': 0.0004587155361751778, 'samples': 5656704, 'steps': 29461, 'loss/train': 0.9164935350418091} -08/30/2021 18:25:43 - INFO - __main__ - Step 29463: {'lr': 0.000458712614982542, 'samples': 5656896, 'steps': 29462, 'loss/train': 1.6710330247879028} -08/30/2021 18:25:43 - INFO - __main__ - Step 29464: {'lr': 0.00045870969369586346, 'samples': 5657088, 'steps': 29463, 'loss/train': 2.187263011932373} -08/30/2021 18:25:45 - INFO - __main__ - Step 29465: {'lr': 0.00045870677231514356, 'samples': 5657280, 'steps': 29464, 'loss/train': 1.160699486732483} -08/30/2021 18:25:45 - INFO - __main__ - Step 29466: {'lr': 0.0004587038508403837, 'samples': 5657472, 'steps': 29465, 'loss/train': 1.2791696786880493} -08/30/2021 18:25:46 - INFO - __main__ - Step 29467: {'lr': 0.000458700929271585, 'samples': 5657664, 'steps': 29466, 'loss/train': 1.6932755708694458} -08/30/2021 18:25:46 - INFO - __main__ - Step 29468: {'lr': 0.0004586980076087489, 'samples': 5657856, 'steps': 29467, 'loss/train': 1.0619211196899414} -08/30/2021 18:25:46 - INFO - __main__ - Step 29469: {'lr': 0.0004586950858518767, 'samples': 5658048, 'steps': 29468, 'loss/train': 0.9249522686004639} -08/30/2021 18:25:48 - INFO - __main__ - Step 29470: {'lr': 0.0004586921640009697, 'samples': 5658240, 'steps': 29469, 'loss/train': 1.277970790863037} -08/30/2021 18:25:49 - INFO - __main__ - Step 29471: {'lr': 0.0004586892420560294, 'samples': 5658432, 'steps': 29470, 'loss/train': 1.4958105087280273} -08/30/2021 18:25:49 - INFO - __main__ - Step 29472: {'lr': 0.0004586863200170567, 'samples': 5658624, 'steps': 29471, 'loss/train': 1.5742889642715454} -08/30/2021 18:25:50 - INFO - __main__ - Step 29473: {'lr': 0.00045868339788405333, 'samples': 5658816, 'steps': 29472, 'loss/train': 1.2178361415863037} -08/30/2021 18:25:50 - INFO - __main__ - Step 29474: {'lr': 0.0004586804756570204, 'samples': 5659008, 'steps': 29473, 'loss/train': 0.9887757301330566} -08/30/2021 18:25:52 - INFO - __main__ - Step 29475: {'lr': 0.0004586775533359592, 'samples': 5659200, 'steps': 29474, 'loss/train': 1.120389461517334} -08/30/2021 18:25:52 - INFO - __main__ - Step 29476: {'lr': 0.00045867463092087116, 'samples': 5659392, 'steps': 29475, 'loss/train': 1.218640923500061} -08/30/2021 18:25:52 - INFO - __main__ - Step 29477: {'lr': 0.00045867170841175755, 'samples': 5659584, 'steps': 29476, 'loss/train': 1.182020902633667} -08/30/2021 18:25:53 - INFO - __main__ - Step 29478: {'lr': 0.0004586687858086197, 'samples': 5659776, 'steps': 29477, 'loss/train': 0.715477466583252} -08/30/2021 18:25:53 - INFO - __main__ - Step 29479: {'lr': 0.0004586658631114589, 'samples': 5659968, 'steps': 29478, 'loss/train': 1.6136478185653687} -08/30/2021 18:25:55 - INFO - __main__ - Step 29480: {'lr': 0.0004586629403202765, 'samples': 5660160, 'steps': 29479, 'loss/train': 1.5179307460784912} -08/30/2021 18:25:55 - INFO - __main__ - Step 29481: {'lr': 0.0004586600174350738, 'samples': 5660352, 'steps': 29480, 'loss/train': 0.09195207059383392} -08/30/2021 18:25:56 - INFO - __main__ - Step 29482: {'lr': 0.0004586570944558521, 'samples': 5660544, 'steps': 29481, 'loss/train': 1.2771415710449219} -08/30/2021 18:25:56 - INFO - __main__ - Step 29483: {'lr': 0.00045865417138261276, 'samples': 5660736, 'steps': 29482, 'loss/train': 0.06736479699611664} -08/30/2021 18:25:56 - INFO - __main__ - Step 29484: {'lr': 0.00045865124821535704, 'samples': 5660928, 'steps': 29483, 'loss/train': 0.6730112433433533} -08/30/2021 18:25:58 - INFO - __main__ - Step 29485: {'lr': 0.00045864832495408624, 'samples': 5661120, 'steps': 29484, 'loss/train': 2.730788230895996} -08/30/2021 18:25:59 - INFO - __main__ - Step 29486: {'lr': 0.0004586454015988019, 'samples': 5661312, 'steps': 29485, 'loss/train': 0.9634883403778076} -08/30/2021 18:25:59 - INFO - __main__ - Step 29487: {'lr': 0.000458642478149505, 'samples': 5661504, 'steps': 29486, 'loss/train': 1.6337947845458984} -08/30/2021 18:25:59 - INFO - __main__ - Step 29488: {'lr': 0.00045863955460619707, 'samples': 5661696, 'steps': 29487, 'loss/train': 1.7172850370407104} -08/30/2021 18:26:00 - INFO - __main__ - Step 29489: {'lr': 0.0004586366309688793, 'samples': 5661888, 'steps': 29488, 'loss/train': 0.0479944609105587} -08/30/2021 18:26:00 - INFO - __main__ - Step 29490: {'lr': 0.00045863370723755315, 'samples': 5662080, 'steps': 29489, 'loss/train': 0.6843440532684326} -08/30/2021 18:26:01 - INFO - __main__ - Step 29491: {'lr': 0.00045863078341221993, 'samples': 5662272, 'steps': 29490, 'loss/train': 1.3027055263519287} -08/30/2021 18:26:02 - INFO - __main__ - Step 29492: {'lr': 0.0004586278594928808, 'samples': 5662464, 'steps': 29491, 'loss/train': 0.09501402080059052} -08/30/2021 18:26:02 - INFO - __main__ - Step 29493: {'lr': 0.0004586249354795372, 'samples': 5662656, 'steps': 29492, 'loss/train': 1.4198743104934692} -08/30/2021 18:26:03 - INFO - __main__ - Step 29494: {'lr': 0.0004586220113721905, 'samples': 5662848, 'steps': 29493, 'loss/train': 1.2894880771636963} -08/30/2021 18:26:03 - INFO - __main__ - Step 29495: {'lr': 0.0004586190871708419, 'samples': 5663040, 'steps': 29494, 'loss/train': 1.7419530153274536} -08/30/2021 18:26:03 - INFO - __main__ - Step 29496: {'lr': 0.0004586161628754927, 'samples': 5663232, 'steps': 29495, 'loss/train': 1.8950157165527344} -08/30/2021 18:26:06 - INFO - __main__ - Step 29497: {'lr': 0.0004586132384861443, 'samples': 5663424, 'steps': 29496, 'loss/train': 0.32504117488861084} -08/30/2021 18:26:06 - INFO - __main__ - Step 29498: {'lr': 0.000458610314002798, 'samples': 5663616, 'steps': 29497, 'loss/train': 1.5534977912902832} -08/30/2021 18:26:07 - INFO - __main__ - Step 29499: {'lr': 0.0004586073894254551, 'samples': 5663808, 'steps': 29498, 'loss/train': 1.144694447517395} -08/30/2021 18:26:07 - INFO - __main__ - Step 29500: {'lr': 0.000458604464754117, 'samples': 5664000, 'steps': 29499, 'loss/train': 1.829520583152771} -08/30/2021 18:26:07 - INFO - __main__ - Step 29501: {'lr': 0.0004586015399887849, 'samples': 5664192, 'steps': 29500, 'loss/train': 0.6112343668937683} -08/30/2021 18:26:08 - INFO - __main__ - Step 29502: {'lr': 0.0004585986151294602, 'samples': 5664384, 'steps': 29501, 'loss/train': 0.5225926637649536} -08/30/2021 18:26:09 - INFO - __main__ - Step 29503: {'lr': 0.0004585956901761441, 'samples': 5664576, 'steps': 29502, 'loss/train': 0.5445204377174377} -08/30/2021 18:26:10 - INFO - __main__ - Step 29504: {'lr': 0.00045859276512883807, 'samples': 5664768, 'steps': 29503, 'loss/train': 1.7337385416030884} -08/30/2021 18:26:10 - INFO - __main__ - Step 29505: {'lr': 0.00045858983998754336, 'samples': 5664960, 'steps': 29504, 'loss/train': 1.2972288131713867} -08/30/2021 18:26:10 - INFO - __main__ - Step 29506: {'lr': 0.0004585869147522612, 'samples': 5665152, 'steps': 29505, 'loss/train': 1.3692007064819336} -08/30/2021 18:26:11 - INFO - __main__ - Step 29507: {'lr': 0.00045858398942299306, 'samples': 5665344, 'steps': 29506, 'loss/train': 2.033146858215332} -08/30/2021 18:26:12 - INFO - __main__ - Step 29508: {'lr': 0.0004585810639997402, 'samples': 5665536, 'steps': 29507, 'loss/train': 1.3620285987854004} -08/30/2021 18:26:13 - INFO - __main__ - Step 29509: {'lr': 0.0004585781384825039, 'samples': 5665728, 'steps': 29508, 'loss/train': 1.6803773641586304} -08/30/2021 18:26:13 - INFO - __main__ - Step 29510: {'lr': 0.00045857521287128556, 'samples': 5665920, 'steps': 29509, 'loss/train': 0.9989269971847534} -08/30/2021 18:26:13 - INFO - __main__ - Step 29511: {'lr': 0.0004585722871660864, 'samples': 5666112, 'steps': 29510, 'loss/train': 1.6287176609039307} -08/30/2021 18:26:14 - INFO - __main__ - Step 29512: {'lr': 0.0004585693613669078, 'samples': 5666304, 'steps': 29511, 'loss/train': 1.455241322517395} -08/30/2021 18:26:15 - INFO - __main__ - Step 29513: {'lr': 0.0004585664354737511, 'samples': 5666496, 'steps': 29512, 'loss/train': 1.7103053331375122} -08/30/2021 18:26:16 - INFO - __main__ - Step 29514: {'lr': 0.0004585635094866175, 'samples': 5666688, 'steps': 29513, 'loss/train': 1.5950748920440674} -08/30/2021 18:26:16 - INFO - __main__ - Step 29515: {'lr': 0.0004585605834055084, 'samples': 5666880, 'steps': 29514, 'loss/train': 0.6312817335128784} -08/30/2021 18:26:16 - INFO - __main__ - Step 29516: {'lr': 0.00045855765723042526, 'samples': 5667072, 'steps': 29515, 'loss/train': 1.4721404314041138} -08/30/2021 18:26:17 - INFO - __main__ - Step 29517: {'lr': 0.00045855473096136914, 'samples': 5667264, 'steps': 29516, 'loss/train': 1.3437658548355103} -08/30/2021 18:26:18 - INFO - __main__ - Step 29518: {'lr': 0.00045855180459834153, 'samples': 5667456, 'steps': 29517, 'loss/train': 1.1570112705230713} -08/30/2021 18:26:19 - INFO - __main__ - Step 29519: {'lr': 0.0004585488781413437, 'samples': 5667648, 'steps': 29518, 'loss/train': 1.4586642980575562} -08/30/2021 18:26:19 - INFO - __main__ - Step 29520: {'lr': 0.00045854595159037695, 'samples': 5667840, 'steps': 29519, 'loss/train': 1.6733678579330444} -08/30/2021 18:26:19 - INFO - __main__ - Step 29521: {'lr': 0.0004585430249454425, 'samples': 5668032, 'steps': 29520, 'loss/train': 1.654155969619751} -08/30/2021 18:26:20 - INFO - __main__ - Step 29522: {'lr': 0.000458540098206542, 'samples': 5668224, 'steps': 29521, 'loss/train': 1.9122824668884277} -08/30/2021 18:26:21 - INFO - __main__ - Step 29523: {'lr': 0.00045853717137367634, 'samples': 5668416, 'steps': 29522, 'loss/train': 1.2130546569824219} -08/30/2021 18:26:22 - INFO - __main__ - Step 29524: {'lr': 0.0004585342444468471, 'samples': 5668608, 'steps': 29523, 'loss/train': 1.0073513984680176} -08/30/2021 18:26:22 - INFO - __main__ - Step 29525: {'lr': 0.00045853131742605563, 'samples': 5668800, 'steps': 29524, 'loss/train': 1.2143741846084595} -08/30/2021 18:26:22 - INFO - __main__ - Step 29526: {'lr': 0.0004585283903113031, 'samples': 5668992, 'steps': 29525, 'loss/train': 1.5078721046447754} -08/30/2021 18:26:23 - INFO - __main__ - Step 29527: {'lr': 0.00045852546310259093, 'samples': 5669184, 'steps': 29526, 'loss/train': 1.5619242191314697} -08/30/2021 18:26:23 - INFO - __main__ - Step 29528: {'lr': 0.00045852253579992043, 'samples': 5669376, 'steps': 29527, 'loss/train': 1.0531502962112427} -08/30/2021 18:26:25 - INFO - __main__ - Step 29529: {'lr': 0.0004585196084032928, 'samples': 5669568, 'steps': 29528, 'loss/train': 1.3731187582015991} -08/30/2021 18:26:26 - INFO - __main__ - Step 29530: {'lr': 0.0004585166809127095, 'samples': 5669760, 'steps': 29529, 'loss/train': 1.3357107639312744} -08/30/2021 18:26:26 - INFO - __main__ - Step 29531: {'lr': 0.0004585137533281718, 'samples': 5669952, 'steps': 29530, 'loss/train': 0.8998951315879822} -08/30/2021 18:26:27 - INFO - __main__ - Step 29532: {'lr': 0.00045851082564968103, 'samples': 5670144, 'steps': 29531, 'loss/train': 1.4392424821853638} -08/30/2021 18:26:27 - INFO - __main__ - Step 29533: {'lr': 0.0004585078978772385, 'samples': 5670336, 'steps': 29532, 'loss/train': 1.5617882013320923} -08/30/2021 18:26:29 - INFO - __main__ - Step 29534: {'lr': 0.0004585049700108455, 'samples': 5670528, 'steps': 29533, 'loss/train': 1.0490193367004395} -08/30/2021 18:26:29 - INFO - __main__ - Step 29535: {'lr': 0.00045850204205050344, 'samples': 5670720, 'steps': 29534, 'loss/train': 1.2691662311553955} -08/30/2021 18:26:30 - INFO - __main__ - Step 29536: {'lr': 0.0004584991139962135, 'samples': 5670912, 'steps': 29535, 'loss/train': 1.3712712526321411} -08/30/2021 18:26:30 - INFO - __main__ - Step 29537: {'lr': 0.00045849618584797717, 'samples': 5671104, 'steps': 29536, 'loss/train': 1.5839011669158936} -08/30/2021 18:26:30 - INFO - __main__ - Step 29538: {'lr': 0.0004584932576057956, 'samples': 5671296, 'steps': 29537, 'loss/train': 0.07783497124910355} -08/30/2021 18:26:31 - INFO - __main__ - Step 29539: {'lr': 0.00045849032926967016, 'samples': 5671488, 'steps': 29538, 'loss/train': 0.04371124133467674} -08/30/2021 18:26:32 - INFO - __main__ - Step 29540: {'lr': 0.0004584874008396023, 'samples': 5671680, 'steps': 29539, 'loss/train': 1.6364810466766357} -08/30/2021 18:26:33 - INFO - __main__ - Step 29541: {'lr': 0.00045848447231559315, 'samples': 5671872, 'steps': 29540, 'loss/train': 1.350569248199463} -08/30/2021 18:26:33 - INFO - __main__ - Step 29542: {'lr': 0.00045848154369764415, 'samples': 5672064, 'steps': 29541, 'loss/train': 1.412458896636963} -08/30/2021 18:26:33 - INFO - __main__ - Step 29543: {'lr': 0.0004584786149857566, 'samples': 5672256, 'steps': 29542, 'loss/train': 1.7077301740646362} -08/30/2021 18:26:34 - INFO - __main__ - Step 29544: {'lr': 0.00045847568617993174, 'samples': 5672448, 'steps': 29543, 'loss/train': 1.4265661239624023} -08/30/2021 18:26:35 - INFO - __main__ - Step 29545: {'lr': 0.000458472757280171, 'samples': 5672640, 'steps': 29544, 'loss/train': 1.2461732625961304} -08/30/2021 18:26:36 - INFO - __main__ - Step 29546: {'lr': 0.0004584698282864757, 'samples': 5672832, 'steps': 29545, 'loss/train': 0.269072026014328} -08/30/2021 18:26:36 - INFO - __main__ - Step 29547: {'lr': 0.000458466899198847, 'samples': 5673024, 'steps': 29546, 'loss/train': 0.7153891324996948} -08/30/2021 18:26:36 - INFO - __main__ - Step 29548: {'lr': 0.0004584639700172863, 'samples': 5673216, 'steps': 29547, 'loss/train': 1.3654835224151611} -08/30/2021 18:26:37 - INFO - __main__ - Step 29549: {'lr': 0.00045846104074179504, 'samples': 5673408, 'steps': 29548, 'loss/train': 2.0023417472839355} -08/30/2021 18:26:37 - INFO - __main__ - Step 29550: {'lr': 0.00045845811137237445, 'samples': 5673600, 'steps': 29549, 'loss/train': 1.5485824346542358} -08/30/2021 18:26:39 - INFO - __main__ - Step 29551: {'lr': 0.0004584551819090259, 'samples': 5673792, 'steps': 29550, 'loss/train': 0.6402052640914917} -08/30/2021 18:26:39 - INFO - __main__ - Step 29552: {'lr': 0.0004584522523517506, 'samples': 5673984, 'steps': 29551, 'loss/train': 1.4533443450927734} -08/30/2021 18:26:40 - INFO - __main__ - Step 29553: {'lr': 0.00045844932270054997, 'samples': 5674176, 'steps': 29552, 'loss/train': 1.2149449586868286} -08/30/2021 18:26:40 - INFO - __main__ - Step 29554: {'lr': 0.00045844639295542525, 'samples': 5674368, 'steps': 29553, 'loss/train': 0.05344089865684509} -08/30/2021 18:26:40 - INFO - __main__ - Step 29555: {'lr': 0.0004584434631163779, 'samples': 5674560, 'steps': 29554, 'loss/train': 3.456982135772705} -08/30/2021 18:26:41 - INFO - __main__ - Step 29556: {'lr': 0.000458440533183409, 'samples': 5674752, 'steps': 29555, 'loss/train': 2.0972509384155273} -08/30/2021 18:26:42 - INFO - __main__ - Step 29557: {'lr': 0.0004584376031565201, 'samples': 5674944, 'steps': 29556, 'loss/train': 1.2078018188476562} -08/30/2021 18:26:43 - INFO - __main__ - Step 29558: {'lr': 0.0004584346730357124, 'samples': 5675136, 'steps': 29557, 'loss/train': 1.2920725345611572} -08/30/2021 18:26:43 - INFO - __main__ - Step 29559: {'lr': 0.0004584317428209872, 'samples': 5675328, 'steps': 29558, 'loss/train': 0.9063498377799988} -08/30/2021 18:26:43 - INFO - __main__ - Step 29560: {'lr': 0.0004584288125123459, 'samples': 5675520, 'steps': 29559, 'loss/train': 0.9930772185325623} -08/30/2021 18:26:44 - INFO - __main__ - Step 29561: {'lr': 0.0004584258821097899, 'samples': 5675712, 'steps': 29560, 'loss/train': 1.6734131574630737} -08/30/2021 18:26:45 - INFO - __main__ - Step 29562: {'lr': 0.0004584229516133203, 'samples': 5675904, 'steps': 29561, 'loss/train': 1.4462260007858276} -08/30/2021 18:26:46 - INFO - __main__ - Step 29563: {'lr': 0.00045842002102293856, 'samples': 5676096, 'steps': 29562, 'loss/train': 1.4785751104354858} -08/30/2021 18:26:46 - INFO - __main__ - Step 29564: {'lr': 0.000458417090338646, 'samples': 5676288, 'steps': 29563, 'loss/train': 2.1335296630859375} -08/30/2021 18:26:46 - INFO - __main__ - Step 29565: {'lr': 0.00045841415956044394, 'samples': 5676480, 'steps': 29564, 'loss/train': 1.2591972351074219} -08/30/2021 18:26:47 - INFO - __main__ - Step 29566: {'lr': 0.0004584112286883336, 'samples': 5676672, 'steps': 29565, 'loss/train': 0.08477567136287689} -08/30/2021 18:26:48 - INFO - __main__ - Step 29567: {'lr': 0.0004584082977223164, 'samples': 5676864, 'steps': 29566, 'loss/train': 1.3854612112045288} -08/30/2021 18:26:48 - INFO - __main__ - Step 29568: {'lr': 0.0004584053666623937, 'samples': 5677056, 'steps': 29567, 'loss/train': 1.5562198162078857} -08/30/2021 18:26:49 - INFO - __main__ - Step 29569: {'lr': 0.00045840243550856666, 'samples': 5677248, 'steps': 29568, 'loss/train': 1.6854863166809082} -08/30/2021 18:26:49 - INFO - __main__ - Step 29570: {'lr': 0.00045839950426083677, 'samples': 5677440, 'steps': 29569, 'loss/train': 1.2686117887496948} -08/30/2021 18:26:50 - INFO - __main__ - Step 29571: {'lr': 0.0004583965729192052, 'samples': 5677632, 'steps': 29570, 'loss/train': 1.0729773044586182} -08/30/2021 18:26:51 - INFO - __main__ - Step 29572: {'lr': 0.00045839364148367345, 'samples': 5677824, 'steps': 29571, 'loss/train': 1.7262150049209595} -08/30/2021 18:26:52 - INFO - __main__ - Step 29573: {'lr': 0.00045839070995424273, 'samples': 5678016, 'steps': 29572, 'loss/train': 1.5303738117218018} -08/30/2021 18:26:52 - INFO - __main__ - Step 29574: {'lr': 0.00045838777833091425, 'samples': 5678208, 'steps': 29573, 'loss/train': 1.3324564695358276} -08/30/2021 18:26:53 - INFO - __main__ - Step 29575: {'lr': 0.00045838484661368963, 'samples': 5678400, 'steps': 29574, 'loss/train': 1.9263807535171509} -08/30/2021 18:26:53 - INFO - __main__ - Step 29576: {'lr': 0.00045838191480256985, 'samples': 5678592, 'steps': 29575, 'loss/train': 0.2690824866294861} -08/30/2021 18:26:53 - INFO - __main__ - Step 29577: {'lr': 0.00045837898289755654, 'samples': 5678784, 'steps': 29576, 'loss/train': 0.047330599278211594} -08/30/2021 18:26:55 - INFO - __main__ - Step 29578: {'lr': 0.0004583760508986508, 'samples': 5678976, 'steps': 29577, 'loss/train': 1.3086485862731934} -08/30/2021 18:26:55 - INFO - __main__ - Step 29579: {'lr': 0.000458373118805854, 'samples': 5679168, 'steps': 29578, 'loss/train': 1.364263653755188} -08/30/2021 18:26:56 - INFO - __main__ - Step 29580: {'lr': 0.00045837018661916754, 'samples': 5679360, 'steps': 29579, 'loss/train': 1.464563250541687} -08/30/2021 18:26:56 - INFO - __main__ - Step 29581: {'lr': 0.00045836725433859266, 'samples': 5679552, 'steps': 29580, 'loss/train': 1.7931222915649414} -08/30/2021 18:26:56 - INFO - __main__ - Step 29582: {'lr': 0.0004583643219641307, 'samples': 5679744, 'steps': 29581, 'loss/train': 1.1459400653839111} -08/30/2021 18:26:59 - INFO - __main__ - Step 29583: {'lr': 0.00045836138949578297, 'samples': 5679936, 'steps': 29582, 'loss/train': 1.4620206356048584} -08/30/2021 18:26:59 - INFO - __main__ - Step 29584: {'lr': 0.00045835845693355096, 'samples': 5680128, 'steps': 29583, 'loss/train': 1.4040746688842773} -08/30/2021 18:26:59 - INFO - __main__ - Step 29585: {'lr': 0.00045835552427743567, 'samples': 5680320, 'steps': 29584, 'loss/train': 1.2760283946990967} -08/30/2021 18:27:00 - INFO - __main__ - Step 29586: {'lr': 0.00045835259152743866, 'samples': 5680512, 'steps': 29585, 'loss/train': 1.6704434156417847} -08/30/2021 18:27:00 - INFO - __main__ - Step 29587: {'lr': 0.0004583496586835612, 'samples': 5680704, 'steps': 29586, 'loss/train': 0.11828450858592987} -08/30/2021 18:27:01 - INFO - __main__ - Step 29588: {'lr': 0.0004583467257458046, 'samples': 5680896, 'steps': 29587, 'loss/train': 1.6639827489852905} -08/30/2021 18:27:02 - INFO - __main__ - Step 29589: {'lr': 0.00045834379271417013, 'samples': 5681088, 'steps': 29588, 'loss/train': 1.6343023777008057} -08/30/2021 18:27:02 - INFO - __main__ - Step 29590: {'lr': 0.0004583408595886592, 'samples': 5681280, 'steps': 29589, 'loss/train': 1.898882508277893} -08/30/2021 18:27:03 - INFO - __main__ - Step 29591: {'lr': 0.0004583379263692732, 'samples': 5681472, 'steps': 29590, 'loss/train': 2.0787954330444336} -08/30/2021 18:27:03 - INFO - __main__ - Step 29592: {'lr': 0.0004583349930560132, 'samples': 5681664, 'steps': 29591, 'loss/train': 2.2682175636291504} -08/30/2021 18:27:06 - INFO - __main__ - Step 29593: {'lr': 0.0004583320596488807, 'samples': 5681856, 'steps': 29592, 'loss/train': 1.465067982673645} -08/30/2021 18:27:06 - INFO - __main__ - Step 29594: {'lr': 0.000458329126147877, 'samples': 5682048, 'steps': 29593, 'loss/train': 1.508357048034668} -08/30/2021 18:27:06 - INFO - __main__ - Step 29595: {'lr': 0.00045832619255300344, 'samples': 5682240, 'steps': 29594, 'loss/train': 1.2611652612686157} -08/30/2021 18:27:07 - INFO - __main__ - Step 29596: {'lr': 0.00045832325886426125, 'samples': 5682432, 'steps': 29595, 'loss/train': 1.4101680517196655} -08/30/2021 18:27:07 - INFO - __main__ - Step 29597: {'lr': 0.0004583203250816518, 'samples': 5682624, 'steps': 29596, 'loss/train': 0.9930189847946167} -08/30/2021 18:27:07 - INFO - __main__ - Step 29598: {'lr': 0.0004583173912051765, 'samples': 5682816, 'steps': 29597, 'loss/train': 0.9272570610046387} -08/30/2021 18:27:08 - INFO - __main__ - Step 29599: {'lr': 0.00045831445723483656, 'samples': 5683008, 'steps': 29598, 'loss/train': 0.8228551745414734} -08/30/2021 18:27:08 - INFO - __main__ - Step 29600: {'lr': 0.0004583115231706334, 'samples': 5683200, 'steps': 29599, 'loss/train': 0.8430296182632446} -08/30/2021 18:27:10 - INFO - __main__ - Step 29601: {'lr': 0.0004583085890125682, 'samples': 5683392, 'steps': 29600, 'loss/train': 0.9320297241210938} -08/30/2021 18:27:10 - INFO - __main__ - Step 29602: {'lr': 0.0004583056547606424, 'samples': 5683584, 'steps': 29601, 'loss/train': 1.4654074907302856} -08/30/2021 18:27:10 - INFO - __main__ - Step 29603: {'lr': 0.0004583027204148573, 'samples': 5683776, 'steps': 29602, 'loss/train': 1.8659985065460205} -08/30/2021 18:27:11 - INFO - __main__ - Step 29604: {'lr': 0.0004582997859752142, 'samples': 5683968, 'steps': 29603, 'loss/train': 1.5351128578186035} -08/30/2021 18:27:11 - INFO - __main__ - Step 29605: {'lr': 0.0004582968514417144, 'samples': 5684160, 'steps': 29604, 'loss/train': 1.4761664867401123} -08/30/2021 18:27:14 - INFO - __main__ - Step 29606: {'lr': 0.00045829391681435926, 'samples': 5684352, 'steps': 29605, 'loss/train': 1.10630464553833} -08/30/2021 18:27:14 - INFO - __main__ - Step 29607: {'lr': 0.0004582909820931501, 'samples': 5684544, 'steps': 29606, 'loss/train': 1.7708563804626465} -08/30/2021 18:27:15 - INFO - __main__ - Step 29608: {'lr': 0.00045828804727808824, 'samples': 5684736, 'steps': 29607, 'loss/train': 1.4790401458740234} -08/30/2021 18:27:15 - INFO - __main__ - Step 29609: {'lr': 0.000458285112369175, 'samples': 5684928, 'steps': 29608, 'loss/train': 1.481463074684143} -08/30/2021 18:27:15 - INFO - __main__ - Step 29610: {'lr': 0.0004582821773664118, 'samples': 5685120, 'steps': 29609, 'loss/train': 1.332221269607544} -08/30/2021 18:27:16 - INFO - __main__ - Step 29611: {'lr': 0.0004582792422697997, 'samples': 5685312, 'steps': 29610, 'loss/train': 1.6628471612930298} -08/30/2021 18:27:16 - INFO - __main__ - Step 29612: {'lr': 0.0004582763070793403, 'samples': 5685504, 'steps': 29611, 'loss/train': 2.3646347522735596} -08/30/2021 18:27:18 - INFO - __main__ - Step 29613: {'lr': 0.0004582733717950347, 'samples': 5685696, 'steps': 29612, 'loss/train': 5.348879337310791} -08/30/2021 18:27:18 - INFO - __main__ - Step 29614: {'lr': 0.00045827043641688444, 'samples': 5685888, 'steps': 29613, 'loss/train': 2.010775327682495} -08/30/2021 18:27:18 - INFO - __main__ - Step 29615: {'lr': 0.00045826750094489065, 'samples': 5686080, 'steps': 29614, 'loss/train': 1.7838435173034668} -08/30/2021 18:27:19 - INFO - __main__ - Step 29616: {'lr': 0.00045826456537905483, 'samples': 5686272, 'steps': 29615, 'loss/train': 1.4085440635681152} -08/30/2021 18:27:19 - INFO - __main__ - Step 29617: {'lr': 0.0004582616297193781, 'samples': 5686464, 'steps': 29616, 'loss/train': 1.5924851894378662} -08/30/2021 18:27:19 - INFO - __main__ - Step 29618: {'lr': 0.000458258693965862, 'samples': 5686656, 'steps': 29617, 'loss/train': 1.6739227771759033} -08/30/2021 18:27:21 - INFO - __main__ - Step 29619: {'lr': 0.0004582557581185077, 'samples': 5686848, 'steps': 29618, 'loss/train': 1.4708425998687744} -08/30/2021 18:27:21 - INFO - __main__ - Step 29620: {'lr': 0.00045825282217731655, 'samples': 5687040, 'steps': 29619, 'loss/train': 1.946986436843872} -08/30/2021 18:27:22 - INFO - __main__ - Step 29621: {'lr': 0.00045824988614228995, 'samples': 5687232, 'steps': 29620, 'loss/train': 2.37992262840271} -08/30/2021 18:27:22 - INFO - __main__ - Step 29622: {'lr': 0.0004582469500134292, 'samples': 5687424, 'steps': 29621, 'loss/train': 1.5118401050567627} -08/30/2021 18:27:22 - INFO - __main__ - Step 29623: {'lr': 0.00045824401379073544, 'samples': 5687616, 'steps': 29622, 'loss/train': 1.385564923286438} -08/30/2021 18:27:24 - INFO - __main__ - Step 29624: {'lr': 0.0004582410774742103, 'samples': 5687808, 'steps': 29623, 'loss/train': 1.0063823461532593} -08/30/2021 18:27:25 - INFO - __main__ - Step 29625: {'lr': 0.00045823814106385485, 'samples': 5688000, 'steps': 29624, 'loss/train': 1.956981897354126} -08/30/2021 18:27:25 - INFO - __main__ - Step 29626: {'lr': 0.0004582352045596705, 'samples': 5688192, 'steps': 29625, 'loss/train': 1.6747437715530396} -08/30/2021 18:27:26 - INFO - __main__ - Step 29627: {'lr': 0.0004582322679616586, 'samples': 5688384, 'steps': 29626, 'loss/train': 1.8953553438186646} -08/30/2021 18:27:26 - INFO - __main__ - Step 29628: {'lr': 0.0004582293312698205, 'samples': 5688576, 'steps': 29627, 'loss/train': 1.556592583656311} -08/30/2021 18:27:26 - INFO - __main__ - Step 29629: {'lr': 0.00045822639448415736, 'samples': 5688768, 'steps': 29628, 'loss/train': 2.9476187229156494} -08/30/2021 18:27:28 - INFO - __main__ - Step 29630: {'lr': 0.0004582234576046707, 'samples': 5688960, 'steps': 29629, 'loss/train': 0.1175139769911766} -08/30/2021 18:27:28 - INFO - __main__ - Step 29631: {'lr': 0.00045822052063136177, 'samples': 5689152, 'steps': 29630, 'loss/train': 1.4863507747650146} -08/30/2021 18:27:29 - INFO - __main__ - Step 29632: {'lr': 0.0004582175835642319, 'samples': 5689344, 'steps': 29631, 'loss/train': 1.4567972421646118} -08/30/2021 18:27:29 - INFO - __main__ - Step 29633: {'lr': 0.0004582146464032824, 'samples': 5689536, 'steps': 29632, 'loss/train': 2.4604380130767822} -08/30/2021 18:27:29 - INFO - __main__ - Step 29634: {'lr': 0.0004582117091485145, 'samples': 5689728, 'steps': 29633, 'loss/train': 1.3318003416061401} -08/30/2021 18:27:31 - INFO - __main__ - Step 29635: {'lr': 0.0004582087717999297, 'samples': 5689920, 'steps': 29634, 'loss/train': 1.550450325012207} -08/30/2021 18:27:31 - INFO - __main__ - Step 29636: {'lr': 0.0004582058343575292, 'samples': 5690112, 'steps': 29635, 'loss/train': 1.9619405269622803} -08/30/2021 18:27:32 - INFO - __main__ - Step 29637: {'lr': 0.00045820289682131437, 'samples': 5690304, 'steps': 29636, 'loss/train': 1.9311447143554688} -08/30/2021 18:27:32 - INFO - __main__ - Step 29638: {'lr': 0.0004581999591912865, 'samples': 5690496, 'steps': 29637, 'loss/train': 1.916884183883667} -08/30/2021 18:27:32 - INFO - __main__ - Step 29639: {'lr': 0.000458197021467447, 'samples': 5690688, 'steps': 29638, 'loss/train': 1.9588192701339722} -08/30/2021 18:27:34 - INFO - __main__ - Step 29640: {'lr': 0.00045819408364979714, 'samples': 5690880, 'steps': 29639, 'loss/train': 1.8672581911087036} -08/30/2021 18:27:34 - INFO - __main__ - Step 29641: {'lr': 0.0004581911457383382, 'samples': 5691072, 'steps': 29640, 'loss/train': 1.2657244205474854} -08/30/2021 18:27:35 - INFO - __main__ - Step 29642: {'lr': 0.0004581882077330716, 'samples': 5691264, 'steps': 29641, 'loss/train': 2.0068185329437256} -08/30/2021 18:27:35 - INFO - __main__ - Step 29643: {'lr': 0.0004581852696339985, 'samples': 5691456, 'steps': 29642, 'loss/train': 1.3693592548370361} -08/30/2021 18:27:35 - INFO - __main__ - Step 29644: {'lr': 0.00045818233144112044, 'samples': 5691648, 'steps': 29643, 'loss/train': 1.9072682857513428} -08/30/2021 18:27:37 - INFO - __main__ - Step 29645: {'lr': 0.00045817939315443855, 'samples': 5691840, 'steps': 29644, 'loss/train': 1.1360223293304443} -08/30/2021 18:27:38 - INFO - __main__ - Step 29646: {'lr': 0.0004581764547739543, 'samples': 5692032, 'steps': 29645, 'loss/train': 1.7882003784179688} -08/30/2021 18:27:38 - INFO - __main__ - Step 29647: {'lr': 0.00045817351629966896, 'samples': 5692224, 'steps': 29646, 'loss/train': 2.02164626121521} -08/30/2021 18:27:38 - INFO - __main__ - Step 29648: {'lr': 0.00045817057773158375, 'samples': 5692416, 'steps': 29647, 'loss/train': 1.7786821126937866} -08/30/2021 18:27:39 - INFO - __main__ - Step 29649: {'lr': 0.0004581676390697002, 'samples': 5692608, 'steps': 29648, 'loss/train': 1.0712475776672363} -08/30/2021 18:27:40 - INFO - __main__ - Step 29650: {'lr': 0.00045816470031401945, 'samples': 5692800, 'steps': 29649, 'loss/train': 0.9194968938827515} -08/30/2021 18:27:41 - INFO - __main__ - Step 29651: {'lr': 0.00045816176146454296, 'samples': 5692992, 'steps': 29650, 'loss/train': 1.670853614807129} -08/30/2021 18:27:41 - INFO - __main__ - Step 29652: {'lr': 0.00045815882252127197, 'samples': 5693184, 'steps': 29651, 'loss/train': 0.986540675163269} -08/30/2021 18:27:41 - INFO - __main__ - Step 29653: {'lr': 0.0004581558834842078, 'samples': 5693376, 'steps': 29652, 'loss/train': 1.2599154710769653} -08/30/2021 18:27:42 - INFO - __main__ - Step 29654: {'lr': 0.00045815294435335184, 'samples': 5693568, 'steps': 29653, 'loss/train': 1.7173832654953003} -08/30/2021 18:27:43 - INFO - __main__ - Step 29655: {'lr': 0.0004581500051287053, 'samples': 5693760, 'steps': 29654, 'loss/train': 1.1453946828842163} -08/30/2021 18:27:44 - INFO - __main__ - Step 29656: {'lr': 0.00045814706581026967, 'samples': 5693952, 'steps': 29655, 'loss/train': 1.1144442558288574} -08/30/2021 18:27:44 - INFO - __main__ - Step 29657: {'lr': 0.0004581441263980461, 'samples': 5694144, 'steps': 29656, 'loss/train': 0.86360764503479} -08/30/2021 18:27:44 - INFO - __main__ - Step 29658: {'lr': 0.0004581411868920361, 'samples': 5694336, 'steps': 29657, 'loss/train': 1.7170466184616089} -08/30/2021 18:27:45 - INFO - __main__ - Step 29659: {'lr': 0.00045813824729224085, 'samples': 5694528, 'steps': 29658, 'loss/train': 1.596787452697754} -08/30/2021 18:27:45 - INFO - __main__ - Step 29660: {'lr': 0.0004581353075986617, 'samples': 5694720, 'steps': 29659, 'loss/train': 1.4135023355484009} -08/30/2021 18:27:47 - INFO - __main__ - Step 29661: {'lr': 0.00045813236781129996, 'samples': 5694912, 'steps': 29660, 'loss/train': 1.6739174127578735} -08/30/2021 18:27:47 - INFO - __main__ - Step 29662: {'lr': 0.00045812942793015707, 'samples': 5695104, 'steps': 29661, 'loss/train': 1.202912449836731} -08/30/2021 18:27:47 - INFO - __main__ - Step 29663: {'lr': 0.0004581264879552342, 'samples': 5695296, 'steps': 29662, 'loss/train': 0.19049958884716034} -08/30/2021 18:27:48 - INFO - __main__ - Step 29664: {'lr': 0.00045812354788653275, 'samples': 5695488, 'steps': 29663, 'loss/train': 1.0727471113204956} -08/30/2021 18:27:48 - INFO - __main__ - Step 29665: {'lr': 0.00045812060772405403, 'samples': 5695680, 'steps': 29664, 'loss/train': 1.5303667783737183} -08/30/2021 18:27:50 - INFO - __main__ - Step 29666: {'lr': 0.0004581176674677995, 'samples': 5695872, 'steps': 29665, 'loss/train': 1.313496708869934} -08/30/2021 18:27:50 - INFO - __main__ - Step 29667: {'lr': 0.00045811472711777026, 'samples': 5696064, 'steps': 29666, 'loss/train': 1.6279692649841309} -08/30/2021 18:27:50 - INFO - __main__ - Step 29668: {'lr': 0.0004581117866739677, 'samples': 5696256, 'steps': 29667, 'loss/train': 1.3790535926818848} -08/30/2021 18:27:51 - INFO - __main__ - Step 29669: {'lr': 0.00045810884613639325, 'samples': 5696448, 'steps': 29668, 'loss/train': 1.1239794492721558} -08/30/2021 18:27:51 - INFO - __main__ - Step 29670: {'lr': 0.00045810590550504816, 'samples': 5696640, 'steps': 29669, 'loss/train': 1.9284592866897583} -08/30/2021 18:27:53 - INFO - __main__ - Step 29671: {'lr': 0.0004581029647799337, 'samples': 5696832, 'steps': 29670, 'loss/train': 1.4202970266342163} -08/30/2021 18:27:53 - INFO - __main__ - Step 29672: {'lr': 0.0004581000239610513, 'samples': 5697024, 'steps': 29671, 'loss/train': 1.2471117973327637} -08/30/2021 18:27:53 - INFO - __main__ - Step 29673: {'lr': 0.0004580970830484023, 'samples': 5697216, 'steps': 29672, 'loss/train': 1.6633930206298828} -08/30/2021 18:27:54 - INFO - __main__ - Step 29674: {'lr': 0.00045809414204198785, 'samples': 5697408, 'steps': 29673, 'loss/train': 1.426016926765442} -08/30/2021 18:27:54 - INFO - __main__ - Step 29675: {'lr': 0.00045809120094180946, 'samples': 5697600, 'steps': 29674, 'loss/train': 1.453947901725769} -08/30/2021 18:27:56 - INFO - __main__ - Step 29676: {'lr': 0.00045808825974786834, 'samples': 5697792, 'steps': 29675, 'loss/train': 1.6104342937469482} -08/30/2021 18:27:56 - INFO - __main__ - Step 29677: {'lr': 0.0004580853184601659, 'samples': 5697984, 'steps': 29676, 'loss/train': 1.46486234664917} -08/30/2021 18:27:57 - INFO - __main__ - Step 29678: {'lr': 0.0004580823770787034, 'samples': 5698176, 'steps': 29677, 'loss/train': 1.7360520362854004} -08/30/2021 18:27:57 - INFO - __main__ - Step 29679: {'lr': 0.0004580794356034822, 'samples': 5698368, 'steps': 29678, 'loss/train': 1.6491705179214478} -08/30/2021 18:27:57 - INFO - __main__ - Step 29680: {'lr': 0.0004580764940345036, 'samples': 5698560, 'steps': 29679, 'loss/train': 1.6530210971832275} -08/30/2021 18:27:59 - INFO - __main__ - Step 29681: {'lr': 0.00045807355237176896, 'samples': 5698752, 'steps': 29680, 'loss/train': 1.5946695804595947} -08/30/2021 18:27:59 - INFO - __main__ - Step 29682: {'lr': 0.0004580706106152796, 'samples': 5698944, 'steps': 29681, 'loss/train': 1.322835922241211} -08/30/2021 18:28:00 - INFO - __main__ - Step 29683: {'lr': 0.00045806766876503683, 'samples': 5699136, 'steps': 29682, 'loss/train': 2.5335166454315186} -08/30/2021 18:28:00 - INFO - __main__ - Step 29684: {'lr': 0.000458064726821042, 'samples': 5699328, 'steps': 29683, 'loss/train': 1.5357316732406616} -08/30/2021 18:28:00 - INFO - __main__ - Step 29685: {'lr': 0.0004580617847832964, 'samples': 5699520, 'steps': 29684, 'loss/train': 1.5088759660720825} -08/30/2021 18:28:02 - INFO - __main__ - Step 29686: {'lr': 0.0004580588426518013, 'samples': 5699712, 'steps': 29685, 'loss/train': 1.354177474975586} -08/30/2021 18:28:02 - INFO - __main__ - Step 29687: {'lr': 0.0004580559004265582, 'samples': 5699904, 'steps': 29686, 'loss/train': 1.7243818044662476} -08/30/2021 18:28:03 - INFO - __main__ - Step 29688: {'lr': 0.0004580529581075683, 'samples': 5700096, 'steps': 29687, 'loss/train': 1.3967630863189697} -08/30/2021 18:28:03 - INFO - __main__ - Step 29689: {'lr': 0.0004580500156948329, 'samples': 5700288, 'steps': 29688, 'loss/train': 1.497321367263794} -08/30/2021 18:28:03 - INFO - __main__ - Step 29690: {'lr': 0.0004580470731883534, 'samples': 5700480, 'steps': 29689, 'loss/train': 1.810050129890442} -08/30/2021 18:28:04 - INFO - __main__ - Step 29691: {'lr': 0.0004580441305881311, 'samples': 5700672, 'steps': 29690, 'loss/train': 0.927593469619751} -08/30/2021 18:28:05 - INFO - __main__ - Step 29692: {'lr': 0.0004580411878941673, 'samples': 5700864, 'steps': 29691, 'loss/train': 2.807532548904419} -08/30/2021 18:28:06 - INFO - __main__ - Step 29693: {'lr': 0.0004580382451064634, 'samples': 5701056, 'steps': 29692, 'loss/train': 1.5563640594482422} -08/30/2021 18:28:06 - INFO - __main__ - Step 29694: {'lr': 0.00045803530222502065, 'samples': 5701248, 'steps': 29693, 'loss/train': 1.595654010772705} -08/30/2021 18:28:07 - INFO - __main__ - Step 29695: {'lr': 0.0004580323592498404, 'samples': 5701440, 'steps': 29694, 'loss/train': 1.2515085935592651} -08/30/2021 18:28:07 - INFO - __main__ - Step 29696: {'lr': 0.00045802941618092397, 'samples': 5701632, 'steps': 29695, 'loss/train': 0.2638806700706482} -08/30/2021 18:28:09 - INFO - __main__ - Step 29697: {'lr': 0.0004580264730182727, 'samples': 5701824, 'steps': 29696, 'loss/train': 1.4753319025039673} -08/30/2021 18:28:10 - INFO - __main__ - Step 29698: {'lr': 0.000458023529761888, 'samples': 5702016, 'steps': 29697, 'loss/train': 1.6588515043258667} -08/30/2021 18:28:10 - INFO - __main__ - Step 29699: {'lr': 0.00045802058641177104, 'samples': 5702208, 'steps': 29698, 'loss/train': 1.7861418724060059} -08/30/2021 18:28:10 - INFO - __main__ - Step 29700: {'lr': 0.00045801764296792317, 'samples': 5702400, 'steps': 29699, 'loss/train': 1.6370424032211304} -08/30/2021 18:28:11 - INFO - __main__ - Step 29701: {'lr': 0.0004580146994303458, 'samples': 5702592, 'steps': 29700, 'loss/train': 1.1859413385391235} -08/30/2021 18:28:12 - INFO - __main__ - Step 29702: {'lr': 0.0004580117557990402, 'samples': 5702784, 'steps': 29701, 'loss/train': 1.4897328615188599} -08/30/2021 18:28:13 - INFO - __main__ - Step 29703: {'lr': 0.0004580088120740077, 'samples': 5702976, 'steps': 29702, 'loss/train': 1.4795736074447632} -08/30/2021 18:28:13 - INFO - __main__ - Step 29704: {'lr': 0.0004580058682552497, 'samples': 5703168, 'steps': 29703, 'loss/train': 2.0447490215301514} -08/30/2021 18:28:13 - INFO - __main__ - Step 29705: {'lr': 0.00045800292434276736, 'samples': 5703360, 'steps': 29704, 'loss/train': 1.5913904905319214} -08/30/2021 18:28:14 - INFO - __main__ - Step 29706: {'lr': 0.0004579999803365622, 'samples': 5703552, 'steps': 29705, 'loss/train': 1.6796106100082397} -08/30/2021 18:28:15 - INFO - __main__ - Step 29707: {'lr': 0.00045799703623663546, 'samples': 5703744, 'steps': 29706, 'loss/train': 1.5506706237792969} -08/30/2021 18:28:16 - INFO - __main__ - Step 29708: {'lr': 0.00045799409204298844, 'samples': 5703936, 'steps': 29707, 'loss/train': 1.0952070951461792} -08/30/2021 18:28:16 - INFO - __main__ - Step 29709: {'lr': 0.00045799114775562245, 'samples': 5704128, 'steps': 29708, 'loss/train': 1.8405007123947144} -08/30/2021 18:28:16 - INFO - __main__ - Step 29710: {'lr': 0.00045798820337453894, 'samples': 5704320, 'steps': 29709, 'loss/train': 1.6173516511917114} -08/30/2021 18:28:17 - INFO - __main__ - Step 29711: {'lr': 0.00045798525889973905, 'samples': 5704512, 'steps': 29710, 'loss/train': 1.2189722061157227} -08/30/2021 18:28:18 - INFO - __main__ - Step 29712: {'lr': 0.00045798231433122436, 'samples': 5704704, 'steps': 29711, 'loss/train': 1.2220425605773926} -08/30/2021 18:28:19 - INFO - __main__ - Step 29713: {'lr': 0.00045797936966899595, 'samples': 5704896, 'steps': 29712, 'loss/train': 1.3528696298599243} -08/30/2021 18:28:19 - INFO - __main__ - Step 29714: {'lr': 0.00045797642491305523, 'samples': 5705088, 'steps': 29713, 'loss/train': 1.8279149532318115} -08/30/2021 18:28:19 - INFO - __main__ - Step 29715: {'lr': 0.0004579734800634036, 'samples': 5705280, 'steps': 29714, 'loss/train': 1.3975285291671753} -08/30/2021 18:28:20 - INFO - __main__ - Step 29716: {'lr': 0.0004579705351200423, 'samples': 5705472, 'steps': 29715, 'loss/train': 1.6372387409210205} -08/30/2021 18:28:21 - INFO - __main__ - Step 29717: {'lr': 0.0004579675900829727, 'samples': 5705664, 'steps': 29716, 'loss/train': 1.507022738456726} -08/30/2021 18:28:22 - INFO - __main__ - Step 29718: {'lr': 0.00045796464495219614, 'samples': 5705856, 'steps': 29717, 'loss/train': 1.4987457990646362} -08/30/2021 18:28:22 - INFO - __main__ - Step 29719: {'lr': 0.00045796169972771387, 'samples': 5706048, 'steps': 29718, 'loss/train': 1.08888840675354} -08/30/2021 18:28:23 - INFO - __main__ - Step 29720: {'lr': 0.00045795875440952726, 'samples': 5706240, 'steps': 29719, 'loss/train': 1.1902862787246704} -08/30/2021 18:28:23 - INFO - __main__ - Step 29721: {'lr': 0.00045795580899763767, 'samples': 5706432, 'steps': 29720, 'loss/train': 1.6228948831558228} -08/30/2021 18:28:23 - INFO - __main__ - Step 29722: {'lr': 0.00045795286349204633, 'samples': 5706624, 'steps': 29721, 'loss/train': 1.4023505449295044} -08/30/2021 18:28:25 - INFO - __main__ - Step 29723: {'lr': 0.0004579499178927547, 'samples': 5706816, 'steps': 29722, 'loss/train': 1.3119184970855713} -08/30/2021 18:28:25 - INFO - __main__ - Step 29724: {'lr': 0.0004579469721997641, 'samples': 5707008, 'steps': 29723, 'loss/train': 1.5725725889205933} -08/30/2021 18:28:26 - INFO - __main__ - Step 29725: {'lr': 0.0004579440264130758, 'samples': 5707200, 'steps': 29724, 'loss/train': 1.6831140518188477} -08/30/2021 18:28:26 - INFO - __main__ - Step 29726: {'lr': 0.000457941080532691, 'samples': 5707392, 'steps': 29725, 'loss/train': 1.8906539678573608} -08/30/2021 18:28:26 - INFO - __main__ - Step 29727: {'lr': 0.0004579381345586113, 'samples': 5707584, 'steps': 29726, 'loss/train': 1.6148093938827515} -08/30/2021 18:28:28 - INFO - __main__ - Step 29728: {'lr': 0.0004579351884908378, 'samples': 5707776, 'steps': 29727, 'loss/train': 1.54594886302948} -08/30/2021 18:28:28 - INFO - __main__ - Step 29729: {'lr': 0.00045793224232937193, 'samples': 5707968, 'steps': 29728, 'loss/train': 1.3913178443908691} -08/30/2021 18:28:29 - INFO - __main__ - Step 29730: {'lr': 0.0004579292960742151, 'samples': 5708160, 'steps': 29729, 'loss/train': 1.354109764099121} -08/30/2021 18:28:29 - INFO - __main__ - Step 29731: {'lr': 0.0004579263497253684, 'samples': 5708352, 'steps': 29730, 'loss/train': 2.0978946685791016} -08/30/2021 18:28:29 - INFO - __main__ - Step 29732: {'lr': 0.00045792340328283334, 'samples': 5708544, 'steps': 29731, 'loss/train': 1.5430909395217896} -08/30/2021 18:28:31 - INFO - __main__ - Step 29733: {'lr': 0.0004579204567466112, 'samples': 5708736, 'steps': 29732, 'loss/train': 1.5453301668167114} -08/30/2021 18:28:31 - INFO - __main__ - Step 29734: {'lr': 0.0004579175101167033, 'samples': 5708928, 'steps': 29733, 'loss/train': 1.5608700513839722} -08/30/2021 18:28:32 - INFO - __main__ - Step 29735: {'lr': 0.000457914563393111, 'samples': 5709120, 'steps': 29734, 'loss/train': 0.512084424495697} -08/30/2021 18:28:32 - INFO - __main__ - Step 29736: {'lr': 0.00045791161657583555, 'samples': 5709312, 'steps': 29735, 'loss/train': 1.3737982511520386} -08/30/2021 18:28:32 - INFO - __main__ - Step 29737: {'lr': 0.00045790866966487843, 'samples': 5709504, 'steps': 29736, 'loss/train': 0.9926096796989441} -08/30/2021 18:28:34 - INFO - __main__ - Step 29738: {'lr': 0.0004579057226602408, 'samples': 5709696, 'steps': 29737, 'loss/train': 0.20578551292419434} -08/30/2021 18:28:34 - INFO - __main__ - Step 29739: {'lr': 0.00045790277556192414, 'samples': 5709888, 'steps': 29738, 'loss/train': 1.2388333082199097} -08/30/2021 18:28:35 - INFO - __main__ - Step 29740: {'lr': 0.0004578998283699296, 'samples': 5710080, 'steps': 29739, 'loss/train': 1.7845193147659302} -08/30/2021 18:28:35 - INFO - __main__ - Step 29741: {'lr': 0.0004578968810842586, 'samples': 5710272, 'steps': 29740, 'loss/train': 1.3406702280044556} -08/30/2021 18:28:35 - INFO - __main__ - Step 29742: {'lr': 0.0004578939337049126, 'samples': 5710464, 'steps': 29741, 'loss/train': 1.8162589073181152} -08/30/2021 18:28:37 - INFO - __main__ - Step 29743: {'lr': 0.0004578909862318927, 'samples': 5710656, 'steps': 29742, 'loss/train': 0.7952150702476501} -08/30/2021 18:28:37 - INFO - __main__ - Step 29744: {'lr': 0.00045788803866520037, 'samples': 5710848, 'steps': 29743, 'loss/train': 2.365987539291382} -08/30/2021 18:28:38 - INFO - __main__ - Step 29745: {'lr': 0.0004578850910048369, 'samples': 5711040, 'steps': 29744, 'loss/train': 1.553279161453247} -08/30/2021 18:28:38 - INFO - __main__ - Step 29746: {'lr': 0.0004578821432508036, 'samples': 5711232, 'steps': 29745, 'loss/train': 1.640616774559021} -08/30/2021 18:28:38 - INFO - __main__ - Step 29747: {'lr': 0.00045787919540310175, 'samples': 5711424, 'steps': 29746, 'loss/train': 1.5358890295028687} -08/30/2021 18:28:39 - INFO - __main__ - Step 29748: {'lr': 0.0004578762474617328, 'samples': 5711616, 'steps': 29747, 'loss/train': 1.5220602750778198} -08/30/2021 18:28:40 - INFO - __main__ - Step 29749: {'lr': 0.00045787329942669803, 'samples': 5711808, 'steps': 29748, 'loss/train': 1.587807059288025} -08/30/2021 18:28:41 - INFO - __main__ - Step 29750: {'lr': 0.0004578703512979988, 'samples': 5712000, 'steps': 29749, 'loss/train': 1.354875087738037} -08/30/2021 18:28:41 - INFO - __main__ - Step 29751: {'lr': 0.00045786740307563633, 'samples': 5712192, 'steps': 29750, 'loss/train': 1.7917624711990356} -08/30/2021 18:28:41 - INFO - __main__ - Step 29752: {'lr': 0.000457864454759612, 'samples': 5712384, 'steps': 29751, 'loss/train': 2.8033447265625} -08/30/2021 18:28:42 - INFO - __main__ - Step 29753: {'lr': 0.00045786150634992716, 'samples': 5712576, 'steps': 29752, 'loss/train': 1.4662129878997803} -08/30/2021 18:28:44 - INFO - __main__ - Step 29754: {'lr': 0.0004578585578465833, 'samples': 5712768, 'steps': 29753, 'loss/train': 1.7054139375686646} -08/30/2021 18:28:44 - INFO - __main__ - Step 29755: {'lr': 0.00045785560924958135, 'samples': 5712960, 'steps': 29754, 'loss/train': 1.5506590604782104} -08/30/2021 18:28:45 - INFO - __main__ - Step 29756: {'lr': 0.00045785266055892296, 'samples': 5713152, 'steps': 29755, 'loss/train': 0.8969353437423706} -08/30/2021 18:28:45 - INFO - __main__ - Step 29757: {'lr': 0.0004578497117746094, 'samples': 5713344, 'steps': 29756, 'loss/train': 1.6206135749816895} -08/30/2021 18:28:45 - INFO - __main__ - Step 29758: {'lr': 0.00045784676289664194, 'samples': 5713536, 'steps': 29757, 'loss/train': 2.000650405883789} -08/30/2021 18:28:47 - INFO - __main__ - Step 29759: {'lr': 0.00045784381392502193, 'samples': 5713728, 'steps': 29758, 'loss/train': 1.9538886547088623} -08/30/2021 18:28:47 - INFO - __main__ - Step 29760: {'lr': 0.00045784086485975076, 'samples': 5713920, 'steps': 29759, 'loss/train': 1.460592269897461} -08/30/2021 18:28:48 - INFO - __main__ - Step 29761: {'lr': 0.00045783791570082956, 'samples': 5714112, 'steps': 29760, 'loss/train': 1.3283790349960327} -08/30/2021 18:28:48 - INFO - __main__ - Step 29762: {'lr': 0.00045783496644825997, 'samples': 5714304, 'steps': 29761, 'loss/train': 1.9077951908111572} -08/30/2021 18:28:48 - INFO - __main__ - Step 29763: {'lr': 0.000457832017102043, 'samples': 5714496, 'steps': 29762, 'loss/train': 1.3710795640945435} -08/30/2021 18:28:50 - INFO - __main__ - Step 29764: {'lr': 0.00045782906766218026, 'samples': 5714688, 'steps': 29763, 'loss/train': 1.4096707105636597} -08/30/2021 18:28:50 - INFO - __main__ - Step 29765: {'lr': 0.00045782611812867285, 'samples': 5714880, 'steps': 29764, 'loss/train': 1.261650562286377} -08/30/2021 18:28:51 - INFO - __main__ - Step 29766: {'lr': 0.0004578231685015223, 'samples': 5715072, 'steps': 29765, 'loss/train': 1.4897416830062866} -08/30/2021 18:28:51 - INFO - __main__ - Step 29767: {'lr': 0.00045782021878072976, 'samples': 5715264, 'steps': 29766, 'loss/train': 1.155381202697754} -08/30/2021 18:28:51 - INFO - __main__ - Step 29768: {'lr': 0.0004578172689662967, 'samples': 5715456, 'steps': 29767, 'loss/train': 1.8191925287246704} -08/30/2021 18:28:53 - INFO - __main__ - Step 29769: {'lr': 0.0004578143190582243, 'samples': 5715648, 'steps': 29768, 'loss/train': 1.3403890132904053} -08/30/2021 18:28:53 - INFO - __main__ - Step 29770: {'lr': 0.000457811369056514, 'samples': 5715840, 'steps': 29769, 'loss/train': 1.5078458786010742} -08/30/2021 18:28:53 - INFO - __main__ - Step 29771: {'lr': 0.0004578084189611671, 'samples': 5716032, 'steps': 29770, 'loss/train': 1.5487326383590698} -08/30/2021 18:28:54 - INFO - __main__ - Step 29772: {'lr': 0.000457805468772185, 'samples': 5716224, 'steps': 29771, 'loss/train': 1.6098134517669678} -08/30/2021 18:28:54 - INFO - __main__ - Step 29773: {'lr': 0.00045780251848956887, 'samples': 5716416, 'steps': 29772, 'loss/train': 0.9175944924354553} -08/30/2021 18:28:56 - INFO - __main__ - Step 29774: {'lr': 0.0004577995681133202, 'samples': 5716608, 'steps': 29773, 'loss/train': 1.8215703964233398} -08/30/2021 18:28:56 - INFO - __main__ - Step 29775: {'lr': 0.00045779661764344025, 'samples': 5716800, 'steps': 29774, 'loss/train': 1.6772704124450684} -08/30/2021 18:28:56 - INFO - __main__ - Step 29776: {'lr': 0.0004577936670799303, 'samples': 5716992, 'steps': 29775, 'loss/train': 1.6390513181686401} -08/30/2021 18:28:57 - INFO - __main__ - Step 29777: {'lr': 0.00045779071642279177, 'samples': 5717184, 'steps': 29776, 'loss/train': 1.5799801349639893} -08/30/2021 18:28:57 - INFO - __main__ - Step 29778: {'lr': 0.00045778776567202597, 'samples': 5717376, 'steps': 29777, 'loss/train': 1.326113224029541} -08/30/2021 18:28:57 - INFO - __main__ - Step 29779: {'lr': 0.0004577848148276341, 'samples': 5717568, 'steps': 29778, 'loss/train': 1.3282570838928223} -08/30/2021 18:28:59 - INFO - __main__ - Step 29780: {'lr': 0.00045778186388961776, 'samples': 5717760, 'steps': 29779, 'loss/train': 1.3016703128814697} -08/30/2021 18:28:59 - INFO - __main__ - Step 29781: {'lr': 0.000457778912857978, 'samples': 5717952, 'steps': 29780, 'loss/train': 1.7542059421539307} -08/30/2021 18:29:00 - INFO - __main__ - Step 29782: {'lr': 0.0004577759617327163, 'samples': 5718144, 'steps': 29781, 'loss/train': 1.3037378787994385} -08/30/2021 18:29:00 - INFO - __main__ - Step 29783: {'lr': 0.000457773010513834, 'samples': 5718336, 'steps': 29782, 'loss/train': 1.2276067733764648} -08/30/2021 18:29:00 - INFO - __main__ - Step 29784: {'lr': 0.0004577700592013323, 'samples': 5718528, 'steps': 29783, 'loss/train': 1.6257506608963013} -08/30/2021 18:29:02 - INFO - __main__ - Step 29785: {'lr': 0.0004577671077952127, 'samples': 5718720, 'steps': 29784, 'loss/train': 1.7140051126480103} -08/30/2021 18:29:03 - INFO - __main__ - Step 29786: {'lr': 0.0004577641562954764, 'samples': 5718912, 'steps': 29785, 'loss/train': 0.15526026487350464} -08/30/2021 18:29:03 - INFO - __main__ - Step 29787: {'lr': 0.00045776120470212477, 'samples': 5719104, 'steps': 29786, 'loss/train': 1.3239808082580566} -08/30/2021 18:29:03 - INFO - __main__ - Step 29788: {'lr': 0.00045775825301515923, 'samples': 5719296, 'steps': 29787, 'loss/train': 1.4864088296890259} -08/30/2021 18:29:04 - INFO - __main__ - Step 29789: {'lr': 0.00045775530123458096, 'samples': 5719488, 'steps': 29788, 'loss/train': 2.255086898803711} -08/30/2021 18:29:05 - INFO - __main__ - Step 29790: {'lr': 0.00045775234936039133, 'samples': 5719680, 'steps': 29789, 'loss/train': 1.44126558303833} -08/30/2021 18:29:05 - INFO - __main__ - Step 29791: {'lr': 0.00045774939739259173, 'samples': 5719872, 'steps': 29790, 'loss/train': 1.770522117614746} -08/30/2021 18:29:06 - INFO - __main__ - Step 29792: {'lr': 0.0004577464453311835, 'samples': 5720064, 'steps': 29791, 'loss/train': 0.2801794409751892} -08/30/2021 18:29:06 - INFO - __main__ - Step 29793: {'lr': 0.00045774349317616786, 'samples': 5720256, 'steps': 29792, 'loss/train': 1.2711302042007446} -08/30/2021 18:29:07 - INFO - __main__ - Step 29794: {'lr': 0.00045774054092754624, 'samples': 5720448, 'steps': 29793, 'loss/train': 1.5915980339050293} -08/30/2021 18:29:08 - INFO - __main__ - Step 29795: {'lr': 0.00045773758858531997, 'samples': 5720640, 'steps': 29794, 'loss/train': 1.4245502948760986} -08/30/2021 18:29:09 - INFO - __main__ - Step 29796: {'lr': 0.0004577346361494903, 'samples': 5720832, 'steps': 29795, 'loss/train': 0.8146663904190063} -08/30/2021 18:29:09 - INFO - __main__ - Step 29797: {'lr': 0.0004577316836200586, 'samples': 5721024, 'steps': 29796, 'loss/train': 0.95196133852005} -08/30/2021 18:29:09 - INFO - __main__ - Step 29798: {'lr': 0.0004577287309970262, 'samples': 5721216, 'steps': 29797, 'loss/train': 0.8967983722686768} -08/30/2021 18:29:10 - INFO - __main__ - Step 29799: {'lr': 0.0004577257782803945, 'samples': 5721408, 'steps': 29798, 'loss/train': 1.5457720756530762} -08/30/2021 18:29:11 - INFO - __main__ - Step 29800: {'lr': 0.00045772282547016475, 'samples': 5721600, 'steps': 29799, 'loss/train': 1.2335726022720337} -08/30/2021 18:29:12 - INFO - __main__ - Step 29801: {'lr': 0.0004577198725663383, 'samples': 5721792, 'steps': 29800, 'loss/train': 1.3536510467529297} -08/30/2021 18:29:12 - INFO - __main__ - Step 29802: {'lr': 0.00045771691956891645, 'samples': 5721984, 'steps': 29801, 'loss/train': 1.571109652519226} -08/30/2021 18:29:12 - INFO - __main__ - Step 29803: {'lr': 0.00045771396647790053, 'samples': 5722176, 'steps': 29802, 'loss/train': 0.9780459403991699} -08/30/2021 18:29:13 - INFO - __main__ - Step 29804: {'lr': 0.00045771101329329195, 'samples': 5722368, 'steps': 29803, 'loss/train': 1.5371843576431274} -08/30/2021 18:29:13 - INFO - __main__ - Step 29805: {'lr': 0.00045770806001509205, 'samples': 5722560, 'steps': 29804, 'loss/train': 1.6407279968261719} -08/30/2021 18:29:15 - INFO - __main__ - Step 29806: {'lr': 0.00045770510664330203, 'samples': 5722752, 'steps': 29805, 'loss/train': 3.0229039192199707} -08/30/2021 18:29:16 - INFO - __main__ - Step 29807: {'lr': 0.0004577021531779233, 'samples': 5722944, 'steps': 29806, 'loss/train': 1.6292167901992798} -08/30/2021 18:29:16 - INFO - __main__ - Step 29808: {'lr': 0.00045769919961895716, 'samples': 5723136, 'steps': 29807, 'loss/train': 1.7189383506774902} -08/30/2021 18:29:17 - INFO - __main__ - Step 29809: {'lr': 0.000457696245966405, 'samples': 5723328, 'steps': 29808, 'loss/train': 1.4111695289611816} -08/30/2021 18:29:17 - INFO - __main__ - Step 29810: {'lr': 0.0004576932922202681, 'samples': 5723520, 'steps': 29809, 'loss/train': 1.9019224643707275} -08/30/2021 18:29:19 - INFO - __main__ - Step 29811: {'lr': 0.00045769033838054783, 'samples': 5723712, 'steps': 29810, 'loss/train': 1.5190767049789429} -08/30/2021 18:29:19 - INFO - __main__ - Step 29812: {'lr': 0.0004576873844472455, 'samples': 5723904, 'steps': 29811, 'loss/train': 1.2523224353790283} -08/30/2021 18:29:19 - INFO - __main__ - Step 29813: {'lr': 0.00045768443042036247, 'samples': 5724096, 'steps': 29812, 'loss/train': 1.69696843624115} -08/30/2021 18:29:20 - INFO - __main__ - Step 29814: {'lr': 0.0004576814762999, 'samples': 5724288, 'steps': 29813, 'loss/train': 0.5058253407478333} -08/30/2021 18:29:20 - INFO - __main__ - Step 29815: {'lr': 0.00045767852208585945, 'samples': 5724480, 'steps': 29814, 'loss/train': 1.6717995405197144} -08/30/2021 18:29:21 - INFO - __main__ - Step 29816: {'lr': 0.00045767556777824217, 'samples': 5724672, 'steps': 29815, 'loss/train': 1.5186625719070435} -08/30/2021 18:29:22 - INFO - __main__ - Step 29817: {'lr': 0.00045767261337704946, 'samples': 5724864, 'steps': 29816, 'loss/train': 1.3946292400360107} -08/30/2021 18:29:22 - INFO - __main__ - Step 29818: {'lr': 0.00045766965888228273, 'samples': 5725056, 'steps': 29817, 'loss/train': 1.4422296285629272} -08/30/2021 18:29:23 - INFO - __main__ - Step 29819: {'lr': 0.00045766670429394317, 'samples': 5725248, 'steps': 29818, 'loss/train': 1.076311469078064} -08/30/2021 18:29:23 - INFO - __main__ - Step 29820: {'lr': 0.00045766374961203236, 'samples': 5725440, 'steps': 29819, 'loss/train': 1.0208680629730225} -08/30/2021 18:29:25 - INFO - __main__ - Step 29821: {'lr': 0.0004576607948365513, 'samples': 5725632, 'steps': 29820, 'loss/train': 1.6473058462142944} -08/30/2021 18:29:25 - INFO - __main__ - Step 29822: {'lr': 0.0004576578399675015, 'samples': 5725824, 'steps': 29821, 'loss/train': 1.4750052690505981} -08/30/2021 18:29:25 - INFO - __main__ - Step 29823: {'lr': 0.00045765488500488437, 'samples': 5726016, 'steps': 29822, 'loss/train': 1.0241910219192505} -08/30/2021 18:29:26 - INFO - __main__ - Step 29824: {'lr': 0.0004576519299487012, 'samples': 5726208, 'steps': 29823, 'loss/train': 1.5517184734344482} -08/30/2021 18:29:26 - INFO - __main__ - Step 29825: {'lr': 0.00045764897479895315, 'samples': 5726400, 'steps': 29824, 'loss/train': 1.3328709602355957} -08/30/2021 18:29:28 - INFO - __main__ - Step 29826: {'lr': 0.0004576460195556418, 'samples': 5726592, 'steps': 29825, 'loss/train': 1.3228015899658203} -08/30/2021 18:29:28 - INFO - __main__ - Step 29827: {'lr': 0.0004576430642187682, 'samples': 5726784, 'steps': 29826, 'loss/train': 1.466692328453064} -08/30/2021 18:29:28 - INFO - __main__ - Step 29828: {'lr': 0.00045764010878833396, 'samples': 5726976, 'steps': 29827, 'loss/train': 1.0952364206314087} -08/30/2021 18:29:29 - INFO - __main__ - Step 29829: {'lr': 0.00045763715326434023, 'samples': 5727168, 'steps': 29828, 'loss/train': 1.3330249786376953} -08/30/2021 18:29:29 - INFO - __main__ - Step 29830: {'lr': 0.0004576341976467884, 'samples': 5727360, 'steps': 29829, 'loss/train': 1.300980567932129} -08/30/2021 18:29:29 - INFO - __main__ - Step 29831: {'lr': 0.00045763124193567983, 'samples': 5727552, 'steps': 29830, 'loss/train': 1.2432913780212402} -08/30/2021 18:29:31 - INFO - __main__ - Step 29832: {'lr': 0.0004576282861310158, 'samples': 5727744, 'steps': 29831, 'loss/train': 1.5756326913833618} -08/30/2021 18:29:31 - INFO - __main__ - Step 29833: {'lr': 0.00045762533023279773, 'samples': 5727936, 'steps': 29832, 'loss/train': 1.3727688789367676} -08/30/2021 18:29:32 - INFO - __main__ - Step 29834: {'lr': 0.00045762237424102687, 'samples': 5728128, 'steps': 29833, 'loss/train': 1.3507001399993896} -08/30/2021 18:29:32 - INFO - __main__ - Step 29835: {'lr': 0.0004576194181557045, 'samples': 5728320, 'steps': 29834, 'loss/train': 1.5258768796920776} -08/30/2021 18:29:32 - INFO - __main__ - Step 29836: {'lr': 0.00045761646197683216, 'samples': 5728512, 'steps': 29835, 'loss/train': 1.6856153011322021} -08/30/2021 18:29:34 - INFO - __main__ - Step 29837: {'lr': 0.00045761350570441096, 'samples': 5728704, 'steps': 29836, 'loss/train': 1.1569122076034546} -08/30/2021 18:29:34 - INFO - __main__ - Step 29838: {'lr': 0.0004576105493384423, 'samples': 5728896, 'steps': 29837, 'loss/train': 1.3239467144012451} -08/30/2021 18:29:35 - INFO - __main__ - Step 29839: {'lr': 0.00045760759287892755, 'samples': 5729088, 'steps': 29838, 'loss/train': 0.49414050579071045} -08/30/2021 18:29:35 - INFO - __main__ - Step 29840: {'lr': 0.000457604636325868, 'samples': 5729280, 'steps': 29839, 'loss/train': 1.2491590976715088} -08/30/2021 18:29:35 - INFO - __main__ - Step 29841: {'lr': 0.00045760167967926504, 'samples': 5729472, 'steps': 29840, 'loss/train': 1.202050805091858} -08/30/2021 18:29:37 - INFO - __main__ - Step 29842: {'lr': 0.00045759872293911995, 'samples': 5729664, 'steps': 29841, 'loss/train': 1.5716712474822998} -08/30/2021 18:29:37 - INFO - __main__ - Step 29843: {'lr': 0.00045759576610543407, 'samples': 5729856, 'steps': 29842, 'loss/train': 1.3601289987564087} -08/30/2021 18:29:38 - INFO - __main__ - Step 29844: {'lr': 0.0004575928091782088, 'samples': 5730048, 'steps': 29843, 'loss/train': 1.9324127435684204} -08/30/2021 18:29:38 - INFO - __main__ - Step 29845: {'lr': 0.00045758985215744536, 'samples': 5730240, 'steps': 29844, 'loss/train': 1.5306636095046997} -08/30/2021 18:29:38 - INFO - __main__ - Step 29846: {'lr': 0.0004575868950431452, 'samples': 5730432, 'steps': 29845, 'loss/train': 1.7896960973739624} -08/30/2021 18:29:40 - INFO - __main__ - Step 29847: {'lr': 0.0004575839378353095, 'samples': 5730624, 'steps': 29846, 'loss/train': 1.4041900634765625} -08/30/2021 18:29:40 - INFO - __main__ - Step 29848: {'lr': 0.0004575809805339397, 'samples': 5730816, 'steps': 29847, 'loss/train': 0.7040590047836304} -08/30/2021 18:29:41 - INFO - __main__ - Step 29849: {'lr': 0.0004575780231390371, 'samples': 5731008, 'steps': 29848, 'loss/train': 0.7328097820281982} -08/30/2021 18:29:41 - INFO - __main__ - Step 29850: {'lr': 0.0004575750656506031, 'samples': 5731200, 'steps': 29849, 'loss/train': 1.475000262260437} -08/30/2021 18:29:41 - INFO - __main__ - Step 29851: {'lr': 0.00045757210806863895, 'samples': 5731392, 'steps': 29850, 'loss/train': 0.813751757144928} -08/30/2021 18:29:43 - INFO - __main__ - Step 29852: {'lr': 0.0004575691503931461, 'samples': 5731584, 'steps': 29851, 'loss/train': 1.2440426349639893} -08/30/2021 18:29:43 - INFO - __main__ - Step 29853: {'lr': 0.00045756619262412565, 'samples': 5731776, 'steps': 29852, 'loss/train': 1.576850175857544} -08/30/2021 18:29:44 - INFO - __main__ - Step 29854: {'lr': 0.0004575632347615791, 'samples': 5731968, 'steps': 29853, 'loss/train': 1.7223079204559326} -08/30/2021 18:29:44 - INFO - __main__ - Step 29855: {'lr': 0.0004575602768055078, 'samples': 5732160, 'steps': 29854, 'loss/train': 1.3341399431228638} -08/30/2021 18:29:44 - INFO - __main__ - Step 29856: {'lr': 0.00045755731875591303, 'samples': 5732352, 'steps': 29855, 'loss/train': 0.9654378294944763} -08/30/2021 18:29:47 - INFO - __main__ - Step 29857: {'lr': 0.0004575543606127961, 'samples': 5732544, 'steps': 29856, 'loss/train': 1.348114252090454} -08/30/2021 18:29:47 - INFO - __main__ - Step 29858: {'lr': 0.0004575514023761585, 'samples': 5732736, 'steps': 29857, 'loss/train': 1.888065218925476} -08/30/2021 18:29:48 - INFO - __main__ - Step 29859: {'lr': 0.00045754844404600136, 'samples': 5732928, 'steps': 29858, 'loss/train': 2.2803468704223633} -08/30/2021 18:29:48 - INFO - __main__ - Step 29860: {'lr': 0.00045754548562232605, 'samples': 5733120, 'steps': 29859, 'loss/train': 1.4766547679901123} -08/30/2021 18:29:48 - INFO - __main__ - Step 29861: {'lr': 0.00045754252710513397, 'samples': 5733312, 'steps': 29860, 'loss/train': 1.2961032390594482} -08/30/2021 18:29:49 - INFO - __main__ - Step 29862: {'lr': 0.00045753956849442647, 'samples': 5733504, 'steps': 29861, 'loss/train': 1.358559250831604} -08/30/2021 18:29:50 - INFO - __main__ - Step 29863: {'lr': 0.00045753660979020485, 'samples': 5733696, 'steps': 29862, 'loss/train': 1.7077391147613525} -08/30/2021 18:29:51 - INFO - __main__ - Step 29864: {'lr': 0.0004575336509924704, 'samples': 5733888, 'steps': 29863, 'loss/train': 1.4787989854812622} -08/30/2021 18:29:51 - INFO - __main__ - Step 29865: {'lr': 0.0004575306921012245, 'samples': 5734080, 'steps': 29864, 'loss/train': 2.005549907684326} -08/30/2021 18:29:51 - INFO - __main__ - Step 29866: {'lr': 0.00045752773311646846, 'samples': 5734272, 'steps': 29865, 'loss/train': 1.8861044645309448} -08/30/2021 18:29:52 - INFO - __main__ - Step 29867: {'lr': 0.0004575247740382037, 'samples': 5734464, 'steps': 29866, 'loss/train': 1.520192265510559} -08/30/2021 18:29:52 - INFO - __main__ - Step 29868: {'lr': 0.0004575218148664314, 'samples': 5734656, 'steps': 29867, 'loss/train': 0.6959830522537231} -08/30/2021 18:29:54 - INFO - __main__ - Step 29869: {'lr': 0.00045751885560115294, 'samples': 5734848, 'steps': 29868, 'loss/train': 1.4108071327209473} -08/30/2021 18:29:54 - INFO - __main__ - Step 29870: {'lr': 0.0004575158962423698, 'samples': 5735040, 'steps': 29869, 'loss/train': 2.066143751144409} -08/30/2021 18:29:55 - INFO - __main__ - Step 29871: {'lr': 0.0004575129367900831, 'samples': 5735232, 'steps': 29870, 'loss/train': 1.474915623664856} -08/30/2021 18:29:55 - INFO - __main__ - Step 29872: {'lr': 0.0004575099772442943, 'samples': 5735424, 'steps': 29871, 'loss/train': 1.578248143196106} -08/30/2021 18:29:55 - INFO - __main__ - Step 29873: {'lr': 0.0004575070176050047, 'samples': 5735616, 'steps': 29872, 'loss/train': 0.0819786787033081} -08/30/2021 18:29:57 - INFO - __main__ - Step 29874: {'lr': 0.00045750405787221566, 'samples': 5735808, 'steps': 29873, 'loss/train': 2.4636528491973877} -08/30/2021 18:29:57 - INFO - __main__ - Step 29875: {'lr': 0.0004575010980459285, 'samples': 5736000, 'steps': 29874, 'loss/train': 1.9061830043792725} -08/30/2021 18:29:58 - INFO - __main__ - Step 29876: {'lr': 0.0004574981381261445, 'samples': 5736192, 'steps': 29875, 'loss/train': 1.2713805437088013} -08/30/2021 18:29:58 - INFO - __main__ - Step 29877: {'lr': 0.0004574951781128651, 'samples': 5736384, 'steps': 29876, 'loss/train': 1.6363621950149536} -08/30/2021 18:29:59 - INFO - __main__ - Step 29878: {'lr': 0.0004574922180060915, 'samples': 5736576, 'steps': 29877, 'loss/train': 1.4786618947982788} -08/30/2021 18:30:00 - INFO - __main__ - Step 29879: {'lr': 0.0004574892578058252, 'samples': 5736768, 'steps': 29878, 'loss/train': 1.4830291271209717} -08/30/2021 18:30:01 - INFO - __main__ - Step 29880: {'lr': 0.0004574862975120674, 'samples': 5736960, 'steps': 29879, 'loss/train': 1.4662595987319946} -08/30/2021 18:30:01 - INFO - __main__ - Step 29881: {'lr': 0.0004574833371248195, 'samples': 5737152, 'steps': 29880, 'loss/train': 2.465188503265381} -08/30/2021 18:30:01 - INFO - __main__ - Step 29882: {'lr': 0.00045748037664408275, 'samples': 5737344, 'steps': 29881, 'loss/train': 1.308503270149231} -08/30/2021 18:30:02 - INFO - __main__ - Step 29883: {'lr': 0.0004574774160698586, 'samples': 5737536, 'steps': 29882, 'loss/train': 0.6008021831512451} -08/30/2021 18:30:03 - INFO - __main__ - Step 29884: {'lr': 0.00045747445540214826, 'samples': 5737728, 'steps': 29883, 'loss/train': 1.2538586854934692} -08/30/2021 18:30:04 - INFO - __main__ - Step 29885: {'lr': 0.00045747149464095324, 'samples': 5737920, 'steps': 29884, 'loss/train': 1.5160785913467407} -08/30/2021 18:30:04 - INFO - __main__ - Step 29886: {'lr': 0.00045746853378627467, 'samples': 5738112, 'steps': 29885, 'loss/train': 1.453216791152954} -08/30/2021 18:30:04 - INFO - __main__ - Step 29887: {'lr': 0.000457465572838114, 'samples': 5738304, 'steps': 29886, 'loss/train': 1.4027401208877563} -08/30/2021 18:30:05 - INFO - __main__ - Step 29888: {'lr': 0.0004574626117964726, 'samples': 5738496, 'steps': 29887, 'loss/train': 1.1967679262161255} -08/30/2021 18:30:05 - INFO - __main__ - Step 29889: {'lr': 0.00045745965066135163, 'samples': 5738688, 'steps': 29888, 'loss/train': 1.338134527206421} -08/30/2021 18:30:07 - INFO - __main__ - Step 29890: {'lr': 0.00045745668943275266, 'samples': 5738880, 'steps': 29889, 'loss/train': 1.9230146408081055} -08/30/2021 18:30:07 - INFO - __main__ - Step 29891: {'lr': 0.00045745372811067687, 'samples': 5739072, 'steps': 29890, 'loss/train': 0.5520074963569641} -08/30/2021 18:30:07 - INFO - __main__ - Step 29892: {'lr': 0.00045745076669512566, 'samples': 5739264, 'steps': 29891, 'loss/train': 1.6947280168533325} -08/30/2021 18:30:08 - INFO - __main__ - Step 29893: {'lr': 0.0004574478051861003, 'samples': 5739456, 'steps': 29892, 'loss/train': 1.720933198928833} -08/30/2021 18:30:08 - INFO - __main__ - Step 29894: {'lr': 0.00045744484358360216, 'samples': 5739648, 'steps': 29893, 'loss/train': 1.9582308530807495} -08/30/2021 18:30:09 - INFO - __main__ - Step 29895: {'lr': 0.0004574418818876326, 'samples': 5739840, 'steps': 29894, 'loss/train': 0.9471269845962524} -08/30/2021 18:30:10 - INFO - __main__ - Step 29896: {'lr': 0.0004574389200981929, 'samples': 5740032, 'steps': 29895, 'loss/train': 1.3663339614868164} -08/30/2021 18:30:10 - INFO - __main__ - Step 29897: {'lr': 0.00045743595821528437, 'samples': 5740224, 'steps': 29896, 'loss/train': 1.9239739179611206} -08/30/2021 18:30:11 - INFO - __main__ - Step 29898: {'lr': 0.0004574329962389085, 'samples': 5740416, 'steps': 29897, 'loss/train': 1.5327961444854736} -08/30/2021 18:30:11 - INFO - __main__ - Step 29899: {'lr': 0.0004574300341690665, 'samples': 5740608, 'steps': 29898, 'loss/train': 1.6033366918563843} -08/30/2021 18:30:12 - INFO - __main__ - Step 29900: {'lr': 0.00045742707200575975, 'samples': 5740800, 'steps': 29899, 'loss/train': 1.089516282081604} -08/30/2021 18:30:13 - INFO - __main__ - Step 29901: {'lr': 0.00045742410974898947, 'samples': 5740992, 'steps': 29900, 'loss/train': 1.4063479900360107} -08/30/2021 18:30:13 - INFO - __main__ - Step 29902: {'lr': 0.0004574211473987571, 'samples': 5741184, 'steps': 29901, 'loss/train': 1.282423496246338} -08/30/2021 18:30:13 - INFO - __main__ - Step 29903: {'lr': 0.00045741818495506403, 'samples': 5741376, 'steps': 29902, 'loss/train': 1.4164947271347046} -08/30/2021 18:30:14 - INFO - __main__ - Step 29904: {'lr': 0.0004574152224179115, 'samples': 5741568, 'steps': 29903, 'loss/train': 1.2825496196746826} -08/30/2021 18:30:15 - INFO - __main__ - Step 29905: {'lr': 0.0004574122597873008, 'samples': 5741760, 'steps': 29904, 'loss/train': 1.7941032648086548} -08/30/2021 18:30:16 - INFO - __main__ - Step 29906: {'lr': 0.0004574092970632335, 'samples': 5741952, 'steps': 29905, 'loss/train': 1.6563183069229126} -08/30/2021 18:30:16 - INFO - __main__ - Step 29907: {'lr': 0.00045740633424571064, 'samples': 5742144, 'steps': 29906, 'loss/train': 0.6336389183998108} -08/30/2021 18:30:17 - INFO - __main__ - Step 29908: {'lr': 0.00045740337133473374, 'samples': 5742336, 'steps': 29907, 'loss/train': 1.3014731407165527} -08/30/2021 18:30:17 - INFO - __main__ - Step 29909: {'lr': 0.00045740040833030404, 'samples': 5742528, 'steps': 29908, 'loss/train': 1.1213966608047485} -08/30/2021 18:30:20 - INFO - __main__ - Step 29910: {'lr': 0.00045739744523242294, 'samples': 5742720, 'steps': 29909, 'loss/train': 1.2861236333847046} -08/30/2021 18:30:21 - INFO - __main__ - Step 29911: {'lr': 0.0004573944820410918, 'samples': 5742912, 'steps': 29910, 'loss/train': 1.6103925704956055} -08/30/2021 18:30:21 - INFO - __main__ - Step 29912: {'lr': 0.0004573915187563118, 'samples': 5743104, 'steps': 29911, 'loss/train': 1.726737141609192} -08/30/2021 18:30:21 - INFO - __main__ - Step 29913: {'lr': 0.00045738855537808443, 'samples': 5743296, 'steps': 29912, 'loss/train': 1.719698190689087} -08/30/2021 18:30:22 - INFO - __main__ - Step 29914: {'lr': 0.000457385591906411, 'samples': 5743488, 'steps': 29913, 'loss/train': 1.1147890090942383} -08/30/2021 18:30:22 - INFO - __main__ - Step 29915: {'lr': 0.00045738262834129283, 'samples': 5743680, 'steps': 29914, 'loss/train': 1.87599515914917} -08/30/2021 18:30:22 - INFO - __main__ - Step 29916: {'lr': 0.0004573796646827312, 'samples': 5743872, 'steps': 29915, 'loss/train': 1.8886315822601318} -08/30/2021 18:30:23 - INFO - __main__ - Step 29917: {'lr': 0.0004573767009307276, 'samples': 5744064, 'steps': 29916, 'loss/train': 1.277214527130127} -08/30/2021 18:30:24 - INFO - __main__ - Step 29918: {'lr': 0.0004573737370852831, 'samples': 5744256, 'steps': 29917, 'loss/train': 2.1520116329193115} -08/30/2021 18:30:25 - INFO - __main__ - Step 29919: {'lr': 0.0004573707731463993, 'samples': 5744448, 'steps': 29918, 'loss/train': 1.8385660648345947} -08/30/2021 18:30:25 - INFO - __main__ - Step 29920: {'lr': 0.00045736780911407736, 'samples': 5744640, 'steps': 29919, 'loss/train': 1.6175665855407715} -08/30/2021 18:30:25 - INFO - __main__ - Step 29921: {'lr': 0.00045736484498831877, 'samples': 5744832, 'steps': 29920, 'loss/train': 1.7936135530471802} -08/30/2021 18:30:26 - INFO - __main__ - Step 29922: {'lr': 0.0004573618807691248, 'samples': 5745024, 'steps': 29921, 'loss/train': 1.5341824293136597} -08/30/2021 18:30:27 - INFO - __main__ - Step 29923: {'lr': 0.0004573589164564966, 'samples': 5745216, 'steps': 29922, 'loss/train': 1.5022945404052734} -08/30/2021 18:30:28 - INFO - __main__ - Step 29924: {'lr': 0.00045735595205043583, 'samples': 5745408, 'steps': 29923, 'loss/train': 1.0516347885131836} -08/30/2021 18:30:28 - INFO - __main__ - Step 29925: {'lr': 0.00045735298755094364, 'samples': 5745600, 'steps': 29924, 'loss/train': 1.4194567203521729} -08/30/2021 18:30:29 - INFO - __main__ - Step 29926: {'lr': 0.00045735002295802137, 'samples': 5745792, 'steps': 29925, 'loss/train': 1.909565806388855} -08/30/2021 18:30:29 - INFO - __main__ - Step 29927: {'lr': 0.00045734705827167035, 'samples': 5745984, 'steps': 29926, 'loss/train': 1.2392679452896118} -08/30/2021 18:30:31 - INFO - __main__ - Step 29928: {'lr': 0.000457344093491892, 'samples': 5746176, 'steps': 29927, 'loss/train': 0.4013739824295044} -08/30/2021 18:30:31 - INFO - __main__ - Step 29929: {'lr': 0.00045734112861868753, 'samples': 5746368, 'steps': 29928, 'loss/train': 1.5148979425430298} -08/30/2021 18:30:32 - INFO - __main__ - Step 29930: {'lr': 0.0004573381636520584, 'samples': 5746560, 'steps': 29929, 'loss/train': 0.2414027750492096} -08/30/2021 18:30:32 - INFO - __main__ - Step 29931: {'lr': 0.0004573351985920059, 'samples': 5746752, 'steps': 29930, 'loss/train': 0.13806553184986115} -08/30/2021 18:30:32 - INFO - __main__ - Step 29932: {'lr': 0.0004573322334385314, 'samples': 5746944, 'steps': 29931, 'loss/train': 0.06139226257801056} -08/30/2021 18:30:33 - INFO - __main__ - Step 29933: {'lr': 0.0004573292681916361, 'samples': 5747136, 'steps': 29932, 'loss/train': 2.4596898555755615} -08/30/2021 18:30:34 - INFO - __main__ - Step 29934: {'lr': 0.0004573263028513214, 'samples': 5747328, 'steps': 29933, 'loss/train': 1.724640130996704} -08/30/2021 18:30:35 - INFO - __main__ - Step 29935: {'lr': 0.0004573233374175888, 'samples': 5747520, 'steps': 29934, 'loss/train': 1.6728287935256958} -08/30/2021 18:30:35 - INFO - __main__ - Step 29936: {'lr': 0.0004573203718904394, 'samples': 5747712, 'steps': 29935, 'loss/train': 1.489703893661499} -08/30/2021 18:30:36 - INFO - __main__ - Step 29937: {'lr': 0.00045731740626987473, 'samples': 5747904, 'steps': 29936, 'loss/train': 1.1529443264007568} -08/30/2021 18:30:36 - INFO - __main__ - Step 29938: {'lr': 0.00045731444055589597, 'samples': 5748096, 'steps': 29937, 'loss/train': 1.6943330764770508} -08/30/2021 18:30:36 - INFO - __main__ - Step 29939: {'lr': 0.0004573114747485045, 'samples': 5748288, 'steps': 29938, 'loss/train': 1.0642552375793457} -08/30/2021 18:30:38 - INFO - __main__ - Step 29940: {'lr': 0.0004573085088477017, 'samples': 5748480, 'steps': 29939, 'loss/train': 1.3704547882080078} -08/30/2021 18:30:38 - INFO - __main__ - Step 29941: {'lr': 0.0004573055428534889, 'samples': 5748672, 'steps': 29940, 'loss/train': 1.265084981918335} -08/30/2021 18:30:39 - INFO - __main__ - Step 29942: {'lr': 0.00045730257676586747, 'samples': 5748864, 'steps': 29941, 'loss/train': 1.354390025138855} -08/30/2021 18:30:39 - INFO - __main__ - Step 29943: {'lr': 0.0004572996105848386, 'samples': 5749056, 'steps': 29942, 'loss/train': 1.4503631591796875} -08/30/2021 18:30:39 - INFO - __main__ - Step 29944: {'lr': 0.0004572966443104038, 'samples': 5749248, 'steps': 29943, 'loss/train': 1.7153041362762451} -08/30/2021 18:30:41 - INFO - __main__ - Step 29945: {'lr': 0.00045729367794256434, 'samples': 5749440, 'steps': 29944, 'loss/train': 0.713683009147644} -08/30/2021 18:30:41 - INFO - __main__ - Step 29946: {'lr': 0.0004572907114813215, 'samples': 5749632, 'steps': 29945, 'loss/train': 1.6766033172607422} -08/30/2021 18:30:42 - INFO - __main__ - Step 29947: {'lr': 0.0004572877449266767, 'samples': 5749824, 'steps': 29946, 'loss/train': 1.700985074043274} -08/30/2021 18:30:42 - INFO - __main__ - Step 29948: {'lr': 0.0004572847782786312, 'samples': 5750016, 'steps': 29947, 'loss/train': 1.3387649059295654} -08/30/2021 18:30:42 - INFO - __main__ - Step 29949: {'lr': 0.0004572818115371864, 'samples': 5750208, 'steps': 29948, 'loss/train': 1.493436574935913} -08/30/2021 18:30:44 - INFO - __main__ - Step 29950: {'lr': 0.0004572788447023436, 'samples': 5750400, 'steps': 29949, 'loss/train': 1.8604241609573364} -08/30/2021 18:30:44 - INFO - __main__ - Step 29951: {'lr': 0.00045727587777410415, 'samples': 5750592, 'steps': 29950, 'loss/train': 1.41011381149292} -08/30/2021 18:30:45 - INFO - __main__ - Step 29952: {'lr': 0.00045727291075246937, 'samples': 5750784, 'steps': 29951, 'loss/train': 1.568453073501587} -08/30/2021 18:30:45 - INFO - __main__ - Step 29953: {'lr': 0.0004572699436374407, 'samples': 5750976, 'steps': 29952, 'loss/train': 2.2069711685180664} -08/30/2021 18:30:45 - INFO - __main__ - Step 29954: {'lr': 0.00045726697642901925, 'samples': 5751168, 'steps': 29953, 'loss/train': 0.19367405772209167} -08/30/2021 18:30:47 - INFO - __main__ - Step 29955: {'lr': 0.0004572640091272066, 'samples': 5751360, 'steps': 29954, 'loss/train': 1.5525058507919312} -08/30/2021 18:30:48 - INFO - __main__ - Step 29956: {'lr': 0.000457261041732004, 'samples': 5751552, 'steps': 29955, 'loss/train': 1.349680781364441} -08/30/2021 18:30:48 - INFO - __main__ - Step 29957: {'lr': 0.0004572580742434127, 'samples': 5751744, 'steps': 29956, 'loss/train': 1.949102759361267} -08/30/2021 18:30:48 - INFO - __main__ - Step 29958: {'lr': 0.00045725510666143424, 'samples': 5751936, 'steps': 29957, 'loss/train': 1.4559065103530884} -08/30/2021 18:30:49 - INFO - __main__ - Step 29959: {'lr': 0.0004572521389860697, 'samples': 5752128, 'steps': 29958, 'loss/train': 1.6270986795425415} -08/30/2021 18:30:50 - INFO - __main__ - Step 29960: {'lr': 0.00045724917121732055, 'samples': 5752320, 'steps': 29959, 'loss/train': 1.2723875045776367} -08/30/2021 18:30:51 - INFO - __main__ - Step 29961: {'lr': 0.0004572462033551882, 'samples': 5752512, 'steps': 29960, 'loss/train': 2.9785878658294678} -08/30/2021 18:30:51 - INFO - __main__ - Step 29962: {'lr': 0.00045724323539967385, 'samples': 5752704, 'steps': 29961, 'loss/train': 1.342309832572937} -08/30/2021 18:30:51 - INFO - __main__ - Step 29963: {'lr': 0.00045724026735077886, 'samples': 5752896, 'steps': 29962, 'loss/train': 1.3100159168243408} -08/30/2021 18:30:52 - INFO - __main__ - Step 29964: {'lr': 0.00045723729920850464, 'samples': 5753088, 'steps': 29963, 'loss/train': 1.652289628982544} -08/30/2021 18:30:54 - INFO - __main__ - Step 29965: {'lr': 0.00045723433097285247, 'samples': 5753280, 'steps': 29964, 'loss/train': 1.4638392925262451} -08/30/2021 18:30:55 - INFO - __main__ - Step 29966: {'lr': 0.0004572313626438238, 'samples': 5753472, 'steps': 29965, 'loss/train': 1.4360930919647217} -08/30/2021 18:30:55 - INFO - __main__ - Step 29967: {'lr': 0.00045722839422141984, 'samples': 5753664, 'steps': 29966, 'loss/train': 1.658735990524292} -08/30/2021 18:30:55 - INFO - __main__ - Step 29968: {'lr': 0.000457225425705642, 'samples': 5753856, 'steps': 29967, 'loss/train': 1.8419651985168457} -08/30/2021 18:30:56 - INFO - __main__ - Step 29969: {'lr': 0.0004572224570964915, 'samples': 5754048, 'steps': 29968, 'loss/train': 1.4746346473693848} -08/30/2021 18:30:56 - INFO - __main__ - Step 29970: {'lr': 0.0004572194883939697, 'samples': 5754240, 'steps': 29969, 'loss/train': 0.20525215566158295} -08/30/2021 18:30:58 - INFO - __main__ - Step 29971: {'lr': 0.0004572165195980781, 'samples': 5754432, 'steps': 29970, 'loss/train': 1.2932289838790894} -08/30/2021 18:30:59 - INFO - __main__ - Step 29972: {'lr': 0.0004572135507088179, 'samples': 5754624, 'steps': 29971, 'loss/train': 1.5811430215835571} -08/30/2021 18:30:59 - INFO - __main__ - Step 29973: {'lr': 0.00045721058172619043, 'samples': 5754816, 'steps': 29972, 'loss/train': 0.12158104032278061} -08/30/2021 18:30:59 - INFO - __main__ - Step 29974: {'lr': 0.0004572076126501972, 'samples': 5755008, 'steps': 29973, 'loss/train': 1.4291597604751587} -08/30/2021 18:31:00 - INFO - __main__ - Step 29975: {'lr': 0.00045720464348083937, 'samples': 5755200, 'steps': 29974, 'loss/train': 1.1311383247375488} -08/30/2021 18:31:00 - INFO - __main__ - Step 29976: {'lr': 0.0004572016742181182, 'samples': 5755392, 'steps': 29975, 'loss/train': 2.0455069541931152} -08/30/2021 18:31:02 - INFO - __main__ - Step 29977: {'lr': 0.0004571987048620353, 'samples': 5755584, 'steps': 29976, 'loss/train': 1.865699052810669} -08/30/2021 18:31:02 - INFO - __main__ - Step 29978: {'lr': 0.0004571957354125918, 'samples': 5755776, 'steps': 29977, 'loss/train': 1.4434974193572998} -08/30/2021 18:31:03 - INFO - __main__ - Step 29979: {'lr': 0.00045719276586978907, 'samples': 5755968, 'steps': 29978, 'loss/train': 1.4251376390457153} -08/30/2021 18:31:03 - INFO - __main__ - Step 29980: {'lr': 0.00045718979623362855, 'samples': 5756160, 'steps': 29979, 'loss/train': 2.0122334957122803} -08/30/2021 18:31:04 - INFO - __main__ - Step 29981: {'lr': 0.00045718682650411146, 'samples': 5756352, 'steps': 29980, 'loss/train': 1.199205994606018} -08/30/2021 18:31:05 - INFO - __main__ - Step 29982: {'lr': 0.0004571838566812392, 'samples': 5756544, 'steps': 29981, 'loss/train': 0.8048202991485596} -08/30/2021 18:31:05 - INFO - __main__ - Step 29983: {'lr': 0.00045718088676501305, 'samples': 5756736, 'steps': 29982, 'loss/train': 1.4998470544815063} -08/30/2021 18:31:06 - INFO - __main__ - Step 29984: {'lr': 0.0004571779167554344, 'samples': 5756928, 'steps': 29983, 'loss/train': 1.5507581233978271} -08/30/2021 18:31:06 - INFO - __main__ - Step 29985: {'lr': 0.0004571749466525046, 'samples': 5757120, 'steps': 29984, 'loss/train': 0.9107785224914551} -08/30/2021 18:31:06 - INFO - __main__ - Step 29986: {'lr': 0.000457171976456225, 'samples': 5757312, 'steps': 29985, 'loss/train': 1.2444286346435547} -08/30/2021 18:31:08 - INFO - __main__ - Step 29987: {'lr': 0.00045716900616659686, 'samples': 5757504, 'steps': 29986, 'loss/train': 1.2106409072875977} -08/30/2021 18:31:08 - INFO - __main__ - Step 29988: {'lr': 0.00045716603578362157, 'samples': 5757696, 'steps': 29987, 'loss/train': 1.3851398229599} -08/30/2021 18:31:09 - INFO - __main__ - Step 29989: {'lr': 0.00045716306530730043, 'samples': 5757888, 'steps': 29988, 'loss/train': 1.0019110441207886} -08/30/2021 18:31:09 - INFO - __main__ - Step 29990: {'lr': 0.00045716009473763486, 'samples': 5758080, 'steps': 29989, 'loss/train': 1.4916727542877197} -08/30/2021 18:31:09 - INFO - __main__ - Step 29991: {'lr': 0.0004571571240746262, 'samples': 5758272, 'steps': 29990, 'loss/train': 1.093345046043396} -08/30/2021 18:31:10 - INFO - __main__ - Step 29992: {'lr': 0.00045715415331827564, 'samples': 5758464, 'steps': 29991, 'loss/train': 1.9349569082260132} -08/30/2021 18:31:11 - INFO - __main__ - Step 29993: {'lr': 0.00045715118246858466, 'samples': 5758656, 'steps': 29992, 'loss/train': 1.2344725131988525} -08/30/2021 18:31:12 - INFO - __main__ - Step 29994: {'lr': 0.0004571482115255545, 'samples': 5758848, 'steps': 29993, 'loss/train': 2.0704667568206787} -08/30/2021 18:31:12 - INFO - __main__ - Step 29995: {'lr': 0.0004571452404891866, 'samples': 5759040, 'steps': 29994, 'loss/train': 1.8195703029632568} -08/30/2021 18:31:12 - INFO - __main__ - Step 29996: {'lr': 0.0004571422693594822, 'samples': 5759232, 'steps': 29995, 'loss/train': 1.6077555418014526} -08/30/2021 18:31:14 - INFO - __main__ - Step 29997: {'lr': 0.00045713929813644274, 'samples': 5759424, 'steps': 29996, 'loss/train': 2.4970226287841797} -08/30/2021 18:31:14 - INFO - __main__ - Step 29998: {'lr': 0.0004571363268200695, 'samples': 5759616, 'steps': 29997, 'loss/train': 1.3227806091308594} -08/30/2021 18:31:15 - INFO - __main__ - Step 29999: {'lr': 0.0004571333554103638, 'samples': 5759808, 'steps': 29998, 'loss/train': 1.6352428197860718} -08/30/2021 18:31:15 - INFO - __main__ - Step 30000: {'lr': 0.0004571303839073271, 'samples': 5760000, 'steps': 29999, 'loss/train': 1.503125548362732} -08/30/2021 18:31:15 - INFO - __main__ - Evaluating model checkpoint -08/30/2021 18:40:00 - INFO - __main__ - Step 30000: {'loss/eval': 1.3865768909454346, 'perplexity': 4.0011305809021} -08/30/2021 18:40:00 - INFO - __main__ - Saving model checkpoint -08/30/2021 18:40:12 - WARNING - huggingface_hub.repository - Adding files tracked by Git LFS: ['wandb/run-20210830_131354-2654p8r7/logs/debug-internal.log', 'wandb/run-20210830_131354-2654p8r7/run-2654p8r7.wandb']. This may take a bit of time if the files are large. -08/30/2021 18:41:13 - INFO - __main__ - Step 30001: {'lr': 0.00045712741231096054, 'samples': 5760192, 'steps': 30000, 'loss/train': 0.998179018497467} -08/30/2021 18:41:14 - INFO - __main__ - Step 30002: {'lr': 0.0004571244406212656, 'samples': 5760384, 'steps': 30001, 'loss/train': 1.0569742918014526} -08/30/2021 18:41:16 - INFO - __main__ - Step 30003: {'lr': 0.00045712146883824357, 'samples': 5760576, 'steps': 30002, 'loss/train': 1.2649835348129272} -08/30/2021 18:41:16 - INFO - __main__ - Step 30004: {'lr': 0.00045711849696189585, 'samples': 5760768, 'steps': 30003, 'loss/train': 0.07835978269577026} -08/30/2021 18:41:17 - INFO - __main__ - Step 30005: {'lr': 0.0004571155249922237, 'samples': 5760960, 'steps': 30004, 'loss/train': 1.3939626216888428} -08/30/2021 18:41:17 - INFO - __main__ - Step 30006: {'lr': 0.00045711255292922847, 'samples': 5761152, 'steps': 30005, 'loss/train': 0.06290615350008011} -08/30/2021 18:41:17 - INFO - __main__ - Step 30007: {'lr': 0.00045710958077291156, 'samples': 5761344, 'steps': 30006, 'loss/train': 1.1841553449630737} -08/30/2021 18:41:18 - INFO - __main__ - Step 30008: {'lr': 0.00045710660852327423, 'samples': 5761536, 'steps': 30007, 'loss/train': 1.169217824935913} -08/30/2021 18:41:19 - INFO - __main__ - Step 30009: {'lr': 0.00045710363618031783, 'samples': 5761728, 'steps': 30008, 'loss/train': 1.5474317073822021} -08/30/2021 18:41:20 - INFO - __main__ - Step 30010: {'lr': 0.0004571006637440438, 'samples': 5761920, 'steps': 30009, 'loss/train': 1.7704938650131226} -08/30/2021 18:41:20 - INFO - __main__ - Step 30011: {'lr': 0.00045709769121445335, 'samples': 5762112, 'steps': 30010, 'loss/train': 1.5660245418548584} -08/30/2021 18:41:20 - INFO - __main__ - Step 30012: {'lr': 0.00045709471859154793, 'samples': 5762304, 'steps': 30011, 'loss/train': 1.7349765300750732} -08/30/2021 18:41:21 - INFO - __main__ - Step 30013: {'lr': 0.0004570917458753288, 'samples': 5762496, 'steps': 30012, 'loss/train': 0.6215084195137024} -08/30/2021 18:41:22 - INFO - __main__ - Step 30014: {'lr': 0.00045708877306579733, 'samples': 5762688, 'steps': 30013, 'loss/train': 1.8880693912506104} -08/30/2021 18:41:23 - INFO - __main__ - Step 30015: {'lr': 0.00045708580016295486, 'samples': 5762880, 'steps': 30014, 'loss/train': 1.5370018482208252} -08/30/2021 18:41:23 - INFO - __main__ - Step 30016: {'lr': 0.0004570828271668027, 'samples': 5763072, 'steps': 30015, 'loss/train': 1.483174443244934} -08/30/2021 18:41:23 - INFO - __main__ - Step 30017: {'lr': 0.0004570798540773422, 'samples': 5763264, 'steps': 30016, 'loss/train': 1.1573729515075684} -08/30/2021 18:41:24 - INFO - __main__ - Step 30018: {'lr': 0.0004570768808945748, 'samples': 5763456, 'steps': 30017, 'loss/train': 1.114778995513916} -08/30/2021 18:41:26 - INFO - __main__ - Step 30019: {'lr': 0.00045707390761850163, 'samples': 5763648, 'steps': 30018, 'loss/train': 1.649596095085144} -08/30/2021 18:41:26 - INFO - __main__ - Step 30020: {'lr': 0.00045707093424912426, 'samples': 5763840, 'steps': 30019, 'loss/train': 1.4206477403640747} -08/30/2021 18:41:27 - INFO - __main__ - Step 30021: {'lr': 0.00045706796078644386, 'samples': 5764032, 'steps': 30020, 'loss/train': 1.3503787517547607} -08/30/2021 18:41:27 - INFO - __main__ - Step 30022: {'lr': 0.00045706498723046185, 'samples': 5764224, 'steps': 30021, 'loss/train': 0.04716811329126358} -08/30/2021 18:41:27 - INFO - __main__ - Step 30023: {'lr': 0.0004570620135811795, 'samples': 5764416, 'steps': 30022, 'loss/train': 0.066108338534832} -08/30/2021 18:41:28 - INFO - __main__ - Step 30024: {'lr': 0.0004570590398385983, 'samples': 5764608, 'steps': 30023, 'loss/train': 0.515494167804718} -08/30/2021 18:41:30 - INFO - __main__ - Step 30025: {'lr': 0.0004570560660027194, 'samples': 5764800, 'steps': 30024, 'loss/train': 1.3453384637832642} -08/30/2021 18:41:31 - INFO - __main__ - Step 30026: {'lr': 0.00045705309207354433, 'samples': 5764992, 'steps': 30025, 'loss/train': 1.5587120056152344} -08/30/2021 18:41:31 - INFO - __main__ - Step 30027: {'lr': 0.00045705011805107426, 'samples': 5765184, 'steps': 30026, 'loss/train': 0.08149411529302597} -08/30/2021 18:41:31 - INFO - __main__ - Step 30028: {'lr': 0.00045704714393531064, 'samples': 5765376, 'steps': 30027, 'loss/train': 1.3082835674285889} -08/30/2021 18:41:32 - INFO - __main__ - Step 30029: {'lr': 0.00045704416972625474, 'samples': 5765568, 'steps': 30028, 'loss/train': 1.4769291877746582} -08/30/2021 18:41:33 - INFO - __main__ - Step 30030: {'lr': 0.000457041195423908, 'samples': 5765760, 'steps': 30029, 'loss/train': 1.6035698652267456} -08/30/2021 18:41:34 - INFO - __main__ - Step 30031: {'lr': 0.0004570382210282716, 'samples': 5765952, 'steps': 30030, 'loss/train': 0.7443256378173828} -08/30/2021 18:41:34 - INFO - __main__ - Step 30032: {'lr': 0.00045703524653934705, 'samples': 5766144, 'steps': 30031, 'loss/train': 1.4345024824142456} -08/30/2021 18:41:34 - INFO - __main__ - Step 30033: {'lr': 0.0004570322719571355, 'samples': 5766336, 'steps': 30032, 'loss/train': 1.4624621868133545} -08/30/2021 18:41:35 - INFO - __main__ - Step 30034: {'lr': 0.00045702929728163845, 'samples': 5766528, 'steps': 30033, 'loss/train': 0.891118049621582} -08/30/2021 18:41:36 - INFO - __main__ - Step 30035: {'lr': 0.00045702632251285727, 'samples': 5766720, 'steps': 30034, 'loss/train': 1.084511637687683} -08/30/2021 18:41:37 - INFO - __main__ - Step 30036: {'lr': 0.0004570233476507931, 'samples': 5766912, 'steps': 30035, 'loss/train': 1.583155632019043} -08/30/2021 18:41:37 - INFO - __main__ - Step 30037: {'lr': 0.0004570203726954475, 'samples': 5767104, 'steps': 30036, 'loss/train': 1.0263639688491821} -08/30/2021 18:41:38 - INFO - __main__ - Step 30038: {'lr': 0.0004570173976468217, 'samples': 5767296, 'steps': 30037, 'loss/train': 1.6417723894119263} -08/30/2021 18:41:38 - INFO - __main__ - Step 30039: {'lr': 0.0004570144225049171, 'samples': 5767488, 'steps': 30038, 'loss/train': 0.33097851276397705} -08/30/2021 18:41:38 - INFO - __main__ - Step 30040: {'lr': 0.00045701144726973487, 'samples': 5767680, 'steps': 30039, 'loss/train': 1.404439926147461} -08/30/2021 18:41:40 - INFO - __main__ - Step 30041: {'lr': 0.0004570084719412766, 'samples': 5767872, 'steps': 30040, 'loss/train': 1.8676258325576782} -08/30/2021 18:41:40 - INFO - __main__ - Step 30042: {'lr': 0.00045700549651954344, 'samples': 5768064, 'steps': 30041, 'loss/train': 2.0991251468658447} -08/30/2021 18:41:41 - INFO - __main__ - Step 30043: {'lr': 0.0004570025210045368, 'samples': 5768256, 'steps': 30042, 'loss/train': 1.5457230806350708} -08/30/2021 18:41:41 - INFO - __main__ - Step 30044: {'lr': 0.00045699954539625803, 'samples': 5768448, 'steps': 30043, 'loss/train': 0.7517519593238831} -08/30/2021 18:41:41 - INFO - __main__ - Step 30045: {'lr': 0.0004569965696947085, 'samples': 5768640, 'steps': 30044, 'loss/train': 0.6729482412338257} -08/30/2021 18:41:43 - INFO - __main__ - Step 30046: {'lr': 0.00045699359389988944, 'samples': 5768832, 'steps': 30045, 'loss/train': 1.2487704753875732} -08/30/2021 18:41:43 - INFO - __main__ - Step 30047: {'lr': 0.0004569906180118023, 'samples': 5769024, 'steps': 30046, 'loss/train': 2.0153775215148926} -08/30/2021 18:41:44 - INFO - __main__ - Step 30048: {'lr': 0.0004569876420304484, 'samples': 5769216, 'steps': 30047, 'loss/train': 1.7277010679244995} -08/30/2021 18:41:44 - INFO - __main__ - Step 30049: {'lr': 0.000456984665955829, 'samples': 5769408, 'steps': 30048, 'loss/train': 1.4386290311813354} -08/30/2021 18:41:44 - INFO - __main__ - Step 30050: {'lr': 0.00045698168978794553, 'samples': 5769600, 'steps': 30049, 'loss/train': 2.3809890747070312} -08/30/2021 18:41:46 - INFO - __main__ - Step 30051: {'lr': 0.0004569787135267993, 'samples': 5769792, 'steps': 30050, 'loss/train': 1.340345859527588} -08/30/2021 18:41:46 - INFO - __main__ - Step 30052: {'lr': 0.00045697573717239174, 'samples': 5769984, 'steps': 30051, 'loss/train': 1.8033154010772705} -08/30/2021 18:41:47 - INFO - __main__ - Step 30053: {'lr': 0.0004569727607247239, 'samples': 5770176, 'steps': 30052, 'loss/train': 1.4956620931625366} -08/30/2021 18:41:47 - INFO - __main__ - Step 30054: {'lr': 0.00045696978418379754, 'samples': 5770368, 'steps': 30053, 'loss/train': 1.053975224494934} -08/30/2021 18:41:48 - INFO - __main__ - Step 30055: {'lr': 0.0004569668075496137, 'samples': 5770560, 'steps': 30054, 'loss/train': 1.7737561464309692} -08/30/2021 18:41:49 - INFO - __main__ - Step 30056: {'lr': 0.00045696383082217387, 'samples': 5770752, 'steps': 30055, 'loss/train': 1.7106996774673462} -08/30/2021 18:41:50 - INFO - __main__ - Step 30057: {'lr': 0.00045696085400147925, 'samples': 5770944, 'steps': 30056, 'loss/train': 1.1695518493652344} -08/30/2021 18:41:50 - INFO - __main__ - Step 30058: {'lr': 0.00045695787708753126, 'samples': 5771136, 'steps': 30057, 'loss/train': 1.4438533782958984} -08/30/2021 18:41:50 - INFO - __main__ - Step 30059: {'lr': 0.0004569549000803313, 'samples': 5771328, 'steps': 30058, 'loss/train': 1.486721158027649} -08/30/2021 18:41:51 - INFO - __main__ - Step 30060: {'lr': 0.00045695192297988066, 'samples': 5771520, 'steps': 30059, 'loss/train': 1.2105164527893066} -08/30/2021 18:41:52 - INFO - __main__ - Step 30061: {'lr': 0.00045694894578618064, 'samples': 5771712, 'steps': 30060, 'loss/train': 1.2889257669448853} -08/30/2021 18:41:53 - INFO - __main__ - Step 30062: {'lr': 0.00045694596849923263, 'samples': 5771904, 'steps': 30061, 'loss/train': 1.5918667316436768} -08/30/2021 18:41:53 - INFO - __main__ - Step 30063: {'lr': 0.0004569429911190379, 'samples': 5772096, 'steps': 30062, 'loss/train': 2.0897765159606934} -08/30/2021 18:41:54 - INFO - __main__ - Step 30064: {'lr': 0.00045694001364559797, 'samples': 5772288, 'steps': 30063, 'loss/train': 1.5740864276885986} -08/30/2021 18:41:54 - INFO - __main__ - Step 30065: {'lr': 0.00045693703607891403, 'samples': 5772480, 'steps': 30064, 'loss/train': 1.585219144821167} -08/30/2021 18:41:55 - INFO - __main__ - Step 30066: {'lr': 0.0004569340584189874, 'samples': 5772672, 'steps': 30065, 'loss/train': 1.149450421333313} -08/30/2021 18:41:56 - INFO - __main__ - Step 30067: {'lr': 0.0004569310806658195, 'samples': 5772864, 'steps': 30066, 'loss/train': 1.5242985486984253} -08/30/2021 18:41:56 - INFO - __main__ - Step 30068: {'lr': 0.0004569281028194117, 'samples': 5773056, 'steps': 30067, 'loss/train': 1.5530261993408203} -08/30/2021 18:41:57 - INFO - __main__ - Step 30069: {'lr': 0.0004569251248797652, 'samples': 5773248, 'steps': 30068, 'loss/train': 1.6106735467910767} -08/30/2021 18:41:57 - INFO - __main__ - Step 30070: {'lr': 0.0004569221468468815, 'samples': 5773440, 'steps': 30069, 'loss/train': 1.7459301948547363} -08/30/2021 18:41:58 - INFO - __main__ - Step 30071: {'lr': 0.0004569191687207618, 'samples': 5773632, 'steps': 30070, 'loss/train': 1.5610826015472412} -08/30/2021 18:41:59 - INFO - __main__ - Step 30072: {'lr': 0.0004569161905014076, 'samples': 5773824, 'steps': 30071, 'loss/train': 1.1051338911056519} -08/30/2021 18:41:59 - INFO - __main__ - Step 30073: {'lr': 0.0004569132121888201, 'samples': 5774016, 'steps': 30072, 'loss/train': 1.6672340631484985} -08/30/2021 18:42:00 - INFO - __main__ - Step 30074: {'lr': 0.0004569102337830007, 'samples': 5774208, 'steps': 30073, 'loss/train': 1.3058487176895142} -08/30/2021 18:42:00 - INFO - __main__ - Step 30075: {'lr': 0.00045690725528395077, 'samples': 5774400, 'steps': 30074, 'loss/train': 1.5243455171585083} -08/30/2021 18:42:01 - INFO - __main__ - Step 30076: {'lr': 0.0004569042766916717, 'samples': 5774592, 'steps': 30075, 'loss/train': 1.4671909809112549} -08/30/2021 18:42:02 - INFO - __main__ - Step 30077: {'lr': 0.0004569012980061646, 'samples': 5774784, 'steps': 30076, 'loss/train': 1.5543147325515747} -08/30/2021 18:42:02 - INFO - __main__ - Step 30078: {'lr': 0.00045689831922743107, 'samples': 5774976, 'steps': 30077, 'loss/train': 1.1969438791275024} -08/30/2021 18:42:03 - INFO - __main__ - Step 30079: {'lr': 0.0004568953403554723, 'samples': 5775168, 'steps': 30078, 'loss/train': 0.6715759038925171} -08/30/2021 18:42:03 - INFO - __main__ - Step 30080: {'lr': 0.0004568923613902897, 'samples': 5775360, 'steps': 30079, 'loss/train': 1.2134110927581787} -08/30/2021 18:42:05 - INFO - __main__ - Step 30081: {'lr': 0.0004568893823318846, 'samples': 5775552, 'steps': 30080, 'loss/train': 1.4327408075332642} -08/30/2021 18:42:06 - INFO - __main__ - Step 30082: {'lr': 0.0004568864031802583, 'samples': 5775744, 'steps': 30081, 'loss/train': 1.0073317289352417} -08/30/2021 18:42:06 - INFO - __main__ - Step 30083: {'lr': 0.00045688342393541227, 'samples': 5775936, 'steps': 30082, 'loss/train': 2.255936622619629} -08/30/2021 18:42:06 - INFO - __main__ - Step 30084: {'lr': 0.00045688044459734766, 'samples': 5776128, 'steps': 30083, 'loss/train': 0.9807066917419434} -08/30/2021 18:42:07 - INFO - __main__ - Step 30085: {'lr': 0.000456877465166066, 'samples': 5776320, 'steps': 30084, 'loss/train': 1.2674349546432495} -08/30/2021 18:42:08 - INFO - __main__ - Step 30086: {'lr': 0.0004568744856415685, 'samples': 5776512, 'steps': 30085, 'loss/train': 0.4089215397834778} -08/30/2021 18:42:09 - INFO - __main__ - Step 30087: {'lr': 0.0004568715060238565, 'samples': 5776704, 'steps': 30086, 'loss/train': 1.612135887145996} -08/30/2021 18:42:09 - INFO - __main__ - Step 30088: {'lr': 0.0004568685263129315, 'samples': 5776896, 'steps': 30087, 'loss/train': 1.5005519390106201} -08/30/2021 18:42:09 - INFO - __main__ - Step 30089: {'lr': 0.00045686554650879464, 'samples': 5777088, 'steps': 30088, 'loss/train': 0.9640678763389587} -08/30/2021 18:42:10 - INFO - __main__ - Step 30090: {'lr': 0.0004568625666114474, 'samples': 5777280, 'steps': 30089, 'loss/train': 0.14149634540081024} -08/30/2021 18:42:10 - INFO - __main__ - Step 30091: {'lr': 0.00045685958662089113, 'samples': 5777472, 'steps': 30090, 'loss/train': 1.920926570892334} -08/30/2021 18:42:12 - INFO - __main__ - Step 30092: {'lr': 0.000456856606537127, 'samples': 5777664, 'steps': 30091, 'loss/train': 1.578325629234314} -08/30/2021 18:42:13 - INFO - __main__ - Step 30093: {'lr': 0.00045685362636015657, 'samples': 5777856, 'steps': 30092, 'loss/train': 0.09030758589506149} -08/30/2021 18:42:13 - INFO - __main__ - Step 30094: {'lr': 0.00045685064608998107, 'samples': 5778048, 'steps': 30093, 'loss/train': 1.5328689813613892} -08/30/2021 18:42:13 - INFO - __main__ - Step 30095: {'lr': 0.00045684766572660185, 'samples': 5778240, 'steps': 30094, 'loss/train': 1.6309140920639038} -08/30/2021 18:42:14 - INFO - __main__ - Step 30096: {'lr': 0.0004568446852700203, 'samples': 5778432, 'steps': 30095, 'loss/train': 1.8274109363555908} -08/30/2021 18:42:14 - INFO - __main__ - Step 30097: {'lr': 0.00045684170472023766, 'samples': 5778624, 'steps': 30096, 'loss/train': 0.9138599038124084} -08/30/2021 18:42:15 - INFO - __main__ - Step 30098: {'lr': 0.00045683872407725534, 'samples': 5778816, 'steps': 30097, 'loss/train': 0.04247663542628288} -08/30/2021 18:42:16 - INFO - __main__ - Step 30099: {'lr': 0.00045683574334107473, 'samples': 5779008, 'steps': 30098, 'loss/train': 0.7867898344993591} -08/30/2021 18:42:16 - INFO - __main__ - Step 30100: {'lr': 0.00045683276251169713, 'samples': 5779200, 'steps': 30099, 'loss/train': 1.4865630865097046} -08/30/2021 18:42:17 - INFO - __main__ - Step 30101: {'lr': 0.00045682978158912384, 'samples': 5779392, 'steps': 30100, 'loss/train': 1.869196891784668} -08/30/2021 18:42:17 - INFO - __main__ - Step 30102: {'lr': 0.0004568268005733562, 'samples': 5779584, 'steps': 30101, 'loss/train': 1.3848079442977905} -08/30/2021 18:42:17 - INFO - __main__ - Step 30103: {'lr': 0.0004568238194643958, 'samples': 5779776, 'steps': 30102, 'loss/train': 1.322537899017334} -08/30/2021 18:42:19 - INFO - __main__ - Step 30104: {'lr': 0.00045682083826224356, 'samples': 5779968, 'steps': 30103, 'loss/train': 2.3614344596862793} -08/30/2021 18:42:19 - INFO - __main__ - Step 30105: {'lr': 0.00045681785696690113, 'samples': 5780160, 'steps': 30104, 'loss/train': 1.1650716066360474} -08/30/2021 18:42:20 - INFO - __main__ - Step 30106: {'lr': 0.0004568148755783698, 'samples': 5780352, 'steps': 30105, 'loss/train': 0.8741475343704224} -08/30/2021 18:42:20 - INFO - __main__ - Step 30107: {'lr': 0.00045681189409665083, 'samples': 5780544, 'steps': 30106, 'loss/train': 1.3587108850479126} -08/30/2021 18:42:20 - INFO - __main__ - Step 30108: {'lr': 0.00045680891252174557, 'samples': 5780736, 'steps': 30107, 'loss/train': 2.155973434448242} -08/30/2021 18:42:22 - INFO - __main__ - Step 30109: {'lr': 0.0004568059308536554, 'samples': 5780928, 'steps': 30108, 'loss/train': 0.974151074886322} -08/30/2021 18:42:22 - INFO - __main__ - Step 30110: {'lr': 0.00045680294909238175, 'samples': 5781120, 'steps': 30109, 'loss/train': 1.5513627529144287} -08/30/2021 18:42:23 - INFO - __main__ - Step 30111: {'lr': 0.00045679996723792585, 'samples': 5781312, 'steps': 30110, 'loss/train': 0.06620944291353226} -08/30/2021 18:42:23 - INFO - __main__ - Step 30112: {'lr': 0.00045679698529028906, 'samples': 5781504, 'steps': 30111, 'loss/train': 1.436975121498108} -08/30/2021 18:42:23 - INFO - __main__ - Step 30113: {'lr': 0.00045679400324947274, 'samples': 5781696, 'steps': 30112, 'loss/train': 1.0639758110046387} -08/30/2021 18:42:25 - INFO - __main__ - Step 30114: {'lr': 0.00045679102111547825, 'samples': 5781888, 'steps': 30113, 'loss/train': 1.4798959493637085} -08/30/2021 18:42:25 - INFO - __main__ - Step 30115: {'lr': 0.00045678803888830687, 'samples': 5782080, 'steps': 30114, 'loss/train': 1.3769304752349854} -08/30/2021 18:42:26 - INFO - __main__ - Step 30116: {'lr': 0.0004567850565679601, 'samples': 5782272, 'steps': 30115, 'loss/train': 1.1682536602020264} -08/30/2021 18:42:26 - INFO - __main__ - Step 30117: {'lr': 0.00045678207415443913, 'samples': 5782464, 'steps': 30116, 'loss/train': 0.8671473860740662} -08/30/2021 18:42:26 - INFO - __main__ - Step 30118: {'lr': 0.0004567790916477453, 'samples': 5782656, 'steps': 30117, 'loss/train': 1.9146126508712769} -08/30/2021 18:42:28 - INFO - __main__ - Step 30119: {'lr': 0.00045677610904788004, 'samples': 5782848, 'steps': 30118, 'loss/train': 1.7721564769744873} -08/30/2021 18:42:29 - INFO - __main__ - Step 30120: {'lr': 0.00045677312635484466, 'samples': 5783040, 'steps': 30119, 'loss/train': 1.2302154302597046} -08/30/2021 18:42:29 - INFO - __main__ - Step 30121: {'lr': 0.00045677014356864043, 'samples': 5783232, 'steps': 30120, 'loss/train': 1.424653172492981} -08/30/2021 18:42:30 - INFO - __main__ - Step 30122: {'lr': 0.0004567671606892688, 'samples': 5783424, 'steps': 30121, 'loss/train': 1.5457096099853516} -08/30/2021 18:42:30 - INFO - __main__ - Step 30123: {'lr': 0.00045676417771673116, 'samples': 5783616, 'steps': 30122, 'loss/train': 1.249524474143982} -08/30/2021 18:42:30 - INFO - __main__ - Step 30124: {'lr': 0.0004567611946510287, 'samples': 5783808, 'steps': 30123, 'loss/train': 0.048977646976709366} -08/30/2021 18:42:32 - INFO - __main__ - Step 30125: {'lr': 0.00045675821149216285, 'samples': 5784000, 'steps': 30124, 'loss/train': 1.342484474182129} -08/30/2021 18:42:32 - INFO - __main__ - Step 30126: {'lr': 0.00045675522824013495, 'samples': 5784192, 'steps': 30125, 'loss/train': 1.2320334911346436} -08/30/2021 18:42:33 - INFO - __main__ - Step 30127: {'lr': 0.00045675224489494633, 'samples': 5784384, 'steps': 30126, 'loss/train': 1.5247381925582886} -08/30/2021 18:42:33 - INFO - __main__ - Step 30128: {'lr': 0.00045674926145659834, 'samples': 5784576, 'steps': 30127, 'loss/train': 1.5194438695907593} -08/30/2021 18:42:33 - INFO - __main__ - Step 30129: {'lr': 0.0004567462779250923, 'samples': 5784768, 'steps': 30128, 'loss/train': 1.0988644361495972} -08/30/2021 18:42:35 - INFO - __main__ - Step 30130: {'lr': 0.0004567432943004296, 'samples': 5784960, 'steps': 30129, 'loss/train': 1.6423465013504028} -08/30/2021 18:42:35 - INFO - __main__ - Step 30131: {'lr': 0.00045674031058261157, 'samples': 5785152, 'steps': 30130, 'loss/train': 0.9279747009277344} -08/30/2021 18:42:36 - INFO - __main__ - Step 30132: {'lr': 0.0004567373267716395, 'samples': 5785344, 'steps': 30131, 'loss/train': 1.577731966972351} -08/30/2021 18:42:36 - INFO - __main__ - Step 30133: {'lr': 0.0004567343428675148, 'samples': 5785536, 'steps': 30132, 'loss/train': 0.08979174494743347} -08/30/2021 18:42:36 - INFO - __main__ - Step 30134: {'lr': 0.00045673135887023874, 'samples': 5785728, 'steps': 30133, 'loss/train': 1.2370126247406006} -08/30/2021 18:42:39 - INFO - __main__ - Step 30135: {'lr': 0.0004567283747798128, 'samples': 5785920, 'steps': 30134, 'loss/train': 1.1754133701324463} -08/30/2021 18:42:39 - INFO - __main__ - Step 30136: {'lr': 0.0004567253905962383, 'samples': 5786112, 'steps': 30135, 'loss/train': 1.1998401880264282} -08/30/2021 18:42:39 - INFO - __main__ - Step 30137: {'lr': 0.00045672240631951645, 'samples': 5786304, 'steps': 30136, 'loss/train': 1.383865475654602} -08/30/2021 18:42:40 - INFO - __main__ - Step 30138: {'lr': 0.0004567194219496487, 'samples': 5786496, 'steps': 30137, 'loss/train': 1.4130598306655884} -08/30/2021 18:42:40 - INFO - __main__ - Step 30139: {'lr': 0.0004567164374866363, 'samples': 5786688, 'steps': 30138, 'loss/train': 1.578806757926941} -08/30/2021 18:42:42 - INFO - __main__ - Step 30140: {'lr': 0.00045671345293048075, 'samples': 5786880, 'steps': 30139, 'loss/train': 1.3131394386291504} -08/30/2021 18:42:42 - INFO - __main__ - Step 30141: {'lr': 0.00045671046828118324, 'samples': 5787072, 'steps': 30140, 'loss/train': 1.7229034900665283} -08/30/2021 18:42:42 - INFO - __main__ - Step 30142: {'lr': 0.0004567074835387452, 'samples': 5787264, 'steps': 30141, 'loss/train': 1.0348509550094604} -08/30/2021 18:42:43 - INFO - __main__ - Step 30143: {'lr': 0.000456704498703168, 'samples': 5787456, 'steps': 30142, 'loss/train': 1.679243564605713} -08/30/2021 18:42:43 - INFO - __main__ - Step 30144: {'lr': 0.0004567015137744529, 'samples': 5787648, 'steps': 30143, 'loss/train': 1.3586660623550415} -08/30/2021 18:42:45 - INFO - __main__ - Step 30145: {'lr': 0.00045669852875260134, 'samples': 5787840, 'steps': 30144, 'loss/train': 1.4935890436172485} -08/30/2021 18:42:45 - INFO - __main__ - Step 30146: {'lr': 0.00045669554363761454, 'samples': 5788032, 'steps': 30145, 'loss/train': 1.7534693479537964} -08/30/2021 18:42:45 - INFO - __main__ - Step 30147: {'lr': 0.0004566925584294939, 'samples': 5788224, 'steps': 30146, 'loss/train': 1.4882893562316895} -08/30/2021 18:42:46 - INFO - __main__ - Step 30148: {'lr': 0.00045668957312824086, 'samples': 5788416, 'steps': 30147, 'loss/train': 1.5803802013397217} -08/30/2021 18:42:46 - INFO - __main__ - Step 30149: {'lr': 0.00045668658773385663, 'samples': 5788608, 'steps': 30148, 'loss/train': 1.4983325004577637} -08/30/2021 18:42:48 - INFO - __main__ - Step 30150: {'lr': 0.00045668360224634263, 'samples': 5788800, 'steps': 30149, 'loss/train': 1.3118733167648315} -08/30/2021 18:42:48 - INFO - __main__ - Step 30151: {'lr': 0.00045668061666570027, 'samples': 5788992, 'steps': 30150, 'loss/train': 1.634933352470398} -08/30/2021 18:42:48 - INFO - __main__ - Step 30152: {'lr': 0.0004566776309919307, 'samples': 5789184, 'steps': 30151, 'loss/train': 1.7133467197418213} -08/30/2021 18:42:49 - INFO - __main__ - Step 30153: {'lr': 0.0004566746452250354, 'samples': 5789376, 'steps': 30152, 'loss/train': 1.4850605726242065} -08/30/2021 18:42:49 - INFO - __main__ - Step 30154: {'lr': 0.00045667165936501573, 'samples': 5789568, 'steps': 30153, 'loss/train': 1.2529581785202026} -08/30/2021 18:42:51 - INFO - __main__ - Step 30155: {'lr': 0.000456668673411873, 'samples': 5789760, 'steps': 30154, 'loss/train': 1.7884093523025513} -08/30/2021 18:42:51 - INFO - __main__ - Step 30156: {'lr': 0.00045666568736560853, 'samples': 5789952, 'steps': 30155, 'loss/train': 2.024064779281616} -08/30/2021 18:42:51 - INFO - __main__ - Step 30157: {'lr': 0.0004566627012262238, 'samples': 5790144, 'steps': 30156, 'loss/train': 1.4978951215744019} -08/30/2021 18:42:52 - INFO - __main__ - Step 30158: {'lr': 0.0004566597149937199, 'samples': 5790336, 'steps': 30157, 'loss/train': 1.2400438785552979} -08/30/2021 18:42:52 - INFO - __main__ - Step 30159: {'lr': 0.00045665672866809835, 'samples': 5790528, 'steps': 30158, 'loss/train': 1.5105055570602417} -08/30/2021 18:42:52 - INFO - __main__ - Step 30160: {'lr': 0.0004566537422493605, 'samples': 5790720, 'steps': 30159, 'loss/train': 1.6243542432785034} -08/30/2021 18:42:54 - INFO - __main__ - Step 30161: {'lr': 0.00045665075573750764, 'samples': 5790912, 'steps': 30160, 'loss/train': 0.8696616888046265} -08/30/2021 18:42:55 - INFO - __main__ - Step 30162: {'lr': 0.00045664776913254115, 'samples': 5791104, 'steps': 30161, 'loss/train': 1.4763052463531494} -08/30/2021 18:42:55 - INFO - __main__ - Step 30163: {'lr': 0.0004566447824344624, 'samples': 5791296, 'steps': 30162, 'loss/train': 1.5289149284362793} -08/30/2021 18:42:55 - INFO - __main__ - Step 30164: {'lr': 0.00045664179564327266, 'samples': 5791488, 'steps': 30163, 'loss/train': 1.2755883932113647} -08/30/2021 18:42:56 - INFO - __main__ - Step 30165: {'lr': 0.00045663880875897325, 'samples': 5791680, 'steps': 30164, 'loss/train': 1.2715866565704346} -08/30/2021 18:42:57 - INFO - __main__ - Step 30166: {'lr': 0.00045663582178156564, 'samples': 5791872, 'steps': 30165, 'loss/train': 1.1453654766082764} -08/30/2021 18:42:58 - INFO - __main__ - Step 30167: {'lr': 0.00045663283471105115, 'samples': 5792064, 'steps': 30166, 'loss/train': 1.3923983573913574} -08/30/2021 18:42:58 - INFO - __main__ - Step 30168: {'lr': 0.00045662984754743106, 'samples': 5792256, 'steps': 30167, 'loss/train': 1.6533193588256836} -08/30/2021 18:42:58 - INFO - __main__ - Step 30169: {'lr': 0.00045662686029070674, 'samples': 5792448, 'steps': 30168, 'loss/train': 1.6843254566192627} -08/30/2021 18:42:59 - INFO - __main__ - Step 30170: {'lr': 0.0004566238729408796, 'samples': 5792640, 'steps': 30169, 'loss/train': 0.06722897291183472} -08/30/2021 18:43:00 - INFO - __main__ - Step 30171: {'lr': 0.00045662088549795087, 'samples': 5792832, 'steps': 30170, 'loss/train': 1.1034841537475586} -08/30/2021 18:43:01 - INFO - __main__ - Step 30172: {'lr': 0.000456617897961922, 'samples': 5793024, 'steps': 30171, 'loss/train': 1.658542513847351} -08/30/2021 18:43:01 - INFO - __main__ - Step 30173: {'lr': 0.00045661491033279427, 'samples': 5793216, 'steps': 30172, 'loss/train': 0.5844011902809143} -08/30/2021 18:43:01 - INFO - __main__ - Step 30174: {'lr': 0.00045661192261056905, 'samples': 5793408, 'steps': 30173, 'loss/train': 2.0529794692993164} -08/30/2021 18:43:02 - INFO - __main__ - Step 30175: {'lr': 0.00045660893479524767, 'samples': 5793600, 'steps': 30174, 'loss/train': 1.4518444538116455} -08/30/2021 18:43:02 - INFO - __main__ - Step 30176: {'lr': 0.00045660594688683154, 'samples': 5793792, 'steps': 30175, 'loss/train': 1.4589122533798218} -08/30/2021 18:43:03 - INFO - __main__ - Step 30177: {'lr': 0.00045660295888532196, 'samples': 5793984, 'steps': 30176, 'loss/train': 1.7479100227355957} -08/30/2021 18:43:04 - INFO - __main__ - Step 30178: {'lr': 0.00045659997079072024, 'samples': 5794176, 'steps': 30177, 'loss/train': 1.6250731945037842} -08/30/2021 18:43:04 - INFO - __main__ - Step 30179: {'lr': 0.00045659698260302773, 'samples': 5794368, 'steps': 30178, 'loss/train': 1.00252103805542} -08/30/2021 18:43:04 - INFO - __main__ - Step 30180: {'lr': 0.00045659399432224583, 'samples': 5794560, 'steps': 30179, 'loss/train': 1.6312451362609863} -08/30/2021 18:43:05 - INFO - __main__ - Step 30181: {'lr': 0.00045659100594837586, 'samples': 5794752, 'steps': 30180, 'loss/train': 0.9336314797401428} -08/30/2021 18:43:06 - INFO - __main__ - Step 30182: {'lr': 0.0004565880174814192, 'samples': 5794944, 'steps': 30181, 'loss/train': 1.6134107112884521} -08/30/2021 18:43:07 - INFO - __main__ - Step 30183: {'lr': 0.0004565850289213772, 'samples': 5795136, 'steps': 30182, 'loss/train': 1.3392689228057861} -08/30/2021 18:43:07 - INFO - __main__ - Step 30184: {'lr': 0.0004565820402682511, 'samples': 5795328, 'steps': 30183, 'loss/train': 1.3019702434539795} -08/30/2021 18:43:08 - INFO - __main__ - Step 30185: {'lr': 0.00045657905152204236, 'samples': 5795520, 'steps': 30184, 'loss/train': 1.1344388723373413} -08/30/2021 18:43:08 - INFO - __main__ - Step 30186: {'lr': 0.0004565760626827523, 'samples': 5795712, 'steps': 30185, 'loss/train': 1.4040650129318237} -08/30/2021 18:43:09 - INFO - __main__ - Step 30187: {'lr': 0.00045657307375038226, 'samples': 5795904, 'steps': 30186, 'loss/train': 1.4295676946640015} -08/30/2021 18:43:10 - INFO - __main__ - Step 30188: {'lr': 0.00045657008472493356, 'samples': 5796096, 'steps': 30187, 'loss/train': 1.5498725175857544} -08/30/2021 18:43:10 - INFO - __main__ - Step 30189: {'lr': 0.0004565670956064075, 'samples': 5796288, 'steps': 30188, 'loss/train': 1.233457326889038} -08/30/2021 18:43:11 - INFO - __main__ - Step 30190: {'lr': 0.00045656410639480563, 'samples': 5796480, 'steps': 30189, 'loss/train': 1.3556773662567139} -08/30/2021 18:43:11 - INFO - __main__ - Step 30191: {'lr': 0.00045656111709012906, 'samples': 5796672, 'steps': 30190, 'loss/train': 1.4870336055755615} -08/30/2021 18:43:13 - INFO - __main__ - Step 30192: {'lr': 0.00045655812769237927, 'samples': 5796864, 'steps': 30191, 'loss/train': 1.584865689277649} -08/30/2021 18:43:13 - INFO - __main__ - Step 30193: {'lr': 0.00045655513820155755, 'samples': 5797056, 'steps': 30192, 'loss/train': 1.6792405843734741} -08/30/2021 18:43:14 - INFO - __main__ - Step 30194: {'lr': 0.00045655214861766525, 'samples': 5797248, 'steps': 30193, 'loss/train': 1.3730969429016113} -08/30/2021 18:43:14 - INFO - __main__ - Step 30195: {'lr': 0.0004565491589407038, 'samples': 5797440, 'steps': 30194, 'loss/train': 1.281630277633667} -08/30/2021 18:43:14 - INFO - __main__ - Step 30196: {'lr': 0.0004565461691706745, 'samples': 5797632, 'steps': 30195, 'loss/train': 1.7849072217941284} -08/30/2021 18:43:16 - INFO - __main__ - Step 30197: {'lr': 0.0004565431793075786, 'samples': 5797824, 'steps': 30196, 'loss/train': 1.6919240951538086} -08/30/2021 18:43:16 - INFO - __main__ - Step 30198: {'lr': 0.0004565401893514176, 'samples': 5798016, 'steps': 30197, 'loss/train': 1.2529618740081787} -08/30/2021 18:43:17 - INFO - __main__ - Step 30199: {'lr': 0.0004565371993021927, 'samples': 5798208, 'steps': 30198, 'loss/train': 1.8620270490646362} -08/30/2021 18:43:17 - INFO - __main__ - Step 30200: {'lr': 0.00045653420915990546, 'samples': 5798400, 'steps': 30199, 'loss/train': 0.07246321439743042} -08/30/2021 18:43:18 - INFO - __main__ - Step 30201: {'lr': 0.000456531218924557, 'samples': 5798592, 'steps': 30200, 'loss/train': 1.1189396381378174} -08/30/2021 18:43:19 - INFO - __main__ - Step 30202: {'lr': 0.0004565282285961488, 'samples': 5798784, 'steps': 30201, 'loss/train': 1.650571346282959} -08/30/2021 18:43:20 - INFO - __main__ - Step 30203: {'lr': 0.0004565252381746821, 'samples': 5798976, 'steps': 30202, 'loss/train': 1.138083577156067} -08/30/2021 18:43:20 - INFO - __main__ - Step 30204: {'lr': 0.0004565222476601584, 'samples': 5799168, 'steps': 30203, 'loss/train': 1.4301347732543945} -08/30/2021 18:43:20 - INFO - __main__ - Step 30205: {'lr': 0.0004565192570525789, 'samples': 5799360, 'steps': 30204, 'loss/train': 1.7329448461532593} -08/30/2021 18:43:21 - INFO - __main__ - Step 30206: {'lr': 0.00045651626635194497, 'samples': 5799552, 'steps': 30205, 'loss/train': 1.1468639373779297} -08/30/2021 18:43:21 - INFO - __main__ - Step 30207: {'lr': 0.0004565132755582581, 'samples': 5799744, 'steps': 30206, 'loss/train': 1.754542350769043} -08/30/2021 18:43:22 - INFO - __main__ - Step 30208: {'lr': 0.0004565102846715195, 'samples': 5799936, 'steps': 30207, 'loss/train': 1.1099430322647095} -08/30/2021 18:43:23 - INFO - __main__ - Step 30209: {'lr': 0.0004565072936917305, 'samples': 5800128, 'steps': 30208, 'loss/train': 0.9972745180130005} -08/30/2021 18:43:23 - INFO - __main__ - Step 30210: {'lr': 0.0004565043026188926, 'samples': 5800320, 'steps': 30209, 'loss/train': 1.6816481351852417} -08/30/2021 18:43:24 - INFO - __main__ - Step 30211: {'lr': 0.000456501311453007, 'samples': 5800512, 'steps': 30210, 'loss/train': 1.667494297027588} -08/30/2021 18:43:24 - INFO - __main__ - Step 30212: {'lr': 0.00045649832019407504, 'samples': 5800704, 'steps': 30211, 'loss/train': 0.8554044961929321} -08/30/2021 18:43:26 - INFO - __main__ - Step 30213: {'lr': 0.0004564953288420982, 'samples': 5800896, 'steps': 30212, 'loss/train': 1.314995288848877} -08/30/2021 18:43:26 - INFO - __main__ - Step 30214: {'lr': 0.00045649233739707774, 'samples': 5801088, 'steps': 30213, 'loss/train': 1.822932243347168} -08/30/2021 18:43:27 - INFO - __main__ - Step 30215: {'lr': 0.00045648934585901496, 'samples': 5801280, 'steps': 30214, 'loss/train': 2.0202341079711914} -08/30/2021 18:43:27 - INFO - __main__ - Step 30216: {'lr': 0.0004564863542279113, 'samples': 5801472, 'steps': 30215, 'loss/train': 1.5291169881820679} -08/30/2021 18:43:27 - INFO - __main__ - Step 30217: {'lr': 0.0004564833625037681, 'samples': 5801664, 'steps': 30216, 'loss/train': 0.048660457134246826} -08/30/2021 18:43:28 - INFO - __main__ - Step 30218: {'lr': 0.00045648037068658667, 'samples': 5801856, 'steps': 30217, 'loss/train': 0.1317969411611557} -08/30/2021 18:43:29 - INFO - __main__ - Step 30219: {'lr': 0.00045647737877636834, 'samples': 5802048, 'steps': 30218, 'loss/train': 1.5373785495758057} -08/30/2021 18:43:30 - INFO - __main__ - Step 30220: {'lr': 0.0004564743867731145, 'samples': 5802240, 'steps': 30219, 'loss/train': 1.494742512702942} -08/30/2021 18:43:30 - INFO - __main__ - Step 30221: {'lr': 0.0004564713946768265, 'samples': 5802432, 'steps': 30220, 'loss/train': 1.335472583770752} -08/30/2021 18:43:30 - INFO - __main__ - Step 30222: {'lr': 0.0004564684024875057, 'samples': 5802624, 'steps': 30221, 'loss/train': 1.1151351928710938} -08/30/2021 18:43:31 - INFO - __main__ - Step 30223: {'lr': 0.0004564654102051534, 'samples': 5802816, 'steps': 30222, 'loss/train': 2.1353673934936523} -08/30/2021 18:43:33 - INFO - __main__ - Step 30224: {'lr': 0.000456462417829771, 'samples': 5803008, 'steps': 30223, 'loss/train': 1.6881850957870483} -08/30/2021 18:43:33 - INFO - __main__ - Step 30225: {'lr': 0.0004564594253613598, 'samples': 5803200, 'steps': 30224, 'loss/train': 1.6358420848846436} -08/30/2021 18:43:33 - INFO - __main__ - Step 30226: {'lr': 0.0004564564327999211, 'samples': 5803392, 'steps': 30225, 'loss/train': 1.6034457683563232} -08/30/2021 18:43:34 - INFO - __main__ - Step 30227: {'lr': 0.00045645344014545643, 'samples': 5803584, 'steps': 30226, 'loss/train': 1.9370226860046387} -08/30/2021 18:43:34 - INFO - __main__ - Step 30228: {'lr': 0.00045645044739796694, 'samples': 5803776, 'steps': 30227, 'loss/train': 0.7137978076934814} -08/30/2021 18:43:36 - INFO - __main__ - Step 30229: {'lr': 0.00045644745455745414, 'samples': 5803968, 'steps': 30228, 'loss/train': 1.1334476470947266} -08/30/2021 18:43:36 - INFO - __main__ - Step 30230: {'lr': 0.0004564444616239193, 'samples': 5804160, 'steps': 30229, 'loss/train': 1.7633591890335083} -08/30/2021 18:43:37 - INFO - __main__ - Step 30231: {'lr': 0.0004564414685973637, 'samples': 5804352, 'steps': 30230, 'loss/train': 2.0532965660095215} -08/30/2021 18:43:37 - INFO - __main__ - Step 30232: {'lr': 0.0004564384754777888, 'samples': 5804544, 'steps': 30231, 'loss/train': 0.8657008409500122} -08/30/2021 18:43:37 - INFO - __main__ - Step 30233: {'lr': 0.00045643548226519587, 'samples': 5804736, 'steps': 30232, 'loss/train': 1.361954927444458} -08/30/2021 18:43:39 - INFO - __main__ - Step 30234: {'lr': 0.00045643248895958636, 'samples': 5804928, 'steps': 30233, 'loss/train': 1.7255884408950806} -08/30/2021 18:43:40 - INFO - __main__ - Step 30235: {'lr': 0.00045642949556096146, 'samples': 5805120, 'steps': 30234, 'loss/train': 1.2330719232559204} -08/30/2021 18:43:40 - INFO - __main__ - Step 30236: {'lr': 0.0004564265020693227, 'samples': 5805312, 'steps': 30235, 'loss/train': 1.0297609567642212} -08/30/2021 18:43:40 - INFO - __main__ - Step 30237: {'lr': 0.0004564235084846713, 'samples': 5805504, 'steps': 30236, 'loss/train': 0.3304782509803772} -08/30/2021 18:43:41 - INFO - __main__ - Step 30238: {'lr': 0.00045642051480700873, 'samples': 5805696, 'steps': 30237, 'loss/train': 1.4655193090438843} -08/30/2021 18:43:43 - INFO - __main__ - Step 30239: {'lr': 0.0004564175210363362, 'samples': 5805888, 'steps': 30238, 'loss/train': 1.2773939371109009} -08/30/2021 18:43:43 - INFO - __main__ - Step 30240: {'lr': 0.00045641452717265507, 'samples': 5806080, 'steps': 30239, 'loss/train': 1.745729923248291} -08/30/2021 18:43:43 - INFO - __main__ - Step 30241: {'lr': 0.00045641153321596687, 'samples': 5806272, 'steps': 30240, 'loss/train': 1.2591203451156616} -08/30/2021 18:43:44 - INFO - __main__ - Step 30242: {'lr': 0.0004564085391662727, 'samples': 5806464, 'steps': 30241, 'loss/train': 1.8606942892074585} -08/30/2021 18:43:44 - INFO - __main__ - Step 30243: {'lr': 0.00045640554502357413, 'samples': 5806656, 'steps': 30242, 'loss/train': 1.4952788352966309} -08/30/2021 18:43:45 - INFO - __main__ - Step 30244: {'lr': 0.0004564025507878723, 'samples': 5806848, 'steps': 30243, 'loss/train': 0.05463343858718872} -08/30/2021 18:43:46 - INFO - __main__ - Step 30245: {'lr': 0.00045639955645916875, 'samples': 5807040, 'steps': 30244, 'loss/train': 1.0868946313858032} -08/30/2021 18:43:47 - INFO - __main__ - Step 30246: {'lr': 0.0004563965620374647, 'samples': 5807232, 'steps': 30245, 'loss/train': 1.633384108543396} -08/30/2021 18:43:47 - INFO - __main__ - Step 30247: {'lr': 0.0004563935675227615, 'samples': 5807424, 'steps': 30246, 'loss/train': 2.012517213821411} -08/30/2021 18:43:48 - INFO - __main__ - Step 30248: {'lr': 0.00045639057291506065, 'samples': 5807616, 'steps': 30247, 'loss/train': 1.6251734495162964} -08/30/2021 18:43:48 - INFO - __main__ - Step 30249: {'lr': 0.0004563875782143633, 'samples': 5807808, 'steps': 30248, 'loss/train': 1.6240020990371704} -08/30/2021 18:43:50 - INFO - __main__ - Step 30250: {'lr': 0.000456384583420671, 'samples': 5808000, 'steps': 30249, 'loss/train': 1.500151515007019} -08/30/2021 18:43:50 - INFO - __main__ - Step 30251: {'lr': 0.0004563815885339849, 'samples': 5808192, 'steps': 30250, 'loss/train': 1.3753119707107544} -08/30/2021 18:43:50 - INFO - __main__ - Step 30252: {'lr': 0.00045637859355430647, 'samples': 5808384, 'steps': 30251, 'loss/train': 3.035808801651001} -08/30/2021 18:43:51 - INFO - __main__ - Step 30253: {'lr': 0.000456375598481637, 'samples': 5808576, 'steps': 30252, 'loss/train': 1.6513733863830566} -08/30/2021 18:43:51 - INFO - __main__ - Step 30254: {'lr': 0.00045637260331597793, 'samples': 5808768, 'steps': 30253, 'loss/train': 1.4726425409317017} -08/30/2021 18:43:52 - INFO - __main__ - Step 30255: {'lr': 0.00045636960805733054, 'samples': 5808960, 'steps': 30254, 'loss/train': 1.8462722301483154} -08/30/2021 18:43:53 - INFO - __main__ - Step 30256: {'lr': 0.0004563666127056961, 'samples': 5809152, 'steps': 30255, 'loss/train': 1.6160821914672852} -08/30/2021 18:43:54 - INFO - __main__ - Step 30257: {'lr': 0.0004563636172610761, 'samples': 5809344, 'steps': 30256, 'loss/train': 1.7190073728561401} -08/30/2021 18:43:54 - INFO - __main__ - Step 30258: {'lr': 0.00045636062172347186, 'samples': 5809536, 'steps': 30257, 'loss/train': 1.7073683738708496} -08/30/2021 18:43:55 - INFO - __main__ - Step 30259: {'lr': 0.0004563576260928847, 'samples': 5809728, 'steps': 30258, 'loss/train': 1.3867048025131226} -08/30/2021 18:43:55 - INFO - __main__ - Step 30260: {'lr': 0.000456354630369316, 'samples': 5809920, 'steps': 30259, 'loss/train': 1.340516448020935} -08/30/2021 18:43:57 - INFO - __main__ - Step 30261: {'lr': 0.00045635163455276707, 'samples': 5810112, 'steps': 30260, 'loss/train': 1.2688188552856445} -08/30/2021 18:43:57 - INFO - __main__ - Step 30262: {'lr': 0.0004563486386432393, 'samples': 5810304, 'steps': 30261, 'loss/train': 1.3179888725280762} -08/30/2021 18:43:57 - INFO - __main__ - Step 30263: {'lr': 0.00045634564264073396, 'samples': 5810496, 'steps': 30262, 'loss/train': 1.367193579673767} -08/30/2021 18:43:58 - INFO - __main__ - Step 30264: {'lr': 0.0004563426465452525, 'samples': 5810688, 'steps': 30263, 'loss/train': 2.21877121925354} -08/30/2021 18:43:58 - INFO - __main__ - Step 30265: {'lr': 0.00045633965035679614, 'samples': 5810880, 'steps': 30264, 'loss/train': 1.3574408292770386} -08/30/2021 18:44:00 - INFO - __main__ - Step 30266: {'lr': 0.0004563366540753664, 'samples': 5811072, 'steps': 30265, 'loss/train': 0.5013177990913391} -08/30/2021 18:44:00 - INFO - __main__ - Step 30267: {'lr': 0.00045633365770096456, 'samples': 5811264, 'steps': 30266, 'loss/train': 1.197783350944519} -08/30/2021 18:44:00 - INFO - __main__ - Step 30268: {'lr': 0.000456330661233592, 'samples': 5811456, 'steps': 30267, 'loss/train': 1.3258761167526245} -08/30/2021 18:44:01 - INFO - __main__ - Step 30269: {'lr': 0.00045632766467324995, 'samples': 5811648, 'steps': 30268, 'loss/train': 1.1505438089370728} -08/30/2021 18:44:01 - INFO - __main__ - Step 30270: {'lr': 0.0004563246680199398, 'samples': 5811840, 'steps': 30269, 'loss/train': 1.3651236295700073} -08/30/2021 18:44:03 - INFO - __main__ - Step 30271: {'lr': 0.000456321671273663, 'samples': 5812032, 'steps': 30270, 'loss/train': 1.547912359237671} -08/30/2021 18:44:03 - INFO - __main__ - Step 30272: {'lr': 0.00045631867443442084, 'samples': 5812224, 'steps': 30271, 'loss/train': 1.3571466207504272} -08/30/2021 18:44:03 - INFO - __main__ - Step 30273: {'lr': 0.00045631567750221465, 'samples': 5812416, 'steps': 30272, 'loss/train': 0.5563685894012451} -08/30/2021 18:44:04 - INFO - __main__ - Step 30274: {'lr': 0.0004563126804770458, 'samples': 5812608, 'steps': 30273, 'loss/train': 0.21116133034229279} -08/30/2021 18:44:04 - INFO - __main__ - Step 30275: {'lr': 0.00045630968335891564, 'samples': 5812800, 'steps': 30274, 'loss/train': 1.1514426469802856} -08/30/2021 18:44:06 - INFO - __main__ - Step 30276: {'lr': 0.00045630668614782553, 'samples': 5812992, 'steps': 30275, 'loss/train': 1.4305827617645264} -08/30/2021 18:44:06 - INFO - __main__ - Step 30277: {'lr': 0.0004563036888437768, 'samples': 5813184, 'steps': 30276, 'loss/train': 1.6732763051986694} -08/30/2021 18:44:07 - INFO - __main__ - Step 30278: {'lr': 0.0004563006914467709, 'samples': 5813376, 'steps': 30277, 'loss/train': 1.6876115798950195} -08/30/2021 18:44:07 - INFO - __main__ - Step 30279: {'lr': 0.000456297693956809, 'samples': 5813568, 'steps': 30278, 'loss/train': 2.2432475090026855} -08/30/2021 18:44:07 - INFO - __main__ - Step 30280: {'lr': 0.0004562946963738925, 'samples': 5813760, 'steps': 30279, 'loss/train': 0.1259242445230484} -08/30/2021 18:44:09 - INFO - __main__ - Step 30281: {'lr': 0.0004562916986980229, 'samples': 5813952, 'steps': 30280, 'loss/train': 1.3225913047790527} -08/30/2021 18:44:09 - INFO - __main__ - Step 30282: {'lr': 0.0004562887009292014, 'samples': 5814144, 'steps': 30281, 'loss/train': 1.4863812923431396} -08/30/2021 18:44:10 - INFO - __main__ - Step 30283: {'lr': 0.0004562857030674293, 'samples': 5814336, 'steps': 30282, 'loss/train': 2.1995954513549805} -08/30/2021 18:44:10 - INFO - __main__ - Step 30284: {'lr': 0.0004562827051127082, 'samples': 5814528, 'steps': 30283, 'loss/train': 1.700416088104248} -08/30/2021 18:44:10 - INFO - __main__ - Step 30285: {'lr': 0.0004562797070650392, 'samples': 5814720, 'steps': 30284, 'loss/train': 1.8413176536560059} -08/30/2021 18:44:11 - INFO - __main__ - Step 30286: {'lr': 0.00045627670892442376, 'samples': 5814912, 'steps': 30285, 'loss/train': 1.8634073734283447} -08/30/2021 18:44:12 - INFO - __main__ - Step 30287: {'lr': 0.0004562737106908632, 'samples': 5815104, 'steps': 30286, 'loss/train': 0.5496020913124084} -08/30/2021 18:44:13 - INFO - __main__ - Step 30288: {'lr': 0.00045627071236435896, 'samples': 5815296, 'steps': 30287, 'loss/train': 1.1342387199401855} -08/30/2021 18:44:13 - INFO - __main__ - Step 30289: {'lr': 0.0004562677139449123, 'samples': 5815488, 'steps': 30288, 'loss/train': 1.2350637912750244} -08/30/2021 18:44:13 - INFO - __main__ - Step 30290: {'lr': 0.0004562647154325246, 'samples': 5815680, 'steps': 30289, 'loss/train': 1.3664730787277222} -08/30/2021 18:44:14 - INFO - __main__ - Step 30291: {'lr': 0.0004562617168271971, 'samples': 5815872, 'steps': 30290, 'loss/train': 1.5584747791290283} -08/30/2021 18:44:15 - INFO - __main__ - Step 30292: {'lr': 0.0004562587181289314, 'samples': 5816064, 'steps': 30291, 'loss/train': 1.0992379188537598} -08/30/2021 18:44:16 - INFO - __main__ - Step 30293: {'lr': 0.00045625571933772857, 'samples': 5816256, 'steps': 30292, 'loss/train': 1.3232252597808838} -08/30/2021 18:44:16 - INFO - __main__ - Step 30294: {'lr': 0.0004562527204535902, 'samples': 5816448, 'steps': 30293, 'loss/train': 1.5896888971328735} -08/30/2021 18:44:16 - INFO - __main__ - Step 30295: {'lr': 0.00045624972147651746, 'samples': 5816640, 'steps': 30294, 'loss/train': 1.650687336921692} -08/30/2021 18:44:17 - INFO - __main__ - Step 30296: {'lr': 0.00045624672240651183, 'samples': 5816832, 'steps': 30295, 'loss/train': 1.091670274734497} -08/30/2021 18:44:19 - INFO - __main__ - Step 30297: {'lr': 0.00045624372324357457, 'samples': 5817024, 'steps': 30296, 'loss/train': 1.6191810369491577} -08/30/2021 18:44:19 - INFO - __main__ - Step 30298: {'lr': 0.0004562407239877071, 'samples': 5817216, 'steps': 30297, 'loss/train': 1.0923471450805664} -08/30/2021 18:44:20 - INFO - __main__ - Step 30299: {'lr': 0.0004562377246389108, 'samples': 5817408, 'steps': 30298, 'loss/train': 1.4671701192855835} -08/30/2021 18:44:20 - INFO - __main__ - Step 30300: {'lr': 0.00045623472519718683, 'samples': 5817600, 'steps': 30299, 'loss/train': 1.7130595445632935} -08/30/2021 18:44:20 - INFO - __main__ - Step 30301: {'lr': 0.00045623172566253676, 'samples': 5817792, 'steps': 30300, 'loss/train': 1.9406265020370483} -08/30/2021 18:44:22 - INFO - __main__ - Step 30302: {'lr': 0.00045622872603496184, 'samples': 5817984, 'steps': 30301, 'loss/train': 1.835220217704773} -08/30/2021 18:44:22 - INFO - __main__ - Step 30303: {'lr': 0.0004562257263144635, 'samples': 5818176, 'steps': 30302, 'loss/train': 1.2928903102874756} -08/30/2021 18:44:23 - INFO - __main__ - Step 30304: {'lr': 0.0004562227265010429, 'samples': 5818368, 'steps': 30303, 'loss/train': 1.152180552482605} -08/30/2021 18:44:23 - INFO - __main__ - Step 30305: {'lr': 0.00045621972659470156, 'samples': 5818560, 'steps': 30304, 'loss/train': 1.1183836460113525} -08/30/2021 18:44:23 - INFO - __main__ - Step 30306: {'lr': 0.0004562167265954409, 'samples': 5818752, 'steps': 30305, 'loss/train': 1.7545011043548584} -08/30/2021 18:44:25 - INFO - __main__ - Step 30307: {'lr': 0.000456213726503262, 'samples': 5818944, 'steps': 30306, 'loss/train': 1.2700676918029785} -08/30/2021 18:44:25 - INFO - __main__ - Step 30308: {'lr': 0.0004562107263181665, 'samples': 5819136, 'steps': 30307, 'loss/train': 1.3349676132202148} -08/30/2021 18:44:26 - INFO - __main__ - Step 30309: {'lr': 0.0004562077260401556, 'samples': 5819328, 'steps': 30308, 'loss/train': 1.5274112224578857} -08/30/2021 18:44:26 - INFO - __main__ - Step 30310: {'lr': 0.00045620472566923064, 'samples': 5819520, 'steps': 30309, 'loss/train': 1.1159486770629883} -08/30/2021 18:44:26 - INFO - __main__ - Step 30311: {'lr': 0.0004562017252053931, 'samples': 5819712, 'steps': 30310, 'loss/train': 2.038820505142212} -08/30/2021 18:44:27 - INFO - __main__ - Step 30312: {'lr': 0.0004561987246486442, 'samples': 5819904, 'steps': 30311, 'loss/train': 1.2197567224502563} -08/30/2021 18:44:28 - INFO - __main__ - Step 30313: {'lr': 0.00045619572399898534, 'samples': 5820096, 'steps': 30312, 'loss/train': 1.556435227394104} -08/30/2021 18:44:29 - INFO - __main__ - Step 30314: {'lr': 0.0004561927232564179, 'samples': 5820288, 'steps': 30313, 'loss/train': 2.0947604179382324} -08/30/2021 18:44:29 - INFO - __main__ - Step 30315: {'lr': 0.00045618972242094313, 'samples': 5820480, 'steps': 30314, 'loss/train': 1.6830512285232544} -08/30/2021 18:44:30 - INFO - __main__ - Step 30316: {'lr': 0.00045618672149256244, 'samples': 5820672, 'steps': 30315, 'loss/train': 4.369750499725342} -08/30/2021 18:44:30 - INFO - __main__ - Step 30317: {'lr': 0.0004561837204712773, 'samples': 5820864, 'steps': 30316, 'loss/train': 1.4061806201934814} -08/30/2021 18:44:31 - INFO - __main__ - Step 30318: {'lr': 0.0004561807193570888, 'samples': 5821056, 'steps': 30317, 'loss/train': 1.1020888090133667} -08/30/2021 18:44:32 - INFO - __main__ - Step 30319: {'lr': 0.0004561777181499986, 'samples': 5821248, 'steps': 30318, 'loss/train': 1.3973207473754883} -08/30/2021 18:44:32 - INFO - __main__ - Step 30320: {'lr': 0.00045617471685000785, 'samples': 5821440, 'steps': 30319, 'loss/train': 1.3725110292434692} -08/30/2021 18:44:33 - INFO - __main__ - Step 30321: {'lr': 0.00045617171545711793, 'samples': 5821632, 'steps': 30320, 'loss/train': 1.4897971153259277} -08/30/2021 18:44:33 - INFO - __main__ - Step 30322: {'lr': 0.0004561687139713302, 'samples': 5821824, 'steps': 30321, 'loss/train': 1.5724416971206665} -08/30/2021 18:44:34 - INFO - __main__ - Step 30323: {'lr': 0.00045616571239264614, 'samples': 5822016, 'steps': 30322, 'loss/train': 3.423105239868164} -08/30/2021 18:44:35 - INFO - __main__ - Step 30324: {'lr': 0.0004561627107210669, 'samples': 5822208, 'steps': 30323, 'loss/train': 1.1945616006851196} -08/30/2021 18:44:35 - INFO - __main__ - Step 30325: {'lr': 0.00045615970895659393, 'samples': 5822400, 'steps': 30324, 'loss/train': 1.3767011165618896} -08/30/2021 18:44:36 - INFO - __main__ - Step 30326: {'lr': 0.00045615670709922855, 'samples': 5822592, 'steps': 30325, 'loss/train': 1.2165873050689697} -08/30/2021 18:44:36 - INFO - __main__ - Step 30327: {'lr': 0.0004561537051489722, 'samples': 5822784, 'steps': 30326, 'loss/train': 1.6331738233566284} -08/30/2021 18:44:38 - INFO - __main__ - Step 30328: {'lr': 0.00045615070310582617, 'samples': 5822976, 'steps': 30327, 'loss/train': 1.5106899738311768} -08/30/2021 18:44:38 - INFO - __main__ - Step 30329: {'lr': 0.00045614770096979177, 'samples': 5823168, 'steps': 30328, 'loss/train': 1.4452539682388306} -08/30/2021 18:44:39 - INFO - __main__ - Step 30330: {'lr': 0.0004561446987408704, 'samples': 5823360, 'steps': 30329, 'loss/train': 1.6874357461929321} -08/30/2021 18:44:39 - INFO - __main__ - Step 30331: {'lr': 0.00045614169641906344, 'samples': 5823552, 'steps': 30330, 'loss/train': 1.418391466140747} -08/30/2021 18:44:39 - INFO - __main__ - Step 30332: {'lr': 0.00045613869400437223, 'samples': 5823744, 'steps': 30331, 'loss/train': 1.51357102394104} -08/30/2021 18:44:40 - INFO - __main__ - Step 30333: {'lr': 0.000456135691496798, 'samples': 5823936, 'steps': 30332, 'loss/train': 2.1403818130493164} -08/30/2021 18:44:41 - INFO - __main__ - Step 30334: {'lr': 0.0004561326888963423, 'samples': 5824128, 'steps': 30333, 'loss/train': 0.5983277559280396} -08/30/2021 18:44:42 - INFO - __main__ - Step 30335: {'lr': 0.0004561296862030064, 'samples': 5824320, 'steps': 30334, 'loss/train': 2.2367749214172363} -08/30/2021 18:44:42 - INFO - __main__ - Step 30336: {'lr': 0.00045612668341679164, 'samples': 5824512, 'steps': 30335, 'loss/train': 1.6840192079544067} -08/30/2021 18:44:42 - INFO - __main__ - Step 30337: {'lr': 0.0004561236805376994, 'samples': 5824704, 'steps': 30336, 'loss/train': 1.0896717309951782} -08/30/2021 18:44:43 - INFO - __main__ - Step 30338: {'lr': 0.00045612067756573097, 'samples': 5824896, 'steps': 30337, 'loss/train': 1.8446327447891235} -08/30/2021 18:44:44 - INFO - __main__ - Step 30339: {'lr': 0.0004561176745008877, 'samples': 5825088, 'steps': 30338, 'loss/train': 1.6288559436798096} -08/30/2021 18:44:45 - INFO - __main__ - Step 30340: {'lr': 0.000456114671343171, 'samples': 5825280, 'steps': 30339, 'loss/train': 0.8107740879058838} -08/30/2021 18:44:45 - INFO - __main__ - Step 30341: {'lr': 0.00045611166809258227, 'samples': 5825472, 'steps': 30340, 'loss/train': 1.2054505348205566} -08/30/2021 18:44:45 - INFO - __main__ - Step 30342: {'lr': 0.0004561086647491227, 'samples': 5825664, 'steps': 30341, 'loss/train': 1.3367034196853638} -08/30/2021 18:44:46 - INFO - __main__ - Step 30343: {'lr': 0.00045610566131279386, 'samples': 5825856, 'steps': 30342, 'loss/train': 1.408198356628418} -08/30/2021 18:44:47 - INFO - __main__ - Step 30344: {'lr': 0.00045610265778359696, 'samples': 5826048, 'steps': 30343, 'loss/train': 2.10677433013916} -08/30/2021 18:44:48 - INFO - __main__ - Step 30345: {'lr': 0.00045609965416153333, 'samples': 5826240, 'steps': 30344, 'loss/train': 1.135197401046753} -08/30/2021 18:44:48 - INFO - __main__ - Step 30346: {'lr': 0.0004560966504466044, 'samples': 5826432, 'steps': 30345, 'loss/train': 1.3828952312469482} -08/30/2021 18:44:48 - INFO - __main__ - Step 30347: {'lr': 0.00045609364663881153, 'samples': 5826624, 'steps': 30346, 'loss/train': 0.8147543668746948} -08/30/2021 18:44:49 - INFO - __main__ - Step 30348: {'lr': 0.000456090642738156, 'samples': 5826816, 'steps': 30347, 'loss/train': 1.7437959909439087} -08/30/2021 18:44:49 - INFO - __main__ - Step 30349: {'lr': 0.00045608763874463925, 'samples': 5827008, 'steps': 30348, 'loss/train': 1.5902305841445923} -08/30/2021 18:44:51 - INFO - __main__ - Step 30350: {'lr': 0.00045608463465826257, 'samples': 5827200, 'steps': 30349, 'loss/train': 1.5159223079681396} -08/30/2021 18:44:51 - INFO - __main__ - Step 30351: {'lr': 0.0004560816304790274, 'samples': 5827392, 'steps': 30350, 'loss/train': 1.2611470222473145} -08/30/2021 18:44:51 - INFO - __main__ - Step 30352: {'lr': 0.0004560786262069349, 'samples': 5827584, 'steps': 30351, 'loss/train': 1.564341425895691} -08/30/2021 18:44:52 - INFO - __main__ - Step 30353: {'lr': 0.00045607562184198666, 'samples': 5827776, 'steps': 30352, 'loss/train': 1.856213927268982} -08/30/2021 18:44:52 - INFO - __main__ - Step 30354: {'lr': 0.00045607261738418384, 'samples': 5827968, 'steps': 30353, 'loss/train': 1.079045295715332} -08/30/2021 18:44:54 - INFO - __main__ - Step 30355: {'lr': 0.00045606961283352793, 'samples': 5828160, 'steps': 30354, 'loss/train': 1.1943246126174927} -08/30/2021 18:44:55 - INFO - __main__ - Step 30356: {'lr': 0.0004560666081900202, 'samples': 5828352, 'steps': 30355, 'loss/train': 1.3076484203338623} -08/30/2021 18:44:55 - INFO - __main__ - Step 30357: {'lr': 0.00045606360345366203, 'samples': 5828544, 'steps': 30356, 'loss/train': 2.0070269107818604} -08/30/2021 18:44:55 - INFO - __main__ - Step 30358: {'lr': 0.00045606059862445485, 'samples': 5828736, 'steps': 30357, 'loss/train': 1.4410141706466675} -08/30/2021 18:44:56 - INFO - __main__ - Step 30359: {'lr': 0.0004560575937023999, 'samples': 5828928, 'steps': 30358, 'loss/train': 1.287891149520874} -08/30/2021 18:44:56 - INFO - __main__ - Step 30360: {'lr': 0.0004560545886874986, 'samples': 5829120, 'steps': 30359, 'loss/train': 1.121692180633545} -08/30/2021 18:44:58 - INFO - __main__ - Step 30361: {'lr': 0.00045605158357975225, 'samples': 5829312, 'steps': 30360, 'loss/train': 0.9509807825088501} -08/30/2021 18:44:58 - INFO - __main__ - Step 30362: {'lr': 0.00045604857837916224, 'samples': 5829504, 'steps': 30361, 'loss/train': 1.219749927520752} -08/30/2021 18:44:58 - INFO - __main__ - Step 30363: {'lr': 0.0004560455730857299, 'samples': 5829696, 'steps': 30362, 'loss/train': 1.771064043045044} -08/30/2021 18:44:59 - INFO - __main__ - Step 30364: {'lr': 0.0004560425676994566, 'samples': 5829888, 'steps': 30363, 'loss/train': 2.072871208190918} -08/30/2021 18:44:59 - INFO - __main__ - Step 30365: {'lr': 0.00045603956222034384, 'samples': 5830080, 'steps': 30364, 'loss/train': 1.4741034507751465} -08/30/2021 18:45:00 - INFO - __main__ - Step 30366: {'lr': 0.0004560365566483927, 'samples': 5830272, 'steps': 30365, 'loss/train': 1.9049711227416992} -08/30/2021 18:45:01 - INFO - __main__ - Step 30367: {'lr': 0.00045603355098360466, 'samples': 5830464, 'steps': 30366, 'loss/train': 1.1554251909255981} -08/30/2021 18:45:01 - INFO - __main__ - Step 30368: {'lr': 0.00045603054522598107, 'samples': 5830656, 'steps': 30367, 'loss/train': 1.33742094039917} -08/30/2021 18:45:02 - INFO - __main__ - Step 30369: {'lr': 0.0004560275393755233, 'samples': 5830848, 'steps': 30368, 'loss/train': 1.3915207386016846} -08/30/2021 18:45:02 - INFO - __main__ - Step 30370: {'lr': 0.0004560245334322328, 'samples': 5831040, 'steps': 30369, 'loss/train': 1.3620425462722778} -08/30/2021 18:45:03 - INFO - __main__ - Step 30371: {'lr': 0.00045602152739611075, 'samples': 5831232, 'steps': 30370, 'loss/train': 1.658311367034912} -08/30/2021 18:45:04 - INFO - __main__ - Step 30372: {'lr': 0.0004560185212671586, 'samples': 5831424, 'steps': 30371, 'loss/train': 1.6842811107635498} -08/30/2021 18:45:04 - INFO - __main__ - Step 30373: {'lr': 0.00045601551504537765, 'samples': 5831616, 'steps': 30372, 'loss/train': 1.5125207901000977} -08/30/2021 18:45:05 - INFO - __main__ - Step 30374: {'lr': 0.0004560125087307693, 'samples': 5831808, 'steps': 30373, 'loss/train': 1.4070923328399658} -08/30/2021 18:45:05 - INFO - __main__ - Step 30375: {'lr': 0.00045600950232333495, 'samples': 5832000, 'steps': 30374, 'loss/train': 1.6056480407714844} -08/30/2021 18:45:07 - INFO - __main__ - Step 30376: {'lr': 0.00045600649582307586, 'samples': 5832192, 'steps': 30375, 'loss/train': 1.4013153314590454} -08/30/2021 18:45:07 - INFO - __main__ - Step 30377: {'lr': 0.00045600348922999334, 'samples': 5832384, 'steps': 30376, 'loss/train': 2.0876340866088867} -08/30/2021 18:45:07 - INFO - __main__ - Step 30378: {'lr': 0.0004560004825440889, 'samples': 5832576, 'steps': 30377, 'loss/train': 1.4471242427825928} -08/30/2021 18:45:08 - INFO - __main__ - Step 30379: {'lr': 0.0004559974757653639, 'samples': 5832768, 'steps': 30378, 'loss/train': 1.370341420173645} -08/30/2021 18:45:08 - INFO - __main__ - Step 30380: {'lr': 0.0004559944688938195, 'samples': 5832960, 'steps': 30379, 'loss/train': 0.9219102263450623} -08/30/2021 18:45:10 - INFO - __main__ - Step 30381: {'lr': 0.0004559914619294572, 'samples': 5833152, 'steps': 30380, 'loss/train': 1.3011467456817627} -08/30/2021 18:45:10 - INFO - __main__ - Step 30382: {'lr': 0.00045598845487227835, 'samples': 5833344, 'steps': 30381, 'loss/train': 1.8089731931686401} -08/30/2021 18:45:10 - INFO - __main__ - Step 30383: {'lr': 0.0004559854477222842, 'samples': 5833536, 'steps': 30382, 'loss/train': 0.9662899971008301} -08/30/2021 18:45:11 - INFO - __main__ - Step 30384: {'lr': 0.0004559824404794763, 'samples': 5833728, 'steps': 30383, 'loss/train': 1.0928486585617065} -08/30/2021 18:45:11 - INFO - __main__ - Step 30385: {'lr': 0.0004559794331438558, 'samples': 5833920, 'steps': 30384, 'loss/train': 1.5999665260314941} -08/30/2021 18:45:13 - INFO - __main__ - Step 30386: {'lr': 0.0004559764257154242, 'samples': 5834112, 'steps': 30385, 'loss/train': 1.3363968133926392} -08/30/2021 18:45:13 - INFO - __main__ - Step 30387: {'lr': 0.0004559734181941828, 'samples': 5834304, 'steps': 30386, 'loss/train': 0.4445675015449524} -08/30/2021 18:45:14 - INFO - __main__ - Step 30388: {'lr': 0.0004559704105801329, 'samples': 5834496, 'steps': 30387, 'loss/train': 0.03256768360733986} -08/30/2021 18:45:14 - INFO - __main__ - Step 30389: {'lr': 0.00045596740287327597, 'samples': 5834688, 'steps': 30388, 'loss/train': 1.8979212045669556} -08/30/2021 18:45:14 - INFO - __main__ - Step 30390: {'lr': 0.0004559643950736133, 'samples': 5834880, 'steps': 30389, 'loss/train': 1.4951472282409668} -08/30/2021 18:45:15 - INFO - __main__ - Step 30391: {'lr': 0.00045596138718114626, 'samples': 5835072, 'steps': 30390, 'loss/train': 1.3925122022628784} -08/30/2021 18:45:16 - INFO - __main__ - Step 30392: {'lr': 0.00045595837919587616, 'samples': 5835264, 'steps': 30391, 'loss/train': 1.2257037162780762} -08/30/2021 18:45:17 - INFO - __main__ - Step 30393: {'lr': 0.0004559553711178044, 'samples': 5835456, 'steps': 30392, 'loss/train': 1.2412104606628418} -08/30/2021 18:45:17 - INFO - __main__ - Step 30394: {'lr': 0.00045595236294693236, 'samples': 5835648, 'steps': 30393, 'loss/train': 1.705388069152832} -08/30/2021 18:45:17 - INFO - __main__ - Step 30395: {'lr': 0.00045594935468326137, 'samples': 5835840, 'steps': 30394, 'loss/train': 1.5520269870758057} -08/30/2021 18:45:18 - INFO - __main__ - Step 30396: {'lr': 0.00045594634632679275, 'samples': 5836032, 'steps': 30395, 'loss/train': 1.4333055019378662} -08/30/2021 18:45:19 - INFO - __main__ - Step 30397: {'lr': 0.0004559433378775278, 'samples': 5836224, 'steps': 30396, 'loss/train': 1.3411235809326172} -08/30/2021 18:45:20 - INFO - __main__ - Step 30398: {'lr': 0.00045594032933546813, 'samples': 5836416, 'steps': 30397, 'loss/train': 1.3540788888931274} -08/30/2021 18:45:20 - INFO - __main__ - Step 30399: {'lr': 0.00045593732070061484, 'samples': 5836608, 'steps': 30398, 'loss/train': 2.5351898670196533} -08/30/2021 18:45:20 - INFO - __main__ - Step 30400: {'lr': 0.00045593431197296934, 'samples': 5836800, 'steps': 30399, 'loss/train': 1.4136940240859985} -08/30/2021 18:45:21 - INFO - __main__ - Step 30401: {'lr': 0.00045593130315253305, 'samples': 5836992, 'steps': 30400, 'loss/train': 1.7455699443817139} -08/30/2021 18:45:21 - INFO - __main__ - Step 30402: {'lr': 0.0004559282942393073, 'samples': 5837184, 'steps': 30401, 'loss/train': 1.6552643775939941} -08/30/2021 18:45:22 - INFO - __main__ - Step 30403: {'lr': 0.00045592528523329346, 'samples': 5837376, 'steps': 30402, 'loss/train': 1.1807719469070435} -08/30/2021 18:45:23 - INFO - __main__ - Step 30404: {'lr': 0.0004559222761344928, 'samples': 5837568, 'steps': 30403, 'loss/train': 1.7294528484344482} -08/30/2021 18:45:23 - INFO - __main__ - Step 30405: {'lr': 0.0004559192669429068, 'samples': 5837760, 'steps': 30404, 'loss/train': 0.8706862926483154} -08/30/2021 18:45:24 - INFO - __main__ - Step 30406: {'lr': 0.0004559162576585367, 'samples': 5837952, 'steps': 30405, 'loss/train': 1.2970597743988037} -08/30/2021 18:45:24 - INFO - __main__ - Step 30407: {'lr': 0.00045591324828138396, 'samples': 5838144, 'steps': 30406, 'loss/train': 0.31338775157928467} -08/30/2021 18:45:26 - INFO - __main__ - Step 30408: {'lr': 0.0004559102388114499, 'samples': 5838336, 'steps': 30407, 'loss/train': 1.484430193901062} -08/30/2021 18:45:27 - INFO - __main__ - Step 30409: {'lr': 0.00045590722924873585, 'samples': 5838528, 'steps': 30408, 'loss/train': 1.5280474424362183} -08/30/2021 18:45:27 - INFO - __main__ - Step 30410: {'lr': 0.00045590421959324314, 'samples': 5838720, 'steps': 30409, 'loss/train': 1.1062175035476685} -08/30/2021 18:45:27 - INFO - __main__ - Step 30411: {'lr': 0.0004559012098449732, 'samples': 5838912, 'steps': 30410, 'loss/train': 1.1596845388412476} -08/30/2021 18:45:28 - INFO - __main__ - Step 30412: {'lr': 0.00045589820000392736, 'samples': 5839104, 'steps': 30411, 'loss/train': 1.6687703132629395} -08/30/2021 18:45:29 - INFO - __main__ - Step 30413: {'lr': 0.00045589519007010695, 'samples': 5839296, 'steps': 30412, 'loss/train': 1.4259675741195679} -08/30/2021 18:45:30 - INFO - __main__ - Step 30414: {'lr': 0.0004558921800435133, 'samples': 5839488, 'steps': 30413, 'loss/train': 1.2854440212249756} -08/30/2021 18:45:30 - INFO - __main__ - Step 30415: {'lr': 0.00045588916992414784, 'samples': 5839680, 'steps': 30414, 'loss/train': 0.9629214406013489} -08/30/2021 18:45:30 - INFO - __main__ - Step 30416: {'lr': 0.0004558861597120119, 'samples': 5839872, 'steps': 30415, 'loss/train': 1.0737756490707397} -08/30/2021 18:45:31 - INFO - __main__ - Step 30417: {'lr': 0.00045588314940710683, 'samples': 5840064, 'steps': 30416, 'loss/train': 1.508437156677246} -08/30/2021 18:45:32 - INFO - __main__ - Step 30418: {'lr': 0.00045588013900943404, 'samples': 5840256, 'steps': 30417, 'loss/train': 1.1975007057189941} -08/30/2021 18:45:33 - INFO - __main__ - Step 30419: {'lr': 0.0004558771285189948, 'samples': 5840448, 'steps': 30418, 'loss/train': 2.858619213104248} -08/30/2021 18:45:33 - INFO - __main__ - Step 30420: {'lr': 0.00045587411793579047, 'samples': 5840640, 'steps': 30419, 'loss/train': 1.9410632848739624} -08/30/2021 18:45:33 - INFO - __main__ - Step 30421: {'lr': 0.0004558711072598225, 'samples': 5840832, 'steps': 30420, 'loss/train': 1.23379647731781} -08/30/2021 18:45:34 - INFO - __main__ - Step 30422: {'lr': 0.0004558680964910922, 'samples': 5841024, 'steps': 30421, 'loss/train': 0.27774685621261597} -08/30/2021 18:45:35 - INFO - __main__ - Step 30423: {'lr': 0.0004558650856296008, 'samples': 5841216, 'steps': 30422, 'loss/train': 2.0526790618896484} -08/30/2021 18:45:36 - INFO - __main__ - Step 30424: {'lr': 0.0004558620746753499, 'samples': 5841408, 'steps': 30423, 'loss/train': 1.662615418434143} -08/30/2021 18:45:36 - INFO - __main__ - Step 30425: {'lr': 0.00045585906362834063, 'samples': 5841600, 'steps': 30424, 'loss/train': 1.230448842048645} -08/30/2021 18:45:36 - INFO - __main__ - Step 30426: {'lr': 0.00045585605248857456, 'samples': 5841792, 'steps': 30425, 'loss/train': 1.2588797807693481} -08/30/2021 18:45:37 - INFO - __main__ - Step 30427: {'lr': 0.00045585304125605276, 'samples': 5841984, 'steps': 30426, 'loss/train': 1.6771354675292969} -08/30/2021 18:45:37 - INFO - __main__ - Step 30428: {'lr': 0.0004558500299307768, 'samples': 5842176, 'steps': 30427, 'loss/train': 1.565519094467163} -08/30/2021 18:45:39 - INFO - __main__ - Step 30429: {'lr': 0.00045584701851274814, 'samples': 5842368, 'steps': 30428, 'loss/train': 0.7025896906852722} -08/30/2021 18:45:39 - INFO - __main__ - Step 30430: {'lr': 0.0004558440070019678, 'samples': 5842560, 'steps': 30429, 'loss/train': 0.9535374641418457} -08/30/2021 18:45:40 - INFO - __main__ - Step 30431: {'lr': 0.0004558409953984375, 'samples': 5842752, 'steps': 30430, 'loss/train': 1.8976178169250488} -08/30/2021 18:45:40 - INFO - __main__ - Step 30432: {'lr': 0.00045583798370215837, 'samples': 5842944, 'steps': 30431, 'loss/train': 1.605116605758667} -08/30/2021 18:45:40 - INFO - __main__ - Step 30433: {'lr': 0.00045583497191313175, 'samples': 5843136, 'steps': 30432, 'loss/train': 1.421343445777893} -08/30/2021 18:45:42 - INFO - __main__ - Step 30434: {'lr': 0.00045583196003135906, 'samples': 5843328, 'steps': 30433, 'loss/train': 1.241392970085144} -08/30/2021 18:45:42 - INFO - __main__ - Step 30435: {'lr': 0.0004558289480568417, 'samples': 5843520, 'steps': 30434, 'loss/train': 1.3463464975357056} -08/30/2021 18:45:43 - INFO - __main__ - Step 30436: {'lr': 0.00045582593598958107, 'samples': 5843712, 'steps': 30435, 'loss/train': 1.0346914529800415} -08/30/2021 18:45:43 - INFO - __main__ - Step 30437: {'lr': 0.00045582292382957836, 'samples': 5843904, 'steps': 30436, 'loss/train': 1.015781283378601} -08/30/2021 18:45:43 - INFO - __main__ - Step 30438: {'lr': 0.000455819911576835, 'samples': 5844096, 'steps': 30437, 'loss/train': 0.68913334608078} -08/30/2021 18:45:45 - INFO - __main__ - Step 30439: {'lr': 0.00045581689923135247, 'samples': 5844288, 'steps': 30438, 'loss/train': 1.3282723426818848} -08/30/2021 18:45:45 - INFO - __main__ - Step 30440: {'lr': 0.00045581388679313194, 'samples': 5844480, 'steps': 30439, 'loss/train': 1.3578760623931885} -08/30/2021 18:45:46 - INFO - __main__ - Step 30441: {'lr': 0.0004558108742621748, 'samples': 5844672, 'steps': 30440, 'loss/train': 1.2686543464660645} -08/30/2021 18:45:46 - INFO - __main__ - Step 30442: {'lr': 0.00045580786163848254, 'samples': 5844864, 'steps': 30441, 'loss/train': 1.8725361824035645} -08/30/2021 18:45:47 - INFO - __main__ - Step 30443: {'lr': 0.00045580484892205643, 'samples': 5845056, 'steps': 30442, 'loss/train': 0.21499814093112946} -08/30/2021 18:45:48 - INFO - __main__ - Step 30444: {'lr': 0.0004558018361128978, 'samples': 5845248, 'steps': 30443, 'loss/train': 1.5177667140960693} -08/30/2021 18:45:48 - INFO - __main__ - Step 30445: {'lr': 0.0004557988232110081, 'samples': 5845440, 'steps': 30444, 'loss/train': 1.489311933517456} -08/30/2021 18:45:49 - INFO - __main__ - Step 30446: {'lr': 0.00045579581021638855, 'samples': 5845632, 'steps': 30445, 'loss/train': 1.3952984809875488} -08/30/2021 18:45:49 - INFO - __main__ - Step 30447: {'lr': 0.00045579279712904057, 'samples': 5845824, 'steps': 30446, 'loss/train': 1.918003797531128} -08/30/2021 18:45:49 - INFO - __main__ - Step 30448: {'lr': 0.00045578978394896565, 'samples': 5846016, 'steps': 30447, 'loss/train': 1.2355464696884155} -08/30/2021 18:45:51 - INFO - __main__ - Step 30449: {'lr': 0.00045578677067616494, 'samples': 5846208, 'steps': 30448, 'loss/train': 1.6813616752624512} -08/30/2021 18:45:52 - INFO - __main__ - Step 30450: {'lr': 0.0004557837573106399, 'samples': 5846400, 'steps': 30449, 'loss/train': 1.2796074151992798} -08/30/2021 18:45:52 - INFO - __main__ - Step 30451: {'lr': 0.0004557807438523919, 'samples': 5846592, 'steps': 30450, 'loss/train': 6.387538433074951} -08/30/2021 18:45:53 - INFO - __main__ - Step 30452: {'lr': 0.00045577773030142224, 'samples': 5846784, 'steps': 30451, 'loss/train': 1.488860011100769} -08/30/2021 18:45:53 - INFO - __main__ - Step 30453: {'lr': 0.0004557747166577323, 'samples': 5846976, 'steps': 30452, 'loss/train': 1.4834585189819336} -08/30/2021 18:45:53 - INFO - __main__ - Step 30454: {'lr': 0.0004557717029213234, 'samples': 5847168, 'steps': 30453, 'loss/train': 1.0458354949951172} -08/30/2021 18:45:54 - INFO - __main__ - Step 30455: {'lr': 0.00045576868909219704, 'samples': 5847360, 'steps': 30454, 'loss/train': 0.03212663531303406} -08/30/2021 18:45:55 - INFO - __main__ - Step 30456: {'lr': 0.0004557656751703544, 'samples': 5847552, 'steps': 30455, 'loss/train': 1.2394939661026} -08/30/2021 18:45:55 - INFO - __main__ - Step 30457: {'lr': 0.000455762661155797, 'samples': 5847744, 'steps': 30456, 'loss/train': 1.448106050491333} -08/30/2021 18:45:56 - INFO - __main__ - Step 30458: {'lr': 0.0004557596470485261, 'samples': 5847936, 'steps': 30457, 'loss/train': 1.1777966022491455} -08/30/2021 18:45:56 - INFO - __main__ - Step 30459: {'lr': 0.0004557566328485431, 'samples': 5848128, 'steps': 30458, 'loss/train': 1.5696755647659302} -08/30/2021 18:45:57 - INFO - __main__ - Step 30460: {'lr': 0.00045575361855584927, 'samples': 5848320, 'steps': 30459, 'loss/train': 1.4418385028839111} -08/30/2021 18:45:59 - INFO - __main__ - Step 30461: {'lr': 0.00045575060417044614, 'samples': 5848512, 'steps': 30460, 'loss/train': 1.3801296949386597} -08/30/2021 18:45:59 - INFO - __main__ - Step 30462: {'lr': 0.0004557475896923349, 'samples': 5848704, 'steps': 30461, 'loss/train': 1.2891565561294556} -08/30/2021 18:46:00 - INFO - __main__ - Step 30463: {'lr': 0.0004557445751215169, 'samples': 5848896, 'steps': 30462, 'loss/train': 0.852066695690155} -08/30/2021 18:46:00 - INFO - __main__ - Step 30464: {'lr': 0.00045574156045799367, 'samples': 5849088, 'steps': 30463, 'loss/train': 1.145896077156067} -08/30/2021 18:46:00 - INFO - __main__ - Step 30465: {'lr': 0.0004557385457017664, 'samples': 5849280, 'steps': 30464, 'loss/train': 0.06214486062526703} -08/30/2021 18:46:02 - INFO - __main__ - Step 30466: {'lr': 0.0004557355308528366, 'samples': 5849472, 'steps': 30465, 'loss/train': 1.7655445337295532} -08/30/2021 18:46:02 - INFO - __main__ - Step 30467: {'lr': 0.00045573251591120545, 'samples': 5849664, 'steps': 30466, 'loss/train': 1.5356248617172241} -08/30/2021 18:46:03 - INFO - __main__ - Step 30468: {'lr': 0.00045572950087687447, 'samples': 5849856, 'steps': 30467, 'loss/train': 0.8759242296218872} -08/30/2021 18:46:03 - INFO - __main__ - Step 30469: {'lr': 0.0004557264857498449, 'samples': 5850048, 'steps': 30468, 'loss/train': 1.3312257528305054} -08/30/2021 18:46:03 - INFO - __main__ - Step 30470: {'lr': 0.0004557234705301182, 'samples': 5850240, 'steps': 30469, 'loss/train': 1.327883005142212} -08/30/2021 18:46:05 - INFO - __main__ - Step 30471: {'lr': 0.0004557204552176957, 'samples': 5850432, 'steps': 30470, 'loss/train': 1.6778514385223389} -08/30/2021 18:46:06 - INFO - __main__ - Step 30472: {'lr': 0.0004557174398125786, 'samples': 5850624, 'steps': 30471, 'loss/train': 2.120680332183838} -08/30/2021 18:46:06 - INFO - __main__ - Step 30473: {'lr': 0.00045571442431476856, 'samples': 5850816, 'steps': 30472, 'loss/train': 0.0953216403722763} -08/30/2021 18:46:06 - INFO - __main__ - Step 30474: {'lr': 0.0004557114087242667, 'samples': 5851008, 'steps': 30473, 'loss/train': 0.33750244975090027} -08/30/2021 18:46:07 - INFO - __main__ - Step 30475: {'lr': 0.0004557083930410745, 'samples': 5851200, 'steps': 30474, 'loss/train': 1.6529700756072998} -08/30/2021 18:46:08 - INFO - __main__ - Step 30476: {'lr': 0.0004557053772651932, 'samples': 5851392, 'steps': 30475, 'loss/train': 1.3859875202178955} -08/30/2021 18:46:09 - INFO - __main__ - Step 30477: {'lr': 0.00045570236139662426, 'samples': 5851584, 'steps': 30476, 'loss/train': 1.657836675643921} -08/30/2021 18:46:09 - INFO - __main__ - Step 30478: {'lr': 0.000455699345435369, 'samples': 5851776, 'steps': 30477, 'loss/train': 0.9254941344261169} -08/30/2021 18:46:09 - INFO - __main__ - Step 30479: {'lr': 0.0004556963293814288, 'samples': 5851968, 'steps': 30478, 'loss/train': 1.3769621849060059} -08/30/2021 18:46:10 - INFO - __main__ - Step 30480: {'lr': 0.000455693313234805, 'samples': 5852160, 'steps': 30479, 'loss/train': 1.717210054397583} -08/30/2021 18:46:11 - INFO - __main__ - Step 30481: {'lr': 0.000455690296995499, 'samples': 5852352, 'steps': 30480, 'loss/train': 1.1527591943740845} -08/30/2021 18:46:12 - INFO - __main__ - Step 30482: {'lr': 0.00045568728066351205, 'samples': 5852544, 'steps': 30481, 'loss/train': 1.7294851541519165} -08/30/2021 18:46:12 - INFO - __main__ - Step 30483: {'lr': 0.0004556842642388457, 'samples': 5852736, 'steps': 30482, 'loss/train': 1.99919855594635} -08/30/2021 18:46:12 - INFO - __main__ - Step 30484: {'lr': 0.0004556812477215011, 'samples': 5852928, 'steps': 30483, 'loss/train': 1.4838645458221436} -08/30/2021 18:46:13 - INFO - __main__ - Step 30485: {'lr': 0.0004556782311114798, 'samples': 5853120, 'steps': 30484, 'loss/train': 1.397320032119751} -08/30/2021 18:46:14 - INFO - __main__ - Step 30486: {'lr': 0.00045567521440878294, 'samples': 5853312, 'steps': 30485, 'loss/train': 0.9859090447425842} -08/30/2021 18:46:15 - INFO - __main__ - Step 30487: {'lr': 0.000455672197613412, 'samples': 5853504, 'steps': 30486, 'loss/train': 1.4842674732208252} -08/30/2021 18:46:15 - INFO - __main__ - Step 30488: {'lr': 0.00045566918072536844, 'samples': 5853696, 'steps': 30487, 'loss/train': 1.6535218954086304} -08/30/2021 18:46:15 - INFO - __main__ - Step 30489: {'lr': 0.00045566616374465355, 'samples': 5853888, 'steps': 30488, 'loss/train': 1.4215378761291504} -08/30/2021 18:46:16 - INFO - __main__ - Step 30490: {'lr': 0.0004556631466712686, 'samples': 5854080, 'steps': 30489, 'loss/train': 1.4654356241226196} -08/30/2021 18:46:17 - INFO - __main__ - Step 30491: {'lr': 0.00045566012950521497, 'samples': 5854272, 'steps': 30490, 'loss/train': 1.2836042642593384} -08/30/2021 18:46:18 - INFO - __main__ - Step 30492: {'lr': 0.0004556571122464941, 'samples': 5854464, 'steps': 30491, 'loss/train': 0.877436101436615} -08/30/2021 18:46:18 - INFO - __main__ - Step 30493: {'lr': 0.0004556540948951073, 'samples': 5854656, 'steps': 30492, 'loss/train': 1.3347598314285278} -08/30/2021 18:46:18 - INFO - __main__ - Step 30494: {'lr': 0.00045565107745105594, 'samples': 5854848, 'steps': 30493, 'loss/train': 1.2189784049987793} -08/30/2021 18:46:19 - INFO - __main__ - Step 30495: {'lr': 0.00045564805991434135, 'samples': 5855040, 'steps': 30494, 'loss/train': 0.9045740365982056} -08/30/2021 18:46:19 - INFO - __main__ - Step 30496: {'lr': 0.00045564504228496494, 'samples': 5855232, 'steps': 30495, 'loss/train': 1.2949351072311401} -08/30/2021 18:46:21 - INFO - __main__ - Step 30497: {'lr': 0.0004556420245629281, 'samples': 5855424, 'steps': 30496, 'loss/train': 1.397195816040039} -08/30/2021 18:46:21 - INFO - __main__ - Step 30498: {'lr': 0.00045563900674823205, 'samples': 5855616, 'steps': 30497, 'loss/train': 1.7661831378936768} -08/30/2021 18:46:21 - INFO - __main__ - Step 30499: {'lr': 0.0004556359888408783, 'samples': 5855808, 'steps': 30498, 'loss/train': 1.0134663581848145} -08/30/2021 18:46:22 - INFO - __main__ - Step 30500: {'lr': 0.00045563297084086807, 'samples': 5856000, 'steps': 30499, 'loss/train': 1.4503636360168457} -08/30/2021 18:46:22 - INFO - __main__ - Step 30501: {'lr': 0.00045562995274820285, 'samples': 5856192, 'steps': 30500, 'loss/train': 0.9922452569007874} -08/30/2021 18:46:24 - INFO - __main__ - Step 30502: {'lr': 0.00045562693456288394, 'samples': 5856384, 'steps': 30501, 'loss/train': 2.010448455810547} -08/30/2021 18:46:24 - INFO - __main__ - Step 30503: {'lr': 0.00045562391628491274, 'samples': 5856576, 'steps': 30502, 'loss/train': 1.1344683170318604} -08/30/2021 18:46:24 - INFO - __main__ - Step 30504: {'lr': 0.00045562089791429056, 'samples': 5856768, 'steps': 30503, 'loss/train': 1.7426371574401855} -08/30/2021 18:46:25 - INFO - __main__ - Step 30505: {'lr': 0.00045561787945101875, 'samples': 5856960, 'steps': 30504, 'loss/train': 1.4198999404907227} -08/30/2021 18:46:25 - INFO - __main__ - Step 30506: {'lr': 0.0004556148608950987, 'samples': 5857152, 'steps': 30505, 'loss/train': 1.4265637397766113} -08/30/2021 18:46:27 - INFO - __main__ - Step 30507: {'lr': 0.0004556118422465319, 'samples': 5857344, 'steps': 30506, 'loss/train': 1.5557074546813965} -08/30/2021 18:46:27 - INFO - __main__ - Step 30508: {'lr': 0.00045560882350531936, 'samples': 5857536, 'steps': 30507, 'loss/train': 1.7879557609558105} -08/30/2021 18:46:28 - INFO - __main__ - Step 30509: {'lr': 0.00045560580467146275, 'samples': 5857728, 'steps': 30508, 'loss/train': 1.1841042041778564} -08/30/2021 18:46:28 - INFO - __main__ - Step 30510: {'lr': 0.00045560278574496334, 'samples': 5857920, 'steps': 30509, 'loss/train': 1.4868690967559814} -08/30/2021 18:46:28 - INFO - __main__ - Step 30511: {'lr': 0.0004555997667258225, 'samples': 5858112, 'steps': 30510, 'loss/train': 1.1867871284484863} -08/30/2021 18:46:30 - INFO - __main__ - Step 30512: {'lr': 0.0004555967476140416, 'samples': 5858304, 'steps': 30511, 'loss/train': 1.388865351676941} -08/30/2021 18:46:31 - INFO - __main__ - Step 30513: {'lr': 0.00045559372840962186, 'samples': 5858496, 'steps': 30512, 'loss/train': 1.6118932962417603} -08/30/2021 18:46:31 - INFO - __main__ - Step 30514: {'lr': 0.00045559070911256486, 'samples': 5858688, 'steps': 30513, 'loss/train': 1.347998023033142} -08/30/2021 18:46:31 - INFO - __main__ - Step 30515: {'lr': 0.00045558768972287183, 'samples': 5858880, 'steps': 30514, 'loss/train': 2.067528486251831} -08/30/2021 18:46:32 - INFO - __main__ - Step 30516: {'lr': 0.0004555846702405442, 'samples': 5859072, 'steps': 30515, 'loss/train': 1.5631417036056519} -08/30/2021 18:46:34 - INFO - __main__ - Step 30517: {'lr': 0.0004555816506655832, 'samples': 5859264, 'steps': 30516, 'loss/train': 1.0549486875534058} -08/30/2021 18:46:34 - INFO - __main__ - Step 30518: {'lr': 0.00045557863099799034, 'samples': 5859456, 'steps': 30517, 'loss/train': 1.077292799949646} -08/30/2021 18:46:35 - INFO - __main__ - Step 30519: {'lr': 0.000455575611237767, 'samples': 5859648, 'steps': 30518, 'loss/train': 0.03098430298268795} -08/30/2021 18:46:35 - INFO - __main__ - Step 30520: {'lr': 0.00045557259138491435, 'samples': 5859840, 'steps': 30519, 'loss/train': 1.6459323167800903} -08/30/2021 18:46:35 - INFO - __main__ - Step 30521: {'lr': 0.0004555695714394339, 'samples': 5860032, 'steps': 30520, 'loss/train': 1.690779209136963} -08/30/2021 18:46:36 - INFO - __main__ - Step 30522: {'lr': 0.00045556655140132696, 'samples': 5860224, 'steps': 30521, 'loss/train': 0.7677645087242126} -08/30/2021 18:46:36 - INFO - __main__ - Step 30523: {'lr': 0.00045556353127059493, 'samples': 5860416, 'steps': 30522, 'loss/train': 0.35487547516822815} -08/30/2021 18:46:38 - INFO - __main__ - Step 30524: {'lr': 0.0004555605110472391, 'samples': 5860608, 'steps': 30523, 'loss/train': 0.0684698075056076} -08/30/2021 18:46:38 - INFO - __main__ - Step 30525: {'lr': 0.0004555574907312609, 'samples': 5860800, 'steps': 30524, 'loss/train': 2.669593095779419} -08/30/2021 18:46:39 - INFO - __main__ - Step 30526: {'lr': 0.00045555447032266167, 'samples': 5860992, 'steps': 30525, 'loss/train': 0.06736353784799576} -08/30/2021 18:46:39 - INFO - __main__ - Step 30527: {'lr': 0.0004555514498214428, 'samples': 5861184, 'steps': 30526, 'loss/train': 0.20482386648654938} -08/30/2021 18:46:39 - INFO - __main__ - Step 30528: {'lr': 0.0004555484292276055, 'samples': 5861376, 'steps': 30527, 'loss/train': 1.2516772747039795} -08/30/2021 18:46:41 - INFO - __main__ - Step 30529: {'lr': 0.0004555454085411514, 'samples': 5861568, 'steps': 30528, 'loss/train': 1.602391242980957} -08/30/2021 18:46:41 - INFO - __main__ - Step 30530: {'lr': 0.0004555423877620817, 'samples': 5861760, 'steps': 30529, 'loss/train': 1.408811330795288} -08/30/2021 18:46:42 - INFO - __main__ - Step 30531: {'lr': 0.00045553936689039765, 'samples': 5861952, 'steps': 30530, 'loss/train': 1.4809492826461792} -08/30/2021 18:46:42 - INFO - __main__ - Step 30532: {'lr': 0.00045553634592610084, 'samples': 5862144, 'steps': 30531, 'loss/train': 1.6968696117401123} -08/30/2021 18:46:42 - INFO - __main__ - Step 30533: {'lr': 0.00045553332486919246, 'samples': 5862336, 'steps': 30532, 'loss/train': 1.3688582181930542} -08/30/2021 18:46:44 - INFO - __main__ - Step 30534: {'lr': 0.000455530303719674, 'samples': 5862528, 'steps': 30533, 'loss/train': 1.5412429571151733} -08/30/2021 18:46:45 - INFO - __main__ - Step 30535: {'lr': 0.00045552728247754673, 'samples': 5862720, 'steps': 30534, 'loss/train': 1.7840511798858643} -08/30/2021 18:46:45 - INFO - __main__ - Step 30536: {'lr': 0.000455524261142812, 'samples': 5862912, 'steps': 30535, 'loss/train': 1.3917664289474487} -08/30/2021 18:46:45 - INFO - __main__ - Step 30537: {'lr': 0.00045552123971547123, 'samples': 5863104, 'steps': 30536, 'loss/train': 1.1540929079055786} -08/30/2021 18:46:46 - INFO - __main__ - Step 30538: {'lr': 0.00045551821819552575, 'samples': 5863296, 'steps': 30537, 'loss/train': 1.5662599802017212} -08/30/2021 18:46:46 - INFO - __main__ - Step 30539: {'lr': 0.0004555151965829769, 'samples': 5863488, 'steps': 30538, 'loss/train': 2.3214945793151855} -08/30/2021 18:46:46 - INFO - __main__ - Step 30540: {'lr': 0.0004555121748778261, 'samples': 5863680, 'steps': 30539, 'loss/train': 1.051978349685669} -08/30/2021 18:46:48 - INFO - __main__ - Step 30541: {'lr': 0.0004555091530800748, 'samples': 5863872, 'steps': 30540, 'loss/train': 0.8701170086860657} -08/30/2021 18:46:49 - INFO - __main__ - Step 30542: {'lr': 0.0004555061311897241, 'samples': 5864064, 'steps': 30541, 'loss/train': 1.3463091850280762} -08/30/2021 18:46:49 - INFO - __main__ - Step 30543: {'lr': 0.0004555031092067756, 'samples': 5864256, 'steps': 30542, 'loss/train': 2.326798439025879} -08/30/2021 18:46:50 - INFO - __main__ - Step 30544: {'lr': 0.00045550008713123047, 'samples': 5864448, 'steps': 30543, 'loss/train': 1.2083103656768799} -08/30/2021 18:46:50 - INFO - __main__ - Step 30545: {'lr': 0.00045549706496309027, 'samples': 5864640, 'steps': 30544, 'loss/train': 1.6895496845245361} -08/30/2021 18:46:50 - INFO - __main__ - Step 30546: {'lr': 0.0004554940427023562, 'samples': 5864832, 'steps': 30545, 'loss/train': 6.210311412811279} -08/30/2021 18:46:52 - INFO - __main__ - Step 30547: {'lr': 0.00045549102034902973, 'samples': 5865024, 'steps': 30546, 'loss/train': 6.09959602355957} -08/30/2021 18:46:53 - INFO - __main__ - Step 30548: {'lr': 0.0004554879979031121, 'samples': 5865216, 'steps': 30547, 'loss/train': 2.1539881229400635} -08/30/2021 18:46:53 - INFO - __main__ - Step 30549: {'lr': 0.00045548497536460487, 'samples': 5865408, 'steps': 30548, 'loss/train': 1.7157001495361328} -08/30/2021 18:46:54 - INFO - __main__ - Step 30550: {'lr': 0.00045548195273350926, 'samples': 5865600, 'steps': 30549, 'loss/train': 0.7891212701797485} -08/30/2021 18:46:54 - INFO - __main__ - Step 30551: {'lr': 0.0004554789300098265, 'samples': 5865792, 'steps': 30550, 'loss/train': 1.369751214981079} -08/30/2021 18:46:54 - INFO - __main__ - Step 30552: {'lr': 0.00045547590719355823, 'samples': 5865984, 'steps': 30551, 'loss/train': 1.878090500831604} -08/30/2021 18:46:56 - INFO - __main__ - Step 30553: {'lr': 0.00045547288428470574, 'samples': 5866176, 'steps': 30552, 'loss/train': 1.9719336032867432} -08/30/2021 18:46:56 - INFO - __main__ - Step 30554: {'lr': 0.0004554698612832703, 'samples': 5866368, 'steps': 30553, 'loss/train': 1.7289650440216064} -08/30/2021 18:46:57 - INFO - __main__ - Step 30555: {'lr': 0.00045546683818925327, 'samples': 5866560, 'steps': 30554, 'loss/train': 1.6674176454544067} -08/30/2021 18:46:57 - INFO - __main__ - Step 30556: {'lr': 0.000455463815002656, 'samples': 5866752, 'steps': 30555, 'loss/train': 1.6973453760147095} -08/30/2021 18:46:57 - INFO - __main__ - Step 30557: {'lr': 0.00045546079172348, 'samples': 5866944, 'steps': 30556, 'loss/train': 1.1133997440338135} -08/30/2021 18:46:59 - INFO - __main__ - Step 30558: {'lr': 0.00045545776835172647, 'samples': 5867136, 'steps': 30557, 'loss/train': 1.8632644414901733} -08/30/2021 18:46:59 - INFO - __main__ - Step 30559: {'lr': 0.00045545474488739693, 'samples': 5867328, 'steps': 30558, 'loss/train': 1.7757090330123901} -08/30/2021 18:47:00 - INFO - __main__ - Step 30560: {'lr': 0.0004554517213304926, 'samples': 5867520, 'steps': 30559, 'loss/train': 1.501355528831482} -08/30/2021 18:47:00 - INFO - __main__ - Step 30561: {'lr': 0.00045544869768101486, 'samples': 5867712, 'steps': 30560, 'loss/train': 1.4714609384536743} -08/30/2021 18:47:00 - INFO - __main__ - Step 30562: {'lr': 0.0004554456739389652, 'samples': 5867904, 'steps': 30561, 'loss/train': 1.2786227464675903} -08/30/2021 18:47:02 - INFO - __main__ - Step 30563: {'lr': 0.00045544265010434484, 'samples': 5868096, 'steps': 30562, 'loss/train': 1.601311445236206} -08/30/2021 18:47:03 - INFO - __main__ - Step 30564: {'lr': 0.0004554396261771552, 'samples': 5868288, 'steps': 30563, 'loss/train': 0.894614040851593} -08/30/2021 18:47:03 - INFO - __main__ - Step 30565: {'lr': 0.00045543660215739755, 'samples': 5868480, 'steps': 30564, 'loss/train': 0.070391945540905} -08/30/2021 18:47:04 - INFO - __main__ - Step 30566: {'lr': 0.00045543357804507344, 'samples': 5868672, 'steps': 30565, 'loss/train': 0.0783257707953453} -08/30/2021 18:47:04 - INFO - __main__ - Step 30567: {'lr': 0.00045543055384018405, 'samples': 5868864, 'steps': 30566, 'loss/train': 1.2704730033874512} -08/30/2021 18:47:04 - INFO - __main__ - Step 30568: {'lr': 0.0004554275295427309, 'samples': 5869056, 'steps': 30567, 'loss/train': 2.2178378105163574} -08/30/2021 18:47:05 - INFO - __main__ - Step 30569: {'lr': 0.0004554245051527153, 'samples': 5869248, 'steps': 30568, 'loss/train': 1.5451369285583496} -08/30/2021 18:47:06 - INFO - __main__ - Step 30570: {'lr': 0.0004554214806701384, 'samples': 5869440, 'steps': 30569, 'loss/train': 1.0610790252685547} -08/30/2021 18:47:07 - INFO - __main__ - Step 30571: {'lr': 0.000455418456095002, 'samples': 5869632, 'steps': 30570, 'loss/train': 0.13574184477329254} -08/30/2021 18:47:07 - INFO - __main__ - Step 30572: {'lr': 0.000455415431427307, 'samples': 5869824, 'steps': 30571, 'loss/train': 1.4240336418151855} -08/30/2021 18:47:08 - INFO - __main__ - Step 30573: {'lr': 0.00045541240666705516, 'samples': 5870016, 'steps': 30572, 'loss/train': 1.0464187860488892} -08/30/2021 18:47:08 - INFO - __main__ - Step 30574: {'lr': 0.0004554093818142475, 'samples': 5870208, 'steps': 30573, 'loss/train': 1.1992316246032715} -08/30/2021 18:47:10 - INFO - __main__ - Step 30575: {'lr': 0.0004554063568688857, 'samples': 5870400, 'steps': 30574, 'loss/train': 0.9268847107887268} -08/30/2021 18:47:11 - INFO - __main__ - Step 30576: {'lr': 0.0004554033318309708, 'samples': 5870592, 'steps': 30575, 'loss/train': 1.431304931640625} -08/30/2021 18:47:11 - INFO - __main__ - Step 30577: {'lr': 0.00045540030670050447, 'samples': 5870784, 'steps': 30576, 'loss/train': 0.63565593957901} -08/30/2021 18:47:11 - INFO - __main__ - Step 30578: {'lr': 0.0004553972814774878, 'samples': 5870976, 'steps': 30577, 'loss/train': 1.849929928779602} -08/30/2021 18:47:12 - INFO - __main__ - Step 30579: {'lr': 0.00045539425616192243, 'samples': 5871168, 'steps': 30578, 'loss/train': 1.5432122945785522} -08/30/2021 18:47:13 - INFO - __main__ - Step 30580: {'lr': 0.0004553912307538095, 'samples': 5871360, 'steps': 30579, 'loss/train': 1.8094135522842407} -08/30/2021 18:47:14 - INFO - __main__ - Step 30581: {'lr': 0.0004553882052531504, 'samples': 5871552, 'steps': 30580, 'loss/train': 0.36771920323371887} -08/30/2021 18:47:14 - INFO - __main__ - Step 30582: {'lr': 0.00045538517965994663, 'samples': 5871744, 'steps': 30581, 'loss/train': 1.361254334449768} -08/30/2021 18:47:14 - INFO - __main__ - Step 30583: {'lr': 0.0004553821539741994, 'samples': 5871936, 'steps': 30582, 'loss/train': 2.047004222869873} -08/30/2021 18:47:15 - INFO - __main__ - Step 30584: {'lr': 0.0004553791281959102, 'samples': 5872128, 'steps': 30583, 'loss/train': 0.8175615072250366} -08/30/2021 18:47:16 - INFO - __main__ - Step 30585: {'lr': 0.00045537610232508033, 'samples': 5872320, 'steps': 30584, 'loss/train': 2.0487401485443115} -08/30/2021 18:47:17 - INFO - __main__ - Step 30586: {'lr': 0.0004553730763617111, 'samples': 5872512, 'steps': 30585, 'loss/train': 1.3200666904449463} -08/30/2021 18:47:17 - INFO - __main__ - Step 30587: {'lr': 0.000455370050305804, 'samples': 5872704, 'steps': 30586, 'loss/train': 1.4460279941558838} -08/30/2021 18:47:17 - INFO - __main__ - Step 30588: {'lr': 0.0004553670241573603, 'samples': 5872896, 'steps': 30587, 'loss/train': 1.4460350275039673} -08/30/2021 18:47:18 - INFO - __main__ - Step 30589: {'lr': 0.00045536399791638133, 'samples': 5873088, 'steps': 30588, 'loss/train': 1.5300310850143433} -08/30/2021 18:47:19 - INFO - __main__ - Step 30590: {'lr': 0.0004553609715828686, 'samples': 5873280, 'steps': 30589, 'loss/train': 1.2519655227661133} -08/30/2021 18:47:20 - INFO - __main__ - Step 30591: {'lr': 0.00045535794515682334, 'samples': 5873472, 'steps': 30590, 'loss/train': 1.3778111934661865} -08/30/2021 18:47:20 - INFO - __main__ - Step 30592: {'lr': 0.00045535491863824695, 'samples': 5873664, 'steps': 30591, 'loss/train': 1.2975655794143677} -08/30/2021 18:47:20 - INFO - __main__ - Step 30593: {'lr': 0.0004553518920271408, 'samples': 5873856, 'steps': 30592, 'loss/train': 1.4341940879821777} -08/30/2021 18:47:21 - INFO - __main__ - Step 30594: {'lr': 0.00045534886532350627, 'samples': 5874048, 'steps': 30593, 'loss/train': 1.7200616598129272} -08/30/2021 18:47:22 - INFO - __main__ - Step 30595: {'lr': 0.00045534583852734474, 'samples': 5874240, 'steps': 30594, 'loss/train': 1.616725206375122} -08/30/2021 18:47:23 - INFO - __main__ - Step 30596: {'lr': 0.00045534281163865756, 'samples': 5874432, 'steps': 30595, 'loss/train': 0.9719061851501465} -08/30/2021 18:47:23 - INFO - __main__ - Step 30597: {'lr': 0.000455339784657446, 'samples': 5874624, 'steps': 30596, 'loss/train': 1.596483826637268} -08/30/2021 18:47:23 - INFO - __main__ - Step 30598: {'lr': 0.0004553367575837115, 'samples': 5874816, 'steps': 30597, 'loss/train': 1.2679634094238281} -08/30/2021 18:47:24 - INFO - __main__ - Step 30599: {'lr': 0.00045533373041745545, 'samples': 5875008, 'steps': 30598, 'loss/train': 1.1390831470489502} -08/30/2021 18:47:24 - INFO - __main__ - Step 30600: {'lr': 0.00045533070315867917, 'samples': 5875200, 'steps': 30599, 'loss/train': 1.7121864557266235} -08/30/2021 18:47:26 - INFO - __main__ - Step 30601: {'lr': 0.0004553276758073841, 'samples': 5875392, 'steps': 30600, 'loss/train': 1.8994885683059692} -08/30/2021 18:47:26 - INFO - __main__ - Step 30602: {'lr': 0.00045532464836357155, 'samples': 5875584, 'steps': 30601, 'loss/train': 1.7125836610794067} -08/30/2021 18:47:26 - INFO - __main__ - Step 30603: {'lr': 0.0004553216208272428, 'samples': 5875776, 'steps': 30602, 'loss/train': 1.7440612316131592} -08/30/2021 18:47:27 - INFO - __main__ - Step 30604: {'lr': 0.0004553185931983994, 'samples': 5875968, 'steps': 30603, 'loss/train': 1.6306486129760742} -08/30/2021 18:47:27 - INFO - __main__ - Step 30605: {'lr': 0.00045531556547704255, 'samples': 5876160, 'steps': 30604, 'loss/train': 1.2530897855758667} -08/30/2021 18:47:29 - INFO - __main__ - Step 30606: {'lr': 0.00045531253766317373, 'samples': 5876352, 'steps': 30605, 'loss/train': 1.349639654159546} -08/30/2021 18:47:29 - INFO - __main__ - Step 30607: {'lr': 0.0004553095097567942, 'samples': 5876544, 'steps': 30606, 'loss/train': 1.7893048524856567} -08/30/2021 18:47:30 - INFO - __main__ - Step 30608: {'lr': 0.0004553064817579053, 'samples': 5876736, 'steps': 30607, 'loss/train': 1.4117324352264404} -08/30/2021 18:47:30 - INFO - __main__ - Step 30609: {'lr': 0.0004553034536665086, 'samples': 5876928, 'steps': 30608, 'loss/train': 0.6804377436637878} -08/30/2021 18:47:30 - INFO - __main__ - Step 30610: {'lr': 0.0004553004254826053, 'samples': 5877120, 'steps': 30609, 'loss/train': 0.7034269571304321} -08/30/2021 18:47:32 - INFO - __main__ - Step 30611: {'lr': 0.0004552973972061967, 'samples': 5877312, 'steps': 30610, 'loss/train': 0.9731603860855103} -08/30/2021 18:47:33 - INFO - __main__ - Step 30612: {'lr': 0.00045529436883728436, 'samples': 5877504, 'steps': 30611, 'loss/train': 1.7750425338745117} -08/30/2021 18:47:33 - INFO - __main__ - Step 30613: {'lr': 0.0004552913403758695, 'samples': 5877696, 'steps': 30612, 'loss/train': 1.576848030090332} -08/30/2021 18:47:33 - INFO - __main__ - Step 30614: {'lr': 0.00045528831182195355, 'samples': 5877888, 'steps': 30613, 'loss/train': 1.0929534435272217} -08/30/2021 18:47:34 - INFO - __main__ - Step 30615: {'lr': 0.00045528528317553786, 'samples': 5878080, 'steps': 30614, 'loss/train': 1.2400987148284912} -08/30/2021 18:47:35 - INFO - __main__ - Step 30616: {'lr': 0.0004552822544366238, 'samples': 5878272, 'steps': 30615, 'loss/train': 1.3178428411483765} -08/30/2021 18:47:35 - INFO - __main__ - Step 30617: {'lr': 0.00045527922560521274, 'samples': 5878464, 'steps': 30616, 'loss/train': 1.4441092014312744} -08/30/2021 18:47:36 - INFO - __main__ - Step 30618: {'lr': 0.0004552761966813059, 'samples': 5878656, 'steps': 30617, 'loss/train': 0.24038703739643097} -08/30/2021 18:47:36 - INFO - __main__ - Step 30619: {'lr': 0.00045527316766490487, 'samples': 5878848, 'steps': 30618, 'loss/train': 1.0963329076766968} -08/30/2021 18:47:37 - INFO - __main__ - Step 30620: {'lr': 0.000455270138556011, 'samples': 5879040, 'steps': 30619, 'loss/train': 1.7947168350219727} -08/30/2021 18:47:38 - INFO - __main__ - Step 30621: {'lr': 0.00045526710935462543, 'samples': 5879232, 'steps': 30620, 'loss/train': 0.8949249982833862} -08/30/2021 18:47:38 - INFO - __main__ - Step 30622: {'lr': 0.00045526408006074973, 'samples': 5879424, 'steps': 30621, 'loss/train': 1.1506030559539795} -08/30/2021 18:47:39 - INFO - __main__ - Step 30623: {'lr': 0.00045526105067438525, 'samples': 5879616, 'steps': 30622, 'loss/train': 1.6091824769973755} -08/30/2021 18:47:39 - INFO - __main__ - Step 30624: {'lr': 0.00045525802119553323, 'samples': 5879808, 'steps': 30623, 'loss/train': 0.46725350618362427} -08/30/2021 18:47:39 - INFO - __main__ - Step 30625: {'lr': 0.0004552549916241951, 'samples': 5880000, 'steps': 30624, 'loss/train': 0.8923364281654358} -08/30/2021 18:47:42 - INFO - __main__ - Step 30626: {'lr': 0.0004552519619603723, 'samples': 5880192, 'steps': 30625, 'loss/train': 0.7296211123466492} -08/30/2021 18:47:42 - INFO - __main__ - Step 30627: {'lr': 0.00045524893220406617, 'samples': 5880384, 'steps': 30626, 'loss/train': 1.4573044776916504} -08/30/2021 18:47:43 - INFO - __main__ - Step 30628: {'lr': 0.00045524590235527796, 'samples': 5880576, 'steps': 30627, 'loss/train': 1.6401554346084595} -08/30/2021 18:47:43 - INFO - __main__ - Step 30629: {'lr': 0.0004552428724140091, 'samples': 5880768, 'steps': 30628, 'loss/train': 1.5434536933898926} -08/30/2021 18:47:43 - INFO - __main__ - Step 30630: {'lr': 0.000455239842380261, 'samples': 5880960, 'steps': 30629, 'loss/train': 0.11715385317802429} -08/30/2021 18:47:44 - INFO - __main__ - Step 30631: {'lr': 0.000455236812254035, 'samples': 5881152, 'steps': 30630, 'loss/train': 1.755092978477478} -08/30/2021 18:47:45 - INFO - __main__ - Step 30632: {'lr': 0.0004552337820353325, 'samples': 5881344, 'steps': 30631, 'loss/train': 1.6778576374053955} -08/30/2021 18:47:46 - INFO - __main__ - Step 30633: {'lr': 0.00045523075172415476, 'samples': 5881536, 'steps': 30632, 'loss/train': 1.6777456998825073} -08/30/2021 18:47:46 - INFO - __main__ - Step 30634: {'lr': 0.0004552277213205032, 'samples': 5881728, 'steps': 30633, 'loss/train': 1.7205262184143066} -08/30/2021 18:47:46 - INFO - __main__ - Step 30635: {'lr': 0.0004552246908243792, 'samples': 5881920, 'steps': 30634, 'loss/train': 1.7409580945968628} -08/30/2021 18:47:47 - INFO - __main__ - Step 30636: {'lr': 0.00045522166023578413, 'samples': 5882112, 'steps': 30635, 'loss/train': 1.3704737424850464} -08/30/2021 18:47:48 - INFO - __main__ - Step 30637: {'lr': 0.0004552186295547194, 'samples': 5882304, 'steps': 30636, 'loss/train': 1.5701302289962769} -08/30/2021 18:47:49 - INFO - __main__ - Step 30638: {'lr': 0.0004552155987811863, 'samples': 5882496, 'steps': 30637, 'loss/train': 1.1240133047103882} -08/30/2021 18:47:49 - INFO - __main__ - Step 30639: {'lr': 0.00045521256791518616, 'samples': 5882688, 'steps': 30638, 'loss/train': 1.3252633810043335} -08/30/2021 18:47:50 - INFO - __main__ - Step 30640: {'lr': 0.0004552095369567205, 'samples': 5882880, 'steps': 30639, 'loss/train': 1.6989467144012451} -08/30/2021 18:47:50 - INFO - __main__ - Step 30641: {'lr': 0.00045520650590579056, 'samples': 5883072, 'steps': 30640, 'loss/train': 1.7590097188949585} -08/30/2021 18:47:52 - INFO - __main__ - Step 30642: {'lr': 0.00045520347476239763, 'samples': 5883264, 'steps': 30641, 'loss/train': 1.7956620454788208} -08/30/2021 18:47:52 - INFO - __main__ - Step 30643: {'lr': 0.00045520044352654335, 'samples': 5883456, 'steps': 30642, 'loss/train': 1.5946303606033325} -08/30/2021 18:47:52 - INFO - __main__ - Step 30644: {'lr': 0.0004551974121982288, 'samples': 5883648, 'steps': 30643, 'loss/train': 0.7562167048454285} -08/30/2021 18:47:53 - INFO - __main__ - Step 30645: {'lr': 0.00045519438077745543, 'samples': 5883840, 'steps': 30644, 'loss/train': 2.0622270107269287} -08/30/2021 18:47:53 - INFO - __main__ - Step 30646: {'lr': 0.0004551913492642248, 'samples': 5884032, 'steps': 30645, 'loss/train': 1.2649282217025757} -08/30/2021 18:47:55 - INFO - __main__ - Step 30647: {'lr': 0.00045518831765853796, 'samples': 5884224, 'steps': 30646, 'loss/train': 2.056971788406372} -08/30/2021 18:47:55 - INFO - __main__ - Step 30648: {'lr': 0.0004551852859603965, 'samples': 5884416, 'steps': 30647, 'loss/train': 0.9747715592384338} -08/30/2021 18:47:55 - INFO - __main__ - Step 30649: {'lr': 0.0004551822541698017, 'samples': 5884608, 'steps': 30648, 'loss/train': 1.5507370233535767} -08/30/2021 18:47:56 - INFO - __main__ - Step 30650: {'lr': 0.0004551792222867549, 'samples': 5884800, 'steps': 30649, 'loss/train': 1.4265443086624146} -08/30/2021 18:47:56 - INFO - __main__ - Step 30651: {'lr': 0.0004551761903112576, 'samples': 5884992, 'steps': 30650, 'loss/train': 1.2638945579528809} -08/30/2021 18:47:56 - INFO - __main__ - Step 30652: {'lr': 0.000455173158243311, 'samples': 5885184, 'steps': 30651, 'loss/train': 1.5258312225341797} -08/30/2021 18:47:58 - INFO - __main__ - Step 30653: {'lr': 0.0004551701260829166, 'samples': 5885376, 'steps': 30652, 'loss/train': 1.4410654306411743} -08/30/2021 18:47:59 - INFO - __main__ - Step 30654: {'lr': 0.00045516709383007563, 'samples': 5885568, 'steps': 30653, 'loss/train': 1.0258395671844482} -08/30/2021 18:47:59 - INFO - __main__ - Step 30655: {'lr': 0.0004551640614847896, 'samples': 5885760, 'steps': 30654, 'loss/train': 0.9390184879302979} -08/30/2021 18:47:59 - INFO - __main__ - Step 30656: {'lr': 0.00045516102904705983, 'samples': 5885952, 'steps': 30655, 'loss/train': 0.891115665435791} -08/30/2021 18:48:00 - INFO - __main__ - Step 30657: {'lr': 0.0004551579965168876, 'samples': 5886144, 'steps': 30656, 'loss/train': 1.3206318616867065} -08/30/2021 18:48:01 - INFO - __main__ - Step 30658: {'lr': 0.00045515496389427433, 'samples': 5886336, 'steps': 30657, 'loss/train': 1.5702022314071655} -08/30/2021 18:48:02 - INFO - __main__ - Step 30659: {'lr': 0.0004551519311792215, 'samples': 5886528, 'steps': 30658, 'loss/train': 1.701112985610962} -08/30/2021 18:48:02 - INFO - __main__ - Step 30660: {'lr': 0.00045514889837173025, 'samples': 5886720, 'steps': 30659, 'loss/train': 0.7067428231239319} -08/30/2021 18:48:02 - INFO - __main__ - Step 30661: {'lr': 0.00045514586547180214, 'samples': 5886912, 'steps': 30660, 'loss/train': 1.7332934141159058} -08/30/2021 18:48:03 - INFO - __main__ - Step 30662: {'lr': 0.0004551428324794385, 'samples': 5887104, 'steps': 30661, 'loss/train': 1.528985619544983} -08/30/2021 18:48:04 - INFO - __main__ - Step 30663: {'lr': 0.00045513979939464056, 'samples': 5887296, 'steps': 30662, 'loss/train': 1.7021403312683105} -08/30/2021 18:48:05 - INFO - __main__ - Step 30664: {'lr': 0.0004551367662174099, 'samples': 5887488, 'steps': 30663, 'loss/train': 1.4849344491958618} -08/30/2021 18:48:05 - INFO - __main__ - Step 30665: {'lr': 0.0004551337329477477, 'samples': 5887680, 'steps': 30664, 'loss/train': 1.1916885375976562} -08/30/2021 18:48:05 - INFO - __main__ - Step 30666: {'lr': 0.00045513069958565545, 'samples': 5887872, 'steps': 30665, 'loss/train': 1.1948695182800293} -08/30/2021 18:48:06 - INFO - __main__ - Step 30667: {'lr': 0.00045512766613113457, 'samples': 5888064, 'steps': 30666, 'loss/train': 1.4168646335601807} -08/30/2021 18:48:07 - INFO - __main__ - Step 30668: {'lr': 0.00045512463258418615, 'samples': 5888256, 'steps': 30667, 'loss/train': 1.3707149028778076} -08/30/2021 18:48:07 - INFO - __main__ - Step 30669: {'lr': 0.00045512159894481183, 'samples': 5888448, 'steps': 30668, 'loss/train': 0.6929999589920044} -08/30/2021 18:48:08 - INFO - __main__ - Step 30670: {'lr': 0.00045511856521301286, 'samples': 5888640, 'steps': 30669, 'loss/train': 1.3104997873306274} -08/30/2021 18:48:08 - INFO - __main__ - Step 30671: {'lr': 0.0004551155313887906, 'samples': 5888832, 'steps': 30670, 'loss/train': 1.3301658630371094} -08/30/2021 18:48:08 - INFO - __main__ - Step 30672: {'lr': 0.0004551124974721465, 'samples': 5889024, 'steps': 30671, 'loss/train': 1.4518308639526367} -08/30/2021 18:48:10 - INFO - __main__ - Step 30673: {'lr': 0.00045510946346308186, 'samples': 5889216, 'steps': 30672, 'loss/train': 1.6256787776947021} -08/30/2021 18:48:10 - INFO - __main__ - Step 30674: {'lr': 0.0004551064293615981, 'samples': 5889408, 'steps': 30673, 'loss/train': 1.4367645978927612} -08/30/2021 18:48:11 - INFO - __main__ - Step 30675: {'lr': 0.00045510339516769647, 'samples': 5889600, 'steps': 30674, 'loss/train': 1.4962762594223022} -08/30/2021 18:48:11 - INFO - __main__ - Step 30676: {'lr': 0.0004551003608813784, 'samples': 5889792, 'steps': 30675, 'loss/train': 1.5136266946792603} -08/30/2021 18:48:12 - INFO - __main__ - Step 30677: {'lr': 0.00045509732650264535, 'samples': 5889984, 'steps': 30676, 'loss/train': 1.123766303062439} -08/30/2021 18:48:14 - INFO - __main__ - Step 30678: {'lr': 0.00045509429203149856, 'samples': 5890176, 'steps': 30677, 'loss/train': 1.3877636194229126} -08/30/2021 18:48:14 - INFO - __main__ - Step 30679: {'lr': 0.00045509125746793946, 'samples': 5890368, 'steps': 30678, 'loss/train': 1.4114665985107422} -08/30/2021 18:48:14 - INFO - __main__ - Step 30680: {'lr': 0.00045508822281196937, 'samples': 5890560, 'steps': 30679, 'loss/train': 1.6636769771575928} -08/30/2021 18:48:15 - INFO - __main__ - Step 30681: {'lr': 0.0004550851880635898, 'samples': 5890752, 'steps': 30680, 'loss/train': 1.3811922073364258} -08/30/2021 18:48:15 - INFO - __main__ - Step 30682: {'lr': 0.0004550821532228019, 'samples': 5890944, 'steps': 30681, 'loss/train': 1.508966088294983} -08/30/2021 18:48:15 - INFO - __main__ - Step 30683: {'lr': 0.00045507911828960717, 'samples': 5891136, 'steps': 30682, 'loss/train': 1.3214455842971802} -08/30/2021 18:48:17 - INFO - __main__ - Step 30684: {'lr': 0.000455076083264007, 'samples': 5891328, 'steps': 30683, 'loss/train': 1.7156789302825928} -08/30/2021 18:48:17 - INFO - __main__ - Step 30685: {'lr': 0.0004550730481460027, 'samples': 5891520, 'steps': 30684, 'loss/train': 1.3713898658752441} -08/30/2021 18:48:18 - INFO - __main__ - Step 30686: {'lr': 0.0004550700129355956, 'samples': 5891712, 'steps': 30685, 'loss/train': 1.6096270084381104} -08/30/2021 18:48:18 - INFO - __main__ - Step 30687: {'lr': 0.0004550669776327871, 'samples': 5891904, 'steps': 30686, 'loss/train': 1.3394801616668701} -08/30/2021 18:48:18 - INFO - __main__ - Step 30688: {'lr': 0.00045506394223757867, 'samples': 5892096, 'steps': 30687, 'loss/train': 1.3650274276733398} -08/30/2021 18:48:20 - INFO - __main__ - Step 30689: {'lr': 0.00045506090674997157, 'samples': 5892288, 'steps': 30688, 'loss/train': 1.1812090873718262} -08/30/2021 18:48:21 - INFO - __main__ - Step 30690: {'lr': 0.00045505787116996714, 'samples': 5892480, 'steps': 30689, 'loss/train': 1.7855641841888428} -08/30/2021 18:48:21 - INFO - __main__ - Step 30691: {'lr': 0.0004550548354975669, 'samples': 5892672, 'steps': 30690, 'loss/train': 0.6450674533843994} -08/30/2021 18:48:21 - INFO - __main__ - Step 30692: {'lr': 0.000455051799732772, 'samples': 5892864, 'steps': 30691, 'loss/train': 1.6922450065612793} -08/30/2021 18:48:22 - INFO - __main__ - Step 30693: {'lr': 0.000455048763875584, 'samples': 5893056, 'steps': 30692, 'loss/train': 1.6246510744094849} -08/30/2021 18:48:23 - INFO - __main__ - Step 30694: {'lr': 0.00045504572792600415, 'samples': 5893248, 'steps': 30693, 'loss/train': 1.4271252155303955} -08/30/2021 18:48:24 - INFO - __main__ - Step 30695: {'lr': 0.00045504269188403386, 'samples': 5893440, 'steps': 30694, 'loss/train': 1.8969249725341797} -08/30/2021 18:48:24 - INFO - __main__ - Step 30696: {'lr': 0.00045503965574967447, 'samples': 5893632, 'steps': 30695, 'loss/train': 1.5949009656906128} -08/30/2021 18:48:24 - INFO - __main__ - Step 30697: {'lr': 0.0004550366195229274, 'samples': 5893824, 'steps': 30696, 'loss/train': 1.5189149379730225} -08/30/2021 18:48:25 - INFO - __main__ - Step 30698: {'lr': 0.00045503358320379405, 'samples': 5894016, 'steps': 30697, 'loss/train': 1.1654564142227173} -08/30/2021 18:48:26 - INFO - __main__ - Step 30699: {'lr': 0.00045503054679227567, 'samples': 5894208, 'steps': 30698, 'loss/train': 1.540948510169983} -08/30/2021 18:48:27 - INFO - __main__ - Step 30700: {'lr': 0.00045502751028837367, 'samples': 5894400, 'steps': 30699, 'loss/train': 2.7859644889831543} -08/30/2021 18:48:27 - INFO - __main__ - Step 30701: {'lr': 0.00045502447369208957, 'samples': 5894592, 'steps': 30700, 'loss/train': 1.3823413848876953} -08/30/2021 18:48:27 - INFO - __main__ - Step 30702: {'lr': 0.00045502143700342445, 'samples': 5894784, 'steps': 30701, 'loss/train': 1.1010650396347046} -08/30/2021 18:48:28 - INFO - __main__ - Step 30703: {'lr': 0.0004550184002223799, 'samples': 5894976, 'steps': 30702, 'loss/train': 1.6398025751113892} -08/30/2021 18:48:28 - INFO - __main__ - Step 30704: {'lr': 0.0004550153633489572, 'samples': 5895168, 'steps': 30703, 'loss/train': 2.0717668533325195} -08/30/2021 18:48:30 - INFO - __main__ - Step 30705: {'lr': 0.0004550123263831578, 'samples': 5895360, 'steps': 30704, 'loss/train': 1.3576658964157104} -08/30/2021 18:48:30 - INFO - __main__ - Step 30706: {'lr': 0.0004550092893249829, 'samples': 5895552, 'steps': 30705, 'loss/train': 0.08371548354625702} -08/30/2021 18:48:31 - INFO - __main__ - Step 30707: {'lr': 0.00045500625217443404, 'samples': 5895744, 'steps': 30706, 'loss/train': 0.07402755320072174} -08/30/2021 18:48:31 - INFO - __main__ - Step 30708: {'lr': 0.0004550032149315125, 'samples': 5895936, 'steps': 30707, 'loss/train': 1.021190881729126} -08/30/2021 18:48:31 - INFO - __main__ - Step 30709: {'lr': 0.00045500017759621974, 'samples': 5896128, 'steps': 30708, 'loss/train': 0.8101719617843628} -08/30/2021 18:48:33 - INFO - __main__ - Step 30710: {'lr': 0.00045499714016855705, 'samples': 5896320, 'steps': 30709, 'loss/train': 1.648227334022522} -08/30/2021 18:48:33 - INFO - __main__ - Step 30711: {'lr': 0.0004549941026485258, 'samples': 5896512, 'steps': 30710, 'loss/train': 1.285312294960022} -08/30/2021 18:48:34 - INFO - __main__ - Step 30712: {'lr': 0.00045499106503612733, 'samples': 5896704, 'steps': 30711, 'loss/train': 0.16413173079490662} -08/30/2021 18:48:34 - INFO - __main__ - Step 30713: {'lr': 0.00045498802733136306, 'samples': 5896896, 'steps': 30712, 'loss/train': 1.5749156475067139} -08/30/2021 18:48:34 - INFO - __main__ - Step 30714: {'lr': 0.0004549849895342344, 'samples': 5897088, 'steps': 30713, 'loss/train': 1.2998645305633545} -08/30/2021 18:48:36 - INFO - __main__ - Step 30715: {'lr': 0.00045498195164474264, 'samples': 5897280, 'steps': 30714, 'loss/train': 1.4540531635284424} -08/30/2021 18:48:36 - INFO - __main__ - Step 30716: {'lr': 0.00045497891366288914, 'samples': 5897472, 'steps': 30715, 'loss/train': 0.9984238743782043} -08/30/2021 18:48:37 - INFO - __main__ - Step 30717: {'lr': 0.0004549758755886754, 'samples': 5897664, 'steps': 30716, 'loss/train': 1.2595840692520142} -08/30/2021 18:48:37 - INFO - __main__ - Step 30718: {'lr': 0.00045497283742210263, 'samples': 5897856, 'steps': 30717, 'loss/train': 1.497979760169983} -08/30/2021 18:48:37 - INFO - __main__ - Step 30719: {'lr': 0.0004549697991631722, 'samples': 5898048, 'steps': 30718, 'loss/train': 1.5174351930618286} -08/30/2021 18:48:39 - INFO - __main__ - Step 30720: {'lr': 0.0004549667608118856, 'samples': 5898240, 'steps': 30719, 'loss/train': 1.0492194890975952} -08/30/2021 18:48:39 - INFO - __main__ - Step 30721: {'lr': 0.0004549637223682441, 'samples': 5898432, 'steps': 30720, 'loss/train': 1.41859769821167} -08/30/2021 18:48:40 - INFO - __main__ - Step 30722: {'lr': 0.0004549606838322492, 'samples': 5898624, 'steps': 30721, 'loss/train': 0.7829442620277405} -08/30/2021 18:48:40 - INFO - __main__ - Step 30723: {'lr': 0.00045495764520390216, 'samples': 5898816, 'steps': 30722, 'loss/train': 1.7781620025634766} -08/30/2021 18:48:41 - INFO - __main__ - Step 30724: {'lr': 0.0004549546064832043, 'samples': 5899008, 'steps': 30723, 'loss/train': 1.6704813241958618} -08/30/2021 18:48:41 - INFO - __main__ - Step 30725: {'lr': 0.0004549515676701571, 'samples': 5899200, 'steps': 30724, 'loss/train': 1.4118534326553345} -08/30/2021 18:48:42 - INFO - __main__ - Step 30726: {'lr': 0.0004549485287647619, 'samples': 5899392, 'steps': 30725, 'loss/train': 1.3349955081939697} -08/30/2021 18:48:43 - INFO - __main__ - Step 30727: {'lr': 0.00045494548976702, 'samples': 5899584, 'steps': 30726, 'loss/train': 1.1516207456588745} -08/30/2021 18:48:43 - INFO - __main__ - Step 30728: {'lr': 0.0004549424506769329, 'samples': 5899776, 'steps': 30727, 'loss/train': 1.6635746955871582} -08/30/2021 18:48:44 - INFO - __main__ - Step 30729: {'lr': 0.00045493941149450185, 'samples': 5899968, 'steps': 30728, 'loss/train': 1.3222459554672241} -08/30/2021 18:48:44 - INFO - __main__ - Step 30730: {'lr': 0.00045493637221972826, 'samples': 5900160, 'steps': 30729, 'loss/train': 1.2599328756332397} -08/30/2021 18:48:45 - INFO - __main__ - Step 30731: {'lr': 0.0004549333328526135, 'samples': 5900352, 'steps': 30730, 'loss/train': 1.7270764112472534} -08/30/2021 18:48:46 - INFO - __main__ - Step 30732: {'lr': 0.0004549302933931589, 'samples': 5900544, 'steps': 30731, 'loss/train': 1.7319059371948242} -08/30/2021 18:48:46 - INFO - __main__ - Step 30733: {'lr': 0.000454927253841366, 'samples': 5900736, 'steps': 30732, 'loss/train': 1.3709053993225098} -08/30/2021 18:48:47 - INFO - __main__ - Step 30734: {'lr': 0.00045492421419723595, 'samples': 5900928, 'steps': 30733, 'loss/train': 1.575917363166809} -08/30/2021 18:48:47 - INFO - __main__ - Step 30735: {'lr': 0.00045492117446077027, 'samples': 5901120, 'steps': 30734, 'loss/train': 1.0894339084625244} -08/30/2021 18:48:49 - INFO - __main__ - Step 30736: {'lr': 0.0004549181346319702, 'samples': 5901312, 'steps': 30735, 'loss/train': 1.6368627548217773} -08/30/2021 18:48:50 - INFO - __main__ - Step 30737: {'lr': 0.00045491509471083717, 'samples': 5901504, 'steps': 30736, 'loss/train': 1.760408878326416} -08/30/2021 18:48:50 - INFO - __main__ - Step 30738: {'lr': 0.00045491205469737263, 'samples': 5901696, 'steps': 30737, 'loss/train': 0.0563410185277462} -08/30/2021 18:48:50 - INFO - __main__ - Step 30739: {'lr': 0.00045490901459157787, 'samples': 5901888, 'steps': 30738, 'loss/train': 0.8755281567573547} -08/30/2021 18:48:51 - INFO - __main__ - Step 30740: {'lr': 0.0004549059743934543, 'samples': 5902080, 'steps': 30739, 'loss/train': 2.1990723609924316} -08/30/2021 18:48:51 - INFO - __main__ - Step 30741: {'lr': 0.00045490293410300315, 'samples': 5902272, 'steps': 30740, 'loss/train': 1.7682366371154785} -08/30/2021 18:48:53 - INFO - __main__ - Step 30742: {'lr': 0.000454899893720226, 'samples': 5902464, 'steps': 30741, 'loss/train': 1.7818737030029297} -08/30/2021 18:48:53 - INFO - __main__ - Step 30743: {'lr': 0.000454896853245124, 'samples': 5902656, 'steps': 30742, 'loss/train': 1.4426699876785278} -08/30/2021 18:48:54 - INFO - __main__ - Step 30744: {'lr': 0.00045489381267769873, 'samples': 5902848, 'steps': 30743, 'loss/train': 2.0978569984436035} -08/30/2021 18:48:54 - INFO - __main__ - Step 30745: {'lr': 0.00045489077201795147, 'samples': 5903040, 'steps': 30744, 'loss/train': 0.0938764363527298} -08/30/2021 18:48:54 - INFO - __main__ - Step 30746: {'lr': 0.0004548877312658836, 'samples': 5903232, 'steps': 30745, 'loss/train': 0.2202833890914917} -08/30/2021 18:48:56 - INFO - __main__ - Step 30747: {'lr': 0.0004548846904214964, 'samples': 5903424, 'steps': 30746, 'loss/train': 0.2757856845855713} -08/30/2021 18:48:57 - INFO - __main__ - Step 30748: {'lr': 0.00045488164948479144, 'samples': 5903616, 'steps': 30747, 'loss/train': 5.178355693817139} -08/30/2021 18:48:57 - INFO - __main__ - Step 30749: {'lr': 0.0004548786084557699, 'samples': 5903808, 'steps': 30748, 'loss/train': 2.07846999168396} -08/30/2021 18:48:58 - INFO - __main__ - Step 30750: {'lr': 0.00045487556733443327, 'samples': 5904000, 'steps': 30749, 'loss/train': 2.0349440574645996} -08/30/2021 18:48:58 - INFO - __main__ - Step 30751: {'lr': 0.0004548725261207828, 'samples': 5904192, 'steps': 30750, 'loss/train': 1.6126673221588135} -08/30/2021 18:49:00 - INFO - __main__ - Step 30752: {'lr': 0.0004548694848148199, 'samples': 5904384, 'steps': 30751, 'loss/train': 1.5104974508285522} -08/30/2021 18:49:00 - INFO - __main__ - Step 30753: {'lr': 0.0004548664434165461, 'samples': 5904576, 'steps': 30752, 'loss/train': 1.4509780406951904} -08/30/2021 18:49:00 - INFO - __main__ - Step 30754: {'lr': 0.0004548634019259625, 'samples': 5904768, 'steps': 30753, 'loss/train': 1.9487842321395874} -08/30/2021 18:49:01 - INFO - __main__ - Step 30755: {'lr': 0.0004548603603430708, 'samples': 5904960, 'steps': 30754, 'loss/train': 1.8448978662490845} -08/30/2021 18:49:01 - INFO - __main__ - Step 30756: {'lr': 0.00045485731866787206, 'samples': 5905152, 'steps': 30755, 'loss/train': 2.021697759628296} -08/30/2021 18:49:01 - INFO - __main__ - Step 30757: {'lr': 0.00045485427690036774, 'samples': 5905344, 'steps': 30756, 'loss/train': 1.3422011137008667} -08/30/2021 18:49:03 - INFO - __main__ - Step 30758: {'lr': 0.0004548512350405593, 'samples': 5905536, 'steps': 30757, 'loss/train': 2.2996208667755127} -08/30/2021 18:49:04 - INFO - __main__ - Step 30759: {'lr': 0.00045484819308844806, 'samples': 5905728, 'steps': 30758, 'loss/train': 0.22292634844779968} -08/30/2021 18:49:04 - INFO - __main__ - Step 30760: {'lr': 0.00045484515104403535, 'samples': 5905920, 'steps': 30759, 'loss/train': 1.8509353399276733} -08/30/2021 18:49:04 - INFO - __main__ - Step 30761: {'lr': 0.00045484210890732257, 'samples': 5906112, 'steps': 30760, 'loss/train': 4.3263840675354} -08/30/2021 18:49:05 - INFO - __main__ - Step 30762: {'lr': 0.0004548390666783111, 'samples': 5906304, 'steps': 30761, 'loss/train': 1.7753716707229614} -08/30/2021 18:49:06 - INFO - __main__ - Step 30763: {'lr': 0.00045483602435700233, 'samples': 5906496, 'steps': 30762, 'loss/train': 1.623103380203247} -08/30/2021 18:49:07 - INFO - __main__ - Step 30764: {'lr': 0.0004548329819433976, 'samples': 5906688, 'steps': 30763, 'loss/train': 1.4231101274490356} -08/30/2021 18:49:07 - INFO - __main__ - Step 30765: {'lr': 0.00045482993943749835, 'samples': 5906880, 'steps': 30764, 'loss/train': 1.7214608192443848} -08/30/2021 18:49:07 - INFO - __main__ - Step 30766: {'lr': 0.0004548268968393058, 'samples': 5907072, 'steps': 30765, 'loss/train': 1.5821691751480103} -08/30/2021 18:49:08 - INFO - __main__ - Step 30767: {'lr': 0.0004548238541488214, 'samples': 5907264, 'steps': 30766, 'loss/train': 1.4154331684112549} -08/30/2021 18:49:09 - INFO - __main__ - Step 30768: {'lr': 0.00045482081136604665, 'samples': 5907456, 'steps': 30767, 'loss/train': 2.2561757564544678} -08/30/2021 18:49:10 - INFO - __main__ - Step 30769: {'lr': 0.0004548177684909827, 'samples': 5907648, 'steps': 30768, 'loss/train': 2.097651481628418} -08/30/2021 18:49:10 - INFO - __main__ - Step 30770: {'lr': 0.0004548147255236311, 'samples': 5907840, 'steps': 30769, 'loss/train': 1.6543786525726318} -08/30/2021 18:49:11 - INFO - __main__ - Step 30771: {'lr': 0.0004548116824639931, 'samples': 5908032, 'steps': 30770, 'loss/train': 0.8371409177780151} -08/30/2021 18:49:11 - INFO - __main__ - Step 30772: {'lr': 0.00045480863931207004, 'samples': 5908224, 'steps': 30771, 'loss/train': 1.294622540473938} -08/30/2021 18:49:12 - INFO - __main__ - Step 30773: {'lr': 0.0004548055960678635, 'samples': 5908416, 'steps': 30772, 'loss/train': 0.9668754935264587} -08/30/2021 18:49:13 - INFO - __main__ - Step 30774: {'lr': 0.0004548025527313746, 'samples': 5908608, 'steps': 30773, 'loss/train': 1.2499743700027466} -08/30/2021 18:49:13 - INFO - __main__ - Step 30775: {'lr': 0.00045479950930260495, 'samples': 5908800, 'steps': 30774, 'loss/train': 1.503238320350647} -08/30/2021 18:49:13 - INFO - __main__ - Step 30776: {'lr': 0.0004547964657815558, 'samples': 5908992, 'steps': 30775, 'loss/train': 2.233491897583008} -08/30/2021 18:49:14 - INFO - __main__ - Step 30777: {'lr': 0.0004547934221682284, 'samples': 5909184, 'steps': 30776, 'loss/train': 1.6315377950668335} -08/30/2021 18:49:15 - INFO - __main__ - Step 30778: {'lr': 0.00045479037846262436, 'samples': 5909376, 'steps': 30777, 'loss/train': 1.4964544773101807} -08/30/2021 18:49:16 - INFO - __main__ - Step 30779: {'lr': 0.00045478733466474487, 'samples': 5909568, 'steps': 30778, 'loss/train': 1.3854427337646484} -08/30/2021 18:49:16 - INFO - __main__ - Step 30780: {'lr': 0.0004547842907745914, 'samples': 5909760, 'steps': 30779, 'loss/train': 2.303678512573242} -08/30/2021 18:49:16 - INFO - __main__ - Step 30781: {'lr': 0.00045478124679216523, 'samples': 5909952, 'steps': 30780, 'loss/train': 0.6042447686195374} -08/30/2021 18:49:17 - INFO - __main__ - Step 30782: {'lr': 0.00045477820271746784, 'samples': 5910144, 'steps': 30781, 'loss/train': 1.8237941265106201} -08/30/2021 18:49:18 - INFO - __main__ - Step 30783: {'lr': 0.00045477515855050056, 'samples': 5910336, 'steps': 30782, 'loss/train': 1.467685341835022} -08/30/2021 18:49:19 - INFO - __main__ - Step 30784: {'lr': 0.0004547721142912647, 'samples': 5910528, 'steps': 30783, 'loss/train': 1.4459495544433594} -08/30/2021 18:49:19 - INFO - __main__ - Step 30785: {'lr': 0.00045476906993976177, 'samples': 5910720, 'steps': 30784, 'loss/train': 1.0934888124465942} -08/30/2021 18:49:19 - INFO - __main__ - Step 30786: {'lr': 0.000454766025495993, 'samples': 5910912, 'steps': 30785, 'loss/train': 1.7733380794525146} -08/30/2021 18:49:20 - INFO - __main__ - Step 30787: {'lr': 0.00045476298095995985, 'samples': 5911104, 'steps': 30786, 'loss/train': 1.3310542106628418} -08/30/2021 18:49:21 - INFO - __main__ - Step 30788: {'lr': 0.00045475993633166357, 'samples': 5911296, 'steps': 30787, 'loss/train': 2.087355375289917} -08/30/2021 18:49:22 - INFO - __main__ - Step 30789: {'lr': 0.00045475689161110565, 'samples': 5911488, 'steps': 30788, 'loss/train': 1.472395658493042} -08/30/2021 18:49:22 - INFO - __main__ - Step 30790: {'lr': 0.0004547538467982876, 'samples': 5911680, 'steps': 30789, 'loss/train': 1.384239673614502} -08/30/2021 18:49:22 - INFO - __main__ - Step 30791: {'lr': 0.00045475080189321044, 'samples': 5911872, 'steps': 30790, 'loss/train': 1.9620822668075562} -08/30/2021 18:49:23 - INFO - __main__ - Step 30792: {'lr': 0.00045474775689587576, 'samples': 5912064, 'steps': 30791, 'loss/train': 0.883018434047699} -08/30/2021 18:49:25 - INFO - __main__ - Step 30793: {'lr': 0.00045474471180628496, 'samples': 5912256, 'steps': 30792, 'loss/train': 1.6669585704803467} -08/30/2021 18:49:25 - INFO - __main__ - Step 30794: {'lr': 0.0004547416666244393, 'samples': 5912448, 'steps': 30793, 'loss/train': 1.5542956590652466} -08/30/2021 18:49:25 - INFO - __main__ - Step 30795: {'lr': 0.00045473862135034026, 'samples': 5912640, 'steps': 30794, 'loss/train': 2.344510078430176} -08/30/2021 18:49:26 - INFO - __main__ - Step 30796: {'lr': 0.0004547355759839891, 'samples': 5912832, 'steps': 30795, 'loss/train': 1.3065285682678223} -08/30/2021 18:49:26 - INFO - __main__ - Step 30797: {'lr': 0.00045473253052538725, 'samples': 5913024, 'steps': 30796, 'loss/train': 1.646628737449646} -08/30/2021 18:49:26 - INFO - __main__ - Step 30798: {'lr': 0.00045472948497453613, 'samples': 5913216, 'steps': 30797, 'loss/train': 0.9493818879127502} -08/30/2021 18:49:28 - INFO - __main__ - Step 30799: {'lr': 0.00045472643933143703, 'samples': 5913408, 'steps': 30798, 'loss/train': 1.842537760734558} -08/30/2021 18:49:28 - INFO - __main__ - Step 30800: {'lr': 0.0004547233935960914, 'samples': 5913600, 'steps': 30799, 'loss/train': 1.8786332607269287} -08/30/2021 18:49:29 - INFO - __main__ - Step 30801: {'lr': 0.00045472034776850045, 'samples': 5913792, 'steps': 30800, 'loss/train': 1.1885528564453125} -08/30/2021 18:49:29 - INFO - __main__ - Step 30802: {'lr': 0.0004547173018486658, 'samples': 5913984, 'steps': 30801, 'loss/train': 1.4817523956298828} -08/30/2021 18:49:30 - INFO - __main__ - Step 30803: {'lr': 0.0004547142558365887, 'samples': 5914176, 'steps': 30802, 'loss/train': 1.4305671453475952} -08/30/2021 18:49:31 - INFO - __main__ - Step 30804: {'lr': 0.0004547112097322704, 'samples': 5914368, 'steps': 30803, 'loss/train': 1.8907513618469238} -08/30/2021 18:49:32 - INFO - __main__ - Step 30805: {'lr': 0.00045470816353571244, 'samples': 5914560, 'steps': 30804, 'loss/train': 2.446058988571167} -08/30/2021 18:49:32 - INFO - __main__ - Step 30806: {'lr': 0.00045470511724691613, 'samples': 5914752, 'steps': 30805, 'loss/train': 1.7583787441253662} -08/30/2021 18:49:32 - INFO - __main__ - Step 30807: {'lr': 0.0004547020708658829, 'samples': 5914944, 'steps': 30806, 'loss/train': 2.3162994384765625} -08/30/2021 18:49:33 - INFO - __main__ - Step 30808: {'lr': 0.000454699024392614, 'samples': 5915136, 'steps': 30807, 'loss/train': 1.706202507019043} -08/30/2021 18:49:35 - INFO - __main__ - Step 30809: {'lr': 0.0004546959778271109, 'samples': 5915328, 'steps': 30808, 'loss/train': 1.5376631021499634} -08/30/2021 18:49:35 - INFO - __main__ - Step 30810: {'lr': 0.00045469293116937504, 'samples': 5915520, 'steps': 30809, 'loss/train': 1.5420583486557007} -08/30/2021 18:49:36 - INFO - __main__ - Step 30811: {'lr': 0.0004546898844194076, 'samples': 5915712, 'steps': 30810, 'loss/train': 2.193227529525757} -08/30/2021 18:49:36 - INFO - __main__ - Step 30812: {'lr': 0.00045468683757721005, 'samples': 5915904, 'steps': 30811, 'loss/train': 1.6837040185928345} -08/30/2021 18:49:36 - INFO - __main__ - Step 30813: {'lr': 0.0004546837906427839, 'samples': 5916096, 'steps': 30812, 'loss/train': 0.13308674097061157} -08/30/2021 18:49:38 - INFO - __main__ - Step 30814: {'lr': 0.00045468074361613026, 'samples': 5916288, 'steps': 30813, 'loss/train': 1.2525848150253296} -08/30/2021 18:49:38 - INFO - __main__ - Step 30815: {'lr': 0.0004546776964972507, 'samples': 5916480, 'steps': 30814, 'loss/train': 1.945178508758545} -08/30/2021 18:49:38 - INFO - __main__ - Step 30816: {'lr': 0.00045467464928614657, 'samples': 5916672, 'steps': 30815, 'loss/train': 6.111526012420654} -08/30/2021 18:49:39 - INFO - __main__ - Step 30817: {'lr': 0.0004546716019828191, 'samples': 5916864, 'steps': 30816, 'loss/train': 1.3960533142089844} -08/30/2021 18:49:39 - INFO - __main__ - Step 30818: {'lr': 0.00045466855458726975, 'samples': 5917056, 'steps': 30817, 'loss/train': 2.6399331092834473} -08/30/2021 18:49:40 - INFO - __main__ - Step 30819: {'lr': 0.0004546655070995, 'samples': 5917248, 'steps': 30818, 'loss/train': 1.5689665079116821} -08/30/2021 18:49:41 - INFO - __main__ - Step 30820: {'lr': 0.0004546624595195111, 'samples': 5917440, 'steps': 30819, 'loss/train': 0.791919469833374} -08/30/2021 18:49:42 - INFO - __main__ - Step 30821: {'lr': 0.0004546594118473044, 'samples': 5917632, 'steps': 30820, 'loss/train': 1.7441242933273315} -08/30/2021 18:49:43 - INFO - __main__ - Step 30822: {'lr': 0.0004546563640828814, 'samples': 5917824, 'steps': 30821, 'loss/train': 1.2575478553771973} -08/30/2021 18:49:43 - INFO - __main__ - Step 30823: {'lr': 0.0004546533162262434, 'samples': 5918016, 'steps': 30822, 'loss/train': 1.7007139921188354} -08/30/2021 18:49:43 - INFO - __main__ - Step 30824: {'lr': 0.00045465026827739175, 'samples': 5918208, 'steps': 30823, 'loss/train': 1.6082549095153809} -08/30/2021 18:49:44 - INFO - __main__ - Step 30825: {'lr': 0.00045464722023632784, 'samples': 5918400, 'steps': 30824, 'loss/train': 1.9467318058013916} -08/30/2021 18:49:45 - INFO - __main__ - Step 30826: {'lr': 0.00045464417210305303, 'samples': 5918592, 'steps': 30825, 'loss/train': 1.5734565258026123} -08/30/2021 18:49:45 - INFO - __main__ - Step 30827: {'lr': 0.0004546411238775687, 'samples': 5918784, 'steps': 30826, 'loss/train': 1.1093934774398804} -08/30/2021 18:49:46 - INFO - __main__ - Step 30828: {'lr': 0.00045463807555987633, 'samples': 5918976, 'steps': 30827, 'loss/train': 1.1093077659606934} -08/30/2021 18:49:46 - INFO - __main__ - Step 30829: {'lr': 0.0004546350271499772, 'samples': 5919168, 'steps': 30828, 'loss/train': 1.193590760231018} -08/30/2021 18:49:47 - INFO - __main__ - Step 30830: {'lr': 0.0004546319786478726, 'samples': 5919360, 'steps': 30829, 'loss/train': 2.011993646621704} -08/30/2021 18:49:48 - INFO - __main__ - Step 30831: {'lr': 0.000454628930053564, 'samples': 5919552, 'steps': 30830, 'loss/train': 1.3023673295974731} -08/30/2021 18:49:48 - INFO - __main__ - Step 30832: {'lr': 0.0004546258813670528, 'samples': 5919744, 'steps': 30831, 'loss/train': 1.8731135129928589} -08/30/2021 18:49:49 - INFO - __main__ - Step 30833: {'lr': 0.0004546228325883403, 'samples': 5919936, 'steps': 30832, 'loss/train': 1.9937634468078613} -08/30/2021 18:49:49 - INFO - __main__ - Step 30834: {'lr': 0.00045461978371742794, 'samples': 5920128, 'steps': 30833, 'loss/train': 1.5370526313781738} -08/30/2021 18:49:50 - INFO - __main__ - Step 30835: {'lr': 0.00045461673475431704, 'samples': 5920320, 'steps': 30834, 'loss/train': 1.700066089630127} -08/30/2021 18:49:50 - INFO - __main__ - Step 30836: {'lr': 0.00045461368569900895, 'samples': 5920512, 'steps': 30835, 'loss/train': 0.6655746102333069} -08/30/2021 18:49:51 - INFO - __main__ - Step 30837: {'lr': 0.0004546106365515052, 'samples': 5920704, 'steps': 30836, 'loss/train': 1.4005099534988403} -08/30/2021 18:49:52 - INFO - __main__ - Step 30838: {'lr': 0.000454607587311807, 'samples': 5920896, 'steps': 30837, 'loss/train': 1.4010639190673828} -08/30/2021 18:49:52 - INFO - __main__ - Step 30839: {'lr': 0.00045460453797991577, 'samples': 5921088, 'steps': 30838, 'loss/train': 2.6396536827087402} -08/30/2021 18:49:52 - INFO - __main__ - Step 30840: {'lr': 0.00045460148855583295, 'samples': 5921280, 'steps': 30839, 'loss/train': 0.8429959416389465} -08/30/2021 18:49:53 - INFO - __main__ - Step 30841: {'lr': 0.00045459843903955977, 'samples': 5921472, 'steps': 30840, 'loss/train': 2.4020378589630127} -08/30/2021 18:49:54 - INFO - __main__ - Step 30842: {'lr': 0.00045459538943109774, 'samples': 5921664, 'steps': 30841, 'loss/train': 2.0796077251434326} -08/30/2021 18:49:55 - INFO - __main__ - Step 30843: {'lr': 0.0004545923397304482, 'samples': 5921856, 'steps': 30842, 'loss/train': 1.5825914144515991} -08/30/2021 18:49:55 - INFO - __main__ - Step 30844: {'lr': 0.0004545892899376125, 'samples': 5922048, 'steps': 30843, 'loss/train': 1.1890977621078491} -08/30/2021 18:49:56 - INFO - __main__ - Step 30845: {'lr': 0.000454586240052592, 'samples': 5922240, 'steps': 30844, 'loss/train': 1.7922642230987549} -08/30/2021 18:49:56 - INFO - __main__ - Step 30846: {'lr': 0.00045458319007538804, 'samples': 5922432, 'steps': 30845, 'loss/train': 0.11606493592262268} -08/30/2021 18:49:58 - INFO - __main__ - Step 30847: {'lr': 0.00045458014000600213, 'samples': 5922624, 'steps': 30846, 'loss/train': 2.962897300720215} -08/30/2021 18:49:58 - INFO - __main__ - Step 30848: {'lr': 0.00045457708984443556, 'samples': 5922816, 'steps': 30847, 'loss/train': 1.8580104112625122} -08/30/2021 18:49:59 - INFO - __main__ - Step 30849: {'lr': 0.0004545740395906897, 'samples': 5923008, 'steps': 30848, 'loss/train': 1.2826155424118042} -08/30/2021 18:49:59 - INFO - __main__ - Step 30850: {'lr': 0.0004545709892447659, 'samples': 5923200, 'steps': 30849, 'loss/train': 1.5987087488174438} -08/30/2021 18:49:59 - INFO - __main__ - Step 30851: {'lr': 0.00045456793880666556, 'samples': 5923392, 'steps': 30850, 'loss/train': 1.9053318500518799} -08/30/2021 18:50:01 - INFO - __main__ - Step 30852: {'lr': 0.0004545648882763902, 'samples': 5923584, 'steps': 30851, 'loss/train': 2.3845627307891846} -08/30/2021 18:50:01 - INFO - __main__ - Step 30853: {'lr': 0.0004545618376539409, 'samples': 5923776, 'steps': 30852, 'loss/train': 1.5275685787200928} -08/30/2021 18:50:02 - INFO - __main__ - Step 30854: {'lr': 0.0004545587869393193, 'samples': 5923968, 'steps': 30853, 'loss/train': 1.8131331205368042} -08/30/2021 18:50:02 - INFO - __main__ - Step 30855: {'lr': 0.00045455573613252667, 'samples': 5924160, 'steps': 30854, 'loss/train': 1.545103907585144} -08/30/2021 18:50:02 - INFO - __main__ - Step 30856: {'lr': 0.0004545526852335643, 'samples': 5924352, 'steps': 30855, 'loss/train': 0.4495946764945984} -08/30/2021 18:50:03 - INFO - __main__ - Step 30857: {'lr': 0.0004545496342424337, 'samples': 5924544, 'steps': 30856, 'loss/train': 1.836046814918518} -08/30/2021 18:50:04 - INFO - __main__ - Step 30858: {'lr': 0.00045454658315913617, 'samples': 5924736, 'steps': 30857, 'loss/train': 1.7491945028305054} -08/30/2021 18:50:05 - INFO - __main__ - Step 30859: {'lr': 0.0004545435319836731, 'samples': 5924928, 'steps': 30858, 'loss/train': 1.735776662826538} -08/30/2021 18:50:05 - INFO - __main__ - Step 30860: {'lr': 0.00045454048071604593, 'samples': 5925120, 'steps': 30859, 'loss/train': 1.489484190940857} -08/30/2021 18:50:05 - INFO - __main__ - Step 30861: {'lr': 0.0004545374293562559, 'samples': 5925312, 'steps': 30860, 'loss/train': 1.7237929105758667} -08/30/2021 18:50:06 - INFO - __main__ - Step 30862: {'lr': 0.00045453437790430446, 'samples': 5925504, 'steps': 30861, 'loss/train': 1.4091020822525024} -08/30/2021 18:50:07 - INFO - __main__ - Step 30863: {'lr': 0.000454531326360193, 'samples': 5925696, 'steps': 30862, 'loss/train': 1.1842780113220215} -08/30/2021 18:50:08 - INFO - __main__ - Step 30864: {'lr': 0.00045452827472392286, 'samples': 5925888, 'steps': 30863, 'loss/train': 1.3570895195007324} -08/30/2021 18:50:08 - INFO - __main__ - Step 30865: {'lr': 0.0004545252229954955, 'samples': 5926080, 'steps': 30864, 'loss/train': 1.746134638786316} -08/30/2021 18:50:08 - INFO - __main__ - Step 30866: {'lr': 0.00045452217117491225, 'samples': 5926272, 'steps': 30865, 'loss/train': 1.3915296792984009} -08/30/2021 18:50:09 - INFO - __main__ - Step 30867: {'lr': 0.00045451911926217437, 'samples': 5926464, 'steps': 30866, 'loss/train': 2.1020700931549072} -08/30/2021 18:50:10 - INFO - __main__ - Step 30868: {'lr': 0.00045451606725728337, 'samples': 5926656, 'steps': 30867, 'loss/train': 1.5282713174819946} -08/30/2021 18:50:11 - INFO - __main__ - Step 30869: {'lr': 0.0004545130151602406, 'samples': 5926848, 'steps': 30868, 'loss/train': 1.4010648727416992} -08/30/2021 18:50:11 - INFO - __main__ - Step 30870: {'lr': 0.00045450996297104743, 'samples': 5927040, 'steps': 30869, 'loss/train': 1.5088531970977783} -08/30/2021 18:50:11 - INFO - __main__ - Step 30871: {'lr': 0.00045450691068970515, 'samples': 5927232, 'steps': 30870, 'loss/train': 1.042020559310913} -08/30/2021 18:50:12 - INFO - __main__ - Step 30872: {'lr': 0.00045450385831621534, 'samples': 5927424, 'steps': 30871, 'loss/train': 0.8496931195259094} -08/30/2021 18:50:13 - INFO - __main__ - Step 30873: {'lr': 0.0004545008058505792, 'samples': 5927616, 'steps': 30872, 'loss/train': 1.6761102676391602} -08/30/2021 18:50:14 - INFO - __main__ - Step 30874: {'lr': 0.0004544977532927981, 'samples': 5927808, 'steps': 30873, 'loss/train': 1.7711992263793945} -08/30/2021 18:50:14 - INFO - __main__ - Step 30875: {'lr': 0.0004544947006428735, 'samples': 5928000, 'steps': 30874, 'loss/train': 1.7140474319458008} -08/30/2021 18:50:14 - INFO - __main__ - Step 30876: {'lr': 0.00045449164790080675, 'samples': 5928192, 'steps': 30875, 'loss/train': 2.2052786350250244} -08/30/2021 18:50:15 - INFO - __main__ - Step 30877: {'lr': 0.00045448859506659926, 'samples': 5928384, 'steps': 30876, 'loss/train': 1.2395455837249756} -08/30/2021 18:50:16 - INFO - __main__ - Step 30878: {'lr': 0.0004544855421402523, 'samples': 5928576, 'steps': 30877, 'loss/train': 0.8298559188842773} -08/30/2021 18:50:17 - INFO - __main__ - Step 30879: {'lr': 0.00045448248912176726, 'samples': 5928768, 'steps': 30878, 'loss/train': 1.4166877269744873} -08/30/2021 18:50:17 - INFO - __main__ - Step 30880: {'lr': 0.00045447943601114563, 'samples': 5928960, 'steps': 30879, 'loss/train': 1.4694899320602417} -08/30/2021 18:50:17 - INFO - __main__ - Step 30881: {'lr': 0.00045447638280838877, 'samples': 5929152, 'steps': 30880, 'loss/train': 2.2456774711608887} -08/30/2021 18:50:18 - INFO - __main__ - Step 30882: {'lr': 0.000454473329513498, 'samples': 5929344, 'steps': 30881, 'loss/train': 1.9202115535736084} -08/30/2021 18:50:19 - INFO - __main__ - Step 30883: {'lr': 0.0004544702761264746, 'samples': 5929536, 'steps': 30882, 'loss/train': 1.6379255056381226} -08/30/2021 18:50:20 - INFO - __main__ - Step 30884: {'lr': 0.0004544672226473201, 'samples': 5929728, 'steps': 30883, 'loss/train': 1.4454952478408813} -08/30/2021 18:50:20 - INFO - __main__ - Step 30885: {'lr': 0.00045446416907603585, 'samples': 5929920, 'steps': 30884, 'loss/train': 0.6298514008522034} -08/30/2021 18:50:21 - INFO - __main__ - Step 30886: {'lr': 0.00045446111541262317, 'samples': 5930112, 'steps': 30885, 'loss/train': 1.408557653427124} -08/30/2021 18:50:21 - INFO - __main__ - Step 30887: {'lr': 0.0004544580616570835, 'samples': 5930304, 'steps': 30886, 'loss/train': 1.8558675050735474} -08/30/2021 18:50:21 - INFO - __main__ - Step 30888: {'lr': 0.0004544550078094182, 'samples': 5930496, 'steps': 30887, 'loss/train': 2.537599563598633} -08/30/2021 18:50:23 - INFO - __main__ - Step 30889: {'lr': 0.00045445195386962855, 'samples': 5930688, 'steps': 30888, 'loss/train': 1.8573321104049683} -08/30/2021 18:50:23 - INFO - __main__ - Step 30890: {'lr': 0.0004544488998377161, 'samples': 5930880, 'steps': 30889, 'loss/train': 1.3963596820831299} -08/30/2021 18:50:23 - INFO - __main__ - Step 30891: {'lr': 0.000454445845713682, 'samples': 5931072, 'steps': 30890, 'loss/train': 1.4934232234954834} -08/30/2021 18:50:24 - INFO - __main__ - Step 30892: {'lr': 0.0004544427914975279, 'samples': 5931264, 'steps': 30891, 'loss/train': 1.6173315048217773} -08/30/2021 18:50:24 - INFO - __main__ - Step 30893: {'lr': 0.0004544397371892549, 'samples': 5931456, 'steps': 30892, 'loss/train': 1.3055099248886108} -08/30/2021 18:50:26 - INFO - __main__ - Step 30894: {'lr': 0.00045443668278886463, 'samples': 5931648, 'steps': 30893, 'loss/train': 2.3843724727630615} -08/30/2021 18:50:26 - INFO - __main__ - Step 30895: {'lr': 0.00045443362829635826, 'samples': 5931840, 'steps': 30894, 'loss/train': 1.3252021074295044} -08/30/2021 18:50:27 - INFO - __main__ - Step 30896: {'lr': 0.00045443057371173727, 'samples': 5932032, 'steps': 30895, 'loss/train': 1.3170150518417358} -08/30/2021 18:50:27 - INFO - __main__ - Step 30897: {'lr': 0.00045442751903500305, 'samples': 5932224, 'steps': 30896, 'loss/train': 1.4374134540557861} -08/30/2021 18:50:27 - INFO - __main__ - Step 30898: {'lr': 0.0004544244642661569, 'samples': 5932416, 'steps': 30897, 'loss/train': 1.7875052690505981} -08/30/2021 18:50:29 - INFO - __main__ - Step 30899: {'lr': 0.00045442140940520027, 'samples': 5932608, 'steps': 30898, 'loss/train': 1.4098151922225952} -08/30/2021 18:50:30 - INFO - __main__ - Step 30900: {'lr': 0.0004544183544521345, 'samples': 5932800, 'steps': 30899, 'loss/train': 1.2480617761611938} -08/30/2021 18:50:30 - INFO - __main__ - Step 30901: {'lr': 0.00045441529940696104, 'samples': 5932992, 'steps': 30900, 'loss/train': 0.08100544661283493} -08/30/2021 18:50:31 - INFO - __main__ - Step 30902: {'lr': 0.0004544122442696811, 'samples': 5933184, 'steps': 30901, 'loss/train': 1.4734858274459839} -08/30/2021 18:50:31 - INFO - __main__ - Step 30903: {'lr': 0.0004544091890402962, 'samples': 5933376, 'steps': 30902, 'loss/train': 5.889724254608154} -08/30/2021 18:50:31 - INFO - __main__ - Step 30904: {'lr': 0.0004544061337188077, 'samples': 5933568, 'steps': 30903, 'loss/train': 1.1169508695602417} -08/30/2021 18:50:33 - INFO - __main__ - Step 30905: {'lr': 0.0004544030783052169, 'samples': 5933760, 'steps': 30904, 'loss/train': 1.4590866565704346} -08/30/2021 18:50:33 - INFO - __main__ - Step 30906: {'lr': 0.0004544000227995253, 'samples': 5933952, 'steps': 30905, 'loss/train': 1.4959120750427246} -08/30/2021 18:50:34 - INFO - __main__ - Step 30907: {'lr': 0.00045439696720173405, 'samples': 5934144, 'steps': 30906, 'loss/train': 1.5704470872879028} -08/30/2021 18:50:34 - INFO - __main__ - Step 30908: {'lr': 0.00045439391151184483, 'samples': 5934336, 'steps': 30907, 'loss/train': 0.8742191195487976} -08/30/2021 18:50:34 - INFO - __main__ - Step 30909: {'lr': 0.0004543908557298588, 'samples': 5934528, 'steps': 30908, 'loss/train': 6.299698829650879} -08/30/2021 18:50:36 - INFO - __main__ - Step 30910: {'lr': 0.0004543877998557775, 'samples': 5934720, 'steps': 30909, 'loss/train': 1.4043680429458618} -08/30/2021 18:50:36 - INFO - __main__ - Step 30911: {'lr': 0.00045438474388960205, 'samples': 5934912, 'steps': 30910, 'loss/train': 1.7212448120117188} -08/30/2021 18:50:37 - INFO - __main__ - Step 30912: {'lr': 0.0004543816878313341, 'samples': 5935104, 'steps': 30911, 'loss/train': 0.9468260407447815} -08/30/2021 18:50:37 - INFO - __main__ - Step 30913: {'lr': 0.0004543786316809749, 'samples': 5935296, 'steps': 30912, 'loss/train': 1.539900302886963} -08/30/2021 18:50:37 - INFO - __main__ - Step 30914: {'lr': 0.0004543755754385258, 'samples': 5935488, 'steps': 30913, 'loss/train': 1.3757702112197876} -08/30/2021 18:50:39 - INFO - __main__ - Step 30915: {'lr': 0.00045437251910398824, 'samples': 5935680, 'steps': 30914, 'loss/train': 1.5696769952774048} -08/30/2021 18:50:39 - INFO - __main__ - Step 30916: {'lr': 0.00045436946267736364, 'samples': 5935872, 'steps': 30915, 'loss/train': 1.4715920686721802} -08/30/2021 18:50:40 - INFO - __main__ - Step 30917: {'lr': 0.0004543664061586532, 'samples': 5936064, 'steps': 30916, 'loss/train': 1.9693139791488647} -08/30/2021 18:50:40 - INFO - __main__ - Step 30918: {'lr': 0.00045436334954785854, 'samples': 5936256, 'steps': 30917, 'loss/train': 1.5209686756134033} -08/30/2021 18:50:40 - INFO - __main__ - Step 30919: {'lr': 0.0004543602928449808, 'samples': 5936448, 'steps': 30918, 'loss/train': 1.678979516029358} -08/30/2021 18:50:42 - INFO - __main__ - Step 30920: {'lr': 0.00045435723605002156, 'samples': 5936640, 'steps': 30919, 'loss/train': 1.150206208229065} -08/30/2021 18:50:43 - INFO - __main__ - Step 30921: {'lr': 0.00045435417916298205, 'samples': 5936832, 'steps': 30920, 'loss/train': 1.7728164196014404} -08/30/2021 18:50:43 - INFO - __main__ - Step 30922: {'lr': 0.00045435112218386364, 'samples': 5937024, 'steps': 30921, 'loss/train': 1.5260149240493774} -08/30/2021 18:50:43 - INFO - __main__ - Step 30923: {'lr': 0.00045434806511266784, 'samples': 5937216, 'steps': 30922, 'loss/train': 1.8596521615982056} -08/30/2021 18:50:44 - INFO - __main__ - Step 30924: {'lr': 0.0004543450079493959, 'samples': 5937408, 'steps': 30923, 'loss/train': 1.4759269952774048} -08/30/2021 18:50:44 - INFO - __main__ - Step 30925: {'lr': 0.0004543419506940494, 'samples': 5937600, 'steps': 30924, 'loss/train': 1.5433435440063477} -08/30/2021 18:50:46 - INFO - __main__ - Step 30926: {'lr': 0.0004543388933466294, 'samples': 5937792, 'steps': 30925, 'loss/train': 1.554054617881775} -08/30/2021 18:50:46 - INFO - __main__ - Step 30927: {'lr': 0.00045433583590713756, 'samples': 5937984, 'steps': 30926, 'loss/train': 1.2592685222625732} -08/30/2021 18:50:46 - INFO - __main__ - Step 30928: {'lr': 0.0004543327783755751, 'samples': 5938176, 'steps': 30927, 'loss/train': 1.513053297996521} -08/30/2021 18:50:47 - INFO - __main__ - Step 30929: {'lr': 0.0004543297207519434, 'samples': 5938368, 'steps': 30928, 'loss/train': 1.5072624683380127} -08/30/2021 18:50:47 - INFO - __main__ - Step 30930: {'lr': 0.0004543266630362439, 'samples': 5938560, 'steps': 30929, 'loss/train': 1.7903330326080322} -08/30/2021 18:50:49 - INFO - __main__ - Step 30931: {'lr': 0.00045432360522847803, 'samples': 5938752, 'steps': 30930, 'loss/train': 1.0317519903182983} -08/30/2021 18:50:49 - INFO - __main__ - Step 30932: {'lr': 0.000454320547328647, 'samples': 5938944, 'steps': 30931, 'loss/train': 1.5009169578552246} -08/30/2021 18:50:49 - INFO - __main__ - Step 30933: {'lr': 0.00045431748933675236, 'samples': 5939136, 'steps': 30932, 'loss/train': 1.7834892272949219} -08/30/2021 18:50:50 - INFO - __main__ - Step 30934: {'lr': 0.00045431443125279534, 'samples': 5939328, 'steps': 30933, 'loss/train': 1.3241400718688965} -08/30/2021 18:50:50 - INFO - __main__ - Step 30935: {'lr': 0.00045431137307677753, 'samples': 5939520, 'steps': 30934, 'loss/train': 1.6047395467758179} -08/30/2021 18:50:50 - INFO - __main__ - Step 30936: {'lr': 0.00045430831480870005, 'samples': 5939712, 'steps': 30935, 'loss/train': 2.9298365116119385} -08/30/2021 18:50:52 - INFO - __main__ - Step 30937: {'lr': 0.0004543052564485644, 'samples': 5939904, 'steps': 30936, 'loss/train': 1.4615219831466675} -08/30/2021 18:50:53 - INFO - __main__ - Step 30938: {'lr': 0.00045430219799637197, 'samples': 5940096, 'steps': 30937, 'loss/train': 1.4555654525756836} -08/30/2021 18:50:53 - INFO - __main__ - Step 30939: {'lr': 0.0004542991394521241, 'samples': 5940288, 'steps': 30938, 'loss/train': 0.75577712059021} -08/30/2021 18:50:54 - INFO - __main__ - Step 30940: {'lr': 0.00045429608081582216, 'samples': 5940480, 'steps': 30939, 'loss/train': 1.7842686176300049} -08/30/2021 18:50:54 - INFO - __main__ - Step 30941: {'lr': 0.0004542930220874677, 'samples': 5940672, 'steps': 30940, 'loss/train': 1.5237113237380981} -08/30/2021 18:50:54 - INFO - __main__ - Step 30942: {'lr': 0.00045428996326706185, 'samples': 5940864, 'steps': 30941, 'loss/train': 1.1260379552841187} -08/30/2021 18:50:56 - INFO - __main__ - Step 30943: {'lr': 0.0004542869043546061, 'samples': 5941056, 'steps': 30942, 'loss/train': 0.05700213089585304} -08/30/2021 18:50:56 - INFO - __main__ - Step 30944: {'lr': 0.0004542838453501018, 'samples': 5941248, 'steps': 30943, 'loss/train': 1.2519384622573853} -08/30/2021 18:50:57 - INFO - __main__ - Step 30945: {'lr': 0.0004542807862535504, 'samples': 5941440, 'steps': 30944, 'loss/train': 1.4879227876663208} -08/30/2021 18:50:57 - INFO - __main__ - Step 30946: {'lr': 0.0004542777270649533, 'samples': 5941632, 'steps': 30945, 'loss/train': 1.4120968580245972} -08/30/2021 18:50:57 - INFO - __main__ - Step 30947: {'lr': 0.0004542746677843117, 'samples': 5941824, 'steps': 30946, 'loss/train': 1.5219526290893555} -08/30/2021 18:50:59 - INFO - __main__ - Step 30948: {'lr': 0.0004542716084116271, 'samples': 5942016, 'steps': 30947, 'loss/train': 1.6526983976364136} -08/30/2021 18:50:59 - INFO - __main__ - Step 30949: {'lr': 0.0004542685489469008, 'samples': 5942208, 'steps': 30948, 'loss/train': 1.6261321306228638} -08/30/2021 18:51:00 - INFO - __main__ - Step 30950: {'lr': 0.0004542654893901344, 'samples': 5942400, 'steps': 30949, 'loss/train': 1.5929393768310547} -08/30/2021 18:51:00 - INFO - __main__ - Step 30951: {'lr': 0.00045426242974132904, 'samples': 5942592, 'steps': 30950, 'loss/train': 1.4672390222549438} -08/30/2021 18:51:00 - INFO - __main__ - Step 30952: {'lr': 0.0004542593700004862, 'samples': 5942784, 'steps': 30951, 'loss/train': 0.5524551272392273} -08/30/2021 18:51:02 - INFO - __main__ - Step 30953: {'lr': 0.0004542563101676072, 'samples': 5942976, 'steps': 30952, 'loss/train': 2.3349385261535645} -08/30/2021 18:51:03 - INFO - __main__ - Step 30954: {'lr': 0.0004542532502426935, 'samples': 5943168, 'steps': 30953, 'loss/train': 1.7408747673034668} -08/30/2021 18:51:03 - INFO - __main__ - Step 30955: {'lr': 0.0004542501902257464, 'samples': 5943360, 'steps': 30954, 'loss/train': 0.8640762567520142} -08/30/2021 18:51:03 - INFO - __main__ - Step 30956: {'lr': 0.0004542471301167673, 'samples': 5943552, 'steps': 30955, 'loss/train': 1.533851146697998} -08/30/2021 18:51:04 - INFO - __main__ - Step 30957: {'lr': 0.0004542440699157577, 'samples': 5943744, 'steps': 30956, 'loss/train': 1.377493143081665} -08/30/2021 18:51:04 - INFO - __main__ - Step 30958: {'lr': 0.00045424100962271883, 'samples': 5943936, 'steps': 30957, 'loss/train': 0.5838767290115356} -08/30/2021 18:51:06 - INFO - __main__ - Step 30959: {'lr': 0.00045423794923765204, 'samples': 5944128, 'steps': 30958, 'loss/train': 1.1220017671585083} -08/30/2021 18:51:06 - INFO - __main__ - Step 30960: {'lr': 0.00045423488876055883, 'samples': 5944320, 'steps': 30959, 'loss/train': 1.49917471408844} -08/30/2021 18:51:06 - INFO - __main__ - Step 30961: {'lr': 0.00045423182819144054, 'samples': 5944512, 'steps': 30960, 'loss/train': 1.4788119792938232} -08/30/2021 18:51:07 - INFO - __main__ - Step 30962: {'lr': 0.00045422876753029853, 'samples': 5944704, 'steps': 30961, 'loss/train': 2.0732154846191406} -08/30/2021 18:51:07 - INFO - __main__ - Step 30963: {'lr': 0.0004542257067771342, 'samples': 5944896, 'steps': 30962, 'loss/train': 1.7146772146224976} -08/30/2021 18:51:09 - INFO - __main__ - Step 30964: {'lr': 0.0004542226459319489, 'samples': 5945088, 'steps': 30963, 'loss/train': 1.3630406856536865} -08/30/2021 18:51:09 - INFO - __main__ - Step 30965: {'lr': 0.000454219584994744, 'samples': 5945280, 'steps': 30964, 'loss/train': 1.5847492218017578} -08/30/2021 18:51:09 - INFO - __main__ - Step 30966: {'lr': 0.00045421652396552094, 'samples': 5945472, 'steps': 30965, 'loss/train': 1.6061770915985107} -08/30/2021 18:51:10 - INFO - __main__ - Step 30967: {'lr': 0.0004542134628442811, 'samples': 5945664, 'steps': 30966, 'loss/train': 1.8897978067398071} -08/30/2021 18:51:10 - INFO - __main__ - Step 30968: {'lr': 0.0004542104016310258, 'samples': 5945856, 'steps': 30967, 'loss/train': 1.4476398229599} -08/30/2021 18:51:12 - INFO - __main__ - Step 30969: {'lr': 0.0004542073403257564, 'samples': 5946048, 'steps': 30968, 'loss/train': 1.5867505073547363} -08/30/2021 18:51:12 - INFO - __main__ - Step 30970: {'lr': 0.0004542042789284744, 'samples': 5946240, 'steps': 30969, 'loss/train': 0.815251886844635} -08/30/2021 18:51:13 - INFO - __main__ - Step 30971: {'lr': 0.0004542012174391811, 'samples': 5946432, 'steps': 30970, 'loss/train': 1.3785136938095093} -08/30/2021 18:51:13 - INFO - __main__ - Step 30972: {'lr': 0.0004541981558578778, 'samples': 5946624, 'steps': 30971, 'loss/train': 1.2928060293197632} -08/30/2021 18:51:14 - INFO - __main__ - Step 30973: {'lr': 0.00045419509418456603, 'samples': 5946816, 'steps': 30972, 'loss/train': 0.06197367236018181} -08/30/2021 18:51:14 - INFO - __main__ - Step 30974: {'lr': 0.00045419203241924705, 'samples': 5947008, 'steps': 30973, 'loss/train': 0.049440354108810425} -08/30/2021 18:51:15 - INFO - __main__ - Step 30975: {'lr': 0.00045418897056192234, 'samples': 5947200, 'steps': 30974, 'loss/train': 1.4731558561325073} -08/30/2021 18:51:16 - INFO - __main__ - Step 30976: {'lr': 0.00045418590861259317, 'samples': 5947392, 'steps': 30975, 'loss/train': 1.7465013265609741} -08/30/2021 18:51:16 - INFO - __main__ - Step 30977: {'lr': 0.0004541828465712611, 'samples': 5947584, 'steps': 30976, 'loss/train': 2.1222403049468994} -08/30/2021 18:51:17 - INFO - __main__ - Step 30978: {'lr': 0.0004541797844379273, 'samples': 5947776, 'steps': 30977, 'loss/train': 1.5453827381134033} -08/30/2021 18:51:17 - INFO - __main__ - Step 30979: {'lr': 0.0004541767222125932, 'samples': 5947968, 'steps': 30978, 'loss/train': 0.9147385358810425} -08/30/2021 18:51:18 - INFO - __main__ - Step 30980: {'lr': 0.0004541736598952603, 'samples': 5948160, 'steps': 30979, 'loss/train': 1.868829607963562} -08/30/2021 18:51:19 - INFO - __main__ - Step 30981: {'lr': 0.0004541705974859298, 'samples': 5948352, 'steps': 30980, 'loss/train': 1.7710955142974854} -08/30/2021 18:51:19 - INFO - __main__ - Step 30982: {'lr': 0.0004541675349846033, 'samples': 5948544, 'steps': 30981, 'loss/train': 1.6964755058288574} -08/30/2021 18:51:20 - INFO - __main__ - Step 30983: {'lr': 0.000454164472391282, 'samples': 5948736, 'steps': 30982, 'loss/train': 1.7199519872665405} -08/30/2021 18:51:20 - INFO - __main__ - Step 30984: {'lr': 0.00045416140970596736, 'samples': 5948928, 'steps': 30983, 'loss/train': 1.543184518814087} -08/30/2021 18:51:21 - INFO - __main__ - Step 30985: {'lr': 0.0004541583469286607, 'samples': 5949120, 'steps': 30984, 'loss/train': 1.5816707611083984} -08/30/2021 18:51:22 - INFO - __main__ - Step 30986: {'lr': 0.00045415528405936347, 'samples': 5949312, 'steps': 30985, 'loss/train': 0.5726720690727234} -08/30/2021 18:51:22 - INFO - __main__ - Step 30987: {'lr': 0.000454152221098077, 'samples': 5949504, 'steps': 30986, 'loss/train': 2.082681179046631} -08/30/2021 18:51:23 - INFO - __main__ - Step 30988: {'lr': 0.0004541491580448027, 'samples': 5949696, 'steps': 30987, 'loss/train': 0.43030846118927} -08/30/2021 18:51:23 - INFO - __main__ - Step 30989: {'lr': 0.00045414609489954195, 'samples': 5949888, 'steps': 30988, 'loss/train': 1.1053502559661865} -08/30/2021 18:51:24 - INFO - __main__ - Step 30990: {'lr': 0.00045414303166229616, 'samples': 5950080, 'steps': 30989, 'loss/train': 1.3367358446121216} -08/30/2021 18:51:25 - INFO - __main__ - Step 30991: {'lr': 0.0004541399683330666, 'samples': 5950272, 'steps': 30990, 'loss/train': 1.6095401048660278} -08/30/2021 18:51:25 - INFO - __main__ - Step 30992: {'lr': 0.00045413690491185476, 'samples': 5950464, 'steps': 30991, 'loss/train': 1.5008652210235596} -08/30/2021 18:51:25 - INFO - __main__ - Step 30993: {'lr': 0.00045413384139866196, 'samples': 5950656, 'steps': 30992, 'loss/train': 1.0580347776412964} -08/30/2021 18:51:26 - INFO - __main__ - Step 30994: {'lr': 0.0004541307777934896, 'samples': 5950848, 'steps': 30993, 'loss/train': 1.4069619178771973} -08/30/2021 18:51:27 - INFO - __main__ - Step 30995: {'lr': 0.00045412771409633905, 'samples': 5951040, 'steps': 30994, 'loss/train': 1.3995437622070312} -08/30/2021 18:51:28 - INFO - __main__ - Step 30996: {'lr': 0.0004541246503072117, 'samples': 5951232, 'steps': 30995, 'loss/train': 1.1555570363998413} -08/30/2021 18:51:28 - INFO - __main__ - Step 30997: {'lr': 0.000454121586426109, 'samples': 5951424, 'steps': 30996, 'loss/train': 0.0732298418879509} -08/30/2021 18:51:28 - INFO - __main__ - Step 30998: {'lr': 0.0004541185224530322, 'samples': 5951616, 'steps': 30997, 'loss/train': 1.7845025062561035} -08/30/2021 18:51:29 - INFO - __main__ - Step 30999: {'lr': 0.00045411545838798273, 'samples': 5951808, 'steps': 30998, 'loss/train': 2.0827035903930664} -08/30/2021 18:51:31 - INFO - __main__ - Step 31000: {'lr': 0.00045411239423096206, 'samples': 5952000, 'steps': 30999, 'loss/train': 1.3978526592254639} -08/30/2021 18:51:31 - INFO - __main__ - Step 31001: {'lr': 0.0004541093299819714, 'samples': 5952192, 'steps': 31000, 'loss/train': 1.2286460399627686} -08/30/2021 18:51:31 - INFO - __main__ - Step 31002: {'lr': 0.0004541062656410123, 'samples': 5952384, 'steps': 31001, 'loss/train': 1.4909310340881348} -08/30/2021 18:51:32 - INFO - __main__ - Step 31003: {'lr': 0.000454103201208086, 'samples': 5952576, 'steps': 31002, 'loss/train': 1.0090872049331665} -08/30/2021 18:51:32 - INFO - __main__ - Step 31004: {'lr': 0.00045410013668319404, 'samples': 5952768, 'steps': 31003, 'loss/train': 1.0905442237854004} -08/30/2021 18:51:34 - INFO - __main__ - Step 31005: {'lr': 0.00045409707206633764, 'samples': 5952960, 'steps': 31004, 'loss/train': 1.5193109512329102} -08/30/2021 18:51:34 - INFO - __main__ - Step 31006: {'lr': 0.0004540940073575183, 'samples': 5953152, 'steps': 31005, 'loss/train': 1.1039931774139404} -08/30/2021 18:51:35 - INFO - __main__ - Step 31007: {'lr': 0.00045409094255673734, 'samples': 5953344, 'steps': 31006, 'loss/train': 0.048871610313653946} -08/30/2021 18:51:35 - INFO - __main__ - Step 31008: {'lr': 0.00045408787766399605, 'samples': 5953536, 'steps': 31007, 'loss/train': 1.1516616344451904} -08/30/2021 18:51:36 - INFO - __main__ - Step 31009: {'lr': 0.00045408481267929604, 'samples': 5953728, 'steps': 31008, 'loss/train': 1.1795395612716675} -08/30/2021 18:51:36 - INFO - __main__ - Step 31010: {'lr': 0.0004540817476026385, 'samples': 5953920, 'steps': 31009, 'loss/train': 1.6250652074813843} -08/30/2021 18:51:38 - INFO - __main__ - Step 31011: {'lr': 0.00045407868243402483, 'samples': 5954112, 'steps': 31010, 'loss/train': 1.7105629444122314} -08/30/2021 18:51:39 - INFO - __main__ - Step 31012: {'lr': 0.0004540756171734565, 'samples': 5954304, 'steps': 31011, 'loss/train': 1.6094919443130493} -08/30/2021 18:51:39 - INFO - __main__ - Step 31013: {'lr': 0.0004540725518209349, 'samples': 5954496, 'steps': 31012, 'loss/train': 1.7254704236984253} -08/30/2021 18:51:40 - INFO - __main__ - Step 31014: {'lr': 0.0004540694863764613, 'samples': 5954688, 'steps': 31013, 'loss/train': 1.6626132726669312} -08/30/2021 18:51:40 - INFO - __main__ - Step 31015: {'lr': 0.0004540664208400371, 'samples': 5954880, 'steps': 31014, 'loss/train': 1.1268343925476074} -08/30/2021 18:51:40 - INFO - __main__ - Step 31016: {'lr': 0.0004540633552116638, 'samples': 5955072, 'steps': 31015, 'loss/train': 0.9672594666481018} -08/30/2021 18:51:42 - INFO - __main__ - Step 31017: {'lr': 0.0004540602894913427, 'samples': 5955264, 'steps': 31016, 'loss/train': 1.5981063842773438} -08/30/2021 18:51:42 - INFO - __main__ - Step 31018: {'lr': 0.0004540572236790751, 'samples': 5955456, 'steps': 31017, 'loss/train': 1.673006534576416} -08/30/2021 18:51:43 - INFO - __main__ - Step 31019: {'lr': 0.0004540541577748625, 'samples': 5955648, 'steps': 31018, 'loss/train': 1.6203272342681885} -08/30/2021 18:51:43 - INFO - __main__ - Step 31020: {'lr': 0.0004540510917787063, 'samples': 5955840, 'steps': 31019, 'loss/train': 1.5703866481781006} -08/30/2021 18:51:43 - INFO - __main__ - Step 31021: {'lr': 0.00045404802569060776, 'samples': 5956032, 'steps': 31020, 'loss/train': 1.4292266368865967} -08/30/2021 18:51:45 - INFO - __main__ - Step 31022: {'lr': 0.00045404495951056835, 'samples': 5956224, 'steps': 31021, 'loss/train': 0.05232563614845276} -08/30/2021 18:51:46 - INFO - __main__ - Step 31023: {'lr': 0.00045404189323858946, 'samples': 5956416, 'steps': 31022, 'loss/train': 1.0030027627944946} -08/30/2021 18:51:46 - INFO - __main__ - Step 31024: {'lr': 0.0004540388268746724, 'samples': 5956608, 'steps': 31023, 'loss/train': 1.4967166185379028} -08/30/2021 18:51:46 - INFO - __main__ - Step 31025: {'lr': 0.0004540357604188186, 'samples': 5956800, 'steps': 31024, 'loss/train': 1.2149097919464111} -08/30/2021 18:51:47 - INFO - __main__ - Step 31026: {'lr': 0.0004540326938710295, 'samples': 5956992, 'steps': 31025, 'loss/train': 1.8220106363296509} -08/30/2021 18:51:48 - INFO - __main__ - Step 31027: {'lr': 0.0004540296272313064, 'samples': 5957184, 'steps': 31026, 'loss/train': 1.1777232885360718} -08/30/2021 18:51:48 - INFO - __main__ - Step 31028: {'lr': 0.00045402656049965055, 'samples': 5957376, 'steps': 31027, 'loss/train': 1.8113280534744263} -08/30/2021 18:51:49 - INFO - __main__ - Step 31029: {'lr': 0.0004540234936760636, 'samples': 5957568, 'steps': 31028, 'loss/train': 0.05803866684436798} -08/30/2021 18:51:49 - INFO - __main__ - Step 31030: {'lr': 0.00045402042676054684, 'samples': 5957760, 'steps': 31029, 'loss/train': 1.611311912536621} -08/30/2021 18:51:50 - INFO - __main__ - Step 31031: {'lr': 0.0004540173597531015, 'samples': 5957952, 'steps': 31030, 'loss/train': 1.4595378637313843} -08/30/2021 18:51:51 - INFO - __main__ - Step 31032: {'lr': 0.00045401429265372925, 'samples': 5958144, 'steps': 31031, 'loss/train': 1.6035057306289673} -08/30/2021 18:51:52 - INFO - __main__ - Step 31033: {'lr': 0.0004540112254624312, 'samples': 5958336, 'steps': 31032, 'loss/train': 1.3567496538162231} -08/30/2021 18:51:52 - INFO - __main__ - Step 31034: {'lr': 0.0004540081581792089, 'samples': 5958528, 'steps': 31033, 'loss/train': 1.5247254371643066} -08/30/2021 18:51:52 - INFO - __main__ - Step 31035: {'lr': 0.0004540050908040636, 'samples': 5958720, 'steps': 31034, 'loss/train': 1.4087685346603394} -08/30/2021 18:51:53 - INFO - __main__ - Step 31036: {'lr': 0.0004540020233369968, 'samples': 5958912, 'steps': 31035, 'loss/train': 1.0668528079986572} -08/30/2021 18:51:53 - INFO - __main__ - Step 31037: {'lr': 0.00045399895577800985, 'samples': 5959104, 'steps': 31036, 'loss/train': 1.4852564334869385} -08/30/2021 18:51:55 - INFO - __main__ - Step 31038: {'lr': 0.00045399588812710415, 'samples': 5959296, 'steps': 31037, 'loss/train': 1.8841310739517212} -08/30/2021 18:51:55 - INFO - __main__ - Step 31039: {'lr': 0.0004539928203842809, 'samples': 5959488, 'steps': 31038, 'loss/train': 1.509718894958496} -08/30/2021 18:51:56 - INFO - __main__ - Step 31040: {'lr': 0.0004539897525495418, 'samples': 5959680, 'steps': 31039, 'loss/train': 1.5329985618591309} -08/30/2021 18:51:56 - INFO - __main__ - Step 31041: {'lr': 0.0004539866846228879, 'samples': 5959872, 'steps': 31040, 'loss/train': 0.9507527947425842} -08/30/2021 18:51:56 - INFO - __main__ - Step 31042: {'lr': 0.0004539836166043209, 'samples': 5960064, 'steps': 31041, 'loss/train': 2.8790485858917236} -08/30/2021 18:51:57 - INFO - __main__ - Step 31043: {'lr': 0.00045398054849384197, 'samples': 5960256, 'steps': 31042, 'loss/train': 1.3953723907470703} -08/30/2021 18:51:58 - INFO - __main__ - Step 31044: {'lr': 0.0004539774802914526, 'samples': 5960448, 'steps': 31043, 'loss/train': 0.906587541103363} -08/30/2021 18:51:59 - INFO - __main__ - Step 31045: {'lr': 0.00045397441199715406, 'samples': 5960640, 'steps': 31044, 'loss/train': 1.4648103713989258} -08/30/2021 18:51:59 - INFO - __main__ - Step 31046: {'lr': 0.0004539713436109478, 'samples': 5960832, 'steps': 31045, 'loss/train': 1.0116899013519287} -08/30/2021 18:51:59 - INFO - __main__ - Step 31047: {'lr': 0.0004539682751328352, 'samples': 5961024, 'steps': 31046, 'loss/train': 0.8836275935173035} -08/30/2021 18:52:00 - INFO - __main__ - Step 31048: {'lr': 0.0004539652065628177, 'samples': 5961216, 'steps': 31047, 'loss/train': 1.0747270584106445} -08/30/2021 18:52:01 - INFO - __main__ - Step 31049: {'lr': 0.00045396213790089657, 'samples': 5961408, 'steps': 31048, 'loss/train': 1.699660062789917} -08/30/2021 18:52:02 - INFO - __main__ - Step 31050: {'lr': 0.0004539590691470733, 'samples': 5961600, 'steps': 31049, 'loss/train': 1.7925145626068115} -08/30/2021 18:52:02 - INFO - __main__ - Step 31051: {'lr': 0.0004539560003013492, 'samples': 5961792, 'steps': 31050, 'loss/train': 1.9361777305603027} -08/30/2021 18:52:02 - INFO - __main__ - Step 31052: {'lr': 0.0004539529313637256, 'samples': 5961984, 'steps': 31051, 'loss/train': 0.6117641925811768} -08/30/2021 18:52:03 - INFO - __main__ - Step 31053: {'lr': 0.0004539498623342041, 'samples': 5962176, 'steps': 31052, 'loss/train': 1.6726100444793701} -08/30/2021 18:52:03 - INFO - __main__ - Step 31054: {'lr': 0.0004539467932127858, 'samples': 5962368, 'steps': 31053, 'loss/train': 1.8790496587753296} -08/30/2021 18:52:05 - INFO - __main__ - Step 31055: {'lr': 0.00045394372399947225, 'samples': 5962560, 'steps': 31054, 'loss/train': 1.194793939590454} -08/30/2021 18:52:05 - INFO - __main__ - Step 31056: {'lr': 0.0004539406546942649, 'samples': 5962752, 'steps': 31055, 'loss/train': 1.072791576385498} -08/30/2021 18:52:06 - INFO - __main__ - Step 31057: {'lr': 0.00045393758529716497, 'samples': 5962944, 'steps': 31056, 'loss/train': 1.4414101839065552} -08/30/2021 18:52:06 - INFO - __main__ - Step 31058: {'lr': 0.0004539345158081739, 'samples': 5963136, 'steps': 31057, 'loss/train': 1.4591870307922363} -08/30/2021 18:52:06 - INFO - __main__ - Step 31059: {'lr': 0.0004539314462272931, 'samples': 5963328, 'steps': 31058, 'loss/train': 0.067268967628479} -08/30/2021 18:52:08 - INFO - __main__ - Step 31060: {'lr': 0.0004539283765545239, 'samples': 5963520, 'steps': 31059, 'loss/train': 1.6859824657440186} -08/30/2021 18:52:08 - INFO - __main__ - Step 31061: {'lr': 0.00045392530678986775, 'samples': 5963712, 'steps': 31060, 'loss/train': 1.5808331966400146} -08/30/2021 18:52:09 - INFO - __main__ - Step 31062: {'lr': 0.00045392223693332604, 'samples': 5963904, 'steps': 31061, 'loss/train': 1.3589439392089844} -08/30/2021 18:52:09 - INFO - __main__ - Step 31063: {'lr': 0.0004539191669849001, 'samples': 5964096, 'steps': 31062, 'loss/train': 1.4981449842453003} -08/30/2021 18:52:09 - INFO - __main__ - Step 31064: {'lr': 0.0004539160969445913, 'samples': 5964288, 'steps': 31063, 'loss/train': 1.7644106149673462} -08/30/2021 18:52:11 - INFO - __main__ - Step 31065: {'lr': 0.0004539130268124011, 'samples': 5964480, 'steps': 31064, 'loss/train': 2.0092480182647705} -08/30/2021 18:52:12 - INFO - __main__ - Step 31066: {'lr': 0.0004539099565883308, 'samples': 5964672, 'steps': 31065, 'loss/train': 1.1268682479858398} -08/30/2021 18:52:12 - INFO - __main__ - Step 31067: {'lr': 0.0004539068862723818, 'samples': 5964864, 'steps': 31066, 'loss/train': 1.950039029121399} -08/30/2021 18:52:12 - INFO - __main__ - Step 31068: {'lr': 0.0004539038158645555, 'samples': 5965056, 'steps': 31067, 'loss/train': 1.7845966815948486} -08/30/2021 18:52:13 - INFO - __main__ - Step 31069: {'lr': 0.00045390074536485336, 'samples': 5965248, 'steps': 31068, 'loss/train': 1.6465349197387695} -08/30/2021 18:52:15 - INFO - __main__ - Step 31070: {'lr': 0.00045389767477327657, 'samples': 5965440, 'steps': 31069, 'loss/train': 1.3320573568344116} -08/30/2021 18:52:15 - INFO - __main__ - Step 31071: {'lr': 0.00045389460408982676, 'samples': 5965632, 'steps': 31070, 'loss/train': 1.6265623569488525} -08/30/2021 18:52:15 - INFO - __main__ - Step 31072: {'lr': 0.0004538915333145052, 'samples': 5965824, 'steps': 31071, 'loss/train': 1.2257441282272339} -08/30/2021 18:52:16 - INFO - __main__ - Step 31073: {'lr': 0.00045388846244731314, 'samples': 5966016, 'steps': 31072, 'loss/train': 1.6296617984771729} -08/30/2021 18:52:16 - INFO - __main__ - Step 31074: {'lr': 0.00045388539148825214, 'samples': 5966208, 'steps': 31073, 'loss/train': 0.9754083156585693} -08/30/2021 18:52:18 - INFO - __main__ - Step 31075: {'lr': 0.0004538823204373235, 'samples': 5966400, 'steps': 31074, 'loss/train': 2.2619900703430176} -08/30/2021 18:52:18 - INFO - __main__ - Step 31076: {'lr': 0.00045387924929452873, 'samples': 5966592, 'steps': 31075, 'loss/train': 1.3385144472122192} -08/30/2021 18:52:18 - INFO - __main__ - Step 31077: {'lr': 0.000453876178059869, 'samples': 5966784, 'steps': 31076, 'loss/train': 0.9936423897743225} -08/30/2021 18:52:19 - INFO - __main__ - Step 31078: {'lr': 0.0004538731067333459, 'samples': 5966976, 'steps': 31077, 'loss/train': 1.4712036848068237} -08/30/2021 18:52:19 - INFO - __main__ - Step 31079: {'lr': 0.00045387003531496064, 'samples': 5967168, 'steps': 31078, 'loss/train': 1.9899890422821045} -08/30/2021 18:52:21 - INFO - __main__ - Step 31080: {'lr': 0.00045386696380471473, 'samples': 5967360, 'steps': 31079, 'loss/train': 0.9737958312034607} -08/30/2021 18:52:21 - INFO - __main__ - Step 31081: {'lr': 0.0004538638922026095, 'samples': 5967552, 'steps': 31080, 'loss/train': 1.493228554725647} -08/30/2021 18:52:22 - INFO - __main__ - Step 31082: {'lr': 0.0004538608205086464, 'samples': 5967744, 'steps': 31081, 'loss/train': 1.5865614414215088} -08/30/2021 18:52:22 - INFO - __main__ - Step 31083: {'lr': 0.0004538577487228267, 'samples': 5967936, 'steps': 31082, 'loss/train': 3.5823469161987305} -08/30/2021 18:52:22 - INFO - __main__ - Step 31084: {'lr': 0.00045385467684515193, 'samples': 5968128, 'steps': 31083, 'loss/train': 1.3502602577209473} -08/30/2021 18:52:23 - INFO - __main__ - Step 31085: {'lr': 0.0004538516048756233, 'samples': 5968320, 'steps': 31084, 'loss/train': 1.6726070642471313} -08/30/2021 18:52:24 - INFO - __main__ - Step 31086: {'lr': 0.00045384853281424235, 'samples': 5968512, 'steps': 31085, 'loss/train': 1.6115013360977173} -08/30/2021 18:52:25 - INFO - __main__ - Step 31087: {'lr': 0.0004538454606610103, 'samples': 5968704, 'steps': 31086, 'loss/train': 1.8925801515579224} -08/30/2021 18:52:25 - INFO - __main__ - Step 31088: {'lr': 0.0004538423884159287, 'samples': 5968896, 'steps': 31087, 'loss/train': 1.3612579107284546} -08/30/2021 18:52:25 - INFO - __main__ - Step 31089: {'lr': 0.0004538393160789988, 'samples': 5969088, 'steps': 31088, 'loss/train': 1.130507469177246} -08/30/2021 18:52:26 - INFO - __main__ - Step 31090: {'lr': 0.0004538362436502221, 'samples': 5969280, 'steps': 31089, 'loss/train': 1.4128400087356567} -08/30/2021 18:52:27 - INFO - __main__ - Step 31091: {'lr': 0.00045383317112959997, 'samples': 5969472, 'steps': 31090, 'loss/train': 1.4794267416000366} -08/30/2021 18:52:28 - INFO - __main__ - Step 31092: {'lr': 0.0004538300985171337, 'samples': 5969664, 'steps': 31091, 'loss/train': 0.6922190189361572} -08/30/2021 18:52:28 - INFO - __main__ - Step 31093: {'lr': 0.00045382702581282477, 'samples': 5969856, 'steps': 31092, 'loss/train': 1.3636902570724487} -08/30/2021 18:52:28 - INFO - __main__ - Step 31094: {'lr': 0.0004538239530166745, 'samples': 5970048, 'steps': 31093, 'loss/train': 1.274987816810608} -08/30/2021 18:52:29 - INFO - __main__ - Step 31095: {'lr': 0.0004538208801286843, 'samples': 5970240, 'steps': 31094, 'loss/train': 1.672188401222229} -08/30/2021 18:52:30 - INFO - __main__ - Step 31096: {'lr': 0.0004538178071488556, 'samples': 5970432, 'steps': 31095, 'loss/train': 1.1953009366989136} -08/30/2021 18:52:31 - INFO - __main__ - Step 31097: {'lr': 0.00045381473407718963, 'samples': 5970624, 'steps': 31096, 'loss/train': 0.9305090308189392} -08/30/2021 18:52:31 - INFO - __main__ - Step 31098: {'lr': 0.000453811660913688, 'samples': 5970816, 'steps': 31097, 'loss/train': 1.1199299097061157} -08/30/2021 18:52:31 - INFO - __main__ - Step 31099: {'lr': 0.000453808587658352, 'samples': 5971008, 'steps': 31098, 'loss/train': 1.1736019849777222} -08/30/2021 18:52:32 - INFO - __main__ - Step 31100: {'lr': 0.0004538055143111829, 'samples': 5971200, 'steps': 31099, 'loss/train': 1.5111671686172485} -08/30/2021 18:52:33 - INFO - __main__ - Step 31101: {'lr': 0.00045380244087218224, 'samples': 5971392, 'steps': 31100, 'loss/train': 1.2263879776000977} -08/30/2021 18:52:34 - INFO - __main__ - Step 31102: {'lr': 0.0004537993673413513, 'samples': 5971584, 'steps': 31101, 'loss/train': 1.2177152633666992} -08/30/2021 18:52:34 - INFO - __main__ - Step 31103: {'lr': 0.0004537962937186916, 'samples': 5971776, 'steps': 31102, 'loss/train': 5.836368560791016} -08/30/2021 18:52:35 - INFO - __main__ - Step 31104: {'lr': 0.00045379322000420433, 'samples': 5971968, 'steps': 31103, 'loss/train': 1.0182262659072876} -08/30/2021 18:52:35 - INFO - __main__ - Step 31105: {'lr': 0.00045379014619789106, 'samples': 5972160, 'steps': 31104, 'loss/train': 0.6063989996910095} -08/30/2021 18:52:35 - INFO - __main__ - Step 31106: {'lr': 0.00045378707229975303, 'samples': 5972352, 'steps': 31105, 'loss/train': 1.6027045249938965} -08/30/2021 18:52:37 - INFO - __main__ - Step 31107: {'lr': 0.0004537839983097917, 'samples': 5972544, 'steps': 31106, 'loss/train': 1.9376516342163086} -08/30/2021 18:52:38 - INFO - __main__ - Step 31108: {'lr': 0.0004537809242280085, 'samples': 5972736, 'steps': 31107, 'loss/train': 1.4661369323730469} -08/30/2021 18:52:38 - INFO - __main__ - Step 31109: {'lr': 0.0004537778500544047, 'samples': 5972928, 'steps': 31108, 'loss/train': 1.029530644416809} -08/30/2021 18:52:38 - INFO - __main__ - Step 31110: {'lr': 0.0004537747757889817, 'samples': 5973120, 'steps': 31109, 'loss/train': 0.9133874177932739} -08/30/2021 18:52:39 - INFO - __main__ - Step 31111: {'lr': 0.0004537717014317411, 'samples': 5973312, 'steps': 31110, 'loss/train': 1.3333266973495483} -08/30/2021 18:52:39 - INFO - __main__ - Step 31112: {'lr': 0.00045376862698268393, 'samples': 5973504, 'steps': 31111, 'loss/train': 0.038941286504268646} -08/30/2021 18:52:41 - INFO - __main__ - Step 31113: {'lr': 0.0004537655524418119, 'samples': 5973696, 'steps': 31112, 'loss/train': 1.2564735412597656} -08/30/2021 18:52:41 - INFO - __main__ - Step 31114: {'lr': 0.00045376247780912616, 'samples': 5973888, 'steps': 31113, 'loss/train': 1.5433170795440674} -08/30/2021 18:52:42 - INFO - __main__ - Step 31115: {'lr': 0.00045375940308462826, 'samples': 5974080, 'steps': 31114, 'loss/train': 1.9497753381729126} -08/30/2021 18:52:42 - INFO - __main__ - Step 31116: {'lr': 0.00045375632826831947, 'samples': 5974272, 'steps': 31115, 'loss/train': 1.3061171770095825} -08/30/2021 18:52:42 - INFO - __main__ - Step 31117: {'lr': 0.00045375325336020124, 'samples': 5974464, 'steps': 31116, 'loss/train': 1.7052353620529175} -08/30/2021 18:52:44 - INFO - __main__ - Step 31118: {'lr': 0.000453750178360275, 'samples': 5974656, 'steps': 31117, 'loss/train': 1.971119999885559} -08/30/2021 18:52:45 - INFO - __main__ - Step 31119: {'lr': 0.00045374710326854194, 'samples': 5974848, 'steps': 31118, 'loss/train': 1.877492904663086} -08/30/2021 18:52:45 - INFO - __main__ - Step 31120: {'lr': 0.0004537440280850037, 'samples': 5975040, 'steps': 31119, 'loss/train': 1.414506435394287} -08/30/2021 18:52:46 - INFO - __main__ - Step 31121: {'lr': 0.00045374095280966147, 'samples': 5975232, 'steps': 31120, 'loss/train': 1.2564905881881714} -08/30/2021 18:52:46 - INFO - __main__ - Step 31122: {'lr': 0.00045373787744251677, 'samples': 5975424, 'steps': 31121, 'loss/train': 1.7289631366729736} -08/30/2021 18:52:48 - INFO - __main__ - Step 31123: {'lr': 0.0004537348019835709, 'samples': 5975616, 'steps': 31122, 'loss/train': 2.0682358741760254} -08/30/2021 18:52:48 - INFO - __main__ - Step 31124: {'lr': 0.0004537317264328252, 'samples': 5975808, 'steps': 31123, 'loss/train': 1.8440382480621338} -08/30/2021 18:52:49 - INFO - __main__ - Step 31125: {'lr': 0.00045372865079028123, 'samples': 5976000, 'steps': 31124, 'loss/train': 1.3663311004638672} -08/30/2021 18:52:49 - INFO - __main__ - Step 31126: {'lr': 0.00045372557505594024, 'samples': 5976192, 'steps': 31125, 'loss/train': 1.004639744758606} -08/30/2021 18:52:49 - INFO - __main__ - Step 31127: {'lr': 0.0004537224992298037, 'samples': 5976384, 'steps': 31126, 'loss/train': 1.444261908531189} -08/30/2021 18:52:51 - INFO - __main__ - Step 31128: {'lr': 0.00045371942331187286, 'samples': 5976576, 'steps': 31127, 'loss/train': 1.231874704360962} -08/30/2021 18:52:52 - INFO - __main__ - Step 31129: {'lr': 0.00045371634730214923, 'samples': 5976768, 'steps': 31128, 'loss/train': 1.3735706806182861} -08/30/2021 18:52:52 - INFO - __main__ - Step 31130: {'lr': 0.00045371327120063417, 'samples': 5976960, 'steps': 31129, 'loss/train': 1.311033844947815} -08/30/2021 18:52:52 - INFO - __main__ - Step 31131: {'lr': 0.00045371019500732904, 'samples': 5977152, 'steps': 31130, 'loss/train': 1.4586528539657593} -08/30/2021 18:52:53 - INFO - __main__ - Step 31132: {'lr': 0.00045370711872223525, 'samples': 5977344, 'steps': 31131, 'loss/train': 1.6951950788497925} -08/30/2021 18:52:54 - INFO - __main__ - Step 31133: {'lr': 0.00045370404234535414, 'samples': 5977536, 'steps': 31132, 'loss/train': 1.6540215015411377} -08/30/2021 18:52:55 - INFO - __main__ - Step 31134: {'lr': 0.00045370096587668714, 'samples': 5977728, 'steps': 31133, 'loss/train': 1.3159565925598145} -08/30/2021 18:52:55 - INFO - __main__ - Step 31135: {'lr': 0.0004536978893162357, 'samples': 5977920, 'steps': 31134, 'loss/train': 1.6009652614593506} -08/30/2021 18:52:56 - INFO - __main__ - Step 31136: {'lr': 0.000453694812664001, 'samples': 5978112, 'steps': 31135, 'loss/train': 0.08150231093168259} -08/30/2021 18:52:56 - INFO - __main__ - Step 31137: {'lr': 0.00045369173591998466, 'samples': 5978304, 'steps': 31136, 'loss/train': 1.1977040767669678} -08/30/2021 18:52:58 - INFO - __main__ - Step 31138: {'lr': 0.00045368865908418794, 'samples': 5978496, 'steps': 31137, 'loss/train': 1.5556244850158691} -08/30/2021 18:52:58 - INFO - __main__ - Step 31139: {'lr': 0.00045368558215661225, 'samples': 5978688, 'steps': 31138, 'loss/train': 0.7230245471000671} -08/30/2021 18:52:58 - INFO - __main__ - Step 31140: {'lr': 0.00045368250513725896, 'samples': 5978880, 'steps': 31139, 'loss/train': 1.637417197227478} -08/30/2021 18:52:59 - INFO - __main__ - Step 31141: {'lr': 0.00045367942802612953, 'samples': 5979072, 'steps': 31140, 'loss/train': 1.6077171564102173} -08/30/2021 18:52:59 - INFO - __main__ - Step 31142: {'lr': 0.0004536763508232252, 'samples': 5979264, 'steps': 31141, 'loss/train': 1.339439034461975} -08/30/2021 18:52:59 - INFO - __main__ - Step 31143: {'lr': 0.0004536732735285476, 'samples': 5979456, 'steps': 31142, 'loss/train': 5.863194465637207} -08/30/2021 18:53:01 - INFO - __main__ - Step 31144: {'lr': 0.00045367019614209783, 'samples': 5979648, 'steps': 31143, 'loss/train': 1.6931700706481934} -08/30/2021 18:53:02 - INFO - __main__ - Step 31145: {'lr': 0.0004536671186638775, 'samples': 5979840, 'steps': 31144, 'loss/train': 0.042302314192056656} -08/30/2021 18:53:02 - INFO - __main__ - Step 31146: {'lr': 0.0004536640410938879, 'samples': 5980032, 'steps': 31145, 'loss/train': 0.03146910294890404} -08/30/2021 18:53:02 - INFO - __main__ - Step 31147: {'lr': 0.00045366096343213034, 'samples': 5980224, 'steps': 31146, 'loss/train': 2.091280698776245} -08/30/2021 18:53:03 - INFO - __main__ - Step 31148: {'lr': 0.0004536578856786064, 'samples': 5980416, 'steps': 31147, 'loss/train': 0.04584484174847603} -08/30/2021 18:53:03 - INFO - __main__ - Step 31149: {'lr': 0.0004536548078333172, 'samples': 5980608, 'steps': 31148, 'loss/train': 1.5256032943725586} -08/30/2021 18:53:05 - INFO - __main__ - Step 31150: {'lr': 0.0004536517298962645, 'samples': 5980800, 'steps': 31149, 'loss/train': 1.3211700916290283} -08/30/2021 18:53:05 - INFO - __main__ - Step 31151: {'lr': 0.00045364865186744936, 'samples': 5980992, 'steps': 31150, 'loss/train': 1.3922449350357056} -08/30/2021 18:53:06 - INFO - __main__ - Step 31152: {'lr': 0.0004536455737468733, 'samples': 5981184, 'steps': 31151, 'loss/train': 1.3153488636016846} -08/30/2021 18:53:06 - INFO - __main__ - Step 31153: {'lr': 0.00045364249553453764, 'samples': 5981376, 'steps': 31152, 'loss/train': 1.6068469285964966} -08/30/2021 18:53:06 - INFO - __main__ - Step 31154: {'lr': 0.00045363941723044386, 'samples': 5981568, 'steps': 31153, 'loss/train': 0.43992772698402405} -08/30/2021 18:53:08 - INFO - __main__ - Step 31155: {'lr': 0.0004536363388345933, 'samples': 5981760, 'steps': 31154, 'loss/train': 0.6110499501228333} -08/30/2021 18:53:08 - INFO - __main__ - Step 31156: {'lr': 0.0004536332603469873, 'samples': 5981952, 'steps': 31155, 'loss/train': 2.086655378341675} -08/30/2021 18:53:09 - INFO - __main__ - Step 31157: {'lr': 0.0004536301817676274, 'samples': 5982144, 'steps': 31156, 'loss/train': 1.5639941692352295} -08/30/2021 18:53:09 - INFO - __main__ - Step 31158: {'lr': 0.0004536271030965148, 'samples': 5982336, 'steps': 31157, 'loss/train': 1.645655632019043} -08/30/2021 18:53:09 - INFO - __main__ - Step 31159: {'lr': 0.00045362402433365094, 'samples': 5982528, 'steps': 31158, 'loss/train': 0.9686564207077026} -08/30/2021 18:53:11 - INFO - __main__ - Step 31160: {'lr': 0.0004536209454790373, 'samples': 5982720, 'steps': 31159, 'loss/train': 1.864017367362976} -08/30/2021 18:53:12 - INFO - __main__ - Step 31161: {'lr': 0.00045361786653267517, 'samples': 5982912, 'steps': 31160, 'loss/train': 0.12420680373907089} -08/30/2021 18:53:12 - INFO - __main__ - Step 31162: {'lr': 0.00045361478749456595, 'samples': 5983104, 'steps': 31161, 'loss/train': 3.0237133502960205} -08/30/2021 18:53:12 - INFO - __main__ - Step 31163: {'lr': 0.0004536117083647111, 'samples': 5983296, 'steps': 31162, 'loss/train': 1.8580105304718018} -08/30/2021 18:53:13 - INFO - __main__ - Step 31164: {'lr': 0.00045360862914311194, 'samples': 5983488, 'steps': 31163, 'loss/train': 1.566408634185791} -08/30/2021 18:53:13 - INFO - __main__ - Step 31165: {'lr': 0.0004536055498297699, 'samples': 5983680, 'steps': 31164, 'loss/train': 1.535684585571289} -08/30/2021 18:53:15 - INFO - __main__ - Step 31166: {'lr': 0.00045360247042468635, 'samples': 5983872, 'steps': 31165, 'loss/train': 1.7129974365234375} -08/30/2021 18:53:15 - INFO - __main__ - Step 31167: {'lr': 0.0004535993909278626, 'samples': 5984064, 'steps': 31166, 'loss/train': 0.8563997149467468} -08/30/2021 18:53:16 - INFO - __main__ - Step 31168: {'lr': 0.00045359631133930016, 'samples': 5984256, 'steps': 31167, 'loss/train': 0.9915846586227417} -08/30/2021 18:53:16 - INFO - __main__ - Step 31169: {'lr': 0.0004535932316590003, 'samples': 5984448, 'steps': 31168, 'loss/train': 1.1800521612167358} -08/30/2021 18:53:16 - INFO - __main__ - Step 31170: {'lr': 0.00045359015188696457, 'samples': 5984640, 'steps': 31169, 'loss/train': 1.218472957611084} -08/30/2021 18:53:18 - INFO - __main__ - Step 31171: {'lr': 0.00045358707202319414, 'samples': 5984832, 'steps': 31170, 'loss/train': 0.2905478775501251} -08/30/2021 18:53:18 - INFO - __main__ - Step 31172: {'lr': 0.0004535839920676906, 'samples': 5985024, 'steps': 31171, 'loss/train': 1.4037226438522339} -08/30/2021 18:53:19 - INFO - __main__ - Step 31173: {'lr': 0.0004535809120204553, 'samples': 5985216, 'steps': 31172, 'loss/train': 1.6890603303909302} -08/30/2021 18:53:19 - INFO - __main__ - Step 31174: {'lr': 0.0004535778318814895, 'samples': 5985408, 'steps': 31173, 'loss/train': 2.3607726097106934} -08/30/2021 18:53:19 - INFO - __main__ - Step 31175: {'lr': 0.0004535747516507947, 'samples': 5985600, 'steps': 31174, 'loss/train': 1.3518590927124023} -08/30/2021 18:53:21 - INFO - __main__ - Step 31176: {'lr': 0.00045357167132837223, 'samples': 5985792, 'steps': 31175, 'loss/train': 1.698056697845459} -08/30/2021 18:53:22 - INFO - __main__ - Step 31177: {'lr': 0.00045356859091422354, 'samples': 5985984, 'steps': 31176, 'loss/train': 1.3519233465194702} -08/30/2021 18:53:22 - INFO - __main__ - Step 31178: {'lr': 0.00045356551040835, 'samples': 5986176, 'steps': 31177, 'loss/train': 1.9519325494766235} -08/30/2021 18:53:23 - INFO - __main__ - Step 31179: {'lr': 0.0004535624298107529, 'samples': 5986368, 'steps': 31178, 'loss/train': 0.7612841129302979} -08/30/2021 18:53:23 - INFO - __main__ - Step 31180: {'lr': 0.00045355934912143383, 'samples': 5986560, 'steps': 31179, 'loss/train': 1.4055265188217163} -08/30/2021 18:53:25 - INFO - __main__ - Step 31181: {'lr': 0.00045355626834039394, 'samples': 5986752, 'steps': 31180, 'loss/train': 1.1429792642593384} -08/30/2021 18:53:25 - INFO - __main__ - Step 31182: {'lr': 0.00045355318746763477, 'samples': 5986944, 'steps': 31181, 'loss/train': 1.7932724952697754} -08/30/2021 18:53:25 - INFO - __main__ - Step 31183: {'lr': 0.0004535501065031577, 'samples': 5987136, 'steps': 31182, 'loss/train': 1.4591612815856934} -08/30/2021 18:53:26 - INFO - __main__ - Step 31184: {'lr': 0.0004535470254469641, 'samples': 5987328, 'steps': 31183, 'loss/train': 1.613660216331482} -08/30/2021 18:53:26 - INFO - __main__ - Step 31185: {'lr': 0.00045354394429905534, 'samples': 5987520, 'steps': 31184, 'loss/train': 1.0812500715255737} -08/30/2021 18:53:26 - INFO - __main__ - Step 31186: {'lr': 0.0004535408630594328, 'samples': 5987712, 'steps': 31185, 'loss/train': 1.4802604913711548} -08/30/2021 18:53:28 - INFO - __main__ - Step 31187: {'lr': 0.0004535377817280979, 'samples': 5987904, 'steps': 31186, 'loss/train': 1.2999248504638672} -08/30/2021 18:53:29 - INFO - __main__ - Step 31188: {'lr': 0.0004535347003050521, 'samples': 5988096, 'steps': 31187, 'loss/train': 1.9061965942382812} -08/30/2021 18:53:29 - INFO - __main__ - Step 31189: {'lr': 0.0004535316187902966, 'samples': 5988288, 'steps': 31188, 'loss/train': 1.8329979181289673} -08/30/2021 18:53:29 - INFO - __main__ - Step 31190: {'lr': 0.00045352853718383287, 'samples': 5988480, 'steps': 31189, 'loss/train': 1.17955482006073} -08/30/2021 18:53:30 - INFO - __main__ - Step 31191: {'lr': 0.00045352545548566235, 'samples': 5988672, 'steps': 31190, 'loss/train': 0.9641557931900024} -08/30/2021 18:53:31 - INFO - __main__ - Step 31192: {'lr': 0.00045352237369578643, 'samples': 5988864, 'steps': 31191, 'loss/train': 1.7571990489959717} -08/30/2021 18:53:32 - INFO - __main__ - Step 31193: {'lr': 0.00045351929181420647, 'samples': 5989056, 'steps': 31192, 'loss/train': 1.1081897020339966} -08/30/2021 18:53:32 - INFO - __main__ - Step 31194: {'lr': 0.0004535162098409238, 'samples': 5989248, 'steps': 31193, 'loss/train': 1.587311029434204} -08/30/2021 18:53:32 - INFO - __main__ - Step 31195: {'lr': 0.00045351312777593995, 'samples': 5989440, 'steps': 31194, 'loss/train': 1.9999451637268066} -08/30/2021 18:53:33 - INFO - __main__ - Step 31196: {'lr': 0.0004535100456192562, 'samples': 5989632, 'steps': 31195, 'loss/train': 1.288652777671814} -08/30/2021 18:53:34 - INFO - __main__ - Step 31197: {'lr': 0.00045350696337087396, 'samples': 5989824, 'steps': 31196, 'loss/train': 2.101027250289917} -08/30/2021 18:53:35 - INFO - __main__ - Step 31198: {'lr': 0.0004535038810307946, 'samples': 5990016, 'steps': 31197, 'loss/train': 1.3536226749420166} -08/30/2021 18:53:35 - INFO - __main__ - Step 31199: {'lr': 0.00045350079859901956, 'samples': 5990208, 'steps': 31198, 'loss/train': 0.947283148765564} -08/30/2021 18:53:35 - INFO - __main__ - Step 31200: {'lr': 0.00045349771607555017, 'samples': 5990400, 'steps': 31199, 'loss/train': 1.8714150190353394} -08/30/2021 18:53:36 - INFO - __main__ - Step 31201: {'lr': 0.0004534946334603879, 'samples': 5990592, 'steps': 31200, 'loss/train': 1.0475910902023315} -08/30/2021 18:53:37 - INFO - __main__ - Step 31202: {'lr': 0.000453491550753534, 'samples': 5990784, 'steps': 31201, 'loss/train': 1.507918119430542} -08/30/2021 18:53:38 - INFO - __main__ - Step 31203: {'lr': 0.00045348846795499, 'samples': 5990976, 'steps': 31202, 'loss/train': 1.7241178750991821} -08/30/2021 18:53:38 - INFO - __main__ - Step 31204: {'lr': 0.0004534853850647572, 'samples': 5991168, 'steps': 31203, 'loss/train': 1.460509181022644} -08/30/2021 18:53:39 - INFO - __main__ - Step 31205: {'lr': 0.00045348230208283716, 'samples': 5991360, 'steps': 31204, 'loss/train': 1.3862348794937134} -08/30/2021 18:53:39 - INFO - __main__ - Step 31206: {'lr': 0.000453479219009231, 'samples': 5991552, 'steps': 31205, 'loss/train': 1.6321722269058228} -08/30/2021 18:53:40 - INFO - __main__ - Step 31207: {'lr': 0.00045347613584394034, 'samples': 5991744, 'steps': 31206, 'loss/train': 0.8021978139877319} -08/30/2021 18:53:41 - INFO - __main__ - Step 31208: {'lr': 0.0004534730525869664, 'samples': 5991936, 'steps': 31207, 'loss/train': 1.1721975803375244} -08/30/2021 18:53:41 - INFO - __main__ - Step 31209: {'lr': 0.0004534699692383106, 'samples': 5992128, 'steps': 31208, 'loss/train': 0.846610963344574} -08/30/2021 18:53:42 - INFO - __main__ - Step 31210: {'lr': 0.00045346688579797444, 'samples': 5992320, 'steps': 31209, 'loss/train': 0.8035076856613159} -08/30/2021 18:53:42 - INFO - __main__ - Step 31211: {'lr': 0.0004534638022659592, 'samples': 5992512, 'steps': 31210, 'loss/train': 1.509392499923706} -08/30/2021 18:53:43 - INFO - __main__ - Step 31212: {'lr': 0.00045346071864226634, 'samples': 5992704, 'steps': 31211, 'loss/train': 1.76493239402771} -08/30/2021 18:53:44 - INFO - __main__ - Step 31213: {'lr': 0.0004534576349268973, 'samples': 5992896, 'steps': 31212, 'loss/train': 1.8032407760620117} -08/30/2021 18:53:44 - INFO - __main__ - Step 31214: {'lr': 0.00045345455111985326, 'samples': 5993088, 'steps': 31213, 'loss/train': 1.8356369733810425} -08/30/2021 18:53:44 - INFO - __main__ - Step 31215: {'lr': 0.0004534514672211358, 'samples': 5993280, 'steps': 31214, 'loss/train': 1.2564467191696167} -08/30/2021 18:53:45 - INFO - __main__ - Step 31216: {'lr': 0.0004534483832307462, 'samples': 5993472, 'steps': 31215, 'loss/train': 1.5392696857452393} -08/30/2021 18:53:46 - INFO - __main__ - Step 31217: {'lr': 0.00045344529914868593, 'samples': 5993664, 'steps': 31216, 'loss/train': 1.8809454441070557} -08/30/2021 18:53:47 - INFO - __main__ - Step 31218: {'lr': 0.0004534422149749564, 'samples': 5993856, 'steps': 31217, 'loss/train': 1.578195333480835} -08/30/2021 18:53:47 - INFO - __main__ - Step 31219: {'lr': 0.0004534391307095589, 'samples': 5994048, 'steps': 31218, 'loss/train': 1.394371509552002} -08/30/2021 18:53:47 - INFO - __main__ - Step 31220: {'lr': 0.0004534360463524948, 'samples': 5994240, 'steps': 31219, 'loss/train': 0.3241921663284302} -08/30/2021 18:53:48 - INFO - __main__ - Step 31221: {'lr': 0.00045343296190376566, 'samples': 5994432, 'steps': 31220, 'loss/train': 1.0528323650360107} -08/30/2021 18:53:48 - INFO - __main__ - Step 31222: {'lr': 0.0004534298773633727, 'samples': 5994624, 'steps': 31221, 'loss/train': 1.6575772762298584} -08/30/2021 18:53:50 - INFO - __main__ - Step 31223: {'lr': 0.00045342679273131743, 'samples': 5994816, 'steps': 31222, 'loss/train': 1.2128381729125977} -08/30/2021 18:53:50 - INFO - __main__ - Step 31224: {'lr': 0.0004534237080076011, 'samples': 5995008, 'steps': 31223, 'loss/train': 1.5789028406143188} -08/30/2021 18:53:51 - INFO - __main__ - Step 31225: {'lr': 0.0004534206231922253, 'samples': 5995200, 'steps': 31224, 'loss/train': 1.637815237045288} -08/30/2021 18:53:51 - INFO - __main__ - Step 31226: {'lr': 0.0004534175382851913, 'samples': 5995392, 'steps': 31225, 'loss/train': 0.10047882050275803} -08/30/2021 18:53:52 - INFO - __main__ - Step 31227: {'lr': 0.0004534144532865004, 'samples': 5995584, 'steps': 31226, 'loss/train': 1.4280861616134644} -08/30/2021 18:53:53 - INFO - __main__ - Step 31228: {'lr': 0.00045341136819615415, 'samples': 5995776, 'steps': 31227, 'loss/train': 1.901550531387329} -08/30/2021 18:53:53 - INFO - __main__ - Step 31229: {'lr': 0.0004534082830141538, 'samples': 5995968, 'steps': 31228, 'loss/train': 1.124707818031311} -08/30/2021 18:53:54 - INFO - __main__ - Step 31230: {'lr': 0.00045340519774050093, 'samples': 5996160, 'steps': 31229, 'loss/train': 1.548142671585083} -08/30/2021 18:53:54 - INFO - __main__ - Step 31231: {'lr': 0.0004534021123751968, 'samples': 5996352, 'steps': 31230, 'loss/train': 1.187740683555603} -08/30/2021 18:53:54 - INFO - __main__ - Step 31232: {'lr': 0.00045339902691824275, 'samples': 5996544, 'steps': 31231, 'loss/train': 0.921841561794281} -08/30/2021 18:53:57 - INFO - __main__ - Step 31233: {'lr': 0.0004533959413696402, 'samples': 5996736, 'steps': 31232, 'loss/train': 1.111497163772583} -08/30/2021 18:53:57 - INFO - __main__ - Step 31234: {'lr': 0.0004533928557293907, 'samples': 5996928, 'steps': 31233, 'loss/train': 1.761494755744934} -08/30/2021 18:53:57 - INFO - __main__ - Step 31235: {'lr': 0.00045338976999749546, 'samples': 5997120, 'steps': 31234, 'loss/train': 5.979400157928467} -08/30/2021 18:53:58 - INFO - __main__ - Step 31236: {'lr': 0.00045338668417395595, 'samples': 5997312, 'steps': 31235, 'loss/train': 1.8501466512680054} -08/30/2021 18:53:58 - INFO - __main__ - Step 31237: {'lr': 0.0004533835982587735, 'samples': 5997504, 'steps': 31236, 'loss/train': 1.6291043758392334} -08/30/2021 18:54:00 - INFO - __main__ - Step 31238: {'lr': 0.00045338051225194954, 'samples': 5997696, 'steps': 31237, 'loss/train': 0.855450451374054} -08/30/2021 18:54:00 - INFO - __main__ - Step 31239: {'lr': 0.0004533774261534855, 'samples': 5997888, 'steps': 31238, 'loss/train': 1.2634632587432861} -08/30/2021 18:54:01 - INFO - __main__ - Step 31240: {'lr': 0.00045337433996338274, 'samples': 5998080, 'steps': 31239, 'loss/train': 1.4583642482757568} -08/30/2021 18:54:01 - INFO - __main__ - Step 31241: {'lr': 0.0004533712536816426, 'samples': 5998272, 'steps': 31240, 'loss/train': 1.8149352073669434} -08/30/2021 18:54:01 - INFO - __main__ - Step 31242: {'lr': 0.0004533681673082665, 'samples': 5998464, 'steps': 31241, 'loss/train': 1.7026433944702148} -08/30/2021 18:54:03 - INFO - __main__ - Step 31243: {'lr': 0.00045336508084325587, 'samples': 5998656, 'steps': 31242, 'loss/train': 1.615867018699646} -08/30/2021 18:54:04 - INFO - __main__ - Step 31244: {'lr': 0.0004533619942866121, 'samples': 5998848, 'steps': 31243, 'loss/train': 2.039458990097046} -08/30/2021 18:54:04 - INFO - __main__ - Step 31245: {'lr': 0.00045335890763833646, 'samples': 5999040, 'steps': 31244, 'loss/train': 1.0180801153182983} -08/30/2021 18:54:04 - INFO - __main__ - Step 31246: {'lr': 0.0004533558208984305, 'samples': 5999232, 'steps': 31245, 'loss/train': 0.043132055550813675} -08/30/2021 18:54:05 - INFO - __main__ - Step 31247: {'lr': 0.0004533527340668956, 'samples': 5999424, 'steps': 31246, 'loss/train': 1.7107980251312256} -08/30/2021 18:54:05 - INFO - __main__ - Step 31248: {'lr': 0.000453349647143733, 'samples': 5999616, 'steps': 31247, 'loss/train': 1.1968151330947876} -08/30/2021 18:54:07 - INFO - __main__ - Step 31249: {'lr': 0.00045334656012894424, 'samples': 5999808, 'steps': 31248, 'loss/train': 1.3520599603652954} -08/30/2021 18:54:07 - INFO - __main__ - Step 31250: {'lr': 0.00045334347302253064, 'samples': 6000000, 'steps': 31249, 'loss/train': 1.1168391704559326} -08/30/2021 18:54:07 - INFO - __main__ - Step 31251: {'lr': 0.00045334038582449355, 'samples': 6000192, 'steps': 31250, 'loss/train': 1.3352669477462769} -08/30/2021 18:54:08 - INFO - __main__ - Step 31252: {'lr': 0.0004533372985348345, 'samples': 6000384, 'steps': 31251, 'loss/train': 1.621696949005127} -08/30/2021 18:54:08 - INFO - __main__ - Step 31253: {'lr': 0.00045333421115355477, 'samples': 6000576, 'steps': 31252, 'loss/train': 1.339316487312317} -08/30/2021 18:54:08 - INFO - __main__ - Step 31254: {'lr': 0.00045333112368065585, 'samples': 6000768, 'steps': 31253, 'loss/train': 1.694393515586853} -08/30/2021 18:54:10 - INFO - __main__ - Step 31255: {'lr': 0.00045332803611613896, 'samples': 6000960, 'steps': 31254, 'loss/train': 0.0778266042470932} -08/30/2021 18:54:10 - INFO - __main__ - Step 31256: {'lr': 0.00045332494846000564, 'samples': 6001152, 'steps': 31255, 'loss/train': 1.0283511877059937} -08/30/2021 18:54:11 - INFO - __main__ - Step 31257: {'lr': 0.00045332186071225724, 'samples': 6001344, 'steps': 31256, 'loss/train': 1.4047452211380005} -08/30/2021 18:54:11 - INFO - __main__ - Step 31258: {'lr': 0.00045331877287289516, 'samples': 6001536, 'steps': 31257, 'loss/train': 1.6048741340637207} -08/30/2021 18:54:11 - INFO - __main__ - Step 31259: {'lr': 0.00045331568494192076, 'samples': 6001728, 'steps': 31258, 'loss/train': 0.8484418392181396} -08/30/2021 18:54:13 - INFO - __main__ - Step 31260: {'lr': 0.00045331259691933545, 'samples': 6001920, 'steps': 31259, 'loss/train': 6.402412414550781} -08/30/2021 18:54:13 - INFO - __main__ - Step 31261: {'lr': 0.00045330950880514065, 'samples': 6002112, 'steps': 31260, 'loss/train': 1.2930322885513306} -08/30/2021 18:54:14 - INFO - __main__ - Step 31262: {'lr': 0.0004533064205993377, 'samples': 6002304, 'steps': 31261, 'loss/train': 1.5986852645874023} -08/30/2021 18:54:14 - INFO - __main__ - Step 31263: {'lr': 0.000453303332301928, 'samples': 6002496, 'steps': 31262, 'loss/train': 1.3185456991195679} -08/30/2021 18:54:14 - INFO - __main__ - Step 31264: {'lr': 0.00045330024391291294, 'samples': 6002688, 'steps': 31263, 'loss/train': 1.3373768329620361} -08/30/2021 18:54:16 - INFO - __main__ - Step 31265: {'lr': 0.00045329715543229396, 'samples': 6002880, 'steps': 31264, 'loss/train': 1.2572249174118042} -08/30/2021 18:54:16 - INFO - __main__ - Step 31266: {'lr': 0.0004532940668600724, 'samples': 6003072, 'steps': 31265, 'loss/train': 1.8223615884780884} -08/30/2021 18:54:17 - INFO - __main__ - Step 31267: {'lr': 0.00045329097819624966, 'samples': 6003264, 'steps': 31266, 'loss/train': 1.4032493829727173} -08/30/2021 18:54:17 - INFO - __main__ - Step 31268: {'lr': 0.00045328788944082717, 'samples': 6003456, 'steps': 31267, 'loss/train': 1.6533368825912476} -08/30/2021 18:54:17 - INFO - __main__ - Step 31269: {'lr': 0.0004532848005938063, 'samples': 6003648, 'steps': 31268, 'loss/train': 1.693549394607544} -08/30/2021 18:54:19 - INFO - __main__ - Step 31270: {'lr': 0.0004532817116551884, 'samples': 6003840, 'steps': 31269, 'loss/train': 1.7190295457839966} -08/30/2021 18:54:20 - INFO - __main__ - Step 31271: {'lr': 0.00045327862262497495, 'samples': 6004032, 'steps': 31270, 'loss/train': 1.8468612432479858} -08/30/2021 18:54:20 - INFO - __main__ - Step 31272: {'lr': 0.00045327553350316726, 'samples': 6004224, 'steps': 31271, 'loss/train': 0.09141149371862411} -08/30/2021 18:54:20 - INFO - __main__ - Step 31273: {'lr': 0.00045327244428976677, 'samples': 6004416, 'steps': 31272, 'loss/train': 1.839314579963684} -08/30/2021 18:54:21 - INFO - __main__ - Step 31274: {'lr': 0.00045326935498477477, 'samples': 6004608, 'steps': 31273, 'loss/train': 1.3692504167556763} -08/30/2021 18:54:22 - INFO - __main__ - Step 31275: {'lr': 0.00045326626558819284, 'samples': 6004800, 'steps': 31274, 'loss/train': 1.6184078454971313} -08/30/2021 18:54:23 - INFO - __main__ - Step 31276: {'lr': 0.00045326317610002223, 'samples': 6004992, 'steps': 31275, 'loss/train': 1.3882378339767456} -08/30/2021 18:54:23 - INFO - __main__ - Step 31277: {'lr': 0.00045326008652026435, 'samples': 6005184, 'steps': 31276, 'loss/train': 1.4430707693099976} -08/30/2021 18:54:24 - INFO - __main__ - Step 31278: {'lr': 0.00045325699684892065, 'samples': 6005376, 'steps': 31277, 'loss/train': 1.4224860668182373} -08/30/2021 18:54:24 - INFO - __main__ - Step 31279: {'lr': 0.00045325390708599245, 'samples': 6005568, 'steps': 31278, 'loss/train': 1.0058977603912354} -08/30/2021 18:54:26 - INFO - __main__ - Step 31280: {'lr': 0.0004532508172314812, 'samples': 6005760, 'steps': 31279, 'loss/train': 1.684635043144226} -08/30/2021 18:54:26 - INFO - __main__ - Step 31281: {'lr': 0.0004532477272853882, 'samples': 6005952, 'steps': 31280, 'loss/train': 1.741889476776123} -08/30/2021 18:54:26 - INFO - __main__ - Step 31282: {'lr': 0.000453244637247715, 'samples': 6006144, 'steps': 31281, 'loss/train': 1.5113399028778076} -08/30/2021 18:54:27 - INFO - __main__ - Step 31283: {'lr': 0.0004532415471184629, 'samples': 6006336, 'steps': 31282, 'loss/train': 1.4530400037765503} -08/30/2021 18:54:27 - INFO - __main__ - Step 31284: {'lr': 0.0004532384568976332, 'samples': 6006528, 'steps': 31283, 'loss/train': 0.9999569654464722} -08/30/2021 18:54:27 - INFO - __main__ - Step 31285: {'lr': 0.00045323536658522747, 'samples': 6006720, 'steps': 31284, 'loss/train': 0.04194250330328941} -08/30/2021 18:54:29 - INFO - __main__ - Step 31286: {'lr': 0.00045323227618124695, 'samples': 6006912, 'steps': 31285, 'loss/train': 1.6435213088989258} -08/30/2021 18:54:30 - INFO - __main__ - Step 31287: {'lr': 0.00045322918568569315, 'samples': 6007104, 'steps': 31286, 'loss/train': 0.9105099439620972} -08/30/2021 18:54:30 - INFO - __main__ - Step 31288: {'lr': 0.0004532260950985675, 'samples': 6007296, 'steps': 31287, 'loss/train': 1.2265020608901978} -08/30/2021 18:54:31 - INFO - __main__ - Step 31289: {'lr': 0.0004532230044198712, 'samples': 6007488, 'steps': 31288, 'loss/train': 1.3852030038833618} -08/30/2021 18:54:31 - INFO - __main__ - Step 31290: {'lr': 0.00045321991364960577, 'samples': 6007680, 'steps': 31289, 'loss/train': 1.4569660425186157} -08/30/2021 18:54:33 - INFO - __main__ - Step 31291: {'lr': 0.00045321682278777253, 'samples': 6007872, 'steps': 31290, 'loss/train': 1.7157217264175415} -08/30/2021 18:54:33 - INFO - __main__ - Step 31292: {'lr': 0.00045321373183437305, 'samples': 6008064, 'steps': 31291, 'loss/train': 1.6974905729293823} -08/30/2021 18:54:34 - INFO - __main__ - Step 31293: {'lr': 0.0004532106407894085, 'samples': 6008256, 'steps': 31292, 'loss/train': 1.9059391021728516} -08/30/2021 18:54:34 - INFO - __main__ - Step 31294: {'lr': 0.0004532075496528804, 'samples': 6008448, 'steps': 31293, 'loss/train': 2.8428099155426025} -08/30/2021 18:54:34 - INFO - __main__ - Step 31295: {'lr': 0.0004532044584247901, 'samples': 6008640, 'steps': 31294, 'loss/train': 1.1328047513961792} -08/30/2021 18:54:36 - INFO - __main__ - Step 31296: {'lr': 0.00045320136710513907, 'samples': 6008832, 'steps': 31295, 'loss/train': 1.3786119222640991} -08/30/2021 18:54:36 - INFO - __main__ - Step 31297: {'lr': 0.00045319827569392855, 'samples': 6009024, 'steps': 31296, 'loss/train': 1.9237794876098633} -08/30/2021 18:54:37 - INFO - __main__ - Step 31298: {'lr': 0.00045319518419116014, 'samples': 6009216, 'steps': 31297, 'loss/train': 1.0042014122009277} -08/30/2021 18:54:37 - INFO - __main__ - Step 31299: {'lr': 0.00045319209259683503, 'samples': 6009408, 'steps': 31298, 'loss/train': 3.9404237270355225} -08/30/2021 18:54:37 - INFO - __main__ - Step 31300: {'lr': 0.0004531890009109547, 'samples': 6009600, 'steps': 31299, 'loss/train': 0.8712418079376221} -08/30/2021 18:54:38 - INFO - __main__ - Step 31301: {'lr': 0.0004531859091335205, 'samples': 6009792, 'steps': 31300, 'loss/train': 1.7124570608139038} -08/30/2021 18:54:39 - INFO - __main__ - Step 31302: {'lr': 0.00045318281726453393, 'samples': 6009984, 'steps': 31301, 'loss/train': 1.4082034826278687} -08/30/2021 18:54:40 - INFO - __main__ - Step 31303: {'lr': 0.00045317972530399634, 'samples': 6010176, 'steps': 31302, 'loss/train': 1.479798674583435} -08/30/2021 18:54:40 - INFO - __main__ - Step 31304: {'lr': 0.00045317663325190904, 'samples': 6010368, 'steps': 31303, 'loss/train': 0.6503819823265076} -08/30/2021 18:54:40 - INFO - __main__ - Step 31305: {'lr': 0.00045317354110827344, 'samples': 6010560, 'steps': 31304, 'loss/train': 1.4694414138793945} -08/30/2021 18:54:41 - INFO - __main__ - Step 31306: {'lr': 0.0004531704488730911, 'samples': 6010752, 'steps': 31305, 'loss/train': 1.2119567394256592} -08/30/2021 18:54:43 - INFO - __main__ - Step 31307: {'lr': 0.0004531673565463632, 'samples': 6010944, 'steps': 31306, 'loss/train': 1.1974531412124634} -08/30/2021 18:54:44 - INFO - __main__ - Step 31308: {'lr': 0.0004531642641280913, 'samples': 6011136, 'steps': 31307, 'loss/train': 2.1453826427459717} -08/30/2021 18:54:44 - INFO - __main__ - Step 31309: {'lr': 0.0004531611716182767, 'samples': 6011328, 'steps': 31308, 'loss/train': 1.3563406467437744} -08/30/2021 18:54:44 - INFO - __main__ - Step 31310: {'lr': 0.0004531580790169207, 'samples': 6011520, 'steps': 31309, 'loss/train': 1.5168622732162476} -08/30/2021 18:54:45 - INFO - __main__ - Step 31311: {'lr': 0.00045315498632402494, 'samples': 6011712, 'steps': 31310, 'loss/train': 1.71764075756073} -08/30/2021 18:54:45 - INFO - __main__ - Step 31312: {'lr': 0.0004531518935395906, 'samples': 6011904, 'steps': 31311, 'loss/train': 1.6577080488204956} -08/30/2021 18:54:45 - INFO - __main__ - Step 31313: {'lr': 0.00045314880066361923, 'samples': 6012096, 'steps': 31312, 'loss/train': 1.8008569478988647} -08/30/2021 18:54:47 - INFO - __main__ - Step 31314: {'lr': 0.00045314570769611207, 'samples': 6012288, 'steps': 31313, 'loss/train': 1.7289601564407349} -08/30/2021 18:54:47 - INFO - __main__ - Step 31315: {'lr': 0.00045314261463707064, 'samples': 6012480, 'steps': 31314, 'loss/train': 0.739951491355896} -08/30/2021 18:54:48 - INFO - __main__ - Step 31316: {'lr': 0.00045313952148649626, 'samples': 6012672, 'steps': 31315, 'loss/train': 1.1222769021987915} -08/30/2021 18:54:48 - INFO - __main__ - Step 31317: {'lr': 0.0004531364282443904, 'samples': 6012864, 'steps': 31316, 'loss/train': 1.603251338005066} -08/30/2021 18:54:48 - INFO - __main__ - Step 31318: {'lr': 0.00045313333491075433, 'samples': 6013056, 'steps': 31317, 'loss/train': 1.1627026796340942} -08/30/2021 18:54:50 - INFO - __main__ - Step 31319: {'lr': 0.0004531302414855895, 'samples': 6013248, 'steps': 31318, 'loss/train': 1.9969780445098877} -08/30/2021 18:54:50 - INFO - __main__ - Step 31320: {'lr': 0.0004531271479688974, 'samples': 6013440, 'steps': 31319, 'loss/train': 1.1127108335494995} -08/30/2021 18:54:51 - INFO - __main__ - Step 31321: {'lr': 0.00045312405436067927, 'samples': 6013632, 'steps': 31320, 'loss/train': 1.810063362121582} -08/30/2021 18:54:51 - INFO - __main__ - Step 31322: {'lr': 0.00045312096066093654, 'samples': 6013824, 'steps': 31321, 'loss/train': 1.625144600868225} -08/30/2021 18:54:52 - INFO - __main__ - Step 31323: {'lr': 0.0004531178668696707, 'samples': 6014016, 'steps': 31322, 'loss/train': 1.8409335613250732} -08/30/2021 18:54:53 - INFO - __main__ - Step 31324: {'lr': 0.00045311477298688306, 'samples': 6014208, 'steps': 31323, 'loss/train': 1.6044880151748657} -08/30/2021 18:54:54 - INFO - __main__ - Step 31325: {'lr': 0.0004531116790125751, 'samples': 6014400, 'steps': 31324, 'loss/train': 0.9908980131149292} -08/30/2021 18:54:54 - INFO - __main__ - Step 31326: {'lr': 0.00045310858494674813, 'samples': 6014592, 'steps': 31325, 'loss/train': 2.1294140815734863} -08/30/2021 18:54:54 - INFO - __main__ - Step 31327: {'lr': 0.00045310549078940356, 'samples': 6014784, 'steps': 31326, 'loss/train': 4.76400899887085} -08/30/2021 18:54:55 - INFO - __main__ - Step 31328: {'lr': 0.00045310239654054274, 'samples': 6014976, 'steps': 31327, 'loss/train': 1.372968077659607} -08/30/2021 18:54:55 - INFO - __main__ - Step 31329: {'lr': 0.0004530993022001672, 'samples': 6015168, 'steps': 31328, 'loss/train': 1.0646507740020752} -08/30/2021 18:54:57 - INFO - __main__ - Step 31330: {'lr': 0.00045309620776827817, 'samples': 6015360, 'steps': 31329, 'loss/train': 1.1996066570281982} -08/30/2021 18:54:57 - INFO - __main__ - Step 31331: {'lr': 0.00045309311324487713, 'samples': 6015552, 'steps': 31330, 'loss/train': 1.597009539604187} -08/30/2021 18:54:58 - INFO - __main__ - Step 31332: {'lr': 0.0004530900186299655, 'samples': 6015744, 'steps': 31331, 'loss/train': 1.5069334506988525} -08/30/2021 18:54:58 - INFO - __main__ - Step 31333: {'lr': 0.0004530869239235446, 'samples': 6015936, 'steps': 31332, 'loss/train': 1.3375705480575562} -08/30/2021 18:54:58 - INFO - __main__ - Step 31334: {'lr': 0.0004530838291256159, 'samples': 6016128, 'steps': 31333, 'loss/train': 1.0631095170974731} -08/30/2021 18:55:00 - INFO - __main__ - Step 31335: {'lr': 0.0004530807342361807, 'samples': 6016320, 'steps': 31334, 'loss/train': 0.0816582441329956} -08/30/2021 18:55:00 - INFO - __main__ - Step 31336: {'lr': 0.0004530776392552406, 'samples': 6016512, 'steps': 31335, 'loss/train': 1.9605308771133423} -08/30/2021 18:55:00 - INFO - __main__ - Step 31337: {'lr': 0.0004530745441827967, 'samples': 6016704, 'steps': 31336, 'loss/train': 2.09440016746521} -08/30/2021 18:55:01 - INFO - __main__ - Step 31338: {'lr': 0.0004530714490188506, 'samples': 6016896, 'steps': 31337, 'loss/train': 1.6025139093399048} -08/30/2021 18:55:01 - INFO - __main__ - Step 31339: {'lr': 0.00045306835376340366, 'samples': 6017088, 'steps': 31338, 'loss/train': 1.575194001197815} -08/30/2021 18:55:03 - INFO - __main__ - Step 31340: {'lr': 0.00045306525841645723, 'samples': 6017280, 'steps': 31339, 'loss/train': 1.8693315982818604} -08/30/2021 18:55:04 - INFO - __main__ - Step 31341: {'lr': 0.0004530621629780127, 'samples': 6017472, 'steps': 31340, 'loss/train': 0.5270640254020691} -08/30/2021 18:55:04 - INFO - __main__ - Step 31342: {'lr': 0.00045305906744807156, 'samples': 6017664, 'steps': 31341, 'loss/train': 1.7819008827209473} -08/30/2021 18:55:05 - INFO - __main__ - Step 31343: {'lr': 0.0004530559718266351, 'samples': 6017856, 'steps': 31342, 'loss/train': 1.6175544261932373} -08/30/2021 18:55:05 - INFO - __main__ - Step 31344: {'lr': 0.0004530528761137047, 'samples': 6018048, 'steps': 31343, 'loss/train': 1.6291863918304443} -08/30/2021 18:55:06 - INFO - __main__ - Step 31345: {'lr': 0.0004530497803092819, 'samples': 6018240, 'steps': 31344, 'loss/train': 0.08060912042856216} -08/30/2021 18:55:07 - INFO - __main__ - Step 31346: {'lr': 0.000453046684413368, 'samples': 6018432, 'steps': 31345, 'loss/train': 0.9258426427841187} -08/30/2021 18:55:07 - INFO - __main__ - Step 31347: {'lr': 0.0004530435884259644, 'samples': 6018624, 'steps': 31346, 'loss/train': 1.0339792966842651} -08/30/2021 18:55:07 - INFO - __main__ - Step 31348: {'lr': 0.0004530404923470724, 'samples': 6018816, 'steps': 31347, 'loss/train': 1.7208458185195923} -08/30/2021 18:55:08 - INFO - __main__ - Step 31349: {'lr': 0.0004530373961766935, 'samples': 6019008, 'steps': 31348, 'loss/train': 1.387402892112732} -08/30/2021 18:55:09 - INFO - __main__ - Step 31350: {'lr': 0.00045303429991482914, 'samples': 6019200, 'steps': 31349, 'loss/train': 2.0206618309020996} -08/30/2021 18:55:10 - INFO - __main__ - Step 31351: {'lr': 0.00045303120356148067, 'samples': 6019392, 'steps': 31350, 'loss/train': 1.4462023973464966} -08/30/2021 18:55:10 - INFO - __main__ - Step 31352: {'lr': 0.00045302810711664944, 'samples': 6019584, 'steps': 31351, 'loss/train': 1.499739408493042} -08/30/2021 18:55:10 - INFO - __main__ - Step 31353: {'lr': 0.00045302501058033687, 'samples': 6019776, 'steps': 31352, 'loss/train': 2.4195618629455566} -08/30/2021 18:55:11 - INFO - __main__ - Step 31354: {'lr': 0.0004530219139525444, 'samples': 6019968, 'steps': 31353, 'loss/train': 1.561851978302002} -08/30/2021 18:55:12 - INFO - __main__ - Step 31355: {'lr': 0.0004530188172332733, 'samples': 6020160, 'steps': 31354, 'loss/train': 1.1478394269943237} -08/30/2021 18:55:13 - INFO - __main__ - Step 31356: {'lr': 0.00045301572042252516, 'samples': 6020352, 'steps': 31355, 'loss/train': 1.4215891361236572} -08/30/2021 18:55:13 - INFO - __main__ - Step 31357: {'lr': 0.00045301262352030123, 'samples': 6020544, 'steps': 31356, 'loss/train': 1.1591626405715942} -08/30/2021 18:55:13 - INFO - __main__ - Step 31358: {'lr': 0.00045300952652660296, 'samples': 6020736, 'steps': 31357, 'loss/train': 1.556175708770752} -08/30/2021 18:55:14 - INFO - __main__ - Step 31359: {'lr': 0.0004530064294414317, 'samples': 6020928, 'steps': 31358, 'loss/train': 1.4957365989685059} -08/30/2021 18:55:15 - INFO - __main__ - Step 31360: {'lr': 0.00045300333226478887, 'samples': 6021120, 'steps': 31359, 'loss/train': 1.3405539989471436} -08/30/2021 18:55:16 - INFO - __main__ - Step 31361: {'lr': 0.0004530002349966759, 'samples': 6021312, 'steps': 31360, 'loss/train': 2.0852339267730713} -08/30/2021 18:55:16 - INFO - __main__ - Step 31362: {'lr': 0.0004529971376370941, 'samples': 6021504, 'steps': 31361, 'loss/train': 2.0898191928863525} -08/30/2021 18:55:17 - INFO - __main__ - Step 31363: {'lr': 0.00045299404018604494, 'samples': 6021696, 'steps': 31362, 'loss/train': 1.0498466491699219} -08/30/2021 18:55:17 - INFO - __main__ - Step 31364: {'lr': 0.00045299094264352987, 'samples': 6021888, 'steps': 31363, 'loss/train': 1.621506929397583} -08/30/2021 18:55:17 - INFO - __main__ - Step 31365: {'lr': 0.00045298784500955014, 'samples': 6022080, 'steps': 31364, 'loss/train': 0.7947888374328613} -08/30/2021 18:55:19 - INFO - __main__ - Step 31366: {'lr': 0.0004529847472841073, 'samples': 6022272, 'steps': 31365, 'loss/train': 0.6868574619293213} -08/30/2021 18:55:19 - INFO - __main__ - Step 31367: {'lr': 0.00045298164946720254, 'samples': 6022464, 'steps': 31366, 'loss/train': 1.34158194065094} -08/30/2021 18:55:20 - INFO - __main__ - Step 31368: {'lr': 0.0004529785515588375, 'samples': 6022656, 'steps': 31367, 'loss/train': 3.5043113231658936} -08/30/2021 18:55:20 - INFO - __main__ - Step 31369: {'lr': 0.00045297545355901336, 'samples': 6022848, 'steps': 31368, 'loss/train': 2.601215124130249} -08/30/2021 18:55:20 - INFO - __main__ - Step 31370: {'lr': 0.00045297235546773175, 'samples': 6023040, 'steps': 31369, 'loss/train': 1.8250067234039307} -08/30/2021 18:55:22 - INFO - __main__ - Step 31371: {'lr': 0.0004529692572849938, 'samples': 6023232, 'steps': 31370, 'loss/train': 1.4554429054260254} -08/30/2021 18:55:22 - INFO - __main__ - Step 31372: {'lr': 0.00045296615901080107, 'samples': 6023424, 'steps': 31371, 'loss/train': 2.171494960784912} -08/30/2021 18:55:23 - INFO - __main__ - Step 31373: {'lr': 0.00045296306064515493, 'samples': 6023616, 'steps': 31372, 'loss/train': 0.9765689373016357} -08/30/2021 18:55:23 - INFO - __main__ - Step 31374: {'lr': 0.0004529599621880567, 'samples': 6023808, 'steps': 31373, 'loss/train': 0.9462294578552246} -08/30/2021 18:55:23 - INFO - __main__ - Step 31375: {'lr': 0.00045295686363950796, 'samples': 6024000, 'steps': 31374, 'loss/train': 1.7525094747543335} -08/30/2021 18:55:24 - INFO - __main__ - Step 31376: {'lr': 0.0004529537649995099, 'samples': 6024192, 'steps': 31375, 'loss/train': 1.6631157398223877} -08/30/2021 18:55:25 - INFO - __main__ - Step 31377: {'lr': 0.0004529506662680641, 'samples': 6024384, 'steps': 31376, 'loss/train': 1.1652833223342896} -08/30/2021 18:55:26 - INFO - __main__ - Step 31378: {'lr': 0.00045294756744517173, 'samples': 6024576, 'steps': 31377, 'loss/train': 1.4136176109313965} -08/30/2021 18:55:26 - INFO - __main__ - Step 31379: {'lr': 0.00045294446853083446, 'samples': 6024768, 'steps': 31378, 'loss/train': 0.5691795945167542} -08/30/2021 18:55:26 - INFO - __main__ - Step 31380: {'lr': 0.00045294136952505346, 'samples': 6024960, 'steps': 31379, 'loss/train': 1.966015338897705} -08/30/2021 18:55:27 - INFO - __main__ - Step 31381: {'lr': 0.0004529382704278302, 'samples': 6025152, 'steps': 31380, 'loss/train': 1.1273294687271118} -08/30/2021 18:55:29 - INFO - __main__ - Step 31382: {'lr': 0.0004529351712391661, 'samples': 6025344, 'steps': 31381, 'loss/train': 1.627261757850647} -08/30/2021 18:55:29 - INFO - __main__ - Step 31383: {'lr': 0.0004529320719590626, 'samples': 6025536, 'steps': 31382, 'loss/train': 1.3488986492156982} -08/30/2021 18:55:30 - INFO - __main__ - Step 31384: {'lr': 0.00045292897258752095, 'samples': 6025728, 'steps': 31383, 'loss/train': 0.031087197363376617} -08/30/2021 18:55:30 - INFO - __main__ - Step 31385: {'lr': 0.0004529258731245427, 'samples': 6025920, 'steps': 31384, 'loss/train': 1.359673023223877} -08/30/2021 18:55:30 - INFO - __main__ - Step 31386: {'lr': 0.0004529227735701291, 'samples': 6026112, 'steps': 31385, 'loss/train': 1.7532901763916016} -08/30/2021 18:55:31 - INFO - __main__ - Step 31387: {'lr': 0.00045291967392428175, 'samples': 6026304, 'steps': 31386, 'loss/train': 1.397007942199707} -08/30/2021 18:55:32 - INFO - __main__ - Step 31388: {'lr': 0.0004529165741870018, 'samples': 6026496, 'steps': 31387, 'loss/train': 2.2244186401367188} -08/30/2021 18:55:32 - INFO - __main__ - Step 31389: {'lr': 0.00045291347435829087, 'samples': 6026688, 'steps': 31388, 'loss/train': 1.6940562725067139} -08/30/2021 18:55:33 - INFO - __main__ - Step 31390: {'lr': 0.0004529103744381503, 'samples': 6026880, 'steps': 31389, 'loss/train': 1.3574824333190918} -08/30/2021 18:55:33 - INFO - __main__ - Step 31391: {'lr': 0.0004529072744265813, 'samples': 6027072, 'steps': 31390, 'loss/train': 0.9527828693389893} -08/30/2021 18:55:34 - INFO - __main__ - Step 31392: {'lr': 0.00045290417432358553, 'samples': 6027264, 'steps': 31391, 'loss/train': 1.5479423999786377} -08/30/2021 18:55:35 - INFO - __main__ - Step 31393: {'lr': 0.00045290107412916425, 'samples': 6027456, 'steps': 31392, 'loss/train': 1.2887177467346191} -08/30/2021 18:55:36 - INFO - __main__ - Step 31394: {'lr': 0.0004528979738433189, 'samples': 6027648, 'steps': 31393, 'loss/train': 1.2290927171707153} -08/30/2021 18:55:36 - INFO - __main__ - Step 31395: {'lr': 0.00045289487346605075, 'samples': 6027840, 'steps': 31394, 'loss/train': 1.4486130475997925} -08/30/2021 18:55:37 - INFO - __main__ - Step 31396: {'lr': 0.0004528917729973614, 'samples': 6028032, 'steps': 31395, 'loss/train': 2.506225824356079} -08/30/2021 18:55:37 - INFO - __main__ - Step 31397: {'lr': 0.00045288867243725207, 'samples': 6028224, 'steps': 31396, 'loss/train': 1.55485999584198} -08/30/2021 18:55:39 - INFO - __main__ - Step 31398: {'lr': 0.00045288557178572433, 'samples': 6028416, 'steps': 31397, 'loss/train': 1.430517315864563} -08/30/2021 18:55:39 - INFO - __main__ - Step 31399: {'lr': 0.00045288247104277937, 'samples': 6028608, 'steps': 31398, 'loss/train': 1.623408317565918} -08/30/2021 18:55:39 - INFO - __main__ - Step 31400: {'lr': 0.0004528793702084187, 'samples': 6028800, 'steps': 31399, 'loss/train': 1.3323373794555664} -08/30/2021 18:55:40 - INFO - __main__ - Step 31401: {'lr': 0.0004528762692826439, 'samples': 6028992, 'steps': 31400, 'loss/train': 2.479332208633423} -08/30/2021 18:55:40 - INFO - __main__ - Step 31402: {'lr': 0.000452873168265456, 'samples': 6029184, 'steps': 31401, 'loss/train': 1.2642860412597656} -08/30/2021 18:55:42 - INFO - __main__ - Step 31403: {'lr': 0.00045287006715685665, 'samples': 6029376, 'steps': 31402, 'loss/train': 0.9872164726257324} -08/30/2021 18:55:42 - INFO - __main__ - Step 31404: {'lr': 0.0004528669659568472, 'samples': 6029568, 'steps': 31403, 'loss/train': 0.9204387068748474} -08/30/2021 18:55:42 - INFO - __main__ - Step 31405: {'lr': 0.00045286386466542896, 'samples': 6029760, 'steps': 31404, 'loss/train': 1.208727240562439} -08/30/2021 18:55:43 - INFO - __main__ - Step 31406: {'lr': 0.0004528607632826034, 'samples': 6029952, 'steps': 31405, 'loss/train': 0.7143217325210571} -08/30/2021 18:55:43 - INFO - __main__ - Step 31407: {'lr': 0.00045285766180837197, 'samples': 6030144, 'steps': 31406, 'loss/train': 1.926500916481018} -08/30/2021 18:55:45 - INFO - __main__ - Step 31408: {'lr': 0.000452854560242736, 'samples': 6030336, 'steps': 31407, 'loss/train': 1.125378966331482} -08/30/2021 18:55:45 - INFO - __main__ - Step 31409: {'lr': 0.0004528514585856968, 'samples': 6030528, 'steps': 31408, 'loss/train': 1.475826621055603} -08/30/2021 18:55:46 - INFO - __main__ - Step 31410: {'lr': 0.0004528483568372559, 'samples': 6030720, 'steps': 31409, 'loss/train': 1.1945854425430298} -08/30/2021 18:55:46 - INFO - __main__ - Step 31411: {'lr': 0.00045284525499741474, 'samples': 6030912, 'steps': 31410, 'loss/train': 1.4862995147705078} -08/30/2021 18:55:46 - INFO - __main__ - Step 31412: {'lr': 0.0004528421530661746, 'samples': 6031104, 'steps': 31411, 'loss/train': 1.360161542892456} -08/30/2021 18:55:47 - INFO - __main__ - Step 31413: {'lr': 0.0004528390510435368, 'samples': 6031296, 'steps': 31412, 'loss/train': 2.8024587631225586} -08/30/2021 18:55:48 - INFO - __main__ - Step 31414: {'lr': 0.0004528359489295031, 'samples': 6031488, 'steps': 31413, 'loss/train': 1.5121667385101318} -08/30/2021 18:55:49 - INFO - __main__ - Step 31415: {'lr': 0.00045283284672407444, 'samples': 6031680, 'steps': 31414, 'loss/train': 1.7138633728027344} -08/30/2021 18:55:49 - INFO - __main__ - Step 31416: {'lr': 0.0004528297444272525, 'samples': 6031872, 'steps': 31415, 'loss/train': 1.478971004486084} -08/30/2021 18:55:49 - INFO - __main__ - Step 31417: {'lr': 0.0004528266420390386, 'samples': 6032064, 'steps': 31416, 'loss/train': 1.2854008674621582} -08/30/2021 18:55:50 - INFO - __main__ - Step 31418: {'lr': 0.00045282353955943417, 'samples': 6032256, 'steps': 31417, 'loss/train': 1.2074687480926514} -08/30/2021 18:55:51 - INFO - __main__ - Step 31419: {'lr': 0.00045282043698844054, 'samples': 6032448, 'steps': 31418, 'loss/train': 1.638526439666748} -08/30/2021 18:55:52 - INFO - __main__ - Step 31420: {'lr': 0.0004528173343260592, 'samples': 6032640, 'steps': 31419, 'loss/train': 0.10108483582735062} -08/30/2021 18:55:52 - INFO - __main__ - Step 31421: {'lr': 0.0004528142315722915, 'samples': 6032832, 'steps': 31420, 'loss/train': 1.5083378553390503} -08/30/2021 18:55:52 - INFO - __main__ - Step 31422: {'lr': 0.0004528111287271388, 'samples': 6033024, 'steps': 31421, 'loss/train': 1.3909136056900024} -08/30/2021 18:55:53 - INFO - __main__ - Step 31423: {'lr': 0.00045280802579060253, 'samples': 6033216, 'steps': 31422, 'loss/train': 0.7654160857200623} -08/30/2021 18:55:55 - INFO - __main__ - Step 31424: {'lr': 0.00045280492276268414, 'samples': 6033408, 'steps': 31423, 'loss/train': 1.332148551940918} -08/30/2021 18:55:55 - INFO - __main__ - Step 31425: {'lr': 0.0004528018196433849, 'samples': 6033600, 'steps': 31424, 'loss/train': 1.2332581281661987} -08/30/2021 18:55:55 - INFO - __main__ - Step 31426: {'lr': 0.0004527987164327063, 'samples': 6033792, 'steps': 31425, 'loss/train': 0.6418870091438293} -08/30/2021 18:55:56 - INFO - __main__ - Step 31427: {'lr': 0.0004527956131306498, 'samples': 6033984, 'steps': 31426, 'loss/train': 0.9826205372810364} -08/30/2021 18:55:56 - INFO - __main__ - Step 31428: {'lr': 0.0004527925097372168, 'samples': 6034176, 'steps': 31427, 'loss/train': 1.4369760751724243} -08/30/2021 18:55:56 - INFO - __main__ - Step 31429: {'lr': 0.0004527894062524084, 'samples': 6034368, 'steps': 31428, 'loss/train': 1.886527180671692} -08/30/2021 18:55:58 - INFO - __main__ - Step 31430: {'lr': 0.00045278630267622637, 'samples': 6034560, 'steps': 31429, 'loss/train': 1.3181524276733398} -08/30/2021 18:55:58 - INFO - __main__ - Step 31431: {'lr': 0.0004527831990086719, 'samples': 6034752, 'steps': 31430, 'loss/train': 1.613345742225647} -08/30/2021 18:55:59 - INFO - __main__ - Step 31432: {'lr': 0.0004527800952497465, 'samples': 6034944, 'steps': 31431, 'loss/train': 1.1999479532241821} -08/30/2021 18:55:59 - INFO - __main__ - Step 31433: {'lr': 0.0004527769913994515, 'samples': 6035136, 'steps': 31432, 'loss/train': 0.2586987614631653} -08/30/2021 18:55:59 - INFO - __main__ - Step 31434: {'lr': 0.00045277388745778836, 'samples': 6035328, 'steps': 31433, 'loss/train': 1.6988682746887207} -08/30/2021 18:56:01 - INFO - __main__ - Step 31435: {'lr': 0.00045277078342475835, 'samples': 6035520, 'steps': 31434, 'loss/train': 1.606391191482544} -08/30/2021 18:56:01 - INFO - __main__ - Step 31436: {'lr': 0.000452767679300363, 'samples': 6035712, 'steps': 31435, 'loss/train': 1.1598868370056152} -08/30/2021 18:56:02 - INFO - __main__ - Step 31437: {'lr': 0.00045276457508460367, 'samples': 6035904, 'steps': 31436, 'loss/train': 1.789568543434143} -08/30/2021 18:56:02 - INFO - __main__ - Step 31438: {'lr': 0.00045276147077748176, 'samples': 6036096, 'steps': 31437, 'loss/train': 1.4439555406570435} -08/30/2021 18:56:02 - INFO - __main__ - Step 31439: {'lr': 0.0004527583663789986, 'samples': 6036288, 'steps': 31438, 'loss/train': 1.4716142416000366} -08/30/2021 18:56:04 - INFO - __main__ - Step 31440: {'lr': 0.0004527552618891557, 'samples': 6036480, 'steps': 31439, 'loss/train': 1.370036244392395} -08/30/2021 18:56:04 - INFO - __main__ - Step 31441: {'lr': 0.0004527521573079544, 'samples': 6036672, 'steps': 31440, 'loss/train': 1.1786279678344727} -08/30/2021 18:56:05 - INFO - __main__ - Step 31442: {'lr': 0.0004527490526353961, 'samples': 6036864, 'steps': 31441, 'loss/train': 1.855455994606018} -08/30/2021 18:56:05 - INFO - __main__ - Step 31443: {'lr': 0.0004527459478714822, 'samples': 6037056, 'steps': 31442, 'loss/train': 0.9614437818527222} -08/30/2021 18:56:05 - INFO - __main__ - Step 31444: {'lr': 0.00045274284301621414, 'samples': 6037248, 'steps': 31443, 'loss/train': 1.296837568283081} -08/30/2021 18:56:07 - INFO - __main__ - Step 31445: {'lr': 0.00045273973806959325, 'samples': 6037440, 'steps': 31444, 'loss/train': 0.8728410005569458} -08/30/2021 18:56:07 - INFO - __main__ - Step 31446: {'lr': 0.00045273663303162096, 'samples': 6037632, 'steps': 31445, 'loss/train': 1.9406379461288452} -08/30/2021 18:56:08 - INFO - __main__ - Step 31447: {'lr': 0.00045273352790229873, 'samples': 6037824, 'steps': 31446, 'loss/train': 1.4328932762145996} -08/30/2021 18:56:08 - INFO - __main__ - Step 31448: {'lr': 0.0004527304226816278, 'samples': 6038016, 'steps': 31447, 'loss/train': 1.1640315055847168} -08/30/2021 18:56:08 - INFO - __main__ - Step 31449: {'lr': 0.0004527273173696097, 'samples': 6038208, 'steps': 31448, 'loss/train': 1.3157843351364136} -08/30/2021 18:56:10 - INFO - __main__ - Step 31450: {'lr': 0.0004527242119662458, 'samples': 6038400, 'steps': 31449, 'loss/train': 1.4977264404296875} -08/30/2021 18:56:11 - INFO - __main__ - Step 31451: {'lr': 0.00045272110647153754, 'samples': 6038592, 'steps': 31450, 'loss/train': 1.9133837223052979} -08/30/2021 18:56:11 - INFO - __main__ - Step 31452: {'lr': 0.00045271800088548625, 'samples': 6038784, 'steps': 31451, 'loss/train': 1.0430338382720947} -08/30/2021 18:56:12 - INFO - __main__ - Step 31453: {'lr': 0.00045271489520809337, 'samples': 6038976, 'steps': 31452, 'loss/train': 0.23288923501968384} -08/30/2021 18:56:12 - INFO - __main__ - Step 31454: {'lr': 0.0004527117894393603, 'samples': 6039168, 'steps': 31453, 'loss/train': 1.496104121208191} -08/30/2021 18:56:12 - INFO - __main__ - Step 31455: {'lr': 0.0004527086835792884, 'samples': 6039360, 'steps': 31454, 'loss/train': 1.5991955995559692} -08/30/2021 18:56:14 - INFO - __main__ - Step 31456: {'lr': 0.0004527055776278791, 'samples': 6039552, 'steps': 31455, 'loss/train': 2.231074094772339} -08/30/2021 18:56:14 - INFO - __main__ - Step 31457: {'lr': 0.00045270247158513377, 'samples': 6039744, 'steps': 31456, 'loss/train': 1.1377114057540894} -08/30/2021 18:56:15 - INFO - __main__ - Step 31458: {'lr': 0.00045269936545105384, 'samples': 6039936, 'steps': 31457, 'loss/train': 1.273699164390564} -08/30/2021 18:56:15 - INFO - __main__ - Step 31459: {'lr': 0.0004526962592256407, 'samples': 6040128, 'steps': 31458, 'loss/train': 1.3193888664245605} -08/30/2021 18:56:15 - INFO - __main__ - Step 31460: {'lr': 0.00045269315290889583, 'samples': 6040320, 'steps': 31459, 'loss/train': 1.9876859188079834} -08/30/2021 18:56:17 - INFO - __main__ - Step 31461: {'lr': 0.00045269004650082045, 'samples': 6040512, 'steps': 31460, 'loss/train': 1.8289393186569214} -08/30/2021 18:56:17 - INFO - __main__ - Step 31462: {'lr': 0.0004526869400014162, 'samples': 6040704, 'steps': 31461, 'loss/train': 1.0538196563720703} -08/30/2021 18:56:18 - INFO - __main__ - Step 31463: {'lr': 0.0004526838334106842, 'samples': 6040896, 'steps': 31462, 'loss/train': 2.3195483684539795} -08/30/2021 18:56:18 - INFO - __main__ - Step 31464: {'lr': 0.000452680726728626, 'samples': 6041088, 'steps': 31463, 'loss/train': 1.1052652597427368} -08/30/2021 18:56:18 - INFO - __main__ - Step 31465: {'lr': 0.00045267761995524314, 'samples': 6041280, 'steps': 31464, 'loss/train': 1.0972288846969604} -08/30/2021 18:56:20 - INFO - __main__ - Step 31466: {'lr': 0.00045267451309053677, 'samples': 6041472, 'steps': 31465, 'loss/train': 1.22018563747406} -08/30/2021 18:56:21 - INFO - __main__ - Step 31467: {'lr': 0.0004526714061345084, 'samples': 6041664, 'steps': 31466, 'loss/train': 1.823421835899353} -08/30/2021 18:56:21 - INFO - __main__ - Step 31468: {'lr': 0.0004526682990871593, 'samples': 6041856, 'steps': 31467, 'loss/train': 1.3162624835968018} -08/30/2021 18:56:21 - INFO - __main__ - Step 31469: {'lr': 0.0004526651919484912, 'samples': 6042048, 'steps': 31468, 'loss/train': 1.4950264692306519} -08/30/2021 18:56:22 - INFO - __main__ - Step 31470: {'lr': 0.00045266208471850516, 'samples': 6042240, 'steps': 31469, 'loss/train': 1.1708528995513916} -08/30/2021 18:56:23 - INFO - __main__ - Step 31471: {'lr': 0.00045265897739720277, 'samples': 6042432, 'steps': 31470, 'loss/train': 1.3910452127456665} -08/30/2021 18:56:24 - INFO - __main__ - Step 31472: {'lr': 0.00045265586998458534, 'samples': 6042624, 'steps': 31471, 'loss/train': 1.279205322265625} -08/30/2021 18:56:24 - INFO - __main__ - Step 31473: {'lr': 0.00045265276248065436, 'samples': 6042816, 'steps': 31472, 'loss/train': 1.2575830221176147} -08/30/2021 18:56:24 - INFO - __main__ - Step 31474: {'lr': 0.0004526496548854111, 'samples': 6043008, 'steps': 31473, 'loss/train': 1.222016453742981} -08/30/2021 18:56:25 - INFO - __main__ - Step 31475: {'lr': 0.000452646547198857, 'samples': 6043200, 'steps': 31474, 'loss/train': 1.686367392539978} -08/30/2021 18:56:25 - INFO - __main__ - Step 31476: {'lr': 0.0004526434394209936, 'samples': 6043392, 'steps': 31475, 'loss/train': 1.1926203966140747} -08/30/2021 18:56:27 - INFO - __main__ - Step 31477: {'lr': 0.00045264033155182216, 'samples': 6043584, 'steps': 31476, 'loss/train': 1.3968989849090576} -08/30/2021 18:56:27 - INFO - __main__ - Step 31478: {'lr': 0.0004526372235913441, 'samples': 6043776, 'steps': 31477, 'loss/train': 0.8984674215316772} -08/30/2021 18:56:27 - INFO - __main__ - Step 31479: {'lr': 0.0004526341155395608, 'samples': 6043968, 'steps': 31478, 'loss/train': 1.6023017168045044} -08/30/2021 18:56:28 - INFO - __main__ - Step 31480: {'lr': 0.00045263100739647373, 'samples': 6044160, 'steps': 31479, 'loss/train': 1.2159675359725952} -08/30/2021 18:56:28 - INFO - __main__ - Step 31481: {'lr': 0.00045262789916208424, 'samples': 6044352, 'steps': 31480, 'loss/train': 0.6490748524665833} -08/30/2021 18:56:30 - INFO - __main__ - Step 31482: {'lr': 0.00045262479083639376, 'samples': 6044544, 'steps': 31481, 'loss/train': 0.8157838582992554} -08/30/2021 18:56:30 - INFO - __main__ - Step 31483: {'lr': 0.0004526216824194037, 'samples': 6044736, 'steps': 31482, 'loss/train': 2.0911879539489746} -08/30/2021 18:56:30 - INFO - __main__ - Step 31484: {'lr': 0.00045261857391111536, 'samples': 6044928, 'steps': 31483, 'loss/train': 1.2063584327697754} -08/30/2021 18:56:31 - INFO - __main__ - Step 31485: {'lr': 0.0004526154653115303, 'samples': 6045120, 'steps': 31484, 'loss/train': 1.706596851348877} -08/30/2021 18:56:31 - INFO - __main__ - Step 31486: {'lr': 0.0004526123566206498, 'samples': 6045312, 'steps': 31485, 'loss/train': 0.9205894470214844} -08/30/2021 18:56:33 - INFO - __main__ - Step 31487: {'lr': 0.0004526092478384753, 'samples': 6045504, 'steps': 31486, 'loss/train': 1.7218198776245117} -08/30/2021 18:56:33 - INFO - __main__ - Step 31488: {'lr': 0.00045260613896500827, 'samples': 6045696, 'steps': 31487, 'loss/train': 1.2149503231048584} -08/30/2021 18:56:33 - INFO - __main__ - Step 31489: {'lr': 0.00045260303000024994, 'samples': 6045888, 'steps': 31488, 'loss/train': 1.7236899137496948} -08/30/2021 18:56:34 - INFO - __main__ - Step 31490: {'lr': 0.0004525999209442018, 'samples': 6046080, 'steps': 31489, 'loss/train': 1.7597769498825073} -08/30/2021 18:56:34 - INFO - __main__ - Step 31491: {'lr': 0.0004525968117968653, 'samples': 6046272, 'steps': 31490, 'loss/train': 0.8732706308364868} -08/30/2021 18:56:34 - INFO - __main__ - Step 31492: {'lr': 0.00045259370255824183, 'samples': 6046464, 'steps': 31491, 'loss/train': 5.7229084968566895} -08/30/2021 18:56:36 - INFO - __main__ - Step 31493: {'lr': 0.0004525905932283327, 'samples': 6046656, 'steps': 31492, 'loss/train': 1.1895314455032349} -08/30/2021 18:56:37 - INFO - __main__ - Step 31494: {'lr': 0.00045258748380713943, 'samples': 6046848, 'steps': 31493, 'loss/train': 1.7025678157806396} -08/30/2021 18:56:37 - INFO - __main__ - Step 31495: {'lr': 0.00045258437429466337, 'samples': 6047040, 'steps': 31494, 'loss/train': 1.4857701063156128} -08/30/2021 18:56:37 - INFO - __main__ - Step 31496: {'lr': 0.0004525812646909059, 'samples': 6047232, 'steps': 31495, 'loss/train': 0.993442952632904} -08/30/2021 18:56:38 - INFO - __main__ - Step 31497: {'lr': 0.0004525781549958684, 'samples': 6047424, 'steps': 31496, 'loss/train': 1.1009951829910278} -08/30/2021 18:56:39 - INFO - __main__ - Step 31498: {'lr': 0.0004525750452095524, 'samples': 6047616, 'steps': 31497, 'loss/train': 1.534775972366333} -08/30/2021 18:56:40 - INFO - __main__ - Step 31499: {'lr': 0.00045257193533195916, 'samples': 6047808, 'steps': 31498, 'loss/train': 1.2641210556030273} -08/30/2021 18:56:40 - INFO - __main__ - Step 31500: {'lr': 0.0004525688253630901, 'samples': 6048000, 'steps': 31499, 'loss/train': 1.6611754894256592} -08/30/2021 18:56:40 - INFO - __main__ - Step 31501: {'lr': 0.00045256571530294664, 'samples': 6048192, 'steps': 31500, 'loss/train': 1.4023146629333496} -08/30/2021 18:56:41 - INFO - __main__ - Step 31502: {'lr': 0.0004525626051515302, 'samples': 6048384, 'steps': 31501, 'loss/train': 1.5561954975128174} -08/30/2021 18:56:42 - INFO - __main__ - Step 31503: {'lr': 0.0004525594949088423, 'samples': 6048576, 'steps': 31502, 'loss/train': 2.238656520843506} -08/30/2021 18:56:43 - INFO - __main__ - Step 31504: {'lr': 0.00045255638457488415, 'samples': 6048768, 'steps': 31503, 'loss/train': 0.05404098704457283} -08/30/2021 18:56:43 - INFO - __main__ - Step 31505: {'lr': 0.0004525532741496572, 'samples': 6048960, 'steps': 31504, 'loss/train': 1.7800315618515015} -08/30/2021 18:56:43 - INFO - __main__ - Step 31506: {'lr': 0.0004525501636331628, 'samples': 6049152, 'steps': 31505, 'loss/train': 1.8348767757415771} -08/30/2021 18:56:44 - INFO - __main__ - Step 31507: {'lr': 0.00045254705302540257, 'samples': 6049344, 'steps': 31506, 'loss/train': 1.6852188110351562} -08/30/2021 18:56:46 - INFO - __main__ - Step 31508: {'lr': 0.00045254394232637765, 'samples': 6049536, 'steps': 31507, 'loss/train': 1.7218661308288574} -08/30/2021 18:56:46 - INFO - __main__ - Step 31509: {'lr': 0.0004525408315360896, 'samples': 6049728, 'steps': 31508, 'loss/train': 1.3552794456481934} -08/30/2021 18:56:47 - INFO - __main__ - Step 31510: {'lr': 0.00045253772065453977, 'samples': 6049920, 'steps': 31509, 'loss/train': 1.0921895503997803} -08/30/2021 18:56:47 - INFO - __main__ - Step 31511: {'lr': 0.00045253460968172957, 'samples': 6050112, 'steps': 31510, 'loss/train': 1.7306175231933594} -08/30/2021 18:56:47 - INFO - __main__ - Step 31512: {'lr': 0.0004525314986176604, 'samples': 6050304, 'steps': 31511, 'loss/train': 0.8179535865783691} -08/30/2021 18:56:49 - INFO - __main__ - Step 31513: {'lr': 0.0004525283874623336, 'samples': 6050496, 'steps': 31512, 'loss/train': 1.351931095123291} -08/30/2021 18:56:50 - INFO - __main__ - Step 31514: {'lr': 0.00045252527621575075, 'samples': 6050688, 'steps': 31513, 'loss/train': 1.6400539875030518} -08/30/2021 18:56:50 - INFO - __main__ - Step 31515: {'lr': 0.0004525221648779131, 'samples': 6050880, 'steps': 31514, 'loss/train': 1.9648393392562866} -08/30/2021 18:56:50 - INFO - __main__ - Step 31516: {'lr': 0.00045251905344882205, 'samples': 6051072, 'steps': 31515, 'loss/train': 1.9522805213928223} -08/30/2021 18:56:51 - INFO - __main__ - Step 31517: {'lr': 0.000452515941928479, 'samples': 6051264, 'steps': 31516, 'loss/train': 1.3978352546691895} -08/30/2021 18:56:51 - INFO - __main__ - Step 31518: {'lr': 0.0004525128303168855, 'samples': 6051456, 'steps': 31517, 'loss/train': 1.381455421447754} -08/30/2021 18:56:52 - INFO - __main__ - Step 31519: {'lr': 0.00045250971861404276, 'samples': 6051648, 'steps': 31518, 'loss/train': 1.6752939224243164} -08/30/2021 18:56:53 - INFO - __main__ - Step 31520: {'lr': 0.0004525066068199523, 'samples': 6051840, 'steps': 31519, 'loss/train': 1.2719836235046387} -08/30/2021 18:56:53 - INFO - __main__ - Step 31521: {'lr': 0.0004525034949346155, 'samples': 6052032, 'steps': 31520, 'loss/train': 1.4441601037979126} -08/30/2021 18:56:54 - INFO - __main__ - Step 31522: {'lr': 0.0004525003829580337, 'samples': 6052224, 'steps': 31521, 'loss/train': 2.3608810901641846} -08/30/2021 18:56:54 - INFO - __main__ - Step 31523: {'lr': 0.0004524972708902084, 'samples': 6052416, 'steps': 31522, 'loss/train': 1.4365335702896118} -08/30/2021 18:56:56 - INFO - __main__ - Step 31524: {'lr': 0.0004524941587311409, 'samples': 6052608, 'steps': 31523, 'loss/train': 1.589581847190857} -08/30/2021 18:56:56 - INFO - __main__ - Step 31525: {'lr': 0.0004524910464808327, 'samples': 6052800, 'steps': 31524, 'loss/train': 1.5015918016433716} -08/30/2021 18:56:56 - INFO - __main__ - Step 31526: {'lr': 0.00045248793413928514, 'samples': 6052992, 'steps': 31525, 'loss/train': 1.3970669507980347} -08/30/2021 18:56:57 - INFO - __main__ - Step 31527: {'lr': 0.0004524848217064997, 'samples': 6053184, 'steps': 31526, 'loss/train': 1.0029394626617432} -08/30/2021 18:56:57 - INFO - __main__ - Step 31528: {'lr': 0.0004524817091824777, 'samples': 6053376, 'steps': 31527, 'loss/train': 1.034461259841919} -08/30/2021 18:56:59 - INFO - __main__ - Step 31529: {'lr': 0.00045247859656722056, 'samples': 6053568, 'steps': 31528, 'loss/train': 1.2880207300186157} -08/30/2021 18:56:59 - INFO - __main__ - Step 31530: {'lr': 0.0004524754838607297, 'samples': 6053760, 'steps': 31529, 'loss/train': 1.7482061386108398} -08/30/2021 18:56:59 - INFO - __main__ - Step 31531: {'lr': 0.0004524723710630064, 'samples': 6053952, 'steps': 31530, 'loss/train': 1.3517693281173706} -08/30/2021 18:57:00 - INFO - __main__ - Step 31532: {'lr': 0.0004524692581740523, 'samples': 6054144, 'steps': 31531, 'loss/train': 1.4645726680755615} -08/30/2021 18:57:00 - INFO - __main__ - Step 31533: {'lr': 0.00045246614519386865, 'samples': 6054336, 'steps': 31532, 'loss/train': 1.362823247909546} -08/30/2021 18:57:02 - INFO - __main__ - Step 31534: {'lr': 0.0004524630321224569, 'samples': 6054528, 'steps': 31533, 'loss/train': 1.1384767293930054} -08/30/2021 18:57:02 - INFO - __main__ - Step 31535: {'lr': 0.0004524599189598183, 'samples': 6054720, 'steps': 31534, 'loss/train': 1.7595208883285522} -08/30/2021 18:57:03 - INFO - __main__ - Step 31536: {'lr': 0.0004524568057059545, 'samples': 6054912, 'steps': 31535, 'loss/train': 1.2609013319015503} -08/30/2021 18:57:03 - INFO - __main__ - Step 31537: {'lr': 0.00045245369236086673, 'samples': 6055104, 'steps': 31536, 'loss/train': 1.063708782196045} -08/30/2021 18:57:03 - INFO - __main__ - Step 31538: {'lr': 0.00045245057892455653, 'samples': 6055296, 'steps': 31537, 'loss/train': 1.398468255996704} -08/30/2021 18:57:05 - INFO - __main__ - Step 31539: {'lr': 0.0004524474653970252, 'samples': 6055488, 'steps': 31538, 'loss/train': 1.3290035724639893} -08/30/2021 18:57:05 - INFO - __main__ - Step 31540: {'lr': 0.00045244435177827413, 'samples': 6055680, 'steps': 31539, 'loss/train': 0.9209257960319519} -08/30/2021 18:57:06 - INFO - __main__ - Step 31541: {'lr': 0.00045244123806830486, 'samples': 6055872, 'steps': 31540, 'loss/train': 2.057265520095825} -08/30/2021 18:57:06 - INFO - __main__ - Step 31542: {'lr': 0.00045243812426711856, 'samples': 6056064, 'steps': 31541, 'loss/train': 1.5249072313308716} -08/30/2021 18:57:06 - INFO - __main__ - Step 31543: {'lr': 0.0004524350103747168, 'samples': 6056256, 'steps': 31542, 'loss/train': 1.7326353788375854} -08/30/2021 18:57:07 - INFO - __main__ - Step 31544: {'lr': 0.00045243189639110093, 'samples': 6056448, 'steps': 31543, 'loss/train': 1.630940318107605} -08/30/2021 18:57:09 - INFO - __main__ - Step 31545: {'lr': 0.00045242878231627247, 'samples': 6056640, 'steps': 31544, 'loss/train': 1.7212327718734741} -08/30/2021 18:57:09 - INFO - __main__ - Step 31546: {'lr': 0.0004524256681502327, 'samples': 6056832, 'steps': 31545, 'loss/train': 1.0421826839447021} -08/30/2021 18:57:10 - INFO - __main__ - Step 31547: {'lr': 0.0004524225538929829, 'samples': 6057024, 'steps': 31546, 'loss/train': 1.0967950820922852} -08/30/2021 18:57:10 - INFO - __main__ - Step 31548: {'lr': 0.0004524194395445248, 'samples': 6057216, 'steps': 31547, 'loss/train': 1.576261281967163} -08/30/2021 18:57:10 - INFO - __main__ - Step 31549: {'lr': 0.0004524163251048595, 'samples': 6057408, 'steps': 31548, 'loss/train': 1.1451524496078491} -08/30/2021 18:57:11 - INFO - __main__ - Step 31550: {'lr': 0.0004524132105739886, 'samples': 6057600, 'steps': 31549, 'loss/train': 0.09778346121311188} -08/30/2021 18:57:12 - INFO - __main__ - Step 31551: {'lr': 0.0004524100959519134, 'samples': 6057792, 'steps': 31550, 'loss/train': 0.08346326649188995} -08/30/2021 18:57:13 - INFO - __main__ - Step 31552: {'lr': 0.00045240698123863535, 'samples': 6057984, 'steps': 31551, 'loss/train': 2.0149972438812256} -08/30/2021 18:57:13 - INFO - __main__ - Step 31553: {'lr': 0.0004524038664341558, 'samples': 6058176, 'steps': 31552, 'loss/train': 1.7667441368103027} -08/30/2021 18:57:13 - INFO - __main__ - Step 31554: {'lr': 0.00045240075153847625, 'samples': 6058368, 'steps': 31553, 'loss/train': 1.8250231742858887} -08/30/2021 18:57:14 - INFO - __main__ - Step 31555: {'lr': 0.00045239763655159805, 'samples': 6058560, 'steps': 31554, 'loss/train': 1.6269919872283936} -08/30/2021 18:57:15 - INFO - __main__ - Step 31556: {'lr': 0.00045239452147352257, 'samples': 6058752, 'steps': 31555, 'loss/train': 1.7754318714141846} -08/30/2021 18:57:16 - INFO - __main__ - Step 31557: {'lr': 0.0004523914063042512, 'samples': 6058944, 'steps': 31556, 'loss/train': 1.6464051008224487} -08/30/2021 18:57:16 - INFO - __main__ - Step 31558: {'lr': 0.00045238829104378545, 'samples': 6059136, 'steps': 31557, 'loss/train': 2.1267404556274414} -08/30/2021 18:57:16 - INFO - __main__ - Step 31559: {'lr': 0.0004523851756921266, 'samples': 6059328, 'steps': 31558, 'loss/train': 1.0851868391036987} -08/30/2021 18:57:17 - INFO - __main__ - Step 31560: {'lr': 0.00045238206024927614, 'samples': 6059520, 'steps': 31559, 'loss/train': 1.1838688850402832} -08/30/2021 18:57:19 - INFO - __main__ - Step 31561: {'lr': 0.00045237894471523543, 'samples': 6059712, 'steps': 31560, 'loss/train': 1.5186291933059692} -08/30/2021 18:57:20 - INFO - __main__ - Step 31562: {'lr': 0.00045237582909000594, 'samples': 6059904, 'steps': 31561, 'loss/train': 1.5224990844726562} -08/30/2021 18:57:20 - INFO - __main__ - Step 31563: {'lr': 0.00045237271337358897, 'samples': 6060096, 'steps': 31562, 'loss/train': 0.7331939935684204} -08/30/2021 18:57:20 - INFO - __main__ - Step 31564: {'lr': 0.00045236959756598605, 'samples': 6060288, 'steps': 31563, 'loss/train': 1.7170697450637817} -08/30/2021 18:57:21 - INFO - __main__ - Step 31565: {'lr': 0.0004523664816671985, 'samples': 6060480, 'steps': 31564, 'loss/train': 1.411661982536316} -08/30/2021 18:57:22 - INFO - __main__ - Step 31566: {'lr': 0.0004523633656772277, 'samples': 6060672, 'steps': 31565, 'loss/train': 1.6969722509384155} -08/30/2021 18:57:23 - INFO - __main__ - Step 31567: {'lr': 0.00045236024959607505, 'samples': 6060864, 'steps': 31566, 'loss/train': 1.627051591873169} -08/30/2021 18:57:23 - INFO - __main__ - Step 31568: {'lr': 0.00045235713342374207, 'samples': 6061056, 'steps': 31567, 'loss/train': 1.966498851776123} -08/30/2021 18:57:23 - INFO - __main__ - Step 31569: {'lr': 0.00045235401716023, 'samples': 6061248, 'steps': 31568, 'loss/train': 1.27817702293396} -08/30/2021 18:57:24 - INFO - __main__ - Step 31570: {'lr': 0.0004523509008055404, 'samples': 6061440, 'steps': 31569, 'loss/train': 0.9885744452476501} -08/30/2021 18:57:24 - INFO - __main__ - Step 31571: {'lr': 0.0004523477843596746, 'samples': 6061632, 'steps': 31570, 'loss/train': 1.8031383752822876} -08/30/2021 18:57:26 - INFO - __main__ - Step 31572: {'lr': 0.00045234466782263403, 'samples': 6061824, 'steps': 31571, 'loss/train': 1.3130309581756592} -08/30/2021 18:57:26 - INFO - __main__ - Step 31573: {'lr': 0.00045234155119442, 'samples': 6062016, 'steps': 31572, 'loss/train': 1.1655257940292358} -08/30/2021 18:57:26 - INFO - __main__ - Step 31574: {'lr': 0.00045233843447503407, 'samples': 6062208, 'steps': 31573, 'loss/train': 1.9268194437026978} -08/30/2021 18:57:27 - INFO - __main__ - Step 31575: {'lr': 0.00045233531766447757, 'samples': 6062400, 'steps': 31574, 'loss/train': 1.5363763570785522} -08/30/2021 18:57:27 - INFO - __main__ - Step 31576: {'lr': 0.00045233220076275186, 'samples': 6062592, 'steps': 31575, 'loss/train': 1.273422122001648} -08/30/2021 18:57:29 - INFO - __main__ - Step 31577: {'lr': 0.0004523290837698583, 'samples': 6062784, 'steps': 31576, 'loss/train': 1.2363674640655518} -08/30/2021 18:57:29 - INFO - __main__ - Step 31578: {'lr': 0.0004523259666857985, 'samples': 6062976, 'steps': 31577, 'loss/train': 2.001171827316284} -08/30/2021 18:57:29 - INFO - __main__ - Step 31579: {'lr': 0.00045232284951057366, 'samples': 6063168, 'steps': 31578, 'loss/train': 2.232010841369629} -08/30/2021 18:57:30 - INFO - __main__ - Step 31580: {'lr': 0.00045231973224418533, 'samples': 6063360, 'steps': 31579, 'loss/train': 1.2469266653060913} -08/30/2021 18:57:30 - INFO - __main__ - Step 31581: {'lr': 0.00045231661488663485, 'samples': 6063552, 'steps': 31580, 'loss/train': 1.5800751447677612} -08/30/2021 18:57:32 - INFO - __main__ - Step 31582: {'lr': 0.0004523134974379236, 'samples': 6063744, 'steps': 31581, 'loss/train': 1.8041555881500244} -08/30/2021 18:57:32 - INFO - __main__ - Step 31583: {'lr': 0.000452310379898053, 'samples': 6063936, 'steps': 31582, 'loss/train': 1.0503699779510498} -08/30/2021 18:57:32 - INFO - __main__ - Step 31584: {'lr': 0.00045230726226702444, 'samples': 6064128, 'steps': 31583, 'loss/train': 1.2031890153884888} -08/30/2021 18:57:33 - INFO - __main__ - Step 31585: {'lr': 0.0004523041445448394, 'samples': 6064320, 'steps': 31584, 'loss/train': 1.5853074789047241} -08/30/2021 18:57:33 - INFO - __main__ - Step 31586: {'lr': 0.00045230102673149923, 'samples': 6064512, 'steps': 31585, 'loss/train': 1.3289752006530762} -08/30/2021 18:57:35 - INFO - __main__ - Step 31587: {'lr': 0.00045229790882700535, 'samples': 6064704, 'steps': 31586, 'loss/train': 0.9187049269676208} -08/30/2021 18:57:35 - INFO - __main__ - Step 31588: {'lr': 0.00045229479083135917, 'samples': 6064896, 'steps': 31587, 'loss/train': 1.7024964094161987} -08/30/2021 18:57:35 - INFO - __main__ - Step 31589: {'lr': 0.000452291672744562, 'samples': 6065088, 'steps': 31588, 'loss/train': 1.8442749977111816} -08/30/2021 18:57:36 - INFO - __main__ - Step 31590: {'lr': 0.0004522885545666153, 'samples': 6065280, 'steps': 31589, 'loss/train': 0.8489173054695129} -08/30/2021 18:57:36 - INFO - __main__ - Step 31591: {'lr': 0.0004522854362975206, 'samples': 6065472, 'steps': 31590, 'loss/train': 1.4772372245788574} -08/30/2021 18:57:38 - INFO - __main__ - Step 31592: {'lr': 0.00045228231793727924, 'samples': 6065664, 'steps': 31591, 'loss/train': 1.51474928855896} -08/30/2021 18:57:39 - INFO - __main__ - Step 31593: {'lr': 0.00045227919948589247, 'samples': 6065856, 'steps': 31592, 'loss/train': 1.716181755065918} -08/30/2021 18:57:39 - INFO - __main__ - Step 31594: {'lr': 0.0004522760809433619, 'samples': 6066048, 'steps': 31593, 'loss/train': 0.03369634971022606} -08/30/2021 18:57:39 - INFO - __main__ - Step 31595: {'lr': 0.0004522729623096888, 'samples': 6066240, 'steps': 31594, 'loss/train': 0.9508997201919556} -08/30/2021 18:57:40 - INFO - __main__ - Step 31596: {'lr': 0.0004522698435848747, 'samples': 6066432, 'steps': 31595, 'loss/train': 1.5020116567611694} -08/30/2021 18:57:40 - INFO - __main__ - Step 31597: {'lr': 0.0004522667247689208, 'samples': 6066624, 'steps': 31596, 'loss/train': 1.4500706195831299} -08/30/2021 18:57:40 - INFO - __main__ - Step 31598: {'lr': 0.0004522636058618287, 'samples': 6066816, 'steps': 31597, 'loss/train': 1.1037218570709229} -08/30/2021 18:57:42 - INFO - __main__ - Step 31599: {'lr': 0.0004522604868635998, 'samples': 6067008, 'steps': 31598, 'loss/train': 1.8208473920822144} -08/30/2021 18:57:42 - INFO - __main__ - Step 31600: {'lr': 0.0004522573677742353, 'samples': 6067200, 'steps': 31599, 'loss/train': 1.5743062496185303} -08/30/2021 18:57:43 - INFO - __main__ - Step 31601: {'lr': 0.0004522542485937369, 'samples': 6067392, 'steps': 31600, 'loss/train': 0.9678654074668884} -08/30/2021 18:57:43 - INFO - __main__ - Step 31602: {'lr': 0.0004522511293221058, 'samples': 6067584, 'steps': 31601, 'loss/train': 1.4245835542678833} -08/30/2021 18:57:43 - INFO - __main__ - Step 31603: {'lr': 0.00045224800995934345, 'samples': 6067776, 'steps': 31602, 'loss/train': 1.0812561511993408} -08/30/2021 18:57:45 - INFO - __main__ - Step 31604: {'lr': 0.00045224489050545125, 'samples': 6067968, 'steps': 31603, 'loss/train': 1.6551666259765625} -08/30/2021 18:57:46 - INFO - __main__ - Step 31605: {'lr': 0.0004522417709604306, 'samples': 6068160, 'steps': 31604, 'loss/train': 1.3745955228805542} -08/30/2021 18:57:46 - INFO - __main__ - Step 31606: {'lr': 0.000452238651324283, 'samples': 6068352, 'steps': 31605, 'loss/train': 1.4644901752471924} -08/30/2021 18:57:46 - INFO - __main__ - Step 31607: {'lr': 0.0004522355315970098, 'samples': 6068544, 'steps': 31606, 'loss/train': 0.9497048258781433} -08/30/2021 18:57:47 - INFO - __main__ - Step 31608: {'lr': 0.0004522324117786123, 'samples': 6068736, 'steps': 31607, 'loss/train': 1.3428709506988525} -08/30/2021 18:57:48 - INFO - __main__ - Step 31609: {'lr': 0.0004522292918690921, 'samples': 6068928, 'steps': 31608, 'loss/train': 1.5631051063537598} -08/30/2021 18:57:49 - INFO - __main__ - Step 31610: {'lr': 0.0004522261718684504, 'samples': 6069120, 'steps': 31609, 'loss/train': 1.394026279449463} -08/30/2021 18:57:49 - INFO - __main__ - Step 31611: {'lr': 0.00045222305177668875, 'samples': 6069312, 'steps': 31610, 'loss/train': 1.3956263065338135} -08/30/2021 18:57:49 - INFO - __main__ - Step 31612: {'lr': 0.00045221993159380857, 'samples': 6069504, 'steps': 31611, 'loss/train': 1.617452621459961} -08/30/2021 18:57:50 - INFO - __main__ - Step 31613: {'lr': 0.00045221681131981116, 'samples': 6069696, 'steps': 31612, 'loss/train': 1.3847172260284424} -08/30/2021 18:57:52 - INFO - __main__ - Step 31614: {'lr': 0.00045221369095469795, 'samples': 6069888, 'steps': 31613, 'loss/train': 1.5455043315887451} -08/30/2021 18:57:52 - INFO - __main__ - Step 31615: {'lr': 0.00045221057049847044, 'samples': 6070080, 'steps': 31614, 'loss/train': 0.05985480174422264} -08/30/2021 18:57:53 - INFO - __main__ - Step 31616: {'lr': 0.0004522074499511299, 'samples': 6070272, 'steps': 31615, 'loss/train': 1.373349666595459} -08/30/2021 18:57:53 - INFO - __main__ - Step 31617: {'lr': 0.0004522043293126778, 'samples': 6070464, 'steps': 31616, 'loss/train': 1.349117398262024} -08/30/2021 18:57:53 - INFO - __main__ - Step 31618: {'lr': 0.00045220120858311557, 'samples': 6070656, 'steps': 31617, 'loss/train': 1.4376928806304932} -08/30/2021 18:57:55 - INFO - __main__ - Step 31619: {'lr': 0.0004521980877624446, 'samples': 6070848, 'steps': 31618, 'loss/train': 2.031606912612915} -08/30/2021 18:57:56 - INFO - __main__ - Step 31620: {'lr': 0.0004521949668506663, 'samples': 6071040, 'steps': 31619, 'loss/train': 0.059158165007829666} -08/30/2021 18:57:56 - INFO - __main__ - Step 31621: {'lr': 0.00045219184584778207, 'samples': 6071232, 'steps': 31620, 'loss/train': 1.1033680438995361} -08/30/2021 18:57:57 - INFO - __main__ - Step 31622: {'lr': 0.0004521887247537933, 'samples': 6071424, 'steps': 31621, 'loss/train': 1.3772066831588745} -08/30/2021 18:57:57 - INFO - __main__ - Step 31623: {'lr': 0.00045218560356870144, 'samples': 6071616, 'steps': 31622, 'loss/train': 1.6896253824234009} -08/30/2021 18:57:57 - INFO - __main__ - Step 31624: {'lr': 0.0004521824822925078, 'samples': 6071808, 'steps': 31623, 'loss/train': 0.02434605173766613} -08/30/2021 18:57:59 - INFO - __main__ - Step 31625: {'lr': 0.00045217936092521396, 'samples': 6072000, 'steps': 31624, 'loss/train': 1.350623607635498} -08/30/2021 18:57:59 - INFO - __main__ - Step 31626: {'lr': 0.00045217623946682114, 'samples': 6072192, 'steps': 31625, 'loss/train': 1.9136111736297607} -08/30/2021 18:58:00 - INFO - __main__ - Step 31627: {'lr': 0.00045217311791733084, 'samples': 6072384, 'steps': 31626, 'loss/train': 1.8074136972427368} -08/30/2021 18:58:00 - INFO - __main__ - Step 31628: {'lr': 0.00045216999627674436, 'samples': 6072576, 'steps': 31627, 'loss/train': 1.3274154663085938} -08/30/2021 18:58:00 - INFO - __main__ - Step 31629: {'lr': 0.0004521668745450633, 'samples': 6072768, 'steps': 31628, 'loss/train': 1.2185918092727661} -08/30/2021 18:58:02 - INFO - __main__ - Step 31630: {'lr': 0.00045216375272228907, 'samples': 6072960, 'steps': 31629, 'loss/train': 1.561006784439087} -08/30/2021 18:58:03 - INFO - __main__ - Step 31631: {'lr': 0.00045216063080842287, 'samples': 6073152, 'steps': 31630, 'loss/train': 0.7294368743896484} -08/30/2021 18:58:03 - INFO - __main__ - Step 31632: {'lr': 0.00045215750880346617, 'samples': 6073344, 'steps': 31631, 'loss/train': 1.4684414863586426} -08/30/2021 18:58:03 - INFO - __main__ - Step 31633: {'lr': 0.00045215438670742045, 'samples': 6073536, 'steps': 31632, 'loss/train': 2.2386507987976074} -08/30/2021 18:58:04 - INFO - __main__ - Step 31634: {'lr': 0.00045215126452028705, 'samples': 6073728, 'steps': 31633, 'loss/train': 1.715134859085083} -08/30/2021 18:58:05 - INFO - __main__ - Step 31635: {'lr': 0.00045214814224206744, 'samples': 6073920, 'steps': 31634, 'loss/train': 1.5047531127929688} -08/30/2021 18:58:06 - INFO - __main__ - Step 31636: {'lr': 0.00045214501987276304, 'samples': 6074112, 'steps': 31635, 'loss/train': 1.7091227769851685} -08/30/2021 18:58:06 - INFO - __main__ - Step 31637: {'lr': 0.0004521418974123751, 'samples': 6074304, 'steps': 31636, 'loss/train': 1.8161869049072266} -08/30/2021 18:58:06 - INFO - __main__ - Step 31638: {'lr': 0.00045213877486090524, 'samples': 6074496, 'steps': 31637, 'loss/train': 1.9217665195465088} -08/30/2021 18:58:07 - INFO - __main__ - Step 31639: {'lr': 0.00045213565221835473, 'samples': 6074688, 'steps': 31638, 'loss/train': 1.0621533393859863} -08/30/2021 18:58:08 - INFO - __main__ - Step 31640: {'lr': 0.00045213252948472505, 'samples': 6074880, 'steps': 31639, 'loss/train': 1.606001853942871} -08/30/2021 18:58:09 - INFO - __main__ - Step 31641: {'lr': 0.0004521294066600175, 'samples': 6075072, 'steps': 31640, 'loss/train': 0.17081789672374725} -08/30/2021 18:58:09 - INFO - __main__ - Step 31642: {'lr': 0.0004521262837442336, 'samples': 6075264, 'steps': 31641, 'loss/train': 1.6975547075271606} -08/30/2021 18:58:09 - INFO - __main__ - Step 31643: {'lr': 0.0004521231607373747, 'samples': 6075456, 'steps': 31642, 'loss/train': 1.6854227781295776} -08/30/2021 18:58:10 - INFO - __main__ - Step 31644: {'lr': 0.00045212003763944226, 'samples': 6075648, 'steps': 31643, 'loss/train': 0.9941006302833557} -08/30/2021 18:58:11 - INFO - __main__ - Step 31645: {'lr': 0.00045211691445043765, 'samples': 6075840, 'steps': 31644, 'loss/train': 1.147262692451477} -08/30/2021 18:58:12 - INFO - __main__ - Step 31646: {'lr': 0.0004521137911703622, 'samples': 6076032, 'steps': 31645, 'loss/train': 1.5758424997329712} -08/30/2021 18:58:12 - INFO - __main__ - Step 31647: {'lr': 0.0004521106677992175, 'samples': 6076224, 'steps': 31646, 'loss/train': 1.4871608018875122} -08/30/2021 18:58:12 - INFO - __main__ - Step 31648: {'lr': 0.0004521075443370048, 'samples': 6076416, 'steps': 31647, 'loss/train': 1.315496563911438} -08/30/2021 18:58:13 - INFO - __main__ - Step 31649: {'lr': 0.0004521044207837256, 'samples': 6076608, 'steps': 31648, 'loss/train': 1.3405646085739136} -08/30/2021 18:58:13 - INFO - __main__ - Step 31650: {'lr': 0.0004521012971393812, 'samples': 6076800, 'steps': 31649, 'loss/train': 1.6827404499053955} -08/30/2021 18:58:14 - INFO - __main__ - Step 31651: {'lr': 0.0004520981734039731, 'samples': 6076992, 'steps': 31650, 'loss/train': 1.050052523612976} -08/30/2021 18:58:15 - INFO - __main__ - Step 31652: {'lr': 0.0004520950495775027, 'samples': 6077184, 'steps': 31651, 'loss/train': 0.9302839636802673} -08/30/2021 18:58:15 - INFO - __main__ - Step 31653: {'lr': 0.00045209192565997137, 'samples': 6077376, 'steps': 31652, 'loss/train': 1.246191382408142} -08/30/2021 18:58:16 - INFO - __main__ - Step 31654: {'lr': 0.00045208880165138054, 'samples': 6077568, 'steps': 31653, 'loss/train': 1.934869408607483} -08/30/2021 18:58:16 - INFO - __main__ - Step 31655: {'lr': 0.0004520856775517316, 'samples': 6077760, 'steps': 31654, 'loss/train': 1.8992890119552612} -08/30/2021 18:58:17 - INFO - __main__ - Step 31656: {'lr': 0.00045208255336102597, 'samples': 6077952, 'steps': 31655, 'loss/train': 1.8047153949737549} -08/30/2021 18:58:18 - INFO - __main__ - Step 31657: {'lr': 0.0004520794290792651, 'samples': 6078144, 'steps': 31656, 'loss/train': 2.0793232917785645} -08/30/2021 18:58:18 - INFO - __main__ - Step 31658: {'lr': 0.0004520763047064503, 'samples': 6078336, 'steps': 31657, 'loss/train': 1.329634189605713} -08/30/2021 18:58:19 - INFO - __main__ - Step 31659: {'lr': 0.0004520731802425831, 'samples': 6078528, 'steps': 31658, 'loss/train': 2.406625270843506} -08/30/2021 18:58:19 - INFO - __main__ - Step 31660: {'lr': 0.0004520700556876648, 'samples': 6078720, 'steps': 31659, 'loss/train': 1.5261276960372925} -08/30/2021 18:58:21 - INFO - __main__ - Step 31661: {'lr': 0.0004520669310416969, 'samples': 6078912, 'steps': 31660, 'loss/train': 1.557644248008728} -08/30/2021 18:58:21 - INFO - __main__ - Step 31662: {'lr': 0.0004520638063046807, 'samples': 6079104, 'steps': 31661, 'loss/train': 0.18460960686206818} -08/30/2021 18:58:22 - INFO - __main__ - Step 31663: {'lr': 0.0004520606814766177, 'samples': 6079296, 'steps': 31662, 'loss/train': 1.4834038019180298} -08/30/2021 18:58:22 - INFO - __main__ - Step 31664: {'lr': 0.00045205755655750924, 'samples': 6079488, 'steps': 31663, 'loss/train': 1.5257419347763062} -08/30/2021 18:58:22 - INFO - __main__ - Step 31665: {'lr': 0.0004520544315473568, 'samples': 6079680, 'steps': 31664, 'loss/train': 1.2246757745742798} -08/30/2021 18:58:24 - INFO - __main__ - Step 31666: {'lr': 0.00045205130644616177, 'samples': 6079872, 'steps': 31665, 'loss/train': 1.3707243204116821} -08/30/2021 18:58:24 - INFO - __main__ - Step 31667: {'lr': 0.0004520481812539255, 'samples': 6080064, 'steps': 31666, 'loss/train': 1.2511168718338013} -08/30/2021 18:58:25 - INFO - __main__ - Step 31668: {'lr': 0.00045204505597064943, 'samples': 6080256, 'steps': 31667, 'loss/train': 1.4564611911773682} -08/30/2021 18:58:25 - INFO - __main__ - Step 31669: {'lr': 0.00045204193059633505, 'samples': 6080448, 'steps': 31668, 'loss/train': 1.3521690368652344} -08/30/2021 18:58:25 - INFO - __main__ - Step 31670: {'lr': 0.0004520388051309836, 'samples': 6080640, 'steps': 31669, 'loss/train': 1.8957232236862183} -08/30/2021 18:58:27 - INFO - __main__ - Step 31671: {'lr': 0.00045203567957459657, 'samples': 6080832, 'steps': 31670, 'loss/train': 1.3604124784469604} -08/30/2021 18:58:28 - INFO - __main__ - Step 31672: {'lr': 0.00045203255392717545, 'samples': 6081024, 'steps': 31671, 'loss/train': 1.3457673788070679} -08/30/2021 18:58:28 - INFO - __main__ - Step 31673: {'lr': 0.00045202942818872157, 'samples': 6081216, 'steps': 31672, 'loss/train': 0.9692102074623108} -08/30/2021 18:58:29 - INFO - __main__ - Step 31674: {'lr': 0.0004520263023592363, 'samples': 6081408, 'steps': 31673, 'loss/train': 1.018338918685913} -08/30/2021 18:58:29 - INFO - __main__ - Step 31675: {'lr': 0.00045202317643872113, 'samples': 6081600, 'steps': 31674, 'loss/train': 1.7192820310592651} -08/30/2021 18:58:30 - INFO - __main__ - Step 31676: {'lr': 0.00045202005042717743, 'samples': 6081792, 'steps': 31675, 'loss/train': 1.3942060470581055} -08/30/2021 18:58:31 - INFO - __main__ - Step 31677: {'lr': 0.0004520169243246066, 'samples': 6081984, 'steps': 31676, 'loss/train': 0.8433346748352051} -08/30/2021 18:58:31 - INFO - __main__ - Step 31678: {'lr': 0.0004520137981310101, 'samples': 6082176, 'steps': 31677, 'loss/train': 1.0872691869735718} -08/30/2021 18:58:32 - INFO - __main__ - Step 31679: {'lr': 0.0004520106718463893, 'samples': 6082368, 'steps': 31678, 'loss/train': 1.5257447957992554} -08/30/2021 18:58:32 - INFO - __main__ - Step 31680: {'lr': 0.0004520075454707456, 'samples': 6082560, 'steps': 31679, 'loss/train': 1.4212603569030762} -08/30/2021 18:58:32 - INFO - __main__ - Step 31681: {'lr': 0.0004520044190040804, 'samples': 6082752, 'steps': 31680, 'loss/train': 0.8837733864784241} -08/30/2021 18:58:34 - INFO - __main__ - Step 31682: {'lr': 0.0004520012924463951, 'samples': 6082944, 'steps': 31681, 'loss/train': 1.139052152633667} -08/30/2021 18:58:34 - INFO - __main__ - Step 31683: {'lr': 0.0004519981657976912, 'samples': 6083136, 'steps': 31682, 'loss/train': 1.3233985900878906} -08/30/2021 18:58:35 - INFO - __main__ - Step 31684: {'lr': 0.00045199503905797, 'samples': 6083328, 'steps': 31683, 'loss/train': 1.5957056283950806} -08/30/2021 18:58:35 - INFO - __main__ - Step 31685: {'lr': 0.0004519919122272329, 'samples': 6083520, 'steps': 31684, 'loss/train': 1.5648043155670166} -08/30/2021 18:58:35 - INFO - __main__ - Step 31686: {'lr': 0.00045198878530548146, 'samples': 6083712, 'steps': 31685, 'loss/train': 1.677486538887024} -08/30/2021 18:58:37 - INFO - __main__ - Step 31687: {'lr': 0.0004519856582927169, 'samples': 6083904, 'steps': 31686, 'loss/train': 1.679205060005188} -08/30/2021 18:58:38 - INFO - __main__ - Step 31688: {'lr': 0.00045198253118894084, 'samples': 6084096, 'steps': 31687, 'loss/train': 1.8955087661743164} -08/30/2021 18:58:38 - INFO - __main__ - Step 31689: {'lr': 0.0004519794039941545, 'samples': 6084288, 'steps': 31688, 'loss/train': 1.417022943496704} -08/30/2021 18:58:39 - INFO - __main__ - Step 31690: {'lr': 0.0004519762767083593, 'samples': 6084480, 'steps': 31689, 'loss/train': 1.5744907855987549} -08/30/2021 18:58:39 - INFO - __main__ - Step 31691: {'lr': 0.00045197314933155677, 'samples': 6084672, 'steps': 31690, 'loss/train': 1.6208579540252686} -08/30/2021 18:58:40 - INFO - __main__ - Step 31692: {'lr': 0.0004519700218637482, 'samples': 6084864, 'steps': 31691, 'loss/train': 1.584664225578308} -08/30/2021 18:58:41 - INFO - __main__ - Step 31693: {'lr': 0.00045196689430493516, 'samples': 6085056, 'steps': 31692, 'loss/train': 1.574609637260437} -08/30/2021 18:58:41 - INFO - __main__ - Step 31694: {'lr': 0.00045196376665511883, 'samples': 6085248, 'steps': 31693, 'loss/train': 1.546935796737671} -08/30/2021 18:58:42 - INFO - __main__ - Step 31695: {'lr': 0.00045196063891430086, 'samples': 6085440, 'steps': 31694, 'loss/train': 1.5212210416793823} -08/30/2021 18:58:42 - INFO - __main__ - Step 31696: {'lr': 0.0004519575110824825, 'samples': 6085632, 'steps': 31695, 'loss/train': 1.4790048599243164} -08/30/2021 18:58:43 - INFO - __main__ - Step 31697: {'lr': 0.0004519543831596652, 'samples': 6085824, 'steps': 31696, 'loss/train': 1.2932026386260986} -08/30/2021 18:58:44 - INFO - __main__ - Step 31698: {'lr': 0.0004519512551458503, 'samples': 6086016, 'steps': 31697, 'loss/train': 1.4547592401504517} -08/30/2021 18:58:45 - INFO - __main__ - Step 31699: {'lr': 0.0004519481270410394, 'samples': 6086208, 'steps': 31698, 'loss/train': 0.1433655023574829} -08/30/2021 18:58:45 - INFO - __main__ - Step 31700: {'lr': 0.00045194499884523376, 'samples': 6086400, 'steps': 31699, 'loss/train': 0.35211166739463806} -08/30/2021 18:58:46 - INFO - __main__ - Step 31701: {'lr': 0.0004519418705584348, 'samples': 6086592, 'steps': 31700, 'loss/train': 1.0860755443572998} -08/30/2021 18:58:46 - INFO - __main__ - Step 31702: {'lr': 0.0004519387421806439, 'samples': 6086784, 'steps': 31701, 'loss/train': 1.586506724357605} -08/30/2021 18:58:46 - INFO - __main__ - Step 31703: {'lr': 0.0004519356137118625, 'samples': 6086976, 'steps': 31702, 'loss/train': 1.771864414215088} -08/30/2021 18:58:48 - INFO - __main__ - Step 31704: {'lr': 0.00045193248515209216, 'samples': 6087168, 'steps': 31703, 'loss/train': 1.4260754585266113} -08/30/2021 18:58:48 - INFO - __main__ - Step 31705: {'lr': 0.0004519293565013341, 'samples': 6087360, 'steps': 31704, 'loss/train': 1.7522869110107422} -08/30/2021 18:58:49 - INFO - __main__ - Step 31706: {'lr': 0.0004519262277595898, 'samples': 6087552, 'steps': 31705, 'loss/train': 1.347668170928955} -08/30/2021 18:58:49 - INFO - __main__ - Step 31707: {'lr': 0.0004519230989268606, 'samples': 6087744, 'steps': 31706, 'loss/train': 1.5464115142822266} -08/30/2021 18:58:49 - INFO - __main__ - Step 31708: {'lr': 0.000451919970003148, 'samples': 6087936, 'steps': 31707, 'loss/train': 1.296976089477539} -08/30/2021 18:58:51 - INFO - __main__ - Step 31709: {'lr': 0.0004519168409884534, 'samples': 6088128, 'steps': 31708, 'loss/train': 1.6748765707015991} -08/30/2021 18:58:51 - INFO - __main__ - Step 31710: {'lr': 0.00045191371188277817, 'samples': 6088320, 'steps': 31709, 'loss/train': 1.7006301879882812} -08/30/2021 18:58:52 - INFO - __main__ - Step 31711: {'lr': 0.0004519105826861237, 'samples': 6088512, 'steps': 31710, 'loss/train': 1.3849173784255981} -08/30/2021 18:58:52 - INFO - __main__ - Step 31712: {'lr': 0.0004519074533984915, 'samples': 6088704, 'steps': 31711, 'loss/train': 1.2888586521148682} -08/30/2021 18:58:52 - INFO - __main__ - Step 31713: {'lr': 0.0004519043240198829, 'samples': 6088896, 'steps': 31712, 'loss/train': 1.2900900840759277} -08/30/2021 18:58:54 - INFO - __main__ - Step 31714: {'lr': 0.0004519011945502993, 'samples': 6089088, 'steps': 31713, 'loss/train': 1.9359652996063232} -08/30/2021 18:58:55 - INFO - __main__ - Step 31715: {'lr': 0.00045189806498974216, 'samples': 6089280, 'steps': 31714, 'loss/train': 0.8847703337669373} -08/30/2021 18:58:55 - INFO - __main__ - Step 31716: {'lr': 0.00045189493533821285, 'samples': 6089472, 'steps': 31715, 'loss/train': 1.570649266242981} -08/30/2021 18:58:55 - INFO - __main__ - Step 31717: {'lr': 0.0004518918055957128, 'samples': 6089664, 'steps': 31716, 'loss/train': 1.5662107467651367} -08/30/2021 18:58:56 - INFO - __main__ - Step 31718: {'lr': 0.0004518886757622435, 'samples': 6089856, 'steps': 31717, 'loss/train': 1.7837783098220825} -08/30/2021 18:58:56 - INFO - __main__ - Step 31719: {'lr': 0.0004518855458378062, 'samples': 6090048, 'steps': 31718, 'loss/train': 1.583587408065796} -08/30/2021 18:58:58 - INFO - __main__ - Step 31720: {'lr': 0.0004518824158224023, 'samples': 6090240, 'steps': 31719, 'loss/train': 2.0281319618225098} -08/30/2021 18:58:58 - INFO - __main__ - Step 31721: {'lr': 0.00045187928571603343, 'samples': 6090432, 'steps': 31720, 'loss/train': 1.341612458229065} -08/30/2021 18:58:58 - INFO - __main__ - Step 31722: {'lr': 0.0004518761555187008, 'samples': 6090624, 'steps': 31721, 'loss/train': 1.3035047054290771} -08/30/2021 18:58:59 - INFO - __main__ - Step 31723: {'lr': 0.00045187302523040597, 'samples': 6090816, 'steps': 31722, 'loss/train': 1.4077343940734863} -08/30/2021 18:58:59 - INFO - __main__ - Step 31724: {'lr': 0.00045186989485115014, 'samples': 6091008, 'steps': 31723, 'loss/train': 1.2675732374191284} -08/30/2021 18:59:01 - INFO - __main__ - Step 31725: {'lr': 0.000451866764380935, 'samples': 6091200, 'steps': 31724, 'loss/train': 1.6097421646118164} -08/30/2021 18:59:02 - INFO - __main__ - Step 31726: {'lr': 0.0004518636338197617, 'samples': 6091392, 'steps': 31725, 'loss/train': 1.6313509941101074} -08/30/2021 18:59:02 - INFO - __main__ - Step 31727: {'lr': 0.00045186050316763186, 'samples': 6091584, 'steps': 31726, 'loss/train': 1.7014423608779907} -08/30/2021 18:59:02 - INFO - __main__ - Step 31728: {'lr': 0.0004518573724245467, 'samples': 6091776, 'steps': 31727, 'loss/train': 1.5814265012741089} -08/30/2021 18:59:03 - INFO - __main__ - Step 31729: {'lr': 0.00045185424159050776, 'samples': 6091968, 'steps': 31728, 'loss/train': 1.6253712177276611} -08/30/2021 18:59:04 - INFO - __main__ - Step 31730: {'lr': 0.00045185111066551643, 'samples': 6092160, 'steps': 31729, 'loss/train': 1.3151179552078247} -08/30/2021 18:59:05 - INFO - __main__ - Step 31731: {'lr': 0.0004518479796495741, 'samples': 6092352, 'steps': 31730, 'loss/train': 0.9944483041763306} -08/30/2021 18:59:05 - INFO - __main__ - Step 31732: {'lr': 0.00045184484854268216, 'samples': 6092544, 'steps': 31731, 'loss/train': 1.4920777082443237} -08/30/2021 18:59:05 - INFO - __main__ - Step 31733: {'lr': 0.00045184171734484203, 'samples': 6092736, 'steps': 31732, 'loss/train': 1.7822221517562866} -08/30/2021 18:59:06 - INFO - __main__ - Step 31734: {'lr': 0.00045183858605605517, 'samples': 6092928, 'steps': 31733, 'loss/train': 1.2142447233200073} -08/30/2021 18:59:07 - INFO - __main__ - Step 31735: {'lr': 0.00045183545467632295, 'samples': 6093120, 'steps': 31734, 'loss/train': 1.3074018955230713} -08/30/2021 18:59:08 - INFO - __main__ - Step 31736: {'lr': 0.0004518323232056468, 'samples': 6093312, 'steps': 31735, 'loss/train': 0.9198724031448364} -08/30/2021 18:59:08 - INFO - __main__ - Step 31737: {'lr': 0.0004518291916440281, 'samples': 6093504, 'steps': 31736, 'loss/train': 1.4412691593170166} -08/30/2021 18:59:08 - INFO - __main__ - Step 31738: {'lr': 0.0004518260599914683, 'samples': 6093696, 'steps': 31737, 'loss/train': 1.4064964056015015} -08/30/2021 18:59:09 - INFO - __main__ - Step 31739: {'lr': 0.0004518229282479688, 'samples': 6093888, 'steps': 31738, 'loss/train': 1.5702183246612549} -08/30/2021 18:59:11 - INFO - __main__ - Step 31740: {'lr': 0.000451819796413531, 'samples': 6094080, 'steps': 31739, 'loss/train': 1.7810715436935425} -08/30/2021 18:59:11 - INFO - __main__ - Step 31741: {'lr': 0.0004518166644881563, 'samples': 6094272, 'steps': 31740, 'loss/train': 1.648104190826416} -08/30/2021 18:59:12 - INFO - __main__ - Step 31742: {'lr': 0.0004518135324718461, 'samples': 6094464, 'steps': 31741, 'loss/train': 1.4135750532150269} -08/30/2021 18:59:12 - INFO - __main__ - Step 31743: {'lr': 0.00045181040036460185, 'samples': 6094656, 'steps': 31742, 'loss/train': 1.8138679265975952} -08/30/2021 18:59:13 - INFO - __main__ - Step 31744: {'lr': 0.0004518072681664249, 'samples': 6094848, 'steps': 31743, 'loss/train': 1.2215015888214111} -08/30/2021 18:59:13 - INFO - __main__ - Step 31745: {'lr': 0.0004518041358773168, 'samples': 6095040, 'steps': 31744, 'loss/train': 1.128543496131897} -08/30/2021 18:59:14 - INFO - __main__ - Step 31746: {'lr': 0.0004518010034972788, 'samples': 6095232, 'steps': 31745, 'loss/train': 1.211618423461914} -08/30/2021 18:59:15 - INFO - __main__ - Step 31747: {'lr': 0.0004517978710263124, 'samples': 6095424, 'steps': 31746, 'loss/train': 1.0471305847167969} -08/30/2021 18:59:15 - INFO - __main__ - Step 31748: {'lr': 0.0004517947384644191, 'samples': 6095616, 'steps': 31747, 'loss/train': 1.3916995525360107} -08/30/2021 18:59:16 - INFO - __main__ - Step 31749: {'lr': 0.00045179160581160005, 'samples': 6095808, 'steps': 31748, 'loss/train': 1.2283918857574463} -08/30/2021 18:59:16 - INFO - __main__ - Step 31750: {'lr': 0.0004517884730678569, 'samples': 6096000, 'steps': 31749, 'loss/train': 1.175004005432129} -08/30/2021 18:59:16 - INFO - __main__ - Step 31751: {'lr': 0.00045178534023319097, 'samples': 6096192, 'steps': 31750, 'loss/train': 1.2510666847229004} -08/30/2021 18:59:18 - INFO - __main__ - Step 31752: {'lr': 0.00045178220730760367, 'samples': 6096384, 'steps': 31751, 'loss/train': 2.866900682449341} -08/30/2021 18:59:18 - INFO - __main__ - Step 31753: {'lr': 0.0004517790742910964, 'samples': 6096576, 'steps': 31752, 'loss/train': 1.5635515451431274} -08/30/2021 18:59:19 - INFO - __main__ - Step 31754: {'lr': 0.0004517759411836706, 'samples': 6096768, 'steps': 31753, 'loss/train': 1.7726420164108276} -08/30/2021 18:59:19 - INFO - __main__ - Step 31755: {'lr': 0.0004517728079853277, 'samples': 6096960, 'steps': 31754, 'loss/train': 1.9591432809829712} -08/30/2021 18:59:19 - INFO - __main__ - Step 31756: {'lr': 0.0004517696746960691, 'samples': 6097152, 'steps': 31755, 'loss/train': 1.5650672912597656} -08/30/2021 18:59:21 - INFO - __main__ - Step 31757: {'lr': 0.00045176654131589617, 'samples': 6097344, 'steps': 31756, 'loss/train': 0.24385832250118256} -08/30/2021 18:59:21 - INFO - __main__ - Step 31758: {'lr': 0.0004517634078448103, 'samples': 6097536, 'steps': 31757, 'loss/train': 1.4693056344985962} -08/30/2021 18:59:22 - INFO - __main__ - Step 31759: {'lr': 0.0004517602742828131, 'samples': 6097728, 'steps': 31758, 'loss/train': 1.4630427360534668} -08/30/2021 18:59:22 - INFO - __main__ - Step 31760: {'lr': 0.0004517571406299057, 'samples': 6097920, 'steps': 31759, 'loss/train': 2.1614649295806885} -08/30/2021 18:59:23 - INFO - __main__ - Step 31761: {'lr': 0.0004517540068860897, 'samples': 6098112, 'steps': 31760, 'loss/train': 1.2102993726730347} -08/30/2021 18:59:24 - INFO - __main__ - Step 31762: {'lr': 0.0004517508730513664, 'samples': 6098304, 'steps': 31761, 'loss/train': 1.5794097185134888} -08/30/2021 18:59:24 - INFO - __main__ - Step 31763: {'lr': 0.00045174773912573735, 'samples': 6098496, 'steps': 31762, 'loss/train': 1.3294028043746948} -08/30/2021 18:59:25 - INFO - __main__ - Step 31764: {'lr': 0.00045174460510920386, 'samples': 6098688, 'steps': 31763, 'loss/train': 1.0927268266677856} -08/30/2021 18:59:25 - INFO - __main__ - Step 31765: {'lr': 0.00045174147100176734, 'samples': 6098880, 'steps': 31764, 'loss/train': 1.4281386137008667} -08/30/2021 18:59:26 - INFO - __main__ - Step 31766: {'lr': 0.00045173833680342925, 'samples': 6099072, 'steps': 31765, 'loss/train': 1.6285591125488281} -08/30/2021 18:59:26 - INFO - __main__ - Step 31767: {'lr': 0.00045173520251419095, 'samples': 6099264, 'steps': 31766, 'loss/train': 2.077353000640869} -08/30/2021 18:59:27 - INFO - __main__ - Step 31768: {'lr': 0.0004517320681340539, 'samples': 6099456, 'steps': 31767, 'loss/train': 1.163082242012024} -08/30/2021 18:59:28 - INFO - __main__ - Step 31769: {'lr': 0.0004517289336630195, 'samples': 6099648, 'steps': 31768, 'loss/train': 1.5306695699691772} -08/30/2021 18:59:28 - INFO - __main__ - Step 31770: {'lr': 0.0004517257991010891, 'samples': 6099840, 'steps': 31769, 'loss/train': 1.7428069114685059} -08/30/2021 18:59:28 - INFO - __main__ - Step 31771: {'lr': 0.0004517226644482642, 'samples': 6100032, 'steps': 31770, 'loss/train': 1.2836638689041138} -08/30/2021 18:59:29 - INFO - __main__ - Step 31772: {'lr': 0.00045171952970454623, 'samples': 6100224, 'steps': 31771, 'loss/train': 1.0561379194259644} -08/30/2021 18:59:30 - INFO - __main__ - Step 31773: {'lr': 0.0004517163948699365, 'samples': 6100416, 'steps': 31772, 'loss/train': 1.876664638519287} -08/30/2021 18:59:31 - INFO - __main__ - Step 31774: {'lr': 0.00045171325994443644, 'samples': 6100608, 'steps': 31773, 'loss/train': 1.8266552686691284} -08/30/2021 18:59:31 - INFO - __main__ - Step 31775: {'lr': 0.00045171012492804753, 'samples': 6100800, 'steps': 31774, 'loss/train': 1.3269596099853516} -08/30/2021 18:59:32 - INFO - __main__ - Step 31776: {'lr': 0.0004517069898207712, 'samples': 6100992, 'steps': 31775, 'loss/train': 1.5919526815414429} -08/30/2021 18:59:32 - INFO - __main__ - Step 31777: {'lr': 0.00045170385462260876, 'samples': 6101184, 'steps': 31776, 'loss/train': 0.6725611090660095} -08/30/2021 18:59:35 - INFO - __main__ - Step 31778: {'lr': 0.0004517007193335617, 'samples': 6101376, 'steps': 31777, 'loss/train': 1.7358683347702026} -08/30/2021 18:59:35 - INFO - __main__ - Step 31779: {'lr': 0.0004516975839536314, 'samples': 6101568, 'steps': 31778, 'loss/train': 0.10978332161903381} -08/30/2021 18:59:36 - INFO - __main__ - Step 31780: {'lr': 0.0004516944484828193, 'samples': 6101760, 'steps': 31779, 'loss/train': 0.9555991888046265} -08/30/2021 18:59:36 - INFO - __main__ - Step 31781: {'lr': 0.0004516913129211268, 'samples': 6101952, 'steps': 31780, 'loss/train': 1.1444238424301147} -08/30/2021 18:59:36 - INFO - __main__ - Step 31782: {'lr': 0.00045168817726855525, 'samples': 6102144, 'steps': 31781, 'loss/train': 4.335629940032959} -08/30/2021 18:59:37 - INFO - __main__ - Step 31783: {'lr': 0.0004516850415251061, 'samples': 6102336, 'steps': 31782, 'loss/train': 4.193833351135254} -08/30/2021 18:59:38 - INFO - __main__ - Step 31784: {'lr': 0.0004516819056907809, 'samples': 6102528, 'steps': 31783, 'loss/train': 1.4793989658355713} -08/30/2021 18:59:39 - INFO - __main__ - Step 31785: {'lr': 0.0004516787697655809, 'samples': 6102720, 'steps': 31784, 'loss/train': 1.823095440864563} -08/30/2021 18:59:39 - INFO - __main__ - Step 31786: {'lr': 0.0004516756337495075, 'samples': 6102912, 'steps': 31785, 'loss/train': 1.108152985572815} -08/30/2021 18:59:39 - INFO - __main__ - Step 31787: {'lr': 0.0004516724976425622, 'samples': 6103104, 'steps': 31786, 'loss/train': 1.6836150884628296} -08/30/2021 18:59:40 - INFO - __main__ - Step 31788: {'lr': 0.0004516693614447464, 'samples': 6103296, 'steps': 31787, 'loss/train': 1.3794578313827515} -08/30/2021 18:59:41 - INFO - __main__ - Step 31789: {'lr': 0.0004516662251560615, 'samples': 6103488, 'steps': 31788, 'loss/train': 1.2366358041763306} -08/30/2021 18:59:42 - INFO - __main__ - Step 31790: {'lr': 0.0004516630887765089, 'samples': 6103680, 'steps': 31789, 'loss/train': 1.6831117868423462} -08/30/2021 18:59:42 - INFO - __main__ - Step 31791: {'lr': 0.00045165995230609003, 'samples': 6103872, 'steps': 31790, 'loss/train': 1.8927607536315918} -08/30/2021 18:59:42 - INFO - __main__ - Step 31792: {'lr': 0.0004516568157448063, 'samples': 6104064, 'steps': 31791, 'loss/train': 1.3940768241882324} -08/30/2021 18:59:43 - INFO - __main__ - Step 31793: {'lr': 0.00045165367909265916, 'samples': 6104256, 'steps': 31792, 'loss/train': 1.6035305261611938} -08/30/2021 18:59:44 - INFO - __main__ - Step 31794: {'lr': 0.00045165054234964984, 'samples': 6104448, 'steps': 31793, 'loss/train': 1.8415007591247559} -08/30/2021 18:59:45 - INFO - __main__ - Step 31795: {'lr': 0.0004516474055157801, 'samples': 6104640, 'steps': 31794, 'loss/train': 1.4146981239318848} -08/30/2021 18:59:45 - INFO - __main__ - Step 31796: {'lr': 0.000451644268591051, 'samples': 6104832, 'steps': 31795, 'loss/train': 1.3608078956604004} -08/30/2021 18:59:45 - INFO - __main__ - Step 31797: {'lr': 0.00045164113157546414, 'samples': 6105024, 'steps': 31796, 'loss/train': 1.3972551822662354} -08/30/2021 18:59:46 - INFO - __main__ - Step 31798: {'lr': 0.0004516379944690209, 'samples': 6105216, 'steps': 31797, 'loss/train': 0.08837572485208511} -08/30/2021 18:59:47 - INFO - __main__ - Step 31799: {'lr': 0.0004516348572717227, 'samples': 6105408, 'steps': 31798, 'loss/train': 1.6503653526306152} -08/30/2021 18:59:48 - INFO - __main__ - Step 31800: {'lr': 0.000451631719983571, 'samples': 6105600, 'steps': 31799, 'loss/train': 1.1910794973373413} -08/30/2021 18:59:48 - INFO - __main__ - Step 31801: {'lr': 0.00045162858260456705, 'samples': 6105792, 'steps': 31800, 'loss/train': 1.2666096687316895} -08/30/2021 18:59:48 - INFO - __main__ - Step 31802: {'lr': 0.0004516254451347125, 'samples': 6105984, 'steps': 31801, 'loss/train': 1.1145057678222656} -08/30/2021 18:59:49 - INFO - __main__ - Step 31803: {'lr': 0.0004516223075740085, 'samples': 6106176, 'steps': 31802, 'loss/train': 1.3834974765777588} -08/30/2021 18:59:49 - INFO - __main__ - Step 31804: {'lr': 0.00045161916992245664, 'samples': 6106368, 'steps': 31803, 'loss/train': 1.6630232334136963} -08/30/2021 18:59:51 - INFO - __main__ - Step 31805: {'lr': 0.0004516160321800584, 'samples': 6106560, 'steps': 31804, 'loss/train': 1.3498830795288086} -08/30/2021 18:59:51 - INFO - __main__ - Step 31806: {'lr': 0.000451612894346815, 'samples': 6106752, 'steps': 31805, 'loss/train': 1.8217791318893433} -08/30/2021 18:59:51 - INFO - __main__ - Step 31807: {'lr': 0.00045160975642272795, 'samples': 6106944, 'steps': 31806, 'loss/train': 0.37964287400245667} -08/30/2021 18:59:52 - INFO - __main__ - Step 31808: {'lr': 0.0004516066184077986, 'samples': 6107136, 'steps': 31807, 'loss/train': 2.2806687355041504} -08/30/2021 18:59:52 - INFO - __main__ - Step 31809: {'lr': 0.0004516034803020285, 'samples': 6107328, 'steps': 31808, 'loss/train': 2.123850107192993} -08/30/2021 18:59:54 - INFO - __main__ - Step 31810: {'lr': 0.0004516003421054189, 'samples': 6107520, 'steps': 31809, 'loss/train': 1.3058465719223022} -08/30/2021 18:59:54 - INFO - __main__ - Step 31811: {'lr': 0.0004515972038179714, 'samples': 6107712, 'steps': 31810, 'loss/train': 1.8727264404296875} -08/30/2021 18:59:54 - INFO - __main__ - Step 31812: {'lr': 0.0004515940654396872, 'samples': 6107904, 'steps': 31811, 'loss/train': 1.3117345571517944} -08/30/2021 18:59:55 - INFO - __main__ - Step 31813: {'lr': 0.00045159092697056794, 'samples': 6108096, 'steps': 31812, 'loss/train': 1.0136164426803589} -08/30/2021 18:59:55 - INFO - __main__ - Step 31814: {'lr': 0.00045158778841061483, 'samples': 6108288, 'steps': 31813, 'loss/train': 1.5322074890136719} -08/30/2021 18:59:57 - INFO - __main__ - Step 31815: {'lr': 0.0004515846497598294, 'samples': 6108480, 'steps': 31814, 'loss/train': 1.6552120447158813} -08/30/2021 18:59:58 - INFO - __main__ - Step 31816: {'lr': 0.000451581511018213, 'samples': 6108672, 'steps': 31815, 'loss/train': 1.793156385421753} -08/30/2021 18:59:58 - INFO - __main__ - Step 31817: {'lr': 0.00045157837218576713, 'samples': 6108864, 'steps': 31816, 'loss/train': 0.9958736300468445} -08/30/2021 18:59:58 - INFO - __main__ - Step 31818: {'lr': 0.00045157523326249316, 'samples': 6109056, 'steps': 31817, 'loss/train': 1.0163085460662842} -08/30/2021 18:59:59 - INFO - __main__ - Step 31819: {'lr': 0.00045157209424839253, 'samples': 6109248, 'steps': 31818, 'loss/train': 1.5546318292617798} -08/30/2021 19:00:00 - INFO - __main__ - Step 31820: {'lr': 0.0004515689551434665, 'samples': 6109440, 'steps': 31819, 'loss/train': 1.1910486221313477} -08/30/2021 19:00:01 - INFO - __main__ - Step 31821: {'lr': 0.00045156581594771675, 'samples': 6109632, 'steps': 31820, 'loss/train': 2.004864454269409} -08/30/2021 19:00:01 - INFO - __main__ - Step 31822: {'lr': 0.00045156267666114446, 'samples': 6109824, 'steps': 31821, 'loss/train': 1.709044337272644} -08/30/2021 19:00:01 - INFO - __main__ - Step 31823: {'lr': 0.0004515595372837512, 'samples': 6110016, 'steps': 31822, 'loss/train': 0.6816454529762268} -08/30/2021 19:00:02 - INFO - __main__ - Step 31824: {'lr': 0.00045155639781553825, 'samples': 6110208, 'steps': 31823, 'loss/train': 1.6261194944381714} -08/30/2021 19:00:03 - INFO - __main__ - Step 31825: {'lr': 0.00045155325825650715, 'samples': 6110400, 'steps': 31824, 'loss/train': 0.8188231587409973} -08/30/2021 19:00:03 - INFO - __main__ - Step 31826: {'lr': 0.00045155011860665927, 'samples': 6110592, 'steps': 31825, 'loss/train': 1.6089593172073364} -08/30/2021 19:00:04 - INFO - __main__ - Step 31827: {'lr': 0.00045154697886599606, 'samples': 6110784, 'steps': 31826, 'loss/train': 1.368036150932312} -08/30/2021 19:00:04 - INFO - __main__ - Step 31828: {'lr': 0.0004515438390345188, 'samples': 6110976, 'steps': 31827, 'loss/train': 1.291267991065979} -08/30/2021 19:00:05 - INFO - __main__ - Step 31829: {'lr': 0.00045154069911222905, 'samples': 6111168, 'steps': 31828, 'loss/train': 1.6703388690948486} -08/30/2021 19:00:06 - INFO - __main__ - Step 31830: {'lr': 0.0004515375590991281, 'samples': 6111360, 'steps': 31829, 'loss/train': 1.500475287437439} -08/30/2021 19:00:06 - INFO - __main__ - Step 31831: {'lr': 0.0004515344189952175, 'samples': 6111552, 'steps': 31830, 'loss/train': 1.0839345455169678} -08/30/2021 19:00:07 - INFO - __main__ - Step 31832: {'lr': 0.0004515312788004986, 'samples': 6111744, 'steps': 31831, 'loss/train': 1.6793702840805054} -08/30/2021 19:00:07 - INFO - __main__ - Step 31833: {'lr': 0.00045152813851497274, 'samples': 6111936, 'steps': 31832, 'loss/train': 1.1811480522155762} -08/30/2021 19:00:07 - INFO - __main__ - Step 31834: {'lr': 0.0004515249981386416, 'samples': 6112128, 'steps': 31833, 'loss/train': 1.714882254600525} -08/30/2021 19:00:08 - INFO - __main__ - Step 31835: {'lr': 0.0004515218576715062, 'samples': 6112320, 'steps': 31834, 'loss/train': 1.9581176042556763} -08/30/2021 19:00:10 - INFO - __main__ - Step 31836: {'lr': 0.00045151871711356827, 'samples': 6112512, 'steps': 31835, 'loss/train': 0.9482317566871643} -08/30/2021 19:00:10 - INFO - __main__ - Step 31837: {'lr': 0.0004515155764648291, 'samples': 6112704, 'steps': 31836, 'loss/train': 0.9607094526290894} -08/30/2021 19:00:11 - INFO - __main__ - Step 31838: {'lr': 0.0004515124357252901, 'samples': 6112896, 'steps': 31837, 'loss/train': 1.5487853288650513} -08/30/2021 19:00:11 - INFO - __main__ - Step 31839: {'lr': 0.0004515092948949527, 'samples': 6113088, 'steps': 31838, 'loss/train': 1.579304575920105} -08/30/2021 19:00:11 - INFO - __main__ - Step 31840: {'lr': 0.00045150615397381835, 'samples': 6113280, 'steps': 31839, 'loss/train': 1.076081395149231} -08/30/2021 19:00:13 - INFO - __main__ - Step 31841: {'lr': 0.0004515030129618884, 'samples': 6113472, 'steps': 31840, 'loss/train': 1.2970243692398071} -08/30/2021 19:00:13 - INFO - __main__ - Step 31842: {'lr': 0.0004514998718591643, 'samples': 6113664, 'steps': 31841, 'loss/train': 1.2793632745742798} -08/30/2021 19:00:14 - INFO - __main__ - Step 31843: {'lr': 0.0004514967306656475, 'samples': 6113856, 'steps': 31842, 'loss/train': 1.1665675640106201} -08/30/2021 19:00:14 - INFO - __main__ - Step 31844: {'lr': 0.0004514935893813394, 'samples': 6114048, 'steps': 31843, 'loss/train': 1.4917482137680054} -08/30/2021 19:00:14 - INFO - __main__ - Step 31845: {'lr': 0.00045149044800624135, 'samples': 6114240, 'steps': 31844, 'loss/train': 1.6520767211914062} -08/30/2021 19:00:16 - INFO - __main__ - Step 31846: {'lr': 0.0004514873065403549, 'samples': 6114432, 'steps': 31845, 'loss/train': 1.6882444620132446} -08/30/2021 19:00:16 - INFO - __main__ - Step 31847: {'lr': 0.0004514841649836813, 'samples': 6114624, 'steps': 31846, 'loss/train': 1.551079273223877} -08/30/2021 19:00:17 - INFO - __main__ - Step 31848: {'lr': 0.000451481023336222, 'samples': 6114816, 'steps': 31847, 'loss/train': 1.6473387479782104} -08/30/2021 19:00:17 - INFO - __main__ - Step 31849: {'lr': 0.0004514778815979785, 'samples': 6115008, 'steps': 31848, 'loss/train': 2.3100783824920654} -08/30/2021 19:00:17 - INFO - __main__ - Step 31850: {'lr': 0.0004514747397689522, 'samples': 6115200, 'steps': 31849, 'loss/train': 1.0601561069488525} -08/30/2021 19:00:19 - INFO - __main__ - Step 31851: {'lr': 0.0004514715978491445, 'samples': 6115392, 'steps': 31850, 'loss/train': 1.2394394874572754} -08/30/2021 19:00:20 - INFO - __main__ - Step 31852: {'lr': 0.0004514684558385568, 'samples': 6115584, 'steps': 31851, 'loss/train': 1.2615773677825928} -08/30/2021 19:00:20 - INFO - __main__ - Step 31853: {'lr': 0.0004514653137371905, 'samples': 6115776, 'steps': 31852, 'loss/train': 1.584965705871582} -08/30/2021 19:00:20 - INFO - __main__ - Step 31854: {'lr': 0.000451462171545047, 'samples': 6115968, 'steps': 31853, 'loss/train': 2.1311557292938232} -08/30/2021 19:00:21 - INFO - __main__ - Step 31855: {'lr': 0.00045145902926212785, 'samples': 6116160, 'steps': 31854, 'loss/train': 1.3710522651672363} -08/30/2021 19:00:22 - INFO - __main__ - Step 31856: {'lr': 0.0004514558868884343, 'samples': 6116352, 'steps': 31855, 'loss/train': 0.2669915556907654} -08/30/2021 19:00:23 - INFO - __main__ - Step 31857: {'lr': 0.00045145274442396786, 'samples': 6116544, 'steps': 31856, 'loss/train': 1.2853583097457886} -08/30/2021 19:00:23 - INFO - __main__ - Step 31858: {'lr': 0.00045144960186872996, 'samples': 6116736, 'steps': 31857, 'loss/train': 1.2335361242294312} -08/30/2021 19:00:24 - INFO - __main__ - Step 31859: {'lr': 0.0004514464592227219, 'samples': 6116928, 'steps': 31858, 'loss/train': 0.09652159363031387} -08/30/2021 19:00:24 - INFO - __main__ - Step 31860: {'lr': 0.0004514433164859453, 'samples': 6117120, 'steps': 31859, 'loss/train': 1.68108332157135} -08/30/2021 19:00:25 - INFO - __main__ - Step 31861: {'lr': 0.0004514401736584013, 'samples': 6117312, 'steps': 31860, 'loss/train': 1.659725546836853} -08/30/2021 19:00:26 - INFO - __main__ - Step 31862: {'lr': 0.0004514370307400916, 'samples': 6117504, 'steps': 31861, 'loss/train': 1.3923143148422241} -08/30/2021 19:00:26 - INFO - __main__ - Step 31863: {'lr': 0.00045143388773101733, 'samples': 6117696, 'steps': 31862, 'loss/train': 1.657745361328125} -08/30/2021 19:00:26 - INFO - __main__ - Step 31864: {'lr': 0.0004514307446311802, 'samples': 6117888, 'steps': 31863, 'loss/train': 1.300657868385315} -08/30/2021 19:00:27 - INFO - __main__ - Step 31865: {'lr': 0.0004514276014405814, 'samples': 6118080, 'steps': 31864, 'loss/train': 1.5859194993972778} -08/30/2021 19:00:28 - INFO - __main__ - Step 31866: {'lr': 0.00045142445815922244, 'samples': 6118272, 'steps': 31865, 'loss/train': 0.8749393224716187} -08/30/2021 19:00:29 - INFO - __main__ - Step 31867: {'lr': 0.0004514213147871047, 'samples': 6118464, 'steps': 31866, 'loss/train': 2.030456781387329} -08/30/2021 19:00:29 - INFO - __main__ - Step 31868: {'lr': 0.00045141817132422974, 'samples': 6118656, 'steps': 31867, 'loss/train': 1.5580260753631592} -08/30/2021 19:00:30 - INFO - __main__ - Step 31869: {'lr': 0.0004514150277705988, 'samples': 6118848, 'steps': 31868, 'loss/train': 0.9957576990127563} -08/30/2021 19:00:30 - INFO - __main__ - Step 31870: {'lr': 0.0004514118841262133, 'samples': 6119040, 'steps': 31869, 'loss/train': 1.6301734447479248} -08/30/2021 19:00:32 - INFO - __main__ - Step 31871: {'lr': 0.0004514087403910748, 'samples': 6119232, 'steps': 31870, 'loss/train': 1.6173347234725952} -08/30/2021 19:00:32 - INFO - __main__ - Step 31872: {'lr': 0.00045140559656518456, 'samples': 6119424, 'steps': 31871, 'loss/train': 1.7911888360977173} -08/30/2021 19:00:33 - INFO - __main__ - Step 31873: {'lr': 0.0004514024526485441, 'samples': 6119616, 'steps': 31872, 'loss/train': 1.1246349811553955} -08/30/2021 19:00:33 - INFO - __main__ - Step 31874: {'lr': 0.0004513993086411548, 'samples': 6119808, 'steps': 31873, 'loss/train': 1.5424352884292603} -08/30/2021 19:00:33 - INFO - __main__ - Step 31875: {'lr': 0.00045139616454301806, 'samples': 6120000, 'steps': 31874, 'loss/train': 1.4392929077148438} -08/30/2021 19:00:34 - INFO - __main__ - Step 31876: {'lr': 0.00045139302035413534, 'samples': 6120192, 'steps': 31875, 'loss/train': 1.192819356918335} -08/30/2021 19:00:36 - INFO - __main__ - Step 31877: {'lr': 0.00045138987607450803, 'samples': 6120384, 'steps': 31876, 'loss/train': 0.19190813601016998} -08/30/2021 19:00:36 - INFO - __main__ - Step 31878: {'lr': 0.00045138673170413756, 'samples': 6120576, 'steps': 31877, 'loss/train': 0.6537971496582031} -08/30/2021 19:00:36 - INFO - __main__ - Step 31879: {'lr': 0.0004513835872430253, 'samples': 6120768, 'steps': 31878, 'loss/train': 1.7221940755844116} -08/30/2021 19:00:37 - INFO - __main__ - Step 31880: {'lr': 0.0004513804426911727, 'samples': 6120960, 'steps': 31879, 'loss/train': 1.7095563411712646} -08/30/2021 19:00:37 - INFO - __main__ - Step 31881: {'lr': 0.00045137729804858124, 'samples': 6121152, 'steps': 31880, 'loss/train': 1.5729342699050903} -08/30/2021 19:00:37 - INFO - __main__ - Step 31882: {'lr': 0.00045137415331525225, 'samples': 6121344, 'steps': 31881, 'loss/train': 0.029747415333986282} -08/30/2021 19:00:39 - INFO - __main__ - Step 31883: {'lr': 0.0004513710084911872, 'samples': 6121536, 'steps': 31882, 'loss/train': 1.4356582164764404} -08/30/2021 19:00:39 - INFO - __main__ - Step 31884: {'lr': 0.00045136786357638736, 'samples': 6121728, 'steps': 31883, 'loss/train': 1.625819206237793} -08/30/2021 19:00:40 - INFO - __main__ - Step 31885: {'lr': 0.00045136471857085435, 'samples': 6121920, 'steps': 31884, 'loss/train': 0.17441563308238983} -08/30/2021 19:00:40 - INFO - __main__ - Step 31886: {'lr': 0.0004513615734745895, 'samples': 6122112, 'steps': 31885, 'loss/train': 1.51893949508667} -08/30/2021 19:00:40 - INFO - __main__ - Step 31887: {'lr': 0.00045135842828759426, 'samples': 6122304, 'steps': 31886, 'loss/train': 1.7774583101272583} -08/30/2021 19:00:41 - INFO - __main__ - Step 31888: {'lr': 0.00045135528300987006, 'samples': 6122496, 'steps': 31887, 'loss/train': 1.7723816633224487} -08/30/2021 19:00:43 - INFO - __main__ - Step 31889: {'lr': 0.00045135213764141814, 'samples': 6122688, 'steps': 31888, 'loss/train': 1.4298135042190552} -08/30/2021 19:00:43 - INFO - __main__ - Step 31890: {'lr': 0.00045134899218224014, 'samples': 6122880, 'steps': 31889, 'loss/train': 1.2692198753356934} -08/30/2021 19:00:44 - INFO - __main__ - Step 31891: {'lr': 0.0004513458466323374, 'samples': 6123072, 'steps': 31890, 'loss/train': 1.3574681282043457} -08/30/2021 19:00:44 - INFO - __main__ - Step 31892: {'lr': 0.0004513427009917113, 'samples': 6123264, 'steps': 31891, 'loss/train': 1.485721468925476} -08/30/2021 19:00:44 - INFO - __main__ - Step 31893: {'lr': 0.0004513395552603633, 'samples': 6123456, 'steps': 31892, 'loss/train': 1.3511744737625122} -08/30/2021 19:00:46 - INFO - __main__ - Step 31894: {'lr': 0.0004513364094382948, 'samples': 6123648, 'steps': 31893, 'loss/train': 2.151597738265991} -08/30/2021 19:00:46 - INFO - __main__ - Step 31895: {'lr': 0.00045133326352550724, 'samples': 6123840, 'steps': 31894, 'loss/train': 1.3925540447235107} -08/30/2021 19:00:47 - INFO - __main__ - Step 31896: {'lr': 0.000451330117522002, 'samples': 6124032, 'steps': 31895, 'loss/train': 1.5076276063919067} -08/30/2021 19:00:47 - INFO - __main__ - Step 31897: {'lr': 0.00045132697142778044, 'samples': 6124224, 'steps': 31896, 'loss/train': 1.6899641752243042} -08/30/2021 19:00:47 - INFO - __main__ - Step 31898: {'lr': 0.0004513238252428442, 'samples': 6124416, 'steps': 31897, 'loss/train': 1.2655805349349976} -08/30/2021 19:00:49 - INFO - __main__ - Step 31899: {'lr': 0.0004513206789671945, 'samples': 6124608, 'steps': 31898, 'loss/train': 1.8990840911865234} -08/30/2021 19:00:49 - INFO - __main__ - Step 31900: {'lr': 0.00045131753260083276, 'samples': 6124800, 'steps': 31899, 'loss/train': 1.9302457571029663} -08/30/2021 19:00:50 - INFO - __main__ - Step 31901: {'lr': 0.0004513143861437605, 'samples': 6124992, 'steps': 31900, 'loss/train': 0.4033149778842926} -08/30/2021 19:00:50 - INFO - __main__ - Step 31902: {'lr': 0.00045131123959597905, 'samples': 6125184, 'steps': 31901, 'loss/train': 1.51475191116333} -08/30/2021 19:00:50 - INFO - __main__ - Step 31903: {'lr': 0.0004513080929574899, 'samples': 6125376, 'steps': 31902, 'loss/train': 1.2061400413513184} -08/30/2021 19:00:52 - INFO - __main__ - Step 31904: {'lr': 0.0004513049462282943, 'samples': 6125568, 'steps': 31903, 'loss/train': 1.6666240692138672} -08/30/2021 19:00:52 - INFO - __main__ - Step 31905: {'lr': 0.00045130179940839395, 'samples': 6125760, 'steps': 31904, 'loss/train': 0.5576969981193542} -08/30/2021 19:00:53 - INFO - __main__ - Step 31906: {'lr': 0.00045129865249779, 'samples': 6125952, 'steps': 31905, 'loss/train': 1.1238410472869873} -08/30/2021 19:00:53 - INFO - __main__ - Step 31907: {'lr': 0.0004512955054964841, 'samples': 6126144, 'steps': 31906, 'loss/train': 1.5824025869369507} -08/30/2021 19:00:53 - INFO - __main__ - Step 31908: {'lr': 0.0004512923584044775, 'samples': 6126336, 'steps': 31907, 'loss/train': 1.0010976791381836} -08/30/2021 19:00:55 - INFO - __main__ - Step 31909: {'lr': 0.0004512892112217717, 'samples': 6126528, 'steps': 31908, 'loss/train': 1.430724859237671} -08/30/2021 19:00:55 - INFO - __main__ - Step 31910: {'lr': 0.00045128606394836805, 'samples': 6126720, 'steps': 31909, 'loss/train': 1.8850479125976562} -08/30/2021 19:00:56 - INFO - __main__ - Step 31911: {'lr': 0.00045128291658426796, 'samples': 6126912, 'steps': 31910, 'loss/train': 1.333143949508667} -08/30/2021 19:00:56 - INFO - __main__ - Step 31912: {'lr': 0.00045127976912947296, 'samples': 6127104, 'steps': 31911, 'loss/train': 1.5215591192245483} -08/30/2021 19:00:56 - INFO - __main__ - Step 31913: {'lr': 0.00045127662158398434, 'samples': 6127296, 'steps': 31912, 'loss/train': 1.4688621759414673} -08/30/2021 19:00:58 - INFO - __main__ - Step 31914: {'lr': 0.00045127347394780367, 'samples': 6127488, 'steps': 31913, 'loss/train': 1.9251075983047485} -08/30/2021 19:00:59 - INFO - __main__ - Step 31915: {'lr': 0.00045127032622093225, 'samples': 6127680, 'steps': 31914, 'loss/train': 0.5122542977333069} -08/30/2021 19:00:59 - INFO - __main__ - Step 31916: {'lr': 0.0004512671784033715, 'samples': 6127872, 'steps': 31915, 'loss/train': 1.3557204008102417} -08/30/2021 19:00:59 - INFO - __main__ - Step 31917: {'lr': 0.00045126403049512286, 'samples': 6128064, 'steps': 31916, 'loss/train': 1.2790255546569824} -08/30/2021 19:01:00 - INFO - __main__ - Step 31918: {'lr': 0.0004512608824961878, 'samples': 6128256, 'steps': 31917, 'loss/train': 1.243576169013977} -08/30/2021 19:01:00 - INFO - __main__ - Step 31919: {'lr': 0.00045125773440656756, 'samples': 6128448, 'steps': 31918, 'loss/train': 0.7762052416801453} -08/30/2021 19:01:02 - INFO - __main__ - Step 31920: {'lr': 0.0004512545862262638, 'samples': 6128640, 'steps': 31919, 'loss/train': 1.8772687911987305} -08/30/2021 19:01:02 - INFO - __main__ - Step 31921: {'lr': 0.0004512514379552779, 'samples': 6128832, 'steps': 31920, 'loss/train': 1.234052300453186} -08/30/2021 19:01:03 - INFO - __main__ - Step 31922: {'lr': 0.0004512482895936111, 'samples': 6129024, 'steps': 31921, 'loss/train': 0.22858773171901703} -08/30/2021 19:01:03 - INFO - __main__ - Step 31923: {'lr': 0.00045124514114126493, 'samples': 6129216, 'steps': 31922, 'loss/train': 1.7342108488082886} -08/30/2021 19:01:03 - INFO - __main__ - Step 31924: {'lr': 0.0004512419925982408, 'samples': 6129408, 'steps': 31923, 'loss/train': 0.8498665690422058} -08/30/2021 19:01:05 - INFO - __main__ - Step 31925: {'lr': 0.0004512388439645402, 'samples': 6129600, 'steps': 31924, 'loss/train': 0.8713580965995789} -08/30/2021 19:01:05 - INFO - __main__ - Step 31926: {'lr': 0.00045123569524016446, 'samples': 6129792, 'steps': 31925, 'loss/train': 1.5903257131576538} -08/30/2021 19:01:06 - INFO - __main__ - Step 31927: {'lr': 0.00045123254642511504, 'samples': 6129984, 'steps': 31926, 'loss/train': 1.119911789894104} -08/30/2021 19:01:06 - INFO - __main__ - Step 31928: {'lr': 0.0004512293975193933, 'samples': 6130176, 'steps': 31927, 'loss/train': 1.2339699268341064} -08/30/2021 19:01:06 - INFO - __main__ - Step 31929: {'lr': 0.0004512262485230007, 'samples': 6130368, 'steps': 31928, 'loss/train': 1.7451261281967163} -08/30/2021 19:01:08 - INFO - __main__ - Step 31930: {'lr': 0.00045122309943593865, 'samples': 6130560, 'steps': 31929, 'loss/train': 1.791560411453247} -08/30/2021 19:01:09 - INFO - __main__ - Step 31931: {'lr': 0.0004512199502582086, 'samples': 6130752, 'steps': 31930, 'loss/train': 1.3058853149414062} -08/30/2021 19:01:09 - INFO - __main__ - Step 31932: {'lr': 0.00045121680098981186, 'samples': 6130944, 'steps': 31931, 'loss/train': 0.13204734027385712} -08/30/2021 19:01:09 - INFO - __main__ - Step 31933: {'lr': 0.00045121365163075007, 'samples': 6131136, 'steps': 31932, 'loss/train': 0.034868452697992325} -08/30/2021 19:01:10 - INFO - __main__ - Step 31934: {'lr': 0.0004512105021810244, 'samples': 6131328, 'steps': 31933, 'loss/train': 1.3254988193511963} -08/30/2021 19:01:10 - INFO - __main__ - Step 31935: {'lr': 0.0004512073526406365, 'samples': 6131520, 'steps': 31934, 'loss/train': 1.6102142333984375} -08/30/2021 19:01:12 - INFO - __main__ - Step 31936: {'lr': 0.0004512042030095876, 'samples': 6131712, 'steps': 31935, 'loss/train': 1.2111961841583252} -08/30/2021 19:01:12 - INFO - __main__ - Step 31937: {'lr': 0.0004512010532878792, 'samples': 6131904, 'steps': 31936, 'loss/train': 1.2480688095092773} -08/30/2021 19:01:12 - INFO - __main__ - Step 31938: {'lr': 0.0004511979034755127, 'samples': 6132096, 'steps': 31937, 'loss/train': 1.541494369506836} -08/30/2021 19:01:13 - INFO - __main__ - Step 31939: {'lr': 0.0004511947535724895, 'samples': 6132288, 'steps': 31938, 'loss/train': 1.8874555826187134} -08/30/2021 19:01:13 - INFO - __main__ - Step 31940: {'lr': 0.00045119160357881105, 'samples': 6132480, 'steps': 31939, 'loss/train': 2.018998622894287} -08/30/2021 19:01:15 - INFO - __main__ - Step 31941: {'lr': 0.0004511884534944789, 'samples': 6132672, 'steps': 31940, 'loss/train': 1.4498368501663208} -08/30/2021 19:01:15 - INFO - __main__ - Step 31942: {'lr': 0.0004511853033194942, 'samples': 6132864, 'steps': 31941, 'loss/train': 2.2000842094421387} -08/30/2021 19:01:16 - INFO - __main__ - Step 31943: {'lr': 0.00045118215305385855, 'samples': 6133056, 'steps': 31942, 'loss/train': 1.9984976053237915} -08/30/2021 19:01:16 - INFO - __main__ - Step 31944: {'lr': 0.0004511790026975733, 'samples': 6133248, 'steps': 31943, 'loss/train': 5.456791400909424} -08/30/2021 19:01:16 - INFO - __main__ - Step 31945: {'lr': 0.00045117585225063996, 'samples': 6133440, 'steps': 31944, 'loss/train': 1.6796048879623413} -08/30/2021 19:01:18 - INFO - __main__ - Step 31946: {'lr': 0.0004511727017130598, 'samples': 6133632, 'steps': 31945, 'loss/train': 1.5475685596466064} -08/30/2021 19:01:19 - INFO - __main__ - Step 31947: {'lr': 0.00045116955108483436, 'samples': 6133824, 'steps': 31946, 'loss/train': 1.6737676858901978} -08/30/2021 19:01:19 - INFO - __main__ - Step 31948: {'lr': 0.00045116640036596507, 'samples': 6134016, 'steps': 31947, 'loss/train': 1.1156933307647705} -08/30/2021 19:01:20 - INFO - __main__ - Step 31949: {'lr': 0.0004511632495564533, 'samples': 6134208, 'steps': 31948, 'loss/train': 0.9910598993301392} -08/30/2021 19:01:20 - INFO - __main__ - Step 31950: {'lr': 0.00045116009865630034, 'samples': 6134400, 'steps': 31949, 'loss/train': 1.533393144607544} -08/30/2021 19:01:21 - INFO - __main__ - Step 31951: {'lr': 0.0004511569476655079, 'samples': 6134592, 'steps': 31950, 'loss/train': 1.2653424739837646} -08/30/2021 19:01:22 - INFO - __main__ - Step 31952: {'lr': 0.00045115379658407717, 'samples': 6134784, 'steps': 31951, 'loss/train': 1.8291164636611938} -08/30/2021 19:01:22 - INFO - __main__ - Step 31953: {'lr': 0.0004511506454120097, 'samples': 6134976, 'steps': 31952, 'loss/train': 1.805966854095459} -08/30/2021 19:01:23 - INFO - __main__ - Step 31954: {'lr': 0.00045114749414930676, 'samples': 6135168, 'steps': 31953, 'loss/train': 1.410210371017456} -08/30/2021 19:01:23 - INFO - __main__ - Step 31955: {'lr': 0.00045114434279596994, 'samples': 6135360, 'steps': 31954, 'loss/train': 1.5953606367111206} -08/30/2021 19:01:25 - INFO - __main__ - Step 31956: {'lr': 0.0004511411913520006, 'samples': 6135552, 'steps': 31955, 'loss/train': 1.5507489442825317} -08/30/2021 19:01:25 - INFO - __main__ - Step 31957: {'lr': 0.0004511380398174001, 'samples': 6135744, 'steps': 31956, 'loss/train': 0.03353830799460411} -08/30/2021 19:01:26 - INFO - __main__ - Step 31958: {'lr': 0.00045113488819216983, 'samples': 6135936, 'steps': 31957, 'loss/train': 0.0318821482360363} -08/30/2021 19:01:26 - INFO - __main__ - Step 31959: {'lr': 0.00045113173647631143, 'samples': 6136128, 'steps': 31958, 'loss/train': 0.9165999889373779} -08/30/2021 19:01:27 - INFO - __main__ - Step 31960: {'lr': 0.0004511285846698261, 'samples': 6136320, 'steps': 31959, 'loss/train': 1.3535188436508179} -08/30/2021 19:01:27 - INFO - __main__ - Step 31961: {'lr': 0.0004511254327727153, 'samples': 6136512, 'steps': 31960, 'loss/train': 1.6394740343093872} -08/30/2021 19:01:28 - INFO - __main__ - Step 31962: {'lr': 0.00045112228078498053, 'samples': 6136704, 'steps': 31961, 'loss/train': 1.3872450590133667} -08/30/2021 19:01:29 - INFO - __main__ - Step 31963: {'lr': 0.0004511191287066232, 'samples': 6136896, 'steps': 31962, 'loss/train': 1.816772222518921} -08/30/2021 19:01:29 - INFO - __main__ - Step 31964: {'lr': 0.00045111597653764456, 'samples': 6137088, 'steps': 31963, 'loss/train': 0.8778124451637268} -08/30/2021 19:01:30 - INFO - __main__ - Step 31965: {'lr': 0.00045111282427804636, 'samples': 6137280, 'steps': 31964, 'loss/train': 1.6676661968231201} -08/30/2021 19:01:30 - INFO - __main__ - Step 31966: {'lr': 0.0004511096719278297, 'samples': 6137472, 'steps': 31965, 'loss/train': 0.8720130324363708} -08/30/2021 19:01:30 - INFO - __main__ - Step 31967: {'lr': 0.0004511065194869961, 'samples': 6137664, 'steps': 31966, 'loss/train': 1.5493005514144897} -08/30/2021 19:01:32 - INFO - __main__ - Step 31968: {'lr': 0.00045110336695554707, 'samples': 6137856, 'steps': 31967, 'loss/train': 1.0071051120758057} -08/30/2021 19:01:33 - INFO - __main__ - Step 31969: {'lr': 0.0004511002143334839, 'samples': 6138048, 'steps': 31968, 'loss/train': 1.5522947311401367} -08/30/2021 19:01:33 - INFO - __main__ - Step 31970: {'lr': 0.0004510970616208081, 'samples': 6138240, 'steps': 31969, 'loss/train': 1.0230203866958618} -08/30/2021 19:01:33 - INFO - __main__ - Step 31971: {'lr': 0.0004510939088175211, 'samples': 6138432, 'steps': 31970, 'loss/train': 0.026159143075346947} -08/30/2021 19:01:34 - INFO - __main__ - Step 31972: {'lr': 0.00045109075592362433, 'samples': 6138624, 'steps': 31971, 'loss/train': 1.4281119108200073} -08/30/2021 19:01:34 - INFO - __main__ - Step 31973: {'lr': 0.0004510876029391191, 'samples': 6138816, 'steps': 31972, 'loss/train': 1.5089854001998901} -08/30/2021 19:01:36 - INFO - __main__ - Step 31974: {'lr': 0.00045108444986400687, 'samples': 6139008, 'steps': 31973, 'loss/train': 1.476694107055664} -08/30/2021 19:01:36 - INFO - __main__ - Step 31975: {'lr': 0.0004510812966982892, 'samples': 6139200, 'steps': 31974, 'loss/train': 1.355631947517395} -08/30/2021 19:01:36 - INFO - __main__ - Step 31976: {'lr': 0.0004510781434419673, 'samples': 6139392, 'steps': 31975, 'loss/train': 1.3529835939407349} -08/30/2021 19:01:37 - INFO - __main__ - Step 31977: {'lr': 0.0004510749900950427, 'samples': 6139584, 'steps': 31976, 'loss/train': 1.140531301498413} -08/30/2021 19:01:38 - INFO - __main__ - Step 31978: {'lr': 0.00045107183665751686, 'samples': 6139776, 'steps': 31977, 'loss/train': 1.628603219985962} -08/30/2021 19:01:39 - INFO - __main__ - Step 31979: {'lr': 0.00045106868312939116, 'samples': 6139968, 'steps': 31978, 'loss/train': 1.0013000965118408} -08/30/2021 19:01:39 - INFO - __main__ - Step 31980: {'lr': 0.0004510655295106669, 'samples': 6140160, 'steps': 31979, 'loss/train': 1.6773079633712769} -08/30/2021 19:01:39 - INFO - __main__ - Step 31981: {'lr': 0.00045106237580134573, 'samples': 6140352, 'steps': 31980, 'loss/train': 1.6410744190216064} -08/30/2021 19:01:40 - INFO - __main__ - Step 31982: {'lr': 0.000451059222001429, 'samples': 6140544, 'steps': 31981, 'loss/train': 1.2098348140716553} -08/30/2021 19:01:40 - INFO - __main__ - Step 31983: {'lr': 0.0004510560681109179, 'samples': 6140736, 'steps': 31982, 'loss/train': 0.9411579966545105} -08/30/2021 19:01:42 - INFO - __main__ - Step 31984: {'lr': 0.0004510529141298142, 'samples': 6140928, 'steps': 31983, 'loss/train': 1.4893128871917725} -08/30/2021 19:01:42 - INFO - __main__ - Step 31985: {'lr': 0.00045104976005811917, 'samples': 6141120, 'steps': 31984, 'loss/train': 1.3210407495498657} -08/30/2021 19:01:42 - INFO - __main__ - Step 31986: {'lr': 0.00045104660589583413, 'samples': 6141312, 'steps': 31985, 'loss/train': 1.7088764905929565} -08/30/2021 19:01:43 - INFO - __main__ - Step 31987: {'lr': 0.0004510434516429606, 'samples': 6141504, 'steps': 31986, 'loss/train': 1.774092197418213} -08/30/2021 19:01:43 - INFO - __main__ - Step 31988: {'lr': 0.0004510402972995, 'samples': 6141696, 'steps': 31987, 'loss/train': 1.4240888357162476} -08/30/2021 19:01:45 - INFO - __main__ - Step 31989: {'lr': 0.0004510371428654538, 'samples': 6141888, 'steps': 31988, 'loss/train': 1.5147643089294434} -08/30/2021 19:01:46 - INFO - __main__ - Step 31990: {'lr': 0.00045103398834082334, 'samples': 6142080, 'steps': 31989, 'loss/train': 1.8578299283981323} -08/30/2021 19:01:46 - INFO - __main__ - Step 31991: {'lr': 0.00045103083372561003, 'samples': 6142272, 'steps': 31990, 'loss/train': 2.1569173336029053} -08/30/2021 19:01:47 - INFO - __main__ - Step 31992: {'lr': 0.0004510276790198153, 'samples': 6142464, 'steps': 31991, 'loss/train': 1.225195050239563} -08/30/2021 19:01:47 - INFO - __main__ - Step 31993: {'lr': 0.00045102452422344065, 'samples': 6142656, 'steps': 31992, 'loss/train': 1.461816668510437} -08/30/2021 19:01:47 - INFO - __main__ - Step 31994: {'lr': 0.0004510213693364875, 'samples': 6142848, 'steps': 31993, 'loss/train': 1.9749394655227661} -08/30/2021 19:01:48 - INFO - __main__ - Step 31995: {'lr': 0.0004510182143589572, 'samples': 6143040, 'steps': 31994, 'loss/train': 0.16042234003543854} -08/30/2021 19:01:48 - INFO - __main__ - Step 31996: {'lr': 0.0004510150592908511, 'samples': 6143232, 'steps': 31995, 'loss/train': 0.06669739633798599} -08/30/2021 19:01:50 - INFO - __main__ - Step 31997: {'lr': 0.00045101190413217085, 'samples': 6143424, 'steps': 31996, 'loss/train': 0.023171178996562958} -08/30/2021 19:01:51 - INFO - __main__ - Step 31998: {'lr': 0.0004510087488829177, 'samples': 6143616, 'steps': 31997, 'loss/train': 1.195980191230774} -08/30/2021 19:01:51 - INFO - __main__ - Step 31999: {'lr': 0.000451005593543093, 'samples': 6143808, 'steps': 31998, 'loss/train': 1.0919106006622314} -08/30/2021 19:01:51 - INFO - __main__ - Step 32000: {'lr': 0.00045100243811269834, 'samples': 6144000, 'steps': 31999, 'loss/train': 2.045699119567871} -08/30/2021 19:01:52 - INFO - __main__ - Step 32001: {'lr': 0.00045099928259173516, 'samples': 6144192, 'steps': 32000, 'loss/train': 1.139817237854004} -08/30/2021 19:01:53 - INFO - __main__ - Step 32002: {'lr': 0.0004509961269802048, 'samples': 6144384, 'steps': 32001, 'loss/train': 0.9346404075622559} -08/30/2021 19:01:54 - INFO - __main__ - Step 32003: {'lr': 0.00045099297127810855, 'samples': 6144576, 'steps': 32002, 'loss/train': 1.5782743692398071} -08/30/2021 19:01:54 - INFO - __main__ - Step 32004: {'lr': 0.0004509898154854481, 'samples': 6144768, 'steps': 32003, 'loss/train': 2.0786890983581543} -08/30/2021 19:01:55 - INFO - __main__ - Step 32005: {'lr': 0.00045098665960222474, 'samples': 6144960, 'steps': 32004, 'loss/train': 0.2444913387298584} -08/30/2021 19:01:55 - INFO - __main__ - Step 32006: {'lr': 0.00045098350362843975, 'samples': 6145152, 'steps': 32005, 'loss/train': 1.8713760375976562} -08/30/2021 19:01:57 - INFO - __main__ - Step 32007: {'lr': 0.0004509803475640948, 'samples': 6145344, 'steps': 32006, 'loss/train': 1.7312630414962769} -08/30/2021 19:01:57 - INFO - __main__ - Step 32008: {'lr': 0.00045097719140919126, 'samples': 6145536, 'steps': 32007, 'loss/train': 1.240100622177124} -08/30/2021 19:01:57 - INFO - __main__ - Step 32009: {'lr': 0.0004509740351637304, 'samples': 6145728, 'steps': 32008, 'loss/train': 1.5063472986221313} -08/30/2021 19:01:58 - INFO - __main__ - Step 32010: {'lr': 0.0004509708788277138, 'samples': 6145920, 'steps': 32009, 'loss/train': 1.406972050666809} -08/30/2021 19:01:58 - INFO - __main__ - Step 32011: {'lr': 0.0004509677224011428, 'samples': 6146112, 'steps': 32010, 'loss/train': 0.5182023048400879} -08/30/2021 19:01:59 - INFO - __main__ - Step 32012: {'lr': 0.00045096456588401883, 'samples': 6146304, 'steps': 32011, 'loss/train': 1.0053365230560303} -08/30/2021 19:02:00 - INFO - __main__ - Step 32013: {'lr': 0.0004509614092763434, 'samples': 6146496, 'steps': 32012, 'loss/train': 1.512039303779602} -08/30/2021 19:02:00 - INFO - __main__ - Step 32014: {'lr': 0.00045095825257811776, 'samples': 6146688, 'steps': 32013, 'loss/train': 1.7275587320327759} -08/30/2021 19:02:01 - INFO - __main__ - Step 32015: {'lr': 0.00045095509578934353, 'samples': 6146880, 'steps': 32014, 'loss/train': 1.5785534381866455} -08/30/2021 19:02:01 - INFO - __main__ - Step 32016: {'lr': 0.00045095193891002194, 'samples': 6147072, 'steps': 32015, 'loss/train': 1.0299241542816162} -08/30/2021 19:02:03 - INFO - __main__ - Step 32017: {'lr': 0.00045094878194015456, 'samples': 6147264, 'steps': 32016, 'loss/train': 1.275549292564392} -08/30/2021 19:02:03 - INFO - __main__ - Step 32018: {'lr': 0.0004509456248797428, 'samples': 6147456, 'steps': 32017, 'loss/train': 1.5068910121917725} -08/30/2021 19:02:03 - INFO - __main__ - Step 32019: {'lr': 0.000450942467728788, 'samples': 6147648, 'steps': 32018, 'loss/train': 1.353131890296936} -08/30/2021 19:02:04 - INFO - __main__ - Step 32020: {'lr': 0.00045093931048729156, 'samples': 6147840, 'steps': 32019, 'loss/train': 1.4195904731750488} -08/30/2021 19:02:04 - INFO - __main__ - Step 32021: {'lr': 0.00045093615315525506, 'samples': 6148032, 'steps': 32020, 'loss/train': 2.2784926891326904} -08/30/2021 19:02:06 - INFO - __main__ - Step 32022: {'lr': 0.00045093299573267977, 'samples': 6148224, 'steps': 32021, 'loss/train': 1.4593552350997925} -08/30/2021 19:02:06 - INFO - __main__ - Step 32023: {'lr': 0.00045092983821956725, 'samples': 6148416, 'steps': 32022, 'loss/train': 1.4830538034439087} -08/30/2021 19:02:07 - INFO - __main__ - Step 32024: {'lr': 0.00045092668061591875, 'samples': 6148608, 'steps': 32023, 'loss/train': 1.3781323432922363} -08/30/2021 19:02:07 - INFO - __main__ - Step 32025: {'lr': 0.00045092352292173585, 'samples': 6148800, 'steps': 32024, 'loss/train': 1.6769580841064453} -08/30/2021 19:02:07 - INFO - __main__ - Step 32026: {'lr': 0.00045092036513701985, 'samples': 6148992, 'steps': 32025, 'loss/train': 1.435570240020752} -08/30/2021 19:02:08 - INFO - __main__ - Step 32027: {'lr': 0.0004509172072617723, 'samples': 6149184, 'steps': 32026, 'loss/train': 1.203198790550232} -08/30/2021 19:02:09 - INFO - __main__ - Step 32028: {'lr': 0.00045091404929599455, 'samples': 6149376, 'steps': 32027, 'loss/train': 0.8941290378570557} -08/30/2021 19:02:10 - INFO - __main__ - Step 32029: {'lr': 0.00045091089123968796, 'samples': 6149568, 'steps': 32028, 'loss/train': 1.23170006275177} -08/30/2021 19:02:10 - INFO - __main__ - Step 32030: {'lr': 0.0004509077330928541, 'samples': 6149760, 'steps': 32029, 'loss/train': 1.4482344388961792} -08/30/2021 19:02:11 - INFO - __main__ - Step 32031: {'lr': 0.0004509045748554943, 'samples': 6149952, 'steps': 32030, 'loss/train': 3.8524041175842285} -08/30/2021 19:02:11 - INFO - __main__ - Step 32032: {'lr': 0.00045090141652760995, 'samples': 6150144, 'steps': 32031, 'loss/train': 0.08425921946763992} -08/30/2021 19:02:12 - INFO - __main__ - Step 32033: {'lr': 0.0004508982581092026, 'samples': 6150336, 'steps': 32032, 'loss/train': 0.8093934059143066} -08/30/2021 19:02:13 - INFO - __main__ - Step 32034: {'lr': 0.00045089509960027354, 'samples': 6150528, 'steps': 32033, 'loss/train': 2.8101725578308105} -08/30/2021 19:02:13 - INFO - __main__ - Step 32035: {'lr': 0.00045089194100082433, 'samples': 6150720, 'steps': 32034, 'loss/train': 1.4310811758041382} -08/30/2021 19:02:14 - INFO - __main__ - Step 32036: {'lr': 0.00045088878231085616, 'samples': 6150912, 'steps': 32035, 'loss/train': 1.7447528839111328} -08/30/2021 19:02:14 - INFO - __main__ - Step 32037: {'lr': 0.00045088562353037077, 'samples': 6151104, 'steps': 32036, 'loss/train': 1.4019067287445068} -08/30/2021 19:02:16 - INFO - __main__ - Step 32038: {'lr': 0.00045088246465936936, 'samples': 6151296, 'steps': 32037, 'loss/train': 1.4390467405319214} -08/30/2021 19:02:16 - INFO - __main__ - Step 32039: {'lr': 0.0004508793056978534, 'samples': 6151488, 'steps': 32038, 'loss/train': 1.354805588722229} -08/30/2021 19:02:16 - INFO - __main__ - Step 32040: {'lr': 0.00045087614664582424, 'samples': 6151680, 'steps': 32039, 'loss/train': 1.8440057039260864} -08/30/2021 19:02:17 - INFO - __main__ - Step 32041: {'lr': 0.0004508729875032834, 'samples': 6151872, 'steps': 32040, 'loss/train': 1.1266757249832153} -08/30/2021 19:02:17 - INFO - __main__ - Step 32042: {'lr': 0.0004508698282702324, 'samples': 6152064, 'steps': 32041, 'loss/train': 1.6667054891586304} -08/30/2021 19:02:17 - INFO - __main__ - Step 32043: {'lr': 0.0004508666689466725, 'samples': 6152256, 'steps': 32042, 'loss/train': 1.7821850776672363} -08/30/2021 19:02:19 - INFO - __main__ - Step 32044: {'lr': 0.00045086350953260526, 'samples': 6152448, 'steps': 32043, 'loss/train': 1.315334439277649} -08/30/2021 19:02:20 - INFO - __main__ - Step 32045: {'lr': 0.0004508603500280319, 'samples': 6152640, 'steps': 32044, 'loss/train': 1.6057698726654053} -08/30/2021 19:02:20 - INFO - __main__ - Step 32046: {'lr': 0.00045085719043295406, 'samples': 6152832, 'steps': 32045, 'loss/train': 1.2984144687652588} -08/30/2021 19:02:20 - INFO - __main__ - Step 32047: {'lr': 0.00045085403074737295, 'samples': 6153024, 'steps': 32046, 'loss/train': 1.811688780784607} -08/30/2021 19:02:21 - INFO - __main__ - Step 32048: {'lr': 0.0004508508709712902, 'samples': 6153216, 'steps': 32047, 'loss/train': 1.1277586221694946} -08/30/2021 19:02:22 - INFO - __main__ - Step 32049: {'lr': 0.00045084771110470717, 'samples': 6153408, 'steps': 32048, 'loss/train': 2.0934958457946777} -08/30/2021 19:02:22 - INFO - __main__ - Step 32050: {'lr': 0.00045084455114762525, 'samples': 6153600, 'steps': 32049, 'loss/train': 1.2152059078216553} -08/30/2021 19:02:23 - INFO - __main__ - Step 32051: {'lr': 0.00045084139110004585, 'samples': 6153792, 'steps': 32050, 'loss/train': 1.2711853981018066} -08/30/2021 19:02:23 - INFO - __main__ - Step 32052: {'lr': 0.0004508382309619704, 'samples': 6153984, 'steps': 32051, 'loss/train': 2.048680067062378} -08/30/2021 19:02:23 - INFO - __main__ - Step 32053: {'lr': 0.0004508350707334004, 'samples': 6154176, 'steps': 32052, 'loss/train': 2.0509331226348877} -08/30/2021 19:02:24 - INFO - __main__ - Step 32054: {'lr': 0.00045083191041433713, 'samples': 6154368, 'steps': 32053, 'loss/train': 2.210904836654663} -08/30/2021 19:02:26 - INFO - __main__ - Step 32055: {'lr': 0.00045082875000478214, 'samples': 6154560, 'steps': 32054, 'loss/train': 1.6762771606445312} -08/30/2021 19:02:26 - INFO - __main__ - Step 32056: {'lr': 0.0004508255895047368, 'samples': 6154752, 'steps': 32055, 'loss/train': 0.9115856885910034} -08/30/2021 19:02:27 - INFO - __main__ - Step 32057: {'lr': 0.0004508224289142026, 'samples': 6154944, 'steps': 32056, 'loss/train': 0.8742789030075073} -08/30/2021 19:02:27 - INFO - __main__ - Step 32058: {'lr': 0.0004508192682331809, 'samples': 6155136, 'steps': 32057, 'loss/train': 1.793533444404602} -08/30/2021 19:02:28 - INFO - __main__ - Step 32059: {'lr': 0.0004508161074616731, 'samples': 6155328, 'steps': 32058, 'loss/train': 1.273215413093567} -08/30/2021 19:02:29 - INFO - __main__ - Step 32060: {'lr': 0.0004508129465996806, 'samples': 6155520, 'steps': 32059, 'loss/train': 0.08419208973646164} -08/30/2021 19:02:30 - INFO - __main__ - Step 32061: {'lr': 0.00045080978564720505, 'samples': 6155712, 'steps': 32060, 'loss/train': 0.8683608174324036} -08/30/2021 19:02:30 - INFO - __main__ - Step 32062: {'lr': 0.0004508066246042476, 'samples': 6155904, 'steps': 32061, 'loss/train': 1.8320715427398682} -08/30/2021 19:02:30 - INFO - __main__ - Step 32063: {'lr': 0.0004508034634708098, 'samples': 6156096, 'steps': 32062, 'loss/train': 1.0917303562164307} -08/30/2021 19:02:31 - INFO - __main__ - Step 32064: {'lr': 0.0004508003022468931, 'samples': 6156288, 'steps': 32063, 'loss/train': 0.8496731519699097} -08/30/2021 19:02:32 - INFO - __main__ - Step 32065: {'lr': 0.00045079714093249887, 'samples': 6156480, 'steps': 32064, 'loss/train': 1.7927823066711426} -08/30/2021 19:02:33 - INFO - __main__ - Step 32066: {'lr': 0.00045079397952762845, 'samples': 6156672, 'steps': 32065, 'loss/train': 1.335373044013977} -08/30/2021 19:02:33 - INFO - __main__ - Step 32067: {'lr': 0.0004507908180322835, 'samples': 6156864, 'steps': 32066, 'loss/train': 1.1555590629577637} -08/30/2021 19:02:33 - INFO - __main__ - Step 32068: {'lr': 0.00045078765644646524, 'samples': 6157056, 'steps': 32067, 'loss/train': 1.8896679878234863} -08/30/2021 19:02:34 - INFO - __main__ - Step 32069: {'lr': 0.00045078449477017516, 'samples': 6157248, 'steps': 32068, 'loss/train': 1.0979979038238525} -08/30/2021 19:02:36 - INFO - __main__ - Step 32070: {'lr': 0.0004507813330034147, 'samples': 6157440, 'steps': 32069, 'loss/train': 1.8681769371032715} -08/30/2021 19:02:36 - INFO - __main__ - Step 32071: {'lr': 0.00045077817114618526, 'samples': 6157632, 'steps': 32070, 'loss/train': 1.4490727186203003} -08/30/2021 19:02:36 - INFO - __main__ - Step 32072: {'lr': 0.00045077500919848826, 'samples': 6157824, 'steps': 32071, 'loss/train': 1.6575084924697876} -08/30/2021 19:02:37 - INFO - __main__ - Step 32073: {'lr': 0.00045077184716032516, 'samples': 6158016, 'steps': 32072, 'loss/train': 1.455581545829773} -08/30/2021 19:02:37 - INFO - __main__ - Step 32074: {'lr': 0.0004507686850316973, 'samples': 6158208, 'steps': 32073, 'loss/train': 1.3231428861618042} -08/30/2021 19:02:37 - INFO - __main__ - Step 32075: {'lr': 0.00045076552281260625, 'samples': 6158400, 'steps': 32074, 'loss/train': 0.9537262320518494} -08/30/2021 19:02:39 - INFO - __main__ - Step 32076: {'lr': 0.0004507623605030533, 'samples': 6158592, 'steps': 32075, 'loss/train': 5.491367340087891} -08/30/2021 19:02:39 - INFO - __main__ - Step 32077: {'lr': 0.00045075919810304, 'samples': 6158784, 'steps': 32076, 'loss/train': 1.324520468711853} -08/30/2021 19:02:40 - INFO - __main__ - Step 32078: {'lr': 0.0004507560356125676, 'samples': 6158976, 'steps': 32077, 'loss/train': 1.9875439405441284} -08/30/2021 19:02:40 - INFO - __main__ - Step 32079: {'lr': 0.0004507528730316377, 'samples': 6159168, 'steps': 32078, 'loss/train': 1.4204699993133545} -08/30/2021 19:02:40 - INFO - __main__ - Step 32080: {'lr': 0.0004507497103602517, 'samples': 6159360, 'steps': 32079, 'loss/train': 1.8378013372421265} -08/30/2021 19:02:42 - INFO - __main__ - Step 32081: {'lr': 0.00045074654759841087, 'samples': 6159552, 'steps': 32080, 'loss/train': 1.4169636964797974} -08/30/2021 19:02:43 - INFO - __main__ - Step 32082: {'lr': 0.00045074338474611683, 'samples': 6159744, 'steps': 32081, 'loss/train': 1.7404274940490723} -08/30/2021 19:02:43 - INFO - __main__ - Step 32083: {'lr': 0.00045074022180337085, 'samples': 6159936, 'steps': 32082, 'loss/train': 0.18177993595600128} -08/30/2021 19:02:43 - INFO - __main__ - Step 32084: {'lr': 0.0004507370587701745, 'samples': 6160128, 'steps': 32083, 'loss/train': 1.4592140913009644} -08/30/2021 19:02:44 - INFO - __main__ - Step 32085: {'lr': 0.000450733895646529, 'samples': 6160320, 'steps': 32084, 'loss/train': 1.0784831047058105} -08/30/2021 19:02:45 - INFO - __main__ - Step 32086: {'lr': 0.00045073073243243603, 'samples': 6160512, 'steps': 32085, 'loss/train': 1.1648410558700562} -08/30/2021 19:02:45 - INFO - __main__ - Step 32087: {'lr': 0.0004507275691278968, 'samples': 6160704, 'steps': 32086, 'loss/train': 1.5367395877838135} -08/30/2021 19:02:46 - INFO - __main__ - Step 32088: {'lr': 0.00045072440573291293, 'samples': 6160896, 'steps': 32087, 'loss/train': 0.9820032119750977} -08/30/2021 19:02:46 - INFO - __main__ - Step 32089: {'lr': 0.0004507212422474857, 'samples': 6161088, 'steps': 32088, 'loss/train': 1.3043065071105957} -08/30/2021 19:02:46 - INFO - __main__ - Step 32090: {'lr': 0.0004507180786716165, 'samples': 6161280, 'steps': 32089, 'loss/train': 1.593130350112915} -08/30/2021 19:02:48 - INFO - __main__ - Step 32091: {'lr': 0.00045071491500530694, 'samples': 6161472, 'steps': 32090, 'loss/train': 1.9413312673568726} -08/30/2021 19:02:48 - INFO - __main__ - Step 32092: {'lr': 0.0004507117512485582, 'samples': 6161664, 'steps': 32091, 'loss/train': 1.3542094230651855} -08/30/2021 19:02:49 - INFO - __main__ - Step 32093: {'lr': 0.000450708587401372, 'samples': 6161856, 'steps': 32092, 'loss/train': 1.2892329692840576} -08/30/2021 19:02:49 - INFO - __main__ - Step 32094: {'lr': 0.0004507054234637495, 'samples': 6162048, 'steps': 32093, 'loss/train': 1.6318327188491821} -08/30/2021 19:02:49 - INFO - __main__ - Step 32095: {'lr': 0.0004507022594356922, 'samples': 6162240, 'steps': 32094, 'loss/train': 1.459619164466858} -08/30/2021 19:02:51 - INFO - __main__ - Step 32096: {'lr': 0.00045069909531720166, 'samples': 6162432, 'steps': 32095, 'loss/train': 1.9088743925094604} -08/30/2021 19:02:51 - INFO - __main__ - Step 32097: {'lr': 0.0004506959311082792, 'samples': 6162624, 'steps': 32096, 'loss/train': 2.1389622688293457} -08/30/2021 19:02:52 - INFO - __main__ - Step 32098: {'lr': 0.00045069276680892624, 'samples': 6162816, 'steps': 32097, 'loss/train': 1.6033211946487427} -08/30/2021 19:02:52 - INFO - __main__ - Step 32099: {'lr': 0.00045068960241914413, 'samples': 6163008, 'steps': 32098, 'loss/train': 1.2506165504455566} -08/30/2021 19:02:52 - INFO - __main__ - Step 32100: {'lr': 0.00045068643793893447, 'samples': 6163200, 'steps': 32099, 'loss/train': 1.2278567552566528} -08/30/2021 19:02:54 - INFO - __main__ - Step 32101: {'lr': 0.0004506832733682986, 'samples': 6163392, 'steps': 32100, 'loss/train': 0.6025732159614563} -08/30/2021 19:02:55 - INFO - __main__ - Step 32102: {'lr': 0.00045068010870723783, 'samples': 6163584, 'steps': 32101, 'loss/train': 0.7777771353721619} -08/30/2021 19:02:55 - INFO - __main__ - Step 32103: {'lr': 0.00045067694395575385, 'samples': 6163776, 'steps': 32102, 'loss/train': 1.4369356632232666} -08/30/2021 19:02:55 - INFO - __main__ - Step 32104: {'lr': 0.0004506737791138479, 'samples': 6163968, 'steps': 32103, 'loss/train': 1.3069368600845337} -08/30/2021 19:02:56 - INFO - __main__ - Step 32105: {'lr': 0.00045067061418152136, 'samples': 6164160, 'steps': 32104, 'loss/train': 1.2212883234024048} -08/30/2021 19:02:58 - INFO - __main__ - Step 32106: {'lr': 0.00045066744915877585, 'samples': 6164352, 'steps': 32105, 'loss/train': 1.1055688858032227} -08/30/2021 19:02:58 - INFO - __main__ - Step 32107: {'lr': 0.0004506642840456126, 'samples': 6164544, 'steps': 32106, 'loss/train': 1.4533751010894775} -08/30/2021 19:02:58 - INFO - __main__ - Step 32108: {'lr': 0.00045066111884203315, 'samples': 6164736, 'steps': 32107, 'loss/train': 1.2181884050369263} -08/30/2021 19:02:59 - INFO - __main__ - Step 32109: {'lr': 0.0004506579535480389, 'samples': 6164928, 'steps': 32108, 'loss/train': 1.562153935432434} -08/30/2021 19:02:59 - INFO - __main__ - Step 32110: {'lr': 0.00045065478816363124, 'samples': 6165120, 'steps': 32109, 'loss/train': 1.656476616859436} -08/30/2021 19:03:01 - INFO - __main__ - Step 32111: {'lr': 0.00045065162268881164, 'samples': 6165312, 'steps': 32110, 'loss/train': 1.3008641004562378} -08/30/2021 19:03:01 - INFO - __main__ - Step 32112: {'lr': 0.0004506484571235816, 'samples': 6165504, 'steps': 32111, 'loss/train': 1.7591400146484375} -08/30/2021 19:03:02 - INFO - __main__ - Step 32113: {'lr': 0.00045064529146794234, 'samples': 6165696, 'steps': 32112, 'loss/train': 1.3816057443618774} -08/30/2021 19:03:02 - INFO - __main__ - Step 32114: {'lr': 0.0004506421257218955, 'samples': 6165888, 'steps': 32113, 'loss/train': 3.6256494522094727} -08/30/2021 19:03:02 - INFO - __main__ - Step 32115: {'lr': 0.00045063895988544235, 'samples': 6166080, 'steps': 32114, 'loss/train': 1.3191349506378174} -08/30/2021 19:03:03 - INFO - __main__ - Step 32116: {'lr': 0.00045063579395858444, 'samples': 6166272, 'steps': 32115, 'loss/train': 1.3613029718399048} -08/30/2021 19:03:04 - INFO - __main__ - Step 32117: {'lr': 0.0004506326279413231, 'samples': 6166464, 'steps': 32116, 'loss/train': 1.834302306175232} -08/30/2021 19:03:05 - INFO - __main__ - Step 32118: {'lr': 0.0004506294618336598, 'samples': 6166656, 'steps': 32117, 'loss/train': 0.11802104115486145} -08/30/2021 19:03:05 - INFO - __main__ - Step 32119: {'lr': 0.00045062629563559595, 'samples': 6166848, 'steps': 32118, 'loss/train': 1.7002917528152466} -08/30/2021 19:03:06 - INFO - __main__ - Step 32120: {'lr': 0.00045062312934713303, 'samples': 6167040, 'steps': 32119, 'loss/train': 1.4887988567352295} -08/30/2021 19:03:06 - INFO - __main__ - Step 32121: {'lr': 0.00045061996296827237, 'samples': 6167232, 'steps': 32120, 'loss/train': 1.649009346961975} -08/30/2021 19:03:08 - INFO - __main__ - Step 32122: {'lr': 0.00045061679649901543, 'samples': 6167424, 'steps': 32121, 'loss/train': 2.261502265930176} -08/30/2021 19:03:08 - INFO - __main__ - Step 32123: {'lr': 0.00045061362993936374, 'samples': 6167616, 'steps': 32122, 'loss/train': 1.179837703704834} -08/30/2021 19:03:08 - INFO - __main__ - Step 32124: {'lr': 0.0004506104632893185, 'samples': 6167808, 'steps': 32123, 'loss/train': 1.4686287641525269} -08/30/2021 19:03:09 - INFO - __main__ - Step 32125: {'lr': 0.00045060729654888143, 'samples': 6168000, 'steps': 32124, 'loss/train': 1.6186310052871704} -08/30/2021 19:03:09 - INFO - __main__ - Step 32126: {'lr': 0.00045060412971805375, 'samples': 6168192, 'steps': 32125, 'loss/train': 1.0545690059661865} -08/30/2021 19:03:11 - INFO - __main__ - Step 32127: {'lr': 0.00045060096279683694, 'samples': 6168384, 'steps': 32126, 'loss/train': 0.5160688757896423} -08/30/2021 19:03:11 - INFO - __main__ - Step 32128: {'lr': 0.0004505977957852325, 'samples': 6168576, 'steps': 32127, 'loss/train': 1.461456298828125} -08/30/2021 19:03:11 - INFO - __main__ - Step 32129: {'lr': 0.00045059462868324177, 'samples': 6168768, 'steps': 32128, 'loss/train': 0.7838690280914307} -08/30/2021 19:03:12 - INFO - __main__ - Step 32130: {'lr': 0.00045059146149086605, 'samples': 6168960, 'steps': 32129, 'loss/train': 0.9849536418914795} -08/30/2021 19:03:12 - INFO - __main__ - Step 32131: {'lr': 0.00045058829420810707, 'samples': 6169152, 'steps': 32130, 'loss/train': 0.9749042391777039} -08/30/2021 19:03:14 - INFO - __main__ - Step 32132: {'lr': 0.00045058512683496607, 'samples': 6169344, 'steps': 32131, 'loss/train': 1.6814159154891968} -08/30/2021 19:03:14 - INFO - __main__ - Step 32133: {'lr': 0.00045058195937144446, 'samples': 6169536, 'steps': 32132, 'loss/train': 1.3760607242584229} -08/30/2021 19:03:14 - INFO - __main__ - Step 32134: {'lr': 0.00045057879181754375, 'samples': 6169728, 'steps': 32133, 'loss/train': 1.2447855472564697} -08/30/2021 19:03:15 - INFO - __main__ - Step 32135: {'lr': 0.0004505756241732653, 'samples': 6169920, 'steps': 32134, 'loss/train': 1.3355622291564941} -08/30/2021 19:03:15 - INFO - __main__ - Step 32136: {'lr': 0.0004505724564386106, 'samples': 6170112, 'steps': 32135, 'loss/train': 1.7124855518341064} -08/30/2021 19:03:17 - INFO - __main__ - Step 32137: {'lr': 0.00045056928861358106, 'samples': 6170304, 'steps': 32136, 'loss/train': 1.301585078239441} -08/30/2021 19:03:17 - INFO - __main__ - Step 32138: {'lr': 0.000450566120698178, 'samples': 6170496, 'steps': 32137, 'loss/train': 1.8446447849273682} -08/30/2021 19:03:17 - INFO - __main__ - Step 32139: {'lr': 0.0004505629526924031, 'samples': 6170688, 'steps': 32138, 'loss/train': 1.005651593208313} -08/30/2021 19:03:18 - INFO - __main__ - Step 32140: {'lr': 0.0004505597845962575, 'samples': 6170880, 'steps': 32139, 'loss/train': 1.6745375394821167} -08/30/2021 19:03:18 - INFO - __main__ - Step 32141: {'lr': 0.0004505566164097428, 'samples': 6171072, 'steps': 32140, 'loss/train': 1.7593958377838135} -08/30/2021 19:03:20 - INFO - __main__ - Step 32142: {'lr': 0.0004505534481328604, 'samples': 6171264, 'steps': 32141, 'loss/train': 1.1630038022994995} -08/30/2021 19:03:20 - INFO - __main__ - Step 32143: {'lr': 0.0004505502797656117, 'samples': 6171456, 'steps': 32142, 'loss/train': 1.2246348857879639} -08/30/2021 19:03:21 - INFO - __main__ - Step 32144: {'lr': 0.00045054711130799806, 'samples': 6171648, 'steps': 32143, 'loss/train': 1.1393463611602783} -08/30/2021 19:03:21 - INFO - __main__ - Step 32145: {'lr': 0.00045054394276002106, 'samples': 6171840, 'steps': 32144, 'loss/train': 1.0095564126968384} -08/30/2021 19:03:21 - INFO - __main__ - Step 32146: {'lr': 0.00045054077412168215, 'samples': 6172032, 'steps': 32145, 'loss/train': 0.8614693880081177} -08/30/2021 19:03:22 - INFO - __main__ - Step 32147: {'lr': 0.0004505376053929825, 'samples': 6172224, 'steps': 32146, 'loss/train': 1.3967212438583374} -08/30/2021 19:03:24 - INFO - __main__ - Step 32148: {'lr': 0.0004505344365739238, 'samples': 6172416, 'steps': 32147, 'loss/train': 1.4298518896102905} -08/30/2021 19:03:24 - INFO - __main__ - Step 32149: {'lr': 0.0004505312676645073, 'samples': 6172608, 'steps': 32148, 'loss/train': 1.7533395290374756} -08/30/2021 19:03:24 - INFO - __main__ - Step 32150: {'lr': 0.00045052809866473454, 'samples': 6172800, 'steps': 32149, 'loss/train': 1.2677139043807983} -08/30/2021 19:03:25 - INFO - __main__ - Step 32151: {'lr': 0.00045052492957460696, 'samples': 6172992, 'steps': 32150, 'loss/train': 2.278658390045166} -08/30/2021 19:03:25 - INFO - __main__ - Step 32152: {'lr': 0.00045052176039412587, 'samples': 6173184, 'steps': 32151, 'loss/train': 1.4786430597305298} -08/30/2021 19:03:25 - INFO - __main__ - Step 32153: {'lr': 0.0004505185911232928, 'samples': 6173376, 'steps': 32152, 'loss/train': 0.9608216881752014} -08/30/2021 19:03:27 - INFO - __main__ - Step 32154: {'lr': 0.00045051542176210914, 'samples': 6173568, 'steps': 32153, 'loss/train': 1.5493953227996826} -08/30/2021 19:03:28 - INFO - __main__ - Step 32155: {'lr': 0.0004505122523105764, 'samples': 6173760, 'steps': 32154, 'loss/train': 1.5346219539642334} -08/30/2021 19:03:28 - INFO - __main__ - Step 32156: {'lr': 0.00045050908276869585, 'samples': 6173952, 'steps': 32155, 'loss/train': 1.8279955387115479} -08/30/2021 19:03:28 - INFO - __main__ - Step 32157: {'lr': 0.0004505059131364689, 'samples': 6174144, 'steps': 32156, 'loss/train': 1.3577688932418823} -08/30/2021 19:03:29 - INFO - __main__ - Step 32158: {'lr': 0.00045050274341389726, 'samples': 6174336, 'steps': 32157, 'loss/train': 1.3958837985992432} -08/30/2021 19:03:31 - INFO - __main__ - Step 32159: {'lr': 0.00045049957360098207, 'samples': 6174528, 'steps': 32158, 'loss/train': 1.30253267288208} -08/30/2021 19:03:31 - INFO - __main__ - Step 32160: {'lr': 0.0004504964036977249, 'samples': 6174720, 'steps': 32159, 'loss/train': 3.0469815731048584} -08/30/2021 19:03:32 - INFO - __main__ - Step 32161: {'lr': 0.00045049323370412723, 'samples': 6174912, 'steps': 32160, 'loss/train': 1.4968340396881104} -08/30/2021 19:03:32 - INFO - __main__ - Step 32162: {'lr': 0.0004504900636201903, 'samples': 6175104, 'steps': 32161, 'loss/train': 1.395896315574646} -08/30/2021 19:03:32 - INFO - __main__ - Step 32163: {'lr': 0.00045048689344591566, 'samples': 6175296, 'steps': 32162, 'loss/train': 1.3904894590377808} -08/30/2021 19:03:34 - INFO - __main__ - Step 32164: {'lr': 0.0004504837231813047, 'samples': 6175488, 'steps': 32163, 'loss/train': 1.5604084730148315} -08/30/2021 19:03:34 - INFO - __main__ - Step 32165: {'lr': 0.0004504805528263589, 'samples': 6175680, 'steps': 32164, 'loss/train': 1.279072642326355} -08/30/2021 19:03:35 - INFO - __main__ - Step 32166: {'lr': 0.00045047738238107967, 'samples': 6175872, 'steps': 32165, 'loss/train': 1.3723299503326416} -08/30/2021 19:03:35 - INFO - __main__ - Step 32167: {'lr': 0.00045047421184546844, 'samples': 6176064, 'steps': 32166, 'loss/train': 1.8364002704620361} -08/30/2021 19:03:35 - INFO - __main__ - Step 32168: {'lr': 0.0004504710412195265, 'samples': 6176256, 'steps': 32167, 'loss/train': 1.8371309041976929} -08/30/2021 19:03:36 - INFO - __main__ - Step 32169: {'lr': 0.00045046787050325555, 'samples': 6176448, 'steps': 32168, 'loss/train': 1.905853509902954} -08/30/2021 19:03:37 - INFO - __main__ - Step 32170: {'lr': 0.0004504646996966568, 'samples': 6176640, 'steps': 32169, 'loss/train': 1.547277569770813} -08/30/2021 19:03:38 - INFO - __main__ - Step 32171: {'lr': 0.0004504615287997318, 'samples': 6176832, 'steps': 32170, 'loss/train': 1.544297456741333} -08/30/2021 19:03:38 - INFO - __main__ - Step 32172: {'lr': 0.00045045835781248184, 'samples': 6177024, 'steps': 32171, 'loss/train': 1.3578882217407227} -08/30/2021 19:03:38 - INFO - __main__ - Step 32173: {'lr': 0.0004504551867349085, 'samples': 6177216, 'steps': 32172, 'loss/train': 1.6245187520980835} -08/30/2021 19:03:40 - INFO - __main__ - Step 32174: {'lr': 0.0004504520155670131, 'samples': 6177408, 'steps': 32173, 'loss/train': 1.0880186557769775} -08/30/2021 19:03:40 - INFO - __main__ - Step 32175: {'lr': 0.0004504488443087972, 'samples': 6177600, 'steps': 32174, 'loss/train': 1.7720310688018799} -08/30/2021 19:03:41 - INFO - __main__ - Step 32176: {'lr': 0.00045044567296026206, 'samples': 6177792, 'steps': 32175, 'loss/train': 1.6322996616363525} -08/30/2021 19:03:41 - INFO - __main__ - Step 32177: {'lr': 0.0004504425015214092, 'samples': 6177984, 'steps': 32176, 'loss/train': 1.562922716140747} -08/30/2021 19:03:42 - INFO - __main__ - Step 32178: {'lr': 0.00045043932999224015, 'samples': 6178176, 'steps': 32177, 'loss/train': 1.3139508962631226} -08/30/2021 19:03:42 - INFO - __main__ - Step 32179: {'lr': 0.00045043615837275607, 'samples': 6178368, 'steps': 32178, 'loss/train': 1.8337661027908325} -08/30/2021 19:03:44 - INFO - __main__ - Step 32180: {'lr': 0.0004504329866629586, 'samples': 6178560, 'steps': 32179, 'loss/train': 1.4523018598556519} -08/30/2021 19:03:44 - INFO - __main__ - Step 32181: {'lr': 0.0004504298148628492, 'samples': 6178752, 'steps': 32180, 'loss/train': 1.5806210041046143} -08/30/2021 19:03:44 - INFO - __main__ - Step 32182: {'lr': 0.0004504266429724292, 'samples': 6178944, 'steps': 32181, 'loss/train': 0.7032216787338257} -08/30/2021 19:03:45 - INFO - __main__ - Step 32183: {'lr': 0.0004504234709917, 'samples': 6179136, 'steps': 32182, 'loss/train': 1.7409673929214478} -08/30/2021 19:03:45 - INFO - __main__ - Step 32184: {'lr': 0.00045042029892066306, 'samples': 6179328, 'steps': 32183, 'loss/train': 1.07532799243927} -08/30/2021 19:03:47 - INFO - __main__ - Step 32185: {'lr': 0.00045041712675931983, 'samples': 6179520, 'steps': 32184, 'loss/train': 1.0329475402832031} -08/30/2021 19:03:47 - INFO - __main__ - Step 32186: {'lr': 0.0004504139545076717, 'samples': 6179712, 'steps': 32185, 'loss/train': 0.66080242395401} -08/30/2021 19:03:47 - INFO - __main__ - Step 32187: {'lr': 0.0004504107821657203, 'samples': 6179904, 'steps': 32186, 'loss/train': 1.7955132722854614} -08/30/2021 19:03:48 - INFO - __main__ - Step 32188: {'lr': 0.00045040760973346673, 'samples': 6180096, 'steps': 32187, 'loss/train': 1.5316449403762817} -08/30/2021 19:03:48 - INFO - __main__ - Step 32189: {'lr': 0.00045040443721091266, 'samples': 6180288, 'steps': 32188, 'loss/train': 1.0864976644515991} -08/30/2021 19:03:50 - INFO - __main__ - Step 32190: {'lr': 0.0004504012645980594, 'samples': 6180480, 'steps': 32189, 'loss/train': 1.294631838798523} -08/30/2021 19:03:50 - INFO - __main__ - Step 32191: {'lr': 0.0004503980918949085, 'samples': 6180672, 'steps': 32190, 'loss/train': 1.7163926362991333} -08/30/2021 19:03:51 - INFO - __main__ - Step 32192: {'lr': 0.00045039491910146124, 'samples': 6180864, 'steps': 32191, 'loss/train': 1.713707447052002} -08/30/2021 19:03:51 - INFO - __main__ - Step 32193: {'lr': 0.00045039174621771915, 'samples': 6181056, 'steps': 32192, 'loss/train': 1.825025200843811} -08/30/2021 19:03:51 - INFO - __main__ - Step 32194: {'lr': 0.00045038857324368367, 'samples': 6181248, 'steps': 32193, 'loss/train': 1.7011688947677612} -08/30/2021 19:03:52 - INFO - __main__ - Step 32195: {'lr': 0.0004503854001793561, 'samples': 6181440, 'steps': 32194, 'loss/train': 1.7963701486587524} -08/30/2021 19:03:53 - INFO - __main__ - Step 32196: {'lr': 0.00045038222702473797, 'samples': 6181632, 'steps': 32195, 'loss/train': 2.0165152549743652} -08/30/2021 19:03:54 - INFO - __main__ - Step 32197: {'lr': 0.0004503790537798308, 'samples': 6181824, 'steps': 32196, 'loss/train': 0.3313131332397461} -08/30/2021 19:03:54 - INFO - __main__ - Step 32198: {'lr': 0.00045037588044463586, 'samples': 6182016, 'steps': 32197, 'loss/train': 0.11049621552228928} -08/30/2021 19:03:55 - INFO - __main__ - Step 32199: {'lr': 0.00045037270701915464, 'samples': 6182208, 'steps': 32198, 'loss/train': 1.2803524732589722} -08/30/2021 19:03:55 - INFO - __main__ - Step 32200: {'lr': 0.0004503695335033885, 'samples': 6182400, 'steps': 32199, 'loss/train': 0.9892556667327881} -08/30/2021 19:03:56 - INFO - __main__ - Step 32201: {'lr': 0.00045036635989733904, 'samples': 6182592, 'steps': 32200, 'loss/train': 0.8140304684638977} -08/30/2021 19:03:57 - INFO - __main__ - Step 32202: {'lr': 0.0004503631862010076, 'samples': 6182784, 'steps': 32201, 'loss/train': 1.8580771684646606} -08/30/2021 19:03:57 - INFO - __main__ - Step 32203: {'lr': 0.0004503600124143955, 'samples': 6182976, 'steps': 32202, 'loss/train': 1.266331434249878} -08/30/2021 19:03:58 - INFO - __main__ - Step 32204: {'lr': 0.0004503568385375043, 'samples': 6183168, 'steps': 32203, 'loss/train': 1.3279629945755005} -08/30/2021 19:03:58 - INFO - __main__ - Step 32205: {'lr': 0.00045035366457033546, 'samples': 6183360, 'steps': 32204, 'loss/train': 1.6388986110687256} -08/30/2021 19:03:59 - INFO - __main__ - Step 32206: {'lr': 0.00045035049051289037, 'samples': 6183552, 'steps': 32205, 'loss/train': 1.7536370754241943} -08/30/2021 19:04:00 - INFO - __main__ - Step 32207: {'lr': 0.00045034731636517036, 'samples': 6183744, 'steps': 32206, 'loss/train': 1.0209001302719116} -08/30/2021 19:04:00 - INFO - __main__ - Step 32208: {'lr': 0.0004503441421271769, 'samples': 6183936, 'steps': 32207, 'loss/train': 1.4281094074249268} -08/30/2021 19:04:01 - INFO - __main__ - Step 32209: {'lr': 0.0004503409677989115, 'samples': 6184128, 'steps': 32208, 'loss/train': 0.953923761844635} -08/30/2021 19:04:01 - INFO - __main__ - Step 32210: {'lr': 0.00045033779338037565, 'samples': 6184320, 'steps': 32209, 'loss/train': 1.758366346359253} -08/30/2021 19:04:02 - INFO - __main__ - Step 32211: {'lr': 0.0004503346188715706, 'samples': 6184512, 'steps': 32210, 'loss/train': 1.7811731100082397} -08/30/2021 19:04:03 - INFO - __main__ - Step 32212: {'lr': 0.0004503314442724979, 'samples': 6184704, 'steps': 32211, 'loss/train': 1.2624577283859253} -08/30/2021 19:04:03 - INFO - __main__ - Step 32213: {'lr': 0.0004503282695831589, 'samples': 6184896, 'steps': 32212, 'loss/train': 1.461298942565918} -08/30/2021 19:04:04 - INFO - __main__ - Step 32214: {'lr': 0.0004503250948035551, 'samples': 6185088, 'steps': 32213, 'loss/train': 1.3856780529022217} -08/30/2021 19:04:04 - INFO - __main__ - Step 32215: {'lr': 0.0004503219199336879, 'samples': 6185280, 'steps': 32214, 'loss/train': 1.2113443613052368} -08/30/2021 19:04:06 - INFO - __main__ - Step 32216: {'lr': 0.00045031874497355876, 'samples': 6185472, 'steps': 32215, 'loss/train': 2.051064968109131} -08/30/2021 19:04:07 - INFO - __main__ - Step 32217: {'lr': 0.000450315569923169, 'samples': 6185664, 'steps': 32216, 'loss/train': 1.9358235597610474} -08/30/2021 19:04:07 - INFO - __main__ - Step 32218: {'lr': 0.00045031239478252017, 'samples': 6185856, 'steps': 32217, 'loss/train': 1.1065044403076172} -08/30/2021 19:04:07 - INFO - __main__ - Step 32219: {'lr': 0.00045030921955161373, 'samples': 6186048, 'steps': 32218, 'loss/train': 1.314040184020996} -08/30/2021 19:04:08 - INFO - __main__ - Step 32220: {'lr': 0.000450306044230451, 'samples': 6186240, 'steps': 32219, 'loss/train': 0.8560385704040527} -08/30/2021 19:04:08 - INFO - __main__ - Step 32221: {'lr': 0.0004503028688190335, 'samples': 6186432, 'steps': 32220, 'loss/train': 1.723817229270935} -08/30/2021 19:04:10 - INFO - __main__ - Step 32222: {'lr': 0.00045029969331736254, 'samples': 6186624, 'steps': 32221, 'loss/train': 1.112336277961731} -08/30/2021 19:04:10 - INFO - __main__ - Step 32223: {'lr': 0.00045029651772543965, 'samples': 6186816, 'steps': 32222, 'loss/train': 1.5397037267684937} -08/30/2021 19:04:11 - INFO - __main__ - Step 32224: {'lr': 0.0004502933420432662, 'samples': 6187008, 'steps': 32223, 'loss/train': 0.10595818608999252} -08/30/2021 19:04:11 - INFO - __main__ - Step 32225: {'lr': 0.0004502901662708437, 'samples': 6187200, 'steps': 32224, 'loss/train': 1.8684959411621094} -08/30/2021 19:04:11 - INFO - __main__ - Step 32226: {'lr': 0.0004502869904081736, 'samples': 6187392, 'steps': 32225, 'loss/train': 1.5043412446975708} -08/30/2021 19:04:13 - INFO - __main__ - Step 32227: {'lr': 0.00045028381445525725, 'samples': 6187584, 'steps': 32226, 'loss/train': 1.1438548564910889} -08/30/2021 19:04:13 - INFO - __main__ - Step 32228: {'lr': 0.0004502806384120961, 'samples': 6187776, 'steps': 32227, 'loss/train': 0.6093456745147705} -08/30/2021 19:04:14 - INFO - __main__ - Step 32229: {'lr': 0.0004502774622786915, 'samples': 6187968, 'steps': 32228, 'loss/train': 1.0948002338409424} -08/30/2021 19:04:14 - INFO - __main__ - Step 32230: {'lr': 0.00045027428605504507, 'samples': 6188160, 'steps': 32229, 'loss/train': 1.5128430128097534} -08/30/2021 19:04:14 - INFO - __main__ - Step 32231: {'lr': 0.00045027110974115814, 'samples': 6188352, 'steps': 32230, 'loss/train': 1.4795303344726562} -08/30/2021 19:04:17 - INFO - __main__ - Step 32232: {'lr': 0.0004502679333370321, 'samples': 6188544, 'steps': 32231, 'loss/train': 1.8321692943572998} -08/30/2021 19:04:17 - INFO - __main__ - Step 32233: {'lr': 0.0004502647568426684, 'samples': 6188736, 'steps': 32232, 'loss/train': 1.2319809198379517} -08/30/2021 19:04:17 - INFO - __main__ - Step 32234: {'lr': 0.0004502615802580685, 'samples': 6188928, 'steps': 32233, 'loss/train': 0.9736570715904236} -08/30/2021 19:04:18 - INFO - __main__ - Step 32235: {'lr': 0.0004502584035832338, 'samples': 6189120, 'steps': 32234, 'loss/train': 1.2968236207962036} -08/30/2021 19:04:18 - INFO - __main__ - Step 32236: {'lr': 0.00045025522681816586, 'samples': 6189312, 'steps': 32235, 'loss/train': 1.3304810523986816} -08/30/2021 19:04:19 - INFO - __main__ - Step 32237: {'lr': 0.0004502520499628659, 'samples': 6189504, 'steps': 32236, 'loss/train': 1.0280253887176514} -08/30/2021 19:04:20 - INFO - __main__ - Step 32238: {'lr': 0.00045024887301733555, 'samples': 6189696, 'steps': 32237, 'loss/train': 0.15719056129455566} -08/30/2021 19:04:20 - INFO - __main__ - Step 32239: {'lr': 0.0004502456959815761, 'samples': 6189888, 'steps': 32238, 'loss/train': 1.4826220273971558} -08/30/2021 19:04:21 - INFO - __main__ - Step 32240: {'lr': 0.000450242518855589, 'samples': 6190080, 'steps': 32239, 'loss/train': 1.3655624389648438} -08/30/2021 19:04:21 - INFO - __main__ - Step 32241: {'lr': 0.00045023934163937565, 'samples': 6190272, 'steps': 32240, 'loss/train': 1.304955244064331} -08/30/2021 19:04:21 - INFO - __main__ - Step 32242: {'lr': 0.00045023616433293763, 'samples': 6190464, 'steps': 32241, 'loss/train': 1.8752590417861938} -08/30/2021 19:04:23 - INFO - __main__ - Step 32243: {'lr': 0.00045023298693627626, 'samples': 6190656, 'steps': 32242, 'loss/train': 1.9656401872634888} -08/30/2021 19:04:23 - INFO - __main__ - Step 32244: {'lr': 0.000450229809449393, 'samples': 6190848, 'steps': 32243, 'loss/train': 1.1609612703323364} -08/30/2021 19:04:24 - INFO - __main__ - Step 32245: {'lr': 0.00045022663187228927, 'samples': 6191040, 'steps': 32244, 'loss/train': 1.9598662853240967} -08/30/2021 19:04:24 - INFO - __main__ - Step 32246: {'lr': 0.0004502234542049666, 'samples': 6191232, 'steps': 32245, 'loss/train': 1.390787959098816} -08/30/2021 19:04:24 - INFO - __main__ - Step 32247: {'lr': 0.00045022027644742624, 'samples': 6191424, 'steps': 32246, 'loss/train': 1.2588329315185547} -08/30/2021 19:04:26 - INFO - __main__ - Step 32248: {'lr': 0.0004502170985996697, 'samples': 6191616, 'steps': 32247, 'loss/train': 1.6045222282409668} -08/30/2021 19:04:27 - INFO - __main__ - Step 32249: {'lr': 0.00045021392066169844, 'samples': 6191808, 'steps': 32248, 'loss/train': 1.5523520708084106} -08/30/2021 19:04:27 - INFO - __main__ - Step 32250: {'lr': 0.0004502107426335139, 'samples': 6192000, 'steps': 32249, 'loss/train': 0.8603515625} -08/30/2021 19:04:27 - INFO - __main__ - Step 32251: {'lr': 0.0004502075645151175, 'samples': 6192192, 'steps': 32250, 'loss/train': 1.7081907987594604} -08/30/2021 19:04:28 - INFO - __main__ - Step 32252: {'lr': 0.0004502043863065106, 'samples': 6192384, 'steps': 32251, 'loss/train': 0.9449916481971741} -08/30/2021 19:04:28 - INFO - __main__ - Step 32253: {'lr': 0.00045020120800769474, 'samples': 6192576, 'steps': 32252, 'loss/train': 1.5930087566375732} -08/30/2021 19:04:29 - INFO - __main__ - Step 32254: {'lr': 0.0004501980296186713, 'samples': 6192768, 'steps': 32253, 'loss/train': 1.470438003540039} -08/30/2021 19:04:30 - INFO - __main__ - Step 32255: {'lr': 0.0004501948511394417, 'samples': 6192960, 'steps': 32254, 'loss/train': 1.4525355100631714} -08/30/2021 19:04:30 - INFO - __main__ - Step 32256: {'lr': 0.0004501916725700074, 'samples': 6193152, 'steps': 32255, 'loss/train': 1.394317626953125} -08/30/2021 19:04:31 - INFO - __main__ - Step 32257: {'lr': 0.00045018849391036987, 'samples': 6193344, 'steps': 32256, 'loss/train': 1.58014976978302} -08/30/2021 19:04:31 - INFO - __main__ - Step 32258: {'lr': 0.00045018531516053046, 'samples': 6193536, 'steps': 32257, 'loss/train': 0.9133492708206177} -08/30/2021 19:04:32 - INFO - __main__ - Step 32259: {'lr': 0.0004501821363204906, 'samples': 6193728, 'steps': 32258, 'loss/train': 1.1269924640655518} -08/30/2021 19:04:33 - INFO - __main__ - Step 32260: {'lr': 0.00045017895739025185, 'samples': 6193920, 'steps': 32259, 'loss/train': 1.0067967176437378} -08/30/2021 19:04:33 - INFO - __main__ - Step 32261: {'lr': 0.0004501757783698154, 'samples': 6194112, 'steps': 32260, 'loss/train': 1.3653923273086548} -08/30/2021 19:04:33 - INFO - __main__ - Step 32262: {'lr': 0.00045017259925918295, 'samples': 6194304, 'steps': 32261, 'loss/train': 0.9848375916481018} -08/30/2021 19:04:34 - INFO - __main__ - Step 32263: {'lr': 0.0004501694200583558, 'samples': 6194496, 'steps': 32262, 'loss/train': 1.7003496885299683} -08/30/2021 19:04:35 - INFO - __main__ - Step 32264: {'lr': 0.0004501662407673354, 'samples': 6194688, 'steps': 32263, 'loss/train': 1.3231052160263062} -08/30/2021 19:04:36 - INFO - __main__ - Step 32265: {'lr': 0.00045016306138612313, 'samples': 6194880, 'steps': 32264, 'loss/train': 1.0903302431106567} -08/30/2021 19:04:36 - INFO - __main__ - Step 32266: {'lr': 0.0004501598819147205, 'samples': 6195072, 'steps': 32265, 'loss/train': 1.4201833009719849} -08/30/2021 19:04:36 - INFO - __main__ - Step 32267: {'lr': 0.00045015670235312895, 'samples': 6195264, 'steps': 32266, 'loss/train': 2.0665924549102783} -08/30/2021 19:04:37 - INFO - __main__ - Step 32268: {'lr': 0.0004501535227013498, 'samples': 6195456, 'steps': 32267, 'loss/train': 1.9269461631774902} -08/30/2021 19:04:39 - INFO - __main__ - Step 32269: {'lr': 0.0004501503429593846, 'samples': 6195648, 'steps': 32268, 'loss/train': 1.0294262170791626} -08/30/2021 19:04:39 - INFO - __main__ - Step 32270: {'lr': 0.0004501471631272348, 'samples': 6195840, 'steps': 32269, 'loss/train': 1.0452120304107666} -08/30/2021 19:04:40 - INFO - __main__ - Step 32271: {'lr': 0.00045014398320490173, 'samples': 6196032, 'steps': 32270, 'loss/train': 1.3407011032104492} -08/30/2021 19:04:40 - INFO - __main__ - Step 32272: {'lr': 0.00045014080319238686, 'samples': 6196224, 'steps': 32271, 'loss/train': 1.2327735424041748} -08/30/2021 19:04:40 - INFO - __main__ - Step 32273: {'lr': 0.00045013762308969164, 'samples': 6196416, 'steps': 32272, 'loss/train': 1.2885394096374512} -08/30/2021 19:04:41 - INFO - __main__ - Step 32274: {'lr': 0.00045013444289681757, 'samples': 6196608, 'steps': 32273, 'loss/train': 1.5427135229110718} -08/30/2021 19:04:42 - INFO - __main__ - Step 32275: {'lr': 0.0004501312626137659, 'samples': 6196800, 'steps': 32274, 'loss/train': 1.1621025800704956} -08/30/2021 19:04:43 - INFO - __main__ - Step 32276: {'lr': 0.0004501280822405382, 'samples': 6196992, 'steps': 32275, 'loss/train': 1.6799015998840332} -08/30/2021 19:04:43 - INFO - __main__ - Step 32277: {'lr': 0.00045012490177713586, 'samples': 6197184, 'steps': 32276, 'loss/train': 1.6742160320281982} -08/30/2021 19:04:43 - INFO - __main__ - Step 32278: {'lr': 0.00045012172122356036, 'samples': 6197376, 'steps': 32277, 'loss/train': 0.9062545299530029} -08/30/2021 19:04:44 - INFO - __main__ - Step 32279: {'lr': 0.0004501185405798131, 'samples': 6197568, 'steps': 32278, 'loss/train': 1.3616219758987427} -08/30/2021 19:04:45 - INFO - __main__ - Step 32280: {'lr': 0.00045011535984589544, 'samples': 6197760, 'steps': 32279, 'loss/train': 1.1179317235946655} -08/30/2021 19:04:46 - INFO - __main__ - Step 32281: {'lr': 0.000450112179021809, 'samples': 6197952, 'steps': 32280, 'loss/train': 1.7102910280227661} -08/30/2021 19:04:46 - INFO - __main__ - Step 32282: {'lr': 0.00045010899810755506, 'samples': 6198144, 'steps': 32281, 'loss/train': 1.355440378189087} -08/30/2021 19:04:46 - INFO - __main__ - Step 32283: {'lr': 0.00045010581710313506, 'samples': 6198336, 'steps': 32282, 'loss/train': 1.5274758338928223} -08/30/2021 19:04:47 - INFO - __main__ - Step 32284: {'lr': 0.0004501026360085505, 'samples': 6198528, 'steps': 32283, 'loss/train': 1.785041332244873} -08/30/2021 19:04:48 - INFO - __main__ - Step 32285: {'lr': 0.0004500994548238028, 'samples': 6198720, 'steps': 32284, 'loss/train': 1.2113220691680908} -08/30/2021 19:04:49 - INFO - __main__ - Step 32286: {'lr': 0.00045009627354889337, 'samples': 6198912, 'steps': 32285, 'loss/train': 0.9600415825843811} -08/30/2021 19:04:49 - INFO - __main__ - Step 32287: {'lr': 0.0004500930921838236, 'samples': 6199104, 'steps': 32286, 'loss/train': 1.620591640472412} -08/30/2021 19:04:49 - INFO - __main__ - Step 32288: {'lr': 0.000450089910728595, 'samples': 6199296, 'steps': 32287, 'loss/train': 1.697812795639038} -08/30/2021 19:04:50 - INFO - __main__ - Step 32289: {'lr': 0.0004500867291832089, 'samples': 6199488, 'steps': 32288, 'loss/train': 1.4883240461349487} -08/30/2021 19:04:51 - INFO - __main__ - Step 32290: {'lr': 0.00045008354754766687, 'samples': 6199680, 'steps': 32289, 'loss/train': 1.4518771171569824} -08/30/2021 19:04:52 - INFO - __main__ - Step 32291: {'lr': 0.0004500803658219703, 'samples': 6199872, 'steps': 32290, 'loss/train': 1.5694080591201782} -08/30/2021 19:04:52 - INFO - __main__ - Step 32292: {'lr': 0.0004500771840061206, 'samples': 6200064, 'steps': 32291, 'loss/train': 1.7950413227081299} -08/30/2021 19:04:52 - INFO - __main__ - Step 32293: {'lr': 0.00045007400210011925, 'samples': 6200256, 'steps': 32292, 'loss/train': 1.6159052848815918} -08/30/2021 19:04:53 - INFO - __main__ - Step 32294: {'lr': 0.0004500708201039676, 'samples': 6200448, 'steps': 32293, 'loss/train': 1.9774682521820068} -08/30/2021 19:04:54 - INFO - __main__ - Step 32295: {'lr': 0.0004500676380176671, 'samples': 6200640, 'steps': 32294, 'loss/train': 2.228645086288452} -08/30/2021 19:04:55 - INFO - __main__ - Step 32296: {'lr': 0.00045006445584121923, 'samples': 6200832, 'steps': 32295, 'loss/train': 1.2370656728744507} -08/30/2021 19:04:55 - INFO - __main__ - Step 32297: {'lr': 0.00045006127357462533, 'samples': 6201024, 'steps': 32296, 'loss/train': 0.9634670615196228} -08/30/2021 19:04:55 - INFO - __main__ - Step 32298: {'lr': 0.000450058091217887, 'samples': 6201216, 'steps': 32297, 'loss/train': 1.016331434249878} -08/30/2021 19:04:56 - INFO - __main__ - Step 32299: {'lr': 0.0004500549087710056, 'samples': 6201408, 'steps': 32298, 'loss/train': 1.5722503662109375} -08/30/2021 19:04:57 - INFO - __main__ - Step 32300: {'lr': 0.0004500517262339825, 'samples': 6201600, 'steps': 32299, 'loss/train': 1.2954716682434082} -08/30/2021 19:04:58 - INFO - __main__ - Step 32301: {'lr': 0.0004500485436068191, 'samples': 6201792, 'steps': 32300, 'loss/train': 1.697182059288025} -08/30/2021 19:04:58 - INFO - __main__ - Step 32302: {'lr': 0.0004500453608895171, 'samples': 6201984, 'steps': 32301, 'loss/train': 1.104217290878296} -08/30/2021 19:04:58 - INFO - __main__ - Step 32303: {'lr': 0.00045004217808207757, 'samples': 6202176, 'steps': 32302, 'loss/train': 1.3325445652008057} -08/30/2021 19:04:59 - INFO - __main__ - Step 32304: {'lr': 0.0004500389951845022, 'samples': 6202368, 'steps': 32303, 'loss/train': 0.8305303454399109} -08/30/2021 19:05:00 - INFO - __main__ - Step 32305: {'lr': 0.00045003581219679235, 'samples': 6202560, 'steps': 32304, 'loss/train': 1.7760523557662964} -08/30/2021 19:05:01 - INFO - __main__ - Step 32306: {'lr': 0.00045003262911894943, 'samples': 6202752, 'steps': 32305, 'loss/train': 1.6123363971710205} -08/30/2021 19:05:01 - INFO - __main__ - Step 32307: {'lr': 0.00045002944595097494, 'samples': 6202944, 'steps': 32306, 'loss/train': 1.5623363256454468} -08/30/2021 19:05:02 - INFO - __main__ - Step 32308: {'lr': 0.00045002626269287024, 'samples': 6203136, 'steps': 32307, 'loss/train': 1.1931275129318237} -08/30/2021 19:05:02 - INFO - __main__ - Step 32309: {'lr': 0.00045002307934463673, 'samples': 6203328, 'steps': 32308, 'loss/train': 1.2309906482696533} -08/30/2021 19:05:03 - INFO - __main__ - Step 32310: {'lr': 0.000450019895906276, 'samples': 6203520, 'steps': 32309, 'loss/train': 1.2578767538070679} -08/30/2021 19:05:04 - INFO - __main__ - Step 32311: {'lr': 0.0004500167123777894, 'samples': 6203712, 'steps': 32310, 'loss/train': 1.2556978464126587} -08/30/2021 19:05:04 - INFO - __main__ - Step 32312: {'lr': 0.00045001352875917824, 'samples': 6203904, 'steps': 32311, 'loss/train': 1.2942194938659668} -08/30/2021 19:05:05 - INFO - __main__ - Step 32313: {'lr': 0.00045001034505044415, 'samples': 6204096, 'steps': 32312, 'loss/train': 1.7812371253967285} -08/30/2021 19:05:05 - INFO - __main__ - Step 32314: {'lr': 0.00045000716125158846, 'samples': 6204288, 'steps': 32313, 'loss/train': 0.655072033405304} -08/30/2021 19:05:07 - INFO - __main__ - Step 32315: {'lr': 0.0004500039773626127, 'samples': 6204480, 'steps': 32314, 'loss/train': 1.0961158275604248} -08/30/2021 19:05:07 - INFO - __main__ - Step 32316: {'lr': 0.00045000079338351805, 'samples': 6204672, 'steps': 32315, 'loss/train': 1.4331393241882324} -08/30/2021 19:05:07 - INFO - __main__ - Step 32317: {'lr': 0.0004499976093143063, 'samples': 6204864, 'steps': 32316, 'loss/train': 1.7492982149124146} -08/30/2021 19:05:08 - INFO - __main__ - Step 32318: {'lr': 0.00044999442515497866, 'samples': 6205056, 'steps': 32317, 'loss/train': 1.6471707820892334} -08/30/2021 19:05:08 - INFO - __main__ - Step 32319: {'lr': 0.0004499912409055367, 'samples': 6205248, 'steps': 32318, 'loss/train': 1.87456214427948} -08/30/2021 19:05:08 - INFO - __main__ - Step 32320: {'lr': 0.0004499880565659816, 'samples': 6205440, 'steps': 32319, 'loss/train': 1.618486762046814} -08/30/2021 19:05:10 - INFO - __main__ - Step 32321: {'lr': 0.0004499848721363151, 'samples': 6205632, 'steps': 32320, 'loss/train': 2.046422243118286} -08/30/2021 19:05:10 - INFO - __main__ - Step 32322: {'lr': 0.0004499816876165385, 'samples': 6205824, 'steps': 32321, 'loss/train': 1.8166916370391846} -08/30/2021 19:05:11 - INFO - __main__ - Step 32323: {'lr': 0.0004499785030066532, 'samples': 6206016, 'steps': 32322, 'loss/train': 1.499638557434082} -08/30/2021 19:05:11 - INFO - __main__ - Step 32324: {'lr': 0.00044997531830666073, 'samples': 6206208, 'steps': 32323, 'loss/train': 1.3961131572723389} -08/30/2021 19:05:12 - INFO - __main__ - Step 32325: {'lr': 0.00044997213351656237, 'samples': 6206400, 'steps': 32324, 'loss/train': 1.3398165702819824} -08/30/2021 19:05:13 - INFO - __main__ - Step 32326: {'lr': 0.00044996894863635965, 'samples': 6206592, 'steps': 32325, 'loss/train': 1.6897411346435547} -08/30/2021 19:05:14 - INFO - __main__ - Step 32327: {'lr': 0.00044996576366605415, 'samples': 6206784, 'steps': 32326, 'loss/train': 1.694573163986206} -08/30/2021 19:05:14 - INFO - __main__ - Step 32328: {'lr': 0.00044996257860564705, 'samples': 6206976, 'steps': 32327, 'loss/train': 0.9707368016242981} -08/30/2021 19:05:15 - INFO - __main__ - Step 32329: {'lr': 0.0004499593934551399, 'samples': 6207168, 'steps': 32328, 'loss/train': 1.1863114833831787} -08/30/2021 19:05:15 - INFO - __main__ - Step 32330: {'lr': 0.00044995620821453416, 'samples': 6207360, 'steps': 32329, 'loss/train': 1.5414466857910156} -08/30/2021 19:05:15 - INFO - __main__ - Step 32331: {'lr': 0.00044995302288383123, 'samples': 6207552, 'steps': 32330, 'loss/train': 1.4557552337646484} -08/30/2021 19:05:17 - INFO - __main__ - Step 32332: {'lr': 0.0004499498374630325, 'samples': 6207744, 'steps': 32331, 'loss/train': 1.3470616340637207} -08/30/2021 19:05:17 - INFO - __main__ - Step 32333: {'lr': 0.0004499466519521396, 'samples': 6207936, 'steps': 32332, 'loss/train': 1.6630051136016846} -08/30/2021 19:05:18 - INFO - __main__ - Step 32334: {'lr': 0.00044994346635115367, 'samples': 6208128, 'steps': 32333, 'loss/train': 1.2623929977416992} -08/30/2021 19:05:18 - INFO - __main__ - Step 32335: {'lr': 0.00044994028066007636, 'samples': 6208320, 'steps': 32334, 'loss/train': 1.2785216569900513} -08/30/2021 19:05:18 - INFO - __main__ - Step 32336: {'lr': 0.00044993709487890906, 'samples': 6208512, 'steps': 32335, 'loss/train': 1.877227783203125} -08/30/2021 19:05:20 - INFO - __main__ - Step 32337: {'lr': 0.0004499339090076532, 'samples': 6208704, 'steps': 32336, 'loss/train': 1.3354116678237915} -08/30/2021 19:05:21 - INFO - __main__ - Step 32338: {'lr': 0.0004499307230463102, 'samples': 6208896, 'steps': 32337, 'loss/train': 1.001396656036377} -08/30/2021 19:05:21 - INFO - __main__ - Step 32339: {'lr': 0.0004499275369948814, 'samples': 6209088, 'steps': 32338, 'loss/train': 1.76034677028656} -08/30/2021 19:05:21 - INFO - __main__ - Step 32340: {'lr': 0.0004499243508533685, 'samples': 6209280, 'steps': 32339, 'loss/train': 1.459526538848877} -08/30/2021 19:05:22 - INFO - __main__ - Step 32341: {'lr': 0.0004499211646217727, 'samples': 6209472, 'steps': 32340, 'loss/train': 1.0437450408935547} -08/30/2021 19:05:24 - INFO - __main__ - Step 32342: {'lr': 0.00044991797830009543, 'samples': 6209664, 'steps': 32341, 'loss/train': 1.3831251859664917} -08/30/2021 19:05:24 - INFO - __main__ - Step 32343: {'lr': 0.00044991479188833826, 'samples': 6209856, 'steps': 32342, 'loss/train': 1.2098065614700317} -08/30/2021 19:05:24 - INFO - __main__ - Step 32344: {'lr': 0.0004499116053865026, 'samples': 6210048, 'steps': 32343, 'loss/train': 1.765133261680603} -08/30/2021 19:05:25 - INFO - __main__ - Step 32345: {'lr': 0.0004499084187945899, 'samples': 6210240, 'steps': 32344, 'loss/train': 1.629771113395691} -08/30/2021 19:05:25 - INFO - __main__ - Step 32346: {'lr': 0.0004499052321126015, 'samples': 6210432, 'steps': 32345, 'loss/train': 1.3455970287322998} -08/30/2021 19:05:26 - INFO - __main__ - Step 32347: {'lr': 0.0004499020453405388, 'samples': 6210624, 'steps': 32346, 'loss/train': 2.2916319370269775} -08/30/2021 19:05:27 - INFO - __main__ - Step 32348: {'lr': 0.00044989885847840344, 'samples': 6210816, 'steps': 32347, 'loss/train': 1.4424232244491577} -08/30/2021 19:05:27 - INFO - __main__ - Step 32349: {'lr': 0.0004498956715261967, 'samples': 6211008, 'steps': 32348, 'loss/train': 1.686930775642395} -08/30/2021 19:05:28 - INFO - __main__ - Step 32350: {'lr': 0.00044989248448392007, 'samples': 6211200, 'steps': 32349, 'loss/train': 1.4522360563278198} -08/30/2021 19:05:28 - INFO - __main__ - Step 32351: {'lr': 0.000449889297351575, 'samples': 6211392, 'steps': 32350, 'loss/train': 1.6329680681228638} -08/30/2021 19:05:29 - INFO - __main__ - Step 32352: {'lr': 0.0004498861101291628, 'samples': 6211584, 'steps': 32351, 'loss/train': 1.6544710397720337} -08/30/2021 19:05:30 - INFO - __main__ - Step 32353: {'lr': 0.0004498829228166851, 'samples': 6211776, 'steps': 32352, 'loss/train': 1.9228895902633667} -08/30/2021 19:05:30 - INFO - __main__ - Step 32354: {'lr': 0.0004498797354141432, 'samples': 6211968, 'steps': 32353, 'loss/train': 1.1937665939331055} -08/30/2021 19:05:31 - INFO - __main__ - Step 32355: {'lr': 0.00044987654792153853, 'samples': 6212160, 'steps': 32354, 'loss/train': 1.3680614233016968} -08/30/2021 19:05:31 - INFO - __main__ - Step 32356: {'lr': 0.0004498733603388726, 'samples': 6212352, 'steps': 32355, 'loss/train': 1.1955623626708984} -08/30/2021 19:05:31 - INFO - __main__ - Step 32357: {'lr': 0.00044987017266614684, 'samples': 6212544, 'steps': 32356, 'loss/train': 1.751094102859497} -08/30/2021 19:05:33 - INFO - __main__ - Step 32358: {'lr': 0.00044986698490336263, 'samples': 6212736, 'steps': 32357, 'loss/train': 1.5925571918487549} -08/30/2021 19:05:33 - INFO - __main__ - Step 32359: {'lr': 0.0004498637970505215, 'samples': 6212928, 'steps': 32358, 'loss/train': 0.42507418990135193} -08/30/2021 19:05:34 - INFO - __main__ - Step 32360: {'lr': 0.0004498606091076248, 'samples': 6213120, 'steps': 32359, 'loss/train': 1.2136996984481812} -08/30/2021 19:05:34 - INFO - __main__ - Step 32361: {'lr': 0.000449857421074674, 'samples': 6213312, 'steps': 32360, 'loss/train': 0.5065601468086243} -08/30/2021 19:05:34 - INFO - __main__ - Step 32362: {'lr': 0.0004498542329516705, 'samples': 6213504, 'steps': 32361, 'loss/train': 0.4492747187614441} -08/30/2021 19:05:36 - INFO - __main__ - Step 32363: {'lr': 0.00044985104473861583, 'samples': 6213696, 'steps': 32362, 'loss/train': 0.775355875492096} -08/30/2021 19:05:36 - INFO - __main__ - Step 32364: {'lr': 0.0004498478564355113, 'samples': 6213888, 'steps': 32363, 'loss/train': 1.3830183744430542} -08/30/2021 19:05:37 - INFO - __main__ - Step 32365: {'lr': 0.0004498446680423584, 'samples': 6214080, 'steps': 32364, 'loss/train': 1.978040337562561} -08/30/2021 19:05:37 - INFO - __main__ - Step 32366: {'lr': 0.0004498414795591586, 'samples': 6214272, 'steps': 32365, 'loss/train': 1.566407322883606} -08/30/2021 19:05:38 - INFO - __main__ - Step 32367: {'lr': 0.00044983829098591336, 'samples': 6214464, 'steps': 32366, 'loss/train': 1.6484313011169434} -08/30/2021 19:05:38 - INFO - __main__ - Step 32368: {'lr': 0.00044983510232262405, 'samples': 6214656, 'steps': 32367, 'loss/train': 1.1499813795089722} -08/30/2021 19:05:39 - INFO - __main__ - Step 32369: {'lr': 0.0004498319135692921, 'samples': 6214848, 'steps': 32368, 'loss/train': 0.07914281636476517} -08/30/2021 19:05:40 - INFO - __main__ - Step 32370: {'lr': 0.00044982872472591897, 'samples': 6215040, 'steps': 32369, 'loss/train': 1.7727489471435547} -08/30/2021 19:05:40 - INFO - __main__ - Step 32371: {'lr': 0.00044982553579250606, 'samples': 6215232, 'steps': 32370, 'loss/train': 1.999704360961914} -08/30/2021 19:05:41 - INFO - __main__ - Step 32372: {'lr': 0.0004498223467690549, 'samples': 6215424, 'steps': 32371, 'loss/train': 0.9826949834823608} -08/30/2021 19:05:41 - INFO - __main__ - Step 32373: {'lr': 0.0004498191576555669, 'samples': 6215616, 'steps': 32372, 'loss/train': 1.6569430828094482} -08/30/2021 19:05:43 - INFO - __main__ - Step 32374: {'lr': 0.00044981596845204344, 'samples': 6215808, 'steps': 32373, 'loss/train': 0.6701174974441528} -08/30/2021 19:05:43 - INFO - __main__ - Step 32375: {'lr': 0.00044981277915848595, 'samples': 6216000, 'steps': 32374, 'loss/train': 1.1777806282043457} -08/30/2021 19:05:44 - INFO - __main__ - Step 32376: {'lr': 0.00044980958977489593, 'samples': 6216192, 'steps': 32375, 'loss/train': 1.3061331510543823} -08/30/2021 19:05:44 - INFO - __main__ - Step 32377: {'lr': 0.00044980640030127484, 'samples': 6216384, 'steps': 32376, 'loss/train': 1.466526746749878} -08/30/2021 19:05:45 - INFO - __main__ - Step 32378: {'lr': 0.00044980321073762405, 'samples': 6216576, 'steps': 32377, 'loss/train': 1.1577993631362915} -08/30/2021 19:05:46 - INFO - __main__ - Step 32379: {'lr': 0.00044980002108394496, 'samples': 6216768, 'steps': 32378, 'loss/train': 1.4330931901931763} -08/30/2021 19:05:46 - INFO - __main__ - Step 32380: {'lr': 0.0004497968313402391, 'samples': 6216960, 'steps': 32379, 'loss/train': 0.7249764800071716} -08/30/2021 19:05:47 - INFO - __main__ - Step 32381: {'lr': 0.00044979364150650794, 'samples': 6217152, 'steps': 32380, 'loss/train': 1.683530569076538} -08/30/2021 19:05:47 - INFO - __main__ - Step 32382: {'lr': 0.00044979045158275273, 'samples': 6217344, 'steps': 32381, 'loss/train': 1.51314377784729} -08/30/2021 19:05:48 - INFO - __main__ - Step 32383: {'lr': 0.0004497872615689751, 'samples': 6217536, 'steps': 32382, 'loss/train': 0.9352617859840393} -08/30/2021 19:05:49 - INFO - __main__ - Step 32384: {'lr': 0.00044978407146517634, 'samples': 6217728, 'steps': 32383, 'loss/train': 1.4616782665252686} -08/30/2021 19:05:50 - INFO - __main__ - Step 32385: {'lr': 0.0004497808812713581, 'samples': 6217920, 'steps': 32384, 'loss/train': 1.418293833732605} -08/30/2021 19:05:50 - INFO - __main__ - Step 32386: {'lr': 0.00044977769098752154, 'samples': 6218112, 'steps': 32385, 'loss/train': 1.1720964908599854} -08/30/2021 19:05:50 - INFO - __main__ - Step 32387: {'lr': 0.0004497745006136683, 'samples': 6218304, 'steps': 32386, 'loss/train': 1.2890551090240479} -08/30/2021 19:05:51 - INFO - __main__ - Step 32388: {'lr': 0.00044977131014979974, 'samples': 6218496, 'steps': 32387, 'loss/train': 1.3431979417800903} -08/30/2021 19:05:52 - INFO - __main__ - Step 32389: {'lr': 0.0004497681195959173, 'samples': 6218688, 'steps': 32388, 'loss/train': 1.47535240650177} -08/30/2021 19:05:53 - INFO - __main__ - Step 32390: {'lr': 0.0004497649289520224, 'samples': 6218880, 'steps': 32389, 'loss/train': 1.7538362741470337} -08/30/2021 19:05:53 - INFO - __main__ - Step 32391: {'lr': 0.00044976173821811654, 'samples': 6219072, 'steps': 32390, 'loss/train': 1.627745270729065} -08/30/2021 19:05:53 - INFO - __main__ - Step 32392: {'lr': 0.0004497585473942011, 'samples': 6219264, 'steps': 32391, 'loss/train': 1.3706724643707275} -08/30/2021 19:05:54 - INFO - __main__ - Step 32393: {'lr': 0.0004497553564802776, 'samples': 6219456, 'steps': 32392, 'loss/train': 1.976728081703186} -08/30/2021 19:05:55 - INFO - __main__ - Step 32394: {'lr': 0.0004497521654763474, 'samples': 6219648, 'steps': 32393, 'loss/train': 0.543554961681366} -08/30/2021 19:05:56 - INFO - __main__ - Step 32395: {'lr': 0.0004497489743824119, 'samples': 6219840, 'steps': 32394, 'loss/train': 1.6516635417938232} -08/30/2021 19:05:56 - INFO - __main__ - Step 32396: {'lr': 0.0004497457831984727, 'samples': 6220032, 'steps': 32395, 'loss/train': 1.149714708328247} -08/30/2021 19:05:56 - INFO - __main__ - Step 32397: {'lr': 0.00044974259192453103, 'samples': 6220224, 'steps': 32396, 'loss/train': 1.8064905405044556} -08/30/2021 19:05:57 - INFO - __main__ - Step 32398: {'lr': 0.0004497394005605885, 'samples': 6220416, 'steps': 32397, 'loss/train': 1.2958773374557495} -08/30/2021 19:05:57 - INFO - __main__ - Step 32399: {'lr': 0.00044973620910664645, 'samples': 6220608, 'steps': 32398, 'loss/train': 0.8186208605766296} -08/30/2021 19:05:59 - INFO - __main__ - Step 32400: {'lr': 0.00044973301756270635, 'samples': 6220800, 'steps': 32399, 'loss/train': 1.544405221939087} -08/30/2021 19:06:00 - INFO - __main__ - Step 32401: {'lr': 0.0004497298259287696, 'samples': 6220992, 'steps': 32400, 'loss/train': 0.8137536644935608} -08/30/2021 19:06:00 - INFO - __main__ - Step 32402: {'lr': 0.00044972663420483774, 'samples': 6221184, 'steps': 32401, 'loss/train': 1.0207865238189697} -08/30/2021 19:06:00 - INFO - __main__ - Step 32403: {'lr': 0.00044972344239091206, 'samples': 6221376, 'steps': 32402, 'loss/train': 1.5676817893981934} -08/30/2021 19:06:01 - INFO - __main__ - Step 32404: {'lr': 0.0004497202504869941, 'samples': 6221568, 'steps': 32403, 'loss/train': 1.5129809379577637} -08/30/2021 19:06:02 - INFO - __main__ - Step 32405: {'lr': 0.0004497170584930853, 'samples': 6221760, 'steps': 32404, 'loss/train': 1.7797439098358154} -08/30/2021 19:06:03 - INFO - __main__ - Step 32406: {'lr': 0.0004497138664091871, 'samples': 6221952, 'steps': 32405, 'loss/train': 1.3799606561660767} -08/30/2021 19:06:03 - INFO - __main__ - Step 32407: {'lr': 0.00044971067423530087, 'samples': 6222144, 'steps': 32406, 'loss/train': 1.6371674537658691} -08/30/2021 19:06:03 - INFO - __main__ - Step 32408: {'lr': 0.0004497074819714281, 'samples': 6222336, 'steps': 32407, 'loss/train': 1.2462704181671143} -08/30/2021 19:06:04 - INFO - __main__ - Step 32409: {'lr': 0.00044970428961757026, 'samples': 6222528, 'steps': 32408, 'loss/train': 0.6013548374176025} -08/30/2021 19:06:05 - INFO - __main__ - Step 32410: {'lr': 0.00044970109717372864, 'samples': 6222720, 'steps': 32409, 'loss/train': 1.535630702972412} -08/30/2021 19:06:06 - INFO - __main__ - Step 32411: {'lr': 0.0004496979046399049, 'samples': 6222912, 'steps': 32410, 'loss/train': 1.3093996047973633} -08/30/2021 19:06:06 - INFO - __main__ - Step 32412: {'lr': 0.00044969471201610037, 'samples': 6223104, 'steps': 32411, 'loss/train': 1.1339932680130005} -08/30/2021 19:06:06 - INFO - __main__ - Step 32413: {'lr': 0.00044969151930231643, 'samples': 6223296, 'steps': 32412, 'loss/train': 0.5679135918617249} -08/30/2021 19:06:07 - INFO - __main__ - Step 32414: {'lr': 0.00044968832649855455, 'samples': 6223488, 'steps': 32413, 'loss/train': 1.6796916723251343} -08/30/2021 19:06:08 - INFO - __main__ - Step 32415: {'lr': 0.00044968513360481624, 'samples': 6223680, 'steps': 32414, 'loss/train': 1.1908469200134277} -08/30/2021 19:06:09 - INFO - __main__ - Step 32416: {'lr': 0.0004496819406211029, 'samples': 6223872, 'steps': 32415, 'loss/train': 1.2527387142181396} -08/30/2021 19:06:09 - INFO - __main__ - Step 32417: {'lr': 0.0004496787475474159, 'samples': 6224064, 'steps': 32416, 'loss/train': 1.3246748447418213} -08/30/2021 19:06:09 - INFO - __main__ - Step 32418: {'lr': 0.00044967555438375675, 'samples': 6224256, 'steps': 32417, 'loss/train': 1.19204843044281} -08/30/2021 19:06:10 - INFO - __main__ - Step 32419: {'lr': 0.0004496723611301269, 'samples': 6224448, 'steps': 32418, 'loss/train': 1.3817065954208374} -08/30/2021 19:06:11 - INFO - __main__ - Step 32420: {'lr': 0.00044966916778652776, 'samples': 6224640, 'steps': 32419, 'loss/train': 1.2285152673721313} -08/30/2021 19:06:12 - INFO - __main__ - Step 32421: {'lr': 0.0004496659743529608, 'samples': 6224832, 'steps': 32420, 'loss/train': 1.3928989171981812} -08/30/2021 19:06:12 - INFO - __main__ - Step 32422: {'lr': 0.00044966278082942746, 'samples': 6225024, 'steps': 32421, 'loss/train': 1.7617006301879883} -08/30/2021 19:06:12 - INFO - __main__ - Step 32423: {'lr': 0.000449659587215929, 'samples': 6225216, 'steps': 32422, 'loss/train': 0.9510110020637512} -08/30/2021 19:06:13 - INFO - __main__ - Step 32424: {'lr': 0.0004496563935124672, 'samples': 6225408, 'steps': 32423, 'loss/train': 1.676318645477295} -08/30/2021 19:06:15 - INFO - __main__ - Step 32425: {'lr': 0.0004496531997190432, 'samples': 6225600, 'steps': 32424, 'loss/train': 1.7138748168945312} -08/30/2021 19:06:15 - INFO - __main__ - Step 32426: {'lr': 0.0004496500058356586, 'samples': 6225792, 'steps': 32425, 'loss/train': 1.4112449884414673} -08/30/2021 19:06:16 - INFO - __main__ - Step 32427: {'lr': 0.00044964681186231473, 'samples': 6225984, 'steps': 32426, 'loss/train': 1.050158977508545} -08/30/2021 19:06:16 - INFO - __main__ - Step 32428: {'lr': 0.0004496436177990131, 'samples': 6226176, 'steps': 32427, 'loss/train': 1.6112520694732666} -08/30/2021 19:06:16 - INFO - __main__ - Step 32429: {'lr': 0.0004496404236457552, 'samples': 6226368, 'steps': 32428, 'loss/train': 1.1650753021240234} -08/30/2021 19:06:17 - INFO - __main__ - Step 32430: {'lr': 0.0004496372294025424, 'samples': 6226560, 'steps': 32429, 'loss/train': 1.639077067375183} -08/30/2021 19:06:18 - INFO - __main__ - Step 32431: {'lr': 0.00044963403506937603, 'samples': 6226752, 'steps': 32430, 'loss/train': 1.2142544984817505} -08/30/2021 19:06:19 - INFO - __main__ - Step 32432: {'lr': 0.00044963084064625775, 'samples': 6226944, 'steps': 32431, 'loss/train': 0.5049042701721191} -08/30/2021 19:06:19 - INFO - __main__ - Step 32433: {'lr': 0.00044962764613318886, 'samples': 6227136, 'steps': 32432, 'loss/train': 1.779929280281067} -08/30/2021 19:06:20 - INFO - __main__ - Step 32434: {'lr': 0.00044962445153017087, 'samples': 6227328, 'steps': 32433, 'loss/train': 1.0560500621795654} -08/30/2021 19:06:20 - INFO - __main__ - Step 32435: {'lr': 0.00044962125683720513, 'samples': 6227520, 'steps': 32434, 'loss/train': 0.12484985589981079} -08/30/2021 19:06:22 - INFO - __main__ - Step 32436: {'lr': 0.0004496180620542931, 'samples': 6227712, 'steps': 32435, 'loss/train': 1.6861265897750854} -08/30/2021 19:06:22 - INFO - __main__ - Step 32437: {'lr': 0.00044961486718143634, 'samples': 6227904, 'steps': 32436, 'loss/train': 1.753557801246643} -08/30/2021 19:06:23 - INFO - __main__ - Step 32438: {'lr': 0.0004496116722186362, 'samples': 6228096, 'steps': 32437, 'loss/train': 1.2478522062301636} -08/30/2021 19:06:23 - INFO - __main__ - Step 32439: {'lr': 0.00044960847716589403, 'samples': 6228288, 'steps': 32438, 'loss/train': 1.1716833114624023} -08/30/2021 19:06:23 - INFO - __main__ - Step 32440: {'lr': 0.00044960528202321143, 'samples': 6228480, 'steps': 32439, 'loss/train': 1.759860873222351} -08/30/2021 19:06:25 - INFO - __main__ - Step 32441: {'lr': 0.0004496020867905898, 'samples': 6228672, 'steps': 32440, 'loss/train': 1.1499463319778442} -08/30/2021 19:06:26 - INFO - __main__ - Step 32442: {'lr': 0.00044959889146803047, 'samples': 6228864, 'steps': 32441, 'loss/train': 1.2256149053573608} -08/30/2021 19:06:26 - INFO - __main__ - Step 32443: {'lr': 0.00044959569605553494, 'samples': 6229056, 'steps': 32442, 'loss/train': 1.6094967126846313} -08/30/2021 19:06:26 - INFO - __main__ - Step 32444: {'lr': 0.00044959250055310473, 'samples': 6229248, 'steps': 32443, 'loss/train': 0.06210010498762131} -08/30/2021 19:06:27 - INFO - __main__ - Step 32445: {'lr': 0.00044958930496074125, 'samples': 6229440, 'steps': 32444, 'loss/train': 0.2832689583301544} -08/30/2021 19:06:27 - INFO - __main__ - Step 32446: {'lr': 0.0004495861092784459, 'samples': 6229632, 'steps': 32445, 'loss/train': 0.2639256715774536} -08/30/2021 19:06:29 - INFO - __main__ - Step 32447: {'lr': 0.00044958291350622007, 'samples': 6229824, 'steps': 32446, 'loss/train': 1.1941344738006592} -08/30/2021 19:06:29 - INFO - __main__ - Step 32448: {'lr': 0.0004495797176440653, 'samples': 6230016, 'steps': 32447, 'loss/train': 0.17134426534175873} -08/30/2021 19:06:29 - INFO - __main__ - Step 32449: {'lr': 0.000449576521691983, 'samples': 6230208, 'steps': 32448, 'loss/train': 1.2336848974227905} -08/30/2021 19:06:30 - INFO - __main__ - Step 32450: {'lr': 0.00044957332564997453, 'samples': 6230400, 'steps': 32449, 'loss/train': 0.7291089296340942} -08/30/2021 19:06:30 - INFO - __main__ - Step 32451: {'lr': 0.0004495701295180414, 'samples': 6230592, 'steps': 32450, 'loss/train': 1.2721360921859741} -08/30/2021 19:06:32 - INFO - __main__ - Step 32452: {'lr': 0.0004495669332961852, 'samples': 6230784, 'steps': 32451, 'loss/train': 2.9824435710906982} -08/30/2021 19:06:32 - INFO - __main__ - Step 32453: {'lr': 0.0004495637369844071, 'samples': 6230976, 'steps': 32452, 'loss/train': 1.7732491493225098} -08/30/2021 19:06:33 - INFO - __main__ - Step 32454: {'lr': 0.0004495605405827087, 'samples': 6231168, 'steps': 32453, 'loss/train': 0.0652928575873375} -08/30/2021 19:06:33 - INFO - __main__ - Step 32455: {'lr': 0.00044955734409109135, 'samples': 6231360, 'steps': 32454, 'loss/train': 1.4207961559295654} -08/30/2021 19:06:33 - INFO - __main__ - Step 32456: {'lr': 0.0004495541475095566, 'samples': 6231552, 'steps': 32455, 'loss/train': 0.33647459745407104} -08/30/2021 19:06:35 - INFO - __main__ - Step 32457: {'lr': 0.0004495509508381058, 'samples': 6231744, 'steps': 32456, 'loss/train': 1.2550816535949707} -08/30/2021 19:06:35 - INFO - __main__ - Step 32458: {'lr': 0.00044954775407674035, 'samples': 6231936, 'steps': 32457, 'loss/train': 0.05562262982130051} -08/30/2021 19:06:36 - INFO - __main__ - Step 32459: {'lr': 0.00044954455722546186, 'samples': 6232128, 'steps': 32458, 'loss/train': 1.3769316673278809} -08/30/2021 19:06:36 - INFO - __main__ - Step 32460: {'lr': 0.0004495413602842716, 'samples': 6232320, 'steps': 32459, 'loss/train': 0.7638034224510193} -08/30/2021 19:06:37 - INFO - __main__ - Step 32461: {'lr': 0.00044953816325317116, 'samples': 6232512, 'steps': 32460, 'loss/train': 1.360421061515808} -08/30/2021 19:06:38 - INFO - __main__ - Step 32462: {'lr': 0.0004495349661321618, 'samples': 6232704, 'steps': 32461, 'loss/train': 1.007704734802246} -08/30/2021 19:06:39 - INFO - __main__ - Step 32463: {'lr': 0.0004495317689212452, 'samples': 6232896, 'steps': 32462, 'loss/train': 1.2015819549560547} -08/30/2021 19:06:39 - INFO - __main__ - Step 32464: {'lr': 0.0004495285716204226, 'samples': 6233088, 'steps': 32463, 'loss/train': 1.8444645404815674} -08/30/2021 19:06:39 - INFO - __main__ - Step 32465: {'lr': 0.00044952537422969545, 'samples': 6233280, 'steps': 32464, 'loss/train': 1.3284454345703125} -08/30/2021 19:06:40 - INFO - __main__ - Step 32466: {'lr': 0.0004495221767490653, 'samples': 6233472, 'steps': 32465, 'loss/train': 1.1120922565460205} -08/30/2021 19:06:41 - INFO - __main__ - Step 32467: {'lr': 0.00044951897917853355, 'samples': 6233664, 'steps': 32466, 'loss/train': 0.06854413449764252} -08/30/2021 19:06:42 - INFO - __main__ - Step 32468: {'lr': 0.0004495157815181016, 'samples': 6233856, 'steps': 32467, 'loss/train': 0.7765848636627197} -08/30/2021 19:06:42 - INFO - __main__ - Step 32469: {'lr': 0.00044951258376777094, 'samples': 6234048, 'steps': 32468, 'loss/train': 1.8528486490249634} -08/30/2021 19:06:42 - INFO - __main__ - Step 32470: {'lr': 0.00044950938592754297, 'samples': 6234240, 'steps': 32469, 'loss/train': 1.3980793952941895} -08/30/2021 19:06:43 - INFO - __main__ - Step 32471: {'lr': 0.00044950618799741913, 'samples': 6234432, 'steps': 32470, 'loss/train': 1.1394309997558594} -08/30/2021 19:06:44 - INFO - __main__ - Step 32472: {'lr': 0.0004495029899774009, 'samples': 6234624, 'steps': 32471, 'loss/train': 1.2558962106704712} -08/30/2021 19:06:45 - INFO - __main__ - Step 32473: {'lr': 0.00044949979186748967, 'samples': 6234816, 'steps': 32472, 'loss/train': 2.0109009742736816} -08/30/2021 19:06:45 - INFO - __main__ - Step 32474: {'lr': 0.00044949659366768697, 'samples': 6235008, 'steps': 32473, 'loss/train': 0.9980002641677856} -08/30/2021 19:06:45 - INFO - __main__ - Step 32475: {'lr': 0.00044949339537799415, 'samples': 6235200, 'steps': 32474, 'loss/train': 1.5778969526290894} -08/30/2021 19:06:46 - INFO - __main__ - Step 32476: {'lr': 0.0004494901969984127, 'samples': 6235392, 'steps': 32475, 'loss/train': 0.5476223826408386} -08/30/2021 19:06:46 - INFO - __main__ - Step 32477: {'lr': 0.000449486998528944, 'samples': 6235584, 'steps': 32476, 'loss/train': 1.2054213285446167} -08/30/2021 19:06:48 - INFO - __main__ - Step 32478: {'lr': 0.00044948379996958963, 'samples': 6235776, 'steps': 32477, 'loss/train': 1.63673734664917} -08/30/2021 19:06:48 - INFO - __main__ - Step 32479: {'lr': 0.00044948060132035087, 'samples': 6235968, 'steps': 32478, 'loss/train': 1.4490669965744019} -08/30/2021 19:06:48 - INFO - __main__ - Step 32480: {'lr': 0.00044947740258122925, 'samples': 6236160, 'steps': 32479, 'loss/train': 1.7334442138671875} -08/30/2021 19:06:49 - INFO - __main__ - Step 32481: {'lr': 0.00044947420375222614, 'samples': 6236352, 'steps': 32480, 'loss/train': 1.7896943092346191} -08/30/2021 19:06:49 - INFO - __main__ - Step 32482: {'lr': 0.00044947100483334315, 'samples': 6236544, 'steps': 32481, 'loss/train': 1.3345435857772827} -08/30/2021 19:06:51 - INFO - __main__ - Step 32483: {'lr': 0.0004494678058245815, 'samples': 6236736, 'steps': 32482, 'loss/train': 1.724750280380249} -08/30/2021 19:06:52 - INFO - __main__ - Step 32484: {'lr': 0.00044946460672594277, 'samples': 6236928, 'steps': 32483, 'loss/train': 1.6925795078277588} -08/30/2021 19:06:52 - INFO - __main__ - Step 32485: {'lr': 0.0004494614075374283, 'samples': 6237120, 'steps': 32484, 'loss/train': 0.7055851221084595} -08/30/2021 19:06:52 - INFO - __main__ - Step 32486: {'lr': 0.0004494582082590397, 'samples': 6237312, 'steps': 32485, 'loss/train': 1.414989948272705} -08/30/2021 19:06:53 - INFO - __main__ - Step 32487: {'lr': 0.0004494550088907783, 'samples': 6237504, 'steps': 32486, 'loss/train': 1.0751837491989136} -08/30/2021 19:06:54 - INFO - __main__ - Step 32488: {'lr': 0.00044945180943264544, 'samples': 6237696, 'steps': 32487, 'loss/train': 4.433512210845947} -08/30/2021 19:06:55 - INFO - __main__ - Step 32489: {'lr': 0.00044944860988464276, 'samples': 6237888, 'steps': 32488, 'loss/train': 1.269638180732727} -08/30/2021 19:06:55 - INFO - __main__ - Step 32490: {'lr': 0.0004494454102467716, 'samples': 6238080, 'steps': 32489, 'loss/train': 0.6475194692611694} -08/30/2021 19:06:55 - INFO - __main__ - Step 32491: {'lr': 0.00044944221051903345, 'samples': 6238272, 'steps': 32490, 'loss/train': 1.8564822673797607} -08/30/2021 19:06:56 - INFO - __main__ - Step 32492: {'lr': 0.0004494390107014297, 'samples': 6238464, 'steps': 32491, 'loss/train': 1.597392201423645} -08/30/2021 19:06:58 - INFO - __main__ - Step 32493: {'lr': 0.0004494358107939618, 'samples': 6238656, 'steps': 32492, 'loss/train': 1.403234839439392} -08/30/2021 19:06:58 - INFO - __main__ - Step 32494: {'lr': 0.0004494326107966311, 'samples': 6238848, 'steps': 32493, 'loss/train': 2.514643430709839} -08/30/2021 19:06:59 - INFO - __main__ - Step 32495: {'lr': 0.0004494294107094393, 'samples': 6239040, 'steps': 32494, 'loss/train': 1.3124140501022339} -08/30/2021 19:06:59 - INFO - __main__ - Step 32496: {'lr': 0.00044942621053238764, 'samples': 6239232, 'steps': 32495, 'loss/train': 1.5863598585128784} -08/30/2021 19:06:59 - INFO - __main__ - Step 32497: {'lr': 0.00044942301026547755, 'samples': 6239424, 'steps': 32496, 'loss/train': 2.784682035446167} -08/30/2021 19:07:00 - INFO - __main__ - Step 32498: {'lr': 0.0004494198099087106, 'samples': 6239616, 'steps': 32497, 'loss/train': 3.2850253582000732} -08/30/2021 19:07:01 - INFO - __main__ - Step 32499: {'lr': 0.00044941660946208806, 'samples': 6239808, 'steps': 32498, 'loss/train': 1.7977617979049683} -08/30/2021 19:07:02 - INFO - __main__ - Step 32500: {'lr': 0.00044941340892561154, 'samples': 6240000, 'steps': 32499, 'loss/train': 1.5849515199661255} -08/30/2021 19:07:02 - INFO - __main__ - Step 32501: {'lr': 0.00044941020829928247, 'samples': 6240192, 'steps': 32500, 'loss/train': 1.777456521987915} -08/30/2021 19:07:03 - INFO - __main__ - Step 32502: {'lr': 0.00044940700758310214, 'samples': 6240384, 'steps': 32501, 'loss/train': 1.5699900388717651} -08/30/2021 19:07:03 - INFO - __main__ - Step 32503: {'lr': 0.00044940380677707214, 'samples': 6240576, 'steps': 32502, 'loss/train': 3.2387187480926514} -08/30/2021 19:07:04 - INFO - __main__ - Step 32504: {'lr': 0.00044940060588119393, 'samples': 6240768, 'steps': 32503, 'loss/train': 1.9758620262145996} -08/30/2021 19:07:05 - INFO - __main__ - Step 32505: {'lr': 0.00044939740489546875, 'samples': 6240960, 'steps': 32504, 'loss/train': 0.7341508865356445} -08/30/2021 19:07:05 - INFO - __main__ - Step 32506: {'lr': 0.0004493942038198983, 'samples': 6241152, 'steps': 32505, 'loss/train': 0.7989136576652527} -08/30/2021 19:07:06 - INFO - __main__ - Step 32507: {'lr': 0.0004493910026544838, 'samples': 6241344, 'steps': 32506, 'loss/train': 1.3034539222717285} -08/30/2021 19:07:06 - INFO - __main__ - Step 32508: {'lr': 0.0004493878013992268, 'samples': 6241536, 'steps': 32507, 'loss/train': 1.39571213722229} -08/30/2021 19:07:06 - INFO - __main__ - Step 32509: {'lr': 0.0004493846000541287, 'samples': 6241728, 'steps': 32508, 'loss/train': 1.5410791635513306} -08/30/2021 19:07:08 - INFO - __main__ - Step 32510: {'lr': 0.00044938139861919115, 'samples': 6241920, 'steps': 32509, 'loss/train': 1.5987144708633423} -08/30/2021 19:07:08 - INFO - __main__ - Step 32511: {'lr': 0.00044937819709441523, 'samples': 6242112, 'steps': 32510, 'loss/train': 0.9097114205360413} -08/30/2021 19:07:09 - INFO - __main__ - Step 32512: {'lr': 0.00044937499547980265, 'samples': 6242304, 'steps': 32511, 'loss/train': 1.3840765953063965} -08/30/2021 19:07:09 - INFO - __main__ - Step 32513: {'lr': 0.00044937179377535475, 'samples': 6242496, 'steps': 32512, 'loss/train': 1.3453541994094849} -08/30/2021 19:07:09 - INFO - __main__ - Step 32514: {'lr': 0.00044936859198107306, 'samples': 6242688, 'steps': 32513, 'loss/train': 0.22491967678070068} -08/30/2021 19:07:11 - INFO - __main__ - Step 32515: {'lr': 0.0004493653900969589, 'samples': 6242880, 'steps': 32514, 'loss/train': 1.1304253339767456} -08/30/2021 19:07:11 - INFO - __main__ - Step 32516: {'lr': 0.0004493621881230138, 'samples': 6243072, 'steps': 32515, 'loss/train': 0.940894603729248} -08/30/2021 19:07:11 - INFO - __main__ - Step 32517: {'lr': 0.00044935898605923916, 'samples': 6243264, 'steps': 32516, 'loss/train': 1.7782803773880005} -08/30/2021 19:07:12 - INFO - __main__ - Step 32518: {'lr': 0.0004493557839056364, 'samples': 6243456, 'steps': 32517, 'loss/train': 1.2063217163085938} -08/30/2021 19:07:12 - INFO - __main__ - Step 32519: {'lr': 0.00044935258166220704, 'samples': 6243648, 'steps': 32518, 'loss/train': 1.2444733381271362} -08/30/2021 19:07:14 - INFO - __main__ - Step 32520: {'lr': 0.00044934937932895246, 'samples': 6243840, 'steps': 32519, 'loss/train': 1.6143519878387451} -08/30/2021 19:07:15 - INFO - __main__ - Step 32521: {'lr': 0.0004493461769058742, 'samples': 6244032, 'steps': 32520, 'loss/train': 0.03852095082402229} -08/30/2021 19:07:15 - INFO - __main__ - Step 32522: {'lr': 0.00044934297439297357, 'samples': 6244224, 'steps': 32521, 'loss/train': 1.912291169166565} -08/30/2021 19:07:15 - INFO - __main__ - Step 32523: {'lr': 0.0004493397717902521, 'samples': 6244416, 'steps': 32522, 'loss/train': 2.0182244777679443} -08/30/2021 19:07:16 - INFO - __main__ - Step 32524: {'lr': 0.00044933656909771117, 'samples': 6244608, 'steps': 32523, 'loss/train': 1.686921238899231} -08/30/2021 19:07:16 - INFO - __main__ - Step 32525: {'lr': 0.00044933336631535224, 'samples': 6244800, 'steps': 32524, 'loss/train': 1.5616185665130615} -08/30/2021 19:07:17 - INFO - __main__ - Step 32526: {'lr': 0.0004493301634431768, 'samples': 6244992, 'steps': 32525, 'loss/train': 1.2322211265563965} -08/30/2021 19:07:18 - INFO - __main__ - Step 32527: {'lr': 0.0004493269604811863, 'samples': 6245184, 'steps': 32526, 'loss/train': 1.4644622802734375} -08/30/2021 19:07:18 - INFO - __main__ - Step 32528: {'lr': 0.000449323757429382, 'samples': 6245376, 'steps': 32527, 'loss/train': 1.7634228467941284} -08/30/2021 19:07:19 - INFO - __main__ - Step 32529: {'lr': 0.00044932055428776566, 'samples': 6245568, 'steps': 32528, 'loss/train': 1.3370349407196045} -08/30/2021 19:07:19 - INFO - __main__ - Step 32530: {'lr': 0.00044931735105633853, 'samples': 6245760, 'steps': 32529, 'loss/train': 0.9920026063919067} -08/30/2021 19:07:21 - INFO - __main__ - Step 32531: {'lr': 0.00044931414773510207, 'samples': 6245952, 'steps': 32530, 'loss/train': 1.1733609437942505} -08/30/2021 19:07:21 - INFO - __main__ - Step 32532: {'lr': 0.00044931094432405766, 'samples': 6246144, 'steps': 32531, 'loss/train': 2.2634294033050537} -08/30/2021 19:07:21 - INFO - __main__ - Step 32533: {'lr': 0.00044930774082320684, 'samples': 6246336, 'steps': 32532, 'loss/train': 0.9710589647293091} -08/30/2021 19:07:22 - INFO - __main__ - Step 32534: {'lr': 0.00044930453723255107, 'samples': 6246528, 'steps': 32533, 'loss/train': 1.5638251304626465} -08/30/2021 19:07:22 - INFO - __main__ - Step 32535: {'lr': 0.0004493013335520917, 'samples': 6246720, 'steps': 32534, 'loss/train': 0.7228960990905762} -08/30/2021 19:07:24 - INFO - __main__ - Step 32536: {'lr': 0.00044929812978183024, 'samples': 6246912, 'steps': 32535, 'loss/train': 1.6448959112167358} -08/30/2021 19:07:25 - INFO - __main__ - Step 32537: {'lr': 0.0004492949259217681, 'samples': 6247104, 'steps': 32536, 'loss/train': 1.9606547355651855} -08/30/2021 19:07:25 - INFO - __main__ - Step 32538: {'lr': 0.00044929172197190684, 'samples': 6247296, 'steps': 32537, 'loss/train': 2.0524723529815674} -08/30/2021 19:07:26 - INFO - __main__ - Step 32539: {'lr': 0.00044928851793224765, 'samples': 6247488, 'steps': 32538, 'loss/train': 1.821181297302246} -08/30/2021 19:07:26 - INFO - __main__ - Step 32540: {'lr': 0.00044928531380279224, 'samples': 6247680, 'steps': 32539, 'loss/train': 3.168372869491577} -08/30/2021 19:07:27 - INFO - __main__ - Step 32541: {'lr': 0.00044928210958354196, 'samples': 6247872, 'steps': 32540, 'loss/train': 1.0670064687728882} -08/30/2021 19:07:28 - INFO - __main__ - Step 32542: {'lr': 0.0004492789052744982, 'samples': 6248064, 'steps': 32541, 'loss/train': 1.429789662361145} -08/30/2021 19:07:28 - INFO - __main__ - Step 32543: {'lr': 0.0004492757008756624, 'samples': 6248256, 'steps': 32542, 'loss/train': 2.3521363735198975} -08/30/2021 19:07:29 - INFO - __main__ - Step 32544: {'lr': 0.0004492724963870361, 'samples': 6248448, 'steps': 32543, 'loss/train': 1.5605545043945312} -08/30/2021 19:07:29 - INFO - __main__ - Step 32545: {'lr': 0.00044926929180862064, 'samples': 6248640, 'steps': 32544, 'loss/train': 1.149708867073059} -08/30/2021 19:07:30 - INFO - __main__ - Step 32546: {'lr': 0.00044926608714041763, 'samples': 6248832, 'steps': 32545, 'loss/train': 1.1772730350494385} -08/30/2021 19:07:31 - INFO - __main__ - Step 32547: {'lr': 0.0004492628823824282, 'samples': 6249024, 'steps': 32546, 'loss/train': 1.9210500717163086} -08/30/2021 19:07:31 - INFO - __main__ - Step 32548: {'lr': 0.0004492596775346541, 'samples': 6249216, 'steps': 32547, 'loss/train': 1.6220155954360962} -08/30/2021 19:07:31 - INFO - __main__ - Step 32549: {'lr': 0.0004492564725970967, 'samples': 6249408, 'steps': 32548, 'loss/train': 1.5211739540100098} -08/30/2021 19:07:32 - INFO - __main__ - Step 32550: {'lr': 0.00044925326756975736, 'samples': 6249600, 'steps': 32549, 'loss/train': 1.5514802932739258} -08/30/2021 19:07:34 - INFO - __main__ - Step 32551: {'lr': 0.00044925006245263757, 'samples': 6249792, 'steps': 32550, 'loss/train': 1.7511314153671265} -08/30/2021 19:07:34 - INFO - __main__ - Step 32552: {'lr': 0.0004492468572457388, 'samples': 6249984, 'steps': 32551, 'loss/train': 1.5107816457748413} -08/30/2021 19:07:35 - INFO - __main__ - Step 32553: {'lr': 0.0004492436519490625, 'samples': 6250176, 'steps': 32552, 'loss/train': 1.1585731506347656} -08/30/2021 19:07:35 - INFO - __main__ - Step 32554: {'lr': 0.00044924044656260997, 'samples': 6250368, 'steps': 32553, 'loss/train': 1.3378500938415527} -08/30/2021 19:07:35 - INFO - __main__ - Step 32555: {'lr': 0.00044923724108638285, 'samples': 6250560, 'steps': 32554, 'loss/train': 1.756518006324768} -08/30/2021 19:07:36 - INFO - __main__ - Step 32556: {'lr': 0.00044923403552038255, 'samples': 6250752, 'steps': 32555, 'loss/train': 0.6435486674308777} -08/30/2021 19:07:37 - INFO - __main__ - Step 32557: {'lr': 0.0004492308298646104, 'samples': 6250944, 'steps': 32556, 'loss/train': 1.7105737924575806} -08/30/2021 19:07:38 - INFO - __main__ - Step 32558: {'lr': 0.0004492276241190679, 'samples': 6251136, 'steps': 32557, 'loss/train': 1.5998950004577637} -08/30/2021 19:07:38 - INFO - __main__ - Step 32559: {'lr': 0.0004492244182837565, 'samples': 6251328, 'steps': 32558, 'loss/train': 1.4155688285827637} -08/30/2021 19:07:38 - INFO - __main__ - Step 32560: {'lr': 0.00044922121235867776, 'samples': 6251520, 'steps': 32559, 'loss/train': 0.2900150418281555} -08/30/2021 19:07:39 - INFO - __main__ - Step 32561: {'lr': 0.00044921800634383294, 'samples': 6251712, 'steps': 32560, 'loss/train': 1.712533950805664} -08/30/2021 19:07:40 - INFO - __main__ - Step 32562: {'lr': 0.0004492148002392235, 'samples': 6251904, 'steps': 32561, 'loss/train': 1.4608594179153442} -08/30/2021 19:07:41 - INFO - __main__ - Step 32563: {'lr': 0.000449211594044851, 'samples': 6252096, 'steps': 32562, 'loss/train': 0.9620749950408936} -08/30/2021 19:07:41 - INFO - __main__ - Step 32564: {'lr': 0.0004492083877607168, 'samples': 6252288, 'steps': 32563, 'loss/train': 1.4404035806655884} -08/30/2021 19:07:41 - INFO - __main__ - Step 32565: {'lr': 0.00044920518138682244, 'samples': 6252480, 'steps': 32564, 'loss/train': 1.1728283166885376} -08/30/2021 19:07:42 - INFO - __main__ - Step 32566: {'lr': 0.00044920197492316925, 'samples': 6252672, 'steps': 32565, 'loss/train': 2.2622733116149902} -08/30/2021 19:07:43 - INFO - __main__ - Step 32567: {'lr': 0.00044919876836975876, 'samples': 6252864, 'steps': 32566, 'loss/train': 1.2195172309875488} -08/30/2021 19:07:44 - INFO - __main__ - Step 32568: {'lr': 0.0004491955617265924, 'samples': 6253056, 'steps': 32567, 'loss/train': 1.522727131843567} -08/30/2021 19:07:44 - INFO - __main__ - Step 32569: {'lr': 0.0004491923549936715, 'samples': 6253248, 'steps': 32568, 'loss/train': 2.150005578994751} -08/30/2021 19:07:44 - INFO - __main__ - Step 32570: {'lr': 0.0004491891481709977, 'samples': 6253440, 'steps': 32569, 'loss/train': 1.6076627969741821} -08/30/2021 19:07:45 - INFO - __main__ - Step 32571: {'lr': 0.0004491859412585723, 'samples': 6253632, 'steps': 32570, 'loss/train': 1.4843344688415527} -08/30/2021 19:07:46 - INFO - __main__ - Step 32572: {'lr': 0.0004491827342563968, 'samples': 6253824, 'steps': 32571, 'loss/train': 1.1950907707214355} -08/30/2021 19:07:47 - INFO - __main__ - Step 32573: {'lr': 0.0004491795271644726, 'samples': 6254016, 'steps': 32572, 'loss/train': 1.4974056482315063} -08/30/2021 19:07:47 - INFO - __main__ - Step 32574: {'lr': 0.0004491763199828012, 'samples': 6254208, 'steps': 32573, 'loss/train': 1.8395887613296509} -08/30/2021 19:07:47 - INFO - __main__ - Step 32575: {'lr': 0.00044917311271138393, 'samples': 6254400, 'steps': 32574, 'loss/train': 1.5923187732696533} -08/30/2021 19:07:48 - INFO - __main__ - Step 32576: {'lr': 0.00044916990535022244, 'samples': 6254592, 'steps': 32575, 'loss/train': 1.4547021389007568} -08/30/2021 19:07:48 - INFO - __main__ - Step 32577: {'lr': 0.00044916669789931806, 'samples': 6254784, 'steps': 32576, 'loss/train': 1.4893746376037598} -08/30/2021 19:07:50 - INFO - __main__ - Step 32578: {'lr': 0.0004491634903586722, 'samples': 6254976, 'steps': 32577, 'loss/train': 1.569621205329895} -08/30/2021 19:07:50 - INFO - __main__ - Step 32579: {'lr': 0.00044916028272828636, 'samples': 6255168, 'steps': 32578, 'loss/train': 1.984078288078308} -08/30/2021 19:07:50 - INFO - __main__ - Step 32580: {'lr': 0.00044915707500816206, 'samples': 6255360, 'steps': 32579, 'loss/train': 1.2185784578323364} -08/30/2021 19:07:51 - INFO - __main__ - Step 32581: {'lr': 0.0004491538671983005, 'samples': 6255552, 'steps': 32580, 'loss/train': 1.5167152881622314} -08/30/2021 19:07:51 - INFO - __main__ - Step 32582: {'lr': 0.00044915065929870335, 'samples': 6255744, 'steps': 32581, 'loss/train': 1.9794422388076782} -08/30/2021 19:07:53 - INFO - __main__ - Step 32583: {'lr': 0.00044914745130937204, 'samples': 6255936, 'steps': 32582, 'loss/train': 1.558671236038208} -08/30/2021 19:07:53 - INFO - __main__ - Step 32584: {'lr': 0.0004491442432303079, 'samples': 6256128, 'steps': 32583, 'loss/train': 1.2898389101028442} -08/30/2021 19:07:53 - INFO - __main__ - Step 32585: {'lr': 0.0004491410350615124, 'samples': 6256320, 'steps': 32584, 'loss/train': 1.0016385316848755} -08/30/2021 19:07:54 - INFO - __main__ - Step 32586: {'lr': 0.0004491378268029871, 'samples': 6256512, 'steps': 32585, 'loss/train': 0.8425077199935913} -08/30/2021 19:07:54 - INFO - __main__ - Step 32587: {'lr': 0.00044913461845473335, 'samples': 6256704, 'steps': 32586, 'loss/train': 1.7002413272857666} -08/30/2021 19:07:56 - INFO - __main__ - Step 32588: {'lr': 0.0004491314100167526, 'samples': 6256896, 'steps': 32587, 'loss/train': 1.3290108442306519} -08/30/2021 19:07:57 - INFO - __main__ - Step 32589: {'lr': 0.00044912820148904634, 'samples': 6257088, 'steps': 32588, 'loss/train': 1.3872827291488647} -08/30/2021 19:07:57 - INFO - __main__ - Step 32590: {'lr': 0.0004491249928716159, 'samples': 6257280, 'steps': 32589, 'loss/train': 1.028517723083496} -08/30/2021 19:07:57 - INFO - __main__ - Step 32591: {'lr': 0.0004491217841644629, 'samples': 6257472, 'steps': 32590, 'loss/train': 1.346028447151184} -08/30/2021 19:07:58 - INFO - __main__ - Step 32592: {'lr': 0.0004491185753675886, 'samples': 6257664, 'steps': 32591, 'loss/train': 1.70199716091156} -08/30/2021 19:07:59 - INFO - __main__ - Step 32593: {'lr': 0.0004491153664809947, 'samples': 6257856, 'steps': 32592, 'loss/train': 1.3674789667129517} -08/30/2021 19:08:00 - INFO - __main__ - Step 32594: {'lr': 0.00044911215750468236, 'samples': 6258048, 'steps': 32593, 'loss/train': 1.2177053689956665} -08/30/2021 19:08:00 - INFO - __main__ - Step 32595: {'lr': 0.0004491089484386531, 'samples': 6258240, 'steps': 32594, 'loss/train': 0.9989675283432007} -08/30/2021 19:08:01 - INFO - __main__ - Step 32596: {'lr': 0.0004491057392829086, 'samples': 6258432, 'steps': 32595, 'loss/train': 1.5146898031234741} -08/30/2021 19:08:01 - INFO - __main__ - Step 32597: {'lr': 0.00044910253003745007, 'samples': 6258624, 'steps': 32596, 'loss/train': 1.4629703760147095} -08/30/2021 19:08:01 - INFO - __main__ - Step 32598: {'lr': 0.00044909932070227887, 'samples': 6258816, 'steps': 32597, 'loss/train': 1.366084337234497} -08/30/2021 19:08:03 - INFO - __main__ - Step 32599: {'lr': 0.00044909611127739676, 'samples': 6259008, 'steps': 32598, 'loss/train': 1.5730016231536865} -08/30/2021 19:08:03 - INFO - __main__ - Step 32600: {'lr': 0.00044909290176280495, 'samples': 6259200, 'steps': 32599, 'loss/train': 1.157251238822937} -08/30/2021 19:08:03 - INFO - __main__ - Step 32601: {'lr': 0.00044908969215850495, 'samples': 6259392, 'steps': 32600, 'loss/train': 1.4529815912246704} -08/30/2021 19:08:04 - INFO - __main__ - Step 32602: {'lr': 0.0004490864824644982, 'samples': 6259584, 'steps': 32601, 'loss/train': 1.7107728719711304} -08/30/2021 19:08:04 - INFO - __main__ - Step 32603: {'lr': 0.0004490832726807862, 'samples': 6259776, 'steps': 32602, 'loss/train': 0.7558012008666992} -08/30/2021 19:08:06 - INFO - __main__ - Step 32604: {'lr': 0.0004490800628073703, 'samples': 6259968, 'steps': 32603, 'loss/train': 1.6195636987686157} -08/30/2021 19:08:07 - INFO - __main__ - Step 32605: {'lr': 0.000449076852844252, 'samples': 6260160, 'steps': 32604, 'loss/train': 1.308281660079956} -08/30/2021 19:08:07 - INFO - __main__ - Step 32606: {'lr': 0.0004490736427914327, 'samples': 6260352, 'steps': 32605, 'loss/train': 0.5588341355323792} -08/30/2021 19:08:07 - INFO - __main__ - Step 32607: {'lr': 0.000449070432648914, 'samples': 6260544, 'steps': 32606, 'loss/train': 0.08983058482408524} -08/30/2021 19:08:08 - INFO - __main__ - Step 32608: {'lr': 0.0004490672224166972, 'samples': 6260736, 'steps': 32607, 'loss/train': 1.482445240020752} -08/30/2021 19:08:08 - INFO - __main__ - Step 32609: {'lr': 0.00044906401209478367, 'samples': 6260928, 'steps': 32608, 'loss/train': 1.5608757734298706} -08/30/2021 19:08:09 - INFO - __main__ - Step 32610: {'lr': 0.00044906080168317507, 'samples': 6261120, 'steps': 32609, 'loss/train': 1.0697720050811768} -08/30/2021 19:08:10 - INFO - __main__ - Step 32611: {'lr': 0.0004490575911818727, 'samples': 6261312, 'steps': 32610, 'loss/train': 1.4957313537597656} -08/30/2021 19:08:10 - INFO - __main__ - Step 32612: {'lr': 0.0004490543805908781, 'samples': 6261504, 'steps': 32611, 'loss/train': 0.7550933957099915} -08/30/2021 19:08:11 - INFO - __main__ - Step 32613: {'lr': 0.00044905116991019264, 'samples': 6261696, 'steps': 32612, 'loss/train': 1.474701166152954} -08/30/2021 19:08:11 - INFO - __main__ - Step 32614: {'lr': 0.00044904795913981775, 'samples': 6261888, 'steps': 32613, 'loss/train': 1.4788645505905151} -08/30/2021 19:08:12 - INFO - __main__ - Step 32615: {'lr': 0.00044904474827975506, 'samples': 6262080, 'steps': 32614, 'loss/train': 1.5367071628570557} -08/30/2021 19:08:13 - INFO - __main__ - Step 32616: {'lr': 0.00044904153733000575, 'samples': 6262272, 'steps': 32615, 'loss/train': 1.407670259475708} -08/30/2021 19:08:13 - INFO - __main__ - Step 32617: {'lr': 0.0004490383262905714, 'samples': 6262464, 'steps': 32616, 'loss/train': 1.796865463256836} -08/30/2021 19:08:14 - INFO - __main__ - Step 32618: {'lr': 0.00044903511516145353, 'samples': 6262656, 'steps': 32617, 'loss/train': 1.2737195491790771} -08/30/2021 19:08:14 - INFO - __main__ - Step 32619: {'lr': 0.0004490319039426535, 'samples': 6262848, 'steps': 32618, 'loss/train': 2.0644729137420654} -08/30/2021 19:08:15 - INFO - __main__ - Step 32620: {'lr': 0.0004490286926341727, 'samples': 6263040, 'steps': 32619, 'loss/train': 1.6587156057357788} -08/30/2021 19:08:16 - INFO - __main__ - Step 32621: {'lr': 0.0004490254812360126, 'samples': 6263232, 'steps': 32620, 'loss/train': 1.367366909980774} -08/30/2021 19:08:16 - INFO - __main__ - Step 32622: {'lr': 0.0004490222697481748, 'samples': 6263424, 'steps': 32621, 'loss/train': 1.2552974224090576} -08/30/2021 19:08:17 - INFO - __main__ - Step 32623: {'lr': 0.00044901905817066055, 'samples': 6263616, 'steps': 32622, 'loss/train': 1.7514386177062988} -08/30/2021 19:08:17 - INFO - __main__ - Step 32624: {'lr': 0.00044901584650347147, 'samples': 6263808, 'steps': 32623, 'loss/train': 0.8660169839859009} -08/30/2021 19:08:19 - INFO - __main__ - Step 32625: {'lr': 0.00044901263474660894, 'samples': 6264000, 'steps': 32624, 'loss/train': 1.4739148616790771} -08/30/2021 19:08:19 - INFO - __main__ - Step 32626: {'lr': 0.0004490094229000743, 'samples': 6264192, 'steps': 32625, 'loss/train': 1.7914471626281738} -08/30/2021 19:08:19 - INFO - __main__ - Step 32627: {'lr': 0.00044900621096386904, 'samples': 6264384, 'steps': 32626, 'loss/train': 1.9467860460281372} -08/30/2021 19:08:20 - INFO - __main__ - Step 32628: {'lr': 0.00044900299893799476, 'samples': 6264576, 'steps': 32627, 'loss/train': 1.9788882732391357} -08/30/2021 19:08:20 - INFO - __main__ - Step 32629: {'lr': 0.0004489997868224528, 'samples': 6264768, 'steps': 32628, 'loss/train': 1.5747175216674805} -08/30/2021 19:08:21 - INFO - __main__ - Step 32630: {'lr': 0.00044899657461724453, 'samples': 6264960, 'steps': 32629, 'loss/train': 1.2320046424865723} -08/30/2021 19:08:22 - INFO - __main__ - Step 32631: {'lr': 0.00044899336232237156, 'samples': 6265152, 'steps': 32630, 'loss/train': 1.4974302053451538} -08/30/2021 19:08:22 - INFO - __main__ - Step 32632: {'lr': 0.0004489901499378352, 'samples': 6265344, 'steps': 32631, 'loss/train': 1.7678385972976685} -08/30/2021 19:08:23 - INFO - __main__ - Step 32633: {'lr': 0.00044898693746363695, 'samples': 6265536, 'steps': 32632, 'loss/train': 1.7455347776412964} -08/30/2021 19:08:23 - INFO - __main__ - Step 32634: {'lr': 0.00044898372489977825, 'samples': 6265728, 'steps': 32633, 'loss/train': 1.287279486656189} -08/30/2021 19:08:23 - INFO - __main__ - Step 32635: {'lr': 0.0004489805122462606, 'samples': 6265920, 'steps': 32634, 'loss/train': 0.9113028645515442} -08/30/2021 19:08:25 - INFO - __main__ - Step 32636: {'lr': 0.0004489772995030853, 'samples': 6266112, 'steps': 32635, 'loss/train': 1.7554665803909302} -08/30/2021 19:08:25 - INFO - __main__ - Step 32637: {'lr': 0.00044897408667025397, 'samples': 6266304, 'steps': 32636, 'loss/train': 1.6604429483413696} -08/30/2021 19:08:26 - INFO - __main__ - Step 32638: {'lr': 0.000448970873747768, 'samples': 6266496, 'steps': 32637, 'loss/train': 1.1881701946258545} -08/30/2021 19:08:26 - INFO - __main__ - Step 32639: {'lr': 0.0004489676607356288, 'samples': 6266688, 'steps': 32638, 'loss/train': 1.8800278902053833} -08/30/2021 19:08:26 - INFO - __main__ - Step 32640: {'lr': 0.00044896444763383787, 'samples': 6266880, 'steps': 32639, 'loss/train': 1.0191476345062256} -08/30/2021 19:08:28 - INFO - __main__ - Step 32641: {'lr': 0.00044896123444239654, 'samples': 6267072, 'steps': 32640, 'loss/train': 1.2555551528930664} -08/30/2021 19:08:28 - INFO - __main__ - Step 32642: {'lr': 0.00044895802116130644, 'samples': 6267264, 'steps': 32641, 'loss/train': 1.476691722869873} -08/30/2021 19:08:29 - INFO - __main__ - Step 32643: {'lr': 0.0004489548077905689, 'samples': 6267456, 'steps': 32642, 'loss/train': 1.2697087526321411} -08/30/2021 19:08:29 - INFO - __main__ - Step 32644: {'lr': 0.0004489515943301854, 'samples': 6267648, 'steps': 32643, 'loss/train': 1.302669644355774} -08/30/2021 19:08:29 - INFO - __main__ - Step 32645: {'lr': 0.0004489483807801574, 'samples': 6267840, 'steps': 32644, 'loss/train': 1.1378012895584106} -08/30/2021 19:08:31 - INFO - __main__ - Step 32646: {'lr': 0.00044894516714048626, 'samples': 6268032, 'steps': 32645, 'loss/train': 1.2294268608093262} -08/30/2021 19:08:32 - INFO - __main__ - Step 32647: {'lr': 0.0004489419534111736, 'samples': 6268224, 'steps': 32646, 'loss/train': 1.510994791984558} -08/30/2021 19:08:32 - INFO - __main__ - Step 32648: {'lr': 0.0004489387395922207, 'samples': 6268416, 'steps': 32647, 'loss/train': 0.47757887840270996} -08/30/2021 19:08:33 - INFO - __main__ - Step 32649: {'lr': 0.00044893552568362903, 'samples': 6268608, 'steps': 32648, 'loss/train': 1.4998905658721924} -08/30/2021 19:08:33 - INFO - __main__ - Step 32650: {'lr': 0.0004489323116854002, 'samples': 6268800, 'steps': 32649, 'loss/train': 1.0956974029541016} -08/30/2021 19:08:35 - INFO - __main__ - Step 32651: {'lr': 0.00044892909759753545, 'samples': 6268992, 'steps': 32650, 'loss/train': 0.9286983013153076} -08/30/2021 19:08:35 - INFO - __main__ - Step 32652: {'lr': 0.00044892588342003637, 'samples': 6269184, 'steps': 32651, 'loss/train': 0.6986061930656433} -08/30/2021 19:08:35 - INFO - __main__ - Step 32653: {'lr': 0.00044892266915290435, 'samples': 6269376, 'steps': 32652, 'loss/train': 0.6714340448379517} -08/30/2021 19:08:36 - INFO - __main__ - Step 32654: {'lr': 0.00044891945479614084, 'samples': 6269568, 'steps': 32653, 'loss/train': 1.2851635217666626} -08/30/2021 19:08:36 - INFO - __main__ - Step 32655: {'lr': 0.00044891624034974726, 'samples': 6269760, 'steps': 32654, 'loss/train': 1.1897081136703491} -08/30/2021 19:08:37 - INFO - __main__ - Step 32656: {'lr': 0.00044891302581372513, 'samples': 6269952, 'steps': 32655, 'loss/train': 0.8642836809158325} -08/30/2021 19:08:38 - INFO - __main__ - Step 32657: {'lr': 0.00044890981118807585, 'samples': 6270144, 'steps': 32656, 'loss/train': 1.5977660417556763} -08/30/2021 19:08:38 - INFO - __main__ - Step 32658: {'lr': 0.00044890659647280084, 'samples': 6270336, 'steps': 32657, 'loss/train': 1.3554693460464478} -08/30/2021 19:08:39 - INFO - __main__ - Step 32659: {'lr': 0.0004489033816679016, 'samples': 6270528, 'steps': 32658, 'loss/train': 1.808934211730957} -08/30/2021 19:08:39 - INFO - __main__ - Step 32660: {'lr': 0.0004489001667733796, 'samples': 6270720, 'steps': 32659, 'loss/train': 0.5968970060348511} -08/30/2021 19:08:39 - INFO - __main__ - Step 32661: {'lr': 0.0004488969517892363, 'samples': 6270912, 'steps': 32660, 'loss/train': 1.2042478322982788} -08/30/2021 19:08:42 - INFO - __main__ - Step 32662: {'lr': 0.000448893736715473, 'samples': 6271104, 'steps': 32661, 'loss/train': 1.426439642906189} -08/30/2021 19:08:42 - INFO - __main__ - Step 32663: {'lr': 0.0004488905215520913, 'samples': 6271296, 'steps': 32662, 'loss/train': 1.2710903882980347} -08/30/2021 19:08:43 - INFO - __main__ - Step 32664: {'lr': 0.00044888730629909256, 'samples': 6271488, 'steps': 32663, 'loss/train': 1.1173428297042847} -08/30/2021 19:08:43 - INFO - __main__ - Step 32665: {'lr': 0.00044888409095647833, 'samples': 6271680, 'steps': 32664, 'loss/train': 0.5026143789291382} -08/30/2021 19:08:43 - INFO - __main__ - Step 32666: {'lr': 0.00044888087552424997, 'samples': 6271872, 'steps': 32665, 'loss/train': 0.801002025604248} -08/30/2021 19:08:44 - INFO - __main__ - Step 32667: {'lr': 0.00044887766000240893, 'samples': 6272064, 'steps': 32666, 'loss/train': 1.8869332075119019} -08/30/2021 19:08:45 - INFO - __main__ - Step 32668: {'lr': 0.0004488744443909567, 'samples': 6272256, 'steps': 32667, 'loss/train': 0.6987221837043762} -08/30/2021 19:08:45 - INFO - __main__ - Step 32669: {'lr': 0.0004488712286898947, 'samples': 6272448, 'steps': 32668, 'loss/train': 0.9386299252510071} -08/30/2021 19:08:46 - INFO - __main__ - Step 32670: {'lr': 0.0004488680128992244, 'samples': 6272640, 'steps': 32669, 'loss/train': 1.3432233333587646} -08/30/2021 19:08:46 - INFO - __main__ - Step 32671: {'lr': 0.00044886479701894736, 'samples': 6272832, 'steps': 32670, 'loss/train': 1.2272197008132935} -08/30/2021 19:08:47 - INFO - __main__ - Step 32672: {'lr': 0.00044886158104906476, 'samples': 6273024, 'steps': 32671, 'loss/train': 1.0744589567184448} -08/30/2021 19:08:47 - INFO - __main__ - Step 32673: {'lr': 0.0004488583649895782, 'samples': 6273216, 'steps': 32672, 'loss/train': 1.8242857456207275} -08/30/2021 19:08:48 - INFO - __main__ - Step 32674: {'lr': 0.00044885514884048926, 'samples': 6273408, 'steps': 32673, 'loss/train': 1.1331464052200317} -08/30/2021 19:08:49 - INFO - __main__ - Step 32675: {'lr': 0.0004488519326017991, 'samples': 6273600, 'steps': 32674, 'loss/train': 1.195969820022583} -08/30/2021 19:08:49 - INFO - __main__ - Step 32676: {'lr': 0.0004488487162735094, 'samples': 6273792, 'steps': 32675, 'loss/train': 1.6875015497207642} -08/30/2021 19:08:49 - INFO - __main__ - Step 32677: {'lr': 0.00044884549985562165, 'samples': 6273984, 'steps': 32676, 'loss/train': 1.3573211431503296} -08/30/2021 19:08:50 - INFO - __main__ - Step 32678: {'lr': 0.000448842283348137, 'samples': 6274176, 'steps': 32677, 'loss/train': 1.196877360343933} -08/30/2021 19:08:51 - INFO - __main__ - Step 32679: {'lr': 0.0004488390667510572, 'samples': 6274368, 'steps': 32678, 'loss/train': 1.146606683731079} -08/30/2021 19:08:52 - INFO - __main__ - Step 32680: {'lr': 0.00044883585006438354, 'samples': 6274560, 'steps': 32679, 'loss/train': 1.2461488246917725} -08/30/2021 19:08:52 - INFO - __main__ - Step 32681: {'lr': 0.0004488326332881175, 'samples': 6274752, 'steps': 32680, 'loss/train': 1.4318525791168213} -08/30/2021 19:08:52 - INFO - __main__ - Step 32682: {'lr': 0.0004488294164222606, 'samples': 6274944, 'steps': 32681, 'loss/train': 1.6273961067199707} -08/30/2021 19:08:53 - INFO - __main__ - Step 32683: {'lr': 0.0004488261994668142, 'samples': 6275136, 'steps': 32682, 'loss/train': 1.14664888381958} -08/30/2021 19:08:54 - INFO - __main__ - Step 32684: {'lr': 0.00044882298242177976, 'samples': 6275328, 'steps': 32683, 'loss/train': 1.650382161140442} -08/30/2021 19:08:55 - INFO - __main__ - Step 32685: {'lr': 0.00044881976528715877, 'samples': 6275520, 'steps': 32684, 'loss/train': 1.581041693687439} -08/30/2021 19:08:55 - INFO - __main__ - Step 32686: {'lr': 0.0004488165480629527, 'samples': 6275712, 'steps': 32685, 'loss/train': 1.138535976409912} -08/30/2021 19:08:56 - INFO - __main__ - Step 32687: {'lr': 0.00044881333074916287, 'samples': 6275904, 'steps': 32686, 'loss/train': 1.7488389015197754} -08/30/2021 19:08:56 - INFO - __main__ - Step 32688: {'lr': 0.00044881011334579093, 'samples': 6276096, 'steps': 32687, 'loss/train': 1.5472015142440796} -08/30/2021 19:08:57 - INFO - __main__ - Step 32689: {'lr': 0.0004488068958528382, 'samples': 6276288, 'steps': 32688, 'loss/train': 2.2534351348876953} -08/30/2021 19:08:58 - INFO - __main__ - Step 32690: {'lr': 0.0004488036782703061, 'samples': 6276480, 'steps': 32689, 'loss/train': 1.339576244354248} -08/30/2021 19:08:58 - INFO - __main__ - Step 32691: {'lr': 0.00044880046059819615, 'samples': 6276672, 'steps': 32690, 'loss/train': 1.3722784519195557} -08/30/2021 19:08:59 - INFO - __main__ - Step 32692: {'lr': 0.00044879724283650976, 'samples': 6276864, 'steps': 32691, 'loss/train': 1.4898552894592285} -08/30/2021 19:08:59 - INFO - __main__ - Step 32693: {'lr': 0.0004487940249852484, 'samples': 6277056, 'steps': 32692, 'loss/train': 1.76902174949646} -08/30/2021 19:09:00 - INFO - __main__ - Step 32694: {'lr': 0.0004487908070444136, 'samples': 6277248, 'steps': 32693, 'loss/train': 0.06002538278698921} -08/30/2021 19:09:01 - INFO - __main__ - Step 32695: {'lr': 0.00044878758901400665, 'samples': 6277440, 'steps': 32694, 'loss/train': 0.45922979712486267} -08/30/2021 19:09:01 - INFO - __main__ - Step 32696: {'lr': 0.00044878437089402906, 'samples': 6277632, 'steps': 32695, 'loss/train': 1.806343913078308} -08/30/2021 19:09:02 - INFO - __main__ - Step 32697: {'lr': 0.0004487811526844824, 'samples': 6277824, 'steps': 32696, 'loss/train': 1.1682636737823486} -08/30/2021 19:09:02 - INFO - __main__ - Step 32698: {'lr': 0.0004487779343853679, 'samples': 6278016, 'steps': 32697, 'loss/train': 1.624447226524353} -08/30/2021 19:09:04 - INFO - __main__ - Step 32699: {'lr': 0.00044877471599668716, 'samples': 6278208, 'steps': 32698, 'loss/train': 0.7771300077438354} -08/30/2021 19:09:05 - INFO - __main__ - Step 32700: {'lr': 0.00044877149751844164, 'samples': 6278400, 'steps': 32699, 'loss/train': 2.180201768875122} -08/30/2021 19:09:05 - INFO - __main__ - Step 32701: {'lr': 0.00044876827895063277, 'samples': 6278592, 'steps': 32700, 'loss/train': 1.3569248914718628} -08/30/2021 19:09:05 - INFO - __main__ - Step 32702: {'lr': 0.0004487650602932619, 'samples': 6278784, 'steps': 32701, 'loss/train': 1.5192692279815674} -08/30/2021 19:09:06 - INFO - __main__ - Step 32703: {'lr': 0.00044876184154633066, 'samples': 6278976, 'steps': 32702, 'loss/train': 1.6608797311782837} -08/30/2021 19:09:07 - INFO - __main__ - Step 32704: {'lr': 0.00044875862270984035, 'samples': 6279168, 'steps': 32703, 'loss/train': 1.514662742614746} -08/30/2021 19:09:08 - INFO - __main__ - Step 32705: {'lr': 0.0004487554037837925, 'samples': 6279360, 'steps': 32704, 'loss/train': 2.7525267601013184} -08/30/2021 19:09:08 - INFO - __main__ - Step 32706: {'lr': 0.00044875218476818845, 'samples': 6279552, 'steps': 32705, 'loss/train': 1.8895959854125977} -08/30/2021 19:09:08 - INFO - __main__ - Step 32707: {'lr': 0.0004487489656630298, 'samples': 6279744, 'steps': 32706, 'loss/train': 0.6508373022079468} -08/30/2021 19:09:09 - INFO - __main__ - Step 32708: {'lr': 0.00044874574646831794, 'samples': 6279936, 'steps': 32707, 'loss/train': 0.9525187611579895} -08/30/2021 19:09:09 - INFO - __main__ - Step 32709: {'lr': 0.0004487425271840543, 'samples': 6280128, 'steps': 32708, 'loss/train': 2.010841131210327} -08/30/2021 19:09:10 - INFO - __main__ - Step 32710: {'lr': 0.0004487393078102403, 'samples': 6280320, 'steps': 32709, 'loss/train': 1.357568383216858} -08/30/2021 19:09:11 - INFO - __main__ - Step 32711: {'lr': 0.00044873608834687754, 'samples': 6280512, 'steps': 32710, 'loss/train': 1.5007696151733398} -08/30/2021 19:09:11 - INFO - __main__ - Step 32712: {'lr': 0.00044873286879396724, 'samples': 6280704, 'steps': 32711, 'loss/train': 1.4705638885498047} -08/30/2021 19:09:12 - INFO - __main__ - Step 32713: {'lr': 0.00044872964915151106, 'samples': 6280896, 'steps': 32712, 'loss/train': 1.5984336137771606} -08/30/2021 19:09:12 - INFO - __main__ - Step 32714: {'lr': 0.00044872642941951035, 'samples': 6281088, 'steps': 32713, 'loss/train': 1.1912426948547363} -08/30/2021 19:09:13 - INFO - __main__ - Step 32715: {'lr': 0.0004487232095979666, 'samples': 6281280, 'steps': 32714, 'loss/train': 1.02670419216156} -08/30/2021 19:09:14 - INFO - __main__ - Step 32716: {'lr': 0.0004487199896868812, 'samples': 6281472, 'steps': 32715, 'loss/train': 1.3977181911468506} -08/30/2021 19:09:14 - INFO - __main__ - Step 32717: {'lr': 0.00044871676968625564, 'samples': 6281664, 'steps': 32716, 'loss/train': 1.223524808883667} -08/30/2021 19:09:15 - INFO - __main__ - Step 32718: {'lr': 0.00044871354959609135, 'samples': 6281856, 'steps': 32717, 'loss/train': 1.7086668014526367} -08/30/2021 19:09:15 - INFO - __main__ - Step 32719: {'lr': 0.00044871032941638984, 'samples': 6282048, 'steps': 32718, 'loss/train': 1.1339046955108643} -08/30/2021 19:09:16 - INFO - __main__ - Step 32720: {'lr': 0.00044870710914715254, 'samples': 6282240, 'steps': 32719, 'loss/train': 1.5099304914474487} -08/30/2021 19:09:17 - INFO - __main__ - Step 32721: {'lr': 0.00044870388878838084, 'samples': 6282432, 'steps': 32720, 'loss/train': 0.7428812384605408} -08/30/2021 19:09:17 - INFO - __main__ - Step 32722: {'lr': 0.00044870066834007627, 'samples': 6282624, 'steps': 32721, 'loss/train': 1.6752691268920898} -08/30/2021 19:09:18 - INFO - __main__ - Step 32723: {'lr': 0.0004486974478022402, 'samples': 6282816, 'steps': 32722, 'loss/train': 1.742810845375061} -08/30/2021 19:09:18 - INFO - __main__ - Step 32724: {'lr': 0.0004486942271748742, 'samples': 6283008, 'steps': 32723, 'loss/train': 1.631355881690979} -08/30/2021 19:09:20 - INFO - __main__ - Step 32725: {'lr': 0.0004486910064579796, 'samples': 6283200, 'steps': 32724, 'loss/train': 0.8716088533401489} -08/30/2021 19:09:20 - INFO - __main__ - Step 32726: {'lr': 0.00044868778565155783, 'samples': 6283392, 'steps': 32725, 'loss/train': 1.4294098615646362} -08/30/2021 19:09:20 - INFO - __main__ - Step 32727: {'lr': 0.00044868456475561047, 'samples': 6283584, 'steps': 32726, 'loss/train': 0.9342978596687317} -08/30/2021 19:09:21 - INFO - __main__ - Step 32728: {'lr': 0.0004486813437701389, 'samples': 6283776, 'steps': 32727, 'loss/train': 0.8733958005905151} -08/30/2021 19:09:21 - INFO - __main__ - Step 32729: {'lr': 0.0004486781226951446, 'samples': 6283968, 'steps': 32728, 'loss/train': 1.2319986820220947} -08/30/2021 19:09:23 - INFO - __main__ - Step 32730: {'lr': 0.000448674901530629, 'samples': 6284160, 'steps': 32729, 'loss/train': 1.865423560142517} -08/30/2021 19:09:23 - INFO - __main__ - Step 32731: {'lr': 0.00044867168027659356, 'samples': 6284352, 'steps': 32730, 'loss/train': 0.0932878777384758} -08/30/2021 19:09:23 - INFO - __main__ - Step 32732: {'lr': 0.00044866845893303973, 'samples': 6284544, 'steps': 32731, 'loss/train': 1.4628554582595825} -08/30/2021 19:09:24 - INFO - __main__ - Step 32733: {'lr': 0.00044866523749996897, 'samples': 6284736, 'steps': 32732, 'loss/train': 1.3478153944015503} -08/30/2021 19:09:24 - INFO - __main__ - Step 32734: {'lr': 0.0004486620159773827, 'samples': 6284928, 'steps': 32733, 'loss/train': 0.9551073312759399} -08/30/2021 19:09:26 - INFO - __main__ - Step 32735: {'lr': 0.0004486587943652823, 'samples': 6285120, 'steps': 32734, 'loss/train': 1.3273606300354004} -08/30/2021 19:09:26 - INFO - __main__ - Step 32736: {'lr': 0.00044865557266366953, 'samples': 6285312, 'steps': 32735, 'loss/train': 1.0841439962387085} -08/30/2021 19:09:27 - INFO - __main__ - Step 32737: {'lr': 0.0004486523508725454, 'samples': 6285504, 'steps': 32736, 'loss/train': 1.8125394582748413} -08/30/2021 19:09:27 - INFO - __main__ - Step 32738: {'lr': 0.00044864912899191174, 'samples': 6285696, 'steps': 32737, 'loss/train': 1.1985185146331787} -08/30/2021 19:09:27 - INFO - __main__ - Step 32739: {'lr': 0.00044864590702176977, 'samples': 6285888, 'steps': 32738, 'loss/train': 0.8871357440948486} -08/30/2021 19:09:29 - INFO - __main__ - Step 32740: {'lr': 0.000448642684962121, 'samples': 6286080, 'steps': 32739, 'loss/train': 1.1493544578552246} -08/30/2021 19:09:30 - INFO - __main__ - Step 32741: {'lr': 0.000448639462812967, 'samples': 6286272, 'steps': 32740, 'loss/train': 1.3475017547607422} -08/30/2021 19:09:30 - INFO - __main__ - Step 32742: {'lr': 0.0004486362405743091, 'samples': 6286464, 'steps': 32741, 'loss/train': 1.44907808303833} -08/30/2021 19:09:31 - INFO - __main__ - Step 32743: {'lr': 0.0004486330182461487, 'samples': 6286656, 'steps': 32742, 'loss/train': 1.7825427055358887} -08/30/2021 19:09:31 - INFO - __main__ - Step 32744: {'lr': 0.0004486297958284874, 'samples': 6286848, 'steps': 32743, 'loss/train': 0.12823890149593353} -08/30/2021 19:09:31 - INFO - __main__ - Step 32745: {'lr': 0.0004486265733213265, 'samples': 6287040, 'steps': 32744, 'loss/train': 1.411868929862976} -08/30/2021 19:09:32 - INFO - __main__ - Step 32746: {'lr': 0.00044862335072466767, 'samples': 6287232, 'steps': 32745, 'loss/train': 4.230576992034912} -08/30/2021 19:09:33 - INFO - __main__ - Step 32747: {'lr': 0.00044862012803851203, 'samples': 6287424, 'steps': 32746, 'loss/train': 8.016744613647461} -08/30/2021 19:09:34 - INFO - __main__ - Step 32748: {'lr': 0.00044861690526286135, 'samples': 6287616, 'steps': 32747, 'loss/train': 1.3422104120254517} -08/30/2021 19:09:34 - INFO - __main__ - Step 32749: {'lr': 0.00044861368239771694, 'samples': 6287808, 'steps': 32748, 'loss/train': 2.1091575622558594} -08/30/2021 19:09:34 - INFO - __main__ - Step 32750: {'lr': 0.00044861045944308026, 'samples': 6288000, 'steps': 32749, 'loss/train': 1.341341257095337} -08/30/2021 19:09:35 - INFO - __main__ - Step 32751: {'lr': 0.0004486072363989528, 'samples': 6288192, 'steps': 32750, 'loss/train': 1.4784268140792847} -08/30/2021 19:09:37 - INFO - __main__ - Step 32752: {'lr': 0.00044860401326533595, 'samples': 6288384, 'steps': 32751, 'loss/train': 1.5603610277175903} -08/30/2021 19:09:37 - INFO - __main__ - Step 32753: {'lr': 0.0004486007900422312, 'samples': 6288576, 'steps': 32752, 'loss/train': 1.4333299398422241} -08/30/2021 19:09:38 - INFO - __main__ - Step 32754: {'lr': 0.00044859756672964, 'samples': 6288768, 'steps': 32753, 'loss/train': 1.936609148979187} -08/30/2021 19:09:38 - INFO - __main__ - Step 32755: {'lr': 0.00044859434332756383, 'samples': 6288960, 'steps': 32754, 'loss/train': 1.333675742149353} -08/30/2021 19:09:38 - INFO - __main__ - Step 32756: {'lr': 0.0004485911198360041, 'samples': 6289152, 'steps': 32755, 'loss/train': 1.4803684949874878} -08/30/2021 19:09:40 - INFO - __main__ - Step 32757: {'lr': 0.0004485878962549622, 'samples': 6289344, 'steps': 32756, 'loss/train': 0.38887861371040344} -08/30/2021 19:09:40 - INFO - __main__ - Step 32758: {'lr': 0.0004485846725844398, 'samples': 6289536, 'steps': 32757, 'loss/train': 1.8522518873214722} -08/30/2021 19:09:41 - INFO - __main__ - Step 32759: {'lr': 0.0004485814488244381, 'samples': 6289728, 'steps': 32758, 'loss/train': 0.8544082641601562} -08/30/2021 19:09:41 - INFO - __main__ - Step 32760: {'lr': 0.0004485782249749587, 'samples': 6289920, 'steps': 32759, 'loss/train': 1.5086592435836792} -08/30/2021 19:09:41 - INFO - __main__ - Step 32761: {'lr': 0.00044857500103600304, 'samples': 6290112, 'steps': 32760, 'loss/train': 1.417419672012329} -08/30/2021 19:09:42 - INFO - __main__ - Step 32762: {'lr': 0.00044857177700757247, 'samples': 6290304, 'steps': 32761, 'loss/train': 0.10837419331073761} -08/30/2021 19:09:43 - INFO - __main__ - Step 32763: {'lr': 0.00044856855288966856, 'samples': 6290496, 'steps': 32762, 'loss/train': 0.42357853055000305} -08/30/2021 19:09:44 - INFO - __main__ - Step 32764: {'lr': 0.0004485653286822927, 'samples': 6290688, 'steps': 32763, 'loss/train': 1.54203462600708} -08/30/2021 19:09:44 - INFO - __main__ - Step 32765: {'lr': 0.0004485621043854465, 'samples': 6290880, 'steps': 32764, 'loss/train': 1.643184781074524} -08/30/2021 19:09:44 - INFO - __main__ - Step 32766: {'lr': 0.0004485588799991311, 'samples': 6291072, 'steps': 32765, 'loss/train': 1.0635567903518677} -08/30/2021 19:09:45 - INFO - __main__ - Step 32767: {'lr': 0.0004485556555233483, 'samples': 6291264, 'steps': 32766, 'loss/train': 0.9965192079544067} -08/30/2021 19:09:46 - INFO - __main__ - Step 32768: {'lr': 0.0004485524309580993, 'samples': 6291456, 'steps': 32767, 'loss/train': 1.7073910236358643} -08/30/2021 19:09:47 - INFO - __main__ - Step 32769: {'lr': 0.0004485492063033856, 'samples': 6291648, 'steps': 32768, 'loss/train': 1.0999629497528076} -08/30/2021 19:09:47 - INFO - __main__ - Step 32770: {'lr': 0.0004485459815592087, 'samples': 6291840, 'steps': 32769, 'loss/train': 1.7776328325271606} -08/30/2021 19:09:47 - INFO - __main__ - Step 32771: {'lr': 0.0004485427567255701, 'samples': 6292032, 'steps': 32770, 'loss/train': 0.7569795846939087} -08/30/2021 19:09:48 - INFO - __main__ - Step 32772: {'lr': 0.0004485395318024712, 'samples': 6292224, 'steps': 32771, 'loss/train': 1.0346463918685913} -08/30/2021 19:09:49 - INFO - __main__ - Step 32773: {'lr': 0.00044853630678991344, 'samples': 6292416, 'steps': 32772, 'loss/train': 1.0680031776428223} -08/30/2021 19:09:50 - INFO - __main__ - Step 32774: {'lr': 0.00044853308168789824, 'samples': 6292608, 'steps': 32773, 'loss/train': 1.6477960348129272} -08/30/2021 19:09:50 - INFO - __main__ - Step 32775: {'lr': 0.00044852985649642714, 'samples': 6292800, 'steps': 32774, 'loss/train': 1.2744946479797363} -08/30/2021 19:09:50 - INFO - __main__ - Step 32776: {'lr': 0.0004485266312155015, 'samples': 6292992, 'steps': 32775, 'loss/train': 1.7531893253326416} -08/30/2021 19:09:51 - INFO - __main__ - Step 32777: {'lr': 0.00044852340584512285, 'samples': 6293184, 'steps': 32776, 'loss/train': 1.0807465314865112} -08/30/2021 19:09:52 - INFO - __main__ - Step 32778: {'lr': 0.00044852018038529264, 'samples': 6293376, 'steps': 32777, 'loss/train': 2.2647616863250732} -08/30/2021 19:09:53 - INFO - __main__ - Step 32779: {'lr': 0.00044851695483601227, 'samples': 6293568, 'steps': 32778, 'loss/train': 1.55298912525177} -08/30/2021 19:09:53 - INFO - __main__ - Step 32780: {'lr': 0.0004485137291972833, 'samples': 6293760, 'steps': 32779, 'loss/train': 1.605798363685608} -08/30/2021 19:09:53 - INFO - __main__ - Step 32781: {'lr': 0.00044851050346910706, 'samples': 6293952, 'steps': 32780, 'loss/train': 1.4963539838790894} -08/30/2021 19:09:54 - INFO - __main__ - Step 32782: {'lr': 0.00044850727765148504, 'samples': 6294144, 'steps': 32781, 'loss/train': 1.1368192434310913} -08/30/2021 19:09:55 - INFO - __main__ - Step 32783: {'lr': 0.00044850405174441866, 'samples': 6294336, 'steps': 32782, 'loss/train': 1.5403021574020386} -08/30/2021 19:09:56 - INFO - __main__ - Step 32784: {'lr': 0.00044850082574790945, 'samples': 6294528, 'steps': 32783, 'loss/train': 0.9672999382019043} -08/30/2021 19:09:56 - INFO - __main__ - Step 32785: {'lr': 0.0004484975996619589, 'samples': 6294720, 'steps': 32784, 'loss/train': 1.37628173828125} -08/30/2021 19:09:56 - INFO - __main__ - Step 32786: {'lr': 0.0004484943734865683, 'samples': 6294912, 'steps': 32785, 'loss/train': 1.615965723991394} -08/30/2021 19:09:57 - INFO - __main__ - Step 32787: {'lr': 0.0004484911472217392, 'samples': 6295104, 'steps': 32786, 'loss/train': 0.8111220002174377} -08/30/2021 19:09:58 - INFO - __main__ - Step 32788: {'lr': 0.0004484879208674731, 'samples': 6295296, 'steps': 32787, 'loss/train': 1.3192120790481567} -08/30/2021 19:09:59 - INFO - __main__ - Step 32789: {'lr': 0.0004484846944237714, 'samples': 6295488, 'steps': 32788, 'loss/train': 1.085790753364563} -08/30/2021 19:09:59 - INFO - __main__ - Step 32790: {'lr': 0.0004484814678906355, 'samples': 6295680, 'steps': 32789, 'loss/train': 1.0670602321624756} -08/30/2021 19:09:59 - INFO - __main__ - Step 32791: {'lr': 0.00044847824126806703, 'samples': 6295872, 'steps': 32790, 'loss/train': 1.282948613166809} -08/30/2021 19:10:00 - INFO - __main__ - Step 32792: {'lr': 0.0004484750145560672, 'samples': 6296064, 'steps': 32791, 'loss/train': 0.8721528649330139} -08/30/2021 19:10:02 - INFO - __main__ - Step 32793: {'lr': 0.0004484717877546377, 'samples': 6296256, 'steps': 32792, 'loss/train': 1.582984447479248} -08/30/2021 19:10:02 - INFO - __main__ - Step 32794: {'lr': 0.0004484685608637798, 'samples': 6296448, 'steps': 32793, 'loss/train': 0.7589924931526184} -08/30/2021 19:10:02 - INFO - __main__ - Step 32795: {'lr': 0.00044846533388349507, 'samples': 6296640, 'steps': 32794, 'loss/train': 1.3637824058532715} -08/30/2021 19:10:03 - INFO - __main__ - Step 32796: {'lr': 0.00044846210681378487, 'samples': 6296832, 'steps': 32795, 'loss/train': 0.041862208396196365} -08/30/2021 19:10:03 - INFO - __main__ - Step 32797: {'lr': 0.00044845887965465076, 'samples': 6297024, 'steps': 32796, 'loss/train': 0.030864065513014793} -08/30/2021 19:10:04 - INFO - __main__ - Step 32798: {'lr': 0.0004484556524060941, 'samples': 6297216, 'steps': 32797, 'loss/train': 1.4275683164596558} -08/30/2021 19:10:05 - INFO - __main__ - Step 32799: {'lr': 0.00044845242506811646, 'samples': 6297408, 'steps': 32798, 'loss/train': 2.122243881225586} -08/30/2021 19:10:05 - INFO - __main__ - Step 32800: {'lr': 0.0004484491976407192, 'samples': 6297600, 'steps': 32799, 'loss/train': 1.2846108675003052} -08/30/2021 19:10:06 - INFO - __main__ - Step 32801: {'lr': 0.00044844597012390374, 'samples': 6297792, 'steps': 32800, 'loss/train': 1.277563214302063} -08/30/2021 19:10:06 - INFO - __main__ - Step 32802: {'lr': 0.0004484427425176716, 'samples': 6297984, 'steps': 32801, 'loss/train': 1.9680557250976562} -08/30/2021 19:10:06 - INFO - __main__ - Step 32803: {'lr': 0.0004484395148220243, 'samples': 6298176, 'steps': 32802, 'loss/train': 1.4853097200393677} -08/30/2021 19:10:07 - INFO - __main__ - Step 32804: {'lr': 0.000448436287036963, 'samples': 6298368, 'steps': 32803, 'loss/train': 1.9306087493896484} -08/30/2021 19:10:08 - INFO - __main__ - Step 32805: {'lr': 0.0004484330591624896, 'samples': 6298560, 'steps': 32804, 'loss/train': 1.0610910654067993} -08/30/2021 19:10:09 - INFO - __main__ - Step 32806: {'lr': 0.00044842983119860525, 'samples': 6298752, 'steps': 32805, 'loss/train': 1.5891335010528564} -08/30/2021 19:10:09 - INFO - __main__ - Step 32807: {'lr': 0.00044842660314531145, 'samples': 6298944, 'steps': 32806, 'loss/train': 1.5910804271697998} -08/30/2021 19:10:09 - INFO - __main__ - Step 32808: {'lr': 0.0004484233750026098, 'samples': 6299136, 'steps': 32807, 'loss/train': 1.2846381664276123} -08/30/2021 19:10:10 - INFO - __main__ - Step 32809: {'lr': 0.00044842014677050145, 'samples': 6299328, 'steps': 32808, 'loss/train': 2.3574535846710205} -08/30/2021 19:10:12 - INFO - __main__ - Step 32810: {'lr': 0.0004484169184489882, 'samples': 6299520, 'steps': 32809, 'loss/train': 1.4643610715866089} -08/30/2021 19:10:13 - INFO - __main__ - Step 32811: {'lr': 0.0004484136900380713, 'samples': 6299712, 'steps': 32810, 'loss/train': 0.11108077317476273} -08/30/2021 19:10:13 - INFO - __main__ - Step 32812: {'lr': 0.00044841046153775224, 'samples': 6299904, 'steps': 32811, 'loss/train': 1.1247373819351196} -08/30/2021 19:10:13 - INFO - __main__ - Step 32813: {'lr': 0.0004484072329480325, 'samples': 6300096, 'steps': 32812, 'loss/train': 1.5413495302200317} -08/30/2021 19:10:14 - INFO - __main__ - Step 32814: {'lr': 0.00044840400426891347, 'samples': 6300288, 'steps': 32813, 'loss/train': 1.8364087343215942} -08/30/2021 19:10:15 - INFO - __main__ - Step 32815: {'lr': 0.00044840077550039676, 'samples': 6300480, 'steps': 32814, 'loss/train': 2.443309783935547} -08/30/2021 19:10:16 - INFO - __main__ - Step 32816: {'lr': 0.0004483975466424837, 'samples': 6300672, 'steps': 32815, 'loss/train': 1.6044660806655884} -08/30/2021 19:10:16 - INFO - __main__ - Step 32817: {'lr': 0.0004483943176951757, 'samples': 6300864, 'steps': 32816, 'loss/train': 1.4346952438354492} -08/30/2021 19:10:16 - INFO - __main__ - Step 32818: {'lr': 0.0004483910886584743, 'samples': 6301056, 'steps': 32817, 'loss/train': 0.5182101726531982} -08/30/2021 19:10:17 - INFO - __main__ - Step 32819: {'lr': 0.00044838785953238094, 'samples': 6301248, 'steps': 32818, 'loss/train': 1.564134120941162} -08/30/2021 19:10:18 - INFO - __main__ - Step 32820: {'lr': 0.0004483846303168971, 'samples': 6301440, 'steps': 32819, 'loss/train': 5.843997478485107} -08/30/2021 19:10:19 - INFO - __main__ - Step 32821: {'lr': 0.0004483814010120242, 'samples': 6301632, 'steps': 32820, 'loss/train': 0.6713508367538452} -08/30/2021 19:10:19 - INFO - __main__ - Step 32822: {'lr': 0.00044837817161776366, 'samples': 6301824, 'steps': 32821, 'loss/train': 1.1678550243377686} -08/30/2021 19:10:19 - INFO - __main__ - Step 32823: {'lr': 0.000448374942134117, 'samples': 6302016, 'steps': 32822, 'loss/train': 1.200532078742981} -08/30/2021 19:10:20 - INFO - __main__ - Step 32824: {'lr': 0.0004483717125610857, 'samples': 6302208, 'steps': 32823, 'loss/train': 1.3769738674163818} -08/30/2021 19:10:21 - INFO - __main__ - Step 32825: {'lr': 0.0004483684828986712, 'samples': 6302400, 'steps': 32824, 'loss/train': 0.6602734327316284} -08/30/2021 19:10:22 - INFO - __main__ - Step 32826: {'lr': 0.00044836525314687477, 'samples': 6302592, 'steps': 32825, 'loss/train': 1.5529022216796875} -08/30/2021 19:10:22 - INFO - __main__ - Step 32827: {'lr': 0.0004483620233056981, 'samples': 6302784, 'steps': 32826, 'loss/train': 1.3596118688583374} -08/30/2021 19:10:23 - INFO - __main__ - Step 32828: {'lr': 0.00044835879337514254, 'samples': 6302976, 'steps': 32827, 'loss/train': 0.3349132835865021} -08/30/2021 19:10:23 - INFO - __main__ - Step 32829: {'lr': 0.0004483555633552096, 'samples': 6303168, 'steps': 32828, 'loss/train': 1.4111298322677612} -08/30/2021 19:10:23 - INFO - __main__ - Step 32830: {'lr': 0.00044835233324590077, 'samples': 6303360, 'steps': 32829, 'loss/train': 1.9994674921035767} -08/30/2021 19:10:25 - INFO - __main__ - Step 32831: {'lr': 0.0004483491030472173, 'samples': 6303552, 'steps': 32830, 'loss/train': 1.2204504013061523} -08/30/2021 19:10:25 - INFO - __main__ - Step 32832: {'lr': 0.00044834587275916084, 'samples': 6303744, 'steps': 32831, 'loss/train': 1.4277275800704956} -08/30/2021 19:10:25 - INFO - __main__ - Step 32833: {'lr': 0.00044834264238173283, 'samples': 6303936, 'steps': 32832, 'loss/train': 1.8300209045410156} -08/30/2021 19:10:26 - INFO - __main__ - Step 32834: {'lr': 0.00044833941191493463, 'samples': 6304128, 'steps': 32833, 'loss/train': 1.5082029104232788} -08/30/2021 19:10:26 - INFO - __main__ - Step 32835: {'lr': 0.0004483361813587678, 'samples': 6304320, 'steps': 32834, 'loss/train': 1.2829923629760742} -08/30/2021 19:10:28 - INFO - __main__ - Step 32836: {'lr': 0.0004483329507132337, 'samples': 6304512, 'steps': 32835, 'loss/train': 1.0331817865371704} -08/30/2021 19:10:28 - INFO - __main__ - Step 32837: {'lr': 0.0004483297199783338, 'samples': 6304704, 'steps': 32836, 'loss/train': 1.5563338994979858} -08/30/2021 19:10:28 - INFO - __main__ - Step 32838: {'lr': 0.0004483264891540697, 'samples': 6304896, 'steps': 32837, 'loss/train': 1.225629210472107} -08/30/2021 19:10:29 - INFO - __main__ - Step 32839: {'lr': 0.00044832325824044274, 'samples': 6305088, 'steps': 32838, 'loss/train': 1.5003451108932495} -08/30/2021 19:10:29 - INFO - __main__ - Step 32840: {'lr': 0.0004483200272374543, 'samples': 6305280, 'steps': 32839, 'loss/train': 1.928655743598938} -08/30/2021 19:10:31 - INFO - __main__ - Step 32841: {'lr': 0.0004483167961451059, 'samples': 6305472, 'steps': 32840, 'loss/train': 0.3928397297859192} -08/30/2021 19:10:31 - INFO - __main__ - Step 32842: {'lr': 0.00044831356496339913, 'samples': 6305664, 'steps': 32841, 'loss/train': 0.057061389088630676} -08/30/2021 19:10:31 - INFO - __main__ - Step 32843: {'lr': 0.0004483103336923352, 'samples': 6305856, 'steps': 32842, 'loss/train': 0.6988543272018433} -08/30/2021 19:10:32 - INFO - __main__ - Step 32844: {'lr': 0.00044830710233191573, 'samples': 6306048, 'steps': 32843, 'loss/train': 0.26205503940582275} -08/30/2021 19:10:32 - INFO - __main__ - Step 32845: {'lr': 0.0004483038708821422, 'samples': 6306240, 'steps': 32844, 'loss/train': 1.4207615852355957} -08/30/2021 19:10:34 - INFO - __main__ - Step 32846: {'lr': 0.00044830063934301603, 'samples': 6306432, 'steps': 32845, 'loss/train': 1.0527763366699219} -08/30/2021 19:10:34 - INFO - __main__ - Step 32847: {'lr': 0.0004482974077145385, 'samples': 6306624, 'steps': 32846, 'loss/train': 1.5359408855438232} -08/30/2021 19:10:35 - INFO - __main__ - Step 32848: {'lr': 0.0004482941759967113, 'samples': 6306816, 'steps': 32847, 'loss/train': 2.462907552719116} -08/30/2021 19:10:35 - INFO - __main__ - Step 32849: {'lr': 0.00044829094418953586, 'samples': 6307008, 'steps': 32848, 'loss/train': 1.7602477073669434} -08/30/2021 19:10:35 - INFO - __main__ - Step 32850: {'lr': 0.00044828771229301354, 'samples': 6307200, 'steps': 32849, 'loss/train': 1.3864902257919312} -08/30/2021 19:10:37 - INFO - __main__ - Step 32851: {'lr': 0.0004482844803071458, 'samples': 6307392, 'steps': 32850, 'loss/train': 1.4359735250473022} -08/30/2021 19:10:37 - INFO - __main__ - Step 32852: {'lr': 0.00044828124823193417, 'samples': 6307584, 'steps': 32851, 'loss/train': 1.408004879951477} -08/30/2021 19:10:38 - INFO - __main__ - Step 32853: {'lr': 0.00044827801606738004, 'samples': 6307776, 'steps': 32852, 'loss/train': 0.5277725458145142} -08/30/2021 19:10:38 - INFO - __main__ - Step 32854: {'lr': 0.00044827478381348495, 'samples': 6307968, 'steps': 32853, 'loss/train': 1.0319784879684448} -08/30/2021 19:10:38 - INFO - __main__ - Step 32855: {'lr': 0.00044827155147025025, 'samples': 6308160, 'steps': 32854, 'loss/train': 1.5729713439941406} -08/30/2021 19:10:40 - INFO - __main__ - Step 32856: {'lr': 0.00044826831903767745, 'samples': 6308352, 'steps': 32855, 'loss/train': 1.4462401866912842} -08/30/2021 19:10:41 - INFO - __main__ - Step 32857: {'lr': 0.000448265086515768, 'samples': 6308544, 'steps': 32856, 'loss/train': 1.4757256507873535} -08/30/2021 19:10:41 - INFO - __main__ - Step 32858: {'lr': 0.0004482618539045234, 'samples': 6308736, 'steps': 32857, 'loss/train': 1.4521393775939941} -08/30/2021 19:10:41 - INFO - __main__ - Step 32859: {'lr': 0.00044825862120394504, 'samples': 6308928, 'steps': 32858, 'loss/train': 1.6196850538253784} -08/30/2021 19:10:42 - INFO - __main__ - Step 32860: {'lr': 0.00044825538841403444, 'samples': 6309120, 'steps': 32859, 'loss/train': 1.2773644924163818} -08/30/2021 19:10:42 - INFO - __main__ - Step 32861: {'lr': 0.000448252155534793, 'samples': 6309312, 'steps': 32860, 'loss/train': 0.028032349422574043} -08/30/2021 19:10:44 - INFO - __main__ - Step 32862: {'lr': 0.0004482489225662222, 'samples': 6309504, 'steps': 32861, 'loss/train': 1.7170188426971436} -08/30/2021 19:10:45 - INFO - __main__ - Step 32863: {'lr': 0.00044824568950832343, 'samples': 6309696, 'steps': 32862, 'loss/train': 1.2952020168304443} -08/30/2021 19:10:45 - INFO - __main__ - Step 32864: {'lr': 0.0004482424563610983, 'samples': 6309888, 'steps': 32863, 'loss/train': 1.0653008222579956} -08/30/2021 19:10:45 - INFO - __main__ - Step 32865: {'lr': 0.00044823922312454815, 'samples': 6310080, 'steps': 32864, 'loss/train': 1.279534101486206} -08/30/2021 19:10:46 - INFO - __main__ - Step 32866: {'lr': 0.00044823598979867445, 'samples': 6310272, 'steps': 32865, 'loss/train': 1.3014886379241943} -08/30/2021 19:10:46 - INFO - __main__ - Step 32867: {'lr': 0.0004482327563834787, 'samples': 6310464, 'steps': 32866, 'loss/train': 1.071877121925354} -08/30/2021 19:10:48 - INFO - __main__ - Step 32868: {'lr': 0.00044822952287896237, 'samples': 6310656, 'steps': 32867, 'loss/train': 1.4732680320739746} -08/30/2021 19:10:48 - INFO - __main__ - Step 32869: {'lr': 0.00044822628928512675, 'samples': 6310848, 'steps': 32868, 'loss/train': 1.6002378463745117} -08/30/2021 19:10:48 - INFO - __main__ - Step 32870: {'lr': 0.0004482230556019735, 'samples': 6311040, 'steps': 32869, 'loss/train': 1.1972324848175049} -08/30/2021 19:10:49 - INFO - __main__ - Step 32871: {'lr': 0.00044821982182950405, 'samples': 6311232, 'steps': 32870, 'loss/train': 1.9368282556533813} -08/30/2021 19:10:49 - INFO - __main__ - Step 32872: {'lr': 0.0004482165879677197, 'samples': 6311424, 'steps': 32871, 'loss/train': 1.9383968114852905} -08/30/2021 19:10:51 - INFO - __main__ - Step 32873: {'lr': 0.0004482133540166221, 'samples': 6311616, 'steps': 32872, 'loss/train': 2.573394775390625} -08/30/2021 19:10:52 - INFO - __main__ - Step 32874: {'lr': 0.00044821011997621255, 'samples': 6311808, 'steps': 32873, 'loss/train': 0.07509901374578476} -08/30/2021 19:10:52 - INFO - __main__ - Step 32875: {'lr': 0.0004482068858464926, 'samples': 6312000, 'steps': 32874, 'loss/train': 1.333949089050293} -08/30/2021 19:10:52 - INFO - __main__ - Step 32876: {'lr': 0.00044820365162746373, 'samples': 6312192, 'steps': 32875, 'loss/train': 0.07692991942167282} -08/30/2021 19:10:53 - INFO - __main__ - Step 32877: {'lr': 0.00044820041731912733, 'samples': 6312384, 'steps': 32876, 'loss/train': 0.05485493317246437} -08/30/2021 19:10:53 - INFO - __main__ - Step 32878: {'lr': 0.0004481971829214848, 'samples': 6312576, 'steps': 32877, 'loss/train': 1.114728569984436} -08/30/2021 19:10:55 - INFO - __main__ - Step 32879: {'lr': 0.0004481939484345378, 'samples': 6312768, 'steps': 32878, 'loss/train': 1.8709505796432495} -08/30/2021 19:10:55 - INFO - __main__ - Step 32880: {'lr': 0.0004481907138582876, 'samples': 6312960, 'steps': 32879, 'loss/train': 1.565878987312317} -08/30/2021 19:10:56 - INFO - __main__ - Step 32881: {'lr': 0.00044818747919273574, 'samples': 6313152, 'steps': 32880, 'loss/train': 1.45503568649292} -08/30/2021 19:10:56 - INFO - __main__ - Step 32882: {'lr': 0.0004481842444378837, 'samples': 6313344, 'steps': 32881, 'loss/train': 1.6048507690429688} -08/30/2021 19:10:56 - INFO - __main__ - Step 32883: {'lr': 0.0004481810095937329, 'samples': 6313536, 'steps': 32882, 'loss/train': 1.7029558420181274} -08/30/2021 19:10:57 - INFO - __main__ - Step 32884: {'lr': 0.00044817777466028467, 'samples': 6313728, 'steps': 32883, 'loss/train': 1.2898426055908203} -08/30/2021 19:10:58 - INFO - __main__ - Step 32885: {'lr': 0.0004481745396375407, 'samples': 6313920, 'steps': 32884, 'loss/train': 0.8254020810127258} -08/30/2021 19:10:59 - INFO - __main__ - Step 32886: {'lr': 0.0004481713045255023, 'samples': 6314112, 'steps': 32885, 'loss/train': 2.064681053161621} -08/30/2021 19:10:59 - INFO - __main__ - Step 32887: {'lr': 0.000448168069324171, 'samples': 6314304, 'steps': 32886, 'loss/train': 1.5842360258102417} -08/30/2021 19:10:59 - INFO - __main__ - Step 32888: {'lr': 0.0004481648340335482, 'samples': 6314496, 'steps': 32887, 'loss/train': 1.7877769470214844} -08/30/2021 19:11:00 - INFO - __main__ - Step 32889: {'lr': 0.0004481615986536354, 'samples': 6314688, 'steps': 32888, 'loss/train': 2.089043378829956} -08/30/2021 19:11:01 - INFO - __main__ - Step 32890: {'lr': 0.000448158363184434, 'samples': 6314880, 'steps': 32889, 'loss/train': 1.4092888832092285} -08/30/2021 19:11:02 - INFO - __main__ - Step 32891: {'lr': 0.00044815512762594556, 'samples': 6315072, 'steps': 32890, 'loss/train': 1.306431531906128} -08/30/2021 19:11:02 - INFO - __main__ - Step 32892: {'lr': 0.00044815189197817143, 'samples': 6315264, 'steps': 32891, 'loss/train': 1.7321676015853882} -08/30/2021 19:11:03 - INFO - __main__ - Step 32893: {'lr': 0.0004481486562411131, 'samples': 6315456, 'steps': 32892, 'loss/train': 1.692110300064087} -08/30/2021 19:11:03 - INFO - __main__ - Step 32894: {'lr': 0.0004481454204147721, 'samples': 6315648, 'steps': 32893, 'loss/train': 1.518251895904541} -08/30/2021 19:11:05 - INFO - __main__ - Step 32895: {'lr': 0.0004481421844991498, 'samples': 6315840, 'steps': 32894, 'loss/train': 1.3641338348388672} -08/30/2021 19:11:05 - INFO - __main__ - Step 32896: {'lr': 0.00044813894849424777, 'samples': 6316032, 'steps': 32895, 'loss/train': 1.3225665092468262} -08/30/2021 19:11:05 - INFO - __main__ - Step 32897: {'lr': 0.0004481357124000672, 'samples': 6316224, 'steps': 32896, 'loss/train': 1.2750303745269775} -08/30/2021 19:11:06 - INFO - __main__ - Step 32898: {'lr': 0.0004481324762166099, 'samples': 6316416, 'steps': 32897, 'loss/train': 2.331758975982666} -08/30/2021 19:11:06 - INFO - __main__ - Step 32899: {'lr': 0.0004481292399438771, 'samples': 6316608, 'steps': 32898, 'loss/train': 1.3119992017745972} -08/30/2021 19:11:08 - INFO - __main__ - Step 32900: {'lr': 0.0004481260035818704, 'samples': 6316800, 'steps': 32899, 'loss/train': 2.2424676418304443} -08/30/2021 19:11:08 - INFO - __main__ - Step 32901: {'lr': 0.00044812276713059106, 'samples': 6316992, 'steps': 32900, 'loss/train': 1.5014487504959106} -08/30/2021 19:11:08 - INFO - __main__ - Step 32902: {'lr': 0.00044811953059004073, 'samples': 6317184, 'steps': 32901, 'loss/train': 1.6551412343978882} -08/30/2021 19:11:09 - INFO - __main__ - Step 32903: {'lr': 0.0004481162939602208, 'samples': 6317376, 'steps': 32902, 'loss/train': 1.285164713859558} -08/30/2021 19:11:09 - INFO - __main__ - Step 32904: {'lr': 0.0004481130572411327, 'samples': 6317568, 'steps': 32903, 'loss/train': 1.6648117303848267} -08/30/2021 19:11:10 - INFO - __main__ - Step 32905: {'lr': 0.00044810982043277795, 'samples': 6317760, 'steps': 32904, 'loss/train': 0.7461702823638916} -08/30/2021 19:11:11 - INFO - __main__ - Step 32906: {'lr': 0.0004481065835351579, 'samples': 6317952, 'steps': 32905, 'loss/train': 0.8383270502090454} -08/30/2021 19:11:12 - INFO - __main__ - Step 32907: {'lr': 0.0004481033465482741, 'samples': 6318144, 'steps': 32906, 'loss/train': 1.3237212896347046} -08/30/2021 19:11:12 - INFO - __main__ - Step 32908: {'lr': 0.00044810010947212803, 'samples': 6318336, 'steps': 32907, 'loss/train': 1.6517670154571533} -08/30/2021 19:11:13 - INFO - __main__ - Step 32909: {'lr': 0.00044809687230672115, 'samples': 6318528, 'steps': 32908, 'loss/train': 2.0691163539886475} -08/30/2021 19:11:13 - INFO - __main__ - Step 32910: {'lr': 0.0004480936350520548, 'samples': 6318720, 'steps': 32909, 'loss/train': 3.0470848083496094} -08/30/2021 19:11:13 - INFO - __main__ - Step 32911: {'lr': 0.0004480903977081305, 'samples': 6318912, 'steps': 32910, 'loss/train': 1.6182889938354492} -08/30/2021 19:11:15 - INFO - __main__ - Step 32912: {'lr': 0.00044808716027494973, 'samples': 6319104, 'steps': 32911, 'loss/train': 1.622750997543335} -08/30/2021 19:11:15 - INFO - __main__ - Step 32913: {'lr': 0.000448083922752514, 'samples': 6319296, 'steps': 32912, 'loss/train': 1.1536993980407715} -08/30/2021 19:11:16 - INFO - __main__ - Step 32914: {'lr': 0.00044808068514082467, 'samples': 6319488, 'steps': 32913, 'loss/train': 1.4181472063064575} -08/30/2021 19:11:16 - INFO - __main__ - Step 32915: {'lr': 0.0004480774474398832, 'samples': 6319680, 'steps': 32914, 'loss/train': 1.9158234596252441} -08/30/2021 19:11:16 - INFO - __main__ - Step 32916: {'lr': 0.00044807420964969113, 'samples': 6319872, 'steps': 32915, 'loss/train': 1.9926166534423828} -08/30/2021 19:11:18 - INFO - __main__ - Step 32917: {'lr': 0.0004480709717702499, 'samples': 6320064, 'steps': 32916, 'loss/train': 2.0427207946777344} -08/30/2021 19:11:19 - INFO - __main__ - Step 32918: {'lr': 0.000448067733801561, 'samples': 6320256, 'steps': 32917, 'loss/train': 1.439934253692627} -08/30/2021 19:11:19 - INFO - __main__ - Step 32919: {'lr': 0.00044806449574362575, 'samples': 6320448, 'steps': 32918, 'loss/train': 1.6649162769317627} -08/30/2021 19:11:19 - INFO - __main__ - Step 32920: {'lr': 0.00044806125759644567, 'samples': 6320640, 'steps': 32919, 'loss/train': 1.4974573850631714} -08/30/2021 19:11:20 - INFO - __main__ - Step 32921: {'lr': 0.00044805801936002225, 'samples': 6320832, 'steps': 32920, 'loss/train': 7.483266353607178} -08/30/2021 19:11:20 - INFO - __main__ - Step 32922: {'lr': 0.00044805478103435707, 'samples': 6321024, 'steps': 32921, 'loss/train': 1.9284188747406006} -08/30/2021 19:11:22 - INFO - __main__ - Step 32923: {'lr': 0.0004480515426194513, 'samples': 6321216, 'steps': 32922, 'loss/train': 1.7512258291244507} -08/30/2021 19:11:23 - INFO - __main__ - Step 32924: {'lr': 0.0004480483041153066, 'samples': 6321408, 'steps': 32923, 'loss/train': 2.1436784267425537} -08/30/2021 19:11:23 - INFO - __main__ - Step 32925: {'lr': 0.00044804506552192447, 'samples': 6321600, 'steps': 32924, 'loss/train': 1.8077055215835571} -08/30/2021 19:11:23 - INFO - __main__ - Step 32926: {'lr': 0.0004480418268393062, 'samples': 6321792, 'steps': 32925, 'loss/train': 1.9932621717453003} -08/30/2021 19:11:24 - INFO - __main__ - Step 32927: {'lr': 0.0004480385880674534, 'samples': 6321984, 'steps': 32926, 'loss/train': 1.8775341510772705} -08/30/2021 19:11:26 - INFO - __main__ - Step 32928: {'lr': 0.00044803534920636744, 'samples': 6322176, 'steps': 32927, 'loss/train': 1.1780743598937988} -08/30/2021 19:11:26 - INFO - __main__ - Step 32929: {'lr': 0.00044803211025604985, 'samples': 6322368, 'steps': 32928, 'loss/train': 1.2579072713851929} -08/30/2021 19:11:26 - INFO - __main__ - Step 32930: {'lr': 0.000448028871216502, 'samples': 6322560, 'steps': 32929, 'loss/train': 0.7032141089439392} -08/30/2021 19:11:27 - INFO - __main__ - Step 32931: {'lr': 0.0004480256320877254, 'samples': 6322752, 'steps': 32930, 'loss/train': 0.545499324798584} -08/30/2021 19:11:27 - INFO - __main__ - Step 32932: {'lr': 0.00044802239286972147, 'samples': 6322944, 'steps': 32931, 'loss/train': 1.4685508012771606} -08/30/2021 19:11:27 - INFO - __main__ - Step 32933: {'lr': 0.0004480191535624918, 'samples': 6323136, 'steps': 32932, 'loss/train': 0.3264021575450897} -08/30/2021 19:11:29 - INFO - __main__ - Step 32934: {'lr': 0.0004480159141660377, 'samples': 6323328, 'steps': 32933, 'loss/train': 0.9525347948074341} -08/30/2021 19:11:30 - INFO - __main__ - Step 32935: {'lr': 0.00044801267468036064, 'samples': 6323520, 'steps': 32934, 'loss/train': 1.7658441066741943} -08/30/2021 19:11:30 - INFO - __main__ - Step 32936: {'lr': 0.0004480094351054622, 'samples': 6323712, 'steps': 32935, 'loss/train': 1.2192119359970093} -08/30/2021 19:11:30 - INFO - __main__ - Step 32937: {'lr': 0.00044800619544134375, 'samples': 6323904, 'steps': 32936, 'loss/train': 1.8914642333984375} -08/30/2021 19:11:31 - INFO - __main__ - Step 32938: {'lr': 0.00044800295568800673, 'samples': 6324096, 'steps': 32937, 'loss/train': 2.274127721786499} -08/30/2021 19:11:31 - INFO - __main__ - Step 32939: {'lr': 0.0004479997158454526, 'samples': 6324288, 'steps': 32938, 'loss/train': 3.3844077587127686} -08/30/2021 19:11:32 - INFO - __main__ - Step 32940: {'lr': 0.00044799647591368296, 'samples': 6324480, 'steps': 32939, 'loss/train': 1.9486433267593384} -08/30/2021 19:11:33 - INFO - __main__ - Step 32941: {'lr': 0.00044799323589269914, 'samples': 6324672, 'steps': 32940, 'loss/train': 1.6158136129379272} -08/30/2021 19:11:33 - INFO - __main__ - Step 32942: {'lr': 0.00044798999578250255, 'samples': 6324864, 'steps': 32941, 'loss/train': 1.310711145401001} -08/30/2021 19:11:34 - INFO - __main__ - Step 32943: {'lr': 0.0004479867555830948, 'samples': 6325056, 'steps': 32942, 'loss/train': 1.3904486894607544} -08/30/2021 19:11:34 - INFO - __main__ - Step 32944: {'lr': 0.0004479835152944772, 'samples': 6325248, 'steps': 32943, 'loss/train': 1.6982293128967285} -08/30/2021 19:11:35 - INFO - __main__ - Step 32945: {'lr': 0.00044798027491665135, 'samples': 6325440, 'steps': 32944, 'loss/train': 1.9827361106872559} -08/30/2021 19:11:36 - INFO - __main__ - Step 32946: {'lr': 0.00044797703444961857, 'samples': 6325632, 'steps': 32945, 'loss/train': 1.3845924139022827} -08/30/2021 19:11:36 - INFO - __main__ - Step 32947: {'lr': 0.00044797379389338045, 'samples': 6325824, 'steps': 32946, 'loss/train': 2.106088876724243} -08/30/2021 19:11:37 - INFO - __main__ - Step 32948: {'lr': 0.0004479705532479384, 'samples': 6326016, 'steps': 32947, 'loss/train': 1.5674136877059937} -08/30/2021 19:11:37 - INFO - __main__ - Step 32949: {'lr': 0.0004479673125132938, 'samples': 6326208, 'steps': 32948, 'loss/train': 1.493359088897705} -08/30/2021 19:11:39 - INFO - __main__ - Step 32950: {'lr': 0.0004479640716894483, 'samples': 6326400, 'steps': 32949, 'loss/train': 1.832162857055664} -08/30/2021 19:11:39 - INFO - __main__ - Step 32951: {'lr': 0.00044796083077640314, 'samples': 6326592, 'steps': 32950, 'loss/train': 1.3775365352630615} -08/30/2021 19:11:39 - INFO - __main__ - Step 32952: {'lr': 0.00044795758977416, 'samples': 6326784, 'steps': 32951, 'loss/train': 1.848576307296753} -08/30/2021 19:11:40 - INFO - __main__ - Step 32953: {'lr': 0.0004479543486827201, 'samples': 6326976, 'steps': 32952, 'loss/train': 1.3696128129959106} -08/30/2021 19:11:40 - INFO - __main__ - Step 32954: {'lr': 0.0004479511075020851, 'samples': 6327168, 'steps': 32953, 'loss/train': 1.454092025756836} -08/30/2021 19:11:42 - INFO - __main__ - Step 32955: {'lr': 0.00044794786623225636, 'samples': 6327360, 'steps': 32954, 'loss/train': 1.6693100929260254} -08/30/2021 19:11:42 - INFO - __main__ - Step 32956: {'lr': 0.0004479446248732354, 'samples': 6327552, 'steps': 32955, 'loss/train': 1.5475125312805176} -08/30/2021 19:11:43 - INFO - __main__ - Step 32957: {'lr': 0.00044794138342502354, 'samples': 6327744, 'steps': 32956, 'loss/train': 1.6520280838012695} -08/30/2021 19:11:43 - INFO - __main__ - Step 32958: {'lr': 0.0004479381418876225, 'samples': 6327936, 'steps': 32957, 'loss/train': 1.093580722808838} -08/30/2021 19:11:43 - INFO - __main__ - Step 32959: {'lr': 0.00044793490026103346, 'samples': 6328128, 'steps': 32958, 'loss/train': 1.9214324951171875} -08/30/2021 19:11:44 - INFO - __main__ - Step 32960: {'lr': 0.0004479316585452581, 'samples': 6328320, 'steps': 32959, 'loss/train': 1.2760549783706665} -08/30/2021 19:11:45 - INFO - __main__ - Step 32961: {'lr': 0.0004479284167402977, 'samples': 6328512, 'steps': 32960, 'loss/train': 0.21415410935878754} -08/30/2021 19:11:46 - INFO - __main__ - Step 32962: {'lr': 0.00044792517484615384, 'samples': 6328704, 'steps': 32961, 'loss/train': 1.455647349357605} -08/30/2021 19:11:46 - INFO - __main__ - Step 32963: {'lr': 0.000447921932862828, 'samples': 6328896, 'steps': 32962, 'loss/train': 1.6069492101669312} -08/30/2021 19:11:46 - INFO - __main__ - Step 32964: {'lr': 0.00044791869079032154, 'samples': 6329088, 'steps': 32963, 'loss/train': 0.2214856892824173} -08/30/2021 19:11:47 - INFO - __main__ - Step 32965: {'lr': 0.000447915448628636, 'samples': 6329280, 'steps': 32964, 'loss/train': 1.82004714012146} -08/30/2021 19:11:48 - INFO - __main__ - Step 32966: {'lr': 0.0004479122063777728, 'samples': 6329472, 'steps': 32965, 'loss/train': 1.7380435466766357} -08/30/2021 19:11:49 - INFO - __main__ - Step 32967: {'lr': 0.0004479089640377334, 'samples': 6329664, 'steps': 32966, 'loss/train': 1.6890532970428467} -08/30/2021 19:11:49 - INFO - __main__ - Step 32968: {'lr': 0.00044790572160851926, 'samples': 6329856, 'steps': 32967, 'loss/train': 1.6374168395996094} -08/30/2021 19:11:49 - INFO - __main__ - Step 32969: {'lr': 0.00044790247909013195, 'samples': 6330048, 'steps': 32968, 'loss/train': 1.3972340822219849} -08/30/2021 19:11:50 - INFO - __main__ - Step 32970: {'lr': 0.0004478992364825728, 'samples': 6330240, 'steps': 32969, 'loss/train': 2.006917953491211} -08/30/2021 19:11:51 - INFO - __main__ - Step 32971: {'lr': 0.00044789599378584324, 'samples': 6330432, 'steps': 32970, 'loss/train': 2.019718647003174} -08/30/2021 19:11:52 - INFO - __main__ - Step 32972: {'lr': 0.0004478927509999449, 'samples': 6330624, 'steps': 32971, 'loss/train': 1.4682337045669556} -08/30/2021 19:11:52 - INFO - __main__ - Step 32973: {'lr': 0.00044788950812487907, 'samples': 6330816, 'steps': 32972, 'loss/train': 1.6100172996520996} -08/30/2021 19:11:53 - INFO - __main__ - Step 32974: {'lr': 0.0004478862651606472, 'samples': 6331008, 'steps': 32973, 'loss/train': 1.8336241245269775} -08/30/2021 19:11:53 - INFO - __main__ - Step 32975: {'lr': 0.000447883022107251, 'samples': 6331200, 'steps': 32974, 'loss/train': 0.11317329853773117} -08/30/2021 19:11:55 - INFO - __main__ - Step 32976: {'lr': 0.00044787977896469167, 'samples': 6331392, 'steps': 32975, 'loss/train': 1.674653172492981} -08/30/2021 19:11:56 - INFO - __main__ - Step 32977: {'lr': 0.0004478765357329708, 'samples': 6331584, 'steps': 32976, 'loss/train': 0.08602840453386307} -08/30/2021 19:11:56 - INFO - __main__ - Step 32978: {'lr': 0.0004478732924120897, 'samples': 6331776, 'steps': 32977, 'loss/train': 5.00439977645874} -08/30/2021 19:11:56 - INFO - __main__ - Step 32979: {'lr': 0.0004478700490020501, 'samples': 6331968, 'steps': 32978, 'loss/train': 1.5188087224960327} -08/30/2021 19:11:57 - INFO - __main__ - Step 32980: {'lr': 0.0004478668055028533, 'samples': 6332160, 'steps': 32979, 'loss/train': 1.8274298906326294} -08/30/2021 19:11:58 - INFO - __main__ - Step 32981: {'lr': 0.0004478635619145007, 'samples': 6332352, 'steps': 32980, 'loss/train': 0.07970250397920609} -08/30/2021 19:11:59 - INFO - __main__ - Step 32982: {'lr': 0.00044786031823699384, 'samples': 6332544, 'steps': 32981, 'loss/train': 0.8789415955543518} -08/30/2021 19:11:59 - INFO - __main__ - Step 32983: {'lr': 0.0004478570744703342, 'samples': 6332736, 'steps': 32982, 'loss/train': 2.237499475479126} -08/30/2021 19:12:00 - INFO - __main__ - Step 32984: {'lr': 0.00044785383061452324, 'samples': 6332928, 'steps': 32983, 'loss/train': 1.8818144798278809} -08/30/2021 19:12:00 - INFO - __main__ - Step 32985: {'lr': 0.00044785058666956234, 'samples': 6333120, 'steps': 32984, 'loss/train': 1.673393726348877} -08/30/2021 19:12:02 - INFO - __main__ - Step 32986: {'lr': 0.000447847342635453, 'samples': 6333312, 'steps': 32985, 'loss/train': 1.3741319179534912} -08/30/2021 19:12:02 - INFO - __main__ - Step 32987: {'lr': 0.00044784409851219675, 'samples': 6333504, 'steps': 32986, 'loss/train': 1.6277153491973877} -08/30/2021 19:12:02 - INFO - __main__ - Step 32988: {'lr': 0.00044784085429979504, 'samples': 6333696, 'steps': 32987, 'loss/train': 1.3665305376052856} -08/30/2021 19:12:03 - INFO - __main__ - Step 32989: {'lr': 0.00044783760999824926, 'samples': 6333888, 'steps': 32988, 'loss/train': 1.4518558979034424} -08/30/2021 19:12:03 - INFO - __main__ - Step 32990: {'lr': 0.00044783436560756086, 'samples': 6334080, 'steps': 32989, 'loss/train': 1.3715745210647583} -08/30/2021 19:12:05 - INFO - __main__ - Step 32991: {'lr': 0.00044783112112773137, 'samples': 6334272, 'steps': 32990, 'loss/train': 0.1078360378742218} -08/30/2021 19:12:06 - INFO - __main__ - Step 32992: {'lr': 0.0004478278765587623, 'samples': 6334464, 'steps': 32991, 'loss/train': 1.7439976930618286} -08/30/2021 19:12:06 - INFO - __main__ - Step 32993: {'lr': 0.000447824631900655, 'samples': 6334656, 'steps': 32992, 'loss/train': 1.2109761238098145} -08/30/2021 19:12:06 - INFO - __main__ - Step 32994: {'lr': 0.00044782138715341094, 'samples': 6334848, 'steps': 32993, 'loss/train': 1.4433255195617676} -08/30/2021 19:12:07 - INFO - __main__ - Step 32995: {'lr': 0.00044781814231703164, 'samples': 6335040, 'steps': 32994, 'loss/train': 0.19289101660251617} -08/30/2021 19:12:07 - INFO - __main__ - Step 32996: {'lr': 0.00044781489739151856, 'samples': 6335232, 'steps': 32995, 'loss/train': 0.1301116943359375} -08/30/2021 19:12:07 - INFO - __main__ - Step 32997: {'lr': 0.00044781165237687306, 'samples': 6335424, 'steps': 32996, 'loss/train': 1.980476975440979} -08/30/2021 19:12:09 - INFO - __main__ - Step 32998: {'lr': 0.00044780840727309676, 'samples': 6335616, 'steps': 32997, 'loss/train': 1.5653765201568604} -08/30/2021 19:12:10 - INFO - __main__ - Step 32999: {'lr': 0.000447805162080191, 'samples': 6335808, 'steps': 32998, 'loss/train': 1.941420555114746} -08/30/2021 19:12:10 - INFO - __main__ - Step 33000: {'lr': 0.0004478019167981573, 'samples': 6336000, 'steps': 32999, 'loss/train': 2.404331922531128} -08/30/2021 19:12:10 - INFO - __main__ - Step 33001: {'lr': 0.00044779867142699713, 'samples': 6336192, 'steps': 33000, 'loss/train': 1.3778611421585083} -08/30/2021 19:12:11 - INFO - __main__ - Step 33002: {'lr': 0.0004477954259667119, 'samples': 6336384, 'steps': 33001, 'loss/train': 0.4002549648284912} -08/30/2021 19:12:12 - INFO - __main__ - Step 33003: {'lr': 0.00044779218041730314, 'samples': 6336576, 'steps': 33002, 'loss/train': 1.8848958015441895} -08/30/2021 19:12:13 - INFO - __main__ - Step 33004: {'lr': 0.00044778893477877225, 'samples': 6336768, 'steps': 33003, 'loss/train': 1.8599143028259277} -08/30/2021 19:12:13 - INFO - __main__ - Step 33005: {'lr': 0.0004477856890511207, 'samples': 6336960, 'steps': 33004, 'loss/train': 2.093334436416626} -08/30/2021 19:12:13 - INFO - __main__ - Step 33006: {'lr': 0.00044778244323435, 'samples': 6337152, 'steps': 33005, 'loss/train': 0.7927687764167786} -08/30/2021 19:12:14 - INFO - __main__ - Step 33007: {'lr': 0.0004477791973284616, 'samples': 6337344, 'steps': 33006, 'loss/train': 1.536917805671692} -08/30/2021 19:12:15 - INFO - __main__ - Step 33008: {'lr': 0.00044777595133345686, 'samples': 6337536, 'steps': 33007, 'loss/train': 2.1827054023742676} -08/30/2021 19:12:16 - INFO - __main__ - Step 33009: {'lr': 0.0004477727052493374, 'samples': 6337728, 'steps': 33008, 'loss/train': 1.6933008432388306} -08/30/2021 19:12:16 - INFO - __main__ - Step 33010: {'lr': 0.0004477694590761046, 'samples': 6337920, 'steps': 33009, 'loss/train': 1.3053333759307861} -08/30/2021 19:12:16 - INFO - __main__ - Step 33011: {'lr': 0.00044776621281375994, 'samples': 6338112, 'steps': 33010, 'loss/train': 1.5660881996154785} -08/30/2021 19:12:17 - INFO - __main__ - Step 33012: {'lr': 0.00044776296646230487, 'samples': 6338304, 'steps': 33011, 'loss/train': 1.2377856969833374} -08/30/2021 19:12:18 - INFO - __main__ - Step 33013: {'lr': 0.00044775972002174085, 'samples': 6338496, 'steps': 33012, 'loss/train': 1.8807965517044067} -08/30/2021 19:12:19 - INFO - __main__ - Step 33014: {'lr': 0.0004477564734920694, 'samples': 6338688, 'steps': 33013, 'loss/train': 2.111697196960449} -08/30/2021 19:12:19 - INFO - __main__ - Step 33015: {'lr': 0.0004477532268732919, 'samples': 6338880, 'steps': 33014, 'loss/train': 1.398719072341919} -08/30/2021 19:12:19 - INFO - __main__ - Step 33016: {'lr': 0.00044774998016540977, 'samples': 6339072, 'steps': 33015, 'loss/train': 1.5961471796035767} -08/30/2021 19:12:20 - INFO - __main__ - Step 33017: {'lr': 0.00044774673336842464, 'samples': 6339264, 'steps': 33016, 'loss/train': 1.4610909223556519} -08/30/2021 19:12:21 - INFO - __main__ - Step 33018: {'lr': 0.0004477434864823379, 'samples': 6339456, 'steps': 33017, 'loss/train': 1.4359678030014038} -08/30/2021 19:12:22 - INFO - __main__ - Step 33019: {'lr': 0.00044774023950715095, 'samples': 6339648, 'steps': 33018, 'loss/train': 1.4415203332901} -08/30/2021 19:12:22 - INFO - __main__ - Step 33020: {'lr': 0.0004477369924428653, 'samples': 6339840, 'steps': 33019, 'loss/train': 2.5177664756774902} -08/30/2021 19:12:23 - INFO - __main__ - Step 33021: {'lr': 0.0004477337452894824, 'samples': 6340032, 'steps': 33020, 'loss/train': 1.6190192699432373} -08/30/2021 19:12:23 - INFO - __main__ - Step 33022: {'lr': 0.0004477304980470038, 'samples': 6340224, 'steps': 33021, 'loss/train': 1.6459637880325317} -08/30/2021 19:12:23 - INFO - __main__ - Step 33023: {'lr': 0.0004477272507154308, 'samples': 6340416, 'steps': 33022, 'loss/train': 1.5261080265045166} -08/30/2021 19:12:25 - INFO - __main__ - Step 33024: {'lr': 0.00044772400329476505, 'samples': 6340608, 'steps': 33023, 'loss/train': 1.8532192707061768} -08/30/2021 19:12:25 - INFO - __main__ - Step 33025: {'lr': 0.0004477207557850078, 'samples': 6340800, 'steps': 33024, 'loss/train': 2.0004000663757324} -08/30/2021 19:12:26 - INFO - __main__ - Step 33026: {'lr': 0.00044771750818616067, 'samples': 6340992, 'steps': 33025, 'loss/train': 1.6905608177185059} -08/30/2021 19:12:26 - INFO - __main__ - Step 33027: {'lr': 0.0004477142604982251, 'samples': 6341184, 'steps': 33026, 'loss/train': 1.8551526069641113} -08/30/2021 19:12:26 - INFO - __main__ - Step 33028: {'lr': 0.0004477110127212025, 'samples': 6341376, 'steps': 33027, 'loss/train': 1.2083057165145874} -08/30/2021 19:12:28 - INFO - __main__ - Step 33029: {'lr': 0.00044770776485509445, 'samples': 6341568, 'steps': 33028, 'loss/train': 1.5260268449783325} -08/30/2021 19:12:28 - INFO - __main__ - Step 33030: {'lr': 0.00044770451689990227, 'samples': 6341760, 'steps': 33029, 'loss/train': 5.980719089508057} -08/30/2021 19:12:29 - INFO - __main__ - Step 33031: {'lr': 0.0004477012688556275, 'samples': 6341952, 'steps': 33030, 'loss/train': 1.6847401857376099} -08/30/2021 19:12:29 - INFO - __main__ - Step 33032: {'lr': 0.0004476980207222716, 'samples': 6342144, 'steps': 33031, 'loss/train': 1.6102837324142456} -08/30/2021 19:12:29 - INFO - __main__ - Step 33033: {'lr': 0.00044769477249983596, 'samples': 6342336, 'steps': 33032, 'loss/train': 2.2273123264312744} -08/30/2021 19:12:32 - INFO - __main__ - Step 33034: {'lr': 0.00044769152418832215, 'samples': 6342528, 'steps': 33033, 'loss/train': 1.6433876752853394} -08/30/2021 19:12:32 - INFO - __main__ - Step 33035: {'lr': 0.00044768827578773164, 'samples': 6342720, 'steps': 33034, 'loss/train': 2.5449917316436768} -08/30/2021 19:12:32 - INFO - __main__ - Step 33036: {'lr': 0.00044768502729806574, 'samples': 6342912, 'steps': 33035, 'loss/train': 0.0667106881737709} -08/30/2021 19:12:33 - INFO - __main__ - Step 33037: {'lr': 0.0004476817787193261, 'samples': 6343104, 'steps': 33036, 'loss/train': 1.247261881828308} -08/30/2021 19:12:33 - INFO - __main__ - Step 33038: {'lr': 0.0004476785300515141, 'samples': 6343296, 'steps': 33037, 'loss/train': 1.3547941446304321} -08/30/2021 19:12:33 - INFO - __main__ - Step 33039: {'lr': 0.0004476752812946312, 'samples': 6343488, 'steps': 33038, 'loss/train': 1.5243659019470215} -08/30/2021 19:12:35 - INFO - __main__ - Step 33040: {'lr': 0.0004476720324486788, 'samples': 6343680, 'steps': 33039, 'loss/train': 1.8858058452606201} -08/30/2021 19:12:36 - INFO - __main__ - Step 33041: {'lr': 0.0004476687835136585, 'samples': 6343872, 'steps': 33040, 'loss/train': 1.2914764881134033} -08/30/2021 19:12:36 - INFO - __main__ - Step 33042: {'lr': 0.0004476655344895717, 'samples': 6344064, 'steps': 33041, 'loss/train': 1.6910029649734497} -08/30/2021 19:12:36 - INFO - __main__ - Step 33043: {'lr': 0.0004476622853764198, 'samples': 6344256, 'steps': 33042, 'loss/train': 1.7504358291625977} -08/30/2021 19:12:37 - INFO - __main__ - Step 33044: {'lr': 0.00044765903617420436, 'samples': 6344448, 'steps': 33043, 'loss/train': 1.9688754081726074} -08/30/2021 19:12:38 - INFO - __main__ - Step 33045: {'lr': 0.00044765578688292686, 'samples': 6344640, 'steps': 33044, 'loss/train': 0.7051455974578857} -08/30/2021 19:12:39 - INFO - __main__ - Step 33046: {'lr': 0.0004476525375025886, 'samples': 6344832, 'steps': 33045, 'loss/train': 1.9232351779937744} -08/30/2021 19:12:39 - INFO - __main__ - Step 33047: {'lr': 0.00044764928803319126, 'samples': 6345024, 'steps': 33046, 'loss/train': 1.4300377368927002} -08/30/2021 19:12:39 - INFO - __main__ - Step 33048: {'lr': 0.00044764603847473615, 'samples': 6345216, 'steps': 33047, 'loss/train': 0.5969157218933105} -08/30/2021 19:12:40 - INFO - __main__ - Step 33049: {'lr': 0.0004476427888272248, 'samples': 6345408, 'steps': 33048, 'loss/train': 1.9350742101669312} -08/30/2021 19:12:41 - INFO - __main__ - Step 33050: {'lr': 0.0004476395390906586, 'samples': 6345600, 'steps': 33049, 'loss/train': 1.226161241531372} -08/30/2021 19:12:42 - INFO - __main__ - Step 33051: {'lr': 0.0004476362892650392, 'samples': 6345792, 'steps': 33050, 'loss/train': 1.5873152017593384} -08/30/2021 19:12:42 - INFO - __main__ - Step 33052: {'lr': 0.0004476330393503678, 'samples': 6345984, 'steps': 33051, 'loss/train': 1.6476330757141113} -08/30/2021 19:12:43 - INFO - __main__ - Step 33053: {'lr': 0.0004476297893466461, 'samples': 6346176, 'steps': 33052, 'loss/train': 1.7915680408477783} -08/30/2021 19:12:43 - INFO - __main__ - Step 33054: {'lr': 0.0004476265392538754, 'samples': 6346368, 'steps': 33053, 'loss/train': 1.0926499366760254} -08/30/2021 19:12:43 - INFO - __main__ - Step 33055: {'lr': 0.0004476232890720573, 'samples': 6346560, 'steps': 33054, 'loss/train': 1.1330680847167969} -08/30/2021 19:12:45 - INFO - __main__ - Step 33056: {'lr': 0.0004476200388011932, 'samples': 6346752, 'steps': 33055, 'loss/train': 1.607593059539795} -08/30/2021 19:12:46 - INFO - __main__ - Step 33057: {'lr': 0.0004476167884412845, 'samples': 6346944, 'steps': 33056, 'loss/train': 1.01962149143219} -08/30/2021 19:12:46 - INFO - __main__ - Step 33058: {'lr': 0.00044761353799233273, 'samples': 6347136, 'steps': 33057, 'loss/train': 0.11563754081726074} -08/30/2021 19:12:46 - INFO - __main__ - Step 33059: {'lr': 0.00044761028745433934, 'samples': 6347328, 'steps': 33058, 'loss/train': 0.08049215376377106} -08/30/2021 19:12:47 - INFO - __main__ - Step 33060: {'lr': 0.00044760703682730584, 'samples': 6347520, 'steps': 33059, 'loss/train': 1.53285551071167} -08/30/2021 19:12:47 - INFO - __main__ - Step 33061: {'lr': 0.00044760378611123365, 'samples': 6347712, 'steps': 33060, 'loss/train': 1.7963281869888306} -08/30/2021 19:12:48 - INFO - __main__ - Step 33062: {'lr': 0.0004476005353061242, 'samples': 6347904, 'steps': 33061, 'loss/train': 1.6620819568634033} -08/30/2021 19:12:49 - INFO - __main__ - Step 33063: {'lr': 0.00044759728441197904, 'samples': 6348096, 'steps': 33062, 'loss/train': 1.6632779836654663} -08/30/2021 19:12:49 - INFO - __main__ - Step 33064: {'lr': 0.0004475940334287996, 'samples': 6348288, 'steps': 33063, 'loss/train': 1.3440567255020142} -08/30/2021 19:12:50 - INFO - __main__ - Step 33065: {'lr': 0.0004475907823565873, 'samples': 6348480, 'steps': 33064, 'loss/train': 0.9957197904586792} -08/30/2021 19:12:50 - INFO - __main__ - Step 33066: {'lr': 0.00044758753119534373, 'samples': 6348672, 'steps': 33065, 'loss/train': 1.9893556833267212} -08/30/2021 19:12:51 - INFO - __main__ - Step 33067: {'lr': 0.0004475842799450702, 'samples': 6348864, 'steps': 33066, 'loss/train': 1.7364380359649658} -08/30/2021 19:12:52 - INFO - __main__ - Step 33068: {'lr': 0.0004475810286057682, 'samples': 6349056, 'steps': 33067, 'loss/train': 1.8391367197036743} -08/30/2021 19:12:52 - INFO - __main__ - Step 33069: {'lr': 0.0004475777771774393, 'samples': 6349248, 'steps': 33068, 'loss/train': 1.7055121660232544} -08/30/2021 19:12:53 - INFO - __main__ - Step 33070: {'lr': 0.00044757452566008497, 'samples': 6349440, 'steps': 33069, 'loss/train': 1.9024608135223389} -08/30/2021 19:12:53 - INFO - __main__ - Step 33071: {'lr': 0.00044757127405370645, 'samples': 6349632, 'steps': 33070, 'loss/train': 1.6867916584014893} -08/30/2021 19:12:55 - INFO - __main__ - Step 33072: {'lr': 0.00044756802235830544, 'samples': 6349824, 'steps': 33071, 'loss/train': 1.8088105916976929} -08/30/2021 19:12:55 - INFO - __main__ - Step 33073: {'lr': 0.00044756477057388336, 'samples': 6350016, 'steps': 33072, 'loss/train': 1.2027164697647095} -08/30/2021 19:12:55 - INFO - __main__ - Step 33074: {'lr': 0.0004475615187004416, 'samples': 6350208, 'steps': 33073, 'loss/train': 0.9536260366439819} -08/30/2021 19:12:56 - INFO - __main__ - Step 33075: {'lr': 0.0004475582667379817, 'samples': 6350400, 'steps': 33074, 'loss/train': 1.1013617515563965} -08/30/2021 19:12:56 - INFO - __main__ - Step 33076: {'lr': 0.0004475550146865051, 'samples': 6350592, 'steps': 33075, 'loss/train': 1.854211688041687} -08/30/2021 19:12:58 - INFO - __main__ - Step 33077: {'lr': 0.00044755176254601323, 'samples': 6350784, 'steps': 33076, 'loss/train': 1.4084270000457764} -08/30/2021 19:12:58 - INFO - __main__ - Step 33078: {'lr': 0.00044754851031650756, 'samples': 6350976, 'steps': 33077, 'loss/train': 1.800654649734497} -08/30/2021 19:12:58 - INFO - __main__ - Step 33079: {'lr': 0.0004475452579979896, 'samples': 6351168, 'steps': 33078, 'loss/train': 1.0381743907928467} -08/30/2021 19:12:59 - INFO - __main__ - Step 33080: {'lr': 0.00044754200559046076, 'samples': 6351360, 'steps': 33079, 'loss/train': 1.8039509057998657} -08/30/2021 19:12:59 - INFO - __main__ - Step 33081: {'lr': 0.0004475387530939226, 'samples': 6351552, 'steps': 33080, 'loss/train': 1.8570154905319214} -08/30/2021 19:13:00 - INFO - __main__ - Step 33082: {'lr': 0.00044753550050837654, 'samples': 6351744, 'steps': 33081, 'loss/train': 1.701557993888855} -08/30/2021 19:13:01 - INFO - __main__ - Step 33083: {'lr': 0.00044753224783382394, 'samples': 6351936, 'steps': 33082, 'loss/train': 1.9021730422973633} -08/30/2021 19:13:01 - INFO - __main__ - Step 33084: {'lr': 0.00044752899507026646, 'samples': 6352128, 'steps': 33083, 'loss/train': 2.026737689971924} -08/30/2021 19:13:02 - INFO - __main__ - Step 33085: {'lr': 0.00044752574221770537, 'samples': 6352320, 'steps': 33084, 'loss/train': 1.6364058256149292} -08/30/2021 19:13:02 - INFO - __main__ - Step 33086: {'lr': 0.0004475224892761423, 'samples': 6352512, 'steps': 33085, 'loss/train': 1.3327927589416504} -08/30/2021 19:13:04 - INFO - __main__ - Step 33087: {'lr': 0.00044751923624557866, 'samples': 6352704, 'steps': 33086, 'loss/train': 0.6286283731460571} -08/30/2021 19:13:05 - INFO - __main__ - Step 33088: {'lr': 0.0004475159831260158, 'samples': 6352896, 'steps': 33087, 'loss/train': 1.3041417598724365} -08/30/2021 19:13:05 - INFO - __main__ - Step 33089: {'lr': 0.00044751272991745537, 'samples': 6353088, 'steps': 33088, 'loss/train': 3.555285930633545} -08/30/2021 19:13:05 - INFO - __main__ - Step 33090: {'lr': 0.00044750947661989873, 'samples': 6353280, 'steps': 33089, 'loss/train': 1.0919694900512695} -08/30/2021 19:13:06 - INFO - __main__ - Step 33091: {'lr': 0.0004475062232333474, 'samples': 6353472, 'steps': 33090, 'loss/train': 1.493559718132019} -08/30/2021 19:13:06 - INFO - __main__ - Step 33092: {'lr': 0.00044750296975780277, 'samples': 6353664, 'steps': 33091, 'loss/train': 1.5346654653549194} -08/30/2021 19:13:08 - INFO - __main__ - Step 33093: {'lr': 0.00044749971619326633, 'samples': 6353856, 'steps': 33092, 'loss/train': 1.525938868522644} -08/30/2021 19:13:08 - INFO - __main__ - Step 33094: {'lr': 0.0004474964625397396, 'samples': 6354048, 'steps': 33093, 'loss/train': 1.625862956047058} -08/30/2021 19:13:08 - INFO - __main__ - Step 33095: {'lr': 0.000447493208797224, 'samples': 6354240, 'steps': 33094, 'loss/train': 1.7917357683181763} -08/30/2021 19:13:09 - INFO - __main__ - Step 33096: {'lr': 0.00044748995496572105, 'samples': 6354432, 'steps': 33095, 'loss/train': 1.6030538082122803} -08/30/2021 19:13:09 - INFO - __main__ - Step 33097: {'lr': 0.0004474867010452321, 'samples': 6354624, 'steps': 33096, 'loss/train': 1.8729901313781738} -08/30/2021 19:13:10 - INFO - __main__ - Step 33098: {'lr': 0.0004474834470357587, 'samples': 6354816, 'steps': 33097, 'loss/train': 1.107359528541565} -08/30/2021 19:13:11 - INFO - __main__ - Step 33099: {'lr': 0.00044748019293730236, 'samples': 6355008, 'steps': 33098, 'loss/train': 0.8696691393852234} -08/30/2021 19:13:11 - INFO - __main__ - Step 33100: {'lr': 0.0004474769387498645, 'samples': 6355200, 'steps': 33099, 'loss/train': 1.7910774946212769} -08/30/2021 19:13:12 - INFO - __main__ - Step 33101: {'lr': 0.0004474736844734465, 'samples': 6355392, 'steps': 33100, 'loss/train': 1.6372565031051636} -08/30/2021 19:13:12 - INFO - __main__ - Step 33102: {'lr': 0.00044747043010805, 'samples': 6355584, 'steps': 33101, 'loss/train': 1.4538310766220093} -08/30/2021 19:13:13 - INFO - __main__ - Step 33103: {'lr': 0.0004474671756536763, 'samples': 6355776, 'steps': 33102, 'loss/train': 1.3681963682174683} -08/30/2021 19:13:14 - INFO - __main__ - Step 33104: {'lr': 0.00044746392111032695, 'samples': 6355968, 'steps': 33103, 'loss/train': 1.4618077278137207} -08/30/2021 19:13:14 - INFO - __main__ - Step 33105: {'lr': 0.00044746066647800343, 'samples': 6356160, 'steps': 33104, 'loss/train': 0.48403170704841614} -08/30/2021 19:13:15 - INFO - __main__ - Step 33106: {'lr': 0.0004474574117567072, 'samples': 6356352, 'steps': 33105, 'loss/train': 1.8794381618499756} -08/30/2021 19:13:15 - INFO - __main__ - Step 33107: {'lr': 0.00044745415694643964, 'samples': 6356544, 'steps': 33106, 'loss/train': 1.640065312385559} -08/30/2021 19:13:16 - INFO - __main__ - Step 33108: {'lr': 0.0004474509020472023, 'samples': 6356736, 'steps': 33107, 'loss/train': 0.6567052602767944} -08/30/2021 19:13:17 - INFO - __main__ - Step 33109: {'lr': 0.0004474476470589967, 'samples': 6356928, 'steps': 33108, 'loss/train': 1.7657300233840942} -08/30/2021 19:13:17 - INFO - __main__ - Step 33110: {'lr': 0.0004474443919818241, 'samples': 6357120, 'steps': 33109, 'loss/train': 1.5498692989349365} -08/30/2021 19:13:18 - INFO - __main__ - Step 33111: {'lr': 0.0004474411368156862, 'samples': 6357312, 'steps': 33110, 'loss/train': 1.566171407699585} -08/30/2021 19:13:18 - INFO - __main__ - Step 33112: {'lr': 0.00044743788156058437, 'samples': 6357504, 'steps': 33111, 'loss/train': 1.715635061264038} -08/30/2021 19:13:19 - INFO - __main__ - Step 33113: {'lr': 0.00044743462621652007, 'samples': 6357696, 'steps': 33112, 'loss/train': 0.8535028696060181} -08/30/2021 19:13:20 - INFO - __main__ - Step 33114: {'lr': 0.0004474313707834947, 'samples': 6357888, 'steps': 33113, 'loss/train': 1.1664762496948242} -08/30/2021 19:13:20 - INFO - __main__ - Step 33115: {'lr': 0.00044742811526150996, 'samples': 6358080, 'steps': 33114, 'loss/train': 1.467318058013916} -08/30/2021 19:13:21 - INFO - __main__ - Step 33116: {'lr': 0.000447424859650567, 'samples': 6358272, 'steps': 33115, 'loss/train': 1.5273271799087524} -08/30/2021 19:13:21 - INFO - __main__ - Step 33117: {'lr': 0.00044742160395066756, 'samples': 6358464, 'steps': 33116, 'loss/train': 1.3869233131408691} -08/30/2021 19:13:22 - INFO - __main__ - Step 33118: {'lr': 0.0004474183481618129, 'samples': 6358656, 'steps': 33117, 'loss/train': 1.1732172966003418} -08/30/2021 19:13:23 - INFO - __main__ - Step 33119: {'lr': 0.00044741509228400465, 'samples': 6358848, 'steps': 33118, 'loss/train': 1.6598488092422485} -08/30/2021 19:13:23 - INFO - __main__ - Step 33120: {'lr': 0.0004474118363172441, 'samples': 6359040, 'steps': 33119, 'loss/train': 0.9198315739631653} -08/30/2021 19:13:24 - INFO - __main__ - Step 33121: {'lr': 0.000447408580261533, 'samples': 6359232, 'steps': 33120, 'loss/train': 0.8731750845909119} -08/30/2021 19:13:24 - INFO - __main__ - Step 33122: {'lr': 0.0004474053241168725, 'samples': 6359424, 'steps': 33121, 'loss/train': 1.7959306240081787} -08/30/2021 19:13:24 - INFO - __main__ - Step 33123: {'lr': 0.00044740206788326423, 'samples': 6359616, 'steps': 33122, 'loss/train': 1.8095154762268066} -08/30/2021 19:13:26 - INFO - __main__ - Step 33124: {'lr': 0.0004473988115607097, 'samples': 6359808, 'steps': 33123, 'loss/train': 2.0089199542999268} -08/30/2021 19:13:26 - INFO - __main__ - Step 33125: {'lr': 0.00044739555514921025, 'samples': 6360000, 'steps': 33124, 'loss/train': 0.3015340268611908} -08/30/2021 19:13:27 - INFO - __main__ - Step 33126: {'lr': 0.0004473922986487674, 'samples': 6360192, 'steps': 33125, 'loss/train': 1.557114601135254} -08/30/2021 19:13:27 - INFO - __main__ - Step 33127: {'lr': 0.00044738904205938264, 'samples': 6360384, 'steps': 33126, 'loss/train': 0.9553331136703491} -08/30/2021 19:13:27 - INFO - __main__ - Step 33128: {'lr': 0.00044738578538105746, 'samples': 6360576, 'steps': 33127, 'loss/train': 1.7851487398147583} -08/30/2021 19:13:29 - INFO - __main__ - Step 33129: {'lr': 0.0004473825286137933, 'samples': 6360768, 'steps': 33128, 'loss/train': 0.785422682762146} -08/30/2021 19:13:29 - INFO - __main__ - Step 33130: {'lr': 0.0004473792717575915, 'samples': 6360960, 'steps': 33129, 'loss/train': 1.3046597242355347} -08/30/2021 19:13:30 - INFO - __main__ - Step 33131: {'lr': 0.00044737601481245376, 'samples': 6361152, 'steps': 33130, 'loss/train': 1.1152418851852417} -08/30/2021 19:13:30 - INFO - __main__ - Step 33132: {'lr': 0.00044737275777838136, 'samples': 6361344, 'steps': 33131, 'loss/train': 1.2857109308242798} -08/30/2021 19:13:30 - INFO - __main__ - Step 33133: {'lr': 0.0004473695006553759, 'samples': 6361536, 'steps': 33132, 'loss/train': 1.2026758193969727} -08/30/2021 19:13:32 - INFO - __main__ - Step 33134: {'lr': 0.0004473662434434388, 'samples': 6361728, 'steps': 33133, 'loss/train': 1.7568212747573853} -08/30/2021 19:13:32 - INFO - __main__ - Step 33135: {'lr': 0.00044736298614257144, 'samples': 6361920, 'steps': 33134, 'loss/train': 1.3744275569915771} -08/30/2021 19:13:33 - INFO - __main__ - Step 33136: {'lr': 0.0004473597287527754, 'samples': 6362112, 'steps': 33135, 'loss/train': 1.0194183588027954} -08/30/2021 19:13:33 - INFO - __main__ - Step 33137: {'lr': 0.00044735647127405216, 'samples': 6362304, 'steps': 33136, 'loss/train': 0.7607768774032593} -08/30/2021 19:13:33 - INFO - __main__ - Step 33138: {'lr': 0.00044735321370640316, 'samples': 6362496, 'steps': 33137, 'loss/train': 0.8930467367172241} -08/30/2021 19:13:35 - INFO - __main__ - Step 33139: {'lr': 0.00044734995604982973, 'samples': 6362688, 'steps': 33138, 'loss/train': 1.7041476964950562} -08/30/2021 19:13:36 - INFO - __main__ - Step 33140: {'lr': 0.0004473466983043335, 'samples': 6362880, 'steps': 33139, 'loss/train': 1.528459072113037} -08/30/2021 19:13:36 - INFO - __main__ - Step 33141: {'lr': 0.0004473434404699159, 'samples': 6363072, 'steps': 33140, 'loss/train': 1.6524134874343872} -08/30/2021 19:13:37 - INFO - __main__ - Step 33142: {'lr': 0.00044734018254657845, 'samples': 6363264, 'steps': 33141, 'loss/train': 1.5705945491790771} -08/30/2021 19:13:37 - INFO - __main__ - Step 33143: {'lr': 0.00044733692453432253, 'samples': 6363456, 'steps': 33142, 'loss/train': 0.06174716725945473} -08/30/2021 19:13:37 - INFO - __main__ - Step 33144: {'lr': 0.00044733366643314956, 'samples': 6363648, 'steps': 33143, 'loss/train': 1.6433777809143066} -08/30/2021 19:13:39 - INFO - __main__ - Step 33145: {'lr': 0.00044733040824306117, 'samples': 6363840, 'steps': 33144, 'loss/train': 4.694973468780518} -08/30/2021 19:13:39 - INFO - __main__ - Step 33146: {'lr': 0.00044732714996405866, 'samples': 6364032, 'steps': 33145, 'loss/train': 1.737661600112915} -08/30/2021 19:13:40 - INFO - __main__ - Step 33147: {'lr': 0.0004473238915961436, 'samples': 6364224, 'steps': 33146, 'loss/train': 1.7607970237731934} -08/30/2021 19:13:40 - INFO - __main__ - Step 33148: {'lr': 0.0004473206331393175, 'samples': 6364416, 'steps': 33147, 'loss/train': 1.1441699266433716} -08/30/2021 19:13:40 - INFO - __main__ - Step 33149: {'lr': 0.0004473173745935818, 'samples': 6364608, 'steps': 33148, 'loss/train': 1.3013454675674438} -08/30/2021 19:13:42 - INFO - __main__ - Step 33150: {'lr': 0.00044731411595893785, 'samples': 6364800, 'steps': 33149, 'loss/train': 1.5090206861495972} -08/30/2021 19:13:42 - INFO - __main__ - Step 33151: {'lr': 0.00044731085723538725, 'samples': 6364992, 'steps': 33150, 'loss/train': 0.9398083686828613} -08/30/2021 19:13:43 - INFO - __main__ - Step 33152: {'lr': 0.00044730759842293136, 'samples': 6365184, 'steps': 33151, 'loss/train': 0.03872733935713768} -08/30/2021 19:13:43 - INFO - __main__ - Step 33153: {'lr': 0.0004473043395215718, 'samples': 6365376, 'steps': 33152, 'loss/train': 1.6674392223358154} -08/30/2021 19:13:43 - INFO - __main__ - Step 33154: {'lr': 0.00044730108053130986, 'samples': 6365568, 'steps': 33153, 'loss/train': 0.07804340124130249} -08/30/2021 19:13:44 - INFO - __main__ - Step 33155: {'lr': 0.00044729782145214717, 'samples': 6365760, 'steps': 33154, 'loss/train': 1.7033551931381226} -08/30/2021 19:13:45 - INFO - __main__ - Step 33156: {'lr': 0.00044729456228408506, 'samples': 6365952, 'steps': 33155, 'loss/train': 1.7550445795059204} -08/30/2021 19:13:46 - INFO - __main__ - Step 33157: {'lr': 0.00044729130302712504, 'samples': 6366144, 'steps': 33156, 'loss/train': 1.3517141342163086} -08/30/2021 19:13:46 - INFO - __main__ - Step 33158: {'lr': 0.00044728804368126873, 'samples': 6366336, 'steps': 33157, 'loss/train': 1.6131904125213623} -08/30/2021 19:13:46 - INFO - __main__ - Step 33159: {'lr': 0.00044728478424651744, 'samples': 6366528, 'steps': 33158, 'loss/train': 1.727964162826538} -08/30/2021 19:13:47 - INFO - __main__ - Step 33160: {'lr': 0.0004472815247228726, 'samples': 6366720, 'steps': 33159, 'loss/train': 1.8815282583236694} -08/30/2021 19:13:48 - INFO - __main__ - Step 33161: {'lr': 0.00044727826511033577, 'samples': 6366912, 'steps': 33160, 'loss/train': 1.420610785484314} -08/30/2021 19:13:49 - INFO - __main__ - Step 33162: {'lr': 0.0004472750054089084, 'samples': 6367104, 'steps': 33161, 'loss/train': 1.2006685733795166} -08/30/2021 19:13:49 - INFO - __main__ - Step 33163: {'lr': 0.00044727174561859194, 'samples': 6367296, 'steps': 33162, 'loss/train': 1.788468599319458} -08/30/2021 19:13:49 - INFO - __main__ - Step 33164: {'lr': 0.00044726848573938796, 'samples': 6367488, 'steps': 33163, 'loss/train': 1.9293099641799927} -08/30/2021 19:13:50 - INFO - __main__ - Step 33165: {'lr': 0.0004472652257712978, 'samples': 6367680, 'steps': 33164, 'loss/train': 0.9755367636680603} -08/30/2021 19:13:51 - INFO - __main__ - Step 33166: {'lr': 0.0004472619657143229, 'samples': 6367872, 'steps': 33165, 'loss/train': 0.9931578636169434} -08/30/2021 19:13:52 - INFO - __main__ - Step 33167: {'lr': 0.00044725870556846495, 'samples': 6368064, 'steps': 33166, 'loss/train': 1.3051424026489258} -08/30/2021 19:13:52 - INFO - __main__ - Step 33168: {'lr': 0.00044725544533372516, 'samples': 6368256, 'steps': 33167, 'loss/train': 1.2481558322906494} -08/30/2021 19:13:52 - INFO - __main__ - Step 33169: {'lr': 0.00044725218501010514, 'samples': 6368448, 'steps': 33168, 'loss/train': 0.6757267713546753} -08/30/2021 19:13:53 - INFO - __main__ - Step 33170: {'lr': 0.0004472489245976063, 'samples': 6368640, 'steps': 33169, 'loss/train': 0.685947835445404} -08/30/2021 19:13:54 - INFO - __main__ - Step 33171: {'lr': 0.00044724566409623013, 'samples': 6368832, 'steps': 33170, 'loss/train': 1.1848844289779663} -08/30/2021 19:13:55 - INFO - __main__ - Step 33172: {'lr': 0.0004472424035059782, 'samples': 6369024, 'steps': 33171, 'loss/train': 1.8384292125701904} -08/30/2021 19:13:55 - INFO - __main__ - Step 33173: {'lr': 0.0004472391428268518, 'samples': 6369216, 'steps': 33172, 'loss/train': 1.9851698875427246} -08/30/2021 19:13:56 - INFO - __main__ - Step 33174: {'lr': 0.00044723588205885254, 'samples': 6369408, 'steps': 33173, 'loss/train': 1.1953809261322021} -08/30/2021 19:13:56 - INFO - __main__ - Step 33175: {'lr': 0.00044723262120198177, 'samples': 6369600, 'steps': 33174, 'loss/train': 0.8316321969032288} -08/30/2021 19:13:56 - INFO - __main__ - Step 33176: {'lr': 0.00044722936025624107, 'samples': 6369792, 'steps': 33175, 'loss/train': 1.3860183954238892} -08/30/2021 19:13:58 - INFO - __main__ - Step 33177: {'lr': 0.00044722609922163184, 'samples': 6369984, 'steps': 33176, 'loss/train': 1.6508485078811646} -08/30/2021 19:13:58 - INFO - __main__ - Step 33178: {'lr': 0.0004472228380981556, 'samples': 6370176, 'steps': 33177, 'loss/train': 1.204204797744751} -08/30/2021 19:13:59 - INFO - __main__ - Step 33179: {'lr': 0.0004472195768858138, 'samples': 6370368, 'steps': 33178, 'loss/train': 1.1181594133377075} -08/30/2021 19:13:59 - INFO - __main__ - Step 33180: {'lr': 0.0004472163155846078, 'samples': 6370560, 'steps': 33179, 'loss/train': 1.6790850162506104} -08/30/2021 19:13:59 - INFO - __main__ - Step 33181: {'lr': 0.0004472130541945393, 'samples': 6370752, 'steps': 33180, 'loss/train': 0.7559379935264587} -08/30/2021 19:14:01 - INFO - __main__ - Step 33182: {'lr': 0.00044720979271560963, 'samples': 6370944, 'steps': 33181, 'loss/train': 1.9271368980407715} -08/30/2021 19:14:02 - INFO - __main__ - Step 33183: {'lr': 0.00044720653114782024, 'samples': 6371136, 'steps': 33182, 'loss/train': 1.4622468948364258} -08/30/2021 19:14:02 - INFO - __main__ - Step 33184: {'lr': 0.0004472032694911726, 'samples': 6371328, 'steps': 33183, 'loss/train': 1.2617207765579224} -08/30/2021 19:14:02 - INFO - __main__ - Step 33185: {'lr': 0.0004472000077456683, 'samples': 6371520, 'steps': 33184, 'loss/train': 0.11245016753673553} -08/30/2021 19:14:03 - INFO - __main__ - Step 33186: {'lr': 0.0004471967459113086, 'samples': 6371712, 'steps': 33185, 'loss/train': 0.10119623690843582} -08/30/2021 19:14:03 - INFO - __main__ - Step 33187: {'lr': 0.0004471934839880951, 'samples': 6371904, 'steps': 33186, 'loss/train': 1.5234103202819824} -08/30/2021 19:14:05 - INFO - __main__ - Step 33188: {'lr': 0.00044719022197602933, 'samples': 6372096, 'steps': 33187, 'loss/train': 1.8250043392181396} -08/30/2021 19:14:05 - INFO - __main__ - Step 33189: {'lr': 0.0004471869598751127, 'samples': 6372288, 'steps': 33188, 'loss/train': 1.4584451913833618} -08/30/2021 19:14:05 - INFO - __main__ - Step 33190: {'lr': 0.0004471836976853466, 'samples': 6372480, 'steps': 33189, 'loss/train': 1.17582368850708} -08/30/2021 19:14:06 - INFO - __main__ - Step 33191: {'lr': 0.00044718043540673257, 'samples': 6372672, 'steps': 33190, 'loss/train': 1.610975742340088} -08/30/2021 19:14:06 - INFO - __main__ - Step 33192: {'lr': 0.0004471771730392722, 'samples': 6372864, 'steps': 33191, 'loss/train': 1.50669527053833} -08/30/2021 19:14:08 - INFO - __main__ - Step 33193: {'lr': 0.0004471739105829667, 'samples': 6373056, 'steps': 33192, 'loss/train': 1.185469150543213} -08/30/2021 19:14:08 - INFO - __main__ - Step 33194: {'lr': 0.00044717064803781773, 'samples': 6373248, 'steps': 33193, 'loss/train': 1.8157325983047485} -08/30/2021 19:14:08 - INFO - __main__ - Step 33195: {'lr': 0.00044716738540382674, 'samples': 6373440, 'steps': 33194, 'loss/train': 1.206169605255127} -08/30/2021 19:14:09 - INFO - __main__ - Step 33196: {'lr': 0.0004471641226809951, 'samples': 6373632, 'steps': 33195, 'loss/train': 1.158311128616333} -08/30/2021 19:14:09 - INFO - __main__ - Step 33197: {'lr': 0.0004471608598693244, 'samples': 6373824, 'steps': 33196, 'loss/train': 0.8852444291114807} -08/30/2021 19:14:11 - INFO - __main__ - Step 33198: {'lr': 0.000447157596968816, 'samples': 6374016, 'steps': 33197, 'loss/train': 1.7501740455627441} -08/30/2021 19:14:12 - INFO - __main__ - Step 33199: {'lr': 0.0004471543339794715, 'samples': 6374208, 'steps': 33198, 'loss/train': 1.9281806945800781} -08/30/2021 19:14:12 - INFO - __main__ - Step 33200: {'lr': 0.00044715107090129223, 'samples': 6374400, 'steps': 33199, 'loss/train': 1.703927993774414} -08/30/2021 19:14:12 - INFO - __main__ - Step 33201: {'lr': 0.00044714780773427975, 'samples': 6374592, 'steps': 33200, 'loss/train': 1.4577666521072388} -08/30/2021 19:14:13 - INFO - __main__ - Step 33202: {'lr': 0.00044714454447843555, 'samples': 6374784, 'steps': 33201, 'loss/train': 1.494301676750183} -08/30/2021 19:14:14 - INFO - __main__ - Step 33203: {'lr': 0.0004471412811337611, 'samples': 6374976, 'steps': 33202, 'loss/train': 1.0275992155075073} -08/30/2021 19:14:15 - INFO - __main__ - Step 33204: {'lr': 0.00044713801770025774, 'samples': 6375168, 'steps': 33203, 'loss/train': 1.3882516622543335} -08/30/2021 19:14:15 - INFO - __main__ - Step 33205: {'lr': 0.00044713475417792705, 'samples': 6375360, 'steps': 33204, 'loss/train': 1.3328049182891846} -08/30/2021 19:14:15 - INFO - __main__ - Step 33206: {'lr': 0.0004471314905667705, 'samples': 6375552, 'steps': 33205, 'loss/train': 0.15638910233974457} -08/30/2021 19:14:16 - INFO - __main__ - Step 33207: {'lr': 0.00044712822686678955, 'samples': 6375744, 'steps': 33206, 'loss/train': 0.6004116535186768} -08/30/2021 19:14:17 - INFO - __main__ - Step 33208: {'lr': 0.00044712496307798566, 'samples': 6375936, 'steps': 33207, 'loss/train': 1.4914157390594482} -08/30/2021 19:14:18 - INFO - __main__ - Step 33209: {'lr': 0.0004471216992003603, 'samples': 6376128, 'steps': 33208, 'loss/train': 1.911248803138733} -08/30/2021 19:14:18 - INFO - __main__ - Step 33210: {'lr': 0.0004471184352339149, 'samples': 6376320, 'steps': 33209, 'loss/train': 1.4934022426605225} -08/30/2021 19:14:18 - INFO - __main__ - Step 33211: {'lr': 0.00044711517117865105, 'samples': 6376512, 'steps': 33210, 'loss/train': 1.5583490133285522} -08/30/2021 19:14:19 - INFO - __main__ - Step 33212: {'lr': 0.00044711190703457005, 'samples': 6376704, 'steps': 33211, 'loss/train': 1.6493061780929565} -08/30/2021 19:14:20 - INFO - __main__ - Step 33213: {'lr': 0.00044710864280167353, 'samples': 6376896, 'steps': 33212, 'loss/train': 0.8273021578788757} -08/30/2021 19:14:21 - INFO - __main__ - Step 33214: {'lr': 0.0004471053784799629, 'samples': 6377088, 'steps': 33213, 'loss/train': 1.4777802228927612} -08/30/2021 19:14:21 - INFO - __main__ - Step 33215: {'lr': 0.0004471021140694396, 'samples': 6377280, 'steps': 33214, 'loss/train': 1.8512877225875854} -08/30/2021 19:14:21 - INFO - __main__ - Step 33216: {'lr': 0.0004470988495701052, 'samples': 6377472, 'steps': 33215, 'loss/train': 1.847663402557373} -08/30/2021 19:14:22 - INFO - __main__ - Step 33217: {'lr': 0.00044709558498196104, 'samples': 6377664, 'steps': 33216, 'loss/train': 1.509377121925354} -08/30/2021 19:14:24 - INFO - __main__ - Step 33218: {'lr': 0.00044709232030500865, 'samples': 6377856, 'steps': 33217, 'loss/train': 1.7002356052398682} -08/30/2021 19:14:25 - INFO - __main__ - Step 33219: {'lr': 0.0004470890555392495, 'samples': 6378048, 'steps': 33218, 'loss/train': 1.758070707321167} -08/30/2021 19:14:25 - INFO - __main__ - Step 33220: {'lr': 0.00044708579068468505, 'samples': 6378240, 'steps': 33219, 'loss/train': 0.9826855063438416} -08/30/2021 19:14:25 - INFO - __main__ - Step 33221: {'lr': 0.0004470825257413168, 'samples': 6378432, 'steps': 33220, 'loss/train': 1.587417483329773} -08/30/2021 19:14:26 - INFO - __main__ - Step 33222: {'lr': 0.00044707926070914624, 'samples': 6378624, 'steps': 33221, 'loss/train': 1.5655951499938965} -08/30/2021 19:14:26 - INFO - __main__ - Step 33223: {'lr': 0.0004470759955881748, 'samples': 6378816, 'steps': 33222, 'loss/train': 1.2147775888442993} -08/30/2021 19:14:27 - INFO - __main__ - Step 33224: {'lr': 0.0004470727303784039, 'samples': 6379008, 'steps': 33223, 'loss/train': 0.6486656069755554} -08/30/2021 19:14:27 - INFO - __main__ - Step 33225: {'lr': 0.00044706946507983513, 'samples': 6379200, 'steps': 33224, 'loss/train': 0.3323737680912018} -08/30/2021 19:14:29 - INFO - __main__ - Step 33226: {'lr': 0.00044706619969246984, 'samples': 6379392, 'steps': 33225, 'loss/train': 0.5406600832939148} -08/30/2021 19:14:29 - INFO - __main__ - Step 33227: {'lr': 0.0004470629342163096, 'samples': 6379584, 'steps': 33226, 'loss/train': 2.0734059810638428} -08/30/2021 19:14:30 - INFO - __main__ - Step 33228: {'lr': 0.00044705966865135583, 'samples': 6379776, 'steps': 33227, 'loss/train': 1.4940927028656006} -08/30/2021 19:14:30 - INFO - __main__ - Step 33229: {'lr': 0.00044705640299761004, 'samples': 6379968, 'steps': 33228, 'loss/train': 1.134113073348999} -08/30/2021 19:14:30 - INFO - __main__ - Step 33230: {'lr': 0.0004470531372550736, 'samples': 6380160, 'steps': 33229, 'loss/train': 1.7533130645751953} -08/30/2021 19:14:31 - INFO - __main__ - Step 33231: {'lr': 0.00044704987142374814, 'samples': 6380352, 'steps': 33230, 'loss/train': 1.9926685094833374} -08/30/2021 19:14:32 - INFO - __main__ - Step 33232: {'lr': 0.00044704660550363507, 'samples': 6380544, 'steps': 33231, 'loss/train': 1.6889886856079102} -08/30/2021 19:14:33 - INFO - __main__ - Step 33233: {'lr': 0.00044704333949473576, 'samples': 6380736, 'steps': 33232, 'loss/train': 1.570174217224121} -08/30/2021 19:14:33 - INFO - __main__ - Step 33234: {'lr': 0.0004470400733970518, 'samples': 6380928, 'steps': 33233, 'loss/train': 1.585200548171997} -08/30/2021 19:14:33 - INFO - __main__ - Step 33235: {'lr': 0.0004470368072105846, 'samples': 6381120, 'steps': 33234, 'loss/train': 1.4171451330184937} -08/30/2021 19:14:34 - INFO - __main__ - Step 33236: {'lr': 0.00044703354093533564, 'samples': 6381312, 'steps': 33235, 'loss/train': 1.796724796295166} -08/30/2021 19:14:35 - INFO - __main__ - Step 33237: {'lr': 0.0004470302745713065, 'samples': 6381504, 'steps': 33236, 'loss/train': 1.452254056930542} -08/30/2021 19:14:36 - INFO - __main__ - Step 33238: {'lr': 0.0004470270081184985, 'samples': 6381696, 'steps': 33237, 'loss/train': 0.17575830221176147} -08/30/2021 19:14:36 - INFO - __main__ - Step 33239: {'lr': 0.00044702374157691316, 'samples': 6381888, 'steps': 33238, 'loss/train': 1.8308111429214478} -08/30/2021 19:14:37 - INFO - __main__ - Step 33240: {'lr': 0.00044702047494655194, 'samples': 6382080, 'steps': 33239, 'loss/train': 1.3223453760147095} -08/30/2021 19:14:37 - INFO - __main__ - Step 33241: {'lr': 0.0004470172082274164, 'samples': 6382272, 'steps': 33240, 'loss/train': 1.7049347162246704} -08/30/2021 19:14:38 - INFO - __main__ - Step 33242: {'lr': 0.0004470139414195079, 'samples': 6382464, 'steps': 33241, 'loss/train': 1.6486618518829346} -08/30/2021 19:14:39 - INFO - __main__ - Step 33243: {'lr': 0.00044701067452282796, 'samples': 6382656, 'steps': 33242, 'loss/train': 1.2168083190917969} -08/30/2021 19:14:39 - INFO - __main__ - Step 33244: {'lr': 0.00044700740753737806, 'samples': 6382848, 'steps': 33243, 'loss/train': 1.190751075744629} -08/30/2021 19:14:39 - INFO - __main__ - Step 33245: {'lr': 0.0004470041404631597, 'samples': 6383040, 'steps': 33244, 'loss/train': 1.361646056175232} -08/30/2021 19:14:40 - INFO - __main__ - Step 33246: {'lr': 0.0004470008733001742, 'samples': 6383232, 'steps': 33245, 'loss/train': 1.2804499864578247} -08/30/2021 19:14:41 - INFO - __main__ - Step 33247: {'lr': 0.0004469976060484233, 'samples': 6383424, 'steps': 33246, 'loss/train': 1.667539358139038} -08/30/2021 19:14:42 - INFO - __main__ - Step 33248: {'lr': 0.00044699433870790817, 'samples': 6383616, 'steps': 33247, 'loss/train': 1.0871059894561768} -08/30/2021 19:14:42 - INFO - __main__ - Step 33249: {'lr': 0.00044699107127863056, 'samples': 6383808, 'steps': 33248, 'loss/train': 1.4582699537277222} -08/30/2021 19:14:43 - INFO - __main__ - Step 33250: {'lr': 0.0004469878037605917, 'samples': 6384000, 'steps': 33249, 'loss/train': 1.6328154802322388} -08/30/2021 19:14:43 - INFO - __main__ - Step 33251: {'lr': 0.0004469845361537933, 'samples': 6384192, 'steps': 33250, 'loss/train': 1.2056998014450073} -08/30/2021 19:14:45 - INFO - __main__ - Step 33252: {'lr': 0.0004469812684582366, 'samples': 6384384, 'steps': 33251, 'loss/train': 1.3030999898910522} -08/30/2021 19:14:45 - INFO - __main__ - Step 33253: {'lr': 0.00044697800067392327, 'samples': 6384576, 'steps': 33252, 'loss/train': 1.153661847114563} -08/30/2021 19:14:46 - INFO - __main__ - Step 33254: {'lr': 0.00044697473280085455, 'samples': 6384768, 'steps': 33253, 'loss/train': 2.4470200538635254} -08/30/2021 19:14:46 - INFO - __main__ - Step 33255: {'lr': 0.0004469714648390322, 'samples': 6384960, 'steps': 33254, 'loss/train': 1.557395100593567} -08/30/2021 19:14:46 - INFO - __main__ - Step 33256: {'lr': 0.00044696819678845744, 'samples': 6385152, 'steps': 33255, 'loss/train': 1.9589415788650513} -08/30/2021 19:14:48 - INFO - __main__ - Step 33257: {'lr': 0.000446964928649132, 'samples': 6385344, 'steps': 33256, 'loss/train': 1.4761420488357544} -08/30/2021 19:14:48 - INFO - __main__ - Step 33258: {'lr': 0.00044696166042105704, 'samples': 6385536, 'steps': 33257, 'loss/train': 2.0367982387542725} -08/30/2021 19:14:49 - INFO - __main__ - Step 33259: {'lr': 0.0004469583921042343, 'samples': 6385728, 'steps': 33258, 'loss/train': 1.4333654642105103} -08/30/2021 19:14:49 - INFO - __main__ - Step 33260: {'lr': 0.0004469551236986651, 'samples': 6385920, 'steps': 33259, 'loss/train': 1.6459969282150269} -08/30/2021 19:14:49 - INFO - __main__ - Step 33261: {'lr': 0.00044695185520435087, 'samples': 6386112, 'steps': 33260, 'loss/train': 1.6131266355514526} -08/30/2021 19:14:51 - INFO - __main__ - Step 33262: {'lr': 0.00044694858662129333, 'samples': 6386304, 'steps': 33261, 'loss/train': 1.306576132774353} -08/30/2021 19:14:52 - INFO - __main__ - Step 33263: {'lr': 0.0004469453179494938, 'samples': 6386496, 'steps': 33262, 'loss/train': 2.506016731262207} -08/30/2021 19:14:52 - INFO - __main__ - Step 33264: {'lr': 0.00044694204918895367, 'samples': 6386688, 'steps': 33263, 'loss/train': 0.9850426912307739} -08/30/2021 19:14:52 - INFO - __main__ - Step 33265: {'lr': 0.0004469387803396745, 'samples': 6386880, 'steps': 33264, 'loss/train': 1.1219128370285034} -08/30/2021 19:14:53 - INFO - __main__ - Step 33266: {'lr': 0.0004469355114016577, 'samples': 6387072, 'steps': 33265, 'loss/train': 1.5980356931686401} -08/30/2021 19:14:53 - INFO - __main__ - Step 33267: {'lr': 0.00044693224237490485, 'samples': 6387264, 'steps': 33266, 'loss/train': 0.9002454280853271} -08/30/2021 19:14:55 - INFO - __main__ - Step 33268: {'lr': 0.00044692897325941737, 'samples': 6387456, 'steps': 33267, 'loss/train': 1.5177640914916992} -08/30/2021 19:14:55 - INFO - __main__ - Step 33269: {'lr': 0.00044692570405519683, 'samples': 6387648, 'steps': 33268, 'loss/train': 1.3533560037612915} -08/30/2021 19:14:56 - INFO - __main__ - Step 33270: {'lr': 0.0004469224347622445, 'samples': 6387840, 'steps': 33269, 'loss/train': 1.006487488746643} -08/30/2021 19:14:56 - INFO - __main__ - Step 33271: {'lr': 0.000446919165380562, 'samples': 6388032, 'steps': 33270, 'loss/train': 2.077798366546631} -08/30/2021 19:14:56 - INFO - __main__ - Step 33272: {'lr': 0.0004469158959101507, 'samples': 6388224, 'steps': 33271, 'loss/train': 1.2345467805862427} -08/30/2021 19:14:58 - INFO - __main__ - Step 33273: {'lr': 0.00044691262635101223, 'samples': 6388416, 'steps': 33272, 'loss/train': 1.2836799621582031} -08/30/2021 19:14:58 - INFO - __main__ - Step 33274: {'lr': 0.0004469093567031479, 'samples': 6388608, 'steps': 33273, 'loss/train': 1.395310401916504} -08/30/2021 19:14:59 - INFO - __main__ - Step 33275: {'lr': 0.00044690608696655923, 'samples': 6388800, 'steps': 33274, 'loss/train': 1.5411368608474731} -08/30/2021 19:14:59 - INFO - __main__ - Step 33276: {'lr': 0.0004469028171412478, 'samples': 6388992, 'steps': 33275, 'loss/train': 1.7975809574127197} -08/30/2021 19:14:59 - INFO - __main__ - Step 33277: {'lr': 0.00044689954722721494, 'samples': 6389184, 'steps': 33276, 'loss/train': 1.0257220268249512} -08/30/2021 19:15:01 - INFO - __main__ - Step 33278: {'lr': 0.0004468962772244622, 'samples': 6389376, 'steps': 33277, 'loss/train': 1.6012530326843262} -08/30/2021 19:15:02 - INFO - __main__ - Step 33279: {'lr': 0.00044689300713299105, 'samples': 6389568, 'steps': 33278, 'loss/train': 1.7047499418258667} -08/30/2021 19:15:02 - INFO - __main__ - Step 33280: {'lr': 0.0004468897369528029, 'samples': 6389760, 'steps': 33279, 'loss/train': 1.1045327186584473} -08/30/2021 19:15:02 - INFO - __main__ - Step 33281: {'lr': 0.00044688646668389933, 'samples': 6389952, 'steps': 33280, 'loss/train': 1.786787509918213} -08/30/2021 19:15:03 - INFO - __main__ - Step 33282: {'lr': 0.0004468831963262817, 'samples': 6390144, 'steps': 33281, 'loss/train': 1.5973328351974487} -08/30/2021 19:15:03 - INFO - __main__ - Step 33283: {'lr': 0.00044687992587995155, 'samples': 6390336, 'steps': 33282, 'loss/train': 0.1498529613018036} -08/30/2021 19:15:03 - INFO - __main__ - Step 33284: {'lr': 0.0004468766553449104, 'samples': 6390528, 'steps': 33283, 'loss/train': 0.24845431745052338} -08/30/2021 19:15:05 - INFO - __main__ - Step 33285: {'lr': 0.00044687338472115964, 'samples': 6390720, 'steps': 33284, 'loss/train': 1.4345593452453613} -08/30/2021 19:15:06 - INFO - __main__ - Step 33286: {'lr': 0.00044687011400870074, 'samples': 6390912, 'steps': 33285, 'loss/train': 1.9823952913284302} -08/30/2021 19:15:06 - INFO - __main__ - Step 33287: {'lr': 0.00044686684320753524, 'samples': 6391104, 'steps': 33286, 'loss/train': 1.325752854347229} -08/30/2021 19:15:06 - INFO - __main__ - Step 33288: {'lr': 0.00044686357231766454, 'samples': 6391296, 'steps': 33287, 'loss/train': 1.2607601881027222} -08/30/2021 19:15:07 - INFO - __main__ - Step 33289: {'lr': 0.00044686030133909017, 'samples': 6391488, 'steps': 33288, 'loss/train': 0.15953637659549713} -08/30/2021 19:15:08 - INFO - __main__ - Step 33290: {'lr': 0.00044685703027181364, 'samples': 6391680, 'steps': 33289, 'loss/train': 1.1410908699035645} -08/30/2021 19:15:09 - INFO - __main__ - Step 33291: {'lr': 0.0004468537591158363, 'samples': 6391872, 'steps': 33290, 'loss/train': 1.593532681465149} -08/30/2021 19:15:09 - INFO - __main__ - Step 33292: {'lr': 0.0004468504878711597, 'samples': 6392064, 'steps': 33291, 'loss/train': 1.307927131652832} -08/30/2021 19:15:09 - INFO - __main__ - Step 33293: {'lr': 0.00044684721653778537, 'samples': 6392256, 'steps': 33292, 'loss/train': 1.2437483072280884} -08/30/2021 19:15:10 - INFO - __main__ - Step 33294: {'lr': 0.00044684394511571463, 'samples': 6392448, 'steps': 33293, 'loss/train': 1.0610694885253906} -08/30/2021 19:15:11 - INFO - __main__ - Step 33295: {'lr': 0.00044684067360494905, 'samples': 6392640, 'steps': 33294, 'loss/train': 1.6670525074005127} -08/30/2021 19:15:12 - INFO - __main__ - Step 33296: {'lr': 0.00044683740200549015, 'samples': 6392832, 'steps': 33295, 'loss/train': 2.364126205444336} -08/30/2021 19:15:12 - INFO - __main__ - Step 33297: {'lr': 0.00044683413031733945, 'samples': 6393024, 'steps': 33296, 'loss/train': 0.9930689930915833} -08/30/2021 19:15:13 - INFO - __main__ - Step 33298: {'lr': 0.00044683085854049814, 'samples': 6393216, 'steps': 33297, 'loss/train': 2.525376558303833} -08/30/2021 19:15:13 - INFO - __main__ - Step 33299: {'lr': 0.00044682758667496806, 'samples': 6393408, 'steps': 33298, 'loss/train': 1.4268330335617065} -08/30/2021 19:15:14 - INFO - __main__ - Step 33300: {'lr': 0.00044682431472075035, 'samples': 6393600, 'steps': 33299, 'loss/train': 1.1879383325576782} -08/30/2021 19:15:15 - INFO - __main__ - Step 33301: {'lr': 0.00044682104267784674, 'samples': 6393792, 'steps': 33300, 'loss/train': 1.0189604759216309} -08/30/2021 19:15:15 - INFO - __main__ - Step 33302: {'lr': 0.0004468177705462585, 'samples': 6393984, 'steps': 33301, 'loss/train': 1.785483956336975} -08/30/2021 19:15:16 - INFO - __main__ - Step 33303: {'lr': 0.0004468144983259873, 'samples': 6394176, 'steps': 33302, 'loss/train': 1.0390609502792358} -08/30/2021 19:15:16 - INFO - __main__ - Step 33304: {'lr': 0.0004468112260170345, 'samples': 6394368, 'steps': 33303, 'loss/train': 1.4747045040130615} -08/30/2021 19:15:16 - INFO - __main__ - Step 33305: {'lr': 0.0004468079536194016, 'samples': 6394560, 'steps': 33304, 'loss/train': 1.726773977279663} -08/30/2021 19:15:18 - INFO - __main__ - Step 33306: {'lr': 0.00044680468113309006, 'samples': 6394752, 'steps': 33305, 'loss/train': 0.07333415001630783} -08/30/2021 19:15:19 - INFO - __main__ - Step 33307: {'lr': 0.0004468014085581014, 'samples': 6394944, 'steps': 33306, 'loss/train': 1.6688435077667236} -08/30/2021 19:15:19 - INFO - __main__ - Step 33308: {'lr': 0.0004467981358944371, 'samples': 6395136, 'steps': 33307, 'loss/train': 1.917307734489441} -08/30/2021 19:15:20 - INFO - __main__ - Step 33309: {'lr': 0.0004467948631420985, 'samples': 6395328, 'steps': 33308, 'loss/train': 1.5020296573638916} -08/30/2021 19:15:20 - INFO - __main__ - Step 33310: {'lr': 0.0004467915903010872, 'samples': 6395520, 'steps': 33309, 'loss/train': 1.3082365989685059} -08/30/2021 19:15:21 - INFO - __main__ - Step 33311: {'lr': 0.0004467883173714047, 'samples': 6395712, 'steps': 33310, 'loss/train': 1.3763829469680786} -08/30/2021 19:15:22 - INFO - __main__ - Step 33312: {'lr': 0.0004467850443530523, 'samples': 6395904, 'steps': 33311, 'loss/train': 2.2396857738494873} -08/30/2021 19:15:22 - INFO - __main__ - Step 33313: {'lr': 0.0004467817712460317, 'samples': 6396096, 'steps': 33312, 'loss/train': 1.550471305847168} -08/30/2021 19:15:23 - INFO - __main__ - Step 33314: {'lr': 0.00044677849805034424, 'samples': 6396288, 'steps': 33313, 'loss/train': 0.40899306535720825} -08/30/2021 19:15:23 - INFO - __main__ - Step 33315: {'lr': 0.0004467752247659914, 'samples': 6396480, 'steps': 33314, 'loss/train': 1.336354374885559} -08/30/2021 19:15:25 - INFO - __main__ - Step 33316: {'lr': 0.00044677195139297476, 'samples': 6396672, 'steps': 33315, 'loss/train': 1.3725905418395996} -08/30/2021 19:15:25 - INFO - __main__ - Step 33317: {'lr': 0.00044676867793129574, 'samples': 6396864, 'steps': 33316, 'loss/train': 1.360742211341858} -08/30/2021 19:15:26 - INFO - __main__ - Step 33318: {'lr': 0.00044676540438095565, 'samples': 6397056, 'steps': 33317, 'loss/train': 1.090036153793335} -08/30/2021 19:15:26 - INFO - __main__ - Step 33319: {'lr': 0.0004467621307419562, 'samples': 6397248, 'steps': 33318, 'loss/train': 0.1322993040084839} -08/30/2021 19:15:26 - INFO - __main__ - Step 33320: {'lr': 0.00044675885701429873, 'samples': 6397440, 'steps': 33319, 'loss/train': 0.9064639210700989} -08/30/2021 19:15:27 - INFO - __main__ - Step 33321: {'lr': 0.00044675558319798477, 'samples': 6397632, 'steps': 33320, 'loss/train': 1.3307347297668457} -08/30/2021 19:15:28 - INFO - __main__ - Step 33322: {'lr': 0.00044675230929301575, 'samples': 6397824, 'steps': 33321, 'loss/train': 0.08482823520898819} -08/30/2021 19:15:29 - INFO - __main__ - Step 33323: {'lr': 0.0004467490352993932, 'samples': 6398016, 'steps': 33322, 'loss/train': 1.1504961252212524} -08/30/2021 19:15:29 - INFO - __main__ - Step 33324: {'lr': 0.00044674576121711855, 'samples': 6398208, 'steps': 33323, 'loss/train': 1.6718014478683472} -08/30/2021 19:15:29 - INFO - __main__ - Step 33325: {'lr': 0.00044674248704619333, 'samples': 6398400, 'steps': 33324, 'loss/train': 1.4017398357391357} -08/30/2021 19:15:30 - INFO - __main__ - Step 33326: {'lr': 0.000446739212786619, 'samples': 6398592, 'steps': 33325, 'loss/train': 1.4466516971588135} -08/30/2021 19:15:32 - INFO - __main__ - Step 33327: {'lr': 0.000446735938438397, 'samples': 6398784, 'steps': 33326, 'loss/train': 1.4872729778289795} -08/30/2021 19:15:32 - INFO - __main__ - Step 33328: {'lr': 0.0004467326640015288, 'samples': 6398976, 'steps': 33327, 'loss/train': 1.0688589811325073} -08/30/2021 19:15:32 - INFO - __main__ - Step 33329: {'lr': 0.00044672938947601593, 'samples': 6399168, 'steps': 33328, 'loss/train': 1.420457124710083} -08/30/2021 19:15:33 - INFO - __main__ - Step 33330: {'lr': 0.00044672611486185976, 'samples': 6399360, 'steps': 33329, 'loss/train': 0.26510173082351685} -08/30/2021 19:15:33 - INFO - __main__ - Step 33331: {'lr': 0.0004467228401590619, 'samples': 6399552, 'steps': 33330, 'loss/train': 0.49148648977279663} -08/30/2021 19:15:33 - INFO - __main__ - Step 33332: {'lr': 0.00044671956536762375, 'samples': 6399744, 'steps': 33331, 'loss/train': 1.4820618629455566} -08/30/2021 19:15:35 - INFO - __main__ - Step 33333: {'lr': 0.00044671629048754683, 'samples': 6399936, 'steps': 33332, 'loss/train': 1.438414216041565} -08/30/2021 19:15:35 - INFO - __main__ - Step 33334: {'lr': 0.00044671301551883253, 'samples': 6400128, 'steps': 33333, 'loss/train': 1.1546604633331299} -08/30/2021 19:15:36 - INFO - __main__ - Step 33335: {'lr': 0.0004467097404614824, 'samples': 6400320, 'steps': 33334, 'loss/train': 1.3472340106964111} -08/30/2021 19:15:36 - INFO - __main__ - Step 33336: {'lr': 0.0004467064653154979, 'samples': 6400512, 'steps': 33335, 'loss/train': 1.4244062900543213} -08/30/2021 19:15:36 - INFO - __main__ - Step 33337: {'lr': 0.0004467031900808805, 'samples': 6400704, 'steps': 33336, 'loss/train': 1.1101934909820557} -08/30/2021 19:15:38 - INFO - __main__ - Step 33338: {'lr': 0.00044669991475763173, 'samples': 6400896, 'steps': 33337, 'loss/train': 1.6133058071136475} -08/30/2021 19:15:39 - INFO - __main__ - Step 33339: {'lr': 0.00044669663934575294, 'samples': 6401088, 'steps': 33338, 'loss/train': 0.6731969118118286} -08/30/2021 19:15:39 - INFO - __main__ - Step 33340: {'lr': 0.0004466933638452457, 'samples': 6401280, 'steps': 33339, 'loss/train': 1.2125256061553955} -08/30/2021 19:15:39 - INFO - __main__ - Step 33341: {'lr': 0.0004466900882561115, 'samples': 6401472, 'steps': 33340, 'loss/train': 1.2524387836456299} -08/30/2021 19:15:40 - INFO - __main__ - Step 33342: {'lr': 0.00044668681257835173, 'samples': 6401664, 'steps': 33341, 'loss/train': 1.8785761594772339} -08/30/2021 19:15:41 - INFO - __main__ - Step 33343: {'lr': 0.00044668353681196794, 'samples': 6401856, 'steps': 33342, 'loss/train': 1.8011149168014526} -08/30/2021 19:15:42 - INFO - __main__ - Step 33344: {'lr': 0.0004466802609569616, 'samples': 6402048, 'steps': 33343, 'loss/train': 1.8663297891616821} -08/30/2021 19:15:42 - INFO - __main__ - Step 33345: {'lr': 0.00044667698501333415, 'samples': 6402240, 'steps': 33344, 'loss/train': 1.5840978622436523} -08/30/2021 19:15:42 - INFO - __main__ - Step 33346: {'lr': 0.0004466737089810871, 'samples': 6402432, 'steps': 33345, 'loss/train': 1.02379310131073} -08/30/2021 19:15:43 - INFO - __main__ - Step 33347: {'lr': 0.00044667043286022193, 'samples': 6402624, 'steps': 33346, 'loss/train': 1.5514895915985107} -08/30/2021 19:15:45 - INFO - __main__ - Step 33348: {'lr': 0.00044666715665074, 'samples': 6402816, 'steps': 33347, 'loss/train': 2.2234818935394287} -08/30/2021 19:15:46 - INFO - __main__ - Step 33349: {'lr': 0.0004466638803526429, 'samples': 6403008, 'steps': 33348, 'loss/train': 1.400463342666626} -08/30/2021 19:15:46 - INFO - __main__ - Step 33350: {'lr': 0.0004466606039659322, 'samples': 6403200, 'steps': 33349, 'loss/train': 1.4251716136932373} -08/30/2021 19:15:46 - INFO - __main__ - Step 33351: {'lr': 0.0004466573274906092, 'samples': 6403392, 'steps': 33350, 'loss/train': 1.7673977613449097} -08/30/2021 19:15:47 - INFO - __main__ - Step 33352: {'lr': 0.0004466540509266754, 'samples': 6403584, 'steps': 33351, 'loss/train': 1.280025601387024} -08/30/2021 19:15:47 - INFO - __main__ - Step 33353: {'lr': 0.0004466507742741325, 'samples': 6403776, 'steps': 33352, 'loss/train': 3.522418975830078} -08/30/2021 19:15:47 - INFO - __main__ - Step 33354: {'lr': 0.0004466474975329816, 'samples': 6403968, 'steps': 33353, 'loss/train': 3.0891058444976807} -08/30/2021 19:15:49 - INFO - __main__ - Step 33355: {'lr': 0.0004466442207032244, 'samples': 6404160, 'steps': 33354, 'loss/train': 1.6727930307388306} -08/30/2021 19:15:49 - INFO - __main__ - Step 33356: {'lr': 0.00044664094378486243, 'samples': 6404352, 'steps': 33355, 'loss/train': 1.574659824371338} -08/30/2021 19:15:50 - INFO - __main__ - Step 33357: {'lr': 0.00044663766677789706, 'samples': 6404544, 'steps': 33356, 'loss/train': 1.6382181644439697} -08/30/2021 19:15:50 - INFO - __main__ - Step 33358: {'lr': 0.0004466343896823297, 'samples': 6404736, 'steps': 33357, 'loss/train': 1.435111403465271} -08/30/2021 19:15:50 - INFO - __main__ - Step 33359: {'lr': 0.000446631112498162, 'samples': 6404928, 'steps': 33358, 'loss/train': 1.0055221319198608} -08/30/2021 19:15:52 - INFO - __main__ - Step 33360: {'lr': 0.0004466278352253954, 'samples': 6405120, 'steps': 33359, 'loss/train': 1.7547920942306519} -08/30/2021 19:15:52 - INFO - __main__ - Step 33361: {'lr': 0.00044662455786403124, 'samples': 6405312, 'steps': 33360, 'loss/train': 1.5736093521118164} -08/30/2021 19:15:53 - INFO - __main__ - Step 33362: {'lr': 0.0004466212804140711, 'samples': 6405504, 'steps': 33361, 'loss/train': 0.19409291446208954} -08/30/2021 19:15:53 - INFO - __main__ - Step 33363: {'lr': 0.00044661800287551653, 'samples': 6405696, 'steps': 33362, 'loss/train': 0.8882451057434082} -08/30/2021 19:15:53 - INFO - __main__ - Step 33364: {'lr': 0.00044661472524836886, 'samples': 6405888, 'steps': 33363, 'loss/train': 1.423277497291565} -08/30/2021 19:15:55 - INFO - __main__ - Step 33365: {'lr': 0.00044661144753262963, 'samples': 6406080, 'steps': 33364, 'loss/train': 1.437907338142395} -08/30/2021 19:15:56 - INFO - __main__ - Step 33366: {'lr': 0.0004466081697283003, 'samples': 6406272, 'steps': 33365, 'loss/train': 2.14711856842041} -08/30/2021 19:15:56 - INFO - __main__ - Step 33367: {'lr': 0.00044660489183538237, 'samples': 6406464, 'steps': 33366, 'loss/train': 1.8020535707473755} -08/30/2021 19:15:57 - INFO - __main__ - Step 33368: {'lr': 0.0004466016138538773, 'samples': 6406656, 'steps': 33367, 'loss/train': 1.4772429466247559} -08/30/2021 19:15:57 - INFO - __main__ - Step 33369: {'lr': 0.0004465983357837866, 'samples': 6406848, 'steps': 33368, 'loss/train': 0.9149893522262573} -08/30/2021 19:15:57 - INFO - __main__ - Step 33370: {'lr': 0.00044659505762511176, 'samples': 6407040, 'steps': 33369, 'loss/train': 1.0663551092147827} -08/30/2021 19:15:59 - INFO - __main__ - Step 33371: {'lr': 0.00044659177937785417, 'samples': 6407232, 'steps': 33370, 'loss/train': 1.4070308208465576} -08/30/2021 19:15:59 - INFO - __main__ - Step 33372: {'lr': 0.0004465885010420154, 'samples': 6407424, 'steps': 33371, 'loss/train': 1.8669415712356567} -08/30/2021 19:16:00 - INFO - __main__ - Step 33373: {'lr': 0.0004465852226175968, 'samples': 6407616, 'steps': 33372, 'loss/train': 1.2759586572647095} -08/30/2021 19:16:00 - INFO - __main__ - Step 33374: {'lr': 0.00044658194410460004, 'samples': 6407808, 'steps': 33373, 'loss/train': 0.9852572083473206} -08/30/2021 19:16:00 - INFO - __main__ - Step 33375: {'lr': 0.0004465786655030264, 'samples': 6408000, 'steps': 33374, 'loss/train': 1.6221834421157837} -08/30/2021 19:16:02 - INFO - __main__ - Step 33376: {'lr': 0.00044657538681287746, 'samples': 6408192, 'steps': 33375, 'loss/train': 1.563546061515808} -08/30/2021 19:16:02 - INFO - __main__ - Step 33377: {'lr': 0.0004465721080341547, 'samples': 6408384, 'steps': 33376, 'loss/train': 1.5885995626449585} -08/30/2021 19:16:03 - INFO - __main__ - Step 33378: {'lr': 0.0004465688291668596, 'samples': 6408576, 'steps': 33377, 'loss/train': 1.658616304397583} -08/30/2021 19:16:03 - INFO - __main__ - Step 33379: {'lr': 0.00044656555021099363, 'samples': 6408768, 'steps': 33378, 'loss/train': 1.3255548477172852} -08/30/2021 19:16:03 - INFO - __main__ - Step 33380: {'lr': 0.00044656227116655824, 'samples': 6408960, 'steps': 33379, 'loss/train': 1.3153778314590454} -08/30/2021 19:16:05 - INFO - __main__ - Step 33381: {'lr': 0.00044655899203355486, 'samples': 6409152, 'steps': 33380, 'loss/train': 1.401679515838623} -08/30/2021 19:16:05 - INFO - __main__ - Step 33382: {'lr': 0.0004465557128119852, 'samples': 6409344, 'steps': 33381, 'loss/train': 1.3784312009811401} -08/30/2021 19:16:06 - INFO - __main__ - Step 33383: {'lr': 0.00044655243350185037, 'samples': 6409536, 'steps': 33382, 'loss/train': 1.7505137920379639} -08/30/2021 19:16:06 - INFO - __main__ - Step 33384: {'lr': 0.0004465491541031522, 'samples': 6409728, 'steps': 33383, 'loss/train': 1.6893738508224487} -08/30/2021 19:16:06 - INFO - __main__ - Step 33385: {'lr': 0.00044654587461589193, 'samples': 6409920, 'steps': 33384, 'loss/train': 1.365661859512329} -08/30/2021 19:16:08 - INFO - __main__ - Step 33386: {'lr': 0.0004465425950400711, 'samples': 6410112, 'steps': 33385, 'loss/train': 2.1446902751922607} -08/30/2021 19:16:08 - INFO - __main__ - Step 33387: {'lr': 0.00044653931537569125, 'samples': 6410304, 'steps': 33386, 'loss/train': 2.165961742401123} -08/30/2021 19:16:09 - INFO - __main__ - Step 33388: {'lr': 0.0004465360356227538, 'samples': 6410496, 'steps': 33387, 'loss/train': 1.543939232826233} -08/30/2021 19:16:09 - INFO - __main__ - Step 33389: {'lr': 0.0004465327557812603, 'samples': 6410688, 'steps': 33388, 'loss/train': 1.596062183380127} -08/30/2021 19:16:09 - INFO - __main__ - Step 33390: {'lr': 0.0004465294758512121, 'samples': 6410880, 'steps': 33389, 'loss/train': 1.463299036026001} -08/30/2021 19:16:11 - INFO - __main__ - Step 33391: {'lr': 0.0004465261958326108, 'samples': 6411072, 'steps': 33390, 'loss/train': 0.7451184391975403} -08/30/2021 19:16:11 - INFO - __main__ - Step 33392: {'lr': 0.0004465229157254578, 'samples': 6411264, 'steps': 33391, 'loss/train': 1.6218186616897583} -08/30/2021 19:16:12 - INFO - __main__ - Step 33393: {'lr': 0.0004465196355297546, 'samples': 6411456, 'steps': 33392, 'loss/train': 0.9780051708221436} -08/30/2021 19:16:12 - INFO - __main__ - Step 33394: {'lr': 0.0004465163552455027, 'samples': 6411648, 'steps': 33393, 'loss/train': 1.819261908531189} -08/30/2021 19:16:12 - INFO - __main__ - Step 33395: {'lr': 0.0004465130748727036, 'samples': 6411840, 'steps': 33394, 'loss/train': 2.0825252532958984} -08/30/2021 19:16:14 - INFO - __main__ - Step 33396: {'lr': 0.0004465097944113587, 'samples': 6412032, 'steps': 33395, 'loss/train': 1.670664668083191} -08/30/2021 19:16:14 - INFO - __main__ - Step 33397: {'lr': 0.00044650651386146954, 'samples': 6412224, 'steps': 33396, 'loss/train': 2.0088019371032715} -08/30/2021 19:16:15 - INFO - __main__ - Step 33398: {'lr': 0.00044650323322303757, 'samples': 6412416, 'steps': 33397, 'loss/train': 0.9385988116264343} -08/30/2021 19:16:15 - INFO - __main__ - Step 33399: {'lr': 0.0004464999524960642, 'samples': 6412608, 'steps': 33398, 'loss/train': 1.6312021017074585} -08/30/2021 19:16:15 - INFO - __main__ - Step 33400: {'lr': 0.0004464966716805511, 'samples': 6412800, 'steps': 33399, 'loss/train': 1.5122473239898682} -08/30/2021 19:16:17 - INFO - __main__ - Step 33401: {'lr': 0.0004464933907764996, 'samples': 6412992, 'steps': 33400, 'loss/train': 1.7289127111434937} -08/30/2021 19:16:17 - INFO - __main__ - Step 33402: {'lr': 0.0004464901097839112, 'samples': 6413184, 'steps': 33401, 'loss/train': 1.416804313659668} -08/30/2021 19:16:18 - INFO - __main__ - Step 33403: {'lr': 0.00044648682870278733, 'samples': 6413376, 'steps': 33402, 'loss/train': 1.2345597743988037} -08/30/2021 19:16:18 - INFO - __main__ - Step 33404: {'lr': 0.0004464835475331296, 'samples': 6413568, 'steps': 33403, 'loss/train': 1.0464625358581543} -08/30/2021 19:16:18 - INFO - __main__ - Step 33405: {'lr': 0.0004464802662749394, 'samples': 6413760, 'steps': 33404, 'loss/train': 1.4701182842254639} -08/30/2021 19:16:19 - INFO - __main__ - Step 33406: {'lr': 0.00044647698492821826, 'samples': 6413952, 'steps': 33405, 'loss/train': 1.5553449392318726} -08/30/2021 19:16:21 - INFO - __main__ - Step 33407: {'lr': 0.00044647370349296757, 'samples': 6414144, 'steps': 33406, 'loss/train': 2.0070667266845703} -08/30/2021 19:16:21 - INFO - __main__ - Step 33408: {'lr': 0.00044647042196918884, 'samples': 6414336, 'steps': 33407, 'loss/train': 1.4474754333496094} -08/30/2021 19:16:21 - INFO - __main__ - Step 33409: {'lr': 0.00044646714035688365, 'samples': 6414528, 'steps': 33408, 'loss/train': 1.617448091506958} -08/30/2021 19:16:22 - INFO - __main__ - Step 33410: {'lr': 0.00044646385865605335, 'samples': 6414720, 'steps': 33409, 'loss/train': 0.08607909083366394} -08/30/2021 19:16:22 - INFO - __main__ - Step 33411: {'lr': 0.0004464605768666995, 'samples': 6414912, 'steps': 33410, 'loss/train': 1.1770544052124023} -08/30/2021 19:16:22 - INFO - __main__ - Step 33412: {'lr': 0.0004464572949888235, 'samples': 6415104, 'steps': 33411, 'loss/train': 1.3189491033554077} -08/30/2021 19:16:24 - INFO - __main__ - Step 33413: {'lr': 0.0004464540130224268, 'samples': 6415296, 'steps': 33412, 'loss/train': 2.448939800262451} -08/30/2021 19:16:24 - INFO - __main__ - Step 33414: {'lr': 0.0004464507309675111, 'samples': 6415488, 'steps': 33413, 'loss/train': 0.8867089152336121} -08/30/2021 19:16:25 - INFO - __main__ - Step 33415: {'lr': 0.00044644744882407767, 'samples': 6415680, 'steps': 33414, 'loss/train': 1.3510990142822266} -08/30/2021 19:16:25 - INFO - __main__ - Step 33416: {'lr': 0.00044644416659212806, 'samples': 6415872, 'steps': 33415, 'loss/train': 1.515901803970337} -08/30/2021 19:16:25 - INFO - __main__ - Step 33417: {'lr': 0.00044644088427166375, 'samples': 6416064, 'steps': 33416, 'loss/train': 1.6699684858322144} -08/30/2021 19:16:27 - INFO - __main__ - Step 33418: {'lr': 0.00044643760186268615, 'samples': 6416256, 'steps': 33417, 'loss/train': 1.7504702806472778} -08/30/2021 19:16:28 - INFO - __main__ - Step 33419: {'lr': 0.00044643431936519683, 'samples': 6416448, 'steps': 33418, 'loss/train': 0.22187237441539764} -08/30/2021 19:16:28 - INFO - __main__ - Step 33420: {'lr': 0.00044643103677919726, 'samples': 6416640, 'steps': 33419, 'loss/train': 1.1697900295257568} -08/30/2021 19:16:29 - INFO - __main__ - Step 33421: {'lr': 0.00044642775410468896, 'samples': 6416832, 'steps': 33420, 'loss/train': 1.303484320640564} -08/30/2021 19:16:29 - INFO - __main__ - Step 33422: {'lr': 0.00044642447134167316, 'samples': 6417024, 'steps': 33421, 'loss/train': 1.6225663423538208} -08/30/2021 19:16:30 - INFO - __main__ - Step 33423: {'lr': 0.00044642118849015167, 'samples': 6417216, 'steps': 33422, 'loss/train': 1.4180470705032349} -08/30/2021 19:16:31 - INFO - __main__ - Step 33424: {'lr': 0.0004464179055501258, 'samples': 6417408, 'steps': 33423, 'loss/train': 1.0804719924926758} -08/30/2021 19:16:31 - INFO - __main__ - Step 33425: {'lr': 0.00044641462252159705, 'samples': 6417600, 'steps': 33424, 'loss/train': 1.3525092601776123} -08/30/2021 19:16:32 - INFO - __main__ - Step 33426: {'lr': 0.0004464113394045669, 'samples': 6417792, 'steps': 33425, 'loss/train': 1.0800803899765015} -08/30/2021 19:16:32 - INFO - __main__ - Step 33427: {'lr': 0.00044640805619903677, 'samples': 6417984, 'steps': 33426, 'loss/train': 1.8649523258209229} -08/30/2021 19:16:33 - INFO - __main__ - Step 33428: {'lr': 0.00044640477290500824, 'samples': 6418176, 'steps': 33427, 'loss/train': 1.5345628261566162} -08/30/2021 19:16:34 - INFO - __main__ - Step 33429: {'lr': 0.00044640148952248285, 'samples': 6418368, 'steps': 33428, 'loss/train': 1.6082801818847656} -08/30/2021 19:16:34 - INFO - __main__ - Step 33430: {'lr': 0.00044639820605146184, 'samples': 6418560, 'steps': 33429, 'loss/train': 0.3826752007007599} -08/30/2021 19:16:35 - INFO - __main__ - Step 33431: {'lr': 0.0004463949224919469, 'samples': 6418752, 'steps': 33430, 'loss/train': 1.5160101652145386} -08/30/2021 19:16:35 - INFO - __main__ - Step 33432: {'lr': 0.0004463916388439394, 'samples': 6418944, 'steps': 33431, 'loss/train': 1.416867733001709} -08/30/2021 19:16:37 - INFO - __main__ - Step 33433: {'lr': 0.00044638835510744094, 'samples': 6419136, 'steps': 33432, 'loss/train': 1.493934154510498} -08/30/2021 19:16:37 - INFO - __main__ - Step 33434: {'lr': 0.0004463850712824528, 'samples': 6419328, 'steps': 33433, 'loss/train': 1.8534473180770874} -08/30/2021 19:16:37 - INFO - __main__ - Step 33435: {'lr': 0.0004463817873689766, 'samples': 6419520, 'steps': 33434, 'loss/train': 0.8413693904876709} -08/30/2021 19:16:38 - INFO - __main__ - Step 33436: {'lr': 0.00044637850336701386, 'samples': 6419712, 'steps': 33435, 'loss/train': 1.0658906698226929} -08/30/2021 19:16:38 - INFO - __main__ - Step 33437: {'lr': 0.000446375219276566, 'samples': 6419904, 'steps': 33436, 'loss/train': 1.5574675798416138} -08/30/2021 19:16:40 - INFO - __main__ - Step 33438: {'lr': 0.0004463719350976344, 'samples': 6420096, 'steps': 33437, 'loss/train': 1.6721071004867554} -08/30/2021 19:16:40 - INFO - __main__ - Step 33439: {'lr': 0.0004463686508302207, 'samples': 6420288, 'steps': 33438, 'loss/train': 2.0010766983032227} -08/30/2021 19:16:41 - INFO - __main__ - Step 33440: {'lr': 0.00044636536647432636, 'samples': 6420480, 'steps': 33439, 'loss/train': 1.5309076309204102} -08/30/2021 19:16:41 - INFO - __main__ - Step 33441: {'lr': 0.00044636208202995277, 'samples': 6420672, 'steps': 33440, 'loss/train': 1.2251158952713013} -08/30/2021 19:16:41 - INFO - __main__ - Step 33442: {'lr': 0.0004463587974971014, 'samples': 6420864, 'steps': 33441, 'loss/train': 1.3289397954940796} -08/30/2021 19:16:43 - INFO - __main__ - Step 33443: {'lr': 0.0004463555128757739, 'samples': 6421056, 'steps': 33442, 'loss/train': 1.108396291732788} -08/30/2021 19:16:43 - INFO - __main__ - Step 33444: {'lr': 0.00044635222816597153, 'samples': 6421248, 'steps': 33443, 'loss/train': 1.6361125707626343} -08/30/2021 19:16:44 - INFO - __main__ - Step 33445: {'lr': 0.0004463489433676959, 'samples': 6421440, 'steps': 33444, 'loss/train': 1.3167794942855835} -08/30/2021 19:16:44 - INFO - __main__ - Step 33446: {'lr': 0.00044634565848094854, 'samples': 6421632, 'steps': 33445, 'loss/train': 1.4385465383529663} -08/30/2021 19:16:44 - INFO - __main__ - Step 33447: {'lr': 0.0004463423735057308, 'samples': 6421824, 'steps': 33446, 'loss/train': 1.1506036520004272} -08/30/2021 19:16:46 - INFO - __main__ - Step 33448: {'lr': 0.00044633908844204424, 'samples': 6422016, 'steps': 33447, 'loss/train': 2.2047119140625} -08/30/2021 19:16:46 - INFO - __main__ - Step 33449: {'lr': 0.0004463358032898903, 'samples': 6422208, 'steps': 33448, 'loss/train': 2.0550198554992676} -08/30/2021 19:16:47 - INFO - __main__ - Step 33450: {'lr': 0.00044633251804927044, 'samples': 6422400, 'steps': 33449, 'loss/train': 2.321042537689209} -08/30/2021 19:16:47 - INFO - __main__ - Step 33451: {'lr': 0.0004463292327201862, 'samples': 6422592, 'steps': 33450, 'loss/train': 1.3362419605255127} -08/30/2021 19:16:47 - INFO - __main__ - Step 33452: {'lr': 0.0004463259473026391, 'samples': 6422784, 'steps': 33451, 'loss/train': 1.324425458908081} -08/30/2021 19:16:48 - INFO - __main__ - Step 33453: {'lr': 0.0004463226617966305, 'samples': 6422976, 'steps': 33452, 'loss/train': 1.8268342018127441} -08/30/2021 19:16:49 - INFO - __main__ - Step 33454: {'lr': 0.00044631937620216196, 'samples': 6423168, 'steps': 33453, 'loss/train': 0.6967935562133789} -08/30/2021 19:16:50 - INFO - __main__ - Step 33455: {'lr': 0.00044631609051923494, 'samples': 6423360, 'steps': 33454, 'loss/train': 1.1998844146728516} -08/30/2021 19:16:50 - INFO - __main__ - Step 33456: {'lr': 0.00044631280474785086, 'samples': 6423552, 'steps': 33455, 'loss/train': 1.1822856664657593} -08/30/2021 19:16:50 - INFO - __main__ - Step 33457: {'lr': 0.0004463095188880113, 'samples': 6423744, 'steps': 33456, 'loss/train': 1.3683770895004272} -08/30/2021 19:16:51 - INFO - __main__ - Step 33458: {'lr': 0.00044630623293971775, 'samples': 6423936, 'steps': 33457, 'loss/train': 1.5302542448043823} -08/30/2021 19:16:52 - INFO - __main__ - Step 33459: {'lr': 0.0004463029469029716, 'samples': 6424128, 'steps': 33458, 'loss/train': 1.4877132177352905} -08/30/2021 19:16:53 - INFO - __main__ - Step 33460: {'lr': 0.0004462996607777743, 'samples': 6424320, 'steps': 33459, 'loss/train': 1.5018351078033447} -08/30/2021 19:16:53 - INFO - __main__ - Step 33461: {'lr': 0.00044629637456412754, 'samples': 6424512, 'steps': 33460, 'loss/train': 1.179540991783142} -08/30/2021 19:16:53 - INFO - __main__ - Step 33462: {'lr': 0.0004462930882620325, 'samples': 6424704, 'steps': 33461, 'loss/train': 1.7101011276245117} -08/30/2021 19:16:54 - INFO - __main__ - Step 33463: {'lr': 0.0004462898018714909, 'samples': 6424896, 'steps': 33462, 'loss/train': 1.0568920373916626} -08/30/2021 19:16:55 - INFO - __main__ - Step 33464: {'lr': 0.0004462865153925042, 'samples': 6425088, 'steps': 33463, 'loss/train': 1.4088925123214722} -08/30/2021 19:16:56 - INFO - __main__ - Step 33465: {'lr': 0.00044628322882507375, 'samples': 6425280, 'steps': 33464, 'loss/train': 1.9408656358718872} -08/30/2021 19:16:56 - INFO - __main__ - Step 33466: {'lr': 0.0004462799421692012, 'samples': 6425472, 'steps': 33465, 'loss/train': 1.1031192541122437} -08/30/2021 19:16:56 - INFO - __main__ - Step 33467: {'lr': 0.0004462766554248878, 'samples': 6425664, 'steps': 33466, 'loss/train': 1.4469138383865356} -08/30/2021 19:16:57 - INFO - __main__ - Step 33468: {'lr': 0.0004462733685921353, 'samples': 6425856, 'steps': 33467, 'loss/train': 1.2693172693252563} -08/30/2021 19:16:59 - INFO - __main__ - Step 33469: {'lr': 0.000446270081670945, 'samples': 6426048, 'steps': 33468, 'loss/train': 1.5170141458511353} -08/30/2021 19:17:00 - INFO - __main__ - Step 33470: {'lr': 0.0004462667946613184, 'samples': 6426240, 'steps': 33469, 'loss/train': 1.2980009317398071} -08/30/2021 19:17:00 - INFO - __main__ - Step 33471: {'lr': 0.00044626350756325707, 'samples': 6426432, 'steps': 33470, 'loss/train': 1.7524052858352661} -08/30/2021 19:17:00 - INFO - __main__ - Step 33472: {'lr': 0.0004462602203767624, 'samples': 6426624, 'steps': 33471, 'loss/train': 5.986457824707031} -08/30/2021 19:17:01 - INFO - __main__ - Step 33473: {'lr': 0.0004462569331018359, 'samples': 6426816, 'steps': 33472, 'loss/train': 5.9101128578186035} -08/30/2021 19:17:01 - INFO - __main__ - Step 33474: {'lr': 0.00044625364573847904, 'samples': 6427008, 'steps': 33473, 'loss/train': 1.7787965536117554} -08/30/2021 19:17:03 - INFO - __main__ - Step 33475: {'lr': 0.0004462503582866933, 'samples': 6427200, 'steps': 33474, 'loss/train': 1.9519734382629395} -08/30/2021 19:17:03 - INFO - __main__ - Step 33476: {'lr': 0.00044624707074648017, 'samples': 6427392, 'steps': 33475, 'loss/train': 1.2446976900100708} -08/30/2021 19:17:03 - INFO - __main__ - Step 33477: {'lr': 0.0004462437831178412, 'samples': 6427584, 'steps': 33476, 'loss/train': 1.5538004636764526} -08/30/2021 19:17:04 - INFO - __main__ - Step 33478: {'lr': 0.00044624049540077784, 'samples': 6427776, 'steps': 33477, 'loss/train': 1.4938383102416992} -08/30/2021 19:17:04 - INFO - __main__ - Step 33479: {'lr': 0.0004462372075952914, 'samples': 6427968, 'steps': 33478, 'loss/train': 1.6635462045669556} -08/30/2021 19:17:04 - INFO - __main__ - Step 33480: {'lr': 0.0004462339197013836, 'samples': 6428160, 'steps': 33479, 'loss/train': 1.6248817443847656} -08/30/2021 19:17:06 - INFO - __main__ - Step 33481: {'lr': 0.00044623063171905585, 'samples': 6428352, 'steps': 33480, 'loss/train': 1.0170185565948486} -08/30/2021 19:17:07 - INFO - __main__ - Step 33482: {'lr': 0.0004462273436483095, 'samples': 6428544, 'steps': 33481, 'loss/train': 1.661685585975647} -08/30/2021 19:17:07 - INFO - __main__ - Step 33483: {'lr': 0.00044622405548914627, 'samples': 6428736, 'steps': 33482, 'loss/train': 0.83110511302948} -08/30/2021 19:17:07 - INFO - __main__ - Step 33484: {'lr': 0.00044622076724156747, 'samples': 6428928, 'steps': 33483, 'loss/train': 1.1491162776947021} -08/30/2021 19:17:08 - INFO - __main__ - Step 33485: {'lr': 0.00044621747890557454, 'samples': 6429120, 'steps': 33484, 'loss/train': 0.08648316562175751} -08/30/2021 19:17:09 - INFO - __main__ - Step 33486: {'lr': 0.0004462141904811691, 'samples': 6429312, 'steps': 33485, 'loss/train': 1.4600337743759155} -08/30/2021 19:17:10 - INFO - __main__ - Step 33487: {'lr': 0.00044621090196835254, 'samples': 6429504, 'steps': 33486, 'loss/train': 2.0368728637695312} -08/30/2021 19:17:10 - INFO - __main__ - Step 33488: {'lr': 0.00044620761336712646, 'samples': 6429696, 'steps': 33487, 'loss/train': 2.0213589668273926} -08/30/2021 19:17:10 - INFO - __main__ - Step 33489: {'lr': 0.00044620432467749215, 'samples': 6429888, 'steps': 33488, 'loss/train': 1.6966632604599} -08/30/2021 19:17:11 - INFO - __main__ - Step 33490: {'lr': 0.0004462010358994513, 'samples': 6430080, 'steps': 33489, 'loss/train': 1.3306323289871216} -08/30/2021 19:17:12 - INFO - __main__ - Step 33491: {'lr': 0.0004461977470330052, 'samples': 6430272, 'steps': 33490, 'loss/train': 1.3611665964126587} -08/30/2021 19:17:13 - INFO - __main__ - Step 33492: {'lr': 0.00044619445807815545, 'samples': 6430464, 'steps': 33491, 'loss/train': 1.854926347732544} -08/30/2021 19:17:13 - INFO - __main__ - Step 33493: {'lr': 0.00044619116903490356, 'samples': 6430656, 'steps': 33492, 'loss/train': 0.38408511877059937} -08/30/2021 19:17:13 - INFO - __main__ - Step 33494: {'lr': 0.00044618787990325086, 'samples': 6430848, 'steps': 33493, 'loss/train': 1.6721330881118774} -08/30/2021 19:17:14 - INFO - __main__ - Step 33495: {'lr': 0.000446184590683199, 'samples': 6431040, 'steps': 33494, 'loss/train': 1.2868119478225708} -08/30/2021 19:17:15 - INFO - __main__ - Step 33496: {'lr': 0.00044618130137474935, 'samples': 6431232, 'steps': 33495, 'loss/train': 1.422435998916626} -08/30/2021 19:17:16 - INFO - __main__ - Step 33497: {'lr': 0.0004461780119779034, 'samples': 6431424, 'steps': 33496, 'loss/train': 1.496319055557251} -08/30/2021 19:17:16 - INFO - __main__ - Step 33498: {'lr': 0.0004461747224926628, 'samples': 6431616, 'steps': 33497, 'loss/train': 0.8715442419052124} -08/30/2021 19:17:16 - INFO - __main__ - Step 33499: {'lr': 0.0004461714329190288, 'samples': 6431808, 'steps': 33498, 'loss/train': 1.5960817337036133} -08/30/2021 19:17:17 - INFO - __main__ - Step 33500: {'lr': 0.00044616814325700293, 'samples': 6432000, 'steps': 33499, 'loss/train': 0.6516277194023132} -08/30/2021 19:17:18 - INFO - __main__ - Step 33501: {'lr': 0.0004461648535065869, 'samples': 6432192, 'steps': 33500, 'loss/train': 1.010624885559082} -08/30/2021 19:17:19 - INFO - __main__ - Step 33502: {'lr': 0.0004461615636677818, 'samples': 6432384, 'steps': 33501, 'loss/train': 1.2123264074325562} -08/30/2021 19:17:19 - INFO - __main__ - Step 33503: {'lr': 0.0004461582737405895, 'samples': 6432576, 'steps': 33502, 'loss/train': 1.5560311079025269} -08/30/2021 19:17:19 - INFO - __main__ - Step 33504: {'lr': 0.00044615498372501116, 'samples': 6432768, 'steps': 33503, 'loss/train': 1.3471797704696655} -08/30/2021 19:17:20 - INFO - __main__ - Step 33505: {'lr': 0.00044615169362104856, 'samples': 6432960, 'steps': 33504, 'loss/train': 1.5496647357940674} -08/30/2021 19:17:21 - INFO - __main__ - Step 33506: {'lr': 0.00044614840342870293, 'samples': 6433152, 'steps': 33505, 'loss/train': 1.0810092687606812} -08/30/2021 19:17:22 - INFO - __main__ - Step 33507: {'lr': 0.0004461451131479759, 'samples': 6433344, 'steps': 33506, 'loss/train': 1.672833800315857} -08/30/2021 19:17:22 - INFO - __main__ - Step 33508: {'lr': 0.0004461418227788689, 'samples': 6433536, 'steps': 33507, 'loss/train': 1.437759280204773} -08/30/2021 19:17:23 - INFO - __main__ - Step 33509: {'lr': 0.00044613853232138343, 'samples': 6433728, 'steps': 33508, 'loss/train': 1.7411867380142212} -08/30/2021 19:17:23 - INFO - __main__ - Step 33510: {'lr': 0.0004461352417755209, 'samples': 6433920, 'steps': 33509, 'loss/train': 1.44561767578125} -08/30/2021 19:17:23 - INFO - __main__ - Step 33511: {'lr': 0.0004461319511412829, 'samples': 6434112, 'steps': 33510, 'loss/train': 1.9419852495193481} -08/30/2021 19:17:25 - INFO - __main__ - Step 33512: {'lr': 0.00044612866041867093, 'samples': 6434304, 'steps': 33511, 'loss/train': 0.6615219712257385} -08/30/2021 19:17:26 - INFO - __main__ - Step 33513: {'lr': 0.0004461253696076863, 'samples': 6434496, 'steps': 33512, 'loss/train': 2.077902317047119} -08/30/2021 19:17:26 - INFO - __main__ - Step 33514: {'lr': 0.00044612207870833073, 'samples': 6434688, 'steps': 33513, 'loss/train': 0.9714586138725281} -08/30/2021 19:17:26 - INFO - __main__ - Step 33515: {'lr': 0.0004461187877206055, 'samples': 6434880, 'steps': 33514, 'loss/train': 1.8643016815185547} -08/30/2021 19:17:27 - INFO - __main__ - Step 33516: {'lr': 0.00044611549664451216, 'samples': 6435072, 'steps': 33515, 'loss/train': 1.7042568922042847} -08/30/2021 19:17:28 - INFO - __main__ - Step 33517: {'lr': 0.0004461122054800522, 'samples': 6435264, 'steps': 33516, 'loss/train': 1.6835029125213623} -08/30/2021 19:17:29 - INFO - __main__ - Step 33518: {'lr': 0.00044610891422722714, 'samples': 6435456, 'steps': 33517, 'loss/train': 1.140123963356018} -08/30/2021 19:17:29 - INFO - __main__ - Step 33519: {'lr': 0.00044610562288603846, 'samples': 6435648, 'steps': 33518, 'loss/train': 1.3658342361450195} -08/30/2021 19:17:29 - INFO - __main__ - Step 33520: {'lr': 0.00044610233145648756, 'samples': 6435840, 'steps': 33519, 'loss/train': 2.090968370437622} -08/30/2021 19:17:30 - INFO - __main__ - Step 33521: {'lr': 0.00044609903993857603, 'samples': 6436032, 'steps': 33520, 'loss/train': 1.7515610456466675} -08/30/2021 19:17:31 - INFO - __main__ - Step 33522: {'lr': 0.0004460957483323052, 'samples': 6436224, 'steps': 33521, 'loss/train': 2.3323111534118652} -08/30/2021 19:17:32 - INFO - __main__ - Step 33523: {'lr': 0.0004460924566376767, 'samples': 6436416, 'steps': 33522, 'loss/train': 1.9491584300994873} -08/30/2021 19:17:32 - INFO - __main__ - Step 33524: {'lr': 0.00044608916485469195, 'samples': 6436608, 'steps': 33523, 'loss/train': 0.9474073052406311} -08/30/2021 19:17:32 - INFO - __main__ - Step 33525: {'lr': 0.0004460858729833525, 'samples': 6436800, 'steps': 33524, 'loss/train': 1.5902125835418701} -08/30/2021 19:17:33 - INFO - __main__ - Step 33526: {'lr': 0.0004460825810236598, 'samples': 6436992, 'steps': 33525, 'loss/train': 1.3268276453018188} -08/30/2021 19:17:34 - INFO - __main__ - Step 33527: {'lr': 0.00044607928897561524, 'samples': 6437184, 'steps': 33526, 'loss/train': 1.4679911136627197} -08/30/2021 19:17:35 - INFO - __main__ - Step 33528: {'lr': 0.0004460759968392204, 'samples': 6437376, 'steps': 33527, 'loss/train': 1.366976261138916} -08/30/2021 19:17:35 - INFO - __main__ - Step 33529: {'lr': 0.0004460727046144768, 'samples': 6437568, 'steps': 33528, 'loss/train': 1.1873396635055542} -08/30/2021 19:17:36 - INFO - __main__ - Step 33530: {'lr': 0.00044606941230138574, 'samples': 6437760, 'steps': 33529, 'loss/train': 1.4000188112258911} -08/30/2021 19:17:36 - INFO - __main__ - Step 33531: {'lr': 0.0004460661198999489, 'samples': 6437952, 'steps': 33530, 'loss/train': 1.60287606716156} -08/30/2021 19:17:37 - INFO - __main__ - Step 33532: {'lr': 0.0004460628274101677, 'samples': 6438144, 'steps': 33531, 'loss/train': 1.2830095291137695} -08/30/2021 19:17:38 - INFO - __main__ - Step 33533: {'lr': 0.0004460595348320436, 'samples': 6438336, 'steps': 33532, 'loss/train': 1.4931893348693848} -08/30/2021 19:17:38 - INFO - __main__ - Step 33534: {'lr': 0.0004460562421655782, 'samples': 6438528, 'steps': 33533, 'loss/train': 1.1894075870513916} -08/30/2021 19:17:39 - INFO - __main__ - Step 33535: {'lr': 0.0004460529494107727, 'samples': 6438720, 'steps': 33534, 'loss/train': 1.116638422012329} -08/30/2021 19:17:39 - INFO - __main__ - Step 33536: {'lr': 0.00044604965656762884, 'samples': 6438912, 'steps': 33535, 'loss/train': 1.6395421028137207} -08/30/2021 19:17:40 - INFO - __main__ - Step 33537: {'lr': 0.0004460463636361481, 'samples': 6439104, 'steps': 33536, 'loss/train': 1.503105640411377} -08/30/2021 19:17:41 - INFO - __main__ - Step 33538: {'lr': 0.00044604307061633187, 'samples': 6439296, 'steps': 33537, 'loss/train': 1.4628092050552368} -08/30/2021 19:17:41 - INFO - __main__ - Step 33539: {'lr': 0.0004460397775081816, 'samples': 6439488, 'steps': 33538, 'loss/train': 0.7604972720146179} -08/30/2021 19:17:42 - INFO - __main__ - Step 33540: {'lr': 0.00044603648431169884, 'samples': 6439680, 'steps': 33539, 'loss/train': 1.6785184144973755} -08/30/2021 19:17:42 - INFO - __main__ - Step 33541: {'lr': 0.0004460331910268851, 'samples': 6439872, 'steps': 33540, 'loss/train': 1.0894722938537598} -08/30/2021 19:17:43 - INFO - __main__ - Step 33542: {'lr': 0.0004460298976537418, 'samples': 6440064, 'steps': 33541, 'loss/train': 1.0590217113494873} -08/30/2021 19:17:44 - INFO - __main__ - Step 33543: {'lr': 0.00044602660419227046, 'samples': 6440256, 'steps': 33542, 'loss/train': 1.2171657085418701} -08/30/2021 19:17:44 - INFO - __main__ - Step 33544: {'lr': 0.0004460233106424726, 'samples': 6440448, 'steps': 33543, 'loss/train': 2.1229300498962402} -08/30/2021 19:17:45 - INFO - __main__ - Step 33545: {'lr': 0.00044602001700434963, 'samples': 6440640, 'steps': 33544, 'loss/train': 1.7850686311721802} -08/30/2021 19:17:45 - INFO - __main__ - Step 33546: {'lr': 0.00044601672327790304, 'samples': 6440832, 'steps': 33545, 'loss/train': 1.6989439725875854} -08/30/2021 19:17:45 - INFO - __main__ - Step 33547: {'lr': 0.00044601342946313437, 'samples': 6441024, 'steps': 33546, 'loss/train': 1.5467450618743896} -08/30/2021 19:17:47 - INFO - __main__ - Step 33548: {'lr': 0.0004460101355600451, 'samples': 6441216, 'steps': 33547, 'loss/train': 1.662822961807251} -08/30/2021 19:17:47 - INFO - __main__ - Step 33549: {'lr': 0.0004460068415686366, 'samples': 6441408, 'steps': 33548, 'loss/train': 0.7413464784622192} -08/30/2021 19:17:48 - INFO - __main__ - Step 33550: {'lr': 0.0004460035474889105, 'samples': 6441600, 'steps': 33549, 'loss/train': 1.6940312385559082} -08/30/2021 19:17:48 - INFO - __main__ - Step 33551: {'lr': 0.00044600025332086824, 'samples': 6441792, 'steps': 33550, 'loss/train': 1.6477826833724976} -08/30/2021 19:17:48 - INFO - __main__ - Step 33552: {'lr': 0.0004459969590645113, 'samples': 6441984, 'steps': 33551, 'loss/train': 1.9770739078521729} -08/30/2021 19:17:50 - INFO - __main__ - Step 33553: {'lr': 0.000445993664719841, 'samples': 6442176, 'steps': 33552, 'loss/train': 1.5966130495071411} -08/30/2021 19:17:50 - INFO - __main__ - Step 33554: {'lr': 0.0004459903702868592, 'samples': 6442368, 'steps': 33553, 'loss/train': 1.5315237045288086} -08/30/2021 19:17:51 - INFO - __main__ - Step 33555: {'lr': 0.00044598707576556706, 'samples': 6442560, 'steps': 33554, 'loss/train': 1.59503173828125} -08/30/2021 19:17:51 - INFO - __main__ - Step 33556: {'lr': 0.00044598378115596614, 'samples': 6442752, 'steps': 33555, 'loss/train': 1.8892861604690552} -08/30/2021 19:17:51 - INFO - __main__ - Step 33557: {'lr': 0.000445980486458058, 'samples': 6442944, 'steps': 33556, 'loss/train': 1.628419041633606} -08/30/2021 19:17:53 - INFO - __main__ - Step 33558: {'lr': 0.0004459771916718441, 'samples': 6443136, 'steps': 33557, 'loss/train': 0.602741003036499} -08/30/2021 19:17:54 - INFO - __main__ - Step 33559: {'lr': 0.0004459738967973258, 'samples': 6443328, 'steps': 33558, 'loss/train': 0.1294114738702774} -08/30/2021 19:17:54 - INFO - __main__ - Step 33560: {'lr': 0.00044597060183450477, 'samples': 6443520, 'steps': 33559, 'loss/train': 1.6607118844985962} -08/30/2021 19:17:54 - INFO - __main__ - Step 33561: {'lr': 0.00044596730678338236, 'samples': 6443712, 'steps': 33560, 'loss/train': 1.4046095609664917} -08/30/2021 19:17:55 - INFO - __main__ - Step 33562: {'lr': 0.0004459640116439602, 'samples': 6443904, 'steps': 33561, 'loss/train': 1.2720739841461182} -08/30/2021 19:17:56 - INFO - __main__ - Step 33563: {'lr': 0.0004459607164162396, 'samples': 6444096, 'steps': 33562, 'loss/train': 0.976750373840332} -08/30/2021 19:17:57 - INFO - __main__ - Step 33564: {'lr': 0.00044595742110022216, 'samples': 6444288, 'steps': 33563, 'loss/train': 1.6367906332015991} -08/30/2021 19:17:57 - INFO - __main__ - Step 33565: {'lr': 0.00044595412569590934, 'samples': 6444480, 'steps': 33564, 'loss/train': 1.6431139707565308} -08/30/2021 19:17:57 - INFO - __main__ - Step 33566: {'lr': 0.0004459508302033025, 'samples': 6444672, 'steps': 33565, 'loss/train': 1.485739827156067} -08/30/2021 19:17:58 - INFO - __main__ - Step 33567: {'lr': 0.00044594753462240335, 'samples': 6444864, 'steps': 33566, 'loss/train': 1.5362398624420166} -08/30/2021 19:17:59 - INFO - __main__ - Step 33568: {'lr': 0.0004459442389532132, 'samples': 6445056, 'steps': 33567, 'loss/train': 0.3389038145542145} -08/30/2021 19:18:00 - INFO - __main__ - Step 33569: {'lr': 0.0004459409431957337, 'samples': 6445248, 'steps': 33568, 'loss/train': 1.1762274503707886} -08/30/2021 19:18:00 - INFO - __main__ - Step 33570: {'lr': 0.00044593764734996615, 'samples': 6445440, 'steps': 33569, 'loss/train': 1.5141596794128418} -08/30/2021 19:18:00 - INFO - __main__ - Step 33571: {'lr': 0.00044593435141591215, 'samples': 6445632, 'steps': 33570, 'loss/train': 1.363669514656067} -08/30/2021 19:18:01 - INFO - __main__ - Step 33572: {'lr': 0.00044593105539357313, 'samples': 6445824, 'steps': 33571, 'loss/train': 1.764335036277771} -08/30/2021 19:18:02 - INFO - __main__ - Step 33573: {'lr': 0.00044592775928295063, 'samples': 6446016, 'steps': 33572, 'loss/train': 1.2118182182312012} -08/30/2021 19:18:03 - INFO - __main__ - Step 33574: {'lr': 0.0004459244630840461, 'samples': 6446208, 'steps': 33573, 'loss/train': 1.42490553855896} -08/30/2021 19:18:03 - INFO - __main__ - Step 33575: {'lr': 0.000445921166796861, 'samples': 6446400, 'steps': 33574, 'loss/train': 1.322339653968811} -08/30/2021 19:18:03 - INFO - __main__ - Step 33576: {'lr': 0.00044591787042139684, 'samples': 6446592, 'steps': 33575, 'loss/train': 1.9720096588134766} -08/30/2021 19:18:04 - INFO - __main__ - Step 33577: {'lr': 0.0004459145739576552, 'samples': 6446784, 'steps': 33576, 'loss/train': 1.5571340322494507} -08/30/2021 19:18:04 - INFO - __main__ - Step 33578: {'lr': 0.0004459112774056374, 'samples': 6446976, 'steps': 33577, 'loss/train': 0.08507446944713593} -08/30/2021 19:18:06 - INFO - __main__ - Step 33579: {'lr': 0.000445907980765345, 'samples': 6447168, 'steps': 33578, 'loss/train': 0.137797549366951} -08/30/2021 19:18:07 - INFO - __main__ - Step 33580: {'lr': 0.00044590468403677954, 'samples': 6447360, 'steps': 33579, 'loss/train': 1.6683679819107056} -08/30/2021 19:18:07 - INFO - __main__ - Step 33581: {'lr': 0.00044590138721994243, 'samples': 6447552, 'steps': 33580, 'loss/train': 0.0656447559595108} -08/30/2021 19:18:08 - INFO - __main__ - Step 33582: {'lr': 0.00044589809031483517, 'samples': 6447744, 'steps': 33581, 'loss/train': 1.7217763662338257} -08/30/2021 19:18:08 - INFO - __main__ - Step 33583: {'lr': 0.0004458947933214592, 'samples': 6447936, 'steps': 33582, 'loss/train': 1.8664904832839966} -08/30/2021 19:18:09 - INFO - __main__ - Step 33584: {'lr': 0.0004458914962398162, 'samples': 6448128, 'steps': 33583, 'loss/train': 1.1735714673995972} -08/30/2021 19:18:10 - INFO - __main__ - Step 33585: {'lr': 0.0004458881990699074, 'samples': 6448320, 'steps': 33584, 'loss/train': 1.5449466705322266} -08/30/2021 19:18:10 - INFO - __main__ - Step 33586: {'lr': 0.00044588490181173435, 'samples': 6448512, 'steps': 33585, 'loss/train': 0.9304819107055664} -08/30/2021 19:18:10 - INFO - __main__ - Step 33587: {'lr': 0.0004458816044652987, 'samples': 6448704, 'steps': 33586, 'loss/train': 1.712382435798645} -08/30/2021 19:18:11 - INFO - __main__ - Step 33588: {'lr': 0.00044587830703060176, 'samples': 6448896, 'steps': 33587, 'loss/train': 1.574870228767395} -08/30/2021 19:18:12 - INFO - __main__ - Step 33589: {'lr': 0.00044587500950764514, 'samples': 6449088, 'steps': 33588, 'loss/train': 1.2343231439590454} -08/30/2021 19:18:13 - INFO - __main__ - Step 33590: {'lr': 0.0004458717118964302, 'samples': 6449280, 'steps': 33589, 'loss/train': 1.4308565855026245} -08/30/2021 19:18:13 - INFO - __main__ - Step 33591: {'lr': 0.0004458684141969585, 'samples': 6449472, 'steps': 33590, 'loss/train': 0.8971796631813049} -08/30/2021 19:18:14 - INFO - __main__ - Step 33592: {'lr': 0.0004458651164092315, 'samples': 6449664, 'steps': 33591, 'loss/train': 1.4396170377731323} -08/30/2021 19:18:14 - INFO - __main__ - Step 33593: {'lr': 0.00044586181853325076, 'samples': 6449856, 'steps': 33592, 'loss/train': 1.6373296976089478} -08/30/2021 19:18:15 - INFO - __main__ - Step 33594: {'lr': 0.0004458585205690177, 'samples': 6450048, 'steps': 33593, 'loss/train': 1.636523723602295} -08/30/2021 19:18:16 - INFO - __main__ - Step 33595: {'lr': 0.0004458552225165338, 'samples': 6450240, 'steps': 33594, 'loss/train': 1.4056764841079712} -08/30/2021 19:18:16 - INFO - __main__ - Step 33596: {'lr': 0.00044585192437580044, 'samples': 6450432, 'steps': 33595, 'loss/train': 1.401124119758606} -08/30/2021 19:18:17 - INFO - __main__ - Step 33597: {'lr': 0.0004458486261468194, 'samples': 6450624, 'steps': 33596, 'loss/train': 1.8220943212509155} -08/30/2021 19:18:17 - INFO - __main__ - Step 33598: {'lr': 0.0004458453278295919, 'samples': 6450816, 'steps': 33597, 'loss/train': 1.9699482917785645} -08/30/2021 19:18:18 - INFO - __main__ - Step 33599: {'lr': 0.00044584202942411956, 'samples': 6451008, 'steps': 33598, 'loss/train': 1.4828118085861206} -08/30/2021 19:18:19 - INFO - __main__ - Step 33600: {'lr': 0.00044583873093040376, 'samples': 6451200, 'steps': 33599, 'loss/train': 1.154546856880188} -08/30/2021 19:18:19 - INFO - __main__ - Step 33601: {'lr': 0.00044583543234844616, 'samples': 6451392, 'steps': 33600, 'loss/train': 1.019271731376648} -08/30/2021 19:18:20 - INFO - __main__ - Step 33602: {'lr': 0.00044583213367824806, 'samples': 6451584, 'steps': 33601, 'loss/train': 1.2273890972137451} -08/30/2021 19:18:20 - INFO - __main__ - Step 33603: {'lr': 0.00044582883491981097, 'samples': 6451776, 'steps': 33602, 'loss/train': 1.2579402923583984} -08/30/2021 19:18:21 - INFO - __main__ - Step 33604: {'lr': 0.0004458255360731365, 'samples': 6451968, 'steps': 33603, 'loss/train': 1.7824475765228271} -08/30/2021 19:18:22 - INFO - __main__ - Step 33605: {'lr': 0.00044582223713822606, 'samples': 6452160, 'steps': 33604, 'loss/train': 1.8708246946334839} -08/30/2021 19:18:22 - INFO - __main__ - Step 33606: {'lr': 0.0004458189381150811, 'samples': 6452352, 'steps': 33605, 'loss/train': 1.6141432523727417} -08/30/2021 19:18:23 - INFO - __main__ - Step 33607: {'lr': 0.00044581563900370326, 'samples': 6452544, 'steps': 33606, 'loss/train': 1.4116876125335693} -08/30/2021 19:18:23 - INFO - __main__ - Step 33608: {'lr': 0.0004458123398040938, 'samples': 6452736, 'steps': 33607, 'loss/train': 1.2242189645767212} -08/30/2021 19:18:25 - INFO - __main__ - Step 33609: {'lr': 0.0004458090405162544, 'samples': 6452928, 'steps': 33608, 'loss/train': 1.7578891515731812} -08/30/2021 19:18:25 - INFO - __main__ - Step 33610: {'lr': 0.0004458057411401864, 'samples': 6453120, 'steps': 33609, 'loss/train': 0.0835859552025795} -08/30/2021 19:18:25 - INFO - __main__ - Step 33611: {'lr': 0.00044580244167589136, 'samples': 6453312, 'steps': 33610, 'loss/train': 1.689874291419983} -08/30/2021 19:18:26 - INFO - __main__ - Step 33612: {'lr': 0.00044579914212337083, 'samples': 6453504, 'steps': 33611, 'loss/train': 1.5564651489257812} -08/30/2021 19:18:26 - INFO - __main__ - Step 33613: {'lr': 0.00044579584248262617, 'samples': 6453696, 'steps': 33612, 'loss/train': 1.5197362899780273} -08/30/2021 19:18:28 - INFO - __main__ - Step 33614: {'lr': 0.0004457925427536589, 'samples': 6453888, 'steps': 33613, 'loss/train': 1.3100367784500122} -08/30/2021 19:18:28 - INFO - __main__ - Step 33615: {'lr': 0.0004457892429364706, 'samples': 6454080, 'steps': 33614, 'loss/train': 1.5002819299697876} -08/30/2021 19:18:28 - INFO - __main__ - Step 33616: {'lr': 0.00044578594303106266, 'samples': 6454272, 'steps': 33615, 'loss/train': 1.2887840270996094} -08/30/2021 19:18:29 - INFO - __main__ - Step 33617: {'lr': 0.00044578264303743654, 'samples': 6454464, 'steps': 33616, 'loss/train': 1.5096867084503174} -08/30/2021 19:18:29 - INFO - __main__ - Step 33618: {'lr': 0.00044577934295559387, 'samples': 6454656, 'steps': 33617, 'loss/train': 0.6373361945152283} -08/30/2021 19:18:29 - INFO - __main__ - Step 33619: {'lr': 0.000445776042785536, 'samples': 6454848, 'steps': 33618, 'loss/train': 1.3112380504608154} -08/30/2021 19:18:31 - INFO - __main__ - Step 33620: {'lr': 0.00044577274252726454, 'samples': 6455040, 'steps': 33619, 'loss/train': 1.7142326831817627} -08/30/2021 19:18:31 - INFO - __main__ - Step 33621: {'lr': 0.00044576944218078075, 'samples': 6455232, 'steps': 33620, 'loss/train': 1.010748028755188} -08/30/2021 19:18:32 - INFO - __main__ - Step 33622: {'lr': 0.00044576614174608644, 'samples': 6455424, 'steps': 33621, 'loss/train': 1.9477105140686035} -08/30/2021 19:18:32 - INFO - __main__ - Step 33623: {'lr': 0.0004457628412231828, 'samples': 6455616, 'steps': 33622, 'loss/train': 0.5873215198516846} -08/30/2021 19:18:32 - INFO - __main__ - Step 33624: {'lr': 0.0004457595406120715, 'samples': 6455808, 'steps': 33623, 'loss/train': 1.3149832487106323} -08/30/2021 19:18:34 - INFO - __main__ - Step 33625: {'lr': 0.000445756239912754, 'samples': 6456000, 'steps': 33624, 'loss/train': 1.191064476966858} -08/30/2021 19:18:34 - INFO - __main__ - Step 33626: {'lr': 0.00044575293912523173, 'samples': 6456192, 'steps': 33625, 'loss/train': 1.6719938516616821} -08/30/2021 19:18:35 - INFO - __main__ - Step 33627: {'lr': 0.0004457496382495062, 'samples': 6456384, 'steps': 33626, 'loss/train': 1.5137373208999634} -08/30/2021 19:18:35 - INFO - __main__ - Step 33628: {'lr': 0.00044574633728557887, 'samples': 6456576, 'steps': 33627, 'loss/train': 1.7458797693252563} -08/30/2021 19:18:35 - INFO - __main__ - Step 33629: {'lr': 0.0004457430362334513, 'samples': 6456768, 'steps': 33628, 'loss/train': 1.588250994682312} -08/30/2021 19:18:37 - INFO - __main__ - Step 33630: {'lr': 0.00044573973509312494, 'samples': 6456960, 'steps': 33629, 'loss/train': 1.6230896711349487} -08/30/2021 19:18:37 - INFO - __main__ - Step 33631: {'lr': 0.00044573643386460127, 'samples': 6457152, 'steps': 33630, 'loss/train': 1.3803664445877075} -08/30/2021 19:18:38 - INFO - __main__ - Step 33632: {'lr': 0.00044573313254788176, 'samples': 6457344, 'steps': 33631, 'loss/train': 1.405279517173767} -08/30/2021 19:18:38 - INFO - __main__ - Step 33633: {'lr': 0.00044572983114296794, 'samples': 6457536, 'steps': 33632, 'loss/train': 1.3801747560501099} -08/30/2021 19:18:38 - INFO - __main__ - Step 33634: {'lr': 0.00044572652964986126, 'samples': 6457728, 'steps': 33633, 'loss/train': 1.7407443523406982} -08/30/2021 19:18:40 - INFO - __main__ - Step 33635: {'lr': 0.0004457232280685633, 'samples': 6457920, 'steps': 33634, 'loss/train': 1.8664658069610596} -08/30/2021 19:18:41 - INFO - __main__ - Step 33636: {'lr': 0.0004457199263990754, 'samples': 6458112, 'steps': 33635, 'loss/train': 1.5581839084625244} -08/30/2021 19:18:41 - INFO - __main__ - Step 33637: {'lr': 0.0004457166246413992, 'samples': 6458304, 'steps': 33636, 'loss/train': 1.475074291229248} -08/30/2021 19:18:42 - INFO - __main__ - Step 33638: {'lr': 0.000445713322795536, 'samples': 6458496, 'steps': 33637, 'loss/train': 2.033583164215088} -08/30/2021 19:18:42 - INFO - __main__ - Step 33639: {'lr': 0.0004457100208614875, 'samples': 6458688, 'steps': 33638, 'loss/train': 1.7355316877365112} -08/30/2021 19:18:43 - INFO - __main__ - Step 33640: {'lr': 0.00044570671883925497, 'samples': 6458880, 'steps': 33639, 'loss/train': 1.048525333404541} -08/30/2021 19:18:44 - INFO - __main__ - Step 33641: {'lr': 0.00044570341672884006, 'samples': 6459072, 'steps': 33640, 'loss/train': 1.741182804107666} -08/30/2021 19:18:44 - INFO - __main__ - Step 33642: {'lr': 0.0004457001145302443, 'samples': 6459264, 'steps': 33641, 'loss/train': 1.8247840404510498} -08/30/2021 19:18:45 - INFO - __main__ - Step 33643: {'lr': 0.00044569681224346897, 'samples': 6459456, 'steps': 33642, 'loss/train': 1.3121438026428223} -08/30/2021 19:18:45 - INFO - __main__ - Step 33644: {'lr': 0.0004456935098685158, 'samples': 6459648, 'steps': 33643, 'loss/train': 1.1755136251449585} -08/30/2021 19:18:46 - INFO - __main__ - Step 33645: {'lr': 0.000445690207405386, 'samples': 6459840, 'steps': 33644, 'loss/train': 1.9052174091339111} -08/30/2021 19:18:47 - INFO - __main__ - Step 33646: {'lr': 0.00044568690485408125, 'samples': 6460032, 'steps': 33645, 'loss/train': 2.1132073402404785} -08/30/2021 19:18:47 - INFO - __main__ - Step 33647: {'lr': 0.0004456836022146031, 'samples': 6460224, 'steps': 33646, 'loss/train': 1.7295184135437012} -08/30/2021 19:18:48 - INFO - __main__ - Step 33648: {'lr': 0.00044568029948695287, 'samples': 6460416, 'steps': 33647, 'loss/train': 1.062779188156128} -08/30/2021 19:18:48 - INFO - __main__ - Step 33649: {'lr': 0.0004456769966711321, 'samples': 6460608, 'steps': 33648, 'loss/train': 1.621753215789795} -08/30/2021 19:18:50 - INFO - __main__ - Step 33650: {'lr': 0.00044567369376714226, 'samples': 6460800, 'steps': 33649, 'loss/train': 1.470309853553772} -08/30/2021 19:18:50 - INFO - __main__ - Step 33651: {'lr': 0.00044567039077498497, 'samples': 6460992, 'steps': 33650, 'loss/train': 1.4786673784255981} -08/30/2021 19:18:50 - INFO - __main__ - Step 33652: {'lr': 0.00044566708769466155, 'samples': 6461184, 'steps': 33651, 'loss/train': 1.9077013731002808} -08/30/2021 19:18:51 - INFO - __main__ - Step 33653: {'lr': 0.00044566378452617363, 'samples': 6461376, 'steps': 33652, 'loss/train': 1.3045562505722046} -08/30/2021 19:18:51 - INFO - __main__ - Step 33654: {'lr': 0.0004456604812695226, 'samples': 6461568, 'steps': 33653, 'loss/train': 0.2149282991886139} -08/30/2021 19:18:51 - INFO - __main__ - Step 33655: {'lr': 0.0004456571779247099, 'samples': 6461760, 'steps': 33654, 'loss/train': 2.1666784286499023} -08/30/2021 19:18:53 - INFO - __main__ - Step 33656: {'lr': 0.0004456538744917372, 'samples': 6461952, 'steps': 33655, 'loss/train': 2.077083110809326} -08/30/2021 19:18:53 - INFO - __main__ - Step 33657: {'lr': 0.0004456505709706059, 'samples': 6462144, 'steps': 33656, 'loss/train': 1.508438229560852} -08/30/2021 19:18:54 - INFO - __main__ - Step 33658: {'lr': 0.0004456472673613174, 'samples': 6462336, 'steps': 33657, 'loss/train': 1.0288509130477905} -08/30/2021 19:18:54 - INFO - __main__ - Step 33659: {'lr': 0.00044564396366387327, 'samples': 6462528, 'steps': 33658, 'loss/train': 1.1481804847717285} -08/30/2021 19:18:55 - INFO - __main__ - Step 33660: {'lr': 0.000445640659878275, 'samples': 6462720, 'steps': 33659, 'loss/train': 1.3931019306182861} -08/30/2021 19:18:56 - INFO - __main__ - Step 33661: {'lr': 0.00044563735600452407, 'samples': 6462912, 'steps': 33660, 'loss/train': 1.7889535427093506} -08/30/2021 19:18:57 - INFO - __main__ - Step 33662: {'lr': 0.000445634052042622, 'samples': 6463104, 'steps': 33661, 'loss/train': 1.5299344062805176} -08/30/2021 19:18:57 - INFO - __main__ - Step 33663: {'lr': 0.00044563074799257015, 'samples': 6463296, 'steps': 33662, 'loss/train': 1.7181077003479004} -08/30/2021 19:18:57 - INFO - __main__ - Step 33664: {'lr': 0.0004456274438543702, 'samples': 6463488, 'steps': 33663, 'loss/train': 1.537021517753601} -08/30/2021 19:18:58 - INFO - __main__ - Step 33665: {'lr': 0.0004456241396280234, 'samples': 6463680, 'steps': 33664, 'loss/train': 1.6002298593521118} -08/30/2021 19:18:59 - INFO - __main__ - Step 33666: {'lr': 0.00044562083531353154, 'samples': 6463872, 'steps': 33665, 'loss/train': 1.5957136154174805} -08/30/2021 19:19:00 - INFO - __main__ - Step 33667: {'lr': 0.00044561753091089585, 'samples': 6464064, 'steps': 33666, 'loss/train': 1.194705843925476} -08/30/2021 19:19:00 - INFO - __main__ - Step 33668: {'lr': 0.00044561422642011794, 'samples': 6464256, 'steps': 33667, 'loss/train': 1.3724820613861084} -08/30/2021 19:19:01 - INFO - __main__ - Step 33669: {'lr': 0.00044561092184119933, 'samples': 6464448, 'steps': 33668, 'loss/train': 0.5602323412895203} -08/30/2021 19:19:01 - INFO - __main__ - Step 33670: {'lr': 0.00044560761717414143, 'samples': 6464640, 'steps': 33669, 'loss/train': 1.494260311126709} -08/30/2021 19:19:01 - INFO - __main__ - Step 33671: {'lr': 0.0004456043124189458, 'samples': 6464832, 'steps': 33670, 'loss/train': 2.1510260105133057} -08/30/2021 19:19:03 - INFO - __main__ - Step 33672: {'lr': 0.00044560100757561386, 'samples': 6465024, 'steps': 33671, 'loss/train': 1.2402567863464355} -08/30/2021 19:19:03 - INFO - __main__ - Step 33673: {'lr': 0.000445597702644147, 'samples': 6465216, 'steps': 33672, 'loss/train': 1.3177675008773804} -08/30/2021 19:19:03 - INFO - __main__ - Step 33674: {'lr': 0.000445594397624547, 'samples': 6465408, 'steps': 33673, 'loss/train': 1.3417434692382812} -08/30/2021 19:19:04 - INFO - __main__ - Step 33675: {'lr': 0.0004455910925168151, 'samples': 6465600, 'steps': 33674, 'loss/train': 0.6625871658325195} -08/30/2021 19:19:04 - INFO - __main__ - Step 33676: {'lr': 0.0004455877873209529, 'samples': 6465792, 'steps': 33675, 'loss/train': 1.4782607555389404} -08/30/2021 19:19:06 - INFO - __main__ - Step 33677: {'lr': 0.00044558448203696184, 'samples': 6465984, 'steps': 33676, 'loss/train': 1.2957102060317993} -08/30/2021 19:19:06 - INFO - __main__ - Step 33678: {'lr': 0.0004455811766648434, 'samples': 6466176, 'steps': 33677, 'loss/train': 1.493072748184204} -08/30/2021 19:19:06 - INFO - __main__ - Step 33679: {'lr': 0.0004455778712045992, 'samples': 6466368, 'steps': 33678, 'loss/train': 0.9289096593856812} -08/30/2021 19:19:07 - INFO - __main__ - Step 33680: {'lr': 0.0004455745656562306, 'samples': 6466560, 'steps': 33679, 'loss/train': 1.2810266017913818} -08/30/2021 19:19:07 - INFO - __main__ - Step 33681: {'lr': 0.000445571260019739, 'samples': 6466752, 'steps': 33680, 'loss/train': 1.046522855758667} -08/30/2021 19:19:09 - INFO - __main__ - Step 33682: {'lr': 0.00044556795429512617, 'samples': 6466944, 'steps': 33681, 'loss/train': 1.375369906425476} -08/30/2021 19:19:09 - INFO - __main__ - Step 33683: {'lr': 0.0004455646484823933, 'samples': 6467136, 'steps': 33682, 'loss/train': 1.3770354986190796} -08/30/2021 19:19:10 - INFO - __main__ - Step 33684: {'lr': 0.00044556134258154215, 'samples': 6467328, 'steps': 33683, 'loss/train': 1.6346420049667358} -08/30/2021 19:19:10 - INFO - __main__ - Step 33685: {'lr': 0.000445558036592574, 'samples': 6467520, 'steps': 33684, 'loss/train': 0.8800514340400696} -08/30/2021 19:19:10 - INFO - __main__ - Step 33686: {'lr': 0.0004455547305154904, 'samples': 6467712, 'steps': 33685, 'loss/train': 1.3120747804641724} -08/30/2021 19:19:13 - INFO - __main__ - Step 33687: {'lr': 0.00044555142435029284, 'samples': 6467904, 'steps': 33686, 'loss/train': 1.90951406955719} -08/30/2021 19:19:13 - INFO - __main__ - Step 33688: {'lr': 0.0004455481180969829, 'samples': 6468096, 'steps': 33687, 'loss/train': 1.4036403894424438} -08/30/2021 19:19:13 - INFO - __main__ - Step 33689: {'lr': 0.00044554481175556194, 'samples': 6468288, 'steps': 33688, 'loss/train': 1.8362884521484375} -08/30/2021 19:19:14 - INFO - __main__ - Step 33690: {'lr': 0.00044554150532603154, 'samples': 6468480, 'steps': 33689, 'loss/train': 1.3188564777374268} -08/30/2021 19:19:14 - INFO - __main__ - Step 33691: {'lr': 0.00044553819880839313, 'samples': 6468672, 'steps': 33690, 'loss/train': 0.12286171317100525} -08/30/2021 19:19:16 - INFO - __main__ - Step 33692: {'lr': 0.0004455348922026483, 'samples': 6468864, 'steps': 33691, 'loss/train': 1.4504883289337158} -08/30/2021 19:19:16 - INFO - __main__ - Step 33693: {'lr': 0.00044553158550879833, 'samples': 6469056, 'steps': 33692, 'loss/train': 0.966931939125061} -08/30/2021 19:19:17 - INFO - __main__ - Step 33694: {'lr': 0.00044552827872684493, 'samples': 6469248, 'steps': 33693, 'loss/train': 0.05195411294698715} -08/30/2021 19:19:17 - INFO - __main__ - Step 33695: {'lr': 0.00044552497185678953, 'samples': 6469440, 'steps': 33694, 'loss/train': 1.4305965900421143} -08/30/2021 19:19:17 - INFO - __main__ - Step 33696: {'lr': 0.00044552166489863354, 'samples': 6469632, 'steps': 33695, 'loss/train': 1.919219732284546} -08/30/2021 19:19:18 - INFO - __main__ - Step 33697: {'lr': 0.0004455183578523785, 'samples': 6469824, 'steps': 33696, 'loss/train': 0.6313751935958862} -08/30/2021 19:19:19 - INFO - __main__ - Step 33698: {'lr': 0.00044551505071802587, 'samples': 6470016, 'steps': 33697, 'loss/train': 1.5120868682861328} -08/30/2021 19:19:20 - INFO - __main__ - Step 33699: {'lr': 0.00044551174349557733, 'samples': 6470208, 'steps': 33698, 'loss/train': 1.5390487909317017} -08/30/2021 19:19:20 - INFO - __main__ - Step 33700: {'lr': 0.0004455084361850341, 'samples': 6470400, 'steps': 33699, 'loss/train': 1.6729403734207153} -08/30/2021 19:19:20 - INFO - __main__ - Step 33701: {'lr': 0.00044550512878639784, 'samples': 6470592, 'steps': 33700, 'loss/train': 2.4788177013397217} -08/30/2021 19:19:21 - INFO - __main__ - Step 33702: {'lr': 0.0004455018212996699, 'samples': 6470784, 'steps': 33701, 'loss/train': 1.4816921949386597} -08/30/2021 19:19:22 - INFO - __main__ - Step 33703: {'lr': 0.0004454985137248519, 'samples': 6470976, 'steps': 33702, 'loss/train': 1.4157847166061401} -08/30/2021 19:19:23 - INFO - __main__ - Step 33704: {'lr': 0.00044549520606194525, 'samples': 6471168, 'steps': 33703, 'loss/train': 1.1378756761550903} -08/30/2021 19:19:23 - INFO - __main__ - Step 33705: {'lr': 0.00044549189831095157, 'samples': 6471360, 'steps': 33704, 'loss/train': 1.4806702136993408} -08/30/2021 19:19:23 - INFO - __main__ - Step 33706: {'lr': 0.0004454885904718722, 'samples': 6471552, 'steps': 33705, 'loss/train': 0.7380875945091248} -08/30/2021 19:19:24 - INFO - __main__ - Step 33707: {'lr': 0.0004454852825447087, 'samples': 6471744, 'steps': 33706, 'loss/train': 1.4180727005004883} -08/30/2021 19:19:25 - INFO - __main__ - Step 33708: {'lr': 0.0004454819745294625, 'samples': 6471936, 'steps': 33707, 'loss/train': 0.8957964777946472} -08/30/2021 19:19:26 - INFO - __main__ - Step 33709: {'lr': 0.0004454786664261352, 'samples': 6472128, 'steps': 33708, 'loss/train': 1.1599117517471313} -08/30/2021 19:19:26 - INFO - __main__ - Step 33710: {'lr': 0.0004454753582347282, 'samples': 6472320, 'steps': 33709, 'loss/train': 1.262404203414917} -08/30/2021 19:19:26 - INFO - __main__ - Step 33711: {'lr': 0.00044547204995524305, 'samples': 6472512, 'steps': 33710, 'loss/train': 1.4879599809646606} -08/30/2021 19:19:27 - INFO - __main__ - Step 33712: {'lr': 0.00044546874158768115, 'samples': 6472704, 'steps': 33711, 'loss/train': 1.5151615142822266} -08/30/2021 19:19:28 - INFO - __main__ - Step 33713: {'lr': 0.00044546543313204415, 'samples': 6472896, 'steps': 33712, 'loss/train': 0.8803406953811646} -08/30/2021 19:19:29 - INFO - __main__ - Step 33714: {'lr': 0.00044546212458833334, 'samples': 6473088, 'steps': 33713, 'loss/train': 1.1372411251068115} -08/30/2021 19:19:29 - INFO - __main__ - Step 33715: {'lr': 0.00044545881595655035, 'samples': 6473280, 'steps': 33714, 'loss/train': 0.08176945894956589} -08/30/2021 19:19:29 - INFO - __main__ - Step 33716: {'lr': 0.00044545550723669664, 'samples': 6473472, 'steps': 33715, 'loss/train': 1.5716156959533691} -08/30/2021 19:19:30 - INFO - __main__ - Step 33717: {'lr': 0.00044545219842877373, 'samples': 6473664, 'steps': 33716, 'loss/train': 1.4744352102279663} -08/30/2021 19:19:31 - INFO - __main__ - Step 33718: {'lr': 0.000445448889532783, 'samples': 6473856, 'steps': 33717, 'loss/train': 1.3616046905517578} -08/30/2021 19:19:32 - INFO - __main__ - Step 33719: {'lr': 0.0004454455805487261, 'samples': 6474048, 'steps': 33718, 'loss/train': 1.614224910736084} -08/30/2021 19:19:32 - INFO - __main__ - Step 33720: {'lr': 0.0004454422714766043, 'samples': 6474240, 'steps': 33719, 'loss/train': 0.05675714835524559} -08/30/2021 19:19:32 - INFO - __main__ - Step 33721: {'lr': 0.00044543896231641935, 'samples': 6474432, 'steps': 33720, 'loss/train': 2.077928304672241} -08/30/2021 19:19:33 - INFO - __main__ - Step 33722: {'lr': 0.00044543565306817256, 'samples': 6474624, 'steps': 33721, 'loss/train': 1.4743558168411255} -08/30/2021 19:19:35 - INFO - __main__ - Step 33723: {'lr': 0.00044543234373186556, 'samples': 6474816, 'steps': 33722, 'loss/train': 1.5818597078323364} -08/30/2021 19:19:35 - INFO - __main__ - Step 33724: {'lr': 0.0004454290343074997, 'samples': 6475008, 'steps': 33723, 'loss/train': 1.5008740425109863} -08/30/2021 19:19:35 - INFO - __main__ - Step 33725: {'lr': 0.00044542572479507655, 'samples': 6475200, 'steps': 33724, 'loss/train': 1.813492774963379} -08/30/2021 19:19:36 - INFO - __main__ - Step 33726: {'lr': 0.00044542241519459757, 'samples': 6475392, 'steps': 33725, 'loss/train': 0.9517505764961243} -08/30/2021 19:19:36 - INFO - __main__ - Step 33727: {'lr': 0.0004454191055060643, 'samples': 6475584, 'steps': 33726, 'loss/train': 0.1324375718832016} -08/30/2021 19:19:36 - INFO - __main__ - Step 33728: {'lr': 0.00044541579572947814, 'samples': 6475776, 'steps': 33727, 'loss/train': 1.6306759119033813} -08/30/2021 19:19:38 - INFO - __main__ - Step 33729: {'lr': 0.0004454124858648407, 'samples': 6475968, 'steps': 33728, 'loss/train': 1.452009916305542} -08/30/2021 19:19:39 - INFO - __main__ - Step 33730: {'lr': 0.00044540917591215335, 'samples': 6476160, 'steps': 33729, 'loss/train': 1.190197229385376} -08/30/2021 19:19:39 - INFO - __main__ - Step 33731: {'lr': 0.0004454058658714177, 'samples': 6476352, 'steps': 33730, 'loss/train': 0.9651709198951721} -08/30/2021 19:19:40 - INFO - __main__ - Step 33732: {'lr': 0.0004454025557426351, 'samples': 6476544, 'steps': 33731, 'loss/train': 1.937745451927185} -08/30/2021 19:19:40 - INFO - __main__ - Step 33733: {'lr': 0.00044539924552580723, 'samples': 6476736, 'steps': 33732, 'loss/train': 0.1663772165775299} -08/30/2021 19:19:40 - INFO - __main__ - Step 33734: {'lr': 0.0004453959352209354, 'samples': 6476928, 'steps': 33733, 'loss/train': 0.07754461467266083} -08/30/2021 19:19:42 - INFO - __main__ - Step 33735: {'lr': 0.0004453926248280212, 'samples': 6477120, 'steps': 33734, 'loss/train': 0.19635151326656342} -08/30/2021 19:19:42 - INFO - __main__ - Step 33736: {'lr': 0.0004453893143470661, 'samples': 6477312, 'steps': 33735, 'loss/train': 1.0328118801116943} -08/30/2021 19:19:43 - INFO - __main__ - Step 33737: {'lr': 0.0004453860037780716, 'samples': 6477504, 'steps': 33736, 'loss/train': 1.5382918119430542} -08/30/2021 19:19:43 - INFO - __main__ - Step 33738: {'lr': 0.00044538269312103916, 'samples': 6477696, 'steps': 33737, 'loss/train': 1.445682406425476} -08/30/2021 19:19:43 - INFO - __main__ - Step 33739: {'lr': 0.00044537938237597033, 'samples': 6477888, 'steps': 33738, 'loss/train': 2.663958787918091} -08/30/2021 19:19:45 - INFO - __main__ - Step 33740: {'lr': 0.00044537607154286645, 'samples': 6478080, 'steps': 33739, 'loss/train': 1.6115236282348633} -08/30/2021 19:19:46 - INFO - __main__ - Step 33741: {'lr': 0.00044537276062172926, 'samples': 6478272, 'steps': 33740, 'loss/train': 1.5073665380477905} -08/30/2021 19:19:46 - INFO - __main__ - Step 33742: {'lr': 0.0004453694496125601, 'samples': 6478464, 'steps': 33741, 'loss/train': 1.6848793029785156} -08/30/2021 19:19:47 - INFO - __main__ - Step 33743: {'lr': 0.0004453661385153604, 'samples': 6478656, 'steps': 33742, 'loss/train': 1.5976946353912354} -08/30/2021 19:19:47 - INFO - __main__ - Step 33744: {'lr': 0.0004453628273301318, 'samples': 6478848, 'steps': 33743, 'loss/train': 1.7621325254440308} -08/30/2021 19:19:49 - INFO - __main__ - Step 33745: {'lr': 0.0004453595160568757, 'samples': 6479040, 'steps': 33744, 'loss/train': 1.7771892547607422} -08/30/2021 19:19:49 - INFO - __main__ - Step 33746: {'lr': 0.0004453562046955937, 'samples': 6479232, 'steps': 33745, 'loss/train': 1.5560173988342285} -08/30/2021 19:19:50 - INFO - __main__ - Step 33747: {'lr': 0.00044535289324628704, 'samples': 6479424, 'steps': 33746, 'loss/train': 1.5462055206298828} -08/30/2021 19:19:50 - INFO - __main__ - Step 33748: {'lr': 0.00044534958170895753, 'samples': 6479616, 'steps': 33747, 'loss/train': 1.2782315015792847} -08/30/2021 19:19:50 - INFO - __main__ - Step 33749: {'lr': 0.0004453462700836064, 'samples': 6479808, 'steps': 33748, 'loss/train': 1.7661064863204956} -08/30/2021 19:19:51 - INFO - __main__ - Step 33750: {'lr': 0.0004453429583702353, 'samples': 6480000, 'steps': 33749, 'loss/train': 1.7305666208267212} -08/30/2021 19:19:52 - INFO - __main__ - Step 33751: {'lr': 0.0004453396465688457, 'samples': 6480192, 'steps': 33750, 'loss/train': 1.7367297410964966} -08/30/2021 19:19:53 - INFO - __main__ - Step 33752: {'lr': 0.00044533633467943906, 'samples': 6480384, 'steps': 33751, 'loss/train': 1.937293291091919} -08/30/2021 19:19:53 - INFO - __main__ - Step 33753: {'lr': 0.00044533302270201693, 'samples': 6480576, 'steps': 33752, 'loss/train': 1.6584053039550781} -08/30/2021 19:19:53 - INFO - __main__ - Step 33754: {'lr': 0.00044532971063658067, 'samples': 6480768, 'steps': 33753, 'loss/train': 1.6454256772994995} -08/30/2021 19:19:54 - INFO - __main__ - Step 33755: {'lr': 0.00044532639848313187, 'samples': 6480960, 'steps': 33754, 'loss/train': 2.291076898574829} -08/30/2021 19:19:55 - INFO - __main__ - Step 33756: {'lr': 0.0004453230862416721, 'samples': 6481152, 'steps': 33755, 'loss/train': 1.3033268451690674} -08/30/2021 19:19:56 - INFO - __main__ - Step 33757: {'lr': 0.00044531977391220267, 'samples': 6481344, 'steps': 33756, 'loss/train': 1.6153513193130493} -08/30/2021 19:19:56 - INFO - __main__ - Step 33758: {'lr': 0.00044531646149472516, 'samples': 6481536, 'steps': 33757, 'loss/train': 1.5686980485916138} -08/30/2021 19:19:56 - INFO - __main__ - Step 33759: {'lr': 0.00044531314898924116, 'samples': 6481728, 'steps': 33758, 'loss/train': 1.573486089706421} -08/30/2021 19:19:57 - INFO - __main__ - Step 33760: {'lr': 0.00044530983639575193, 'samples': 6481920, 'steps': 33759, 'loss/train': 1.5041369199752808} -08/30/2021 19:19:57 - INFO - __main__ - Step 33761: {'lr': 0.00044530652371425916, 'samples': 6482112, 'steps': 33760, 'loss/train': 1.0164790153503418} -08/30/2021 19:19:58 - INFO - __main__ - Step 33762: {'lr': 0.00044530321094476434, 'samples': 6482304, 'steps': 33761, 'loss/train': 1.2703678607940674} -08/30/2021 19:19:59 - INFO - __main__ - Step 33763: {'lr': 0.0004452998980872689, 'samples': 6482496, 'steps': 33762, 'loss/train': 1.3127743005752563} -08/30/2021 19:19:59 - INFO - __main__ - Step 33764: {'lr': 0.0004452965851417743, 'samples': 6482688, 'steps': 33763, 'loss/train': 1.2908152341842651} -08/30/2021 19:20:00 - INFO - __main__ - Step 33765: {'lr': 0.000445293272108282, 'samples': 6482880, 'steps': 33764, 'loss/train': 1.3670977354049683} -08/30/2021 19:20:00 - INFO - __main__ - Step 33766: {'lr': 0.0004452899589867937, 'samples': 6483072, 'steps': 33765, 'loss/train': 0.9376664757728577} -08/30/2021 19:20:01 - INFO - __main__ - Step 33767: {'lr': 0.00044528664577731073, 'samples': 6483264, 'steps': 33766, 'loss/train': 1.3679068088531494} -08/30/2021 19:20:02 - INFO - __main__ - Step 33768: {'lr': 0.00044528333247983456, 'samples': 6483456, 'steps': 33767, 'loss/train': 1.1519654989242554} -08/30/2021 19:20:02 - INFO - __main__ - Step 33769: {'lr': 0.0004452800190943667, 'samples': 6483648, 'steps': 33768, 'loss/train': 1.5699752569198608} -08/30/2021 19:20:03 - INFO - __main__ - Step 33770: {'lr': 0.0004452767056209087, 'samples': 6483840, 'steps': 33769, 'loss/train': 1.7179687023162842} -08/30/2021 19:20:03 - INFO - __main__ - Step 33771: {'lr': 0.0004452733920594621, 'samples': 6484032, 'steps': 33770, 'loss/train': 1.6127049922943115} -08/30/2021 19:20:04 - INFO - __main__ - Step 33772: {'lr': 0.0004452700784100283, 'samples': 6484224, 'steps': 33771, 'loss/train': 1.8528072834014893} -08/30/2021 19:20:05 - INFO - __main__ - Step 33773: {'lr': 0.0004452667646726088, 'samples': 6484416, 'steps': 33772, 'loss/train': 1.8164608478546143} -08/30/2021 19:20:05 - INFO - __main__ - Step 33774: {'lr': 0.0004452634508472051, 'samples': 6484608, 'steps': 33773, 'loss/train': 1.3129944801330566} -08/30/2021 19:20:05 - INFO - __main__ - Step 33775: {'lr': 0.0004452601369338187, 'samples': 6484800, 'steps': 33774, 'loss/train': 1.7763618230819702} -08/30/2021 19:20:06 - INFO - __main__ - Step 33776: {'lr': 0.00044525682293245107, 'samples': 6484992, 'steps': 33775, 'loss/train': 1.6041359901428223} -08/30/2021 19:20:08 - INFO - __main__ - Step 33777: {'lr': 0.0004452535088431038, 'samples': 6485184, 'steps': 33776, 'loss/train': 1.4973009824752808} -08/30/2021 19:20:08 - INFO - __main__ - Step 33778: {'lr': 0.00044525019466577824, 'samples': 6485376, 'steps': 33777, 'loss/train': 1.0766139030456543} -08/30/2021 19:20:08 - INFO - __main__ - Step 33779: {'lr': 0.000445246880400476, 'samples': 6485568, 'steps': 33778, 'loss/train': 0.960921585559845} -08/30/2021 19:20:09 - INFO - __main__ - Step 33780: {'lr': 0.0004452435660471985, 'samples': 6485760, 'steps': 33779, 'loss/train': 1.4789167642593384} -08/30/2021 19:20:09 - INFO - __main__ - Step 33781: {'lr': 0.00044524025160594735, 'samples': 6485952, 'steps': 33780, 'loss/train': 1.0589964389801025} -08/30/2021 19:20:09 - INFO - __main__ - Step 33782: {'lr': 0.00044523693707672384, 'samples': 6486144, 'steps': 33781, 'loss/train': 0.41785523295402527} -08/30/2021 19:20:11 - INFO - __main__ - Step 33783: {'lr': 0.0004452336224595296, 'samples': 6486336, 'steps': 33782, 'loss/train': 0.31878143548965454} -08/30/2021 19:20:11 - INFO - __main__ - Step 33784: {'lr': 0.00044523030775436617, 'samples': 6486528, 'steps': 33783, 'loss/train': 1.0572500228881836} -08/30/2021 19:20:12 - INFO - __main__ - Step 33785: {'lr': 0.00044522699296123495, 'samples': 6486720, 'steps': 33784, 'loss/train': 1.9437154531478882} -08/30/2021 19:20:12 - INFO - __main__ - Step 33786: {'lr': 0.0004452236780801374, 'samples': 6486912, 'steps': 33785, 'loss/train': 0.8700249195098877} -08/30/2021 19:20:12 - INFO - __main__ - Step 33787: {'lr': 0.00044522036311107514, 'samples': 6487104, 'steps': 33786, 'loss/train': 1.5943043231964111} -08/30/2021 19:20:14 - INFO - __main__ - Step 33788: {'lr': 0.0004452170480540496, 'samples': 6487296, 'steps': 33787, 'loss/train': 1.2318328619003296} -08/30/2021 19:20:14 - INFO - __main__ - Step 33789: {'lr': 0.0004452137329090622, 'samples': 6487488, 'steps': 33788, 'loss/train': 1.3939425945281982} -08/30/2021 19:20:15 - INFO - __main__ - Step 33790: {'lr': 0.0004452104176761146, 'samples': 6487680, 'steps': 33789, 'loss/train': 0.7296445965766907} -08/30/2021 19:20:15 - INFO - __main__ - Step 33791: {'lr': 0.0004452071023552081, 'samples': 6487872, 'steps': 33790, 'loss/train': 1.9287878274917603} -08/30/2021 19:20:15 - INFO - __main__ - Step 33792: {'lr': 0.0004452037869463443, 'samples': 6488064, 'steps': 33791, 'loss/train': 1.9356757402420044} -08/30/2021 19:20:17 - INFO - __main__ - Step 33793: {'lr': 0.0004452004714495248, 'samples': 6488256, 'steps': 33792, 'loss/train': 1.3879512548446655} -08/30/2021 19:20:18 - INFO - __main__ - Step 33794: {'lr': 0.00044519715586475083, 'samples': 6488448, 'steps': 33793, 'loss/train': 1.3470523357391357} -08/30/2021 19:20:18 - INFO - __main__ - Step 33795: {'lr': 0.0004451938401920241, 'samples': 6488640, 'steps': 33794, 'loss/train': 1.2987070083618164} -08/30/2021 19:20:19 - INFO - __main__ - Step 33796: {'lr': 0.0004451905244313461, 'samples': 6488832, 'steps': 33795, 'loss/train': 1.2954049110412598} -08/30/2021 19:20:19 - INFO - __main__ - Step 33797: {'lr': 0.0004451872085827182, 'samples': 6489024, 'steps': 33796, 'loss/train': 1.325581669807434} -08/30/2021 19:20:21 - INFO - __main__ - Step 33798: {'lr': 0.000445183892646142, 'samples': 6489216, 'steps': 33797, 'loss/train': 1.8152703046798706} -08/30/2021 19:20:21 - INFO - __main__ - Step 33799: {'lr': 0.0004451805766216189, 'samples': 6489408, 'steps': 33798, 'loss/train': 1.5288186073303223} -08/30/2021 19:20:21 - INFO - __main__ - Step 33800: {'lr': 0.00044517726050915044, 'samples': 6489600, 'steps': 33799, 'loss/train': 0.8148971199989319} -08/30/2021 19:20:22 - INFO - __main__ - Step 33801: {'lr': 0.0004451739443087381, 'samples': 6489792, 'steps': 33800, 'loss/train': 1.640548825263977} -08/30/2021 19:20:22 - INFO - __main__ - Step 33802: {'lr': 0.0004451706280203834, 'samples': 6489984, 'steps': 33801, 'loss/train': 0.9394887685775757} -08/30/2021 19:20:22 - INFO - __main__ - Step 33803: {'lr': 0.0004451673116440879, 'samples': 6490176, 'steps': 33802, 'loss/train': 1.5112522840499878} -08/30/2021 19:20:24 - INFO - __main__ - Step 33804: {'lr': 0.00044516399517985296, 'samples': 6490368, 'steps': 33803, 'loss/train': 0.540610134601593} -08/30/2021 19:20:25 - INFO - __main__ - Step 33805: {'lr': 0.00044516067862768015, 'samples': 6490560, 'steps': 33804, 'loss/train': 1.5167460441589355} -08/30/2021 19:20:25 - INFO - __main__ - Step 33806: {'lr': 0.00044515736198757095, 'samples': 6490752, 'steps': 33805, 'loss/train': 1.2457060813903809} -08/30/2021 19:20:25 - INFO - __main__ - Step 33807: {'lr': 0.0004451540452595268, 'samples': 6490944, 'steps': 33806, 'loss/train': 1.23661470413208} -08/30/2021 19:20:26 - INFO - __main__ - Step 33808: {'lr': 0.0004451507284435494, 'samples': 6491136, 'steps': 33807, 'loss/train': 2.0407135486602783} -08/30/2021 19:20:27 - INFO - __main__ - Step 33809: {'lr': 0.00044514741153964, 'samples': 6491328, 'steps': 33808, 'loss/train': 1.6382018327713013} -08/30/2021 19:20:28 - INFO - __main__ - Step 33810: {'lr': 0.00044514409454780016, 'samples': 6491520, 'steps': 33809, 'loss/train': 1.1615650653839111} -08/30/2021 19:20:28 - INFO - __main__ - Step 33811: {'lr': 0.0004451407774680314, 'samples': 6491712, 'steps': 33810, 'loss/train': 1.409875750541687} -08/30/2021 19:20:28 - INFO - __main__ - Step 33812: {'lr': 0.0004451374603003353, 'samples': 6491904, 'steps': 33811, 'loss/train': 1.489293098449707} -08/30/2021 19:20:29 - INFO - __main__ - Step 33813: {'lr': 0.0004451341430447132, 'samples': 6492096, 'steps': 33812, 'loss/train': 1.573107123374939} -08/30/2021 19:20:30 - INFO - __main__ - Step 33814: {'lr': 0.0004451308257011667, 'samples': 6492288, 'steps': 33813, 'loss/train': 2.4382524490356445} -08/30/2021 19:20:31 - INFO - __main__ - Step 33815: {'lr': 0.00044512750826969724, 'samples': 6492480, 'steps': 33814, 'loss/train': 1.6215991973876953} -08/30/2021 19:20:31 - INFO - __main__ - Step 33816: {'lr': 0.0004451241907503063, 'samples': 6492672, 'steps': 33815, 'loss/train': 0.7824227213859558} -08/30/2021 19:20:31 - INFO - __main__ - Step 33817: {'lr': 0.0004451208731429954, 'samples': 6492864, 'steps': 33816, 'loss/train': 2.214453935623169} -08/30/2021 19:20:32 - INFO - __main__ - Step 33818: {'lr': 0.00044511755544776615, 'samples': 6493056, 'steps': 33817, 'loss/train': 1.2359373569488525} -08/30/2021 19:20:33 - INFO - __main__ - Step 33819: {'lr': 0.0004451142376646199, 'samples': 6493248, 'steps': 33818, 'loss/train': 1.2238761186599731} -08/30/2021 19:20:34 - INFO - __main__ - Step 33820: {'lr': 0.0004451109197935582, 'samples': 6493440, 'steps': 33819, 'loss/train': 1.313556432723999} -08/30/2021 19:20:34 - INFO - __main__ - Step 33821: {'lr': 0.0004451076018345824, 'samples': 6493632, 'steps': 33820, 'loss/train': 1.0907546281814575} -08/30/2021 19:20:34 - INFO - __main__ - Step 33822: {'lr': 0.0004451042837876943, 'samples': 6493824, 'steps': 33821, 'loss/train': 0.6498135924339294} -08/30/2021 19:20:35 - INFO - __main__ - Step 33823: {'lr': 0.00044510096565289513, 'samples': 6494016, 'steps': 33822, 'loss/train': 1.1190437078475952} -08/30/2021 19:20:35 - INFO - __main__ - Step 33824: {'lr': 0.0004450976474301865, 'samples': 6494208, 'steps': 33823, 'loss/train': 1.8094733953475952} -08/30/2021 19:20:37 - INFO - __main__ - Step 33825: {'lr': 0.0004450943291195698, 'samples': 6494400, 'steps': 33824, 'loss/train': 1.167904019355774} -08/30/2021 19:20:37 - INFO - __main__ - Step 33826: {'lr': 0.0004450910107210467, 'samples': 6494592, 'steps': 33825, 'loss/train': 1.4186716079711914} -08/30/2021 19:20:37 - INFO - __main__ - Step 33827: {'lr': 0.00044508769223461863, 'samples': 6494784, 'steps': 33826, 'loss/train': 1.2514773607254028} -08/30/2021 19:20:38 - INFO - __main__ - Step 33828: {'lr': 0.00044508437366028695, 'samples': 6494976, 'steps': 33827, 'loss/train': 1.443077564239502} -08/30/2021 19:20:38 - INFO - __main__ - Step 33829: {'lr': 0.00044508105499805337, 'samples': 6495168, 'steps': 33828, 'loss/train': 1.3630058765411377} -08/30/2021 19:20:40 - INFO - __main__ - Step 33830: {'lr': 0.0004450777362479192, 'samples': 6495360, 'steps': 33829, 'loss/train': 1.7333565950393677} -08/30/2021 19:20:41 - INFO - __main__ - Step 33831: {'lr': 0.000445074417409886, 'samples': 6495552, 'steps': 33830, 'loss/train': 0.054648514837026596} -08/30/2021 19:20:41 - INFO - __main__ - Step 33832: {'lr': 0.0004450710984839553, 'samples': 6495744, 'steps': 33831, 'loss/train': 0.23711515963077545} -08/30/2021 19:20:41 - INFO - __main__ - Step 33833: {'lr': 0.00044506777947012863, 'samples': 6495936, 'steps': 33832, 'loss/train': 1.3185186386108398} -08/30/2021 19:20:42 - INFO - __main__ - Step 33834: {'lr': 0.0004450644603684074, 'samples': 6496128, 'steps': 33833, 'loss/train': 1.3689053058624268} -08/30/2021 19:20:42 - INFO - __main__ - Step 33835: {'lr': 0.0004450611411787931, 'samples': 6496320, 'steps': 33834, 'loss/train': 0.941810131072998} -08/30/2021 19:20:43 - INFO - __main__ - Step 33836: {'lr': 0.0004450578219012873, 'samples': 6496512, 'steps': 33835, 'loss/train': 1.574400782585144} -08/30/2021 19:20:44 - INFO - __main__ - Step 33837: {'lr': 0.00044505450253589144, 'samples': 6496704, 'steps': 33836, 'loss/train': 1.5366309881210327} -08/30/2021 19:20:44 - INFO - __main__ - Step 33838: {'lr': 0.00044505118308260693, 'samples': 6496896, 'steps': 33837, 'loss/train': 1.4238420724868774} -08/30/2021 19:20:44 - INFO - __main__ - Step 33839: {'lr': 0.0004450478635414355, 'samples': 6497088, 'steps': 33838, 'loss/train': 1.624822974205017} -08/30/2021 19:20:45 - INFO - __main__ - Step 33840: {'lr': 0.0004450445439123785, 'samples': 6497280, 'steps': 33839, 'loss/train': 1.6758664846420288} -08/30/2021 19:20:47 - INFO - __main__ - Step 33841: {'lr': 0.0004450412241954374, 'samples': 6497472, 'steps': 33840, 'loss/train': 1.5433599948883057} -08/30/2021 19:20:47 - INFO - __main__ - Step 33842: {'lr': 0.00044503790439061374, 'samples': 6497664, 'steps': 33841, 'loss/train': 1.4497911930084229} -08/30/2021 19:20:48 - INFO - __main__ - Step 33843: {'lr': 0.000445034584497909, 'samples': 6497856, 'steps': 33842, 'loss/train': 1.3877265453338623} -08/30/2021 19:20:48 - INFO - __main__ - Step 33844: {'lr': 0.00044503126451732474, 'samples': 6498048, 'steps': 33843, 'loss/train': 1.2756401300430298} -08/30/2021 19:20:48 - INFO - __main__ - Step 33845: {'lr': 0.00044502794444886234, 'samples': 6498240, 'steps': 33844, 'loss/train': 1.6663813591003418} -08/30/2021 19:20:50 - INFO - __main__ - Step 33846: {'lr': 0.00044502462429252336, 'samples': 6498432, 'steps': 33845, 'loss/train': 1.2357209920883179} -08/30/2021 19:20:50 - INFO - __main__ - Step 33847: {'lr': 0.0004450213040483093, 'samples': 6498624, 'steps': 33846, 'loss/train': 1.3075966835021973} -08/30/2021 19:20:51 - INFO - __main__ - Step 33848: {'lr': 0.00044501798371622173, 'samples': 6498816, 'steps': 33847, 'loss/train': 1.6986846923828125} -08/30/2021 19:20:51 - INFO - __main__ - Step 33849: {'lr': 0.00044501466329626197, 'samples': 6499008, 'steps': 33848, 'loss/train': 0.8778390288352966} -08/30/2021 19:20:52 - INFO - __main__ - Step 33850: {'lr': 0.0004450113427884317, 'samples': 6499200, 'steps': 33849, 'loss/train': 1.942723274230957} -08/30/2021 19:20:53 - INFO - __main__ - Step 33851: {'lr': 0.00044500802219273224, 'samples': 6499392, 'steps': 33850, 'loss/train': 1.6642335653305054} -08/30/2021 19:20:53 - INFO - __main__ - Step 33852: {'lr': 0.00044500470150916514, 'samples': 6499584, 'steps': 33851, 'loss/train': 1.373314380645752} -08/30/2021 19:20:54 - INFO - __main__ - Step 33853: {'lr': 0.000445001380737732, 'samples': 6499776, 'steps': 33852, 'loss/train': 1.4638320207595825} -08/30/2021 19:20:54 - INFO - __main__ - Step 33854: {'lr': 0.0004449980598784343, 'samples': 6499968, 'steps': 33853, 'loss/train': 1.5324115753173828} -08/30/2021 19:20:54 - INFO - __main__ - Step 33855: {'lr': 0.0004449947389312734, 'samples': 6500160, 'steps': 33854, 'loss/train': 1.6708019971847534} -08/30/2021 19:20:56 - INFO - __main__ - Step 33856: {'lr': 0.00044499141789625086, 'samples': 6500352, 'steps': 33855, 'loss/train': 1.95577073097229} -08/30/2021 19:20:56 - INFO - __main__ - Step 33857: {'lr': 0.0004449880967733683, 'samples': 6500544, 'steps': 33856, 'loss/train': 1.1643824577331543} -08/30/2021 19:20:57 - INFO - __main__ - Step 33858: {'lr': 0.0004449847755626271, 'samples': 6500736, 'steps': 33857, 'loss/train': 1.5369292497634888} -08/30/2021 19:20:57 - INFO - __main__ - Step 33859: {'lr': 0.0004449814542640287, 'samples': 6500928, 'steps': 33858, 'loss/train': 1.41264009475708} -08/30/2021 19:20:57 - INFO - __main__ - Step 33860: {'lr': 0.0004449781328775746, 'samples': 6501120, 'steps': 33859, 'loss/train': 1.3092153072357178} -08/30/2021 19:20:58 - INFO - __main__ - Step 33861: {'lr': 0.0004449748114032665, 'samples': 6501312, 'steps': 33860, 'loss/train': 0.6003842949867249} -08/30/2021 19:20:59 - INFO - __main__ - Step 33862: {'lr': 0.00044497148984110567, 'samples': 6501504, 'steps': 33861, 'loss/train': 1.4862371683120728} -08/30/2021 19:21:00 - INFO - __main__ - Step 33863: {'lr': 0.00044496816819109377, 'samples': 6501696, 'steps': 33862, 'loss/train': 1.1522754430770874} -08/30/2021 19:21:00 - INFO - __main__ - Step 33864: {'lr': 0.0004449648464532322, 'samples': 6501888, 'steps': 33863, 'loss/train': 1.1018861532211304} -08/30/2021 19:21:00 - INFO - __main__ - Step 33865: {'lr': 0.0004449615246275225, 'samples': 6502080, 'steps': 33864, 'loss/train': 1.5629613399505615} -08/30/2021 19:21:01 - INFO - __main__ - Step 33866: {'lr': 0.000444958202713966, 'samples': 6502272, 'steps': 33865, 'loss/train': 1.4350067377090454} -08/30/2021 19:21:02 - INFO - __main__ - Step 33867: {'lr': 0.0004449548807125645, 'samples': 6502464, 'steps': 33866, 'loss/train': 0.46062156558036804} -08/30/2021 19:21:03 - INFO - __main__ - Step 33868: {'lr': 0.0004449515586233193, 'samples': 6502656, 'steps': 33867, 'loss/train': 1.584196925163269} -08/30/2021 19:21:03 - INFO - __main__ - Step 33869: {'lr': 0.0004449482364462319, 'samples': 6502848, 'steps': 33868, 'loss/train': 1.4910050630569458} -08/30/2021 19:21:04 - INFO - __main__ - Step 33870: {'lr': 0.0004449449141813039, 'samples': 6503040, 'steps': 33869, 'loss/train': 1.3369876146316528} -08/30/2021 19:21:04 - INFO - __main__ - Step 33871: {'lr': 0.00044494159182853667, 'samples': 6503232, 'steps': 33870, 'loss/train': 1.728448748588562} -08/30/2021 19:21:06 - INFO - __main__ - Step 33872: {'lr': 0.0004449382693879318, 'samples': 6503424, 'steps': 33871, 'loss/train': 1.382724404335022} -08/30/2021 19:21:06 - INFO - __main__ - Step 33873: {'lr': 0.0004449349468594908, 'samples': 6503616, 'steps': 33872, 'loss/train': 0.988279402256012} -08/30/2021 19:21:06 - INFO - __main__ - Step 33874: {'lr': 0.000444931624243215, 'samples': 6503808, 'steps': 33873, 'loss/train': 1.8086014986038208} -08/30/2021 19:21:07 - INFO - __main__ - Step 33875: {'lr': 0.0004449283015391061, 'samples': 6504000, 'steps': 33874, 'loss/train': 1.2181453704833984} -08/30/2021 19:21:07 - INFO - __main__ - Step 33876: {'lr': 0.0004449249787471655, 'samples': 6504192, 'steps': 33875, 'loss/train': 1.516812801361084} -08/30/2021 19:21:09 - INFO - __main__ - Step 33877: {'lr': 0.0004449216558673947, 'samples': 6504384, 'steps': 33876, 'loss/train': 1.0998013019561768} -08/30/2021 19:21:09 - INFO - __main__ - Step 33878: {'lr': 0.0004449183328997952, 'samples': 6504576, 'steps': 33877, 'loss/train': 0.8791530728340149} -08/30/2021 19:21:09 - INFO - __main__ - Step 33879: {'lr': 0.0004449150098443685, 'samples': 6504768, 'steps': 33878, 'loss/train': 2.1546788215637207} -08/30/2021 19:21:10 - INFO - __main__ - Step 33880: {'lr': 0.00044491168670111615, 'samples': 6504960, 'steps': 33879, 'loss/train': 0.9371464252471924} -08/30/2021 19:21:10 - INFO - __main__ - Step 33881: {'lr': 0.0004449083634700396, 'samples': 6505152, 'steps': 33880, 'loss/train': 1.1692291498184204} -08/30/2021 19:21:10 - INFO - __main__ - Step 33882: {'lr': 0.00044490504015114033, 'samples': 6505344, 'steps': 33881, 'loss/train': 1.299615502357483} -08/30/2021 19:21:12 - INFO - __main__ - Step 33883: {'lr': 0.0004449017167444198, 'samples': 6505536, 'steps': 33882, 'loss/train': 0.9115594625473022} -08/30/2021 19:21:12 - INFO - __main__ - Step 33884: {'lr': 0.0004448983932498797, 'samples': 6505728, 'steps': 33883, 'loss/train': 1.4423195123672485} -08/30/2021 19:21:13 - INFO - __main__ - Step 33885: {'lr': 0.00044489506966752127, 'samples': 6505920, 'steps': 33884, 'loss/train': 1.28299880027771} -08/30/2021 19:21:13 - INFO - __main__ - Step 33886: {'lr': 0.00044489174599734614, 'samples': 6506112, 'steps': 33885, 'loss/train': 1.0047564506530762} -08/30/2021 19:21:13 - INFO - __main__ - Step 33887: {'lr': 0.0004448884222393559, 'samples': 6506304, 'steps': 33886, 'loss/train': 1.4295834302902222} -08/30/2021 19:21:15 - INFO - __main__ - Step 33888: {'lr': 0.00044488509839355183, 'samples': 6506496, 'steps': 33887, 'loss/train': 1.3253395557403564} -08/30/2021 19:21:15 - INFO - __main__ - Step 33889: {'lr': 0.00044488177445993563, 'samples': 6506688, 'steps': 33888, 'loss/train': 0.05622369050979614} -08/30/2021 19:21:16 - INFO - __main__ - Step 33890: {'lr': 0.0004448784504385086, 'samples': 6506880, 'steps': 33889, 'loss/train': 1.813767433166504} -08/30/2021 19:21:16 - INFO - __main__ - Step 33891: {'lr': 0.0004448751263292724, 'samples': 6507072, 'steps': 33890, 'loss/train': 1.5589590072631836} -08/30/2021 19:21:17 - INFO - __main__ - Step 33892: {'lr': 0.0004448718021322285, 'samples': 6507264, 'steps': 33891, 'loss/train': 1.0483603477478027} -08/30/2021 19:21:19 - INFO - __main__ - Step 33893: {'lr': 0.0004448684778473784, 'samples': 6507456, 'steps': 33892, 'loss/train': 1.525713324546814} -08/30/2021 19:21:19 - INFO - __main__ - Step 33894: {'lr': 0.0004448651534747235, 'samples': 6507648, 'steps': 33893, 'loss/train': 0.850823700428009} -08/30/2021 19:21:20 - INFO - __main__ - Step 33895: {'lr': 0.0004448618290142654, 'samples': 6507840, 'steps': 33894, 'loss/train': 0.07434050738811493} -08/30/2021 19:21:20 - INFO - __main__ - Step 33896: {'lr': 0.0004448585044660055, 'samples': 6508032, 'steps': 33895, 'loss/train': 1.6688246726989746} -08/30/2021 19:21:20 - INFO - __main__ - Step 33897: {'lr': 0.0004448551798299455, 'samples': 6508224, 'steps': 33896, 'loss/train': 1.5972011089324951} -08/30/2021 19:21:22 - INFO - __main__ - Step 33898: {'lr': 0.00044485185510608665, 'samples': 6508416, 'steps': 33897, 'loss/train': 2.083176851272583} -08/30/2021 19:21:22 - INFO - __main__ - Step 33899: {'lr': 0.0004448485302944306, 'samples': 6508608, 'steps': 33898, 'loss/train': 1.6384687423706055} -08/30/2021 19:21:22 - INFO - __main__ - Step 33900: {'lr': 0.0004448452053949789, 'samples': 6508800, 'steps': 33899, 'loss/train': 1.5330208539962769} -08/30/2021 19:21:23 - INFO - __main__ - Step 33901: {'lr': 0.0004448418804077328, 'samples': 6508992, 'steps': 33900, 'loss/train': 1.2696808576583862} -08/30/2021 19:21:23 - INFO - __main__ - Step 33902: {'lr': 0.000444838555332694, 'samples': 6509184, 'steps': 33901, 'loss/train': 0.5143625140190125} -08/30/2021 19:21:25 - INFO - __main__ - Step 33903: {'lr': 0.000444835230169864, 'samples': 6509376, 'steps': 33902, 'loss/train': 1.4817063808441162} -08/30/2021 19:21:26 - INFO - __main__ - Step 33904: {'lr': 0.00044483190491924427, 'samples': 6509568, 'steps': 33903, 'loss/train': 1.420440673828125} -08/30/2021 19:21:26 - INFO - __main__ - Step 33905: {'lr': 0.0004448285795808362, 'samples': 6509760, 'steps': 33904, 'loss/train': 0.03294937685132027} -08/30/2021 19:21:26 - INFO - __main__ - Step 33906: {'lr': 0.00044482525415464144, 'samples': 6509952, 'steps': 33905, 'loss/train': 1.353139877319336} -08/30/2021 19:21:27 - INFO - __main__ - Step 33907: {'lr': 0.0004448219286406614, 'samples': 6510144, 'steps': 33906, 'loss/train': 1.360242247581482} -08/30/2021 19:21:27 - INFO - __main__ - Step 33908: {'lr': 0.00044481860303889766, 'samples': 6510336, 'steps': 33907, 'loss/train': 1.3502663373947144} -08/30/2021 19:21:27 - INFO - __main__ - Step 33909: {'lr': 0.0004448152773493516, 'samples': 6510528, 'steps': 33908, 'loss/train': 1.4947407245635986} -08/30/2021 19:21:29 - INFO - __main__ - Step 33910: {'lr': 0.0004448119515720248, 'samples': 6510720, 'steps': 33909, 'loss/train': 0.18104121088981628} -08/30/2021 19:21:29 - INFO - __main__ - Step 33911: {'lr': 0.0004448086257069187, 'samples': 6510912, 'steps': 33910, 'loss/train': 1.7081741094589233} -08/30/2021 19:21:30 - INFO - __main__ - Step 33912: {'lr': 0.00044480529975403496, 'samples': 6511104, 'steps': 33911, 'loss/train': 0.7345178127288818} -08/30/2021 19:21:30 - INFO - __main__ - Step 33913: {'lr': 0.00044480197371337484, 'samples': 6511296, 'steps': 33912, 'loss/train': 1.319288730621338} -08/30/2021 19:21:30 - INFO - __main__ - Step 33914: {'lr': 0.00044479864758494004, 'samples': 6511488, 'steps': 33913, 'loss/train': 1.6771048307418823} -08/30/2021 19:21:32 - INFO - __main__ - Step 33915: {'lr': 0.0004447953213687319, 'samples': 6511680, 'steps': 33914, 'loss/train': 1.0491857528686523} -08/30/2021 19:21:33 - INFO - __main__ - Step 33916: {'lr': 0.00044479199506475205, 'samples': 6511872, 'steps': 33915, 'loss/train': 1.7016457319259644} -08/30/2021 19:21:33 - INFO - __main__ - Step 33917: {'lr': 0.0004447886686730019, 'samples': 6512064, 'steps': 33916, 'loss/train': 1.3642207384109497} -08/30/2021 19:21:34 - INFO - __main__ - Step 33918: {'lr': 0.00044478534219348297, 'samples': 6512256, 'steps': 33917, 'loss/train': 1.7083402872085571} -08/30/2021 19:21:34 - INFO - __main__ - Step 33919: {'lr': 0.0004447820156261968, 'samples': 6512448, 'steps': 33918, 'loss/train': 0.025473570451140404} -08/30/2021 19:21:34 - INFO - __main__ - Step 33920: {'lr': 0.0004447786889711449, 'samples': 6512640, 'steps': 33919, 'loss/train': 1.494349718093872} -08/30/2021 19:21:36 - INFO - __main__ - Step 33921: {'lr': 0.00044477536222832867, 'samples': 6512832, 'steps': 33920, 'loss/train': 0.8877117037773132} -08/30/2021 19:21:36 - INFO - __main__ - Step 33922: {'lr': 0.0004447720353977497, 'samples': 6513024, 'steps': 33921, 'loss/train': 1.5002405643463135} -08/30/2021 19:21:36 - INFO - __main__ - Step 33923: {'lr': 0.0004447687084794094, 'samples': 6513216, 'steps': 33922, 'loss/train': 1.2252342700958252} -08/30/2021 19:21:37 - INFO - __main__ - Step 33924: {'lr': 0.00044476538147330934, 'samples': 6513408, 'steps': 33923, 'loss/train': 1.5719655752182007} -08/30/2021 19:21:37 - INFO - __main__ - Step 33925: {'lr': 0.00044476205437945105, 'samples': 6513600, 'steps': 33924, 'loss/train': 1.2667392492294312} -08/30/2021 19:21:38 - INFO - __main__ - Step 33926: {'lr': 0.0004447587271978359, 'samples': 6513792, 'steps': 33925, 'loss/train': 1.179510474205017} -08/30/2021 19:21:39 - INFO - __main__ - Step 33927: {'lr': 0.0004447553999284656, 'samples': 6513984, 'steps': 33926, 'loss/train': 1.2825231552124023} -08/30/2021 19:21:39 - INFO - __main__ - Step 33928: {'lr': 0.00044475207257134143, 'samples': 6514176, 'steps': 33927, 'loss/train': 0.1595047265291214} -08/30/2021 19:21:40 - INFO - __main__ - Step 33929: {'lr': 0.000444748745126465, 'samples': 6514368, 'steps': 33928, 'loss/train': 1.1425038576126099} -08/30/2021 19:21:40 - INFO - __main__ - Step 33930: {'lr': 0.0004447454175938378, 'samples': 6514560, 'steps': 33929, 'loss/train': 1.4913631677627563} -08/30/2021 19:21:40 - INFO - __main__ - Step 33931: {'lr': 0.00044474208997346133, 'samples': 6514752, 'steps': 33930, 'loss/train': 1.6583921909332275} -08/30/2021 19:21:42 - INFO - __main__ - Step 33932: {'lr': 0.00044473876226533703, 'samples': 6514944, 'steps': 33931, 'loss/train': 1.4317001104354858} -08/30/2021 19:21:43 - INFO - __main__ - Step 33933: {'lr': 0.0004447354344694665, 'samples': 6515136, 'steps': 33932, 'loss/train': 1.5071940422058105} -08/30/2021 19:21:43 - INFO - __main__ - Step 33934: {'lr': 0.0004447321065858512, 'samples': 6515328, 'steps': 33933, 'loss/train': 1.394973874092102} -08/30/2021 19:21:43 - INFO - __main__ - Step 33935: {'lr': 0.00044472877861449257, 'samples': 6515520, 'steps': 33934, 'loss/train': 1.2846614122390747} -08/30/2021 19:21:44 - INFO - __main__ - Step 33936: {'lr': 0.00044472545055539213, 'samples': 6515712, 'steps': 33935, 'loss/train': 1.419373631477356} -08/30/2021 19:21:45 - INFO - __main__ - Step 33937: {'lr': 0.00044472212240855155, 'samples': 6515904, 'steps': 33936, 'loss/train': 0.9835194945335388} -08/30/2021 19:21:46 - INFO - __main__ - Step 33938: {'lr': 0.0004447187941739721, 'samples': 6516096, 'steps': 33937, 'loss/train': 1.4644720554351807} -08/30/2021 19:21:46 - INFO - __main__ - Step 33939: {'lr': 0.00044471546585165536, 'samples': 6516288, 'steps': 33938, 'loss/train': 0.8359298706054688} -08/30/2021 19:21:46 - INFO - __main__ - Step 33940: {'lr': 0.0004447121374416028, 'samples': 6516480, 'steps': 33939, 'loss/train': 1.2722243070602417} -08/30/2021 19:21:47 - INFO - __main__ - Step 33941: {'lr': 0.000444708808943816, 'samples': 6516672, 'steps': 33940, 'loss/train': 1.3056972026824951} -08/30/2021 19:21:48 - INFO - __main__ - Step 33942: {'lr': 0.00044470548035829637, 'samples': 6516864, 'steps': 33941, 'loss/train': 1.6970505714416504} -08/30/2021 19:21:49 - INFO - __main__ - Step 33943: {'lr': 0.00044470215168504554, 'samples': 6517056, 'steps': 33942, 'loss/train': 1.3225524425506592} -08/30/2021 19:21:49 - INFO - __main__ - Step 33944: {'lr': 0.0004446988229240648, 'samples': 6517248, 'steps': 33943, 'loss/train': 1.0484739542007446} -08/30/2021 19:21:49 - INFO - __main__ - Step 33945: {'lr': 0.00044469549407535593, 'samples': 6517440, 'steps': 33944, 'loss/train': 1.7722183465957642} -08/30/2021 19:21:50 - INFO - __main__ - Step 33946: {'lr': 0.0004446921651389202, 'samples': 6517632, 'steps': 33945, 'loss/train': 1.5921233892440796} -08/30/2021 19:21:52 - INFO - __main__ - Step 33947: {'lr': 0.00044468883611475913, 'samples': 6517824, 'steps': 33946, 'loss/train': 0.10728372633457184} -08/30/2021 19:21:53 - INFO - __main__ - Step 33948: {'lr': 0.00044468550700287436, 'samples': 6518016, 'steps': 33947, 'loss/train': 0.5068848133087158} -08/30/2021 19:21:53 - INFO - __main__ - Step 33949: {'lr': 0.00044468217780326724, 'samples': 6518208, 'steps': 33948, 'loss/train': 1.8218778371810913} -08/30/2021 19:21:53 - INFO - __main__ - Step 33950: {'lr': 0.0004446788485159393, 'samples': 6518400, 'steps': 33949, 'loss/train': 0.08906268328428268} -08/30/2021 19:21:54 - INFO - __main__ - Step 33951: {'lr': 0.00044467551914089223, 'samples': 6518592, 'steps': 33950, 'loss/train': 0.2462569922208786} -08/30/2021 19:21:54 - INFO - __main__ - Step 33952: {'lr': 0.0004446721896781273, 'samples': 6518784, 'steps': 33951, 'loss/train': 1.1991685628890991} -08/30/2021 19:21:56 - INFO - __main__ - Step 33953: {'lr': 0.00044466886012764603, 'samples': 6518976, 'steps': 33952, 'loss/train': 1.5038806200027466} -08/30/2021 19:21:56 - INFO - __main__ - Step 33954: {'lr': 0.00044466553048944996, 'samples': 6519168, 'steps': 33953, 'loss/train': 1.138209342956543} -08/30/2021 19:21:56 - INFO - __main__ - Step 33955: {'lr': 0.0004446622007635407, 'samples': 6519360, 'steps': 33954, 'loss/train': 1.7388213872909546} -08/30/2021 19:21:57 - INFO - __main__ - Step 33956: {'lr': 0.0004446588709499196, 'samples': 6519552, 'steps': 33955, 'loss/train': 1.270929217338562} -08/30/2021 19:21:57 - INFO - __main__ - Step 33957: {'lr': 0.00044465554104858817, 'samples': 6519744, 'steps': 33956, 'loss/train': 0.06287913024425507} -08/30/2021 19:21:59 - INFO - __main__ - Step 33958: {'lr': 0.0004446522110595481, 'samples': 6519936, 'steps': 33957, 'loss/train': 0.047152016311883926} -08/30/2021 19:21:59 - INFO - __main__ - Step 33959: {'lr': 0.00044464888098280067, 'samples': 6520128, 'steps': 33958, 'loss/train': 1.2860584259033203} -08/30/2021 19:22:00 - INFO - __main__ - Step 33960: {'lr': 0.00044464555081834745, 'samples': 6520320, 'steps': 33959, 'loss/train': 1.2669841051101685} -08/30/2021 19:22:00 - INFO - __main__ - Step 33961: {'lr': 0.00044464222056618996, 'samples': 6520512, 'steps': 33960, 'loss/train': 1.0910521745681763} -08/30/2021 19:22:00 - INFO - __main__ - Step 33962: {'lr': 0.00044463889022632963, 'samples': 6520704, 'steps': 33961, 'loss/train': 2.0555191040039062} -08/30/2021 19:22:01 - INFO - __main__ - Step 33963: {'lr': 0.0004446355597987681, 'samples': 6520896, 'steps': 33962, 'loss/train': 1.3677674531936646} -08/30/2021 19:22:02 - INFO - __main__ - Step 33964: {'lr': 0.00044463222928350677, 'samples': 6521088, 'steps': 33963, 'loss/train': 0.23425672948360443} -08/30/2021 19:22:03 - INFO - __main__ - Step 33965: {'lr': 0.0004446288986805471, 'samples': 6521280, 'steps': 33964, 'loss/train': 1.3336637020111084} -08/30/2021 19:22:03 - INFO - __main__ - Step 33966: {'lr': 0.0004446255679898907, 'samples': 6521472, 'steps': 33965, 'loss/train': 1.368518590927124} -08/30/2021 19:22:03 - INFO - __main__ - Step 33967: {'lr': 0.000444622237211539, 'samples': 6521664, 'steps': 33966, 'loss/train': 0.08844552934169769} -08/30/2021 19:22:04 - INFO - __main__ - Step 33968: {'lr': 0.00044461890634549364, 'samples': 6521856, 'steps': 33967, 'loss/train': 1.519295334815979} -08/30/2021 19:22:06 - INFO - __main__ - Step 33969: {'lr': 0.00044461557539175587, 'samples': 6522048, 'steps': 33968, 'loss/train': 1.3855935335159302} -08/30/2021 19:22:06 - INFO - __main__ - Step 33970: {'lr': 0.0004446122443503274, 'samples': 6522240, 'steps': 33969, 'loss/train': 1.117292881011963} -08/30/2021 19:22:06 - INFO - __main__ - Step 33971: {'lr': 0.00044460891322120963, 'samples': 6522432, 'steps': 33970, 'loss/train': 0.1941833198070526} -08/30/2021 19:22:07 - INFO - __main__ - Step 33972: {'lr': 0.000444605582004404, 'samples': 6522624, 'steps': 33971, 'loss/train': 1.6087018251419067} -08/30/2021 19:22:07 - INFO - __main__ - Step 33973: {'lr': 0.0004446022506999122, 'samples': 6522816, 'steps': 33972, 'loss/train': 2.2581584453582764} -08/30/2021 19:22:08 - INFO - __main__ - Step 33974: {'lr': 0.0004445989193077356, 'samples': 6523008, 'steps': 33973, 'loss/train': 1.6441208124160767} -08/30/2021 19:22:09 - INFO - __main__ - Step 33975: {'lr': 0.0004445955878278758, 'samples': 6523200, 'steps': 33974, 'loss/train': 1.8568898439407349} -08/30/2021 19:22:09 - INFO - __main__ - Step 33976: {'lr': 0.00044459225626033413, 'samples': 6523392, 'steps': 33975, 'loss/train': 1.6220955848693848} -08/30/2021 19:22:10 - INFO - __main__ - Step 33977: {'lr': 0.00044458892460511225, 'samples': 6523584, 'steps': 33976, 'loss/train': 1.4792912006378174} -08/30/2021 19:22:10 - INFO - __main__ - Step 33978: {'lr': 0.0004445855928622116, 'samples': 6523776, 'steps': 33977, 'loss/train': 2.175816774368286} -08/30/2021 19:22:12 - INFO - __main__ - Step 33979: {'lr': 0.00044458226103163365, 'samples': 6523968, 'steps': 33978, 'loss/train': 1.5777018070220947} -08/30/2021 19:22:12 - INFO - __main__ - Step 33980: {'lr': 0.0004445789291133799, 'samples': 6524160, 'steps': 33979, 'loss/train': 1.580352544784546} -08/30/2021 19:22:12 - INFO - __main__ - Step 33981: {'lr': 0.0004445755971074519, 'samples': 6524352, 'steps': 33980, 'loss/train': 2.261376142501831} -08/30/2021 19:22:13 - INFO - __main__ - Step 33982: {'lr': 0.0004445722650138512, 'samples': 6524544, 'steps': 33981, 'loss/train': 1.8368432521820068} -08/30/2021 19:22:13 - INFO - __main__ - Step 33983: {'lr': 0.00044456893283257925, 'samples': 6524736, 'steps': 33982, 'loss/train': 1.5508798360824585} -08/30/2021 19:22:14 - INFO - __main__ - Step 33984: {'lr': 0.00044456560056363746, 'samples': 6524928, 'steps': 33983, 'loss/train': 0.5090582966804504} -08/30/2021 19:22:15 - INFO - __main__ - Step 33985: {'lr': 0.0004445622682070275, 'samples': 6525120, 'steps': 33984, 'loss/train': 0.8270739912986755} -08/30/2021 19:22:15 - INFO - __main__ - Step 33986: {'lr': 0.00044455893576275077, 'samples': 6525312, 'steps': 33985, 'loss/train': 1.4644569158554077} -08/30/2021 19:22:16 - INFO - __main__ - Step 33987: {'lr': 0.00044455560323080874, 'samples': 6525504, 'steps': 33986, 'loss/train': 1.3766546249389648} -08/30/2021 19:22:16 - INFO - __main__ - Step 33988: {'lr': 0.00044455227061120296, 'samples': 6525696, 'steps': 33987, 'loss/train': 1.5774089097976685} -08/30/2021 19:22:16 - INFO - __main__ - Step 33989: {'lr': 0.000444548937903935, 'samples': 6525888, 'steps': 33988, 'loss/train': 1.5354235172271729} -08/30/2021 19:22:18 - INFO - __main__ - Step 33990: {'lr': 0.0004445456051090062, 'samples': 6526080, 'steps': 33989, 'loss/train': 1.2000242471694946} -08/30/2021 19:22:18 - INFO - __main__ - Step 33991: {'lr': 0.0004445422722264182, 'samples': 6526272, 'steps': 33990, 'loss/train': 0.47508615255355835} -08/30/2021 19:22:19 - INFO - __main__ - Step 33992: {'lr': 0.0004445389392561724, 'samples': 6526464, 'steps': 33991, 'loss/train': 1.2503502368927002} -08/30/2021 19:22:19 - INFO - __main__ - Step 33993: {'lr': 0.0004445356061982704, 'samples': 6526656, 'steps': 33992, 'loss/train': 1.4229282140731812} -08/30/2021 19:22:19 - INFO - __main__ - Step 33994: {'lr': 0.0004445322730527137, 'samples': 6526848, 'steps': 33993, 'loss/train': 1.8668755292892456} -08/30/2021 19:22:21 - INFO - __main__ - Step 33995: {'lr': 0.0004445289398195037, 'samples': 6527040, 'steps': 33994, 'loss/train': 0.2902545630931854} -08/30/2021 19:22:22 - INFO - __main__ - Step 33996: {'lr': 0.000444525606498642, 'samples': 6527232, 'steps': 33995, 'loss/train': 1.4460036754608154} -08/30/2021 19:22:22 - INFO - __main__ - Step 33997: {'lr': 0.00044452227309013003, 'samples': 6527424, 'steps': 33996, 'loss/train': 1.8232755661010742} -08/30/2021 19:22:23 - INFO - __main__ - Step 33998: {'lr': 0.0004445189395939694, 'samples': 6527616, 'steps': 33997, 'loss/train': 1.5057605504989624} -08/30/2021 19:22:23 - INFO - __main__ - Step 33999: {'lr': 0.0004445156060101614, 'samples': 6527808, 'steps': 33998, 'loss/train': 1.542720913887024} -08/30/2021 19:22:23 - INFO - __main__ - Step 34000: {'lr': 0.0004445122723387077, 'samples': 6528000, 'steps': 33999, 'loss/train': 1.302803635597229} -08/30/2021 19:22:25 - INFO - __main__ - Step 34001: {'lr': 0.0004445089385796099, 'samples': 6528192, 'steps': 34000, 'loss/train': 0.2338247150182724} -08/30/2021 19:22:26 - INFO - __main__ - Step 34002: {'lr': 0.0004445056047328693, 'samples': 6528384, 'steps': 34001, 'loss/train': 0.7542929649353027} -08/30/2021 19:22:26 - INFO - __main__ - Step 34003: {'lr': 0.0004445022707984874, 'samples': 6528576, 'steps': 34002, 'loss/train': 1.3637045621871948} -08/30/2021 19:22:27 - INFO - __main__ - Step 34004: {'lr': 0.0004444989367764659, 'samples': 6528768, 'steps': 34003, 'loss/train': 1.511135458946228} -08/30/2021 19:22:27 - INFO - __main__ - Step 34005: {'lr': 0.0004444956026668061, 'samples': 6528960, 'steps': 34004, 'loss/train': 1.450154423713684} -08/30/2021 19:22:29 - INFO - __main__ - Step 34006: {'lr': 0.00044449226846950964, 'samples': 6529152, 'steps': 34005, 'loss/train': 1.5379148721694946} -08/30/2021 19:22:29 - INFO - __main__ - Step 34007: {'lr': 0.00044448893418457794, 'samples': 6529344, 'steps': 34006, 'loss/train': 1.2722413539886475} -08/30/2021 19:22:29 - INFO - __main__ - Step 34008: {'lr': 0.00044448559981201256, 'samples': 6529536, 'steps': 34007, 'loss/train': 0.3601374626159668} -08/30/2021 19:22:30 - INFO - __main__ - Step 34009: {'lr': 0.00044448226535181485, 'samples': 6529728, 'steps': 34008, 'loss/train': 0.41265320777893066} -08/30/2021 19:22:30 - INFO - __main__ - Step 34010: {'lr': 0.0004444789308039865, 'samples': 6529920, 'steps': 34009, 'loss/train': 1.9307525157928467} -08/30/2021 19:22:30 - INFO - __main__ - Step 34011: {'lr': 0.00044447559616852893, 'samples': 6530112, 'steps': 34010, 'loss/train': 2.2137908935546875} -08/30/2021 19:22:32 - INFO - __main__ - Step 34012: {'lr': 0.0004444722614454437, 'samples': 6530304, 'steps': 34011, 'loss/train': 1.3125523328781128} -08/30/2021 19:22:33 - INFO - __main__ - Step 34013: {'lr': 0.00044446892663473227, 'samples': 6530496, 'steps': 34012, 'loss/train': 1.557146668434143} -08/30/2021 19:22:33 - INFO - __main__ - Step 34014: {'lr': 0.0004444655917363961, 'samples': 6530688, 'steps': 34013, 'loss/train': 1.4590916633605957} -08/30/2021 19:22:33 - INFO - __main__ - Step 34015: {'lr': 0.00044446225675043684, 'samples': 6530880, 'steps': 34014, 'loss/train': 1.444432020187378} -08/30/2021 19:22:34 - INFO - __main__ - Step 34016: {'lr': 0.0004444589216768558, 'samples': 6531072, 'steps': 34015, 'loss/train': 1.8459526300430298} -08/30/2021 19:22:35 - INFO - __main__ - Step 34017: {'lr': 0.0004444555865156545, 'samples': 6531264, 'steps': 34016, 'loss/train': 0.11406456679105759} -08/30/2021 19:22:36 - INFO - __main__ - Step 34018: {'lr': 0.0004444522512668346, 'samples': 6531456, 'steps': 34017, 'loss/train': 1.6628382205963135} -08/30/2021 19:22:36 - INFO - __main__ - Step 34019: {'lr': 0.0004444489159303976, 'samples': 6531648, 'steps': 34018, 'loss/train': 1.4332411289215088} -08/30/2021 19:22:36 - INFO - __main__ - Step 34020: {'lr': 0.0004444455805063448, 'samples': 6531840, 'steps': 34019, 'loss/train': 0.9525831937789917} -08/30/2021 19:22:37 - INFO - __main__ - Step 34021: {'lr': 0.00044444224499467784, 'samples': 6532032, 'steps': 34020, 'loss/train': 1.7560033798217773} -08/30/2021 19:22:38 - INFO - __main__ - Step 34022: {'lr': 0.0004444389093953982, 'samples': 6532224, 'steps': 34021, 'loss/train': 1.7731221914291382} -08/30/2021 19:22:39 - INFO - __main__ - Step 34023: {'lr': 0.00044443557370850743, 'samples': 6532416, 'steps': 34022, 'loss/train': 1.5227303504943848} -08/30/2021 19:22:39 - INFO - __main__ - Step 34024: {'lr': 0.00044443223793400695, 'samples': 6532608, 'steps': 34023, 'loss/train': 5.8248372077941895} -08/30/2021 19:22:39 - INFO - __main__ - Step 34025: {'lr': 0.0004444289020718983, 'samples': 6532800, 'steps': 34024, 'loss/train': 1.6655195951461792} -08/30/2021 19:22:40 - INFO - __main__ - Step 34026: {'lr': 0.000444425566122183, 'samples': 6532992, 'steps': 34025, 'loss/train': 1.2167819738388062} -08/30/2021 19:22:42 - INFO - __main__ - Step 34027: {'lr': 0.0004444222300848626, 'samples': 6533184, 'steps': 34026, 'loss/train': 1.4032080173492432} -08/30/2021 19:22:42 - INFO - __main__ - Step 34028: {'lr': 0.00044441889395993844, 'samples': 6533376, 'steps': 34027, 'loss/train': 0.5165640711784363} -08/30/2021 19:22:42 - INFO - __main__ - Step 34029: {'lr': 0.00044441555774741215, 'samples': 6533568, 'steps': 34028, 'loss/train': 1.2656562328338623} -08/30/2021 19:22:43 - INFO - __main__ - Step 34030: {'lr': 0.00044441222144728525, 'samples': 6533760, 'steps': 34029, 'loss/train': 1.4361112117767334} -08/30/2021 19:22:43 - INFO - __main__ - Step 34031: {'lr': 0.00044440888505955926, 'samples': 6533952, 'steps': 34030, 'loss/train': 1.6054483652114868} -08/30/2021 19:22:45 - INFO - __main__ - Step 34032: {'lr': 0.00044440554858423553, 'samples': 6534144, 'steps': 34031, 'loss/train': 0.17834961414337158} -08/30/2021 19:22:45 - INFO - __main__ - Step 34033: {'lr': 0.0004444022120213157, 'samples': 6534336, 'steps': 34032, 'loss/train': 1.5666649341583252} -08/30/2021 19:22:45 - INFO - __main__ - Step 34034: {'lr': 0.00044439887537080116, 'samples': 6534528, 'steps': 34033, 'loss/train': 0.9417108297348022} -08/30/2021 19:22:46 - INFO - __main__ - Step 34035: {'lr': 0.00044439553863269356, 'samples': 6534720, 'steps': 34034, 'loss/train': 1.5861077308654785} -08/30/2021 19:22:46 - INFO - __main__ - Step 34036: {'lr': 0.00044439220180699434, 'samples': 6534912, 'steps': 34035, 'loss/train': 1.1958444118499756} -08/30/2021 19:22:47 - INFO - __main__ - Step 34037: {'lr': 0.00044438886489370493, 'samples': 6535104, 'steps': 34036, 'loss/train': 0.8025926351547241} -08/30/2021 19:22:48 - INFO - __main__ - Step 34038: {'lr': 0.00044438552789282694, 'samples': 6535296, 'steps': 34037, 'loss/train': 1.6437263488769531} -08/30/2021 19:22:49 - INFO - __main__ - Step 34039: {'lr': 0.00044438219080436184, 'samples': 6535488, 'steps': 34038, 'loss/train': 1.6665632724761963} -08/30/2021 19:22:49 - INFO - __main__ - Step 34040: {'lr': 0.0004443788536283111, 'samples': 6535680, 'steps': 34039, 'loss/train': 0.49048101902008057} -08/30/2021 19:22:49 - INFO - __main__ - Step 34041: {'lr': 0.0004443755163646762, 'samples': 6535872, 'steps': 34040, 'loss/train': 1.439178466796875} -08/30/2021 19:22:50 - INFO - __main__ - Step 34042: {'lr': 0.00044437217901345885, 'samples': 6536064, 'steps': 34041, 'loss/train': 1.6291260719299316} -08/30/2021 19:22:52 - INFO - __main__ - Step 34043: {'lr': 0.0004443688415746602, 'samples': 6536256, 'steps': 34042, 'loss/train': 0.7658398747444153} -08/30/2021 19:22:52 - INFO - __main__ - Step 34044: {'lr': 0.00044436550404828207, 'samples': 6536448, 'steps': 34043, 'loss/train': 1.4731136560440063} -08/30/2021 19:22:53 - INFO - __main__ - Step 34045: {'lr': 0.0004443621664343258, 'samples': 6536640, 'steps': 34044, 'loss/train': 1.4982048273086548} -08/30/2021 19:22:53 - INFO - __main__ - Step 34046: {'lr': 0.000444358828732793, 'samples': 6536832, 'steps': 34045, 'loss/train': 1.6950299739837646} -08/30/2021 19:22:53 - INFO - __main__ - Step 34047: {'lr': 0.000444355490943685, 'samples': 6537024, 'steps': 34046, 'loss/train': 0.6983802318572998} -08/30/2021 19:22:54 - INFO - __main__ - Step 34048: {'lr': 0.0004443521530670035, 'samples': 6537216, 'steps': 34047, 'loss/train': 1.171935796737671} -08/30/2021 19:22:55 - INFO - __main__ - Step 34049: {'lr': 0.00044434881510274995, 'samples': 6537408, 'steps': 34048, 'loss/train': 0.9457870125770569} -08/30/2021 19:22:56 - INFO - __main__ - Step 34050: {'lr': 0.00044434547705092574, 'samples': 6537600, 'steps': 34049, 'loss/train': 1.1059062480926514} -08/30/2021 19:22:56 - INFO - __main__ - Step 34051: {'lr': 0.0004443421389115325, 'samples': 6537792, 'steps': 34050, 'loss/train': 0.15285541117191315} -08/30/2021 19:22:57 - INFO - __main__ - Step 34052: {'lr': 0.00044433880068457166, 'samples': 6537984, 'steps': 34051, 'loss/train': 1.0612382888793945} -08/30/2021 19:22:57 - INFO - __main__ - Step 34053: {'lr': 0.0004443354623700447, 'samples': 6538176, 'steps': 34052, 'loss/train': 1.487714171409607} -08/30/2021 19:22:58 - INFO - __main__ - Step 34054: {'lr': 0.0004443321239679533, 'samples': 6538368, 'steps': 34053, 'loss/train': 0.6798129677772522} -08/30/2021 19:22:59 - INFO - __main__ - Step 34055: {'lr': 0.0004443287854782988, 'samples': 6538560, 'steps': 34054, 'loss/train': 1.1008055210113525} -08/30/2021 19:22:59 - INFO - __main__ - Step 34056: {'lr': 0.0004443254469010828, 'samples': 6538752, 'steps': 34055, 'loss/train': 1.6925904750823975} -08/30/2021 19:23:00 - INFO - __main__ - Step 34057: {'lr': 0.0004443221082363067, 'samples': 6538944, 'steps': 34056, 'loss/train': 1.514134407043457} -08/30/2021 19:23:00 - INFO - __main__ - Step 34058: {'lr': 0.000444318769483972, 'samples': 6539136, 'steps': 34057, 'loss/train': 1.9152193069458008} -08/30/2021 19:23:02 - INFO - __main__ - Step 34059: {'lr': 0.0004443154306440803, 'samples': 6539328, 'steps': 34058, 'loss/train': 1.9796053171157837} -08/30/2021 19:23:03 - INFO - __main__ - Step 34060: {'lr': 0.00044431209171663313, 'samples': 6539520, 'steps': 34059, 'loss/train': 0.25463294982910156} -08/30/2021 19:23:03 - INFO - __main__ - Step 34061: {'lr': 0.00044430875270163185, 'samples': 6539712, 'steps': 34060, 'loss/train': 1.1701732873916626} -08/30/2021 19:23:03 - INFO - __main__ - Step 34062: {'lr': 0.00044430541359907804, 'samples': 6539904, 'steps': 34061, 'loss/train': 1.5943013429641724} -08/30/2021 19:23:04 - INFO - __main__ - Step 34063: {'lr': 0.0004443020744089733, 'samples': 6540096, 'steps': 34062, 'loss/train': 1.3849632740020752} -08/30/2021 19:23:04 - INFO - __main__ - Step 34064: {'lr': 0.00044429873513131897, 'samples': 6540288, 'steps': 34063, 'loss/train': 1.2737693786621094} -08/30/2021 19:23:05 - INFO - __main__ - Step 34065: {'lr': 0.00044429539576611664, 'samples': 6540480, 'steps': 34064, 'loss/train': 2.0899105072021484} -08/30/2021 19:23:06 - INFO - __main__ - Step 34066: {'lr': 0.0004442920563133678, 'samples': 6540672, 'steps': 34065, 'loss/train': 1.907918930053711} -08/30/2021 19:23:06 - INFO - __main__ - Step 34067: {'lr': 0.000444288716773074, 'samples': 6540864, 'steps': 34066, 'loss/train': 1.8460075855255127} -08/30/2021 19:23:07 - INFO - __main__ - Step 34068: {'lr': 0.00044428537714523664, 'samples': 6541056, 'steps': 34067, 'loss/train': 1.53731107711792} -08/30/2021 19:23:07 - INFO - __main__ - Step 34069: {'lr': 0.00044428203742985734, 'samples': 6541248, 'steps': 34068, 'loss/train': 1.5715285539627075} -08/30/2021 19:23:09 - INFO - __main__ - Step 34070: {'lr': 0.0004442786976269375, 'samples': 6541440, 'steps': 34069, 'loss/train': 0.991809070110321} -08/30/2021 19:23:09 - INFO - __main__ - Step 34071: {'lr': 0.0004442753577364788, 'samples': 6541632, 'steps': 34070, 'loss/train': 1.6136173009872437} -08/30/2021 19:23:10 - INFO - __main__ - Step 34072: {'lr': 0.00044427201775848246, 'samples': 6541824, 'steps': 34071, 'loss/train': 1.2435650825500488} -08/30/2021 19:23:10 - INFO - __main__ - Step 34073: {'lr': 0.0004442686776929502, 'samples': 6542016, 'steps': 34072, 'loss/train': 2.152937412261963} -08/30/2021 19:23:10 - INFO - __main__ - Step 34074: {'lr': 0.0004442653375398835, 'samples': 6542208, 'steps': 34073, 'loss/train': 0.43778541684150696} -08/30/2021 19:23:12 - INFO - __main__ - Step 34075: {'lr': 0.0004442619972992838, 'samples': 6542400, 'steps': 34074, 'loss/train': 1.5430192947387695} -08/30/2021 19:23:12 - INFO - __main__ - Step 34076: {'lr': 0.00044425865697115266, 'samples': 6542592, 'steps': 34075, 'loss/train': 1.7967345714569092} -08/30/2021 19:23:13 - INFO - __main__ - Step 34077: {'lr': 0.00044425531655549157, 'samples': 6542784, 'steps': 34076, 'loss/train': 0.9645836353302002} -08/30/2021 19:23:13 - INFO - __main__ - Step 34078: {'lr': 0.0004442519760523021, 'samples': 6542976, 'steps': 34077, 'loss/train': 1.2653108835220337} -08/30/2021 19:23:13 - INFO - __main__ - Step 34079: {'lr': 0.00044424863546158554, 'samples': 6543168, 'steps': 34078, 'loss/train': 1.6694822311401367} -08/30/2021 19:23:14 - INFO - __main__ - Step 34080: {'lr': 0.00044424529478334364, 'samples': 6543360, 'steps': 34079, 'loss/train': 1.5284863710403442} -08/30/2021 19:23:16 - INFO - __main__ - Step 34081: {'lr': 0.0004442419540175778, 'samples': 6543552, 'steps': 34080, 'loss/train': 0.1475307047367096} -08/30/2021 19:23:16 - INFO - __main__ - Step 34082: {'lr': 0.0004442386131642895, 'samples': 6543744, 'steps': 34081, 'loss/train': 1.412103533744812} -08/30/2021 19:23:16 - INFO - __main__ - Step 34083: {'lr': 0.0004442352722234803, 'samples': 6543936, 'steps': 34082, 'loss/train': 1.4961471557617188} -08/30/2021 19:23:17 - INFO - __main__ - Step 34084: {'lr': 0.0004442319311951517, 'samples': 6544128, 'steps': 34083, 'loss/train': 1.8522720336914062} -08/30/2021 19:23:17 - INFO - __main__ - Step 34085: {'lr': 0.00044422859007930515, 'samples': 6544320, 'steps': 34084, 'loss/train': 1.3261008262634277} -08/30/2021 19:23:18 - INFO - __main__ - Step 34086: {'lr': 0.00044422524887594223, 'samples': 6544512, 'steps': 34085, 'loss/train': 0.7102405428886414} -08/30/2021 19:23:19 - INFO - __main__ - Step 34087: {'lr': 0.0004442219075850644, 'samples': 6544704, 'steps': 34086, 'loss/train': 1.4017736911773682} -08/30/2021 19:23:19 - INFO - __main__ - Step 34088: {'lr': 0.0004442185662066731, 'samples': 6544896, 'steps': 34087, 'loss/train': 0.9071478843688965} -08/30/2021 19:23:20 - INFO - __main__ - Step 34089: {'lr': 0.00044421522474077, 'samples': 6545088, 'steps': 34088, 'loss/train': 0.7296309471130371} -08/30/2021 19:23:20 - INFO - __main__ - Step 34090: {'lr': 0.0004442118831873565, 'samples': 6545280, 'steps': 34089, 'loss/train': 1.5598859786987305} -08/30/2021 19:23:21 - INFO - __main__ - Step 34091: {'lr': 0.00044420854154643413, 'samples': 6545472, 'steps': 34090, 'loss/train': 1.604191541671753} -08/30/2021 19:23:22 - INFO - __main__ - Step 34092: {'lr': 0.00044420519981800446, 'samples': 6545664, 'steps': 34091, 'loss/train': 1.550437331199646} -08/30/2021 19:23:22 - INFO - __main__ - Step 34093: {'lr': 0.0004442018580020688, 'samples': 6545856, 'steps': 34092, 'loss/train': 1.6765708923339844} -08/30/2021 19:23:23 - INFO - __main__ - Step 34094: {'lr': 0.0004441985160986288, 'samples': 6546048, 'steps': 34093, 'loss/train': 1.8748102188110352} -08/30/2021 19:23:23 - INFO - __main__ - Step 34095: {'lr': 0.00044419517410768594, 'samples': 6546240, 'steps': 34094, 'loss/train': 1.2102035284042358} -08/30/2021 19:23:24 - INFO - __main__ - Step 34096: {'lr': 0.0004441918320292418, 'samples': 6546432, 'steps': 34095, 'loss/train': 1.571191430091858} -08/30/2021 19:23:25 - INFO - __main__ - Step 34097: {'lr': 0.00044418848986329775, 'samples': 6546624, 'steps': 34096, 'loss/train': 1.576714277267456} -08/30/2021 19:23:25 - INFO - __main__ - Step 34098: {'lr': 0.0004441851476098554, 'samples': 6546816, 'steps': 34097, 'loss/train': 1.3400318622589111} -08/30/2021 19:23:26 - INFO - __main__ - Step 34099: {'lr': 0.0004441818052689162, 'samples': 6547008, 'steps': 34098, 'loss/train': 1.7222793102264404} -08/30/2021 19:23:26 - INFO - __main__ - Step 34100: {'lr': 0.0004441784628404817, 'samples': 6547200, 'steps': 34099, 'loss/train': 1.5035686492919922} -08/30/2021 19:23:27 - INFO - __main__ - Step 34101: {'lr': 0.0004441751203245533, 'samples': 6547392, 'steps': 34100, 'loss/train': 1.8330358266830444} -08/30/2021 19:23:28 - INFO - __main__ - Step 34102: {'lr': 0.0004441717777211327, 'samples': 6547584, 'steps': 34101, 'loss/train': 2.1723060607910156} -08/30/2021 19:23:28 - INFO - __main__ - Step 34103: {'lr': 0.00044416843503022126, 'samples': 6547776, 'steps': 34102, 'loss/train': 1.5225306749343872} -08/30/2021 19:23:29 - INFO - __main__ - Step 34104: {'lr': 0.00044416509225182044, 'samples': 6547968, 'steps': 34103, 'loss/train': 1.1453888416290283} -08/30/2021 19:23:29 - INFO - __main__ - Step 34105: {'lr': 0.0004441617493859319, 'samples': 6548160, 'steps': 34104, 'loss/train': 1.463390827178955} -08/30/2021 19:23:30 - INFO - __main__ - Step 34106: {'lr': 0.0004441584064325571, 'samples': 6548352, 'steps': 34105, 'loss/train': 1.5844244956970215} -08/30/2021 19:23:31 - INFO - __main__ - Step 34107: {'lr': 0.0004441550633916975, 'samples': 6548544, 'steps': 34106, 'loss/train': 1.9017499685287476} -08/30/2021 19:23:32 - INFO - __main__ - Step 34108: {'lr': 0.0004441517202633546, 'samples': 6548736, 'steps': 34107, 'loss/train': 1.7990669012069702} -08/30/2021 19:23:32 - INFO - __main__ - Step 34109: {'lr': 0.0004441483770475299, 'samples': 6548928, 'steps': 34108, 'loss/train': 1.2839605808258057} -08/30/2021 19:23:33 - INFO - __main__ - Step 34110: {'lr': 0.000444145033744225, 'samples': 6549120, 'steps': 34109, 'loss/train': 1.3546086549758911} -08/30/2021 19:23:33 - INFO - __main__ - Step 34111: {'lr': 0.0004441416903534413, 'samples': 6549312, 'steps': 34110, 'loss/train': 0.17416894435882568} -08/30/2021 19:23:35 - INFO - __main__ - Step 34112: {'lr': 0.00044413834687518034, 'samples': 6549504, 'steps': 34111, 'loss/train': 1.389888048171997} -08/30/2021 19:23:35 - INFO - __main__ - Step 34113: {'lr': 0.00044413500330944366, 'samples': 6549696, 'steps': 34112, 'loss/train': 1.502997636795044} -08/30/2021 19:23:36 - INFO - __main__ - Step 34114: {'lr': 0.00044413165965623275, 'samples': 6549888, 'steps': 34113, 'loss/train': 1.8994534015655518} -08/30/2021 19:23:36 - INFO - __main__ - Step 34115: {'lr': 0.00044412831591554916, 'samples': 6550080, 'steps': 34114, 'loss/train': 1.4599614143371582} -08/30/2021 19:23:36 - INFO - __main__ - Step 34116: {'lr': 0.0004441249720873942, 'samples': 6550272, 'steps': 34115, 'loss/train': 1.1991057395935059} -08/30/2021 19:23:37 - INFO - __main__ - Step 34117: {'lr': 0.00044412162817176966, 'samples': 6550464, 'steps': 34116, 'loss/train': 0.8302178382873535} -08/30/2021 19:23:38 - INFO - __main__ - Step 34118: {'lr': 0.00044411828416867684, 'samples': 6550656, 'steps': 34117, 'loss/train': 1.6284816265106201} -08/30/2021 19:23:39 - INFO - __main__ - Step 34119: {'lr': 0.00044411494007811736, 'samples': 6550848, 'steps': 34118, 'loss/train': 1.1236224174499512} -08/30/2021 19:23:39 - INFO - __main__ - Step 34120: {'lr': 0.00044411159590009263, 'samples': 6551040, 'steps': 34119, 'loss/train': 1.3370686769485474} -08/30/2021 19:23:40 - INFO - __main__ - Step 34121: {'lr': 0.0004441082516346043, 'samples': 6551232, 'steps': 34120, 'loss/train': 1.8110923767089844} -08/30/2021 19:23:40 - INFO - __main__ - Step 34122: {'lr': 0.0004441049072816537, 'samples': 6551424, 'steps': 34121, 'loss/train': 1.2732646465301514} -08/30/2021 19:23:41 - INFO - __main__ - Step 34123: {'lr': 0.0004441015628412425, 'samples': 6551616, 'steps': 34122, 'loss/train': 1.7347229719161987} -08/30/2021 19:23:42 - INFO - __main__ - Step 34124: {'lr': 0.0004440982183133721, 'samples': 6551808, 'steps': 34123, 'loss/train': 1.4055626392364502} -08/30/2021 19:23:42 - INFO - __main__ - Step 34125: {'lr': 0.00044409487369804395, 'samples': 6552000, 'steps': 34124, 'loss/train': 1.4072000980377197} -08/30/2021 19:23:43 - INFO - __main__ - Step 34126: {'lr': 0.00044409152899525973, 'samples': 6552192, 'steps': 34125, 'loss/train': 1.2079187631607056} -08/30/2021 19:23:43 - INFO - __main__ - Step 34127: {'lr': 0.00044408818420502085, 'samples': 6552384, 'steps': 34126, 'loss/train': 1.6269725561141968} -08/30/2021 19:23:45 - INFO - __main__ - Step 34128: {'lr': 0.00044408483932732886, 'samples': 6552576, 'steps': 34127, 'loss/train': 1.5361895561218262} -08/30/2021 19:23:45 - INFO - __main__ - Step 34129: {'lr': 0.00044408149436218523, 'samples': 6552768, 'steps': 34128, 'loss/train': 1.7371842861175537} -08/30/2021 19:23:45 - INFO - __main__ - Step 34130: {'lr': 0.00044407814930959137, 'samples': 6552960, 'steps': 34129, 'loss/train': 1.6486812829971313} -08/30/2021 19:23:46 - INFO - __main__ - Step 34131: {'lr': 0.000444074804169549, 'samples': 6553152, 'steps': 34130, 'loss/train': 2.4829702377319336} -08/30/2021 19:23:46 - INFO - __main__ - Step 34132: {'lr': 0.00044407145894205947, 'samples': 6553344, 'steps': 34131, 'loss/train': 0.819826066493988} -08/30/2021 19:23:48 - INFO - __main__ - Step 34133: {'lr': 0.0004440681136271244, 'samples': 6553536, 'steps': 34132, 'loss/train': 1.3111553192138672} -08/30/2021 19:23:48 - INFO - __main__ - Step 34134: {'lr': 0.0004440647682247452, 'samples': 6553728, 'steps': 34133, 'loss/train': 1.255419135093689} -08/30/2021 19:23:49 - INFO - __main__ - Step 34135: {'lr': 0.00044406142273492334, 'samples': 6553920, 'steps': 34134, 'loss/train': 1.1177340745925903} -08/30/2021 19:23:49 - INFO - __main__ - Step 34136: {'lr': 0.00044405807715766047, 'samples': 6554112, 'steps': 34135, 'loss/train': 1.4886301755905151} -08/30/2021 19:23:49 - INFO - __main__ - Step 34137: {'lr': 0.00044405473149295804, 'samples': 6554304, 'steps': 34136, 'loss/train': 1.3253486156463623} -08/30/2021 19:23:51 - INFO - __main__ - Step 34138: {'lr': 0.0004440513857408175, 'samples': 6554496, 'steps': 34137, 'loss/train': 1.618687391281128} -08/30/2021 19:23:51 - INFO - __main__ - Step 34139: {'lr': 0.0004440480399012404, 'samples': 6554688, 'steps': 34138, 'loss/train': 1.6538251638412476} -08/30/2021 19:23:52 - INFO - __main__ - Step 34140: {'lr': 0.00044404469397422823, 'samples': 6554880, 'steps': 34139, 'loss/train': 1.6019890308380127} -08/30/2021 19:23:52 - INFO - __main__ - Step 34141: {'lr': 0.00044404134795978257, 'samples': 6555072, 'steps': 34140, 'loss/train': 1.201795220375061} -08/30/2021 19:23:52 - INFO - __main__ - Step 34142: {'lr': 0.0004440380018579049, 'samples': 6555264, 'steps': 34141, 'loss/train': 1.527990460395813} -08/30/2021 19:23:54 - INFO - __main__ - Step 34143: {'lr': 0.00044403465566859656, 'samples': 6555456, 'steps': 34142, 'loss/train': 1.0799099206924438} -08/30/2021 19:23:54 - INFO - __main__ - Step 34144: {'lr': 0.0004440313093918593, 'samples': 6555648, 'steps': 34143, 'loss/train': 1.9859564304351807} -08/30/2021 19:23:55 - INFO - __main__ - Step 34145: {'lr': 0.00044402796302769453, 'samples': 6555840, 'steps': 34144, 'loss/train': 0.777617335319519} -08/30/2021 19:23:55 - INFO - __main__ - Step 34146: {'lr': 0.0004440246165761037, 'samples': 6556032, 'steps': 34145, 'loss/train': 1.4875977039337158} -08/30/2021 19:23:55 - INFO - __main__ - Step 34147: {'lr': 0.00044402127003708846, 'samples': 6556224, 'steps': 34146, 'loss/train': 1.2050319910049438} -08/30/2021 19:23:57 - INFO - __main__ - Step 34148: {'lr': 0.0004440179234106502, 'samples': 6556416, 'steps': 34147, 'loss/train': 1.2090332508087158} -08/30/2021 19:23:57 - INFO - __main__ - Step 34149: {'lr': 0.00044401457669679043, 'samples': 6556608, 'steps': 34148, 'loss/train': 0.9860490560531616} -08/30/2021 19:23:58 - INFO - __main__ - Step 34150: {'lr': 0.0004440112298955107, 'samples': 6556800, 'steps': 34149, 'loss/train': 2.4779458045959473} -08/30/2021 19:23:58 - INFO - __main__ - Step 34151: {'lr': 0.0004440078830068125, 'samples': 6556992, 'steps': 34150, 'loss/train': 1.4247993230819702} -08/30/2021 19:23:58 - INFO - __main__ - Step 34152: {'lr': 0.00044400453603069727, 'samples': 6557184, 'steps': 34151, 'loss/train': 0.5688244104385376} -08/30/2021 19:24:00 - INFO - __main__ - Step 34153: {'lr': 0.0004440011889671667, 'samples': 6557376, 'steps': 34152, 'loss/train': 1.5328048467636108} -08/30/2021 19:24:00 - INFO - __main__ - Step 34154: {'lr': 0.00044399784181622216, 'samples': 6557568, 'steps': 34153, 'loss/train': 2.024057626724243} -08/30/2021 19:24:01 - INFO - __main__ - Step 34155: {'lr': 0.0004439944945778651, 'samples': 6557760, 'steps': 34154, 'loss/train': 1.7221916913986206} -08/30/2021 19:24:01 - INFO - __main__ - Step 34156: {'lr': 0.0004439911472520972, 'samples': 6557952, 'steps': 34155, 'loss/train': 1.5092796087265015} -08/30/2021 19:24:01 - INFO - __main__ - Step 34157: {'lr': 0.0004439877998389199, 'samples': 6558144, 'steps': 34156, 'loss/train': 1.34806227684021} -08/30/2021 19:24:03 - INFO - __main__ - Step 34158: {'lr': 0.0004439844523383346, 'samples': 6558336, 'steps': 34157, 'loss/train': 1.026733160018921} -08/30/2021 19:24:04 - INFO - __main__ - Step 34159: {'lr': 0.000443981104750343, 'samples': 6558528, 'steps': 34158, 'loss/train': 1.7693021297454834} -08/30/2021 19:24:04 - INFO - __main__ - Step 34160: {'lr': 0.0004439777570749465, 'samples': 6558720, 'steps': 34159, 'loss/train': 1.5494612455368042} -08/30/2021 19:24:04 - INFO - __main__ - Step 34161: {'lr': 0.0004439744093121465, 'samples': 6558912, 'steps': 34160, 'loss/train': 0.18620210886001587} -08/30/2021 19:24:05 - INFO - __main__ - Step 34162: {'lr': 0.00044397106146194473, 'samples': 6559104, 'steps': 34161, 'loss/train': 1.3535797595977783} -08/30/2021 19:24:05 - INFO - __main__ - Step 34163: {'lr': 0.00044396771352434256, 'samples': 6559296, 'steps': 34162, 'loss/train': 1.4653098583221436} -08/30/2021 19:24:06 - INFO - __main__ - Step 34164: {'lr': 0.00044396436549934155, 'samples': 6559488, 'steps': 34163, 'loss/train': 1.4813244342803955} -08/30/2021 19:24:07 - INFO - __main__ - Step 34165: {'lr': 0.00044396101738694316, 'samples': 6559680, 'steps': 34164, 'loss/train': 1.4787218570709229} -08/30/2021 19:24:07 - INFO - __main__ - Step 34166: {'lr': 0.000443957669187149, 'samples': 6559872, 'steps': 34165, 'loss/train': 1.663667917251587} -08/30/2021 19:24:08 - INFO - __main__ - Step 34167: {'lr': 0.0004439543208999604, 'samples': 6560064, 'steps': 34166, 'loss/train': 1.3167599439620972} -08/30/2021 19:24:08 - INFO - __main__ - Step 34168: {'lr': 0.00044395097252537905, 'samples': 6560256, 'steps': 34167, 'loss/train': 1.2871379852294922} -08/30/2021 19:24:10 - INFO - __main__ - Step 34169: {'lr': 0.0004439476240634064, 'samples': 6560448, 'steps': 34168, 'loss/train': 1.1371201276779175} -08/30/2021 19:24:10 - INFO - __main__ - Step 34170: {'lr': 0.00044394427551404386, 'samples': 6560640, 'steps': 34169, 'loss/train': 1.474199652671814} -08/30/2021 19:24:11 - INFO - __main__ - Step 34171: {'lr': 0.00044394092687729305, 'samples': 6560832, 'steps': 34170, 'loss/train': 1.9667190313339233} -08/30/2021 19:24:11 - INFO - __main__ - Step 34172: {'lr': 0.0004439375781531555, 'samples': 6561024, 'steps': 34171, 'loss/train': 1.244231104850769} -08/30/2021 19:24:11 - INFO - __main__ - Step 34173: {'lr': 0.00044393422934163265, 'samples': 6561216, 'steps': 34172, 'loss/train': 1.9117591381072998} -08/30/2021 19:24:13 - INFO - __main__ - Step 34174: {'lr': 0.000443930880442726, 'samples': 6561408, 'steps': 34173, 'loss/train': 1.083193063735962} -08/30/2021 19:24:13 - INFO - __main__ - Step 34175: {'lr': 0.0004439275314564371, 'samples': 6561600, 'steps': 34174, 'loss/train': 1.7774274349212646} -08/30/2021 19:24:14 - INFO - __main__ - Step 34176: {'lr': 0.0004439241823827674, 'samples': 6561792, 'steps': 34175, 'loss/train': 1.2330737113952637} -08/30/2021 19:24:14 - INFO - __main__ - Step 34177: {'lr': 0.0004439208332217186, 'samples': 6561984, 'steps': 34176, 'loss/train': 1.119931936264038} -08/30/2021 19:24:14 - INFO - __main__ - Step 34178: {'lr': 0.00044391748397329194, 'samples': 6562176, 'steps': 34177, 'loss/train': 1.6856865882873535} -08/30/2021 19:24:16 - INFO - __main__ - Step 34179: {'lr': 0.0004439141346374891, 'samples': 6562368, 'steps': 34178, 'loss/train': 1.6810458898544312} -08/30/2021 19:24:17 - INFO - __main__ - Step 34180: {'lr': 0.0004439107852143115, 'samples': 6562560, 'steps': 34179, 'loss/train': 1.2703230381011963} -08/30/2021 19:24:17 - INFO - __main__ - Step 34181: {'lr': 0.0004439074357037607, 'samples': 6562752, 'steps': 34180, 'loss/train': 1.591692328453064} -08/30/2021 19:24:17 - INFO - __main__ - Step 34182: {'lr': 0.0004439040861058383, 'samples': 6562944, 'steps': 34181, 'loss/train': 1.7475205659866333} -08/30/2021 19:24:18 - INFO - __main__ - Step 34183: {'lr': 0.00044390073642054564, 'samples': 6563136, 'steps': 34182, 'loss/train': 0.2079470306634903} -08/30/2021 19:24:18 - INFO - __main__ - Step 34184: {'lr': 0.00044389738664788424, 'samples': 6563328, 'steps': 34183, 'loss/train': 0.30054929852485657} -08/30/2021 19:24:20 - INFO - __main__ - Step 34185: {'lr': 0.00044389403678785576, 'samples': 6563520, 'steps': 34184, 'loss/train': 1.2066550254821777} -08/30/2021 19:24:20 - INFO - __main__ - Step 34186: {'lr': 0.0004438906868404616, 'samples': 6563712, 'steps': 34185, 'loss/train': 1.898586630821228} -08/30/2021 19:24:21 - INFO - __main__ - Step 34187: {'lr': 0.00044388733680570324, 'samples': 6563904, 'steps': 34186, 'loss/train': 1.0105535984039307} -08/30/2021 19:24:21 - INFO - __main__ - Step 34188: {'lr': 0.00044388398668358234, 'samples': 6564096, 'steps': 34187, 'loss/train': 0.5083702206611633} -08/30/2021 19:24:21 - INFO - __main__ - Step 34189: {'lr': 0.00044388063647410016, 'samples': 6564288, 'steps': 34188, 'loss/train': 1.2549986839294434} -08/30/2021 19:24:22 - INFO - __main__ - Step 34190: {'lr': 0.00044387728617725845, 'samples': 6564480, 'steps': 34189, 'loss/train': 0.02863602340221405} -08/30/2021 19:24:23 - INFO - __main__ - Step 34191: {'lr': 0.0004438739357930586, 'samples': 6564672, 'steps': 34190, 'loss/train': 1.8983687162399292} -08/30/2021 19:24:24 - INFO - __main__ - Step 34192: {'lr': 0.00044387058532150217, 'samples': 6564864, 'steps': 34191, 'loss/train': 1.122631549835205} -08/30/2021 19:24:24 - INFO - __main__ - Step 34193: {'lr': 0.0004438672347625907, 'samples': 6565056, 'steps': 34192, 'loss/train': 1.2891201972961426} -08/30/2021 19:24:24 - INFO - __main__ - Step 34194: {'lr': 0.0004438638841163255, 'samples': 6565248, 'steps': 34193, 'loss/train': 1.9356719255447388} -08/30/2021 19:24:25 - INFO - __main__ - Step 34195: {'lr': 0.0004438605333827083, 'samples': 6565440, 'steps': 34194, 'loss/train': 1.4864017963409424} -08/30/2021 19:24:26 - INFO - __main__ - Step 34196: {'lr': 0.00044385718256174055, 'samples': 6565632, 'steps': 34195, 'loss/train': 1.7286392450332642} -08/30/2021 19:24:27 - INFO - __main__ - Step 34197: {'lr': 0.0004438538316534237, 'samples': 6565824, 'steps': 34196, 'loss/train': 1.7241981029510498} -08/30/2021 19:24:27 - INFO - __main__ - Step 34198: {'lr': 0.0004438504806577594, 'samples': 6566016, 'steps': 34197, 'loss/train': 1.3779321908950806} -08/30/2021 19:24:27 - INFO - __main__ - Step 34199: {'lr': 0.000443847129574749, 'samples': 6566208, 'steps': 34198, 'loss/train': 2.177377462387085} -08/30/2021 19:24:28 - INFO - __main__ - Step 34200: {'lr': 0.0004438437784043941, 'samples': 6566400, 'steps': 34199, 'loss/train': 0.8560999035835266} -08/30/2021 19:24:28 - INFO - __main__ - Step 34201: {'lr': 0.00044384042714669614, 'samples': 6566592, 'steps': 34200, 'loss/train': 1.8695520162582397} -08/30/2021 19:24:30 - INFO - __main__ - Step 34202: {'lr': 0.0004438370758016567, 'samples': 6566784, 'steps': 34201, 'loss/train': 1.9796277284622192} -08/30/2021 19:24:30 - INFO - __main__ - Step 34203: {'lr': 0.00044383372436927727, 'samples': 6566976, 'steps': 34202, 'loss/train': 1.2149608135223389} -08/30/2021 19:24:31 - INFO - __main__ - Step 34204: {'lr': 0.00044383037284955937, 'samples': 6567168, 'steps': 34203, 'loss/train': 0.474067747592926} -08/30/2021 19:24:31 - INFO - __main__ - Step 34205: {'lr': 0.00044382702124250444, 'samples': 6567360, 'steps': 34204, 'loss/train': 0.06754706054925919} -08/30/2021 19:24:31 - INFO - __main__ - Step 34206: {'lr': 0.0004438236695481141, 'samples': 6567552, 'steps': 34205, 'loss/train': 1.4249253273010254} -08/30/2021 19:24:33 - INFO - __main__ - Step 34207: {'lr': 0.00044382031776638974, 'samples': 6567744, 'steps': 34206, 'loss/train': 1.7205047607421875} -08/30/2021 19:24:33 - INFO - __main__ - Step 34208: {'lr': 0.000443816965897333, 'samples': 6567936, 'steps': 34207, 'loss/train': 1.0833297967910767} -08/30/2021 19:24:34 - INFO - __main__ - Step 34209: {'lr': 0.0004438136139409453, 'samples': 6568128, 'steps': 34208, 'loss/train': 2.3178319931030273} -08/30/2021 19:24:34 - INFO - __main__ - Step 34210: {'lr': 0.00044381026189722824, 'samples': 6568320, 'steps': 34209, 'loss/train': 1.1204833984375} -08/30/2021 19:24:34 - INFO - __main__ - Step 34211: {'lr': 0.0004438069097661832, 'samples': 6568512, 'steps': 34210, 'loss/train': 1.4572902917861938} -08/30/2021 19:24:36 - INFO - __main__ - Step 34212: {'lr': 0.0004438035575478118, 'samples': 6568704, 'steps': 34211, 'loss/train': 0.03854339197278023} -08/30/2021 19:24:37 - INFO - __main__ - Step 34213: {'lr': 0.0004438002052421154, 'samples': 6568896, 'steps': 34212, 'loss/train': 1.9920425415039062} -08/30/2021 19:24:37 - INFO - __main__ - Step 34214: {'lr': 0.00044379685284909575, 'samples': 6569088, 'steps': 34213, 'loss/train': 1.115020751953125} -08/30/2021 19:24:37 - INFO - __main__ - Step 34215: {'lr': 0.00044379350036875413, 'samples': 6569280, 'steps': 34214, 'loss/train': 1.7330234050750732} -08/30/2021 19:24:38 - INFO - __main__ - Step 34216: {'lr': 0.00044379014780109217, 'samples': 6569472, 'steps': 34215, 'loss/train': 0.030922777950763702} -08/30/2021 19:24:38 - INFO - __main__ - Step 34217: {'lr': 0.00044378679514611144, 'samples': 6569664, 'steps': 34216, 'loss/train': 0.03244650363922119} -08/30/2021 19:24:39 - INFO - __main__ - Step 34218: {'lr': 0.0004437834424038133, 'samples': 6569856, 'steps': 34217, 'loss/train': 1.6112648248672485} -08/30/2021 19:24:40 - INFO - __main__ - Step 34219: {'lr': 0.00044378008957419936, 'samples': 6570048, 'steps': 34218, 'loss/train': 1.5600571632385254} -08/30/2021 19:24:40 - INFO - __main__ - Step 34220: {'lr': 0.00044377673665727105, 'samples': 6570240, 'steps': 34219, 'loss/train': 1.6179169416427612} -08/30/2021 19:24:41 - INFO - __main__ - Step 34221: {'lr': 0.00044377338365303, 'samples': 6570432, 'steps': 34220, 'loss/train': 1.8349685668945312} -08/30/2021 19:24:41 - INFO - __main__ - Step 34222: {'lr': 0.00044377003056147757, 'samples': 6570624, 'steps': 34221, 'loss/train': 1.8525657653808594} -08/30/2021 19:24:43 - INFO - __main__ - Step 34223: {'lr': 0.00044376667738261545, 'samples': 6570816, 'steps': 34222, 'loss/train': 1.5012279748916626} -08/30/2021 19:24:44 - INFO - __main__ - Step 34224: {'lr': 0.000443763324116445, 'samples': 6571008, 'steps': 34223, 'loss/train': 1.5951707363128662} -08/30/2021 19:24:44 - INFO - __main__ - Step 34225: {'lr': 0.00044375997076296774, 'samples': 6571200, 'steps': 34224, 'loss/train': 1.2798352241516113} -08/30/2021 19:24:45 - INFO - __main__ - Step 34226: {'lr': 0.0004437566173221853, 'samples': 6571392, 'steps': 34225, 'loss/train': 0.09263995289802551} -08/30/2021 19:24:45 - INFO - __main__ - Step 34227: {'lr': 0.0004437532637940991, 'samples': 6571584, 'steps': 34226, 'loss/train': 1.4912067651748657} -08/30/2021 19:24:46 - INFO - __main__ - Step 34228: {'lr': 0.0004437499101787107, 'samples': 6571776, 'steps': 34227, 'loss/train': 1.5270442962646484} -08/30/2021 19:24:47 - INFO - __main__ - Step 34229: {'lr': 0.00044374655647602153, 'samples': 6571968, 'steps': 34228, 'loss/train': 0.8537130951881409} -08/30/2021 19:24:47 - INFO - __main__ - Step 34230: {'lr': 0.0004437432026860332, 'samples': 6572160, 'steps': 34229, 'loss/train': 1.00099515914917} -08/30/2021 19:24:48 - INFO - __main__ - Step 34231: {'lr': 0.00044373984880874705, 'samples': 6572352, 'steps': 34230, 'loss/train': 1.547523021697998} -08/30/2021 19:24:48 - INFO - __main__ - Step 34232: {'lr': 0.0004437364948441649, 'samples': 6572544, 'steps': 34231, 'loss/train': 0.5179018974304199} -08/30/2021 19:24:50 - INFO - __main__ - Step 34233: {'lr': 0.00044373314079228796, 'samples': 6572736, 'steps': 34232, 'loss/train': 1.007223129272461} -08/30/2021 19:24:50 - INFO - __main__ - Step 34234: {'lr': 0.0004437297866531179, 'samples': 6572928, 'steps': 34233, 'loss/train': 1.3493837118148804} -08/30/2021 19:24:50 - INFO - __main__ - Step 34235: {'lr': 0.0004437264324266561, 'samples': 6573120, 'steps': 34234, 'loss/train': 1.7975345849990845} -08/30/2021 19:24:51 - INFO - __main__ - Step 34236: {'lr': 0.00044372307811290425, 'samples': 6573312, 'steps': 34235, 'loss/train': 2.090087890625} -08/30/2021 19:24:51 - INFO - __main__ - Step 34237: {'lr': 0.00044371972371186374, 'samples': 6573504, 'steps': 34236, 'loss/train': 0.9617405533790588} -08/30/2021 19:24:52 - INFO - __main__ - Step 34238: {'lr': 0.0004437163692235361, 'samples': 6573696, 'steps': 34237, 'loss/train': 1.2290090322494507} -08/30/2021 19:24:53 - INFO - __main__ - Step 34239: {'lr': 0.0004437130146479229, 'samples': 6573888, 'steps': 34238, 'loss/train': 1.1606254577636719} -08/30/2021 19:24:53 - INFO - __main__ - Step 34240: {'lr': 0.00044370965998502554, 'samples': 6574080, 'steps': 34239, 'loss/train': 1.639793038368225} -08/30/2021 19:24:54 - INFO - __main__ - Step 34241: {'lr': 0.0004437063052348457, 'samples': 6574272, 'steps': 34240, 'loss/train': 0.46614667773246765} -08/30/2021 19:24:54 - INFO - __main__ - Step 34242: {'lr': 0.0004437029503973847, 'samples': 6574464, 'steps': 34241, 'loss/train': 0.9633070826530457} -08/30/2021 19:24:54 - INFO - __main__ - Step 34243: {'lr': 0.00044369959547264416, 'samples': 6574656, 'steps': 34242, 'loss/train': 1.1773043870925903} -08/30/2021 19:24:56 - INFO - __main__ - Step 34244: {'lr': 0.0004436962404606255, 'samples': 6574848, 'steps': 34243, 'loss/train': 1.3718786239624023} -08/30/2021 19:24:57 - INFO - __main__ - Step 34245: {'lr': 0.0004436928853613304, 'samples': 6575040, 'steps': 34244, 'loss/train': 1.1644132137298584} -08/30/2021 19:24:57 - INFO - __main__ - Step 34246: {'lr': 0.0004436895301747602, 'samples': 6575232, 'steps': 34245, 'loss/train': 0.13820725679397583} -08/30/2021 19:24:57 - INFO - __main__ - Step 34247: {'lr': 0.00044368617490091655, 'samples': 6575424, 'steps': 34246, 'loss/train': 1.9280463457107544} -08/30/2021 19:24:58 - INFO - __main__ - Step 34248: {'lr': 0.0004436828195398009, 'samples': 6575616, 'steps': 34247, 'loss/train': 1.2685279846191406} -08/30/2021 19:24:59 - INFO - __main__ - Step 34249: {'lr': 0.0004436794640914148, 'samples': 6575808, 'steps': 34248, 'loss/train': 1.8469264507293701} -08/30/2021 19:25:00 - INFO - __main__ - Step 34250: {'lr': 0.00044367610855575965, 'samples': 6576000, 'steps': 34249, 'loss/train': 1.165789008140564} -08/30/2021 19:25:00 - INFO - __main__ - Step 34251: {'lr': 0.00044367275293283705, 'samples': 6576192, 'steps': 34250, 'loss/train': 1.6584229469299316} -08/30/2021 19:25:00 - INFO - __main__ - Step 34252: {'lr': 0.00044366939722264843, 'samples': 6576384, 'steps': 34251, 'loss/train': 1.1459347009658813} -08/30/2021 19:25:01 - INFO - __main__ - Step 34253: {'lr': 0.00044366604142519547, 'samples': 6576576, 'steps': 34252, 'loss/train': 1.487842082977295} -08/30/2021 19:25:02 - INFO - __main__ - Step 34254: {'lr': 0.0004436626855404796, 'samples': 6576768, 'steps': 34253, 'loss/train': 1.770192265510559} -08/30/2021 19:25:03 - INFO - __main__ - Step 34255: {'lr': 0.0004436593295685022, 'samples': 6576960, 'steps': 34254, 'loss/train': 1.1421363353729248} -08/30/2021 19:25:03 - INFO - __main__ - Step 34256: {'lr': 0.00044365597350926495, 'samples': 6577152, 'steps': 34255, 'loss/train': 1.4245450496673584} -08/30/2021 19:25:03 - INFO - __main__ - Step 34257: {'lr': 0.0004436526173627693, 'samples': 6577344, 'steps': 34256, 'loss/train': 1.275696873664856} -08/30/2021 19:25:04 - INFO - __main__ - Step 34258: {'lr': 0.00044364926112901675, 'samples': 6577536, 'steps': 34257, 'loss/train': 1.6342436075210571} -08/30/2021 19:25:06 - INFO - __main__ - Step 34259: {'lr': 0.0004436459048080089, 'samples': 6577728, 'steps': 34258, 'loss/train': 1.5422656536102295} -08/30/2021 19:25:07 - INFO - __main__ - Step 34260: {'lr': 0.00044364254839974717, 'samples': 6577920, 'steps': 34259, 'loss/train': 1.8504722118377686} -08/30/2021 19:25:07 - INFO - __main__ - Step 34261: {'lr': 0.0004436391919042331, 'samples': 6578112, 'steps': 34260, 'loss/train': 1.1316170692443848} -08/30/2021 19:25:07 - INFO - __main__ - Step 34262: {'lr': 0.00044363583532146814, 'samples': 6578304, 'steps': 34261, 'loss/train': 1.1465259790420532} -08/30/2021 19:25:08 - INFO - __main__ - Step 34263: {'lr': 0.0004436324786514538, 'samples': 6578496, 'steps': 34262, 'loss/train': 1.1065312623977661} -08/30/2021 19:25:08 - INFO - __main__ - Step 34264: {'lr': 0.0004436291218941918, 'samples': 6578688, 'steps': 34263, 'loss/train': 2.729570150375366} -08/30/2021 19:25:08 - INFO - __main__ - Step 34265: {'lr': 0.00044362576504968344, 'samples': 6578880, 'steps': 34264, 'loss/train': 2.7487316131591797} -08/30/2021 19:25:10 - INFO - __main__ - Step 34266: {'lr': 0.0004436224081179303, 'samples': 6579072, 'steps': 34265, 'loss/train': 1.3740428686141968} -08/30/2021 19:25:10 - INFO - __main__ - Step 34267: {'lr': 0.00044361905109893397, 'samples': 6579264, 'steps': 34266, 'loss/train': 1.0996173620224} -08/30/2021 19:25:11 - INFO - __main__ - Step 34268: {'lr': 0.00044361569399269574, 'samples': 6579456, 'steps': 34267, 'loss/train': 1.31764817237854} -08/30/2021 19:25:11 - INFO - __main__ - Step 34269: {'lr': 0.0004436123367992174, 'samples': 6579648, 'steps': 34268, 'loss/train': 1.7479370832443237} -08/30/2021 19:25:11 - INFO - __main__ - Step 34270: {'lr': 0.0004436089795185003, 'samples': 6579840, 'steps': 34269, 'loss/train': 1.315965175628662} -08/30/2021 19:25:13 - INFO - __main__ - Step 34271: {'lr': 0.0004436056221505459, 'samples': 6580032, 'steps': 34270, 'loss/train': 1.4850128889083862} -08/30/2021 19:25:14 - INFO - __main__ - Step 34272: {'lr': 0.00044360226469535583, 'samples': 6580224, 'steps': 34271, 'loss/train': 1.6063331365585327} -08/30/2021 19:25:14 - INFO - __main__ - Step 34273: {'lr': 0.0004435989071529316, 'samples': 6580416, 'steps': 34272, 'loss/train': 1.93623685836792} -08/30/2021 19:25:14 - INFO - __main__ - Step 34274: {'lr': 0.0004435955495232746, 'samples': 6580608, 'steps': 34273, 'loss/train': 1.8147273063659668} -08/30/2021 19:25:15 - INFO - __main__ - Step 34275: {'lr': 0.00044359219180638656, 'samples': 6580800, 'steps': 34274, 'loss/train': 0.036472879350185394} -08/30/2021 19:25:15 - INFO - __main__ - Step 34276: {'lr': 0.0004435888340022688, 'samples': 6580992, 'steps': 34275, 'loss/train': 0.8034371137619019} -08/30/2021 19:25:15 - INFO - __main__ - Step 34277: {'lr': 0.0004435854761109229, 'samples': 6581184, 'steps': 34276, 'loss/train': 2.220669984817505} -08/30/2021 19:25:17 - INFO - __main__ - Step 34278: {'lr': 0.00044358211813235046, 'samples': 6581376, 'steps': 34277, 'loss/train': 1.5848262310028076} -08/30/2021 19:25:18 - INFO - __main__ - Step 34279: {'lr': 0.0004435787600665528, 'samples': 6581568, 'steps': 34278, 'loss/train': 0.13611367344856262} -08/30/2021 19:25:18 - INFO - __main__ - Step 34280: {'lr': 0.0004435754019135315, 'samples': 6581760, 'steps': 34279, 'loss/train': 1.5251275300979614} -08/30/2021 19:25:18 - INFO - __main__ - Step 34281: {'lr': 0.0004435720436732882, 'samples': 6581952, 'steps': 34280, 'loss/train': 0.6050376296043396} -08/30/2021 19:25:19 - INFO - __main__ - Step 34282: {'lr': 0.0004435686853458243, 'samples': 6582144, 'steps': 34281, 'loss/train': 1.4607545137405396} -08/30/2021 19:25:21 - INFO - __main__ - Step 34283: {'lr': 0.0004435653269311414, 'samples': 6582336, 'steps': 34282, 'loss/train': 1.279322624206543} -08/30/2021 19:25:21 - INFO - __main__ - Step 34284: {'lr': 0.00044356196842924086, 'samples': 6582528, 'steps': 34283, 'loss/train': 1.5130841732025146} -08/30/2021 19:25:21 - INFO - __main__ - Step 34285: {'lr': 0.0004435586098401243, 'samples': 6582720, 'steps': 34284, 'loss/train': 1.7569422721862793} -08/30/2021 19:25:22 - INFO - __main__ - Step 34286: {'lr': 0.00044355525116379326, 'samples': 6582912, 'steps': 34285, 'loss/train': 2.2513930797576904} -08/30/2021 19:25:22 - INFO - __main__ - Step 34287: {'lr': 0.00044355189240024917, 'samples': 6583104, 'steps': 34286, 'loss/train': 1.1448408365249634} -08/30/2021 19:25:24 - INFO - __main__ - Step 34288: {'lr': 0.00044354853354949353, 'samples': 6583296, 'steps': 34287, 'loss/train': 1.3231486082077026} -08/30/2021 19:25:24 - INFO - __main__ - Step 34289: {'lr': 0.000443545174611528, 'samples': 6583488, 'steps': 34288, 'loss/train': 1.7273366451263428} -08/30/2021 19:25:24 - INFO - __main__ - Step 34290: {'lr': 0.000443541815586354, 'samples': 6583680, 'steps': 34289, 'loss/train': 1.305019497871399} -08/30/2021 19:25:25 - INFO - __main__ - Step 34291: {'lr': 0.0004435384564739729, 'samples': 6583872, 'steps': 34290, 'loss/train': 1.125197172164917} -08/30/2021 19:25:25 - INFO - __main__ - Step 34292: {'lr': 0.00044353509727438657, 'samples': 6584064, 'steps': 34291, 'loss/train': 0.8574925065040588} -08/30/2021 19:25:27 - INFO - __main__ - Step 34293: {'lr': 0.00044353173798759616, 'samples': 6584256, 'steps': 34292, 'loss/train': 1.1615010499954224} -08/30/2021 19:25:27 - INFO - __main__ - Step 34294: {'lr': 0.0004435283786136034, 'samples': 6584448, 'steps': 34293, 'loss/train': 1.2592524290084839} -08/30/2021 19:25:27 - INFO - __main__ - Step 34295: {'lr': 0.0004435250191524097, 'samples': 6584640, 'steps': 34294, 'loss/train': 1.0597270727157593} -08/30/2021 19:25:28 - INFO - __main__ - Step 34296: {'lr': 0.0004435216596040167, 'samples': 6584832, 'steps': 34295, 'loss/train': 1.015820860862732} -08/30/2021 19:25:28 - INFO - __main__ - Step 34297: {'lr': 0.00044351829996842575, 'samples': 6585024, 'steps': 34296, 'loss/train': 1.4411613941192627} -08/30/2021 19:25:30 - INFO - __main__ - Step 34298: {'lr': 0.00044351494024563845, 'samples': 6585216, 'steps': 34297, 'loss/train': 1.0451772212982178} -08/30/2021 19:25:30 - INFO - __main__ - Step 34299: {'lr': 0.0004435115804356563, 'samples': 6585408, 'steps': 34298, 'loss/train': 1.1034191846847534} -08/30/2021 19:25:30 - INFO - __main__ - Step 34300: {'lr': 0.0004435082205384808, 'samples': 6585600, 'steps': 34299, 'loss/train': 1.4241681098937988} -08/30/2021 19:25:31 - INFO - __main__ - Step 34301: {'lr': 0.00044350486055411354, 'samples': 6585792, 'steps': 34300, 'loss/train': 1.849123477935791} -08/30/2021 19:25:31 - INFO - __main__ - Step 34302: {'lr': 0.000443501500482556, 'samples': 6585984, 'steps': 34301, 'loss/train': 1.3144383430480957} -08/30/2021 19:25:33 - INFO - __main__ - Step 34303: {'lr': 0.0004434981403238096, 'samples': 6586176, 'steps': 34302, 'loss/train': 1.4229683876037598} -08/30/2021 19:25:33 - INFO - __main__ - Step 34304: {'lr': 0.0004434947800778759, 'samples': 6586368, 'steps': 34303, 'loss/train': 1.4115080833435059} -08/30/2021 19:25:34 - INFO - __main__ - Step 34305: {'lr': 0.0004434914197447565, 'samples': 6586560, 'steps': 34304, 'loss/train': 1.8310561180114746} -08/30/2021 19:25:34 - INFO - __main__ - Step 34306: {'lr': 0.0004434880593244528, 'samples': 6586752, 'steps': 34305, 'loss/train': 1.541959524154663} -08/30/2021 19:25:34 - INFO - __main__ - Step 34307: {'lr': 0.0004434846988169664, 'samples': 6586944, 'steps': 34306, 'loss/train': 1.6055432558059692} -08/30/2021 19:25:35 - INFO - __main__ - Step 34308: {'lr': 0.0004434813382222989, 'samples': 6587136, 'steps': 34307, 'loss/train': 1.0402737855911255} -08/30/2021 19:25:36 - INFO - __main__ - Step 34309: {'lr': 0.0004434779775404515, 'samples': 6587328, 'steps': 34308, 'loss/train': 1.6550846099853516} -08/30/2021 19:25:37 - INFO - __main__ - Step 34310: {'lr': 0.000443474616771426, 'samples': 6587520, 'steps': 34309, 'loss/train': 1.699147343635559} -08/30/2021 19:25:37 - INFO - __main__ - Step 34311: {'lr': 0.00044347125591522377, 'samples': 6587712, 'steps': 34310, 'loss/train': 1.4277589321136475} -08/30/2021 19:25:37 - INFO - __main__ - Step 34312: {'lr': 0.00044346789497184643, 'samples': 6587904, 'steps': 34311, 'loss/train': 1.2638791799545288} -08/30/2021 19:25:38 - INFO - __main__ - Step 34313: {'lr': 0.0004434645339412954, 'samples': 6588096, 'steps': 34312, 'loss/train': 1.0181409120559692} -08/30/2021 19:25:39 - INFO - __main__ - Step 34314: {'lr': 0.0004434611728235722, 'samples': 6588288, 'steps': 34313, 'loss/train': 1.0525574684143066} -08/30/2021 19:25:40 - INFO - __main__ - Step 34315: {'lr': 0.0004434578116186785, 'samples': 6588480, 'steps': 34314, 'loss/train': 1.6535593271255493} -08/30/2021 19:25:40 - INFO - __main__ - Step 34316: {'lr': 0.00044345445032661565, 'samples': 6588672, 'steps': 34315, 'loss/train': 1.7786425352096558} -08/30/2021 19:25:40 - INFO - __main__ - Step 34317: {'lr': 0.0004434510889473852, 'samples': 6588864, 'steps': 34316, 'loss/train': 1.1568361520767212} -08/30/2021 19:25:41 - INFO - __main__ - Step 34318: {'lr': 0.00044344772748098867, 'samples': 6589056, 'steps': 34317, 'loss/train': 0.9997491240501404} -08/30/2021 19:25:42 - INFO - __main__ - Step 34319: {'lr': 0.00044344436592742755, 'samples': 6589248, 'steps': 34318, 'loss/train': 1.6291216611862183} -08/30/2021 19:25:43 - INFO - __main__ - Step 34320: {'lr': 0.0004434410042867034, 'samples': 6589440, 'steps': 34319, 'loss/train': 1.8541678190231323} -08/30/2021 19:25:43 - INFO - __main__ - Step 34321: {'lr': 0.0004434376425588178, 'samples': 6589632, 'steps': 34320, 'loss/train': 1.3037652969360352} -08/30/2021 19:25:43 - INFO - __main__ - Step 34322: {'lr': 0.00044343428074377207, 'samples': 6589824, 'steps': 34321, 'loss/train': 1.7471519708633423} -08/30/2021 19:25:44 - INFO - __main__ - Step 34323: {'lr': 0.0004434309188415679, 'samples': 6590016, 'steps': 34322, 'loss/train': 1.3369140625} -08/30/2021 19:25:45 - INFO - __main__ - Step 34324: {'lr': 0.0004434275568522067, 'samples': 6590208, 'steps': 34323, 'loss/train': 0.4033282995223999} -08/30/2021 19:25:46 - INFO - __main__ - Step 34325: {'lr': 0.0004434241947756901, 'samples': 6590400, 'steps': 34324, 'loss/train': 1.3243719339370728} -08/30/2021 19:25:46 - INFO - __main__ - Step 34326: {'lr': 0.0004434208326120195, 'samples': 6590592, 'steps': 34325, 'loss/train': 1.038028359413147} -08/30/2021 19:25:47 - INFO - __main__ - Step 34327: {'lr': 0.0004434174703611964, 'samples': 6590784, 'steps': 34326, 'loss/train': 0.9112753868103027} -08/30/2021 19:25:47 - INFO - __main__ - Step 34328: {'lr': 0.00044341410802322247, 'samples': 6590976, 'steps': 34327, 'loss/train': 1.6747767925262451} -08/30/2021 19:25:47 - INFO - __main__ - Step 34329: {'lr': 0.00044341074559809903, 'samples': 6591168, 'steps': 34328, 'loss/train': 1.0039563179016113} -08/30/2021 19:25:48 - INFO - __main__ - Step 34330: {'lr': 0.00044340738308582775, 'samples': 6591360, 'steps': 34329, 'loss/train': 0.03337034955620766} -08/30/2021 19:25:49 - INFO - __main__ - Step 34331: {'lr': 0.0004434040204864101, 'samples': 6591552, 'steps': 34330, 'loss/train': 1.483001470565796} -08/30/2021 19:25:50 - INFO - __main__ - Step 34332: {'lr': 0.00044340065779984757, 'samples': 6591744, 'steps': 34331, 'loss/train': 1.5729074478149414} -08/30/2021 19:25:50 - INFO - __main__ - Step 34333: {'lr': 0.0004433972950261417, 'samples': 6591936, 'steps': 34332, 'loss/train': 1.3920680284500122} -08/30/2021 19:25:50 - INFO - __main__ - Step 34334: {'lr': 0.00044339393216529394, 'samples': 6592128, 'steps': 34333, 'loss/train': 0.399932324886322} -08/30/2021 19:25:51 - INFO - __main__ - Step 34335: {'lr': 0.00044339056921730593, 'samples': 6592320, 'steps': 34334, 'loss/train': 1.3992620706558228} -08/30/2021 19:25:53 - INFO - __main__ - Step 34336: {'lr': 0.000443387206182179, 'samples': 6592512, 'steps': 34335, 'loss/train': 1.3509875535964966} -08/30/2021 19:25:53 - INFO - __main__ - Step 34337: {'lr': 0.0004433838430599149, 'samples': 6592704, 'steps': 34336, 'loss/train': 1.7384206056594849} -08/30/2021 19:25:54 - INFO - __main__ - Step 34338: {'lr': 0.000443380479850515, 'samples': 6592896, 'steps': 34337, 'loss/train': 1.2571719884872437} -08/30/2021 19:25:54 - INFO - __main__ - Step 34339: {'lr': 0.00044337711655398083, 'samples': 6593088, 'steps': 34338, 'loss/train': 1.735754132270813} -08/30/2021 19:25:54 - INFO - __main__ - Step 34340: {'lr': 0.00044337375317031393, 'samples': 6593280, 'steps': 34339, 'loss/train': 1.4142794609069824} -08/30/2021 19:25:56 - INFO - __main__ - Step 34341: {'lr': 0.0004433703896995157, 'samples': 6593472, 'steps': 34340, 'loss/train': 1.5877922773361206} -08/30/2021 19:25:56 - INFO - __main__ - Step 34342: {'lr': 0.0004433670261415879, 'samples': 6593664, 'steps': 34341, 'loss/train': 1.3526380062103271} -08/30/2021 19:25:57 - INFO - __main__ - Step 34343: {'lr': 0.0004433636624965318, 'samples': 6593856, 'steps': 34342, 'loss/train': 1.3758047819137573} -08/30/2021 19:25:57 - INFO - __main__ - Step 34344: {'lr': 0.0004433602987643491, 'samples': 6594048, 'steps': 34343, 'loss/train': 2.0959386825561523} -08/30/2021 19:25:57 - INFO - __main__ - Step 34345: {'lr': 0.00044335693494504115, 'samples': 6594240, 'steps': 34344, 'loss/train': 1.9930661916732788} -08/30/2021 19:25:59 - INFO - __main__ - Step 34346: {'lr': 0.00044335357103860964, 'samples': 6594432, 'steps': 34345, 'loss/train': 1.3216766119003296} -08/30/2021 19:25:59 - INFO - __main__ - Step 34347: {'lr': 0.0004433502070450559, 'samples': 6594624, 'steps': 34346, 'loss/train': 1.0442615747451782} -08/30/2021 19:25:59 - INFO - __main__ - Step 34348: {'lr': 0.0004433468429643816, 'samples': 6594816, 'steps': 34347, 'loss/train': 1.3631224632263184} -08/30/2021 19:26:00 - INFO - __main__ - Step 34349: {'lr': 0.00044334347879658817, 'samples': 6595008, 'steps': 34348, 'loss/train': 1.4799100160598755} -08/30/2021 19:26:00 - INFO - __main__ - Step 34350: {'lr': 0.0004433401145416771, 'samples': 6595200, 'steps': 34349, 'loss/train': 1.4209132194519043} -08/30/2021 19:26:01 - INFO - __main__ - Step 34351: {'lr': 0.00044333675019965, 'samples': 6595392, 'steps': 34350, 'loss/train': 0.5847344994544983} -08/30/2021 19:26:02 - INFO - __main__ - Step 34352: {'lr': 0.00044333338577050844, 'samples': 6595584, 'steps': 34351, 'loss/train': 0.5432370901107788} -08/30/2021 19:26:02 - INFO - __main__ - Step 34353: {'lr': 0.0004433300212542537, 'samples': 6595776, 'steps': 34352, 'loss/train': 1.5141524076461792} -08/30/2021 19:26:03 - INFO - __main__ - Step 34354: {'lr': 0.00044332665665088755, 'samples': 6595968, 'steps': 34353, 'loss/train': 0.999143660068512} -08/30/2021 19:26:03 - INFO - __main__ - Step 34355: {'lr': 0.00044332329196041133, 'samples': 6596160, 'steps': 34354, 'loss/train': 1.7645156383514404} -08/30/2021 19:26:03 - INFO - __main__ - Step 34356: {'lr': 0.0004433199271828267, 'samples': 6596352, 'steps': 34355, 'loss/train': 1.7707819938659668} -08/30/2021 19:26:05 - INFO - __main__ - Step 34357: {'lr': 0.0004433165623181349, 'samples': 6596544, 'steps': 34356, 'loss/train': 0.4831221103668213} -08/30/2021 19:26:05 - INFO - __main__ - Step 34358: {'lr': 0.0004433131973663378, 'samples': 6596736, 'steps': 34357, 'loss/train': 1.2558364868164062} -08/30/2021 19:26:06 - INFO - __main__ - Step 34359: {'lr': 0.0004433098323274367, 'samples': 6596928, 'steps': 34358, 'loss/train': 1.8244661092758179} -08/30/2021 19:26:06 - INFO - __main__ - Step 34360: {'lr': 0.00044330646720143317, 'samples': 6597120, 'steps': 34359, 'loss/train': 1.5290697813034058} -08/30/2021 19:26:06 - INFO - __main__ - Step 34361: {'lr': 0.0004433031019883288, 'samples': 6597312, 'steps': 34360, 'loss/train': 1.1753313541412354} -08/30/2021 19:26:08 - INFO - __main__ - Step 34362: {'lr': 0.00044329973668812497, 'samples': 6597504, 'steps': 34361, 'loss/train': 1.4041204452514648} -08/30/2021 19:26:08 - INFO - __main__ - Step 34363: {'lr': 0.00044329637130082324, 'samples': 6597696, 'steps': 34362, 'loss/train': 1.5539454221725464} -08/30/2021 19:26:09 - INFO - __main__ - Step 34364: {'lr': 0.00044329300582642516, 'samples': 6597888, 'steps': 34363, 'loss/train': 0.8712891936302185} -08/30/2021 19:26:09 - INFO - __main__ - Step 34365: {'lr': 0.0004432896402649323, 'samples': 6598080, 'steps': 34364, 'loss/train': 1.9170267581939697} -08/30/2021 19:26:09 - INFO - __main__ - Step 34366: {'lr': 0.0004432862746163461, 'samples': 6598272, 'steps': 34365, 'loss/train': 1.5498980283737183} -08/30/2021 19:26:11 - INFO - __main__ - Step 34367: {'lr': 0.000443282908880668, 'samples': 6598464, 'steps': 34366, 'loss/train': 1.7895435094833374} -08/30/2021 19:26:11 - INFO - __main__ - Step 34368: {'lr': 0.00044327954305789963, 'samples': 6598656, 'steps': 34367, 'loss/train': 1.296325922012329} -08/30/2021 19:26:12 - INFO - __main__ - Step 34369: {'lr': 0.0004432761771480426, 'samples': 6598848, 'steps': 34368, 'loss/train': 1.6100263595581055} -08/30/2021 19:26:12 - INFO - __main__ - Step 34370: {'lr': 0.0004432728111510982, 'samples': 6599040, 'steps': 34369, 'loss/train': 1.3352285623550415} -08/30/2021 19:26:12 - INFO - __main__ - Step 34371: {'lr': 0.000443269445067068, 'samples': 6599232, 'steps': 34370, 'loss/train': 1.4644743204116821} -08/30/2021 19:26:14 - INFO - __main__ - Step 34372: {'lr': 0.0004432660788959537, 'samples': 6599424, 'steps': 34371, 'loss/train': 0.0805610790848732} -08/30/2021 19:26:14 - INFO - __main__ - Step 34373: {'lr': 0.00044326271263775657, 'samples': 6599616, 'steps': 34372, 'loss/train': 1.8947086334228516} -08/30/2021 19:26:15 - INFO - __main__ - Step 34374: {'lr': 0.0004432593462924783, 'samples': 6599808, 'steps': 34373, 'loss/train': 1.1238963603973389} -08/30/2021 19:26:15 - INFO - __main__ - Step 34375: {'lr': 0.0004432559798601203, 'samples': 6600000, 'steps': 34374, 'loss/train': 0.7812830209732056} -08/30/2021 19:26:15 - INFO - __main__ - Step 34376: {'lr': 0.0004432526133406842, 'samples': 6600192, 'steps': 34375, 'loss/train': 0.54055255651474} -08/30/2021 19:26:17 - INFO - __main__ - Step 34377: {'lr': 0.0004432492467341715, 'samples': 6600384, 'steps': 34376, 'loss/train': 1.493737816810608} -08/30/2021 19:26:17 - INFO - __main__ - Step 34378: {'lr': 0.00044324588004058364, 'samples': 6600576, 'steps': 34377, 'loss/train': 1.344374179840088} -08/30/2021 19:26:18 - INFO - __main__ - Step 34379: {'lr': 0.00044324251325992214, 'samples': 6600768, 'steps': 34378, 'loss/train': 1.3997677564620972} -08/30/2021 19:26:18 - INFO - __main__ - Step 34380: {'lr': 0.0004432391463921885, 'samples': 6600960, 'steps': 34379, 'loss/train': 1.1257917881011963} -08/30/2021 19:26:18 - INFO - __main__ - Step 34381: {'lr': 0.00044323577943738437, 'samples': 6601152, 'steps': 34380, 'loss/train': 1.6540206670761108} -08/30/2021 19:26:20 - INFO - __main__ - Step 34382: {'lr': 0.00044323241239551113, 'samples': 6601344, 'steps': 34381, 'loss/train': 1.5172102451324463} -08/30/2021 19:26:20 - INFO - __main__ - Step 34383: {'lr': 0.0004432290452665704, 'samples': 6601536, 'steps': 34382, 'loss/train': 1.7449623346328735} -08/30/2021 19:26:21 - INFO - __main__ - Step 34384: {'lr': 0.00044322567805056356, 'samples': 6601728, 'steps': 34383, 'loss/train': 1.4433776140213013} -08/30/2021 19:26:21 - INFO - __main__ - Step 34385: {'lr': 0.00044322231074749225, 'samples': 6601920, 'steps': 34384, 'loss/train': 1.4767518043518066} -08/30/2021 19:26:21 - INFO - __main__ - Step 34386: {'lr': 0.0004432189433573579, 'samples': 6602112, 'steps': 34385, 'loss/train': 1.5803310871124268} -08/30/2021 19:26:22 - INFO - __main__ - Step 34387: {'lr': 0.00044321557588016214, 'samples': 6602304, 'steps': 34386, 'loss/train': 1.4494335651397705} -08/30/2021 19:26:23 - INFO - __main__ - Step 34388: {'lr': 0.0004432122083159065, 'samples': 6602496, 'steps': 34387, 'loss/train': 1.1938616037368774} -08/30/2021 19:26:24 - INFO - __main__ - Step 34389: {'lr': 0.0004432088406645922, 'samples': 6602688, 'steps': 34388, 'loss/train': 1.8994015455245972} -08/30/2021 19:26:24 - INFO - __main__ - Step 34390: {'lr': 0.00044320547292622114, 'samples': 6602880, 'steps': 34389, 'loss/train': 1.6787949800491333} -08/30/2021 19:26:25 - INFO - __main__ - Step 34391: {'lr': 0.0004432021051007946, 'samples': 6603072, 'steps': 34390, 'loss/train': 1.8606735467910767} -08/30/2021 19:26:25 - INFO - __main__ - Step 34392: {'lr': 0.00044319873718831425, 'samples': 6603264, 'steps': 34391, 'loss/train': 0.8606879115104675} -08/30/2021 19:26:27 - INFO - __main__ - Step 34393: {'lr': 0.00044319536918878156, 'samples': 6603456, 'steps': 34392, 'loss/train': 0.12102912366390228} -08/30/2021 19:26:27 - INFO - __main__ - Step 34394: {'lr': 0.00044319200110219794, 'samples': 6603648, 'steps': 34393, 'loss/train': 1.3255921602249146} -08/30/2021 19:26:28 - INFO - __main__ - Step 34395: {'lr': 0.000443188632928565, 'samples': 6603840, 'steps': 34394, 'loss/train': 2.069284200668335} -08/30/2021 19:26:28 - INFO - __main__ - Step 34396: {'lr': 0.0004431852646678842, 'samples': 6604032, 'steps': 34395, 'loss/train': 0.936872661113739} -08/30/2021 19:26:28 - INFO - __main__ - Step 34397: {'lr': 0.00044318189632015716, 'samples': 6604224, 'steps': 34396, 'loss/train': 1.3372077941894531} -08/30/2021 19:26:30 - INFO - __main__ - Step 34398: {'lr': 0.0004431785278853853, 'samples': 6604416, 'steps': 34397, 'loss/train': 1.3406580686569214} -08/30/2021 19:26:30 - INFO - __main__ - Step 34399: {'lr': 0.0004431751593635702, 'samples': 6604608, 'steps': 34398, 'loss/train': 1.3278084993362427} -08/30/2021 19:26:31 - INFO - __main__ - Step 34400: {'lr': 0.00044317179075471335, 'samples': 6604800, 'steps': 34399, 'loss/train': 0.38800692558288574} -08/30/2021 19:26:31 - INFO - __main__ - Step 34401: {'lr': 0.00044316842205881625, 'samples': 6604992, 'steps': 34400, 'loss/train': 1.2890698909759521} -08/30/2021 19:26:31 - INFO - __main__ - Step 34402: {'lr': 0.00044316505327588054, 'samples': 6605184, 'steps': 34401, 'loss/train': 0.9331830143928528} -08/30/2021 19:26:33 - INFO - __main__ - Step 34403: {'lr': 0.00044316168440590757, 'samples': 6605376, 'steps': 34402, 'loss/train': 1.6600427627563477} -08/30/2021 19:26:33 - INFO - __main__ - Step 34404: {'lr': 0.00044315831544889886, 'samples': 6605568, 'steps': 34403, 'loss/train': 1.3622405529022217} -08/30/2021 19:26:34 - INFO - __main__ - Step 34405: {'lr': 0.0004431549464048561, 'samples': 6605760, 'steps': 34404, 'loss/train': 1.027209997177124} -08/30/2021 19:26:34 - INFO - __main__ - Step 34406: {'lr': 0.0004431515772737806, 'samples': 6605952, 'steps': 34405, 'loss/train': 1.2644612789154053} -08/30/2021 19:26:34 - INFO - __main__ - Step 34407: {'lr': 0.000443148208055674, 'samples': 6606144, 'steps': 34406, 'loss/train': 1.3569592237472534} -08/30/2021 19:26:36 - INFO - __main__ - Step 34408: {'lr': 0.0004431448387505379, 'samples': 6606336, 'steps': 34407, 'loss/train': 1.3876062631607056} -08/30/2021 19:26:37 - INFO - __main__ - Step 34409: {'lr': 0.00044314146935837365, 'samples': 6606528, 'steps': 34408, 'loss/train': 1.5231746435165405} -08/30/2021 19:26:37 - INFO - __main__ - Step 34410: {'lr': 0.0004431380998791828, 'samples': 6606720, 'steps': 34409, 'loss/train': 1.3941922187805176} -08/30/2021 19:26:37 - INFO - __main__ - Step 34411: {'lr': 0.0004431347303129669, 'samples': 6606912, 'steps': 34410, 'loss/train': 0.9178640842437744} -08/30/2021 19:26:38 - INFO - __main__ - Step 34412: {'lr': 0.00044313136065972754, 'samples': 6607104, 'steps': 34411, 'loss/train': 0.030487028881907463} -08/30/2021 19:26:38 - INFO - __main__ - Step 34413: {'lr': 0.0004431279909194661, 'samples': 6607296, 'steps': 34412, 'loss/train': 1.2436041831970215} -08/30/2021 19:26:40 - INFO - __main__ - Step 34414: {'lr': 0.00044312462109218423, 'samples': 6607488, 'steps': 34413, 'loss/train': 1.8023035526275635} -08/30/2021 19:26:40 - INFO - __main__ - Step 34415: {'lr': 0.0004431212511778834, 'samples': 6607680, 'steps': 34414, 'loss/train': 1.4230846166610718} -08/30/2021 19:26:41 - INFO - __main__ - Step 34416: {'lr': 0.000443117881176565, 'samples': 6607872, 'steps': 34415, 'loss/train': 1.2220278978347778} -08/30/2021 19:26:41 - INFO - __main__ - Step 34417: {'lr': 0.00044311451108823075, 'samples': 6608064, 'steps': 34416, 'loss/train': 1.4115710258483887} -08/30/2021 19:26:41 - INFO - __main__ - Step 34418: {'lr': 0.00044311114091288205, 'samples': 6608256, 'steps': 34417, 'loss/train': 1.3294082880020142} -08/30/2021 19:26:43 - INFO - __main__ - Step 34419: {'lr': 0.0004431077706505205, 'samples': 6608448, 'steps': 34418, 'loss/train': 1.5514307022094727} -08/30/2021 19:26:43 - INFO - __main__ - Step 34420: {'lr': 0.0004431044003011475, 'samples': 6608640, 'steps': 34419, 'loss/train': 0.8480591177940369} -08/30/2021 19:26:43 - INFO - __main__ - Step 34421: {'lr': 0.00044310102986476463, 'samples': 6608832, 'steps': 34420, 'loss/train': 1.857121229171753} -08/30/2021 19:26:44 - INFO - __main__ - Step 34422: {'lr': 0.0004430976593413735, 'samples': 6609024, 'steps': 34421, 'loss/train': 1.5511581897735596} -08/30/2021 19:26:44 - INFO - __main__ - Step 34423: {'lr': 0.0004430942887309755, 'samples': 6609216, 'steps': 34422, 'loss/train': 1.3938441276550293} -08/30/2021 19:26:46 - INFO - __main__ - Step 34424: {'lr': 0.00044309091803357216, 'samples': 6609408, 'steps': 34423, 'loss/train': 1.754330039024353} -08/30/2021 19:26:46 - INFO - __main__ - Step 34425: {'lr': 0.0004430875472491651, 'samples': 6609600, 'steps': 34424, 'loss/train': 3.110199213027954} -08/30/2021 19:26:47 - INFO - __main__ - Step 34426: {'lr': 0.0004430841763777557, 'samples': 6609792, 'steps': 34425, 'loss/train': 1.2199982404708862} -08/30/2021 19:26:47 - INFO - __main__ - Step 34427: {'lr': 0.0004430808054193456, 'samples': 6609984, 'steps': 34426, 'loss/train': 1.3279060125350952} -08/30/2021 19:26:47 - INFO - __main__ - Step 34428: {'lr': 0.00044307743437393623, 'samples': 6610176, 'steps': 34427, 'loss/train': 1.2195956707000732} -08/30/2021 19:26:48 - INFO - __main__ - Step 34429: {'lr': 0.0004430740632415292, 'samples': 6610368, 'steps': 34428, 'loss/train': 1.2849218845367432} -08/30/2021 19:26:49 - INFO - __main__ - Step 34430: {'lr': 0.0004430706920221259, 'samples': 6610560, 'steps': 34429, 'loss/train': 0.079468734562397} -08/30/2021 19:26:50 - INFO - __main__ - Step 34431: {'lr': 0.00044306732071572796, 'samples': 6610752, 'steps': 34430, 'loss/train': 1.4782328605651855} -08/30/2021 19:26:50 - INFO - __main__ - Step 34432: {'lr': 0.00044306394932233694, 'samples': 6610944, 'steps': 34431, 'loss/train': 1.4525034427642822} -08/30/2021 19:26:50 - INFO - __main__ - Step 34433: {'lr': 0.0004430605778419542, 'samples': 6611136, 'steps': 34432, 'loss/train': 0.5215873718261719} -08/30/2021 19:26:51 - INFO - __main__ - Step 34434: {'lr': 0.00044305720627458136, 'samples': 6611328, 'steps': 34433, 'loss/train': 1.5125080347061157} -08/30/2021 19:26:52 - INFO - __main__ - Step 34435: {'lr': 0.00044305383462022, 'samples': 6611520, 'steps': 34434, 'loss/train': 0.8998143672943115} -08/30/2021 19:26:53 - INFO - __main__ - Step 34436: {'lr': 0.0004430504628788714, 'samples': 6611712, 'steps': 34435, 'loss/train': 1.93230402469635} -08/30/2021 19:26:53 - INFO - __main__ - Step 34437: {'lr': 0.0004430470910505373, 'samples': 6611904, 'steps': 34436, 'loss/train': 1.4839353561401367} -08/30/2021 19:26:53 - INFO - __main__ - Step 34438: {'lr': 0.00044304371913521926, 'samples': 6612096, 'steps': 34437, 'loss/train': 0.6594424247741699} -08/30/2021 19:26:54 - INFO - __main__ - Step 34439: {'lr': 0.0004430403471329186, 'samples': 6612288, 'steps': 34438, 'loss/train': 1.6658412218093872} -08/30/2021 19:26:55 - INFO - __main__ - Step 34440: {'lr': 0.0004430369750436369, 'samples': 6612480, 'steps': 34439, 'loss/train': 1.7098740339279175} -08/30/2021 19:26:56 - INFO - __main__ - Step 34441: {'lr': 0.0004430336028673758, 'samples': 6612672, 'steps': 34440, 'loss/train': 1.4242730140686035} -08/30/2021 19:26:56 - INFO - __main__ - Step 34442: {'lr': 0.00044303023060413677, 'samples': 6612864, 'steps': 34441, 'loss/train': 1.324416160583496} -08/30/2021 19:26:56 - INFO - __main__ - Step 34443: {'lr': 0.0004430268582539212, 'samples': 6613056, 'steps': 34442, 'loss/train': 1.3261427879333496} -08/30/2021 19:26:57 - INFO - __main__ - Step 34444: {'lr': 0.0004430234858167308, 'samples': 6613248, 'steps': 34443, 'loss/train': 1.37202787399292} -08/30/2021 19:26:59 - INFO - __main__ - Step 34445: {'lr': 0.000443020113292567, 'samples': 6613440, 'steps': 34444, 'loss/train': 1.631679892539978} -08/30/2021 19:26:59 - INFO - __main__ - Step 34446: {'lr': 0.0004430167406814312, 'samples': 6613632, 'steps': 34445, 'loss/train': 1.7860093116760254} -08/30/2021 19:26:59 - INFO - __main__ - Step 34447: {'lr': 0.0004430133679833251, 'samples': 6613824, 'steps': 34446, 'loss/train': 1.346189022064209} -08/30/2021 19:27:00 - INFO - __main__ - Step 34448: {'lr': 0.00044300999519825016, 'samples': 6614016, 'steps': 34447, 'loss/train': 1.6412649154663086} -08/30/2021 19:27:00 - INFO - __main__ - Step 34449: {'lr': 0.00044300662232620784, 'samples': 6614208, 'steps': 34448, 'loss/train': 1.8074865341186523} -08/30/2021 19:27:02 - INFO - __main__ - Step 34450: {'lr': 0.0004430032493671998, 'samples': 6614400, 'steps': 34449, 'loss/train': 0.7451086044311523} -08/30/2021 19:27:02 - INFO - __main__ - Step 34451: {'lr': 0.0004429998763212274, 'samples': 6614592, 'steps': 34450, 'loss/train': 1.337473750114441} -08/30/2021 19:27:03 - INFO - __main__ - Step 34452: {'lr': 0.00044299650318829233, 'samples': 6614784, 'steps': 34451, 'loss/train': 1.1569933891296387} -08/30/2021 19:27:03 - INFO - __main__ - Step 34453: {'lr': 0.0004429931299683959, 'samples': 6614976, 'steps': 34452, 'loss/train': 1.5492223501205444} -08/30/2021 19:27:03 - INFO - __main__ - Step 34454: {'lr': 0.0004429897566615398, 'samples': 6615168, 'steps': 34453, 'loss/train': 1.2494310140609741} -08/30/2021 19:27:04 - INFO - __main__ - Step 34455: {'lr': 0.0004429863832677255, 'samples': 6615360, 'steps': 34454, 'loss/train': 1.5201736688613892} -08/30/2021 19:27:05 - INFO - __main__ - Step 34456: {'lr': 0.0004429830097869545, 'samples': 6615552, 'steps': 34455, 'loss/train': 0.14513061940670013} -08/30/2021 19:27:06 - INFO - __main__ - Step 34457: {'lr': 0.0004429796362192283, 'samples': 6615744, 'steps': 34456, 'loss/train': 1.0094025135040283} -08/30/2021 19:27:06 - INFO - __main__ - Step 34458: {'lr': 0.0004429762625645485, 'samples': 6615936, 'steps': 34457, 'loss/train': 1.3376976251602173} -08/30/2021 19:27:06 - INFO - __main__ - Step 34459: {'lr': 0.0004429728888229166, 'samples': 6616128, 'steps': 34458, 'loss/train': 1.3319414854049683} -08/30/2021 19:27:07 - INFO - __main__ - Step 34460: {'lr': 0.000442969514994334, 'samples': 6616320, 'steps': 34459, 'loss/train': 1.7238891124725342} -08/30/2021 19:27:09 - INFO - __main__ - Step 34461: {'lr': 0.0004429661410788024, 'samples': 6616512, 'steps': 34460, 'loss/train': 1.6685853004455566} -08/30/2021 19:27:09 - INFO - __main__ - Step 34462: {'lr': 0.00044296276707632323, 'samples': 6616704, 'steps': 34461, 'loss/train': 1.4678622484207153} -08/30/2021 19:27:10 - INFO - __main__ - Step 34463: {'lr': 0.000442959392986898, 'samples': 6616896, 'steps': 34462, 'loss/train': 1.3602629899978638} -08/30/2021 19:27:10 - INFO - __main__ - Step 34464: {'lr': 0.0004429560188105282, 'samples': 6617088, 'steps': 34463, 'loss/train': 1.3855806589126587} -08/30/2021 19:27:10 - INFO - __main__ - Step 34465: {'lr': 0.00044295264454721544, 'samples': 6617280, 'steps': 34464, 'loss/train': 0.08018211275339127} -08/30/2021 19:27:11 - INFO - __main__ - Step 34466: {'lr': 0.0004429492701969612, 'samples': 6617472, 'steps': 34465, 'loss/train': 0.2471642941236496} -08/30/2021 19:27:12 - INFO - __main__ - Step 34467: {'lr': 0.00044294589575976696, 'samples': 6617664, 'steps': 34466, 'loss/train': 1.3627315759658813} -08/30/2021 19:27:13 - INFO - __main__ - Step 34468: {'lr': 0.00044294252123563434, 'samples': 6617856, 'steps': 34467, 'loss/train': 1.3598071336746216} -08/30/2021 19:27:13 - INFO - __main__ - Step 34469: {'lr': 0.00044293914662456475, 'samples': 6618048, 'steps': 34468, 'loss/train': 1.3098459243774414} -08/30/2021 19:27:13 - INFO - __main__ - Step 34470: {'lr': 0.00044293577192655977, 'samples': 6618240, 'steps': 34469, 'loss/train': 1.1171422004699707} -08/30/2021 19:27:14 - INFO - __main__ - Step 34471: {'lr': 0.0004429323971416209, 'samples': 6618432, 'steps': 34470, 'loss/train': 1.1799956560134888} -08/30/2021 19:27:15 - INFO - __main__ - Step 34472: {'lr': 0.0004429290222697497, 'samples': 6618624, 'steps': 34471, 'loss/train': 1.2923181056976318} -08/30/2021 19:27:16 - INFO - __main__ - Step 34473: {'lr': 0.0004429256473109476, 'samples': 6618816, 'steps': 34472, 'loss/train': 1.2467824220657349} -08/30/2021 19:27:16 - INFO - __main__ - Step 34474: {'lr': 0.0004429222722652162, 'samples': 6619008, 'steps': 34473, 'loss/train': 0.024378672242164612} -08/30/2021 19:27:17 - INFO - __main__ - Step 34475: {'lr': 0.0004429188971325571, 'samples': 6619200, 'steps': 34474, 'loss/train': 1.4998093843460083} -08/30/2021 19:27:17 - INFO - __main__ - Step 34476: {'lr': 0.00044291552191297155, 'samples': 6619392, 'steps': 34475, 'loss/train': 1.4220741987228394} -08/30/2021 19:27:17 - INFO - __main__ - Step 34477: {'lr': 0.0004429121466064614, 'samples': 6619584, 'steps': 34476, 'loss/train': 2.0970053672790527} -08/30/2021 19:27:19 - INFO - __main__ - Step 34478: {'lr': 0.0004429087712130279, 'samples': 6619776, 'steps': 34477, 'loss/train': 1.473771572113037} -08/30/2021 19:27:19 - INFO - __main__ - Step 34479: {'lr': 0.00044290539573267276, 'samples': 6619968, 'steps': 34478, 'loss/train': 1.2748184204101562} -08/30/2021 19:27:20 - INFO - __main__ - Step 34480: {'lr': 0.00044290202016539736, 'samples': 6620160, 'steps': 34479, 'loss/train': 1.4546483755111694} -08/30/2021 19:27:20 - INFO - __main__ - Step 34481: {'lr': 0.0004428986445112033, 'samples': 6620352, 'steps': 34480, 'loss/train': 1.1653300523757935} -08/30/2021 19:27:21 - INFO - __main__ - Step 34482: {'lr': 0.00044289526877009213, 'samples': 6620544, 'steps': 34481, 'loss/train': 1.4459903240203857} -08/30/2021 19:27:21 - INFO - __main__ - Step 34483: {'lr': 0.00044289189294206534, 'samples': 6620736, 'steps': 34482, 'loss/train': 1.0771769285202026} -08/30/2021 19:27:22 - INFO - __main__ - Step 34484: {'lr': 0.0004428885170271244, 'samples': 6620928, 'steps': 34483, 'loss/train': 1.309779405593872} -08/30/2021 19:27:23 - INFO - __main__ - Step 34485: {'lr': 0.0004428851410252709, 'samples': 6621120, 'steps': 34484, 'loss/train': 1.2912912368774414} -08/30/2021 19:27:23 - INFO - __main__ - Step 34486: {'lr': 0.0004428817649365063, 'samples': 6621312, 'steps': 34485, 'loss/train': 0.8086441159248352} -08/30/2021 19:27:24 - INFO - __main__ - Step 34487: {'lr': 0.0004428783887608321, 'samples': 6621504, 'steps': 34486, 'loss/train': 1.2254034280776978} -08/30/2021 19:27:24 - INFO - __main__ - Step 34488: {'lr': 0.00044287501249824996, 'samples': 6621696, 'steps': 34487, 'loss/train': 1.6118260622024536} -08/30/2021 19:27:26 - INFO - __main__ - Step 34489: {'lr': 0.0004428716361487613, 'samples': 6621888, 'steps': 34488, 'loss/train': 4.752957820892334} -08/30/2021 19:27:26 - INFO - __main__ - Step 34490: {'lr': 0.0004428682597123677, 'samples': 6622080, 'steps': 34489, 'loss/train': 0.2814444601535797} -08/30/2021 19:27:26 - INFO - __main__ - Step 34491: {'lr': 0.0004428648831890705, 'samples': 6622272, 'steps': 34490, 'loss/train': 1.516649603843689} -08/30/2021 19:27:27 - INFO - __main__ - Step 34492: {'lr': 0.0004428615065788715, 'samples': 6622464, 'steps': 34491, 'loss/train': 1.6049208641052246} -08/30/2021 19:27:27 - INFO - __main__ - Step 34493: {'lr': 0.00044285812988177197, 'samples': 6622656, 'steps': 34492, 'loss/train': 1.1035348176956177} -08/30/2021 19:27:29 - INFO - __main__ - Step 34494: {'lr': 0.0004428547530977736, 'samples': 6622848, 'steps': 34493, 'loss/train': 1.8791131973266602} -08/30/2021 19:27:29 - INFO - __main__ - Step 34495: {'lr': 0.0004428513762268779, 'samples': 6623040, 'steps': 34494, 'loss/train': 0.6788734793663025} -08/30/2021 19:27:29 - INFO - __main__ - Step 34496: {'lr': 0.00044284799926908627, 'samples': 6623232, 'steps': 34495, 'loss/train': 1.5275757312774658} -08/30/2021 19:27:30 - INFO - __main__ - Step 34497: {'lr': 0.0004428446222244004, 'samples': 6623424, 'steps': 34496, 'loss/train': 1.2486664056777954} -08/30/2021 19:27:30 - INFO - __main__ - Step 34498: {'lr': 0.0004428412450928216, 'samples': 6623616, 'steps': 34497, 'loss/train': 1.8646252155303955} -08/30/2021 19:27:32 - INFO - __main__ - Step 34499: {'lr': 0.00044283786787435156, 'samples': 6623808, 'steps': 34498, 'loss/train': 2.15881085395813} -08/30/2021 19:27:33 - INFO - __main__ - Step 34500: {'lr': 0.0004428344905689917, 'samples': 6624000, 'steps': 34499, 'loss/train': 1.4565550088882446} -08/30/2021 19:27:33 - INFO - __main__ - Step 34501: {'lr': 0.0004428311131767437, 'samples': 6624192, 'steps': 34500, 'loss/train': 1.437974452972412} -08/30/2021 19:27:33 - INFO - __main__ - Step 34502: {'lr': 0.0004428277356976089, 'samples': 6624384, 'steps': 34501, 'loss/train': 2.451415777206421} -08/30/2021 19:27:34 - INFO - __main__ - Step 34503: {'lr': 0.0004428243581315889, 'samples': 6624576, 'steps': 34502, 'loss/train': 1.4674867391586304} -08/30/2021 19:27:35 - INFO - __main__ - Step 34504: {'lr': 0.0004428209804786853, 'samples': 6624768, 'steps': 34503, 'loss/train': 0.14034180343151093} -08/30/2021 19:27:36 - INFO - __main__ - Step 34505: {'lr': 0.0004428176027388995, 'samples': 6624960, 'steps': 34504, 'loss/train': 1.5051461458206177} -08/30/2021 19:27:36 - INFO - __main__ - Step 34506: {'lr': 0.0004428142249122331, 'samples': 6625152, 'steps': 34505, 'loss/train': 1.3033932447433472} -08/30/2021 19:27:36 - INFO - __main__ - Step 34507: {'lr': 0.00044281084699868747, 'samples': 6625344, 'steps': 34506, 'loss/train': 1.6993290185928345} -08/30/2021 19:27:37 - INFO - __main__ - Step 34508: {'lr': 0.0004428074689982643, 'samples': 6625536, 'steps': 34507, 'loss/train': 1.1897045373916626} -08/30/2021 19:27:37 - INFO - __main__ - Step 34509: {'lr': 0.0004428040909109651, 'samples': 6625728, 'steps': 34508, 'loss/train': 1.6434334516525269} -08/30/2021 19:27:39 - INFO - __main__ - Step 34510: {'lr': 0.00044280071273679133, 'samples': 6625920, 'steps': 34509, 'loss/train': 0.6318305134773254} -08/30/2021 19:27:39 - INFO - __main__ - Step 34511: {'lr': 0.00044279733447574456, 'samples': 6626112, 'steps': 34510, 'loss/train': 1.4127222299575806} -08/30/2021 19:27:39 - INFO - __main__ - Step 34512: {'lr': 0.00044279395612782625, 'samples': 6626304, 'steps': 34511, 'loss/train': 1.2508999109268188} -08/30/2021 19:27:40 - INFO - __main__ - Step 34513: {'lr': 0.0004427905776930379, 'samples': 6626496, 'steps': 34512, 'loss/train': 1.570178508758545} -08/30/2021 19:27:40 - INFO - __main__ - Step 34514: {'lr': 0.0004427871991713812, 'samples': 6626688, 'steps': 34513, 'loss/train': 1.290770411491394} -08/30/2021 19:27:42 - INFO - __main__ - Step 34515: {'lr': 0.0004427838205628575, 'samples': 6626880, 'steps': 34514, 'loss/train': 1.4480304718017578} -08/30/2021 19:27:42 - INFO - __main__ - Step 34516: {'lr': 0.0004427804418674684, 'samples': 6627072, 'steps': 34515, 'loss/train': 1.6381162405014038} -08/30/2021 19:27:42 - INFO - __main__ - Step 34517: {'lr': 0.00044277706308521543, 'samples': 6627264, 'steps': 34516, 'loss/train': 1.5167180299758911} -08/30/2021 19:27:43 - INFO - __main__ - Step 34518: {'lr': 0.0004427736842161001, 'samples': 6627456, 'steps': 34517, 'loss/train': 1.8896290063858032} -08/30/2021 19:27:43 - INFO - __main__ - Step 34519: {'lr': 0.00044277030526012386, 'samples': 6627648, 'steps': 34518, 'loss/train': 1.2373080253601074} -08/30/2021 19:27:45 - INFO - __main__ - Step 34520: {'lr': 0.0004427669262172883, 'samples': 6627840, 'steps': 34519, 'loss/train': 1.4679688215255737} -08/30/2021 19:27:45 - INFO - __main__ - Step 34521: {'lr': 0.000442763547087595, 'samples': 6628032, 'steps': 34520, 'loss/train': 2.0088555812835693} -08/30/2021 19:27:46 - INFO - __main__ - Step 34522: {'lr': 0.00044276016787104535, 'samples': 6628224, 'steps': 34521, 'loss/train': 1.9846179485321045} -08/30/2021 19:27:46 - INFO - __main__ - Step 34523: {'lr': 0.000442756788567641, 'samples': 6628416, 'steps': 34522, 'loss/train': 0.6158360242843628} -08/30/2021 19:27:46 - INFO - __main__ - Step 34524: {'lr': 0.0004427534091773834, 'samples': 6628608, 'steps': 34523, 'loss/train': 1.708936333656311} -08/30/2021 19:27:48 - INFO - __main__ - Step 34525: {'lr': 0.00044275002970027403, 'samples': 6628800, 'steps': 34524, 'loss/train': 1.1619412899017334} -08/30/2021 19:27:49 - INFO - __main__ - Step 34526: {'lr': 0.00044274665013631457, 'samples': 6628992, 'steps': 34525, 'loss/train': 1.3224120140075684} -08/30/2021 19:27:49 - INFO - __main__ - Step 34527: {'lr': 0.0004427432704855064, 'samples': 6629184, 'steps': 34526, 'loss/train': 1.686940312385559} -08/30/2021 19:27:49 - INFO - __main__ - Step 34528: {'lr': 0.000442739890747851, 'samples': 6629376, 'steps': 34527, 'loss/train': 0.1830187737941742} -08/30/2021 19:27:50 - INFO - __main__ - Step 34529: {'lr': 0.0004427365109233502, 'samples': 6629568, 'steps': 34528, 'loss/train': 0.5719832181930542} -08/30/2021 19:27:50 - INFO - __main__ - Step 34530: {'lr': 0.00044273313101200507, 'samples': 6629760, 'steps': 34529, 'loss/train': 1.2203422784805298} -08/30/2021 19:27:51 - INFO - __main__ - Step 34531: {'lr': 0.00044272975101381754, 'samples': 6629952, 'steps': 34530, 'loss/train': 1.482810616493225} -08/30/2021 19:27:52 - INFO - __main__ - Step 34532: {'lr': 0.0004427263709287889, 'samples': 6630144, 'steps': 34531, 'loss/train': 1.3061579465866089} -08/30/2021 19:27:52 - INFO - __main__ - Step 34533: {'lr': 0.00044272299075692067, 'samples': 6630336, 'steps': 34532, 'loss/train': 1.6461799144744873} -08/30/2021 19:27:53 - INFO - __main__ - Step 34534: {'lr': 0.0004427196104982145, 'samples': 6630528, 'steps': 34533, 'loss/train': 1.2202532291412354} -08/30/2021 19:27:53 - INFO - __main__ - Step 34535: {'lr': 0.0004427162301526718, 'samples': 6630720, 'steps': 34534, 'loss/train': 1.492713451385498} -08/30/2021 19:27:54 - INFO - __main__ - Step 34536: {'lr': 0.0004427128497202941, 'samples': 6630912, 'steps': 34535, 'loss/train': 0.9139453768730164} -08/30/2021 19:27:55 - INFO - __main__ - Step 34537: {'lr': 0.00044270946920108305, 'samples': 6631104, 'steps': 34536, 'loss/train': 0.5907489061355591} -08/30/2021 19:27:55 - INFO - __main__ - Step 34538: {'lr': 0.00044270608859504006, 'samples': 6631296, 'steps': 34537, 'loss/train': 1.5253498554229736} -08/30/2021 19:27:56 - INFO - __main__ - Step 34539: {'lr': 0.0004427027079021667, 'samples': 6631488, 'steps': 34538, 'loss/train': 1.3501640558242798} -08/30/2021 19:27:56 - INFO - __main__ - Step 34540: {'lr': 0.0004426993271224645, 'samples': 6631680, 'steps': 34539, 'loss/train': 1.6406875848770142} -08/30/2021 19:27:57 - INFO - __main__ - Step 34541: {'lr': 0.0004426959462559349, 'samples': 6631872, 'steps': 34540, 'loss/train': 1.1325690746307373} -08/30/2021 19:27:58 - INFO - __main__ - Step 34542: {'lr': 0.0004426925653025795, 'samples': 6632064, 'steps': 34541, 'loss/train': 1.8664443492889404} -08/30/2021 19:27:58 - INFO - __main__ - Step 34543: {'lr': 0.0004426891842623998, 'samples': 6632256, 'steps': 34542, 'loss/train': 1.5031765699386597} -08/30/2021 19:27:58 - INFO - __main__ - Step 34544: {'lr': 0.0004426858031353973, 'samples': 6632448, 'steps': 34543, 'loss/train': 1.265485167503357} -08/30/2021 19:27:59 - INFO - __main__ - Step 34545: {'lr': 0.0004426824219215736, 'samples': 6632640, 'steps': 34544, 'loss/train': 1.4783307313919067} -08/30/2021 19:28:00 - INFO - __main__ - Step 34546: {'lr': 0.00044267904062093014, 'samples': 6632832, 'steps': 34545, 'loss/train': 0.8809460997581482} -08/30/2021 19:28:01 - INFO - __main__ - Step 34547: {'lr': 0.0004426756592334685, 'samples': 6633024, 'steps': 34546, 'loss/train': 1.5961167812347412} -08/30/2021 19:28:01 - INFO - __main__ - Step 34548: {'lr': 0.0004426722777591902, 'samples': 6633216, 'steps': 34547, 'loss/train': 0.769387423992157} -08/30/2021 19:28:01 - INFO - __main__ - Step 34549: {'lr': 0.00044266889619809665, 'samples': 6633408, 'steps': 34548, 'loss/train': 1.2212328910827637} -08/30/2021 19:28:02 - INFO - __main__ - Step 34550: {'lr': 0.00044266551455018953, 'samples': 6633600, 'steps': 34549, 'loss/train': 1.6502959728240967} -08/30/2021 19:28:04 - INFO - __main__ - Step 34551: {'lr': 0.0004426621328154703, 'samples': 6633792, 'steps': 34550, 'loss/train': 1.1621997356414795} -08/30/2021 19:28:04 - INFO - __main__ - Step 34552: {'lr': 0.0004426587509939405, 'samples': 6633984, 'steps': 34551, 'loss/train': 1.7934597730636597} -08/30/2021 19:28:04 - INFO - __main__ - Step 34553: {'lr': 0.0004426553690856016, 'samples': 6634176, 'steps': 34552, 'loss/train': 1.1838699579238892} -08/30/2021 19:28:05 - INFO - __main__ - Step 34554: {'lr': 0.0004426519870904552, 'samples': 6634368, 'steps': 34553, 'loss/train': 1.638792634010315} -08/30/2021 19:28:05 - INFO - __main__ - Step 34555: {'lr': 0.0004426486050085028, 'samples': 6634560, 'steps': 34554, 'loss/train': 2.1602914333343506} -08/30/2021 19:28:07 - INFO - __main__ - Step 34556: {'lr': 0.0004426452228397458, 'samples': 6634752, 'steps': 34555, 'loss/train': 1.1738427877426147} -08/30/2021 19:28:07 - INFO - __main__ - Step 34557: {'lr': 0.000442641840584186, 'samples': 6634944, 'steps': 34556, 'loss/train': 2.541248321533203} -08/30/2021 19:28:08 - INFO - __main__ - Step 34558: {'lr': 0.00044263845824182467, 'samples': 6635136, 'steps': 34557, 'loss/train': 1.4648534059524536} -08/30/2021 19:28:08 - INFO - __main__ - Step 34559: {'lr': 0.0004426350758126634, 'samples': 6635328, 'steps': 34558, 'loss/train': 2.1016812324523926} -08/30/2021 19:28:08 - INFO - __main__ - Step 34560: {'lr': 0.0004426316932967038, 'samples': 6635520, 'steps': 34559, 'loss/train': 1.349694013595581} -08/30/2021 19:28:10 - INFO - __main__ - Step 34561: {'lr': 0.0004426283106939473, 'samples': 6635712, 'steps': 34560, 'loss/train': 1.9669362306594849} -08/30/2021 19:28:10 - INFO - __main__ - Step 34562: {'lr': 0.00044262492800439547, 'samples': 6635904, 'steps': 34561, 'loss/train': 1.9280204772949219} -08/30/2021 19:28:11 - INFO - __main__ - Step 34563: {'lr': 0.00044262154522804986, 'samples': 6636096, 'steps': 34562, 'loss/train': 1.3438531160354614} -08/30/2021 19:28:11 - INFO - __main__ - Step 34564: {'lr': 0.00044261816236491186, 'samples': 6636288, 'steps': 34563, 'loss/train': 0.960212230682373} -08/30/2021 19:28:11 - INFO - __main__ - Step 34565: {'lr': 0.00044261477941498316, 'samples': 6636480, 'steps': 34564, 'loss/train': 1.8634120225906372} -08/30/2021 19:28:13 - INFO - __main__ - Step 34566: {'lr': 0.0004426113963782652, 'samples': 6636672, 'steps': 34565, 'loss/train': 1.4474068880081177} -08/30/2021 19:28:13 - INFO - __main__ - Step 34567: {'lr': 0.00044260801325475953, 'samples': 6636864, 'steps': 34566, 'loss/train': 1.5259560346603394} -08/30/2021 19:28:14 - INFO - __main__ - Step 34568: {'lr': 0.0004426046300444676, 'samples': 6637056, 'steps': 34567, 'loss/train': 1.513583779335022} -08/30/2021 19:28:14 - INFO - __main__ - Step 34569: {'lr': 0.000442601246747391, 'samples': 6637248, 'steps': 34568, 'loss/train': 0.9271699786186218} -08/30/2021 19:28:14 - INFO - __main__ - Step 34570: {'lr': 0.0004425978633635313, 'samples': 6637440, 'steps': 34569, 'loss/train': 1.5802444219589233} -08/30/2021 19:28:15 - INFO - __main__ - Step 34571: {'lr': 0.0004425944798928899, 'samples': 6637632, 'steps': 34570, 'loss/train': 0.8644600510597229} -08/30/2021 19:28:16 - INFO - __main__ - Step 34572: {'lr': 0.0004425910963354685, 'samples': 6637824, 'steps': 34571, 'loss/train': 1.5983903408050537} -08/30/2021 19:28:17 - INFO - __main__ - Step 34573: {'lr': 0.0004425877126912685, 'samples': 6638016, 'steps': 34572, 'loss/train': 1.1706236600875854} -08/30/2021 19:28:17 - INFO - __main__ - Step 34574: {'lr': 0.00044258432896029145, 'samples': 6638208, 'steps': 34573, 'loss/train': 1.072049617767334} -08/30/2021 19:28:17 - INFO - __main__ - Step 34575: {'lr': 0.00044258094514253876, 'samples': 6638400, 'steps': 34574, 'loss/train': 1.3613985776901245} -08/30/2021 19:28:18 - INFO - __main__ - Step 34576: {'lr': 0.00044257756123801216, 'samples': 6638592, 'steps': 34575, 'loss/train': 1.8122700452804565} -08/30/2021 19:28:19 - INFO - __main__ - Step 34577: {'lr': 0.0004425741772467131, 'samples': 6638784, 'steps': 34576, 'loss/train': 1.3815467357635498} -08/30/2021 19:28:20 - INFO - __main__ - Step 34578: {'lr': 0.0004425707931686431, 'samples': 6638976, 'steps': 34577, 'loss/train': 0.6512845754623413} -08/30/2021 19:28:20 - INFO - __main__ - Step 34579: {'lr': 0.00044256740900380364, 'samples': 6639168, 'steps': 34578, 'loss/train': 0.5899108648300171} -08/30/2021 19:28:20 - INFO - __main__ - Step 34580: {'lr': 0.0004425640247521963, 'samples': 6639360, 'steps': 34579, 'loss/train': 1.639444351196289} -08/30/2021 19:28:21 - INFO - __main__ - Step 34581: {'lr': 0.00044256064041382255, 'samples': 6639552, 'steps': 34580, 'loss/train': 1.121112585067749} -08/30/2021 19:28:22 - INFO - __main__ - Step 34582: {'lr': 0.0004425572559886839, 'samples': 6639744, 'steps': 34581, 'loss/train': 1.2499206066131592} -08/30/2021 19:28:23 - INFO - __main__ - Step 34583: {'lr': 0.00044255387147678206, 'samples': 6639936, 'steps': 34582, 'loss/train': 0.7356665134429932} -08/30/2021 19:28:23 - INFO - __main__ - Step 34584: {'lr': 0.0004425504868781183, 'samples': 6640128, 'steps': 34583, 'loss/train': 0.6532497406005859} -08/30/2021 19:28:24 - INFO - __main__ - Step 34585: {'lr': 0.0004425471021926943, 'samples': 6640320, 'steps': 34584, 'loss/train': 1.4160295724868774} -08/30/2021 19:28:24 - INFO - __main__ - Step 34586: {'lr': 0.0004425437174205115, 'samples': 6640512, 'steps': 34585, 'loss/train': 1.1702860593795776} -08/30/2021 19:28:26 - INFO - __main__ - Step 34587: {'lr': 0.00044254033256157154, 'samples': 6640704, 'steps': 34586, 'loss/train': 1.3929725885391235} -08/30/2021 19:28:26 - INFO - __main__ - Step 34588: {'lr': 0.0004425369476158759, 'samples': 6640896, 'steps': 34587, 'loss/train': 1.1652488708496094} -08/30/2021 19:28:26 - INFO - __main__ - Step 34589: {'lr': 0.000442533562583426, 'samples': 6641088, 'steps': 34588, 'loss/train': 1.1288782358169556} -08/30/2021 19:28:27 - INFO - __main__ - Step 34590: {'lr': 0.00044253017746422355, 'samples': 6641280, 'steps': 34589, 'loss/train': 1.6927356719970703} -08/30/2021 19:28:27 - INFO - __main__ - Step 34591: {'lr': 0.00044252679225826984, 'samples': 6641472, 'steps': 34590, 'loss/train': 2.002218246459961} -08/30/2021 19:28:28 - INFO - __main__ - Step 34592: {'lr': 0.0004425234069655666, 'samples': 6641664, 'steps': 34591, 'loss/train': 2.097356081008911} -08/30/2021 19:28:29 - INFO - __main__ - Step 34593: {'lr': 0.0004425200215861153, 'samples': 6641856, 'steps': 34592, 'loss/train': 1.1375408172607422} -08/30/2021 19:28:29 - INFO - __main__ - Step 34594: {'lr': 0.00044251663611991743, 'samples': 6642048, 'steps': 34593, 'loss/train': 1.5154321193695068} -08/30/2021 19:28:30 - INFO - __main__ - Step 34595: {'lr': 0.0004425132505669745, 'samples': 6642240, 'steps': 34594, 'loss/train': 1.4113093614578247} -08/30/2021 19:28:30 - INFO - __main__ - Step 34596: {'lr': 0.00044250986492728805, 'samples': 6642432, 'steps': 34595, 'loss/train': 2.0654656887054443} -08/30/2021 19:28:31 - INFO - __main__ - Step 34597: {'lr': 0.0004425064792008597, 'samples': 6642624, 'steps': 34596, 'loss/train': 1.338316798210144} -08/30/2021 19:28:32 - INFO - __main__ - Step 34598: {'lr': 0.0004425030933876909, 'samples': 6642816, 'steps': 34597, 'loss/train': 1.8056979179382324} -08/30/2021 19:28:32 - INFO - __main__ - Step 34599: {'lr': 0.0004424997074877831, 'samples': 6643008, 'steps': 34598, 'loss/train': 1.3419913053512573} -08/30/2021 19:28:33 - INFO - __main__ - Step 34600: {'lr': 0.00044249632150113806, 'samples': 6643200, 'steps': 34599, 'loss/train': 1.241982102394104} -08/30/2021 19:28:33 - INFO - __main__ - Step 34601: {'lr': 0.000442492935427757, 'samples': 6643392, 'steps': 34600, 'loss/train': 1.4011131525039673} -08/30/2021 19:28:33 - INFO - __main__ - Step 34602: {'lr': 0.00044248954926764164, 'samples': 6643584, 'steps': 34601, 'loss/train': 1.1405445337295532} -08/30/2021 19:28:35 - INFO - __main__ - Step 34603: {'lr': 0.0004424861630207935, 'samples': 6643776, 'steps': 34602, 'loss/train': 1.6157505512237549} -08/30/2021 19:28:35 - INFO - __main__ - Step 34604: {'lr': 0.00044248277668721396, 'samples': 6643968, 'steps': 34603, 'loss/train': 1.084503412246704} -08/30/2021 19:28:35 - INFO - __main__ - Step 34605: {'lr': 0.00044247939026690475, 'samples': 6644160, 'steps': 34604, 'loss/train': 1.842009425163269} -08/30/2021 19:28:36 - INFO - __main__ - Step 34606: {'lr': 0.0004424760037598673, 'samples': 6644352, 'steps': 34605, 'loss/train': 1.3989065885543823} -08/30/2021 19:28:36 - INFO - __main__ - Step 34607: {'lr': 0.00044247261716610307, 'samples': 6644544, 'steps': 34606, 'loss/train': 1.432049036026001} -08/30/2021 19:28:38 - INFO - __main__ - Step 34608: {'lr': 0.0004424692304856136, 'samples': 6644736, 'steps': 34607, 'loss/train': 1.508874773979187} -08/30/2021 19:28:39 - INFO - __main__ - Step 34609: {'lr': 0.0004424658437184006, 'samples': 6644928, 'steps': 34608, 'loss/train': 2.344315528869629} -08/30/2021 19:28:39 - INFO - __main__ - Step 34610: {'lr': 0.0004424624568644654, 'samples': 6645120, 'steps': 34609, 'loss/train': 1.7382147312164307} -08/30/2021 19:28:39 - INFO - __main__ - Step 34611: {'lr': 0.00044245906992380955, 'samples': 6645312, 'steps': 34610, 'loss/train': 1.5767616033554077} -08/30/2021 19:28:40 - INFO - __main__ - Step 34612: {'lr': 0.0004424556828964347, 'samples': 6645504, 'steps': 34611, 'loss/train': 1.6449493169784546} -08/30/2021 19:28:41 - INFO - __main__ - Step 34613: {'lr': 0.0004424522957823422, 'samples': 6645696, 'steps': 34612, 'loss/train': 1.6256276369094849} -08/30/2021 19:28:42 - INFO - __main__ - Step 34614: {'lr': 0.00044244890858153376, 'samples': 6645888, 'steps': 34613, 'loss/train': 0.7414907813072205} -08/30/2021 19:28:42 - INFO - __main__ - Step 34615: {'lr': 0.00044244552129401075, 'samples': 6646080, 'steps': 34614, 'loss/train': 1.420929193496704} -08/30/2021 19:28:43 - INFO - __main__ - Step 34616: {'lr': 0.0004424421339197747, 'samples': 6646272, 'steps': 34615, 'loss/train': 1.387358546257019} -08/30/2021 19:28:43 - INFO - __main__ - Step 34617: {'lr': 0.00044243874645882733, 'samples': 6646464, 'steps': 34616, 'loss/train': 1.2828692197799683} -08/30/2021 19:28:45 - INFO - __main__ - Step 34618: {'lr': 0.0004424353589111699, 'samples': 6646656, 'steps': 34617, 'loss/train': 1.1269830465316772} -08/30/2021 19:28:46 - INFO - __main__ - Step 34619: {'lr': 0.0004424319712768041, 'samples': 6646848, 'steps': 34618, 'loss/train': 0.9125427007675171} -08/30/2021 19:28:46 - INFO - __main__ - Step 34620: {'lr': 0.00044242858355573143, 'samples': 6647040, 'steps': 34619, 'loss/train': 0.7687682509422302} -08/30/2021 19:28:46 - INFO - __main__ - Step 34621: {'lr': 0.00044242519574795347, 'samples': 6647232, 'steps': 34620, 'loss/train': 0.03656759113073349} -08/30/2021 19:28:47 - INFO - __main__ - Step 34622: {'lr': 0.00044242180785347164, 'samples': 6647424, 'steps': 34621, 'loss/train': 0.030534954741597176} -08/30/2021 19:28:47 - INFO - __main__ - Step 34623: {'lr': 0.00044241841987228747, 'samples': 6647616, 'steps': 34622, 'loss/train': 1.1314226388931274} -08/30/2021 19:28:47 - INFO - __main__ - Step 34624: {'lr': 0.00044241503180440263, 'samples': 6647808, 'steps': 34623, 'loss/train': 1.2687695026397705} -08/30/2021 19:28:49 - INFO - __main__ - Step 34625: {'lr': 0.0004424116436498185, 'samples': 6648000, 'steps': 34624, 'loss/train': 0.9782544374465942} -08/30/2021 19:28:49 - INFO - __main__ - Step 34626: {'lr': 0.0004424082554085366, 'samples': 6648192, 'steps': 34625, 'loss/train': 1.5050990581512451} -08/30/2021 19:28:50 - INFO - __main__ - Step 34627: {'lr': 0.0004424048670805586, 'samples': 6648384, 'steps': 34626, 'loss/train': 1.2192565202713013} -08/30/2021 19:28:50 - INFO - __main__ - Step 34628: {'lr': 0.0004424014786658859, 'samples': 6648576, 'steps': 34627, 'loss/train': 0.9493632912635803} -08/30/2021 19:28:51 - INFO - __main__ - Step 34629: {'lr': 0.00044239809016452, 'samples': 6648768, 'steps': 34628, 'loss/train': 1.5128798484802246} -08/30/2021 19:28:52 - INFO - __main__ - Step 34630: {'lr': 0.00044239470157646254, 'samples': 6648960, 'steps': 34629, 'loss/train': 1.3421119451522827} -08/30/2021 19:28:53 - INFO - __main__ - Step 34631: {'lr': 0.000442391312901715, 'samples': 6649152, 'steps': 34630, 'loss/train': 1.1037216186523438} -08/30/2021 19:28:53 - INFO - __main__ - Step 34632: {'lr': 0.0004423879241402788, 'samples': 6649344, 'steps': 34631, 'loss/train': 1.7800251245498657} -08/30/2021 19:28:53 - INFO - __main__ - Step 34633: {'lr': 0.00044238453529215575, 'samples': 6649536, 'steps': 34632, 'loss/train': 1.9754528999328613} -08/30/2021 19:28:54 - INFO - __main__ - Step 34634: {'lr': 0.00044238114635734713, 'samples': 6649728, 'steps': 34633, 'loss/train': 1.574794888496399} -08/30/2021 19:28:54 - INFO - __main__ - Step 34635: {'lr': 0.0004423777573358545, 'samples': 6649920, 'steps': 34634, 'loss/train': 1.3289318084716797} -08/30/2021 19:28:56 - INFO - __main__ - Step 34636: {'lr': 0.0004423743682276794, 'samples': 6650112, 'steps': 34635, 'loss/train': 1.5770080089569092} -08/30/2021 19:28:56 - INFO - __main__ - Step 34637: {'lr': 0.0004423709790328235, 'samples': 6650304, 'steps': 34636, 'loss/train': 1.1990138292312622} -08/30/2021 19:28:57 - INFO - __main__ - Step 34638: {'lr': 0.0004423675897512881, 'samples': 6650496, 'steps': 34637, 'loss/train': 0.026132598519325256} -08/30/2021 19:28:57 - INFO - __main__ - Step 34639: {'lr': 0.0004423642003830748, 'samples': 6650688, 'steps': 34638, 'loss/train': 1.4408581256866455} -08/30/2021 19:28:57 - INFO - __main__ - Step 34640: {'lr': 0.00044236081092818527, 'samples': 6650880, 'steps': 34639, 'loss/train': 1.650970220565796} -08/30/2021 19:28:59 - INFO - __main__ - Step 34641: {'lr': 0.00044235742138662085, 'samples': 6651072, 'steps': 34640, 'loss/train': 2.1028692722320557} -08/30/2021 19:28:59 - INFO - __main__ - Step 34642: {'lr': 0.0004423540317583832, 'samples': 6651264, 'steps': 34641, 'loss/train': 2.193288564682007} -08/30/2021 19:28:59 - INFO - __main__ - Step 34643: {'lr': 0.00044235064204347377, 'samples': 6651456, 'steps': 34642, 'loss/train': 1.4730808734893799} -08/30/2021 19:29:00 - INFO - __main__ - Step 34644: {'lr': 0.0004423472522418941, 'samples': 6651648, 'steps': 34643, 'loss/train': 1.362569808959961} -08/30/2021 19:29:00 - INFO - __main__ - Step 34645: {'lr': 0.0004423438623536457, 'samples': 6651840, 'steps': 34644, 'loss/train': 1.7961080074310303} -08/30/2021 19:29:01 - INFO - __main__ - Step 34646: {'lr': 0.0004423404723787301, 'samples': 6652032, 'steps': 34645, 'loss/train': 1.3881537914276123} -08/30/2021 19:29:02 - INFO - __main__ - Step 34647: {'lr': 0.000442337082317149, 'samples': 6652224, 'steps': 34646, 'loss/train': 1.1188929080963135} -08/30/2021 19:29:02 - INFO - __main__ - Step 34648: {'lr': 0.0004423336921689036, 'samples': 6652416, 'steps': 34647, 'loss/train': 1.5280674695968628} -08/30/2021 19:29:03 - INFO - __main__ - Step 34649: {'lr': 0.0004423303019339957, 'samples': 6652608, 'steps': 34648, 'loss/train': 1.7794148921966553} -08/30/2021 19:29:03 - INFO - __main__ - Step 34650: {'lr': 0.0004423269116124267, 'samples': 6652800, 'steps': 34649, 'loss/train': 1.3994988203048706} -08/30/2021 19:29:04 - INFO - __main__ - Step 34651: {'lr': 0.0004423235212041982, 'samples': 6652992, 'steps': 34650, 'loss/train': 1.0937551259994507} -08/30/2021 19:29:05 - INFO - __main__ - Step 34652: {'lr': 0.00044232013070931165, 'samples': 6653184, 'steps': 34651, 'loss/train': 1.5449656248092651} -08/30/2021 19:29:06 - INFO - __main__ - Step 34653: {'lr': 0.00044231674012776864, 'samples': 6653376, 'steps': 34652, 'loss/train': 1.0204274654388428} -08/30/2021 19:29:06 - INFO - __main__ - Step 34654: {'lr': 0.0004423133494595707, 'samples': 6653568, 'steps': 34653, 'loss/train': 1.695006012916565} -08/30/2021 19:29:06 - INFO - __main__ - Step 34655: {'lr': 0.00044230995870471923, 'samples': 6653760, 'steps': 34654, 'loss/train': 1.1935582160949707} -08/30/2021 19:29:07 - INFO - __main__ - Step 34656: {'lr': 0.000442306567863216, 'samples': 6653952, 'steps': 34655, 'loss/train': 1.6298872232437134} -08/30/2021 19:29:08 - INFO - __main__ - Step 34657: {'lr': 0.00044230317693506226, 'samples': 6654144, 'steps': 34656, 'loss/train': 1.2420439720153809} -08/30/2021 19:29:09 - INFO - __main__ - Step 34658: {'lr': 0.00044229978592025975, 'samples': 6654336, 'steps': 34657, 'loss/train': 2.5009686946868896} -08/30/2021 19:29:09 - INFO - __main__ - Step 34659: {'lr': 0.00044229639481881, 'samples': 6654528, 'steps': 34658, 'loss/train': 1.510106086730957} -08/30/2021 19:29:10 - INFO - __main__ - Step 34660: {'lr': 0.00044229300363071434, 'samples': 6654720, 'steps': 34659, 'loss/train': 1.1639480590820312} -08/30/2021 19:29:10 - INFO - __main__ - Step 34661: {'lr': 0.0004422896123559744, 'samples': 6654912, 'steps': 34660, 'loss/train': 1.5406805276870728} -08/30/2021 19:29:12 - INFO - __main__ - Step 34662: {'lr': 0.00044228622099459183, 'samples': 6655104, 'steps': 34661, 'loss/train': 1.7438578605651855} -08/30/2021 19:29:12 - INFO - __main__ - Step 34663: {'lr': 0.000442282829546568, 'samples': 6655296, 'steps': 34662, 'loss/train': 1.529159426689148} -08/30/2021 19:29:13 - INFO - __main__ - Step 34664: {'lr': 0.00044227943801190454, 'samples': 6655488, 'steps': 34663, 'loss/train': 1.7015680074691772} -08/30/2021 19:29:13 - INFO - __main__ - Step 34665: {'lr': 0.0004422760463906029, 'samples': 6655680, 'steps': 34664, 'loss/train': 1.2366178035736084} -08/30/2021 19:29:13 - INFO - __main__ - Step 34666: {'lr': 0.00044227265468266464, 'samples': 6655872, 'steps': 34665, 'loss/train': 1.1760388612747192} -08/30/2021 19:29:15 - INFO - __main__ - Step 34667: {'lr': 0.0004422692628880913, 'samples': 6656064, 'steps': 34666, 'loss/train': 1.7349165678024292} -08/30/2021 19:29:16 - INFO - __main__ - Step 34668: {'lr': 0.00044226587100688436, 'samples': 6656256, 'steps': 34667, 'loss/train': 0.10080096125602722} -08/30/2021 19:29:16 - INFO - __main__ - Step 34669: {'lr': 0.0004422624790390454, 'samples': 6656448, 'steps': 34668, 'loss/train': 1.257863998413086} -08/30/2021 19:29:16 - INFO - __main__ - Step 34670: {'lr': 0.000442259086984576, 'samples': 6656640, 'steps': 34669, 'loss/train': 1.5491306781768799} -08/30/2021 19:29:17 - INFO - __main__ - Step 34671: {'lr': 0.00044225569484347753, 'samples': 6656832, 'steps': 34670, 'loss/train': 0.8068243861198425} -08/30/2021 19:29:17 - INFO - __main__ - Step 34672: {'lr': 0.00044225230261575165, 'samples': 6657024, 'steps': 34671, 'loss/train': 1.4714633226394653} -08/30/2021 19:29:19 - INFO - __main__ - Step 34673: {'lr': 0.00044224891030139986, 'samples': 6657216, 'steps': 34672, 'loss/train': 0.9917858242988586} -08/30/2021 19:29:19 - INFO - __main__ - Step 34674: {'lr': 0.0004422455179004237, 'samples': 6657408, 'steps': 34673, 'loss/train': 0.6558176279067993} -08/30/2021 19:29:20 - INFO - __main__ - Step 34675: {'lr': 0.00044224212541282463, 'samples': 6657600, 'steps': 34674, 'loss/train': 1.201133370399475} -08/30/2021 19:29:20 - INFO - __main__ - Step 34676: {'lr': 0.0004422387328386042, 'samples': 6657792, 'steps': 34675, 'loss/train': 1.5372264385223389} -08/30/2021 19:29:20 - INFO - __main__ - Step 34677: {'lr': 0.000442235340177764, 'samples': 6657984, 'steps': 34676, 'loss/train': 1.5975207090377808} -08/30/2021 19:29:22 - INFO - __main__ - Step 34678: {'lr': 0.00044223194743030556, 'samples': 6658176, 'steps': 34677, 'loss/train': 2.0032284259796143} -08/30/2021 19:29:22 - INFO - __main__ - Step 34679: {'lr': 0.00044222855459623034, 'samples': 6658368, 'steps': 34678, 'loss/train': 0.6564019322395325} -08/30/2021 19:29:23 - INFO - __main__ - Step 34680: {'lr': 0.00044222516167553985, 'samples': 6658560, 'steps': 34679, 'loss/train': 1.6180073022842407} -08/30/2021 19:29:23 - INFO - __main__ - Step 34681: {'lr': 0.0004422217686682357, 'samples': 6658752, 'steps': 34680, 'loss/train': 1.4621936082839966} -08/30/2021 19:29:23 - INFO - __main__ - Step 34682: {'lr': 0.00044221837557431945, 'samples': 6658944, 'steps': 34681, 'loss/train': 1.28822922706604} -08/30/2021 19:29:25 - INFO - __main__ - Step 34683: {'lr': 0.00044221498239379247, 'samples': 6659136, 'steps': 34682, 'loss/train': 0.9522958397865295} -08/30/2021 19:29:25 - INFO - __main__ - Step 34684: {'lr': 0.0004422115891266565, 'samples': 6659328, 'steps': 34683, 'loss/train': 1.7374886274337769} -08/30/2021 19:29:26 - INFO - __main__ - Step 34685: {'lr': 0.00044220819577291283, 'samples': 6659520, 'steps': 34684, 'loss/train': 0.7801975607872009} -08/30/2021 19:29:26 - INFO - __main__ - Step 34686: {'lr': 0.00044220480233256315, 'samples': 6659712, 'steps': 34685, 'loss/train': 1.4226176738739014} -08/30/2021 19:29:26 - INFO - __main__ - Step 34687: {'lr': 0.00044220140880560897, 'samples': 6659904, 'steps': 34686, 'loss/train': 1.1236802339553833} -08/30/2021 19:29:28 - INFO - __main__ - Step 34688: {'lr': 0.0004421980151920518, 'samples': 6660096, 'steps': 34687, 'loss/train': 1.602264165878296} -08/30/2021 19:29:28 - INFO - __main__ - Step 34689: {'lr': 0.00044219462149189313, 'samples': 6660288, 'steps': 34688, 'loss/train': 0.8838433027267456} -08/30/2021 19:29:29 - INFO - __main__ - Step 34690: {'lr': 0.0004421912277051346, 'samples': 6660480, 'steps': 34689, 'loss/train': 1.0139211416244507} -08/30/2021 19:29:29 - INFO - __main__ - Step 34691: {'lr': 0.00044218783383177763, 'samples': 6660672, 'steps': 34690, 'loss/train': 1.5555403232574463} -08/30/2021 19:29:29 - INFO - __main__ - Step 34692: {'lr': 0.00044218443987182384, 'samples': 6660864, 'steps': 34691, 'loss/train': 0.9847817420959473} -08/30/2021 19:29:31 - INFO - __main__ - Step 34693: {'lr': 0.0004421810458252746, 'samples': 6661056, 'steps': 34692, 'loss/train': 1.9286046028137207} -08/30/2021 19:29:32 - INFO - __main__ - Step 34694: {'lr': 0.00044217765169213166, 'samples': 6661248, 'steps': 34693, 'loss/train': 1.5308654308319092} -08/30/2021 19:29:32 - INFO - __main__ - Step 34695: {'lr': 0.00044217425747239636, 'samples': 6661440, 'steps': 34694, 'loss/train': 1.2886213064193726} -08/30/2021 19:29:32 - INFO - __main__ - Step 34696: {'lr': 0.00044217086316607033, 'samples': 6661632, 'steps': 34695, 'loss/train': 1.4247550964355469} -08/30/2021 19:29:33 - INFO - __main__ - Step 34697: {'lr': 0.00044216746877315504, 'samples': 6661824, 'steps': 34696, 'loss/train': 1.329972505569458} -08/30/2021 19:29:33 - INFO - __main__ - Step 34698: {'lr': 0.0004421640742936521, 'samples': 6662016, 'steps': 34697, 'loss/train': 1.5331666469573975} -08/30/2021 19:29:35 - INFO - __main__ - Step 34699: {'lr': 0.000442160679727563, 'samples': 6662208, 'steps': 34698, 'loss/train': 0.4324115812778473} -08/30/2021 19:29:35 - INFO - __main__ - Step 34700: {'lr': 0.0004421572850748893, 'samples': 6662400, 'steps': 34699, 'loss/train': 0.7966052293777466} -08/30/2021 19:29:36 - INFO - __main__ - Step 34701: {'lr': 0.00044215389033563235, 'samples': 6662592, 'steps': 34700, 'loss/train': 0.16638953983783722} -08/30/2021 19:29:36 - INFO - __main__ - Step 34702: {'lr': 0.00044215049550979394, 'samples': 6662784, 'steps': 34701, 'loss/train': 0.6518832445144653} -08/30/2021 19:29:36 - INFO - __main__ - Step 34703: {'lr': 0.0004421471005973755, 'samples': 6662976, 'steps': 34702, 'loss/train': 1.5585709810256958} -08/30/2021 19:29:38 - INFO - __main__ - Step 34704: {'lr': 0.0004421437055983785, 'samples': 6663168, 'steps': 34703, 'loss/train': 0.5413429737091064} -08/30/2021 19:29:38 - INFO - __main__ - Step 34705: {'lr': 0.0004421403105128045, 'samples': 6663360, 'steps': 34704, 'loss/train': 1.3705461025238037} -08/30/2021 19:29:39 - INFO - __main__ - Step 34706: {'lr': 0.00044213691534065503, 'samples': 6663552, 'steps': 34705, 'loss/train': 1.6387416124343872} -08/30/2021 19:29:39 - INFO - __main__ - Step 34707: {'lr': 0.0004421335200819316, 'samples': 6663744, 'steps': 34706, 'loss/train': 1.3581836223602295} -08/30/2021 19:29:39 - INFO - __main__ - Step 34708: {'lr': 0.00044213012473663584, 'samples': 6663936, 'steps': 34707, 'loss/train': 1.6423312425613403} -08/30/2021 19:29:41 - INFO - __main__ - Step 34709: {'lr': 0.0004421267293047692, 'samples': 6664128, 'steps': 34708, 'loss/train': 0.08500602096319199} -08/30/2021 19:29:41 - INFO - __main__ - Step 34710: {'lr': 0.0004421233337863332, 'samples': 6664320, 'steps': 34709, 'loss/train': 1.0537681579589844} -08/30/2021 19:29:42 - INFO - __main__ - Step 34711: {'lr': 0.0004421199381813293, 'samples': 6664512, 'steps': 34710, 'loss/train': 1.7350077629089355} -08/30/2021 19:29:42 - INFO - __main__ - Step 34712: {'lr': 0.0004421165424897593, 'samples': 6664704, 'steps': 34711, 'loss/train': 1.7634326219558716} -08/30/2021 19:29:42 - INFO - __main__ - Step 34713: {'lr': 0.00044211314671162446, 'samples': 6664896, 'steps': 34712, 'loss/train': 1.4969698190689087} -08/30/2021 19:29:45 - INFO - __main__ - Step 34714: {'lr': 0.0004421097508469264, 'samples': 6665088, 'steps': 34713, 'loss/train': 1.0224230289459229} -08/30/2021 19:29:45 - INFO - __main__ - Step 34715: {'lr': 0.0004421063548956666, 'samples': 6665280, 'steps': 34714, 'loss/train': 1.5540722608566284} -08/30/2021 19:29:45 - INFO - __main__ - Step 34716: {'lr': 0.0004421029588578468, 'samples': 6665472, 'steps': 34715, 'loss/train': 1.6547048091888428} -08/30/2021 19:29:46 - INFO - __main__ - Step 34717: {'lr': 0.00044209956273346816, 'samples': 6665664, 'steps': 34716, 'loss/train': 1.0293141603469849} -08/30/2021 19:29:46 - INFO - __main__ - Step 34718: {'lr': 0.0004420961665225326, 'samples': 6665856, 'steps': 34717, 'loss/train': 1.2696518898010254} -08/30/2021 19:29:46 - INFO - __main__ - Step 34719: {'lr': 0.0004420927702250414, 'samples': 6666048, 'steps': 34718, 'loss/train': 1.9864994287490845} -08/30/2021 19:29:48 - INFO - __main__ - Step 34720: {'lr': 0.00044208937384099614, 'samples': 6666240, 'steps': 34719, 'loss/train': 1.6231191158294678} -08/30/2021 19:29:49 - INFO - __main__ - Step 34721: {'lr': 0.0004420859773703985, 'samples': 6666432, 'steps': 34720, 'loss/train': 1.2206162214279175} -08/30/2021 19:29:49 - INFO - __main__ - Step 34722: {'lr': 0.0004420825808132497, 'samples': 6666624, 'steps': 34721, 'loss/train': 2.1539533138275146} -08/30/2021 19:29:49 - INFO - __main__ - Step 34723: {'lr': 0.0004420791841695515, 'samples': 6666816, 'steps': 34722, 'loss/train': 0.10320522636175156} -08/30/2021 19:29:50 - INFO - __main__ - Step 34724: {'lr': 0.00044207578743930544, 'samples': 6667008, 'steps': 34723, 'loss/train': 1.749796986579895} -08/30/2021 19:29:52 - INFO - __main__ - Step 34725: {'lr': 0.00044207239062251297, 'samples': 6667200, 'steps': 34724, 'loss/train': 1.0909737348556519} -08/30/2021 19:29:52 - INFO - __main__ - Step 34726: {'lr': 0.00044206899371917563, 'samples': 6667392, 'steps': 34725, 'loss/train': 1.5443371534347534} -08/30/2021 19:29:52 - INFO - __main__ - Step 34727: {'lr': 0.00044206559672929505, 'samples': 6667584, 'steps': 34726, 'loss/train': 0.7401970624923706} -08/30/2021 19:29:53 - INFO - __main__ - Step 34728: {'lr': 0.00044206219965287253, 'samples': 6667776, 'steps': 34727, 'loss/train': 0.5476230382919312} -08/30/2021 19:29:53 - INFO - __main__ - Step 34729: {'lr': 0.0004420588024899098, 'samples': 6667968, 'steps': 34728, 'loss/train': 1.7276771068572998} -08/30/2021 19:29:55 - INFO - __main__ - Step 34730: {'lr': 0.00044205540524040846, 'samples': 6668160, 'steps': 34729, 'loss/train': 1.187868356704712} -08/30/2021 19:29:55 - INFO - __main__ - Step 34731: {'lr': 0.0004420520079043698, 'samples': 6668352, 'steps': 34730, 'loss/train': 1.0180031061172485} -08/30/2021 19:29:55 - INFO - __main__ - Step 34732: {'lr': 0.00044204861048179544, 'samples': 6668544, 'steps': 34731, 'loss/train': 1.392545223236084} -08/30/2021 19:29:56 - INFO - __main__ - Step 34733: {'lr': 0.000442045212972687, 'samples': 6668736, 'steps': 34732, 'loss/train': 1.2085925340652466} -08/30/2021 19:29:56 - INFO - __main__ - Step 34734: {'lr': 0.00044204181537704594, 'samples': 6668928, 'steps': 34733, 'loss/train': 2.0333735942840576} -08/30/2021 19:29:58 - INFO - __main__ - Step 34735: {'lr': 0.0004420384176948738, 'samples': 6669120, 'steps': 34734, 'loss/train': 1.894636631011963} -08/30/2021 19:29:58 - INFO - __main__ - Step 34736: {'lr': 0.0004420350199261721, 'samples': 6669312, 'steps': 34735, 'loss/train': 1.0695494413375854} -08/30/2021 19:29:58 - INFO - __main__ - Step 34737: {'lr': 0.0004420316220709424, 'samples': 6669504, 'steps': 34736, 'loss/train': 0.819586455821991} -08/30/2021 19:29:59 - INFO - __main__ - Step 34738: {'lr': 0.0004420282241291862, 'samples': 6669696, 'steps': 34737, 'loss/train': 1.361747145652771} -08/30/2021 19:29:59 - INFO - __main__ - Step 34739: {'lr': 0.0004420248261009051, 'samples': 6669888, 'steps': 34738, 'loss/train': 1.8967548608779907} -08/30/2021 19:29:59 - INFO - __main__ - Step 34740: {'lr': 0.0004420214279861005, 'samples': 6670080, 'steps': 34739, 'loss/train': 1.2004952430725098} -08/30/2021 19:30:01 - INFO - __main__ - Step 34741: {'lr': 0.000442018029784774, 'samples': 6670272, 'steps': 34740, 'loss/train': 0.9303376078605652} -08/30/2021 19:30:01 - INFO - __main__ - Step 34742: {'lr': 0.00044201463149692725, 'samples': 6670464, 'steps': 34741, 'loss/train': 1.6795202493667603} -08/30/2021 19:30:02 - INFO - __main__ - Step 34743: {'lr': 0.0004420112331225616, 'samples': 6670656, 'steps': 34742, 'loss/train': 1.0386409759521484} -08/30/2021 19:30:02 - INFO - __main__ - Step 34744: {'lr': 0.0004420078346616786, 'samples': 6670848, 'steps': 34743, 'loss/train': 1.1938104629516602} -08/30/2021 19:30:02 - INFO - __main__ - Step 34745: {'lr': 0.00044200443611427985, 'samples': 6671040, 'steps': 34744, 'loss/train': 1.588404893875122} -08/30/2021 19:30:04 - INFO - __main__ - Step 34746: {'lr': 0.000442001037480367, 'samples': 6671232, 'steps': 34745, 'loss/train': 1.9168548583984375} -08/30/2021 19:30:05 - INFO - __main__ - Step 34747: {'lr': 0.0004419976387599413, 'samples': 6671424, 'steps': 34746, 'loss/train': 1.2247517108917236} -08/30/2021 19:30:05 - INFO - __main__ - Step 34748: {'lr': 0.0004419942399530045, 'samples': 6671616, 'steps': 34747, 'loss/train': 0.9280975461006165} -08/30/2021 19:30:05 - INFO - __main__ - Step 34749: {'lr': 0.000441990841059558, 'samples': 6671808, 'steps': 34748, 'loss/train': 0.09358397126197815} -08/30/2021 19:30:06 - INFO - __main__ - Step 34750: {'lr': 0.0004419874420796034, 'samples': 6672000, 'steps': 34749, 'loss/train': 0.6446064114570618} -08/30/2021 19:30:07 - INFO - __main__ - Step 34751: {'lr': 0.00044198404301314223, 'samples': 6672192, 'steps': 34750, 'loss/train': 0.6184068918228149} -08/30/2021 19:30:08 - INFO - __main__ - Step 34752: {'lr': 0.000441980643860176, 'samples': 6672384, 'steps': 34751, 'loss/train': 1.9865344762802124} -08/30/2021 19:30:08 - INFO - __main__ - Step 34753: {'lr': 0.0004419772446207063, 'samples': 6672576, 'steps': 34752, 'loss/train': 1.5299996137619019} -08/30/2021 19:30:08 - INFO - __main__ - Step 34754: {'lr': 0.0004419738452947346, 'samples': 6672768, 'steps': 34753, 'loss/train': 1.5365554094314575} -08/30/2021 19:30:09 - INFO - __main__ - Step 34755: {'lr': 0.00044197044588226245, 'samples': 6672960, 'steps': 34754, 'loss/train': 1.6013884544372559} -08/30/2021 19:30:09 - INFO - __main__ - Step 34756: {'lr': 0.00044196704638329134, 'samples': 6673152, 'steps': 34755, 'loss/train': 1.6902989149093628} -08/30/2021 19:30:10 - INFO - __main__ - Step 34757: {'lr': 0.00044196364679782284, 'samples': 6673344, 'steps': 34756, 'loss/train': 1.1759026050567627} -08/30/2021 19:30:11 - INFO - __main__ - Step 34758: {'lr': 0.00044196024712585854, 'samples': 6673536, 'steps': 34757, 'loss/train': 1.1638102531433105} -08/30/2021 19:30:11 - INFO - __main__ - Step 34759: {'lr': 0.0004419568473673999, 'samples': 6673728, 'steps': 34758, 'loss/train': 1.7615946531295776} -08/30/2021 19:30:12 - INFO - __main__ - Step 34760: {'lr': 0.00044195344752244844, 'samples': 6673920, 'steps': 34759, 'loss/train': 1.3740109205245972} -08/30/2021 19:30:12 - INFO - __main__ - Step 34761: {'lr': 0.0004419500475910057, 'samples': 6674112, 'steps': 34760, 'loss/train': 1.8068288564682007} -08/30/2021 19:30:14 - INFO - __main__ - Step 34762: {'lr': 0.0004419466475730732, 'samples': 6674304, 'steps': 34761, 'loss/train': 1.335292935371399} -08/30/2021 19:30:14 - INFO - __main__ - Step 34763: {'lr': 0.00044194324746865265, 'samples': 6674496, 'steps': 34762, 'loss/train': 1.5998960733413696} -08/30/2021 19:30:14 - INFO - __main__ - Step 34764: {'lr': 0.00044193984727774533, 'samples': 6674688, 'steps': 34763, 'loss/train': 1.4881980419158936} -08/30/2021 19:30:15 - INFO - __main__ - Step 34765: {'lr': 0.0004419364470003529, 'samples': 6674880, 'steps': 34764, 'loss/train': 0.8375330567359924} -08/30/2021 19:30:15 - INFO - __main__ - Step 34766: {'lr': 0.00044193304663647684, 'samples': 6675072, 'steps': 34765, 'loss/train': 1.299536943435669} -08/30/2021 19:30:17 - INFO - __main__ - Step 34767: {'lr': 0.00044192964618611875, 'samples': 6675264, 'steps': 34766, 'loss/train': 1.460287094116211} -08/30/2021 19:30:17 - INFO - __main__ - Step 34768: {'lr': 0.0004419262456492801, 'samples': 6675456, 'steps': 34767, 'loss/train': 1.5032386779785156} -08/30/2021 19:30:17 - INFO - __main__ - Step 34769: {'lr': 0.0004419228450259625, 'samples': 6675648, 'steps': 34768, 'loss/train': 1.292349934577942} -08/30/2021 19:30:18 - INFO - __main__ - Step 34770: {'lr': 0.00044191944431616734, 'samples': 6675840, 'steps': 34769, 'loss/train': 1.1969331502914429} -08/30/2021 19:30:18 - INFO - __main__ - Step 34771: {'lr': 0.0004419160435198963, 'samples': 6676032, 'steps': 34770, 'loss/train': 1.389635682106018} -08/30/2021 19:30:20 - INFO - __main__ - Step 34772: {'lr': 0.00044191264263715083, 'samples': 6676224, 'steps': 34771, 'loss/train': 1.2823338508605957} -08/30/2021 19:30:21 - INFO - __main__ - Step 34773: {'lr': 0.00044190924166793245, 'samples': 6676416, 'steps': 34772, 'loss/train': 1.0687317848205566} -08/30/2021 19:30:21 - INFO - __main__ - Step 34774: {'lr': 0.00044190584061224277, 'samples': 6676608, 'steps': 34773, 'loss/train': 0.6831493973731995} -08/30/2021 19:30:22 - INFO - __main__ - Step 34775: {'lr': 0.0004419024394700833, 'samples': 6676800, 'steps': 34774, 'loss/train': 1.4117400646209717} -08/30/2021 19:30:22 - INFO - __main__ - Step 34776: {'lr': 0.0004418990382414555, 'samples': 6676992, 'steps': 34775, 'loss/train': 1.9957515001296997} -08/30/2021 19:30:22 - INFO - __main__ - Step 34777: {'lr': 0.000441895636926361, 'samples': 6677184, 'steps': 34776, 'loss/train': 1.2460740804672241} -08/30/2021 19:30:24 - INFO - __main__ - Step 34778: {'lr': 0.0004418922355248013, 'samples': 6677376, 'steps': 34777, 'loss/train': 2.4083032608032227} -08/30/2021 19:30:24 - INFO - __main__ - Step 34779: {'lr': 0.00044188883403677783, 'samples': 6677568, 'steps': 34778, 'loss/train': 1.159144401550293} -08/30/2021 19:30:25 - INFO - __main__ - Step 34780: {'lr': 0.0004418854324622923, 'samples': 6677760, 'steps': 34779, 'loss/train': 0.7860084176063538} -08/30/2021 19:30:25 - INFO - __main__ - Step 34781: {'lr': 0.0004418820308013461, 'samples': 6677952, 'steps': 34780, 'loss/train': 0.6624705195426941} -08/30/2021 19:30:25 - INFO - __main__ - Step 34782: {'lr': 0.0004418786290539408, 'samples': 6678144, 'steps': 34781, 'loss/train': 1.468929409980774} -08/30/2021 19:30:27 - INFO - __main__ - Step 34783: {'lr': 0.000441875227220078, 'samples': 6678336, 'steps': 34782, 'loss/train': 1.6640392541885376} -08/30/2021 19:30:27 - INFO - __main__ - Step 34784: {'lr': 0.00044187182529975924, 'samples': 6678528, 'steps': 34783, 'loss/train': 1.5427321195602417} -08/30/2021 19:30:28 - INFO - __main__ - Step 34785: {'lr': 0.00044186842329298594, 'samples': 6678720, 'steps': 34784, 'loss/train': 1.402348518371582} -08/30/2021 19:30:28 - INFO - __main__ - Step 34786: {'lr': 0.0004418650211997596, 'samples': 6678912, 'steps': 34785, 'loss/train': 0.3444991707801819} -08/30/2021 19:30:28 - INFO - __main__ - Step 34787: {'lr': 0.00044186161902008193, 'samples': 6679104, 'steps': 34786, 'loss/train': 0.8967769742012024} -08/30/2021 19:30:30 - INFO - __main__ - Step 34788: {'lr': 0.0004418582167539544, 'samples': 6679296, 'steps': 34787, 'loss/train': 0.791840672492981} -08/30/2021 19:30:30 - INFO - __main__ - Step 34789: {'lr': 0.00044185481440137846, 'samples': 6679488, 'steps': 34788, 'loss/train': 1.4772237539291382} -08/30/2021 19:30:31 - INFO - __main__ - Step 34790: {'lr': 0.0004418514119623557, 'samples': 6679680, 'steps': 34789, 'loss/train': 1.569371223449707} -08/30/2021 19:30:31 - INFO - __main__ - Step 34791: {'lr': 0.00044184800943688774, 'samples': 6679872, 'steps': 34790, 'loss/train': 1.5514798164367676} -08/30/2021 19:30:31 - INFO - __main__ - Step 34792: {'lr': 0.00044184460682497595, 'samples': 6680064, 'steps': 34791, 'loss/train': 1.2580409049987793} -08/30/2021 19:30:33 - INFO - __main__ - Step 34793: {'lr': 0.00044184120412662196, 'samples': 6680256, 'steps': 34792, 'loss/train': 1.6579335927963257} -08/30/2021 19:30:34 - INFO - __main__ - Step 34794: {'lr': 0.00044183780134182725, 'samples': 6680448, 'steps': 34793, 'loss/train': 1.4819539785385132} -08/30/2021 19:30:34 - INFO - __main__ - Step 34795: {'lr': 0.0004418343984705935, 'samples': 6680640, 'steps': 34794, 'loss/train': 1.9057198762893677} -08/30/2021 19:30:34 - INFO - __main__ - Step 34796: {'lr': 0.000441830995512922, 'samples': 6680832, 'steps': 34795, 'loss/train': 1.8886874914169312} -08/30/2021 19:30:35 - INFO - __main__ - Step 34797: {'lr': 0.00044182759246881446, 'samples': 6681024, 'steps': 34796, 'loss/train': 0.026153258979320526} -08/30/2021 19:30:35 - INFO - __main__ - Step 34798: {'lr': 0.0004418241893382724, 'samples': 6681216, 'steps': 34797, 'loss/train': 1.4936158657073975} -08/30/2021 19:30:35 - INFO - __main__ - Step 34799: {'lr': 0.0004418207861212973, 'samples': 6681408, 'steps': 34798, 'loss/train': 1.608742594718933} -08/30/2021 19:30:37 - INFO - __main__ - Step 34800: {'lr': 0.0004418173828178906, 'samples': 6681600, 'steps': 34799, 'loss/train': 1.6500439643859863} -08/30/2021 19:30:37 - INFO - __main__ - Step 34801: {'lr': 0.0004418139794280541, 'samples': 6681792, 'steps': 34800, 'loss/train': 1.565674066543579} -08/30/2021 19:30:38 - INFO - __main__ - Step 34802: {'lr': 0.0004418105759517892, 'samples': 6681984, 'steps': 34801, 'loss/train': 1.2757917642593384} -08/30/2021 19:30:38 - INFO - __main__ - Step 34803: {'lr': 0.0004418071723890973, 'samples': 6682176, 'steps': 34802, 'loss/train': 1.5636024475097656} -08/30/2021 19:30:39 - INFO - __main__ - Step 34804: {'lr': 0.0004418037687399801, 'samples': 6682368, 'steps': 34803, 'loss/train': 0.6732167601585388} -08/30/2021 19:30:40 - INFO - __main__ - Step 34805: {'lr': 0.0004418003650044391, 'samples': 6682560, 'steps': 34804, 'loss/train': 1.4263074398040771} -08/30/2021 19:30:41 - INFO - __main__ - Step 34806: {'lr': 0.0004417969611824758, 'samples': 6682752, 'steps': 34805, 'loss/train': 1.2235455513000488} -08/30/2021 19:30:41 - INFO - __main__ - Step 34807: {'lr': 0.00044179355727409173, 'samples': 6682944, 'steps': 34806, 'loss/train': 1.2955653667449951} -08/30/2021 19:30:41 - INFO - __main__ - Step 34808: {'lr': 0.00044179015327928847, 'samples': 6683136, 'steps': 34807, 'loss/train': 1.1689554452896118} -08/30/2021 19:30:42 - INFO - __main__ - Step 34809: {'lr': 0.0004417867491980675, 'samples': 6683328, 'steps': 34808, 'loss/train': 1.5134466886520386} -08/30/2021 19:30:43 - INFO - __main__ - Step 34810: {'lr': 0.0004417833450304304, 'samples': 6683520, 'steps': 34809, 'loss/train': 1.5974912643432617} -08/30/2021 19:30:44 - INFO - __main__ - Step 34811: {'lr': 0.0004417799407763786, 'samples': 6683712, 'steps': 34810, 'loss/train': 0.7585117220878601} -08/30/2021 19:30:44 - INFO - __main__ - Step 34812: {'lr': 0.00044177653643591387, 'samples': 6683904, 'steps': 34811, 'loss/train': 1.289052963256836} -08/30/2021 19:30:44 - INFO - __main__ - Step 34813: {'lr': 0.00044177313200903745, 'samples': 6684096, 'steps': 34812, 'loss/train': 1.6717332601547241} -08/30/2021 19:30:45 - INFO - __main__ - Step 34814: {'lr': 0.0004417697274957511, 'samples': 6684288, 'steps': 34813, 'loss/train': 1.3906093835830688} -08/30/2021 19:30:46 - INFO - __main__ - Step 34815: {'lr': 0.0004417663228960562, 'samples': 6684480, 'steps': 34814, 'loss/train': 1.7551484107971191} -08/30/2021 19:30:47 - INFO - __main__ - Step 34816: {'lr': 0.0004417629182099545, 'samples': 6684672, 'steps': 34815, 'loss/train': 1.8394625186920166} -08/30/2021 19:30:47 - INFO - __main__ - Step 34817: {'lr': 0.00044175951343744725, 'samples': 6684864, 'steps': 34816, 'loss/train': 1.7801318168640137} -08/30/2021 19:30:47 - INFO - __main__ - Step 34818: {'lr': 0.0004417561085785362, 'samples': 6685056, 'steps': 34817, 'loss/train': 1.6029207706451416} -08/30/2021 19:30:48 - INFO - __main__ - Step 34819: {'lr': 0.0004417527036332227, 'samples': 6685248, 'steps': 34818, 'loss/train': 1.453639268875122} -08/30/2021 19:30:49 - INFO - __main__ - Step 34820: {'lr': 0.0004417492986015085, 'samples': 6685440, 'steps': 34819, 'loss/train': 1.3046061992645264} -08/30/2021 19:30:50 - INFO - __main__ - Step 34821: {'lr': 0.000441745893483395, 'samples': 6685632, 'steps': 34820, 'loss/train': 1.7073967456817627} -08/30/2021 19:30:50 - INFO - __main__ - Step 34822: {'lr': 0.00044174248827888376, 'samples': 6685824, 'steps': 34821, 'loss/train': 1.296985149383545} -08/30/2021 19:30:50 - INFO - __main__ - Step 34823: {'lr': 0.00044173908298797627, 'samples': 6686016, 'steps': 34822, 'loss/train': 1.2004714012145996} -08/30/2021 19:30:51 - INFO - __main__ - Step 34824: {'lr': 0.0004417356776106741, 'samples': 6686208, 'steps': 34823, 'loss/train': 1.5317583084106445} -08/30/2021 19:30:51 - INFO - __main__ - Step 34825: {'lr': 0.00044173227214697885, 'samples': 6686400, 'steps': 34824, 'loss/train': 1.8565694093704224} -08/30/2021 19:30:52 - INFO - __main__ - Step 34826: {'lr': 0.000441728866596892, 'samples': 6686592, 'steps': 34825, 'loss/train': 1.6611049175262451} -08/30/2021 19:30:53 - INFO - __main__ - Step 34827: {'lr': 0.00044172546096041504, 'samples': 6686784, 'steps': 34826, 'loss/train': 0.2876690626144409} -08/30/2021 19:30:53 - INFO - __main__ - Step 34828: {'lr': 0.0004417220552375496, 'samples': 6686976, 'steps': 34827, 'loss/train': 1.161854863166809} -08/30/2021 19:30:54 - INFO - __main__ - Step 34829: {'lr': 0.00044171864942829707, 'samples': 6687168, 'steps': 34828, 'loss/train': 1.7079987525939941} -08/30/2021 19:30:54 - INFO - __main__ - Step 34830: {'lr': 0.0004417152435326591, 'samples': 6687360, 'steps': 34829, 'loss/train': 1.3795909881591797} -08/30/2021 19:30:56 - INFO - __main__ - Step 34831: {'lr': 0.00044171183755063726, 'samples': 6687552, 'steps': 34830, 'loss/train': 1.8254364728927612} -08/30/2021 19:30:56 - INFO - __main__ - Step 34832: {'lr': 0.00044170843148223305, 'samples': 6687744, 'steps': 34831, 'loss/train': 1.633926510810852} -08/30/2021 19:30:57 - INFO - __main__ - Step 34833: {'lr': 0.0004417050253274479, 'samples': 6687936, 'steps': 34832, 'loss/train': 2.0371410846710205} -08/30/2021 19:30:57 - INFO - __main__ - Step 34834: {'lr': 0.00044170161908628345, 'samples': 6688128, 'steps': 34833, 'loss/train': 1.4808772802352905} -08/30/2021 19:30:58 - INFO - __main__ - Step 34835: {'lr': 0.0004416982127587412, 'samples': 6688320, 'steps': 34834, 'loss/train': 1.7261383533477783} -08/30/2021 19:30:59 - INFO - __main__ - Step 34836: {'lr': 0.00044169480634482274, 'samples': 6688512, 'steps': 34835, 'loss/train': 1.6901108026504517} -08/30/2021 19:30:59 - INFO - __main__ - Step 34837: {'lr': 0.0004416913998445294, 'samples': 6688704, 'steps': 34836, 'loss/train': 2.1727051734924316} -08/30/2021 19:31:00 - INFO - __main__ - Step 34838: {'lr': 0.000441687993257863, 'samples': 6688896, 'steps': 34837, 'loss/train': 1.5491070747375488} -08/30/2021 19:31:00 - INFO - __main__ - Step 34839: {'lr': 0.000441684586584825, 'samples': 6689088, 'steps': 34838, 'loss/train': 1.0219261646270752} -08/30/2021 19:31:01 - INFO - __main__ - Step 34840: {'lr': 0.0004416811798254168, 'samples': 6689280, 'steps': 34839, 'loss/train': 1.4175992012023926} -08/30/2021 19:31:02 - INFO - __main__ - Step 34841: {'lr': 0.00044167777297964006, 'samples': 6689472, 'steps': 34840, 'loss/train': 1.086851954460144} -08/30/2021 19:31:03 - INFO - __main__ - Step 34842: {'lr': 0.0004416743660474962, 'samples': 6689664, 'steps': 34841, 'loss/train': 1.172855257987976} -08/30/2021 19:31:03 - INFO - __main__ - Step 34843: {'lr': 0.0004416709590289869, 'samples': 6689856, 'steps': 34842, 'loss/train': 1.4749000072479248} -08/30/2021 19:31:04 - INFO - __main__ - Step 34844: {'lr': 0.00044166755192411364, 'samples': 6690048, 'steps': 34843, 'loss/train': 1.4386703968048096} -08/30/2021 19:31:04 - INFO - __main__ - Step 34845: {'lr': 0.00044166414473287784, 'samples': 6690240, 'steps': 34844, 'loss/train': 3.9213595390319824} -08/30/2021 19:31:04 - INFO - __main__ - Step 34846: {'lr': 0.0004416607374552812, 'samples': 6690432, 'steps': 34845, 'loss/train': 1.2432138919830322} -08/30/2021 19:31:06 - INFO - __main__ - Step 34847: {'lr': 0.00044165733009132524, 'samples': 6690624, 'steps': 34846, 'loss/train': 1.974619746208191} -08/30/2021 19:31:06 - INFO - __main__ - Step 34848: {'lr': 0.00044165392264101136, 'samples': 6690816, 'steps': 34847, 'loss/train': 2.2524802684783936} -08/30/2021 19:31:06 - INFO - __main__ - Step 34849: {'lr': 0.0004416505151043412, 'samples': 6691008, 'steps': 34848, 'loss/train': 1.4525641202926636} -08/30/2021 19:31:07 - INFO - __main__ - Step 34850: {'lr': 0.0004416471074813163, 'samples': 6691200, 'steps': 34849, 'loss/train': 1.4050114154815674} -08/30/2021 19:31:08 - INFO - __main__ - Step 34851: {'lr': 0.0004416436997719382, 'samples': 6691392, 'steps': 34850, 'loss/train': 1.9952603578567505} -08/30/2021 19:31:09 - INFO - __main__ - Step 34852: {'lr': 0.0004416402919762084, 'samples': 6691584, 'steps': 34851, 'loss/train': 1.2240517139434814} -08/30/2021 19:31:09 - INFO - __main__ - Step 34853: {'lr': 0.00044163688409412833, 'samples': 6691776, 'steps': 34852, 'loss/train': 1.0828030109405518} -08/30/2021 19:31:09 - INFO - __main__ - Step 34854: {'lr': 0.0004416334761256997, 'samples': 6691968, 'steps': 34853, 'loss/train': 1.1099767684936523} -08/30/2021 19:31:10 - INFO - __main__ - Step 34855: {'lr': 0.000441630068070924, 'samples': 6692160, 'steps': 34854, 'loss/train': 1.4822251796722412} -08/30/2021 19:31:10 - INFO - __main__ - Step 34856: {'lr': 0.0004416266599298028, 'samples': 6692352, 'steps': 34855, 'loss/train': 1.3974529504776} -08/30/2021 19:31:12 - INFO - __main__ - Step 34857: {'lr': 0.00044162325170233745, 'samples': 6692544, 'steps': 34856, 'loss/train': 1.701670527458191} -08/30/2021 19:31:12 - INFO - __main__ - Step 34858: {'lr': 0.00044161984338852967, 'samples': 6692736, 'steps': 34857, 'loss/train': 1.397925615310669} -08/30/2021 19:31:12 - INFO - __main__ - Step 34859: {'lr': 0.000441616434988381, 'samples': 6692928, 'steps': 34858, 'loss/train': 1.7587172985076904} -08/30/2021 19:31:13 - INFO - __main__ - Step 34860: {'lr': 0.00044161302650189295, 'samples': 6693120, 'steps': 34859, 'loss/train': 1.7492303848266602} -08/30/2021 19:31:13 - INFO - __main__ - Step 34861: {'lr': 0.00044160961792906694, 'samples': 6693312, 'steps': 34860, 'loss/train': 0.9920586943626404} -08/30/2021 19:31:15 - INFO - __main__ - Step 34862: {'lr': 0.00044160620926990456, 'samples': 6693504, 'steps': 34861, 'loss/train': 1.1697667837142944} -08/30/2021 19:31:15 - INFO - __main__ - Step 34863: {'lr': 0.0004416028005244075, 'samples': 6693696, 'steps': 34862, 'loss/train': 1.527687430381775} -08/30/2021 19:31:15 - INFO - __main__ - Step 34864: {'lr': 0.0004415993916925771, 'samples': 6693888, 'steps': 34863, 'loss/train': 1.2309246063232422} -08/30/2021 19:31:16 - INFO - __main__ - Step 34865: {'lr': 0.000441595982774415, 'samples': 6694080, 'steps': 34864, 'loss/train': 1.2404483556747437} -08/30/2021 19:31:16 - INFO - __main__ - Step 34866: {'lr': 0.00044159257376992267, 'samples': 6694272, 'steps': 34865, 'loss/train': 0.95048588514328} -08/30/2021 19:31:17 - INFO - __main__ - Step 34867: {'lr': 0.0004415891646791017, 'samples': 6694464, 'steps': 34866, 'loss/train': 1.4146426916122437} -08/30/2021 19:31:18 - INFO - __main__ - Step 34868: {'lr': 0.0004415857555019536, 'samples': 6694656, 'steps': 34867, 'loss/train': 1.2230663299560547} -08/30/2021 19:31:18 - INFO - __main__ - Step 34869: {'lr': 0.00044158234623847993, 'samples': 6694848, 'steps': 34868, 'loss/train': 1.3979012966156006} -08/30/2021 19:31:19 - INFO - __main__ - Step 34870: {'lr': 0.00044157893688868223, 'samples': 6695040, 'steps': 34869, 'loss/train': 1.5737814903259277} -08/30/2021 19:31:19 - INFO - __main__ - Step 34871: {'lr': 0.00044157552745256203, 'samples': 6695232, 'steps': 34870, 'loss/train': 1.2867834568023682} -08/30/2021 19:31:21 - INFO - __main__ - Step 34872: {'lr': 0.0004415721179301208, 'samples': 6695424, 'steps': 34871, 'loss/train': 1.8243038654327393} -08/30/2021 19:31:21 - INFO - __main__ - Step 34873: {'lr': 0.00044156870832136015, 'samples': 6695616, 'steps': 34872, 'loss/train': 1.4083529710769653} -08/30/2021 19:31:22 - INFO - __main__ - Step 34874: {'lr': 0.00044156529862628157, 'samples': 6695808, 'steps': 34873, 'loss/train': 1.1257758140563965} -08/30/2021 19:31:22 - INFO - __main__ - Step 34875: {'lr': 0.00044156188884488667, 'samples': 6696000, 'steps': 34874, 'loss/train': 0.5940538644790649} -08/30/2021 19:31:22 - INFO - __main__ - Step 34876: {'lr': 0.0004415584789771769, 'samples': 6696192, 'steps': 34875, 'loss/train': 1.5871161222457886} -08/30/2021 19:31:24 - INFO - __main__ - Step 34877: {'lr': 0.0004415550690231539, 'samples': 6696384, 'steps': 34876, 'loss/train': 1.7959715127944946} -08/30/2021 19:31:24 - INFO - __main__ - Step 34878: {'lr': 0.0004415516589828191, 'samples': 6696576, 'steps': 34877, 'loss/train': 1.8214266300201416} -08/30/2021 19:31:25 - INFO - __main__ - Step 34879: {'lr': 0.00044154824885617405, 'samples': 6696768, 'steps': 34878, 'loss/train': 1.333667278289795} -08/30/2021 19:31:25 - INFO - __main__ - Step 34880: {'lr': 0.0004415448386432204, 'samples': 6696960, 'steps': 34879, 'loss/train': 1.5091241598129272} -08/30/2021 19:31:25 - INFO - __main__ - Step 34881: {'lr': 0.00044154142834395947, 'samples': 6697152, 'steps': 34880, 'loss/train': 1.980600118637085} -08/30/2021 19:31:27 - INFO - __main__ - Step 34882: {'lr': 0.00044153801795839296, 'samples': 6697344, 'steps': 34881, 'loss/train': 1.2688275575637817} -08/30/2021 19:31:28 - INFO - __main__ - Step 34883: {'lr': 0.00044153460748652245, 'samples': 6697536, 'steps': 34882, 'loss/train': 1.6996781826019287} -08/30/2021 19:31:28 - INFO - __main__ - Step 34884: {'lr': 0.00044153119692834944, 'samples': 6697728, 'steps': 34883, 'loss/train': 1.1240493059158325} -08/30/2021 19:31:29 - INFO - __main__ - Step 34885: {'lr': 0.0004415277862838753, 'samples': 6697920, 'steps': 34884, 'loss/train': 1.2142804861068726} -08/30/2021 19:31:29 - INFO - __main__ - Step 34886: {'lr': 0.00044152437555310174, 'samples': 6698112, 'steps': 34885, 'loss/train': 1.9530127048492432} -08/30/2021 19:31:30 - INFO - __main__ - Step 34887: {'lr': 0.00044152096473603025, 'samples': 6698304, 'steps': 34886, 'loss/train': 1.6505686044692993} -08/30/2021 19:31:31 - INFO - __main__ - Step 34888: {'lr': 0.00044151755383266234, 'samples': 6698496, 'steps': 34887, 'loss/train': 1.431886076927185} -08/30/2021 19:31:31 - INFO - __main__ - Step 34889: {'lr': 0.0004415141428429997, 'samples': 6698688, 'steps': 34888, 'loss/train': 1.5804921388626099} -08/30/2021 19:31:32 - INFO - __main__ - Step 34890: {'lr': 0.0004415107317670436, 'samples': 6698880, 'steps': 34889, 'loss/train': 1.5146671533584595} -08/30/2021 19:31:32 - INFO - __main__ - Step 34891: {'lr': 0.0004415073206047958, 'samples': 6699072, 'steps': 34890, 'loss/train': 1.518310308456421} -08/30/2021 19:31:33 - INFO - __main__ - Step 34892: {'lr': 0.0004415039093562577, 'samples': 6699264, 'steps': 34891, 'loss/train': 0.8351407051086426} -08/30/2021 19:31:34 - INFO - __main__ - Step 34893: {'lr': 0.00044150049802143095, 'samples': 6699456, 'steps': 34892, 'loss/train': 0.9097894430160522} -08/30/2021 19:31:34 - INFO - __main__ - Step 34894: {'lr': 0.00044149708660031704, 'samples': 6699648, 'steps': 34893, 'loss/train': 1.442458987236023} -08/30/2021 19:31:35 - INFO - __main__ - Step 34895: {'lr': 0.0004414936750929174, 'samples': 6699840, 'steps': 34894, 'loss/train': 1.6313551664352417} -08/30/2021 19:31:35 - INFO - __main__ - Step 34896: {'lr': 0.0004414902634992338, 'samples': 6700032, 'steps': 34895, 'loss/train': 1.3373081684112549} -08/30/2021 19:31:35 - INFO - __main__ - Step 34897: {'lr': 0.0004414868518192675, 'samples': 6700224, 'steps': 34896, 'loss/train': 1.1038962602615356} -08/30/2021 19:31:37 - INFO - __main__ - Step 34898: {'lr': 0.0004414834400530203, 'samples': 6700416, 'steps': 34897, 'loss/train': 0.8443583250045776} -08/30/2021 19:31:37 - INFO - __main__ - Step 34899: {'lr': 0.00044148002820049354, 'samples': 6700608, 'steps': 34898, 'loss/train': 1.4998301267623901} -08/30/2021 19:31:37 - INFO - __main__ - Step 34900: {'lr': 0.00044147661626168887, 'samples': 6700800, 'steps': 34899, 'loss/train': 1.3775559663772583} -08/30/2021 19:31:38 - INFO - __main__ - Step 34901: {'lr': 0.0004414732042366078, 'samples': 6700992, 'steps': 34900, 'loss/train': 2.135401964187622} -08/30/2021 19:31:38 - INFO - __main__ - Step 34902: {'lr': 0.00044146979212525184, 'samples': 6701184, 'steps': 34901, 'loss/train': 1.555981993675232} -08/30/2021 19:31:40 - INFO - __main__ - Step 34903: {'lr': 0.0004414663799276225, 'samples': 6701376, 'steps': 34902, 'loss/train': 1.308225393295288} -08/30/2021 19:31:40 - INFO - __main__ - Step 34904: {'lr': 0.0004414629676437214, 'samples': 6701568, 'steps': 34903, 'loss/train': 1.3855127096176147} -08/30/2021 19:31:40 - INFO - __main__ - Step 34905: {'lr': 0.00044145955527355007, 'samples': 6701760, 'steps': 34904, 'loss/train': 1.6369949579238892} -08/30/2021 19:31:41 - INFO - __main__ - Step 34906: {'lr': 0.00044145614281711, 'samples': 6701952, 'steps': 34905, 'loss/train': 1.4939477443695068} -08/30/2021 19:31:41 - INFO - __main__ - Step 34907: {'lr': 0.00044145273027440275, 'samples': 6702144, 'steps': 34906, 'loss/train': 0.7918360233306885} -08/30/2021 19:31:43 - INFO - __main__ - Step 34908: {'lr': 0.0004414493176454298, 'samples': 6702336, 'steps': 34907, 'loss/train': 1.0705316066741943} -08/30/2021 19:31:43 - INFO - __main__ - Step 34909: {'lr': 0.0004414459049301929, 'samples': 6702528, 'steps': 34908, 'loss/train': 1.296346664428711} -08/30/2021 19:31:43 - INFO - __main__ - Step 34910: {'lr': 0.00044144249212869327, 'samples': 6702720, 'steps': 34909, 'loss/train': 1.7491952180862427} -08/30/2021 19:31:44 - INFO - __main__ - Step 34911: {'lr': 0.0004414390792409326, 'samples': 6702912, 'steps': 34910, 'loss/train': 1.4354376792907715} -08/30/2021 19:31:44 - INFO - __main__ - Step 34912: {'lr': 0.0004414356662669126, 'samples': 6703104, 'steps': 34911, 'loss/train': 1.414766788482666} -08/30/2021 19:31:46 - INFO - __main__ - Step 34913: {'lr': 0.0004414322532066345, 'samples': 6703296, 'steps': 34912, 'loss/train': 1.2923349142074585} -08/30/2021 19:31:46 - INFO - __main__ - Step 34914: {'lr': 0.0004414288400601, 'samples': 6703488, 'steps': 34913, 'loss/train': 1.2957944869995117} -08/30/2021 19:31:47 - INFO - __main__ - Step 34915: {'lr': 0.0004414254268273107, 'samples': 6703680, 'steps': 34914, 'loss/train': 1.2687324285507202} -08/30/2021 19:31:47 - INFO - __main__ - Step 34916: {'lr': 0.0004414220135082679, 'samples': 6703872, 'steps': 34915, 'loss/train': 1.5417463779449463} -08/30/2021 19:31:47 - INFO - __main__ - Step 34917: {'lr': 0.0004414186001029734, 'samples': 6704064, 'steps': 34916, 'loss/train': 2.081559896469116} -08/30/2021 19:31:49 - INFO - __main__ - Step 34918: {'lr': 0.00044141518661142864, 'samples': 6704256, 'steps': 34917, 'loss/train': 1.0758578777313232} -08/30/2021 19:31:49 - INFO - __main__ - Step 34919: {'lr': 0.0004414117730336351, 'samples': 6704448, 'steps': 34918, 'loss/train': 1.3303520679473877} -08/30/2021 19:31:50 - INFO - __main__ - Step 34920: {'lr': 0.0004414083593695944, 'samples': 6704640, 'steps': 34919, 'loss/train': 1.7778058052062988} -08/30/2021 19:31:50 - INFO - __main__ - Step 34921: {'lr': 0.0004414049456193081, 'samples': 6704832, 'steps': 34920, 'loss/train': 1.1302248239517212} -08/30/2021 19:31:50 - INFO - __main__ - Step 34922: {'lr': 0.00044140153178277765, 'samples': 6705024, 'steps': 34921, 'loss/train': 1.0757726430892944} -08/30/2021 19:31:51 - INFO - __main__ - Step 34923: {'lr': 0.0004413981178600046, 'samples': 6705216, 'steps': 34922, 'loss/train': 1.4501041173934937} -08/30/2021 19:31:52 - INFO - __main__ - Step 34924: {'lr': 0.00044139470385099047, 'samples': 6705408, 'steps': 34923, 'loss/train': 0.9826469421386719} -08/30/2021 19:31:53 - INFO - __main__ - Step 34925: {'lr': 0.0004413912897557369, 'samples': 6705600, 'steps': 34924, 'loss/train': 1.6712535619735718} -08/30/2021 19:31:53 - INFO - __main__ - Step 34926: {'lr': 0.0004413878755742454, 'samples': 6705792, 'steps': 34925, 'loss/train': 1.4016990661621094} -08/30/2021 19:31:53 - INFO - __main__ - Step 34927: {'lr': 0.00044138446130651736, 'samples': 6705984, 'steps': 34926, 'loss/train': 1.0843738317489624} -08/30/2021 19:31:54 - INFO - __main__ - Step 34928: {'lr': 0.00044138104695255455, 'samples': 6706176, 'steps': 34927, 'loss/train': 1.0599063634872437} -08/30/2021 19:31:55 - INFO - __main__ - Step 34929: {'lr': 0.00044137763251235837, 'samples': 6706368, 'steps': 34928, 'loss/train': 1.0353928804397583} -08/30/2021 19:31:56 - INFO - __main__ - Step 34930: {'lr': 0.0004413742179859304, 'samples': 6706560, 'steps': 34929, 'loss/train': 1.6535227298736572} -08/30/2021 19:31:56 - INFO - __main__ - Step 34931: {'lr': 0.00044137080337327205, 'samples': 6706752, 'steps': 34930, 'loss/train': 1.1370371580123901} -08/30/2021 19:31:56 - INFO - __main__ - Step 34932: {'lr': 0.000441367388674385, 'samples': 6706944, 'steps': 34931, 'loss/train': 1.3399639129638672} -08/30/2021 19:31:57 - INFO - __main__ - Step 34933: {'lr': 0.00044136397388927083, 'samples': 6707136, 'steps': 34932, 'loss/train': 1.2659764289855957} -08/30/2021 19:31:59 - INFO - __main__ - Step 34934: {'lr': 0.000441360559017931, 'samples': 6707328, 'steps': 34933, 'loss/train': 1.408302664756775} -08/30/2021 19:31:59 - INFO - __main__ - Step 34935: {'lr': 0.00044135714406036696, 'samples': 6707520, 'steps': 34934, 'loss/train': 0.8814275860786438} -08/30/2021 19:32:00 - INFO - __main__ - Step 34936: {'lr': 0.00044135372901658046, 'samples': 6707712, 'steps': 34935, 'loss/train': 1.4974032640457153} -08/30/2021 19:32:00 - INFO - __main__ - Step 34937: {'lr': 0.0004413503138865729, 'samples': 6707904, 'steps': 34936, 'loss/train': 1.4900633096694946} -08/30/2021 19:32:00 - INFO - __main__ - Step 34938: {'lr': 0.00044134689867034583, 'samples': 6708096, 'steps': 34937, 'loss/train': 1.1023952960968018} -08/30/2021 19:32:02 - INFO - __main__ - Step 34939: {'lr': 0.00044134348336790074, 'samples': 6708288, 'steps': 34938, 'loss/train': 1.4308836460113525} -08/30/2021 19:32:02 - INFO - __main__ - Step 34940: {'lr': 0.0004413400679792393, 'samples': 6708480, 'steps': 34939, 'loss/train': 1.3813395500183105} -08/30/2021 19:32:03 - INFO - __main__ - Step 34941: {'lr': 0.00044133665250436295, 'samples': 6708672, 'steps': 34940, 'loss/train': 1.0480033159255981} -08/30/2021 19:32:03 - INFO - __main__ - Step 34942: {'lr': 0.00044133323694327324, 'samples': 6708864, 'steps': 34941, 'loss/train': 1.8553470373153687} -08/30/2021 19:32:03 - INFO - __main__ - Step 34943: {'lr': 0.0004413298212959718, 'samples': 6709056, 'steps': 34942, 'loss/train': 0.9769366383552551} -08/30/2021 19:32:05 - INFO - __main__ - Step 34944: {'lr': 0.00044132640556246, 'samples': 6709248, 'steps': 34943, 'loss/train': 1.2747609615325928} -08/30/2021 19:32:05 - INFO - __main__ - Step 34945: {'lr': 0.00044132298974273955, 'samples': 6709440, 'steps': 34944, 'loss/train': 1.2658013105392456} -08/30/2021 19:32:06 - INFO - __main__ - Step 34946: {'lr': 0.00044131957383681186, 'samples': 6709632, 'steps': 34945, 'loss/train': 1.5538816452026367} -08/30/2021 19:32:06 - INFO - __main__ - Step 34947: {'lr': 0.0004413161578446785, 'samples': 6709824, 'steps': 34946, 'loss/train': 1.8017503023147583} -08/30/2021 19:32:07 - INFO - __main__ - Step 34948: {'lr': 0.00044131274176634113, 'samples': 6710016, 'steps': 34947, 'loss/train': 1.155334234237671} -08/30/2021 19:32:08 - INFO - __main__ - Step 34949: {'lr': 0.00044130932560180114, 'samples': 6710208, 'steps': 34948, 'loss/train': 0.075958751142025} -08/30/2021 19:32:09 - INFO - __main__ - Step 34950: {'lr': 0.0004413059093510601, 'samples': 6710400, 'steps': 34949, 'loss/train': 1.3488863706588745} -08/30/2021 19:32:09 - INFO - __main__ - Step 34951: {'lr': 0.00044130249301411957, 'samples': 6710592, 'steps': 34950, 'loss/train': 0.6622664928436279} -08/30/2021 19:32:09 - INFO - __main__ - Step 34952: {'lr': 0.0004412990765909811, 'samples': 6710784, 'steps': 34951, 'loss/train': 0.07370854169130325} -08/30/2021 19:32:10 - INFO - __main__ - Step 34953: {'lr': 0.0004412956600816462, 'samples': 6710976, 'steps': 34952, 'loss/train': 1.2174763679504395} -08/30/2021 19:32:10 - INFO - __main__ - Step 34954: {'lr': 0.00044129224348611644, 'samples': 6711168, 'steps': 34953, 'loss/train': 1.7220250368118286} -08/30/2021 19:32:12 - INFO - __main__ - Step 34955: {'lr': 0.0004412888268043934, 'samples': 6711360, 'steps': 34954, 'loss/train': 0.035442106425762177} -08/30/2021 19:32:12 - INFO - __main__ - Step 34956: {'lr': 0.0004412854100364785, 'samples': 6711552, 'steps': 34955, 'loss/train': 1.458470344543457} -08/30/2021 19:32:13 - INFO - __main__ - Step 34957: {'lr': 0.0004412819931823734, 'samples': 6711744, 'steps': 34956, 'loss/train': 1.0985313653945923} -08/30/2021 19:32:13 - INFO - __main__ - Step 34958: {'lr': 0.0004412785762420795, 'samples': 6711936, 'steps': 34957, 'loss/train': 1.5779829025268555} -08/30/2021 19:32:13 - INFO - __main__ - Step 34959: {'lr': 0.0004412751592155985, 'samples': 6712128, 'steps': 34958, 'loss/train': 1.0971028804779053} -08/30/2021 19:32:15 - INFO - __main__ - Step 34960: {'lr': 0.00044127174210293186, 'samples': 6712320, 'steps': 34959, 'loss/train': 1.132872223854065} -08/30/2021 19:32:15 - INFO - __main__ - Step 34961: {'lr': 0.0004412683249040811, 'samples': 6712512, 'steps': 34960, 'loss/train': 1.2651100158691406} -08/30/2021 19:32:16 - INFO - __main__ - Step 34962: {'lr': 0.0004412649076190478, 'samples': 6712704, 'steps': 34961, 'loss/train': 1.420601725578308} -08/30/2021 19:32:16 - INFO - __main__ - Step 34963: {'lr': 0.00044126149024783346, 'samples': 6712896, 'steps': 34962, 'loss/train': 1.4611116647720337} -08/30/2021 19:32:16 - INFO - __main__ - Step 34964: {'lr': 0.0004412580727904396, 'samples': 6713088, 'steps': 34963, 'loss/train': 1.36281418800354} -08/30/2021 19:32:18 - INFO - __main__ - Step 34965: {'lr': 0.0004412546552468679, 'samples': 6713280, 'steps': 34964, 'loss/train': 1.1717272996902466} -08/30/2021 19:32:18 - INFO - __main__ - Step 34966: {'lr': 0.00044125123761711975, 'samples': 6713472, 'steps': 34965, 'loss/train': 1.4397194385528564} -08/30/2021 19:32:19 - INFO - __main__ - Step 34967: {'lr': 0.00044124781990119677, 'samples': 6713664, 'steps': 34966, 'loss/train': 1.1725163459777832} -08/30/2021 19:32:19 - INFO - __main__ - Step 34968: {'lr': 0.0004412444020991004, 'samples': 6713856, 'steps': 34967, 'loss/train': 0.12758542597293854} -08/30/2021 19:32:19 - INFO - __main__ - Step 34969: {'lr': 0.0004412409842108324, 'samples': 6714048, 'steps': 34968, 'loss/train': 1.1853598356246948} -08/30/2021 19:32:21 - INFO - __main__ - Step 34970: {'lr': 0.0004412375662363941, 'samples': 6714240, 'steps': 34969, 'loss/train': 0.9862979650497437} -08/30/2021 19:32:21 - INFO - __main__ - Step 34971: {'lr': 0.00044123414817578705, 'samples': 6714432, 'steps': 34970, 'loss/train': 1.3713527917861938} -08/30/2021 19:32:22 - INFO - __main__ - Step 34972: {'lr': 0.00044123073002901286, 'samples': 6714624, 'steps': 34971, 'loss/train': 1.966863751411438} -08/30/2021 19:32:22 - INFO - __main__ - Step 34973: {'lr': 0.0004412273117960731, 'samples': 6714816, 'steps': 34972, 'loss/train': 1.3497530221939087} -08/30/2021 19:32:22 - INFO - __main__ - Step 34974: {'lr': 0.00044122389347696925, 'samples': 6715008, 'steps': 34973, 'loss/train': 1.4592618942260742} -08/30/2021 19:32:24 - INFO - __main__ - Step 34975: {'lr': 0.0004412204750717028, 'samples': 6715200, 'steps': 34974, 'loss/train': 1.2592018842697144} -08/30/2021 19:32:25 - INFO - __main__ - Step 34976: {'lr': 0.00044121705658027545, 'samples': 6715392, 'steps': 34975, 'loss/train': 0.8790485858917236} -08/30/2021 19:32:25 - INFO - __main__ - Step 34977: {'lr': 0.00044121363800268853, 'samples': 6715584, 'steps': 34976, 'loss/train': 1.33357572555542} -08/30/2021 19:32:25 - INFO - __main__ - Step 34978: {'lr': 0.0004412102193389438, 'samples': 6715776, 'steps': 34977, 'loss/train': 1.4491406679153442} -08/30/2021 19:32:26 - INFO - __main__ - Step 34979: {'lr': 0.0004412068005890427, 'samples': 6715968, 'steps': 34978, 'loss/train': 1.7957377433776855} -08/30/2021 19:32:26 - INFO - __main__ - Step 34980: {'lr': 0.0004412033817529867, 'samples': 6716160, 'steps': 34979, 'loss/train': 3.723341703414917} -08/30/2021 19:32:28 - INFO - __main__ - Step 34981: {'lr': 0.0004411999628307775, 'samples': 6716352, 'steps': 34980, 'loss/train': 2.0891482830047607} -08/30/2021 19:32:28 - INFO - __main__ - Step 34982: {'lr': 0.0004411965438224164, 'samples': 6716544, 'steps': 34981, 'loss/train': 2.0819387435913086} -08/30/2021 19:32:29 - INFO - __main__ - Step 34983: {'lr': 0.0004411931247279052, 'samples': 6716736, 'steps': 34982, 'loss/train': 1.2802892923355103} -08/30/2021 19:32:29 - INFO - __main__ - Step 34984: {'lr': 0.00044118970554724523, 'samples': 6716928, 'steps': 34983, 'loss/train': 0.2615245580673218} -08/30/2021 19:32:29 - INFO - __main__ - Step 34985: {'lr': 0.0004411862862804382, 'samples': 6717120, 'steps': 34984, 'loss/train': 1.3118356466293335} -08/30/2021 19:32:31 - INFO - __main__ - Step 34986: {'lr': 0.0004411828669274856, 'samples': 6717312, 'steps': 34985, 'loss/train': 0.8165215253829956} -08/30/2021 19:32:31 - INFO - __main__ - Step 34987: {'lr': 0.0004411794474883889, 'samples': 6717504, 'steps': 34986, 'loss/train': 1.1048524379730225} -08/30/2021 19:32:32 - INFO - __main__ - Step 34988: {'lr': 0.0004411760279631497, 'samples': 6717696, 'steps': 34987, 'loss/train': 1.797042727470398} -08/30/2021 19:32:32 - INFO - __main__ - Step 34989: {'lr': 0.0004411726083517696, 'samples': 6717888, 'steps': 34988, 'loss/train': 1.6182481050491333} -08/30/2021 19:32:32 - INFO - __main__ - Step 34990: {'lr': 0.00044116918865425004, 'samples': 6718080, 'steps': 34989, 'loss/train': 5.43362283706665} -08/30/2021 19:32:34 - INFO - __main__ - Step 34991: {'lr': 0.00044116576887059255, 'samples': 6718272, 'steps': 34990, 'loss/train': 1.5861461162567139} -08/30/2021 19:32:35 - INFO - __main__ - Step 34992: {'lr': 0.0004411623490007988, 'samples': 6718464, 'steps': 34991, 'loss/train': 1.012242078781128} -08/30/2021 19:32:35 - INFO - __main__ - Step 34993: {'lr': 0.0004411589290448701, 'samples': 6718656, 'steps': 34992, 'loss/train': 1.86570143699646} -08/30/2021 19:32:35 - INFO - __main__ - Step 34994: {'lr': 0.0004411555090028082, 'samples': 6718848, 'steps': 34993, 'loss/train': 1.142942190170288} -08/30/2021 19:32:36 - INFO - __main__ - Step 34995: {'lr': 0.00044115208887461464, 'samples': 6719040, 'steps': 34994, 'loss/train': 1.1457595825195312} -08/30/2021 19:32:37 - INFO - __main__ - Step 34996: {'lr': 0.00044114866866029086, 'samples': 6719232, 'steps': 34995, 'loss/train': 1.43965744972229} -08/30/2021 19:32:38 - INFO - __main__ - Step 34997: {'lr': 0.00044114524835983844, 'samples': 6719424, 'steps': 34996, 'loss/train': 1.3998771905899048} -08/30/2021 19:32:38 - INFO - __main__ - Step 34998: {'lr': 0.00044114182797325884, 'samples': 6719616, 'steps': 34997, 'loss/train': 1.418233871459961} -08/30/2021 19:32:38 - INFO - __main__ - Step 34999: {'lr': 0.0004411384075005538, 'samples': 6719808, 'steps': 34998, 'loss/train': 1.4251606464385986} -08/30/2021 19:32:39 - INFO - __main__ - Step 35000: {'lr': 0.0004411349869417247, 'samples': 6720000, 'steps': 34999, 'loss/train': 1.608568787574768} -08/30/2021 19:32:39 - INFO - __main__ - Step 35001: {'lr': 0.00044113156629677313, 'samples': 6720192, 'steps': 35000, 'loss/train': 1.2498257160186768} -08/30/2021 19:32:40 - INFO - __main__ - Step 35002: {'lr': 0.00044112814556570066, 'samples': 6720384, 'steps': 35001, 'loss/train': 1.1979851722717285} -08/30/2021 19:32:41 - INFO - __main__ - Step 35003: {'lr': 0.00044112472474850875, 'samples': 6720576, 'steps': 35002, 'loss/train': 1.4907722473144531} -08/30/2021 19:32:41 - INFO - __main__ - Step 35004: {'lr': 0.000441121303845199, 'samples': 6720768, 'steps': 35003, 'loss/train': 1.3451606035232544} -08/30/2021 19:32:42 - INFO - __main__ - Step 35005: {'lr': 0.0004411178828557729, 'samples': 6720960, 'steps': 35004, 'loss/train': 1.400999665260315} -08/30/2021 19:32:42 - INFO - __main__ - Step 35006: {'lr': 0.00044111446178023205, 'samples': 6721152, 'steps': 35005, 'loss/train': 1.5949101448059082} -08/30/2021 19:32:44 - INFO - __main__ - Step 35007: {'lr': 0.000441111040618578, 'samples': 6721344, 'steps': 35006, 'loss/train': 1.2730093002319336} -08/30/2021 19:32:44 - INFO - __main__ - Step 35008: {'lr': 0.0004411076193708122, 'samples': 6721536, 'steps': 35007, 'loss/train': 1.6350964307785034} -08/30/2021 19:32:45 - INFO - __main__ - Step 35009: {'lr': 0.00044110419803693635, 'samples': 6721728, 'steps': 35008, 'loss/train': 0.588362455368042} -08/30/2021 19:32:45 - INFO - __main__ - Step 35010: {'lr': 0.00044110077661695194, 'samples': 6721920, 'steps': 35009, 'loss/train': 0.6230650544166565} -08/30/2021 19:32:45 - INFO - __main__ - Step 35011: {'lr': 0.00044109735511086036, 'samples': 6722112, 'steps': 35010, 'loss/train': 0.5072710514068604} -08/30/2021 19:32:47 - INFO - __main__ - Step 35012: {'lr': 0.00044109393351866324, 'samples': 6722304, 'steps': 35011, 'loss/train': 1.3631649017333984} -08/30/2021 19:32:47 - INFO - __main__ - Step 35013: {'lr': 0.0004410905118403622, 'samples': 6722496, 'steps': 35012, 'loss/train': 2.4922847747802734} -08/30/2021 19:32:48 - INFO - __main__ - Step 35014: {'lr': 0.0004410870900759587, 'samples': 6722688, 'steps': 35013, 'loss/train': 1.4231981039047241} -08/30/2021 19:32:48 - INFO - __main__ - Step 35015: {'lr': 0.0004410836682254543, 'samples': 6722880, 'steps': 35014, 'loss/train': 1.2394388914108276} -08/30/2021 19:32:48 - INFO - __main__ - Step 35016: {'lr': 0.0004410802462888506, 'samples': 6723072, 'steps': 35015, 'loss/train': 1.2930346727371216} -08/30/2021 19:32:50 - INFO - __main__ - Step 35017: {'lr': 0.00044107682426614903, 'samples': 6723264, 'steps': 35016, 'loss/train': 1.2831521034240723} -08/30/2021 19:32:50 - INFO - __main__ - Step 35018: {'lr': 0.00044107340215735125, 'samples': 6723456, 'steps': 35017, 'loss/train': 0.6018421649932861} -08/30/2021 19:32:51 - INFO - __main__ - Step 35019: {'lr': 0.00044106997996245866, 'samples': 6723648, 'steps': 35018, 'loss/train': 1.442072868347168} -08/30/2021 19:32:51 - INFO - __main__ - Step 35020: {'lr': 0.000441066557681473, 'samples': 6723840, 'steps': 35019, 'loss/train': 1.624201774597168} -08/30/2021 19:32:51 - INFO - __main__ - Step 35021: {'lr': 0.00044106313531439565, 'samples': 6724032, 'steps': 35020, 'loss/train': 1.4344145059585571} -08/30/2021 19:32:53 - INFO - __main__ - Step 35022: {'lr': 0.00044105971286122816, 'samples': 6724224, 'steps': 35021, 'loss/train': 1.5966792106628418} -08/30/2021 19:32:53 - INFO - __main__ - Step 35023: {'lr': 0.00044105629032197214, 'samples': 6724416, 'steps': 35022, 'loss/train': 1.3417925834655762} -08/30/2021 19:32:54 - INFO - __main__ - Step 35024: {'lr': 0.0004410528676966291, 'samples': 6724608, 'steps': 35023, 'loss/train': 1.6505361795425415} -08/30/2021 19:32:54 - INFO - __main__ - Step 35025: {'lr': 0.00044104944498520054, 'samples': 6724800, 'steps': 35024, 'loss/train': 1.2967965602874756} -08/30/2021 19:32:54 - INFO - __main__ - Step 35026: {'lr': 0.00044104602218768805, 'samples': 6724992, 'steps': 35025, 'loss/train': 1.8254172801971436} -08/30/2021 19:32:56 - INFO - __main__ - Step 35027: {'lr': 0.0004410425993040933, 'samples': 6725184, 'steps': 35026, 'loss/train': 0.9522691369056702} -08/30/2021 19:32:56 - INFO - __main__ - Step 35028: {'lr': 0.0004410391763344176, 'samples': 6725376, 'steps': 35027, 'loss/train': 0.9665768146514893} -08/30/2021 19:32:57 - INFO - __main__ - Step 35029: {'lr': 0.00044103575327866264, 'samples': 6725568, 'steps': 35028, 'loss/train': 1.1050482988357544} -08/30/2021 19:32:57 - INFO - __main__ - Step 35030: {'lr': 0.0004410323301368299, 'samples': 6725760, 'steps': 35029, 'loss/train': 1.7607635259628296} -08/30/2021 19:32:57 - INFO - __main__ - Step 35031: {'lr': 0.0004410289069089209, 'samples': 6725952, 'steps': 35030, 'loss/train': 0.9335264563560486} -08/30/2021 19:32:59 - INFO - __main__ - Step 35032: {'lr': 0.0004410254835949372, 'samples': 6726144, 'steps': 35031, 'loss/train': 0.9821897745132446} -08/30/2021 19:32:59 - INFO - __main__ - Step 35033: {'lr': 0.00044102206019488045, 'samples': 6726336, 'steps': 35032, 'loss/train': 0.6056498289108276} -08/30/2021 19:33:00 - INFO - __main__ - Step 35034: {'lr': 0.00044101863670875207, 'samples': 6726528, 'steps': 35033, 'loss/train': 1.4131925106048584} -08/30/2021 19:33:00 - INFO - __main__ - Step 35035: {'lr': 0.0004410152131365536, 'samples': 6726720, 'steps': 35034, 'loss/train': 1.3641514778137207} -08/30/2021 19:33:00 - INFO - __main__ - Step 35036: {'lr': 0.00044101178947828667, 'samples': 6726912, 'steps': 35035, 'loss/train': 0.9625906944274902} -08/30/2021 19:33:01 - INFO - __main__ - Step 35037: {'lr': 0.0004410083657339528, 'samples': 6727104, 'steps': 35036, 'loss/train': 2.07183837890625} -08/30/2021 19:33:02 - INFO - __main__ - Step 35038: {'lr': 0.00044100494190355347, 'samples': 6727296, 'steps': 35037, 'loss/train': 0.5002424120903015} -08/30/2021 19:33:03 - INFO - __main__ - Step 35039: {'lr': 0.0004410015179870903, 'samples': 6727488, 'steps': 35038, 'loss/train': 1.127249836921692} -08/30/2021 19:33:03 - INFO - __main__ - Step 35040: {'lr': 0.0004409980939845647, 'samples': 6727680, 'steps': 35039, 'loss/train': 1.3199843168258667} -08/30/2021 19:33:03 - INFO - __main__ - Step 35041: {'lr': 0.00044099466989597837, 'samples': 6727872, 'steps': 35040, 'loss/train': 1.1282857656478882} -08/30/2021 19:33:04 - INFO - __main__ - Step 35042: {'lr': 0.00044099124572133283, 'samples': 6728064, 'steps': 35041, 'loss/train': 1.9509625434875488} -08/30/2021 19:33:06 - INFO - __main__ - Step 35043: {'lr': 0.00044098782146062955, 'samples': 6728256, 'steps': 35042, 'loss/train': 1.8122310638427734} -08/30/2021 19:33:06 - INFO - __main__ - Step 35044: {'lr': 0.00044098439711387006, 'samples': 6728448, 'steps': 35043, 'loss/train': 1.501436710357666} -08/30/2021 19:33:07 - INFO - __main__ - Step 35045: {'lr': 0.000440980972681056, 'samples': 6728640, 'steps': 35044, 'loss/train': 1.2846965789794922} -08/30/2021 19:33:07 - INFO - __main__ - Step 35046: {'lr': 0.0004409775481621888, 'samples': 6728832, 'steps': 35045, 'loss/train': 1.9868472814559937} -08/30/2021 19:33:07 - INFO - __main__ - Step 35047: {'lr': 0.0004409741235572701, 'samples': 6729024, 'steps': 35046, 'loss/train': 1.2437779903411865} -08/30/2021 19:33:09 - INFO - __main__ - Step 35048: {'lr': 0.0004409706988663015, 'samples': 6729216, 'steps': 35047, 'loss/train': 1.5886855125427246} -08/30/2021 19:33:09 - INFO - __main__ - Step 35049: {'lr': 0.00044096727408928426, 'samples': 6729408, 'steps': 35048, 'loss/train': 1.4767874479293823} -08/30/2021 19:33:10 - INFO - __main__ - Step 35050: {'lr': 0.0004409638492262202, 'samples': 6729600, 'steps': 35049, 'loss/train': 2.264859676361084} -08/30/2021 19:33:10 - INFO - __main__ - Step 35051: {'lr': 0.0004409604242771108, 'samples': 6729792, 'steps': 35050, 'loss/train': 1.2183133363723755} -08/30/2021 19:33:10 - INFO - __main__ - Step 35052: {'lr': 0.0004409569992419576, 'samples': 6729984, 'steps': 35051, 'loss/train': 1.7627239227294922} -08/30/2021 19:33:12 - INFO - __main__ - Step 35053: {'lr': 0.0004409535741207621, 'samples': 6730176, 'steps': 35052, 'loss/train': 1.620200514793396} -08/30/2021 19:33:12 - INFO - __main__ - Step 35054: {'lr': 0.00044095014891352584, 'samples': 6730368, 'steps': 35053, 'loss/train': 1.8186169862747192} -08/30/2021 19:33:12 - INFO - __main__ - Step 35055: {'lr': 0.0004409467236202505, 'samples': 6730560, 'steps': 35054, 'loss/train': 1.1668120622634888} -08/30/2021 19:33:13 - INFO - __main__ - Step 35056: {'lr': 0.0004409432982409374, 'samples': 6730752, 'steps': 35055, 'loss/train': 1.3651800155639648} -08/30/2021 19:33:13 - INFO - __main__ - Step 35057: {'lr': 0.0004409398727755882, 'samples': 6730944, 'steps': 35056, 'loss/train': 0.658411979675293} -08/30/2021 19:33:15 - INFO - __main__ - Step 35058: {'lr': 0.00044093644722420445, 'samples': 6731136, 'steps': 35057, 'loss/train': 1.2759971618652344} -08/30/2021 19:33:15 - INFO - __main__ - Step 35059: {'lr': 0.00044093302158678766, 'samples': 6731328, 'steps': 35058, 'loss/train': 1.3347318172454834} -08/30/2021 19:33:16 - INFO - __main__ - Step 35060: {'lr': 0.0004409295958633394, 'samples': 6731520, 'steps': 35059, 'loss/train': 0.04077564552426338} -08/30/2021 19:33:16 - INFO - __main__ - Step 35061: {'lr': 0.00044092617005386125, 'samples': 6731712, 'steps': 35060, 'loss/train': 0.03668401390314102} -08/30/2021 19:33:17 - INFO - __main__ - Step 35062: {'lr': 0.00044092274415835473, 'samples': 6731904, 'steps': 35061, 'loss/train': 1.5081043243408203} -08/30/2021 19:33:17 - INFO - __main__ - Step 35063: {'lr': 0.0004409193181768213, 'samples': 6732096, 'steps': 35062, 'loss/train': 1.809552550315857} -08/30/2021 19:33:18 - INFO - __main__ - Step 35064: {'lr': 0.00044091589210926266, 'samples': 6732288, 'steps': 35063, 'loss/train': 1.3295716047286987} -08/30/2021 19:33:19 - INFO - __main__ - Step 35065: {'lr': 0.00044091246595568025, 'samples': 6732480, 'steps': 35064, 'loss/train': 1.4741064310073853} -08/30/2021 19:33:19 - INFO - __main__ - Step 35066: {'lr': 0.00044090903971607555, 'samples': 6732672, 'steps': 35065, 'loss/train': 1.6967097520828247} -08/30/2021 19:33:20 - INFO - __main__ - Step 35067: {'lr': 0.0004409056133904502, 'samples': 6732864, 'steps': 35066, 'loss/train': 1.4284765720367432} -08/30/2021 19:33:20 - INFO - __main__ - Step 35068: {'lr': 0.00044090218697880577, 'samples': 6733056, 'steps': 35067, 'loss/train': 1.3743704557418823} -08/30/2021 19:33:21 - INFO - __main__ - Step 35069: {'lr': 0.0004408987604811437, 'samples': 6733248, 'steps': 35068, 'loss/train': 1.3716342449188232} -08/30/2021 19:33:22 - INFO - __main__ - Step 35070: {'lr': 0.00044089533389746573, 'samples': 6733440, 'steps': 35069, 'loss/train': 1.1787060499191284} -08/30/2021 19:33:22 - INFO - __main__ - Step 35071: {'lr': 0.00044089190722777316, 'samples': 6733632, 'steps': 35070, 'loss/train': 1.353332281112671} -08/30/2021 19:33:23 - INFO - __main__ - Step 35072: {'lr': 0.00044088848047206763, 'samples': 6733824, 'steps': 35071, 'loss/train': 1.9297947883605957} -08/30/2021 19:33:23 - INFO - __main__ - Step 35073: {'lr': 0.0004408850536303507, 'samples': 6734016, 'steps': 35072, 'loss/train': 1.4050127267837524} -08/30/2021 19:33:24 - INFO - __main__ - Step 35074: {'lr': 0.000440881626702624, 'samples': 6734208, 'steps': 35073, 'loss/train': 1.686198353767395} -08/30/2021 19:33:25 - INFO - __main__ - Step 35075: {'lr': 0.00044087819968888887, 'samples': 6734400, 'steps': 35074, 'loss/train': 1.3090829849243164} -08/30/2021 19:33:25 - INFO - __main__ - Step 35076: {'lr': 0.00044087477258914696, 'samples': 6734592, 'steps': 35075, 'loss/train': 1.817962884902954} -08/30/2021 19:33:25 - INFO - __main__ - Step 35077: {'lr': 0.00044087134540339996, 'samples': 6734784, 'steps': 35076, 'loss/train': 1.5255579948425293} -08/30/2021 19:33:26 - INFO - __main__ - Step 35078: {'lr': 0.00044086791813164916, 'samples': 6734976, 'steps': 35077, 'loss/train': 1.0958340167999268} -08/30/2021 19:33:27 - INFO - __main__ - Step 35079: {'lr': 0.00044086449077389636, 'samples': 6735168, 'steps': 35078, 'loss/train': 1.1610349416732788} -08/30/2021 19:33:28 - INFO - __main__ - Step 35080: {'lr': 0.0004408610633301428, 'samples': 6735360, 'steps': 35079, 'loss/train': 1.8730825185775757} -08/30/2021 19:33:28 - INFO - __main__ - Step 35081: {'lr': 0.00044085763580039027, 'samples': 6735552, 'steps': 35080, 'loss/train': 1.4571410417556763} -08/30/2021 19:33:29 - INFO - __main__ - Step 35082: {'lr': 0.0004408542081846402, 'samples': 6735744, 'steps': 35081, 'loss/train': 1.156598687171936} -08/30/2021 19:33:29 - INFO - __main__ - Step 35083: {'lr': 0.0004408507804828942, 'samples': 6735936, 'steps': 35082, 'loss/train': 0.732154130935669} -08/30/2021 19:33:29 - INFO - __main__ - Step 35084: {'lr': 0.00044084735269515375, 'samples': 6736128, 'steps': 35083, 'loss/train': 1.5006557703018188} -08/30/2021 19:33:31 - INFO - __main__ - Step 35085: {'lr': 0.0004408439248214205, 'samples': 6736320, 'steps': 35084, 'loss/train': 1.4012720584869385} -08/30/2021 19:33:31 - INFO - __main__ - Step 35086: {'lr': 0.00044084049686169584, 'samples': 6736512, 'steps': 35085, 'loss/train': 2.148707389831543} -08/30/2021 19:33:32 - INFO - __main__ - Step 35087: {'lr': 0.00044083706881598147, 'samples': 6736704, 'steps': 35086, 'loss/train': 1.2792222499847412} -08/30/2021 19:33:32 - INFO - __main__ - Step 35088: {'lr': 0.00044083364068427875, 'samples': 6736896, 'steps': 35087, 'loss/train': 0.6709632873535156} -08/30/2021 19:33:32 - INFO - __main__ - Step 35089: {'lr': 0.0004408302124665894, 'samples': 6737088, 'steps': 35088, 'loss/train': 1.5113765001296997} -08/30/2021 19:33:34 - INFO - __main__ - Step 35090: {'lr': 0.00044082678416291495, 'samples': 6737280, 'steps': 35089, 'loss/train': 0.6331438422203064} -08/30/2021 19:33:34 - INFO - __main__ - Step 35091: {'lr': 0.00044082335577325685, 'samples': 6737472, 'steps': 35090, 'loss/train': 1.594581127166748} -08/30/2021 19:33:34 - INFO - __main__ - Step 35092: {'lr': 0.0004408199272976167, 'samples': 6737664, 'steps': 35091, 'loss/train': 1.5178340673446655} -08/30/2021 19:33:35 - INFO - __main__ - Step 35093: {'lr': 0.00044081649873599604, 'samples': 6737856, 'steps': 35092, 'loss/train': 1.6615768671035767} -08/30/2021 19:33:35 - INFO - __main__ - Step 35094: {'lr': 0.0004408130700883964, 'samples': 6738048, 'steps': 35093, 'loss/train': 1.477236270904541} -08/30/2021 19:33:38 - INFO - __main__ - Step 35095: {'lr': 0.0004408096413548193, 'samples': 6738240, 'steps': 35094, 'loss/train': 0.9638330340385437} -08/30/2021 19:33:38 - INFO - __main__ - Step 35096: {'lr': 0.00044080621253526637, 'samples': 6738432, 'steps': 35095, 'loss/train': 0.21695414185523987} -08/30/2021 19:33:38 - INFO - __main__ - Step 35097: {'lr': 0.00044080278362973913, 'samples': 6738624, 'steps': 35096, 'loss/train': 0.15020699799060822} -08/30/2021 19:33:39 - INFO - __main__ - Step 35098: {'lr': 0.00044079935463823904, 'samples': 6738816, 'steps': 35097, 'loss/train': 1.3352291584014893} -08/30/2021 19:33:39 - INFO - __main__ - Step 35099: {'lr': 0.00044079592556076774, 'samples': 6739008, 'steps': 35098, 'loss/train': 1.5562607049942017} -08/30/2021 19:33:40 - INFO - __main__ - Step 35100: {'lr': 0.00044079249639732664, 'samples': 6739200, 'steps': 35099, 'loss/train': 1.4374668598175049} -08/30/2021 19:33:41 - INFO - __main__ - Step 35101: {'lr': 0.00044078906714791757, 'samples': 6739392, 'steps': 35100, 'loss/train': 0.06896452605724335} -08/30/2021 19:33:42 - INFO - __main__ - Step 35102: {'lr': 0.0004407856378125418, 'samples': 6739584, 'steps': 35101, 'loss/train': 1.990705966949463} -08/30/2021 19:33:42 - INFO - __main__ - Step 35103: {'lr': 0.00044078220839120086, 'samples': 6739776, 'steps': 35102, 'loss/train': 1.762894868850708} -08/30/2021 19:33:42 - INFO - __main__ - Step 35104: {'lr': 0.0004407787788838966, 'samples': 6739968, 'steps': 35103, 'loss/train': 1.6660062074661255} -08/30/2021 19:33:43 - INFO - __main__ - Step 35105: {'lr': 0.00044077534929063024, 'samples': 6740160, 'steps': 35104, 'loss/train': 1.545969843864441} -08/30/2021 19:33:44 - INFO - __main__ - Step 35106: {'lr': 0.00044077191961140337, 'samples': 6740352, 'steps': 35105, 'loss/train': 1.2282251119613647} -08/30/2021 19:33:45 - INFO - __main__ - Step 35107: {'lr': 0.00044076848984621775, 'samples': 6740544, 'steps': 35106, 'loss/train': 1.5219817161560059} -08/30/2021 19:33:45 - INFO - __main__ - Step 35108: {'lr': 0.00044076505999507474, 'samples': 6740736, 'steps': 35107, 'loss/train': 1.2070413827896118} -08/30/2021 19:33:45 - INFO - __main__ - Step 35109: {'lr': 0.00044076163005797597, 'samples': 6740928, 'steps': 35108, 'loss/train': 1.923166275024414} -08/30/2021 19:33:46 - INFO - __main__ - Step 35110: {'lr': 0.00044075820003492295, 'samples': 6741120, 'steps': 35109, 'loss/train': 1.5452156066894531} -08/30/2021 19:33:46 - INFO - __main__ - Step 35111: {'lr': 0.0004407547699259173, 'samples': 6741312, 'steps': 35110, 'loss/train': 2.220792770385742} -08/30/2021 19:33:48 - INFO - __main__ - Step 35112: {'lr': 0.0004407513397309604, 'samples': 6741504, 'steps': 35111, 'loss/train': 0.9561098217964172} -08/30/2021 19:33:48 - INFO - __main__ - Step 35113: {'lr': 0.0004407479094500539, 'samples': 6741696, 'steps': 35112, 'loss/train': 1.100181221961975} -08/30/2021 19:33:48 - INFO - __main__ - Step 35114: {'lr': 0.00044074447908319935, 'samples': 6741888, 'steps': 35113, 'loss/train': 1.4713833332061768} -08/30/2021 19:33:49 - INFO - __main__ - Step 35115: {'lr': 0.0004407410486303983, 'samples': 6742080, 'steps': 35114, 'loss/train': 1.253598690032959} -08/30/2021 19:33:49 - INFO - __main__ - Step 35116: {'lr': 0.0004407376180916522, 'samples': 6742272, 'steps': 35115, 'loss/train': 2.0496363639831543} -08/30/2021 19:33:50 - INFO - __main__ - Step 35117: {'lr': 0.0004407341874669627, 'samples': 6742464, 'steps': 35116, 'loss/train': 1.3307188749313354} -08/30/2021 19:33:51 - INFO - __main__ - Step 35118: {'lr': 0.00044073075675633134, 'samples': 6742656, 'steps': 35117, 'loss/train': 1.5264326333999634} -08/30/2021 19:33:51 - INFO - __main__ - Step 35119: {'lr': 0.0004407273259597597, 'samples': 6742848, 'steps': 35118, 'loss/train': 1.7594091892242432} -08/30/2021 19:33:52 - INFO - __main__ - Step 35120: {'lr': 0.0004407238950772492, 'samples': 6743040, 'steps': 35119, 'loss/train': 1.0203707218170166} -08/30/2021 19:33:52 - INFO - __main__ - Step 35121: {'lr': 0.00044072046410880143, 'samples': 6743232, 'steps': 35120, 'loss/train': 0.8387742042541504} -08/30/2021 19:33:53 - INFO - __main__ - Step 35122: {'lr': 0.000440717033054418, 'samples': 6743424, 'steps': 35121, 'loss/train': 1.977790117263794} -08/30/2021 19:33:54 - INFO - __main__ - Step 35123: {'lr': 0.0004407136019141005, 'samples': 6743616, 'steps': 35122, 'loss/train': 1.3198071718215942} -08/30/2021 19:33:54 - INFO - __main__ - Step 35124: {'lr': 0.0004407101706878502, 'samples': 6743808, 'steps': 35123, 'loss/train': 1.3572293519973755} -08/30/2021 19:33:55 - INFO - __main__ - Step 35125: {'lr': 0.000440706739375669, 'samples': 6744000, 'steps': 35124, 'loss/train': 1.7889180183410645} -08/30/2021 19:33:55 - INFO - __main__ - Step 35126: {'lr': 0.00044070330797755825, 'samples': 6744192, 'steps': 35125, 'loss/train': 1.328520655632019} -08/30/2021 19:33:57 - INFO - __main__ - Step 35127: {'lr': 0.0004406998764935195, 'samples': 6744384, 'steps': 35126, 'loss/train': 1.3321994543075562} -08/30/2021 19:33:57 - INFO - __main__ - Step 35128: {'lr': 0.0004406964449235544, 'samples': 6744576, 'steps': 35127, 'loss/train': 5.919016361236572} -08/30/2021 19:33:58 - INFO - __main__ - Step 35129: {'lr': 0.00044069301326766434, 'samples': 6744768, 'steps': 35128, 'loss/train': 5.838839054107666} -08/30/2021 19:33:58 - INFO - __main__ - Step 35130: {'lr': 0.00044068958152585104, 'samples': 6744960, 'steps': 35129, 'loss/train': 1.1469359397888184} -08/30/2021 19:33:59 - INFO - __main__ - Step 35131: {'lr': 0.00044068614969811586, 'samples': 6745152, 'steps': 35130, 'loss/train': 1.4037948846817017} -08/30/2021 19:33:59 - INFO - __main__ - Step 35132: {'lr': 0.0004406827177844605, 'samples': 6745344, 'steps': 35131, 'loss/train': 0.8167937994003296} -08/30/2021 19:34:01 - INFO - __main__ - Step 35133: {'lr': 0.00044067928578488645, 'samples': 6745536, 'steps': 35132, 'loss/train': 0.22708335518836975} -08/30/2021 19:34:01 - INFO - __main__ - Step 35134: {'lr': 0.0004406758536993952, 'samples': 6745728, 'steps': 35133, 'loss/train': 1.5980310440063477} -08/30/2021 19:34:01 - INFO - __main__ - Step 35135: {'lr': 0.00044067242152798843, 'samples': 6745920, 'steps': 35134, 'loss/train': 1.1887896060943604} -08/30/2021 19:34:02 - INFO - __main__ - Step 35136: {'lr': 0.00044066898927066757, 'samples': 6746112, 'steps': 35135, 'loss/train': 0.8095821738243103} -08/30/2021 19:34:02 - INFO - __main__ - Step 35137: {'lr': 0.0004406655569274342, 'samples': 6746304, 'steps': 35136, 'loss/train': 1.610980749130249} -08/30/2021 19:34:02 - INFO - __main__ - Step 35138: {'lr': 0.0004406621244982899, 'samples': 6746496, 'steps': 35137, 'loss/train': 1.263929843902588} -08/30/2021 19:34:04 - INFO - __main__ - Step 35139: {'lr': 0.00044065869198323614, 'samples': 6746688, 'steps': 35138, 'loss/train': 1.789681077003479} -08/30/2021 19:34:04 - INFO - __main__ - Step 35140: {'lr': 0.0004406552593822746, 'samples': 6746880, 'steps': 35139, 'loss/train': 1.6807105541229248} -08/30/2021 19:34:05 - INFO - __main__ - Step 35141: {'lr': 0.00044065182669540665, 'samples': 6747072, 'steps': 35140, 'loss/train': 1.8546452522277832} -08/30/2021 19:34:05 - INFO - __main__ - Step 35142: {'lr': 0.000440648393922634, 'samples': 6747264, 'steps': 35141, 'loss/train': 1.3173348903656006} -08/30/2021 19:34:07 - INFO - __main__ - Step 35143: {'lr': 0.0004406449610639581, 'samples': 6747456, 'steps': 35142, 'loss/train': 1.7653255462646484} -08/30/2021 19:34:07 - INFO - __main__ - Step 35144: {'lr': 0.0004406415281193805, 'samples': 6747648, 'steps': 35143, 'loss/train': 1.690947413444519} -08/30/2021 19:34:07 - INFO - __main__ - Step 35145: {'lr': 0.0004406380950889027, 'samples': 6747840, 'steps': 35144, 'loss/train': 0.0914091095328331} -08/30/2021 19:34:08 - INFO - __main__ - Step 35146: {'lr': 0.0004406346619725265, 'samples': 6748032, 'steps': 35145, 'loss/train': 2.2457568645477295} -08/30/2021 19:34:08 - INFO - __main__ - Step 35147: {'lr': 0.00044063122877025315, 'samples': 6748224, 'steps': 35146, 'loss/train': 0.06289371848106384} -08/30/2021 19:34:08 - INFO - __main__ - Step 35148: {'lr': 0.0004406277954820843, 'samples': 6748416, 'steps': 35147, 'loss/train': 1.475255012512207} -08/30/2021 19:34:10 - INFO - __main__ - Step 35149: {'lr': 0.0004406243621080216, 'samples': 6748608, 'steps': 35148, 'loss/train': 1.5640921592712402} -08/30/2021 19:34:10 - INFO - __main__ - Step 35150: {'lr': 0.00044062092864806634, 'samples': 6748800, 'steps': 35149, 'loss/train': 1.2072811126708984} -08/30/2021 19:34:11 - INFO - __main__ - Step 35151: {'lr': 0.00044061749510222037, 'samples': 6748992, 'steps': 35150, 'loss/train': 2.398737907409668} -08/30/2021 19:34:11 - INFO - __main__ - Step 35152: {'lr': 0.00044061406147048504, 'samples': 6749184, 'steps': 35151, 'loss/train': 1.7054141759872437} -08/30/2021 19:34:11 - INFO - __main__ - Step 35153: {'lr': 0.000440610627752862, 'samples': 6749376, 'steps': 35152, 'loss/train': 1.2718210220336914} -08/30/2021 19:34:13 - INFO - __main__ - Step 35154: {'lr': 0.00044060719394935265, 'samples': 6749568, 'steps': 35153, 'loss/train': 1.265812873840332} -08/30/2021 19:34:14 - INFO - __main__ - Step 35155: {'lr': 0.0004406037600599588, 'samples': 6749760, 'steps': 35154, 'loss/train': 1.229170560836792} -08/30/2021 19:34:14 - INFO - __main__ - Step 35156: {'lr': 0.0004406003260846817, 'samples': 6749952, 'steps': 35155, 'loss/train': 1.4863605499267578} -08/30/2021 19:34:15 - INFO - __main__ - Step 35157: {'lr': 0.0004405968920235231, 'samples': 6750144, 'steps': 35156, 'loss/train': 0.9780787229537964} -08/30/2021 19:34:15 - INFO - __main__ - Step 35158: {'lr': 0.0004405934578764845, 'samples': 6750336, 'steps': 35157, 'loss/train': 1.421268343925476} -08/30/2021 19:34:17 - INFO - __main__ - Step 35159: {'lr': 0.0004405900236435674, 'samples': 6750528, 'steps': 35158, 'loss/train': 1.925866961479187} -08/30/2021 19:34:17 - INFO - __main__ - Step 35160: {'lr': 0.00044058658932477336, 'samples': 6750720, 'steps': 35159, 'loss/train': 0.5766004323959351} -08/30/2021 19:34:18 - INFO - __main__ - Step 35161: {'lr': 0.0004405831549201039, 'samples': 6750912, 'steps': 35160, 'loss/train': 1.8874460458755493} -08/30/2021 19:34:18 - INFO - __main__ - Step 35162: {'lr': 0.0004405797204295607, 'samples': 6751104, 'steps': 35161, 'loss/train': 1.2231470346450806} -08/30/2021 19:34:18 - INFO - __main__ - Step 35163: {'lr': 0.0004405762858531451, 'samples': 6751296, 'steps': 35162, 'loss/train': 1.5750610828399658} -08/30/2021 19:34:20 - INFO - __main__ - Step 35164: {'lr': 0.00044057285119085887, 'samples': 6751488, 'steps': 35163, 'loss/train': 1.4553025960922241} -08/30/2021 19:34:20 - INFO - __main__ - Step 35165: {'lr': 0.0004405694164427035, 'samples': 6751680, 'steps': 35164, 'loss/train': 1.443730354309082} -08/30/2021 19:34:21 - INFO - __main__ - Step 35166: {'lr': 0.0004405659816086804, 'samples': 6751872, 'steps': 35165, 'loss/train': 1.6259300708770752} -08/30/2021 19:34:21 - INFO - __main__ - Step 35167: {'lr': 0.00044056254668879127, 'samples': 6752064, 'steps': 35166, 'loss/train': 2.0701069831848145} -08/30/2021 19:34:21 - INFO - __main__ - Step 35168: {'lr': 0.00044055911168303753, 'samples': 6752256, 'steps': 35167, 'loss/train': 2.03838849067688} -08/30/2021 19:34:22 - INFO - __main__ - Step 35169: {'lr': 0.00044055567659142083, 'samples': 6752448, 'steps': 35168, 'loss/train': 1.6455274820327759} -08/30/2021 19:34:23 - INFO - __main__ - Step 35170: {'lr': 0.0004405522414139427, 'samples': 6752640, 'steps': 35169, 'loss/train': 1.3178457021713257} -08/30/2021 19:34:24 - INFO - __main__ - Step 35171: {'lr': 0.0004405488061506047, 'samples': 6752832, 'steps': 35170, 'loss/train': 1.2635177373886108} -08/30/2021 19:34:24 - INFO - __main__ - Step 35172: {'lr': 0.0004405453708014082, 'samples': 6753024, 'steps': 35171, 'loss/train': 0.6742770075798035} -08/30/2021 19:34:24 - INFO - __main__ - Step 35173: {'lr': 0.00044054193536635503, 'samples': 6753216, 'steps': 35172, 'loss/train': 1.4755159616470337} -08/30/2021 19:34:25 - INFO - __main__ - Step 35174: {'lr': 0.00044053849984544653, 'samples': 6753408, 'steps': 35173, 'loss/train': 1.1763559579849243} -08/30/2021 19:34:26 - INFO - __main__ - Step 35175: {'lr': 0.0004405350642386844, 'samples': 6753600, 'steps': 35174, 'loss/train': 1.9033881425857544} -08/30/2021 19:34:27 - INFO - __main__ - Step 35176: {'lr': 0.00044053162854607004, 'samples': 6753792, 'steps': 35175, 'loss/train': 0.8928601145744324} -08/30/2021 19:34:27 - INFO - __main__ - Step 35177: {'lr': 0.0004405281927676051, 'samples': 6753984, 'steps': 35176, 'loss/train': 1.3737467527389526} -08/30/2021 19:34:28 - INFO - __main__ - Step 35178: {'lr': 0.0004405247569032911, 'samples': 6754176, 'steps': 35177, 'loss/train': 1.949627161026001} -08/30/2021 19:34:28 - INFO - __main__ - Step 35179: {'lr': 0.00044052132095312956, 'samples': 6754368, 'steps': 35178, 'loss/train': 1.8561934232711792} -08/30/2021 19:34:30 - INFO - __main__ - Step 35180: {'lr': 0.0004405178849171221, 'samples': 6754560, 'steps': 35179, 'loss/train': 0.24839358031749725} -08/30/2021 19:34:30 - INFO - __main__ - Step 35181: {'lr': 0.00044051444879527013, 'samples': 6754752, 'steps': 35180, 'loss/train': 0.61899334192276} -08/30/2021 19:34:31 - INFO - __main__ - Step 35182: {'lr': 0.00044051101258757544, 'samples': 6754944, 'steps': 35181, 'loss/train': 1.483779788017273} -08/30/2021 19:34:31 - INFO - __main__ - Step 35183: {'lr': 0.0004405075762940393, 'samples': 6755136, 'steps': 35182, 'loss/train': 0.9080450534820557} -08/30/2021 19:34:31 - INFO - __main__ - Step 35184: {'lr': 0.00044050413991466344, 'samples': 6755328, 'steps': 35183, 'loss/train': 1.2553569078445435} -08/30/2021 19:34:33 - INFO - __main__ - Step 35185: {'lr': 0.0004405007034494494, 'samples': 6755520, 'steps': 35184, 'loss/train': 2.0483922958374023} -08/30/2021 19:34:33 - INFO - __main__ - Step 35186: {'lr': 0.00044049726689839854, 'samples': 6755712, 'steps': 35185, 'loss/train': 0.9954208135604858} -08/30/2021 19:34:34 - INFO - __main__ - Step 35187: {'lr': 0.0004404938302615126, 'samples': 6755904, 'steps': 35186, 'loss/train': 1.5959469079971313} -08/30/2021 19:34:34 - INFO - __main__ - Step 35188: {'lr': 0.00044049039353879317, 'samples': 6756096, 'steps': 35187, 'loss/train': 1.2983096837997437} -08/30/2021 19:34:34 - INFO - __main__ - Step 35189: {'lr': 0.00044048695673024166, 'samples': 6756288, 'steps': 35188, 'loss/train': 1.1405982971191406} -08/30/2021 19:34:35 - INFO - __main__ - Step 35190: {'lr': 0.00044048351983585966, 'samples': 6756480, 'steps': 35189, 'loss/train': 4.97883939743042} -08/30/2021 19:34:36 - INFO - __main__ - Step 35191: {'lr': 0.00044048008285564865, 'samples': 6756672, 'steps': 35190, 'loss/train': 0.626621425151825} -08/30/2021 19:34:37 - INFO - __main__ - Step 35192: {'lr': 0.0004404766457896104, 'samples': 6756864, 'steps': 35191, 'loss/train': 1.7165340185165405} -08/30/2021 19:34:37 - INFO - __main__ - Step 35193: {'lr': 0.0004404732086377462, 'samples': 6757056, 'steps': 35192, 'loss/train': 1.673938274383545} -08/30/2021 19:34:37 - INFO - __main__ - Step 35194: {'lr': 0.00044046977140005774, 'samples': 6757248, 'steps': 35193, 'loss/train': 1.4433075189590454} -08/30/2021 19:34:38 - INFO - __main__ - Step 35195: {'lr': 0.00044046633407654657, 'samples': 6757440, 'steps': 35194, 'loss/train': 1.6284478902816772} -08/30/2021 19:34:39 - INFO - __main__ - Step 35196: {'lr': 0.0004404628966672142, 'samples': 6757632, 'steps': 35195, 'loss/train': 1.6464027166366577} -08/30/2021 19:34:40 - INFO - __main__ - Step 35197: {'lr': 0.0004404594591720622, 'samples': 6757824, 'steps': 35196, 'loss/train': 1.9045639038085938} -08/30/2021 19:34:40 - INFO - __main__ - Step 35198: {'lr': 0.00044045602159109207, 'samples': 6758016, 'steps': 35197, 'loss/train': 1.601232647895813} -08/30/2021 19:34:41 - INFO - __main__ - Step 35199: {'lr': 0.0004404525839243054, 'samples': 6758208, 'steps': 35198, 'loss/train': 1.32688307762146} -08/30/2021 19:34:41 - INFO - __main__ - Step 35200: {'lr': 0.00044044914617170374, 'samples': 6758400, 'steps': 35199, 'loss/train': 1.6576082706451416} -08/30/2021 19:34:42 - INFO - __main__ - Step 35201: {'lr': 0.00044044570833328865, 'samples': 6758592, 'steps': 35200, 'loss/train': 1.3306043148040771} -08/30/2021 19:34:43 - INFO - __main__ - Step 35202: {'lr': 0.00044044227040906166, 'samples': 6758784, 'steps': 35201, 'loss/train': 0.914250373840332} -08/30/2021 19:34:43 - INFO - __main__ - Step 35203: {'lr': 0.00044043883239902425, 'samples': 6758976, 'steps': 35202, 'loss/train': 2.131357431411743} -08/30/2021 19:34:44 - INFO - __main__ - Step 35204: {'lr': 0.00044043539430317814, 'samples': 6759168, 'steps': 35203, 'loss/train': 1.3784360885620117} -08/30/2021 19:34:44 - INFO - __main__ - Step 35205: {'lr': 0.00044043195612152475, 'samples': 6759360, 'steps': 35204, 'loss/train': 1.1162667274475098} -08/30/2021 19:34:46 - INFO - __main__ - Step 35206: {'lr': 0.0004404285178540657, 'samples': 6759552, 'steps': 35205, 'loss/train': 1.7808799743652344} -08/30/2021 19:34:46 - INFO - __main__ - Step 35207: {'lr': 0.0004404250795008024, 'samples': 6759744, 'steps': 35206, 'loss/train': 1.4750785827636719} -08/30/2021 19:34:47 - INFO - __main__ - Step 35208: {'lr': 0.00044042164106173655, 'samples': 6759936, 'steps': 35207, 'loss/train': 1.5423390865325928} -08/30/2021 19:34:47 - INFO - __main__ - Step 35209: {'lr': 0.00044041820253686964, 'samples': 6760128, 'steps': 35208, 'loss/train': 1.6783699989318848} -08/30/2021 19:34:47 - INFO - __main__ - Step 35210: {'lr': 0.0004404147639262032, 'samples': 6760320, 'steps': 35209, 'loss/train': 1.6512147188186646} -08/30/2021 19:34:49 - INFO - __main__ - Step 35211: {'lr': 0.00044041132522973885, 'samples': 6760512, 'steps': 35210, 'loss/train': 2.347942352294922} -08/30/2021 19:34:50 - INFO - __main__ - Step 35212: {'lr': 0.0004404078864474781, 'samples': 6760704, 'steps': 35211, 'loss/train': 1.5213650465011597} -08/30/2021 19:34:50 - INFO - __main__ - Step 35213: {'lr': 0.00044040444757942245, 'samples': 6760896, 'steps': 35212, 'loss/train': 0.9378730654716492} -08/30/2021 19:34:50 - INFO - __main__ - Step 35214: {'lr': 0.00044040100862557355, 'samples': 6761088, 'steps': 35213, 'loss/train': 0.8650201559066772} -08/30/2021 19:34:51 - INFO - __main__ - Step 35215: {'lr': 0.00044039756958593287, 'samples': 6761280, 'steps': 35214, 'loss/train': 1.0497382879257202} -08/30/2021 19:34:51 - INFO - __main__ - Step 35216: {'lr': 0.000440394130460502, 'samples': 6761472, 'steps': 35215, 'loss/train': 1.380338191986084} -08/30/2021 19:34:53 - INFO - __main__ - Step 35217: {'lr': 0.00044039069124928245, 'samples': 6761664, 'steps': 35216, 'loss/train': 0.4927540719509125} -08/30/2021 19:34:53 - INFO - __main__ - Step 35218: {'lr': 0.0004403872519522758, 'samples': 6761856, 'steps': 35217, 'loss/train': 1.8464901447296143} -08/30/2021 19:34:53 - INFO - __main__ - Step 35219: {'lr': 0.00044038381256948357, 'samples': 6762048, 'steps': 35218, 'loss/train': 1.7989280223846436} -08/30/2021 19:34:54 - INFO - __main__ - Step 35220: {'lr': 0.00044038037310090736, 'samples': 6762240, 'steps': 35219, 'loss/train': 1.262181043624878} -08/30/2021 19:34:54 - INFO - __main__ - Step 35221: {'lr': 0.00044037693354654863, 'samples': 6762432, 'steps': 35220, 'loss/train': 0.2169027179479599} -08/30/2021 19:34:55 - INFO - __main__ - Step 35222: {'lr': 0.0004403734939064091, 'samples': 6762624, 'steps': 35221, 'loss/train': 1.6021244525909424} -08/30/2021 19:34:56 - INFO - __main__ - Step 35223: {'lr': 0.00044037005418049016, 'samples': 6762816, 'steps': 35222, 'loss/train': 0.7446139454841614} -08/30/2021 19:34:56 - INFO - __main__ - Step 35224: {'lr': 0.00044036661436879334, 'samples': 6763008, 'steps': 35223, 'loss/train': 1.6979058980941772} -08/30/2021 19:34:57 - INFO - __main__ - Step 35225: {'lr': 0.00044036317447132035, 'samples': 6763200, 'steps': 35224, 'loss/train': 1.5907671451568604} -08/30/2021 19:34:57 - INFO - __main__ - Step 35226: {'lr': 0.00044035973448807266, 'samples': 6763392, 'steps': 35225, 'loss/train': 1.5446741580963135} -08/30/2021 19:34:57 - INFO - __main__ - Step 35227: {'lr': 0.00044035629441905173, 'samples': 6763584, 'steps': 35226, 'loss/train': 1.255882740020752} -08/30/2021 19:34:59 - INFO - __main__ - Step 35228: {'lr': 0.0004403528542642592, 'samples': 6763776, 'steps': 35227, 'loss/train': 1.9746030569076538} -08/30/2021 19:34:59 - INFO - __main__ - Step 35229: {'lr': 0.00044034941402369666, 'samples': 6763968, 'steps': 35228, 'loss/train': 0.7388115525245667} -08/30/2021 19:35:00 - INFO - __main__ - Step 35230: {'lr': 0.0004403459736973656, 'samples': 6764160, 'steps': 35229, 'loss/train': 1.0392111539840698} -08/30/2021 19:35:00 - INFO - __main__ - Step 35231: {'lr': 0.00044034253328526765, 'samples': 6764352, 'steps': 35230, 'loss/train': 1.14803946018219} -08/30/2021 19:35:00 - INFO - __main__ - Step 35232: {'lr': 0.00044033909278740416, 'samples': 6764544, 'steps': 35231, 'loss/train': 1.5649964809417725} -08/30/2021 19:35:02 - INFO - __main__ - Step 35233: {'lr': 0.0004403356522037769, 'samples': 6764736, 'steps': 35232, 'loss/train': 1.1752593517303467} -08/30/2021 19:35:02 - INFO - __main__ - Step 35234: {'lr': 0.00044033221153438727, 'samples': 6764928, 'steps': 35233, 'loss/train': 1.9982519149780273} -08/30/2021 19:35:03 - INFO - __main__ - Step 35235: {'lr': 0.00044032877077923696, 'samples': 6765120, 'steps': 35234, 'loss/train': 1.9026896953582764} -08/30/2021 19:35:03 - INFO - __main__ - Step 35236: {'lr': 0.0004403253299383274, 'samples': 6765312, 'steps': 35235, 'loss/train': 1.168999195098877} -08/30/2021 19:35:03 - INFO - __main__ - Step 35237: {'lr': 0.00044032188901166016, 'samples': 6765504, 'steps': 35236, 'loss/train': 1.1683205366134644} -08/30/2021 19:35:05 - INFO - __main__ - Step 35238: {'lr': 0.0004403184479992368, 'samples': 6765696, 'steps': 35237, 'loss/train': 2.364229917526245} -08/30/2021 19:35:05 - INFO - __main__ - Step 35239: {'lr': 0.000440315006901059, 'samples': 6765888, 'steps': 35238, 'loss/train': 1.3106727600097656} -08/30/2021 19:35:06 - INFO - __main__ - Step 35240: {'lr': 0.00044031156571712807, 'samples': 6766080, 'steps': 35239, 'loss/train': 1.5884283781051636} -08/30/2021 19:35:06 - INFO - __main__ - Step 35241: {'lr': 0.0004403081244474457, 'samples': 6766272, 'steps': 35240, 'loss/train': 1.3158551454544067} -08/30/2021 19:35:06 - INFO - __main__ - Step 35242: {'lr': 0.00044030468309201354, 'samples': 6766464, 'steps': 35241, 'loss/train': 1.2236522436141968} -08/30/2021 19:35:08 - INFO - __main__ - Step 35243: {'lr': 0.0004403012416508329, 'samples': 6766656, 'steps': 35242, 'loss/train': 1.473706603050232} -08/30/2021 19:35:09 - INFO - __main__ - Step 35244: {'lr': 0.00044029780012390553, 'samples': 6766848, 'steps': 35243, 'loss/train': 1.4110535383224487} -08/30/2021 19:35:09 - INFO - __main__ - Step 35245: {'lr': 0.0004402943585112329, 'samples': 6767040, 'steps': 35244, 'loss/train': 0.09369825571775436} -08/30/2021 19:35:09 - INFO - __main__ - Step 35246: {'lr': 0.0004402909168128165, 'samples': 6767232, 'steps': 35245, 'loss/train': 1.7193278074264526} -08/30/2021 19:35:10 - INFO - __main__ - Step 35247: {'lr': 0.00044028747502865794, 'samples': 6767424, 'steps': 35246, 'loss/train': 1.5147919654846191} -08/30/2021 19:35:11 - INFO - __main__ - Step 35248: {'lr': 0.0004402840331587589, 'samples': 6767616, 'steps': 35247, 'loss/train': 1.8174281120300293} -08/30/2021 19:35:12 - INFO - __main__ - Step 35249: {'lr': 0.0004402805912031207, 'samples': 6767808, 'steps': 35248, 'loss/train': 0.8487445712089539} -08/30/2021 19:35:12 - INFO - __main__ - Step 35250: {'lr': 0.0004402771491617451, 'samples': 6768000, 'steps': 35249, 'loss/train': 0.7927405834197998} -08/30/2021 19:35:12 - INFO - __main__ - Step 35251: {'lr': 0.0004402737070346335, 'samples': 6768192, 'steps': 35250, 'loss/train': 0.988335132598877} -08/30/2021 19:35:13 - INFO - __main__ - Step 35252: {'lr': 0.0004402702648217875, 'samples': 6768384, 'steps': 35251, 'loss/train': 1.369179129600525} -08/30/2021 19:35:13 - INFO - __main__ - Step 35253: {'lr': 0.00044026682252320864, 'samples': 6768576, 'steps': 35252, 'loss/train': 3.055659532546997} -08/30/2021 19:35:15 - INFO - __main__ - Step 35254: {'lr': 0.00044026338013889853, 'samples': 6768768, 'steps': 35253, 'loss/train': 1.8225443363189697} -08/30/2021 19:35:15 - INFO - __main__ - Step 35255: {'lr': 0.00044025993766885866, 'samples': 6768960, 'steps': 35254, 'loss/train': 1.828208565711975} -08/30/2021 19:35:16 - INFO - __main__ - Step 35256: {'lr': 0.00044025649511309064, 'samples': 6769152, 'steps': 35255, 'loss/train': 1.041124939918518} -08/30/2021 19:35:16 - INFO - __main__ - Step 35257: {'lr': 0.00044025305247159585, 'samples': 6769344, 'steps': 35256, 'loss/train': 1.5535945892333984} -08/30/2021 19:35:16 - INFO - __main__ - Step 35258: {'lr': 0.00044024960974437606, 'samples': 6769536, 'steps': 35257, 'loss/train': 0.07975805550813675} -08/30/2021 19:35:18 - INFO - __main__ - Step 35259: {'lr': 0.0004402461669314327, 'samples': 6769728, 'steps': 35258, 'loss/train': 1.6203875541687012} -08/30/2021 19:35:18 - INFO - __main__ - Step 35260: {'lr': 0.0004402427240327674, 'samples': 6769920, 'steps': 35259, 'loss/train': 1.3997536897659302} -08/30/2021 19:35:19 - INFO - __main__ - Step 35261: {'lr': 0.0004402392810483816, 'samples': 6770112, 'steps': 35260, 'loss/train': 1.4612407684326172} -08/30/2021 19:35:19 - INFO - __main__ - Step 35262: {'lr': 0.000440235837978277, 'samples': 6770304, 'steps': 35261, 'loss/train': 0.9268139600753784} -08/30/2021 19:35:20 - INFO - __main__ - Step 35263: {'lr': 0.00044023239482245504, 'samples': 6770496, 'steps': 35262, 'loss/train': 1.2010623216629028} -08/30/2021 19:35:21 - INFO - __main__ - Step 35264: {'lr': 0.0004402289515809172, 'samples': 6770688, 'steps': 35263, 'loss/train': 1.7011468410491943} -08/30/2021 19:35:22 - INFO - __main__ - Step 35265: {'lr': 0.00044022550825366526, 'samples': 6770880, 'steps': 35264, 'loss/train': 1.3645305633544922} -08/30/2021 19:35:22 - INFO - __main__ - Step 35266: {'lr': 0.0004402220648407006, 'samples': 6771072, 'steps': 35265, 'loss/train': 1.9016871452331543} -08/30/2021 19:35:22 - INFO - __main__ - Step 35267: {'lr': 0.00044021862134202485, 'samples': 6771264, 'steps': 35266, 'loss/train': 1.0431255102157593} -08/30/2021 19:35:23 - INFO - __main__ - Step 35268: {'lr': 0.00044021517775763943, 'samples': 6771456, 'steps': 35267, 'loss/train': 0.5561128258705139} -08/30/2021 19:35:25 - INFO - __main__ - Step 35269: {'lr': 0.00044021173408754604, 'samples': 6771648, 'steps': 35268, 'loss/train': 1.310693621635437} -08/30/2021 19:35:25 - INFO - __main__ - Step 35270: {'lr': 0.00044020829033174615, 'samples': 6771840, 'steps': 35269, 'loss/train': 1.2678537368774414} -08/30/2021 19:35:26 - INFO - __main__ - Step 35271: {'lr': 0.0004402048464902414, 'samples': 6772032, 'steps': 35270, 'loss/train': 0.8126941919326782} -08/30/2021 19:35:26 - INFO - __main__ - Step 35272: {'lr': 0.0004402014025630332, 'samples': 6772224, 'steps': 35271, 'loss/train': 1.036738395690918} -08/30/2021 19:35:26 - INFO - __main__ - Step 35273: {'lr': 0.00044019795855012325, 'samples': 6772416, 'steps': 35272, 'loss/train': 1.1602281332015991} -08/30/2021 19:35:27 - INFO - __main__ - Step 35274: {'lr': 0.00044019451445151305, 'samples': 6772608, 'steps': 35273, 'loss/train': 1.720868468284607} -08/30/2021 19:35:28 - INFO - __main__ - Step 35275: {'lr': 0.00044019107026720404, 'samples': 6772800, 'steps': 35274, 'loss/train': 1.3801974058151245} -08/30/2021 19:35:29 - INFO - __main__ - Step 35276: {'lr': 0.00044018762599719796, 'samples': 6772992, 'steps': 35275, 'loss/train': 1.4340863227844238} -08/30/2021 19:35:29 - INFO - __main__ - Step 35277: {'lr': 0.0004401841816414962, 'samples': 6773184, 'steps': 35276, 'loss/train': 1.6542479991912842} -08/30/2021 19:35:29 - INFO - __main__ - Step 35278: {'lr': 0.0004401807372001004, 'samples': 6773376, 'steps': 35277, 'loss/train': 0.8494566082954407} -08/30/2021 19:35:30 - INFO - __main__ - Step 35279: {'lr': 0.0004401772926730122, 'samples': 6773568, 'steps': 35278, 'loss/train': 1.38467276096344} -08/30/2021 19:35:31 - INFO - __main__ - Step 35280: {'lr': 0.0004401738480602329, 'samples': 6773760, 'steps': 35279, 'loss/train': 1.4366095066070557} -08/30/2021 19:35:32 - INFO - __main__ - Step 35281: {'lr': 0.0004401704033617643, 'samples': 6773952, 'steps': 35280, 'loss/train': 0.13203176856040955} -08/30/2021 19:35:32 - INFO - __main__ - Step 35282: {'lr': 0.0004401669585776078, 'samples': 6774144, 'steps': 35281, 'loss/train': 1.0327534675598145} -08/30/2021 19:35:33 - INFO - __main__ - Step 35283: {'lr': 0.000440163513707765, 'samples': 6774336, 'steps': 35282, 'loss/train': 1.26374351978302} -08/30/2021 19:35:33 - INFO - __main__ - Step 35284: {'lr': 0.00044016006875223745, 'samples': 6774528, 'steps': 35283, 'loss/train': 1.0519497394561768} -08/30/2021 19:35:35 - INFO - __main__ - Step 35285: {'lr': 0.00044015662371102676, 'samples': 6774720, 'steps': 35284, 'loss/train': 1.084066390991211} -08/30/2021 19:35:36 - INFO - __main__ - Step 35286: {'lr': 0.0004401531785841344, 'samples': 6774912, 'steps': 35285, 'loss/train': 2.0477452278137207} -08/30/2021 19:35:36 - INFO - __main__ - Step 35287: {'lr': 0.00044014973337156197, 'samples': 6775104, 'steps': 35286, 'loss/train': 1.5073790550231934} -08/30/2021 19:35:37 - INFO - __main__ - Step 35288: {'lr': 0.0004401462880733109, 'samples': 6775296, 'steps': 35287, 'loss/train': 0.7509042620658875} -08/30/2021 19:35:37 - INFO - __main__ - Step 35289: {'lr': 0.000440142842689383, 'samples': 6775488, 'steps': 35288, 'loss/train': 0.5955594778060913} -08/30/2021 19:35:37 - INFO - __main__ - Step 35290: {'lr': 0.00044013939721977957, 'samples': 6775680, 'steps': 35289, 'loss/train': 0.4908735156059265} -08/30/2021 19:35:38 - INFO - __main__ - Step 35291: {'lr': 0.0004401359516645023, 'samples': 6775872, 'steps': 35290, 'loss/train': 1.3419342041015625} -08/30/2021 19:35:39 - INFO - __main__ - Step 35292: {'lr': 0.0004401325060235527, 'samples': 6776064, 'steps': 35291, 'loss/train': 5.298120021820068} -08/30/2021 19:35:40 - INFO - __main__ - Step 35293: {'lr': 0.00044012906029693236, 'samples': 6776256, 'steps': 35292, 'loss/train': 1.2927677631378174} -08/30/2021 19:35:40 - INFO - __main__ - Step 35294: {'lr': 0.0004401256144846427, 'samples': 6776448, 'steps': 35293, 'loss/train': 1.2110918760299683} -08/30/2021 19:35:40 - INFO - __main__ - Step 35295: {'lr': 0.0004401221685866854, 'samples': 6776640, 'steps': 35294, 'loss/train': 2.1023428440093994} -08/30/2021 19:35:41 - INFO - __main__ - Step 35296: {'lr': 0.00044011872260306205, 'samples': 6776832, 'steps': 35295, 'loss/train': 1.1127710342407227} -08/30/2021 19:35:42 - INFO - __main__ - Step 35297: {'lr': 0.00044011527653377416, 'samples': 6777024, 'steps': 35296, 'loss/train': 1.0868569612503052} -08/30/2021 19:35:43 - INFO - __main__ - Step 35298: {'lr': 0.0004401118303788232, 'samples': 6777216, 'steps': 35297, 'loss/train': 1.801560640335083} -08/30/2021 19:35:43 - INFO - __main__ - Step 35299: {'lr': 0.00044010838413821075, 'samples': 6777408, 'steps': 35298, 'loss/train': 1.542335033416748} -08/30/2021 19:35:43 - INFO - __main__ - Step 35300: {'lr': 0.0004401049378119384, 'samples': 6777600, 'steps': 35299, 'loss/train': 0.08990535140037537} -08/30/2021 19:35:44 - INFO - __main__ - Step 35301: {'lr': 0.0004401014914000078, 'samples': 6777792, 'steps': 35300, 'loss/train': 0.26383742690086365} -08/30/2021 19:35:44 - INFO - __main__ - Step 35302: {'lr': 0.00044009804490242026, 'samples': 6777984, 'steps': 35301, 'loss/train': 1.709259033203125} -08/30/2021 19:35:46 - INFO - __main__ - Step 35303: {'lr': 0.00044009459831917755, 'samples': 6778176, 'steps': 35302, 'loss/train': 1.717235803604126} -08/30/2021 19:35:47 - INFO - __main__ - Step 35304: {'lr': 0.00044009115165028113, 'samples': 6778368, 'steps': 35303, 'loss/train': 0.8929498791694641} -08/30/2021 19:35:47 - INFO - __main__ - Step 35305: {'lr': 0.0004400877048957326, 'samples': 6778560, 'steps': 35304, 'loss/train': 1.6270958185195923} -08/30/2021 19:35:47 - INFO - __main__ - Step 35306: {'lr': 0.00044008425805553347, 'samples': 6778752, 'steps': 35305, 'loss/train': 1.4239238500595093} -08/30/2021 19:35:48 - INFO - __main__ - Step 35307: {'lr': 0.00044008081112968537, 'samples': 6778944, 'steps': 35306, 'loss/train': 1.2555062770843506} -08/30/2021 19:35:49 - INFO - __main__ - Step 35308: {'lr': 0.0004400773641181897, 'samples': 6779136, 'steps': 35307, 'loss/train': 1.2234728336334229} -08/30/2021 19:35:50 - INFO - __main__ - Step 35309: {'lr': 0.0004400739170210481, 'samples': 6779328, 'steps': 35308, 'loss/train': 1.640255093574524} -08/30/2021 19:35:50 - INFO - __main__ - Step 35310: {'lr': 0.00044007046983826213, 'samples': 6779520, 'steps': 35309, 'loss/train': 0.27572792768478394} -08/30/2021 19:35:51 - INFO - __main__ - Step 35311: {'lr': 0.0004400670225698333, 'samples': 6779712, 'steps': 35310, 'loss/train': 1.57471764087677} -08/30/2021 19:35:51 - INFO - __main__ - Step 35312: {'lr': 0.00044006357521576334, 'samples': 6779904, 'steps': 35311, 'loss/train': 1.2589054107666016} -08/30/2021 19:35:53 - INFO - __main__ - Step 35313: {'lr': 0.0004400601277760536, 'samples': 6780096, 'steps': 35312, 'loss/train': 2.064746618270874} -08/30/2021 19:35:53 - INFO - __main__ - Step 35314: {'lr': 0.0004400566802507057, 'samples': 6780288, 'steps': 35313, 'loss/train': 1.9095836877822876} -08/30/2021 19:35:53 - INFO - __main__ - Step 35315: {'lr': 0.0004400532326397211, 'samples': 6780480, 'steps': 35314, 'loss/train': 1.270258903503418} -08/30/2021 19:35:54 - INFO - __main__ - Step 35316: {'lr': 0.00044004978494310154, 'samples': 6780672, 'steps': 35315, 'loss/train': 1.4586715698242188} -08/30/2021 19:35:54 - INFO - __main__ - Step 35317: {'lr': 0.00044004633716084854, 'samples': 6780864, 'steps': 35316, 'loss/train': 2.2896289825439453} -08/30/2021 19:35:56 - INFO - __main__ - Step 35318: {'lr': 0.0004400428892929635, 'samples': 6781056, 'steps': 35317, 'loss/train': 1.3984524011611938} -08/30/2021 19:35:56 - INFO - __main__ - Step 35319: {'lr': 0.00044003944133944804, 'samples': 6781248, 'steps': 35318, 'loss/train': 1.5508476495742798} -08/30/2021 19:35:56 - INFO - __main__ - Step 35320: {'lr': 0.00044003599330030385, 'samples': 6781440, 'steps': 35319, 'loss/train': 1.4566360712051392} -08/30/2021 19:35:57 - INFO - __main__ - Step 35321: {'lr': 0.00044003254517553225, 'samples': 6781632, 'steps': 35320, 'loss/train': 1.2995983362197876} -08/30/2021 19:35:57 - INFO - __main__ - Step 35322: {'lr': 0.000440029096965135, 'samples': 6781824, 'steps': 35321, 'loss/train': 1.6833568811416626} -08/30/2021 19:35:58 - INFO - __main__ - Step 35323: {'lr': 0.0004400256486691135, 'samples': 6782016, 'steps': 35322, 'loss/train': 1.4694782495498657} -08/30/2021 19:35:59 - INFO - __main__ - Step 35324: {'lr': 0.0004400222002874695, 'samples': 6782208, 'steps': 35323, 'loss/train': 1.3471918106079102} -08/30/2021 19:36:00 - INFO - __main__ - Step 35325: {'lr': 0.0004400187518202043, 'samples': 6782400, 'steps': 35324, 'loss/train': 1.5700156688690186} -08/30/2021 19:36:00 - INFO - __main__ - Step 35326: {'lr': 0.00044001530326731966, 'samples': 6782592, 'steps': 35325, 'loss/train': 1.4041510820388794} -08/30/2021 19:36:00 - INFO - __main__ - Step 35327: {'lr': 0.00044001185462881707, 'samples': 6782784, 'steps': 35326, 'loss/train': 1.5778844356536865} -08/30/2021 19:36:01 - INFO - __main__ - Step 35328: {'lr': 0.000440008405904698, 'samples': 6782976, 'steps': 35327, 'loss/train': 1.3653637170791626} -08/30/2021 19:36:02 - INFO - __main__ - Step 35329: {'lr': 0.0004400049570949641, 'samples': 6783168, 'steps': 35328, 'loss/train': 1.2845649719238281} -08/30/2021 19:36:02 - INFO - __main__ - Step 35330: {'lr': 0.0004400015081996169, 'samples': 6783360, 'steps': 35329, 'loss/train': 1.058379888534546} -08/30/2021 19:36:03 - INFO - __main__ - Step 35331: {'lr': 0.000439998059218658, 'samples': 6783552, 'steps': 35330, 'loss/train': 1.6161878108978271} -08/30/2021 19:36:03 - INFO - __main__ - Step 35332: {'lr': 0.0004399946101520889, 'samples': 6783744, 'steps': 35331, 'loss/train': 0.4192153215408325} -08/30/2021 19:36:04 - INFO - __main__ - Step 35333: {'lr': 0.0004399911609999111, 'samples': 6783936, 'steps': 35332, 'loss/train': 1.5687097311019897} -08/30/2021 19:36:05 - INFO - __main__ - Step 35334: {'lr': 0.0004399877117621262, 'samples': 6784128, 'steps': 35333, 'loss/train': 1.4547446966171265} -08/30/2021 19:36:05 - INFO - __main__ - Step 35335: {'lr': 0.0004399842624387358, 'samples': 6784320, 'steps': 35334, 'loss/train': 1.9110000133514404} -08/30/2021 19:36:06 - INFO - __main__ - Step 35336: {'lr': 0.0004399808130297415, 'samples': 6784512, 'steps': 35335, 'loss/train': 1.5049439668655396} -08/30/2021 19:36:06 - INFO - __main__ - Step 35337: {'lr': 0.0004399773635351446, 'samples': 6784704, 'steps': 35336, 'loss/train': 1.6948868036270142} -08/30/2021 19:36:06 - INFO - __main__ - Step 35338: {'lr': 0.000439973913954947, 'samples': 6784896, 'steps': 35337, 'loss/train': 1.647794246673584} -08/30/2021 19:36:08 - INFO - __main__ - Step 35339: {'lr': 0.00043997046428915, 'samples': 6785088, 'steps': 35338, 'loss/train': 0.6966094374656677} -08/30/2021 19:36:08 - INFO - __main__ - Step 35340: {'lr': 0.00043996701453775526, 'samples': 6785280, 'steps': 35339, 'loss/train': 1.6490147113800049} -08/30/2021 19:36:09 - INFO - __main__ - Step 35341: {'lr': 0.0004399635647007643, 'samples': 6785472, 'steps': 35340, 'loss/train': 1.4258105754852295} -08/30/2021 19:36:09 - INFO - __main__ - Step 35342: {'lr': 0.00043996011477817875, 'samples': 6785664, 'steps': 35341, 'loss/train': 0.9135576486587524} -08/30/2021 19:36:10 - INFO - __main__ - Step 35343: {'lr': 0.0004399566647700001, 'samples': 6785856, 'steps': 35342, 'loss/train': 1.7830604314804077} -08/30/2021 19:36:12 - INFO - __main__ - Step 35344: {'lr': 0.00043995321467622984, 'samples': 6786048, 'steps': 35343, 'loss/train': 1.1424063444137573} -08/30/2021 19:36:12 - INFO - __main__ - Step 35345: {'lr': 0.00043994976449686964, 'samples': 6786240, 'steps': 35344, 'loss/train': 1.5647335052490234} -08/30/2021 19:36:12 - INFO - __main__ - Step 35346: {'lr': 0.000439946314231921, 'samples': 6786432, 'steps': 35345, 'loss/train': 0.2106710523366928} -08/30/2021 19:36:13 - INFO - __main__ - Step 35347: {'lr': 0.00043994286388138545, 'samples': 6786624, 'steps': 35346, 'loss/train': 1.7119828462600708} -08/30/2021 19:36:13 - INFO - __main__ - Step 35348: {'lr': 0.00043993941344526455, 'samples': 6786816, 'steps': 35347, 'loss/train': 1.407097578048706} -08/30/2021 19:36:14 - INFO - __main__ - Step 35349: {'lr': 0.00043993596292356, 'samples': 6787008, 'steps': 35348, 'loss/train': 1.2357357740402222} -08/30/2021 19:36:15 - INFO - __main__ - Step 35350: {'lr': 0.00043993251231627315, 'samples': 6787200, 'steps': 35349, 'loss/train': 1.7043943405151367} -08/30/2021 19:36:16 - INFO - __main__ - Step 35351: {'lr': 0.00043992906162340563, 'samples': 6787392, 'steps': 35350, 'loss/train': 1.9289575815200806} -08/30/2021 19:36:16 - INFO - __main__ - Step 35352: {'lr': 0.00043992561084495906, 'samples': 6787584, 'steps': 35351, 'loss/train': 2.431380033493042} -08/30/2021 19:36:16 - INFO - __main__ - Step 35353: {'lr': 0.0004399221599809349, 'samples': 6787776, 'steps': 35352, 'loss/train': 1.7876442670822144} -08/30/2021 19:36:17 - INFO - __main__ - Step 35354: {'lr': 0.0004399187090313348, 'samples': 6787968, 'steps': 35353, 'loss/train': 1.2761778831481934} -08/30/2021 19:36:19 - INFO - __main__ - Step 35355: {'lr': 0.00043991525799616017, 'samples': 6788160, 'steps': 35354, 'loss/train': 1.2068582773208618} -08/30/2021 19:36:19 - INFO - __main__ - Step 35356: {'lr': 0.0004399118068754127, 'samples': 6788352, 'steps': 35355, 'loss/train': 2.0843570232391357} -08/30/2021 19:36:20 - INFO - __main__ - Step 35357: {'lr': 0.0004399083556690939, 'samples': 6788544, 'steps': 35356, 'loss/train': 1.4274187088012695} -08/30/2021 19:36:20 - INFO - __main__ - Step 35358: {'lr': 0.0004399049043772053, 'samples': 6788736, 'steps': 35357, 'loss/train': 0.705751895904541} -08/30/2021 19:36:20 - INFO - __main__ - Step 35359: {'lr': 0.00043990145299974853, 'samples': 6788928, 'steps': 35358, 'loss/train': 1.1702861785888672} -08/30/2021 19:36:22 - INFO - __main__ - Step 35360: {'lr': 0.0004398980015367251, 'samples': 6789120, 'steps': 35359, 'loss/train': 1.231582760810852} -08/30/2021 19:36:22 - INFO - __main__ - Step 35361: {'lr': 0.00043989454998813655, 'samples': 6789312, 'steps': 35360, 'loss/train': 0.36591726541519165} -08/30/2021 19:36:23 - INFO - __main__ - Step 35362: {'lr': 0.00043989109835398444, 'samples': 6789504, 'steps': 35361, 'loss/train': 1.3209960460662842} -08/30/2021 19:36:23 - INFO - __main__ - Step 35363: {'lr': 0.0004398876466342703, 'samples': 6789696, 'steps': 35362, 'loss/train': 1.8163431882858276} -08/30/2021 19:36:24 - INFO - __main__ - Step 35364: {'lr': 0.0004398841948289958, 'samples': 6789888, 'steps': 35363, 'loss/train': 1.3110448122024536} -08/30/2021 19:36:24 - INFO - __main__ - Step 35365: {'lr': 0.0004398807429381623, 'samples': 6790080, 'steps': 35364, 'loss/train': 0.049749474972486496} -08/30/2021 19:36:26 - INFO - __main__ - Step 35366: {'lr': 0.0004398772909617715, 'samples': 6790272, 'steps': 35365, 'loss/train': 1.8331133127212524} -08/30/2021 19:36:27 - INFO - __main__ - Step 35367: {'lr': 0.00043987383889982495, 'samples': 6790464, 'steps': 35366, 'loss/train': 1.2132179737091064} -08/30/2021 19:36:27 - INFO - __main__ - Step 35368: {'lr': 0.00043987038675232415, 'samples': 6790656, 'steps': 35367, 'loss/train': 1.374467134475708} -08/30/2021 19:36:28 - INFO - __main__ - Step 35369: {'lr': 0.00043986693451927074, 'samples': 6790848, 'steps': 35368, 'loss/train': 0.34419572353363037} -08/30/2021 19:36:28 - INFO - __main__ - Step 35370: {'lr': 0.0004398634822006662, 'samples': 6791040, 'steps': 35369, 'loss/train': 0.25599876046180725} -08/30/2021 19:36:28 - INFO - __main__ - Step 35371: {'lr': 0.0004398600297965121, 'samples': 6791232, 'steps': 35370, 'loss/train': 1.0565998554229736} -08/30/2021 19:36:30 - INFO - __main__ - Step 35372: {'lr': 0.00043985657730680997, 'samples': 6791424, 'steps': 35371, 'loss/train': 1.3926738500595093} -08/30/2021 19:36:30 - INFO - __main__ - Step 35373: {'lr': 0.00043985312473156143, 'samples': 6791616, 'steps': 35372, 'loss/train': 1.0037105083465576} -08/30/2021 19:36:31 - INFO - __main__ - Step 35374: {'lr': 0.000439849672070768, 'samples': 6791808, 'steps': 35373, 'loss/train': 0.936872124671936} -08/30/2021 19:36:31 - INFO - __main__ - Step 35375: {'lr': 0.00043984621932443115, 'samples': 6792000, 'steps': 35374, 'loss/train': 1.5440009832382202} -08/30/2021 19:36:31 - INFO - __main__ - Step 35376: {'lr': 0.0004398427664925526, 'samples': 6792192, 'steps': 35375, 'loss/train': 1.294872760772705} -08/30/2021 19:36:32 - INFO - __main__ - Step 35377: {'lr': 0.0004398393135751338, 'samples': 6792384, 'steps': 35376, 'loss/train': 1.6850001811981201} -08/30/2021 19:36:33 - INFO - __main__ - Step 35378: {'lr': 0.0004398358605721764, 'samples': 6792576, 'steps': 35377, 'loss/train': 0.7377321720123291} -08/30/2021 19:36:34 - INFO - __main__ - Step 35379: {'lr': 0.00043983240748368186, 'samples': 6792768, 'steps': 35378, 'loss/train': 1.3044615983963013} -08/30/2021 19:36:34 - INFO - __main__ - Step 35380: {'lr': 0.0004398289543096518, 'samples': 6792960, 'steps': 35379, 'loss/train': 1.5079270601272583} -08/30/2021 19:36:34 - INFO - __main__ - Step 35381: {'lr': 0.0004398255010500877, 'samples': 6793152, 'steps': 35380, 'loss/train': 1.6334177255630493} -08/30/2021 19:36:35 - INFO - __main__ - Step 35382: {'lr': 0.00043982204770499114, 'samples': 6793344, 'steps': 35381, 'loss/train': 0.9073518514633179} -08/30/2021 19:36:36 - INFO - __main__ - Step 35383: {'lr': 0.0004398185942743637, 'samples': 6793536, 'steps': 35382, 'loss/train': 1.200181484222412} -08/30/2021 19:36:36 - INFO - __main__ - Step 35384: {'lr': 0.00043981514075820693, 'samples': 6793728, 'steps': 35383, 'loss/train': 0.6204242706298828} -08/30/2021 19:36:37 - INFO - __main__ - Step 35385: {'lr': 0.0004398116871565224, 'samples': 6793920, 'steps': 35384, 'loss/train': 0.8892233967781067} -08/30/2021 19:36:37 - INFO - __main__ - Step 35386: {'lr': 0.0004398082334693116, 'samples': 6794112, 'steps': 35385, 'loss/train': 1.8526052236557007} -08/30/2021 19:36:38 - INFO - __main__ - Step 35387: {'lr': 0.0004398047796965762, 'samples': 6794304, 'steps': 35386, 'loss/train': 1.7854810953140259} -08/30/2021 19:36:39 - INFO - __main__ - Step 35388: {'lr': 0.0004398013258383177, 'samples': 6794496, 'steps': 35387, 'loss/train': 1.622938632965088} -08/30/2021 19:36:40 - INFO - __main__ - Step 35389: {'lr': 0.0004397978718945377, 'samples': 6794688, 'steps': 35388, 'loss/train': 1.3173573017120361} -08/30/2021 19:36:40 - INFO - __main__ - Step 35390: {'lr': 0.0004397944178652376, 'samples': 6794880, 'steps': 35389, 'loss/train': 1.4173136949539185} -08/30/2021 19:36:40 - INFO - __main__ - Step 35391: {'lr': 0.0004397909637504191, 'samples': 6795072, 'steps': 35390, 'loss/train': 2.6413254737854004} -08/30/2021 19:36:41 - INFO - __main__ - Step 35392: {'lr': 0.00043978750955008374, 'samples': 6795264, 'steps': 35391, 'loss/train': 0.8653263449668884} -08/30/2021 19:36:42 - INFO - __main__ - Step 35393: {'lr': 0.00043978405526423305, 'samples': 6795456, 'steps': 35392, 'loss/train': 1.6237744092941284} -08/30/2021 19:36:43 - INFO - __main__ - Step 35394: {'lr': 0.0004397806008928686, 'samples': 6795648, 'steps': 35393, 'loss/train': 1.0248075723648071} -08/30/2021 19:36:43 - INFO - __main__ - Step 35395: {'lr': 0.00043977714643599194, 'samples': 6795840, 'steps': 35394, 'loss/train': 0.43009302020072937} -08/30/2021 19:36:44 - INFO - __main__ - Step 35396: {'lr': 0.0004397736918936046, 'samples': 6796032, 'steps': 35395, 'loss/train': 1.2525368928909302} -08/30/2021 19:36:44 - INFO - __main__ - Step 35397: {'lr': 0.0004397702372657082, 'samples': 6796224, 'steps': 35396, 'loss/train': 1.5758581161499023} -08/30/2021 19:36:45 - INFO - __main__ - Step 35398: {'lr': 0.00043976678255230417, 'samples': 6796416, 'steps': 35397, 'loss/train': 1.3603363037109375} -08/30/2021 19:36:46 - INFO - __main__ - Step 35399: {'lr': 0.0004397633277533942, 'samples': 6796608, 'steps': 35398, 'loss/train': 0.6953346729278564} -08/30/2021 19:36:46 - INFO - __main__ - Step 35400: {'lr': 0.0004397598728689799, 'samples': 6796800, 'steps': 35399, 'loss/train': 1.5138709545135498} -08/30/2021 19:36:47 - INFO - __main__ - Step 35401: {'lr': 0.0004397564178990626, 'samples': 6796992, 'steps': 35400, 'loss/train': 1.2172725200653076} -08/30/2021 19:36:47 - INFO - __main__ - Step 35402: {'lr': 0.0004397529628436441, 'samples': 6797184, 'steps': 35401, 'loss/train': 0.9983571767807007} -08/30/2021 19:36:49 - INFO - __main__ - Step 35403: {'lr': 0.0004397495077027258, 'samples': 6797376, 'steps': 35402, 'loss/train': 0.9644858241081238} -08/30/2021 19:36:49 - INFO - __main__ - Step 35404: {'lr': 0.0004397460524763093, 'samples': 6797568, 'steps': 35403, 'loss/train': 1.7141958475112915} -08/30/2021 19:36:49 - INFO - __main__ - Step 35405: {'lr': 0.00043974259716439613, 'samples': 6797760, 'steps': 35404, 'loss/train': 1.1593409776687622} -08/30/2021 19:36:50 - INFO - __main__ - Step 35406: {'lr': 0.0004397391417669878, 'samples': 6797952, 'steps': 35405, 'loss/train': 1.45179283618927} -08/30/2021 19:36:50 - INFO - __main__ - Step 35407: {'lr': 0.0004397356862840861, 'samples': 6798144, 'steps': 35406, 'loss/train': 1.4605265855789185} -08/30/2021 19:36:52 - INFO - __main__ - Step 35408: {'lr': 0.00043973223071569234, 'samples': 6798336, 'steps': 35407, 'loss/train': 1.7734060287475586} -08/30/2021 19:36:52 - INFO - __main__ - Step 35409: {'lr': 0.0004397287750618082, 'samples': 6798528, 'steps': 35408, 'loss/train': 0.7091401219367981} -08/30/2021 19:36:52 - INFO - __main__ - Step 35410: {'lr': 0.00043972531932243516, 'samples': 6798720, 'steps': 35409, 'loss/train': 2.148045063018799} -08/30/2021 19:36:53 - INFO - __main__ - Step 35411: {'lr': 0.00043972186349757484, 'samples': 6798912, 'steps': 35410, 'loss/train': 1.3229072093963623} -08/30/2021 19:36:53 - INFO - __main__ - Step 35412: {'lr': 0.0004397184075872288, 'samples': 6799104, 'steps': 35411, 'loss/train': 1.3060005903244019} -08/30/2021 19:36:53 - INFO - __main__ - Step 35413: {'lr': 0.0004397149515913985, 'samples': 6799296, 'steps': 35412, 'loss/train': 1.6305447816848755} -08/30/2021 19:36:55 - INFO - __main__ - Step 35414: {'lr': 0.0004397114955100856, 'samples': 6799488, 'steps': 35413, 'loss/train': 1.6426652669906616} -08/30/2021 19:36:56 - INFO - __main__ - Step 35415: {'lr': 0.00043970803934329167, 'samples': 6799680, 'steps': 35414, 'loss/train': 1.3134020566940308} -08/30/2021 19:36:56 - INFO - __main__ - Step 35416: {'lr': 0.00043970458309101825, 'samples': 6799872, 'steps': 35415, 'loss/train': 0.20792165398597717} -08/30/2021 19:36:57 - INFO - __main__ - Step 35417: {'lr': 0.0004397011267532668, 'samples': 6800064, 'steps': 35416, 'loss/train': 1.2112113237380981} -08/30/2021 19:36:57 - INFO - __main__ - Step 35418: {'lr': 0.00043969767033003894, 'samples': 6800256, 'steps': 35417, 'loss/train': 1.7336615324020386} -08/30/2021 19:36:58 - INFO - __main__ - Step 35419: {'lr': 0.0004396942138213363, 'samples': 6800448, 'steps': 35418, 'loss/train': 1.6246439218521118} -08/30/2021 19:36:59 - INFO - __main__ - Step 35420: {'lr': 0.00043969075722716033, 'samples': 6800640, 'steps': 35419, 'loss/train': 1.69806706905365} -08/30/2021 19:36:59 - INFO - __main__ - Step 35421: {'lr': 0.0004396873005475127, 'samples': 6800832, 'steps': 35420, 'loss/train': 1.445824384689331} -08/30/2021 19:37:00 - INFO - __main__ - Step 35422: {'lr': 0.00043968384378239477, 'samples': 6801024, 'steps': 35421, 'loss/train': 1.4318392276763916} -08/30/2021 19:37:00 - INFO - __main__ - Step 35423: {'lr': 0.00043968038693180834, 'samples': 6801216, 'steps': 35422, 'loss/train': 1.7666666507720947} -08/30/2021 19:37:02 - INFO - __main__ - Step 35424: {'lr': 0.00043967692999575484, 'samples': 6801408, 'steps': 35423, 'loss/train': 1.677564024925232} -08/30/2021 19:37:02 - INFO - __main__ - Step 35425: {'lr': 0.00043967347297423575, 'samples': 6801600, 'steps': 35424, 'loss/train': 0.8641349673271179} -08/30/2021 19:37:02 - INFO - __main__ - Step 35426: {'lr': 0.0004396700158672528, 'samples': 6801792, 'steps': 35425, 'loss/train': 2.300177574157715} -08/30/2021 19:37:03 - INFO - __main__ - Step 35427: {'lr': 0.0004396665586748075, 'samples': 6801984, 'steps': 35426, 'loss/train': 1.1048344373703003} -08/30/2021 19:37:03 - INFO - __main__ - Step 35428: {'lr': 0.0004396631013969013, 'samples': 6802176, 'steps': 35427, 'loss/train': 0.26490673422813416} -08/30/2021 19:37:05 - INFO - __main__ - Step 35429: {'lr': 0.0004396596440335359, 'samples': 6802368, 'steps': 35428, 'loss/train': 1.4350842237472534} -08/30/2021 19:37:05 - INFO - __main__ - Step 35430: {'lr': 0.00043965618658471276, 'samples': 6802560, 'steps': 35429, 'loss/train': 1.8680329322814941} -08/30/2021 19:37:05 - INFO - __main__ - Step 35431: {'lr': 0.0004396527290504334, 'samples': 6802752, 'steps': 35430, 'loss/train': 0.5671683549880981} -08/30/2021 19:37:06 - INFO - __main__ - Step 35432: {'lr': 0.00043964927143069955, 'samples': 6802944, 'steps': 35431, 'loss/train': 1.3406174182891846} -08/30/2021 19:37:06 - INFO - __main__ - Step 35433: {'lr': 0.0004396458137255126, 'samples': 6803136, 'steps': 35432, 'loss/train': 0.07098355144262314} -08/30/2021 19:37:07 - INFO - __main__ - Step 35434: {'lr': 0.0004396423559348742, 'samples': 6803328, 'steps': 35433, 'loss/train': 1.6706665754318237} -08/30/2021 19:37:08 - INFO - __main__ - Step 35435: {'lr': 0.0004396388980587859, 'samples': 6803520, 'steps': 35434, 'loss/train': 1.9187897443771362} -08/30/2021 19:37:08 - INFO - __main__ - Step 35436: {'lr': 0.0004396354400972492, 'samples': 6803712, 'steps': 35435, 'loss/train': 1.5230586528778076} -08/30/2021 19:37:09 - INFO - __main__ - Step 35437: {'lr': 0.0004396319820502657, 'samples': 6803904, 'steps': 35436, 'loss/train': 1.3035917282104492} -08/30/2021 19:37:09 - INFO - __main__ - Step 35438: {'lr': 0.000439628523917837, 'samples': 6804096, 'steps': 35437, 'loss/train': 1.4326589107513428} -08/30/2021 19:37:10 - INFO - __main__ - Step 35439: {'lr': 0.0004396250656999646, 'samples': 6804288, 'steps': 35438, 'loss/train': 1.3794828653335571} -08/30/2021 19:37:11 - INFO - __main__ - Step 35440: {'lr': 0.00043962160739665, 'samples': 6804480, 'steps': 35439, 'loss/train': 1.1045030355453491} -08/30/2021 19:37:11 - INFO - __main__ - Step 35441: {'lr': 0.0004396181490078949, 'samples': 6804672, 'steps': 35440, 'loss/train': 0.6782146096229553} -08/30/2021 19:37:12 - INFO - __main__ - Step 35442: {'lr': 0.0004396146905337008, 'samples': 6804864, 'steps': 35441, 'loss/train': 1.210057258605957} -08/30/2021 19:37:12 - INFO - __main__ - Step 35443: {'lr': 0.0004396112319740692, 'samples': 6805056, 'steps': 35442, 'loss/train': 1.6531317234039307} -08/30/2021 19:37:13 - INFO - __main__ - Step 35444: {'lr': 0.0004396077733290017, 'samples': 6805248, 'steps': 35443, 'loss/train': 1.5051201581954956} -08/30/2021 19:37:14 - INFO - __main__ - Step 35445: {'lr': 0.00043960431459849993, 'samples': 6805440, 'steps': 35444, 'loss/train': 1.4708025455474854} -08/30/2021 19:37:14 - INFO - __main__ - Step 35446: {'lr': 0.00043960085578256537, 'samples': 6805632, 'steps': 35445, 'loss/train': 1.2306946516036987} -08/30/2021 19:37:15 - INFO - __main__ - Step 35447: {'lr': 0.0004395973968811995, 'samples': 6805824, 'steps': 35446, 'loss/train': 1.0647679567337036} -08/30/2021 19:37:15 - INFO - __main__ - Step 35448: {'lr': 0.00043959393789440407, 'samples': 6806016, 'steps': 35447, 'loss/train': 1.2634668350219727} -08/30/2021 19:37:15 - INFO - __main__ - Step 35449: {'lr': 0.0004395904788221805, 'samples': 6806208, 'steps': 35448, 'loss/train': 1.3179101943969727} -08/30/2021 19:37:17 - INFO - __main__ - Step 35450: {'lr': 0.00043958701966453033, 'samples': 6806400, 'steps': 35449, 'loss/train': 1.3771743774414062} -08/30/2021 19:37:17 - INFO - __main__ - Step 35451: {'lr': 0.00043958356042145524, 'samples': 6806592, 'steps': 35450, 'loss/train': 1.5681291818618774} -08/30/2021 19:37:18 - INFO - __main__ - Step 35452: {'lr': 0.0004395801010929567, 'samples': 6806784, 'steps': 35451, 'loss/train': 1.4143986701965332} -08/30/2021 19:37:18 - INFO - __main__ - Step 35453: {'lr': 0.0004395766416790363, 'samples': 6806976, 'steps': 35452, 'loss/train': 1.2842624187469482} -08/30/2021 19:37:18 - INFO - __main__ - Step 35454: {'lr': 0.0004395731821796956, 'samples': 6807168, 'steps': 35453, 'loss/train': 1.5339900255203247} -08/30/2021 19:37:20 - INFO - __main__ - Step 35455: {'lr': 0.00043956972259493615, 'samples': 6807360, 'steps': 35454, 'loss/train': 1.3370405435562134} -08/30/2021 19:37:20 - INFO - __main__ - Step 35456: {'lr': 0.0004395662629247595, 'samples': 6807552, 'steps': 35455, 'loss/train': 1.2923717498779297} -08/30/2021 19:37:21 - INFO - __main__ - Step 35457: {'lr': 0.0004395628031691672, 'samples': 6807744, 'steps': 35456, 'loss/train': 0.9794766902923584} -08/30/2021 19:37:21 - INFO - __main__ - Step 35458: {'lr': 0.00043955934332816083, 'samples': 6807936, 'steps': 35457, 'loss/train': 1.4066797494888306} -08/30/2021 19:37:21 - INFO - __main__ - Step 35459: {'lr': 0.00043955588340174195, 'samples': 6808128, 'steps': 35458, 'loss/train': 1.0689204931259155} -08/30/2021 19:37:23 - INFO - __main__ - Step 35460: {'lr': 0.00043955242338991217, 'samples': 6808320, 'steps': 35459, 'loss/train': 1.3036293983459473} -08/30/2021 19:37:23 - INFO - __main__ - Step 35461: {'lr': 0.0004395489632926729, 'samples': 6808512, 'steps': 35460, 'loss/train': 1.0542709827423096} -08/30/2021 19:37:24 - INFO - __main__ - Step 35462: {'lr': 0.0004395455031100258, 'samples': 6808704, 'steps': 35461, 'loss/train': 1.4861023426055908} -08/30/2021 19:37:24 - INFO - __main__ - Step 35463: {'lr': 0.0004395420428419725, 'samples': 6808896, 'steps': 35462, 'loss/train': 0.8354753851890564} -08/30/2021 19:37:25 - INFO - __main__ - Step 35464: {'lr': 0.0004395385824885144, 'samples': 6809088, 'steps': 35463, 'loss/train': 1.276066780090332} -08/30/2021 19:37:27 - INFO - __main__ - Step 35465: {'lr': 0.0004395351220496532, 'samples': 6809280, 'steps': 35464, 'loss/train': 2.0710320472717285} -08/30/2021 19:37:27 - INFO - __main__ - Step 35466: {'lr': 0.00043953166152539035, 'samples': 6809472, 'steps': 35465, 'loss/train': 1.3038617372512817} -08/30/2021 19:37:27 - INFO - __main__ - Step 35467: {'lr': 0.00043952820091572753, 'samples': 6809664, 'steps': 35466, 'loss/train': 1.283642292022705} -08/30/2021 19:37:28 - INFO - __main__ - Step 35468: {'lr': 0.0004395247402206662, 'samples': 6809856, 'steps': 35467, 'loss/train': 1.750546932220459} -08/30/2021 19:37:28 - INFO - __main__ - Step 35469: {'lr': 0.0004395212794402079, 'samples': 6810048, 'steps': 35468, 'loss/train': 1.957651138305664} -08/30/2021 19:37:29 - INFO - __main__ - Step 35470: {'lr': 0.00043951781857435424, 'samples': 6810240, 'steps': 35469, 'loss/train': 1.3968238830566406} -08/30/2021 19:37:30 - INFO - __main__ - Step 35471: {'lr': 0.00043951435762310686, 'samples': 6810432, 'steps': 35470, 'loss/train': 1.20931875705719} -08/30/2021 19:37:30 - INFO - __main__ - Step 35472: {'lr': 0.0004395108965864671, 'samples': 6810624, 'steps': 35471, 'loss/train': 1.7945719957351685} -08/30/2021 19:37:31 - INFO - __main__ - Step 35473: {'lr': 0.00043950743546443676, 'samples': 6810816, 'steps': 35472, 'loss/train': 1.374839186668396} -08/30/2021 19:37:31 - INFO - __main__ - Step 35474: {'lr': 0.0004395039742570173, 'samples': 6811008, 'steps': 35473, 'loss/train': 1.3714797496795654} -08/30/2021 19:37:33 - INFO - __main__ - Step 35475: {'lr': 0.00043950051296421023, 'samples': 6811200, 'steps': 35474, 'loss/train': 1.2336626052856445} -08/30/2021 19:37:33 - INFO - __main__ - Step 35476: {'lr': 0.00043949705158601715, 'samples': 6811392, 'steps': 35475, 'loss/train': 0.9487754702568054} -08/30/2021 19:37:33 - INFO - __main__ - Step 35477: {'lr': 0.00043949359012243963, 'samples': 6811584, 'steps': 35476, 'loss/train': 0.9743692278862} -08/30/2021 19:37:34 - INFO - __main__ - Step 35478: {'lr': 0.00043949012857347924, 'samples': 6811776, 'steps': 35477, 'loss/train': 1.6047486066818237} -08/30/2021 19:37:34 - INFO - __main__ - Step 35479: {'lr': 0.0004394866669391375, 'samples': 6811968, 'steps': 35478, 'loss/train': 1.0453120470046997} -08/30/2021 19:37:36 - INFO - __main__ - Step 35480: {'lr': 0.00043948320521941596, 'samples': 6812160, 'steps': 35479, 'loss/train': 1.099510908126831} -08/30/2021 19:37:36 - INFO - __main__ - Step 35481: {'lr': 0.00043947974341431627, 'samples': 6812352, 'steps': 35480, 'loss/train': 1.6088054180145264} -08/30/2021 19:37:36 - INFO - __main__ - Step 35482: {'lr': 0.0004394762815238399, 'samples': 6812544, 'steps': 35481, 'loss/train': 1.281843662261963} -08/30/2021 19:37:37 - INFO - __main__ - Step 35483: {'lr': 0.00043947281954798844, 'samples': 6812736, 'steps': 35482, 'loss/train': 1.0731096267700195} -08/30/2021 19:37:37 - INFO - __main__ - Step 35484: {'lr': 0.0004394693574867635, 'samples': 6812928, 'steps': 35483, 'loss/train': 1.6933749914169312} -08/30/2021 19:37:37 - INFO - __main__ - Step 35485: {'lr': 0.0004394658953401666, 'samples': 6813120, 'steps': 35484, 'loss/train': 1.4031773805618286} -08/30/2021 19:37:39 - INFO - __main__ - Step 35486: {'lr': 0.0004394624331081992, 'samples': 6813312, 'steps': 35485, 'loss/train': 1.0322613716125488} -08/30/2021 19:37:39 - INFO - __main__ - Step 35487: {'lr': 0.00043945897079086295, 'samples': 6813504, 'steps': 35486, 'loss/train': 1.3490275144577026} -08/30/2021 19:37:40 - INFO - __main__ - Step 35488: {'lr': 0.00043945550838815953, 'samples': 6813696, 'steps': 35487, 'loss/train': 1.5497703552246094} -08/30/2021 19:37:40 - INFO - __main__ - Step 35489: {'lr': 0.00043945204590009027, 'samples': 6813888, 'steps': 35488, 'loss/train': 2.1221632957458496} -08/30/2021 19:37:40 - INFO - __main__ - Step 35490: {'lr': 0.0004394485833266569, 'samples': 6814080, 'steps': 35489, 'loss/train': 1.2926548719406128} -08/30/2021 19:37:42 - INFO - __main__ - Step 35491: {'lr': 0.0004394451206678609, 'samples': 6814272, 'steps': 35490, 'loss/train': 1.2890409231185913} -08/30/2021 19:37:42 - INFO - __main__ - Step 35492: {'lr': 0.00043944165792370385, 'samples': 6814464, 'steps': 35491, 'loss/train': 1.413093090057373} -08/30/2021 19:37:43 - INFO - __main__ - Step 35493: {'lr': 0.00043943819509418723, 'samples': 6814656, 'steps': 35492, 'loss/train': 1.5966626405715942} -08/30/2021 19:37:43 - INFO - __main__ - Step 35494: {'lr': 0.00043943473217931283, 'samples': 6814848, 'steps': 35493, 'loss/train': 1.3935346603393555} -08/30/2021 19:37:43 - INFO - __main__ - Step 35495: {'lr': 0.0004394312691790821, 'samples': 6815040, 'steps': 35494, 'loss/train': 1.2111256122589111} -08/30/2021 19:37:45 - INFO - __main__ - Step 35496: {'lr': 0.00043942780609349636, 'samples': 6815232, 'steps': 35495, 'loss/train': 1.3922882080078125} -08/30/2021 19:37:45 - INFO - __main__ - Step 35497: {'lr': 0.0004394243429225575, 'samples': 6815424, 'steps': 35496, 'loss/train': 1.4599941968917847} -08/30/2021 19:37:46 - INFO - __main__ - Step 35498: {'lr': 0.0004394208796662669, 'samples': 6815616, 'steps': 35497, 'loss/train': 1.6065566539764404} -08/30/2021 19:37:46 - INFO - __main__ - Step 35499: {'lr': 0.00043941741632462625, 'samples': 6815808, 'steps': 35498, 'loss/train': 1.4144123792648315} -08/30/2021 19:37:46 - INFO - __main__ - Step 35500: {'lr': 0.000439413952897637, 'samples': 6816000, 'steps': 35499, 'loss/train': 1.3598979711532593} -08/30/2021 19:37:48 - INFO - __main__ - Step 35501: {'lr': 0.0004394104893853007, 'samples': 6816192, 'steps': 35500, 'loss/train': 1.4200773239135742} -08/30/2021 19:37:49 - INFO - __main__ - Step 35502: {'lr': 0.00043940702578761906, 'samples': 6816384, 'steps': 35501, 'loss/train': 1.4697645902633667} -08/30/2021 19:37:49 - INFO - __main__ - Step 35503: {'lr': 0.00043940356210459344, 'samples': 6816576, 'steps': 35502, 'loss/train': 1.477472186088562} -08/30/2021 19:37:49 - INFO - __main__ - Step 35504: {'lr': 0.0004394000983362255, 'samples': 6816768, 'steps': 35503, 'loss/train': 1.402300477027893} -08/30/2021 19:37:50 - INFO - __main__ - Step 35505: {'lr': 0.0004393966344825168, 'samples': 6816960, 'steps': 35504, 'loss/train': 1.4279059171676636} -08/30/2021 19:37:51 - INFO - __main__ - Step 35506: {'lr': 0.00043939317054346894, 'samples': 6817152, 'steps': 35505, 'loss/train': 0.35592007637023926} -08/30/2021 19:37:52 - INFO - __main__ - Step 35507: {'lr': 0.00043938970651908346, 'samples': 6817344, 'steps': 35506, 'loss/train': 1.366572618484497} -08/30/2021 19:37:52 - INFO - __main__ - Step 35508: {'lr': 0.0004393862424093619, 'samples': 6817536, 'steps': 35507, 'loss/train': 0.6412873268127441} -08/30/2021 19:37:52 - INFO - __main__ - Step 35509: {'lr': 0.0004393827782143057, 'samples': 6817728, 'steps': 35508, 'loss/train': 1.8807237148284912} -08/30/2021 19:37:53 - INFO - __main__ - Step 35510: {'lr': 0.00043937931393391667, 'samples': 6817920, 'steps': 35509, 'loss/train': 0.8151328563690186} -08/30/2021 19:37:54 - INFO - __main__ - Step 35511: {'lr': 0.0004393758495681962, 'samples': 6818112, 'steps': 35510, 'loss/train': 1.8052244186401367} -08/30/2021 19:37:55 - INFO - __main__ - Step 35512: {'lr': 0.0004393723851171459, 'samples': 6818304, 'steps': 35511, 'loss/train': 1.8337180614471436} -08/30/2021 19:37:55 - INFO - __main__ - Step 35513: {'lr': 0.0004393689205807673, 'samples': 6818496, 'steps': 35512, 'loss/train': 1.5067464113235474} -08/30/2021 19:37:55 - INFO - __main__ - Step 35514: {'lr': 0.00043936545595906206, 'samples': 6818688, 'steps': 35513, 'loss/train': 4.344979286193848} -08/30/2021 19:37:56 - INFO - __main__ - Step 35515: {'lr': 0.00043936199125203156, 'samples': 6818880, 'steps': 35514, 'loss/train': 0.9031326770782471} -08/30/2021 19:37:57 - INFO - __main__ - Step 35516: {'lr': 0.00043935852645967755, 'samples': 6819072, 'steps': 35515, 'loss/train': 1.792057752609253} -08/30/2021 19:37:57 - INFO - __main__ - Step 35517: {'lr': 0.00043935506158200143, 'samples': 6819264, 'steps': 35516, 'loss/train': 1.351317286491394} -08/30/2021 19:37:58 - INFO - __main__ - Step 35518: {'lr': 0.000439351596619005, 'samples': 6819456, 'steps': 35517, 'loss/train': 1.123411774635315} -08/30/2021 19:37:58 - INFO - __main__ - Step 35519: {'lr': 0.00043934813157068956, 'samples': 6819648, 'steps': 35518, 'loss/train': 1.02517569065094} -08/30/2021 19:37:59 - INFO - __main__ - Step 35520: {'lr': 0.00043934466643705673, 'samples': 6819840, 'steps': 35519, 'loss/train': 0.5735183954238892} -08/30/2021 19:38:00 - INFO - __main__ - Step 35521: {'lr': 0.00043934120121810814, 'samples': 6820032, 'steps': 35520, 'loss/train': 1.282111644744873} -08/30/2021 19:38:01 - INFO - __main__ - Step 35522: {'lr': 0.0004393377359138454, 'samples': 6820224, 'steps': 35521, 'loss/train': 1.5309820175170898} -08/30/2021 19:38:01 - INFO - __main__ - Step 35523: {'lr': 0.00043933427052426986, 'samples': 6820416, 'steps': 35522, 'loss/train': 1.2699809074401855} -08/30/2021 19:38:02 - INFO - __main__ - Step 35524: {'lr': 0.00043933080504938337, 'samples': 6820608, 'steps': 35523, 'loss/train': 1.2430779933929443} -08/30/2021 19:38:02 - INFO - __main__ - Step 35525: {'lr': 0.00043932733948918724, 'samples': 6820800, 'steps': 35524, 'loss/train': 1.4439725875854492} -08/30/2021 19:38:03 - INFO - __main__ - Step 35526: {'lr': 0.0004393238738436832, 'samples': 6820992, 'steps': 35525, 'loss/train': 1.9710932970046997} -08/30/2021 19:38:04 - INFO - __main__ - Step 35527: {'lr': 0.00043932040811287264, 'samples': 6821184, 'steps': 35526, 'loss/train': 1.4086105823516846} -08/30/2021 19:38:04 - INFO - __main__ - Step 35528: {'lr': 0.0004393169422967573, 'samples': 6821376, 'steps': 35527, 'loss/train': 1.0004055500030518} -08/30/2021 19:38:05 - INFO - __main__ - Step 35529: {'lr': 0.0004393134763953387, 'samples': 6821568, 'steps': 35528, 'loss/train': 0.9425281286239624} -08/30/2021 19:38:05 - INFO - __main__ - Step 35530: {'lr': 0.00043931001040861835, 'samples': 6821760, 'steps': 35529, 'loss/train': 1.9139232635498047} -08/30/2021 19:38:06 - INFO - __main__ - Step 35531: {'lr': 0.00043930654433659775, 'samples': 6821952, 'steps': 35530, 'loss/train': 1.7550944089889526} -08/30/2021 19:38:07 - INFO - __main__ - Step 35532: {'lr': 0.0004393030781792787, 'samples': 6822144, 'steps': 35531, 'loss/train': 1.1504539251327515} -08/30/2021 19:38:07 - INFO - __main__ - Step 35533: {'lr': 0.00043929961193666246, 'samples': 6822336, 'steps': 35532, 'loss/train': 1.4087321758270264} -08/30/2021 19:38:08 - INFO - __main__ - Step 35534: {'lr': 0.0004392961456087508, 'samples': 6822528, 'steps': 35533, 'loss/train': 0.4733916223049164} -08/30/2021 19:38:08 - INFO - __main__ - Step 35535: {'lr': 0.00043929267919554516, 'samples': 6822720, 'steps': 35534, 'loss/train': 1.3361679315567017} -08/30/2021 19:38:08 - INFO - __main__ - Step 35536: {'lr': 0.00043928921269704725, 'samples': 6822912, 'steps': 35535, 'loss/train': 1.0247011184692383} -08/30/2021 19:38:10 - INFO - __main__ - Step 35537: {'lr': 0.00043928574611325845, 'samples': 6823104, 'steps': 35536, 'loss/train': 1.9099128246307373} -08/30/2021 19:38:10 - INFO - __main__ - Step 35538: {'lr': 0.00043928227944418046, 'samples': 6823296, 'steps': 35537, 'loss/train': 0.7634215354919434} -08/30/2021 19:38:11 - INFO - __main__ - Step 35539: {'lr': 0.00043927881268981484, 'samples': 6823488, 'steps': 35538, 'loss/train': 1.7309541702270508} -08/30/2021 19:38:11 - INFO - __main__ - Step 35540: {'lr': 0.00043927534585016305, 'samples': 6823680, 'steps': 35539, 'loss/train': 1.7048053741455078} -08/30/2021 19:38:11 - INFO - __main__ - Step 35541: {'lr': 0.0004392718789252267, 'samples': 6823872, 'steps': 35540, 'loss/train': 1.5013402700424194} -08/30/2021 19:38:13 - INFO - __main__ - Step 35542: {'lr': 0.0004392684119150074, 'samples': 6824064, 'steps': 35541, 'loss/train': 1.8228617906570435} -08/30/2021 19:38:13 - INFO - __main__ - Step 35543: {'lr': 0.0004392649448195066, 'samples': 6824256, 'steps': 35542, 'loss/train': 1.3826454877853394} -08/30/2021 19:38:14 - INFO - __main__ - Step 35544: {'lr': 0.000439261477638726, 'samples': 6824448, 'steps': 35543, 'loss/train': 1.5281010866165161} -08/30/2021 19:38:14 - INFO - __main__ - Step 35545: {'lr': 0.0004392580103726671, 'samples': 6824640, 'steps': 35544, 'loss/train': 2.0254573822021484} -08/30/2021 19:38:14 - INFO - __main__ - Step 35546: {'lr': 0.0004392545430213315, 'samples': 6824832, 'steps': 35545, 'loss/train': 1.2443621158599854} -08/30/2021 19:38:16 - INFO - __main__ - Step 35547: {'lr': 0.00043925107558472065, 'samples': 6825024, 'steps': 35546, 'loss/train': 0.5305963754653931} -08/30/2021 19:38:16 - INFO - __main__ - Step 35548: {'lr': 0.0004392476080628363, 'samples': 6825216, 'steps': 35547, 'loss/train': 0.9291126728057861} -08/30/2021 19:38:17 - INFO - __main__ - Step 35549: {'lr': 0.00043924414045567973, 'samples': 6825408, 'steps': 35548, 'loss/train': 1.429993748664856} -08/30/2021 19:38:17 - INFO - __main__ - Step 35550: {'lr': 0.00043924067276325274, 'samples': 6825600, 'steps': 35549, 'loss/train': 0.35420963168144226} -08/30/2021 19:38:18 - INFO - __main__ - Step 35551: {'lr': 0.0004392372049855569, 'samples': 6825792, 'steps': 35550, 'loss/train': 1.6251249313354492} -08/30/2021 19:38:19 - INFO - __main__ - Step 35552: {'lr': 0.0004392337371225936, 'samples': 6825984, 'steps': 35551, 'loss/train': 1.0503017902374268} -08/30/2021 19:38:19 - INFO - __main__ - Step 35553: {'lr': 0.0004392302691743645, 'samples': 6826176, 'steps': 35552, 'loss/train': 0.13708476722240448} -08/30/2021 19:38:20 - INFO - __main__ - Step 35554: {'lr': 0.0004392268011408712, 'samples': 6826368, 'steps': 35553, 'loss/train': 1.3462666273117065} -08/30/2021 19:38:20 - INFO - __main__ - Step 35555: {'lr': 0.0004392233330221152, 'samples': 6826560, 'steps': 35554, 'loss/train': 1.2558846473693848} -08/30/2021 19:38:21 - INFO - __main__ - Step 35556: {'lr': 0.0004392198648180981, 'samples': 6826752, 'steps': 35555, 'loss/train': 0.604512095451355} -08/30/2021 19:38:22 - INFO - __main__ - Step 35557: {'lr': 0.0004392163965288215, 'samples': 6826944, 'steps': 35556, 'loss/train': 1.3461673259735107} -08/30/2021 19:38:23 - INFO - __main__ - Step 35558: {'lr': 0.0004392129281542868, 'samples': 6827136, 'steps': 35557, 'loss/train': 1.3256924152374268} -08/30/2021 19:38:23 - INFO - __main__ - Step 35559: {'lr': 0.00043920945969449577, 'samples': 6827328, 'steps': 35558, 'loss/train': 1.069580078125} -08/30/2021 19:38:23 - INFO - __main__ - Step 35560: {'lr': 0.0004392059911494498, 'samples': 6827520, 'steps': 35559, 'loss/train': 1.2970229387283325} -08/30/2021 19:38:24 - INFO - __main__ - Step 35561: {'lr': 0.0004392025225191506, 'samples': 6827712, 'steps': 35560, 'loss/train': 1.1350421905517578} -08/30/2021 19:38:24 - INFO - __main__ - Step 35562: {'lr': 0.0004391990538035996, 'samples': 6827904, 'steps': 35561, 'loss/train': 1.411685585975647} -08/30/2021 19:38:26 - INFO - __main__ - Step 35563: {'lr': 0.00043919558500279845, 'samples': 6828096, 'steps': 35562, 'loss/train': 1.0079528093338013} -08/30/2021 19:38:26 - INFO - __main__ - Step 35564: {'lr': 0.0004391921161167487, 'samples': 6828288, 'steps': 35563, 'loss/train': 1.3235201835632324} -08/30/2021 19:38:26 - INFO - __main__ - Step 35565: {'lr': 0.00043918864714545194, 'samples': 6828480, 'steps': 35564, 'loss/train': 1.5277256965637207} -08/30/2021 19:38:27 - INFO - __main__ - Step 35566: {'lr': 0.00043918517808890964, 'samples': 6828672, 'steps': 35565, 'loss/train': 1.6159189939498901} -08/30/2021 19:38:27 - INFO - __main__ - Step 35567: {'lr': 0.0004391817089471234, 'samples': 6828864, 'steps': 35566, 'loss/train': 1.0270401239395142} -08/30/2021 19:38:29 - INFO - __main__ - Step 35568: {'lr': 0.0004391782397200949, 'samples': 6829056, 'steps': 35567, 'loss/train': 1.0426150560379028} -08/30/2021 19:38:29 - INFO - __main__ - Step 35569: {'lr': 0.0004391747704078255, 'samples': 6829248, 'steps': 35568, 'loss/train': 1.212659478187561} -08/30/2021 19:38:29 - INFO - __main__ - Step 35570: {'lr': 0.0004391713010103169, 'samples': 6829440, 'steps': 35569, 'loss/train': 1.590492844581604} -08/30/2021 19:38:30 - INFO - __main__ - Step 35571: {'lr': 0.0004391678315275706, 'samples': 6829632, 'steps': 35570, 'loss/train': 1.5762189626693726} -08/30/2021 19:38:30 - INFO - __main__ - Step 35572: {'lr': 0.00043916436195958825, 'samples': 6829824, 'steps': 35571, 'loss/train': 1.54468834400177} -08/30/2021 19:38:32 - INFO - __main__ - Step 35573: {'lr': 0.00043916089230637133, 'samples': 6830016, 'steps': 35572, 'loss/train': 1.7828104496002197} -08/30/2021 19:38:32 - INFO - __main__ - Step 35574: {'lr': 0.0004391574225679215, 'samples': 6830208, 'steps': 35573, 'loss/train': 1.7065386772155762} -08/30/2021 19:38:33 - INFO - __main__ - Step 35575: {'lr': 0.0004391539527442401, 'samples': 6830400, 'steps': 35574, 'loss/train': 0.7366040349006653} -08/30/2021 19:38:33 - INFO - __main__ - Step 35576: {'lr': 0.000439150482835329, 'samples': 6830592, 'steps': 35575, 'loss/train': 1.237656593322754} -08/30/2021 19:38:33 - INFO - __main__ - Step 35577: {'lr': 0.0004391470128411895, 'samples': 6830784, 'steps': 35576, 'loss/train': 1.1078851222991943} -08/30/2021 19:38:35 - INFO - __main__ - Step 35578: {'lr': 0.00043914354276182335, 'samples': 6830976, 'steps': 35577, 'loss/train': 1.0219086408615112} -08/30/2021 19:38:36 - INFO - __main__ - Step 35579: {'lr': 0.00043914007259723196, 'samples': 6831168, 'steps': 35578, 'loss/train': 1.4273958206176758} -08/30/2021 19:38:36 - INFO - __main__ - Step 35580: {'lr': 0.000439136602347417, 'samples': 6831360, 'steps': 35579, 'loss/train': 1.1936569213867188} -08/30/2021 19:38:36 - INFO - __main__ - Step 35581: {'lr': 0.00043913313201238017, 'samples': 6831552, 'steps': 35580, 'loss/train': 0.10602215677499771} -08/30/2021 19:38:37 - INFO - __main__ - Step 35582: {'lr': 0.00043912966159212263, 'samples': 6831744, 'steps': 35581, 'loss/train': 1.244699239730835} -08/30/2021 19:38:38 - INFO - __main__ - Step 35583: {'lr': 0.0004391261910866463, 'samples': 6831936, 'steps': 35582, 'loss/train': 1.4847512245178223} -08/30/2021 19:38:39 - INFO - __main__ - Step 35584: {'lr': 0.0004391227204959526, 'samples': 6832128, 'steps': 35583, 'loss/train': 1.280083179473877} -08/30/2021 19:38:39 - INFO - __main__ - Step 35585: {'lr': 0.00043911924982004315, 'samples': 6832320, 'steps': 35584, 'loss/train': 1.2352662086486816} -08/30/2021 19:38:40 - INFO - __main__ - Step 35586: {'lr': 0.0004391157790589195, 'samples': 6832512, 'steps': 35585, 'loss/train': 1.0446867942810059} -08/30/2021 19:38:40 - INFO - __main__ - Step 35587: {'lr': 0.00043911230821258313, 'samples': 6832704, 'steps': 35586, 'loss/train': 1.8367719650268555} -08/30/2021 19:38:41 - INFO - __main__ - Step 35588: {'lr': 0.00043910883728103575, 'samples': 6832896, 'steps': 35587, 'loss/train': 0.08733471482992172} -08/30/2021 19:38:42 - INFO - __main__ - Step 35589: {'lr': 0.0004391053662642788, 'samples': 6833088, 'steps': 35588, 'loss/train': 1.8498398065567017} -08/30/2021 19:38:42 - INFO - __main__ - Step 35590: {'lr': 0.00043910189516231386, 'samples': 6833280, 'steps': 35589, 'loss/train': 1.3803876638412476} -08/30/2021 19:38:43 - INFO - __main__ - Step 35591: {'lr': 0.00043909842397514255, 'samples': 6833472, 'steps': 35590, 'loss/train': 1.363560438156128} -08/30/2021 19:38:43 - INFO - __main__ - Step 35592: {'lr': 0.00043909495270276646, 'samples': 6833664, 'steps': 35591, 'loss/train': 1.172803282737732} -08/30/2021 19:38:45 - INFO - __main__ - Step 35593: {'lr': 0.00043909148134518703, 'samples': 6833856, 'steps': 35592, 'loss/train': 1.4856820106506348} -08/30/2021 19:38:45 - INFO - __main__ - Step 35594: {'lr': 0.0004390880099024059, 'samples': 6834048, 'steps': 35593, 'loss/train': 2.113456964492798} -08/30/2021 19:38:45 - INFO - __main__ - Step 35595: {'lr': 0.00043908453837442464, 'samples': 6834240, 'steps': 35594, 'loss/train': 1.9697480201721191} -08/30/2021 19:38:46 - INFO - __main__ - Step 35596: {'lr': 0.0004390810667612448, 'samples': 6834432, 'steps': 35595, 'loss/train': 1.910926103591919} -08/30/2021 19:38:46 - INFO - __main__ - Step 35597: {'lr': 0.00043907759506286797, 'samples': 6834624, 'steps': 35596, 'loss/train': 0.06204963102936745} -08/30/2021 19:38:47 - INFO - __main__ - Step 35598: {'lr': 0.00043907412327929575, 'samples': 6834816, 'steps': 35597, 'loss/train': 1.398746132850647} -08/30/2021 19:38:48 - INFO - __main__ - Step 35599: {'lr': 0.00043907065141052953, 'samples': 6835008, 'steps': 35598, 'loss/train': 1.45152747631073} -08/30/2021 19:38:48 - INFO - __main__ - Step 35600: {'lr': 0.00043906717945657104, 'samples': 6835200, 'steps': 35599, 'loss/train': 1.3819210529327393} -08/30/2021 19:38:49 - INFO - __main__ - Step 35601: {'lr': 0.00043906370741742185, 'samples': 6835392, 'steps': 35600, 'loss/train': 1.8691887855529785} -08/30/2021 19:38:49 - INFO - __main__ - Step 35602: {'lr': 0.0004390602352930834, 'samples': 6835584, 'steps': 35601, 'loss/train': 0.9794334173202515} -08/30/2021 19:38:49 - INFO - __main__ - Step 35603: {'lr': 0.00043905676308355734, 'samples': 6835776, 'steps': 35602, 'loss/train': 1.4168742895126343} -08/30/2021 19:38:51 - INFO - __main__ - Step 35604: {'lr': 0.00043905329078884527, 'samples': 6835968, 'steps': 35603, 'loss/train': 1.2644916772842407} -08/30/2021 19:38:52 - INFO - __main__ - Step 35605: {'lr': 0.00043904981840894863, 'samples': 6836160, 'steps': 35604, 'loss/train': 0.6998332738876343} -08/30/2021 19:38:52 - INFO - __main__ - Step 35606: {'lr': 0.0004390463459438691, 'samples': 6836352, 'steps': 35605, 'loss/train': 1.3609315156936646} -08/30/2021 19:38:52 - INFO - __main__ - Step 35607: {'lr': 0.0004390428733936082, 'samples': 6836544, 'steps': 35606, 'loss/train': 0.7326480150222778} -08/30/2021 19:38:53 - INFO - __main__ - Step 35608: {'lr': 0.0004390394007581675, 'samples': 6836736, 'steps': 35607, 'loss/train': 0.12532192468643188} -08/30/2021 19:38:55 - INFO - __main__ - Step 35609: {'lr': 0.00043903592803754856, 'samples': 6836928, 'steps': 35608, 'loss/train': 1.637898325920105} -08/30/2021 19:38:55 - INFO - __main__ - Step 35610: {'lr': 0.00043903245523175296, 'samples': 6837120, 'steps': 35609, 'loss/train': 0.8914738297462463} -08/30/2021 19:38:55 - INFO - __main__ - Step 35611: {'lr': 0.00043902898234078223, 'samples': 6837312, 'steps': 35610, 'loss/train': 1.0995962619781494} -08/30/2021 19:38:56 - INFO - __main__ - Step 35612: {'lr': 0.000439025509364638, 'samples': 6837504, 'steps': 35611, 'loss/train': 1.6563763618469238} -08/30/2021 19:38:56 - INFO - __main__ - Step 35613: {'lr': 0.0004390220363033217, 'samples': 6837696, 'steps': 35612, 'loss/train': 1.5935888290405273} -08/30/2021 19:38:57 - INFO - __main__ - Step 35614: {'lr': 0.0004390185631568351, 'samples': 6837888, 'steps': 35613, 'loss/train': 0.7934514880180359} -08/30/2021 19:38:58 - INFO - __main__ - Step 35615: {'lr': 0.00043901508992517956, 'samples': 6838080, 'steps': 35614, 'loss/train': 1.4886112213134766} -08/30/2021 19:38:58 - INFO - __main__ - Step 35616: {'lr': 0.0004390116166083568, 'samples': 6838272, 'steps': 35615, 'loss/train': 1.094867467880249} -08/30/2021 19:38:59 - INFO - __main__ - Step 35617: {'lr': 0.00043900814320636827, 'samples': 6838464, 'steps': 35616, 'loss/train': 1.63827383518219} -08/30/2021 19:38:59 - INFO - __main__ - Step 35618: {'lr': 0.00043900466971921563, 'samples': 6838656, 'steps': 35617, 'loss/train': 1.4104467630386353} -08/30/2021 19:39:01 - INFO - __main__ - Step 35619: {'lr': 0.00043900119614690043, 'samples': 6838848, 'steps': 35618, 'loss/train': 1.210228443145752} -08/30/2021 19:39:01 - INFO - __main__ - Step 35620: {'lr': 0.00043899772248942413, 'samples': 6839040, 'steps': 35619, 'loss/train': 1.6693419218063354} -08/30/2021 19:39:01 - INFO - __main__ - Step 35621: {'lr': 0.0004389942487467884, 'samples': 6839232, 'steps': 35620, 'loss/train': 1.3732359409332275} -08/30/2021 19:39:02 - INFO - __main__ - Step 35622: {'lr': 0.00043899077491899485, 'samples': 6839424, 'steps': 35621, 'loss/train': 0.9131094217300415} -08/30/2021 19:39:02 - INFO - __main__ - Step 35623: {'lr': 0.0004389873010060449, 'samples': 6839616, 'steps': 35622, 'loss/train': 1.4173331260681152} -08/30/2021 19:39:02 - INFO - __main__ - Step 35624: {'lr': 0.00043898382700794015, 'samples': 6839808, 'steps': 35623, 'loss/train': 0.9711362719535828} -08/30/2021 19:39:04 - INFO - __main__ - Step 35625: {'lr': 0.0004389803529246823, 'samples': 6840000, 'steps': 35624, 'loss/train': 1.642768144607544} -08/30/2021 19:39:05 - INFO - __main__ - Step 35626: {'lr': 0.00043897687875627277, 'samples': 6840192, 'steps': 35625, 'loss/train': 1.5010039806365967} -08/30/2021 19:39:05 - INFO - __main__ - Step 35627: {'lr': 0.00043897340450271317, 'samples': 6840384, 'steps': 35626, 'loss/train': 1.1777400970458984} -08/30/2021 19:39:05 - INFO - __main__ - Step 35628: {'lr': 0.0004389699301640051, 'samples': 6840576, 'steps': 35627, 'loss/train': 1.7789735794067383} -08/30/2021 19:39:06 - INFO - __main__ - Step 35629: {'lr': 0.00043896645574015004, 'samples': 6840768, 'steps': 35628, 'loss/train': 1.2212371826171875} -08/30/2021 19:39:07 - INFO - __main__ - Step 35630: {'lr': 0.00043896298123114965, 'samples': 6840960, 'steps': 35629, 'loss/train': 1.5458974838256836} -08/30/2021 19:39:08 - INFO - __main__ - Step 35631: {'lr': 0.00043895950663700546, 'samples': 6841152, 'steps': 35630, 'loss/train': 1.691313624382019} -08/30/2021 19:39:08 - INFO - __main__ - Step 35632: {'lr': 0.000438956031957719, 'samples': 6841344, 'steps': 35631, 'loss/train': 1.8477039337158203} -08/30/2021 19:39:09 - INFO - __main__ - Step 35633: {'lr': 0.0004389525571932919, 'samples': 6841536, 'steps': 35632, 'loss/train': 1.50918710231781} -08/30/2021 19:39:09 - INFO - __main__ - Step 35634: {'lr': 0.00043894908234372564, 'samples': 6841728, 'steps': 35633, 'loss/train': 1.189761996269226} -08/30/2021 19:39:10 - INFO - __main__ - Step 35635: {'lr': 0.0004389456074090219, 'samples': 6841920, 'steps': 35634, 'loss/train': 0.9537816643714905} -08/30/2021 19:39:11 - INFO - __main__ - Step 35636: {'lr': 0.0004389421323891822, 'samples': 6842112, 'steps': 35635, 'loss/train': 1.7430158853530884} -08/30/2021 19:39:11 - INFO - __main__ - Step 35637: {'lr': 0.000438938657284208, 'samples': 6842304, 'steps': 35636, 'loss/train': 0.8309873342514038} -08/30/2021 19:39:12 - INFO - __main__ - Step 35638: {'lr': 0.000438935182094101, 'samples': 6842496, 'steps': 35637, 'loss/train': 1.4525035619735718} -08/30/2021 19:39:12 - INFO - __main__ - Step 35639: {'lr': 0.0004389317068188628, 'samples': 6842688, 'steps': 35638, 'loss/train': 1.3033227920532227} -08/30/2021 19:39:13 - INFO - __main__ - Step 35640: {'lr': 0.0004389282314584948, 'samples': 6842880, 'steps': 35639, 'loss/train': 0.8959699273109436} -08/30/2021 19:39:14 - INFO - __main__ - Step 35641: {'lr': 0.0004389247560129987, 'samples': 6843072, 'steps': 35640, 'loss/train': 1.357480525970459} -08/30/2021 19:39:14 - INFO - __main__ - Step 35642: {'lr': 0.000438921280482376, 'samples': 6843264, 'steps': 35641, 'loss/train': 1.4794636964797974} -08/30/2021 19:39:15 - INFO - __main__ - Step 35643: {'lr': 0.00043891780486662825, 'samples': 6843456, 'steps': 35642, 'loss/train': 1.3781284093856812} -08/30/2021 19:39:15 - INFO - __main__ - Step 35644: {'lr': 0.00043891432916575714, 'samples': 6843648, 'steps': 35643, 'loss/train': 1.154592514038086} -08/30/2021 19:39:16 - INFO - __main__ - Step 35645: {'lr': 0.0004389108533797641, 'samples': 6843840, 'steps': 35644, 'loss/train': 0.9701963663101196} -08/30/2021 19:39:17 - INFO - __main__ - Step 35646: {'lr': 0.00043890737750865074, 'samples': 6844032, 'steps': 35645, 'loss/train': 3.0385804176330566} -08/30/2021 19:39:17 - INFO - __main__ - Step 35647: {'lr': 0.0004389039015524186, 'samples': 6844224, 'steps': 35646, 'loss/train': 1.477814793586731} -08/30/2021 19:39:17 - INFO - __main__ - Step 35648: {'lr': 0.0004389004255110693, 'samples': 6844416, 'steps': 35647, 'loss/train': 1.7936725616455078} -08/30/2021 19:39:18 - INFO - __main__ - Step 35649: {'lr': 0.0004388969493846044, 'samples': 6844608, 'steps': 35648, 'loss/train': 1.4018914699554443} -08/30/2021 19:39:18 - INFO - __main__ - Step 35650: {'lr': 0.00043889347317302543, 'samples': 6844800, 'steps': 35649, 'loss/train': 1.39692223072052} -08/30/2021 19:39:20 - INFO - __main__ - Step 35651: {'lr': 0.000438889996876334, 'samples': 6844992, 'steps': 35650, 'loss/train': 1.7134805917739868} -08/30/2021 19:39:20 - INFO - __main__ - Step 35652: {'lr': 0.00043888652049453163, 'samples': 6845184, 'steps': 35651, 'loss/train': 1.6207311153411865} -08/30/2021 19:39:20 - INFO - __main__ - Step 35653: {'lr': 0.0004388830440276199, 'samples': 6845376, 'steps': 35652, 'loss/train': 1.9511761665344238} -08/30/2021 19:39:21 - INFO - __main__ - Step 35654: {'lr': 0.0004388795674756004, 'samples': 6845568, 'steps': 35653, 'loss/train': 1.9038118124008179} -08/30/2021 19:39:21 - INFO - __main__ - Step 35655: {'lr': 0.0004388760908384747, 'samples': 6845760, 'steps': 35654, 'loss/train': 1.5171244144439697} -08/30/2021 19:39:23 - INFO - __main__ - Step 35656: {'lr': 0.00043887261411624433, 'samples': 6845952, 'steps': 35655, 'loss/train': 1.7236616611480713} -08/30/2021 19:39:23 - INFO - __main__ - Step 35657: {'lr': 0.00043886913730891087, 'samples': 6846144, 'steps': 35656, 'loss/train': 1.7457900047302246} -08/30/2021 19:39:24 - INFO - __main__ - Step 35658: {'lr': 0.00043886566041647593, 'samples': 6846336, 'steps': 35657, 'loss/train': 2.3147151470184326} -08/30/2021 19:39:24 - INFO - __main__ - Step 35659: {'lr': 0.000438862183438941, 'samples': 6846528, 'steps': 35658, 'loss/train': 1.4650671482086182} -08/30/2021 19:39:24 - INFO - __main__ - Step 35660: {'lr': 0.00043885870637630763, 'samples': 6846720, 'steps': 35659, 'loss/train': 1.3873176574707031} -08/30/2021 19:39:26 - INFO - __main__ - Step 35661: {'lr': 0.00043885522922857757, 'samples': 6846912, 'steps': 35660, 'loss/train': 1.3182965517044067} -08/30/2021 19:39:26 - INFO - __main__ - Step 35662: {'lr': 0.00043885175199575216, 'samples': 6847104, 'steps': 35661, 'loss/train': 1.821889877319336} -08/30/2021 19:39:27 - INFO - __main__ - Step 35663: {'lr': 0.00043884827467783303, 'samples': 6847296, 'steps': 35662, 'loss/train': 1.2539817094802856} -08/30/2021 19:39:27 - INFO - __main__ - Step 35664: {'lr': 0.00043884479727482193, 'samples': 6847488, 'steps': 35663, 'loss/train': 1.7631292343139648} -08/30/2021 19:39:27 - INFO - __main__ - Step 35665: {'lr': 0.00043884131978672014, 'samples': 6847680, 'steps': 35664, 'loss/train': 1.445492148399353} -08/30/2021 19:39:28 - INFO - __main__ - Step 35666: {'lr': 0.00043883784221352947, 'samples': 6847872, 'steps': 35665, 'loss/train': 1.5081000328063965} -08/30/2021 19:39:29 - INFO - __main__ - Step 35667: {'lr': 0.00043883436455525125, 'samples': 6848064, 'steps': 35666, 'loss/train': 1.2931530475616455} -08/30/2021 19:39:30 - INFO - __main__ - Step 35668: {'lr': 0.0004388308868118873, 'samples': 6848256, 'steps': 35667, 'loss/train': 1.7521008253097534} -08/30/2021 19:39:30 - INFO - __main__ - Step 35669: {'lr': 0.00043882740898343905, 'samples': 6848448, 'steps': 35668, 'loss/train': 1.2962530851364136} -08/30/2021 19:39:30 - INFO - __main__ - Step 35670: {'lr': 0.00043882393106990804, 'samples': 6848640, 'steps': 35669, 'loss/train': 1.1387592554092407} -08/30/2021 19:39:31 - INFO - __main__ - Step 35671: {'lr': 0.0004388204530712959, 'samples': 6848832, 'steps': 35670, 'loss/train': 1.1954197883605957} -08/30/2021 19:39:32 - INFO - __main__ - Step 35672: {'lr': 0.0004388169749876042, 'samples': 6849024, 'steps': 35671, 'loss/train': 1.3102842569351196} -08/30/2021 19:39:33 - INFO - __main__ - Step 35673: {'lr': 0.0004388134968188344, 'samples': 6849216, 'steps': 35672, 'loss/train': 1.5865390300750732} -08/30/2021 19:39:33 - INFO - __main__ - Step 35674: {'lr': 0.00043881001856498823, 'samples': 6849408, 'steps': 35673, 'loss/train': 0.9513254165649414} -08/30/2021 19:39:33 - INFO - __main__ - Step 35675: {'lr': 0.0004388065402260672, 'samples': 6849600, 'steps': 35674, 'loss/train': 1.3794844150543213} -08/30/2021 19:39:34 - INFO - __main__ - Step 35676: {'lr': 0.0004388030618020729, 'samples': 6849792, 'steps': 35675, 'loss/train': 1.8563107252120972} -08/30/2021 19:39:35 - INFO - __main__ - Step 35677: {'lr': 0.0004387995832930067, 'samples': 6849984, 'steps': 35676, 'loss/train': 1.1908576488494873} -08/30/2021 19:39:36 - INFO - __main__ - Step 35678: {'lr': 0.00043879610469887043, 'samples': 6850176, 'steps': 35677, 'loss/train': 0.9676467180252075} -08/30/2021 19:39:36 - INFO - __main__ - Step 35679: {'lr': 0.00043879262601966544, 'samples': 6850368, 'steps': 35678, 'loss/train': 1.0132702589035034} -08/30/2021 19:39:37 - INFO - __main__ - Step 35680: {'lr': 0.00043878914725539356, 'samples': 6850560, 'steps': 35679, 'loss/train': 1.7388083934783936} -08/30/2021 19:39:37 - INFO - __main__ - Step 35681: {'lr': 0.00043878566840605606, 'samples': 6850752, 'steps': 35680, 'loss/train': 1.4481080770492554} -08/30/2021 19:39:37 - INFO - __main__ - Step 35682: {'lr': 0.0004387821894716547, 'samples': 6850944, 'steps': 35681, 'loss/train': 1.6208693981170654} -08/30/2021 19:39:39 - INFO - __main__ - Step 35683: {'lr': 0.000438778710452191, 'samples': 6851136, 'steps': 35682, 'loss/train': 1.1175706386566162} -08/30/2021 19:39:40 - INFO - __main__ - Step 35684: {'lr': 0.00043877523134766664, 'samples': 6851328, 'steps': 35683, 'loss/train': 0.6959826946258545} -08/30/2021 19:39:40 - INFO - __main__ - Step 35685: {'lr': 0.0004387717521580829, 'samples': 6851520, 'steps': 35684, 'loss/train': 1.755468726158142} -08/30/2021 19:39:41 - INFO - __main__ - Step 35686: {'lr': 0.00043876827288344156, 'samples': 6851712, 'steps': 35685, 'loss/train': 1.4296605587005615} -08/30/2021 19:39:41 - INFO - __main__ - Step 35687: {'lr': 0.00043876479352374423, 'samples': 6851904, 'steps': 35686, 'loss/train': 0.0532398484647274} -08/30/2021 19:39:42 - INFO - __main__ - Step 35688: {'lr': 0.00043876131407899233, 'samples': 6852096, 'steps': 35687, 'loss/train': 1.791062593460083} -08/30/2021 19:39:43 - INFO - __main__ - Step 35689: {'lr': 0.00043875783454918753, 'samples': 6852288, 'steps': 35688, 'loss/train': 1.7844648361206055} -08/30/2021 19:39:43 - INFO - __main__ - Step 35690: {'lr': 0.00043875435493433135, 'samples': 6852480, 'steps': 35689, 'loss/train': 1.4128694534301758} -08/30/2021 19:39:44 - INFO - __main__ - Step 35691: {'lr': 0.00043875087523442537, 'samples': 6852672, 'steps': 35690, 'loss/train': 1.6357346773147583} -08/30/2021 19:39:44 - INFO - __main__ - Step 35692: {'lr': 0.0004387473954494712, 'samples': 6852864, 'steps': 35691, 'loss/train': 1.2960482835769653} -08/30/2021 19:39:45 - INFO - __main__ - Step 35693: {'lr': 0.00043874391557947027, 'samples': 6853056, 'steps': 35692, 'loss/train': 1.777909517288208} -08/30/2021 19:39:46 - INFO - __main__ - Step 35694: {'lr': 0.0004387404356244243, 'samples': 6853248, 'steps': 35693, 'loss/train': 1.472602128982544} -08/30/2021 19:39:46 - INFO - __main__ - Step 35695: {'lr': 0.0004387369555843348, 'samples': 6853440, 'steps': 35694, 'loss/train': 1.805136799812317} -08/30/2021 19:39:47 - INFO - __main__ - Step 35696: {'lr': 0.00043873347545920333, 'samples': 6853632, 'steps': 35695, 'loss/train': 1.1814404726028442} -08/30/2021 19:39:47 - INFO - __main__ - Step 35697: {'lr': 0.00043872999524903147, 'samples': 6853824, 'steps': 35696, 'loss/train': 1.2362682819366455} -08/30/2021 19:39:48 - INFO - __main__ - Step 35698: {'lr': 0.00043872651495382076, 'samples': 6854016, 'steps': 35697, 'loss/train': 1.357146978378296} -08/30/2021 19:39:49 - INFO - __main__ - Step 35699: {'lr': 0.00043872303457357287, 'samples': 6854208, 'steps': 35698, 'loss/train': 1.2132716178894043} -08/30/2021 19:39:49 - INFO - __main__ - Step 35700: {'lr': 0.0004387195541082892, 'samples': 6854400, 'steps': 35699, 'loss/train': 1.2962244749069214} -08/30/2021 19:39:50 - INFO - __main__ - Step 35701: {'lr': 0.0004387160735579715, 'samples': 6854592, 'steps': 35700, 'loss/train': 1.7019201517105103} -08/30/2021 19:39:50 - INFO - __main__ - Step 35702: {'lr': 0.0004387125929226212, 'samples': 6854784, 'steps': 35701, 'loss/train': 1.5078734159469604} -08/30/2021 19:39:51 - INFO - __main__ - Step 35703: {'lr': 0.00043870911220224, 'samples': 6854976, 'steps': 35702, 'loss/train': 0.39509594440460205} -08/30/2021 19:39:52 - INFO - __main__ - Step 35704: {'lr': 0.0004387056313968293, 'samples': 6855168, 'steps': 35703, 'loss/train': 1.2451130151748657} -08/30/2021 19:39:52 - INFO - __main__ - Step 35705: {'lr': 0.00043870215050639073, 'samples': 6855360, 'steps': 35704, 'loss/train': 1.6831550598144531} -08/30/2021 19:39:53 - INFO - __main__ - Step 35706: {'lr': 0.00043869866953092593, 'samples': 6855552, 'steps': 35705, 'loss/train': 1.6268436908721924} -08/30/2021 19:39:53 - INFO - __main__ - Step 35707: {'lr': 0.00043869518847043643, 'samples': 6855744, 'steps': 35706, 'loss/train': 1.4169487953186035} -08/30/2021 19:39:55 - INFO - __main__ - Step 35708: {'lr': 0.0004386917073249237, 'samples': 6855936, 'steps': 35707, 'loss/train': 0.739641547203064} -08/30/2021 19:39:56 - INFO - __main__ - Step 35709: {'lr': 0.00043868822609438953, 'samples': 6856128, 'steps': 35708, 'loss/train': 0.949308454990387} -08/30/2021 19:39:56 - INFO - __main__ - Step 35710: {'lr': 0.00043868474477883523, 'samples': 6856320, 'steps': 35709, 'loss/train': 0.5304680466651917} -08/30/2021 19:39:56 - INFO - __main__ - Step 35711: {'lr': 0.0004386812633782626, 'samples': 6856512, 'steps': 35710, 'loss/train': 0.6883789300918579} -08/30/2021 19:39:57 - INFO - __main__ - Step 35712: {'lr': 0.00043867778189267306, 'samples': 6856704, 'steps': 35711, 'loss/train': 3.0548501014709473} -08/30/2021 19:39:57 - INFO - __main__ - Step 35713: {'lr': 0.0004386743003220682, 'samples': 6856896, 'steps': 35712, 'loss/train': 0.6495181322097778} -08/30/2021 19:39:58 - INFO - __main__ - Step 35714: {'lr': 0.0004386708186664496, 'samples': 6857088, 'steps': 35713, 'loss/train': 1.6035770177841187} -08/30/2021 19:39:59 - INFO - __main__ - Step 35715: {'lr': 0.00043866733692581896, 'samples': 6857280, 'steps': 35714, 'loss/train': 1.4421180486679077} -08/30/2021 19:39:59 - INFO - __main__ - Step 35716: {'lr': 0.0004386638551001777, 'samples': 6857472, 'steps': 35715, 'loss/train': 1.022769570350647} -08/30/2021 19:39:59 - INFO - __main__ - Step 35717: {'lr': 0.00043866037318952735, 'samples': 6857664, 'steps': 35716, 'loss/train': 1.398125171661377} -08/30/2021 19:40:00 - INFO - __main__ - Step 35718: {'lr': 0.0004386568911938695, 'samples': 6857856, 'steps': 35717, 'loss/train': 1.2186522483825684} -08/30/2021 19:40:01 - INFO - __main__ - Step 35719: {'lr': 0.0004386534091132059, 'samples': 6858048, 'steps': 35718, 'loss/train': 1.1770780086517334} -08/30/2021 19:40:02 - INFO - __main__ - Step 35720: {'lr': 0.0004386499269475379, 'samples': 6858240, 'steps': 35719, 'loss/train': 1.588206171989441} -08/30/2021 19:40:02 - INFO - __main__ - Step 35721: {'lr': 0.00043864644469686717, 'samples': 6858432, 'steps': 35720, 'loss/train': 1.0388907194137573} -08/30/2021 19:40:02 - INFO - __main__ - Step 35722: {'lr': 0.0004386429623611953, 'samples': 6858624, 'steps': 35721, 'loss/train': 0.9350224733352661} -08/30/2021 19:40:03 - INFO - __main__ - Step 35723: {'lr': 0.0004386394799405238, 'samples': 6858816, 'steps': 35722, 'loss/train': 1.7079821825027466} -08/30/2021 19:40:05 - INFO - __main__ - Step 35724: {'lr': 0.00043863599743485416, 'samples': 6859008, 'steps': 35723, 'loss/train': 2.0020370483398438} -08/30/2021 19:40:05 - INFO - __main__ - Step 35725: {'lr': 0.0004386325148441882, 'samples': 6859200, 'steps': 35724, 'loss/train': 0.5875958800315857} -08/30/2021 19:40:06 - INFO - __main__ - Step 35726: {'lr': 0.00043862903216852723, 'samples': 6859392, 'steps': 35725, 'loss/train': 1.4427247047424316} -08/30/2021 19:40:06 - INFO - __main__ - Step 35727: {'lr': 0.00043862554940787303, 'samples': 6859584, 'steps': 35726, 'loss/train': 1.0599899291992188} -08/30/2021 19:40:07 - INFO - __main__ - Step 35728: {'lr': 0.000438622066562227, 'samples': 6859776, 'steps': 35727, 'loss/train': 0.7915924191474915} -08/30/2021 19:40:07 - INFO - __main__ - Step 35729: {'lr': 0.0004386185836315908, 'samples': 6859968, 'steps': 35728, 'loss/train': 1.872920036315918} -08/30/2021 19:40:08 - INFO - __main__ - Step 35730: {'lr': 0.0004386151006159659, 'samples': 6860160, 'steps': 35729, 'loss/train': 1.6561102867126465} -08/30/2021 19:40:09 - INFO - __main__ - Step 35731: {'lr': 0.00043861161751535406, 'samples': 6860352, 'steps': 35730, 'loss/train': 1.4359028339385986} -08/30/2021 19:40:09 - INFO - __main__ - Step 35732: {'lr': 0.0004386081343297567, 'samples': 6860544, 'steps': 35731, 'loss/train': 0.752839982509613} -08/30/2021 19:40:10 - INFO - __main__ - Step 35733: {'lr': 0.0004386046510591754, 'samples': 6860736, 'steps': 35732, 'loss/train': 1.461084246635437} -08/30/2021 19:40:10 - INFO - __main__ - Step 35734: {'lr': 0.0004386011677036118, 'samples': 6860928, 'steps': 35733, 'loss/train': 1.8140510320663452} -08/30/2021 19:40:12 - INFO - __main__ - Step 35735: {'lr': 0.00043859768426306737, 'samples': 6861120, 'steps': 35734, 'loss/train': 1.5535871982574463} -08/30/2021 19:40:13 - INFO - __main__ - Step 35736: {'lr': 0.00043859420073754377, 'samples': 6861312, 'steps': 35735, 'loss/train': 1.768283724784851} -08/30/2021 19:40:13 - INFO - __main__ - Step 35737: {'lr': 0.0004385907171270425, 'samples': 6861504, 'steps': 35736, 'loss/train': 1.4834998846054077} -08/30/2021 19:40:13 - INFO - __main__ - Step 35738: {'lr': 0.00043858723343156514, 'samples': 6861696, 'steps': 35737, 'loss/train': 0.43895164132118225} -08/30/2021 19:40:14 - INFO - __main__ - Step 35739: {'lr': 0.00043858374965111336, 'samples': 6861888, 'steps': 35738, 'loss/train': 1.659919023513794} -08/30/2021 19:40:15 - INFO - __main__ - Step 35740: {'lr': 0.00043858026578568864, 'samples': 6862080, 'steps': 35739, 'loss/train': 1.2154282331466675} -08/30/2021 19:40:16 - INFO - __main__ - Step 35741: {'lr': 0.00043857678183529256, 'samples': 6862272, 'steps': 35740, 'loss/train': 0.04095795005559921} -08/30/2021 19:40:16 - INFO - __main__ - Step 35742: {'lr': 0.0004385732977999266, 'samples': 6862464, 'steps': 35741, 'loss/train': 0.859963595867157} -08/30/2021 19:40:16 - INFO - __main__ - Step 35743: {'lr': 0.0004385698136795926, 'samples': 6862656, 'steps': 35742, 'loss/train': 1.576748013496399} -08/30/2021 19:40:17 - INFO - __main__ - Step 35744: {'lr': 0.00043856632947429175, 'samples': 6862848, 'steps': 35743, 'loss/train': 1.3742958307266235} -08/30/2021 19:40:18 - INFO - __main__ - Step 35745: {'lr': 0.00043856284518402594, 'samples': 6863040, 'steps': 35744, 'loss/train': 1.1338467597961426} -08/30/2021 19:40:19 - INFO - __main__ - Step 35746: {'lr': 0.00043855936080879667, 'samples': 6863232, 'steps': 35745, 'loss/train': 1.1429330110549927} -08/30/2021 19:40:19 - INFO - __main__ - Step 35747: {'lr': 0.0004385558763486053, 'samples': 6863424, 'steps': 35746, 'loss/train': 0.5309433937072754} -08/30/2021 19:40:19 - INFO - __main__ - Step 35748: {'lr': 0.00043855239180345376, 'samples': 6863616, 'steps': 35747, 'loss/train': 1.1584179401397705} -08/30/2021 19:40:20 - INFO - __main__ - Step 35749: {'lr': 0.00043854890717334326, 'samples': 6863808, 'steps': 35748, 'loss/train': 1.578368067741394} -08/30/2021 19:40:20 - INFO - __main__ - Step 35750: {'lr': 0.00043854542245827554, 'samples': 6864000, 'steps': 35749, 'loss/train': 2.151776075363159} -08/30/2021 19:40:22 - INFO - __main__ - Step 35751: {'lr': 0.00043854193765825223, 'samples': 6864192, 'steps': 35750, 'loss/train': 1.8846768140792847} -08/30/2021 19:40:22 - INFO - __main__ - Step 35752: {'lr': 0.00043853845277327485, 'samples': 6864384, 'steps': 35751, 'loss/train': 0.6006564497947693} -08/30/2021 19:40:22 - INFO - __main__ - Step 35753: {'lr': 0.0004385349678033449, 'samples': 6864576, 'steps': 35752, 'loss/train': 1.1803851127624512} -08/30/2021 19:40:23 - INFO - __main__ - Step 35754: {'lr': 0.000438531482748464, 'samples': 6864768, 'steps': 35753, 'loss/train': 1.5470081567764282} -08/30/2021 19:40:24 - INFO - __main__ - Step 35755: {'lr': 0.00043852799760863375, 'samples': 6864960, 'steps': 35754, 'loss/train': 1.0977510213851929} -08/30/2021 19:40:25 - INFO - __main__ - Step 35756: {'lr': 0.0004385245123838557, 'samples': 6865152, 'steps': 35755, 'loss/train': 0.8566994071006775} -08/30/2021 19:40:25 - INFO - __main__ - Step 35757: {'lr': 0.00043852102707413144, 'samples': 6865344, 'steps': 35756, 'loss/train': 1.259803295135498} -08/30/2021 19:40:25 - INFO - __main__ - Step 35758: {'lr': 0.00043851754167946244, 'samples': 6865536, 'steps': 35757, 'loss/train': 1.8018505573272705} -08/30/2021 19:40:26 - INFO - __main__ - Step 35759: {'lr': 0.00043851405619985037, 'samples': 6865728, 'steps': 35758, 'loss/train': 0.9264659285545349} -08/30/2021 19:40:26 - INFO - __main__ - Step 35760: {'lr': 0.00043851057063529675, 'samples': 6865920, 'steps': 35759, 'loss/train': 0.7205207347869873} -08/30/2021 19:40:28 - INFO - __main__ - Step 35761: {'lr': 0.00043850708498580326, 'samples': 6866112, 'steps': 35760, 'loss/train': 0.5752424001693726} -08/30/2021 19:40:29 - INFO - __main__ - Step 35762: {'lr': 0.00043850359925137126, 'samples': 6866304, 'steps': 35761, 'loss/train': 1.7855188846588135} -08/30/2021 19:40:29 - INFO - __main__ - Step 35763: {'lr': 0.0004385001134320026, 'samples': 6866496, 'steps': 35762, 'loss/train': 1.1552997827529907} -08/30/2021 19:40:30 - INFO - __main__ - Step 35764: {'lr': 0.0004384966275276986, 'samples': 6866688, 'steps': 35763, 'loss/train': 1.2471599578857422} -08/30/2021 19:40:30 - INFO - __main__ - Step 35765: {'lr': 0.00043849314153846094, 'samples': 6866880, 'steps': 35764, 'loss/train': 1.1940642595291138} -08/30/2021 19:40:30 - INFO - __main__ - Step 35766: {'lr': 0.0004384896554642912, 'samples': 6867072, 'steps': 35765, 'loss/train': 1.9924455881118774} -08/30/2021 19:40:31 - INFO - __main__ - Step 35767: {'lr': 0.00043848616930519094, 'samples': 6867264, 'steps': 35766, 'loss/train': 1.452562928199768} -08/30/2021 19:40:32 - INFO - __main__ - Step 35768: {'lr': 0.0004384826830611617, 'samples': 6867456, 'steps': 35767, 'loss/train': 1.4745227098464966} -08/30/2021 19:40:33 - INFO - __main__ - Step 35769: {'lr': 0.00043847919673220504, 'samples': 6867648, 'steps': 35768, 'loss/train': 2.126126289367676} -08/30/2021 19:40:33 - INFO - __main__ - Step 35770: {'lr': 0.00043847571031832257, 'samples': 6867840, 'steps': 35769, 'loss/train': 0.12559567391872406} -08/30/2021 19:40:33 - INFO - __main__ - Step 35771: {'lr': 0.0004384722238195159, 'samples': 6868032, 'steps': 35770, 'loss/train': 0.0725589394569397} -08/30/2021 19:40:34 - INFO - __main__ - Step 35772: {'lr': 0.0004384687372357865, 'samples': 6868224, 'steps': 35771, 'loss/train': 1.2416489124298096} -08/30/2021 19:40:35 - INFO - __main__ - Step 35773: {'lr': 0.000438465250567136, 'samples': 6868416, 'steps': 35772, 'loss/train': 1.4894640445709229} -08/30/2021 19:40:36 - INFO - __main__ - Step 35774: {'lr': 0.00043846176381356607, 'samples': 6868608, 'steps': 35773, 'loss/train': 0.7272209525108337} -08/30/2021 19:40:36 - INFO - __main__ - Step 35775: {'lr': 0.000438458276975078, 'samples': 6868800, 'steps': 35774, 'loss/train': 1.644163727760315} -08/30/2021 19:40:37 - INFO - __main__ - Step 35776: {'lr': 0.0004384547900516737, 'samples': 6868992, 'steps': 35775, 'loss/train': 1.6450856924057007} -08/30/2021 19:40:37 - INFO - __main__ - Step 35777: {'lr': 0.00043845130304335454, 'samples': 6869184, 'steps': 35776, 'loss/train': 1.7167104482650757} -08/30/2021 19:40:39 - INFO - __main__ - Step 35778: {'lr': 0.00043844781595012204, 'samples': 6869376, 'steps': 35777, 'loss/train': 1.3521348237991333} -08/30/2021 19:40:39 - INFO - __main__ - Step 35779: {'lr': 0.0004384443287719779, 'samples': 6869568, 'steps': 35778, 'loss/train': 1.14707612991333} -08/30/2021 19:40:39 - INFO - __main__ - Step 35780: {'lr': 0.0004384408415089237, 'samples': 6869760, 'steps': 35779, 'loss/train': 1.990094542503357} -08/30/2021 19:40:40 - INFO - __main__ - Step 35781: {'lr': 0.000438437354160961, 'samples': 6869952, 'steps': 35780, 'loss/train': 1.4677101373672485} -08/30/2021 19:40:40 - INFO - __main__ - Step 35782: {'lr': 0.00043843386672809127, 'samples': 6870144, 'steps': 35781, 'loss/train': 1.3196239471435547} -08/30/2021 19:40:42 - INFO - __main__ - Step 35783: {'lr': 0.00043843037921031616, 'samples': 6870336, 'steps': 35782, 'loss/train': 1.3968104124069214} -08/30/2021 19:40:42 - INFO - __main__ - Step 35784: {'lr': 0.00043842689160763723, 'samples': 6870528, 'steps': 35783, 'loss/train': 0.9303664565086365} -08/30/2021 19:40:43 - INFO - __main__ - Step 35785: {'lr': 0.00043842340392005605, 'samples': 6870720, 'steps': 35784, 'loss/train': 1.709263801574707} -08/30/2021 19:40:43 - INFO - __main__ - Step 35786: {'lr': 0.00043841991614757415, 'samples': 6870912, 'steps': 35785, 'loss/train': 1.9071567058563232} -08/30/2021 19:40:43 - INFO - __main__ - Step 35787: {'lr': 0.00043841642829019325, 'samples': 6871104, 'steps': 35786, 'loss/train': 1.302585244178772} -08/30/2021 19:40:45 - INFO - __main__ - Step 35788: {'lr': 0.00043841294034791466, 'samples': 6871296, 'steps': 35787, 'loss/train': 0.9638983011245728} -08/30/2021 19:40:46 - INFO - __main__ - Step 35789: {'lr': 0.0004384094523207403, 'samples': 6871488, 'steps': 35788, 'loss/train': 1.3495556116104126} -08/30/2021 19:40:46 - INFO - __main__ - Step 35790: {'lr': 0.0004384059642086714, 'samples': 6871680, 'steps': 35789, 'loss/train': 1.5559329986572266} -08/30/2021 19:40:47 - INFO - __main__ - Step 35791: {'lr': 0.00043840247601170966, 'samples': 6871872, 'steps': 35790, 'loss/train': 1.0083070993423462} -08/30/2021 19:40:47 - INFO - __main__ - Step 35792: {'lr': 0.0004383989877298568, 'samples': 6872064, 'steps': 35791, 'loss/train': 1.7565701007843018} -08/30/2021 19:40:47 - INFO - __main__ - Step 35793: {'lr': 0.0004383954993631142, 'samples': 6872256, 'steps': 35792, 'loss/train': 1.2921377420425415} -08/30/2021 19:40:49 - INFO - __main__ - Step 35794: {'lr': 0.0004383920109114835, 'samples': 6872448, 'steps': 35793, 'loss/train': 0.9689278602600098} -08/30/2021 19:40:49 - INFO - __main__ - Step 35795: {'lr': 0.00043838852237496626, 'samples': 6872640, 'steps': 35794, 'loss/train': 1.3755950927734375} -08/30/2021 19:40:50 - INFO - __main__ - Step 35796: {'lr': 0.000438385033753564, 'samples': 6872832, 'steps': 35795, 'loss/train': 1.233426570892334} -08/30/2021 19:40:50 - INFO - __main__ - Step 35797: {'lr': 0.00043838154504727847, 'samples': 6873024, 'steps': 35796, 'loss/train': 1.0053900480270386} -08/30/2021 19:40:50 - INFO - __main__ - Step 35798: {'lr': 0.00043837805625611105, 'samples': 6873216, 'steps': 35797, 'loss/train': 1.2939139604568481} -08/30/2021 19:40:52 - INFO - __main__ - Step 35799: {'lr': 0.0004383745673800634, 'samples': 6873408, 'steps': 35798, 'loss/train': 1.6685645580291748} -08/30/2021 19:40:53 - INFO - __main__ - Step 35800: {'lr': 0.000438371078419137, 'samples': 6873600, 'steps': 35799, 'loss/train': 1.132985234260559} -08/30/2021 19:40:53 - INFO - __main__ - Step 35801: {'lr': 0.00043836758937333366, 'samples': 6873792, 'steps': 35800, 'loss/train': 2.439655065536499} -08/30/2021 19:40:53 - INFO - __main__ - Step 35802: {'lr': 0.0004383641002426547, 'samples': 6873984, 'steps': 35801, 'loss/train': 1.5419939756393433} -08/30/2021 19:40:54 - INFO - __main__ - Step 35803: {'lr': 0.0004383606110271018, 'samples': 6874176, 'steps': 35802, 'loss/train': 0.8653266429901123} -08/30/2021 19:40:55 - INFO - __main__ - Step 35804: {'lr': 0.00043835712172667643, 'samples': 6874368, 'steps': 35803, 'loss/train': 1.158326506614685} -08/30/2021 19:40:55 - INFO - __main__ - Step 35805: {'lr': 0.00043835363234138037, 'samples': 6874560, 'steps': 35804, 'loss/train': 1.425804853439331} -08/30/2021 19:40:56 - INFO - __main__ - Step 35806: {'lr': 0.00043835014287121497, 'samples': 6874752, 'steps': 35805, 'loss/train': 1.483182668685913} -08/30/2021 19:40:56 - INFO - __main__ - Step 35807: {'lr': 0.00043834665331618196, 'samples': 6874944, 'steps': 35806, 'loss/train': 1.5690828561782837} -08/30/2021 19:40:56 - INFO - __main__ - Step 35808: {'lr': 0.00043834316367628287, 'samples': 6875136, 'steps': 35807, 'loss/train': 1.5251847505569458} -08/30/2021 19:40:57 - INFO - __main__ - Step 35809: {'lr': 0.0004383396739515192, 'samples': 6875328, 'steps': 35808, 'loss/train': 1.4956177473068237} -08/30/2021 19:40:58 - INFO - __main__ - Step 35810: {'lr': 0.00043833618414189265, 'samples': 6875520, 'steps': 35809, 'loss/train': 1.3618067502975464} -08/30/2021 19:40:59 - INFO - __main__ - Step 35811: {'lr': 0.0004383326942474046, 'samples': 6875712, 'steps': 35810, 'loss/train': 1.365071415901184} -08/30/2021 19:40:59 - INFO - __main__ - Step 35812: {'lr': 0.0004383292042680569, 'samples': 6875904, 'steps': 35811, 'loss/train': 1.2887581586837769} -08/30/2021 19:41:00 - INFO - __main__ - Step 35813: {'lr': 0.0004383257142038509, 'samples': 6876096, 'steps': 35812, 'loss/train': 0.8633568286895752} -08/30/2021 19:41:00 - INFO - __main__ - Step 35814: {'lr': 0.0004383222240547882, 'samples': 6876288, 'steps': 35813, 'loss/train': 1.455997109413147} -08/30/2021 19:41:02 - INFO - __main__ - Step 35815: {'lr': 0.00043831873382087043, 'samples': 6876480, 'steps': 35814, 'loss/train': 0.11450637131929398} -08/30/2021 19:41:02 - INFO - __main__ - Step 35816: {'lr': 0.0004383152435020992, 'samples': 6876672, 'steps': 35815, 'loss/train': 0.9193439483642578} -08/30/2021 19:41:03 - INFO - __main__ - Step 35817: {'lr': 0.0004383117530984759, 'samples': 6876864, 'steps': 35816, 'loss/train': 0.11300406605005264} -08/30/2021 19:41:03 - INFO - __main__ - Step 35818: {'lr': 0.0004383082626100024, 'samples': 6877056, 'steps': 35817, 'loss/train': 1.0652726888656616} -08/30/2021 19:41:03 - INFO - __main__ - Step 35819: {'lr': 0.00043830477203668, 'samples': 6877248, 'steps': 35818, 'loss/train': 1.4916833639144897} -08/30/2021 19:41:05 - INFO - __main__ - Step 35820: {'lr': 0.0004383012813785104, 'samples': 6877440, 'steps': 35819, 'loss/train': 0.8225932121276855} -08/30/2021 19:41:05 - INFO - __main__ - Step 35821: {'lr': 0.00043829779063549515, 'samples': 6877632, 'steps': 35820, 'loss/train': 1.8141981363296509} -08/30/2021 19:41:06 - INFO - __main__ - Step 35822: {'lr': 0.0004382942998076358, 'samples': 6877824, 'steps': 35821, 'loss/train': 0.8098313808441162} -08/30/2021 19:41:06 - INFO - __main__ - Step 35823: {'lr': 0.000438290808894934, 'samples': 6878016, 'steps': 35822, 'loss/train': 0.7846266031265259} -08/30/2021 19:41:07 - INFO - __main__ - Step 35824: {'lr': 0.0004382873178973912, 'samples': 6878208, 'steps': 35823, 'loss/train': 1.348767876625061} -08/30/2021 19:41:08 - INFO - __main__ - Step 35825: {'lr': 0.00043828382681500907, 'samples': 6878400, 'steps': 35824, 'loss/train': 1.2977933883666992} -08/30/2021 19:41:08 - INFO - __main__ - Step 35826: {'lr': 0.0004382803356477891, 'samples': 6878592, 'steps': 35825, 'loss/train': 1.1374726295471191} -08/30/2021 19:41:09 - INFO - __main__ - Step 35827: {'lr': 0.000438276844395733, 'samples': 6878784, 'steps': 35826, 'loss/train': 1.7101885080337524} -08/30/2021 19:41:09 - INFO - __main__ - Step 35828: {'lr': 0.0004382733530588422, 'samples': 6878976, 'steps': 35827, 'loss/train': 1.4890118837356567} -08/30/2021 19:41:09 - INFO - __main__ - Step 35829: {'lr': 0.00043826986163711835, 'samples': 6879168, 'steps': 35828, 'loss/train': 1.2416892051696777} -08/30/2021 19:41:10 - INFO - __main__ - Step 35830: {'lr': 0.000438266370130563, 'samples': 6879360, 'steps': 35829, 'loss/train': 1.267130970954895} -08/30/2021 19:41:11 - INFO - __main__ - Step 35831: {'lr': 0.0004382628785391778, 'samples': 6879552, 'steps': 35830, 'loss/train': 2.0122570991516113} -08/30/2021 19:41:12 - INFO - __main__ - Step 35832: {'lr': 0.00043825938686296417, 'samples': 6879744, 'steps': 35831, 'loss/train': 1.7289721965789795} -08/30/2021 19:41:12 - INFO - __main__ - Step 35833: {'lr': 0.00043825589510192376, 'samples': 6879936, 'steps': 35832, 'loss/train': 1.301513671875} -08/30/2021 19:41:12 - INFO - __main__ - Step 35834: {'lr': 0.0004382524032560582, 'samples': 6880128, 'steps': 35833, 'loss/train': 1.5454095602035522} -08/30/2021 19:41:13 - INFO - __main__ - Step 35835: {'lr': 0.000438248911325369, 'samples': 6880320, 'steps': 35834, 'loss/train': 1.5459630489349365} -08/30/2021 19:41:14 - INFO - __main__ - Step 35836: {'lr': 0.00043824541930985775, 'samples': 6880512, 'steps': 35835, 'loss/train': 1.6328880786895752} -08/30/2021 19:41:15 - INFO - __main__ - Step 35837: {'lr': 0.0004382419272095259, 'samples': 6880704, 'steps': 35836, 'loss/train': 1.4368534088134766} -08/30/2021 19:41:15 - INFO - __main__ - Step 35838: {'lr': 0.00043823843502437533, 'samples': 6880896, 'steps': 35837, 'loss/train': 0.6696494221687317} -08/30/2021 19:41:15 - INFO - __main__ - Step 35839: {'lr': 0.00043823494275440733, 'samples': 6881088, 'steps': 35838, 'loss/train': 1.1786456108093262} -08/30/2021 19:41:16 - INFO - __main__ - Step 35840: {'lr': 0.0004382314503996236, 'samples': 6881280, 'steps': 35839, 'loss/train': 0.8219661116600037} -08/30/2021 19:41:18 - INFO - __main__ - Step 35841: {'lr': 0.0004382279579600256, 'samples': 6881472, 'steps': 35840, 'loss/train': 1.1060184240341187} -08/30/2021 19:41:18 - INFO - __main__ - Step 35842: {'lr': 0.0004382244654356151, 'samples': 6881664, 'steps': 35841, 'loss/train': 0.7607479095458984} -08/30/2021 19:41:19 - INFO - __main__ - Step 35843: {'lr': 0.0004382209728263935, 'samples': 6881856, 'steps': 35842, 'loss/train': 1.6023942232131958} -08/30/2021 19:41:19 - INFO - __main__ - Step 35844: {'lr': 0.0004382174801323624, 'samples': 6882048, 'steps': 35843, 'loss/train': 0.7133591175079346} -08/30/2021 19:41:19 - INFO - __main__ - Step 35845: {'lr': 0.00043821398735352344, 'samples': 6882240, 'steps': 35844, 'loss/train': 1.059515118598938} -08/30/2021 19:41:20 - INFO - __main__ - Step 35846: {'lr': 0.0004382104944898782, 'samples': 6882432, 'steps': 35845, 'loss/train': 1.2639186382293701} -08/30/2021 19:41:21 - INFO - __main__ - Step 35847: {'lr': 0.00043820700154142825, 'samples': 6882624, 'steps': 35846, 'loss/train': 1.8837535381317139} -08/30/2021 19:41:22 - INFO - __main__ - Step 35848: {'lr': 0.00043820350850817504, 'samples': 6882816, 'steps': 35847, 'loss/train': 1.5463966131210327} -08/30/2021 19:41:22 - INFO - __main__ - Step 35849: {'lr': 0.00043820001539012025, 'samples': 6883008, 'steps': 35848, 'loss/train': 1.0958948135375977} -08/30/2021 19:41:23 - INFO - __main__ - Step 35850: {'lr': 0.00043819652218726545, 'samples': 6883200, 'steps': 35849, 'loss/train': 1.5311769247055054} -08/30/2021 19:41:23 - INFO - __main__ - Step 35851: {'lr': 0.0004381930288996122, 'samples': 6883392, 'steps': 35850, 'loss/train': 1.0675137042999268} -08/30/2021 19:41:25 - INFO - __main__ - Step 35852: {'lr': 0.0004381895355271621, 'samples': 6883584, 'steps': 35851, 'loss/train': 1.3081263303756714} -08/30/2021 19:41:25 - INFO - __main__ - Step 35853: {'lr': 0.00043818604206991664, 'samples': 6883776, 'steps': 35852, 'loss/train': 1.055031418800354} -08/30/2021 19:41:25 - INFO - __main__ - Step 35854: {'lr': 0.0004381825485278775, 'samples': 6883968, 'steps': 35853, 'loss/train': 1.10634183883667} -08/30/2021 19:41:26 - INFO - __main__ - Step 35855: {'lr': 0.00043817905490104613, 'samples': 6884160, 'steps': 35854, 'loss/train': 1.2523554563522339} -08/30/2021 19:41:26 - INFO - __main__ - Step 35856: {'lr': 0.00043817556118942426, 'samples': 6884352, 'steps': 35855, 'loss/train': 1.5465097427368164} -08/30/2021 19:41:28 - INFO - __main__ - Step 35857: {'lr': 0.0004381720673930134, 'samples': 6884544, 'steps': 35856, 'loss/train': 1.6932920217514038} -08/30/2021 19:41:29 - INFO - __main__ - Step 35858: {'lr': 0.00043816857351181503, 'samples': 6884736, 'steps': 35857, 'loss/train': 1.629940390586853} -08/30/2021 19:41:29 - INFO - __main__ - Step 35859: {'lr': 0.0004381650795458309, 'samples': 6884928, 'steps': 35858, 'loss/train': 1.8170835971832275} -08/30/2021 19:41:29 - INFO - __main__ - Step 35860: {'lr': 0.0004381615854950625, 'samples': 6885120, 'steps': 35859, 'loss/train': 1.8068844079971313} -08/30/2021 19:41:30 - INFO - __main__ - Step 35861: {'lr': 0.0004381580913595113, 'samples': 6885312, 'steps': 35860, 'loss/train': 3.2505946159362793} -08/30/2021 19:41:30 - INFO - __main__ - Step 35862: {'lr': 0.000438154597139179, 'samples': 6885504, 'steps': 35861, 'loss/train': 1.0914829969406128} -08/30/2021 19:41:31 - INFO - __main__ - Step 35863: {'lr': 0.0004381511028340671, 'samples': 6885696, 'steps': 35862, 'loss/train': 1.1033549308776855} -08/30/2021 19:41:32 - INFO - __main__ - Step 35864: {'lr': 0.0004381476084441773, 'samples': 6885888, 'steps': 35863, 'loss/train': 0.7790926694869995} -08/30/2021 19:41:32 - INFO - __main__ - Step 35865: {'lr': 0.00043814411396951103, 'samples': 6886080, 'steps': 35864, 'loss/train': 1.744763970375061} -08/30/2021 19:41:33 - INFO - __main__ - Step 35866: {'lr': 0.00043814061941007, 'samples': 6886272, 'steps': 35865, 'loss/train': 1.042218565940857} -08/30/2021 19:41:33 - INFO - __main__ - Step 35867: {'lr': 0.00043813712476585564, 'samples': 6886464, 'steps': 35866, 'loss/train': 1.3351562023162842} -08/30/2021 19:41:33 - INFO - __main__ - Step 35868: {'lr': 0.00043813363003686963, 'samples': 6886656, 'steps': 35867, 'loss/train': 1.7624542713165283} -08/30/2021 19:41:35 - INFO - __main__ - Step 35869: {'lr': 0.00043813013522311353, 'samples': 6886848, 'steps': 35868, 'loss/train': 1.4124177694320679} -08/30/2021 19:41:36 - INFO - __main__ - Step 35870: {'lr': 0.0004381266403245888, 'samples': 6887040, 'steps': 35869, 'loss/train': 2.866715669631958} -08/30/2021 19:41:36 - INFO - __main__ - Step 35871: {'lr': 0.00043812314534129716, 'samples': 6887232, 'steps': 35870, 'loss/train': 1.3953862190246582} -08/30/2021 19:41:36 - INFO - __main__ - Step 35872: {'lr': 0.0004381196502732402, 'samples': 6887424, 'steps': 35871, 'loss/train': 1.0986944437026978} -08/30/2021 19:41:37 - INFO - __main__ - Step 35873: {'lr': 0.00043811615512041934, 'samples': 6887616, 'steps': 35872, 'loss/train': 1.6316261291503906} -08/30/2021 19:41:37 - INFO - __main__ - Step 35874: {'lr': 0.00043811265988283625, 'samples': 6887808, 'steps': 35873, 'loss/train': 1.1859568357467651} -08/30/2021 19:41:39 - INFO - __main__ - Step 35875: {'lr': 0.00043810916456049257, 'samples': 6888000, 'steps': 35874, 'loss/train': 1.3458808660507202} -08/30/2021 19:41:39 - INFO - __main__ - Step 35876: {'lr': 0.00043810566915338965, 'samples': 6888192, 'steps': 35875, 'loss/train': 0.6165096759796143} -08/30/2021 19:41:40 - INFO - __main__ - Step 35877: {'lr': 0.0004381021736615294, 'samples': 6888384, 'steps': 35876, 'loss/train': 0.7613841891288757} -08/30/2021 19:41:40 - INFO - __main__ - Step 35878: {'lr': 0.0004380986780849131, 'samples': 6888576, 'steps': 35877, 'loss/train': 1.8748672008514404} -08/30/2021 19:41:40 - INFO - __main__ - Step 35879: {'lr': 0.0004380951824235425, 'samples': 6888768, 'steps': 35878, 'loss/train': 1.521654725074768} -08/30/2021 19:41:42 - INFO - __main__ - Step 35880: {'lr': 0.00043809168667741907, 'samples': 6888960, 'steps': 35879, 'loss/train': 1.4347739219665527} -08/30/2021 19:41:42 - INFO - __main__ - Step 35881: {'lr': 0.0004380881908465445, 'samples': 6889152, 'steps': 35880, 'loss/train': 1.4354737997055054} -08/30/2021 19:41:43 - INFO - __main__ - Step 35882: {'lr': 0.0004380846949309202, 'samples': 6889344, 'steps': 35881, 'loss/train': 1.3781572580337524} -08/30/2021 19:41:43 - INFO - __main__ - Step 35883: {'lr': 0.00043808119893054787, 'samples': 6889536, 'steps': 35882, 'loss/train': 1.5532004833221436} -08/30/2021 19:41:43 - INFO - __main__ - Step 35884: {'lr': 0.0004380777028454291, 'samples': 6889728, 'steps': 35883, 'loss/train': 0.8596472144126892} -08/30/2021 19:41:45 - INFO - __main__ - Step 35885: {'lr': 0.0004380742066755654, 'samples': 6889920, 'steps': 35884, 'loss/train': 1.613647699356079} -08/30/2021 19:41:46 - INFO - __main__ - Step 35886: {'lr': 0.0004380707104209583, 'samples': 6890112, 'steps': 35885, 'loss/train': 0.04353176802396774} -08/30/2021 19:41:46 - INFO - __main__ - Step 35887: {'lr': 0.0004380672140816095, 'samples': 6890304, 'steps': 35886, 'loss/train': 0.8171952962875366} -08/30/2021 19:41:46 - INFO - __main__ - Step 35888: {'lr': 0.0004380637176575205, 'samples': 6890496, 'steps': 35887, 'loss/train': 2.121934652328491} -08/30/2021 19:41:47 - INFO - __main__ - Step 35889: {'lr': 0.00043806022114869294, 'samples': 6890688, 'steps': 35888, 'loss/train': 1.5538878440856934} -08/30/2021 19:41:47 - INFO - __main__ - Step 35890: {'lr': 0.0004380567245551282, 'samples': 6890880, 'steps': 35889, 'loss/train': 1.1371572017669678} -08/30/2021 19:41:49 - INFO - __main__ - Step 35891: {'lr': 0.0004380532278768282, 'samples': 6891072, 'steps': 35890, 'loss/train': 1.6110029220581055} -08/30/2021 19:41:49 - INFO - __main__ - Step 35892: {'lr': 0.0004380497311137942, 'samples': 6891264, 'steps': 35891, 'loss/train': 1.6960369348526} -08/30/2021 19:41:49 - INFO - __main__ - Step 35893: {'lr': 0.00043804623426602784, 'samples': 6891456, 'steps': 35892, 'loss/train': 1.629783272743225} -08/30/2021 19:41:50 - INFO - __main__ - Step 35894: {'lr': 0.00043804273733353085, 'samples': 6891648, 'steps': 35893, 'loss/train': 1.7936067581176758} -08/30/2021 19:41:50 - INFO - __main__ - Step 35895: {'lr': 0.0004380392403163047, 'samples': 6891840, 'steps': 35894, 'loss/train': 1.4328663349151611} -08/30/2021 19:41:52 - INFO - __main__ - Step 35896: {'lr': 0.00043803574321435093, 'samples': 6892032, 'steps': 35895, 'loss/train': 1.5266427993774414} -08/30/2021 19:41:53 - INFO - __main__ - Step 35897: {'lr': 0.00043803224602767115, 'samples': 6892224, 'steps': 35896, 'loss/train': 1.4053335189819336} -08/30/2021 19:41:53 - INFO - __main__ - Step 35898: {'lr': 0.000438028748756267, 'samples': 6892416, 'steps': 35897, 'loss/train': 1.304561734199524} -08/30/2021 19:41:54 - INFO - __main__ - Step 35899: {'lr': 0.00043802525140013994, 'samples': 6892608, 'steps': 35898, 'loss/train': 1.5983912944793701} -08/30/2021 19:41:54 - INFO - __main__ - Step 35900: {'lr': 0.00043802175395929156, 'samples': 6892800, 'steps': 35899, 'loss/train': 1.329479694366455} -08/30/2021 19:41:55 - INFO - __main__ - Step 35901: {'lr': 0.00043801825643372363, 'samples': 6892992, 'steps': 35900, 'loss/train': 0.9093522429466248} -08/30/2021 19:41:56 - INFO - __main__ - Step 35902: {'lr': 0.00043801475882343743, 'samples': 6893184, 'steps': 35901, 'loss/train': 1.4933193922042847} -08/30/2021 19:41:56 - INFO - __main__ - Step 35903: {'lr': 0.0004380112611284347, 'samples': 6893376, 'steps': 35902, 'loss/train': 1.4038033485412598} -08/30/2021 19:41:57 - INFO - __main__ - Step 35904: {'lr': 0.00043800776334871705, 'samples': 6893568, 'steps': 35903, 'loss/train': 1.1220324039459229} -08/30/2021 19:41:57 - INFO - __main__ - Step 35905: {'lr': 0.000438004265484286, 'samples': 6893760, 'steps': 35904, 'loss/train': 1.3246674537658691} -08/30/2021 19:41:59 - INFO - __main__ - Step 35906: {'lr': 0.0004380007675351431, 'samples': 6893952, 'steps': 35905, 'loss/train': 1.105709195137024} -08/30/2021 19:41:59 - INFO - __main__ - Step 35907: {'lr': 0.00043799726950128997, 'samples': 6894144, 'steps': 35906, 'loss/train': 1.3028582334518433} -08/30/2021 19:42:00 - INFO - __main__ - Step 35908: {'lr': 0.0004379937713827282, 'samples': 6894336, 'steps': 35907, 'loss/train': 1.5036885738372803} -08/30/2021 19:42:00 - INFO - __main__ - Step 35909: {'lr': 0.0004379902731794593, 'samples': 6894528, 'steps': 35908, 'loss/train': 1.6185053586959839} -08/30/2021 19:42:00 - INFO - __main__ - Step 35910: {'lr': 0.00043798677489148487, 'samples': 6894720, 'steps': 35909, 'loss/train': 1.006392002105713} -08/30/2021 19:42:01 - INFO - __main__ - Step 35911: {'lr': 0.0004379832765188065, 'samples': 6894912, 'steps': 35910, 'loss/train': 1.156903624534607} -08/30/2021 19:42:01 - INFO - __main__ - Step 35912: {'lr': 0.00043797977806142585, 'samples': 6895104, 'steps': 35911, 'loss/train': 0.23539602756500244} -08/30/2021 19:42:03 - INFO - __main__ - Step 35913: {'lr': 0.0004379762795193443, 'samples': 6895296, 'steps': 35912, 'loss/train': 0.12552106380462646} -08/30/2021 19:42:03 - INFO - __main__ - Step 35914: {'lr': 0.0004379727808925636, 'samples': 6895488, 'steps': 35913, 'loss/train': 1.5842339992523193} -08/30/2021 19:42:04 - INFO - __main__ - Step 35915: {'lr': 0.00043796928218108527, 'samples': 6895680, 'steps': 35914, 'loss/train': 1.5486630201339722} -08/30/2021 19:42:04 - INFO - __main__ - Step 35916: {'lr': 0.0004379657833849109, 'samples': 6895872, 'steps': 35915, 'loss/train': 2.00393009185791} -08/30/2021 19:42:04 - INFO - __main__ - Step 35917: {'lr': 0.000437962284504042, 'samples': 6896064, 'steps': 35916, 'loss/train': 1.2316259145736694} -08/30/2021 19:42:06 - INFO - __main__ - Step 35918: {'lr': 0.00043795878553848025, 'samples': 6896256, 'steps': 35917, 'loss/train': 1.6356743574142456} -08/30/2021 19:42:06 - INFO - __main__ - Step 35919: {'lr': 0.0004379552864882271, 'samples': 6896448, 'steps': 35918, 'loss/train': 0.13809886574745178} -08/30/2021 19:42:07 - INFO - __main__ - Step 35920: {'lr': 0.00043795178735328425, 'samples': 6896640, 'steps': 35919, 'loss/train': 1.2755662202835083} -08/30/2021 19:42:07 - INFO - __main__ - Step 35921: {'lr': 0.0004379482881336532, 'samples': 6896832, 'steps': 35920, 'loss/train': 1.628170371055603} -08/30/2021 19:42:07 - INFO - __main__ - Step 35922: {'lr': 0.0004379447888293355, 'samples': 6897024, 'steps': 35921, 'loss/train': 1.4386086463928223} -08/30/2021 19:42:08 - INFO - __main__ - Step 35923: {'lr': 0.0004379412894403328, 'samples': 6897216, 'steps': 35922, 'loss/train': 1.5190057754516602} -08/30/2021 19:42:09 - INFO - __main__ - Step 35924: {'lr': 0.0004379377899666468, 'samples': 6897408, 'steps': 35923, 'loss/train': 1.868404746055603} -08/30/2021 19:42:10 - INFO - __main__ - Step 35925: {'lr': 0.0004379342904082788, 'samples': 6897600, 'steps': 35924, 'loss/train': 1.0146533250808716} -08/30/2021 19:42:10 - INFO - __main__ - Step 35926: {'lr': 0.00043793079076523053, 'samples': 6897792, 'steps': 35925, 'loss/train': 0.5593517422676086} -08/30/2021 19:42:10 - INFO - __main__ - Step 35927: {'lr': 0.0004379272910375035, 'samples': 6897984, 'steps': 35926, 'loss/train': 1.5626782178878784} -08/30/2021 19:42:11 - INFO - __main__ - Step 35928: {'lr': 0.0004379237912250994, 'samples': 6898176, 'steps': 35927, 'loss/train': 1.6108183860778809} -08/30/2021 19:42:12 - INFO - __main__ - Step 35929: {'lr': 0.0004379202913280197, 'samples': 6898368, 'steps': 35928, 'loss/train': 0.7381371259689331} -08/30/2021 19:42:13 - INFO - __main__ - Step 35930: {'lr': 0.0004379167913462661, 'samples': 6898560, 'steps': 35929, 'loss/train': 1.7457282543182373} -08/30/2021 19:42:13 - INFO - __main__ - Step 35931: {'lr': 0.00043791329127984004, 'samples': 6898752, 'steps': 35930, 'loss/train': 1.0831356048583984} -08/30/2021 19:42:13 - INFO - __main__ - Step 35932: {'lr': 0.0004379097911287431, 'samples': 6898944, 'steps': 35931, 'loss/train': 1.2513684034347534} -08/30/2021 19:42:14 - INFO - __main__ - Step 35933: {'lr': 0.000437906290892977, 'samples': 6899136, 'steps': 35932, 'loss/train': 1.300889253616333} -08/30/2021 19:42:16 - INFO - __main__ - Step 35934: {'lr': 0.00043790279057254314, 'samples': 6899328, 'steps': 35933, 'loss/train': 1.373547077178955} -08/30/2021 19:42:16 - INFO - __main__ - Step 35935: {'lr': 0.00043789929016744324, 'samples': 6899520, 'steps': 35934, 'loss/train': 1.266237497329712} -08/30/2021 19:42:16 - INFO - __main__ - Step 35936: {'lr': 0.0004378957896776787, 'samples': 6899712, 'steps': 35935, 'loss/train': 1.0654737949371338} -08/30/2021 19:42:17 - INFO - __main__ - Step 35937: {'lr': 0.0004378922891032514, 'samples': 6899904, 'steps': 35936, 'loss/train': 1.1746692657470703} -08/30/2021 19:42:17 - INFO - __main__ - Step 35938: {'lr': 0.0004378887884441626, 'samples': 6900096, 'steps': 35937, 'loss/train': 0.03163360059261322} -08/30/2021 19:42:17 - INFO - __main__ - Step 35939: {'lr': 0.000437885287700414, 'samples': 6900288, 'steps': 35938, 'loss/train': 1.0469541549682617} -08/30/2021 19:42:19 - INFO - __main__ - Step 35940: {'lr': 0.0004378817868720073, 'samples': 6900480, 'steps': 35939, 'loss/train': 1.2296102046966553} -08/30/2021 19:42:19 - INFO - __main__ - Step 35941: {'lr': 0.0004378782859589439, 'samples': 6900672, 'steps': 35940, 'loss/train': 1.4204121828079224} -08/30/2021 19:42:20 - INFO - __main__ - Step 35942: {'lr': 0.00043787478496122546, 'samples': 6900864, 'steps': 35941, 'loss/train': 1.2266864776611328} -08/30/2021 19:42:20 - INFO - __main__ - Step 35943: {'lr': 0.0004378712838788536, 'samples': 6901056, 'steps': 35942, 'loss/train': 1.0710322856903076} -08/30/2021 19:42:21 - INFO - __main__ - Step 35944: {'lr': 0.0004378677827118297, 'samples': 6901248, 'steps': 35943, 'loss/train': 1.3463505506515503} -08/30/2021 19:42:22 - INFO - __main__ - Step 35945: {'lr': 0.0004378642814601556, 'samples': 6901440, 'steps': 35944, 'loss/train': 1.977847695350647} -08/30/2021 19:42:23 - INFO - __main__ - Step 35946: {'lr': 0.0004378607801238327, 'samples': 6901632, 'steps': 35945, 'loss/train': 1.4442052841186523} -08/30/2021 19:42:23 - INFO - __main__ - Step 35947: {'lr': 0.00043785727870286265, 'samples': 6901824, 'steps': 35946, 'loss/train': 1.5053248405456543} -08/30/2021 19:42:23 - INFO - __main__ - Step 35948: {'lr': 0.00043785377719724697, 'samples': 6902016, 'steps': 35947, 'loss/train': 1.0368385314941406} -08/30/2021 19:42:24 - INFO - __main__ - Step 35949: {'lr': 0.0004378502756069873, 'samples': 6902208, 'steps': 35948, 'loss/train': 0.6296055912971497} -08/30/2021 19:42:26 - INFO - __main__ - Step 35950: {'lr': 0.0004378467739320852, 'samples': 6902400, 'steps': 35949, 'loss/train': 1.8616852760314941} -08/30/2021 19:42:26 - INFO - __main__ - Step 35951: {'lr': 0.0004378432721725422, 'samples': 6902592, 'steps': 35950, 'loss/train': 1.6548593044281006} -08/30/2021 19:42:27 - INFO - __main__ - Step 35952: {'lr': 0.00043783977032836, 'samples': 6902784, 'steps': 35951, 'loss/train': 1.3482282161712646} -08/30/2021 19:42:27 - INFO - __main__ - Step 35953: {'lr': 0.00043783626839954005, 'samples': 6902976, 'steps': 35952, 'loss/train': 1.2887263298034668} -08/30/2021 19:42:27 - INFO - __main__ - Step 35954: {'lr': 0.0004378327663860839, 'samples': 6903168, 'steps': 35953, 'loss/train': 1.7742043733596802} -08/30/2021 19:42:28 - INFO - __main__ - Step 35955: {'lr': 0.00043782926428799333, 'samples': 6903360, 'steps': 35954, 'loss/train': 1.4570260047912598} -08/30/2021 19:42:30 - INFO - __main__ - Step 35956: {'lr': 0.0004378257621052698, 'samples': 6903552, 'steps': 35955, 'loss/train': 0.19698043167591095} -08/30/2021 19:42:30 - INFO - __main__ - Step 35957: {'lr': 0.0004378222598379148, 'samples': 6903744, 'steps': 35956, 'loss/train': 1.0483758449554443} -08/30/2021 19:42:30 - INFO - __main__ - Step 35958: {'lr': 0.00043781875748593, 'samples': 6903936, 'steps': 35957, 'loss/train': 1.1234116554260254} -08/30/2021 19:42:31 - INFO - __main__ - Step 35959: {'lr': 0.000437815255049317, 'samples': 6904128, 'steps': 35958, 'loss/train': 1.541306495666504} -08/30/2021 19:42:31 - INFO - __main__ - Step 35960: {'lr': 0.0004378117525280773, 'samples': 6904320, 'steps': 35959, 'loss/train': 1.461466670036316} -08/30/2021 19:42:33 - INFO - __main__ - Step 35961: {'lr': 0.00043780824992221257, 'samples': 6904512, 'steps': 35960, 'loss/train': 1.5916260480880737} -08/30/2021 19:42:33 - INFO - __main__ - Step 35962: {'lr': 0.00043780474723172433, 'samples': 6904704, 'steps': 35961, 'loss/train': 1.4838563203811646} -08/30/2021 19:42:34 - INFO - __main__ - Step 35963: {'lr': 0.00043780124445661416, 'samples': 6904896, 'steps': 35962, 'loss/train': 0.2184886336326599} -08/30/2021 19:42:34 - INFO - __main__ - Step 35964: {'lr': 0.00043779774159688364, 'samples': 6905088, 'steps': 35963, 'loss/train': 1.4340686798095703} -08/30/2021 19:42:34 - INFO - __main__ - Step 35965: {'lr': 0.00043779423865253434, 'samples': 6905280, 'steps': 35964, 'loss/train': 1.2144970893859863} -08/30/2021 19:42:36 - INFO - __main__ - Step 35966: {'lr': 0.00043779073562356783, 'samples': 6905472, 'steps': 35965, 'loss/train': 1.4804232120513916} -08/30/2021 19:42:36 - INFO - __main__ - Step 35967: {'lr': 0.0004377872325099858, 'samples': 6905664, 'steps': 35966, 'loss/train': 1.1439294815063477} -08/30/2021 19:42:37 - INFO - __main__ - Step 35968: {'lr': 0.00043778372931178974, 'samples': 6905856, 'steps': 35967, 'loss/train': 1.7621876001358032} -08/30/2021 19:42:37 - INFO - __main__ - Step 35969: {'lr': 0.00043778022602898115, 'samples': 6906048, 'steps': 35968, 'loss/train': 2.0064849853515625} -08/30/2021 19:42:37 - INFO - __main__ - Step 35970: {'lr': 0.0004377767226615617, 'samples': 6906240, 'steps': 35969, 'loss/train': 1.1076551675796509} -08/30/2021 19:42:39 - INFO - __main__ - Step 35971: {'lr': 0.000437773219209533, 'samples': 6906432, 'steps': 35970, 'loss/train': 1.1933568716049194} -08/30/2021 19:42:39 - INFO - __main__ - Step 35972: {'lr': 0.00043776971567289656, 'samples': 6906624, 'steps': 35971, 'loss/train': 1.253467082977295} -08/30/2021 19:42:40 - INFO - __main__ - Step 35973: {'lr': 0.00043776621205165404, 'samples': 6906816, 'steps': 35972, 'loss/train': 0.8991245627403259} -08/30/2021 19:42:40 - INFO - __main__ - Step 35974: {'lr': 0.0004377627083458069, 'samples': 6907008, 'steps': 35973, 'loss/train': 1.5318894386291504} -08/30/2021 19:42:40 - INFO - __main__ - Step 35975: {'lr': 0.0004377592045553568, 'samples': 6907200, 'steps': 35974, 'loss/train': 1.268610954284668} -08/30/2021 19:42:41 - INFO - __main__ - Step 35976: {'lr': 0.00043775570068030524, 'samples': 6907392, 'steps': 35975, 'loss/train': 0.7990579605102539} -08/30/2021 19:42:42 - INFO - __main__ - Step 35977: {'lr': 0.0004377521967206539, 'samples': 6907584, 'steps': 35976, 'loss/train': 0.8548378944396973} -08/30/2021 19:42:43 - INFO - __main__ - Step 35978: {'lr': 0.00043774869267640436, 'samples': 6907776, 'steps': 35977, 'loss/train': 1.7069313526153564} -08/30/2021 19:42:43 - INFO - __main__ - Step 35979: {'lr': 0.0004377451885475581, 'samples': 6907968, 'steps': 35978, 'loss/train': 1.6038774251937866} -08/30/2021 19:42:43 - INFO - __main__ - Step 35980: {'lr': 0.0004377416843341168, 'samples': 6908160, 'steps': 35979, 'loss/train': 1.096545696258545} -08/30/2021 19:42:44 - INFO - __main__ - Step 35981: {'lr': 0.00043773818003608203, 'samples': 6908352, 'steps': 35980, 'loss/train': 1.547872543334961} -08/30/2021 19:42:45 - INFO - __main__ - Step 35982: {'lr': 0.00043773467565345523, 'samples': 6908544, 'steps': 35981, 'loss/train': 1.7717556953430176} -08/30/2021 19:42:46 - INFO - __main__ - Step 35983: {'lr': 0.0004377311711862381, 'samples': 6908736, 'steps': 35982, 'loss/train': 1.2803595066070557} -08/30/2021 19:42:46 - INFO - __main__ - Step 35984: {'lr': 0.0004377276666344322, 'samples': 6908928, 'steps': 35983, 'loss/train': 1.8664737939834595} -08/30/2021 19:42:46 - INFO - __main__ - Step 35985: {'lr': 0.00043772416199803924, 'samples': 6909120, 'steps': 35984, 'loss/train': 1.4957305192947388} -08/30/2021 19:42:47 - INFO - __main__ - Step 35986: {'lr': 0.00043772065727706053, 'samples': 6909312, 'steps': 35985, 'loss/train': 1.1382882595062256} -08/30/2021 19:42:48 - INFO - __main__ - Step 35987: {'lr': 0.0004377171524714978, 'samples': 6909504, 'steps': 35986, 'loss/train': 1.461427092552185} -08/30/2021 19:42:49 - INFO - __main__ - Step 35988: {'lr': 0.0004377136475813527, 'samples': 6909696, 'steps': 35987, 'loss/train': 1.9665017127990723} -08/30/2021 19:42:49 - INFO - __main__ - Step 35989: {'lr': 0.0004377101426066266, 'samples': 6909888, 'steps': 35988, 'loss/train': 1.9896049499511719} -08/30/2021 19:42:49 - INFO - __main__ - Step 35990: {'lr': 0.0004377066375473213, 'samples': 6910080, 'steps': 35989, 'loss/train': 1.1919983625411987} -08/30/2021 19:42:50 - INFO - __main__ - Step 35991: {'lr': 0.00043770313240343826, 'samples': 6910272, 'steps': 35990, 'loss/train': 1.751158595085144} -08/30/2021 19:42:51 - INFO - __main__ - Step 35992: {'lr': 0.00043769962717497916, 'samples': 6910464, 'steps': 35991, 'loss/train': 1.5254515409469604} -08/30/2021 19:42:52 - INFO - __main__ - Step 35993: {'lr': 0.0004376961218619454, 'samples': 6910656, 'steps': 35992, 'loss/train': 1.237084150314331} -08/30/2021 19:42:52 - INFO - __main__ - Step 35994: {'lr': 0.00043769261646433867, 'samples': 6910848, 'steps': 35993, 'loss/train': 1.1449388265609741} -08/30/2021 19:42:52 - INFO - __main__ - Step 35995: {'lr': 0.0004376891109821606, 'samples': 6911040, 'steps': 35994, 'loss/train': 1.532547950744629} -08/30/2021 19:42:53 - INFO - __main__ - Step 35996: {'lr': 0.0004376856054154127, 'samples': 6911232, 'steps': 35995, 'loss/train': 1.8205986022949219} -08/30/2021 19:42:54 - INFO - __main__ - Step 35997: {'lr': 0.00043768209976409645, 'samples': 6911424, 'steps': 35996, 'loss/train': 1.4493441581726074} -08/30/2021 19:42:55 - INFO - __main__ - Step 35998: {'lr': 0.0004376785940282137, 'samples': 6911616, 'steps': 35997, 'loss/train': 1.7962307929992676} -08/30/2021 19:42:55 - INFO - __main__ - Step 35999: {'lr': 0.0004376750882077658, 'samples': 6911808, 'steps': 35998, 'loss/train': 0.8227716684341431} -08/30/2021 19:42:55 - INFO - __main__ - Step 36000: {'lr': 0.0004376715823027544, 'samples': 6912000, 'steps': 35999, 'loss/train': 0.28827592730522156} -08/30/2021 19:42:56 - INFO - __main__ - Step 36001: {'lr': 0.0004376680763131811, 'samples': 6912192, 'steps': 36000, 'loss/train': 1.0225043296813965} -08/30/2021 19:42:57 - INFO - __main__ - Step 36002: {'lr': 0.0004376645702390475, 'samples': 6912384, 'steps': 36001, 'loss/train': 1.203527569770813} -08/30/2021 19:42:58 - INFO - __main__ - Step 36003: {'lr': 0.00043766106408035506, 'samples': 6912576, 'steps': 36002, 'loss/train': 1.2971988916397095} -08/30/2021 19:42:58 - INFO - __main__ - Step 36004: {'lr': 0.0004376575578371055, 'samples': 6912768, 'steps': 36003, 'loss/train': 1.5095651149749756} -08/30/2021 19:42:58 - INFO - __main__ - Step 36005: {'lr': 0.0004376540515093003, 'samples': 6912960, 'steps': 36004, 'loss/train': 0.9047927260398865} -08/30/2021 19:42:59 - INFO - __main__ - Step 36006: {'lr': 0.0004376505450969411, 'samples': 6913152, 'steps': 36005, 'loss/train': 1.8407281637191772} -08/30/2021 19:42:59 - INFO - __main__ - Step 36007: {'lr': 0.0004376470386000294, 'samples': 6913344, 'steps': 36006, 'loss/train': 1.3397948741912842} -08/30/2021 19:43:01 - INFO - __main__ - Step 36008: {'lr': 0.0004376435320185669, 'samples': 6913536, 'steps': 36007, 'loss/train': 1.3284211158752441} -08/30/2021 19:43:02 - INFO - __main__ - Step 36009: {'lr': 0.0004376400253525551, 'samples': 6913728, 'steps': 36008, 'loss/train': 0.869174063205719} -08/30/2021 19:43:02 - INFO - __main__ - Step 36010: {'lr': 0.0004376365186019956, 'samples': 6913920, 'steps': 36009, 'loss/train': 1.620209813117981} -08/30/2021 19:43:02 - INFO - __main__ - Step 36011: {'lr': 0.00043763301176689, 'samples': 6914112, 'steps': 36010, 'loss/train': 1.8468531370162964} -08/30/2021 19:43:03 - INFO - __main__ - Step 36012: {'lr': 0.0004376295048472399, 'samples': 6914304, 'steps': 36011, 'loss/train': 0.8346722722053528} -08/30/2021 19:43:04 - INFO - __main__ - Step 36013: {'lr': 0.0004376259978430468, 'samples': 6914496, 'steps': 36012, 'loss/train': 1.434913158416748} -08/30/2021 19:43:05 - INFO - __main__ - Step 36014: {'lr': 0.0004376224907543123, 'samples': 6914688, 'steps': 36013, 'loss/train': 0.7564408183097839} -08/30/2021 19:43:05 - INFO - __main__ - Step 36015: {'lr': 0.00043761898358103804, 'samples': 6914880, 'steps': 36014, 'loss/train': 1.110268235206604} -08/30/2021 19:43:05 - INFO - __main__ - Step 36016: {'lr': 0.0004376154763232255, 'samples': 6915072, 'steps': 36015, 'loss/train': 1.2822383642196655} -08/30/2021 19:43:06 - INFO - __main__ - Step 36017: {'lr': 0.0004376119689808764, 'samples': 6915264, 'steps': 36016, 'loss/train': 1.6770011186599731} -08/30/2021 19:43:08 - INFO - __main__ - Step 36018: {'lr': 0.00043760846155399216, 'samples': 6915456, 'steps': 36017, 'loss/train': 0.08690931648015976} -08/30/2021 19:43:08 - INFO - __main__ - Step 36019: {'lr': 0.0004376049540425745, 'samples': 6915648, 'steps': 36018, 'loss/train': 1.2932840585708618} -08/30/2021 19:43:08 - INFO - __main__ - Step 36020: {'lr': 0.0004376014464466249, 'samples': 6915840, 'steps': 36019, 'loss/train': 1.8744899034500122} -08/30/2021 19:43:09 - INFO - __main__ - Step 36021: {'lr': 0.0004375979387661451, 'samples': 6916032, 'steps': 36020, 'loss/train': 1.6647194623947144} -08/30/2021 19:43:09 - INFO - __main__ - Step 36022: {'lr': 0.0004375944310011364, 'samples': 6916224, 'steps': 36021, 'loss/train': 1.9740253686904907} -08/30/2021 19:43:11 - INFO - __main__ - Step 36023: {'lr': 0.00043759092315160064, 'samples': 6916416, 'steps': 36022, 'loss/train': 0.09651821851730347} -08/30/2021 19:43:11 - INFO - __main__ - Step 36024: {'lr': 0.00043758741521753925, 'samples': 6916608, 'steps': 36023, 'loss/train': 1.815151572227478} -08/30/2021 19:43:12 - INFO - __main__ - Step 36025: {'lr': 0.0004375839071989539, 'samples': 6916800, 'steps': 36024, 'loss/train': 1.6136376857757568} -08/30/2021 19:43:12 - INFO - __main__ - Step 36026: {'lr': 0.00043758039909584613, 'samples': 6916992, 'steps': 36025, 'loss/train': 1.468501329421997} -08/30/2021 19:43:12 - INFO - __main__ - Step 36027: {'lr': 0.0004375768909082175, 'samples': 6917184, 'steps': 36026, 'loss/train': 0.10584470629692078} -08/30/2021 19:43:13 - INFO - __main__ - Step 36028: {'lr': 0.0004375733826360697, 'samples': 6917376, 'steps': 36027, 'loss/train': 0.765294075012207} -08/30/2021 19:43:14 - INFO - __main__ - Step 36029: {'lr': 0.0004375698742794042, 'samples': 6917568, 'steps': 36028, 'loss/train': 5.794175148010254} -08/30/2021 19:43:15 - INFO - __main__ - Step 36030: {'lr': 0.0004375663658382225, 'samples': 6917760, 'steps': 36029, 'loss/train': 0.9114642143249512} -08/30/2021 19:43:15 - INFO - __main__ - Step 36031: {'lr': 0.0004375628573125264, 'samples': 6917952, 'steps': 36030, 'loss/train': 1.5143628120422363} -08/30/2021 19:43:15 - INFO - __main__ - Step 36032: {'lr': 0.0004375593487023174, 'samples': 6918144, 'steps': 36031, 'loss/train': 0.9707401990890503} -08/30/2021 19:43:16 - INFO - __main__ - Step 36033: {'lr': 0.00043755584000759696, 'samples': 6918336, 'steps': 36032, 'loss/train': 1.919002890586853} -08/30/2021 19:43:17 - INFO - __main__ - Step 36034: {'lr': 0.0004375523312283668, 'samples': 6918528, 'steps': 36033, 'loss/train': 1.9662377834320068} -08/30/2021 19:43:18 - INFO - __main__ - Step 36035: {'lr': 0.00043754882236462844, 'samples': 6918720, 'steps': 36034, 'loss/train': 1.7322356700897217} -08/30/2021 19:43:18 - INFO - __main__ - Step 36036: {'lr': 0.00043754531341638346, 'samples': 6918912, 'steps': 36035, 'loss/train': 1.3574854135513306} -08/30/2021 19:43:18 - INFO - __main__ - Step 36037: {'lr': 0.00043754180438363344, 'samples': 6919104, 'steps': 36036, 'loss/train': 1.8688459396362305} -08/30/2021 19:43:19 - INFO - __main__ - Step 36038: {'lr': 0.00043753829526638, 'samples': 6919296, 'steps': 36037, 'loss/train': 1.3560893535614014} -08/30/2021 19:43:20 - INFO - __main__ - Step 36039: {'lr': 0.0004375347860646247, 'samples': 6919488, 'steps': 36038, 'loss/train': 1.8518990278244019} -08/30/2021 19:43:21 - INFO - __main__ - Step 36040: {'lr': 0.00043753127677836917, 'samples': 6919680, 'steps': 36039, 'loss/train': 0.848493754863739} -08/30/2021 19:43:21 - INFO - __main__ - Step 36041: {'lr': 0.0004375277674076149, 'samples': 6919872, 'steps': 36040, 'loss/train': 1.4543474912643433} -08/30/2021 19:43:21 - INFO - __main__ - Step 36042: {'lr': 0.0004375242579523635, 'samples': 6920064, 'steps': 36041, 'loss/train': 2.002323627471924} -08/30/2021 19:43:22 - INFO - __main__ - Step 36043: {'lr': 0.0004375207484126166, 'samples': 6920256, 'steps': 36042, 'loss/train': 1.7686681747436523} -08/30/2021 19:43:22 - INFO - __main__ - Step 36044: {'lr': 0.0004375172387883757, 'samples': 6920448, 'steps': 36043, 'loss/train': 2.4521396160125732} -08/30/2021 19:43:24 - INFO - __main__ - Step 36045: {'lr': 0.00043751372907964247, 'samples': 6920640, 'steps': 36044, 'loss/train': 1.3211314678192139} -08/30/2021 19:43:24 - INFO - __main__ - Step 36046: {'lr': 0.00043751021928641845, 'samples': 6920832, 'steps': 36045, 'loss/train': 1.4622420072555542} -08/30/2021 19:43:24 - INFO - __main__ - Step 36047: {'lr': 0.0004375067094087051, 'samples': 6921024, 'steps': 36046, 'loss/train': 1.1819556951522827} -08/30/2021 19:43:25 - INFO - __main__ - Step 36048: {'lr': 0.0004375031994465042, 'samples': 6921216, 'steps': 36047, 'loss/train': 2.2134838104248047} -08/30/2021 19:43:25 - INFO - __main__ - Step 36049: {'lr': 0.00043749968939981734, 'samples': 6921408, 'steps': 36048, 'loss/train': 1.0158450603485107} -08/30/2021 19:43:27 - INFO - __main__ - Step 36050: {'lr': 0.0004374961792686459, 'samples': 6921600, 'steps': 36049, 'loss/train': 2.0458874702453613} -08/30/2021 19:43:27 - INFO - __main__ - Step 36051: {'lr': 0.00043749266905299155, 'samples': 6921792, 'steps': 36050, 'loss/train': 1.354964256286621} -08/30/2021 19:43:27 - INFO - __main__ - Step 36052: {'lr': 0.000437489158752856, 'samples': 6921984, 'steps': 36051, 'loss/train': 1.5432651042938232} -08/30/2021 19:43:28 - INFO - __main__ - Step 36053: {'lr': 0.00043748564836824065, 'samples': 6922176, 'steps': 36052, 'loss/train': 1.6794992685317993} -08/30/2021 19:43:28 - INFO - __main__ - Step 36054: {'lr': 0.0004374821378991473, 'samples': 6922368, 'steps': 36053, 'loss/train': 1.8025633096694946} -08/30/2021 19:43:30 - INFO - __main__ - Step 36055: {'lr': 0.0004374786273455772, 'samples': 6922560, 'steps': 36054, 'loss/train': 1.141648530960083} -08/30/2021 19:43:30 - INFO - __main__ - Step 36056: {'lr': 0.0004374751167075322, 'samples': 6922752, 'steps': 36055, 'loss/train': 1.8451446294784546} -08/30/2021 19:43:30 - INFO - __main__ - Step 36057: {'lr': 0.0004374716059850138, 'samples': 6922944, 'steps': 36056, 'loss/train': 1.531600832939148} -08/30/2021 19:43:31 - INFO - __main__ - Step 36058: {'lr': 0.0004374680951780236, 'samples': 6923136, 'steps': 36057, 'loss/train': 0.5976413488388062} -08/30/2021 19:43:31 - INFO - __main__ - Step 36059: {'lr': 0.00043746458428656324, 'samples': 6923328, 'steps': 36058, 'loss/train': 1.4780911207199097} -08/30/2021 19:43:33 - INFO - __main__ - Step 36060: {'lr': 0.00043746107331063414, 'samples': 6923520, 'steps': 36059, 'loss/train': 1.6300278902053833} -08/30/2021 19:43:33 - INFO - __main__ - Step 36061: {'lr': 0.000437457562250238, 'samples': 6923712, 'steps': 36060, 'loss/train': 0.7864250540733337} -08/30/2021 19:43:33 - INFO - __main__ - Step 36062: {'lr': 0.0004374540511053763, 'samples': 6923904, 'steps': 36061, 'loss/train': 1.363936424255371} -08/30/2021 19:43:34 - INFO - __main__ - Step 36063: {'lr': 0.00043745053987605075, 'samples': 6924096, 'steps': 36062, 'loss/train': 1.2985875606536865} -08/30/2021 19:43:34 - INFO - __main__ - Step 36064: {'lr': 0.00043744702856226295, 'samples': 6924288, 'steps': 36063, 'loss/train': 1.1848994493484497} -08/30/2021 19:43:36 - INFO - __main__ - Step 36065: {'lr': 0.0004374435171640144, 'samples': 6924480, 'steps': 36064, 'loss/train': 1.1395477056503296} -08/30/2021 19:43:37 - INFO - __main__ - Step 36066: {'lr': 0.0004374400056813066, 'samples': 6924672, 'steps': 36065, 'loss/train': 0.05058704689145088} -08/30/2021 19:43:37 - INFO - __main__ - Step 36067: {'lr': 0.0004374364941141413, 'samples': 6924864, 'steps': 36066, 'loss/train': 1.5755720138549805} -08/30/2021 19:43:37 - INFO - __main__ - Step 36068: {'lr': 0.00043743298246251994, 'samples': 6925056, 'steps': 36067, 'loss/train': 1.4239070415496826} -08/30/2021 19:43:38 - INFO - __main__ - Step 36069: {'lr': 0.00043742947072644424, 'samples': 6925248, 'steps': 36068, 'loss/train': 1.3607182502746582} -08/30/2021 19:43:39 - INFO - __main__ - Step 36070: {'lr': 0.0004374259589059157, 'samples': 6925440, 'steps': 36069, 'loss/train': 1.3380931615829468} -08/30/2021 19:43:40 - INFO - __main__ - Step 36071: {'lr': 0.0004374224470009359, 'samples': 6925632, 'steps': 36070, 'loss/train': 1.2803268432617188} -08/30/2021 19:43:40 - INFO - __main__ - Step 36072: {'lr': 0.00043741893501150644, 'samples': 6925824, 'steps': 36071, 'loss/train': 1.140285611152649} -08/30/2021 19:43:40 - INFO - __main__ - Step 36073: {'lr': 0.0004374154229376289, 'samples': 6926016, 'steps': 36072, 'loss/train': 1.416749119758606} -08/30/2021 19:43:41 - INFO - __main__ - Step 36074: {'lr': 0.00043741191077930486, 'samples': 6926208, 'steps': 36073, 'loss/train': 1.8557988405227661} -08/30/2021 19:43:42 - INFO - __main__ - Step 36075: {'lr': 0.00043740839853653594, 'samples': 6926400, 'steps': 36074, 'loss/train': 1.285251498222351} -08/30/2021 19:43:43 - INFO - __main__ - Step 36076: {'lr': 0.0004374048862093236, 'samples': 6926592, 'steps': 36075, 'loss/train': 1.213763952255249} -08/30/2021 19:43:43 - INFO - __main__ - Step 36077: {'lr': 0.00043740137379766954, 'samples': 6926784, 'steps': 36076, 'loss/train': 1.7948158979415894} -08/30/2021 19:43:43 - INFO - __main__ - Step 36078: {'lr': 0.0004373978613015753, 'samples': 6926976, 'steps': 36077, 'loss/train': 1.2927815914154053} -08/30/2021 19:43:44 - INFO - __main__ - Step 36079: {'lr': 0.00043739434872104257, 'samples': 6927168, 'steps': 36078, 'loss/train': 1.382166862487793} -08/30/2021 19:43:45 - INFO - __main__ - Step 36080: {'lr': 0.00043739083605607275, 'samples': 6927360, 'steps': 36079, 'loss/train': 0.3568832278251648} -08/30/2021 19:43:46 - INFO - __main__ - Step 36081: {'lr': 0.0004373873233066676, 'samples': 6927552, 'steps': 36080, 'loss/train': 1.6571969985961914} -08/30/2021 19:43:46 - INFO - __main__ - Step 36082: {'lr': 0.00043738381047282856, 'samples': 6927744, 'steps': 36081, 'loss/train': 1.4800221920013428} -08/30/2021 19:43:46 - INFO - __main__ - Step 36083: {'lr': 0.00043738029755455724, 'samples': 6927936, 'steps': 36082, 'loss/train': 1.482835054397583} -08/30/2021 19:43:47 - INFO - __main__ - Step 36084: {'lr': 0.00043737678455185524, 'samples': 6928128, 'steps': 36083, 'loss/train': 1.1489288806915283} -08/30/2021 19:43:47 - INFO - __main__ - Step 36085: {'lr': 0.0004373732714647242, 'samples': 6928320, 'steps': 36084, 'loss/train': 1.46577787399292} -08/30/2021 19:43:49 - INFO - __main__ - Step 36086: {'lr': 0.0004373697582931657, 'samples': 6928512, 'steps': 36085, 'loss/train': 0.9283316135406494} -08/30/2021 19:43:49 - INFO - __main__ - Step 36087: {'lr': 0.0004373662450371812, 'samples': 6928704, 'steps': 36086, 'loss/train': 1.5501642227172852} -08/30/2021 19:43:49 - INFO - __main__ - Step 36088: {'lr': 0.0004373627316967723, 'samples': 6928896, 'steps': 36087, 'loss/train': 1.4926953315734863} -08/30/2021 19:43:50 - INFO - __main__ - Step 36089: {'lr': 0.0004373592182719408, 'samples': 6929088, 'steps': 36088, 'loss/train': 1.7692233324050903} -08/30/2021 19:43:50 - INFO - __main__ - Step 36090: {'lr': 0.00043735570476268804, 'samples': 6929280, 'steps': 36089, 'loss/train': 0.8793413043022156} -08/30/2021 19:43:52 - INFO - __main__ - Step 36091: {'lr': 0.0004373521911690157, 'samples': 6929472, 'steps': 36090, 'loss/train': 1.1689447164535522} -08/30/2021 19:43:52 - INFO - __main__ - Step 36092: {'lr': 0.00043734867749092534, 'samples': 6929664, 'steps': 36091, 'loss/train': 1.890589952468872} -08/30/2021 19:43:53 - INFO - __main__ - Step 36093: {'lr': 0.0004373451637284186, 'samples': 6929856, 'steps': 36092, 'loss/train': 0.511699914932251} -08/30/2021 19:43:53 - INFO - __main__ - Step 36094: {'lr': 0.0004373416498814969, 'samples': 6930048, 'steps': 36093, 'loss/train': 1.3292160034179688} -08/30/2021 19:43:53 - INFO - __main__ - Step 36095: {'lr': 0.0004373381359501621, 'samples': 6930240, 'steps': 36094, 'loss/train': 1.3810791969299316} -08/30/2021 19:43:54 - INFO - __main__ - Step 36096: {'lr': 0.00043733462193441553, 'samples': 6930432, 'steps': 36095, 'loss/train': 0.6969497799873352} -08/30/2021 19:43:55 - INFO - __main__ - Step 36097: {'lr': 0.00043733110783425894, 'samples': 6930624, 'steps': 36096, 'loss/train': 1.5299763679504395} -08/30/2021 19:43:56 - INFO - __main__ - Step 36098: {'lr': 0.00043732759364969374, 'samples': 6930816, 'steps': 36097, 'loss/train': 1.5626649856567383} -08/30/2021 19:43:56 - INFO - __main__ - Step 36099: {'lr': 0.0004373240793807217, 'samples': 6931008, 'steps': 36098, 'loss/train': 1.3506392240524292} -08/30/2021 19:43:57 - INFO - __main__ - Step 36100: {'lr': 0.00043732056502734435, 'samples': 6931200, 'steps': 36099, 'loss/train': 1.5071520805358887} -08/30/2021 19:43:57 - INFO - __main__ - Step 36101: {'lr': 0.0004373170505895632, 'samples': 6931392, 'steps': 36100, 'loss/train': 0.1549835354089737} -08/30/2021 19:43:58 - INFO - __main__ - Step 36102: {'lr': 0.0004373135360673799, 'samples': 6931584, 'steps': 36101, 'loss/train': 1.5522302389144897} -08/30/2021 19:43:59 - INFO - __main__ - Step 36103: {'lr': 0.000437310021460796, 'samples': 6931776, 'steps': 36102, 'loss/train': 1.450844407081604} -08/30/2021 19:43:59 - INFO - __main__ - Step 36104: {'lr': 0.000437306506769813, 'samples': 6931968, 'steps': 36103, 'loss/train': 1.9918410778045654} -08/30/2021 19:44:00 - INFO - __main__ - Step 36105: {'lr': 0.0004373029919944327, 'samples': 6932160, 'steps': 36104, 'loss/train': 1.6261976957321167} -08/30/2021 19:44:00 - INFO - __main__ - Step 36106: {'lr': 0.00043729947713465653, 'samples': 6932352, 'steps': 36105, 'loss/train': 1.0425323247909546} -08/30/2021 19:44:01 - INFO - __main__ - Step 36107: {'lr': 0.00043729596219048607, 'samples': 6932544, 'steps': 36106, 'loss/train': 1.4196878671646118} -08/30/2021 19:44:02 - INFO - __main__ - Step 36108: {'lr': 0.000437292447161923, 'samples': 6932736, 'steps': 36107, 'loss/train': 1.3793174028396606} -08/30/2021 19:44:02 - INFO - __main__ - Step 36109: {'lr': 0.0004372889320489688, 'samples': 6932928, 'steps': 36108, 'loss/train': 0.8662286996841431} -08/30/2021 19:44:02 - INFO - __main__ - Step 36110: {'lr': 0.00043728541685162503, 'samples': 6933120, 'steps': 36109, 'loss/train': 1.8410738706588745} -08/30/2021 19:44:03 - INFO - __main__ - Step 36111: {'lr': 0.0004372819015698934, 'samples': 6933312, 'steps': 36110, 'loss/train': 0.6522652506828308} -08/30/2021 19:44:04 - INFO - __main__ - Step 36112: {'lr': 0.0004372783862037755, 'samples': 6933504, 'steps': 36111, 'loss/train': 1.6090412139892578} -08/30/2021 19:44:05 - INFO - __main__ - Step 36113: {'lr': 0.00043727487075327285, 'samples': 6933696, 'steps': 36112, 'loss/train': 1.2346184253692627} -08/30/2021 19:44:05 - INFO - __main__ - Step 36114: {'lr': 0.00043727135521838697, 'samples': 6933888, 'steps': 36113, 'loss/train': 1.940293312072754} -08/30/2021 19:44:05 - INFO - __main__ - Step 36115: {'lr': 0.00043726783959911953, 'samples': 6934080, 'steps': 36114, 'loss/train': 1.8155865669250488} -08/30/2021 19:44:06 - INFO - __main__ - Step 36116: {'lr': 0.00043726432389547205, 'samples': 6934272, 'steps': 36115, 'loss/train': 1.8422759771347046} -08/30/2021 19:44:08 - INFO - __main__ - Step 36117: {'lr': 0.00043726080810744616, 'samples': 6934464, 'steps': 36116, 'loss/train': 2.2651312351226807} -08/30/2021 19:44:08 - INFO - __main__ - Step 36118: {'lr': 0.0004372572922350435, 'samples': 6934656, 'steps': 36117, 'loss/train': 1.2567503452301025} -08/30/2021 19:44:09 - INFO - __main__ - Step 36119: {'lr': 0.0004372537762782656, 'samples': 6934848, 'steps': 36118, 'loss/train': 2.4502525329589844} -08/30/2021 19:44:09 - INFO - __main__ - Step 36120: {'lr': 0.00043725026023711395, 'samples': 6935040, 'steps': 36119, 'loss/train': 1.0960851907730103} -08/30/2021 19:44:09 - INFO - __main__ - Step 36121: {'lr': 0.0004372467441115903, 'samples': 6935232, 'steps': 36120, 'loss/train': 0.6183828115463257} -08/30/2021 19:44:11 - INFO - __main__ - Step 36122: {'lr': 0.00043724322790169613, 'samples': 6935424, 'steps': 36121, 'loss/train': 1.1075011491775513} -08/30/2021 19:44:12 - INFO - __main__ - Step 36123: {'lr': 0.00043723971160743305, 'samples': 6935616, 'steps': 36122, 'loss/train': 1.1525518894195557} -08/30/2021 19:44:12 - INFO - __main__ - Step 36124: {'lr': 0.00043723619522880266, 'samples': 6935808, 'steps': 36123, 'loss/train': 2.762505054473877} -08/30/2021 19:44:12 - INFO - __main__ - Step 36125: {'lr': 0.0004372326787658065, 'samples': 6936000, 'steps': 36124, 'loss/train': 1.3858706951141357} -08/30/2021 19:44:13 - INFO - __main__ - Step 36126: {'lr': 0.00043722916221844617, 'samples': 6936192, 'steps': 36125, 'loss/train': 1.8959014415740967} -08/30/2021 19:44:14 - INFO - __main__ - Step 36127: {'lr': 0.0004372256455867233, 'samples': 6936384, 'steps': 36126, 'loss/train': 0.088154137134552} -08/30/2021 19:44:14 - INFO - __main__ - Step 36128: {'lr': 0.0004372221288706394, 'samples': 6936576, 'steps': 36127, 'loss/train': 1.7600674629211426} -08/30/2021 19:44:15 - INFO - __main__ - Step 36129: {'lr': 0.0004372186120701962, 'samples': 6936768, 'steps': 36128, 'loss/train': 1.3942238092422485} -08/30/2021 19:44:15 - INFO - __main__ - Step 36130: {'lr': 0.00043721509518539507, 'samples': 6936960, 'steps': 36129, 'loss/train': 1.1062726974487305} -08/30/2021 19:44:15 - INFO - __main__ - Step 36131: {'lr': 0.0004372115782162378, 'samples': 6937152, 'steps': 36130, 'loss/train': 1.438301682472229} -08/30/2021 19:44:17 - INFO - __main__ - Step 36132: {'lr': 0.00043720806116272584, 'samples': 6937344, 'steps': 36131, 'loss/train': 1.54770028591156} -08/30/2021 19:44:17 - INFO - __main__ - Step 36133: {'lr': 0.00043720454402486076, 'samples': 6937536, 'steps': 36132, 'loss/train': 1.4610021114349365} -08/30/2021 19:44:18 - INFO - __main__ - Step 36134: {'lr': 0.00043720102680264427, 'samples': 6937728, 'steps': 36133, 'loss/train': 1.7238088846206665} -08/30/2021 19:44:18 - INFO - __main__ - Step 36135: {'lr': 0.0004371975094960778, 'samples': 6937920, 'steps': 36134, 'loss/train': 1.848029375076294} -08/30/2021 19:44:18 - INFO - __main__ - Step 36136: {'lr': 0.0004371939921051632, 'samples': 6938112, 'steps': 36135, 'loss/train': 1.175031304359436} -08/30/2021 19:44:19 - INFO - __main__ - Step 36137: {'lr': 0.00043719047462990174, 'samples': 6938304, 'steps': 36136, 'loss/train': 1.9913254976272583} -08/30/2021 19:44:20 - INFO - __main__ - Step 36138: {'lr': 0.0004371869570702952, 'samples': 6938496, 'steps': 36137, 'loss/train': 1.6899923086166382} -08/30/2021 19:44:21 - INFO - __main__ - Step 36139: {'lr': 0.0004371834394263451, 'samples': 6938688, 'steps': 36138, 'loss/train': 1.2530657052993774} -08/30/2021 19:44:21 - INFO - __main__ - Step 36140: {'lr': 0.000437179921698053, 'samples': 6938880, 'steps': 36139, 'loss/train': 1.5722675323486328} -08/30/2021 19:44:21 - INFO - __main__ - Step 36141: {'lr': 0.00043717640388542045, 'samples': 6939072, 'steps': 36140, 'loss/train': 1.606685996055603} -08/30/2021 19:44:22 - INFO - __main__ - Step 36142: {'lr': 0.00043717288598844916, 'samples': 6939264, 'steps': 36141, 'loss/train': 1.9109846353530884} -08/30/2021 19:44:23 - INFO - __main__ - Step 36143: {'lr': 0.0004371693680071407, 'samples': 6939456, 'steps': 36142, 'loss/train': 1.5546871423721313} -08/30/2021 19:44:24 - INFO - __main__ - Step 36144: {'lr': 0.00043716584994149657, 'samples': 6939648, 'steps': 36143, 'loss/train': 1.5325613021850586} -08/30/2021 19:44:24 - INFO - __main__ - Step 36145: {'lr': 0.0004371623317915184, 'samples': 6939840, 'steps': 36144, 'loss/train': 1.2303208112716675} -08/30/2021 19:44:24 - INFO - __main__ - Step 36146: {'lr': 0.00043715881355720776, 'samples': 6940032, 'steps': 36145, 'loss/train': 1.4710524082183838} -08/30/2021 19:44:25 - INFO - __main__ - Step 36147: {'lr': 0.0004371552952385663, 'samples': 6940224, 'steps': 36146, 'loss/train': 1.0660884380340576} -08/30/2021 19:44:26 - INFO - __main__ - Step 36148: {'lr': 0.00043715177683559546, 'samples': 6940416, 'steps': 36147, 'loss/train': 1.469367265701294} -08/30/2021 19:44:27 - INFO - __main__ - Step 36149: {'lr': 0.000437148258348297, 'samples': 6940608, 'steps': 36148, 'loss/train': 1.448828101158142} -08/30/2021 19:44:27 - INFO - __main__ - Step 36150: {'lr': 0.0004371447397766724, 'samples': 6940800, 'steps': 36149, 'loss/train': 1.3521138429641724} -08/30/2021 19:44:27 - INFO - __main__ - Step 36151: {'lr': 0.0004371412211207233, 'samples': 6940992, 'steps': 36150, 'loss/train': 1.6602424383163452} -08/30/2021 19:44:28 - INFO - __main__ - Step 36152: {'lr': 0.0004371377023804512, 'samples': 6941184, 'steps': 36151, 'loss/train': 1.3956000804901123} -08/30/2021 19:44:30 - INFO - __main__ - Step 36153: {'lr': 0.0004371341835558578, 'samples': 6941376, 'steps': 36152, 'loss/train': 1.2133311033248901} -08/30/2021 19:44:30 - INFO - __main__ - Step 36154: {'lr': 0.0004371306646469445, 'samples': 6941568, 'steps': 36153, 'loss/train': 0.9220306873321533} -08/30/2021 19:44:30 - INFO - __main__ - Step 36155: {'lr': 0.00043712714565371315, 'samples': 6941760, 'steps': 36154, 'loss/train': 1.729306697845459} -08/30/2021 19:44:31 - INFO - __main__ - Step 36156: {'lr': 0.0004371236265761651, 'samples': 6941952, 'steps': 36155, 'loss/train': 1.8302483558654785} -08/30/2021 19:44:31 - INFO - __main__ - Step 36157: {'lr': 0.0004371201074143021, 'samples': 6942144, 'steps': 36156, 'loss/train': 1.705064296722412} -08/30/2021 19:44:31 - INFO - __main__ - Step 36158: {'lr': 0.0004371165881681256, 'samples': 6942336, 'steps': 36157, 'loss/train': 1.1303297281265259} -08/30/2021 19:44:33 - INFO - __main__ - Step 36159: {'lr': 0.0004371130688376373, 'samples': 6942528, 'steps': 36158, 'loss/train': 1.4892210960388184} -08/30/2021 19:44:34 - INFO - __main__ - Step 36160: {'lr': 0.00043710954942283875, 'samples': 6942720, 'steps': 36159, 'loss/train': 1.5749467611312866} -08/30/2021 19:44:34 - INFO - __main__ - Step 36161: {'lr': 0.0004371060299237315, 'samples': 6942912, 'steps': 36160, 'loss/train': 1.079881191253662} -08/30/2021 19:44:34 - INFO - __main__ - Step 36162: {'lr': 0.00043710251034031713, 'samples': 6943104, 'steps': 36161, 'loss/train': 1.4332362413406372} -08/30/2021 19:44:35 - INFO - __main__ - Step 36163: {'lr': 0.0004370989906725973, 'samples': 6943296, 'steps': 36162, 'loss/train': 1.3096790313720703} -08/30/2021 19:44:36 - INFO - __main__ - Step 36164: {'lr': 0.00043709547092057356, 'samples': 6943488, 'steps': 36163, 'loss/train': 0.06760528683662415} -08/30/2021 19:44:37 - INFO - __main__ - Step 36165: {'lr': 0.00043709195108424746, 'samples': 6943680, 'steps': 36164, 'loss/train': 1.3607068061828613} -08/30/2021 19:44:37 - INFO - __main__ - Step 36166: {'lr': 0.0004370884311636206, 'samples': 6943872, 'steps': 36165, 'loss/train': 1.660696268081665} -08/30/2021 19:44:37 - INFO - __main__ - Step 36167: {'lr': 0.0004370849111586946, 'samples': 6944064, 'steps': 36166, 'loss/train': 1.7609360218048096} -08/30/2021 19:44:38 - INFO - __main__ - Step 36168: {'lr': 0.000437081391069471, 'samples': 6944256, 'steps': 36167, 'loss/train': 1.4726663827896118} -08/30/2021 19:44:38 - INFO - __main__ - Step 36169: {'lr': 0.0004370778708959514, 'samples': 6944448, 'steps': 36168, 'loss/train': 1.277608036994934} -08/30/2021 19:44:40 - INFO - __main__ - Step 36170: {'lr': 0.00043707435063813747, 'samples': 6944640, 'steps': 36169, 'loss/train': 1.2327027320861816} -08/30/2021 19:44:40 - INFO - __main__ - Step 36171: {'lr': 0.0004370708302960307, 'samples': 6944832, 'steps': 36170, 'loss/train': 0.8638128042221069} -08/30/2021 19:44:40 - INFO - __main__ - Step 36172: {'lr': 0.00043706730986963274, 'samples': 6945024, 'steps': 36171, 'loss/train': 1.5289987325668335} -08/30/2021 19:44:41 - INFO - __main__ - Step 36173: {'lr': 0.0004370637893589451, 'samples': 6945216, 'steps': 36172, 'loss/train': 1.1286712884902954} -08/30/2021 19:44:41 - INFO - __main__ - Step 36174: {'lr': 0.0004370602687639693, 'samples': 6945408, 'steps': 36173, 'loss/train': 1.2298859357833862} -08/30/2021 19:44:43 - INFO - __main__ - Step 36175: {'lr': 0.00043705674808470715, 'samples': 6945600, 'steps': 36174, 'loss/train': 1.3916815519332886} -08/30/2021 19:44:44 - INFO - __main__ - Step 36176: {'lr': 0.00043705322732116007, 'samples': 6945792, 'steps': 36175, 'loss/train': 1.8155173063278198} -08/30/2021 19:44:44 - INFO - __main__ - Step 36177: {'lr': 0.00043704970647332977, 'samples': 6945984, 'steps': 36176, 'loss/train': 1.2930392026901245} -08/30/2021 19:44:44 - INFO - __main__ - Step 36178: {'lr': 0.00043704618554121766, 'samples': 6946176, 'steps': 36177, 'loss/train': 1.5829293727874756} -08/30/2021 19:44:45 - INFO - __main__ - Step 36179: {'lr': 0.0004370426645248254, 'samples': 6946368, 'steps': 36178, 'loss/train': 0.9655218124389648} -08/30/2021 19:44:46 - INFO - __main__ - Step 36180: {'lr': 0.00043703914342415473, 'samples': 6946560, 'steps': 36179, 'loss/train': 1.4457999467849731} -08/30/2021 19:44:47 - INFO - __main__ - Step 36181: {'lr': 0.000437035622239207, 'samples': 6946752, 'steps': 36180, 'loss/train': 1.3025232553482056} -08/30/2021 19:44:47 - INFO - __main__ - Step 36182: {'lr': 0.00043703210096998396, 'samples': 6946944, 'steps': 36181, 'loss/train': 1.5481994152069092} -08/30/2021 19:44:47 - INFO - __main__ - Step 36183: {'lr': 0.00043702857961648713, 'samples': 6947136, 'steps': 36182, 'loss/train': 0.7084340453147888} -08/30/2021 19:44:48 - INFO - __main__ - Step 36184: {'lr': 0.0004370250581787181, 'samples': 6947328, 'steps': 36183, 'loss/train': 1.3375695943832397} -08/30/2021 19:44:49 - INFO - __main__ - Step 36185: {'lr': 0.00043702153665667846, 'samples': 6947520, 'steps': 36184, 'loss/train': 1.5599709749221802} -08/30/2021 19:44:50 - INFO - __main__ - Step 36186: {'lr': 0.0004370180150503698, 'samples': 6947712, 'steps': 36185, 'loss/train': 1.7210819721221924} -08/30/2021 19:44:50 - INFO - __main__ - Step 36187: {'lr': 0.0004370144933597938, 'samples': 6947904, 'steps': 36186, 'loss/train': 0.1739286184310913} -08/30/2021 19:44:51 - INFO - __main__ - Step 36188: {'lr': 0.00043701097158495186, 'samples': 6948096, 'steps': 36187, 'loss/train': 1.976375699043274} -08/30/2021 19:44:51 - INFO - __main__ - Step 36189: {'lr': 0.0004370074497258456, 'samples': 6948288, 'steps': 36188, 'loss/train': 1.0812376737594604} -08/30/2021 19:44:52 - INFO - __main__ - Step 36190: {'lr': 0.00043700392778247676, 'samples': 6948480, 'steps': 36189, 'loss/train': 0.06739005446434021} -08/30/2021 19:44:53 - INFO - __main__ - Step 36191: {'lr': 0.0004370004057548468, 'samples': 6948672, 'steps': 36190, 'loss/train': 1.254050850868225} -08/30/2021 19:44:53 - INFO - __main__ - Step 36192: {'lr': 0.0004369968836429574, 'samples': 6948864, 'steps': 36191, 'loss/train': 1.595575213432312} -08/30/2021 19:44:53 - INFO - __main__ - Step 36193: {'lr': 0.0004369933614468101, 'samples': 6949056, 'steps': 36192, 'loss/train': 1.0041005611419678} -08/30/2021 19:44:54 - INFO - __main__ - Step 36194: {'lr': 0.0004369898391664064, 'samples': 6949248, 'steps': 36193, 'loss/train': 0.678227424621582} -08/30/2021 19:44:54 - INFO - __main__ - Step 36195: {'lr': 0.000436986316801748, 'samples': 6949440, 'steps': 36194, 'loss/train': 1.6307750940322876} -08/30/2021 19:44:56 - INFO - __main__ - Step 36196: {'lr': 0.00043698279435283637, 'samples': 6949632, 'steps': 36195, 'loss/train': 1.4718012809753418} -08/30/2021 19:44:56 - INFO - __main__ - Step 36197: {'lr': 0.0004369792718196733, 'samples': 6949824, 'steps': 36196, 'loss/train': 1.6100915670394897} -08/30/2021 19:44:56 - INFO - __main__ - Step 36198: {'lr': 0.0004369757492022602, 'samples': 6950016, 'steps': 36197, 'loss/train': 0.9444458484649658} -08/30/2021 19:44:57 - INFO - __main__ - Step 36199: {'lr': 0.00043697222650059876, 'samples': 6950208, 'steps': 36198, 'loss/train': 1.5574300289154053} -08/30/2021 19:44:57 - INFO - __main__ - Step 36200: {'lr': 0.00043696870371469045, 'samples': 6950400, 'steps': 36199, 'loss/train': 1.7513478994369507} -08/30/2021 19:44:59 - INFO - __main__ - Step 36201: {'lr': 0.000436965180844537, 'samples': 6950592, 'steps': 36200, 'loss/train': 1.6801937818527222} -08/30/2021 19:44:59 - INFO - __main__ - Step 36202: {'lr': 0.00043696165789013986, 'samples': 6950784, 'steps': 36201, 'loss/train': 1.6791130304336548} -08/30/2021 19:45:00 - INFO - __main__ - Step 36203: {'lr': 0.0004369581348515007, 'samples': 6950976, 'steps': 36202, 'loss/train': 1.7950574159622192} -08/30/2021 19:45:00 - INFO - __main__ - Step 36204: {'lr': 0.00043695461172862113, 'samples': 6951168, 'steps': 36203, 'loss/train': 1.4765222072601318} -08/30/2021 19:45:00 - INFO - __main__ - Step 36205: {'lr': 0.0004369510885215026, 'samples': 6951360, 'steps': 36204, 'loss/train': 1.7500945329666138} -08/30/2021 19:45:02 - INFO - __main__ - Step 36206: {'lr': 0.0004369475652301469, 'samples': 6951552, 'steps': 36205, 'loss/train': 1.255204677581787} -08/30/2021 19:45:02 - INFO - __main__ - Step 36207: {'lr': 0.0004369440418545555, 'samples': 6951744, 'steps': 36206, 'loss/train': 1.4784289598464966} -08/30/2021 19:45:03 - INFO - __main__ - Step 36208: {'lr': 0.00043694051839472995, 'samples': 6951936, 'steps': 36207, 'loss/train': 1.869343638420105} -08/30/2021 19:45:03 - INFO - __main__ - Step 36209: {'lr': 0.00043693699485067186, 'samples': 6952128, 'steps': 36208, 'loss/train': 1.2865989208221436} -08/30/2021 19:45:03 - INFO - __main__ - Step 36210: {'lr': 0.0004369334712223829, 'samples': 6952320, 'steps': 36209, 'loss/train': 1.4650505781173706} -08/30/2021 19:45:05 - INFO - __main__ - Step 36211: {'lr': 0.0004369299475098646, 'samples': 6952512, 'steps': 36210, 'loss/train': 1.2392257452011108} -08/30/2021 19:45:05 - INFO - __main__ - Step 36212: {'lr': 0.00043692642371311854, 'samples': 6952704, 'steps': 36211, 'loss/train': 1.435381531715393} -08/30/2021 19:45:06 - INFO - __main__ - Step 36213: {'lr': 0.00043692289983214626, 'samples': 6952896, 'steps': 36212, 'loss/train': 1.03143310546875} -08/30/2021 19:45:06 - INFO - __main__ - Step 36214: {'lr': 0.0004369193758669495, 'samples': 6953088, 'steps': 36213, 'loss/train': 1.5595673322677612} -08/30/2021 19:45:06 - INFO - __main__ - Step 36215: {'lr': 0.0004369158518175297, 'samples': 6953280, 'steps': 36214, 'loss/train': 1.5154434442520142} -08/30/2021 19:45:07 - INFO - __main__ - Step 36216: {'lr': 0.00043691232768388856, 'samples': 6953472, 'steps': 36215, 'loss/train': 1.42335045337677} -08/30/2021 19:45:09 - INFO - __main__ - Step 36217: {'lr': 0.00043690880346602755, 'samples': 6953664, 'steps': 36216, 'loss/train': 1.2866326570510864} -08/30/2021 19:45:09 - INFO - __main__ - Step 36218: {'lr': 0.0004369052791639483, 'samples': 6953856, 'steps': 36217, 'loss/train': 1.5749741792678833} -08/30/2021 19:45:09 - INFO - __main__ - Step 36219: {'lr': 0.0004369017547776525, 'samples': 6954048, 'steps': 36218, 'loss/train': 1.0419127941131592} -08/30/2021 19:45:10 - INFO - __main__ - Step 36220: {'lr': 0.0004368982303071416, 'samples': 6954240, 'steps': 36219, 'loss/train': 0.9410125613212585} -08/30/2021 19:45:10 - INFO - __main__ - Step 36221: {'lr': 0.0004368947057524173, 'samples': 6954432, 'steps': 36220, 'loss/train': 0.1284305900335312} -08/30/2021 19:45:12 - INFO - __main__ - Step 36222: {'lr': 0.00043689118111348105, 'samples': 6954624, 'steps': 36221, 'loss/train': 1.5536609888076782} -08/30/2021 19:45:12 - INFO - __main__ - Step 36223: {'lr': 0.00043688765639033456, 'samples': 6954816, 'steps': 36222, 'loss/train': 0.5226022005081177} -08/30/2021 19:45:12 - INFO - __main__ - Step 36224: {'lr': 0.00043688413158297934, 'samples': 6955008, 'steps': 36223, 'loss/train': 1.2744625806808472} -08/30/2021 19:45:13 - INFO - __main__ - Step 36225: {'lr': 0.00043688060669141705, 'samples': 6955200, 'steps': 36224, 'loss/train': 1.3792767524719238} -08/30/2021 19:45:13 - INFO - __main__ - Step 36226: {'lr': 0.00043687708171564923, 'samples': 6955392, 'steps': 36225, 'loss/train': 1.159806489944458} -08/30/2021 19:45:15 - INFO - __main__ - Step 36227: {'lr': 0.00043687355665567745, 'samples': 6955584, 'steps': 36226, 'loss/train': 1.1828851699829102} -08/30/2021 19:45:16 - INFO - __main__ - Step 36228: {'lr': 0.0004368700315115034, 'samples': 6955776, 'steps': 36227, 'loss/train': 1.8451720476150513} -08/30/2021 19:45:16 - INFO - __main__ - Step 36229: {'lr': 0.00043686650628312854, 'samples': 6955968, 'steps': 36228, 'loss/train': 1.1378953456878662} -08/30/2021 19:45:16 - INFO - __main__ - Step 36230: {'lr': 0.00043686298097055456, 'samples': 6956160, 'steps': 36229, 'loss/train': 1.9758963584899902} -08/30/2021 19:45:17 - INFO - __main__ - Step 36231: {'lr': 0.0004368594555737829, 'samples': 6956352, 'steps': 36230, 'loss/train': 1.3730993270874023} -08/30/2021 19:45:18 - INFO - __main__ - Step 36232: {'lr': 0.0004368559300928153, 'samples': 6956544, 'steps': 36231, 'loss/train': 1.512043833732605} -08/30/2021 19:45:19 - INFO - __main__ - Step 36233: {'lr': 0.0004368524045276534, 'samples': 6956736, 'steps': 36232, 'loss/train': 1.282394289970398} -08/30/2021 19:45:19 - INFO - __main__ - Step 36234: {'lr': 0.00043684887887829863, 'samples': 6956928, 'steps': 36233, 'loss/train': 2.2907588481903076} -08/30/2021 19:45:19 - INFO - __main__ - Step 36235: {'lr': 0.0004368453531447526, 'samples': 6957120, 'steps': 36234, 'loss/train': 1.3599456548690796} -08/30/2021 19:45:20 - INFO - __main__ - Step 36236: {'lr': 0.00043684182732701694, 'samples': 6957312, 'steps': 36235, 'loss/train': 1.5863093137741089} -08/30/2021 19:45:21 - INFO - __main__ - Step 36237: {'lr': 0.00043683830142509327, 'samples': 6957504, 'steps': 36236, 'loss/train': 1.5000536441802979} -08/30/2021 19:45:22 - INFO - __main__ - Step 36238: {'lr': 0.00043683477543898314, 'samples': 6957696, 'steps': 36237, 'loss/train': 1.005483627319336} -08/30/2021 19:45:22 - INFO - __main__ - Step 36239: {'lr': 0.0004368312493686881, 'samples': 6957888, 'steps': 36238, 'loss/train': 0.786897599697113} -08/30/2021 19:45:23 - INFO - __main__ - Step 36240: {'lr': 0.0004368277232142098, 'samples': 6958080, 'steps': 36239, 'loss/train': 1.2815017700195312} -08/30/2021 19:45:23 - INFO - __main__ - Step 36241: {'lr': 0.00043682419697554985, 'samples': 6958272, 'steps': 36240, 'loss/train': 0.2626532316207886} -08/30/2021 19:45:25 - INFO - __main__ - Step 36242: {'lr': 0.0004368206706527098, 'samples': 6958464, 'steps': 36241, 'loss/train': 1.5950918197631836} -08/30/2021 19:45:26 - INFO - __main__ - Step 36243: {'lr': 0.00043681714424569117, 'samples': 6958656, 'steps': 36242, 'loss/train': 0.9098647832870483} -08/30/2021 19:45:26 - INFO - __main__ - Step 36244: {'lr': 0.0004368136177544957, 'samples': 6958848, 'steps': 36243, 'loss/train': 1.3512158393859863} -08/30/2021 19:45:26 - INFO - __main__ - Step 36245: {'lr': 0.00043681009117912484, 'samples': 6959040, 'steps': 36244, 'loss/train': 1.772580862045288} -08/30/2021 19:45:27 - INFO - __main__ - Step 36246: {'lr': 0.0004368065645195803, 'samples': 6959232, 'steps': 36245, 'loss/train': 1.6935904026031494} -08/30/2021 19:45:27 - INFO - __main__ - Step 36247: {'lr': 0.0004368030377758636, 'samples': 6959424, 'steps': 36246, 'loss/train': 1.2961620092391968} -08/30/2021 19:45:27 - INFO - __main__ - Step 36248: {'lr': 0.0004367995109479763, 'samples': 6959616, 'steps': 36247, 'loss/train': 1.5124505758285522} -08/30/2021 19:45:29 - INFO - __main__ - Step 36249: {'lr': 0.00043679598403592, 'samples': 6959808, 'steps': 36248, 'loss/train': 0.9172031283378601} -08/30/2021 19:45:29 - INFO - __main__ - Step 36250: {'lr': 0.00043679245703969627, 'samples': 6960000, 'steps': 36249, 'loss/train': 1.30707848072052} -08/30/2021 19:45:30 - INFO - __main__ - Step 36251: {'lr': 0.00043678892995930685, 'samples': 6960192, 'steps': 36250, 'loss/train': 1.4898329973220825} -08/30/2021 19:45:30 - INFO - __main__ - Step 36252: {'lr': 0.00043678540279475314, 'samples': 6960384, 'steps': 36251, 'loss/train': 1.596374750137329} -08/30/2021 19:45:30 - INFO - __main__ - Step 36253: {'lr': 0.0004367818755460369, 'samples': 6960576, 'steps': 36252, 'loss/train': 0.13209521770477295} -08/30/2021 19:45:32 - INFO - __main__ - Step 36254: {'lr': 0.00043677834821315956, 'samples': 6960768, 'steps': 36253, 'loss/train': 1.007800579071045} -08/30/2021 19:45:32 - INFO - __main__ - Step 36255: {'lr': 0.00043677482079612276, 'samples': 6960960, 'steps': 36254, 'loss/train': 1.576393961906433} -08/30/2021 19:45:33 - INFO - __main__ - Step 36256: {'lr': 0.00043677129329492814, 'samples': 6961152, 'steps': 36255, 'loss/train': 1.7132619619369507} -08/30/2021 19:45:33 - INFO - __main__ - Step 36257: {'lr': 0.00043676776570957725, 'samples': 6961344, 'steps': 36256, 'loss/train': 1.5446170568466187} -08/30/2021 19:45:33 - INFO - __main__ - Step 36258: {'lr': 0.0004367642380400717, 'samples': 6961536, 'steps': 36257, 'loss/train': 1.608413815498352} -08/30/2021 19:45:34 - INFO - __main__ - Step 36259: {'lr': 0.0004367607102864131, 'samples': 6961728, 'steps': 36258, 'loss/train': 1.252132534980774} -08/30/2021 19:45:35 - INFO - __main__ - Step 36260: {'lr': 0.00043675718244860296, 'samples': 6961920, 'steps': 36259, 'loss/train': 2.2234764099121094} -08/30/2021 19:45:36 - INFO - __main__ - Step 36261: {'lr': 0.00043675365452664286, 'samples': 6962112, 'steps': 36260, 'loss/train': 1.8667486906051636} -08/30/2021 19:45:36 - INFO - __main__ - Step 36262: {'lr': 0.0004367501265205345, 'samples': 6962304, 'steps': 36261, 'loss/train': 1.3845876455307007} -08/30/2021 19:45:36 - INFO - __main__ - Step 36263: {'lr': 0.0004367465984302794, 'samples': 6962496, 'steps': 36262, 'loss/train': 1.7512222528457642} -08/30/2021 19:45:37 - INFO - __main__ - Step 36264: {'lr': 0.0004367430702558792, 'samples': 6962688, 'steps': 36263, 'loss/train': 1.561260461807251} -08/30/2021 19:45:39 - INFO - __main__ - Step 36265: {'lr': 0.0004367395419973355, 'samples': 6962880, 'steps': 36264, 'loss/train': 1.352837324142456} -08/30/2021 19:45:39 - INFO - __main__ - Step 36266: {'lr': 0.00043673601365464975, 'samples': 6963072, 'steps': 36265, 'loss/train': 1.7692322731018066} -08/30/2021 19:45:39 - INFO - __main__ - Step 36267: {'lr': 0.00043673248522782364, 'samples': 6963264, 'steps': 36266, 'loss/train': 1.645789623260498} -08/30/2021 19:45:40 - INFO - __main__ - Step 36268: {'lr': 0.0004367289567168588, 'samples': 6963456, 'steps': 36267, 'loss/train': 0.10028726607561111} -08/30/2021 19:45:40 - INFO - __main__ - Step 36269: {'lr': 0.00043672542812175675, 'samples': 6963648, 'steps': 36268, 'loss/train': 0.47563982009887695} -08/30/2021 19:45:40 - INFO - __main__ - Step 36270: {'lr': 0.00043672189944251905, 'samples': 6963840, 'steps': 36269, 'loss/train': 1.2824796438217163} -08/30/2021 19:45:42 - INFO - __main__ - Step 36271: {'lr': 0.0004367183706791474, 'samples': 6964032, 'steps': 36270, 'loss/train': 1.4002498388290405} -08/30/2021 19:45:43 - INFO - __main__ - Step 36272: {'lr': 0.0004367148418316434, 'samples': 6964224, 'steps': 36271, 'loss/train': 1.5807998180389404} -08/30/2021 19:45:43 - INFO - __main__ - Step 36273: {'lr': 0.0004367113129000085, 'samples': 6964416, 'steps': 36272, 'loss/train': 1.772133708000183} -08/30/2021 19:45:43 - INFO - __main__ - Step 36274: {'lr': 0.00043670778388424434, 'samples': 6964608, 'steps': 36273, 'loss/train': 1.4267396926879883} -08/30/2021 19:45:44 - INFO - __main__ - Step 36275: {'lr': 0.00043670425478435263, 'samples': 6964800, 'steps': 36274, 'loss/train': 1.4207713603973389} -08/30/2021 19:45:45 - INFO - __main__ - Step 36276: {'lr': 0.00043670072560033474, 'samples': 6964992, 'steps': 36275, 'loss/train': 1.940977931022644} -08/30/2021 19:45:46 - INFO - __main__ - Step 36277: {'lr': 0.00043669719633219247, 'samples': 6965184, 'steps': 36276, 'loss/train': 1.104358434677124} -08/30/2021 19:45:46 - INFO - __main__ - Step 36278: {'lr': 0.0004366936669799273, 'samples': 6965376, 'steps': 36277, 'loss/train': 1.3936634063720703} -08/30/2021 19:45:46 - INFO - __main__ - Step 36279: {'lr': 0.0004366901375435408, 'samples': 6965568, 'steps': 36278, 'loss/train': 0.5173631310462952} -08/30/2021 19:45:47 - INFO - __main__ - Step 36280: {'lr': 0.0004366866080230347, 'samples': 6965760, 'steps': 36279, 'loss/train': 1.362754464149475} -08/30/2021 19:45:49 - INFO - __main__ - Step 36281: {'lr': 0.0004366830784184104, 'samples': 6965952, 'steps': 36280, 'loss/train': 0.9476340413093567} -08/30/2021 19:45:49 - INFO - __main__ - Step 36282: {'lr': 0.00043667954872966965, 'samples': 6966144, 'steps': 36281, 'loss/train': 1.6118483543395996} -08/30/2021 19:45:49 - INFO - __main__ - Step 36283: {'lr': 0.000436676018956814, 'samples': 6966336, 'steps': 36282, 'loss/train': 1.2911791801452637} -08/30/2021 19:45:50 - INFO - __main__ - Step 36284: {'lr': 0.0004366724890998449, 'samples': 6966528, 'steps': 36283, 'loss/train': 1.72792649269104} -08/30/2021 19:45:50 - INFO - __main__ - Step 36285: {'lr': 0.00043666895915876416, 'samples': 6966720, 'steps': 36284, 'loss/train': 1.0139909982681274} -08/30/2021 19:45:51 - INFO - __main__ - Step 36286: {'lr': 0.0004366654291335732, 'samples': 6966912, 'steps': 36285, 'loss/train': 2.0946671962738037} -08/30/2021 19:45:52 - INFO - __main__ - Step 36287: {'lr': 0.00043666189902427367, 'samples': 6967104, 'steps': 36286, 'loss/train': 1.5928480625152588} -08/30/2021 19:45:52 - INFO - __main__ - Step 36288: {'lr': 0.00043665836883086725, 'samples': 6967296, 'steps': 36287, 'loss/train': 1.501845359802246} -08/30/2021 19:45:53 - INFO - __main__ - Step 36289: {'lr': 0.0004366548385533554, 'samples': 6967488, 'steps': 36288, 'loss/train': 1.6620104312896729} -08/30/2021 19:45:53 - INFO - __main__ - Step 36290: {'lr': 0.0004366513081917398, 'samples': 6967680, 'steps': 36289, 'loss/train': 1.5876080989837646} -08/30/2021 19:45:54 - INFO - __main__ - Step 36291: {'lr': 0.00043664777774602196, 'samples': 6967872, 'steps': 36290, 'loss/train': 1.1251871585845947} -08/30/2021 19:45:55 - INFO - __main__ - Step 36292: {'lr': 0.00043664424721620354, 'samples': 6968064, 'steps': 36291, 'loss/train': 1.3264949321746826} -08/30/2021 19:45:55 - INFO - __main__ - Step 36293: {'lr': 0.00043664071660228605, 'samples': 6968256, 'steps': 36292, 'loss/train': 1.2746326923370361} -08/30/2021 19:45:56 - INFO - __main__ - Step 36294: {'lr': 0.00043663718590427117, 'samples': 6968448, 'steps': 36293, 'loss/train': 1.3966554403305054} -08/30/2021 19:45:56 - INFO - __main__ - Step 36295: {'lr': 0.0004366336551221605, 'samples': 6968640, 'steps': 36294, 'loss/train': 1.408300757408142} -08/30/2021 19:45:56 - INFO - __main__ - Step 36296: {'lr': 0.0004366301242559555, 'samples': 6968832, 'steps': 36295, 'loss/train': 1.7586427927017212} -08/30/2021 19:45:59 - INFO - __main__ - Step 36297: {'lr': 0.00043662659330565793, 'samples': 6969024, 'steps': 36296, 'loss/train': 0.875842273235321} -08/30/2021 19:45:59 - INFO - __main__ - Step 36298: {'lr': 0.00043662306227126917, 'samples': 6969216, 'steps': 36297, 'loss/train': 0.8898364305496216} -08/30/2021 19:45:59 - INFO - __main__ - Step 36299: {'lr': 0.00043661953115279104, 'samples': 6969408, 'steps': 36298, 'loss/train': 1.5504984855651855} -08/30/2021 19:46:00 - INFO - __main__ - Step 36300: {'lr': 0.000436615999950225, 'samples': 6969600, 'steps': 36299, 'loss/train': 0.1926325410604477} -08/30/2021 19:46:00 - INFO - __main__ - Step 36301: {'lr': 0.0004366124686635727, 'samples': 6969792, 'steps': 36300, 'loss/train': 2.0592730045318604} -08/30/2021 19:46:02 - INFO - __main__ - Step 36302: {'lr': 0.00043660893729283564, 'samples': 6969984, 'steps': 36301, 'loss/train': 1.6141204833984375} -08/30/2021 19:46:02 - INFO - __main__ - Step 36303: {'lr': 0.0004366054058380155, 'samples': 6970176, 'steps': 36302, 'loss/train': 1.7512975931167603} -08/30/2021 19:46:02 - INFO - __main__ - Step 36304: {'lr': 0.0004366018742991139, 'samples': 6970368, 'steps': 36303, 'loss/train': 0.26098498702049255} -08/30/2021 19:46:03 - INFO - __main__ - Step 36305: {'lr': 0.00043659834267613227, 'samples': 6970560, 'steps': 36304, 'loss/train': 1.9825482368469238} -08/30/2021 19:46:03 - INFO - __main__ - Step 36306: {'lr': 0.0004365948109690724, 'samples': 6970752, 'steps': 36305, 'loss/train': 1.3607426881790161} -08/30/2021 19:46:05 - INFO - __main__ - Step 36307: {'lr': 0.0004365912791779357, 'samples': 6970944, 'steps': 36306, 'loss/train': 1.9683040380477905} -08/30/2021 19:46:05 - INFO - __main__ - Step 36308: {'lr': 0.00043658774730272393, 'samples': 6971136, 'steps': 36307, 'loss/train': 1.0265824794769287} -08/30/2021 19:46:05 - INFO - __main__ - Step 36309: {'lr': 0.00043658421534343856, 'samples': 6971328, 'steps': 36308, 'loss/train': 1.1142578125} -08/30/2021 19:46:06 - INFO - __main__ - Step 36310: {'lr': 0.0004365806833000813, 'samples': 6971520, 'steps': 36309, 'loss/train': 1.6549283266067505} -08/30/2021 19:46:06 - INFO - __main__ - Step 36311: {'lr': 0.0004365771511726535, 'samples': 6971712, 'steps': 36310, 'loss/train': 1.6925839185714722} -08/30/2021 19:46:08 - INFO - __main__ - Step 36312: {'lr': 0.00043657361896115706, 'samples': 6971904, 'steps': 36311, 'loss/train': 1.011309266090393} -08/30/2021 19:46:08 - INFO - __main__ - Step 36313: {'lr': 0.0004365700866655934, 'samples': 6972096, 'steps': 36312, 'loss/train': 1.3822884559631348} -08/30/2021 19:46:09 - INFO - __main__ - Step 36314: {'lr': 0.00043656655428596407, 'samples': 6972288, 'steps': 36313, 'loss/train': 1.634024977684021} -08/30/2021 19:46:09 - INFO - __main__ - Step 36315: {'lr': 0.0004365630218222708, 'samples': 6972480, 'steps': 36314, 'loss/train': 1.1251134872436523} -08/30/2021 19:46:09 - INFO - __main__ - Step 36316: {'lr': 0.00043655948927451505, 'samples': 6972672, 'steps': 36315, 'loss/train': 1.1436549425125122} -08/30/2021 19:46:10 - INFO - __main__ - Step 36317: {'lr': 0.0004365559566426985, 'samples': 6972864, 'steps': 36316, 'loss/train': 0.9091794490814209} -08/30/2021 19:46:11 - INFO - __main__ - Step 36318: {'lr': 0.0004365524239268227, 'samples': 6973056, 'steps': 36317, 'loss/train': 1.8467167615890503} -08/30/2021 19:46:12 - INFO - __main__ - Step 36319: {'lr': 0.00043654889112688933, 'samples': 6973248, 'steps': 36318, 'loss/train': 1.1432421207427979} -08/30/2021 19:46:12 - INFO - __main__ - Step 36320: {'lr': 0.00043654535824289985, 'samples': 6973440, 'steps': 36319, 'loss/train': 1.821355938911438} -08/30/2021 19:46:12 - INFO - __main__ - Step 36321: {'lr': 0.0004365418252748559, 'samples': 6973632, 'steps': 36320, 'loss/train': 0.08417873829603195} -08/30/2021 19:46:13 - INFO - __main__ - Step 36322: {'lr': 0.0004365382922227591, 'samples': 6973824, 'steps': 36321, 'loss/train': 1.5863474607467651} -08/30/2021 19:46:14 - INFO - __main__ - Step 36323: {'lr': 0.000436534759086611, 'samples': 6974016, 'steps': 36322, 'loss/train': 0.971802830696106} -08/30/2021 19:46:15 - INFO - __main__ - Step 36324: {'lr': 0.00043653122586641323, 'samples': 6974208, 'steps': 36323, 'loss/train': 1.5479087829589844} -08/30/2021 19:46:15 - INFO - __main__ - Step 36325: {'lr': 0.0004365276925621674, 'samples': 6974400, 'steps': 36324, 'loss/train': 1.3704218864440918} -08/30/2021 19:46:16 - INFO - __main__ - Step 36326: {'lr': 0.0004365241591738751, 'samples': 6974592, 'steps': 36325, 'loss/train': 1.4487746953964233} -08/30/2021 19:46:16 - INFO - __main__ - Step 36327: {'lr': 0.0004365206257015378, 'samples': 6974784, 'steps': 36326, 'loss/train': 0.9230908751487732} -08/30/2021 19:46:18 - INFO - __main__ - Step 36328: {'lr': 0.0004365170921451572, 'samples': 6974976, 'steps': 36327, 'loss/train': 2.0408403873443604} -08/30/2021 19:46:18 - INFO - __main__ - Step 36329: {'lr': 0.00043651355850473495, 'samples': 6975168, 'steps': 36328, 'loss/train': 0.9604093432426453} -08/30/2021 19:46:18 - INFO - __main__ - Step 36330: {'lr': 0.0004365100247802725, 'samples': 6975360, 'steps': 36329, 'loss/train': 5.837498188018799} -08/30/2021 19:46:19 - INFO - __main__ - Step 36331: {'lr': 0.0004365064909717715, 'samples': 6975552, 'steps': 36330, 'loss/train': 1.7468425035476685} -08/30/2021 19:46:19 - INFO - __main__ - Step 36332: {'lr': 0.0004365029570792336, 'samples': 6975744, 'steps': 36331, 'loss/train': 1.1854568719863892} -08/30/2021 19:46:19 - INFO - __main__ - Step 36333: {'lr': 0.00043649942310266035, 'samples': 6975936, 'steps': 36332, 'loss/train': 1.463685393333435} -08/30/2021 19:46:21 - INFO - __main__ - Step 36334: {'lr': 0.00043649588904205326, 'samples': 6976128, 'steps': 36333, 'loss/train': 1.4908409118652344} -08/30/2021 19:46:21 - INFO - __main__ - Step 36335: {'lr': 0.0004364923548974141, 'samples': 6976320, 'steps': 36334, 'loss/train': 1.406709909439087} -08/30/2021 19:46:22 - INFO - __main__ - Step 36336: {'lr': 0.0004364888206687443, 'samples': 6976512, 'steps': 36335, 'loss/train': 1.4437986612319946} -08/30/2021 19:46:22 - INFO - __main__ - Step 36337: {'lr': 0.00043648528635604556, 'samples': 6976704, 'steps': 36336, 'loss/train': 1.535369634628296} -08/30/2021 19:46:22 - INFO - __main__ - Step 36338: {'lr': 0.00043648175195931937, 'samples': 6976896, 'steps': 36337, 'loss/train': 1.943576693534851} -08/30/2021 19:46:24 - INFO - __main__ - Step 36339: {'lr': 0.0004364782174785674, 'samples': 6977088, 'steps': 36338, 'loss/train': 1.0343637466430664} -08/30/2021 19:46:25 - INFO - __main__ - Step 36340: {'lr': 0.0004364746829137912, 'samples': 6977280, 'steps': 36339, 'loss/train': 1.1846541166305542} -08/30/2021 19:46:25 - INFO - __main__ - Step 36341: {'lr': 0.0004364711482649925, 'samples': 6977472, 'steps': 36340, 'loss/train': 1.517400860786438} -08/30/2021 19:46:26 - INFO - __main__ - Step 36342: {'lr': 0.00043646761353217266, 'samples': 6977664, 'steps': 36341, 'loss/train': 1.5300853252410889} -08/30/2021 19:46:26 - INFO - __main__ - Step 36343: {'lr': 0.0004364640787153334, 'samples': 6977856, 'steps': 36342, 'loss/train': 0.7770493626594543} -08/30/2021 19:46:27 - INFO - __main__ - Step 36344: {'lr': 0.0004364605438144764, 'samples': 6978048, 'steps': 36343, 'loss/train': 0.9535834789276123} -08/30/2021 19:46:28 - INFO - __main__ - Step 36345: {'lr': 0.000436457008829603, 'samples': 6978240, 'steps': 36344, 'loss/train': 1.6743377447128296} -08/30/2021 19:46:28 - INFO - __main__ - Step 36346: {'lr': 0.00043645347376071507, 'samples': 6978432, 'steps': 36345, 'loss/train': 1.1523141860961914} -08/30/2021 19:46:29 - INFO - __main__ - Step 36347: {'lr': 0.0004364499386078141, 'samples': 6978624, 'steps': 36346, 'loss/train': 1.6288502216339111} -08/30/2021 19:46:29 - INFO - __main__ - Step 36348: {'lr': 0.00043644640337090157, 'samples': 6978816, 'steps': 36347, 'loss/train': 1.502032995223999} -08/30/2021 19:46:29 - INFO - __main__ - Step 36349: {'lr': 0.0004364428680499792, 'samples': 6979008, 'steps': 36348, 'loss/train': 1.5496554374694824} -08/30/2021 19:46:31 - INFO - __main__ - Step 36350: {'lr': 0.0004364393326450486, 'samples': 6979200, 'steps': 36349, 'loss/train': 1.6158000230789185} -08/30/2021 19:46:31 - INFO - __main__ - Step 36351: {'lr': 0.00043643579715611124, 'samples': 6979392, 'steps': 36350, 'loss/train': 2.336977005004883} -08/30/2021 19:46:32 - INFO - __main__ - Step 36352: {'lr': 0.00043643226158316886, 'samples': 6979584, 'steps': 36351, 'loss/train': 2.0129332542419434} -08/30/2021 19:46:32 - INFO - __main__ - Step 36353: {'lr': 0.00043642872592622293, 'samples': 6979776, 'steps': 36352, 'loss/train': 1.4041097164154053} -08/30/2021 19:46:32 - INFO - __main__ - Step 36354: {'lr': 0.0004364251901852751, 'samples': 6979968, 'steps': 36353, 'loss/train': 0.8781626224517822} -08/30/2021 19:46:34 - INFO - __main__ - Step 36355: {'lr': 0.000436421654360327, 'samples': 6980160, 'steps': 36354, 'loss/train': 1.2388808727264404} -08/30/2021 19:46:34 - INFO - __main__ - Step 36356: {'lr': 0.00043641811845138016, 'samples': 6980352, 'steps': 36355, 'loss/train': 2.17956280708313} -08/30/2021 19:46:35 - INFO - __main__ - Step 36357: {'lr': 0.0004364145824584361, 'samples': 6980544, 'steps': 36356, 'loss/train': 1.1740961074829102} -08/30/2021 19:46:35 - INFO - __main__ - Step 36358: {'lr': 0.00043641104638149656, 'samples': 6980736, 'steps': 36357, 'loss/train': 1.27120041847229} -08/30/2021 19:46:35 - INFO - __main__ - Step 36359: {'lr': 0.00043640751022056316, 'samples': 6980928, 'steps': 36358, 'loss/train': 1.6762738227844238} -08/30/2021 19:46:37 - INFO - __main__ - Step 36360: {'lr': 0.00043640397397563737, 'samples': 6981120, 'steps': 36359, 'loss/train': 1.1005442142486572} -08/30/2021 19:46:37 - INFO - __main__ - Step 36361: {'lr': 0.00043640043764672077, 'samples': 6981312, 'steps': 36360, 'loss/train': 1.5166518688201904} -08/30/2021 19:46:38 - INFO - __main__ - Step 36362: {'lr': 0.00043639690123381503, 'samples': 6981504, 'steps': 36361, 'loss/train': 1.233532190322876} -08/30/2021 19:46:38 - INFO - __main__ - Step 36363: {'lr': 0.00043639336473692174, 'samples': 6981696, 'steps': 36362, 'loss/train': 1.1842894554138184} -08/30/2021 19:46:38 - INFO - __main__ - Step 36364: {'lr': 0.00043638982815604247, 'samples': 6981888, 'steps': 36363, 'loss/train': 1.7364468574523926} -08/30/2021 19:46:39 - INFO - __main__ - Step 36365: {'lr': 0.00043638629149117883, 'samples': 6982080, 'steps': 36364, 'loss/train': 1.4133139848709106} -08/30/2021 19:46:40 - INFO - __main__ - Step 36366: {'lr': 0.0004363827547423324, 'samples': 6982272, 'steps': 36365, 'loss/train': 1.4663580656051636} -08/30/2021 19:46:41 - INFO - __main__ - Step 36367: {'lr': 0.00043637921790950476, 'samples': 6982464, 'steps': 36366, 'loss/train': 0.044430457055568695} -08/30/2021 19:46:41 - INFO - __main__ - Step 36368: {'lr': 0.00043637568099269753, 'samples': 6982656, 'steps': 36367, 'loss/train': 1.4652724266052246} -08/30/2021 19:46:41 - INFO - __main__ - Step 36369: {'lr': 0.00043637214399191234, 'samples': 6982848, 'steps': 36368, 'loss/train': 1.1841883659362793} -08/30/2021 19:46:42 - INFO - __main__ - Step 36370: {'lr': 0.00043636860690715064, 'samples': 6983040, 'steps': 36369, 'loss/train': 1.732420802116394} -08/30/2021 19:46:43 - INFO - __main__ - Step 36371: {'lr': 0.00043636506973841424, 'samples': 6983232, 'steps': 36370, 'loss/train': 1.3470722436904907} -08/30/2021 19:46:44 - INFO - __main__ - Step 36372: {'lr': 0.00043636153248570453, 'samples': 6983424, 'steps': 36371, 'loss/train': 0.8544849753379822} -08/30/2021 19:46:44 - INFO - __main__ - Step 36373: {'lr': 0.0004363579951490232, 'samples': 6983616, 'steps': 36372, 'loss/train': 1.2581340074539185} -08/30/2021 19:46:44 - INFO - __main__ - Step 36374: {'lr': 0.0004363544577283718, 'samples': 6983808, 'steps': 36373, 'loss/train': 0.6959117650985718} -08/30/2021 19:46:45 - INFO - __main__ - Step 36375: {'lr': 0.0004363509202237521, 'samples': 6984000, 'steps': 36374, 'loss/train': 1.0700585842132568} -08/30/2021 19:46:46 - INFO - __main__ - Step 36376: {'lr': 0.0004363473826351654, 'samples': 6984192, 'steps': 36375, 'loss/train': 1.657585859298706} -08/30/2021 19:46:47 - INFO - __main__ - Step 36377: {'lr': 0.0004363438449626135, 'samples': 6984384, 'steps': 36376, 'loss/train': 1.5339055061340332} -08/30/2021 19:46:47 - INFO - __main__ - Step 36378: {'lr': 0.000436340307206098, 'samples': 6984576, 'steps': 36377, 'loss/train': 1.1779080629348755} -08/30/2021 19:46:47 - INFO - __main__ - Step 36379: {'lr': 0.00043633676936562026, 'samples': 6984768, 'steps': 36378, 'loss/train': 0.8532932996749878} -08/30/2021 19:46:48 - INFO - __main__ - Step 36380: {'lr': 0.0004363332314411822, 'samples': 6984960, 'steps': 36379, 'loss/train': 1.6608859300613403} -08/30/2021 19:46:49 - INFO - __main__ - Step 36381: {'lr': 0.0004363296934327852, 'samples': 6985152, 'steps': 36380, 'loss/train': 2.0106258392333984} -08/30/2021 19:46:50 - INFO - __main__ - Step 36382: {'lr': 0.00043632615534043096, 'samples': 6985344, 'steps': 36381, 'loss/train': 1.5246495008468628} -08/30/2021 19:46:50 - INFO - __main__ - Step 36383: {'lr': 0.00043632261716412097, 'samples': 6985536, 'steps': 36382, 'loss/train': 1.2977567911148071} -08/30/2021 19:46:50 - INFO - __main__ - Step 36384: {'lr': 0.0004363190789038569, 'samples': 6985728, 'steps': 36383, 'loss/train': 0.9314844608306885} -08/30/2021 19:46:51 - INFO - __main__ - Step 36385: {'lr': 0.0004363155405596404, 'samples': 6985920, 'steps': 36384, 'loss/train': 1.174365758895874} -08/30/2021 19:46:52 - INFO - __main__ - Step 36386: {'lr': 0.00043631200213147296, 'samples': 6986112, 'steps': 36385, 'loss/train': 1.2470765113830566} -08/30/2021 19:46:52 - INFO - __main__ - Step 36387: {'lr': 0.0004363084636193561, 'samples': 6986304, 'steps': 36386, 'loss/train': 1.5699836015701294} -08/30/2021 19:46:53 - INFO - __main__ - Step 36388: {'lr': 0.0004363049250232917, 'samples': 6986496, 'steps': 36387, 'loss/train': 1.5065574645996094} -08/30/2021 19:46:53 - INFO - __main__ - Step 36389: {'lr': 0.000436301386343281, 'samples': 6986688, 'steps': 36388, 'loss/train': 0.9250494837760925} -08/30/2021 19:46:54 - INFO - __main__ - Step 36390: {'lr': 0.0004362978475793259, 'samples': 6986880, 'steps': 36389, 'loss/train': 1.5851961374282837} -08/30/2021 19:46:56 - INFO - __main__ - Step 36391: {'lr': 0.00043629430873142773, 'samples': 6987072, 'steps': 36390, 'loss/train': 0.9763813018798828} -08/30/2021 19:46:56 - INFO - __main__ - Step 36392: {'lr': 0.00043629076979958837, 'samples': 6987264, 'steps': 36391, 'loss/train': 1.4903507232666016} -08/30/2021 19:46:56 - INFO - __main__ - Step 36393: {'lr': 0.00043628723078380916, 'samples': 6987456, 'steps': 36392, 'loss/train': 1.2402701377868652} -08/30/2021 19:46:57 - INFO - __main__ - Step 36394: {'lr': 0.0004362836916840919, 'samples': 6987648, 'steps': 36393, 'loss/train': 1.290327787399292} -08/30/2021 19:46:57 - INFO - __main__ - Step 36395: {'lr': 0.00043628015250043794, 'samples': 6987840, 'steps': 36394, 'loss/train': 1.3989843130111694} -08/30/2021 19:46:59 - INFO - __main__ - Step 36396: {'lr': 0.00043627661323284914, 'samples': 6988032, 'steps': 36395, 'loss/train': 1.5493284463882446} -08/30/2021 19:46:59 - INFO - __main__ - Step 36397: {'lr': 0.00043627307388132693, 'samples': 6988224, 'steps': 36396, 'loss/train': 1.6801135540008545} -08/30/2021 19:46:59 - INFO - __main__ - Step 36398: {'lr': 0.0004362695344458729, 'samples': 6988416, 'steps': 36397, 'loss/train': 1.5184098482131958} -08/30/2021 19:47:00 - INFO - __main__ - Step 36399: {'lr': 0.00043626599492648877, 'samples': 6988608, 'steps': 36398, 'loss/train': 1.9017716646194458} -08/30/2021 19:47:00 - INFO - __main__ - Step 36400: {'lr': 0.000436262455323176, 'samples': 6988800, 'steps': 36399, 'loss/train': 1.036109209060669} -08/30/2021 19:47:02 - INFO - __main__ - Step 36401: {'lr': 0.0004362589156359363, 'samples': 6988992, 'steps': 36400, 'loss/train': 1.6708488464355469} -08/30/2021 19:47:02 - INFO - __main__ - Step 36402: {'lr': 0.00043625537586477114, 'samples': 6989184, 'steps': 36401, 'loss/train': 1.72758150100708} -08/30/2021 19:47:03 - INFO - __main__ - Step 36403: {'lr': 0.00043625183600968224, 'samples': 6989376, 'steps': 36402, 'loss/train': 1.4736424684524536} -08/30/2021 19:47:03 - INFO - __main__ - Step 36404: {'lr': 0.00043624829607067105, 'samples': 6989568, 'steps': 36403, 'loss/train': 1.1701653003692627} -08/30/2021 19:47:03 - INFO - __main__ - Step 36405: {'lr': 0.0004362447560477394, 'samples': 6989760, 'steps': 36404, 'loss/train': 0.028951827436685562} -08/30/2021 19:47:04 - INFO - __main__ - Step 36406: {'lr': 0.0004362412159408886, 'samples': 6989952, 'steps': 36405, 'loss/train': 1.3001972436904907} -08/30/2021 19:47:04 - INFO - __main__ - Step 36407: {'lr': 0.0004362376757501205, 'samples': 6990144, 'steps': 36406, 'loss/train': 1.716759204864502} -08/30/2021 19:47:06 - INFO - __main__ - Step 36408: {'lr': 0.00043623413547543645, 'samples': 6990336, 'steps': 36407, 'loss/train': 0.8372818827629089} -08/30/2021 19:47:06 - INFO - __main__ - Step 36409: {'lr': 0.00043623059511683826, 'samples': 6990528, 'steps': 36408, 'loss/train': 0.8395217061042786} -08/30/2021 19:47:06 - INFO - __main__ - Step 36410: {'lr': 0.0004362270546743274, 'samples': 6990720, 'steps': 36409, 'loss/train': 0.4687364399433136} -08/30/2021 19:47:07 - INFO - __main__ - Step 36411: {'lr': 0.0004362235141479055, 'samples': 6990912, 'steps': 36410, 'loss/train': 1.0184953212738037} -08/30/2021 19:47:07 - INFO - __main__ - Step 36412: {'lr': 0.0004362199735375742, 'samples': 6991104, 'steps': 36411, 'loss/train': 1.4308748245239258} -08/30/2021 19:47:09 - INFO - __main__ - Step 36413: {'lr': 0.000436216432843335, 'samples': 6991296, 'steps': 36412, 'loss/train': 1.4313554763793945} -08/30/2021 19:47:09 - INFO - __main__ - Step 36414: {'lr': 0.00043621289206518957, 'samples': 6991488, 'steps': 36413, 'loss/train': 1.0186474323272705} -08/30/2021 19:47:09 - INFO - __main__ - Step 36415: {'lr': 0.00043620935120313955, 'samples': 6991680, 'steps': 36414, 'loss/train': 0.6312722563743591} -08/30/2021 19:47:10 - INFO - __main__ - Step 36416: {'lr': 0.0004362058102571864, 'samples': 6991872, 'steps': 36415, 'loss/train': 0.806549608707428} -08/30/2021 19:47:10 - INFO - __main__ - Step 36417: {'lr': 0.00043620226922733174, 'samples': 6992064, 'steps': 36416, 'loss/train': 1.9578888416290283} -08/30/2021 19:47:12 - INFO - __main__ - Step 36418: {'lr': 0.0004361987281135773, 'samples': 6992256, 'steps': 36417, 'loss/train': 1.956422209739685} -08/30/2021 19:47:12 - INFO - __main__ - Step 36419: {'lr': 0.00043619518691592453, 'samples': 6992448, 'steps': 36418, 'loss/train': 0.8095663189888} -08/30/2021 19:47:12 - INFO - __main__ - Step 36420: {'lr': 0.00043619164563437506, 'samples': 6992640, 'steps': 36419, 'loss/train': 1.6983819007873535} -08/30/2021 19:47:13 - INFO - __main__ - Step 36421: {'lr': 0.0004361881042689306, 'samples': 6992832, 'steps': 36420, 'loss/train': 1.4028847217559814} -08/30/2021 19:47:13 - INFO - __main__ - Step 36422: {'lr': 0.00043618456281959263, 'samples': 6993024, 'steps': 36421, 'loss/train': 1.512710452079773} -08/30/2021 19:47:15 - INFO - __main__ - Step 36423: {'lr': 0.0004361810212863627, 'samples': 6993216, 'steps': 36422, 'loss/train': 1.3518368005752563} -08/30/2021 19:47:15 - INFO - __main__ - Step 36424: {'lr': 0.0004361774796692425, 'samples': 6993408, 'steps': 36423, 'loss/train': 0.9979020357131958} -08/30/2021 19:47:15 - INFO - __main__ - Step 36425: {'lr': 0.00043617393796823367, 'samples': 6993600, 'steps': 36424, 'loss/train': 1.237671136856079} -08/30/2021 19:47:16 - INFO - __main__ - Step 36426: {'lr': 0.00043617039618333765, 'samples': 6993792, 'steps': 36425, 'loss/train': 1.2507598400115967} -08/30/2021 19:47:16 - INFO - __main__ - Step 36427: {'lr': 0.00043616685431455615, 'samples': 6993984, 'steps': 36426, 'loss/train': 1.2287665605545044} -08/30/2021 19:47:18 - INFO - __main__ - Step 36428: {'lr': 0.0004361633123618908, 'samples': 6994176, 'steps': 36427, 'loss/train': 1.2938023805618286} -08/30/2021 19:47:19 - INFO - __main__ - Step 36429: {'lr': 0.00043615977032534305, 'samples': 6994368, 'steps': 36428, 'loss/train': 1.3939820528030396} -08/30/2021 19:47:19 - INFO - __main__ - Step 36430: {'lr': 0.00043615622820491464, 'samples': 6994560, 'steps': 36429, 'loss/train': 1.091234564781189} -08/30/2021 19:47:19 - INFO - __main__ - Step 36431: {'lr': 0.00043615268600060705, 'samples': 6994752, 'steps': 36430, 'loss/train': 0.9800477623939514} -08/30/2021 19:47:20 - INFO - __main__ - Step 36432: {'lr': 0.000436149143712422, 'samples': 6994944, 'steps': 36431, 'loss/train': 0.08381208777427673} -08/30/2021 19:47:21 - INFO - __main__ - Step 36433: {'lr': 0.0004361456013403609, 'samples': 6995136, 'steps': 36432, 'loss/train': 1.5640465021133423} -08/30/2021 19:47:21 - INFO - __main__ - Step 36434: {'lr': 0.00043614205888442553, 'samples': 6995328, 'steps': 36433, 'loss/train': 1.1764110326766968} -08/30/2021 19:47:22 - INFO - __main__ - Step 36435: {'lr': 0.00043613851634461743, 'samples': 6995520, 'steps': 36434, 'loss/train': 1.5034747123718262} -08/30/2021 19:47:22 - INFO - __main__ - Step 36436: {'lr': 0.00043613497372093827, 'samples': 6995712, 'steps': 36435, 'loss/train': 1.010730504989624} -08/30/2021 19:47:22 - INFO - __main__ - Step 36437: {'lr': 0.0004361314310133894, 'samples': 6995904, 'steps': 36436, 'loss/train': 1.4037946462631226} -08/30/2021 19:47:24 - INFO - __main__ - Step 36438: {'lr': 0.00043612788822197266, 'samples': 6996096, 'steps': 36437, 'loss/train': 1.5880666971206665} -08/30/2021 19:47:24 - INFO - __main__ - Step 36439: {'lr': 0.0004361243453466896, 'samples': 6996288, 'steps': 36438, 'loss/train': 0.5422747731208801} -08/30/2021 19:47:25 - INFO - __main__ - Step 36440: {'lr': 0.0004361208023875417, 'samples': 6996480, 'steps': 36439, 'loss/train': 2.4194462299346924} -08/30/2021 19:47:25 - INFO - __main__ - Step 36441: {'lr': 0.00043611725934453074, 'samples': 6996672, 'steps': 36440, 'loss/train': 1.7073898315429688} -08/30/2021 19:47:25 - INFO - __main__ - Step 36442: {'lr': 0.00043611371621765817, 'samples': 6996864, 'steps': 36441, 'loss/train': 1.4313596487045288} -08/30/2021 19:47:27 - INFO - __main__ - Step 36443: {'lr': 0.0004361101730069256, 'samples': 6997056, 'steps': 36442, 'loss/train': 1.48096764087677} -08/30/2021 19:47:27 - INFO - __main__ - Step 36444: {'lr': 0.00043610662971233465, 'samples': 6997248, 'steps': 36443, 'loss/train': 1.0268685817718506} -08/30/2021 19:47:28 - INFO - __main__ - Step 36445: {'lr': 0.00043610308633388695, 'samples': 6997440, 'steps': 36444, 'loss/train': 1.5223705768585205} -08/30/2021 19:47:28 - INFO - __main__ - Step 36446: {'lr': 0.0004360995428715841, 'samples': 6997632, 'steps': 36445, 'loss/train': 1.1339970827102661} -08/30/2021 19:47:28 - INFO - __main__ - Step 36447: {'lr': 0.00043609599932542764, 'samples': 6997824, 'steps': 36446, 'loss/train': 1.1776108741760254} -08/30/2021 19:47:29 - INFO - __main__ - Step 36448: {'lr': 0.00043609245569541924, 'samples': 6998016, 'steps': 36447, 'loss/train': 1.4329923391342163} -08/30/2021 19:47:31 - INFO - __main__ - Step 36449: {'lr': 0.00043608891198156037, 'samples': 6998208, 'steps': 36448, 'loss/train': 0.9501417875289917} -08/30/2021 19:47:31 - INFO - __main__ - Step 36450: {'lr': 0.0004360853681838528, 'samples': 6998400, 'steps': 36449, 'loss/train': 1.625877022743225} -08/30/2021 19:47:31 - INFO - __main__ - Step 36451: {'lr': 0.0004360818243022979, 'samples': 6998592, 'steps': 36450, 'loss/train': 0.9098576903343201} -08/30/2021 19:47:32 - INFO - __main__ - Step 36452: {'lr': 0.00043607828033689753, 'samples': 6998784, 'steps': 36451, 'loss/train': 1.3731720447540283} -08/30/2021 19:47:32 - INFO - __main__ - Step 36453: {'lr': 0.000436074736287653, 'samples': 6998976, 'steps': 36452, 'loss/train': 1.8267905712127686} -08/30/2021 19:47:34 - INFO - __main__ - Step 36454: {'lr': 0.00043607119215456625, 'samples': 6999168, 'steps': 36453, 'loss/train': 1.9684451818466187} -08/30/2021 19:47:34 - INFO - __main__ - Step 36455: {'lr': 0.00043606764793763865, 'samples': 6999360, 'steps': 36454, 'loss/train': 1.4963877201080322} -08/30/2021 19:47:34 - INFO - __main__ - Step 36456: {'lr': 0.00043606410363687177, 'samples': 6999552, 'steps': 36455, 'loss/train': 0.8276395201683044} -08/30/2021 19:47:35 - INFO - __main__ - Step 36457: {'lr': 0.00043606055925226727, 'samples': 6999744, 'steps': 36456, 'loss/train': 1.0844939947128296} -08/30/2021 19:47:35 - INFO - __main__ - Step 36458: {'lr': 0.0004360570147838269, 'samples': 6999936, 'steps': 36457, 'loss/train': 0.823511004447937} -08/30/2021 19:47:37 - INFO - __main__ - Step 36459: {'lr': 0.00043605347023155193, 'samples': 7000128, 'steps': 36458, 'loss/train': 1.3540081977844238} -08/30/2021 19:47:37 - INFO - __main__ - Step 36460: {'lr': 0.0004360499255954442, 'samples': 7000320, 'steps': 36459, 'loss/train': 1.195165753364563} -08/30/2021 19:47:37 - INFO - __main__ - Step 36461: {'lr': 0.0004360463808755053, 'samples': 7000512, 'steps': 36460, 'loss/train': 0.6927940845489502} -08/30/2021 19:47:38 - INFO - __main__ - Step 36462: {'lr': 0.00043604283607173673, 'samples': 7000704, 'steps': 36461, 'loss/train': 1.1124961376190186} -08/30/2021 19:47:38 - INFO - __main__ - Step 36463: {'lr': 0.0004360392911841401, 'samples': 7000896, 'steps': 36462, 'loss/train': 1.461443305015564} -08/30/2021 19:47:40 - INFO - __main__ - Step 36464: {'lr': 0.0004360357462127171, 'samples': 7001088, 'steps': 36463, 'loss/train': 1.238618016242981} -08/30/2021 19:47:40 - INFO - __main__ - Step 36465: {'lr': 0.0004360322011574692, 'samples': 7001280, 'steps': 36464, 'loss/train': 0.5723713636398315} -08/30/2021 19:47:41 - INFO - __main__ - Step 36466: {'lr': 0.00043602865601839817, 'samples': 7001472, 'steps': 36465, 'loss/train': 1.0349533557891846} -08/30/2021 19:47:41 - INFO - __main__ - Step 36467: {'lr': 0.00043602511079550535, 'samples': 7001664, 'steps': 36466, 'loss/train': 0.8309263586997986} -08/30/2021 19:47:41 - INFO - __main__ - Step 36468: {'lr': 0.0004360215654887926, 'samples': 7001856, 'steps': 36467, 'loss/train': 1.879464030265808} -08/30/2021 19:47:42 - INFO - __main__ - Step 36469: {'lr': 0.0004360180200982613, 'samples': 7002048, 'steps': 36468, 'loss/train': 1.3553422689437866} -08/30/2021 19:47:43 - INFO - __main__ - Step 36470: {'lr': 0.00043601447462391317, 'samples': 7002240, 'steps': 36469, 'loss/train': 0.9028359055519104} -08/30/2021 19:47:44 - INFO - __main__ - Step 36471: {'lr': 0.00043601092906574986, 'samples': 7002432, 'steps': 36470, 'loss/train': 1.421359658241272} -08/30/2021 19:47:44 - INFO - __main__ - Step 36472: {'lr': 0.0004360073834237729, 'samples': 7002624, 'steps': 36471, 'loss/train': 1.6730273962020874} -08/30/2021 19:47:44 - INFO - __main__ - Step 36473: {'lr': 0.0004360038376979838, 'samples': 7002816, 'steps': 36472, 'loss/train': 1.1096608638763428} -08/30/2021 19:47:45 - INFO - __main__ - Step 36474: {'lr': 0.0004360002918883843, 'samples': 7003008, 'steps': 36473, 'loss/train': 5.877317905426025} -08/30/2021 19:47:46 - INFO - __main__ - Step 36475: {'lr': 0.00043599674599497593, 'samples': 7003200, 'steps': 36474, 'loss/train': 1.6931506395339966} -08/30/2021 19:47:47 - INFO - __main__ - Step 36476: {'lr': 0.00043599320001776025, 'samples': 7003392, 'steps': 36475, 'loss/train': 1.4531265497207642} -08/30/2021 19:47:47 - INFO - __main__ - Step 36477: {'lr': 0.00043598965395673893, 'samples': 7003584, 'steps': 36476, 'loss/train': 1.1867077350616455} -08/30/2021 19:47:47 - INFO - __main__ - Step 36478: {'lr': 0.0004359861078119136, 'samples': 7003776, 'steps': 36477, 'loss/train': 1.9284695386886597} -08/30/2021 19:47:48 - INFO - __main__ - Step 36479: {'lr': 0.00043598256158328575, 'samples': 7003968, 'steps': 36478, 'loss/train': 1.6126198768615723} -08/30/2021 19:47:48 - INFO - __main__ - Step 36480: {'lr': 0.00043597901527085703, 'samples': 7004160, 'steps': 36479, 'loss/train': 1.5148154497146606} -08/30/2021 19:47:50 - INFO - __main__ - Step 36481: {'lr': 0.000435975468874629, 'samples': 7004352, 'steps': 36480, 'loss/train': 2.088822841644287} -08/30/2021 19:47:50 - INFO - __main__ - Step 36482: {'lr': 0.00043597192239460336, 'samples': 7004544, 'steps': 36481, 'loss/train': 1.85660982131958} -08/30/2021 19:47:50 - INFO - __main__ - Step 36483: {'lr': 0.00043596837583078165, 'samples': 7004736, 'steps': 36482, 'loss/train': 0.9900230765342712} -08/30/2021 19:47:51 - INFO - __main__ - Step 36484: {'lr': 0.0004359648291831654, 'samples': 7004928, 'steps': 36483, 'loss/train': 1.157524824142456} -08/30/2021 19:47:51 - INFO - __main__ - Step 36485: {'lr': 0.0004359612824517563, 'samples': 7005120, 'steps': 36484, 'loss/train': 1.1578923463821411} -08/30/2021 19:47:53 - INFO - __main__ - Step 36486: {'lr': 0.0004359577356365559, 'samples': 7005312, 'steps': 36485, 'loss/train': 1.3362678289413452} -08/30/2021 19:47:53 - INFO - __main__ - Step 36487: {'lr': 0.00043595418873756584, 'samples': 7005504, 'steps': 36486, 'loss/train': 0.8806517720222473} -08/30/2021 19:47:53 - INFO - __main__ - Step 36488: {'lr': 0.0004359506417547876, 'samples': 7005696, 'steps': 36487, 'loss/train': 0.6454231142997742} -08/30/2021 19:47:54 - INFO - __main__ - Step 36489: {'lr': 0.000435947094688223, 'samples': 7005888, 'steps': 36488, 'loss/train': 1.2656669616699219} -08/30/2021 19:47:54 - INFO - __main__ - Step 36490: {'lr': 0.0004359435475378735, 'samples': 7006080, 'steps': 36489, 'loss/train': 1.606446623802185} -08/30/2021 19:47:55 - INFO - __main__ - Step 36491: {'lr': 0.0004359400003037406, 'samples': 7006272, 'steps': 36490, 'loss/train': 2.6311333179473877} -08/30/2021 19:47:56 - INFO - __main__ - Step 36492: {'lr': 0.0004359364529858261, 'samples': 7006464, 'steps': 36491, 'loss/train': 1.030823826789856} -08/30/2021 19:47:56 - INFO - __main__ - Step 36493: {'lr': 0.00043593290558413143, 'samples': 7006656, 'steps': 36492, 'loss/train': 1.479521632194519} -08/30/2021 19:47:57 - INFO - __main__ - Step 36494: {'lr': 0.0004359293580986583, 'samples': 7006848, 'steps': 36493, 'loss/train': 1.374276876449585} -08/30/2021 19:47:57 - INFO - __main__ - Step 36495: {'lr': 0.0004359258105294083, 'samples': 7007040, 'steps': 36494, 'loss/train': 1.6317195892333984} -08/30/2021 19:47:58 - INFO - __main__ - Step 36496: {'lr': 0.0004359222628763829, 'samples': 7007232, 'steps': 36495, 'loss/train': 6.169818878173828} -08/30/2021 19:47:59 - INFO - __main__ - Step 36497: {'lr': 0.0004359187151395839, 'samples': 7007424, 'steps': 36496, 'loss/train': 1.41305410861969} -08/30/2021 19:47:59 - INFO - __main__ - Step 36498: {'lr': 0.0004359151673190127, 'samples': 7007616, 'steps': 36497, 'loss/train': 1.8294190168380737} -08/30/2021 19:48:00 - INFO - __main__ - Step 36499: {'lr': 0.0004359116194146711, 'samples': 7007808, 'steps': 36498, 'loss/train': 1.3524771928787231} -08/30/2021 19:48:00 - INFO - __main__ - Step 36500: {'lr': 0.0004359080714265605, 'samples': 7008000, 'steps': 36499, 'loss/train': 1.275800108909607} -08/30/2021 19:48:02 - INFO - __main__ - Step 36501: {'lr': 0.00043590452335468265, 'samples': 7008192, 'steps': 36500, 'loss/train': 1.5451632738113403} -08/30/2021 19:48:03 - INFO - __main__ - Step 36502: {'lr': 0.00043590097519903917, 'samples': 7008384, 'steps': 36501, 'loss/train': 1.144112467765808} -08/30/2021 19:48:03 - INFO - __main__ - Step 36503: {'lr': 0.0004358974269596314, 'samples': 7008576, 'steps': 36502, 'loss/train': 1.904725193977356} -08/30/2021 19:48:04 - INFO - __main__ - Step 36504: {'lr': 0.00043589387863646125, 'samples': 7008768, 'steps': 36503, 'loss/train': 0.38427162170410156} -08/30/2021 19:48:04 - INFO - __main__ - Step 36505: {'lr': 0.0004358903302295301, 'samples': 7008960, 'steps': 36504, 'loss/train': 1.152559757232666} -08/30/2021 19:48:05 - INFO - __main__ - Step 36506: {'lr': 0.0004358867817388397, 'samples': 7009152, 'steps': 36505, 'loss/train': 0.5000024437904358} -08/30/2021 19:48:06 - INFO - __main__ - Step 36507: {'lr': 0.0004358832331643916, 'samples': 7009344, 'steps': 36506, 'loss/train': 1.2807445526123047} -08/30/2021 19:48:06 - INFO - __main__ - Step 36508: {'lr': 0.0004358796845061873, 'samples': 7009536, 'steps': 36507, 'loss/train': 1.509907841682434} -08/30/2021 19:48:06 - INFO - __main__ - Step 36509: {'lr': 0.00043587613576422855, 'samples': 7009728, 'steps': 36508, 'loss/train': 1.8179283142089844} -08/30/2021 19:48:07 - INFO - __main__ - Step 36510: {'lr': 0.00043587258693851685, 'samples': 7009920, 'steps': 36509, 'loss/train': 1.31987726688385} -08/30/2021 19:48:08 - INFO - __main__ - Step 36511: {'lr': 0.0004358690380290539, 'samples': 7010112, 'steps': 36510, 'loss/train': 1.4994300603866577} -08/30/2021 19:48:09 - INFO - __main__ - Step 36512: {'lr': 0.00043586548903584113, 'samples': 7010304, 'steps': 36511, 'loss/train': 2.2657501697540283} -08/30/2021 19:48:09 - INFO - __main__ - Step 36513: {'lr': 0.0004358619399588802, 'samples': 7010496, 'steps': 36512, 'loss/train': 1.943145513534546} -08/30/2021 19:48:09 - INFO - __main__ - Step 36514: {'lr': 0.0004358583907981729, 'samples': 7010688, 'steps': 36513, 'loss/train': 0.41833555698394775} -08/30/2021 19:48:10 - INFO - __main__ - Step 36515: {'lr': 0.0004358548415537206, 'samples': 7010880, 'steps': 36514, 'loss/train': 1.337725043296814} -08/30/2021 19:48:10 - INFO - __main__ - Step 36516: {'lr': 0.000435851292225525, 'samples': 7011072, 'steps': 36515, 'loss/train': 1.452592372894287} -08/30/2021 19:48:12 - INFO - __main__ - Step 36517: {'lr': 0.0004358477428135876, 'samples': 7011264, 'steps': 36516, 'loss/train': 1.5251343250274658} -08/30/2021 19:48:12 - INFO - __main__ - Step 36518: {'lr': 0.00043584419331791014, 'samples': 7011456, 'steps': 36517, 'loss/train': 1.6350144147872925} -08/30/2021 19:48:12 - INFO - __main__ - Step 36519: {'lr': 0.0004358406437384942, 'samples': 7011648, 'steps': 36518, 'loss/train': 1.236351490020752} -08/30/2021 19:48:13 - INFO - __main__ - Step 36520: {'lr': 0.0004358370940753412, 'samples': 7011840, 'steps': 36519, 'loss/train': 1.3332247734069824} -08/30/2021 19:48:13 - INFO - __main__ - Step 36521: {'lr': 0.000435833544328453, 'samples': 7012032, 'steps': 36520, 'loss/train': 1.3820645809173584} -08/30/2021 19:48:15 - INFO - __main__ - Step 36522: {'lr': 0.00043582999449783103, 'samples': 7012224, 'steps': 36521, 'loss/train': 1.4637681245803833} -08/30/2021 19:48:15 - INFO - __main__ - Step 36523: {'lr': 0.0004358264445834769, 'samples': 7012416, 'steps': 36522, 'loss/train': 1.278749942779541} -08/30/2021 19:48:16 - INFO - __main__ - Step 36524: {'lr': 0.00043582289458539224, 'samples': 7012608, 'steps': 36523, 'loss/train': 0.8776615262031555} -08/30/2021 19:48:16 - INFO - __main__ - Step 36525: {'lr': 0.00043581934450357876, 'samples': 7012800, 'steps': 36524, 'loss/train': 1.9267964363098145} -08/30/2021 19:48:16 - INFO - __main__ - Step 36526: {'lr': 0.0004358157943380379, 'samples': 7012992, 'steps': 36525, 'loss/train': 2.7304790019989014} -08/30/2021 19:48:18 - INFO - __main__ - Step 36527: {'lr': 0.00043581224408877116, 'samples': 7013184, 'steps': 36526, 'loss/train': 1.2880278825759888} -08/30/2021 19:48:18 - INFO - __main__ - Step 36528: {'lr': 0.00043580869375578046, 'samples': 7013376, 'steps': 36527, 'loss/train': 5.815019607543945} -08/30/2021 19:48:19 - INFO - __main__ - Step 36529: {'lr': 0.00043580514333906717, 'samples': 7013568, 'steps': 36528, 'loss/train': 1.5183874368667603} -08/30/2021 19:48:19 - INFO - __main__ - Step 36530: {'lr': 0.000435801592838633, 'samples': 7013760, 'steps': 36529, 'loss/train': 1.5846532583236694} -08/30/2021 19:48:19 - INFO - __main__ - Step 36531: {'lr': 0.0004357980422544794, 'samples': 7013952, 'steps': 36530, 'loss/train': 1.8552756309509277} -08/30/2021 19:48:20 - INFO - __main__ - Step 36532: {'lr': 0.00043579449158660815, 'samples': 7014144, 'steps': 36531, 'loss/train': 1.71445631980896} -08/30/2021 19:48:21 - INFO - __main__ - Step 36533: {'lr': 0.0004357909408350208, 'samples': 7014336, 'steps': 36532, 'loss/train': 1.38188636302948} -08/30/2021 19:48:22 - INFO - __main__ - Step 36534: {'lr': 0.00043578738999971886, 'samples': 7014528, 'steps': 36533, 'loss/train': 2.012483835220337} -08/30/2021 19:48:22 - INFO - __main__ - Step 36535: {'lr': 0.000435783839080704, 'samples': 7014720, 'steps': 36534, 'loss/train': 0.05404497683048248} -08/30/2021 19:48:22 - INFO - __main__ - Step 36536: {'lr': 0.00043578028807797774, 'samples': 7014912, 'steps': 36535, 'loss/train': 1.4148170948028564} -08/30/2021 19:48:23 - INFO - __main__ - Step 36537: {'lr': 0.0004357767369915419, 'samples': 7015104, 'steps': 36536, 'loss/train': 2.089134693145752} -08/30/2021 19:48:24 - INFO - __main__ - Step 36538: {'lr': 0.0004357731858213978, 'samples': 7015296, 'steps': 36537, 'loss/train': 1.2578330039978027} -08/30/2021 19:48:25 - INFO - __main__ - Step 36539: {'lr': 0.0004357696345675472, 'samples': 7015488, 'steps': 36538, 'loss/train': 1.3099653720855713} -08/30/2021 19:48:25 - INFO - __main__ - Step 36540: {'lr': 0.00043576608322999167, 'samples': 7015680, 'steps': 36539, 'loss/train': 1.617466688156128} -08/30/2021 19:48:25 - INFO - __main__ - Step 36541: {'lr': 0.0004357625318087328, 'samples': 7015872, 'steps': 36540, 'loss/train': 1.8089059591293335} -08/30/2021 19:48:26 - INFO - __main__ - Step 36542: {'lr': 0.00043575898030377225, 'samples': 7016064, 'steps': 36541, 'loss/train': 2.036715269088745} -08/30/2021 19:48:27 - INFO - __main__ - Step 36543: {'lr': 0.00043575542871511155, 'samples': 7016256, 'steps': 36542, 'loss/train': 1.4833344221115112} -08/30/2021 19:48:28 - INFO - __main__ - Step 36544: {'lr': 0.00043575187704275234, 'samples': 7016448, 'steps': 36543, 'loss/train': 1.2527631521224976} -08/30/2021 19:48:28 - INFO - __main__ - Step 36545: {'lr': 0.0004357483252866961, 'samples': 7016640, 'steps': 36544, 'loss/train': 2.0547447204589844} -08/30/2021 19:48:28 - INFO - __main__ - Step 36546: {'lr': 0.00043574477344694463, 'samples': 7016832, 'steps': 36545, 'loss/train': 1.2601391077041626} -08/30/2021 19:48:29 - INFO - __main__ - Step 36547: {'lr': 0.0004357412215234994, 'samples': 7017024, 'steps': 36546, 'loss/train': 1.3062084913253784} -08/30/2021 19:48:31 - INFO - __main__ - Step 36548: {'lr': 0.00043573766951636206, 'samples': 7017216, 'steps': 36547, 'loss/train': 1.1554791927337646} -08/30/2021 19:48:31 - INFO - __main__ - Step 36549: {'lr': 0.00043573411742553415, 'samples': 7017408, 'steps': 36548, 'loss/train': 1.0076406002044678} -08/30/2021 19:48:32 - INFO - __main__ - Step 36550: {'lr': 0.0004357305652510174, 'samples': 7017600, 'steps': 36549, 'loss/train': 2.242140769958496} -08/30/2021 19:48:32 - INFO - __main__ - Step 36551: {'lr': 0.00043572701299281327, 'samples': 7017792, 'steps': 36550, 'loss/train': 0.660279393196106} -08/30/2021 19:48:32 - INFO - __main__ - Step 36552: {'lr': 0.0004357234606509234, 'samples': 7017984, 'steps': 36551, 'loss/train': 1.575362205505371} -08/30/2021 19:48:33 - INFO - __main__ - Step 36553: {'lr': 0.00043571990822534936, 'samples': 7018176, 'steps': 36552, 'loss/train': 3.932896137237549} -08/30/2021 19:48:35 - INFO - __main__ - Step 36554: {'lr': 0.00043571635571609287, 'samples': 7018368, 'steps': 36553, 'loss/train': 1.0440348386764526} -08/30/2021 19:48:35 - INFO - __main__ - Step 36555: {'lr': 0.00043571280312315543, 'samples': 7018560, 'steps': 36554, 'loss/train': 1.1563599109649658} -08/30/2021 19:48:35 - INFO - __main__ - Step 36556: {'lr': 0.0004357092504465386, 'samples': 7018752, 'steps': 36555, 'loss/train': 1.3621444702148438} -08/30/2021 19:48:36 - INFO - __main__ - Step 36557: {'lr': 0.00043570569768624416, 'samples': 7018944, 'steps': 36556, 'loss/train': 1.2782279253005981} -08/30/2021 19:48:36 - INFO - __main__ - Step 36558: {'lr': 0.00043570214484227353, 'samples': 7019136, 'steps': 36557, 'loss/train': 1.4263688325881958} -08/30/2021 19:48:38 - INFO - __main__ - Step 36559: {'lr': 0.00043569859191462847, 'samples': 7019328, 'steps': 36558, 'loss/train': 1.3615001440048218} -08/30/2021 19:48:38 - INFO - __main__ - Step 36560: {'lr': 0.0004356950389033104, 'samples': 7019520, 'steps': 36559, 'loss/train': 1.5760283470153809} -08/30/2021 19:48:38 - INFO - __main__ - Step 36561: {'lr': 0.0004356914858083211, 'samples': 7019712, 'steps': 36560, 'loss/train': 1.891967535018921} -08/30/2021 19:48:39 - INFO - __main__ - Step 36562: {'lr': 0.00043568793262966195, 'samples': 7019904, 'steps': 36561, 'loss/train': 1.246058464050293} -08/30/2021 19:48:39 - INFO - __main__ - Step 36563: {'lr': 0.00043568437936733473, 'samples': 7020096, 'steps': 36562, 'loss/train': 1.5230660438537598} -08/30/2021 19:48:41 - INFO - __main__ - Step 36564: {'lr': 0.0004356808260213411, 'samples': 7020288, 'steps': 36563, 'loss/train': 1.6539273262023926} -08/30/2021 19:48:41 - INFO - __main__ - Step 36565: {'lr': 0.00043567727259168244, 'samples': 7020480, 'steps': 36564, 'loss/train': 1.2522408962249756} -08/30/2021 19:48:41 - INFO - __main__ - Step 36566: {'lr': 0.0004356737190783605, 'samples': 7020672, 'steps': 36565, 'loss/train': 1.108936071395874} -08/30/2021 19:48:42 - INFO - __main__ - Step 36567: {'lr': 0.00043567016548137685, 'samples': 7020864, 'steps': 36566, 'loss/train': 1.2651119232177734} -08/30/2021 19:48:42 - INFO - __main__ - Step 36568: {'lr': 0.00043566661180073304, 'samples': 7021056, 'steps': 36567, 'loss/train': 1.0394198894500732} -08/30/2021 19:48:44 - INFO - __main__ - Step 36569: {'lr': 0.00043566305803643073, 'samples': 7021248, 'steps': 36568, 'loss/train': 1.6034506559371948} -08/30/2021 19:48:44 - INFO - __main__ - Step 36570: {'lr': 0.00043565950418847154, 'samples': 7021440, 'steps': 36569, 'loss/train': 2.1219236850738525} -08/30/2021 19:48:44 - INFO - __main__ - Step 36571: {'lr': 0.00043565595025685705, 'samples': 7021632, 'steps': 36570, 'loss/train': 1.7575101852416992} -08/30/2021 19:48:45 - INFO - __main__ - Step 36572: {'lr': 0.0004356523962415889, 'samples': 7021824, 'steps': 36571, 'loss/train': 2.0594255924224854} -08/30/2021 19:48:45 - INFO - __main__ - Step 36573: {'lr': 0.00043564884214266855, 'samples': 7022016, 'steps': 36572, 'loss/train': 1.5242760181427002} -08/30/2021 19:48:47 - INFO - __main__ - Step 36574: {'lr': 0.00043564528796009774, 'samples': 7022208, 'steps': 36573, 'loss/train': 1.4918831586837769} -08/30/2021 19:48:47 - INFO - __main__ - Step 36575: {'lr': 0.00043564173369387807, 'samples': 7022400, 'steps': 36574, 'loss/train': 1.3450161218643188} -08/30/2021 19:48:47 - INFO - __main__ - Step 36576: {'lr': 0.00043563817934401107, 'samples': 7022592, 'steps': 36575, 'loss/train': 1.106136441230774} -08/30/2021 19:48:48 - INFO - __main__ - Step 36577: {'lr': 0.0004356346249104983, 'samples': 7022784, 'steps': 36576, 'loss/train': 1.150787591934204} -08/30/2021 19:48:48 - INFO - __main__ - Step 36578: {'lr': 0.0004356310703933415, 'samples': 7022976, 'steps': 36577, 'loss/train': 1.2052197456359863} -08/30/2021 19:48:50 - INFO - __main__ - Step 36579: {'lr': 0.00043562751579254215, 'samples': 7023168, 'steps': 36578, 'loss/train': 2.0636699199676514} -08/30/2021 19:48:50 - INFO - __main__ - Step 36580: {'lr': 0.00043562396110810196, 'samples': 7023360, 'steps': 36579, 'loss/train': 1.325165033340454} -08/30/2021 19:48:50 - INFO - __main__ - Step 36581: {'lr': 0.00043562040634002245, 'samples': 7023552, 'steps': 36580, 'loss/train': 1.8251488208770752} -08/30/2021 19:48:51 - INFO - __main__ - Step 36582: {'lr': 0.0004356168514883053, 'samples': 7023744, 'steps': 36581, 'loss/train': 1.6045143604278564} -08/30/2021 19:48:51 - INFO - __main__ - Step 36583: {'lr': 0.000435613296552952, 'samples': 7023936, 'steps': 36582, 'loss/train': 1.722639560699463} -08/30/2021 19:48:53 - INFO - __main__ - Step 36584: {'lr': 0.0004356097415339643, 'samples': 7024128, 'steps': 36583, 'loss/train': 1.5015318393707275} -08/30/2021 19:48:53 - INFO - __main__ - Step 36585: {'lr': 0.0004356061864313436, 'samples': 7024320, 'steps': 36584, 'loss/train': 0.8369975090026855} -08/30/2021 19:48:54 - INFO - __main__ - Step 36586: {'lr': 0.0004356026312450917, 'samples': 7024512, 'steps': 36585, 'loss/train': 1.0878782272338867} -08/30/2021 19:48:54 - INFO - __main__ - Step 36587: {'lr': 0.00043559907597521007, 'samples': 7024704, 'steps': 36586, 'loss/train': 0.20002266764640808} -08/30/2021 19:48:54 - INFO - __main__ - Step 36588: {'lr': 0.00043559552062170037, 'samples': 7024896, 'steps': 36587, 'loss/train': 1.7895675897598267} -08/30/2021 19:48:56 - INFO - __main__ - Step 36589: {'lr': 0.00043559196518456425, 'samples': 7025088, 'steps': 36588, 'loss/train': 1.6089807748794556} -08/30/2021 19:48:56 - INFO - __main__ - Step 36590: {'lr': 0.0004355884096638032, 'samples': 7025280, 'steps': 36589, 'loss/train': 1.6458605527877808} -08/30/2021 19:48:57 - INFO - __main__ - Step 36591: {'lr': 0.0004355848540594188, 'samples': 7025472, 'steps': 36590, 'loss/train': 1.2729971408843994} -08/30/2021 19:48:57 - INFO - __main__ - Step 36592: {'lr': 0.00043558129837141285, 'samples': 7025664, 'steps': 36591, 'loss/train': 1.5198731422424316} -08/30/2021 19:48:57 - INFO - __main__ - Step 36593: {'lr': 0.0004355777425997868, 'samples': 7025856, 'steps': 36592, 'loss/train': 1.761038899421692} -08/30/2021 19:48:59 - INFO - __main__ - Step 36594: {'lr': 0.0004355741867445423, 'samples': 7026048, 'steps': 36593, 'loss/train': 1.2411330938339233} -08/30/2021 19:48:59 - INFO - __main__ - Step 36595: {'lr': 0.00043557063080568094, 'samples': 7026240, 'steps': 36594, 'loss/train': 1.5074400901794434} -08/30/2021 19:49:00 - INFO - __main__ - Step 36596: {'lr': 0.00043556707478320425, 'samples': 7026432, 'steps': 36595, 'loss/train': 1.2042975425720215} -08/30/2021 19:49:00 - INFO - __main__ - Step 36597: {'lr': 0.000435563518677114, 'samples': 7026624, 'steps': 36596, 'loss/train': 1.2453397512435913} -08/30/2021 19:49:01 - INFO - __main__ - Step 36598: {'lr': 0.00043555996248741157, 'samples': 7026816, 'steps': 36597, 'loss/train': 1.4067848920822144} -08/30/2021 19:49:01 - INFO - __main__ - Step 36599: {'lr': 0.00043555640621409874, 'samples': 7027008, 'steps': 36598, 'loss/train': 0.9534721374511719} -08/30/2021 19:49:03 - INFO - __main__ - Step 36600: {'lr': 0.000435552849857177, 'samples': 7027200, 'steps': 36599, 'loss/train': 1.4208219051361084} -08/30/2021 19:49:03 - INFO - __main__ - Step 36601: {'lr': 0.0004355492934166481, 'samples': 7027392, 'steps': 36600, 'loss/train': 0.06765236705541611} -08/30/2021 19:49:03 - INFO - __main__ - Step 36602: {'lr': 0.00043554573689251355, 'samples': 7027584, 'steps': 36601, 'loss/train': 1.4174158573150635} -08/30/2021 19:49:04 - INFO - __main__ - Step 36603: {'lr': 0.00043554218028477493, 'samples': 7027776, 'steps': 36602, 'loss/train': 1.5248489379882812} -08/30/2021 19:49:04 - INFO - __main__ - Step 36604: {'lr': 0.0004355386235934339, 'samples': 7027968, 'steps': 36603, 'loss/train': 1.6492342948913574} -08/30/2021 19:49:05 - INFO - __main__ - Step 36605: {'lr': 0.0004355350668184919, 'samples': 7028160, 'steps': 36604, 'loss/train': 1.1743378639221191} -08/30/2021 19:49:06 - INFO - __main__ - Step 36606: {'lr': 0.0004355315099599508, 'samples': 7028352, 'steps': 36605, 'loss/train': 0.7627246379852295} -08/30/2021 19:49:06 - INFO - __main__ - Step 36607: {'lr': 0.000435527953017812, 'samples': 7028544, 'steps': 36606, 'loss/train': 1.5173484086990356} -08/30/2021 19:49:07 - INFO - __main__ - Step 36608: {'lr': 0.00043552439599207714, 'samples': 7028736, 'steps': 36607, 'loss/train': 1.3291195631027222} -08/30/2021 19:49:07 - INFO - __main__ - Step 36609: {'lr': 0.00043552083888274794, 'samples': 7028928, 'steps': 36608, 'loss/train': 2.4523611068725586} -08/30/2021 19:49:09 - INFO - __main__ - Step 36610: {'lr': 0.00043551728168982583, 'samples': 7029120, 'steps': 36609, 'loss/train': 1.1981136798858643} -08/30/2021 19:49:09 - INFO - __main__ - Step 36611: {'lr': 0.0004355137244133126, 'samples': 7029312, 'steps': 36610, 'loss/train': 1.184779167175293} -08/30/2021 19:49:10 - INFO - __main__ - Step 36612: {'lr': 0.00043551016705320965, 'samples': 7029504, 'steps': 36611, 'loss/train': 1.491159200668335} -08/30/2021 19:49:10 - INFO - __main__ - Step 36613: {'lr': 0.00043550660960951874, 'samples': 7029696, 'steps': 36612, 'loss/train': 0.6981892585754395} -08/30/2021 19:49:10 - INFO - __main__ - Step 36614: {'lr': 0.0004355030520822414, 'samples': 7029888, 'steps': 36613, 'loss/train': 1.2497870922088623} -08/30/2021 19:49:12 - INFO - __main__ - Step 36615: {'lr': 0.00043549949447137915, 'samples': 7030080, 'steps': 36614, 'loss/train': 1.1743836402893066} -08/30/2021 19:49:12 - INFO - __main__ - Step 36616: {'lr': 0.00043549593677693385, 'samples': 7030272, 'steps': 36615, 'loss/train': 1.3580169677734375} -08/30/2021 19:49:13 - INFO - __main__ - Step 36617: {'lr': 0.0004354923789989068, 'samples': 7030464, 'steps': 36616, 'loss/train': 1.4517509937286377} -08/30/2021 19:49:13 - INFO - __main__ - Step 36618: {'lr': 0.0004354888211372998, 'samples': 7030656, 'steps': 36617, 'loss/train': 0.4366558790206909} -08/30/2021 19:49:13 - INFO - __main__ - Step 36619: {'lr': 0.0004354852631921145, 'samples': 7030848, 'steps': 36618, 'loss/train': 1.0512324571609497} -08/30/2021 19:49:15 - INFO - __main__ - Step 36620: {'lr': 0.0004354817051633523, 'samples': 7031040, 'steps': 36619, 'loss/train': 1.2595950365066528} -08/30/2021 19:49:15 - INFO - __main__ - Step 36621: {'lr': 0.00043547814705101486, 'samples': 7031232, 'steps': 36620, 'loss/train': 2.4898011684417725} -08/30/2021 19:49:16 - INFO - __main__ - Step 36622: {'lr': 0.00043547458885510393, 'samples': 7031424, 'steps': 36621, 'loss/train': 1.334200143814087} -08/30/2021 19:49:16 - INFO - __main__ - Step 36623: {'lr': 0.00043547103057562097, 'samples': 7031616, 'steps': 36622, 'loss/train': 1.209738850593567} -08/30/2021 19:49:16 - INFO - __main__ - Step 36624: {'lr': 0.00043546747221256764, 'samples': 7031808, 'steps': 36623, 'loss/train': 3.094558000564575} -08/30/2021 19:49:17 - INFO - __main__ - Step 36625: {'lr': 0.00043546391376594553, 'samples': 7032000, 'steps': 36624, 'loss/train': 1.9644629955291748} -08/30/2021 19:49:18 - INFO - __main__ - Step 36626: {'lr': 0.0004354603552357562, 'samples': 7032192, 'steps': 36625, 'loss/train': 1.131923794746399} -08/30/2021 19:49:19 - INFO - __main__ - Step 36627: {'lr': 0.0004354567966220013, 'samples': 7032384, 'steps': 36626, 'loss/train': 1.3133677244186401} -08/30/2021 19:49:19 - INFO - __main__ - Step 36628: {'lr': 0.0004354532379246825, 'samples': 7032576, 'steps': 36627, 'loss/train': 1.3306858539581299} -08/30/2021 19:49:19 - INFO - __main__ - Step 36629: {'lr': 0.0004354496791438013, 'samples': 7032768, 'steps': 36628, 'loss/train': 1.0869311094284058} -08/30/2021 19:49:20 - INFO - __main__ - Step 36630: {'lr': 0.0004354461202793593, 'samples': 7032960, 'steps': 36629, 'loss/train': 1.7309787273406982} -08/30/2021 19:49:21 - INFO - __main__ - Step 36631: {'lr': 0.00043544256133135815, 'samples': 7033152, 'steps': 36630, 'loss/train': 0.3938276767730713} -08/30/2021 19:49:22 - INFO - __main__ - Step 36632: {'lr': 0.0004354390022997995, 'samples': 7033344, 'steps': 36631, 'loss/train': 1.2225375175476074} -08/30/2021 19:49:22 - INFO - __main__ - Step 36633: {'lr': 0.0004354354431846848, 'samples': 7033536, 'steps': 36632, 'loss/train': 1.5289702415466309} -08/30/2021 19:49:22 - INFO - __main__ - Step 36634: {'lr': 0.00043543188398601586, 'samples': 7033728, 'steps': 36633, 'loss/train': 1.410776138305664} -08/30/2021 19:49:23 - INFO - __main__ - Step 36635: {'lr': 0.00043542832470379415, 'samples': 7033920, 'steps': 36634, 'loss/train': 0.9819300174713135} -08/30/2021 19:49:24 - INFO - __main__ - Step 36636: {'lr': 0.0004354247653380212, 'samples': 7034112, 'steps': 36635, 'loss/train': 0.7413052916526794} -08/30/2021 19:49:25 - INFO - __main__ - Step 36637: {'lr': 0.00043542120588869885, 'samples': 7034304, 'steps': 36636, 'loss/train': 1.367821216583252} -08/30/2021 19:49:25 - INFO - __main__ - Step 36638: {'lr': 0.0004354176463558284, 'samples': 7034496, 'steps': 36637, 'loss/train': 1.754111647605896} -08/30/2021 19:49:25 - INFO - __main__ - Step 36639: {'lr': 0.00043541408673941173, 'samples': 7034688, 'steps': 36638, 'loss/train': 1.5507147312164307} -08/30/2021 19:49:26 - INFO - __main__ - Step 36640: {'lr': 0.00043541052703945034, 'samples': 7034880, 'steps': 36639, 'loss/train': 1.081290602684021} -08/30/2021 19:49:28 - INFO - __main__ - Step 36641: {'lr': 0.0004354069672559458, 'samples': 7035072, 'steps': 36640, 'loss/train': 1.4214664697647095} -08/30/2021 19:49:28 - INFO - __main__ - Step 36642: {'lr': 0.0004354034073888997, 'samples': 7035264, 'steps': 36641, 'loss/train': 0.8091091513633728} -08/30/2021 19:49:29 - INFO - __main__ - Step 36643: {'lr': 0.00043539984743831375, 'samples': 7035456, 'steps': 36642, 'loss/train': 0.8957213759422302} -08/30/2021 19:49:29 - INFO - __main__ - Step 36644: {'lr': 0.0004353962874041895, 'samples': 7035648, 'steps': 36643, 'loss/train': 0.9911098480224609} -08/30/2021 19:49:29 - INFO - __main__ - Step 36645: {'lr': 0.0004353927272865285, 'samples': 7035840, 'steps': 36644, 'loss/train': 1.4371337890625} -08/30/2021 19:49:30 - INFO - __main__ - Step 36646: {'lr': 0.0004353891670853324, 'samples': 7036032, 'steps': 36645, 'loss/train': 2.2173895835876465} -08/30/2021 19:49:30 - INFO - __main__ - Step 36647: {'lr': 0.00043538560680060287, 'samples': 7036224, 'steps': 36646, 'loss/train': 1.6057382822036743} -08/30/2021 19:49:32 - INFO - __main__ - Step 36648: {'lr': 0.00043538204643234137, 'samples': 7036416, 'steps': 36647, 'loss/train': 1.1364264488220215} -08/30/2021 19:49:32 - INFO - __main__ - Step 36649: {'lr': 0.0004353784859805496, 'samples': 7036608, 'steps': 36648, 'loss/train': 1.198661208152771} -08/30/2021 19:49:33 - INFO - __main__ - Step 36650: {'lr': 0.00043537492544522917, 'samples': 7036800, 'steps': 36649, 'loss/train': 1.7976967096328735} -08/30/2021 19:49:33 - INFO - __main__ - Step 36651: {'lr': 0.0004353713648263816, 'samples': 7036992, 'steps': 36650, 'loss/train': 1.2448914051055908} -08/30/2021 19:49:33 - INFO - __main__ - Step 36652: {'lr': 0.00043536780412400857, 'samples': 7037184, 'steps': 36651, 'loss/train': 1.5411320924758911} -08/30/2021 19:49:35 - INFO - __main__ - Step 36653: {'lr': 0.0004353642433381117, 'samples': 7037376, 'steps': 36652, 'loss/train': 1.1788196563720703} -08/30/2021 19:49:35 - INFO - __main__ - Step 36654: {'lr': 0.00043536068246869254, 'samples': 7037568, 'steps': 36653, 'loss/train': 1.728651762008667} -08/30/2021 19:49:36 - INFO - __main__ - Step 36655: {'lr': 0.00043535712151575274, 'samples': 7037760, 'steps': 36654, 'loss/train': 1.6517583131790161} -08/30/2021 19:49:36 - INFO - __main__ - Step 36656: {'lr': 0.00043535356047929387, 'samples': 7037952, 'steps': 36655, 'loss/train': 1.6122596263885498} -08/30/2021 19:49:36 - INFO - __main__ - Step 36657: {'lr': 0.0004353499993593176, 'samples': 7038144, 'steps': 36656, 'loss/train': 1.6522592306137085} -08/30/2021 19:49:38 - INFO - __main__ - Step 36658: {'lr': 0.0004353464381558254, 'samples': 7038336, 'steps': 36657, 'loss/train': 1.2207783460617065} -08/30/2021 19:49:38 - INFO - __main__ - Step 36659: {'lr': 0.00043534287686881895, 'samples': 7038528, 'steps': 36658, 'loss/train': 1.5376250743865967} -08/30/2021 19:49:39 - INFO - __main__ - Step 36660: {'lr': 0.00043533931549829993, 'samples': 7038720, 'steps': 36659, 'loss/train': 0.8740956783294678} -08/30/2021 19:49:39 - INFO - __main__ - Step 36661: {'lr': 0.00043533575404426986, 'samples': 7038912, 'steps': 36660, 'loss/train': 1.4214528799057007} -08/30/2021 19:49:39 - INFO - __main__ - Step 36662: {'lr': 0.0004353321925067303, 'samples': 7039104, 'steps': 36661, 'loss/train': 1.2832437753677368} -08/30/2021 19:49:41 - INFO - __main__ - Step 36663: {'lr': 0.0004353286308856829, 'samples': 7039296, 'steps': 36662, 'loss/train': 0.044129423797130585} -08/30/2021 19:49:42 - INFO - __main__ - Step 36664: {'lr': 0.00043532506918112933, 'samples': 7039488, 'steps': 36663, 'loss/train': 1.424027442932129} -08/30/2021 19:49:42 - INFO - __main__ - Step 36665: {'lr': 0.0004353215073930712, 'samples': 7039680, 'steps': 36664, 'loss/train': 1.690145492553711} -08/30/2021 19:49:43 - INFO - __main__ - Step 36666: {'lr': 0.00043531794552150994, 'samples': 7039872, 'steps': 36665, 'loss/train': 0.25014355778694153} -08/30/2021 19:49:43 - INFO - __main__ - Step 36667: {'lr': 0.0004353143835664474, 'samples': 7040064, 'steps': 36666, 'loss/train': 0.4051026403903961} -08/30/2021 19:49:44 - INFO - __main__ - Step 36668: {'lr': 0.00043531082152788495, 'samples': 7040256, 'steps': 36667, 'loss/train': 0.6898967027664185} -08/30/2021 19:49:45 - INFO - __main__ - Step 36669: {'lr': 0.0004353072594058243, 'samples': 7040448, 'steps': 36668, 'loss/train': 1.3379818201065063} -08/30/2021 19:49:45 - INFO - __main__ - Step 36670: {'lr': 0.0004353036972002671, 'samples': 7040640, 'steps': 36669, 'loss/train': 1.7584658861160278} -08/30/2021 19:49:46 - INFO - __main__ - Step 36671: {'lr': 0.00043530013491121497, 'samples': 7040832, 'steps': 36670, 'loss/train': 1.6686280965805054} -08/30/2021 19:49:46 - INFO - __main__ - Step 36672: {'lr': 0.00043529657253866936, 'samples': 7041024, 'steps': 36671, 'loss/train': 1.2137001752853394} -08/30/2021 19:49:47 - INFO - __main__ - Step 36673: {'lr': 0.000435293010082632, 'samples': 7041216, 'steps': 36672, 'loss/train': 1.3776910305023193} -08/30/2021 19:49:48 - INFO - __main__ - Step 36674: {'lr': 0.0004352894475431045, 'samples': 7041408, 'steps': 36673, 'loss/train': 1.8339715003967285} -08/30/2021 19:49:48 - INFO - __main__ - Step 36675: {'lr': 0.0004352858849200885, 'samples': 7041600, 'steps': 36674, 'loss/train': 0.048947595059871674} -08/30/2021 19:49:49 - INFO - __main__ - Step 36676: {'lr': 0.0004352823222135854, 'samples': 7041792, 'steps': 36675, 'loss/train': 1.431644320487976} -08/30/2021 19:49:49 - INFO - __main__ - Step 36677: {'lr': 0.00043527875942359697, 'samples': 7041984, 'steps': 36676, 'loss/train': 1.2802859544754028} -08/30/2021 19:49:50 - INFO - __main__ - Step 36678: {'lr': 0.0004352751965501248, 'samples': 7042176, 'steps': 36677, 'loss/train': 1.8463026285171509} -08/30/2021 19:49:51 - INFO - __main__ - Step 36679: {'lr': 0.0004352716335931706, 'samples': 7042368, 'steps': 36678, 'loss/train': 1.1140857934951782} -08/30/2021 19:49:51 - INFO - __main__ - Step 36680: {'lr': 0.0004352680705527357, 'samples': 7042560, 'steps': 36679, 'loss/train': 1.790854811668396} -08/30/2021 19:49:52 - INFO - __main__ - Step 36681: {'lr': 0.00043526450742882193, 'samples': 7042752, 'steps': 36680, 'loss/train': 1.316838264465332} -08/30/2021 19:49:52 - INFO - __main__ - Step 36682: {'lr': 0.0004352609442214309, 'samples': 7042944, 'steps': 36681, 'loss/train': 1.2183455228805542} -08/30/2021 19:49:54 - INFO - __main__ - Step 36683: {'lr': 0.00043525738093056404, 'samples': 7043136, 'steps': 36682, 'loss/train': 1.3153342008590698} -08/30/2021 19:49:54 - INFO - __main__ - Step 36684: {'lr': 0.0004352538175562231, 'samples': 7043328, 'steps': 36683, 'loss/train': 1.073585867881775} -08/30/2021 19:49:55 - INFO - __main__ - Step 36685: {'lr': 0.00043525025409840967, 'samples': 7043520, 'steps': 36684, 'loss/train': 0.9450781941413879} -08/30/2021 19:49:55 - INFO - __main__ - Step 36686: {'lr': 0.00043524669055712534, 'samples': 7043712, 'steps': 36685, 'loss/train': 1.3040051460266113} -08/30/2021 19:49:55 - INFO - __main__ - Step 36687: {'lr': 0.00043524312693237166, 'samples': 7043904, 'steps': 36686, 'loss/train': 1.2252814769744873} -08/30/2021 19:49:56 - INFO - __main__ - Step 36688: {'lr': 0.0004352395632241504, 'samples': 7044096, 'steps': 36687, 'loss/train': 0.060605812817811966} -08/30/2021 19:49:58 - INFO - __main__ - Step 36689: {'lr': 0.00043523599943246297, 'samples': 7044288, 'steps': 36688, 'loss/train': 0.7352709770202637} -08/30/2021 19:49:58 - INFO - __main__ - Step 36690: {'lr': 0.00043523243555731094, 'samples': 7044480, 'steps': 36689, 'loss/train': 1.1972976922988892} -08/30/2021 19:49:58 - INFO - __main__ - Step 36691: {'lr': 0.00043522887159869617, 'samples': 7044672, 'steps': 36690, 'loss/train': 1.4369250535964966} -08/30/2021 19:49:59 - INFO - __main__ - Step 36692: {'lr': 0.00043522530755662017, 'samples': 7044864, 'steps': 36691, 'loss/train': 1.1358816623687744} -08/30/2021 19:49:59 - INFO - __main__ - Step 36693: {'lr': 0.00043522174343108445, 'samples': 7045056, 'steps': 36692, 'loss/train': 0.2358015775680542} -08/30/2021 19:49:59 - INFO - __main__ - Step 36694: {'lr': 0.00043521817922209064, 'samples': 7045248, 'steps': 36693, 'loss/train': 0.2850950062274933} -08/30/2021 19:50:01 - INFO - __main__ - Step 36695: {'lr': 0.00043521461492964037, 'samples': 7045440, 'steps': 36694, 'loss/train': 1.0765414237976074} -08/30/2021 19:50:02 - INFO - __main__ - Step 36696: {'lr': 0.00043521105055373526, 'samples': 7045632, 'steps': 36695, 'loss/train': 1.4708921909332275} -08/30/2021 19:50:02 - INFO - __main__ - Step 36697: {'lr': 0.000435207486094377, 'samples': 7045824, 'steps': 36696, 'loss/train': 1.1216543912887573} -08/30/2021 19:50:02 - INFO - __main__ - Step 36698: {'lr': 0.00043520392155156694, 'samples': 7046016, 'steps': 36697, 'loss/train': 1.6061737537384033} -08/30/2021 19:50:03 - INFO - __main__ - Step 36699: {'lr': 0.000435200356925307, 'samples': 7046208, 'steps': 36698, 'loss/train': 1.096311092376709} -08/30/2021 19:50:03 - INFO - __main__ - Step 36700: {'lr': 0.0004351967922155986, 'samples': 7046400, 'steps': 36699, 'loss/train': 1.0611648559570312} -08/30/2021 19:50:05 - INFO - __main__ - Step 36701: {'lr': 0.0004351932274224434, 'samples': 7046592, 'steps': 36700, 'loss/train': 1.1511927843093872} -08/30/2021 19:50:05 - INFO - __main__ - Step 36702: {'lr': 0.0004351896625458429, 'samples': 7046784, 'steps': 36701, 'loss/train': 1.3228759765625} -08/30/2021 19:50:05 - INFO - __main__ - Step 36703: {'lr': 0.0004351860975857989, 'samples': 7046976, 'steps': 36702, 'loss/train': 1.0734847784042358} -08/30/2021 19:50:06 - INFO - __main__ - Step 36704: {'lr': 0.00043518253254231276, 'samples': 7047168, 'steps': 36703, 'loss/train': 1.5056232213974} -08/30/2021 19:50:06 - INFO - __main__ - Step 36705: {'lr': 0.00043517896741538634, 'samples': 7047360, 'steps': 36704, 'loss/train': 1.000693678855896} -08/30/2021 19:50:08 - INFO - __main__ - Step 36706: {'lr': 0.0004351754022050212, 'samples': 7047552, 'steps': 36705, 'loss/train': 1.2989751100540161} -08/30/2021 19:50:08 - INFO - __main__ - Step 36707: {'lr': 0.00043517183691121875, 'samples': 7047744, 'steps': 36706, 'loss/train': 1.2257020473480225} -08/30/2021 19:50:09 - INFO - __main__ - Step 36708: {'lr': 0.00043516827153398073, 'samples': 7047936, 'steps': 36707, 'loss/train': 1.4511054754257202} -08/30/2021 19:50:09 - INFO - __main__ - Step 36709: {'lr': 0.0004351647060733088, 'samples': 7048128, 'steps': 36708, 'loss/train': 1.8234800100326538} -08/30/2021 19:50:09 - INFO - __main__ - Step 36710: {'lr': 0.00043516114052920453, 'samples': 7048320, 'steps': 36709, 'loss/train': 1.5382531881332397} -08/30/2021 19:50:11 - INFO - __main__ - Step 36711: {'lr': 0.00043515757490166944, 'samples': 7048512, 'steps': 36710, 'loss/train': 1.3825267553329468} -08/30/2021 19:50:11 - INFO - __main__ - Step 36712: {'lr': 0.00043515400919070526, 'samples': 7048704, 'steps': 36711, 'loss/train': 0.8438291549682617} -08/30/2021 19:50:12 - INFO - __main__ - Step 36713: {'lr': 0.0004351504433963135, 'samples': 7048896, 'steps': 36712, 'loss/train': 1.3279600143432617} -08/30/2021 19:50:12 - INFO - __main__ - Step 36714: {'lr': 0.0004351468775184959, 'samples': 7049088, 'steps': 36713, 'loss/train': 1.023358702659607} -08/30/2021 19:50:12 - INFO - __main__ - Step 36715: {'lr': 0.0004351433115572538, 'samples': 7049280, 'steps': 36714, 'loss/train': 1.5246587991714478} -08/30/2021 19:50:14 - INFO - __main__ - Step 36716: {'lr': 0.00043513974551258913, 'samples': 7049472, 'steps': 36715, 'loss/train': 1.4114965200424194} -08/30/2021 19:50:14 - INFO - __main__ - Step 36717: {'lr': 0.00043513617938450327, 'samples': 7049664, 'steps': 36716, 'loss/train': 1.702172040939331} -08/30/2021 19:50:15 - INFO - __main__ - Step 36718: {'lr': 0.00043513261317299797, 'samples': 7049856, 'steps': 36717, 'loss/train': 0.9815688729286194} -08/30/2021 19:50:15 - INFO - __main__ - Step 36719: {'lr': 0.00043512904687807475, 'samples': 7050048, 'steps': 36718, 'loss/train': 1.148401141166687} -08/30/2021 19:50:15 - INFO - __main__ - Step 36720: {'lr': 0.00043512548049973523, 'samples': 7050240, 'steps': 36719, 'loss/train': 0.8587327003479004} -08/30/2021 19:50:17 - INFO - __main__ - Step 36721: {'lr': 0.00043512191403798095, 'samples': 7050432, 'steps': 36720, 'loss/train': 1.6336232423782349} -08/30/2021 19:50:18 - INFO - __main__ - Step 36722: {'lr': 0.0004351183474928137, 'samples': 7050624, 'steps': 36721, 'loss/train': 1.1510086059570312} -08/30/2021 19:50:18 - INFO - __main__ - Step 36723: {'lr': 0.00043511478086423493, 'samples': 7050816, 'steps': 36722, 'loss/train': 1.3894286155700684} -08/30/2021 19:50:19 - INFO - __main__ - Step 36724: {'lr': 0.0004351112141522463, 'samples': 7051008, 'steps': 36723, 'loss/train': 1.3885177373886108} -08/30/2021 19:50:19 - INFO - __main__ - Step 36725: {'lr': 0.00043510764735684945, 'samples': 7051200, 'steps': 36724, 'loss/train': 1.2266805171966553} -08/30/2021 19:50:20 - INFO - __main__ - Step 36726: {'lr': 0.0004351040804780459, 'samples': 7051392, 'steps': 36725, 'loss/train': 1.6934620141983032} -08/30/2021 19:50:21 - INFO - __main__ - Step 36727: {'lr': 0.00043510051351583733, 'samples': 7051584, 'steps': 36726, 'loss/train': 1.350189447402954} -08/30/2021 19:50:21 - INFO - __main__ - Step 36728: {'lr': 0.0004350969464702254, 'samples': 7051776, 'steps': 36727, 'loss/train': 1.2746144533157349} -08/30/2021 19:50:22 - INFO - __main__ - Step 36729: {'lr': 0.0004350933793412115, 'samples': 7051968, 'steps': 36728, 'loss/train': 1.035346269607544} -08/30/2021 19:50:22 - INFO - __main__ - Step 36730: {'lr': 0.00043508981212879737, 'samples': 7052160, 'steps': 36729, 'loss/train': 1.4221863746643066} -08/30/2021 19:50:22 - INFO - __main__ - Step 36731: {'lr': 0.0004350862448329848, 'samples': 7052352, 'steps': 36730, 'loss/train': 1.3501044511795044} -08/30/2021 19:50:24 - INFO - __main__ - Step 36732: {'lr': 0.00043508267745377504, 'samples': 7052544, 'steps': 36731, 'loss/train': 1.5294417142868042} -08/30/2021 19:50:24 - INFO - __main__ - Step 36733: {'lr': 0.00043507910999117003, 'samples': 7052736, 'steps': 36732, 'loss/train': 1.114034652709961} -08/30/2021 19:50:25 - INFO - __main__ - Step 36734: {'lr': 0.00043507554244517113, 'samples': 7052928, 'steps': 36733, 'loss/train': 1.204210638999939} -08/30/2021 19:50:25 - INFO - __main__ - Step 36735: {'lr': 0.0004350719748157801, 'samples': 7053120, 'steps': 36734, 'loss/train': 1.4735853672027588} -08/30/2021 19:50:25 - INFO - __main__ - Step 36736: {'lr': 0.00043506840710299844, 'samples': 7053312, 'steps': 36735, 'loss/train': 0.8844746947288513} -08/30/2021 19:50:27 - INFO - __main__ - Step 36737: {'lr': 0.00043506483930682785, 'samples': 7053504, 'steps': 36736, 'loss/train': 1.420186161994934} -08/30/2021 19:50:27 - INFO - __main__ - Step 36738: {'lr': 0.0004350612714272699, 'samples': 7053696, 'steps': 36737, 'loss/train': 1.5141267776489258} -08/30/2021 19:50:28 - INFO - __main__ - Step 36739: {'lr': 0.0004350577034643262, 'samples': 7053888, 'steps': 36738, 'loss/train': 1.4006013870239258} -08/30/2021 19:50:28 - INFO - __main__ - Step 36740: {'lr': 0.0004350541354179983, 'samples': 7054080, 'steps': 36739, 'loss/train': 1.53284752368927} -08/30/2021 19:50:28 - INFO - __main__ - Step 36741: {'lr': 0.00043505056728828794, 'samples': 7054272, 'steps': 36740, 'loss/train': 0.5731781721115112} -08/30/2021 19:50:30 - INFO - __main__ - Step 36742: {'lr': 0.0004350469990751966, 'samples': 7054464, 'steps': 36741, 'loss/train': 1.130262017250061} -08/30/2021 19:50:30 - INFO - __main__ - Step 36743: {'lr': 0.000435043430778726, 'samples': 7054656, 'steps': 36742, 'loss/train': 2.417330265045166} -08/30/2021 19:50:31 - INFO - __main__ - Step 36744: {'lr': 0.00043503986239887765, 'samples': 7054848, 'steps': 36743, 'loss/train': 1.7894667387008667} -08/30/2021 19:50:31 - INFO - __main__ - Step 36745: {'lr': 0.0004350362939356532, 'samples': 7055040, 'steps': 36744, 'loss/train': 1.0532146692276} -08/30/2021 19:50:31 - INFO - __main__ - Step 36746: {'lr': 0.00043503272538905423, 'samples': 7055232, 'steps': 36745, 'loss/train': 1.0075383186340332} -08/30/2021 19:50:33 - INFO - __main__ - Step 36747: {'lr': 0.0004350291567590824, 'samples': 7055424, 'steps': 36746, 'loss/train': 1.5667258501052856} -08/30/2021 19:50:33 - INFO - __main__ - Step 36748: {'lr': 0.00043502558804573924, 'samples': 7055616, 'steps': 36747, 'loss/train': 1.3375009298324585} -08/30/2021 19:50:34 - INFO - __main__ - Step 36749: {'lr': 0.0004350220192490264, 'samples': 7055808, 'steps': 36748, 'loss/train': 1.066444993019104} -08/30/2021 19:50:34 - INFO - __main__ - Step 36750: {'lr': 0.00043501845036894555, 'samples': 7056000, 'steps': 36749, 'loss/train': 1.5496065616607666} -08/30/2021 19:50:34 - INFO - __main__ - Step 36751: {'lr': 0.00043501488140549824, 'samples': 7056192, 'steps': 36750, 'loss/train': 1.5164856910705566} -08/30/2021 19:50:36 - INFO - __main__ - Step 36752: {'lr': 0.000435011312358686, 'samples': 7056384, 'steps': 36751, 'loss/train': 1.5143030881881714} -08/30/2021 19:50:36 - INFO - __main__ - Step 36753: {'lr': 0.0004350077432285106, 'samples': 7056576, 'steps': 36752, 'loss/train': 1.4826269149780273} -08/30/2021 19:50:37 - INFO - __main__ - Step 36754: {'lr': 0.0004350041740149735, 'samples': 7056768, 'steps': 36753, 'loss/train': 1.3413727283477783} -08/30/2021 19:50:37 - INFO - __main__ - Step 36755: {'lr': 0.00043500060471807645, 'samples': 7056960, 'steps': 36754, 'loss/train': 1.3902397155761719} -08/30/2021 19:50:37 - INFO - __main__ - Step 36756: {'lr': 0.000434997035337821, 'samples': 7057152, 'steps': 36755, 'loss/train': 1.5261427164077759} -08/30/2021 19:50:38 - INFO - __main__ - Step 36757: {'lr': 0.0004349934658742086, 'samples': 7057344, 'steps': 36756, 'loss/train': 1.793416142463684} -08/30/2021 19:50:39 - INFO - __main__ - Step 36758: {'lr': 0.00043498989632724105, 'samples': 7057536, 'steps': 36757, 'loss/train': 0.07235637307167053} -08/30/2021 19:50:40 - INFO - __main__ - Step 36759: {'lr': 0.00043498632669692, 'samples': 7057728, 'steps': 36758, 'loss/train': 1.0857549905776978} -08/30/2021 19:50:40 - INFO - __main__ - Step 36760: {'lr': 0.0004349827569832469, 'samples': 7057920, 'steps': 36759, 'loss/train': 1.811194896697998} -08/30/2021 19:50:41 - INFO - __main__ - Step 36761: {'lr': 0.00043497918718622344, 'samples': 7058112, 'steps': 36760, 'loss/train': 1.170149326324463} -08/30/2021 19:50:41 - INFO - __main__ - Step 36762: {'lr': 0.0004349756173058512, 'samples': 7058304, 'steps': 36761, 'loss/train': 1.4687120914459229} -08/30/2021 19:50:43 - INFO - __main__ - Step 36763: {'lr': 0.0004349720473421318, 'samples': 7058496, 'steps': 36762, 'loss/train': 1.5276732444763184} -08/30/2021 19:50:43 - INFO - __main__ - Step 36764: {'lr': 0.00043496847729506685, 'samples': 7058688, 'steps': 36763, 'loss/train': 1.513434648513794} -08/30/2021 19:50:43 - INFO - __main__ - Step 36765: {'lr': 0.000434964907164658, 'samples': 7058880, 'steps': 36764, 'loss/train': 0.8090911507606506} -08/30/2021 19:50:44 - INFO - __main__ - Step 36766: {'lr': 0.0004349613369509067, 'samples': 7059072, 'steps': 36765, 'loss/train': 1.393768072128296} -08/30/2021 19:50:44 - INFO - __main__ - Step 36767: {'lr': 0.0004349577666538148, 'samples': 7059264, 'steps': 36766, 'loss/train': 1.1167211532592773} -08/30/2021 19:50:46 - INFO - __main__ - Step 36768: {'lr': 0.0004349541962733837, 'samples': 7059456, 'steps': 36767, 'loss/train': 1.119260549545288} -08/30/2021 19:50:46 - INFO - __main__ - Step 36769: {'lr': 0.0004349506258096152, 'samples': 7059648, 'steps': 36768, 'loss/train': 1.2865499258041382} -08/30/2021 19:50:46 - INFO - __main__ - Step 36770: {'lr': 0.00043494705526251064, 'samples': 7059840, 'steps': 36769, 'loss/train': 1.5907214879989624} -08/30/2021 19:50:47 - INFO - __main__ - Step 36771: {'lr': 0.00043494348463207197, 'samples': 7060032, 'steps': 36770, 'loss/train': 1.2490900754928589} -08/30/2021 19:50:47 - INFO - __main__ - Step 36772: {'lr': 0.0004349399139183005, 'samples': 7060224, 'steps': 36771, 'loss/train': 1.3989109992980957} -08/30/2021 19:50:50 - INFO - __main__ - Step 36773: {'lr': 0.000434936343121198, 'samples': 7060416, 'steps': 36772, 'loss/train': 0.5802854895591736} -08/30/2021 19:50:50 - INFO - __main__ - Step 36774: {'lr': 0.000434932772240766, 'samples': 7060608, 'steps': 36773, 'loss/train': 2.3337364196777344} -08/30/2021 19:50:50 - INFO - __main__ - Step 36775: {'lr': 0.0004349292012770062, 'samples': 7060800, 'steps': 36774, 'loss/train': 1.7584441900253296} -08/30/2021 19:50:51 - INFO - __main__ - Step 36776: {'lr': 0.00043492563022992013, 'samples': 7060992, 'steps': 36775, 'loss/train': 0.41401219367980957} -08/30/2021 19:50:51 - INFO - __main__ - Step 36777: {'lr': 0.00043492205909950943, 'samples': 7061184, 'steps': 36776, 'loss/train': 1.0634077787399292} -08/30/2021 19:50:52 - INFO - __main__ - Step 36778: {'lr': 0.0004349184878857757, 'samples': 7061376, 'steps': 36777, 'loss/train': 0.6090685725212097} -08/30/2021 19:50:53 - INFO - __main__ - Step 36779: {'lr': 0.0004349149165887205, 'samples': 7061568, 'steps': 36778, 'loss/train': 2.570732593536377} -08/30/2021 19:50:53 - INFO - __main__ - Step 36780: {'lr': 0.0004349113452083456, 'samples': 7061760, 'steps': 36779, 'loss/train': 1.5769164562225342} -08/30/2021 19:50:54 - INFO - __main__ - Step 36781: {'lr': 0.00043490777374465244, 'samples': 7061952, 'steps': 36780, 'loss/train': 1.5659064054489136} -08/30/2021 19:50:54 - INFO - __main__ - Step 36782: {'lr': 0.0004349042021976427, 'samples': 7062144, 'steps': 36781, 'loss/train': 1.8731383085250854} -08/30/2021 19:50:55 - INFO - __main__ - Step 36783: {'lr': 0.000434900630567318, 'samples': 7062336, 'steps': 36782, 'loss/train': 1.11239492893219} -08/30/2021 19:50:56 - INFO - __main__ - Step 36784: {'lr': 0.00043489705885367986, 'samples': 7062528, 'steps': 36783, 'loss/train': 1.7922813892364502} -08/30/2021 19:50:56 - INFO - __main__ - Step 36785: {'lr': 0.00043489348705673, 'samples': 7062720, 'steps': 36784, 'loss/train': 1.6734100580215454} -08/30/2021 19:50:57 - INFO - __main__ - Step 36786: {'lr': 0.00043488991517647, 'samples': 7062912, 'steps': 36785, 'loss/train': 1.780049443244934} -08/30/2021 19:50:57 - INFO - __main__ - Step 36787: {'lr': 0.00043488634321290146, 'samples': 7063104, 'steps': 36786, 'loss/train': 1.3812592029571533} -08/30/2021 19:50:57 - INFO - __main__ - Step 36788: {'lr': 0.000434882771166026, 'samples': 7063296, 'steps': 36787, 'loss/train': 1.7514374256134033} -08/30/2021 19:50:58 - INFO - __main__ - Step 36789: {'lr': 0.00043487919903584515, 'samples': 7063488, 'steps': 36788, 'loss/train': 1.6486750841140747} -08/30/2021 19:51:00 - INFO - __main__ - Step 36790: {'lr': 0.00043487562682236066, 'samples': 7063680, 'steps': 36789, 'loss/train': 1.6784473657608032} -08/30/2021 19:51:00 - INFO - __main__ - Step 36791: {'lr': 0.000434872054525574, 'samples': 7063872, 'steps': 36790, 'loss/train': 1.5071698427200317} -08/30/2021 19:51:01 - INFO - __main__ - Step 36792: {'lr': 0.00043486848214548693, 'samples': 7064064, 'steps': 36791, 'loss/train': 0.7901178002357483} -08/30/2021 19:51:01 - INFO - __main__ - Step 36793: {'lr': 0.0004348649096821009, 'samples': 7064256, 'steps': 36792, 'loss/train': 1.458463191986084} -08/30/2021 19:51:01 - INFO - __main__ - Step 36794: {'lr': 0.0004348613371354176, 'samples': 7064448, 'steps': 36793, 'loss/train': 2.257478952407837} -08/30/2021 19:51:04 - INFO - __main__ - Step 36795: {'lr': 0.0004348577645054387, 'samples': 7064640, 'steps': 36794, 'loss/train': 0.14407555758953094} -08/30/2021 19:51:04 - INFO - __main__ - Step 36796: {'lr': 0.0004348541917921657, 'samples': 7064832, 'steps': 36795, 'loss/train': 1.0325839519500732} -08/30/2021 19:51:04 - INFO - __main__ - Step 36797: {'lr': 0.0004348506189956002, 'samples': 7065024, 'steps': 36796, 'loss/train': 1.8709971904754639} -08/30/2021 19:51:05 - INFO - __main__ - Step 36798: {'lr': 0.0004348470461157439, 'samples': 7065216, 'steps': 36797, 'loss/train': 1.183646321296692} -08/30/2021 19:51:05 - INFO - __main__ - Step 36799: {'lr': 0.0004348434731525984, 'samples': 7065408, 'steps': 36798, 'loss/train': 1.7938910722732544} -08/30/2021 19:51:05 - INFO - __main__ - Step 36800: {'lr': 0.00043483990010616524, 'samples': 7065600, 'steps': 36799, 'loss/train': 1.2465991973876953} -08/30/2021 19:51:07 - INFO - __main__ - Step 36801: {'lr': 0.00043483632697644616, 'samples': 7065792, 'steps': 36800, 'loss/train': 0.11328092962503433} -08/30/2021 19:51:08 - INFO - __main__ - Step 36802: {'lr': 0.00043483275376344257, 'samples': 7065984, 'steps': 36801, 'loss/train': 1.626562237739563} -08/30/2021 19:51:08 - INFO - __main__ - Step 36803: {'lr': 0.00043482918046715627, 'samples': 7066176, 'steps': 36802, 'loss/train': 0.9440440535545349} -08/30/2021 19:51:08 - INFO - __main__ - Step 36804: {'lr': 0.00043482560708758876, 'samples': 7066368, 'steps': 36803, 'loss/train': 1.7031415700912476} -08/30/2021 19:51:09 - INFO - __main__ - Step 36805: {'lr': 0.0004348220336247417, 'samples': 7066560, 'steps': 36804, 'loss/train': 1.7413356304168701} -08/30/2021 19:51:09 - INFO - __main__ - Step 36806: {'lr': 0.0004348184600786167, 'samples': 7066752, 'steps': 36805, 'loss/train': 1.2216918468475342} -08/30/2021 19:51:10 - INFO - __main__ - Step 36807: {'lr': 0.0004348148864492153, 'samples': 7066944, 'steps': 36806, 'loss/train': 1.392309546470642} -08/30/2021 19:51:11 - INFO - __main__ - Step 36808: {'lr': 0.00043481131273653926, 'samples': 7067136, 'steps': 36807, 'loss/train': 0.5392890572547913} -08/30/2021 19:51:11 - INFO - __main__ - Step 36809: {'lr': 0.00043480773894059, 'samples': 7067328, 'steps': 36808, 'loss/train': 1.9753751754760742} -08/30/2021 19:51:12 - INFO - __main__ - Step 36810: {'lr': 0.0004348041650613692, 'samples': 7067520, 'steps': 36809, 'loss/train': 1.767722249031067} -08/30/2021 19:51:12 - INFO - __main__ - Step 36811: {'lr': 0.0004348005910988786, 'samples': 7067712, 'steps': 36810, 'loss/train': 1.9477856159210205} -08/30/2021 19:51:14 - INFO - __main__ - Step 36812: {'lr': 0.0004347970170531197, 'samples': 7067904, 'steps': 36811, 'loss/train': 3.1116228103637695} -08/30/2021 19:51:14 - INFO - __main__ - Step 36813: {'lr': 0.000434793442924094, 'samples': 7068096, 'steps': 36812, 'loss/train': 1.2393287420272827} -08/30/2021 19:51:14 - INFO - __main__ - Step 36814: {'lr': 0.0004347898687118033, 'samples': 7068288, 'steps': 36813, 'loss/train': 1.3419828414916992} -08/30/2021 19:51:15 - INFO - __main__ - Step 36815: {'lr': 0.0004347862944162492, 'samples': 7068480, 'steps': 36814, 'loss/train': 1.2952697277069092} -08/30/2021 19:51:15 - INFO - __main__ - Step 36816: {'lr': 0.00043478272003743315, 'samples': 7068672, 'steps': 36815, 'loss/train': 1.283370852470398} -08/30/2021 19:51:17 - INFO - __main__ - Step 36817: {'lr': 0.0004347791455753569, 'samples': 7068864, 'steps': 36816, 'loss/train': 2.282930374145508} -08/30/2021 19:51:17 - INFO - __main__ - Step 36818: {'lr': 0.00043477557103002197, 'samples': 7069056, 'steps': 36817, 'loss/train': 1.0517560243606567} -08/30/2021 19:51:17 - INFO - __main__ - Step 36819: {'lr': 0.00043477199640143004, 'samples': 7069248, 'steps': 36818, 'loss/train': 1.9354766607284546} -08/30/2021 19:51:18 - INFO - __main__ - Step 36820: {'lr': 0.00043476842168958276, 'samples': 7069440, 'steps': 36819, 'loss/train': 1.3237605094909668} -08/30/2021 19:51:18 - INFO - __main__ - Step 36821: {'lr': 0.0004347648468944816, 'samples': 7069632, 'steps': 36820, 'loss/train': 2.9693386554718018} -08/30/2021 19:51:20 - INFO - __main__ - Step 36822: {'lr': 0.0004347612720161283, 'samples': 7069824, 'steps': 36821, 'loss/train': 1.0591917037963867} -08/30/2021 19:51:20 - INFO - __main__ - Step 36823: {'lr': 0.00043475769705452437, 'samples': 7070016, 'steps': 36822, 'loss/train': 0.6354339122772217} -08/30/2021 19:51:20 - INFO - __main__ - Step 36824: {'lr': 0.00043475412200967155, 'samples': 7070208, 'steps': 36823, 'loss/train': 0.27789032459259033} -08/30/2021 19:51:21 - INFO - __main__ - Step 36825: {'lr': 0.00043475054688157136, 'samples': 7070400, 'steps': 36824, 'loss/train': 1.7641217708587646} -08/30/2021 19:51:21 - INFO - __main__ - Step 36826: {'lr': 0.00043474697167022536, 'samples': 7070592, 'steps': 36825, 'loss/train': 1.9912052154541016} -08/30/2021 19:51:22 - INFO - __main__ - Step 36827: {'lr': 0.0004347433963756353, 'samples': 7070784, 'steps': 36826, 'loss/train': 1.850598692893982} -08/30/2021 19:51:23 - INFO - __main__ - Step 36828: {'lr': 0.0004347398209978027, 'samples': 7070976, 'steps': 36827, 'loss/train': 1.684794306755066} -08/30/2021 19:51:23 - INFO - __main__ - Step 36829: {'lr': 0.0004347362455367292, 'samples': 7071168, 'steps': 36828, 'loss/train': 1.0775448083877563} -08/30/2021 19:51:24 - INFO - __main__ - Step 36830: {'lr': 0.0004347326699924163, 'samples': 7071360, 'steps': 36829, 'loss/train': 0.7445506453514099} -08/30/2021 19:51:24 - INFO - __main__ - Step 36831: {'lr': 0.0004347290943648658, 'samples': 7071552, 'steps': 36830, 'loss/train': 1.5281739234924316} -08/30/2021 19:51:24 - INFO - __main__ - Step 36832: {'lr': 0.00043472551865407917, 'samples': 7071744, 'steps': 36831, 'loss/train': 1.7025636434555054} -08/30/2021 19:51:27 - INFO - __main__ - Step 36833: {'lr': 0.0004347219428600581, 'samples': 7071936, 'steps': 36832, 'loss/train': 1.5944740772247314} -08/30/2021 19:51:27 - INFO - __main__ - Step 36834: {'lr': 0.0004347183669828042, 'samples': 7072128, 'steps': 36833, 'loss/train': 1.6958502531051636} -08/30/2021 19:51:27 - INFO - __main__ - Step 36835: {'lr': 0.00043471479102231904, 'samples': 7072320, 'steps': 36834, 'loss/train': 1.7756755352020264} -08/30/2021 19:51:28 - INFO - __main__ - Step 36836: {'lr': 0.0004347112149786042, 'samples': 7072512, 'steps': 36835, 'loss/train': 1.0302866697311401} -08/30/2021 19:51:28 - INFO - __main__ - Step 36837: {'lr': 0.0004347076388516614, 'samples': 7072704, 'steps': 36836, 'loss/train': 2.2028441429138184} -08/30/2021 19:51:29 - INFO - __main__ - Step 36838: {'lr': 0.00043470406264149215, 'samples': 7072896, 'steps': 36837, 'loss/train': 1.542486310005188} -08/30/2021 19:51:30 - INFO - __main__ - Step 36839: {'lr': 0.00043470048634809813, 'samples': 7073088, 'steps': 36838, 'loss/train': 1.6159751415252686} -08/30/2021 19:51:30 - INFO - __main__ - Step 36840: {'lr': 0.00043469690997148086, 'samples': 7073280, 'steps': 36839, 'loss/train': 1.5094271898269653} -08/30/2021 19:51:31 - INFO - __main__ - Step 36841: {'lr': 0.00043469333351164207, 'samples': 7073472, 'steps': 36840, 'loss/train': 1.7073278427124023} -08/30/2021 19:51:31 - INFO - __main__ - Step 36842: {'lr': 0.0004346897569685833, 'samples': 7073664, 'steps': 36841, 'loss/train': 1.5118752717971802} -08/30/2021 19:51:31 - INFO - __main__ - Step 36843: {'lr': 0.00043468618034230613, 'samples': 7073856, 'steps': 36842, 'loss/train': 1.497745394706726} -08/30/2021 19:51:33 - INFO - __main__ - Step 36844: {'lr': 0.00043468260363281234, 'samples': 7074048, 'steps': 36843, 'loss/train': 1.622791051864624} -08/30/2021 19:51:34 - INFO - __main__ - Step 36845: {'lr': 0.0004346790268401033, 'samples': 7074240, 'steps': 36844, 'loss/train': 0.13512659072875977} -08/30/2021 19:51:34 - INFO - __main__ - Step 36846: {'lr': 0.00043467544996418075, 'samples': 7074432, 'steps': 36845, 'loss/train': 1.831268310546875} -08/30/2021 19:51:34 - INFO - __main__ - Step 36847: {'lr': 0.0004346718730050463, 'samples': 7074624, 'steps': 36846, 'loss/train': 1.5660496950149536} -08/30/2021 19:51:35 - INFO - __main__ - Step 36848: {'lr': 0.0004346682959627016, 'samples': 7074816, 'steps': 36847, 'loss/train': 1.698951244354248} -08/30/2021 19:51:35 - INFO - __main__ - Step 36849: {'lr': 0.0004346647188371482, 'samples': 7075008, 'steps': 36848, 'loss/train': 1.3131630420684814} -08/30/2021 19:51:37 - INFO - __main__ - Step 36850: {'lr': 0.00043466114162838765, 'samples': 7075200, 'steps': 36849, 'loss/train': 1.89736807346344} -08/30/2021 19:51:37 - INFO - __main__ - Step 36851: {'lr': 0.00043465756433642175, 'samples': 7075392, 'steps': 36850, 'loss/train': 1.7006425857543945} -08/30/2021 19:51:37 - INFO - __main__ - Step 36852: {'lr': 0.0004346539869612519, 'samples': 7075584, 'steps': 36851, 'loss/train': 1.5596452951431274} -08/30/2021 19:51:38 - INFO - __main__ - Step 36853: {'lr': 0.0004346504095028799, 'samples': 7075776, 'steps': 36852, 'loss/train': 0.6171156764030457} -08/30/2021 19:51:38 - INFO - __main__ - Step 36854: {'lr': 0.00043464683196130726, 'samples': 7075968, 'steps': 36853, 'loss/train': 1.4701935052871704} -08/30/2021 19:51:38 - INFO - __main__ - Step 36855: {'lr': 0.00043464325433653563, 'samples': 7076160, 'steps': 36854, 'loss/train': 0.6239742636680603} -08/30/2021 19:51:40 - INFO - __main__ - Step 36856: {'lr': 0.0004346396766285665, 'samples': 7076352, 'steps': 36855, 'loss/train': 1.4213045835494995} -08/30/2021 19:51:40 - INFO - __main__ - Step 36857: {'lr': 0.0004346360988374016, 'samples': 7076544, 'steps': 36856, 'loss/train': 0.8447583913803101} -08/30/2021 19:51:41 - INFO - __main__ - Step 36858: {'lr': 0.0004346325209630426, 'samples': 7076736, 'steps': 36857, 'loss/train': 1.7020998001098633} -08/30/2021 19:51:41 - INFO - __main__ - Step 36859: {'lr': 0.00043462894300549097, 'samples': 7076928, 'steps': 36858, 'loss/train': 1.4927747249603271} -08/30/2021 19:51:42 - INFO - __main__ - Step 36860: {'lr': 0.0004346253649647485, 'samples': 7077120, 'steps': 36859, 'loss/train': 1.1809659004211426} -08/30/2021 19:51:43 - INFO - __main__ - Step 36861: {'lr': 0.00043462178684081657, 'samples': 7077312, 'steps': 36860, 'loss/train': 1.1880556344985962} -08/30/2021 19:51:43 - INFO - __main__ - Step 36862: {'lr': 0.00043461820863369697, 'samples': 7077504, 'steps': 36861, 'loss/train': 0.9868214726448059} -08/30/2021 19:51:44 - INFO - __main__ - Step 36863: {'lr': 0.0004346146303433912, 'samples': 7077696, 'steps': 36862, 'loss/train': 1.9891897439956665} -08/30/2021 19:51:44 - INFO - __main__ - Step 36864: {'lr': 0.00043461105196990093, 'samples': 7077888, 'steps': 36863, 'loss/train': 1.4800950288772583} -08/30/2021 19:51:44 - INFO - __main__ - Step 36865: {'lr': 0.0004346074735132278, 'samples': 7078080, 'steps': 36864, 'loss/train': 1.5107578039169312} -08/30/2021 19:51:46 - INFO - __main__ - Step 36866: {'lr': 0.0004346038949733734, 'samples': 7078272, 'steps': 36865, 'loss/train': 0.944397509098053} -08/30/2021 19:51:46 - INFO - __main__ - Step 36867: {'lr': 0.0004346003163503393, 'samples': 7078464, 'steps': 36866, 'loss/train': 1.6311485767364502} -08/30/2021 19:51:47 - INFO - __main__ - Step 36868: {'lr': 0.00043459673764412713, 'samples': 7078656, 'steps': 36867, 'loss/train': 1.911833643913269} -08/30/2021 19:51:47 - INFO - __main__ - Step 36869: {'lr': 0.0004345931588547386, 'samples': 7078848, 'steps': 36868, 'loss/train': 0.20603567361831665} -08/30/2021 19:51:47 - INFO - __main__ - Step 36870: {'lr': 0.00043458957998217517, 'samples': 7079040, 'steps': 36869, 'loss/train': 0.93301922082901} -08/30/2021 19:51:49 - INFO - __main__ - Step 36871: {'lr': 0.0004345860010264385, 'samples': 7079232, 'steps': 36870, 'loss/train': 1.9856507778167725} -08/30/2021 19:51:49 - INFO - __main__ - Step 36872: {'lr': 0.00043458242198753035, 'samples': 7079424, 'steps': 36871, 'loss/train': 0.7868944406509399} -08/30/2021 19:51:50 - INFO - __main__ - Step 36873: {'lr': 0.00043457884286545216, 'samples': 7079616, 'steps': 36872, 'loss/train': 1.3528791666030884} -08/30/2021 19:51:50 - INFO - __main__ - Step 36874: {'lr': 0.0004345752636602055, 'samples': 7079808, 'steps': 36873, 'loss/train': 1.4041922092437744} -08/30/2021 19:51:50 - INFO - __main__ - Step 36875: {'lr': 0.00043457168437179217, 'samples': 7080000, 'steps': 36874, 'loss/train': 1.0192317962646484} -08/30/2021 19:51:52 - INFO - __main__ - Step 36876: {'lr': 0.00043456810500021363, 'samples': 7080192, 'steps': 36875, 'loss/train': 1.3907181024551392} -08/30/2021 19:51:53 - INFO - __main__ - Step 36877: {'lr': 0.00043456452554547153, 'samples': 7080384, 'steps': 36876, 'loss/train': 1.4760247468948364} -08/30/2021 19:51:53 - INFO - __main__ - Step 36878: {'lr': 0.0004345609460075676, 'samples': 7080576, 'steps': 36877, 'loss/train': 1.4130911827087402} -08/30/2021 19:51:54 - INFO - __main__ - Step 36879: {'lr': 0.00043455736638650335, 'samples': 7080768, 'steps': 36878, 'loss/train': 0.7857569456100464} -08/30/2021 19:51:54 - INFO - __main__ - Step 36880: {'lr': 0.0004345537866822803, 'samples': 7080960, 'steps': 36879, 'loss/train': 1.0793346166610718} -08/30/2021 19:51:55 - INFO - __main__ - Step 36881: {'lr': 0.0004345502068949002, 'samples': 7081152, 'steps': 36880, 'loss/train': 1.303871512413025} -08/30/2021 19:51:56 - INFO - __main__ - Step 36882: {'lr': 0.0004345466270243646, 'samples': 7081344, 'steps': 36881, 'loss/train': 1.7368212938308716} -08/30/2021 19:51:56 - INFO - __main__ - Step 36883: {'lr': 0.0004345430470706753, 'samples': 7081536, 'steps': 36882, 'loss/train': 1.3319361209869385} -08/30/2021 19:51:57 - INFO - __main__ - Step 36884: {'lr': 0.00043453946703383354, 'samples': 7081728, 'steps': 36883, 'loss/train': 1.3173316717147827} -08/30/2021 19:51:57 - INFO - __main__ - Step 36885: {'lr': 0.00043453588691384125, 'samples': 7081920, 'steps': 36884, 'loss/train': 1.3831349611282349} -08/30/2021 19:51:57 - INFO - __main__ - Step 36886: {'lr': 0.0004345323067106999, 'samples': 7082112, 'steps': 36885, 'loss/train': 2.2285733222961426} -08/30/2021 19:51:59 - INFO - __main__ - Step 36887: {'lr': 0.00043452872642441124, 'samples': 7082304, 'steps': 36886, 'loss/train': 1.0684077739715576} -08/30/2021 19:52:00 - INFO - __main__ - Step 36888: {'lr': 0.0004345251460549766, 'samples': 7082496, 'steps': 36887, 'loss/train': 1.6257017850875854} -08/30/2021 19:52:00 - INFO - __main__ - Step 36889: {'lr': 0.0004345215656023979, 'samples': 7082688, 'steps': 36888, 'loss/train': 0.5881924629211426} -08/30/2021 19:52:00 - INFO - __main__ - Step 36890: {'lr': 0.0004345179850666766, 'samples': 7082880, 'steps': 36889, 'loss/train': 1.4926257133483887} -08/30/2021 19:52:01 - INFO - __main__ - Step 36891: {'lr': 0.0004345144044478144, 'samples': 7083072, 'steps': 36890, 'loss/train': 1.6564733982086182} -08/30/2021 19:52:02 - INFO - __main__ - Step 36892: {'lr': 0.0004345108237458128, 'samples': 7083264, 'steps': 36891, 'loss/train': 1.6903613805770874} -08/30/2021 19:52:03 - INFO - __main__ - Step 36893: {'lr': 0.00043450724296067344, 'samples': 7083456, 'steps': 36892, 'loss/train': 0.7877649664878845} -08/30/2021 19:52:03 - INFO - __main__ - Step 36894: {'lr': 0.00043450366209239803, 'samples': 7083648, 'steps': 36893, 'loss/train': 1.5424647331237793} -08/30/2021 19:52:03 - INFO - __main__ - Step 36895: {'lr': 0.0004345000811409881, 'samples': 7083840, 'steps': 36894, 'loss/train': 1.7291079759597778} -08/30/2021 19:52:04 - INFO - __main__ - Step 36896: {'lr': 0.0004344965001064453, 'samples': 7084032, 'steps': 36895, 'loss/train': 2.0265002250671387} -08/30/2021 19:52:05 - INFO - __main__ - Step 36897: {'lr': 0.0004344929189887712, 'samples': 7084224, 'steps': 36896, 'loss/train': 1.2669568061828613} -08/30/2021 19:52:06 - INFO - __main__ - Step 36898: {'lr': 0.0004344893377879674, 'samples': 7084416, 'steps': 36897, 'loss/train': 1.0824276208877563} -08/30/2021 19:52:06 - INFO - __main__ - Step 36899: {'lr': 0.00043448575650403555, 'samples': 7084608, 'steps': 36898, 'loss/train': 1.5803066492080688} -08/30/2021 19:52:06 - INFO - __main__ - Step 36900: {'lr': 0.00043448217513697727, 'samples': 7084800, 'steps': 36899, 'loss/train': 1.8659253120422363} -08/30/2021 19:52:07 - INFO - __main__ - Step 36901: {'lr': 0.0004344785936867942, 'samples': 7084992, 'steps': 36900, 'loss/train': 1.3426913022994995} -08/30/2021 19:52:09 - INFO - __main__ - Step 36902: {'lr': 0.00043447501215348794, 'samples': 7085184, 'steps': 36901, 'loss/train': 1.2634861469268799} -08/30/2021 19:52:10 - INFO - __main__ - Step 36903: {'lr': 0.00043447143053706007, 'samples': 7085376, 'steps': 36902, 'loss/train': 1.5066152811050415} -08/30/2021 19:52:10 - INFO - __main__ - Step 36904: {'lr': 0.00043446784883751223, 'samples': 7085568, 'steps': 36903, 'loss/train': 1.6530123949050903} -08/30/2021 19:52:10 - INFO - __main__ - Step 36905: {'lr': 0.000434464267054846, 'samples': 7085760, 'steps': 36904, 'loss/train': 0.7644088268280029} -08/30/2021 19:52:11 - INFO - __main__ - Step 36906: {'lr': 0.000434460685189063, 'samples': 7085952, 'steps': 36905, 'loss/train': 1.1632622480392456} -08/30/2021 19:52:11 - INFO - __main__ - Step 36907: {'lr': 0.0004344571032401649, 'samples': 7086144, 'steps': 36906, 'loss/train': 1.4312840700149536} -08/30/2021 19:52:12 - INFO - __main__ - Step 36908: {'lr': 0.0004344535212081533, 'samples': 7086336, 'steps': 36907, 'loss/train': 0.15583209693431854} -08/30/2021 19:52:13 - INFO - __main__ - Step 36909: {'lr': 0.0004344499390930298, 'samples': 7086528, 'steps': 36908, 'loss/train': 1.5124632120132446} -08/30/2021 19:52:13 - INFO - __main__ - Step 36910: {'lr': 0.0004344463568947959, 'samples': 7086720, 'steps': 36909, 'loss/train': 1.3383314609527588} -08/30/2021 19:52:14 - INFO - __main__ - Step 36911: {'lr': 0.0004344427746134534, 'samples': 7086912, 'steps': 36910, 'loss/train': 0.69477778673172} -08/30/2021 19:52:14 - INFO - __main__ - Step 36912: {'lr': 0.0004344391922490037, 'samples': 7087104, 'steps': 36911, 'loss/train': 1.7162814140319824} -08/30/2021 19:52:16 - INFO - __main__ - Step 36913: {'lr': 0.0004344356098014487, 'samples': 7087296, 'steps': 36912, 'loss/train': 1.2389296293258667} -08/30/2021 19:52:16 - INFO - __main__ - Step 36914: {'lr': 0.0004344320272707898, 'samples': 7087488, 'steps': 36913, 'loss/train': 1.6162362098693848} -08/30/2021 19:52:17 - INFO - __main__ - Step 36915: {'lr': 0.0004344284446570287, 'samples': 7087680, 'steps': 36914, 'loss/train': 0.20172248780727386} -08/30/2021 19:52:17 - INFO - __main__ - Step 36916: {'lr': 0.00043442486196016697, 'samples': 7087872, 'steps': 36915, 'loss/train': 1.0644278526306152} -08/30/2021 19:52:17 - INFO - __main__ - Step 36917: {'lr': 0.00043442127918020624, 'samples': 7088064, 'steps': 36916, 'loss/train': 1.3371798992156982} -08/30/2021 19:52:18 - INFO - __main__ - Step 36918: {'lr': 0.00043441769631714813, 'samples': 7088256, 'steps': 36917, 'loss/train': 1.6196606159210205} -08/30/2021 19:52:19 - INFO - __main__ - Step 36919: {'lr': 0.0004344141133709943, 'samples': 7088448, 'steps': 36918, 'loss/train': 1.281686544418335} -08/30/2021 19:52:20 - INFO - __main__ - Step 36920: {'lr': 0.00043441053034174625, 'samples': 7088640, 'steps': 36919, 'loss/train': 2.353680372238159} -08/30/2021 19:52:20 - INFO - __main__ - Step 36921: {'lr': 0.00043440694722940567, 'samples': 7088832, 'steps': 36920, 'loss/train': 1.623010277748108} -08/30/2021 19:52:20 - INFO - __main__ - Step 36922: {'lr': 0.00043440336403397417, 'samples': 7089024, 'steps': 36921, 'loss/train': 1.7530802488327026} -08/30/2021 19:52:21 - INFO - __main__ - Step 36923: {'lr': 0.00043439978075545337, 'samples': 7089216, 'steps': 36922, 'loss/train': 1.8340357542037964} -08/30/2021 19:52:22 - INFO - __main__ - Step 36924: {'lr': 0.0004343961973938449, 'samples': 7089408, 'steps': 36923, 'loss/train': 2.0118818283081055} -08/30/2021 19:52:22 - INFO - __main__ - Step 36925: {'lr': 0.00043439261394915033, 'samples': 7089600, 'steps': 36924, 'loss/train': 1.7424439191818237} -08/30/2021 19:52:23 - INFO - __main__ - Step 36926: {'lr': 0.0004343890304213713, 'samples': 7089792, 'steps': 36925, 'loss/train': 1.5566686391830444} -08/30/2021 19:52:23 - INFO - __main__ - Step 36927: {'lr': 0.0004343854468105094, 'samples': 7089984, 'steps': 36926, 'loss/train': 1.6069055795669556} -08/30/2021 19:52:23 - INFO - __main__ - Step 36928: {'lr': 0.00043438186311656624, 'samples': 7090176, 'steps': 36927, 'loss/train': 1.2824548482894897} -08/30/2021 19:52:25 - INFO - __main__ - Step 36929: {'lr': 0.0004343782793395435, 'samples': 7090368, 'steps': 36928, 'loss/train': 0.23958955705165863} -08/30/2021 19:52:25 - INFO - __main__ - Step 36930: {'lr': 0.00043437469547944277, 'samples': 7090560, 'steps': 36929, 'loss/train': 0.9688027501106262} -08/30/2021 19:52:26 - INFO - __main__ - Step 36931: {'lr': 0.0004343711115362656, 'samples': 7090752, 'steps': 36930, 'loss/train': 2.1543033123016357} -08/30/2021 19:52:26 - INFO - __main__ - Step 36932: {'lr': 0.00043436752751001365, 'samples': 7090944, 'steps': 36931, 'loss/train': 1.5060359239578247} -08/30/2021 19:52:26 - INFO - __main__ - Step 36933: {'lr': 0.0004343639434006885, 'samples': 7091136, 'steps': 36932, 'loss/train': 0.7337257862091064} -08/30/2021 19:52:28 - INFO - __main__ - Step 36934: {'lr': 0.00043436035920829186, 'samples': 7091328, 'steps': 36933, 'loss/train': 1.5979710817337036} -08/30/2021 19:52:29 - INFO - __main__ - Step 36935: {'lr': 0.0004343567749328253, 'samples': 7091520, 'steps': 36934, 'loss/train': 1.3218986988067627} -08/30/2021 19:52:29 - INFO - __main__ - Step 36936: {'lr': 0.00043435319057429046, 'samples': 7091712, 'steps': 36935, 'loss/train': 1.294980525970459} -08/30/2021 19:52:29 - INFO - __main__ - Step 36937: {'lr': 0.0004343496061326888, 'samples': 7091904, 'steps': 36936, 'loss/train': 1.5687510967254639} -08/30/2021 19:52:30 - INFO - __main__ - Step 36938: {'lr': 0.0004343460216080221, 'samples': 7092096, 'steps': 36937, 'loss/train': 1.8208032846450806} -08/30/2021 19:52:30 - INFO - __main__ - Step 36939: {'lr': 0.00043434243700029196, 'samples': 7092288, 'steps': 36938, 'loss/train': 2.672553062438965} -08/30/2021 19:52:32 - INFO - __main__ - Step 36940: {'lr': 0.0004343388523095, 'samples': 7092480, 'steps': 36939, 'loss/train': 1.633872628211975} -08/30/2021 19:52:32 - INFO - __main__ - Step 36941: {'lr': 0.00043433526753564766, 'samples': 7092672, 'steps': 36940, 'loss/train': 1.6166070699691772} -08/30/2021 19:52:33 - INFO - __main__ - Step 36942: {'lr': 0.00043433168267873677, 'samples': 7092864, 'steps': 36941, 'loss/train': 1.5333166122436523} -08/30/2021 19:52:33 - INFO - __main__ - Step 36943: {'lr': 0.0004343280977387689, 'samples': 7093056, 'steps': 36942, 'loss/train': 1.033284306526184} -08/30/2021 19:52:33 - INFO - __main__ - Step 36944: {'lr': 0.0004343245127157456, 'samples': 7093248, 'steps': 36943, 'loss/train': 2.024367332458496} -08/30/2021 19:52:35 - INFO - __main__ - Step 36945: {'lr': 0.0004343209276096686, 'samples': 7093440, 'steps': 36944, 'loss/train': 1.439671516418457} -08/30/2021 19:52:35 - INFO - __main__ - Step 36946: {'lr': 0.00043431734242053933, 'samples': 7093632, 'steps': 36945, 'loss/train': 1.2868527173995972} -08/30/2021 19:52:36 - INFO - __main__ - Step 36947: {'lr': 0.0004343137571483595, 'samples': 7093824, 'steps': 36946, 'loss/train': 1.385898232460022} -08/30/2021 19:52:36 - INFO - __main__ - Step 36948: {'lr': 0.00043431017179313075, 'samples': 7094016, 'steps': 36947, 'loss/train': 1.1743888854980469} -08/30/2021 19:52:36 - INFO - __main__ - Step 36949: {'lr': 0.0004343065863548548, 'samples': 7094208, 'steps': 36948, 'loss/train': 1.4184134006500244} -08/30/2021 19:52:38 - INFO - __main__ - Step 36950: {'lr': 0.000434303000833533, 'samples': 7094400, 'steps': 36949, 'loss/train': 1.347912073135376} -08/30/2021 19:52:38 - INFO - __main__ - Step 36951: {'lr': 0.00043429941522916715, 'samples': 7094592, 'steps': 36950, 'loss/train': 0.6524996757507324} -08/30/2021 19:52:39 - INFO - __main__ - Step 36952: {'lr': 0.0004342958295417588, 'samples': 7094784, 'steps': 36951, 'loss/train': 2.1537210941314697} -08/30/2021 19:52:39 - INFO - __main__ - Step 36953: {'lr': 0.00043429224377130964, 'samples': 7094976, 'steps': 36952, 'loss/train': 1.3659676313400269} -08/30/2021 19:52:39 - INFO - __main__ - Step 36954: {'lr': 0.00043428865791782126, 'samples': 7095168, 'steps': 36953, 'loss/train': 1.3667595386505127} -08/30/2021 19:52:41 - INFO - __main__ - Step 36955: {'lr': 0.0004342850719812952, 'samples': 7095360, 'steps': 36954, 'loss/train': 1.1743696928024292} -08/30/2021 19:52:41 - INFO - __main__ - Step 36956: {'lr': 0.00043428148596173316, 'samples': 7095552, 'steps': 36955, 'loss/train': 1.2689417600631714} -08/30/2021 19:52:42 - INFO - __main__ - Step 36957: {'lr': 0.00043427789985913675, 'samples': 7095744, 'steps': 36956, 'loss/train': 1.1221024990081787} -08/30/2021 19:52:42 - INFO - __main__ - Step 36958: {'lr': 0.00043427431367350753, 'samples': 7095936, 'steps': 36957, 'loss/train': 1.446897268295288} -08/30/2021 19:52:42 - INFO - __main__ - Step 36959: {'lr': 0.0004342707274048472, 'samples': 7096128, 'steps': 36958, 'loss/train': 1.893778920173645} -08/30/2021 19:52:44 - INFO - __main__ - Step 36960: {'lr': 0.0004342671410531572, 'samples': 7096320, 'steps': 36959, 'loss/train': 1.1127581596374512} -08/30/2021 19:52:44 - INFO - __main__ - Step 36961: {'lr': 0.00043426355461843934, 'samples': 7096512, 'steps': 36960, 'loss/train': 1.0507432222366333} -08/30/2021 19:52:45 - INFO - __main__ - Step 36962: {'lr': 0.00043425996810069525, 'samples': 7096704, 'steps': 36961, 'loss/train': 0.758385956287384} -08/30/2021 19:52:45 - INFO - __main__ - Step 36963: {'lr': 0.0004342563814999264, 'samples': 7096896, 'steps': 36962, 'loss/train': 1.7164360284805298} -08/30/2021 19:52:45 - INFO - __main__ - Step 36964: {'lr': 0.0004342527948161344, 'samples': 7097088, 'steps': 36963, 'loss/train': 1.39939284324646} -08/30/2021 19:52:46 - INFO - __main__ - Step 36965: {'lr': 0.000434249208049321, 'samples': 7097280, 'steps': 36964, 'loss/train': 1.573245882987976} -08/30/2021 19:52:47 - INFO - __main__ - Step 36966: {'lr': 0.0004342456211994877, 'samples': 7097472, 'steps': 36965, 'loss/train': 0.9394899010658264} -08/30/2021 19:52:48 - INFO - __main__ - Step 36967: {'lr': 0.00043424203426663623, 'samples': 7097664, 'steps': 36966, 'loss/train': 0.26969125866889954} -08/30/2021 19:52:48 - INFO - __main__ - Step 36968: {'lr': 0.0004342384472507681, 'samples': 7097856, 'steps': 36967, 'loss/train': 1.4364887475967407} -08/30/2021 19:52:48 - INFO - __main__ - Step 36969: {'lr': 0.00043423486015188497, 'samples': 7098048, 'steps': 36968, 'loss/train': 1.5569854974746704} -08/30/2021 19:52:49 - INFO - __main__ - Step 36970: {'lr': 0.00043423127296998845, 'samples': 7098240, 'steps': 36969, 'loss/train': 1.4173226356506348} -08/30/2021 19:52:50 - INFO - __main__ - Step 36971: {'lr': 0.0004342276857050802, 'samples': 7098432, 'steps': 36970, 'loss/train': 1.9105315208435059} -08/30/2021 19:52:51 - INFO - __main__ - Step 36972: {'lr': 0.00043422409835716175, 'samples': 7098624, 'steps': 36971, 'loss/train': 2.0277769565582275} -08/30/2021 19:52:51 - INFO - __main__ - Step 36973: {'lr': 0.00043422051092623483, 'samples': 7098816, 'steps': 36972, 'loss/train': 1.1386018991470337} -08/30/2021 19:52:51 - INFO - __main__ - Step 36974: {'lr': 0.0004342169234123009, 'samples': 7099008, 'steps': 36973, 'loss/train': 1.489443063735962} -08/30/2021 19:52:52 - INFO - __main__ - Step 36975: {'lr': 0.0004342133358153617, 'samples': 7099200, 'steps': 36974, 'loss/train': 1.8622065782546997} -08/30/2021 19:52:53 - INFO - __main__ - Step 36976: {'lr': 0.0004342097481354189, 'samples': 7099392, 'steps': 36975, 'loss/train': 1.5048037767410278} -08/30/2021 19:52:54 - INFO - __main__ - Step 36977: {'lr': 0.00043420616037247395, 'samples': 7099584, 'steps': 36976, 'loss/train': 1.5004308223724365} -08/30/2021 19:52:54 - INFO - __main__ - Step 36978: {'lr': 0.0004342025725265285, 'samples': 7099776, 'steps': 36977, 'loss/train': 1.0251719951629639} -08/30/2021 19:52:54 - INFO - __main__ - Step 36979: {'lr': 0.00043419898459758435, 'samples': 7099968, 'steps': 36978, 'loss/train': 1.5730838775634766} -08/30/2021 19:52:55 - INFO - __main__ - Step 36980: {'lr': 0.00043419539658564286, 'samples': 7100160, 'steps': 36979, 'loss/train': 1.404199481010437} -08/30/2021 19:52:56 - INFO - __main__ - Step 36981: {'lr': 0.0004341918084907058, 'samples': 7100352, 'steps': 36980, 'loss/train': 1.177692174911499} -08/30/2021 19:52:57 - INFO - __main__ - Step 36982: {'lr': 0.0004341882203127747, 'samples': 7100544, 'steps': 36981, 'loss/train': 1.64198899269104} -08/30/2021 19:52:57 - INFO - __main__ - Step 36983: {'lr': 0.00043418463205185134, 'samples': 7100736, 'steps': 36982, 'loss/train': 1.1643450260162354} -08/30/2021 19:52:57 - INFO - __main__ - Step 36984: {'lr': 0.0004341810437079372, 'samples': 7100928, 'steps': 36983, 'loss/train': 1.3584672212600708} -08/30/2021 19:52:58 - INFO - __main__ - Step 36985: {'lr': 0.0004341774552810339, 'samples': 7101120, 'steps': 36984, 'loss/train': 1.108555555343628} -08/30/2021 19:52:59 - INFO - __main__ - Step 36986: {'lr': 0.0004341738667711431, 'samples': 7101312, 'steps': 36985, 'loss/train': 1.617867350578308} -08/30/2021 19:53:00 - INFO - __main__ - Step 36987: {'lr': 0.0004341702781782664, 'samples': 7101504, 'steps': 36986, 'loss/train': 1.32652747631073} -08/30/2021 19:53:00 - INFO - __main__ - Step 36988: {'lr': 0.00043416668950240536, 'samples': 7101696, 'steps': 36987, 'loss/train': 1.2426902055740356} -08/30/2021 19:53:00 - INFO - __main__ - Step 36989: {'lr': 0.0004341631007435617, 'samples': 7101888, 'steps': 36988, 'loss/train': 0.7134483456611633} -08/30/2021 19:53:01 - INFO - __main__ - Step 36990: {'lr': 0.00043415951190173697, 'samples': 7102080, 'steps': 36989, 'loss/train': 1.0421174764633179} -08/30/2021 19:53:02 - INFO - __main__ - Step 36991: {'lr': 0.00043415592297693276, 'samples': 7102272, 'steps': 36990, 'loss/train': 1.1955801248550415} -08/30/2021 19:53:03 - INFO - __main__ - Step 36992: {'lr': 0.00043415233396915077, 'samples': 7102464, 'steps': 36991, 'loss/train': 1.566650629043579} -08/30/2021 19:53:03 - INFO - __main__ - Step 36993: {'lr': 0.0004341487448783926, 'samples': 7102656, 'steps': 36992, 'loss/train': 1.7085177898406982} -08/30/2021 19:53:03 - INFO - __main__ - Step 36994: {'lr': 0.00043414515570465987, 'samples': 7102848, 'steps': 36993, 'loss/train': 1.1849037408828735} -08/30/2021 19:53:04 - INFO - __main__ - Step 36995: {'lr': 0.0004341415664479541, 'samples': 7103040, 'steps': 36994, 'loss/train': 1.8075555562973022} -08/30/2021 19:53:04 - INFO - __main__ - Step 36996: {'lr': 0.00043413797710827707, 'samples': 7103232, 'steps': 36995, 'loss/train': 1.0284196138381958} -08/30/2021 19:53:06 - INFO - __main__ - Step 36997: {'lr': 0.00043413438768563026, 'samples': 7103424, 'steps': 36996, 'loss/train': 1.2237123250961304} -08/30/2021 19:53:07 - INFO - __main__ - Step 36998: {'lr': 0.0004341307981800153, 'samples': 7103616, 'steps': 36997, 'loss/train': 1.5749413967132568} -08/30/2021 19:53:07 - INFO - __main__ - Step 36999: {'lr': 0.0004341272085914339, 'samples': 7103808, 'steps': 36998, 'loss/train': 1.7321717739105225} -08/30/2021 19:53:07 - INFO - __main__ - Step 37000: {'lr': 0.00043412361891988763, 'samples': 7104000, 'steps': 36999, 'loss/train': 1.539825439453125} -08/30/2021 19:53:08 - INFO - __main__ - Step 37001: {'lr': 0.0004341200291653781, 'samples': 7104192, 'steps': 37000, 'loss/train': 0.8989658951759338} -08/30/2021 19:53:09 - INFO - __main__ - Step 37002: {'lr': 0.00043411643932790686, 'samples': 7104384, 'steps': 37001, 'loss/train': 1.5800189971923828} -08/30/2021 19:53:10 - INFO - __main__ - Step 37003: {'lr': 0.0004341128494074756, 'samples': 7104576, 'steps': 37002, 'loss/train': 1.349951148033142} -08/30/2021 19:53:10 - INFO - __main__ - Step 37004: {'lr': 0.00043410925940408595, 'samples': 7104768, 'steps': 37003, 'loss/train': 0.2885541021823883} -08/30/2021 19:53:10 - INFO - __main__ - Step 37005: {'lr': 0.00043410566931773953, 'samples': 7104960, 'steps': 37004, 'loss/train': 1.5363378524780273} -08/30/2021 19:53:11 - INFO - __main__ - Step 37006: {'lr': 0.000434102079148438, 'samples': 7105152, 'steps': 37005, 'loss/train': 1.4845151901245117} -08/30/2021 19:53:12 - INFO - __main__ - Step 37007: {'lr': 0.0004340984888961828, 'samples': 7105344, 'steps': 37006, 'loss/train': 1.6094889640808105} -08/30/2021 19:53:13 - INFO - __main__ - Step 37008: {'lr': 0.00043409489856097573, 'samples': 7105536, 'steps': 37007, 'loss/train': 1.469128966331482} -08/30/2021 19:53:13 - INFO - __main__ - Step 37009: {'lr': 0.0004340913081428183, 'samples': 7105728, 'steps': 37008, 'loss/train': 1.7176958322525024} -08/30/2021 19:53:14 - INFO - __main__ - Step 37010: {'lr': 0.00043408771764171216, 'samples': 7105920, 'steps': 37009, 'loss/train': 1.3295246362686157} -08/30/2021 19:53:14 - INFO - __main__ - Step 37011: {'lr': 0.000434084127057659, 'samples': 7106112, 'steps': 37010, 'loss/train': 0.6916934847831726} -08/30/2021 19:53:14 - INFO - __main__ - Step 37012: {'lr': 0.0004340805363906603, 'samples': 7106304, 'steps': 37011, 'loss/train': 1.2902816534042358} -08/30/2021 19:53:16 - INFO - __main__ - Step 37013: {'lr': 0.00043407694564071773, 'samples': 7106496, 'steps': 37012, 'loss/train': 0.057550281286239624} -08/30/2021 19:53:16 - INFO - __main__ - Step 37014: {'lr': 0.00043407335480783306, 'samples': 7106688, 'steps': 37013, 'loss/train': 0.858756422996521} -08/30/2021 19:53:17 - INFO - __main__ - Step 37015: {'lr': 0.0004340697638920077, 'samples': 7106880, 'steps': 37014, 'loss/train': 1.4779387712478638} -08/30/2021 19:53:17 - INFO - __main__ - Step 37016: {'lr': 0.0004340661728932433, 'samples': 7107072, 'steps': 37015, 'loss/train': 1.6564719676971436} -08/30/2021 19:53:17 - INFO - __main__ - Step 37017: {'lr': 0.0004340625818115416, 'samples': 7107264, 'steps': 37016, 'loss/train': 1.3332830667495728} -08/30/2021 19:53:18 - INFO - __main__ - Step 37018: {'lr': 0.00043405899064690405, 'samples': 7107456, 'steps': 37017, 'loss/train': 1.2354892492294312} -08/30/2021 19:53:19 - INFO - __main__ - Step 37019: {'lr': 0.0004340553993993325, 'samples': 7107648, 'steps': 37018, 'loss/train': 1.2463513612747192} -08/30/2021 19:53:20 - INFO - __main__ - Step 37020: {'lr': 0.0004340518080688283, 'samples': 7107840, 'steps': 37019, 'loss/train': 1.396854281425476} -08/30/2021 19:53:20 - INFO - __main__ - Step 37021: {'lr': 0.0004340482166553932, 'samples': 7108032, 'steps': 37020, 'loss/train': 1.6890665292739868} -08/30/2021 19:53:20 - INFO - __main__ - Step 37022: {'lr': 0.0004340446251590289, 'samples': 7108224, 'steps': 37021, 'loss/train': 1.6288957595825195} -08/30/2021 19:53:21 - INFO - __main__ - Step 37023: {'lr': 0.00043404103357973684, 'samples': 7108416, 'steps': 37022, 'loss/train': 1.4945032596588135} -08/30/2021 19:53:22 - INFO - __main__ - Step 37024: {'lr': 0.0004340374419175188, 'samples': 7108608, 'steps': 37023, 'loss/train': 1.2181408405303955} -08/30/2021 19:53:23 - INFO - __main__ - Step 37025: {'lr': 0.0004340338501723763, 'samples': 7108800, 'steps': 37024, 'loss/train': 1.5541753768920898} -08/30/2021 19:53:23 - INFO - __main__ - Step 37026: {'lr': 0.00043403025834431097, 'samples': 7108992, 'steps': 37025, 'loss/train': 1.6661155223846436} -08/30/2021 19:53:23 - INFO - __main__ - Step 37027: {'lr': 0.00043402666643332444, 'samples': 7109184, 'steps': 37026, 'loss/train': 1.4981967210769653} -08/30/2021 19:53:24 - INFO - __main__ - Step 37028: {'lr': 0.00043402307443941835, 'samples': 7109376, 'steps': 37027, 'loss/train': 1.227504014968872} -08/30/2021 19:53:25 - INFO - __main__ - Step 37029: {'lr': 0.00043401948236259437, 'samples': 7109568, 'steps': 37028, 'loss/train': 1.4776465892791748} -08/30/2021 19:53:26 - INFO - __main__ - Step 37030: {'lr': 0.000434015890202854, 'samples': 7109760, 'steps': 37029, 'loss/train': 1.3422006368637085} -08/30/2021 19:53:26 - INFO - __main__ - Step 37031: {'lr': 0.0004340122979601989, 'samples': 7109952, 'steps': 37030, 'loss/train': 1.5140113830566406} -08/30/2021 19:53:26 - INFO - __main__ - Step 37032: {'lr': 0.0004340087056346307, 'samples': 7110144, 'steps': 37031, 'loss/train': 1.6615102291107178} -08/30/2021 19:53:27 - INFO - __main__ - Step 37033: {'lr': 0.000434005113226151, 'samples': 7110336, 'steps': 37032, 'loss/train': 1.2792826890945435} -08/30/2021 19:53:28 - INFO - __main__ - Step 37034: {'lr': 0.0004340015207347614, 'samples': 7110528, 'steps': 37033, 'loss/train': 1.2476483583450317} -08/30/2021 19:53:29 - INFO - __main__ - Step 37035: {'lr': 0.0004339979281604636, 'samples': 7110720, 'steps': 37034, 'loss/train': 1.4508005380630493} -08/30/2021 19:53:29 - INFO - __main__ - Step 37036: {'lr': 0.00043399433550325917, 'samples': 7110912, 'steps': 37035, 'loss/train': 1.631337285041809} -08/30/2021 19:53:29 - INFO - __main__ - Step 37037: {'lr': 0.00043399074276314974, 'samples': 7111104, 'steps': 37036, 'loss/train': 1.7164074182510376} -08/30/2021 19:53:30 - INFO - __main__ - Step 37038: {'lr': 0.00043398714994013696, 'samples': 7111296, 'steps': 37037, 'loss/train': 1.6832025051116943} -08/30/2021 19:53:31 - INFO - __main__ - Step 37039: {'lr': 0.00043398355703422233, 'samples': 7111488, 'steps': 37038, 'loss/train': 0.34106573462486267} -08/30/2021 19:53:32 - INFO - __main__ - Step 37040: {'lr': 0.0004339799640454076, 'samples': 7111680, 'steps': 37039, 'loss/train': 1.8033214807510376} -08/30/2021 19:53:32 - INFO - __main__ - Step 37041: {'lr': 0.00043397637097369434, 'samples': 7111872, 'steps': 37040, 'loss/train': 1.70357346534729} -08/30/2021 19:53:32 - INFO - __main__ - Step 37042: {'lr': 0.0004339727778190842, 'samples': 7112064, 'steps': 37041, 'loss/train': 1.618456482887268} -08/30/2021 19:53:33 - INFO - __main__ - Step 37043: {'lr': 0.0004339691845815786, 'samples': 7112256, 'steps': 37042, 'loss/train': 1.5284024477005005} -08/30/2021 19:53:33 - INFO - __main__ - Step 37044: {'lr': 0.0004339655912611795, 'samples': 7112448, 'steps': 37043, 'loss/train': 1.093475341796875} -08/30/2021 19:53:34 - INFO - __main__ - Step 37045: {'lr': 0.00043396199785788824, 'samples': 7112640, 'steps': 37044, 'loss/train': 1.6510095596313477} -08/30/2021 19:53:35 - INFO - __main__ - Step 37046: {'lr': 0.00043395840437170666, 'samples': 7112832, 'steps': 37045, 'loss/train': 1.233132243156433} -08/30/2021 19:53:35 - INFO - __main__ - Step 37047: {'lr': 0.00043395481080263614, 'samples': 7113024, 'steps': 37046, 'loss/train': 1.533531665802002} -08/30/2021 19:53:36 - INFO - __main__ - Step 37048: {'lr': 0.0004339512171506785, 'samples': 7113216, 'steps': 37047, 'loss/train': 1.6453118324279785} -08/30/2021 19:53:36 - INFO - __main__ - Step 37049: {'lr': 0.0004339476234158352, 'samples': 7113408, 'steps': 37048, 'loss/train': 1.7882049083709717} -08/30/2021 19:53:38 - INFO - __main__ - Step 37050: {'lr': 0.00043394402959810795, 'samples': 7113600, 'steps': 37049, 'loss/train': 1.091997504234314} -08/30/2021 19:53:38 - INFO - __main__ - Step 37051: {'lr': 0.00043394043569749843, 'samples': 7113792, 'steps': 37050, 'loss/train': 1.4180865287780762} -08/30/2021 19:53:39 - INFO - __main__ - Step 37052: {'lr': 0.00043393684171400817, 'samples': 7113984, 'steps': 37051, 'loss/train': 1.5587260723114014} -08/30/2021 19:53:39 - INFO - __main__ - Step 37053: {'lr': 0.00043393324764763873, 'samples': 7114176, 'steps': 37052, 'loss/train': 0.796995222568512} -08/30/2021 19:53:40 - INFO - __main__ - Step 37054: {'lr': 0.0004339296534983919, 'samples': 7114368, 'steps': 37053, 'loss/train': 0.9326147437095642} -08/30/2021 19:53:41 - INFO - __main__ - Step 37055: {'lr': 0.00043392605926626914, 'samples': 7114560, 'steps': 37054, 'loss/train': 0.9415121078491211} -08/30/2021 19:53:41 - INFO - __main__ - Step 37056: {'lr': 0.0004339224649512722, 'samples': 7114752, 'steps': 37055, 'loss/train': 1.4428216218948364} -08/30/2021 19:53:42 - INFO - __main__ - Step 37057: {'lr': 0.00043391887055340263, 'samples': 7114944, 'steps': 37056, 'loss/train': 1.523805856704712} -08/30/2021 19:53:42 - INFO - __main__ - Step 37058: {'lr': 0.000433915276072662, 'samples': 7115136, 'steps': 37057, 'loss/train': 1.5136395692825317} -08/30/2021 19:53:43 - INFO - __main__ - Step 37059: {'lr': 0.00043391168150905203, 'samples': 7115328, 'steps': 37058, 'loss/train': 1.1078822612762451} -08/30/2021 19:53:44 - INFO - __main__ - Step 37060: {'lr': 0.0004339080868625743, 'samples': 7115520, 'steps': 37059, 'loss/train': 0.41612711548805237} -08/30/2021 19:53:45 - INFO - __main__ - Step 37061: {'lr': 0.00043390449213323037, 'samples': 7115712, 'steps': 37060, 'loss/train': 1.3532260656356812} -08/30/2021 19:53:45 - INFO - __main__ - Step 37062: {'lr': 0.000433900897321022, 'samples': 7115904, 'steps': 37061, 'loss/train': 1.4750059843063354} -08/30/2021 19:53:46 - INFO - __main__ - Step 37063: {'lr': 0.0004338973024259506, 'samples': 7116096, 'steps': 37062, 'loss/train': 1.4050695896148682} -08/30/2021 19:53:46 - INFO - __main__ - Step 37064: {'lr': 0.00043389370744801806, 'samples': 7116288, 'steps': 37063, 'loss/train': 1.2933963537216187} -08/30/2021 19:53:48 - INFO - __main__ - Step 37065: {'lr': 0.00043389011238722575, 'samples': 7116480, 'steps': 37064, 'loss/train': 1.612127423286438} -08/30/2021 19:53:48 - INFO - __main__ - Step 37066: {'lr': 0.0004338865172435754, 'samples': 7116672, 'steps': 37065, 'loss/train': 1.811689853668213} -08/30/2021 19:53:48 - INFO - __main__ - Step 37067: {'lr': 0.00043388292201706867, 'samples': 7116864, 'steps': 37066, 'loss/train': 1.3822399377822876} -08/30/2021 19:53:49 - INFO - __main__ - Step 37068: {'lr': 0.0004338793267077071, 'samples': 7117056, 'steps': 37067, 'loss/train': 0.1393483281135559} -08/30/2021 19:53:49 - INFO - __main__ - Step 37069: {'lr': 0.0004338757313154923, 'samples': 7117248, 'steps': 37068, 'loss/train': 1.6364192962646484} -08/30/2021 19:53:50 - INFO - __main__ - Step 37070: {'lr': 0.000433872135840426, 'samples': 7117440, 'steps': 37069, 'loss/train': 1.6288944482803345} -08/30/2021 19:53:51 - INFO - __main__ - Step 37071: {'lr': 0.00043386854028250977, 'samples': 7117632, 'steps': 37070, 'loss/train': 1.01338529586792} -08/30/2021 19:53:51 - INFO - __main__ - Step 37072: {'lr': 0.00043386494464174515, 'samples': 7117824, 'steps': 37071, 'loss/train': 1.7017862796783447} -08/30/2021 19:53:52 - INFO - __main__ - Step 37073: {'lr': 0.0004338613489181338, 'samples': 7118016, 'steps': 37072, 'loss/train': 1.5734326839447021} -08/30/2021 19:53:52 - INFO - __main__ - Step 37074: {'lr': 0.00043385775311167746, 'samples': 7118208, 'steps': 37073, 'loss/train': 1.0885738134384155} -08/30/2021 19:53:52 - INFO - __main__ - Step 37075: {'lr': 0.00043385415722237765, 'samples': 7118400, 'steps': 37074, 'loss/train': 1.5801478624343872} -08/30/2021 19:53:54 - INFO - __main__ - Step 37076: {'lr': 0.0004338505612502359, 'samples': 7118592, 'steps': 37075, 'loss/train': 0.5208668112754822} -08/30/2021 19:53:54 - INFO - __main__ - Step 37077: {'lr': 0.000433846965195254, 'samples': 7118784, 'steps': 37076, 'loss/train': 1.3963780403137207} -08/30/2021 19:53:55 - INFO - __main__ - Step 37078: {'lr': 0.00043384336905743343, 'samples': 7118976, 'steps': 37077, 'loss/train': 1.4589495658874512} -08/30/2021 19:53:55 - INFO - __main__ - Step 37079: {'lr': 0.0004338397728367759, 'samples': 7119168, 'steps': 37078, 'loss/train': 1.3546909093856812} -08/30/2021 19:53:55 - INFO - __main__ - Step 37080: {'lr': 0.000433836176533283, 'samples': 7119360, 'steps': 37079, 'loss/train': 0.8696184158325195} -08/30/2021 19:53:57 - INFO - __main__ - Step 37081: {'lr': 0.0004338325801469564, 'samples': 7119552, 'steps': 37080, 'loss/train': 0.8663526177406311} -08/30/2021 19:53:57 - INFO - __main__ - Step 37082: {'lr': 0.00043382898367779767, 'samples': 7119744, 'steps': 37081, 'loss/train': 1.0161995887756348} -08/30/2021 19:53:58 - INFO - __main__ - Step 37083: {'lr': 0.00043382538712580845, 'samples': 7119936, 'steps': 37082, 'loss/train': 1.668605923652649} -08/30/2021 19:53:58 - INFO - __main__ - Step 37084: {'lr': 0.00043382179049099024, 'samples': 7120128, 'steps': 37083, 'loss/train': 0.6745041608810425} -08/30/2021 19:53:58 - INFO - __main__ - Step 37085: {'lr': 0.00043381819377334485, 'samples': 7120320, 'steps': 37084, 'loss/train': 1.7028006315231323} -08/30/2021 19:54:00 - INFO - __main__ - Step 37086: {'lr': 0.00043381459697287383, 'samples': 7120512, 'steps': 37085, 'loss/train': 1.6769983768463135} -08/30/2021 19:54:00 - INFO - __main__ - Step 37087: {'lr': 0.0004338110000895787, 'samples': 7120704, 'steps': 37086, 'loss/train': 1.716045618057251} -08/30/2021 19:54:01 - INFO - __main__ - Step 37088: {'lr': 0.00043380740312346135, 'samples': 7120896, 'steps': 37087, 'loss/train': 1.728021264076233} -08/30/2021 19:54:01 - INFO - __main__ - Step 37089: {'lr': 0.00043380380607452307, 'samples': 7121088, 'steps': 37088, 'loss/train': 2.275291919708252} -08/30/2021 19:54:01 - INFO - __main__ - Step 37090: {'lr': 0.0004338002089427657, 'samples': 7121280, 'steps': 37089, 'loss/train': 1.7778035402297974} -08/30/2021 19:54:03 - INFO - __main__ - Step 37091: {'lr': 0.00043379661172819075, 'samples': 7121472, 'steps': 37090, 'loss/train': 1.234944224357605} -08/30/2021 19:54:04 - INFO - __main__ - Step 37092: {'lr': 0.0004337930144307999, 'samples': 7121664, 'steps': 37091, 'loss/train': 1.5676524639129639} -08/30/2021 19:54:04 - INFO - __main__ - Step 37093: {'lr': 0.0004337894170505947, 'samples': 7121856, 'steps': 37092, 'loss/train': 1.1639885902404785} -08/30/2021 19:54:04 - INFO - __main__ - Step 37094: {'lr': 0.0004337858195875769, 'samples': 7122048, 'steps': 37093, 'loss/train': 0.280882865190506} -08/30/2021 19:54:05 - INFO - __main__ - Step 37095: {'lr': 0.00043378222204174807, 'samples': 7122240, 'steps': 37094, 'loss/train': 1.2138230800628662} -08/30/2021 19:54:06 - INFO - __main__ - Step 37096: {'lr': 0.0004337786244131097, 'samples': 7122432, 'steps': 37095, 'loss/train': 1.653456449508667} -08/30/2021 19:54:07 - INFO - __main__ - Step 37097: {'lr': 0.00043377502670166357, 'samples': 7122624, 'steps': 37096, 'loss/train': 1.5132277011871338} -08/30/2021 19:54:07 - INFO - __main__ - Step 37098: {'lr': 0.0004337714289074113, 'samples': 7122816, 'steps': 37097, 'loss/train': 0.9573349952697754} -08/30/2021 19:54:07 - INFO - __main__ - Step 37099: {'lr': 0.0004337678310303544, 'samples': 7123008, 'steps': 37098, 'loss/train': 1.622782588005066} -08/30/2021 19:54:08 - INFO - __main__ - Step 37100: {'lr': 0.00043376423307049455, 'samples': 7123200, 'steps': 37099, 'loss/train': 0.9316123723983765} -08/30/2021 19:54:10 - INFO - __main__ - Step 37101: {'lr': 0.00043376063502783337, 'samples': 7123392, 'steps': 37100, 'loss/train': 1.652148962020874} -08/30/2021 19:54:10 - INFO - __main__ - Step 37102: {'lr': 0.00043375703690237254, 'samples': 7123584, 'steps': 37101, 'loss/train': 1.684349775314331} -08/30/2021 19:54:11 - INFO - __main__ - Step 37103: {'lr': 0.0004337534386941135, 'samples': 7123776, 'steps': 37102, 'loss/train': 1.8276478052139282} -08/30/2021 19:54:11 - INFO - __main__ - Step 37104: {'lr': 0.00043374984040305816, 'samples': 7123968, 'steps': 37103, 'loss/train': 1.924911618232727} -08/30/2021 19:54:11 - INFO - __main__ - Step 37105: {'lr': 0.00043374624202920786, 'samples': 7124160, 'steps': 37104, 'loss/train': 1.290555715560913} -08/30/2021 19:54:13 - INFO - __main__ - Step 37106: {'lr': 0.0004337426435725644, 'samples': 7124352, 'steps': 37105, 'loss/train': 2.033660411834717} -08/30/2021 19:54:14 - INFO - __main__ - Step 37107: {'lr': 0.00043373904503312934, 'samples': 7124544, 'steps': 37106, 'loss/train': 1.5066791772842407} -08/30/2021 19:54:14 - INFO - __main__ - Step 37108: {'lr': 0.0004337354464109042, 'samples': 7124736, 'steps': 37107, 'loss/train': 0.9907783269882202} -08/30/2021 19:54:14 - INFO - __main__ - Step 37109: {'lr': 0.0004337318477058908, 'samples': 7124928, 'steps': 37108, 'loss/train': 1.429274320602417} -08/30/2021 19:54:15 - INFO - __main__ - Step 37110: {'lr': 0.0004337282489180907, 'samples': 7125120, 'steps': 37109, 'loss/train': 1.2618458271026611} -08/30/2021 19:54:15 - INFO - __main__ - Step 37111: {'lr': 0.0004337246500475054, 'samples': 7125312, 'steps': 37110, 'loss/train': 1.6446267366409302} -08/30/2021 19:54:16 - INFO - __main__ - Step 37112: {'lr': 0.0004337210510941366, 'samples': 7125504, 'steps': 37111, 'loss/train': 0.05694969743490219} -08/30/2021 19:54:17 - INFO - __main__ - Step 37113: {'lr': 0.000433717452057986, 'samples': 7125696, 'steps': 37112, 'loss/train': 1.4984523057937622} -08/30/2021 19:54:17 - INFO - __main__ - Step 37114: {'lr': 0.00043371385293905517, 'samples': 7125888, 'steps': 37113, 'loss/train': 1.72265625} -08/30/2021 19:54:18 - INFO - __main__ - Step 37115: {'lr': 0.0004337102537373456, 'samples': 7126080, 'steps': 37114, 'loss/train': 1.5365489721298218} -08/30/2021 19:54:18 - INFO - __main__ - Step 37116: {'lr': 0.0004337066544528591, 'samples': 7126272, 'steps': 37115, 'loss/train': 1.3277665376663208} -08/30/2021 19:54:19 - INFO - __main__ - Step 37117: {'lr': 0.00043370305508559723, 'samples': 7126464, 'steps': 37116, 'loss/train': 1.1964889764785767} -08/30/2021 19:54:20 - INFO - __main__ - Step 37118: {'lr': 0.00043369945563556157, 'samples': 7126656, 'steps': 37117, 'loss/train': 1.2485020160675049} -08/30/2021 19:54:20 - INFO - __main__ - Step 37119: {'lr': 0.00043369585610275374, 'samples': 7126848, 'steps': 37118, 'loss/train': 1.522022008895874} -08/30/2021 19:54:21 - INFO - __main__ - Step 37120: {'lr': 0.0004336922564871755, 'samples': 7127040, 'steps': 37119, 'loss/train': 1.2104867696762085} -08/30/2021 19:54:21 - INFO - __main__ - Step 37121: {'lr': 0.00043368865678882824, 'samples': 7127232, 'steps': 37120, 'loss/train': 0.8421387076377869} -08/30/2021 19:54:23 - INFO - __main__ - Step 37122: {'lr': 0.00043368505700771377, 'samples': 7127424, 'steps': 37121, 'loss/train': 1.1219406127929688} -08/30/2021 19:54:23 - INFO - __main__ - Step 37123: {'lr': 0.00043368145714383364, 'samples': 7127616, 'steps': 37122, 'loss/train': 1.9347363710403442} -08/30/2021 19:54:24 - INFO - __main__ - Step 37124: {'lr': 0.00043367785719718947, 'samples': 7127808, 'steps': 37123, 'loss/train': 1.542358160018921} -08/30/2021 19:54:24 - INFO - __main__ - Step 37125: {'lr': 0.0004336742571677829, 'samples': 7128000, 'steps': 37124, 'loss/train': 0.1368544101715088} -08/30/2021 19:54:24 - INFO - __main__ - Step 37126: {'lr': 0.00043367065705561547, 'samples': 7128192, 'steps': 37125, 'loss/train': 1.227088451385498} -08/30/2021 19:54:25 - INFO - __main__ - Step 37127: {'lr': 0.00043366705686068895, 'samples': 7128384, 'steps': 37126, 'loss/train': 1.4763684272766113} -08/30/2021 19:54:26 - INFO - __main__ - Step 37128: {'lr': 0.0004336634565830049, 'samples': 7128576, 'steps': 37127, 'loss/train': 0.3037351667881012} -08/30/2021 19:54:27 - INFO - __main__ - Step 37129: {'lr': 0.0004336598562225649, 'samples': 7128768, 'steps': 37128, 'loss/train': 0.9881518483161926} -08/30/2021 19:54:27 - INFO - __main__ - Step 37130: {'lr': 0.00043365625577937065, 'samples': 7128960, 'steps': 37129, 'loss/train': 0.9750529527664185} -08/30/2021 19:54:27 - INFO - __main__ - Step 37131: {'lr': 0.00043365265525342365, 'samples': 7129152, 'steps': 37130, 'loss/train': 1.4949061870574951} -08/30/2021 19:54:28 - INFO - __main__ - Step 37132: {'lr': 0.00043364905464472563, 'samples': 7129344, 'steps': 37131, 'loss/train': 1.2265797853469849} -08/30/2021 19:54:29 - INFO - __main__ - Step 37133: {'lr': 0.0004336454539532782, 'samples': 7129536, 'steps': 37132, 'loss/train': 1.5571553707122803} -08/30/2021 19:54:30 - INFO - __main__ - Step 37134: {'lr': 0.00043364185317908296, 'samples': 7129728, 'steps': 37133, 'loss/train': 0.9152698516845703} -08/30/2021 19:54:30 - INFO - __main__ - Step 37135: {'lr': 0.0004336382523221415, 'samples': 7129920, 'steps': 37134, 'loss/train': 1.4276806116104126} -08/30/2021 19:54:30 - INFO - __main__ - Step 37136: {'lr': 0.0004336346513824555, 'samples': 7130112, 'steps': 37135, 'loss/train': 1.975346326828003} -08/30/2021 19:54:31 - INFO - __main__ - Step 37137: {'lr': 0.0004336310503600266, 'samples': 7130304, 'steps': 37136, 'loss/train': 2.117755889892578} -08/30/2021 19:54:32 - INFO - __main__ - Step 37138: {'lr': 0.0004336274492548563, 'samples': 7130496, 'steps': 37137, 'loss/train': 1.3216679096221924} -08/30/2021 19:54:33 - INFO - __main__ - Step 37139: {'lr': 0.0004336238480669463, 'samples': 7130688, 'steps': 37138, 'loss/train': 1.5789737701416016} -08/30/2021 19:54:33 - INFO - __main__ - Step 37140: {'lr': 0.0004336202467962983, 'samples': 7130880, 'steps': 37139, 'loss/train': 1.8885977268218994} -08/30/2021 19:54:34 - INFO - __main__ - Step 37141: {'lr': 0.0004336166454429139, 'samples': 7131072, 'steps': 37140, 'loss/train': 1.868220567703247} -08/30/2021 19:54:34 - INFO - __main__ - Step 37142: {'lr': 0.0004336130440067946, 'samples': 7131264, 'steps': 37141, 'loss/train': 1.0575519800186157} -08/30/2021 19:54:35 - INFO - __main__ - Step 37143: {'lr': 0.000433609442487942, 'samples': 7131456, 'steps': 37142, 'loss/train': 1.2918672561645508} -08/30/2021 19:54:36 - INFO - __main__ - Step 37144: {'lr': 0.00043360584088635804, 'samples': 7131648, 'steps': 37143, 'loss/train': 2.4049482345581055} -08/30/2021 19:54:36 - INFO - __main__ - Step 37145: {'lr': 0.0004336022392020439, 'samples': 7131840, 'steps': 37144, 'loss/train': 1.272507905960083} -08/30/2021 19:54:37 - INFO - __main__ - Step 37146: {'lr': 0.0004335986374350015, 'samples': 7132032, 'steps': 37145, 'loss/train': 0.7864501476287842} -08/30/2021 19:54:37 - INFO - __main__ - Step 37147: {'lr': 0.00043359503558523246, 'samples': 7132224, 'steps': 37146, 'loss/train': 1.36385977268219} -08/30/2021 19:54:38 - INFO - __main__ - Step 37148: {'lr': 0.0004335914336527382, 'samples': 7132416, 'steps': 37147, 'loss/train': 1.7500404119491577} -08/30/2021 19:54:39 - INFO - __main__ - Step 37149: {'lr': 0.0004335878316375206, 'samples': 7132608, 'steps': 37148, 'loss/train': 1.0112521648406982} -08/30/2021 19:54:39 - INFO - __main__ - Step 37150: {'lr': 0.0004335842295395811, 'samples': 7132800, 'steps': 37149, 'loss/train': 0.23985888063907623} -08/30/2021 19:54:40 - INFO - __main__ - Step 37151: {'lr': 0.0004335806273589214, 'samples': 7132992, 'steps': 37150, 'loss/train': 1.2631280422210693} -08/30/2021 19:54:40 - INFO - __main__ - Step 37152: {'lr': 0.0004335770250955431, 'samples': 7133184, 'steps': 37151, 'loss/train': 1.8199909925460815} -08/30/2021 19:54:42 - INFO - __main__ - Step 37153: {'lr': 0.0004335734227494478, 'samples': 7133376, 'steps': 37152, 'loss/train': 1.0068362951278687} -08/30/2021 19:54:42 - INFO - __main__ - Step 37154: {'lr': 0.0004335698203206372, 'samples': 7133568, 'steps': 37153, 'loss/train': 1.2943278551101685} -08/30/2021 19:54:42 - INFO - __main__ - Step 37155: {'lr': 0.00043356621780911273, 'samples': 7133760, 'steps': 37154, 'loss/train': 1.223723292350769} -08/30/2021 19:54:43 - INFO - __main__ - Step 37156: {'lr': 0.0004335626152148763, 'samples': 7133952, 'steps': 37155, 'loss/train': 0.8880375623703003} -08/30/2021 19:54:43 - INFO - __main__ - Step 37157: {'lr': 0.0004335590125379293, 'samples': 7134144, 'steps': 37156, 'loss/train': 1.708461046218872} -08/30/2021 19:54:44 - INFO - __main__ - Step 37158: {'lr': 0.00043355540977827356, 'samples': 7134336, 'steps': 37157, 'loss/train': 1.7664451599121094} -08/30/2021 19:54:46 - INFO - __main__ - Step 37159: {'lr': 0.0004335518069359105, 'samples': 7134528, 'steps': 37158, 'loss/train': 1.7524760961532593} -08/30/2021 19:54:46 - INFO - __main__ - Step 37160: {'lr': 0.0004335482040108418, 'samples': 7134720, 'steps': 37159, 'loss/train': 1.235119342803955} -08/30/2021 19:54:47 - INFO - __main__ - Step 37161: {'lr': 0.00043354460100306915, 'samples': 7134912, 'steps': 37160, 'loss/train': 1.0423471927642822} -08/30/2021 19:54:47 - INFO - __main__ - Step 37162: {'lr': 0.00043354099791259414, 'samples': 7135104, 'steps': 37161, 'loss/train': 1.8361793756484985} -08/30/2021 19:54:47 - INFO - __main__ - Step 37163: {'lr': 0.00043353739473941846, 'samples': 7135296, 'steps': 37162, 'loss/train': 2.021512985229492} -08/30/2021 19:54:49 - INFO - __main__ - Step 37164: {'lr': 0.0004335337914835435, 'samples': 7135488, 'steps': 37163, 'loss/train': 1.564961552619934} -08/30/2021 19:54:49 - INFO - __main__ - Step 37165: {'lr': 0.0004335301881449711, 'samples': 7135680, 'steps': 37164, 'loss/train': 0.5492373704910278} -08/30/2021 19:54:50 - INFO - __main__ - Step 37166: {'lr': 0.00043352658472370294, 'samples': 7135872, 'steps': 37165, 'loss/train': 1.3987257480621338} -08/30/2021 19:54:50 - INFO - __main__ - Step 37167: {'lr': 0.00043352298121974043, 'samples': 7136064, 'steps': 37166, 'loss/train': 1.5350240468978882} -08/30/2021 19:54:50 - INFO - __main__ - Step 37168: {'lr': 0.00043351937763308533, 'samples': 7136256, 'steps': 37167, 'loss/train': 1.6532922983169556} -08/30/2021 19:54:52 - INFO - __main__ - Step 37169: {'lr': 0.0004335157739637392, 'samples': 7136448, 'steps': 37168, 'loss/train': 1.6544990539550781} -08/30/2021 19:54:52 - INFO - __main__ - Step 37170: {'lr': 0.0004335121702117038, 'samples': 7136640, 'steps': 37169, 'loss/train': 1.416341781616211} -08/30/2021 19:54:53 - INFO - __main__ - Step 37171: {'lr': 0.0004335085663769805, 'samples': 7136832, 'steps': 37170, 'loss/train': 0.6026067733764648} -08/30/2021 19:54:53 - INFO - __main__ - Step 37172: {'lr': 0.00043350496245957116, 'samples': 7137024, 'steps': 37171, 'loss/train': 2.3104517459869385} -08/30/2021 19:54:54 - INFO - __main__ - Step 37173: {'lr': 0.00043350135845947725, 'samples': 7137216, 'steps': 37172, 'loss/train': 1.5542380809783936} -08/30/2021 19:54:55 - INFO - __main__ - Step 37174: {'lr': 0.00043349775437670046, 'samples': 7137408, 'steps': 37173, 'loss/train': 1.3513115644454956} -08/30/2021 19:54:56 - INFO - __main__ - Step 37175: {'lr': 0.0004334941502112425, 'samples': 7137600, 'steps': 37174, 'loss/train': 0.10398662090301514} -08/30/2021 19:54:56 - INFO - __main__ - Step 37176: {'lr': 0.0004334905459631049, 'samples': 7137792, 'steps': 37175, 'loss/train': 0.24205230176448822} -08/30/2021 19:54:57 - INFO - __main__ - Step 37177: {'lr': 0.0004334869416322892, 'samples': 7137984, 'steps': 37176, 'loss/train': 1.1347286701202393} -08/30/2021 19:54:57 - INFO - __main__ - Step 37178: {'lr': 0.0004334833372187972, 'samples': 7138176, 'steps': 37177, 'loss/train': 0.954086184501648} -08/30/2021 19:54:58 - INFO - __main__ - Step 37179: {'lr': 0.0004334797327226304, 'samples': 7138368, 'steps': 37178, 'loss/train': 1.5092992782592773} -08/30/2021 19:54:59 - INFO - __main__ - Step 37180: {'lr': 0.00043347612814379047, 'samples': 7138560, 'steps': 37179, 'loss/train': 1.203762173652649} -08/30/2021 19:54:59 - INFO - __main__ - Step 37181: {'lr': 0.000433472523482279, 'samples': 7138752, 'steps': 37180, 'loss/train': 1.647207498550415} -08/30/2021 19:55:00 - INFO - __main__ - Step 37182: {'lr': 0.0004334689187380977, 'samples': 7138944, 'steps': 37181, 'loss/train': 1.4049173593521118} -08/30/2021 19:55:00 - INFO - __main__ - Step 37183: {'lr': 0.0004334653139112481, 'samples': 7139136, 'steps': 37182, 'loss/train': 1.3880038261413574} -08/30/2021 19:55:00 - INFO - __main__ - Step 37184: {'lr': 0.0004334617090017319, 'samples': 7139328, 'steps': 37183, 'loss/train': 1.5641449689865112} -08/30/2021 19:55:02 - INFO - __main__ - Step 37185: {'lr': 0.0004334581040095506, 'samples': 7139520, 'steps': 37184, 'loss/train': 1.4881904125213623} -08/30/2021 19:55:02 - INFO - __main__ - Step 37186: {'lr': 0.00043345449893470594, 'samples': 7139712, 'steps': 37185, 'loss/train': 1.1744705438613892} -08/30/2021 19:55:03 - INFO - __main__ - Step 37187: {'lr': 0.00043345089377719954, 'samples': 7139904, 'steps': 37186, 'loss/train': 1.065626859664917} -08/30/2021 19:55:03 - INFO - __main__ - Step 37188: {'lr': 0.00043344728853703297, 'samples': 7140096, 'steps': 37187, 'loss/train': 1.326798677444458} -08/30/2021 19:55:03 - INFO - __main__ - Step 37189: {'lr': 0.0004334436832142079, 'samples': 7140288, 'steps': 37188, 'loss/train': 1.3048057556152344} -08/30/2021 19:55:06 - INFO - __main__ - Step 37190: {'lr': 0.000433440077808726, 'samples': 7140480, 'steps': 37189, 'loss/train': 1.572681188583374} -08/30/2021 19:55:06 - INFO - __main__ - Step 37191: {'lr': 0.00043343647232058877, 'samples': 7140672, 'steps': 37190, 'loss/train': 1.8363094329833984} -08/30/2021 19:55:07 - INFO - __main__ - Step 37192: {'lr': 0.0004334328667497979, 'samples': 7140864, 'steps': 37191, 'loss/train': 2.047091245651245} -08/30/2021 19:55:07 - INFO - __main__ - Step 37193: {'lr': 0.00043342926109635497, 'samples': 7141056, 'steps': 37192, 'loss/train': 0.43282344937324524} -08/30/2021 19:55:07 - INFO - __main__ - Step 37194: {'lr': 0.0004334256553602617, 'samples': 7141248, 'steps': 37193, 'loss/train': 2.75614857673645} -08/30/2021 19:55:08 - INFO - __main__ - Step 37195: {'lr': 0.00043342204954151963, 'samples': 7141440, 'steps': 37194, 'loss/train': 1.511721134185791} -08/30/2021 19:55:08 - INFO - __main__ - Step 37196: {'lr': 0.00043341844364013047, 'samples': 7141632, 'steps': 37195, 'loss/train': 1.2944092750549316} -08/30/2021 19:55:10 - INFO - __main__ - Step 37197: {'lr': 0.00043341483765609566, 'samples': 7141824, 'steps': 37196, 'loss/train': 1.5528048276901245} -08/30/2021 19:55:10 - INFO - __main__ - Step 37198: {'lr': 0.0004334112315894171, 'samples': 7142016, 'steps': 37197, 'loss/train': 0.17207683622837067} -08/30/2021 19:55:10 - INFO - __main__ - Step 37199: {'lr': 0.00043340762544009627, 'samples': 7142208, 'steps': 37198, 'loss/train': 1.4666324853897095} -08/30/2021 19:55:11 - INFO - __main__ - Step 37200: {'lr': 0.0004334040192081347, 'samples': 7142400, 'steps': 37199, 'loss/train': 1.9627348184585571} -08/30/2021 19:55:11 - INFO - __main__ - Step 37201: {'lr': 0.00043340041289353416, 'samples': 7142592, 'steps': 37200, 'loss/train': 1.0309817790985107} -08/30/2021 19:55:13 - INFO - __main__ - Step 37202: {'lr': 0.0004333968064962962, 'samples': 7142784, 'steps': 37201, 'loss/train': 1.6099499464035034} -08/30/2021 19:55:14 - INFO - __main__ - Step 37203: {'lr': 0.00043339320001642244, 'samples': 7142976, 'steps': 37202, 'loss/train': 1.5217416286468506} -08/30/2021 19:55:14 - INFO - __main__ - Step 37204: {'lr': 0.0004333895934539146, 'samples': 7143168, 'steps': 37203, 'loss/train': 2.3480777740478516} -08/30/2021 19:55:15 - INFO - __main__ - Step 37205: {'lr': 0.00043338598680877423, 'samples': 7143360, 'steps': 37204, 'loss/train': 1.8372015953063965} -08/30/2021 19:55:15 - INFO - __main__ - Step 37206: {'lr': 0.00043338238008100297, 'samples': 7143552, 'steps': 37205, 'loss/train': 1.8181730508804321} -08/30/2021 19:55:15 - INFO - __main__ - Step 37207: {'lr': 0.0004333787732706024, 'samples': 7143744, 'steps': 37206, 'loss/train': 1.7918623685836792} -08/30/2021 19:55:16 - INFO - __main__ - Step 37208: {'lr': 0.00043337516637757416, 'samples': 7143936, 'steps': 37207, 'loss/train': 1.2571052312850952} -08/30/2021 19:55:17 - INFO - __main__ - Step 37209: {'lr': 0.00043337155940191996, 'samples': 7144128, 'steps': 37208, 'loss/train': 1.115092158317566} -08/30/2021 19:55:18 - INFO - __main__ - Step 37210: {'lr': 0.0004333679523436413, 'samples': 7144320, 'steps': 37209, 'loss/train': 1.2502648830413818} -08/30/2021 19:55:18 - INFO - __main__ - Step 37211: {'lr': 0.0004333643452027399, 'samples': 7144512, 'steps': 37210, 'loss/train': 0.840894877910614} -08/30/2021 19:55:18 - INFO - __main__ - Step 37212: {'lr': 0.00043336073797921743, 'samples': 7144704, 'steps': 37211, 'loss/train': 0.8375406861305237} -08/30/2021 19:55:19 - INFO - __main__ - Step 37213: {'lr': 0.0004333571306730754, 'samples': 7144896, 'steps': 37212, 'loss/train': 1.2654939889907837} -08/30/2021 19:55:19 - INFO - __main__ - Step 37214: {'lr': 0.00043335352328431544, 'samples': 7145088, 'steps': 37213, 'loss/train': 0.24022336304187775} -08/30/2021 19:55:21 - INFO - __main__ - Step 37215: {'lr': 0.00043334991581293924, 'samples': 7145280, 'steps': 37214, 'loss/train': 1.8620597124099731} -08/30/2021 19:55:21 - INFO - __main__ - Step 37216: {'lr': 0.0004333463082589484, 'samples': 7145472, 'steps': 37215, 'loss/train': 1.8533010482788086} -08/30/2021 19:55:22 - INFO - __main__ - Step 37217: {'lr': 0.0004333427006223445, 'samples': 7145664, 'steps': 37216, 'loss/train': 1.8302745819091797} -08/30/2021 19:55:22 - INFO - __main__ - Step 37218: {'lr': 0.00043333909290312923, 'samples': 7145856, 'steps': 37217, 'loss/train': 1.461767554283142} -08/30/2021 19:55:22 - INFO - __main__ - Step 37219: {'lr': 0.00043333548510130426, 'samples': 7146048, 'steps': 37218, 'loss/train': 1.3717758655548096} -08/30/2021 19:55:24 - INFO - __main__ - Step 37220: {'lr': 0.00043333187721687104, 'samples': 7146240, 'steps': 37219, 'loss/train': 1.4820228815078735} -08/30/2021 19:55:24 - INFO - __main__ - Step 37221: {'lr': 0.0004333282692498314, 'samples': 7146432, 'steps': 37220, 'loss/train': 1.2022372484207153} -08/30/2021 19:55:25 - INFO - __main__ - Step 37222: {'lr': 0.00043332466120018685, 'samples': 7146624, 'steps': 37221, 'loss/train': 1.107514500617981} -08/30/2021 19:55:25 - INFO - __main__ - Step 37223: {'lr': 0.000433321053067939, 'samples': 7146816, 'steps': 37222, 'loss/train': 1.4988950490951538} -08/30/2021 19:55:25 - INFO - __main__ - Step 37224: {'lr': 0.00043331744485308954, 'samples': 7147008, 'steps': 37223, 'loss/train': 1.3260629177093506} -08/30/2021 19:55:27 - INFO - __main__ - Step 37225: {'lr': 0.00043331383655564003, 'samples': 7147200, 'steps': 37224, 'loss/train': 1.2078348398208618} -08/30/2021 19:55:27 - INFO - __main__ - Step 37226: {'lr': 0.0004333102281755922, 'samples': 7147392, 'steps': 37225, 'loss/train': 1.2126277685165405} -08/30/2021 19:55:28 - INFO - __main__ - Step 37227: {'lr': 0.0004333066197129475, 'samples': 7147584, 'steps': 37226, 'loss/train': 1.4857620000839233} -08/30/2021 19:55:28 - INFO - __main__ - Step 37228: {'lr': 0.00043330301116770777, 'samples': 7147776, 'steps': 37227, 'loss/train': 0.8882859945297241} -08/30/2021 19:55:29 - INFO - __main__ - Step 37229: {'lr': 0.0004332994025398745, 'samples': 7147968, 'steps': 37228, 'loss/train': 1.3623707294464111} -08/30/2021 19:55:30 - INFO - __main__ - Step 37230: {'lr': 0.0004332957938294493, 'samples': 7148160, 'steps': 37229, 'loss/train': 1.6523367166519165} -08/30/2021 19:55:31 - INFO - __main__ - Step 37231: {'lr': 0.0004332921850364339, 'samples': 7148352, 'steps': 37230, 'loss/train': 0.6934989094734192} -08/30/2021 19:55:31 - INFO - __main__ - Step 37232: {'lr': 0.00043328857616082986, 'samples': 7148544, 'steps': 37231, 'loss/train': 1.1358364820480347} -08/30/2021 19:55:31 - INFO - __main__ - Step 37233: {'lr': 0.0004332849672026388, 'samples': 7148736, 'steps': 37232, 'loss/train': 1.2381203174591064} -08/30/2021 19:55:32 - INFO - __main__ - Step 37234: {'lr': 0.0004332813581618624, 'samples': 7148928, 'steps': 37233, 'loss/train': 1.1748789548873901} -08/30/2021 19:55:32 - INFO - __main__ - Step 37235: {'lr': 0.00043327774903850226, 'samples': 7149120, 'steps': 37234, 'loss/train': 1.7189126014709473} -08/30/2021 19:55:33 - INFO - __main__ - Step 37236: {'lr': 0.0004332741398325599, 'samples': 7149312, 'steps': 37235, 'loss/train': 0.944999635219574} -08/30/2021 19:55:34 - INFO - __main__ - Step 37237: {'lr': 0.00043327053054403707, 'samples': 7149504, 'steps': 37236, 'loss/train': 0.4593856930732727} -08/30/2021 19:55:34 - INFO - __main__ - Step 37238: {'lr': 0.0004332669211729354, 'samples': 7149696, 'steps': 37237, 'loss/train': 1.4445148706436157} -08/30/2021 19:55:35 - INFO - __main__ - Step 37239: {'lr': 0.00043326331171925656, 'samples': 7149888, 'steps': 37238, 'loss/train': 1.6017992496490479} -08/30/2021 19:55:35 - INFO - __main__ - Step 37240: {'lr': 0.000433259702183002, 'samples': 7150080, 'steps': 37239, 'loss/train': 0.5682351589202881} -08/30/2021 19:55:36 - INFO - __main__ - Step 37241: {'lr': 0.0004332560925641734, 'samples': 7150272, 'steps': 37240, 'loss/train': 1.3645657300949097} -08/30/2021 19:55:37 - INFO - __main__ - Step 37242: {'lr': 0.0004332524828627725, 'samples': 7150464, 'steps': 37241, 'loss/train': 1.4339689016342163} -08/30/2021 19:55:37 - INFO - __main__ - Step 37243: {'lr': 0.0004332488730788009, 'samples': 7150656, 'steps': 37242, 'loss/train': 1.087787389755249} -08/30/2021 19:55:38 - INFO - __main__ - Step 37244: {'lr': 0.0004332452632122601, 'samples': 7150848, 'steps': 37243, 'loss/train': 1.5928938388824463} -08/30/2021 19:55:38 - INFO - __main__ - Step 37245: {'lr': 0.0004332416532631519, 'samples': 7151040, 'steps': 37244, 'loss/train': 0.34386229515075684} -08/30/2021 19:55:40 - INFO - __main__ - Step 37246: {'lr': 0.00043323804323147777, 'samples': 7151232, 'steps': 37245, 'loss/train': 1.358180284500122} -08/30/2021 19:55:40 - INFO - __main__ - Step 37247: {'lr': 0.0004332344331172394, 'samples': 7151424, 'steps': 37246, 'loss/train': 1.5665887594223022} -08/30/2021 19:55:41 - INFO - __main__ - Step 37248: {'lr': 0.0004332308229204385, 'samples': 7151616, 'steps': 37247, 'loss/train': 1.357224941253662} -08/30/2021 19:55:41 - INFO - __main__ - Step 37249: {'lr': 0.00043322721264107657, 'samples': 7151808, 'steps': 37248, 'loss/train': 1.1494323015213013} -08/30/2021 19:55:41 - INFO - __main__ - Step 37250: {'lr': 0.00043322360227915526, 'samples': 7152000, 'steps': 37249, 'loss/train': 0.16026242077350616} -08/30/2021 19:55:43 - INFO - __main__ - Step 37251: {'lr': 0.0004332199918346763, 'samples': 7152192, 'steps': 37250, 'loss/train': 0.15770988166332245} -08/30/2021 19:55:43 - INFO - __main__ - Step 37252: {'lr': 0.00043321638130764116, 'samples': 7152384, 'steps': 37251, 'loss/train': 1.315923810005188} -08/30/2021 19:55:44 - INFO - __main__ - Step 37253: {'lr': 0.00043321277069805153, 'samples': 7152576, 'steps': 37252, 'loss/train': 0.7792982459068298} -08/30/2021 19:55:44 - INFO - __main__ - Step 37254: {'lr': 0.0004332091600059091, 'samples': 7152768, 'steps': 37253, 'loss/train': 1.541377067565918} -08/30/2021 19:55:44 - INFO - __main__ - Step 37255: {'lr': 0.00043320554923121545, 'samples': 7152960, 'steps': 37254, 'loss/train': 1.4678643941879272} -08/30/2021 19:55:45 - INFO - __main__ - Step 37256: {'lr': 0.0004332019383739722, 'samples': 7153152, 'steps': 37255, 'loss/train': 1.4669246673583984} -08/30/2021 19:55:47 - INFO - __main__ - Step 37257: {'lr': 0.000433198327434181, 'samples': 7153344, 'steps': 37256, 'loss/train': 1.6319292783737183} -08/30/2021 19:55:47 - INFO - __main__ - Step 37258: {'lr': 0.0004331947164118434, 'samples': 7153536, 'steps': 37257, 'loss/train': 1.3833212852478027} -08/30/2021 19:55:47 - INFO - __main__ - Step 37259: {'lr': 0.00043319110530696116, 'samples': 7153728, 'steps': 37258, 'loss/train': 1.1719000339508057} -08/30/2021 19:55:48 - INFO - __main__ - Step 37260: {'lr': 0.00043318749411953584, 'samples': 7153920, 'steps': 37259, 'loss/train': 1.6889448165893555} -08/30/2021 19:55:48 - INFO - __main__ - Step 37261: {'lr': 0.000433183882849569, 'samples': 7154112, 'steps': 37260, 'loss/train': 1.5338735580444336} -08/30/2021 19:55:49 - INFO - __main__ - Step 37262: {'lr': 0.0004331802714970624, 'samples': 7154304, 'steps': 37261, 'loss/train': 1.3940200805664062} -08/30/2021 19:55:50 - INFO - __main__ - Step 37263: {'lr': 0.0004331766600620175, 'samples': 7154496, 'steps': 37262, 'loss/train': 1.5051100254058838} -08/30/2021 19:55:50 - INFO - __main__ - Step 37264: {'lr': 0.00043317304854443607, 'samples': 7154688, 'steps': 37263, 'loss/train': 1.626781940460205} -08/30/2021 19:55:51 - INFO - __main__ - Step 37265: {'lr': 0.0004331694369443197, 'samples': 7154880, 'steps': 37264, 'loss/train': 1.3269175291061401} -08/30/2021 19:55:51 - INFO - __main__ - Step 37266: {'lr': 0.00043316582526167004, 'samples': 7155072, 'steps': 37265, 'loss/train': 1.393304467201233} -08/30/2021 19:55:53 - INFO - __main__ - Step 37267: {'lr': 0.0004331622134964887, 'samples': 7155264, 'steps': 37266, 'loss/train': 1.2010682821273804} -08/30/2021 19:55:53 - INFO - __main__ - Step 37268: {'lr': 0.0004331586016487772, 'samples': 7155456, 'steps': 37267, 'loss/train': 0.3664584457874298} -08/30/2021 19:55:53 - INFO - __main__ - Step 37269: {'lr': 0.00043315498971853726, 'samples': 7155648, 'steps': 37268, 'loss/train': 0.09463349729776382} -08/30/2021 19:55:54 - INFO - __main__ - Step 37270: {'lr': 0.0004331513777057706, 'samples': 7155840, 'steps': 37269, 'loss/train': 1.4243720769882202} -08/30/2021 19:55:54 - INFO - __main__ - Step 37271: {'lr': 0.00043314776561047865, 'samples': 7156032, 'steps': 37270, 'loss/train': 1.5816227197647095} -08/30/2021 19:55:56 - INFO - __main__ - Step 37272: {'lr': 0.0004331441534326632, 'samples': 7156224, 'steps': 37271, 'loss/train': 1.6990299224853516} -08/30/2021 19:55:56 - INFO - __main__ - Step 37273: {'lr': 0.0004331405411723258, 'samples': 7156416, 'steps': 37272, 'loss/train': 1.6356576681137085} -08/30/2021 19:55:57 - INFO - __main__ - Step 37274: {'lr': 0.0004331369288294681, 'samples': 7156608, 'steps': 37273, 'loss/train': 1.199906587600708} -08/30/2021 19:55:57 - INFO - __main__ - Step 37275: {'lr': 0.0004331333164040918, 'samples': 7156800, 'steps': 37274, 'loss/train': 1.1874136924743652} -08/30/2021 19:55:58 - INFO - __main__ - Step 37276: {'lr': 0.0004331297038961984, 'samples': 7156992, 'steps': 37275, 'loss/train': 1.125455379486084} -08/30/2021 19:55:59 - INFO - __main__ - Step 37277: {'lr': 0.00043312609130578963, 'samples': 7157184, 'steps': 37276, 'loss/train': 1.2430005073547363} -08/30/2021 19:56:00 - INFO - __main__ - Step 37278: {'lr': 0.000433122478632867, 'samples': 7157376, 'steps': 37277, 'loss/train': 0.1170068085193634} -08/30/2021 19:56:00 - INFO - __main__ - Step 37279: {'lr': 0.0004331188658774322, 'samples': 7157568, 'steps': 37278, 'loss/train': 1.7714715003967285} -08/30/2021 19:56:00 - INFO - __main__ - Step 37280: {'lr': 0.00043311525303948685, 'samples': 7157760, 'steps': 37279, 'loss/train': 0.8312937617301941} -08/30/2021 19:56:01 - INFO - __main__ - Step 37281: {'lr': 0.0004331116401190327, 'samples': 7157952, 'steps': 37280, 'loss/train': 1.6909489631652832} -08/30/2021 19:56:02 - INFO - __main__ - Step 37282: {'lr': 0.0004331080271160712, 'samples': 7158144, 'steps': 37281, 'loss/train': 1.5297600030899048} -08/30/2021 19:56:03 - INFO - __main__ - Step 37283: {'lr': 0.00043310441403060404, 'samples': 7158336, 'steps': 37282, 'loss/train': 1.5976977348327637} -08/30/2021 19:56:03 - INFO - __main__ - Step 37284: {'lr': 0.00043310080086263284, 'samples': 7158528, 'steps': 37283, 'loss/train': 1.4269418716430664} -08/30/2021 19:56:03 - INFO - __main__ - Step 37285: {'lr': 0.0004330971876121593, 'samples': 7158720, 'steps': 37284, 'loss/train': 1.2697572708129883} -08/30/2021 19:56:04 - INFO - __main__ - Step 37286: {'lr': 0.0004330935742791849, 'samples': 7158912, 'steps': 37285, 'loss/train': 1.423542857170105} -08/30/2021 19:56:06 - INFO - __main__ - Step 37287: {'lr': 0.00043308996086371146, 'samples': 7159104, 'steps': 37286, 'loss/train': 2.171774387359619} -08/30/2021 19:56:06 - INFO - __main__ - Step 37288: {'lr': 0.0004330863473657405, 'samples': 7159296, 'steps': 37287, 'loss/train': 1.756593942642212} -08/30/2021 19:56:07 - INFO - __main__ - Step 37289: {'lr': 0.00043308273378527364, 'samples': 7159488, 'steps': 37288, 'loss/train': 1.410674810409546} -08/30/2021 19:56:07 - INFO - __main__ - Step 37290: {'lr': 0.00043307912012231255, 'samples': 7159680, 'steps': 37289, 'loss/train': 1.7248365879058838} -08/30/2021 19:56:07 - INFO - __main__ - Step 37291: {'lr': 0.0004330755063768588, 'samples': 7159872, 'steps': 37290, 'loss/train': 0.11255665123462677} -08/30/2021 19:56:08 - INFO - __main__ - Step 37292: {'lr': 0.000433071892548914, 'samples': 7160064, 'steps': 37291, 'loss/train': 0.06722675263881683} -08/30/2021 19:56:08 - INFO - __main__ - Step 37293: {'lr': 0.00043306827863847985, 'samples': 7160256, 'steps': 37292, 'loss/train': 1.6550936698913574} -08/30/2021 19:56:10 - INFO - __main__ - Step 37294: {'lr': 0.00043306466464555803, 'samples': 7160448, 'steps': 37293, 'loss/train': 0.29456886649131775} -08/30/2021 19:56:10 - INFO - __main__ - Step 37295: {'lr': 0.0004330610505701501, 'samples': 7160640, 'steps': 37294, 'loss/train': 1.5085599422454834} -08/30/2021 19:56:11 - INFO - __main__ - Step 37296: {'lr': 0.00043305743641225766, 'samples': 7160832, 'steps': 37295, 'loss/train': 1.5765646696090698} -08/30/2021 19:56:11 - INFO - __main__ - Step 37297: {'lr': 0.00043305382217188225, 'samples': 7161024, 'steps': 37296, 'loss/train': 1.4817980527877808} -08/30/2021 19:56:11 - INFO - __main__ - Step 37298: {'lr': 0.0004330502078490258, 'samples': 7161216, 'steps': 37297, 'loss/train': 1.6245449781417847} -08/30/2021 19:56:13 - INFO - __main__ - Step 37299: {'lr': 0.0004330465934436896, 'samples': 7161408, 'steps': 37298, 'loss/train': 1.7996934652328491} -08/30/2021 19:56:13 - INFO - __main__ - Step 37300: {'lr': 0.00043304297895587553, 'samples': 7161600, 'steps': 37299, 'loss/train': 1.0784474611282349} -08/30/2021 19:56:14 - INFO - __main__ - Step 37301: {'lr': 0.0004330393643855851, 'samples': 7161792, 'steps': 37300, 'loss/train': 1.261918067932129} -08/30/2021 19:56:14 - INFO - __main__ - Step 37302: {'lr': 0.0004330357497328199, 'samples': 7161984, 'steps': 37301, 'loss/train': 1.263678789138794} -08/30/2021 19:56:14 - INFO - __main__ - Step 37303: {'lr': 0.00043303213499758166, 'samples': 7162176, 'steps': 37302, 'loss/train': 1.6204594373703003} -08/30/2021 19:56:16 - INFO - __main__ - Step 37304: {'lr': 0.00043302852017987196, 'samples': 7162368, 'steps': 37303, 'loss/train': 1.5933401584625244} -08/30/2021 19:56:17 - INFO - __main__ - Step 37305: {'lr': 0.0004330249052796924, 'samples': 7162560, 'steps': 37304, 'loss/train': 0.846378743648529} -08/30/2021 19:56:17 - INFO - __main__ - Step 37306: {'lr': 0.0004330212902970447, 'samples': 7162752, 'steps': 37305, 'loss/train': 1.3449466228485107} -08/30/2021 19:56:17 - INFO - __main__ - Step 37307: {'lr': 0.0004330176752319304, 'samples': 7162944, 'steps': 37306, 'loss/train': 1.298366904258728} -08/30/2021 19:56:18 - INFO - __main__ - Step 37308: {'lr': 0.0004330140600843512, 'samples': 7163136, 'steps': 37307, 'loss/train': 0.14137066900730133} -08/30/2021 19:56:18 - INFO - __main__ - Step 37309: {'lr': 0.0004330104448543086, 'samples': 7163328, 'steps': 37308, 'loss/train': 1.425593376159668} -08/30/2021 19:56:20 - INFO - __main__ - Step 37310: {'lr': 0.0004330068295418044, 'samples': 7163520, 'steps': 37309, 'loss/train': 1.1895626783370972} -08/30/2021 19:56:20 - INFO - __main__ - Step 37311: {'lr': 0.0004330032141468401, 'samples': 7163712, 'steps': 37310, 'loss/train': 1.4988731145858765} -08/30/2021 19:56:20 - INFO - __main__ - Step 37312: {'lr': 0.0004329995986694174, 'samples': 7163904, 'steps': 37311, 'loss/train': 1.6009279489517212} -08/30/2021 19:56:21 - INFO - __main__ - Step 37313: {'lr': 0.00043299598310953793, 'samples': 7164096, 'steps': 37312, 'loss/train': 1.7883325815200806} -08/30/2021 19:56:21 - INFO - __main__ - Step 37314: {'lr': 0.0004329923674672032, 'samples': 7164288, 'steps': 37313, 'loss/train': 1.531451940536499} -08/30/2021 19:56:23 - INFO - __main__ - Step 37315: {'lr': 0.00043298875174241504, 'samples': 7164480, 'steps': 37314, 'loss/train': 1.3104544878005981} -08/30/2021 19:56:23 - INFO - __main__ - Step 37316: {'lr': 0.00043298513593517483, 'samples': 7164672, 'steps': 37315, 'loss/train': 1.6571338176727295} -08/30/2021 19:56:24 - INFO - __main__ - Step 37317: {'lr': 0.0004329815200454845, 'samples': 7164864, 'steps': 37316, 'loss/train': 0.07107654958963394} -08/30/2021 19:56:24 - INFO - __main__ - Step 37318: {'lr': 0.00043297790407334545, 'samples': 7165056, 'steps': 37317, 'loss/train': 1.0674660205841064} -08/30/2021 19:56:24 - INFO - __main__ - Step 37319: {'lr': 0.0004329742880187594, 'samples': 7165248, 'steps': 37318, 'loss/train': 1.6088038682937622} -08/30/2021 19:56:26 - INFO - __main__ - Step 37320: {'lr': 0.0004329706718817279, 'samples': 7165440, 'steps': 37319, 'loss/train': 1.5619314908981323} -08/30/2021 19:56:27 - INFO - __main__ - Step 37321: {'lr': 0.00043296705566225267, 'samples': 7165632, 'steps': 37320, 'loss/train': 1.4305415153503418} -08/30/2021 19:56:27 - INFO - __main__ - Step 37322: {'lr': 0.00043296343936033535, 'samples': 7165824, 'steps': 37321, 'loss/train': 1.6878626346588135} -08/30/2021 19:56:27 - INFO - __main__ - Step 37323: {'lr': 0.0004329598229759775, 'samples': 7166016, 'steps': 37322, 'loss/train': 1.2063426971435547} -08/30/2021 19:56:28 - INFO - __main__ - Step 37324: {'lr': 0.00043295620650918076, 'samples': 7166208, 'steps': 37323, 'loss/train': 0.07216602563858032} -08/30/2021 19:56:28 - INFO - __main__ - Step 37325: {'lr': 0.0004329525899599468, 'samples': 7166400, 'steps': 37324, 'loss/train': 0.3446216881275177} -08/30/2021 19:56:30 - INFO - __main__ - Step 37326: {'lr': 0.0004329489733282772, 'samples': 7166592, 'steps': 37325, 'loss/train': 0.14824801683425903} -08/30/2021 19:56:30 - INFO - __main__ - Step 37327: {'lr': 0.0004329453566141737, 'samples': 7166784, 'steps': 37326, 'loss/train': 1.5553874969482422} -08/30/2021 19:56:31 - INFO - __main__ - Step 37328: {'lr': 0.00043294173981763776, 'samples': 7166976, 'steps': 37327, 'loss/train': 1.5382400751113892} -08/30/2021 19:56:31 - INFO - __main__ - Step 37329: {'lr': 0.00043293812293867113, 'samples': 7167168, 'steps': 37328, 'loss/train': 1.0531420707702637} -08/30/2021 19:56:31 - INFO - __main__ - Step 37330: {'lr': 0.0004329345059772754, 'samples': 7167360, 'steps': 37329, 'loss/train': 1.4449208974838257} -08/30/2021 19:56:33 - INFO - __main__ - Step 37331: {'lr': 0.0004329308889334522, 'samples': 7167552, 'steps': 37330, 'loss/train': 1.391638159751892} -08/30/2021 19:56:33 - INFO - __main__ - Step 37332: {'lr': 0.00043292727180720315, 'samples': 7167744, 'steps': 37331, 'loss/train': 1.972778558731079} -08/30/2021 19:56:34 - INFO - __main__ - Step 37333: {'lr': 0.0004329236545985299, 'samples': 7167936, 'steps': 37332, 'loss/train': 1.0132642984390259} -08/30/2021 19:56:34 - INFO - __main__ - Step 37334: {'lr': 0.000432920037307434, 'samples': 7168128, 'steps': 37333, 'loss/train': 1.914176106452942} -08/30/2021 19:56:34 - INFO - __main__ - Step 37335: {'lr': 0.00043291641993391727, 'samples': 7168320, 'steps': 37334, 'loss/train': 1.3197611570358276} -08/30/2021 19:56:36 - INFO - __main__ - Step 37336: {'lr': 0.0004329128024779812, 'samples': 7168512, 'steps': 37335, 'loss/train': 0.8799515962600708} -08/30/2021 19:56:37 - INFO - __main__ - Step 37337: {'lr': 0.0004329091849396274, 'samples': 7168704, 'steps': 37336, 'loss/train': 1.0617070198059082} -08/30/2021 19:56:37 - INFO - __main__ - Step 37338: {'lr': 0.00043290556731885756, 'samples': 7168896, 'steps': 37337, 'loss/train': 1.0679913759231567} -08/30/2021 19:56:37 - INFO - __main__ - Step 37339: {'lr': 0.0004329019496156733, 'samples': 7169088, 'steps': 37338, 'loss/train': 0.05821027234196663} -08/30/2021 19:56:38 - INFO - __main__ - Step 37340: {'lr': 0.0004328983318300763, 'samples': 7169280, 'steps': 37339, 'loss/train': 0.5832203030586243} -08/30/2021 19:56:39 - INFO - __main__ - Step 37341: {'lr': 0.00043289471396206803, 'samples': 7169472, 'steps': 37340, 'loss/train': 2.432037830352783} -08/30/2021 19:56:40 - INFO - __main__ - Step 37342: {'lr': 0.0004328910960116503, 'samples': 7169664, 'steps': 37341, 'loss/train': 1.2108513116836548} -08/30/2021 19:56:40 - INFO - __main__ - Step 37343: {'lr': 0.00043288747797882467, 'samples': 7169856, 'steps': 37342, 'loss/train': 1.0174715518951416} -08/30/2021 19:56:40 - INFO - __main__ - Step 37344: {'lr': 0.00043288385986359266, 'samples': 7170048, 'steps': 37343, 'loss/train': 1.4958276748657227} -08/30/2021 19:56:41 - INFO - __main__ - Step 37345: {'lr': 0.00043288024166595614, 'samples': 7170240, 'steps': 37344, 'loss/train': 1.271643042564392} -08/30/2021 19:56:41 - INFO - __main__ - Step 37346: {'lr': 0.00043287662338591657, 'samples': 7170432, 'steps': 37345, 'loss/train': 1.5020782947540283} -08/30/2021 19:56:43 - INFO - __main__ - Step 37347: {'lr': 0.0004328730050234756, 'samples': 7170624, 'steps': 37346, 'loss/train': 1.7531085014343262} -08/30/2021 19:56:43 - INFO - __main__ - Step 37348: {'lr': 0.00043286938657863483, 'samples': 7170816, 'steps': 37347, 'loss/train': 1.0881903171539307} -08/30/2021 19:56:43 - INFO - __main__ - Step 37349: {'lr': 0.00043286576805139597, 'samples': 7171008, 'steps': 37348, 'loss/train': 1.3239662647247314} -08/30/2021 19:56:44 - INFO - __main__ - Step 37350: {'lr': 0.0004328621494417606, 'samples': 7171200, 'steps': 37349, 'loss/train': 1.359250783920288} -08/30/2021 19:56:44 - INFO - __main__ - Step 37351: {'lr': 0.0004328585307497304, 'samples': 7171392, 'steps': 37350, 'loss/train': 1.7430981397628784} -08/30/2021 19:56:44 - INFO - __main__ - Step 37352: {'lr': 0.00043285491197530694, 'samples': 7171584, 'steps': 37351, 'loss/train': 1.6985012292861938} -08/30/2021 19:56:46 - INFO - __main__ - Step 37353: {'lr': 0.00043285129311849193, 'samples': 7171776, 'steps': 37352, 'loss/train': 0.9445045590400696} -08/30/2021 19:56:46 - INFO - __main__ - Step 37354: {'lr': 0.0004328476741792869, 'samples': 7171968, 'steps': 37353, 'loss/train': 0.12586896121501923} -08/30/2021 19:56:47 - INFO - __main__ - Step 37355: {'lr': 0.00043284405515769356, 'samples': 7172160, 'steps': 37354, 'loss/train': 1.033687710762024} -08/30/2021 19:56:47 - INFO - __main__ - Step 37356: {'lr': 0.00043284043605371346, 'samples': 7172352, 'steps': 37355, 'loss/train': 1.3645912408828735} -08/30/2021 19:56:49 - INFO - __main__ - Step 37357: {'lr': 0.0004328368168673483, 'samples': 7172544, 'steps': 37356, 'loss/train': 1.8850632905960083} -08/30/2021 19:56:49 - INFO - __main__ - Step 37358: {'lr': 0.00043283319759859974, 'samples': 7172736, 'steps': 37357, 'loss/train': 1.6752790212631226} -08/30/2021 19:56:49 - INFO - __main__ - Step 37359: {'lr': 0.0004328295782474693, 'samples': 7172928, 'steps': 37358, 'loss/train': 1.166944980621338} -08/30/2021 19:56:50 - INFO - __main__ - Step 37360: {'lr': 0.0004328259588139587, 'samples': 7173120, 'steps': 37359, 'loss/train': 1.457136869430542} -08/30/2021 19:56:50 - INFO - __main__ - Step 37361: {'lr': 0.0004328223392980696, 'samples': 7173312, 'steps': 37360, 'loss/train': 2.1077630519866943} -08/30/2021 19:56:50 - INFO - __main__ - Step 37362: {'lr': 0.00043281871969980346, 'samples': 7173504, 'steps': 37361, 'loss/train': 1.880540370941162} -08/30/2021 19:56:52 - INFO - __main__ - Step 37363: {'lr': 0.00043281510001916214, 'samples': 7173696, 'steps': 37362, 'loss/train': 2.121408224105835} -08/30/2021 19:56:52 - INFO - __main__ - Step 37364: {'lr': 0.0004328114802561471, 'samples': 7173888, 'steps': 37363, 'loss/train': 1.6379472017288208} -08/30/2021 19:56:53 - INFO - __main__ - Step 37365: {'lr': 0.00043280786041076006, 'samples': 7174080, 'steps': 37364, 'loss/train': 1.5812128782272339} -08/30/2021 19:56:53 - INFO - __main__ - Step 37366: {'lr': 0.0004328042404830026, 'samples': 7174272, 'steps': 37365, 'loss/train': 1.535988450050354} -08/30/2021 19:56:53 - INFO - __main__ - Step 37367: {'lr': 0.0004328006204728763, 'samples': 7174464, 'steps': 37366, 'loss/train': 1.198941946029663} -08/30/2021 19:56:55 - INFO - __main__ - Step 37368: {'lr': 0.00043279700038038296, 'samples': 7174656, 'steps': 37367, 'loss/train': 1.422837257385254} -08/30/2021 19:56:55 - INFO - __main__ - Step 37369: {'lr': 0.0004327933802055241, 'samples': 7174848, 'steps': 37368, 'loss/train': 1.2558835744857788} -08/30/2021 19:56:56 - INFO - __main__ - Step 37370: {'lr': 0.0004327897599483013, 'samples': 7175040, 'steps': 37369, 'loss/train': 1.3162193298339844} -08/30/2021 19:56:56 - INFO - __main__ - Step 37371: {'lr': 0.00043278613960871624, 'samples': 7175232, 'steps': 37370, 'loss/train': 1.0559483766555786} -08/30/2021 19:56:56 - INFO - __main__ - Step 37372: {'lr': 0.00043278251918677066, 'samples': 7175424, 'steps': 37371, 'loss/train': 0.9671065807342529} -08/30/2021 19:56:58 - INFO - __main__ - Step 37373: {'lr': 0.00043277889868246605, 'samples': 7175616, 'steps': 37372, 'loss/train': 1.4900364875793457} -08/30/2021 19:56:59 - INFO - __main__ - Step 37374: {'lr': 0.0004327752780958041, 'samples': 7175808, 'steps': 37373, 'loss/train': 0.9577486515045166} -08/30/2021 19:56:59 - INFO - __main__ - Step 37375: {'lr': 0.0004327716574267864, 'samples': 7176000, 'steps': 37374, 'loss/train': 2.4016902446746826} -08/30/2021 19:56:59 - INFO - __main__ - Step 37376: {'lr': 0.00043276803667541465, 'samples': 7176192, 'steps': 37375, 'loss/train': 1.3319861888885498} -08/30/2021 19:57:00 - INFO - __main__ - Step 37377: {'lr': 0.0004327644158416905, 'samples': 7176384, 'steps': 37376, 'loss/train': 1.5461835861206055} -08/30/2021 19:57:02 - INFO - __main__ - Step 37378: {'lr': 0.0004327607949256154, 'samples': 7176576, 'steps': 37377, 'loss/train': 0.04532282054424286} -08/30/2021 19:57:02 - INFO - __main__ - Step 37379: {'lr': 0.00043275717392719115, 'samples': 7176768, 'steps': 37378, 'loss/train': 1.0498652458190918} -08/30/2021 19:57:02 - INFO - __main__ - Step 37380: {'lr': 0.0004327535528464194, 'samples': 7176960, 'steps': 37379, 'loss/train': 0.8886426091194153} -08/30/2021 19:57:03 - INFO - __main__ - Step 37381: {'lr': 0.0004327499316833016, 'samples': 7177152, 'steps': 37380, 'loss/train': 1.3985416889190674} -08/30/2021 19:57:03 - INFO - __main__ - Step 37382: {'lr': 0.0004327463104378395, 'samples': 7177344, 'steps': 37381, 'loss/train': 1.2480146884918213} -08/30/2021 19:57:05 - INFO - __main__ - Step 37383: {'lr': 0.0004327426891100349, 'samples': 7177536, 'steps': 37382, 'loss/train': 1.7824444770812988} -08/30/2021 19:57:06 - INFO - __main__ - Step 37384: {'lr': 0.0004327390676998891, 'samples': 7177728, 'steps': 37383, 'loss/train': 1.5549664497375488} -08/30/2021 19:57:06 - INFO - __main__ - Step 37385: {'lr': 0.000432735446207404, 'samples': 7177920, 'steps': 37384, 'loss/train': 1.207931637763977} -08/30/2021 19:57:06 - INFO - __main__ - Step 37386: {'lr': 0.0004327318246325811, 'samples': 7178112, 'steps': 37385, 'loss/train': 1.0678645372390747} -08/30/2021 19:57:07 - INFO - __main__ - Step 37387: {'lr': 0.000432728202975422, 'samples': 7178304, 'steps': 37386, 'loss/train': 0.37636715173721313} -08/30/2021 19:57:07 - INFO - __main__ - Step 37388: {'lr': 0.0004327245812359285, 'samples': 7178496, 'steps': 37387, 'loss/train': 0.088512122631073} -08/30/2021 19:57:09 - INFO - __main__ - Step 37389: {'lr': 0.000432720959414102, 'samples': 7178688, 'steps': 37388, 'loss/train': 1.6997284889221191} -08/30/2021 19:57:09 - INFO - __main__ - Step 37390: {'lr': 0.00043271733750994436, 'samples': 7178880, 'steps': 37389, 'loss/train': 1.2147971391677856} -08/30/2021 19:57:10 - INFO - __main__ - Step 37391: {'lr': 0.00043271371552345704, 'samples': 7179072, 'steps': 37390, 'loss/train': 1.3436174392700195} -08/30/2021 19:57:10 - INFO - __main__ - Step 37392: {'lr': 0.00043271009345464175, 'samples': 7179264, 'steps': 37391, 'loss/train': 0.6908589601516724} -08/30/2021 19:57:10 - INFO - __main__ - Step 37393: {'lr': 0.0004327064713035002, 'samples': 7179456, 'steps': 37392, 'loss/train': 1.4388829469680786} -08/30/2021 19:57:12 - INFO - __main__ - Step 37394: {'lr': 0.00043270284907003377, 'samples': 7179648, 'steps': 37393, 'loss/train': 1.4150233268737793} -08/30/2021 19:57:12 - INFO - __main__ - Step 37395: {'lr': 0.0004326992267542443, 'samples': 7179840, 'steps': 37394, 'loss/train': 1.4888242483139038} -08/30/2021 19:57:13 - INFO - __main__ - Step 37396: {'lr': 0.0004326956043561335, 'samples': 7180032, 'steps': 37395, 'loss/train': 1.0283443927764893} -08/30/2021 19:57:13 - INFO - __main__ - Step 37397: {'lr': 0.0004326919818757028, 'samples': 7180224, 'steps': 37396, 'loss/train': 3.0277960300445557} -08/30/2021 19:57:14 - INFO - __main__ - Step 37398: {'lr': 0.00043268835931295393, 'samples': 7180416, 'steps': 37397, 'loss/train': 0.054287899285554886} -08/30/2021 19:57:14 - INFO - __main__ - Step 37399: {'lr': 0.00043268473666788844, 'samples': 7180608, 'steps': 37398, 'loss/train': 1.6503711938858032} -08/30/2021 19:57:15 - INFO - __main__ - Step 37400: {'lr': 0.0004326811139405081, 'samples': 7180800, 'steps': 37399, 'loss/train': 1.7558388710021973} -08/30/2021 19:57:16 - INFO - __main__ - Step 37401: {'lr': 0.0004326774911308145, 'samples': 7180992, 'steps': 37400, 'loss/train': 1.7582695484161377} -08/30/2021 19:57:16 - INFO - __main__ - Step 37402: {'lr': 0.00043267386823880904, 'samples': 7181184, 'steps': 37401, 'loss/train': 1.6344903707504272} -08/30/2021 19:57:16 - INFO - __main__ - Step 37403: {'lr': 0.00043267024526449374, 'samples': 7181376, 'steps': 37402, 'loss/train': 1.507318377494812} -08/30/2021 19:57:17 - INFO - __main__ - Step 37404: {'lr': 0.00043266662220787003, 'samples': 7181568, 'steps': 37403, 'loss/train': 1.3364880084991455} -08/30/2021 19:57:18 - INFO - __main__ - Step 37405: {'lr': 0.0004326629990689395, 'samples': 7181760, 'steps': 37404, 'loss/train': 1.3650082349777222} -08/30/2021 19:57:19 - INFO - __main__ - Step 37406: {'lr': 0.0004326593758477039, 'samples': 7181952, 'steps': 37405, 'loss/train': 0.8217769265174866} -08/30/2021 19:57:19 - INFO - __main__ - Step 37407: {'lr': 0.0004326557525441648, 'samples': 7182144, 'steps': 37406, 'loss/train': 1.3236083984375} -08/30/2021 19:57:19 - INFO - __main__ - Step 37408: {'lr': 0.00043265212915832374, 'samples': 7182336, 'steps': 37407, 'loss/train': 1.3377635478973389} -08/30/2021 19:57:20 - INFO - __main__ - Step 37409: {'lr': 0.00043264850569018254, 'samples': 7182528, 'steps': 37408, 'loss/train': 1.2040746212005615} -08/30/2021 19:57:21 - INFO - __main__ - Step 37410: {'lr': 0.00043264488213974275, 'samples': 7182720, 'steps': 37409, 'loss/train': 1.322455883026123} -08/30/2021 19:57:22 - INFO - __main__ - Step 37411: {'lr': 0.000432641258507006, 'samples': 7182912, 'steps': 37410, 'loss/train': 1.3514970541000366} -08/30/2021 19:57:22 - INFO - __main__ - Step 37412: {'lr': 0.0004326376347919738, 'samples': 7183104, 'steps': 37411, 'loss/train': 0.9499925374984741} -08/30/2021 19:57:22 - INFO - __main__ - Step 37413: {'lr': 0.00043263401099464805, 'samples': 7183296, 'steps': 37412, 'loss/train': 1.6077375411987305} -08/30/2021 19:57:23 - INFO - __main__ - Step 37414: {'lr': 0.00043263038711503017, 'samples': 7183488, 'steps': 37413, 'loss/train': 1.4592623710632324} -08/30/2021 19:57:24 - INFO - __main__ - Step 37415: {'lr': 0.00043262676315312183, 'samples': 7183680, 'steps': 37414, 'loss/train': 1.508489966392517} -08/30/2021 19:57:25 - INFO - __main__ - Step 37416: {'lr': 0.0004326231391089247, 'samples': 7183872, 'steps': 37415, 'loss/train': 1.2562161684036255} -08/30/2021 19:57:25 - INFO - __main__ - Step 37417: {'lr': 0.00043261951498244045, 'samples': 7184064, 'steps': 37416, 'loss/train': 1.4437053203582764} -08/30/2021 19:57:25 - INFO - __main__ - Step 37418: {'lr': 0.0004326158907736706, 'samples': 7184256, 'steps': 37417, 'loss/train': 1.0420544147491455} -08/30/2021 19:57:26 - INFO - __main__ - Step 37419: {'lr': 0.00043261226648261687, 'samples': 7184448, 'steps': 37418, 'loss/train': 1.6170576810836792} -08/30/2021 19:57:27 - INFO - __main__ - Step 37420: {'lr': 0.0004326086421092809, 'samples': 7184640, 'steps': 37419, 'loss/train': 1.7398796081542969} -08/30/2021 19:57:28 - INFO - __main__ - Step 37421: {'lr': 0.00043260501765366425, 'samples': 7184832, 'steps': 37420, 'loss/train': 1.1298325061798096} -08/30/2021 19:57:28 - INFO - __main__ - Step 37422: {'lr': 0.00043260139311576863, 'samples': 7185024, 'steps': 37421, 'loss/train': 0.9653279185295105} -08/30/2021 19:57:28 - INFO - __main__ - Step 37423: {'lr': 0.0004325977684955956, 'samples': 7185216, 'steps': 37422, 'loss/train': 1.33500075340271} -08/30/2021 19:57:29 - INFO - __main__ - Step 37424: {'lr': 0.0004325941437931469, 'samples': 7185408, 'steps': 37423, 'loss/train': 1.562026023864746} -08/30/2021 19:57:30 - INFO - __main__ - Step 37425: {'lr': 0.0004325905190084241, 'samples': 7185600, 'steps': 37424, 'loss/train': 1.6564122438430786} -08/30/2021 19:57:31 - INFO - __main__ - Step 37426: {'lr': 0.00043258689414142875, 'samples': 7185792, 'steps': 37425, 'loss/train': 1.2570436000823975} -08/30/2021 19:57:31 - INFO - __main__ - Step 37427: {'lr': 0.0004325832691921626, 'samples': 7185984, 'steps': 37426, 'loss/train': 1.313199520111084} -08/30/2021 19:57:31 - INFO - __main__ - Step 37428: {'lr': 0.00043257964416062723, 'samples': 7186176, 'steps': 37427, 'loss/train': 1.1498758792877197} -08/30/2021 19:57:32 - INFO - __main__ - Step 37429: {'lr': 0.0004325760190468243, 'samples': 7186368, 'steps': 37428, 'loss/train': 1.528903603553772} -08/30/2021 19:57:33 - INFO - __main__ - Step 37430: {'lr': 0.0004325723938507555, 'samples': 7186560, 'steps': 37429, 'loss/train': 1.7303169965744019} -08/30/2021 19:57:34 - INFO - __main__ - Step 37431: {'lr': 0.0004325687685724223, 'samples': 7186752, 'steps': 37430, 'loss/train': 1.217275857925415} -08/30/2021 19:57:34 - INFO - __main__ - Step 37432: {'lr': 0.0004325651432118265, 'samples': 7186944, 'steps': 37431, 'loss/train': 1.6117987632751465} -08/30/2021 19:57:34 - INFO - __main__ - Step 37433: {'lr': 0.00043256151776896955, 'samples': 7187136, 'steps': 37432, 'loss/train': 0.9703555703163147} -08/30/2021 19:57:35 - INFO - __main__ - Step 37434: {'lr': 0.0004325578922438533, 'samples': 7187328, 'steps': 37433, 'loss/train': 1.4213981628417969} -08/30/2021 19:57:37 - INFO - __main__ - Step 37435: {'lr': 0.0004325542666364793, 'samples': 7187520, 'steps': 37434, 'loss/train': 1.5709381103515625} -08/30/2021 19:57:37 - INFO - __main__ - Step 37436: {'lr': 0.00043255064094684917, 'samples': 7187712, 'steps': 37435, 'loss/train': 1.619301199913025} -08/30/2021 19:57:38 - INFO - __main__ - Step 37437: {'lr': 0.0004325470151749644, 'samples': 7187904, 'steps': 37436, 'loss/train': 1.691413402557373} -08/30/2021 19:57:38 - INFO - __main__ - Step 37438: {'lr': 0.00043254338932082696, 'samples': 7188096, 'steps': 37437, 'loss/train': 1.849639892578125} -08/30/2021 19:57:38 - INFO - __main__ - Step 37439: {'lr': 0.00043253976338443814, 'samples': 7188288, 'steps': 37438, 'loss/train': 1.6818939447402954} -08/30/2021 19:57:40 - INFO - __main__ - Step 37440: {'lr': 0.00043253613736579975, 'samples': 7188480, 'steps': 37439, 'loss/train': 1.8714663982391357} -08/30/2021 19:57:40 - INFO - __main__ - Step 37441: {'lr': 0.0004325325112649134, 'samples': 7188672, 'steps': 37440, 'loss/train': 0.05223394185304642} -08/30/2021 19:57:41 - INFO - __main__ - Step 37442: {'lr': 0.00043252888508178066, 'samples': 7188864, 'steps': 37441, 'loss/train': 1.535318374633789} -08/30/2021 19:57:41 - INFO - __main__ - Step 37443: {'lr': 0.0004325252588164033, 'samples': 7189056, 'steps': 37442, 'loss/train': 1.324577808380127} -08/30/2021 19:57:41 - INFO - __main__ - Step 37444: {'lr': 0.00043252163246878286, 'samples': 7189248, 'steps': 37443, 'loss/train': 1.3996564149856567} -08/30/2021 19:57:43 - INFO - __main__ - Step 37445: {'lr': 0.000432518006038921, 'samples': 7189440, 'steps': 37444, 'loss/train': 1.14308762550354} -08/30/2021 19:57:43 - INFO - __main__ - Step 37446: {'lr': 0.00043251437952681926, 'samples': 7189632, 'steps': 37445, 'loss/train': 0.6676692366600037} -08/30/2021 19:57:44 - INFO - __main__ - Step 37447: {'lr': 0.0004325107529324795, 'samples': 7189824, 'steps': 37446, 'loss/train': 1.4937154054641724} -08/30/2021 19:57:44 - INFO - __main__ - Step 37448: {'lr': 0.0004325071262559031, 'samples': 7190016, 'steps': 37447, 'loss/train': 1.6540510654449463} -08/30/2021 19:57:44 - INFO - __main__ - Step 37449: {'lr': 0.00043250349949709184, 'samples': 7190208, 'steps': 37448, 'loss/train': 1.3088397979736328} -08/30/2021 19:57:45 - INFO - __main__ - Step 37450: {'lr': 0.0004324998726560473, 'samples': 7190400, 'steps': 37449, 'loss/train': 0.5380183458328247} -08/30/2021 19:57:46 - INFO - __main__ - Step 37451: {'lr': 0.0004324962457327712, 'samples': 7190592, 'steps': 37450, 'loss/train': 1.4496593475341797} -08/30/2021 19:57:47 - INFO - __main__ - Step 37452: {'lr': 0.00043249261872726504, 'samples': 7190784, 'steps': 37451, 'loss/train': 1.0326513051986694} -08/30/2021 19:57:47 - INFO - __main__ - Step 37453: {'lr': 0.0004324889916395305, 'samples': 7190976, 'steps': 37452, 'loss/train': 2.254138946533203} -08/30/2021 19:57:47 - INFO - __main__ - Step 37454: {'lr': 0.0004324853644695693, 'samples': 7191168, 'steps': 37453, 'loss/train': 1.4218182563781738} -08/30/2021 19:57:48 - INFO - __main__ - Step 37455: {'lr': 0.000432481737217383, 'samples': 7191360, 'steps': 37454, 'loss/train': 1.4825137853622437} -08/30/2021 19:57:49 - INFO - __main__ - Step 37456: {'lr': 0.0004324781098829732, 'samples': 7191552, 'steps': 37455, 'loss/train': 0.029197394847869873} -08/30/2021 19:57:50 - INFO - __main__ - Step 37457: {'lr': 0.0004324744824663417, 'samples': 7191744, 'steps': 37456, 'loss/train': 1.437658429145813} -08/30/2021 19:57:50 - INFO - __main__ - Step 37458: {'lr': 0.00043247085496748983, 'samples': 7191936, 'steps': 37457, 'loss/train': 0.9503560662269592} -08/30/2021 19:57:50 - INFO - __main__ - Step 37459: {'lr': 0.0004324672273864195, 'samples': 7192128, 'steps': 37458, 'loss/train': 1.532064437866211} -08/30/2021 19:57:51 - INFO - __main__ - Step 37460: {'lr': 0.00043246359972313233, 'samples': 7192320, 'steps': 37459, 'loss/train': 1.625966191291809} -08/30/2021 19:57:52 - INFO - __main__ - Step 37461: {'lr': 0.0004324599719776298, 'samples': 7192512, 'steps': 37460, 'loss/train': 1.7297823429107666} -08/30/2021 19:57:53 - INFO - __main__ - Step 37462: {'lr': 0.00043245634414991365, 'samples': 7192704, 'steps': 37461, 'loss/train': 1.6629902124404907} -08/30/2021 19:57:53 - INFO - __main__ - Step 37463: {'lr': 0.0004324527162399854, 'samples': 7192896, 'steps': 37462, 'loss/train': 1.5064109563827515} -08/30/2021 19:57:53 - INFO - __main__ - Step 37464: {'lr': 0.0004324490882478469, 'samples': 7193088, 'steps': 37463, 'loss/train': 1.5163710117340088} -08/30/2021 19:57:54 - INFO - __main__ - Step 37465: {'lr': 0.0004324454601734995, 'samples': 7193280, 'steps': 37464, 'loss/train': 0.9994857907295227} -08/30/2021 19:57:55 - INFO - __main__ - Step 37466: {'lr': 0.0004324418320169451, 'samples': 7193472, 'steps': 37465, 'loss/train': 1.6675835847854614} -08/30/2021 19:57:56 - INFO - __main__ - Step 37467: {'lr': 0.00043243820377818524, 'samples': 7193664, 'steps': 37466, 'loss/train': 1.3926085233688354} -08/30/2021 19:57:56 - INFO - __main__ - Step 37468: {'lr': 0.0004324345754572215, 'samples': 7193856, 'steps': 37467, 'loss/train': 1.9959787130355835} -08/30/2021 19:57:56 - INFO - __main__ - Step 37469: {'lr': 0.00043243094705405554, 'samples': 7194048, 'steps': 37468, 'loss/train': 0.8023901581764221} -08/30/2021 19:57:57 - INFO - __main__ - Step 37470: {'lr': 0.0004324273185686891, 'samples': 7194240, 'steps': 37469, 'loss/train': 1.7683916091918945} -08/30/2021 19:57:58 - INFO - __main__ - Step 37471: {'lr': 0.00043242369000112365, 'samples': 7194432, 'steps': 37470, 'loss/train': 1.9535781145095825} -08/30/2021 19:57:59 - INFO - __main__ - Step 37472: {'lr': 0.00043242006135136093, 'samples': 7194624, 'steps': 37471, 'loss/train': 1.5709192752838135} -08/30/2021 19:57:59 - INFO - __main__ - Step 37473: {'lr': 0.00043241643261940246, 'samples': 7194816, 'steps': 37472, 'loss/train': 1.2576907873153687} -08/30/2021 19:58:00 - INFO - __main__ - Step 37474: {'lr': 0.00043241280380525003, 'samples': 7195008, 'steps': 37473, 'loss/train': 1.5616741180419922} -08/30/2021 19:58:00 - INFO - __main__ - Step 37475: {'lr': 0.0004324091749089052, 'samples': 7195200, 'steps': 37474, 'loss/train': 1.4544329643249512} -08/30/2021 19:58:00 - INFO - __main__ - Step 37476: {'lr': 0.0004324055459303696, 'samples': 7195392, 'steps': 37475, 'loss/train': 2.2143774032592773} -08/30/2021 19:58:02 - INFO - __main__ - Step 37477: {'lr': 0.00043240191686964494, 'samples': 7195584, 'steps': 37476, 'loss/train': 1.9346952438354492} -08/30/2021 19:58:02 - INFO - __main__ - Step 37478: {'lr': 0.00043239828772673276, 'samples': 7195776, 'steps': 37477, 'loss/train': 1.6234220266342163} -08/30/2021 19:58:03 - INFO - __main__ - Step 37479: {'lr': 0.0004323946585016347, 'samples': 7195968, 'steps': 37478, 'loss/train': 1.0614049434661865} -08/30/2021 19:58:03 - INFO - __main__ - Step 37480: {'lr': 0.00043239102919435235, 'samples': 7196160, 'steps': 37479, 'loss/train': 1.4087451696395874} -08/30/2021 19:58:03 - INFO - __main__ - Step 37481: {'lr': 0.0004323873998048875, 'samples': 7196352, 'steps': 37480, 'loss/train': 1.5892679691314697} -08/30/2021 19:58:05 - INFO - __main__ - Step 37482: {'lr': 0.00043238377033324175, 'samples': 7196544, 'steps': 37481, 'loss/train': 2.275916337966919} -08/30/2021 19:58:06 - INFO - __main__ - Step 37483: {'lr': 0.00043238014077941656, 'samples': 7196736, 'steps': 37482, 'loss/train': 1.1161500215530396} -08/30/2021 19:58:06 - INFO - __main__ - Step 37484: {'lr': 0.00043237651114341383, 'samples': 7196928, 'steps': 37483, 'loss/train': 1.7871931791305542} -08/30/2021 19:58:07 - INFO - __main__ - Step 37485: {'lr': 0.00043237288142523503, 'samples': 7197120, 'steps': 37484, 'loss/train': 1.4332817792892456} -08/30/2021 19:58:07 - INFO - __main__ - Step 37486: {'lr': 0.00043236925162488173, 'samples': 7197312, 'steps': 37485, 'loss/train': 1.6623674631118774} -08/30/2021 19:58:07 - INFO - __main__ - Step 37487: {'lr': 0.0004323656217423557, 'samples': 7197504, 'steps': 37486, 'loss/train': 1.1692649126052856} -08/30/2021 19:58:09 - INFO - __main__ - Step 37488: {'lr': 0.00043236199177765856, 'samples': 7197696, 'steps': 37487, 'loss/train': 1.9744224548339844} -08/30/2021 19:58:10 - INFO - __main__ - Step 37489: {'lr': 0.0004323583617307919, 'samples': 7197888, 'steps': 37488, 'loss/train': 1.7935391664505005} -08/30/2021 19:58:10 - INFO - __main__ - Step 37490: {'lr': 0.00043235473160175745, 'samples': 7198080, 'steps': 37489, 'loss/train': 1.656412124633789} -08/30/2021 19:58:10 - INFO - __main__ - Step 37491: {'lr': 0.0004323511013905567, 'samples': 7198272, 'steps': 37490, 'loss/train': 1.7821305990219116} -08/30/2021 19:58:11 - INFO - __main__ - Step 37492: {'lr': 0.0004323474710971913, 'samples': 7198464, 'steps': 37491, 'loss/train': 0.2615404725074768} -08/30/2021 19:58:12 - INFO - __main__ - Step 37493: {'lr': 0.0004323438407216631, 'samples': 7198656, 'steps': 37492, 'loss/train': 1.3712270259857178} -08/30/2021 19:58:13 - INFO - __main__ - Step 37494: {'lr': 0.0004323402102639734, 'samples': 7198848, 'steps': 37493, 'loss/train': 1.5318272113800049} -08/30/2021 19:58:13 - INFO - __main__ - Step 37495: {'lr': 0.00043233657972412414, 'samples': 7199040, 'steps': 37494, 'loss/train': 1.8162832260131836} -08/30/2021 19:58:13 - INFO - __main__ - Step 37496: {'lr': 0.00043233294910211684, 'samples': 7199232, 'steps': 37495, 'loss/train': 0.6068657636642456} -08/30/2021 19:58:14 - INFO - __main__ - Step 37497: {'lr': 0.0004323293183979531, 'samples': 7199424, 'steps': 37496, 'loss/train': 1.4310290813446045} -08/30/2021 19:58:15 - INFO - __main__ - Step 37498: {'lr': 0.0004323256876116345, 'samples': 7199616, 'steps': 37497, 'loss/train': 1.5072999000549316} -08/30/2021 19:58:16 - INFO - __main__ - Step 37499: {'lr': 0.0004323220567431628, 'samples': 7199808, 'steps': 37498, 'loss/train': 1.1527888774871826} -08/30/2021 19:58:16 - INFO - __main__ - Step 37500: {'lr': 0.0004323184257925397, 'samples': 7200000, 'steps': 37499, 'loss/train': 1.0558773279190063} -08/30/2021 19:58:16 - INFO - __main__ - Step 37501: {'lr': 0.0004323147947597667, 'samples': 7200192, 'steps': 37500, 'loss/train': 1.4937289953231812} -08/30/2021 19:58:17 - INFO - __main__ - Step 37502: {'lr': 0.00043231116364484534, 'samples': 7200384, 'steps': 37501, 'loss/train': 1.1834146976470947} -08/30/2021 19:58:18 - INFO - __main__ - Step 37503: {'lr': 0.00043230753244777743, 'samples': 7200576, 'steps': 37502, 'loss/train': 1.7812247276306152} -08/30/2021 19:58:19 - INFO - __main__ - Step 37504: {'lr': 0.00043230390116856467, 'samples': 7200768, 'steps': 37503, 'loss/train': 0.9910949468612671} -08/30/2021 19:58:19 - INFO - __main__ - Step 37505: {'lr': 0.00043230026980720847, 'samples': 7200960, 'steps': 37504, 'loss/train': 0.27721384167671204} -08/30/2021 19:58:19 - INFO - __main__ - Step 37506: {'lr': 0.00043229663836371056, 'samples': 7201152, 'steps': 37505, 'loss/train': 1.6516259908676147} -08/30/2021 19:58:20 - INFO - __main__ - Step 37507: {'lr': 0.0004322930068380727, 'samples': 7201344, 'steps': 37506, 'loss/train': 1.2754383087158203} -08/30/2021 19:58:20 - INFO - __main__ - Step 37508: {'lr': 0.00043228937523029636, 'samples': 7201536, 'steps': 37507, 'loss/train': 1.1058402061462402} -08/30/2021 19:58:21 - INFO - __main__ - Step 37509: {'lr': 0.00043228574354038326, 'samples': 7201728, 'steps': 37508, 'loss/train': 1.912397027015686} -08/30/2021 19:58:22 - INFO - __main__ - Step 37510: {'lr': 0.00043228211176833496, 'samples': 7201920, 'steps': 37509, 'loss/train': 1.2819210290908813} -08/30/2021 19:58:22 - INFO - __main__ - Step 37511: {'lr': 0.00043227847991415326, 'samples': 7202112, 'steps': 37510, 'loss/train': 1.7909189462661743} -08/30/2021 19:58:23 - INFO - __main__ - Step 37512: {'lr': 0.00043227484797783965, 'samples': 7202304, 'steps': 37511, 'loss/train': 1.4759891033172607} -08/30/2021 19:58:23 - INFO - __main__ - Step 37513: {'lr': 0.0004322712159593958, 'samples': 7202496, 'steps': 37512, 'loss/train': 1.4428958892822266} -08/30/2021 19:58:25 - INFO - __main__ - Step 37514: {'lr': 0.0004322675838588234, 'samples': 7202688, 'steps': 37513, 'loss/train': 1.2655271291732788} -08/30/2021 19:58:25 - INFO - __main__ - Step 37515: {'lr': 0.0004322639516761239, 'samples': 7202880, 'steps': 37514, 'loss/train': 1.7687451839447021} -08/30/2021 19:58:25 - INFO - __main__ - Step 37516: {'lr': 0.0004322603194112992, 'samples': 7203072, 'steps': 37515, 'loss/train': 1.3810795545578003} -08/30/2021 19:58:26 - INFO - __main__ - Step 37517: {'lr': 0.00043225668706435073, 'samples': 7203264, 'steps': 37516, 'loss/train': 1.9673357009887695} -08/30/2021 19:58:26 - INFO - __main__ - Step 37518: {'lr': 0.0004322530546352803, 'samples': 7203456, 'steps': 37517, 'loss/train': 1.2577698230743408} -08/30/2021 19:58:28 - INFO - __main__ - Step 37519: {'lr': 0.0004322494221240894, 'samples': 7203648, 'steps': 37518, 'loss/train': 1.4642664194107056} -08/30/2021 19:58:28 - INFO - __main__ - Step 37520: {'lr': 0.0004322457895307797, 'samples': 7203840, 'steps': 37519, 'loss/train': 0.9526332020759583} -08/30/2021 19:58:29 - INFO - __main__ - Step 37521: {'lr': 0.00043224215685535287, 'samples': 7204032, 'steps': 37520, 'loss/train': 1.2903285026550293} -08/30/2021 19:58:29 - INFO - __main__ - Step 37522: {'lr': 0.0004322385240978106, 'samples': 7204224, 'steps': 37521, 'loss/train': 1.4051399230957031} -08/30/2021 19:58:29 - INFO - __main__ - Step 37523: {'lr': 0.0004322348912581544, 'samples': 7204416, 'steps': 37522, 'loss/train': 1.049926996231079} -08/30/2021 19:58:31 - INFO - __main__ - Step 37524: {'lr': 0.000432231258336386, 'samples': 7204608, 'steps': 37523, 'loss/train': 1.4273812770843506} -08/30/2021 19:58:31 - INFO - __main__ - Step 37525: {'lr': 0.000432227625332507, 'samples': 7204800, 'steps': 37524, 'loss/train': 0.8716246485710144} -08/30/2021 19:58:32 - INFO - __main__ - Step 37526: {'lr': 0.000432223992246519, 'samples': 7204992, 'steps': 37525, 'loss/train': 1.1482375860214233} -08/30/2021 19:58:32 - INFO - __main__ - Step 37527: {'lr': 0.0004322203590784237, 'samples': 7205184, 'steps': 37526, 'loss/train': 1.5492173433303833} -08/30/2021 19:58:32 - INFO - __main__ - Step 37528: {'lr': 0.0004322167258282228, 'samples': 7205376, 'steps': 37527, 'loss/train': 1.2992923259735107} -08/30/2021 19:58:33 - INFO - __main__ - Step 37529: {'lr': 0.0004322130924959178, 'samples': 7205568, 'steps': 37528, 'loss/train': 1.7902179956436157} -08/30/2021 19:58:34 - INFO - __main__ - Step 37530: {'lr': 0.0004322094590815104, 'samples': 7205760, 'steps': 37529, 'loss/train': 1.3195284605026245} -08/30/2021 19:58:34 - INFO - __main__ - Step 37531: {'lr': 0.00043220582558500223, 'samples': 7205952, 'steps': 37530, 'loss/train': 1.6612164974212646} -08/30/2021 19:58:35 - INFO - __main__ - Step 37532: {'lr': 0.00043220219200639485, 'samples': 7206144, 'steps': 37531, 'loss/train': 1.0602866411209106} -08/30/2021 19:58:35 - INFO - __main__ - Step 37533: {'lr': 0.00043219855834569006, 'samples': 7206336, 'steps': 37532, 'loss/train': 1.4278581142425537} -08/30/2021 19:58:36 - INFO - __main__ - Step 37534: {'lr': 0.00043219492460288937, 'samples': 7206528, 'steps': 37533, 'loss/train': 0.9774312973022461} -08/30/2021 19:58:37 - INFO - __main__ - Step 37535: {'lr': 0.00043219129077799447, 'samples': 7206720, 'steps': 37534, 'loss/train': 1.0480772256851196} -08/30/2021 19:58:37 - INFO - __main__ - Step 37536: {'lr': 0.000432187656871007, 'samples': 7206912, 'steps': 37535, 'loss/train': 1.4655450582504272} -08/30/2021 19:58:38 - INFO - __main__ - Step 37537: {'lr': 0.0004321840228819286, 'samples': 7207104, 'steps': 37536, 'loss/train': 1.4091171026229858} -08/30/2021 19:58:38 - INFO - __main__ - Step 37538: {'lr': 0.0004321803888107608, 'samples': 7207296, 'steps': 37537, 'loss/train': 1.4877434968948364} -08/30/2021 19:58:39 - INFO - __main__ - Step 37539: {'lr': 0.0004321767546575054, 'samples': 7207488, 'steps': 37538, 'loss/train': 1.3915910720825195} -08/30/2021 19:58:40 - INFO - __main__ - Step 37540: {'lr': 0.000432173120422164, 'samples': 7207680, 'steps': 37539, 'loss/train': 1.5611861944198608} -08/30/2021 19:58:40 - INFO - __main__ - Step 37541: {'lr': 0.00043216948610473816, 'samples': 7207872, 'steps': 37540, 'loss/train': 2.035835027694702} -08/30/2021 19:58:41 - INFO - __main__ - Step 37542: {'lr': 0.0004321658517052296, 'samples': 7208064, 'steps': 37541, 'loss/train': 1.3971617221832275} -08/30/2021 19:58:41 - INFO - __main__ - Step 37543: {'lr': 0.00043216221722363983, 'samples': 7208256, 'steps': 37542, 'loss/train': 1.233750343322754} -08/30/2021 19:58:42 - INFO - __main__ - Step 37544: {'lr': 0.00043215858265997065, 'samples': 7208448, 'steps': 37543, 'loss/train': 1.4952385425567627} -08/30/2021 19:58:44 - INFO - __main__ - Step 37545: {'lr': 0.0004321549480142236, 'samples': 7208640, 'steps': 37544, 'loss/train': 0.9079849720001221} -08/30/2021 19:58:44 - INFO - __main__ - Step 37546: {'lr': 0.0004321513132864003, 'samples': 7208832, 'steps': 37545, 'loss/train': 1.5006433725357056} -08/30/2021 19:58:45 - INFO - __main__ - Step 37547: {'lr': 0.0004321476784765025, 'samples': 7209024, 'steps': 37546, 'loss/train': 2.069721221923828} -08/30/2021 19:58:45 - INFO - __main__ - Step 37548: {'lr': 0.00043214404358453174, 'samples': 7209216, 'steps': 37547, 'loss/train': 1.0978617668151855} -08/30/2021 19:58:45 - INFO - __main__ - Step 37549: {'lr': 0.0004321404086104897, 'samples': 7209408, 'steps': 37548, 'loss/train': 1.4166901111602783} -08/30/2021 19:58:46 - INFO - __main__ - Step 37550: {'lr': 0.00043213677355437795, 'samples': 7209600, 'steps': 37549, 'loss/train': 2.1366448402404785} -08/30/2021 19:58:47 - INFO - __main__ - Step 37551: {'lr': 0.0004321331384161983, 'samples': 7209792, 'steps': 37550, 'loss/train': 1.1152297258377075} -08/30/2021 19:58:47 - INFO - __main__ - Step 37552: {'lr': 0.00043212950319595215, 'samples': 7209984, 'steps': 37551, 'loss/train': 1.4170417785644531} -08/30/2021 19:58:48 - INFO - __main__ - Step 37553: {'lr': 0.0004321258678936413, 'samples': 7210176, 'steps': 37552, 'loss/train': 1.6036512851715088} -08/30/2021 19:58:48 - INFO - __main__ - Step 37554: {'lr': 0.00043212223250926727, 'samples': 7210368, 'steps': 37553, 'loss/train': 0.7793318629264832} -08/30/2021 19:58:49 - INFO - __main__ - Step 37555: {'lr': 0.00043211859704283184, 'samples': 7210560, 'steps': 37554, 'loss/train': 0.17542804777622223} -08/30/2021 19:58:50 - INFO - __main__ - Step 37556: {'lr': 0.0004321149614943366, 'samples': 7210752, 'steps': 37555, 'loss/train': 0.9032306671142578} -08/30/2021 19:58:50 - INFO - __main__ - Step 37557: {'lr': 0.0004321113258637832, 'samples': 7210944, 'steps': 37556, 'loss/train': 1.3906383514404297} -08/30/2021 19:58:51 - INFO - __main__ - Step 37558: {'lr': 0.0004321076901511731, 'samples': 7211136, 'steps': 37557, 'loss/train': 1.1014204025268555} -08/30/2021 19:58:51 - INFO - __main__ - Step 37559: {'lr': 0.0004321040543565082, 'samples': 7211328, 'steps': 37558, 'loss/train': 1.4682289361953735} -08/30/2021 19:58:51 - INFO - __main__ - Step 37560: {'lr': 0.00043210041847979003, 'samples': 7211520, 'steps': 37559, 'loss/train': 1.8109159469604492} -08/30/2021 19:58:53 - INFO - __main__ - Step 37561: {'lr': 0.0004320967825210202, 'samples': 7211712, 'steps': 37560, 'loss/train': 1.3364187479019165} -08/30/2021 19:58:53 - INFO - __main__ - Step 37562: {'lr': 0.00043209314648020035, 'samples': 7211904, 'steps': 37561, 'loss/train': 1.6465651988983154} -08/30/2021 19:58:54 - INFO - __main__ - Step 37563: {'lr': 0.0004320895103573321, 'samples': 7212096, 'steps': 37562, 'loss/train': 2.1376163959503174} -08/30/2021 19:58:54 - INFO - __main__ - Step 37564: {'lr': 0.00043208587415241725, 'samples': 7212288, 'steps': 37563, 'loss/train': 1.2642743587493896} -08/30/2021 19:58:54 - INFO - __main__ - Step 37565: {'lr': 0.00043208223786545723, 'samples': 7212480, 'steps': 37564, 'loss/train': 1.5711627006530762} -08/30/2021 19:58:55 - INFO - __main__ - Step 37566: {'lr': 0.0004320786014964538, 'samples': 7212672, 'steps': 37565, 'loss/train': 1.5496430397033691} -08/30/2021 19:58:56 - INFO - __main__ - Step 37567: {'lr': 0.0004320749650454085, 'samples': 7212864, 'steps': 37566, 'loss/train': 1.6033724546432495} -08/30/2021 19:58:57 - INFO - __main__ - Step 37568: {'lr': 0.0004320713285123231, 'samples': 7213056, 'steps': 37567, 'loss/train': 1.73569917678833} -08/30/2021 19:58:57 - INFO - __main__ - Step 37569: {'lr': 0.0004320676918971991, 'samples': 7213248, 'steps': 37568, 'loss/train': 1.4966765642166138} -08/30/2021 19:58:57 - INFO - __main__ - Step 37570: {'lr': 0.00043206405520003824, 'samples': 7213440, 'steps': 37569, 'loss/train': 1.7415043115615845} -08/30/2021 19:58:58 - INFO - __main__ - Step 37571: {'lr': 0.00043206041842084214, 'samples': 7213632, 'steps': 37570, 'loss/train': 1.3438230752944946} -08/30/2021 19:58:59 - INFO - __main__ - Step 37572: {'lr': 0.00043205678155961244, 'samples': 7213824, 'steps': 37571, 'loss/train': 1.7384071350097656} -08/30/2021 19:59:00 - INFO - __main__ - Step 37573: {'lr': 0.0004320531446163507, 'samples': 7214016, 'steps': 37572, 'loss/train': 1.6909834146499634} -08/30/2021 19:59:00 - INFO - __main__ - Step 37574: {'lr': 0.00043204950759105865, 'samples': 7214208, 'steps': 37573, 'loss/train': 1.6572736501693726} -08/30/2021 19:59:00 - INFO - __main__ - Step 37575: {'lr': 0.0004320458704837379, 'samples': 7214400, 'steps': 37574, 'loss/train': 1.727827548980713} -08/30/2021 19:59:01 - INFO - __main__ - Step 37576: {'lr': 0.00043204223329439015, 'samples': 7214592, 'steps': 37575, 'loss/train': 1.2690116167068481} -08/30/2021 19:59:02 - INFO - __main__ - Step 37577: {'lr': 0.00043203859602301695, 'samples': 7214784, 'steps': 37576, 'loss/train': 1.1359823942184448} -08/30/2021 19:59:03 - INFO - __main__ - Step 37578: {'lr': 0.00043203495866961996, 'samples': 7214976, 'steps': 37577, 'loss/train': 1.6740102767944336} -08/30/2021 19:59:03 - INFO - __main__ - Step 37579: {'lr': 0.00043203132123420074, 'samples': 7215168, 'steps': 37578, 'loss/train': 1.6285802125930786} -08/30/2021 19:59:03 - INFO - __main__ - Step 37580: {'lr': 0.00043202768371676113, 'samples': 7215360, 'steps': 37579, 'loss/train': 1.6305042505264282} -08/30/2021 19:59:04 - INFO - __main__ - Step 37581: {'lr': 0.0004320240461173026, 'samples': 7215552, 'steps': 37580, 'loss/train': 1.7473945617675781} -08/30/2021 19:59:05 - INFO - __main__ - Step 37582: {'lr': 0.00043202040843582685, 'samples': 7215744, 'steps': 37581, 'loss/train': 1.7889299392700195} -08/30/2021 19:59:06 - INFO - __main__ - Step 37583: {'lr': 0.00043201677067233554, 'samples': 7215936, 'steps': 37582, 'loss/train': 1.1004011631011963} -08/30/2021 19:59:06 - INFO - __main__ - Step 37584: {'lr': 0.00043201313282683024, 'samples': 7216128, 'steps': 37583, 'loss/train': 1.7682527303695679} -08/30/2021 19:59:06 - INFO - __main__ - Step 37585: {'lr': 0.0004320094948993127, 'samples': 7216320, 'steps': 37584, 'loss/train': 1.712681770324707} -08/30/2021 19:59:07 - INFO - __main__ - Step 37586: {'lr': 0.00043200585688978445, 'samples': 7216512, 'steps': 37585, 'loss/train': 1.4677200317382812} -08/30/2021 19:59:08 - INFO - __main__ - Step 37587: {'lr': 0.00043200221879824706, 'samples': 7216704, 'steps': 37586, 'loss/train': 1.5668485164642334} -08/30/2021 19:59:09 - INFO - __main__ - Step 37588: {'lr': 0.0004319985806247024, 'samples': 7216896, 'steps': 37587, 'loss/train': 1.33074152469635} -08/30/2021 19:59:09 - INFO - __main__ - Step 37589: {'lr': 0.00043199494236915206, 'samples': 7217088, 'steps': 37588, 'loss/train': 1.2112542390823364} -08/30/2021 19:59:09 - INFO - __main__ - Step 37590: {'lr': 0.0004319913040315975, 'samples': 7217280, 'steps': 37589, 'loss/train': 1.16719388961792} -08/30/2021 19:59:10 - INFO - __main__ - Step 37591: {'lr': 0.00043198766561204047, 'samples': 7217472, 'steps': 37590, 'loss/train': 1.869739294052124} -08/30/2021 19:59:10 - INFO - __main__ - Step 37592: {'lr': 0.0004319840271104826, 'samples': 7217664, 'steps': 37591, 'loss/train': 0.04509987309575081} -08/30/2021 19:59:12 - INFO - __main__ - Step 37593: {'lr': 0.0004319803885269256, 'samples': 7217856, 'steps': 37592, 'loss/train': 1.1683651208877563} -08/30/2021 19:59:12 - INFO - __main__ - Step 37594: {'lr': 0.0004319767498613709, 'samples': 7218048, 'steps': 37593, 'loss/train': 1.0008716583251953} -08/30/2021 19:59:13 - INFO - __main__ - Step 37595: {'lr': 0.00043197311111382045, 'samples': 7218240, 'steps': 37594, 'loss/train': 1.6956290006637573} -08/30/2021 19:59:13 - INFO - __main__ - Step 37596: {'lr': 0.00043196947228427564, 'samples': 7218432, 'steps': 37595, 'loss/train': 1.082789421081543} -08/30/2021 19:59:14 - INFO - __main__ - Step 37597: {'lr': 0.0004319658333727382, 'samples': 7218624, 'steps': 37596, 'loss/train': 1.2129055261611938} -08/30/2021 19:59:15 - INFO - __main__ - Step 37598: {'lr': 0.0004319621943792098, 'samples': 7218816, 'steps': 37597, 'loss/train': 0.16011081635951996} -08/30/2021 19:59:15 - INFO - __main__ - Step 37599: {'lr': 0.000431958555303692, 'samples': 7219008, 'steps': 37598, 'loss/train': 2.258772134780884} -08/30/2021 19:59:16 - INFO - __main__ - Step 37600: {'lr': 0.00043195491614618655, 'samples': 7219200, 'steps': 37599, 'loss/train': 1.2972426414489746} -08/30/2021 19:59:16 - INFO - __main__ - Step 37601: {'lr': 0.00043195127690669486, 'samples': 7219392, 'steps': 37600, 'loss/train': 0.4891473948955536} -08/30/2021 19:59:16 - INFO - __main__ - Step 37602: {'lr': 0.00043194763758521896, 'samples': 7219584, 'steps': 37601, 'loss/train': 1.3949825763702393} -08/30/2021 19:59:18 - INFO - __main__ - Step 37603: {'lr': 0.00043194399818176013, 'samples': 7219776, 'steps': 37602, 'loss/train': 1.4770081043243408} -08/30/2021 19:59:19 - INFO - __main__ - Step 37604: {'lr': 0.00043194035869632017, 'samples': 7219968, 'steps': 37603, 'loss/train': 0.296678364276886} -08/30/2021 19:59:19 - INFO - __main__ - Step 37605: {'lr': 0.00043193671912890064, 'samples': 7220160, 'steps': 37604, 'loss/train': 1.6438281536102295} -08/30/2021 19:59:19 - INFO - __main__ - Step 37606: {'lr': 0.0004319330794795033, 'samples': 7220352, 'steps': 37605, 'loss/train': 0.17355850338935852} -08/30/2021 19:59:20 - INFO - __main__ - Step 37607: {'lr': 0.0004319294397481297, 'samples': 7220544, 'steps': 37606, 'loss/train': 0.6790974736213684} -08/30/2021 19:59:21 - INFO - __main__ - Step 37608: {'lr': 0.0004319257999347815, 'samples': 7220736, 'steps': 37607, 'loss/train': 0.651013970375061} -08/30/2021 19:59:22 - INFO - __main__ - Step 37609: {'lr': 0.0004319221600394603, 'samples': 7220928, 'steps': 37608, 'loss/train': 1.365445613861084} -08/30/2021 19:59:22 - INFO - __main__ - Step 37610: {'lr': 0.0004319185200621678, 'samples': 7221120, 'steps': 37609, 'loss/train': 0.05014752224087715} -08/30/2021 19:59:23 - INFO - __main__ - Step 37611: {'lr': 0.0004319148800029057, 'samples': 7221312, 'steps': 37610, 'loss/train': 1.3334579467773438} -08/30/2021 19:59:23 - INFO - __main__ - Step 37612: {'lr': 0.0004319112398616755, 'samples': 7221504, 'steps': 37611, 'loss/train': 1.457069754600525} -08/30/2021 19:59:24 - INFO - __main__ - Step 37613: {'lr': 0.00043190759963847894, 'samples': 7221696, 'steps': 37612, 'loss/train': 1.3781859874725342} -08/30/2021 19:59:25 - INFO - __main__ - Step 37614: {'lr': 0.00043190395933331757, 'samples': 7221888, 'steps': 37613, 'loss/train': 1.5307385921478271} -08/30/2021 19:59:25 - INFO - __main__ - Step 37615: {'lr': 0.00043190031894619306, 'samples': 7222080, 'steps': 37614, 'loss/train': 1.5736502408981323} -08/30/2021 19:59:26 - INFO - __main__ - Step 37616: {'lr': 0.0004318966784771071, 'samples': 7222272, 'steps': 37615, 'loss/train': 1.6792057752609253} -08/30/2021 19:59:26 - INFO - __main__ - Step 37617: {'lr': 0.00043189303792606136, 'samples': 7222464, 'steps': 37616, 'loss/train': 1.4793416261672974} -08/30/2021 19:59:26 - INFO - __main__ - Step 37618: {'lr': 0.0004318893972930574, 'samples': 7222656, 'steps': 37617, 'loss/train': 1.5910242795944214} -08/30/2021 19:59:28 - INFO - __main__ - Step 37619: {'lr': 0.00043188575657809685, 'samples': 7222848, 'steps': 37618, 'loss/train': 1.156327486038208} -08/30/2021 19:59:29 - INFO - __main__ - Step 37620: {'lr': 0.00043188211578118143, 'samples': 7223040, 'steps': 37619, 'loss/train': 1.646649956703186} -08/30/2021 19:59:29 - INFO - __main__ - Step 37621: {'lr': 0.0004318784749023127, 'samples': 7223232, 'steps': 37620, 'loss/train': 1.2390806674957275} -08/30/2021 19:59:29 - INFO - __main__ - Step 37622: {'lr': 0.0004318748339414923, 'samples': 7223424, 'steps': 37621, 'loss/train': 2.3212947845458984} -08/30/2021 19:59:30 - INFO - __main__ - Step 37623: {'lr': 0.000431871192898722, 'samples': 7223616, 'steps': 37622, 'loss/train': 1.117757797241211} -08/30/2021 19:59:31 - INFO - __main__ - Step 37624: {'lr': 0.0004318675517740033, 'samples': 7223808, 'steps': 37623, 'loss/train': 1.309813380241394} -08/30/2021 19:59:32 - INFO - __main__ - Step 37625: {'lr': 0.0004318639105673379, 'samples': 7224000, 'steps': 37624, 'loss/train': 1.8009846210479736} -08/30/2021 19:59:32 - INFO - __main__ - Step 37626: {'lr': 0.00043186026927872736, 'samples': 7224192, 'steps': 37625, 'loss/train': 0.9139742255210876} -08/30/2021 19:59:32 - INFO - __main__ - Step 37627: {'lr': 0.0004318566279081735, 'samples': 7224384, 'steps': 37626, 'loss/train': 1.024888277053833} -08/30/2021 19:59:33 - INFO - __main__ - Step 37628: {'lr': 0.0004318529864556777, 'samples': 7224576, 'steps': 37627, 'loss/train': 0.9063631892204285} -08/30/2021 19:59:34 - INFO - __main__ - Step 37629: {'lr': 0.0004318493449212419, 'samples': 7224768, 'steps': 37628, 'loss/train': 1.1232155561447144} -08/30/2021 19:59:35 - INFO - __main__ - Step 37630: {'lr': 0.00043184570330486756, 'samples': 7224960, 'steps': 37629, 'loss/train': 1.5673871040344238} -08/30/2021 19:59:35 - INFO - __main__ - Step 37631: {'lr': 0.0004318420616065563, 'samples': 7225152, 'steps': 37630, 'loss/train': 1.8563885688781738} -08/30/2021 19:59:35 - INFO - __main__ - Step 37632: {'lr': 0.0004318384198263099, 'samples': 7225344, 'steps': 37631, 'loss/train': 1.389448642730713} -08/30/2021 19:59:36 - INFO - __main__ - Step 37633: {'lr': 0.0004318347779641298, 'samples': 7225536, 'steps': 37632, 'loss/train': 0.9539344906806946} -08/30/2021 19:59:36 - INFO - __main__ - Step 37634: {'lr': 0.00043183113602001777, 'samples': 7225728, 'steps': 37633, 'loss/train': 0.7564384937286377} -08/30/2021 19:59:38 - INFO - __main__ - Step 37635: {'lr': 0.0004318274939939755, 'samples': 7225920, 'steps': 37634, 'loss/train': 1.7145167589187622} -08/30/2021 19:59:38 - INFO - __main__ - Step 37636: {'lr': 0.00043182385188600457, 'samples': 7226112, 'steps': 37635, 'loss/train': 0.7960317730903625} -08/30/2021 19:59:38 - INFO - __main__ - Step 37637: {'lr': 0.0004318202096961066, 'samples': 7226304, 'steps': 37636, 'loss/train': 1.4038528203964233} -08/30/2021 19:59:39 - INFO - __main__ - Step 37638: {'lr': 0.0004318165674242832, 'samples': 7226496, 'steps': 37637, 'loss/train': 1.1525098085403442} -08/30/2021 19:59:39 - INFO - __main__ - Step 37639: {'lr': 0.0004318129250705361, 'samples': 7226688, 'steps': 37638, 'loss/train': 1.8547435998916626} -08/30/2021 19:59:41 - INFO - __main__ - Step 37640: {'lr': 0.0004318092826348669, 'samples': 7226880, 'steps': 37639, 'loss/train': 1.3831381797790527} -08/30/2021 19:59:41 - INFO - __main__ - Step 37641: {'lr': 0.0004318056401172772, 'samples': 7227072, 'steps': 37640, 'loss/train': 1.096973180770874} -08/30/2021 19:59:42 - INFO - __main__ - Step 37642: {'lr': 0.0004318019975177688, 'samples': 7227264, 'steps': 37641, 'loss/train': 1.2614604234695435} -08/30/2021 19:59:42 - INFO - __main__ - Step 37643: {'lr': 0.0004317983548363431, 'samples': 7227456, 'steps': 37642, 'loss/train': 1.274519920349121} -08/30/2021 19:59:42 - INFO - __main__ - Step 37644: {'lr': 0.0004317947120730019, 'samples': 7227648, 'steps': 37643, 'loss/train': 1.0516068935394287} -08/30/2021 19:59:44 - INFO - __main__ - Step 37645: {'lr': 0.0004317910692277469, 'samples': 7227840, 'steps': 37644, 'loss/train': 1.3844913244247437} -08/30/2021 19:59:44 - INFO - __main__ - Step 37646: {'lr': 0.0004317874263005795, 'samples': 7228032, 'steps': 37645, 'loss/train': 0.9391219615936279} -08/30/2021 19:59:45 - INFO - __main__ - Step 37647: {'lr': 0.0004317837832915016, 'samples': 7228224, 'steps': 37646, 'loss/train': 1.628291368484497} -08/30/2021 19:59:45 - INFO - __main__ - Step 37648: {'lr': 0.0004317801402005147, 'samples': 7228416, 'steps': 37647, 'loss/train': 1.0557103157043457} -08/30/2021 19:59:45 - INFO - __main__ - Step 37649: {'lr': 0.00043177649702762043, 'samples': 7228608, 'steps': 37648, 'loss/train': 1.723480224609375} -08/30/2021 19:59:46 - INFO - __main__ - Step 37650: {'lr': 0.0004317728537728206, 'samples': 7228800, 'steps': 37649, 'loss/train': 1.3076304197311401} -08/30/2021 19:59:48 - INFO - __main__ - Step 37651: {'lr': 0.0004317692104361166, 'samples': 7228992, 'steps': 37650, 'loss/train': 1.1958271265029907} -08/30/2021 19:59:48 - INFO - __main__ - Step 37652: {'lr': 0.0004317655670175102, 'samples': 7229184, 'steps': 37651, 'loss/train': 1.4377630949020386} -08/30/2021 19:59:49 - INFO - __main__ - Step 37653: {'lr': 0.0004317619235170032, 'samples': 7229376, 'steps': 37652, 'loss/train': 0.5691970586776733} -08/30/2021 19:59:49 - INFO - __main__ - Step 37654: {'lr': 0.00043175827993459696, 'samples': 7229568, 'steps': 37653, 'loss/train': 0.05685167387127876} -08/30/2021 19:59:49 - INFO - __main__ - Step 37655: {'lr': 0.0004317546362702932, 'samples': 7229760, 'steps': 37654, 'loss/train': 1.6861059665679932} -08/30/2021 19:59:51 - INFO - __main__ - Step 37656: {'lr': 0.0004317509925240937, 'samples': 7229952, 'steps': 37655, 'loss/train': 1.8072127103805542} -08/30/2021 19:59:52 - INFO - __main__ - Step 37657: {'lr': 0.00043174734869599993, 'samples': 7230144, 'steps': 37656, 'loss/train': 1.6896204948425293} -08/30/2021 19:59:52 - INFO - __main__ - Step 37658: {'lr': 0.0004317437047860137, 'samples': 7230336, 'steps': 37657, 'loss/train': 1.2762514352798462} -08/30/2021 19:59:53 - INFO - __main__ - Step 37659: {'lr': 0.0004317400607941364, 'samples': 7230528, 'steps': 37658, 'loss/train': 3.2795166969299316} -08/30/2021 19:59:53 - INFO - __main__ - Step 37660: {'lr': 0.00043173641672037, 'samples': 7230720, 'steps': 37659, 'loss/train': 1.296006202697754} -08/30/2021 19:59:53 - INFO - __main__ - Step 37661: {'lr': 0.00043173277256471586, 'samples': 7230912, 'steps': 37660, 'loss/train': 1.295522689819336} -08/30/2021 19:59:55 - INFO - __main__ - Step 37662: {'lr': 0.0004317291283271758, 'samples': 7231104, 'steps': 37661, 'loss/train': 0.0589936301112175} -08/30/2021 19:59:55 - INFO - __main__ - Step 37663: {'lr': 0.0004317254840077514, 'samples': 7231296, 'steps': 37662, 'loss/train': 1.808688759803772} -08/30/2021 19:59:55 - INFO - __main__ - Step 37664: {'lr': 0.0004317218396064443, 'samples': 7231488, 'steps': 37663, 'loss/train': 1.4146373271942139} -08/30/2021 19:59:56 - INFO - __main__ - Step 37665: {'lr': 0.00043171819512325614, 'samples': 7231680, 'steps': 37664, 'loss/train': 1.7586722373962402} -08/30/2021 19:59:56 - INFO - __main__ - Step 37666: {'lr': 0.00043171455055818854, 'samples': 7231872, 'steps': 37665, 'loss/train': 3.4197332859039307} -08/30/2021 19:59:58 - INFO - __main__ - Step 37667: {'lr': 0.0004317109059112432, 'samples': 7232064, 'steps': 37666, 'loss/train': 0.9519919753074646} -08/30/2021 19:59:58 - INFO - __main__ - Step 37668: {'lr': 0.00043170726118242164, 'samples': 7232256, 'steps': 37667, 'loss/train': 1.6871439218521118} -08/30/2021 19:59:58 - INFO - __main__ - Step 37669: {'lr': 0.0004317036163717257, 'samples': 7232448, 'steps': 37668, 'loss/train': 1.7556183338165283} -08/30/2021 19:59:59 - INFO - __main__ - Step 37670: {'lr': 0.0004316999714791569, 'samples': 7232640, 'steps': 37669, 'loss/train': 1.513393759727478} -08/30/2021 19:59:59 - INFO - __main__ - Step 37671: {'lr': 0.0004316963265047169, 'samples': 7232832, 'steps': 37670, 'loss/train': 3.277825117111206} -08/30/2021 20:00:01 - INFO - __main__ - Step 37672: {'lr': 0.00043169268144840726, 'samples': 7233024, 'steps': 37671, 'loss/train': 0.6956737637519836} -08/30/2021 20:00:01 - INFO - __main__ - Step 37673: {'lr': 0.0004316890363102298, 'samples': 7233216, 'steps': 37672, 'loss/train': 1.0515555143356323} -08/30/2021 20:00:01 - INFO - __main__ - Step 37674: {'lr': 0.000431685391090186, 'samples': 7233408, 'steps': 37673, 'loss/train': 0.7952166199684143} -08/30/2021 20:00:02 - INFO - __main__ - Step 37675: {'lr': 0.00043168174578827755, 'samples': 7233600, 'steps': 37674, 'loss/train': 1.5562384128570557} -08/30/2021 20:00:02 - INFO - __main__ - Step 37676: {'lr': 0.00043167810040450617, 'samples': 7233792, 'steps': 37675, 'loss/train': 1.666055679321289} -08/30/2021 20:00:02 - INFO - __main__ - Step 37677: {'lr': 0.00043167445493887347, 'samples': 7233984, 'steps': 37676, 'loss/train': 2.1080710887908936} -08/30/2021 20:00:04 - INFO - __main__ - Step 37678: {'lr': 0.000431670809391381, 'samples': 7234176, 'steps': 37677, 'loss/train': 1.3906583786010742} -08/30/2021 20:00:04 - INFO - __main__ - Step 37679: {'lr': 0.00043166716376203047, 'samples': 7234368, 'steps': 37678, 'loss/train': 1.8267698287963867} -08/30/2021 20:00:05 - INFO - __main__ - Step 37680: {'lr': 0.0004316635180508235, 'samples': 7234560, 'steps': 37679, 'loss/train': 1.3839911222457886} -08/30/2021 20:00:05 - INFO - __main__ - Step 37681: {'lr': 0.0004316598722577618, 'samples': 7234752, 'steps': 37680, 'loss/train': 1.4439574480056763} -08/30/2021 20:00:05 - INFO - __main__ - Step 37682: {'lr': 0.000431656226382847, 'samples': 7234944, 'steps': 37681, 'loss/train': 2.007516622543335} -08/30/2021 20:00:07 - INFO - __main__ - Step 37683: {'lr': 0.00043165258042608055, 'samples': 7235136, 'steps': 37682, 'loss/train': 1.4240386486053467} -08/30/2021 20:00:08 - INFO - __main__ - Step 37684: {'lr': 0.0004316489343874644, 'samples': 7235328, 'steps': 37683, 'loss/train': 3.268465518951416} -08/30/2021 20:00:08 - INFO - __main__ - Step 37685: {'lr': 0.000431645288267, 'samples': 7235520, 'steps': 37684, 'loss/train': 2.1904873847961426} -08/30/2021 20:00:08 - INFO - __main__ - Step 37686: {'lr': 0.00043164164206468904, 'samples': 7235712, 'steps': 37685, 'loss/train': 1.0899049043655396} -08/30/2021 20:00:09 - INFO - __main__ - Step 37687: {'lr': 0.00043163799578053313, 'samples': 7235904, 'steps': 37686, 'loss/train': 1.3167779445648193} -08/30/2021 20:00:10 - INFO - __main__ - Step 37688: {'lr': 0.00043163434941453395, 'samples': 7236096, 'steps': 37687, 'loss/train': 1.7515298128128052} -08/30/2021 20:00:11 - INFO - __main__ - Step 37689: {'lr': 0.00043163070296669317, 'samples': 7236288, 'steps': 37688, 'loss/train': 1.6320736408233643} -08/30/2021 20:00:11 - INFO - __main__ - Step 37690: {'lr': 0.00043162705643701236, 'samples': 7236480, 'steps': 37689, 'loss/train': 1.1585415601730347} -08/30/2021 20:00:11 - INFO - __main__ - Step 37691: {'lr': 0.00043162340982549327, 'samples': 7236672, 'steps': 37690, 'loss/train': 1.2465486526489258} -08/30/2021 20:00:12 - INFO - __main__ - Step 37692: {'lr': 0.00043161976313213735, 'samples': 7236864, 'steps': 37691, 'loss/train': 0.7220036387443542} -08/30/2021 20:00:13 - INFO - __main__ - Step 37693: {'lr': 0.0004316161163569465, 'samples': 7237056, 'steps': 37692, 'loss/train': 1.8642101287841797} -08/30/2021 20:00:14 - INFO - __main__ - Step 37694: {'lr': 0.0004316124694999222, 'samples': 7237248, 'steps': 37693, 'loss/train': 1.3861749172210693} -08/30/2021 20:00:14 - INFO - __main__ - Step 37695: {'lr': 0.000431608822561066, 'samples': 7237440, 'steps': 37694, 'loss/train': 1.209458589553833} -08/30/2021 20:00:14 - INFO - __main__ - Step 37696: {'lr': 0.0004316051755403798, 'samples': 7237632, 'steps': 37695, 'loss/train': 1.4119212627410889} -08/30/2021 20:00:15 - INFO - __main__ - Step 37697: {'lr': 0.000431601528437865, 'samples': 7237824, 'steps': 37696, 'loss/train': 0.8251736760139465} -08/30/2021 20:00:16 - INFO - __main__ - Step 37698: {'lr': 0.00043159788125352353, 'samples': 7238016, 'steps': 37697, 'loss/train': 0.3981972932815552} -08/30/2021 20:00:17 - INFO - __main__ - Step 37699: {'lr': 0.0004315942339873567, 'samples': 7238208, 'steps': 37698, 'loss/train': 1.198006510734558} -08/30/2021 20:00:17 - INFO - __main__ - Step 37700: {'lr': 0.00043159058663936635, 'samples': 7238400, 'steps': 37699, 'loss/train': 1.1396652460098267} -08/30/2021 20:00:17 - INFO - __main__ - Step 37701: {'lr': 0.0004315869392095542, 'samples': 7238592, 'steps': 37700, 'loss/train': 1.6370837688446045} -08/30/2021 20:00:18 - INFO - __main__ - Step 37702: {'lr': 0.0004315832916979216, 'samples': 7238784, 'steps': 37701, 'loss/train': 1.0754244327545166} -08/30/2021 20:00:19 - INFO - __main__ - Step 37703: {'lr': 0.00043157964410447047, 'samples': 7238976, 'steps': 37702, 'loss/train': 1.0226269960403442} -08/30/2021 20:00:20 - INFO - __main__ - Step 37704: {'lr': 0.0004315759964292023, 'samples': 7239168, 'steps': 37703, 'loss/train': 1.6114041805267334} -08/30/2021 20:00:20 - INFO - __main__ - Step 37705: {'lr': 0.0004315723486721188, 'samples': 7239360, 'steps': 37704, 'loss/train': 1.4619520902633667} -08/30/2021 20:00:20 - INFO - __main__ - Step 37706: {'lr': 0.00043156870083322166, 'samples': 7239552, 'steps': 37705, 'loss/train': 1.3416861295700073} -08/30/2021 20:00:21 - INFO - __main__ - Step 37707: {'lr': 0.00043156505291251234, 'samples': 7239744, 'steps': 37706, 'loss/train': 1.5742803812026978} -08/30/2021 20:00:23 - INFO - __main__ - Step 37708: {'lr': 0.00043156140490999275, 'samples': 7239936, 'steps': 37707, 'loss/train': 1.2783983945846558} -08/30/2021 20:00:23 - INFO - __main__ - Step 37709: {'lr': 0.0004315577568256643, 'samples': 7240128, 'steps': 37708, 'loss/train': 1.647295594215393} -08/30/2021 20:00:23 - INFO - __main__ - Step 37710: {'lr': 0.0004315541086595288, 'samples': 7240320, 'steps': 37709, 'loss/train': 0.6494789123535156} -08/30/2021 20:00:24 - INFO - __main__ - Step 37711: {'lr': 0.00043155046041158776, 'samples': 7240512, 'steps': 37710, 'loss/train': 1.8711117506027222} -08/30/2021 20:00:24 - INFO - __main__ - Step 37712: {'lr': 0.0004315468120818429, 'samples': 7240704, 'steps': 37711, 'loss/train': 1.697899341583252} -08/30/2021 20:00:24 - INFO - __main__ - Step 37713: {'lr': 0.0004315431636702959, 'samples': 7240896, 'steps': 37712, 'loss/train': 1.2972338199615479} -08/30/2021 20:00:26 - INFO - __main__ - Step 37714: {'lr': 0.00043153951517694824, 'samples': 7241088, 'steps': 37713, 'loss/train': 1.4324350357055664} -08/30/2021 20:00:26 - INFO - __main__ - Step 37715: {'lr': 0.0004315358666018018, 'samples': 7241280, 'steps': 37714, 'loss/train': 1.8348197937011719} -08/30/2021 20:00:27 - INFO - __main__ - Step 37716: {'lr': 0.00043153221794485795, 'samples': 7241472, 'steps': 37715, 'loss/train': 2.153360605239868} -08/30/2021 20:00:27 - INFO - __main__ - Step 37717: {'lr': 0.0004315285692061186, 'samples': 7241664, 'steps': 37716, 'loss/train': 1.7202860116958618} -08/30/2021 20:00:28 - INFO - __main__ - Step 37718: {'lr': 0.00043152492038558526, 'samples': 7241856, 'steps': 37717, 'loss/train': 1.7653424739837646} -08/30/2021 20:00:29 - INFO - __main__ - Step 37719: {'lr': 0.00043152127148325957, 'samples': 7242048, 'steps': 37718, 'loss/train': 0.4958634078502655} -08/30/2021 20:00:30 - INFO - __main__ - Step 37720: {'lr': 0.00043151762249914324, 'samples': 7242240, 'steps': 37719, 'loss/train': 1.39985191822052} -08/30/2021 20:00:30 - INFO - __main__ - Step 37721: {'lr': 0.00043151397343323784, 'samples': 7242432, 'steps': 37720, 'loss/train': 2.093074083328247} -08/30/2021 20:00:30 - INFO - __main__ - Step 37722: {'lr': 0.00043151032428554505, 'samples': 7242624, 'steps': 37721, 'loss/train': 1.455536127090454} -08/30/2021 20:00:31 - INFO - __main__ - Step 37723: {'lr': 0.0004315066750560665, 'samples': 7242816, 'steps': 37722, 'loss/train': 1.557468295097351} -08/30/2021 20:00:32 - INFO - __main__ - Step 37724: {'lr': 0.0004315030257448038, 'samples': 7243008, 'steps': 37723, 'loss/train': 1.5150514841079712} -08/30/2021 20:00:33 - INFO - __main__ - Step 37725: {'lr': 0.00043149937635175874, 'samples': 7243200, 'steps': 37724, 'loss/train': 1.359570026397705} -08/30/2021 20:00:33 - INFO - __main__ - Step 37726: {'lr': 0.0004314957268769328, 'samples': 7243392, 'steps': 37725, 'loss/train': 1.3170517683029175} -08/30/2021 20:00:33 - INFO - __main__ - Step 37727: {'lr': 0.00043149207732032767, 'samples': 7243584, 'steps': 37726, 'loss/train': 1.7453690767288208} -08/30/2021 20:00:34 - INFO - __main__ - Step 37728: {'lr': 0.00043148842768194503, 'samples': 7243776, 'steps': 37727, 'loss/train': 1.6623790264129639} -08/30/2021 20:00:35 - INFO - __main__ - Step 37729: {'lr': 0.0004314847779617865, 'samples': 7243968, 'steps': 37728, 'loss/train': 0.448483943939209} -08/30/2021 20:00:36 - INFO - __main__ - Step 37730: {'lr': 0.00043148112815985377, 'samples': 7244160, 'steps': 37729, 'loss/train': 1.305484652519226} -08/30/2021 20:00:36 - INFO - __main__ - Step 37731: {'lr': 0.0004314774782761484, 'samples': 7244352, 'steps': 37730, 'loss/train': 0.3110705316066742} -08/30/2021 20:00:36 - INFO - __main__ - Step 37732: {'lr': 0.00043147382831067204, 'samples': 7244544, 'steps': 37731, 'loss/train': 1.6531836986541748} -08/30/2021 20:00:37 - INFO - __main__ - Step 37733: {'lr': 0.0004314701782634264, 'samples': 7244736, 'steps': 37732, 'loss/train': 1.6658873558044434} -08/30/2021 20:00:38 - INFO - __main__ - Step 37734: {'lr': 0.0004314665281344132, 'samples': 7244928, 'steps': 37733, 'loss/train': 1.7653268575668335} -08/30/2021 20:00:39 - INFO - __main__ - Step 37735: {'lr': 0.0004314628779236339, 'samples': 7245120, 'steps': 37734, 'loss/train': 1.4686462879180908} -08/30/2021 20:00:39 - INFO - __main__ - Step 37736: {'lr': 0.00043145922763109017, 'samples': 7245312, 'steps': 37735, 'loss/train': 1.2351796627044678} -08/30/2021 20:00:40 - INFO - __main__ - Step 37737: {'lr': 0.0004314555772567838, 'samples': 7245504, 'steps': 37736, 'loss/train': 0.5019418001174927} -08/30/2021 20:00:40 - INFO - __main__ - Step 37738: {'lr': 0.0004314519268007163, 'samples': 7245696, 'steps': 37737, 'loss/train': 1.318006157875061} -08/30/2021 20:00:41 - INFO - __main__ - Step 37739: {'lr': 0.00043144827626288943, 'samples': 7245888, 'steps': 37738, 'loss/train': 1.523842453956604} -08/30/2021 20:00:42 - INFO - __main__ - Step 37740: {'lr': 0.00043144462564330464, 'samples': 7246080, 'steps': 37739, 'loss/train': 1.5707664489746094} -08/30/2021 20:00:42 - INFO - __main__ - Step 37741: {'lr': 0.0004314409749419638, 'samples': 7246272, 'steps': 37740, 'loss/train': 1.3167386054992676} -08/30/2021 20:00:43 - INFO - __main__ - Step 37742: {'lr': 0.00043143732415886843, 'samples': 7246464, 'steps': 37741, 'loss/train': 1.1945606470108032} -08/30/2021 20:00:43 - INFO - __main__ - Step 37743: {'lr': 0.0004314336732940202, 'samples': 7246656, 'steps': 37742, 'loss/train': 1.58213210105896} -08/30/2021 20:00:43 - INFO - __main__ - Step 37744: {'lr': 0.0004314300223474208, 'samples': 7246848, 'steps': 37743, 'loss/train': 1.0002487897872925} -08/30/2021 20:00:45 - INFO - __main__ - Step 37745: {'lr': 0.0004314263713190718, 'samples': 7247040, 'steps': 37744, 'loss/train': 1.4598662853240967} -08/30/2021 20:00:45 - INFO - __main__ - Step 37746: {'lr': 0.00043142272020897486, 'samples': 7247232, 'steps': 37745, 'loss/train': 1.5184264183044434} -08/30/2021 20:00:46 - INFO - __main__ - Step 37747: {'lr': 0.0004314190690171317, 'samples': 7247424, 'steps': 37746, 'loss/train': 1.203436255455017} -08/30/2021 20:00:46 - INFO - __main__ - Step 37748: {'lr': 0.0004314154177435438, 'samples': 7247616, 'steps': 37747, 'loss/train': 1.6650391817092896} -08/30/2021 20:00:46 - INFO - __main__ - Step 37749: {'lr': 0.000431411766388213, 'samples': 7247808, 'steps': 37748, 'loss/train': 1.3178043365478516} -08/30/2021 20:00:48 - INFO - __main__ - Step 37750: {'lr': 0.0004314081149511409, 'samples': 7248000, 'steps': 37749, 'loss/train': 1.464530348777771} -08/30/2021 20:00:48 - INFO - __main__ - Step 37751: {'lr': 0.00043140446343232895, 'samples': 7248192, 'steps': 37750, 'loss/train': 1.2500584125518799} -08/30/2021 20:00:49 - INFO - __main__ - Step 37752: {'lr': 0.000431400811831779, 'samples': 7248384, 'steps': 37751, 'loss/train': 1.2512109279632568} -08/30/2021 20:00:49 - INFO - __main__ - Step 37753: {'lr': 0.0004313971601494927, 'samples': 7248576, 'steps': 37752, 'loss/train': 1.548935055732727} -08/30/2021 20:00:49 - INFO - __main__ - Step 37754: {'lr': 0.0004313935083854716, 'samples': 7248768, 'steps': 37753, 'loss/train': 1.5450690984725952} -08/30/2021 20:00:51 - INFO - __main__ - Step 37755: {'lr': 0.0004313898565397174, 'samples': 7248960, 'steps': 37754, 'loss/train': 0.1970173716545105} -08/30/2021 20:00:52 - INFO - __main__ - Step 37756: {'lr': 0.00043138620461223175, 'samples': 7249152, 'steps': 37755, 'loss/train': 1.8051140308380127} -08/30/2021 20:00:52 - INFO - __main__ - Step 37757: {'lr': 0.00043138255260301625, 'samples': 7249344, 'steps': 37756, 'loss/train': 1.5002102851867676} -08/30/2021 20:00:52 - INFO - __main__ - Step 37758: {'lr': 0.0004313789005120725, 'samples': 7249536, 'steps': 37757, 'loss/train': 1.4088208675384521} -08/30/2021 20:00:53 - INFO - __main__ - Step 37759: {'lr': 0.00043137524833940233, 'samples': 7249728, 'steps': 37758, 'loss/train': 1.7270442247390747} -08/30/2021 20:00:55 - INFO - __main__ - Step 37760: {'lr': 0.0004313715960850072, 'samples': 7249920, 'steps': 37759, 'loss/train': 2.1317856311798096} -08/30/2021 20:00:55 - INFO - __main__ - Step 37761: {'lr': 0.00043136794374888887, 'samples': 7250112, 'steps': 37760, 'loss/train': 1.4589859247207642} -08/30/2021 20:00:56 - INFO - __main__ - Step 37762: {'lr': 0.0004313642913310489, 'samples': 7250304, 'steps': 37761, 'loss/train': 1.3985317945480347} -08/30/2021 20:00:56 - INFO - __main__ - Step 37763: {'lr': 0.00043136063883148905, 'samples': 7250496, 'steps': 37762, 'loss/train': 1.383558988571167} -08/30/2021 20:00:56 - INFO - __main__ - Step 37764: {'lr': 0.00043135698625021093, 'samples': 7250688, 'steps': 37763, 'loss/train': 1.6549559831619263} -08/30/2021 20:00:58 - INFO - __main__ - Step 37765: {'lr': 0.000431353333587216, 'samples': 7250880, 'steps': 37764, 'loss/train': 1.2775039672851562} -08/30/2021 20:00:58 - INFO - __main__ - Step 37766: {'lr': 0.00043134968084250616, 'samples': 7251072, 'steps': 37765, 'loss/train': 1.4158092737197876} -08/30/2021 20:00:59 - INFO - __main__ - Step 37767: {'lr': 0.00043134602801608293, 'samples': 7251264, 'steps': 37766, 'loss/train': 1.577428936958313} -08/30/2021 20:00:59 - INFO - __main__ - Step 37768: {'lr': 0.00043134237510794794, 'samples': 7251456, 'steps': 37767, 'loss/train': 2.0538487434387207} -08/30/2021 20:00:59 - INFO - __main__ - Step 37769: {'lr': 0.0004313387221181029, 'samples': 7251648, 'steps': 37768, 'loss/train': 1.7513422966003418} -08/30/2021 20:01:01 - INFO - __main__ - Step 37770: {'lr': 0.0004313350690465495, 'samples': 7251840, 'steps': 37769, 'loss/train': 1.4537458419799805} -08/30/2021 20:01:01 - INFO - __main__ - Step 37771: {'lr': 0.00043133141589328923, 'samples': 7252032, 'steps': 37770, 'loss/train': 0.7458590865135193} -08/30/2021 20:01:02 - INFO - __main__ - Step 37772: {'lr': 0.0004313277626583239, 'samples': 7252224, 'steps': 37771, 'loss/train': 1.2735846042633057} -08/30/2021 20:01:02 - INFO - __main__ - Step 37773: {'lr': 0.000431324109341655, 'samples': 7252416, 'steps': 37772, 'loss/train': 0.7350367307662964} -08/30/2021 20:01:02 - INFO - __main__ - Step 37774: {'lr': 0.0004313204559432842, 'samples': 7252608, 'steps': 37773, 'loss/train': 1.2383387088775635} -08/30/2021 20:01:04 - INFO - __main__ - Step 37775: {'lr': 0.0004313168024632133, 'samples': 7252800, 'steps': 37774, 'loss/train': 0.5584983825683594} -08/30/2021 20:01:04 - INFO - __main__ - Step 37776: {'lr': 0.00043131314890144386, 'samples': 7252992, 'steps': 37775, 'loss/train': 1.2908673286437988} -08/30/2021 20:01:05 - INFO - __main__ - Step 37777: {'lr': 0.0004313094952579775, 'samples': 7253184, 'steps': 37776, 'loss/train': 1.3741708993911743} -08/30/2021 20:01:05 - INFO - __main__ - Step 37778: {'lr': 0.0004313058415328158, 'samples': 7253376, 'steps': 37777, 'loss/train': 0.317062109708786} -08/30/2021 20:01:05 - INFO - __main__ - Step 37779: {'lr': 0.00043130218772596053, 'samples': 7253568, 'steps': 37778, 'loss/train': 1.5649075508117676} -08/30/2021 20:01:07 - INFO - __main__ - Step 37780: {'lr': 0.00043129853383741334, 'samples': 7253760, 'steps': 37779, 'loss/train': 0.6254189610481262} -08/30/2021 20:01:08 - INFO - __main__ - Step 37781: {'lr': 0.00043129487986717574, 'samples': 7253952, 'steps': 37780, 'loss/train': 2.1937649250030518} -08/30/2021 20:01:08 - INFO - __main__ - Step 37782: {'lr': 0.00043129122581524957, 'samples': 7254144, 'steps': 37781, 'loss/train': 1.481724739074707} -08/30/2021 20:01:09 - INFO - __main__ - Step 37783: {'lr': 0.0004312875716816363, 'samples': 7254336, 'steps': 37782, 'loss/train': 1.017342448234558} -08/30/2021 20:01:09 - INFO - __main__ - Step 37784: {'lr': 0.0004312839174663377, 'samples': 7254528, 'steps': 37783, 'loss/train': 1.4106327295303345} -08/30/2021 20:01:09 - INFO - __main__ - Step 37785: {'lr': 0.0004312802631693553, 'samples': 7254720, 'steps': 37784, 'loss/train': 0.6265113353729248} -08/30/2021 20:01:10 - INFO - __main__ - Step 37786: {'lr': 0.00043127660879069084, 'samples': 7254912, 'steps': 37785, 'loss/train': 0.5277948975563049} -08/30/2021 20:01:11 - INFO - __main__ - Step 37787: {'lr': 0.00043127295433034594, 'samples': 7255104, 'steps': 37786, 'loss/train': 1.2199138402938843} -08/30/2021 20:01:12 - INFO - __main__ - Step 37788: {'lr': 0.00043126929978832217, 'samples': 7255296, 'steps': 37787, 'loss/train': 0.05714753642678261} -08/30/2021 20:01:12 - INFO - __main__ - Step 37789: {'lr': 0.00043126564516462134, 'samples': 7255488, 'steps': 37788, 'loss/train': 0.993311882019043} -08/30/2021 20:01:12 - INFO - __main__ - Step 37790: {'lr': 0.000431261990459245, 'samples': 7255680, 'steps': 37789, 'loss/train': 4.479589939117432} -08/30/2021 20:01:13 - INFO - __main__ - Step 37791: {'lr': 0.0004312583356721948, 'samples': 7255872, 'steps': 37790, 'loss/train': 1.38930082321167} -08/30/2021 20:01:14 - INFO - __main__ - Step 37792: {'lr': 0.0004312546808034724, 'samples': 7256064, 'steps': 37791, 'loss/train': 1.716701865196228} -08/30/2021 20:01:15 - INFO - __main__ - Step 37793: {'lr': 0.0004312510258530794, 'samples': 7256256, 'steps': 37792, 'loss/train': 1.6482864618301392} -08/30/2021 20:01:15 - INFO - __main__ - Step 37794: {'lr': 0.0004312473708210175, 'samples': 7256448, 'steps': 37793, 'loss/train': 0.8659932017326355} -08/30/2021 20:01:15 - INFO - __main__ - Step 37795: {'lr': 0.0004312437157072884, 'samples': 7256640, 'steps': 37794, 'loss/train': 1.498479962348938} -08/30/2021 20:01:16 - INFO - __main__ - Step 37796: {'lr': 0.00043124006051189356, 'samples': 7256832, 'steps': 37795, 'loss/train': 1.50589919090271} -08/30/2021 20:01:17 - INFO - __main__ - Step 37797: {'lr': 0.0004312364052348348, 'samples': 7257024, 'steps': 37796, 'loss/train': 1.1998440027236938} -08/30/2021 20:01:18 - INFO - __main__ - Step 37798: {'lr': 0.0004312327498761137, 'samples': 7257216, 'steps': 37797, 'loss/train': 1.165573239326477} -08/30/2021 20:01:18 - INFO - __main__ - Step 37799: {'lr': 0.000431229094435732, 'samples': 7257408, 'steps': 37798, 'loss/train': 1.298769235610962} -08/30/2021 20:01:18 - INFO - __main__ - Step 37800: {'lr': 0.0004312254389136911, 'samples': 7257600, 'steps': 37799, 'loss/train': 1.6393367052078247} -08/30/2021 20:01:19 - INFO - __main__ - Step 37801: {'lr': 0.00043122178330999296, 'samples': 7257792, 'steps': 37800, 'loss/train': 1.7565828561782837} -08/30/2021 20:01:20 - INFO - __main__ - Step 37802: {'lr': 0.0004312181276246391, 'samples': 7257984, 'steps': 37801, 'loss/train': 1.5882149934768677} -08/30/2021 20:01:21 - INFO - __main__ - Step 37803: {'lr': 0.00043121447185763106, 'samples': 7258176, 'steps': 37802, 'loss/train': 1.6342334747314453} -08/30/2021 20:01:21 - INFO - __main__ - Step 37804: {'lr': 0.0004312108160089706, 'samples': 7258368, 'steps': 37803, 'loss/train': 1.569624900817871} -08/30/2021 20:01:21 - INFO - __main__ - Step 37805: {'lr': 0.00043120716007865933, 'samples': 7258560, 'steps': 37804, 'loss/train': 0.5727700591087341} -08/30/2021 20:01:22 - INFO - __main__ - Step 37806: {'lr': 0.0004312035040666989, 'samples': 7258752, 'steps': 37805, 'loss/train': 1.0620774030685425} -08/30/2021 20:01:23 - INFO - __main__ - Step 37807: {'lr': 0.000431199847973091, 'samples': 7258944, 'steps': 37806, 'loss/train': 1.3332579135894775} -08/30/2021 20:01:24 - INFO - __main__ - Step 37808: {'lr': 0.0004311961917978372, 'samples': 7259136, 'steps': 37807, 'loss/train': 1.697693943977356} -08/30/2021 20:01:24 - INFO - __main__ - Step 37809: {'lr': 0.0004311925355409393, 'samples': 7259328, 'steps': 37808, 'loss/train': 1.5940006971359253} -08/30/2021 20:01:24 - INFO - __main__ - Step 37810: {'lr': 0.00043118887920239876, 'samples': 7259520, 'steps': 37809, 'loss/train': 1.4617135524749756} -08/30/2021 20:01:25 - INFO - __main__ - Step 37811: {'lr': 0.00043118522278221726, 'samples': 7259712, 'steps': 37810, 'loss/train': 1.3778870105743408} -08/30/2021 20:01:27 - INFO - __main__ - Step 37812: {'lr': 0.0004311815662803966, 'samples': 7259904, 'steps': 37811, 'loss/train': 2.3793747425079346} -08/30/2021 20:01:27 - INFO - __main__ - Step 37813: {'lr': 0.00043117790969693826, 'samples': 7260096, 'steps': 37812, 'loss/train': 1.7134493589401245} -08/30/2021 20:01:27 - INFO - __main__ - Step 37814: {'lr': 0.00043117425303184395, 'samples': 7260288, 'steps': 37813, 'loss/train': 1.6078107357025146} -08/30/2021 20:01:28 - INFO - __main__ - Step 37815: {'lr': 0.0004311705962851153, 'samples': 7260480, 'steps': 37814, 'loss/train': 1.257380485534668} -08/30/2021 20:01:28 - INFO - __main__ - Step 37816: {'lr': 0.000431166939456754, 'samples': 7260672, 'steps': 37815, 'loss/train': 1.3523883819580078} -08/30/2021 20:01:30 - INFO - __main__ - Step 37817: {'lr': 0.0004311632825467617, 'samples': 7260864, 'steps': 37816, 'loss/train': 0.7073904275894165} -08/30/2021 20:01:30 - INFO - __main__ - Step 37818: {'lr': 0.00043115962555514, 'samples': 7261056, 'steps': 37817, 'loss/train': 1.1123647689819336} -08/30/2021 20:01:31 - INFO - __main__ - Step 37819: {'lr': 0.0004311559684818905, 'samples': 7261248, 'steps': 37818, 'loss/train': 1.449662685394287} -08/30/2021 20:01:31 - INFO - __main__ - Step 37820: {'lr': 0.000431152311327015, 'samples': 7261440, 'steps': 37819, 'loss/train': 0.5699060559272766} -08/30/2021 20:01:31 - INFO - __main__ - Step 37821: {'lr': 0.00043114865409051505, 'samples': 7261632, 'steps': 37820, 'loss/train': 1.3527705669403076} -08/30/2021 20:01:33 - INFO - __main__ - Step 37822: {'lr': 0.0004311449967723923, 'samples': 7261824, 'steps': 37821, 'loss/train': 1.5606176853179932} -08/30/2021 20:01:33 - INFO - __main__ - Step 37823: {'lr': 0.00043114133937264843, 'samples': 7262016, 'steps': 37822, 'loss/train': 1.5322378873825073} -08/30/2021 20:01:34 - INFO - __main__ - Step 37824: {'lr': 0.000431137681891285, 'samples': 7262208, 'steps': 37823, 'loss/train': 0.664175808429718} -08/30/2021 20:01:34 - INFO - __main__ - Step 37825: {'lr': 0.0004311340243283038, 'samples': 7262400, 'steps': 37824, 'loss/train': 0.0782211422920227} -08/30/2021 20:01:34 - INFO - __main__ - Step 37826: {'lr': 0.0004311303666837064, 'samples': 7262592, 'steps': 37825, 'loss/train': 1.404437780380249} -08/30/2021 20:01:35 - INFO - __main__ - Step 37827: {'lr': 0.0004311267089574944, 'samples': 7262784, 'steps': 37826, 'loss/train': 0.18977566063404083} -08/30/2021 20:01:36 - INFO - __main__ - Step 37828: {'lr': 0.00043112305114966957, 'samples': 7262976, 'steps': 37827, 'loss/train': 2.391573190689087} -08/30/2021 20:01:37 - INFO - __main__ - Step 37829: {'lr': 0.0004311193932602334, 'samples': 7263168, 'steps': 37828, 'loss/train': 1.4405546188354492} -08/30/2021 20:01:37 - INFO - __main__ - Step 37830: {'lr': 0.0004311157352891877, 'samples': 7263360, 'steps': 37829, 'loss/train': 1.7260751724243164} -08/30/2021 20:01:37 - INFO - __main__ - Step 37831: {'lr': 0.000431112077236534, 'samples': 7263552, 'steps': 37830, 'loss/train': 1.29401433467865} -08/30/2021 20:01:38 - INFO - __main__ - Step 37832: {'lr': 0.0004311084191022741, 'samples': 7263744, 'steps': 37831, 'loss/train': 1.2429078817367554} -08/30/2021 20:01:39 - INFO - __main__ - Step 37833: {'lr': 0.00043110476088640935, 'samples': 7263936, 'steps': 37832, 'loss/train': 1.2765179872512817} -08/30/2021 20:01:39 - INFO - __main__ - Step 37834: {'lr': 0.00043110110258894177, 'samples': 7264128, 'steps': 37833, 'loss/train': 2.3622725009918213} -08/30/2021 20:01:40 - INFO - __main__ - Step 37835: {'lr': 0.00043109744420987274, 'samples': 7264320, 'steps': 37834, 'loss/train': 1.2294102907180786} -08/30/2021 20:01:40 - INFO - __main__ - Step 37836: {'lr': 0.000431093785749204, 'samples': 7264512, 'steps': 37835, 'loss/train': 1.6432852745056152} -08/30/2021 20:01:40 - INFO - __main__ - Step 37837: {'lr': 0.00043109012720693717, 'samples': 7264704, 'steps': 37836, 'loss/train': 1.603135108947754} -08/30/2021 20:01:42 - INFO - __main__ - Step 37838: {'lr': 0.000431086468583074, 'samples': 7264896, 'steps': 37837, 'loss/train': 1.3908874988555908} -08/30/2021 20:01:43 - INFO - __main__ - Step 37839: {'lr': 0.00043108280987761593, 'samples': 7265088, 'steps': 37838, 'loss/train': 0.3412628173828125} -08/30/2021 20:01:43 - INFO - __main__ - Step 37840: {'lr': 0.0004310791510905649, 'samples': 7265280, 'steps': 37839, 'loss/train': 1.7199853658676147} -08/30/2021 20:01:43 - INFO - __main__ - Step 37841: {'lr': 0.00043107549222192235, 'samples': 7265472, 'steps': 37840, 'loss/train': 1.634230136871338} -08/30/2021 20:01:44 - INFO - __main__ - Step 37842: {'lr': 0.0004310718332716899, 'samples': 7265664, 'steps': 37841, 'loss/train': 1.3085078001022339} -08/30/2021 20:01:45 - INFO - __main__ - Step 37843: {'lr': 0.00043106817423986933, 'samples': 7265856, 'steps': 37842, 'loss/train': 1.3753633499145508} -08/30/2021 20:01:46 - INFO - __main__ - Step 37844: {'lr': 0.00043106451512646226, 'samples': 7266048, 'steps': 37843, 'loss/train': 1.5045685768127441} -08/30/2021 20:01:46 - INFO - __main__ - Step 37845: {'lr': 0.00043106085593147027, 'samples': 7266240, 'steps': 37844, 'loss/train': 1.0204722881317139} -08/30/2021 20:01:46 - INFO - __main__ - Step 37846: {'lr': 0.00043105719665489505, 'samples': 7266432, 'steps': 37845, 'loss/train': 1.5937714576721191} -08/30/2021 20:01:47 - INFO - __main__ - Step 37847: {'lr': 0.0004310535372967383, 'samples': 7266624, 'steps': 37846, 'loss/train': 1.3426986932754517} -08/30/2021 20:01:48 - INFO - __main__ - Step 37848: {'lr': 0.0004310498778570016, 'samples': 7266816, 'steps': 37847, 'loss/train': 1.5222175121307373} -08/30/2021 20:01:49 - INFO - __main__ - Step 37849: {'lr': 0.0004310462183356866, 'samples': 7267008, 'steps': 37848, 'loss/train': 1.5410236120224} -08/30/2021 20:01:49 - INFO - __main__ - Step 37850: {'lr': 0.00043104255873279497, 'samples': 7267200, 'steps': 37849, 'loss/train': 0.9960685968399048} -08/30/2021 20:01:49 - INFO - __main__ - Step 37851: {'lr': 0.00043103889904832837, 'samples': 7267392, 'steps': 37850, 'loss/train': 1.3453502655029297} -08/30/2021 20:01:50 - INFO - __main__ - Step 37852: {'lr': 0.0004310352392822884, 'samples': 7267584, 'steps': 37851, 'loss/train': 1.0611807107925415} -08/30/2021 20:01:51 - INFO - __main__ - Step 37853: {'lr': 0.00043103157943467674, 'samples': 7267776, 'steps': 37852, 'loss/train': 1.4241032600402832} -08/30/2021 20:01:52 - INFO - __main__ - Step 37854: {'lr': 0.00043102791950549513, 'samples': 7267968, 'steps': 37853, 'loss/train': 1.404571533203125} -08/30/2021 20:01:52 - INFO - __main__ - Step 37855: {'lr': 0.00043102425949474504, 'samples': 7268160, 'steps': 37854, 'loss/train': 1.0707902908325195} -08/30/2021 20:01:53 - INFO - __main__ - Step 37856: {'lr': 0.00043102059940242825, 'samples': 7268352, 'steps': 37855, 'loss/train': 1.2622687816619873} -08/30/2021 20:01:53 - INFO - __main__ - Step 37857: {'lr': 0.0004310169392285464, 'samples': 7268544, 'steps': 37856, 'loss/train': 1.3767515420913696} -08/30/2021 20:01:53 - INFO - __main__ - Step 37858: {'lr': 0.0004310132789731011, 'samples': 7268736, 'steps': 37857, 'loss/train': 1.4821090698242188} -08/30/2021 20:01:56 - INFO - __main__ - Step 37859: {'lr': 0.000431009618636094, 'samples': 7268928, 'steps': 37858, 'loss/train': 0.06676900386810303} -08/30/2021 20:01:57 - INFO - __main__ - Step 37860: {'lr': 0.00043100595821752674, 'samples': 7269120, 'steps': 37859, 'loss/train': 1.4708852767944336} -08/30/2021 20:01:57 - INFO - __main__ - Step 37861: {'lr': 0.00043100229771740096, 'samples': 7269312, 'steps': 37860, 'loss/train': 1.5063320398330688} -08/30/2021 20:01:57 - INFO - __main__ - Step 37862: {'lr': 0.0004309986371357184, 'samples': 7269504, 'steps': 37861, 'loss/train': 1.0035943984985352} -08/30/2021 20:01:58 - INFO - __main__ - Step 37863: {'lr': 0.00043099497647248065, 'samples': 7269696, 'steps': 37862, 'loss/train': 1.7991957664489746} -08/30/2021 20:01:58 - INFO - __main__ - Step 37864: {'lr': 0.00043099131572768936, 'samples': 7269888, 'steps': 37863, 'loss/train': 1.7775837182998657} -08/30/2021 20:01:58 - INFO - __main__ - Step 37865: {'lr': 0.00043098765490134607, 'samples': 7270080, 'steps': 37864, 'loss/train': 1.0462443828582764} -08/30/2021 20:01:59 - INFO - __main__ - Step 37866: {'lr': 0.00043098399399345267, 'samples': 7270272, 'steps': 37865, 'loss/train': 2.1398673057556152} -08/30/2021 20:02:00 - INFO - __main__ - Step 37867: {'lr': 0.0004309803330040106, 'samples': 7270464, 'steps': 37866, 'loss/train': 5.814516067504883} -08/30/2021 20:02:01 - INFO - __main__ - Step 37868: {'lr': 0.0004309766719330216, 'samples': 7270656, 'steps': 37867, 'loss/train': 0.6848388910293579} -08/30/2021 20:02:01 - INFO - __main__ - Step 37869: {'lr': 0.00043097301078048736, 'samples': 7270848, 'steps': 37868, 'loss/train': 1.5420037508010864} -08/30/2021 20:02:02 - INFO - __main__ - Step 37870: {'lr': 0.00043096934954640935, 'samples': 7271040, 'steps': 37869, 'loss/train': 1.61904776096344} -08/30/2021 20:02:02 - INFO - __main__ - Step 37871: {'lr': 0.0004309656882307894, 'samples': 7271232, 'steps': 37870, 'loss/train': 0.18017643690109253} -08/30/2021 20:02:02 - INFO - __main__ - Step 37872: {'lr': 0.0004309620268336292, 'samples': 7271424, 'steps': 37871, 'loss/train': 0.8786585330963135} -08/30/2021 20:02:04 - INFO - __main__ - Step 37873: {'lr': 0.0004309583653549302, 'samples': 7271616, 'steps': 37872, 'loss/train': 1.290591835975647} -08/30/2021 20:02:05 - INFO - __main__ - Step 37874: {'lr': 0.0004309547037946941, 'samples': 7271808, 'steps': 37873, 'loss/train': 1.7790499925613403} -08/30/2021 20:02:05 - INFO - __main__ - Step 37875: {'lr': 0.0004309510421529227, 'samples': 7272000, 'steps': 37874, 'loss/train': 1.4028468132019043} -08/30/2021 20:02:05 - INFO - __main__ - Step 37876: {'lr': 0.00043094738042961754, 'samples': 7272192, 'steps': 37875, 'loss/train': 1.6830459833145142} -08/30/2021 20:02:06 - INFO - __main__ - Step 37877: {'lr': 0.0004309437186247803, 'samples': 7272384, 'steps': 37876, 'loss/train': 1.4887789487838745} -08/30/2021 20:02:07 - INFO - __main__ - Step 37878: {'lr': 0.00043094005673841257, 'samples': 7272576, 'steps': 37877, 'loss/train': 0.8011658191680908} -08/30/2021 20:02:08 - INFO - __main__ - Step 37879: {'lr': 0.00043093639477051606, 'samples': 7272768, 'steps': 37878, 'loss/train': 1.5701242685317993} -08/30/2021 20:02:08 - INFO - __main__ - Step 37880: {'lr': 0.0004309327327210923, 'samples': 7272960, 'steps': 37879, 'loss/train': 1.2994638681411743} -08/30/2021 20:02:08 - INFO - __main__ - Step 37881: {'lr': 0.00043092907059014325, 'samples': 7273152, 'steps': 37880, 'loss/train': 1.2492634057998657} -08/30/2021 20:02:09 - INFO - __main__ - Step 37882: {'lr': 0.00043092540837767025, 'samples': 7273344, 'steps': 37881, 'loss/train': 1.1876689195632935} -08/30/2021 20:02:10 - INFO - __main__ - Step 37883: {'lr': 0.000430921746083675, 'samples': 7273536, 'steps': 37882, 'loss/train': 1.6326980590820312} -08/30/2021 20:02:11 - INFO - __main__ - Step 37884: {'lr': 0.00043091808370815935, 'samples': 7273728, 'steps': 37883, 'loss/train': 1.6195087432861328} -08/30/2021 20:02:11 - INFO - __main__ - Step 37885: {'lr': 0.0004309144212511246, 'samples': 7273920, 'steps': 37884, 'loss/train': 1.1608182191848755} -08/30/2021 20:02:11 - INFO - __main__ - Step 37886: {'lr': 0.00043091075871257275, 'samples': 7274112, 'steps': 37885, 'loss/train': 1.5530043840408325} -08/30/2021 20:02:12 - INFO - __main__ - Step 37887: {'lr': 0.0004309070960925052, 'samples': 7274304, 'steps': 37886, 'loss/train': 1.4360982179641724} -08/30/2021 20:02:13 - INFO - __main__ - Step 37888: {'lr': 0.0004309034333909238, 'samples': 7274496, 'steps': 37887, 'loss/train': 2.7442939281463623} -08/30/2021 20:02:14 - INFO - __main__ - Step 37889: {'lr': 0.0004308997706078301, 'samples': 7274688, 'steps': 37888, 'loss/train': 0.9758208394050598} -08/30/2021 20:02:14 - INFO - __main__ - Step 37890: {'lr': 0.00043089610774322575, 'samples': 7274880, 'steps': 37889, 'loss/train': 0.5293806195259094} -08/30/2021 20:02:15 - INFO - __main__ - Step 37891: {'lr': 0.00043089244479711233, 'samples': 7275072, 'steps': 37890, 'loss/train': 1.2836235761642456} -08/30/2021 20:02:15 - INFO - __main__ - Step 37892: {'lr': 0.00043088878176949163, 'samples': 7275264, 'steps': 37891, 'loss/train': 1.7117257118225098} -08/30/2021 20:02:16 - INFO - __main__ - Step 37893: {'lr': 0.0004308851186603652, 'samples': 7275456, 'steps': 37892, 'loss/train': 1.4861423969268799} -08/30/2021 20:02:17 - INFO - __main__ - Step 37894: {'lr': 0.0004308814554697348, 'samples': 7275648, 'steps': 37893, 'loss/train': 1.29928719997406} -08/30/2021 20:02:17 - INFO - __main__ - Step 37895: {'lr': 0.0004308777921976019, 'samples': 7275840, 'steps': 37894, 'loss/train': 0.8017020225524902} -08/30/2021 20:02:18 - INFO - __main__ - Step 37896: {'lr': 0.00043087412884396835, 'samples': 7276032, 'steps': 37895, 'loss/train': 1.224180817604065} -08/30/2021 20:02:18 - INFO - __main__ - Step 37897: {'lr': 0.0004308704654088357, 'samples': 7276224, 'steps': 37896, 'loss/train': 1.6390975713729858} -08/30/2021 20:02:18 - INFO - __main__ - Step 37898: {'lr': 0.00043086680189220554, 'samples': 7276416, 'steps': 37897, 'loss/train': 1.4691028594970703} -08/30/2021 20:02:20 - INFO - __main__ - Step 37899: {'lr': 0.00043086313829407966, 'samples': 7276608, 'steps': 37898, 'loss/train': 1.4377100467681885} -08/30/2021 20:02:20 - INFO - __main__ - Step 37900: {'lr': 0.0004308594746144596, 'samples': 7276800, 'steps': 37899, 'loss/train': 1.1837940216064453} -08/30/2021 20:02:21 - INFO - __main__ - Step 37901: {'lr': 0.0004308558108533471, 'samples': 7276992, 'steps': 37900, 'loss/train': 1.5996122360229492} -08/30/2021 20:02:21 - INFO - __main__ - Step 37902: {'lr': 0.0004308521470107437, 'samples': 7277184, 'steps': 37901, 'loss/train': 1.0837979316711426} -08/30/2021 20:02:21 - INFO - __main__ - Step 37903: {'lr': 0.00043084848308665115, 'samples': 7277376, 'steps': 37902, 'loss/train': 1.2540404796600342} -08/30/2021 20:02:23 - INFO - __main__ - Step 37904: {'lr': 0.00043084481908107103, 'samples': 7277568, 'steps': 37903, 'loss/train': 1.5019642114639282} -08/30/2021 20:02:24 - INFO - __main__ - Step 37905: {'lr': 0.00043084115499400505, 'samples': 7277760, 'steps': 37904, 'loss/train': 1.501989722251892} -08/30/2021 20:02:24 - INFO - __main__ - Step 37906: {'lr': 0.0004308374908254549, 'samples': 7277952, 'steps': 37905, 'loss/train': 1.6943483352661133} -08/30/2021 20:02:24 - INFO - __main__ - Step 37907: {'lr': 0.000430833826575422, 'samples': 7278144, 'steps': 37906, 'loss/train': 1.894102931022644} -08/30/2021 20:02:25 - INFO - __main__ - Step 37908: {'lr': 0.0004308301622439083, 'samples': 7278336, 'steps': 37907, 'loss/train': 0.05945177748799324} -08/30/2021 20:02:25 - INFO - __main__ - Step 37909: {'lr': 0.0004308264978309153, 'samples': 7278528, 'steps': 37908, 'loss/train': 0.5095059275627136} -08/30/2021 20:02:27 - INFO - __main__ - Step 37910: {'lr': 0.0004308228333364447, 'samples': 7278720, 'steps': 37909, 'loss/train': 1.611308217048645} -08/30/2021 20:02:27 - INFO - __main__ - Step 37911: {'lr': 0.000430819168760498, 'samples': 7278912, 'steps': 37910, 'loss/train': 0.7591837048530579} -08/30/2021 20:02:27 - INFO - __main__ - Step 37912: {'lr': 0.0004308155041030771, 'samples': 7279104, 'steps': 37911, 'loss/train': 1.6226508617401123} -08/30/2021 20:02:28 - INFO - __main__ - Step 37913: {'lr': 0.00043081183936418343, 'samples': 7279296, 'steps': 37912, 'loss/train': 0.12308230251073837} -08/30/2021 20:02:28 - INFO - __main__ - Step 37914: {'lr': 0.0004308081745438188, 'samples': 7279488, 'steps': 37913, 'loss/train': 1.0532708168029785} -08/30/2021 20:02:30 - INFO - __main__ - Step 37915: {'lr': 0.00043080450964198483, 'samples': 7279680, 'steps': 37914, 'loss/train': 1.7810993194580078} -08/30/2021 20:02:31 - INFO - __main__ - Step 37916: {'lr': 0.00043080084465868307, 'samples': 7279872, 'steps': 37915, 'loss/train': 1.8623061180114746} -08/30/2021 20:02:31 - INFO - __main__ - Step 37917: {'lr': 0.0004307971795939152, 'samples': 7280064, 'steps': 37916, 'loss/train': 1.3737930059432983} -08/30/2021 20:02:31 - INFO - __main__ - Step 37918: {'lr': 0.000430793514447683, 'samples': 7280256, 'steps': 37917, 'loss/train': 1.1269421577453613} -08/30/2021 20:02:32 - INFO - __main__ - Step 37919: {'lr': 0.000430789849219988, 'samples': 7280448, 'steps': 37918, 'loss/train': 0.9433661103248596} -08/30/2021 20:02:32 - INFO - __main__ - Step 37920: {'lr': 0.0004307861839108319, 'samples': 7280640, 'steps': 37919, 'loss/train': 1.3293336629867554} -08/30/2021 20:02:34 - INFO - __main__ - Step 37921: {'lr': 0.00043078251852021634, 'samples': 7280832, 'steps': 37920, 'loss/train': 1.1722218990325928} -08/30/2021 20:02:34 - INFO - __main__ - Step 37922: {'lr': 0.0004307788530481429, 'samples': 7281024, 'steps': 37921, 'loss/train': 1.3880480527877808} -08/30/2021 20:02:34 - INFO - __main__ - Step 37923: {'lr': 0.00043077518749461336, 'samples': 7281216, 'steps': 37922, 'loss/train': 0.8215358853340149} -08/30/2021 20:02:35 - INFO - __main__ - Step 37924: {'lr': 0.00043077152185962933, 'samples': 7281408, 'steps': 37923, 'loss/train': 2.0082170963287354} -08/30/2021 20:02:35 - INFO - __main__ - Step 37925: {'lr': 0.00043076785614319234, 'samples': 7281600, 'steps': 37924, 'loss/train': 1.9002224206924438} -08/30/2021 20:02:37 - INFO - __main__ - Step 37926: {'lr': 0.0004307641903453042, 'samples': 7281792, 'steps': 37925, 'loss/train': 1.3372080326080322} -08/30/2021 20:02:38 - INFO - __main__ - Step 37927: {'lr': 0.00043076052446596656, 'samples': 7281984, 'steps': 37926, 'loss/train': 0.9769525527954102} -08/30/2021 20:02:38 - INFO - __main__ - Step 37928: {'lr': 0.000430756858505181, 'samples': 7282176, 'steps': 37927, 'loss/train': 2.007188320159912} -08/30/2021 20:02:39 - INFO - __main__ - Step 37929: {'lr': 0.00043075319246294914, 'samples': 7282368, 'steps': 37928, 'loss/train': 2.086503267288208} -08/30/2021 20:02:39 - INFO - __main__ - Step 37930: {'lr': 0.0004307495263392727, 'samples': 7282560, 'steps': 37929, 'loss/train': 1.3345279693603516} -08/30/2021 20:02:40 - INFO - __main__ - Step 37931: {'lr': 0.00043074586013415337, 'samples': 7282752, 'steps': 37930, 'loss/train': 0.8397785425186157} -08/30/2021 20:02:41 - INFO - __main__ - Step 37932: {'lr': 0.0004307421938475926, 'samples': 7282944, 'steps': 37931, 'loss/train': 1.3382477760314941} -08/30/2021 20:02:41 - INFO - __main__ - Step 37933: {'lr': 0.0004307385274795923, 'samples': 7283136, 'steps': 37932, 'loss/train': 1.1909817457199097} -08/30/2021 20:02:42 - INFO - __main__ - Step 37934: {'lr': 0.000430734861030154, 'samples': 7283328, 'steps': 37933, 'loss/train': 1.8692418336868286} -08/30/2021 20:02:42 - INFO - __main__ - Step 37935: {'lr': 0.0004307311944992793, 'samples': 7283520, 'steps': 37934, 'loss/train': 1.2709850072860718} -08/30/2021 20:02:44 - INFO - __main__ - Step 37936: {'lr': 0.00043072752788697003, 'samples': 7283712, 'steps': 37935, 'loss/train': 0.8929647207260132} -08/30/2021 20:02:44 - INFO - __main__ - Step 37937: {'lr': 0.0004307238611932276, 'samples': 7283904, 'steps': 37936, 'loss/train': 1.7575852870941162} -08/30/2021 20:02:44 - INFO - __main__ - Step 37938: {'lr': 0.00043072019441805386, 'samples': 7284096, 'steps': 37937, 'loss/train': 1.7067137956619263} -08/30/2021 20:02:45 - INFO - __main__ - Step 37939: {'lr': 0.00043071652756145035, 'samples': 7284288, 'steps': 37938, 'loss/train': 1.6471831798553467} -08/30/2021 20:02:45 - INFO - __main__ - Step 37940: {'lr': 0.0004307128606234188, 'samples': 7284480, 'steps': 37939, 'loss/train': 1.3572616577148438} -08/30/2021 20:02:45 - INFO - __main__ - Step 37941: {'lr': 0.00043070919360396076, 'samples': 7284672, 'steps': 37940, 'loss/train': 1.5423264503479004} -08/30/2021 20:02:47 - INFO - __main__ - Step 37942: {'lr': 0.00043070552650307804, 'samples': 7284864, 'steps': 37941, 'loss/train': 1.6752439737319946} -08/30/2021 20:02:47 - INFO - __main__ - Step 37943: {'lr': 0.0004307018593207721, 'samples': 7285056, 'steps': 37942, 'loss/train': 1.6285309791564941} -08/30/2021 20:02:48 - INFO - __main__ - Step 37944: {'lr': 0.0004306981920570447, 'samples': 7285248, 'steps': 37943, 'loss/train': 1.3542191982269287} -08/30/2021 20:02:48 - INFO - __main__ - Step 37945: {'lr': 0.00043069452471189765, 'samples': 7285440, 'steps': 37944, 'loss/train': 2.0343024730682373} -08/30/2021 20:02:49 - INFO - __main__ - Step 37946: {'lr': 0.00043069085728533225, 'samples': 7285632, 'steps': 37945, 'loss/train': 0.996588408946991} -08/30/2021 20:02:50 - INFO - __main__ - Step 37947: {'lr': 0.0004306871897773504, 'samples': 7285824, 'steps': 37946, 'loss/train': 1.0571370124816895} -08/30/2021 20:02:51 - INFO - __main__ - Step 37948: {'lr': 0.0004306835221879537, 'samples': 7286016, 'steps': 37947, 'loss/train': 2.371856689453125} -08/30/2021 20:02:51 - INFO - __main__ - Step 37949: {'lr': 0.00043067985451714373, 'samples': 7286208, 'steps': 37948, 'loss/train': 1.525660514831543} -08/30/2021 20:02:51 - INFO - __main__ - Step 37950: {'lr': 0.0004306761867649223, 'samples': 7286400, 'steps': 37949, 'loss/train': 1.173021674156189} -08/30/2021 20:02:52 - INFO - __main__ - Step 37951: {'lr': 0.0004306725189312909, 'samples': 7286592, 'steps': 37950, 'loss/train': 1.0360796451568604} -08/30/2021 20:02:53 - INFO - __main__ - Step 37952: {'lr': 0.00043066885101625133, 'samples': 7286784, 'steps': 37951, 'loss/train': 1.4797992706298828} -08/30/2021 20:02:54 - INFO - __main__ - Step 37953: {'lr': 0.00043066518301980504, 'samples': 7286976, 'steps': 37952, 'loss/train': 1.709488868713379} -08/30/2021 20:02:54 - INFO - __main__ - Step 37954: {'lr': 0.00043066151494195387, 'samples': 7287168, 'steps': 37953, 'loss/train': 1.8373823165893555} -08/30/2021 20:02:55 - INFO - __main__ - Step 37955: {'lr': 0.00043065784678269944, 'samples': 7287360, 'steps': 37954, 'loss/train': 1.8149770498275757} -08/30/2021 20:02:55 - INFO - __main__ - Step 37956: {'lr': 0.00043065417854204333, 'samples': 7287552, 'steps': 37955, 'loss/train': 1.3321179151535034} -08/30/2021 20:02:56 - INFO - __main__ - Step 37957: {'lr': 0.0004306505102199872, 'samples': 7287744, 'steps': 37956, 'loss/train': 1.5129896402359009} -08/30/2021 20:02:57 - INFO - __main__ - Step 37958: {'lr': 0.0004306468418165328, 'samples': 7287936, 'steps': 37957, 'loss/train': 1.294215440750122} -08/30/2021 20:02:57 - INFO - __main__ - Step 37959: {'lr': 0.0004306431733316817, 'samples': 7288128, 'steps': 37958, 'loss/train': 1.1099672317504883} -08/30/2021 20:02:58 - INFO - __main__ - Step 37960: {'lr': 0.00043063950476543563, 'samples': 7288320, 'steps': 37959, 'loss/train': 1.4662171602249146} -08/30/2021 20:02:58 - INFO - __main__ - Step 37961: {'lr': 0.0004306358361177961, 'samples': 7288512, 'steps': 37960, 'loss/train': 1.893613338470459} -08/30/2021 20:02:59 - INFO - __main__ - Step 37962: {'lr': 0.00043063216738876487, 'samples': 7288704, 'steps': 37961, 'loss/train': 0.6625356674194336} -08/30/2021 20:03:00 - INFO - __main__ - Step 37963: {'lr': 0.0004306284985783436, 'samples': 7288896, 'steps': 37962, 'loss/train': 1.7436747550964355} -08/30/2021 20:03:00 - INFO - __main__ - Step 37964: {'lr': 0.00043062482968653394, 'samples': 7289088, 'steps': 37963, 'loss/train': 1.6192299127578735} -08/30/2021 20:03:01 - INFO - __main__ - Step 37965: {'lr': 0.00043062116071333745, 'samples': 7289280, 'steps': 37964, 'loss/train': 1.397481918334961} -08/30/2021 20:03:01 - INFO - __main__ - Step 37966: {'lr': 0.0004306174916587559, 'samples': 7289472, 'steps': 37965, 'loss/train': 2.117974042892456} -08/30/2021 20:03:02 - INFO - __main__ - Step 37967: {'lr': 0.0004306138225227909, 'samples': 7289664, 'steps': 37966, 'loss/train': 1.8756572008132935} -08/30/2021 20:03:03 - INFO - __main__ - Step 37968: {'lr': 0.0004306101533054441, 'samples': 7289856, 'steps': 37967, 'loss/train': 0.8081443905830383} -08/30/2021 20:03:03 - INFO - __main__ - Step 37969: {'lr': 0.0004306064840067171, 'samples': 7290048, 'steps': 37968, 'loss/train': 1.2252280712127686} -08/30/2021 20:03:04 - INFO - __main__ - Step 37970: {'lr': 0.00043060281462661165, 'samples': 7290240, 'steps': 37969, 'loss/train': 1.2962955236434937} -08/30/2021 20:03:04 - INFO - __main__ - Step 37971: {'lr': 0.0004305991451651293, 'samples': 7290432, 'steps': 37970, 'loss/train': 1.7549068927764893} -08/30/2021 20:03:04 - INFO - __main__ - Step 37972: {'lr': 0.00043059547562227185, 'samples': 7290624, 'steps': 37971, 'loss/train': 1.2480435371398926} -08/30/2021 20:03:06 - INFO - __main__ - Step 37973: {'lr': 0.0004305918059980408, 'samples': 7290816, 'steps': 37972, 'loss/train': 0.8773108124732971} -08/30/2021 20:03:07 - INFO - __main__ - Step 37974: {'lr': 0.00043058813629243787, 'samples': 7291008, 'steps': 37973, 'loss/train': 1.6526979207992554} -08/30/2021 20:03:07 - INFO - __main__ - Step 37975: {'lr': 0.0004305844665054648, 'samples': 7291200, 'steps': 37974, 'loss/train': 0.11428213864564896} -08/30/2021 20:03:07 - INFO - __main__ - Step 37976: {'lr': 0.00043058079663712304, 'samples': 7291392, 'steps': 37975, 'loss/train': 0.05056499317288399} -08/30/2021 20:03:08 - INFO - __main__ - Step 37977: {'lr': 0.00043057712668741443, 'samples': 7291584, 'steps': 37976, 'loss/train': 0.5404082536697388} -08/30/2021 20:03:08 - INFO - __main__ - Step 37978: {'lr': 0.0004305734566563405, 'samples': 7291776, 'steps': 37977, 'loss/train': 1.5344116687774658} -08/30/2021 20:03:10 - INFO - __main__ - Step 37979: {'lr': 0.000430569786543903, 'samples': 7291968, 'steps': 37978, 'loss/train': 0.616824209690094} -08/30/2021 20:03:11 - INFO - __main__ - Step 37980: {'lr': 0.00043056611635010355, 'samples': 7292160, 'steps': 37979, 'loss/train': 1.741088628768921} -08/30/2021 20:03:11 - INFO - __main__ - Step 37981: {'lr': 0.00043056244607494375, 'samples': 7292352, 'steps': 37980, 'loss/train': 1.4914863109588623} -08/30/2021 20:03:11 - INFO - __main__ - Step 37982: {'lr': 0.0004305587757184254, 'samples': 7292544, 'steps': 37981, 'loss/train': 0.07795705646276474} -08/30/2021 20:03:12 - INFO - __main__ - Step 37983: {'lr': 0.0004305551052805499, 'samples': 7292736, 'steps': 37982, 'loss/train': 0.9139474034309387} -08/30/2021 20:03:13 - INFO - __main__ - Step 37984: {'lr': 0.0004305514347613191, 'samples': 7292928, 'steps': 37983, 'loss/train': 1.4218533039093018} -08/30/2021 20:03:14 - INFO - __main__ - Step 37985: {'lr': 0.0004305477641607347, 'samples': 7293120, 'steps': 37984, 'loss/train': 1.732502818107605} -08/30/2021 20:03:14 - INFO - __main__ - Step 37986: {'lr': 0.0004305440934787982, 'samples': 7293312, 'steps': 37985, 'loss/train': 1.4697660207748413} -08/30/2021 20:03:14 - INFO - __main__ - Step 37987: {'lr': 0.0004305404227155113, 'samples': 7293504, 'steps': 37986, 'loss/train': 0.8130356669425964} -08/30/2021 20:03:15 - INFO - __main__ - Step 37988: {'lr': 0.0004305367518708757, 'samples': 7293696, 'steps': 37987, 'loss/train': 1.533135175704956} -08/30/2021 20:03:17 - INFO - __main__ - Step 37989: {'lr': 0.000430533080944893, 'samples': 7293888, 'steps': 37988, 'loss/train': 1.0704238414764404} -08/30/2021 20:03:17 - INFO - __main__ - Step 37990: {'lr': 0.00043052940993756493, 'samples': 7294080, 'steps': 37989, 'loss/train': 1.513957142829895} -08/30/2021 20:03:17 - INFO - __main__ - Step 37991: {'lr': 0.00043052573884889305, 'samples': 7294272, 'steps': 37990, 'loss/train': 0.9590299725532532} -08/30/2021 20:03:18 - INFO - __main__ - Step 37992: {'lr': 0.00043052206767887907, 'samples': 7294464, 'steps': 37991, 'loss/train': 1.0240545272827148} -08/30/2021 20:03:18 - INFO - __main__ - Step 37993: {'lr': 0.00043051839642752466, 'samples': 7294656, 'steps': 37992, 'loss/train': 0.6313053965568542} -08/30/2021 20:03:18 - INFO - __main__ - Step 37994: {'lr': 0.00043051472509483135, 'samples': 7294848, 'steps': 37993, 'loss/train': 2.0285911560058594} -08/30/2021 20:03:19 - INFO - __main__ - Step 37995: {'lr': 0.00043051105368080103, 'samples': 7295040, 'steps': 37994, 'loss/train': 3.0165655612945557} -08/30/2021 20:03:20 - INFO - __main__ - Step 37996: {'lr': 0.00043050738218543505, 'samples': 7295232, 'steps': 37995, 'loss/train': 0.8663383722305298} -08/30/2021 20:03:21 - INFO - __main__ - Step 37997: {'lr': 0.00043050371060873537, 'samples': 7295424, 'steps': 37996, 'loss/train': 1.5373209714889526} -08/30/2021 20:03:21 - INFO - __main__ - Step 37998: {'lr': 0.00043050003895070345, 'samples': 7295616, 'steps': 37997, 'loss/train': 1.8453495502471924} -08/30/2021 20:03:22 - INFO - __main__ - Step 37999: {'lr': 0.000430496367211341, 'samples': 7295808, 'steps': 37998, 'loss/train': 1.5784364938735962} -08/30/2021 20:03:22 - INFO - __main__ - Step 38000: {'lr': 0.00043049269539064967, 'samples': 7296000, 'steps': 37999, 'loss/train': 1.7386360168457031} -08/30/2021 20:03:24 - INFO - __main__ - Step 38001: {'lr': 0.0004304890234886311, 'samples': 7296192, 'steps': 38000, 'loss/train': 1.4180324077606201} -08/30/2021 20:03:24 - INFO - __main__ - Step 38002: {'lr': 0.000430485351505287, 'samples': 7296384, 'steps': 38001, 'loss/train': 1.0759921073913574} -08/30/2021 20:03:25 - INFO - __main__ - Step 38003: {'lr': 0.000430481679440619, 'samples': 7296576, 'steps': 38002, 'loss/train': 1.434752106666565} -08/30/2021 20:03:25 - INFO - __main__ - Step 38004: {'lr': 0.0004304780072946287, 'samples': 7296768, 'steps': 38003, 'loss/train': 0.1043323203921318} -08/30/2021 20:03:25 - INFO - __main__ - Step 38005: {'lr': 0.00043047433506731783, 'samples': 7296960, 'steps': 38004, 'loss/train': 1.4746665954589844} -08/30/2021 20:03:27 - INFO - __main__ - Step 38006: {'lr': 0.00043047066275868795, 'samples': 7297152, 'steps': 38005, 'loss/train': 1.7519036531448364} -08/30/2021 20:03:27 - INFO - __main__ - Step 38007: {'lr': 0.0004304669903687408, 'samples': 7297344, 'steps': 38006, 'loss/train': 0.8012483716011047} -08/30/2021 20:03:28 - INFO - __main__ - Step 38008: {'lr': 0.000430463317897478, 'samples': 7297536, 'steps': 38007, 'loss/train': 1.7156062126159668} -08/30/2021 20:03:28 - INFO - __main__ - Step 38009: {'lr': 0.0004304596453449012, 'samples': 7297728, 'steps': 38008, 'loss/train': 2.0242068767547607} -08/30/2021 20:03:28 - INFO - __main__ - Step 38010: {'lr': 0.0004304559727110121, 'samples': 7297920, 'steps': 38009, 'loss/train': 2.1348319053649902} -08/30/2021 20:03:29 - INFO - __main__ - Step 38011: {'lr': 0.0004304522999958124, 'samples': 7298112, 'steps': 38010, 'loss/train': 1.8222863674163818} -08/30/2021 20:03:30 - INFO - __main__ - Step 38012: {'lr': 0.00043044862719930356, 'samples': 7298304, 'steps': 38011, 'loss/train': 1.3840633630752563} -08/30/2021 20:03:31 - INFO - __main__ - Step 38013: {'lr': 0.0004304449543214874, 'samples': 7298496, 'steps': 38012, 'loss/train': 1.9130126237869263} -08/30/2021 20:03:31 - INFO - __main__ - Step 38014: {'lr': 0.0004304412813623655, 'samples': 7298688, 'steps': 38013, 'loss/train': 1.882386326789856} -08/30/2021 20:03:32 - INFO - __main__ - Step 38015: {'lr': 0.0004304376083219396, 'samples': 7298880, 'steps': 38014, 'loss/train': 0.8804007768630981} -08/30/2021 20:03:32 - INFO - __main__ - Step 38016: {'lr': 0.00043043393520021125, 'samples': 7299072, 'steps': 38015, 'loss/train': 0.13883128762245178} -08/30/2021 20:03:33 - INFO - __main__ - Step 38017: {'lr': 0.0004304302619971822, 'samples': 7299264, 'steps': 38016, 'loss/train': 1.70297110080719} -08/30/2021 20:03:34 - INFO - __main__ - Step 38018: {'lr': 0.000430426588712854, 'samples': 7299456, 'steps': 38017, 'loss/train': 1.4282335042953491} -08/30/2021 20:03:34 - INFO - __main__ - Step 38019: {'lr': 0.0004304229153472283, 'samples': 7299648, 'steps': 38018, 'loss/train': 1.3424490690231323} -08/30/2021 20:03:35 - INFO - __main__ - Step 38020: {'lr': 0.0004304192419003069, 'samples': 7299840, 'steps': 38019, 'loss/train': 1.3992161750793457} -08/30/2021 20:03:35 - INFO - __main__ - Step 38021: {'lr': 0.0004304155683720914, 'samples': 7300032, 'steps': 38020, 'loss/train': 1.5418304204940796} -08/30/2021 20:03:37 - INFO - __main__ - Step 38022: {'lr': 0.0004304118947625835, 'samples': 7300224, 'steps': 38021, 'loss/train': 0.09601171314716339} -08/30/2021 20:03:37 - INFO - __main__ - Step 38023: {'lr': 0.00043040822107178465, 'samples': 7300416, 'steps': 38022, 'loss/train': 1.2730473279953003} -08/30/2021 20:03:37 - INFO - __main__ - Step 38024: {'lr': 0.0004304045472996966, 'samples': 7300608, 'steps': 38023, 'loss/train': 1.0747939348220825} -08/30/2021 20:03:38 - INFO - __main__ - Step 38025: {'lr': 0.0004304008734463212, 'samples': 7300800, 'steps': 38024, 'loss/train': 1.6828967332839966} -08/30/2021 20:03:38 - INFO - __main__ - Step 38026: {'lr': 0.00043039719951165986, 'samples': 7300992, 'steps': 38025, 'loss/train': 2.090561866760254} -08/30/2021 20:03:39 - INFO - __main__ - Step 38027: {'lr': 0.0004303935254957143, 'samples': 7301184, 'steps': 38026, 'loss/train': 1.8977477550506592} -08/30/2021 20:03:40 - INFO - __main__ - Step 38028: {'lr': 0.0004303898513984863, 'samples': 7301376, 'steps': 38027, 'loss/train': 1.4088269472122192} -08/30/2021 20:03:40 - INFO - __main__ - Step 38029: {'lr': 0.0004303861772199773, 'samples': 7301568, 'steps': 38028, 'loss/train': 1.0330966711044312} -08/30/2021 20:03:41 - INFO - __main__ - Step 38030: {'lr': 0.00043038250296018916, 'samples': 7301760, 'steps': 38029, 'loss/train': 1.5588605403900146} -08/30/2021 20:03:41 - INFO - __main__ - Step 38031: {'lr': 0.00043037882861912344, 'samples': 7301952, 'steps': 38030, 'loss/train': 0.5695727467536926} -08/30/2021 20:03:43 - INFO - __main__ - Step 38032: {'lr': 0.00043037515419678174, 'samples': 7302144, 'steps': 38031, 'loss/train': 1.294374704360962} -08/30/2021 20:03:44 - INFO - __main__ - Step 38033: {'lr': 0.0004303714796931658, 'samples': 7302336, 'steps': 38032, 'loss/train': 0.7637272477149963} -08/30/2021 20:03:44 - INFO - __main__ - Step 38034: {'lr': 0.0004303678051082773, 'samples': 7302528, 'steps': 38033, 'loss/train': 1.7364870309829712} -08/30/2021 20:03:44 - INFO - __main__ - Step 38035: {'lr': 0.00043036413044211786, 'samples': 7302720, 'steps': 38034, 'loss/train': 1.1784203052520752} -08/30/2021 20:03:45 - INFO - __main__ - Step 38036: {'lr': 0.0004303604556946891, 'samples': 7302912, 'steps': 38035, 'loss/train': 1.5858491659164429} -08/30/2021 20:03:46 - INFO - __main__ - Step 38037: {'lr': 0.00043035678086599265, 'samples': 7303104, 'steps': 38036, 'loss/train': 0.9570990800857544} -08/30/2021 20:03:46 - INFO - __main__ - Step 38038: {'lr': 0.00043035310595603026, 'samples': 7303296, 'steps': 38037, 'loss/train': 0.3596562147140503} -08/30/2021 20:03:47 - INFO - __main__ - Step 38039: {'lr': 0.00043034943096480357, 'samples': 7303488, 'steps': 38038, 'loss/train': 1.8890827894210815} -08/30/2021 20:03:47 - INFO - __main__ - Step 38040: {'lr': 0.0004303457558923142, 'samples': 7303680, 'steps': 38039, 'loss/train': 1.600340485572815} -08/30/2021 20:03:47 - INFO - __main__ - Step 38041: {'lr': 0.00043034208073856374, 'samples': 7303872, 'steps': 38040, 'loss/train': 0.49670132994651794} -08/30/2021 20:03:48 - INFO - __main__ - Step 38042: {'lr': 0.000430338405503554, 'samples': 7304064, 'steps': 38041, 'loss/train': 1.7882537841796875} -08/30/2021 20:03:49 - INFO - __main__ - Step 38043: {'lr': 0.00043033473018728655, 'samples': 7304256, 'steps': 38042, 'loss/train': 1.536326289176941} -08/30/2021 20:03:50 - INFO - __main__ - Step 38044: {'lr': 0.00043033105478976306, 'samples': 7304448, 'steps': 38043, 'loss/train': 1.5883727073669434} -08/30/2021 20:03:50 - INFO - __main__ - Step 38045: {'lr': 0.00043032737931098517, 'samples': 7304640, 'steps': 38044, 'loss/train': 1.8947027921676636} -08/30/2021 20:03:51 - INFO - __main__ - Step 38046: {'lr': 0.0004303237037509545, 'samples': 7304832, 'steps': 38045, 'loss/train': 0.8449161052703857} -08/30/2021 20:03:51 - INFO - __main__ - Step 38047: {'lr': 0.0004303200281096727, 'samples': 7305024, 'steps': 38046, 'loss/train': 1.590850591659546} -08/30/2021 20:03:52 - INFO - __main__ - Step 38048: {'lr': 0.00043031635238714163, 'samples': 7305216, 'steps': 38047, 'loss/train': 1.472548007965088} -08/30/2021 20:03:53 - INFO - __main__ - Step 38049: {'lr': 0.00043031267658336276, 'samples': 7305408, 'steps': 38048, 'loss/train': 1.02083158493042} -08/30/2021 20:03:53 - INFO - __main__ - Step 38050: {'lr': 0.00043030900069833774, 'samples': 7305600, 'steps': 38049, 'loss/train': 1.3275349140167236} -08/30/2021 20:03:54 - INFO - __main__ - Step 38051: {'lr': 0.0004303053247320683, 'samples': 7305792, 'steps': 38050, 'loss/train': 1.6457797288894653} -08/30/2021 20:03:54 - INFO - __main__ - Step 38052: {'lr': 0.000430301648684556, 'samples': 7305984, 'steps': 38051, 'loss/train': 1.064283013343811} -08/30/2021 20:03:55 - INFO - __main__ - Step 38053: {'lr': 0.0004302979725558026, 'samples': 7306176, 'steps': 38052, 'loss/train': 1.4403722286224365} -08/30/2021 20:03:56 - INFO - __main__ - Step 38054: {'lr': 0.0004302942963458097, 'samples': 7306368, 'steps': 38053, 'loss/train': 1.52396559715271} -08/30/2021 20:03:56 - INFO - __main__ - Step 38055: {'lr': 0.00043029062005457897, 'samples': 7306560, 'steps': 38054, 'loss/train': 1.647038221359253} -08/30/2021 20:03:57 - INFO - __main__ - Step 38056: {'lr': 0.00043028694368211216, 'samples': 7306752, 'steps': 38055, 'loss/train': 1.6798739433288574} -08/30/2021 20:03:57 - INFO - __main__ - Step 38057: {'lr': 0.00043028326722841073, 'samples': 7306944, 'steps': 38056, 'loss/train': 1.427933692932129} -08/30/2021 20:03:59 - INFO - __main__ - Step 38058: {'lr': 0.00043027959069347644, 'samples': 7307136, 'steps': 38057, 'loss/train': 1.5558427572250366} -08/30/2021 20:03:59 - INFO - __main__ - Step 38059: {'lr': 0.00043027591407731106, 'samples': 7307328, 'steps': 38058, 'loss/train': 0.9162428379058838} -08/30/2021 20:03:59 - INFO - __main__ - Step 38060: {'lr': 0.000430272237379916, 'samples': 7307520, 'steps': 38059, 'loss/train': 1.9274269342422485} -08/30/2021 20:04:00 - INFO - __main__ - Step 38061: {'lr': 0.00043026856060129307, 'samples': 7307712, 'steps': 38060, 'loss/train': 1.641619086265564} -08/30/2021 20:04:00 - INFO - __main__ - Step 38062: {'lr': 0.00043026488374144404, 'samples': 7307904, 'steps': 38061, 'loss/train': 1.0995973348617554} -08/30/2021 20:04:01 - INFO - __main__ - Step 38063: {'lr': 0.00043026120680037026, 'samples': 7308096, 'steps': 38062, 'loss/train': 1.8768608570098877} -08/30/2021 20:04:02 - INFO - __main__ - Step 38064: {'lr': 0.00043025752977807365, 'samples': 7308288, 'steps': 38063, 'loss/train': 1.5482667684555054} -08/30/2021 20:04:02 - INFO - __main__ - Step 38065: {'lr': 0.00043025385267455576, 'samples': 7308480, 'steps': 38064, 'loss/train': 1.600582242012024} -08/30/2021 20:04:03 - INFO - __main__ - Step 38066: {'lr': 0.0004302501754898183, 'samples': 7308672, 'steps': 38065, 'loss/train': 1.2704813480377197} -08/30/2021 20:04:03 - INFO - __main__ - Step 38067: {'lr': 0.00043024649822386284, 'samples': 7308864, 'steps': 38066, 'loss/train': 1.2843825817108154} -08/30/2021 20:04:04 - INFO - __main__ - Step 38068: {'lr': 0.00043024282087669106, 'samples': 7309056, 'steps': 38067, 'loss/train': 1.643200159072876} -08/30/2021 20:04:05 - INFO - __main__ - Step 38069: {'lr': 0.0004302391434483048, 'samples': 7309248, 'steps': 38068, 'loss/train': 1.4084856510162354} -08/30/2021 20:04:05 - INFO - __main__ - Step 38070: {'lr': 0.00043023546593870543, 'samples': 7309440, 'steps': 38069, 'loss/train': 1.260197639465332} -08/30/2021 20:04:05 - INFO - __main__ - Step 38071: {'lr': 0.00043023178834789477, 'samples': 7309632, 'steps': 38070, 'loss/train': 1.0648444890975952} -08/30/2021 20:04:06 - INFO - __main__ - Step 38072: {'lr': 0.0004302281106758745, 'samples': 7309824, 'steps': 38071, 'loss/train': 1.3773057460784912} -08/30/2021 20:04:07 - INFO - __main__ - Step 38073: {'lr': 0.00043022443292264613, 'samples': 7310016, 'steps': 38072, 'loss/train': 2.071263313293457} -08/30/2021 20:04:08 - INFO - __main__ - Step 38074: {'lr': 0.00043022075508821145, 'samples': 7310208, 'steps': 38073, 'loss/train': 1.4826546907424927} -08/30/2021 20:04:08 - INFO - __main__ - Step 38075: {'lr': 0.0004302170771725721, 'samples': 7310400, 'steps': 38074, 'loss/train': 1.163777470588684} -08/30/2021 20:04:09 - INFO - __main__ - Step 38076: {'lr': 0.0004302133991757297, 'samples': 7310592, 'steps': 38075, 'loss/train': 1.8173130750656128} -08/30/2021 20:04:09 - INFO - __main__ - Step 38077: {'lr': 0.000430209721097686, 'samples': 7310784, 'steps': 38076, 'loss/train': 1.3335477113723755} -08/30/2021 20:04:11 - INFO - __main__ - Step 38078: {'lr': 0.00043020604293844244, 'samples': 7310976, 'steps': 38077, 'loss/train': 1.1913659572601318} -08/30/2021 20:04:11 - INFO - __main__ - Step 38079: {'lr': 0.0004302023646980009, 'samples': 7311168, 'steps': 38078, 'loss/train': 1.4555636644363403} -08/30/2021 20:04:11 - INFO - __main__ - Step 38080: {'lr': 0.00043019868637636294, 'samples': 7311360, 'steps': 38079, 'loss/train': 1.7773770093917847} -08/30/2021 20:04:12 - INFO - __main__ - Step 38081: {'lr': 0.0004301950079735302, 'samples': 7311552, 'steps': 38080, 'loss/train': 1.149129033088684} -08/30/2021 20:04:12 - INFO - __main__ - Step 38082: {'lr': 0.00043019132948950443, 'samples': 7311744, 'steps': 38081, 'loss/train': 3.0543625354766846} -08/30/2021 20:04:12 - INFO - __main__ - Step 38083: {'lr': 0.0004301876509242872, 'samples': 7311936, 'steps': 38082, 'loss/train': 1.4620031118392944} -08/30/2021 20:04:13 - INFO - __main__ - Step 38084: {'lr': 0.0004301839722778802, 'samples': 7312128, 'steps': 38083, 'loss/train': 1.4417636394500732} -08/30/2021 20:04:14 - INFO - __main__ - Step 38085: {'lr': 0.0004301802935502851, 'samples': 7312320, 'steps': 38084, 'loss/train': 1.1092498302459717} -08/30/2021 20:04:15 - INFO - __main__ - Step 38086: {'lr': 0.00043017661474150347, 'samples': 7312512, 'steps': 38085, 'loss/train': 1.0917634963989258} -08/30/2021 20:04:15 - INFO - __main__ - Step 38087: {'lr': 0.0004301729358515371, 'samples': 7312704, 'steps': 38086, 'loss/train': 1.238690972328186} -08/30/2021 20:04:15 - INFO - __main__ - Step 38088: {'lr': 0.00043016925688038756, 'samples': 7312896, 'steps': 38087, 'loss/train': 1.6434701681137085} -08/30/2021 20:04:16 - INFO - __main__ - Step 38089: {'lr': 0.00043016557782805655, 'samples': 7313088, 'steps': 38088, 'loss/train': 1.3235447406768799} -08/30/2021 20:04:18 - INFO - __main__ - Step 38090: {'lr': 0.0004301618986945457, 'samples': 7313280, 'steps': 38089, 'loss/train': 0.9472088813781738} -08/30/2021 20:04:18 - INFO - __main__ - Step 38091: {'lr': 0.0004301582194798567, 'samples': 7313472, 'steps': 38090, 'loss/train': 1.320418357849121} -08/30/2021 20:04:19 - INFO - __main__ - Step 38092: {'lr': 0.00043015454018399115, 'samples': 7313664, 'steps': 38091, 'loss/train': 1.4500608444213867} -08/30/2021 20:04:19 - INFO - __main__ - Step 38093: {'lr': 0.00043015086080695075, 'samples': 7313856, 'steps': 38092, 'loss/train': 2.2782180309295654} -08/30/2021 20:04:19 - INFO - __main__ - Step 38094: {'lr': 0.0004301471813487372, 'samples': 7314048, 'steps': 38093, 'loss/train': 1.544771671295166} -08/30/2021 20:04:21 - INFO - __main__ - Step 38095: {'lr': 0.00043014350180935207, 'samples': 7314240, 'steps': 38094, 'loss/train': 1.32065749168396} -08/30/2021 20:04:21 - INFO - __main__ - Step 38096: {'lr': 0.0004301398221887971, 'samples': 7314432, 'steps': 38095, 'loss/train': 1.8495428562164307} -08/30/2021 20:04:22 - INFO - __main__ - Step 38097: {'lr': 0.0004301361424870739, 'samples': 7314624, 'steps': 38096, 'loss/train': 0.18316933512687683} -08/30/2021 20:04:22 - INFO - __main__ - Step 38098: {'lr': 0.00043013246270418406, 'samples': 7314816, 'steps': 38097, 'loss/train': 2.0615177154541016} -08/30/2021 20:04:22 - INFO - __main__ - Step 38099: {'lr': 0.00043012878284012936, 'samples': 7315008, 'steps': 38098, 'loss/train': 1.0804531574249268} -08/30/2021 20:04:23 - INFO - __main__ - Step 38100: {'lr': 0.0004301251028949114, 'samples': 7315200, 'steps': 38099, 'loss/train': 1.241612195968628} -08/30/2021 20:04:24 - INFO - __main__ - Step 38101: {'lr': 0.00043012142286853185, 'samples': 7315392, 'steps': 38100, 'loss/train': 1.2666245698928833} -08/30/2021 20:04:25 - INFO - __main__ - Step 38102: {'lr': 0.00043011774276099235, 'samples': 7315584, 'steps': 38101, 'loss/train': 1.3013263940811157} -08/30/2021 20:04:25 - INFO - __main__ - Step 38103: {'lr': 0.0004301140625722946, 'samples': 7315776, 'steps': 38102, 'loss/train': 1.5301237106323242} -08/30/2021 20:04:26 - INFO - __main__ - Step 38104: {'lr': 0.0004301103823024403, 'samples': 7315968, 'steps': 38103, 'loss/train': 1.8450559377670288} -08/30/2021 20:04:26 - INFO - __main__ - Step 38105: {'lr': 0.0004301067019514309, 'samples': 7316160, 'steps': 38104, 'loss/train': 1.2126245498657227} -08/30/2021 20:04:27 - INFO - __main__ - Step 38106: {'lr': 0.0004301030215192683, 'samples': 7316352, 'steps': 38105, 'loss/train': 1.06794011592865} -08/30/2021 20:04:28 - INFO - __main__ - Step 38107: {'lr': 0.00043009934100595403, 'samples': 7316544, 'steps': 38106, 'loss/train': 1.2656378746032715} -08/30/2021 20:04:28 - INFO - __main__ - Step 38108: {'lr': 0.00043009566041148973, 'samples': 7316736, 'steps': 38107, 'loss/train': 1.358382225036621} -08/30/2021 20:04:28 - INFO - __main__ - Step 38109: {'lr': 0.0004300919797358772, 'samples': 7316928, 'steps': 38108, 'loss/train': 1.4306318759918213} -08/30/2021 20:04:29 - INFO - __main__ - Step 38110: {'lr': 0.00043008829897911796, 'samples': 7317120, 'steps': 38109, 'loss/train': 1.4010542631149292} -08/30/2021 20:04:30 - INFO - __main__ - Step 38111: {'lr': 0.0004300846181412137, 'samples': 7317312, 'steps': 38110, 'loss/train': 1.4865506887435913} -08/30/2021 20:04:31 - INFO - __main__ - Step 38112: {'lr': 0.00043008093722216603, 'samples': 7317504, 'steps': 38111, 'loss/train': 1.0639395713806152} -08/30/2021 20:04:31 - INFO - __main__ - Step 38113: {'lr': 0.00043007725622197675, 'samples': 7317696, 'steps': 38112, 'loss/train': 1.9150346517562866} -08/30/2021 20:04:32 - INFO - __main__ - Step 38114: {'lr': 0.0004300735751406474, 'samples': 7317888, 'steps': 38113, 'loss/train': 2.0976529121398926} -08/30/2021 20:04:32 - INFO - __main__ - Step 38115: {'lr': 0.00043006989397817967, 'samples': 7318080, 'steps': 38114, 'loss/train': 1.4350019693374634} -08/30/2021 20:04:32 - INFO - __main__ - Step 38116: {'lr': 0.00043006621273457523, 'samples': 7318272, 'steps': 38115, 'loss/train': 1.3051835298538208} -08/30/2021 20:04:34 - INFO - __main__ - Step 38117: {'lr': 0.0004300625314098358, 'samples': 7318464, 'steps': 38116, 'loss/train': 0.10825788229703903} -08/30/2021 20:04:34 - INFO - __main__ - Step 38118: {'lr': 0.0004300588500039629, 'samples': 7318656, 'steps': 38117, 'loss/train': 5.947971343994141} -08/30/2021 20:04:35 - INFO - __main__ - Step 38119: {'lr': 0.0004300551685169583, 'samples': 7318848, 'steps': 38118, 'loss/train': 1.714760184288025} -08/30/2021 20:04:35 - INFO - __main__ - Step 38120: {'lr': 0.0004300514869488236, 'samples': 7319040, 'steps': 38119, 'loss/train': 1.7870771884918213} -08/30/2021 20:04:35 - INFO - __main__ - Step 38121: {'lr': 0.00043004780529956046, 'samples': 7319232, 'steps': 38120, 'loss/train': 1.267866849899292} -08/30/2021 20:04:37 - INFO - __main__ - Step 38122: {'lr': 0.00043004412356917055, 'samples': 7319424, 'steps': 38121, 'loss/train': 1.9728401899337769} -08/30/2021 20:04:37 - INFO - __main__ - Step 38123: {'lr': 0.0004300404417576556, 'samples': 7319616, 'steps': 38122, 'loss/train': 1.5835316181182861} -08/30/2021 20:04:38 - INFO - __main__ - Step 38124: {'lr': 0.00043003675986501717, 'samples': 7319808, 'steps': 38123, 'loss/train': 1.705342173576355} -08/30/2021 20:04:38 - INFO - __main__ - Step 38125: {'lr': 0.00043003307789125694, 'samples': 7320000, 'steps': 38124, 'loss/train': 1.744152545928955} -08/30/2021 20:04:39 - INFO - __main__ - Step 38126: {'lr': 0.0004300293958363766, 'samples': 7320192, 'steps': 38125, 'loss/train': 1.6485809087753296} -08/30/2021 20:04:40 - INFO - __main__ - Step 38127: {'lr': 0.00043002571370037777, 'samples': 7320384, 'steps': 38126, 'loss/train': 2.0750226974487305} -08/30/2021 20:04:41 - INFO - __main__ - Step 38128: {'lr': 0.00043002203148326213, 'samples': 7320576, 'steps': 38127, 'loss/train': 1.4557346105575562} -08/30/2021 20:04:41 - INFO - __main__ - Step 38129: {'lr': 0.0004300183491850314, 'samples': 7320768, 'steps': 38128, 'loss/train': 1.4113519191741943} -08/30/2021 20:04:41 - INFO - __main__ - Step 38130: {'lr': 0.0004300146668056871, 'samples': 7320960, 'steps': 38129, 'loss/train': 1.333693027496338} -08/30/2021 20:04:42 - INFO - __main__ - Step 38131: {'lr': 0.00043001098434523107, 'samples': 7321152, 'steps': 38130, 'loss/train': 1.1593481302261353} -08/30/2021 20:04:42 - INFO - __main__ - Step 38132: {'lr': 0.0004300073018036648, 'samples': 7321344, 'steps': 38131, 'loss/train': 0.5571146011352539} -08/30/2021 20:04:44 - INFO - __main__ - Step 38133: {'lr': 0.00043000361918099, 'samples': 7321536, 'steps': 38132, 'loss/train': 1.232261300086975} -08/30/2021 20:04:44 - INFO - __main__ - Step 38134: {'lr': 0.00042999993647720836, 'samples': 7321728, 'steps': 38133, 'loss/train': 0.06851159036159515} -08/30/2021 20:04:45 - INFO - __main__ - Step 38135: {'lr': 0.0004299962536923215, 'samples': 7321920, 'steps': 38134, 'loss/train': 1.6765235662460327} -08/30/2021 20:04:45 - INFO - __main__ - Step 38136: {'lr': 0.0004299925708263312, 'samples': 7322112, 'steps': 38135, 'loss/train': 1.6706408262252808} -08/30/2021 20:04:45 - INFO - __main__ - Step 38137: {'lr': 0.00042998888787923895, 'samples': 7322304, 'steps': 38136, 'loss/train': 1.7377032041549683} -08/30/2021 20:04:47 - INFO - __main__ - Step 38138: {'lr': 0.0004299852048510465, 'samples': 7322496, 'steps': 38137, 'loss/train': 1.678581953048706} -08/30/2021 20:04:47 - INFO - __main__ - Step 38139: {'lr': 0.00042998152174175555, 'samples': 7322688, 'steps': 38138, 'loss/train': 1.3767420053482056} -08/30/2021 20:04:48 - INFO - __main__ - Step 38140: {'lr': 0.0004299778385513676, 'samples': 7322880, 'steps': 38139, 'loss/train': 1.274703860282898} -08/30/2021 20:04:48 - INFO - __main__ - Step 38141: {'lr': 0.0004299741552798845, 'samples': 7323072, 'steps': 38140, 'loss/train': 1.2292976379394531} -08/30/2021 20:04:48 - INFO - __main__ - Step 38142: {'lr': 0.0004299704719273078, 'samples': 7323264, 'steps': 38141, 'loss/train': 1.185442566871643} -08/30/2021 20:04:49 - INFO - __main__ - Step 38143: {'lr': 0.00042996678849363914, 'samples': 7323456, 'steps': 38142, 'loss/train': 1.057015299797058} -08/30/2021 20:04:51 - INFO - __main__ - Step 38144: {'lr': 0.00042996310497888025, 'samples': 7323648, 'steps': 38143, 'loss/train': 1.5116634368896484} -08/30/2021 20:04:51 - INFO - __main__ - Step 38145: {'lr': 0.00042995942138303274, 'samples': 7323840, 'steps': 38144, 'loss/train': 1.4529461860656738} -08/30/2021 20:04:52 - INFO - __main__ - Step 38146: {'lr': 0.0004299557377060983, 'samples': 7324032, 'steps': 38145, 'loss/train': 1.35940682888031} -08/30/2021 20:04:52 - INFO - __main__ - Step 38147: {'lr': 0.00042995205394807864, 'samples': 7324224, 'steps': 38146, 'loss/train': 1.5660464763641357} -08/30/2021 20:04:52 - INFO - __main__ - Step 38148: {'lr': 0.00042994837010897524, 'samples': 7324416, 'steps': 38147, 'loss/train': 1.2501001358032227} -08/30/2021 20:04:55 - INFO - __main__ - Step 38149: {'lr': 0.00042994468618879, 'samples': 7324608, 'steps': 38148, 'loss/train': 1.6698060035705566} -08/30/2021 20:04:55 - INFO - __main__ - Step 38150: {'lr': 0.0004299410021875244, 'samples': 7324800, 'steps': 38149, 'loss/train': 0.5998290181159973} -08/30/2021 20:04:55 - INFO - __main__ - Step 38151: {'lr': 0.00042993731810518025, 'samples': 7324992, 'steps': 38150, 'loss/train': 0.5505896806716919} -08/30/2021 20:04:56 - INFO - __main__ - Step 38152: {'lr': 0.00042993363394175897, 'samples': 7325184, 'steps': 38151, 'loss/train': 1.2739479541778564} -08/30/2021 20:04:56 - INFO - __main__ - Step 38153: {'lr': 0.0004299299496972625, 'samples': 7325376, 'steps': 38152, 'loss/train': 0.7034235596656799} -08/30/2021 20:04:57 - INFO - __main__ - Step 38154: {'lr': 0.0004299262653716923, 'samples': 7325568, 'steps': 38153, 'loss/train': 1.1546645164489746} -08/30/2021 20:04:58 - INFO - __main__ - Step 38155: {'lr': 0.0004299225809650501, 'samples': 7325760, 'steps': 38154, 'loss/train': 1.1841838359832764} -08/30/2021 20:04:58 - INFO - __main__ - Step 38156: {'lr': 0.0004299188964773376, 'samples': 7325952, 'steps': 38155, 'loss/train': 1.0835820436477661} -08/30/2021 20:04:59 - INFO - __main__ - Step 38157: {'lr': 0.0004299152119085564, 'samples': 7326144, 'steps': 38156, 'loss/train': 1.6562628746032715} -08/30/2021 20:04:59 - INFO - __main__ - Step 38158: {'lr': 0.0004299115272587082, 'samples': 7326336, 'steps': 38157, 'loss/train': 0.6394487023353577} -08/30/2021 20:05:00 - INFO - __main__ - Step 38159: {'lr': 0.0004299078425277947, 'samples': 7326528, 'steps': 38158, 'loss/train': 1.6423875093460083} -08/30/2021 20:05:01 - INFO - __main__ - Step 38160: {'lr': 0.00042990415771581734, 'samples': 7326720, 'steps': 38159, 'loss/train': 1.2092241048812866} -08/30/2021 20:05:02 - INFO - __main__ - Step 38161: {'lr': 0.0004299004728227781, 'samples': 7326912, 'steps': 38160, 'loss/train': 1.6938648223876953} -08/30/2021 20:05:02 - INFO - __main__ - Step 38162: {'lr': 0.0004298967878486784, 'samples': 7327104, 'steps': 38161, 'loss/train': 2.016425371170044} -08/30/2021 20:05:02 - INFO - __main__ - Step 38163: {'lr': 0.00042989310279352, 'samples': 7327296, 'steps': 38162, 'loss/train': 1.2421073913574219} -08/30/2021 20:05:03 - INFO - __main__ - Step 38164: {'lr': 0.0004298894176573046, 'samples': 7327488, 'steps': 38163, 'loss/train': 0.059755463153123856} -08/30/2021 20:05:03 - INFO - __main__ - Step 38165: {'lr': 0.0004298857324400337, 'samples': 7327680, 'steps': 38164, 'loss/train': 1.375670075416565} -08/30/2021 20:05:05 - INFO - __main__ - Step 38166: {'lr': 0.0004298820471417091, 'samples': 7327872, 'steps': 38165, 'loss/train': 1.4727246761322021} -08/30/2021 20:05:05 - INFO - __main__ - Step 38167: {'lr': 0.00042987836176233246, 'samples': 7328064, 'steps': 38166, 'loss/train': 0.7216182947158813} -08/30/2021 20:05:05 - INFO - __main__ - Step 38168: {'lr': 0.0004298746763019054, 'samples': 7328256, 'steps': 38167, 'loss/train': 1.4980967044830322} -08/30/2021 20:05:06 - INFO - __main__ - Step 38169: {'lr': 0.0004298709907604296, 'samples': 7328448, 'steps': 38168, 'loss/train': 0.632712721824646} -08/30/2021 20:05:06 - INFO - __main__ - Step 38170: {'lr': 0.0004298673051379066, 'samples': 7328640, 'steps': 38169, 'loss/train': 0.4579286277294159} -08/30/2021 20:05:08 - INFO - __main__ - Step 38171: {'lr': 0.0004298636194343383, 'samples': 7328832, 'steps': 38170, 'loss/train': 1.649490475654602} -08/30/2021 20:05:08 - INFO - __main__ - Step 38172: {'lr': 0.0004298599336497262, 'samples': 7329024, 'steps': 38171, 'loss/train': 1.2945585250854492} -08/30/2021 20:05:08 - INFO - __main__ - Step 38173: {'lr': 0.00042985624778407196, 'samples': 7329216, 'steps': 38172, 'loss/train': 2.015388011932373} -08/30/2021 20:05:09 - INFO - __main__ - Step 38174: {'lr': 0.00042985256183737723, 'samples': 7329408, 'steps': 38173, 'loss/train': 1.3931941986083984} -08/30/2021 20:05:09 - INFO - __main__ - Step 38175: {'lr': 0.00042984887580964376, 'samples': 7329600, 'steps': 38174, 'loss/train': 1.5762046575546265} -08/30/2021 20:05:11 - INFO - __main__ - Step 38176: {'lr': 0.00042984518970087316, 'samples': 7329792, 'steps': 38175, 'loss/train': 1.447563886642456} -08/30/2021 20:05:11 - INFO - __main__ - Step 38177: {'lr': 0.0004298415035110671, 'samples': 7329984, 'steps': 38176, 'loss/train': 0.9451384544372559} -08/30/2021 20:05:11 - INFO - __main__ - Step 38178: {'lr': 0.00042983781724022723, 'samples': 7330176, 'steps': 38177, 'loss/train': 1.563511848449707} -08/30/2021 20:05:12 - INFO - __main__ - Step 38179: {'lr': 0.0004298341308883552, 'samples': 7330368, 'steps': 38178, 'loss/train': 1.2556973695755005} -08/30/2021 20:05:12 - INFO - __main__ - Step 38180: {'lr': 0.0004298304444554527, 'samples': 7330560, 'steps': 38179, 'loss/train': 1.8115509748458862} -08/30/2021 20:05:14 - INFO - __main__ - Step 38181: {'lr': 0.00042982675794152135, 'samples': 7330752, 'steps': 38180, 'loss/train': 1.5163209438323975} -08/30/2021 20:05:14 - INFO - __main__ - Step 38182: {'lr': 0.0004298230713465629, 'samples': 7330944, 'steps': 38181, 'loss/train': 3.8600540161132812} -08/30/2021 20:05:15 - INFO - __main__ - Step 38183: {'lr': 0.00042981938467057893, 'samples': 7331136, 'steps': 38182, 'loss/train': 0.09460396319627762} -08/30/2021 20:05:15 - INFO - __main__ - Step 38184: {'lr': 0.0004298156979135711, 'samples': 7331328, 'steps': 38183, 'loss/train': 1.7542532682418823} -08/30/2021 20:05:15 - INFO - __main__ - Step 38185: {'lr': 0.000429812011075541, 'samples': 7331520, 'steps': 38184, 'loss/train': 1.335465431213379} -08/30/2021 20:05:16 - INFO - __main__ - Step 38186: {'lr': 0.0004298083241564905, 'samples': 7331712, 'steps': 38185, 'loss/train': 0.14262399077415466} -08/30/2021 20:05:18 - INFO - __main__ - Step 38187: {'lr': 0.00042980463715642115, 'samples': 7331904, 'steps': 38186, 'loss/train': 1.7476221323013306} -08/30/2021 20:05:18 - INFO - __main__ - Step 38188: {'lr': 0.0004298009500753346, 'samples': 7332096, 'steps': 38187, 'loss/train': 1.2012053728103638} -08/30/2021 20:05:19 - INFO - __main__ - Step 38189: {'lr': 0.00042979726291323246, 'samples': 7332288, 'steps': 38188, 'loss/train': 0.08518649637699127} -08/30/2021 20:05:19 - INFO - __main__ - Step 38190: {'lr': 0.00042979357567011643, 'samples': 7332480, 'steps': 38189, 'loss/train': 1.461737036705017} -08/30/2021 20:05:19 - INFO - __main__ - Step 38191: {'lr': 0.0004297898883459883, 'samples': 7332672, 'steps': 38190, 'loss/train': 1.0762619972229004} -08/30/2021 20:05:20 - INFO - __main__ - Step 38192: {'lr': 0.00042978620094084955, 'samples': 7332864, 'steps': 38191, 'loss/train': 1.7315171957015991} -08/30/2021 20:05:21 - INFO - __main__ - Step 38193: {'lr': 0.00042978251345470185, 'samples': 7333056, 'steps': 38192, 'loss/train': 0.8061356544494629} -08/30/2021 20:05:22 - INFO - __main__ - Step 38194: {'lr': 0.000429778825887547, 'samples': 7333248, 'steps': 38193, 'loss/train': 1.8283162117004395} -08/30/2021 20:05:22 - INFO - __main__ - Step 38195: {'lr': 0.00042977513823938665, 'samples': 7333440, 'steps': 38194, 'loss/train': 0.6713355779647827} -08/30/2021 20:05:22 - INFO - __main__ - Step 38196: {'lr': 0.00042977145051022224, 'samples': 7333632, 'steps': 38195, 'loss/train': 2.2314579486846924} -08/30/2021 20:05:23 - INFO - __main__ - Step 38197: {'lr': 0.0004297677627000557, 'samples': 7333824, 'steps': 38196, 'loss/train': 1.8773198127746582} -08/30/2021 20:05:24 - INFO - __main__ - Step 38198: {'lr': 0.0004297640748088886, 'samples': 7334016, 'steps': 38197, 'loss/train': 1.4580886363983154} -08/30/2021 20:05:25 - INFO - __main__ - Step 38199: {'lr': 0.0004297603868367225, 'samples': 7334208, 'steps': 38198, 'loss/train': 1.021130084991455} -08/30/2021 20:05:25 - INFO - __main__ - Step 38200: {'lr': 0.00042975669878355917, 'samples': 7334400, 'steps': 38199, 'loss/train': 0.9159539937973022} -08/30/2021 20:05:25 - INFO - __main__ - Step 38201: {'lr': 0.00042975301064940026, 'samples': 7334592, 'steps': 38200, 'loss/train': 1.5189489126205444} -08/30/2021 20:05:26 - INFO - __main__ - Step 38202: {'lr': 0.00042974932243424743, 'samples': 7334784, 'steps': 38201, 'loss/train': 1.0034737586975098} -08/30/2021 20:05:28 - INFO - __main__ - Step 38203: {'lr': 0.0004297456341381023, 'samples': 7334976, 'steps': 38202, 'loss/train': 1.9908865690231323} -08/30/2021 20:05:28 - INFO - __main__ - Step 38204: {'lr': 0.0004297419457609666, 'samples': 7335168, 'steps': 38203, 'loss/train': 1.3665775060653687} -08/30/2021 20:05:28 - INFO - __main__ - Step 38205: {'lr': 0.0004297382573028419, 'samples': 7335360, 'steps': 38204, 'loss/train': 1.351920485496521} -08/30/2021 20:05:29 - INFO - __main__ - Step 38206: {'lr': 0.0004297345687637299, 'samples': 7335552, 'steps': 38205, 'loss/train': 1.8134219646453857} -08/30/2021 20:05:29 - INFO - __main__ - Step 38207: {'lr': 0.00042973088014363237, 'samples': 7335744, 'steps': 38206, 'loss/train': 1.4496570825576782} -08/30/2021 20:05:30 - INFO - __main__ - Step 38208: {'lr': 0.0004297271914425508, 'samples': 7335936, 'steps': 38207, 'loss/train': 1.2204450368881226} -08/30/2021 20:05:31 - INFO - __main__ - Step 38209: {'lr': 0.00042972350266048693, 'samples': 7336128, 'steps': 38208, 'loss/train': 1.5176422595977783} -08/30/2021 20:05:31 - INFO - __main__ - Step 38210: {'lr': 0.0004297198137974425, 'samples': 7336320, 'steps': 38209, 'loss/train': 1.4744043350219727} -08/30/2021 20:05:32 - INFO - __main__ - Step 38211: {'lr': 0.00042971612485341896, 'samples': 7336512, 'steps': 38210, 'loss/train': 1.7286087274551392} -08/30/2021 20:05:32 - INFO - __main__ - Step 38212: {'lr': 0.00042971243582841823, 'samples': 7336704, 'steps': 38211, 'loss/train': 1.5018001794815063} -08/30/2021 20:05:33 - INFO - __main__ - Step 38213: {'lr': 0.0004297087467224418, 'samples': 7336896, 'steps': 38212, 'loss/train': 1.4578546285629272} -08/30/2021 20:05:34 - INFO - __main__ - Step 38214: {'lr': 0.0004297050575354914, 'samples': 7337088, 'steps': 38213, 'loss/train': 1.1368920803070068} -08/30/2021 20:05:35 - INFO - __main__ - Step 38215: {'lr': 0.0004297013682675687, 'samples': 7337280, 'steps': 38214, 'loss/train': 0.7339975237846375} -08/30/2021 20:05:35 - INFO - __main__ - Step 38216: {'lr': 0.0004296976789186753, 'samples': 7337472, 'steps': 38215, 'loss/train': 1.039969801902771} -08/30/2021 20:05:35 - INFO - __main__ - Step 38217: {'lr': 0.00042969398948881286, 'samples': 7337664, 'steps': 38216, 'loss/train': 1.5827642679214478} -08/30/2021 20:05:36 - INFO - __main__ - Step 38218: {'lr': 0.00042969029997798314, 'samples': 7337856, 'steps': 38217, 'loss/train': 0.9548296332359314} -08/30/2021 20:05:37 - INFO - __main__ - Step 38219: {'lr': 0.00042968661038618775, 'samples': 7338048, 'steps': 38218, 'loss/train': 0.9502847194671631} -08/30/2021 20:05:38 - INFO - __main__ - Step 38220: {'lr': 0.0004296829207134283, 'samples': 7338240, 'steps': 38219, 'loss/train': 1.522841453552246} -08/30/2021 20:05:38 - INFO - __main__ - Step 38221: {'lr': 0.0004296792309597065, 'samples': 7338432, 'steps': 38220, 'loss/train': 2.252483367919922} -08/30/2021 20:05:38 - INFO - __main__ - Step 38222: {'lr': 0.00042967554112502404, 'samples': 7338624, 'steps': 38221, 'loss/train': 1.893862247467041} -08/30/2021 20:05:39 - INFO - __main__ - Step 38223: {'lr': 0.00042967185120938256, 'samples': 7338816, 'steps': 38222, 'loss/train': 1.1537975072860718} -08/30/2021 20:05:40 - INFO - __main__ - Step 38224: {'lr': 0.00042966816121278365, 'samples': 7339008, 'steps': 38223, 'loss/train': 1.4714430570602417} -08/30/2021 20:05:41 - INFO - __main__ - Step 38225: {'lr': 0.0004296644711352291, 'samples': 7339200, 'steps': 38224, 'loss/train': 0.22892123460769653} -08/30/2021 20:05:41 - INFO - __main__ - Step 38226: {'lr': 0.0004296607809767205, 'samples': 7339392, 'steps': 38225, 'loss/train': 1.49606192111969} -08/30/2021 20:05:41 - INFO - __main__ - Step 38227: {'lr': 0.00042965709073725957, 'samples': 7339584, 'steps': 38226, 'loss/train': 1.4638125896453857} -08/30/2021 20:05:42 - INFO - __main__ - Step 38228: {'lr': 0.00042965340041684785, 'samples': 7339776, 'steps': 38227, 'loss/train': 1.256641149520874} -08/30/2021 20:05:42 - INFO - __main__ - Step 38229: {'lr': 0.00042964971001548715, 'samples': 7339968, 'steps': 38228, 'loss/train': 1.588843584060669} -08/30/2021 20:05:43 - INFO - __main__ - Step 38230: {'lr': 0.00042964601953317895, 'samples': 7340160, 'steps': 38229, 'loss/train': 1.417837381362915} -08/30/2021 20:05:44 - INFO - __main__ - Step 38231: {'lr': 0.0004296423289699252, 'samples': 7340352, 'steps': 38230, 'loss/train': 1.3788716793060303} -08/30/2021 20:05:44 - INFO - __main__ - Step 38232: {'lr': 0.00042963863832572727, 'samples': 7340544, 'steps': 38231, 'loss/train': 1.118288516998291} -08/30/2021 20:05:45 - INFO - __main__ - Step 38233: {'lr': 0.0004296349476005869, 'samples': 7340736, 'steps': 38232, 'loss/train': 1.4372879266738892} -08/30/2021 20:05:45 - INFO - __main__ - Step 38234: {'lr': 0.0004296312567945059, 'samples': 7340928, 'steps': 38233, 'loss/train': 1.1061968803405762} -08/30/2021 20:05:47 - INFO - __main__ - Step 38235: {'lr': 0.0004296275659074858, 'samples': 7341120, 'steps': 38234, 'loss/train': 1.413161039352417} -08/30/2021 20:05:47 - INFO - __main__ - Step 38236: {'lr': 0.00042962387493952823, 'samples': 7341312, 'steps': 38235, 'loss/train': 1.414198398590088} -08/30/2021 20:05:48 - INFO - __main__ - Step 38237: {'lr': 0.00042962018389063495, 'samples': 7341504, 'steps': 38236, 'loss/train': 0.4985870122909546} -08/30/2021 20:05:48 - INFO - __main__ - Step 38238: {'lr': 0.0004296164927608076, 'samples': 7341696, 'steps': 38237, 'loss/train': 1.5697894096374512} -08/30/2021 20:05:48 - INFO - __main__ - Step 38239: {'lr': 0.00042961280155004786, 'samples': 7341888, 'steps': 38238, 'loss/train': 1.022641897201538} -08/30/2021 20:05:50 - INFO - __main__ - Step 38240: {'lr': 0.0004296091102583573, 'samples': 7342080, 'steps': 38239, 'loss/train': 0.495064914226532} -08/30/2021 20:05:50 - INFO - __main__ - Step 38241: {'lr': 0.0004296054188857377, 'samples': 7342272, 'steps': 38240, 'loss/train': 0.7581716179847717} -08/30/2021 20:05:50 - INFO - __main__ - Step 38242: {'lr': 0.0004296017274321906, 'samples': 7342464, 'steps': 38241, 'loss/train': 1.1975090503692627} -08/30/2021 20:05:51 - INFO - __main__ - Step 38243: {'lr': 0.0004295980358977178, 'samples': 7342656, 'steps': 38242, 'loss/train': 1.9184114933013916} -08/30/2021 20:05:51 - INFO - __main__ - Step 38244: {'lr': 0.0004295943442823209, 'samples': 7342848, 'steps': 38243, 'loss/train': 1.3504652976989746} -08/30/2021 20:05:53 - INFO - __main__ - Step 38245: {'lr': 0.0004295906525860015, 'samples': 7343040, 'steps': 38244, 'loss/train': 1.0900636911392212} -08/30/2021 20:05:53 - INFO - __main__ - Step 38246: {'lr': 0.00042958696080876136, 'samples': 7343232, 'steps': 38245, 'loss/train': 1.3474056720733643} -08/30/2021 20:05:53 - INFO - __main__ - Step 38247: {'lr': 0.00042958326895060206, 'samples': 7343424, 'steps': 38246, 'loss/train': 1.1300328969955444} -08/30/2021 20:05:54 - INFO - __main__ - Step 38248: {'lr': 0.0004295795770115254, 'samples': 7343616, 'steps': 38247, 'loss/train': 0.5504335165023804} -08/30/2021 20:05:54 - INFO - __main__ - Step 38249: {'lr': 0.0004295758849915329, 'samples': 7343808, 'steps': 38248, 'loss/train': 1.278775691986084} -08/30/2021 20:05:56 - INFO - __main__ - Step 38250: {'lr': 0.00042957219289062635, 'samples': 7344000, 'steps': 38249, 'loss/train': 1.3333531618118286} -08/30/2021 20:05:56 - INFO - __main__ - Step 38251: {'lr': 0.0004295685007088072, 'samples': 7344192, 'steps': 38250, 'loss/train': 1.7198967933654785} -08/30/2021 20:05:57 - INFO - __main__ - Step 38252: {'lr': 0.00042956480844607734, 'samples': 7344384, 'steps': 38251, 'loss/train': 1.3209530115127563} -08/30/2021 20:05:57 - INFO - __main__ - Step 38253: {'lr': 0.00042956111610243833, 'samples': 7344576, 'steps': 38252, 'loss/train': 1.4080396890640259} -08/30/2021 20:05:57 - INFO - __main__ - Step 38254: {'lr': 0.0004295574236778919, 'samples': 7344768, 'steps': 38253, 'loss/train': 1.213220477104187} -08/30/2021 20:05:59 - INFO - __main__ - Step 38255: {'lr': 0.00042955373117243954, 'samples': 7344960, 'steps': 38254, 'loss/train': 1.8991073369979858} -08/30/2021 20:06:00 - INFO - __main__ - Step 38256: {'lr': 0.0004295500385860832, 'samples': 7345152, 'steps': 38255, 'loss/train': 1.8520393371582031} -08/30/2021 20:06:00 - INFO - __main__ - Step 38257: {'lr': 0.0004295463459188243, 'samples': 7345344, 'steps': 38256, 'loss/train': 1.1536933183670044} -08/30/2021 20:06:01 - INFO - __main__ - Step 38258: {'lr': 0.00042954265317066457, 'samples': 7345536, 'steps': 38257, 'loss/train': 1.7650787830352783} -08/30/2021 20:06:01 - INFO - __main__ - Step 38259: {'lr': 0.0004295389603416057, 'samples': 7345728, 'steps': 38258, 'loss/train': 1.3722585439682007} -08/30/2021 20:06:02 - INFO - __main__ - Step 38260: {'lr': 0.0004295352674316494, 'samples': 7345920, 'steps': 38259, 'loss/train': 0.08418068289756775} -08/30/2021 20:06:03 - INFO - __main__ - Step 38261: {'lr': 0.0004295315744407972, 'samples': 7346112, 'steps': 38260, 'loss/train': 1.8569375276565552} -08/30/2021 20:06:03 - INFO - __main__ - Step 38262: {'lr': 0.0004295278813690509, 'samples': 7346304, 'steps': 38261, 'loss/train': 1.8080946207046509} -08/30/2021 20:06:04 - INFO - __main__ - Step 38263: {'lr': 0.0004295241882164121, 'samples': 7346496, 'steps': 38262, 'loss/train': 0.0890379324555397} -08/30/2021 20:06:04 - INFO - __main__ - Step 38264: {'lr': 0.0004295204949828825, 'samples': 7346688, 'steps': 38263, 'loss/train': 1.5070195198059082} -08/30/2021 20:06:04 - INFO - __main__ - Step 38265: {'lr': 0.0004295168016684636, 'samples': 7346880, 'steps': 38264, 'loss/train': 1.324474573135376} -08/30/2021 20:06:06 - INFO - __main__ - Step 38266: {'lr': 0.0004295131082731574, 'samples': 7347072, 'steps': 38265, 'loss/train': 1.471064805984497} -08/30/2021 20:06:07 - INFO - __main__ - Step 38267: {'lr': 0.0004295094147969652, 'samples': 7347264, 'steps': 38266, 'loss/train': 1.5266824960708618} -08/30/2021 20:06:07 - INFO - __main__ - Step 38268: {'lr': 0.0004295057212398889, 'samples': 7347456, 'steps': 38267, 'loss/train': 1.4947975873947144} -08/30/2021 20:06:07 - INFO - __main__ - Step 38269: {'lr': 0.00042950202760193003, 'samples': 7347648, 'steps': 38268, 'loss/train': 0.7710279822349548} -08/30/2021 20:06:08 - INFO - __main__ - Step 38270: {'lr': 0.0004294983338830904, 'samples': 7347840, 'steps': 38269, 'loss/train': 0.06871286779642105} -08/30/2021 20:06:09 - INFO - __main__ - Step 38271: {'lr': 0.0004294946400833716, 'samples': 7348032, 'steps': 38270, 'loss/train': 1.5208311080932617} -08/30/2021 20:06:10 - INFO - __main__ - Step 38272: {'lr': 0.0004294909462027752, 'samples': 7348224, 'steps': 38271, 'loss/train': 0.9921095371246338} -08/30/2021 20:06:10 - INFO - __main__ - Step 38273: {'lr': 0.000429487252241303, 'samples': 7348416, 'steps': 38272, 'loss/train': 1.6964455842971802} -08/30/2021 20:06:10 - INFO - __main__ - Step 38274: {'lr': 0.00042948355819895655, 'samples': 7348608, 'steps': 38273, 'loss/train': 0.6870641708374023} -08/30/2021 20:06:11 - INFO - __main__ - Step 38275: {'lr': 0.0004294798640757377, 'samples': 7348800, 'steps': 38274, 'loss/train': 1.894271731376648} -08/30/2021 20:06:12 - INFO - __main__ - Step 38276: {'lr': 0.00042947616987164787, 'samples': 7348992, 'steps': 38275, 'loss/train': 1.4293462038040161} -08/30/2021 20:06:13 - INFO - __main__ - Step 38277: {'lr': 0.00042947247558668887, 'samples': 7349184, 'steps': 38276, 'loss/train': 1.2104756832122803} -08/30/2021 20:06:13 - INFO - __main__ - Step 38278: {'lr': 0.00042946878122086243, 'samples': 7349376, 'steps': 38277, 'loss/train': 2.1625611782073975} -08/30/2021 20:06:13 - INFO - __main__ - Step 38279: {'lr': 0.00042946508677417007, 'samples': 7349568, 'steps': 38278, 'loss/train': 0.9601813554763794} -08/30/2021 20:06:14 - INFO - __main__ - Step 38280: {'lr': 0.0004294613922466135, 'samples': 7349760, 'steps': 38279, 'loss/train': 1.3848577737808228} -08/30/2021 20:06:15 - INFO - __main__ - Step 38281: {'lr': 0.0004294576976381944, 'samples': 7349952, 'steps': 38280, 'loss/train': 1.0251612663269043} -08/30/2021 20:06:15 - INFO - __main__ - Step 38282: {'lr': 0.00042945400294891445, 'samples': 7350144, 'steps': 38281, 'loss/train': 0.4659092426300049} -08/30/2021 20:06:16 - INFO - __main__ - Step 38283: {'lr': 0.0004294503081787753, 'samples': 7350336, 'steps': 38282, 'loss/train': 1.0270302295684814} -08/30/2021 20:06:16 - INFO - __main__ - Step 38284: {'lr': 0.0004294466133277786, 'samples': 7350528, 'steps': 38283, 'loss/train': 1.0008982419967651} -08/30/2021 20:06:17 - INFO - __main__ - Step 38285: {'lr': 0.00042944291839592597, 'samples': 7350720, 'steps': 38284, 'loss/train': 1.7949819564819336} -08/30/2021 20:06:19 - INFO - __main__ - Step 38286: {'lr': 0.0004294392233832192, 'samples': 7350912, 'steps': 38285, 'loss/train': 1.3292067050933838} -08/30/2021 20:06:19 - INFO - __main__ - Step 38287: {'lr': 0.0004294355282896599, 'samples': 7351104, 'steps': 38286, 'loss/train': 1.497835397720337} -08/30/2021 20:06:19 - INFO - __main__ - Step 38288: {'lr': 0.00042943183311524967, 'samples': 7351296, 'steps': 38287, 'loss/train': 1.17180597782135} -08/30/2021 20:06:20 - INFO - __main__ - Step 38289: {'lr': 0.0004294281378599902, 'samples': 7351488, 'steps': 38288, 'loss/train': 0.8179500102996826} -08/30/2021 20:06:20 - INFO - __main__ - Step 38290: {'lr': 0.00042942444252388323, 'samples': 7351680, 'steps': 38289, 'loss/train': 1.8279922008514404} -08/30/2021 20:06:21 - INFO - __main__ - Step 38291: {'lr': 0.0004294207471069304, 'samples': 7351872, 'steps': 38290, 'loss/train': 0.3865101933479309} -08/30/2021 20:06:22 - INFO - __main__ - Step 38292: {'lr': 0.0004294170516091332, 'samples': 7352064, 'steps': 38291, 'loss/train': 0.199554905295372} -08/30/2021 20:06:23 - INFO - __main__ - Step 38293: {'lr': 0.0004294133560304936, 'samples': 7352256, 'steps': 38292, 'loss/train': 0.6022427082061768} -08/30/2021 20:06:23 - INFO - __main__ - Step 38294: {'lr': 0.00042940966037101314, 'samples': 7352448, 'steps': 38293, 'loss/train': 0.4879750609397888} -08/30/2021 20:06:23 - INFO - __main__ - Step 38295: {'lr': 0.00042940596463069336, 'samples': 7352640, 'steps': 38294, 'loss/train': 1.4816641807556152} -08/30/2021 20:06:24 - INFO - __main__ - Step 38296: {'lr': 0.00042940226880953605, 'samples': 7352832, 'steps': 38295, 'loss/train': 0.8066173195838928} -08/30/2021 20:06:25 - INFO - __main__ - Step 38297: {'lr': 0.0004293985729075428, 'samples': 7353024, 'steps': 38296, 'loss/train': 1.0941252708435059} -08/30/2021 20:06:26 - INFO - __main__ - Step 38298: {'lr': 0.00042939487692471534, 'samples': 7353216, 'steps': 38297, 'loss/train': 1.3860887289047241} -08/30/2021 20:06:26 - INFO - __main__ - Step 38299: {'lr': 0.0004293911808610554, 'samples': 7353408, 'steps': 38298, 'loss/train': 1.9408745765686035} -08/30/2021 20:06:27 - INFO - __main__ - Step 38300: {'lr': 0.0004293874847165645, 'samples': 7353600, 'steps': 38299, 'loss/train': 2.1356542110443115} -08/30/2021 20:06:27 - INFO - __main__ - Step 38301: {'lr': 0.0004293837884912444, 'samples': 7353792, 'steps': 38300, 'loss/train': 1.271031379699707} -08/30/2021 20:06:27 - INFO - __main__ - Step 38302: {'lr': 0.00042938009218509667, 'samples': 7353984, 'steps': 38301, 'loss/train': 0.039873361587524414} -08/30/2021 20:06:29 - INFO - __main__ - Step 38303: {'lr': 0.00042937639579812304, 'samples': 7354176, 'steps': 38302, 'loss/train': 1.24366295337677} -08/30/2021 20:06:29 - INFO - __main__ - Step 38304: {'lr': 0.0004293726993303252, 'samples': 7354368, 'steps': 38303, 'loss/train': 1.8782334327697754} -08/30/2021 20:06:30 - INFO - __main__ - Step 38305: {'lr': 0.0004293690027817048, 'samples': 7354560, 'steps': 38304, 'loss/train': 1.8164504766464233} -08/30/2021 20:06:30 - INFO - __main__ - Step 38306: {'lr': 0.00042936530615226355, 'samples': 7354752, 'steps': 38305, 'loss/train': 1.1669104099273682} -08/30/2021 20:06:30 - INFO - __main__ - Step 38307: {'lr': 0.00042936160944200295, 'samples': 7354944, 'steps': 38306, 'loss/train': 0.7284160256385803} -08/30/2021 20:06:32 - INFO - __main__ - Step 38308: {'lr': 0.00042935791265092483, 'samples': 7355136, 'steps': 38307, 'loss/train': 1.7641724348068237} -08/30/2021 20:06:33 - INFO - __main__ - Step 38309: {'lr': 0.0004293542157790308, 'samples': 7355328, 'steps': 38308, 'loss/train': 1.6868990659713745} -08/30/2021 20:06:33 - INFO - __main__ - Step 38310: {'lr': 0.00042935051882632245, 'samples': 7355520, 'steps': 38309, 'loss/train': 1.474240779876709} -08/30/2021 20:06:34 - INFO - __main__ - Step 38311: {'lr': 0.0004293468217928017, 'samples': 7355712, 'steps': 38310, 'loss/train': 1.1536802053451538} -08/30/2021 20:06:34 - INFO - __main__ - Step 38312: {'lr': 0.0004293431246784699, 'samples': 7355904, 'steps': 38311, 'loss/train': 1.35757315158844} -08/30/2021 20:06:34 - INFO - __main__ - Step 38313: {'lr': 0.0004293394274833289, 'samples': 7356096, 'steps': 38312, 'loss/train': 2.712996006011963} -08/30/2021 20:06:36 - INFO - __main__ - Step 38314: {'lr': 0.0004293357302073804, 'samples': 7356288, 'steps': 38313, 'loss/train': 1.4420884847640991} -08/30/2021 20:06:37 - INFO - __main__ - Step 38315: {'lr': 0.00042933203285062585, 'samples': 7356480, 'steps': 38314, 'loss/train': 0.03965742886066437} -08/30/2021 20:06:37 - INFO - __main__ - Step 38316: {'lr': 0.00042932833541306704, 'samples': 7356672, 'steps': 38315, 'loss/train': 0.05863025411963463} -08/30/2021 20:06:37 - INFO - __main__ - Step 38317: {'lr': 0.0004293246378947058, 'samples': 7356864, 'steps': 38316, 'loss/train': 1.2256696224212646} -08/30/2021 20:06:38 - INFO - __main__ - Step 38318: {'lr': 0.00042932094029554354, 'samples': 7357056, 'steps': 38317, 'loss/train': 1.7070883512496948} -08/30/2021 20:06:38 - INFO - __main__ - Step 38319: {'lr': 0.00042931724261558205, 'samples': 7357248, 'steps': 38318, 'loss/train': 1.1679096221923828} -08/30/2021 20:06:40 - INFO - __main__ - Step 38320: {'lr': 0.000429313544854823, 'samples': 7357440, 'steps': 38319, 'loss/train': 2.084946393966675} -08/30/2021 20:06:40 - INFO - __main__ - Step 38321: {'lr': 0.00042930984701326796, 'samples': 7357632, 'steps': 38320, 'loss/train': 0.9213653802871704} -08/30/2021 20:06:41 - INFO - __main__ - Step 38322: {'lr': 0.0004293061490909187, 'samples': 7357824, 'steps': 38321, 'loss/train': 2.204930305480957} -08/30/2021 20:06:41 - INFO - __main__ - Step 38323: {'lr': 0.0004293024510877769, 'samples': 7358016, 'steps': 38322, 'loss/train': 1.5008680820465088} -08/30/2021 20:06:41 - INFO - __main__ - Step 38324: {'lr': 0.00042929875300384417, 'samples': 7358208, 'steps': 38323, 'loss/train': 1.2555770874023438} -08/30/2021 20:06:43 - INFO - __main__ - Step 38325: {'lr': 0.0004292950548391222, 'samples': 7358400, 'steps': 38324, 'loss/train': 1.0517908334732056} -08/30/2021 20:06:43 - INFO - __main__ - Step 38326: {'lr': 0.00042929135659361265, 'samples': 7358592, 'steps': 38325, 'loss/train': 1.4341306686401367} -08/30/2021 20:06:44 - INFO - __main__ - Step 38327: {'lr': 0.0004292876582673171, 'samples': 7358784, 'steps': 38326, 'loss/train': 1.5242656469345093} -08/30/2021 20:06:44 - INFO - __main__ - Step 38328: {'lr': 0.0004292839598602374, 'samples': 7358976, 'steps': 38327, 'loss/train': 1.540467381477356} -08/30/2021 20:06:44 - INFO - __main__ - Step 38329: {'lr': 0.000429280261372375, 'samples': 7359168, 'steps': 38328, 'loss/train': 1.4473063945770264} -08/30/2021 20:06:46 - INFO - __main__ - Step 38330: {'lr': 0.00042927656280373176, 'samples': 7359360, 'steps': 38329, 'loss/train': 1.760880470275879} -08/30/2021 20:06:47 - INFO - __main__ - Step 38331: {'lr': 0.00042927286415430933, 'samples': 7359552, 'steps': 38330, 'loss/train': 1.310583233833313} -08/30/2021 20:06:47 - INFO - __main__ - Step 38332: {'lr': 0.0004292691654241092, 'samples': 7359744, 'steps': 38331, 'loss/train': 1.4204710721969604} -08/30/2021 20:06:47 - INFO - __main__ - Step 38333: {'lr': 0.00042926546661313313, 'samples': 7359936, 'steps': 38332, 'loss/train': 1.2705073356628418} -08/30/2021 20:06:48 - INFO - __main__ - Step 38334: {'lr': 0.00042926176772138295, 'samples': 7360128, 'steps': 38333, 'loss/train': 1.5802440643310547} -08/30/2021 20:06:49 - INFO - __main__ - Step 38335: {'lr': 0.0004292580687488601, 'samples': 7360320, 'steps': 38334, 'loss/train': 0.784907341003418} -08/30/2021 20:06:50 - INFO - __main__ - Step 38336: {'lr': 0.0004292543696955663, 'samples': 7360512, 'steps': 38335, 'loss/train': 1.3498750925064087} -08/30/2021 20:06:50 - INFO - __main__ - Step 38337: {'lr': 0.00042925067056150324, 'samples': 7360704, 'steps': 38336, 'loss/train': 1.0025606155395508} -08/30/2021 20:06:50 - INFO - __main__ - Step 38338: {'lr': 0.0004292469713466727, 'samples': 7360896, 'steps': 38337, 'loss/train': 1.865934133529663} -08/30/2021 20:06:51 - INFO - __main__ - Step 38339: {'lr': 0.00042924327205107616, 'samples': 7361088, 'steps': 38338, 'loss/train': 1.722361445426941} -08/30/2021 20:06:52 - INFO - __main__ - Step 38340: {'lr': 0.00042923957267471536, 'samples': 7361280, 'steps': 38339, 'loss/train': 1.7274144887924194} -08/30/2021 20:06:53 - INFO - __main__ - Step 38341: {'lr': 0.000429235873217592, 'samples': 7361472, 'steps': 38340, 'loss/train': 1.5452969074249268} -08/30/2021 20:06:53 - INFO - __main__ - Step 38342: {'lr': 0.0004292321736797077, 'samples': 7361664, 'steps': 38341, 'loss/train': 0.16172029078006744} -08/30/2021 20:06:53 - INFO - __main__ - Step 38343: {'lr': 0.0004292284740610642, 'samples': 7361856, 'steps': 38342, 'loss/train': 1.1055632829666138} -08/30/2021 20:06:54 - INFO - __main__ - Step 38344: {'lr': 0.0004292247743616631, 'samples': 7362048, 'steps': 38343, 'loss/train': 1.6674665212631226} -08/30/2021 20:06:54 - INFO - __main__ - Step 38345: {'lr': 0.00042922107458150604, 'samples': 7362240, 'steps': 38344, 'loss/train': 1.0714342594146729} -08/30/2021 20:06:55 - INFO - __main__ - Step 38346: {'lr': 0.00042921737472059474, 'samples': 7362432, 'steps': 38345, 'loss/train': 0.8256217837333679} -08/30/2021 20:06:56 - INFO - __main__ - Step 38347: {'lr': 0.0004292136747789309, 'samples': 7362624, 'steps': 38346, 'loss/train': 1.4083000421524048} -08/30/2021 20:06:56 - INFO - __main__ - Step 38348: {'lr': 0.00042920997475651607, 'samples': 7362816, 'steps': 38347, 'loss/train': 1.5473214387893677} -08/30/2021 20:06:57 - INFO - __main__ - Step 38349: {'lr': 0.00042920627465335205, 'samples': 7363008, 'steps': 38348, 'loss/train': 1.6063055992126465} -08/30/2021 20:06:57 - INFO - __main__ - Step 38350: {'lr': 0.00042920257446944044, 'samples': 7363200, 'steps': 38349, 'loss/train': 1.1227517127990723} -08/30/2021 20:06:59 - INFO - __main__ - Step 38351: {'lr': 0.0004291988742047829, 'samples': 7363392, 'steps': 38350, 'loss/train': 1.6076951026916504} -08/30/2021 20:06:59 - INFO - __main__ - Step 38352: {'lr': 0.0004291951738593811, 'samples': 7363584, 'steps': 38351, 'loss/train': 1.4710899591445923} -08/30/2021 20:06:59 - INFO - __main__ - Step 38353: {'lr': 0.0004291914734332367, 'samples': 7363776, 'steps': 38352, 'loss/train': 1.488527536392212} -08/30/2021 20:07:00 - INFO - __main__ - Step 38354: {'lr': 0.0004291877729263515, 'samples': 7363968, 'steps': 38353, 'loss/train': 0.05705566331744194} -08/30/2021 20:07:00 - INFO - __main__ - Step 38355: {'lr': 0.0004291840723387269, 'samples': 7364160, 'steps': 38354, 'loss/train': 1.9111604690551758} -08/30/2021 20:07:02 - INFO - __main__ - Step 38356: {'lr': 0.0004291803716703648, 'samples': 7364352, 'steps': 38355, 'loss/train': 1.3006529808044434} -08/30/2021 20:07:02 - INFO - __main__ - Step 38357: {'lr': 0.0004291766709212668, 'samples': 7364544, 'steps': 38356, 'loss/train': 1.4822531938552856} -08/30/2021 20:07:02 - INFO - __main__ - Step 38358: {'lr': 0.00042917297009143455, 'samples': 7364736, 'steps': 38357, 'loss/train': 1.4925570487976074} -08/30/2021 20:07:03 - INFO - __main__ - Step 38359: {'lr': 0.00042916926918086973, 'samples': 7364928, 'steps': 38358, 'loss/train': 1.2138392925262451} -08/30/2021 20:07:03 - INFO - __main__ - Step 38360: {'lr': 0.000429165568189574, 'samples': 7365120, 'steps': 38359, 'loss/train': 1.5441910028457642} -08/30/2021 20:07:05 - INFO - __main__ - Step 38361: {'lr': 0.000429161867117549, 'samples': 7365312, 'steps': 38360, 'loss/train': 1.702162265777588} -08/30/2021 20:07:06 - INFO - __main__ - Step 38362: {'lr': 0.0004291581659647965, 'samples': 7365504, 'steps': 38361, 'loss/train': 1.0644760131835938} -08/30/2021 20:07:06 - INFO - __main__ - Step 38363: {'lr': 0.00042915446473131805, 'samples': 7365696, 'steps': 38362, 'loss/train': 1.857157826423645} -08/30/2021 20:07:06 - INFO - __main__ - Step 38364: {'lr': 0.0004291507634171153, 'samples': 7365888, 'steps': 38363, 'loss/train': 1.570695161819458} -08/30/2021 20:07:07 - INFO - __main__ - Step 38365: {'lr': 0.0004291470620221901, 'samples': 7366080, 'steps': 38364, 'loss/train': 1.4484847784042358} -08/30/2021 20:07:08 - INFO - __main__ - Step 38366: {'lr': 0.0004291433605465439, 'samples': 7366272, 'steps': 38365, 'loss/train': 1.6458383798599243} -08/30/2021 20:07:09 - INFO - __main__ - Step 38367: {'lr': 0.00042913965899017855, 'samples': 7366464, 'steps': 38366, 'loss/train': 1.7018097639083862} -08/30/2021 20:07:09 - INFO - __main__ - Step 38368: {'lr': 0.0004291359573530956, 'samples': 7366656, 'steps': 38367, 'loss/train': 0.5052033066749573} -08/30/2021 20:07:09 - INFO - __main__ - Step 38369: {'lr': 0.0004291322556352967, 'samples': 7366848, 'steps': 38368, 'loss/train': 1.6005996465682983} -08/30/2021 20:07:10 - INFO - __main__ - Step 38370: {'lr': 0.00042912855383678365, 'samples': 7367040, 'steps': 38369, 'loss/train': 1.4237728118896484} -08/30/2021 20:07:10 - INFO - __main__ - Step 38371: {'lr': 0.000429124851957558, 'samples': 7367232, 'steps': 38370, 'loss/train': 1.1759494543075562} -08/30/2021 20:07:12 - INFO - __main__ - Step 38372: {'lr': 0.0004291211499976214, 'samples': 7367424, 'steps': 38371, 'loss/train': 0.0802549198269844} -08/30/2021 20:07:12 - INFO - __main__ - Step 38373: {'lr': 0.0004291174479569757, 'samples': 7367616, 'steps': 38372, 'loss/train': 0.9666499495506287} -08/30/2021 20:07:12 - INFO - __main__ - Step 38374: {'lr': 0.00042911374583562233, 'samples': 7367808, 'steps': 38373, 'loss/train': 1.8338737487792969} -08/30/2021 20:07:13 - INFO - __main__ - Step 38375: {'lr': 0.0004291100436335631, 'samples': 7368000, 'steps': 38374, 'loss/train': 1.7034742832183838} -08/30/2021 20:07:13 - INFO - __main__ - Step 38376: {'lr': 0.00042910634135079963, 'samples': 7368192, 'steps': 38375, 'loss/train': 1.0884268283843994} -08/30/2021 20:07:15 - INFO - __main__ - Step 38377: {'lr': 0.00042910263898733364, 'samples': 7368384, 'steps': 38376, 'loss/train': 1.3782685995101929} -08/30/2021 20:07:15 - INFO - __main__ - Step 38378: {'lr': 0.0004290989365431668, 'samples': 7368576, 'steps': 38377, 'loss/train': 1.3031351566314697} -08/30/2021 20:07:16 - INFO - __main__ - Step 38379: {'lr': 0.0004290952340183007, 'samples': 7368768, 'steps': 38378, 'loss/train': 1.3178495168685913} -08/30/2021 20:07:16 - INFO - __main__ - Step 38380: {'lr': 0.00042909153141273705, 'samples': 7368960, 'steps': 38379, 'loss/train': 1.0316145420074463} -08/30/2021 20:07:16 - INFO - __main__ - Step 38381: {'lr': 0.0004290878287264775, 'samples': 7369152, 'steps': 38380, 'loss/train': 1.0927937030792236} -08/30/2021 20:07:17 - INFO - __main__ - Step 38382: {'lr': 0.0004290841259595237, 'samples': 7369344, 'steps': 38381, 'loss/train': 0.21168382465839386} -08/30/2021 20:07:18 - INFO - __main__ - Step 38383: {'lr': 0.00042908042311187744, 'samples': 7369536, 'steps': 38382, 'loss/train': 0.2850779891014099} -08/30/2021 20:07:19 - INFO - __main__ - Step 38384: {'lr': 0.00042907672018354027, 'samples': 7369728, 'steps': 38383, 'loss/train': 1.570150375366211} -08/30/2021 20:07:19 - INFO - __main__ - Step 38385: {'lr': 0.00042907301717451396, 'samples': 7369920, 'steps': 38384, 'loss/train': 1.4802727699279785} -08/30/2021 20:07:19 - INFO - __main__ - Step 38386: {'lr': 0.0004290693140848, 'samples': 7370112, 'steps': 38385, 'loss/train': 1.4690767526626587} -08/30/2021 20:07:20 - INFO - __main__ - Step 38387: {'lr': 0.0004290656109144003, 'samples': 7370304, 'steps': 38386, 'loss/train': 1.6843456029891968} -08/30/2021 20:07:21 - INFO - __main__ - Step 38388: {'lr': 0.0004290619076633163, 'samples': 7370496, 'steps': 38387, 'loss/train': 1.4054378271102905} -08/30/2021 20:07:22 - INFO - __main__ - Step 38389: {'lr': 0.0004290582043315498, 'samples': 7370688, 'steps': 38388, 'loss/train': 2.0691275596618652} -08/30/2021 20:07:22 - INFO - __main__ - Step 38390: {'lr': 0.0004290545009191024, 'samples': 7370880, 'steps': 38389, 'loss/train': 1.850519061088562} -08/30/2021 20:07:23 - INFO - __main__ - Step 38391: {'lr': 0.0004290507974259759, 'samples': 7371072, 'steps': 38390, 'loss/train': 1.5354053974151611} -08/30/2021 20:07:23 - INFO - __main__ - Step 38392: {'lr': 0.0004290470938521718, 'samples': 7371264, 'steps': 38391, 'loss/train': 1.6896512508392334} -08/30/2021 20:07:24 - INFO - __main__ - Step 38393: {'lr': 0.0004290433901976918, 'samples': 7371456, 'steps': 38392, 'loss/train': 1.3803422451019287} -08/30/2021 20:07:25 - INFO - __main__ - Step 38394: {'lr': 0.0004290396864625377, 'samples': 7371648, 'steps': 38393, 'loss/train': 1.3532553911209106} -08/30/2021 20:07:25 - INFO - __main__ - Step 38395: {'lr': 0.000429035982646711, 'samples': 7371840, 'steps': 38394, 'loss/train': 1.0663450956344604} -08/30/2021 20:07:25 - INFO - __main__ - Step 38396: {'lr': 0.0004290322787502135, 'samples': 7372032, 'steps': 38395, 'loss/train': 1.366197109222412} -08/30/2021 20:07:26 - INFO - __main__ - Step 38397: {'lr': 0.0004290285747730468, 'samples': 7372224, 'steps': 38396, 'loss/train': 1.0420398712158203} -08/30/2021 20:07:27 - INFO - __main__ - Step 38398: {'lr': 0.00042902487071521257, 'samples': 7372416, 'steps': 38397, 'loss/train': 1.5380035638809204} -08/30/2021 20:07:28 - INFO - __main__ - Step 38399: {'lr': 0.0004290211665767125, 'samples': 7372608, 'steps': 38398, 'loss/train': 1.3863297700881958} -08/30/2021 20:07:28 - INFO - __main__ - Step 38400: {'lr': 0.00042901746235754837, 'samples': 7372800, 'steps': 38399, 'loss/train': 5.894840717315674} -08/30/2021 20:07:29 - INFO - __main__ - Step 38401: {'lr': 0.0004290137580577216, 'samples': 7372992, 'steps': 38400, 'loss/train': 1.3483859300613403} -08/30/2021 20:07:29 - INFO - __main__ - Step 38402: {'lr': 0.000429010053677234, 'samples': 7373184, 'steps': 38401, 'loss/train': 1.3598942756652832} -08/30/2021 20:07:29 - INFO - __main__ - Step 38403: {'lr': 0.00042900634921608726, 'samples': 7373376, 'steps': 38402, 'loss/train': 1.2021913528442383} -08/30/2021 20:07:31 - INFO - __main__ - Step 38404: {'lr': 0.0004290026446742831, 'samples': 7373568, 'steps': 38403, 'loss/train': 1.045536756515503} -08/30/2021 20:07:32 - INFO - __main__ - Step 38405: {'lr': 0.00042899894005182294, 'samples': 7373760, 'steps': 38404, 'loss/train': 1.710484266281128} -08/30/2021 20:07:32 - INFO - __main__ - Step 38406: {'lr': 0.0004289952353487088, 'samples': 7373952, 'steps': 38405, 'loss/train': 1.2518749237060547} -08/30/2021 20:07:32 - INFO - __main__ - Step 38407: {'lr': 0.000428991530564942, 'samples': 7374144, 'steps': 38406, 'loss/train': 1.3863412141799927} -08/30/2021 20:07:33 - INFO - __main__ - Step 38408: {'lr': 0.00042898782570052453, 'samples': 7374336, 'steps': 38407, 'loss/train': 1.3660690784454346} -08/30/2021 20:07:33 - INFO - __main__ - Step 38409: {'lr': 0.0004289841207554578, 'samples': 7374528, 'steps': 38408, 'loss/train': 1.8012281656265259} -08/30/2021 20:07:34 - INFO - __main__ - Step 38410: {'lr': 0.00042898041572974363, 'samples': 7374720, 'steps': 38409, 'loss/train': 0.05124419555068016} -08/30/2021 20:07:35 - INFO - __main__ - Step 38411: {'lr': 0.0004289767106233836, 'samples': 7374912, 'steps': 38410, 'loss/train': 1.5511677265167236} -08/30/2021 20:07:35 - INFO - __main__ - Step 38412: {'lr': 0.0004289730054363795, 'samples': 7375104, 'steps': 38411, 'loss/train': 1.6404657363891602} -08/30/2021 20:07:36 - INFO - __main__ - Step 38413: {'lr': 0.00042896930016873293, 'samples': 7375296, 'steps': 38412, 'loss/train': 0.4600420296192169} -08/30/2021 20:07:36 - INFO - __main__ - Step 38414: {'lr': 0.0004289655948204455, 'samples': 7375488, 'steps': 38413, 'loss/train': 1.2763087749481201} -08/30/2021 20:07:38 - INFO - __main__ - Step 38415: {'lr': 0.00042896188939151893, 'samples': 7375680, 'steps': 38414, 'loss/train': 0.8128842115402222} -08/30/2021 20:07:38 - INFO - __main__ - Step 38416: {'lr': 0.00042895818388195497, 'samples': 7375872, 'steps': 38415, 'loss/train': 1.8555107116699219} -08/30/2021 20:07:38 - INFO - __main__ - Step 38417: {'lr': 0.00042895447829175516, 'samples': 7376064, 'steps': 38416, 'loss/train': 0.6345165967941284} -08/30/2021 20:07:39 - INFO - __main__ - Step 38418: {'lr': 0.00042895077262092117, 'samples': 7376256, 'steps': 38417, 'loss/train': 1.8651283979415894} -08/30/2021 20:07:39 - INFO - __main__ - Step 38419: {'lr': 0.00042894706686945485, 'samples': 7376448, 'steps': 38418, 'loss/train': 0.7478687763214111} -08/30/2021 20:07:39 - INFO - __main__ - Step 38420: {'lr': 0.00042894336103735766, 'samples': 7376640, 'steps': 38419, 'loss/train': 2.884406805038452} -08/30/2021 20:07:41 - INFO - __main__ - Step 38421: {'lr': 0.0004289396551246313, 'samples': 7376832, 'steps': 38420, 'loss/train': 1.53440260887146} -08/30/2021 20:07:42 - INFO - __main__ - Step 38422: {'lr': 0.0004289359491312776, 'samples': 7377024, 'steps': 38421, 'loss/train': 1.1233142614364624} -08/30/2021 20:07:42 - INFO - __main__ - Step 38423: {'lr': 0.00042893224305729806, 'samples': 7377216, 'steps': 38422, 'loss/train': 1.0973279476165771} -08/30/2021 20:07:43 - INFO - __main__ - Step 38424: {'lr': 0.0004289285369026944, 'samples': 7377408, 'steps': 38423, 'loss/train': 1.3954734802246094} -08/30/2021 20:07:43 - INFO - __main__ - Step 38425: {'lr': 0.00042892483066746836, 'samples': 7377600, 'steps': 38424, 'loss/train': 2.1326191425323486} -08/30/2021 20:07:44 - INFO - __main__ - Step 38426: {'lr': 0.0004289211243516216, 'samples': 7377792, 'steps': 38425, 'loss/train': 1.6857160329818726} -08/30/2021 20:07:45 - INFO - __main__ - Step 38427: {'lr': 0.0004289174179551556, 'samples': 7377984, 'steps': 38426, 'loss/train': 1.6702098846435547} -08/30/2021 20:07:45 - INFO - __main__ - Step 38428: {'lr': 0.0004289137114780722, 'samples': 7378176, 'steps': 38427, 'loss/train': 1.3359206914901733} -08/30/2021 20:07:46 - INFO - __main__ - Step 38429: {'lr': 0.00042891000492037315, 'samples': 7378368, 'steps': 38428, 'loss/train': 1.6277127265930176} -08/30/2021 20:07:46 - INFO - __main__ - Step 38430: {'lr': 0.00042890629828205997, 'samples': 7378560, 'steps': 38429, 'loss/train': 0.9746399521827698} -08/30/2021 20:07:47 - INFO - __main__ - Step 38431: {'lr': 0.0004289025915631343, 'samples': 7378752, 'steps': 38430, 'loss/train': 1.7930362224578857} -08/30/2021 20:07:48 - INFO - __main__ - Step 38432: {'lr': 0.00042889888476359793, 'samples': 7378944, 'steps': 38431, 'loss/train': 1.0633318424224854} -08/30/2021 20:07:48 - INFO - __main__ - Step 38433: {'lr': 0.0004288951778834525, 'samples': 7379136, 'steps': 38432, 'loss/train': 1.75481116771698} -08/30/2021 20:07:49 - INFO - __main__ - Step 38434: {'lr': 0.00042889147092269964, 'samples': 7379328, 'steps': 38433, 'loss/train': 1.6086457967758179} -08/30/2021 20:07:49 - INFO - __main__ - Step 38435: {'lr': 0.0004288877638813411, 'samples': 7379520, 'steps': 38434, 'loss/train': 1.5156124830245972} -08/30/2021 20:07:51 - INFO - __main__ - Step 38436: {'lr': 0.00042888405675937843, 'samples': 7379712, 'steps': 38435, 'loss/train': 1.480774998664856} -08/30/2021 20:07:51 - INFO - __main__ - Step 38437: {'lr': 0.00042888034955681337, 'samples': 7379904, 'steps': 38436, 'loss/train': 1.2685781717300415} -08/30/2021 20:07:52 - INFO - __main__ - Step 38438: {'lr': 0.0004288766422736476, 'samples': 7380096, 'steps': 38437, 'loss/train': 1.4384146928787231} -08/30/2021 20:07:52 - INFO - __main__ - Step 38439: {'lr': 0.00042887293490988276, 'samples': 7380288, 'steps': 38438, 'loss/train': 1.7205339670181274} -08/30/2021 20:07:52 - INFO - __main__ - Step 38440: {'lr': 0.00042886922746552056, 'samples': 7380480, 'steps': 38439, 'loss/train': 0.03151669725775719} -08/30/2021 20:07:53 - INFO - __main__ - Step 38441: {'lr': 0.0004288655199405626, 'samples': 7380672, 'steps': 38440, 'loss/train': 1.7208235263824463} -08/30/2021 20:07:54 - INFO - __main__ - Step 38442: {'lr': 0.00042886181233501067, 'samples': 7380864, 'steps': 38441, 'loss/train': 1.6233160495758057} -08/30/2021 20:07:55 - INFO - __main__ - Step 38443: {'lr': 0.00042885810464886635, 'samples': 7381056, 'steps': 38442, 'loss/train': 1.3776395320892334} -08/30/2021 20:07:55 - INFO - __main__ - Step 38444: {'lr': 0.0004288543968821312, 'samples': 7381248, 'steps': 38443, 'loss/train': 1.6801183223724365} -08/30/2021 20:07:55 - INFO - __main__ - Step 38445: {'lr': 0.00042885068903480717, 'samples': 7381440, 'steps': 38444, 'loss/train': 1.5177701711654663} -08/30/2021 20:07:56 - INFO - __main__ - Step 38446: {'lr': 0.00042884698110689574, 'samples': 7381632, 'steps': 38445, 'loss/train': 1.238015055656433} -08/30/2021 20:07:58 - INFO - __main__ - Step 38447: {'lr': 0.00042884327309839865, 'samples': 7381824, 'steps': 38446, 'loss/train': 0.98250412940979} -08/30/2021 20:07:58 - INFO - __main__ - Step 38448: {'lr': 0.0004288395650093174, 'samples': 7382016, 'steps': 38447, 'loss/train': 1.351719856262207} -08/30/2021 20:07:59 - INFO - __main__ - Step 38449: {'lr': 0.000428835856839654, 'samples': 7382208, 'steps': 38448, 'loss/train': 1.6364364624023438} -08/30/2021 20:07:59 - INFO - __main__ - Step 38450: {'lr': 0.0004288321485894098, 'samples': 7382400, 'steps': 38449, 'loss/train': 1.087575912475586} -08/30/2021 20:07:59 - INFO - __main__ - Step 38451: {'lr': 0.0004288284402585866, 'samples': 7382592, 'steps': 38450, 'loss/train': 1.4363609552383423} -08/30/2021 20:08:00 - INFO - __main__ - Step 38452: {'lr': 0.0004288247318471861, 'samples': 7382784, 'steps': 38451, 'loss/train': 1.2984539270401} -08/30/2021 20:08:01 - INFO - __main__ - Step 38453: {'lr': 0.0004288210233552099, 'samples': 7382976, 'steps': 38452, 'loss/train': 0.6166121959686279} -08/30/2021 20:08:02 - INFO - __main__ - Step 38454: {'lr': 0.00042881731478265975, 'samples': 7383168, 'steps': 38453, 'loss/train': 1.294426679611206} -08/30/2021 20:08:02 - INFO - __main__ - Step 38455: {'lr': 0.00042881360612953724, 'samples': 7383360, 'steps': 38454, 'loss/train': 1.5295624732971191} -08/30/2021 20:08:03 - INFO - __main__ - Step 38456: {'lr': 0.0004288098973958441, 'samples': 7383552, 'steps': 38455, 'loss/train': 0.06265326589345932} -08/30/2021 20:08:03 - INFO - __main__ - Step 38457: {'lr': 0.000428806188581582, 'samples': 7383744, 'steps': 38456, 'loss/train': 0.11087145656347275} -08/30/2021 20:08:04 - INFO - __main__ - Step 38458: {'lr': 0.00042880247968675255, 'samples': 7383936, 'steps': 38457, 'loss/train': 1.7792470455169678} -08/30/2021 20:08:05 - INFO - __main__ - Step 38459: {'lr': 0.00042879877071135746, 'samples': 7384128, 'steps': 38458, 'loss/train': 1.6664425134658813} -08/30/2021 20:08:05 - INFO - __main__ - Step 38460: {'lr': 0.0004287950616553984, 'samples': 7384320, 'steps': 38459, 'loss/train': 1.4453438520431519} -08/30/2021 20:08:05 - INFO - __main__ - Step 38461: {'lr': 0.0004287913525188771, 'samples': 7384512, 'steps': 38460, 'loss/train': 1.2469711303710938} -08/30/2021 20:08:06 - INFO - __main__ - Step 38462: {'lr': 0.0004287876433017951, 'samples': 7384704, 'steps': 38461, 'loss/train': 1.9227299690246582} -08/30/2021 20:08:07 - INFO - __main__ - Step 38463: {'lr': 0.0004287839340041542, 'samples': 7384896, 'steps': 38462, 'loss/train': 1.9891043901443481} -08/30/2021 20:08:08 - INFO - __main__ - Step 38464: {'lr': 0.000428780224625956, 'samples': 7385088, 'steps': 38463, 'loss/train': 1.535179853439331} -08/30/2021 20:08:08 - INFO - __main__ - Step 38465: {'lr': 0.00042877651516720215, 'samples': 7385280, 'steps': 38464, 'loss/train': 1.1087923049926758} -08/30/2021 20:08:08 - INFO - __main__ - Step 38466: {'lr': 0.0004287728056278944, 'samples': 7385472, 'steps': 38465, 'loss/train': 0.8257372379302979} -08/30/2021 20:08:09 - INFO - __main__ - Step 38467: {'lr': 0.00042876909600803444, 'samples': 7385664, 'steps': 38466, 'loss/train': 1.8143433332443237} -08/30/2021 20:08:10 - INFO - __main__ - Step 38468: {'lr': 0.00042876538630762386, 'samples': 7385856, 'steps': 38467, 'loss/train': 1.3907827138900757} -08/30/2021 20:08:11 - INFO - __main__ - Step 38469: {'lr': 0.00042876167652666433, 'samples': 7386048, 'steps': 38468, 'loss/train': 1.5649192333221436} -08/30/2021 20:08:11 - INFO - __main__ - Step 38470: {'lr': 0.0004287579666651575, 'samples': 7386240, 'steps': 38469, 'loss/train': 1.6606879234313965} -08/30/2021 20:08:12 - INFO - __main__ - Step 38471: {'lr': 0.00042875425672310506, 'samples': 7386432, 'steps': 38470, 'loss/train': 1.539514183998108} -08/30/2021 20:08:12 - INFO - __main__ - Step 38472: {'lr': 0.00042875054670050885, 'samples': 7386624, 'steps': 38471, 'loss/train': 1.4509732723236084} -08/30/2021 20:08:14 - INFO - __main__ - Step 38473: {'lr': 0.00042874683659737035, 'samples': 7386816, 'steps': 38472, 'loss/train': 1.0951043367385864} -08/30/2021 20:08:15 - INFO - __main__ - Step 38474: {'lr': 0.0004287431264136913, 'samples': 7387008, 'steps': 38473, 'loss/train': 1.0203770399093628} -08/30/2021 20:08:15 - INFO - __main__ - Step 38475: {'lr': 0.0004287394161494733, 'samples': 7387200, 'steps': 38474, 'loss/train': 1.8917231559753418} -08/30/2021 20:08:16 - INFO - __main__ - Step 38476: {'lr': 0.0004287357058047181, 'samples': 7387392, 'steps': 38475, 'loss/train': 2.1725013256073} -08/30/2021 20:08:16 - INFO - __main__ - Step 38477: {'lr': 0.00042873199537942733, 'samples': 7387584, 'steps': 38476, 'loss/train': 1.5604864358901978} -08/30/2021 20:08:16 - INFO - __main__ - Step 38478: {'lr': 0.0004287282848736027, 'samples': 7387776, 'steps': 38477, 'loss/train': 0.026956936344504356} -08/30/2021 20:08:18 - INFO - __main__ - Step 38479: {'lr': 0.00042872457428724586, 'samples': 7387968, 'steps': 38478, 'loss/train': 1.6910027265548706} -08/30/2021 20:08:18 - INFO - __main__ - Step 38480: {'lr': 0.00042872086362035844, 'samples': 7388160, 'steps': 38479, 'loss/train': 1.4944396018981934} -08/30/2021 20:08:18 - INFO - __main__ - Step 38481: {'lr': 0.00042871715287294223, 'samples': 7388352, 'steps': 38480, 'loss/train': 1.3934500217437744} -08/30/2021 20:08:19 - INFO - __main__ - Step 38482: {'lr': 0.00042871344204499886, 'samples': 7388544, 'steps': 38481, 'loss/train': 0.8657522201538086} -08/30/2021 20:08:19 - INFO - __main__ - Step 38483: {'lr': 0.0004287097311365299, 'samples': 7388736, 'steps': 38482, 'loss/train': 1.3216339349746704} -08/30/2021 20:08:21 - INFO - __main__ - Step 38484: {'lr': 0.00042870602014753707, 'samples': 7388928, 'steps': 38483, 'loss/train': 1.3031517267227173} -08/30/2021 20:08:21 - INFO - __main__ - Step 38485: {'lr': 0.0004287023090780221, 'samples': 7389120, 'steps': 38484, 'loss/train': 1.4127449989318848} -08/30/2021 20:08:21 - INFO - __main__ - Step 38486: {'lr': 0.0004286985979279866, 'samples': 7389312, 'steps': 38485, 'loss/train': 1.0331435203552246} -08/30/2021 20:08:22 - INFO - __main__ - Step 38487: {'lr': 0.0004286948866974323, 'samples': 7389504, 'steps': 38486, 'loss/train': 2.846611976623535} -08/30/2021 20:08:22 - INFO - __main__ - Step 38488: {'lr': 0.0004286911753863608, 'samples': 7389696, 'steps': 38487, 'loss/train': 1.4545589685440063} -08/30/2021 20:08:24 - INFO - __main__ - Step 38489: {'lr': 0.0004286874639947739, 'samples': 7389888, 'steps': 38488, 'loss/train': 0.8318132758140564} -08/30/2021 20:08:24 - INFO - __main__ - Step 38490: {'lr': 0.0004286837525226731, 'samples': 7390080, 'steps': 38489, 'loss/train': 1.4098542928695679} -08/30/2021 20:08:24 - INFO - __main__ - Step 38491: {'lr': 0.0004286800409700602, 'samples': 7390272, 'steps': 38490, 'loss/train': 1.7316874265670776} -08/30/2021 20:08:25 - INFO - __main__ - Step 38492: {'lr': 0.0004286763293369369, 'samples': 7390464, 'steps': 38491, 'loss/train': 1.665035367012024} -08/30/2021 20:08:25 - INFO - __main__ - Step 38493: {'lr': 0.00042867261762330466, 'samples': 7390656, 'steps': 38492, 'loss/train': 1.579277515411377} -08/30/2021 20:08:25 - INFO - __main__ - Step 38494: {'lr': 0.0004286689058291654, 'samples': 7390848, 'steps': 38493, 'loss/train': 1.2257510423660278} -08/30/2021 20:08:27 - INFO - __main__ - Step 38495: {'lr': 0.00042866519395452063, 'samples': 7391040, 'steps': 38494, 'loss/train': 1.256990671157837} -08/30/2021 20:08:27 - INFO - __main__ - Step 38496: {'lr': 0.00042866148199937216, 'samples': 7391232, 'steps': 38495, 'loss/train': 1.0256305932998657} -08/30/2021 20:08:28 - INFO - __main__ - Step 38497: {'lr': 0.00042865776996372146, 'samples': 7391424, 'steps': 38496, 'loss/train': 0.6763159036636353} -08/30/2021 20:08:28 - INFO - __main__ - Step 38498: {'lr': 0.00042865405784757037, 'samples': 7391616, 'steps': 38497, 'loss/train': 1.5458842515945435} -08/30/2021 20:08:29 - INFO - __main__ - Step 38499: {'lr': 0.0004286503456509206, 'samples': 7391808, 'steps': 38498, 'loss/train': 1.0726215839385986} -08/30/2021 20:08:30 - INFO - __main__ - Step 38500: {'lr': 0.0004286466333737737, 'samples': 7392000, 'steps': 38499, 'loss/train': 1.5382964611053467} -08/30/2021 20:08:30 - INFO - __main__ - Step 38501: {'lr': 0.00042864292101613133, 'samples': 7392192, 'steps': 38500, 'loss/train': 1.2885104417800903} -08/30/2021 20:08:31 - INFO - __main__ - Step 38502: {'lr': 0.0004286392085779953, 'samples': 7392384, 'steps': 38501, 'loss/train': 1.8463127613067627} -08/30/2021 20:08:31 - INFO - __main__ - Step 38503: {'lr': 0.00042863549605936716, 'samples': 7392576, 'steps': 38502, 'loss/train': 0.9789907932281494} -08/30/2021 20:08:31 - INFO - __main__ - Step 38504: {'lr': 0.00042863178346024856, 'samples': 7392768, 'steps': 38503, 'loss/train': 1.4179446697235107} -08/30/2021 20:08:33 - INFO - __main__ - Step 38505: {'lr': 0.00042862807078064124, 'samples': 7392960, 'steps': 38504, 'loss/train': 0.829459547996521} -08/30/2021 20:08:34 - INFO - __main__ - Step 38506: {'lr': 0.00042862435802054703, 'samples': 7393152, 'steps': 38505, 'loss/train': 0.11938699334859848} -08/30/2021 20:08:34 - INFO - __main__ - Step 38507: {'lr': 0.00042862064517996723, 'samples': 7393344, 'steps': 38506, 'loss/train': 1.2859399318695068} -08/30/2021 20:08:34 - INFO - __main__ - Step 38508: {'lr': 0.00042861693225890385, 'samples': 7393536, 'steps': 38507, 'loss/train': 1.0238215923309326} -08/30/2021 20:08:35 - INFO - __main__ - Step 38509: {'lr': 0.0004286132192573584, 'samples': 7393728, 'steps': 38508, 'loss/train': 2.307140827178955} -08/30/2021 20:08:36 - INFO - __main__ - Step 38510: {'lr': 0.0004286095061753326, 'samples': 7393920, 'steps': 38509, 'loss/train': 1.4286121129989624} -08/30/2021 20:08:37 - INFO - __main__ - Step 38511: {'lr': 0.0004286057930128281, 'samples': 7394112, 'steps': 38510, 'loss/train': 1.5474827289581299} -08/30/2021 20:08:37 - INFO - __main__ - Step 38512: {'lr': 0.00042860207976984664, 'samples': 7394304, 'steps': 38511, 'loss/train': 0.9539635181427002} -08/30/2021 20:08:38 - INFO - __main__ - Step 38513: {'lr': 0.00042859836644638976, 'samples': 7394496, 'steps': 38512, 'loss/train': 0.13185752928256989} -08/30/2021 20:08:38 - INFO - __main__ - Step 38514: {'lr': 0.00042859465304245927, 'samples': 7394688, 'steps': 38513, 'loss/train': 1.589725375175476} -08/30/2021 20:08:39 - INFO - __main__ - Step 38515: {'lr': 0.00042859093955805675, 'samples': 7394880, 'steps': 38514, 'loss/train': 1.4439661502838135} -08/30/2021 20:08:40 - INFO - __main__ - Step 38516: {'lr': 0.0004285872259931839, 'samples': 7395072, 'steps': 38515, 'loss/train': 0.9839127063751221} -08/30/2021 20:08:40 - INFO - __main__ - Step 38517: {'lr': 0.00042858351234784244, 'samples': 7395264, 'steps': 38516, 'loss/train': 1.1193145513534546} -08/30/2021 20:08:41 - INFO - __main__ - Step 38518: {'lr': 0.000428579798622034, 'samples': 7395456, 'steps': 38517, 'loss/train': 1.6708089113235474} -08/30/2021 20:08:41 - INFO - __main__ - Step 38519: {'lr': 0.0004285760848157603, 'samples': 7395648, 'steps': 38518, 'loss/train': 1.71746027469635} -08/30/2021 20:08:42 - INFO - __main__ - Step 38520: {'lr': 0.00042857237092902285, 'samples': 7395840, 'steps': 38519, 'loss/train': 1.389754056930542} -08/30/2021 20:08:43 - INFO - __main__ - Step 38521: {'lr': 0.0004285686569618235, 'samples': 7396032, 'steps': 38520, 'loss/train': 1.28855299949646} -08/30/2021 20:08:43 - INFO - __main__ - Step 38522: {'lr': 0.0004285649429141639, 'samples': 7396224, 'steps': 38521, 'loss/train': 1.0698468685150146} -08/30/2021 20:08:43 - INFO - __main__ - Step 38523: {'lr': 0.00042856122878604566, 'samples': 7396416, 'steps': 38522, 'loss/train': 1.6809558868408203} -08/30/2021 20:08:44 - INFO - __main__ - Step 38524: {'lr': 0.0004285575145774705, 'samples': 7396608, 'steps': 38523, 'loss/train': 1.2037886381149292} -08/30/2021 20:08:46 - INFO - __main__ - Step 38525: {'lr': 0.00042855380028844004, 'samples': 7396800, 'steps': 38524, 'loss/train': 1.1967549324035645} -08/30/2021 20:08:46 - INFO - __main__ - Step 38526: {'lr': 0.00042855008591895607, 'samples': 7396992, 'steps': 38525, 'loss/train': 1.2843049764633179} -08/30/2021 20:08:47 - INFO - __main__ - Step 38527: {'lr': 0.00042854637146902007, 'samples': 7397184, 'steps': 38526, 'loss/train': 1.729673981666565} -08/30/2021 20:08:47 - INFO - __main__ - Step 38528: {'lr': 0.00042854265693863394, 'samples': 7397376, 'steps': 38527, 'loss/train': 1.2778013944625854} -08/30/2021 20:08:47 - INFO - __main__ - Step 38529: {'lr': 0.00042853894232779924, 'samples': 7397568, 'steps': 38528, 'loss/train': 1.6214121580123901} -08/30/2021 20:08:48 - INFO - __main__ - Step 38530: {'lr': 0.00042853522763651767, 'samples': 7397760, 'steps': 38529, 'loss/train': 1.3370741605758667} -08/30/2021 20:08:49 - INFO - __main__ - Step 38531: {'lr': 0.00042853151286479074, 'samples': 7397952, 'steps': 38530, 'loss/train': 1.225573182106018} -08/30/2021 20:08:50 - INFO - __main__ - Step 38532: {'lr': 0.0004285277980126204, 'samples': 7398144, 'steps': 38531, 'loss/train': 1.3735125064849854} -08/30/2021 20:08:50 - INFO - __main__ - Step 38533: {'lr': 0.0004285240830800081, 'samples': 7398336, 'steps': 38532, 'loss/train': 1.0428873300552368} -08/30/2021 20:08:51 - INFO - __main__ - Step 38534: {'lr': 0.00042852036806695565, 'samples': 7398528, 'steps': 38533, 'loss/train': 1.1194499731063843} -08/30/2021 20:08:51 - INFO - __main__ - Step 38535: {'lr': 0.0004285166529734647, 'samples': 7398720, 'steps': 38534, 'loss/train': 0.12767842411994934} -08/30/2021 20:08:53 - INFO - __main__ - Step 38536: {'lr': 0.0004285129377995369, 'samples': 7398912, 'steps': 38535, 'loss/train': 0.9758719801902771} -08/30/2021 20:08:53 - INFO - __main__ - Step 38537: {'lr': 0.0004285092225451739, 'samples': 7399104, 'steps': 38536, 'loss/train': 0.6560772061347961} -08/30/2021 20:08:53 - INFO - __main__ - Step 38538: {'lr': 0.0004285055072103774, 'samples': 7399296, 'steps': 38537, 'loss/train': 0.06396327912807465} -08/30/2021 20:08:54 - INFO - __main__ - Step 38539: {'lr': 0.00042850179179514906, 'samples': 7399488, 'steps': 38538, 'loss/train': 0.8640857338905334} -08/30/2021 20:08:54 - INFO - __main__ - Step 38540: {'lr': 0.00042849807629949057, 'samples': 7399680, 'steps': 38539, 'loss/train': 1.4904595613479614} -08/30/2021 20:08:56 - INFO - __main__ - Step 38541: {'lr': 0.0004284943607234036, 'samples': 7399872, 'steps': 38540, 'loss/train': 0.756790041923523} -08/30/2021 20:08:56 - INFO - __main__ - Step 38542: {'lr': 0.00042849064506688984, 'samples': 7400064, 'steps': 38541, 'loss/train': 1.6215373277664185} -08/30/2021 20:08:56 - INFO - __main__ - Step 38543: {'lr': 0.00042848692932995094, 'samples': 7400256, 'steps': 38542, 'loss/train': 1.2473387718200684} -08/30/2021 20:08:57 - INFO - __main__ - Step 38544: {'lr': 0.0004284832135125886, 'samples': 7400448, 'steps': 38543, 'loss/train': 1.1544280052185059} -08/30/2021 20:08:57 - INFO - __main__ - Step 38545: {'lr': 0.0004284794976148044, 'samples': 7400640, 'steps': 38544, 'loss/train': 0.5333156585693359} -08/30/2021 20:08:59 - INFO - __main__ - Step 38546: {'lr': 0.00042847578163660016, 'samples': 7400832, 'steps': 38545, 'loss/train': 1.554076075553894} -08/30/2021 20:08:59 - INFO - __main__ - Step 38547: {'lr': 0.0004284720655779775, 'samples': 7401024, 'steps': 38546, 'loss/train': 1.4622931480407715} -08/30/2021 20:09:00 - INFO - __main__ - Step 38548: {'lr': 0.00042846834943893806, 'samples': 7401216, 'steps': 38547, 'loss/train': 1.4342594146728516} -08/30/2021 20:09:00 - INFO - __main__ - Step 38549: {'lr': 0.0004284646332194836, 'samples': 7401408, 'steps': 38548, 'loss/train': 0.026467587798833847} -08/30/2021 20:09:00 - INFO - __main__ - Step 38550: {'lr': 0.0004284609169196156, 'samples': 7401600, 'steps': 38549, 'loss/train': 4.960337162017822} -08/30/2021 20:09:01 - INFO - __main__ - Step 38551: {'lr': 0.000428457200539336, 'samples': 7401792, 'steps': 38550, 'loss/train': 1.6371339559555054} -08/30/2021 20:09:01 - INFO - __main__ - Step 38552: {'lr': 0.0004284534840786463, 'samples': 7401984, 'steps': 38551, 'loss/train': 2.3429114818573} -08/30/2021 20:09:03 - INFO - __main__ - Step 38553: {'lr': 0.0004284497675375482, 'samples': 7402176, 'steps': 38552, 'loss/train': 1.4956729412078857} -08/30/2021 20:09:03 - INFO - __main__ - Step 38554: {'lr': 0.0004284460509160433, 'samples': 7402368, 'steps': 38553, 'loss/train': 1.6276262998580933} -08/30/2021 20:09:03 - INFO - __main__ - Step 38555: {'lr': 0.0004284423342141335, 'samples': 7402560, 'steps': 38554, 'loss/train': 1.6214299201965332} -08/30/2021 20:09:04 - INFO - __main__ - Step 38556: {'lr': 0.0004284386174318202, 'samples': 7402752, 'steps': 38555, 'loss/train': 1.9098286628723145} -08/30/2021 20:09:04 - INFO - __main__ - Step 38557: {'lr': 0.00042843490056910534, 'samples': 7402944, 'steps': 38556, 'loss/train': 1.6006876230239868} -08/30/2021 20:09:06 - INFO - __main__ - Step 38558: {'lr': 0.00042843118362599045, 'samples': 7403136, 'steps': 38557, 'loss/train': 1.0018879175186157} -08/30/2021 20:09:06 - INFO - __main__ - Step 38559: {'lr': 0.0004284274666024772, 'samples': 7403328, 'steps': 38558, 'loss/train': 0.9748728275299072} -08/30/2021 20:09:06 - INFO - __main__ - Step 38560: {'lr': 0.0004284237494985672, 'samples': 7403520, 'steps': 38559, 'loss/train': 1.503739356994629} -08/30/2021 20:09:07 - INFO - __main__ - Step 38561: {'lr': 0.0004284200323142623, 'samples': 7403712, 'steps': 38560, 'loss/train': 1.3755677938461304} -08/30/2021 20:09:07 - INFO - __main__ - Step 38562: {'lr': 0.0004284163150495641, 'samples': 7403904, 'steps': 38561, 'loss/train': 1.1172332763671875} -08/30/2021 20:09:08 - INFO - __main__ - Step 38563: {'lr': 0.00042841259770447427, 'samples': 7404096, 'steps': 38562, 'loss/train': 1.1763057708740234} -08/30/2021 20:09:09 - INFO - __main__ - Step 38564: {'lr': 0.00042840888027899436, 'samples': 7404288, 'steps': 38563, 'loss/train': 0.8469580411911011} -08/30/2021 20:09:09 - INFO - __main__ - Step 38565: {'lr': 0.0004284051627731263, 'samples': 7404480, 'steps': 38564, 'loss/train': 1.3201395273208618} -08/30/2021 20:09:10 - INFO - __main__ - Step 38566: {'lr': 0.0004284014451868716, 'samples': 7404672, 'steps': 38565, 'loss/train': 0.761022686958313} -08/30/2021 20:09:10 - INFO - __main__ - Step 38567: {'lr': 0.0004283977275202319, 'samples': 7404864, 'steps': 38566, 'loss/train': 1.4326833486557007} -08/30/2021 20:09:12 - INFO - __main__ - Step 38568: {'lr': 0.00042839400977320895, 'samples': 7405056, 'steps': 38567, 'loss/train': 0.9958623647689819} -08/30/2021 20:09:13 - INFO - __main__ - Step 38569: {'lr': 0.00042839029194580446, 'samples': 7405248, 'steps': 38568, 'loss/train': 1.4541212320327759} -08/30/2021 20:09:13 - INFO - __main__ - Step 38570: {'lr': 0.0004283865740380201, 'samples': 7405440, 'steps': 38569, 'loss/train': 1.0612595081329346} -08/30/2021 20:09:13 - INFO - __main__ - Step 38571: {'lr': 0.0004283828560498574, 'samples': 7405632, 'steps': 38570, 'loss/train': 4.319080829620361} -08/30/2021 20:09:14 - INFO - __main__ - Step 38572: {'lr': 0.0004283791379813181, 'samples': 7405824, 'steps': 38571, 'loss/train': 4.791377544403076} -08/30/2021 20:09:14 - INFO - __main__ - Step 38573: {'lr': 0.000428375419832404, 'samples': 7406016, 'steps': 38572, 'loss/train': 2.282837152481079} -08/30/2021 20:09:16 - INFO - __main__ - Step 38574: {'lr': 0.0004283717016031167, 'samples': 7406208, 'steps': 38573, 'loss/train': 2.021578788757324} -08/30/2021 20:09:16 - INFO - __main__ - Step 38575: {'lr': 0.0004283679832934578, 'samples': 7406400, 'steps': 38574, 'loss/train': 1.5614449977874756} -08/30/2021 20:09:16 - INFO - __main__ - Step 38576: {'lr': 0.0004283642649034291, 'samples': 7406592, 'steps': 38575, 'loss/train': 1.622318148612976} -08/30/2021 20:09:17 - INFO - __main__ - Step 38577: {'lr': 0.00042836054643303226, 'samples': 7406784, 'steps': 38576, 'loss/train': 0.8903332948684692} -08/30/2021 20:09:17 - INFO - __main__ - Step 38578: {'lr': 0.0004283568278822688, 'samples': 7406976, 'steps': 38577, 'loss/train': 1.5244050025939941} -08/30/2021 20:09:19 - INFO - __main__ - Step 38579: {'lr': 0.0004283531092511405, 'samples': 7407168, 'steps': 38578, 'loss/train': 2.0325591564178467} -08/30/2021 20:09:19 - INFO - __main__ - Step 38580: {'lr': 0.0004283493905396491, 'samples': 7407360, 'steps': 38579, 'loss/train': 1.0972278118133545} -08/30/2021 20:09:20 - INFO - __main__ - Step 38581: {'lr': 0.00042834567174779623, 'samples': 7407552, 'steps': 38580, 'loss/train': 1.1752090454101562} -08/30/2021 20:09:20 - INFO - __main__ - Step 38582: {'lr': 0.00042834195287558356, 'samples': 7407744, 'steps': 38581, 'loss/train': 1.4278823137283325} -08/30/2021 20:09:20 - INFO - __main__ - Step 38583: {'lr': 0.00042833823392301264, 'samples': 7407936, 'steps': 38582, 'loss/train': 1.79173743724823} -08/30/2021 20:09:23 - INFO - __main__ - Step 38584: {'lr': 0.00042833451489008537, 'samples': 7408128, 'steps': 38583, 'loss/train': 0.21683377027511597} -08/30/2021 20:09:23 - INFO - __main__ - Step 38585: {'lr': 0.00042833079577680327, 'samples': 7408320, 'steps': 38584, 'loss/train': 1.5409005880355835} -08/30/2021 20:09:24 - INFO - __main__ - Step 38586: {'lr': 0.0004283270765831682, 'samples': 7408512, 'steps': 38585, 'loss/train': 1.4707132577896118} -08/30/2021 20:09:24 - INFO - __main__ - Step 38587: {'lr': 0.00042832335730918147, 'samples': 7408704, 'steps': 38586, 'loss/train': 0.1335688829421997} -08/30/2021 20:09:24 - INFO - __main__ - Step 38588: {'lr': 0.0004283196379548451, 'samples': 7408896, 'steps': 38587, 'loss/train': 0.10015653073787689} -08/30/2021 20:09:25 - INFO - __main__ - Step 38589: {'lr': 0.0004283159185201607, 'samples': 7409088, 'steps': 38588, 'loss/train': 1.6177349090576172} -08/30/2021 20:09:26 - INFO - __main__ - Step 38590: {'lr': 0.00042831219900512984, 'samples': 7409280, 'steps': 38589, 'loss/train': 0.554823637008667} -08/30/2021 20:09:27 - INFO - __main__ - Step 38591: {'lr': 0.0004283084794097543, 'samples': 7409472, 'steps': 38590, 'loss/train': 2.556117296218872} -08/30/2021 20:09:27 - INFO - __main__ - Step 38592: {'lr': 0.00042830475973403573, 'samples': 7409664, 'steps': 38591, 'loss/train': 1.9750686883926392} -08/30/2021 20:09:28 - INFO - __main__ - Step 38593: {'lr': 0.0004283010399779757, 'samples': 7409856, 'steps': 38592, 'loss/train': 2.290078639984131} -08/30/2021 20:09:28 - INFO - __main__ - Step 38594: {'lr': 0.000428297320141576, 'samples': 7410048, 'steps': 38593, 'loss/train': 1.5426976680755615} -08/30/2021 20:09:29 - INFO - __main__ - Step 38595: {'lr': 0.0004282936002248383, 'samples': 7410240, 'steps': 38594, 'loss/train': 1.6319833993911743} -08/30/2021 20:09:30 - INFO - __main__ - Step 38596: {'lr': 0.00042828988022776426, 'samples': 7410432, 'steps': 38595, 'loss/train': 1.6357815265655518} -08/30/2021 20:09:30 - INFO - __main__ - Step 38597: {'lr': 0.00042828616015035554, 'samples': 7410624, 'steps': 38596, 'loss/train': 1.467668890953064} -08/30/2021 20:09:31 - INFO - __main__ - Step 38598: {'lr': 0.00042828243999261384, 'samples': 7410816, 'steps': 38597, 'loss/train': 1.3639193773269653} -08/30/2021 20:09:31 - INFO - __main__ - Step 38599: {'lr': 0.0004282787197545408, 'samples': 7411008, 'steps': 38598, 'loss/train': 1.701872706413269} -08/30/2021 20:09:33 - INFO - __main__ - Step 38600: {'lr': 0.00042827499943613815, 'samples': 7411200, 'steps': 38599, 'loss/train': 1.4856274127960205} -08/30/2021 20:09:33 - INFO - __main__ - Step 38601: {'lr': 0.00042827127903740747, 'samples': 7411392, 'steps': 38600, 'loss/train': 2.1299808025360107} -08/30/2021 20:09:34 - INFO - __main__ - Step 38602: {'lr': 0.00042826755855835053, 'samples': 7411584, 'steps': 38601, 'loss/train': 1.2858208417892456} -08/30/2021 20:09:34 - INFO - __main__ - Step 38603: {'lr': 0.00042826383799896906, 'samples': 7411776, 'steps': 38602, 'loss/train': 1.8762195110321045} -08/30/2021 20:09:35 - INFO - __main__ - Step 38604: {'lr': 0.0004282601173592646, 'samples': 7411968, 'steps': 38603, 'loss/train': 1.772971510887146} -08/30/2021 20:09:35 - INFO - __main__ - Step 38605: {'lr': 0.0004282563966392389, 'samples': 7412160, 'steps': 38604, 'loss/train': 0.21396401524543762} -08/30/2021 20:09:37 - INFO - __main__ - Step 38606: {'lr': 0.00042825267583889354, 'samples': 7412352, 'steps': 38605, 'loss/train': 0.1161898598074913} -08/30/2021 20:09:38 - INFO - __main__ - Step 38607: {'lr': 0.00042824895495823033, 'samples': 7412544, 'steps': 38606, 'loss/train': 1.6667474508285522} -08/30/2021 20:09:38 - INFO - __main__ - Step 38608: {'lr': 0.0004282452339972509, 'samples': 7412736, 'steps': 38607, 'loss/train': 2.1116271018981934} -08/30/2021 20:09:38 - INFO - __main__ - Step 38609: {'lr': 0.00042824151295595695, 'samples': 7412928, 'steps': 38608, 'loss/train': 1.9374371767044067} -08/30/2021 20:09:39 - INFO - __main__ - Step 38610: {'lr': 0.0004282377918343501, 'samples': 7413120, 'steps': 38609, 'loss/train': 0.6436307430267334} -08/30/2021 20:09:39 - INFO - __main__ - Step 38611: {'lr': 0.00042823407063243197, 'samples': 7413312, 'steps': 38610, 'loss/train': 0.5573675036430359} -08/30/2021 20:09:41 - INFO - __main__ - Step 38612: {'lr': 0.0004282303493502044, 'samples': 7413504, 'steps': 38611, 'loss/train': 1.6397336721420288} -08/30/2021 20:09:41 - INFO - __main__ - Step 38613: {'lr': 0.000428226627987669, 'samples': 7413696, 'steps': 38612, 'loss/train': 1.955654501914978} -08/30/2021 20:09:41 - INFO - __main__ - Step 38614: {'lr': 0.0004282229065448273, 'samples': 7413888, 'steps': 38613, 'loss/train': 1.315771460533142} -08/30/2021 20:09:42 - INFO - __main__ - Step 38615: {'lr': 0.0004282191850216812, 'samples': 7414080, 'steps': 38614, 'loss/train': 1.478628396987915} -08/30/2021 20:09:42 - INFO - __main__ - Step 38616: {'lr': 0.00042821546341823236, 'samples': 7414272, 'steps': 38615, 'loss/train': 1.2186205387115479} -08/30/2021 20:09:44 - INFO - __main__ - Step 38617: {'lr': 0.0004282117417344823, 'samples': 7414464, 'steps': 38616, 'loss/train': 2.0446653366088867} -08/30/2021 20:09:44 - INFO - __main__ - Step 38618: {'lr': 0.00042820801997043277, 'samples': 7414656, 'steps': 38617, 'loss/train': 1.4565842151641846} -08/30/2021 20:09:45 - INFO - __main__ - Step 38619: {'lr': 0.0004282042981260855, 'samples': 7414848, 'steps': 38618, 'loss/train': 1.7942994832992554} -08/30/2021 20:09:45 - INFO - __main__ - Step 38620: {'lr': 0.00042820057620144214, 'samples': 7415040, 'steps': 38619, 'loss/train': 1.426952838897705} -08/30/2021 20:09:45 - INFO - __main__ - Step 38621: {'lr': 0.00042819685419650427, 'samples': 7415232, 'steps': 38620, 'loss/train': 2.0606207847595215} -08/30/2021 20:09:47 - INFO - __main__ - Step 38622: {'lr': 0.0004281931321112737, 'samples': 7415424, 'steps': 38621, 'loss/train': 1.652417778968811} -08/30/2021 20:09:47 - INFO - __main__ - Step 38623: {'lr': 0.0004281894099457521, 'samples': 7415616, 'steps': 38622, 'loss/train': 0.8534078598022461} -08/30/2021 20:09:48 - INFO - __main__ - Step 38624: {'lr': 0.00042818568769994103, 'samples': 7415808, 'steps': 38623, 'loss/train': 1.6389437913894653} -08/30/2021 20:09:48 - INFO - __main__ - Step 38625: {'lr': 0.00042818196537384225, 'samples': 7416000, 'steps': 38624, 'loss/train': 1.456589698791504} -08/30/2021 20:09:48 - INFO - __main__ - Step 38626: {'lr': 0.0004281782429674574, 'samples': 7416192, 'steps': 38625, 'loss/train': 1.4333062171936035} -08/30/2021 20:09:50 - INFO - __main__ - Step 38627: {'lr': 0.0004281745204807882, 'samples': 7416384, 'steps': 38626, 'loss/train': 0.43587514758110046} -08/30/2021 20:09:50 - INFO - __main__ - Step 38628: {'lr': 0.00042817079791383636, 'samples': 7416576, 'steps': 38627, 'loss/train': 2.1891889572143555} -08/30/2021 20:09:51 - INFO - __main__ - Step 38629: {'lr': 0.00042816707526660346, 'samples': 7416768, 'steps': 38628, 'loss/train': 1.2977513074874878} -08/30/2021 20:09:51 - INFO - __main__ - Step 38630: {'lr': 0.00042816335253909125, 'samples': 7416960, 'steps': 38629, 'loss/train': 1.475739598274231} -08/30/2021 20:09:51 - INFO - __main__ - Step 38631: {'lr': 0.00042815962973130134, 'samples': 7417152, 'steps': 38630, 'loss/train': 1.857330083847046} -08/30/2021 20:09:53 - INFO - __main__ - Step 38632: {'lr': 0.00042815590684323554, 'samples': 7417344, 'steps': 38631, 'loss/train': 1.4106769561767578} -08/30/2021 20:09:53 - INFO - __main__ - Step 38633: {'lr': 0.00042815218387489535, 'samples': 7417536, 'steps': 38632, 'loss/train': 1.4453449249267578} -08/30/2021 20:09:54 - INFO - __main__ - Step 38634: {'lr': 0.00042814846082628256, 'samples': 7417728, 'steps': 38633, 'loss/train': 1.7522774934768677} -08/30/2021 20:09:54 - INFO - __main__ - Step 38635: {'lr': 0.0004281447376973988, 'samples': 7417920, 'steps': 38634, 'loss/train': 1.7621123790740967} -08/30/2021 20:09:54 - INFO - __main__ - Step 38636: {'lr': 0.00042814101448824583, 'samples': 7418112, 'steps': 38635, 'loss/train': 1.2906841039657593} -08/30/2021 20:09:56 - INFO - __main__ - Step 38637: {'lr': 0.0004281372911988253, 'samples': 7418304, 'steps': 38636, 'loss/train': 0.8466001152992249} -08/30/2021 20:09:57 - INFO - __main__ - Step 38638: {'lr': 0.0004281335678291387, 'samples': 7418496, 'steps': 38637, 'loss/train': 1.6220788955688477} -08/30/2021 20:09:57 - INFO - __main__ - Step 38639: {'lr': 0.000428129844379188, 'samples': 7418688, 'steps': 38638, 'loss/train': 1.6182951927185059} -08/30/2021 20:09:58 - INFO - __main__ - Step 38640: {'lr': 0.0004281261208489747, 'samples': 7418880, 'steps': 38639, 'loss/train': 1.4365603923797607} -08/30/2021 20:09:58 - INFO - __main__ - Step 38641: {'lr': 0.0004281223972385004, 'samples': 7419072, 'steps': 38640, 'loss/train': 1.4633879661560059} -08/30/2021 20:09:58 - INFO - __main__ - Step 38642: {'lr': 0.00042811867354776705, 'samples': 7419264, 'steps': 38641, 'loss/train': 1.6247738599777222} -08/30/2021 20:10:00 - INFO - __main__ - Step 38643: {'lr': 0.0004281149497767761, 'samples': 7419456, 'steps': 38642, 'loss/train': 0.5863242745399475} -08/30/2021 20:10:01 - INFO - __main__ - Step 38644: {'lr': 0.00042811122592552943, 'samples': 7419648, 'steps': 38643, 'loss/train': 1.9961851835250854} -08/30/2021 20:10:01 - INFO - __main__ - Step 38645: {'lr': 0.0004281075019940285, 'samples': 7419840, 'steps': 38644, 'loss/train': 1.3115507364273071} -08/30/2021 20:10:01 - INFO - __main__ - Step 38646: {'lr': 0.00042810377798227506, 'samples': 7420032, 'steps': 38645, 'loss/train': 1.6012402772903442} -08/30/2021 20:10:02 - INFO - __main__ - Step 38647: {'lr': 0.00042810005389027077, 'samples': 7420224, 'steps': 38646, 'loss/train': 1.3315033912658691} -08/30/2021 20:10:03 - INFO - __main__ - Step 38648: {'lr': 0.0004280963297180174, 'samples': 7420416, 'steps': 38647, 'loss/train': 1.3940638303756714} -08/30/2021 20:10:04 - INFO - __main__ - Step 38649: {'lr': 0.0004280926054655165, 'samples': 7420608, 'steps': 38648, 'loss/train': 1.7996569871902466} -08/30/2021 20:10:04 - INFO - __main__ - Step 38650: {'lr': 0.00042808888113277, 'samples': 7420800, 'steps': 38649, 'loss/train': 1.0887048244476318} -08/30/2021 20:10:04 - INFO - __main__ - Step 38651: {'lr': 0.0004280851567197792, 'samples': 7420992, 'steps': 38650, 'loss/train': 1.5012034177780151} -08/30/2021 20:10:05 - INFO - __main__ - Step 38652: {'lr': 0.0004280814322265461, 'samples': 7421184, 'steps': 38651, 'loss/train': 1.7306108474731445} -08/30/2021 20:10:06 - INFO - __main__ - Step 38653: {'lr': 0.00042807770765307217, 'samples': 7421376, 'steps': 38652, 'loss/train': 1.6279971599578857} -08/30/2021 20:10:07 - INFO - __main__ - Step 38654: {'lr': 0.00042807398299935927, 'samples': 7421568, 'steps': 38653, 'loss/train': 1.1435880661010742} -08/30/2021 20:10:07 - INFO - __main__ - Step 38655: {'lr': 0.0004280702582654089, 'samples': 7421760, 'steps': 38654, 'loss/train': 1.231977939605713} -08/30/2021 20:10:08 - INFO - __main__ - Step 38656: {'lr': 0.00042806653345122287, 'samples': 7421952, 'steps': 38655, 'loss/train': 1.288036823272705} -08/30/2021 20:10:08 - INFO - __main__ - Step 38657: {'lr': 0.0004280628085568028, 'samples': 7422144, 'steps': 38656, 'loss/train': 0.7506770491600037} -08/30/2021 20:10:09 - INFO - __main__ - Step 38658: {'lr': 0.0004280590835821503, 'samples': 7422336, 'steps': 38657, 'loss/train': 0.6064561605453491} -08/30/2021 20:10:10 - INFO - __main__ - Step 38659: {'lr': 0.0004280553585272672, 'samples': 7422528, 'steps': 38658, 'loss/train': 1.281550407409668} -08/30/2021 20:10:10 - INFO - __main__ - Step 38660: {'lr': 0.0004280516333921551, 'samples': 7422720, 'steps': 38659, 'loss/train': 1.726662039756775} -08/30/2021 20:10:11 - INFO - __main__ - Step 38661: {'lr': 0.00042804790817681574, 'samples': 7422912, 'steps': 38660, 'loss/train': 1.4874367713928223} -08/30/2021 20:10:11 - INFO - __main__ - Step 38662: {'lr': 0.0004280441828812506, 'samples': 7423104, 'steps': 38661, 'loss/train': 1.0482029914855957} -08/30/2021 20:10:11 - INFO - __main__ - Step 38663: {'lr': 0.0004280404575054616, 'samples': 7423296, 'steps': 38662, 'loss/train': 1.4116946458816528} -08/30/2021 20:10:13 - INFO - __main__ - Step 38664: {'lr': 0.00042803673204945027, 'samples': 7423488, 'steps': 38663, 'loss/train': 2.0071163177490234} -08/30/2021 20:10:13 - INFO - __main__ - Step 38665: {'lr': 0.0004280330065132184, 'samples': 7423680, 'steps': 38664, 'loss/train': 1.448816180229187} -08/30/2021 20:10:14 - INFO - __main__ - Step 38666: {'lr': 0.0004280292808967675, 'samples': 7423872, 'steps': 38665, 'loss/train': 0.9995388388633728} -08/30/2021 20:10:14 - INFO - __main__ - Step 38667: {'lr': 0.00042802555520009945, 'samples': 7424064, 'steps': 38666, 'loss/train': 1.0025697946548462} -08/30/2021 20:10:14 - INFO - __main__ - Step 38668: {'lr': 0.00042802182942321576, 'samples': 7424256, 'steps': 38667, 'loss/train': 1.261796236038208} -08/30/2021 20:10:16 - INFO - __main__ - Step 38669: {'lr': 0.0004280181035661182, 'samples': 7424448, 'steps': 38668, 'loss/train': 2.285823106765747} -08/30/2021 20:10:16 - INFO - __main__ - Step 38670: {'lr': 0.0004280143776288085, 'samples': 7424640, 'steps': 38669, 'loss/train': 1.179396152496338} -08/30/2021 20:10:17 - INFO - __main__ - Step 38671: {'lr': 0.00042801065161128814, 'samples': 7424832, 'steps': 38670, 'loss/train': 1.3689016103744507} -08/30/2021 20:10:17 - INFO - __main__ - Step 38672: {'lr': 0.000428006925513559, 'samples': 7425024, 'steps': 38671, 'loss/train': 1.0872362852096558} -08/30/2021 20:10:17 - INFO - __main__ - Step 38673: {'lr': 0.0004280031993356227, 'samples': 7425216, 'steps': 38672, 'loss/train': 1.3017916679382324} -08/30/2021 20:10:19 - INFO - __main__ - Step 38674: {'lr': 0.00042799947307748087, 'samples': 7425408, 'steps': 38673, 'loss/train': 1.8740603923797607} -08/30/2021 20:10:20 - INFO - __main__ - Step 38675: {'lr': 0.0004279957467391353, 'samples': 7425600, 'steps': 38674, 'loss/train': 1.3275476694107056} -08/30/2021 20:10:20 - INFO - __main__ - Step 38676: {'lr': 0.0004279920203205875, 'samples': 7425792, 'steps': 38675, 'loss/train': 0.6729128956794739} -08/30/2021 20:10:20 - INFO - __main__ - Step 38677: {'lr': 0.0004279882938218393, 'samples': 7425984, 'steps': 38676, 'loss/train': 1.571664571762085} -08/30/2021 20:10:21 - INFO - __main__ - Step 38678: {'lr': 0.00042798456724289227, 'samples': 7426176, 'steps': 38677, 'loss/train': 1.4537087678909302} -08/30/2021 20:10:22 - INFO - __main__ - Step 38679: {'lr': 0.0004279808405837482, 'samples': 7426368, 'steps': 38678, 'loss/train': 0.09544751048088074} -08/30/2021 20:10:23 - INFO - __main__ - Step 38680: {'lr': 0.00042797711384440863, 'samples': 7426560, 'steps': 38679, 'loss/train': 1.1798216104507446} -08/30/2021 20:10:23 - INFO - __main__ - Step 38681: {'lr': 0.0004279733870248754, 'samples': 7426752, 'steps': 38680, 'loss/train': 1.4335826635360718} -08/30/2021 20:10:23 - INFO - __main__ - Step 38682: {'lr': 0.00042796966012515007, 'samples': 7426944, 'steps': 38681, 'loss/train': 1.7576112747192383} -08/30/2021 20:10:24 - INFO - __main__ - Step 38683: {'lr': 0.00042796593314523435, 'samples': 7427136, 'steps': 38682, 'loss/train': 1.6155834197998047} -08/30/2021 20:10:25 - INFO - __main__ - Step 38684: {'lr': 0.0004279622060851299, 'samples': 7427328, 'steps': 38683, 'loss/train': 1.3129968643188477} -08/30/2021 20:10:26 - INFO - __main__ - Step 38685: {'lr': 0.0004279584789448385, 'samples': 7427520, 'steps': 38684, 'loss/train': 1.273803949356079} -08/30/2021 20:10:26 - INFO - __main__ - Step 38686: {'lr': 0.0004279547517243617, 'samples': 7427712, 'steps': 38685, 'loss/train': 1.3160357475280762} -08/30/2021 20:10:27 - INFO - __main__ - Step 38687: {'lr': 0.00042795102442370127, 'samples': 7427904, 'steps': 38686, 'loss/train': 1.5185521841049194} -08/30/2021 20:10:27 - INFO - __main__ - Step 38688: {'lr': 0.0004279472970428588, 'samples': 7428096, 'steps': 38687, 'loss/train': 1.4837063550949097} -08/30/2021 20:10:27 - INFO - __main__ - Step 38689: {'lr': 0.0004279435695818361, 'samples': 7428288, 'steps': 38688, 'loss/train': 0.05492337793111801} -08/30/2021 20:10:30 - INFO - __main__ - Step 38690: {'lr': 0.00042793984204063477, 'samples': 7428480, 'steps': 38689, 'loss/train': 1.6588153839111328} -08/30/2021 20:10:30 - INFO - __main__ - Step 38691: {'lr': 0.0004279361144192565, 'samples': 7428672, 'steps': 38690, 'loss/train': 0.08101096004247665} -08/30/2021 20:10:31 - INFO - __main__ - Step 38692: {'lr': 0.00042793238671770285, 'samples': 7428864, 'steps': 38691, 'loss/train': 1.7580540180206299} -08/30/2021 20:10:31 - INFO - __main__ - Step 38693: {'lr': 0.0004279286589359757, 'samples': 7429056, 'steps': 38692, 'loss/train': 0.9432997107505798} -08/30/2021 20:10:31 - INFO - __main__ - Step 38694: {'lr': 0.00042792493107407666, 'samples': 7429248, 'steps': 38693, 'loss/train': 0.04007983207702637} -08/30/2021 20:10:32 - INFO - __main__ - Step 38695: {'lr': 0.0004279212031320073, 'samples': 7429440, 'steps': 38694, 'loss/train': 1.4492865800857544} -08/30/2021 20:10:33 - INFO - __main__ - Step 38696: {'lr': 0.00042791747510976955, 'samples': 7429632, 'steps': 38695, 'loss/train': 1.645767331123352} -08/30/2021 20:10:34 - INFO - __main__ - Step 38697: {'lr': 0.0004279137470073648, 'samples': 7429824, 'steps': 38696, 'loss/train': 1.941857099533081} -08/30/2021 20:10:34 - INFO - __main__ - Step 38698: {'lr': 0.00042791001882479485, 'samples': 7430016, 'steps': 38697, 'loss/train': 1.4204496145248413} -08/30/2021 20:10:34 - INFO - __main__ - Step 38699: {'lr': 0.0004279062905620614, 'samples': 7430208, 'steps': 38698, 'loss/train': 1.3363687992095947} -08/30/2021 20:10:35 - INFO - __main__ - Step 38700: {'lr': 0.0004279025622191662, 'samples': 7430400, 'steps': 38699, 'loss/train': 1.0146483182907104} -08/30/2021 20:10:36 - INFO - __main__ - Step 38701: {'lr': 0.00042789883379611084, 'samples': 7430592, 'steps': 38700, 'loss/train': 1.5381847620010376} -08/30/2021 20:10:37 - INFO - __main__ - Step 38702: {'lr': 0.000427895105292897, 'samples': 7430784, 'steps': 38701, 'loss/train': 1.6289020776748657} -08/30/2021 20:10:37 - INFO - __main__ - Step 38703: {'lr': 0.00042789137670952627, 'samples': 7430976, 'steps': 38702, 'loss/train': 1.2194492816925049} -08/30/2021 20:10:37 - INFO - __main__ - Step 38704: {'lr': 0.00042788764804600055, 'samples': 7431168, 'steps': 38703, 'loss/train': 1.3122613430023193} -08/30/2021 20:10:38 - INFO - __main__ - Step 38705: {'lr': 0.0004278839193023214, 'samples': 7431360, 'steps': 38704, 'loss/train': 0.5256453156471252} -08/30/2021 20:10:38 - INFO - __main__ - Step 38706: {'lr': 0.0004278801904784904, 'samples': 7431552, 'steps': 38705, 'loss/train': 1.7385294437408447} -08/30/2021 20:10:40 - INFO - __main__ - Step 38707: {'lr': 0.00042787646157450946, 'samples': 7431744, 'steps': 38706, 'loss/train': 0.43294215202331543} -08/30/2021 20:10:40 - INFO - __main__ - Step 38708: {'lr': 0.00042787273259038, 'samples': 7431936, 'steps': 38707, 'loss/train': 1.0498179197311401} -08/30/2021 20:10:40 - INFO - __main__ - Step 38709: {'lr': 0.00042786900352610393, 'samples': 7432128, 'steps': 38708, 'loss/train': 0.6126086711883545} -08/30/2021 20:10:41 - INFO - __main__ - Step 38710: {'lr': 0.0004278652743816828, 'samples': 7432320, 'steps': 38709, 'loss/train': 1.7270009517669678} -08/30/2021 20:10:41 - INFO - __main__ - Step 38711: {'lr': 0.00042786154515711826, 'samples': 7432512, 'steps': 38710, 'loss/train': 1.660953402519226} -08/30/2021 20:10:43 - INFO - __main__ - Step 38712: {'lr': 0.0004278578158524121, 'samples': 7432704, 'steps': 38711, 'loss/train': 0.07817649096250534} -08/30/2021 20:10:43 - INFO - __main__ - Step 38713: {'lr': 0.00042785408646756594, 'samples': 7432896, 'steps': 38712, 'loss/train': 0.9201869964599609} -08/30/2021 20:10:43 - INFO - __main__ - Step 38714: {'lr': 0.0004278503570025816, 'samples': 7433088, 'steps': 38713, 'loss/train': 1.5371040105819702} -08/30/2021 20:10:44 - INFO - __main__ - Step 38715: {'lr': 0.0004278466274574605, 'samples': 7433280, 'steps': 38714, 'loss/train': 1.8116850852966309} -08/30/2021 20:10:44 - INFO - __main__ - Step 38716: {'lr': 0.0004278428978322044, 'samples': 7433472, 'steps': 38715, 'loss/train': 1.53053879737854} -08/30/2021 20:10:46 - INFO - __main__ - Step 38717: {'lr': 0.00042783916812681516, 'samples': 7433664, 'steps': 38716, 'loss/train': 1.78085458278656} -08/30/2021 20:10:46 - INFO - __main__ - Step 38718: {'lr': 0.0004278354383412943, 'samples': 7433856, 'steps': 38717, 'loss/train': 1.4068180322647095} -08/30/2021 20:10:46 - INFO - __main__ - Step 38719: {'lr': 0.0004278317084756435, 'samples': 7434048, 'steps': 38718, 'loss/train': 1.5187715291976929} -08/30/2021 20:10:47 - INFO - __main__ - Step 38720: {'lr': 0.00042782797852986454, 'samples': 7434240, 'steps': 38719, 'loss/train': 1.3090986013412476} -08/30/2021 20:10:47 - INFO - __main__ - Step 38721: {'lr': 0.00042782424850395894, 'samples': 7434432, 'steps': 38720, 'loss/train': 1.1511976718902588} -08/30/2021 20:10:49 - INFO - __main__ - Step 38722: {'lr': 0.00042782051839792857, 'samples': 7434624, 'steps': 38721, 'loss/train': 1.9558556079864502} -08/30/2021 20:10:49 - INFO - __main__ - Step 38723: {'lr': 0.000427816788211775, 'samples': 7434816, 'steps': 38722, 'loss/train': 0.044451870024204254} -08/30/2021 20:10:50 - INFO - __main__ - Step 38724: {'lr': 0.00042781305794549994, 'samples': 7435008, 'steps': 38723, 'loss/train': 1.308264136314392} -08/30/2021 20:10:50 - INFO - __main__ - Step 38725: {'lr': 0.00042780932759910504, 'samples': 7435200, 'steps': 38724, 'loss/train': 1.4418635368347168} -08/30/2021 20:10:50 - INFO - __main__ - Step 38726: {'lr': 0.00042780559717259194, 'samples': 7435392, 'steps': 38725, 'loss/train': 1.03141450881958} -08/30/2021 20:10:52 - INFO - __main__ - Step 38727: {'lr': 0.0004278018666659624, 'samples': 7435584, 'steps': 38726, 'loss/train': 1.353161096572876} -08/30/2021 20:10:52 - INFO - __main__ - Step 38728: {'lr': 0.0004277981360792182, 'samples': 7435776, 'steps': 38727, 'loss/train': 1.473778247833252} -08/30/2021 20:10:53 - INFO - __main__ - Step 38729: {'lr': 0.0004277944054123608, 'samples': 7435968, 'steps': 38728, 'loss/train': 0.8205475211143494} -08/30/2021 20:10:53 - INFO - __main__ - Step 38730: {'lr': 0.000427790674665392, 'samples': 7436160, 'steps': 38729, 'loss/train': 1.5710917711257935} -08/30/2021 20:10:53 - INFO - __main__ - Step 38731: {'lr': 0.00042778694383831354, 'samples': 7436352, 'steps': 38730, 'loss/train': 1.616429090499878} -08/30/2021 20:10:55 - INFO - __main__ - Step 38732: {'lr': 0.0004277832129311269, 'samples': 7436544, 'steps': 38731, 'loss/train': 1.319718837738037} -08/30/2021 20:10:55 - INFO - __main__ - Step 38733: {'lr': 0.000427779481943834, 'samples': 7436736, 'steps': 38732, 'loss/train': 1.6281687021255493} -08/30/2021 20:10:56 - INFO - __main__ - Step 38734: {'lr': 0.0004277757508764363, 'samples': 7436928, 'steps': 38733, 'loss/train': 1.7237601280212402} -08/30/2021 20:10:56 - INFO - __main__ - Step 38735: {'lr': 0.00042777201972893564, 'samples': 7437120, 'steps': 38734, 'loss/train': 1.6055048704147339} -08/30/2021 20:10:56 - INFO - __main__ - Step 38736: {'lr': 0.00042776828850133364, 'samples': 7437312, 'steps': 38735, 'loss/train': 1.5065596103668213} -08/30/2021 20:10:57 - INFO - __main__ - Step 38737: {'lr': 0.0004277645571936321, 'samples': 7437504, 'steps': 38736, 'loss/train': 1.191209316253662} -08/30/2021 20:10:58 - INFO - __main__ - Step 38738: {'lr': 0.0004277608258058324, 'samples': 7437696, 'steps': 38737, 'loss/train': 1.4561070203781128} -08/30/2021 20:10:59 - INFO - __main__ - Step 38739: {'lr': 0.00042775709433793657, 'samples': 7437888, 'steps': 38738, 'loss/train': 1.4625935554504395} -08/30/2021 20:10:59 - INFO - __main__ - Step 38740: {'lr': 0.0004277533627899461, 'samples': 7438080, 'steps': 38739, 'loss/train': 1.3131028413772583} -08/30/2021 20:10:59 - INFO - __main__ - Step 38741: {'lr': 0.00042774963116186274, 'samples': 7438272, 'steps': 38740, 'loss/train': 1.5198599100112915} -08/30/2021 20:11:00 - INFO - __main__ - Step 38742: {'lr': 0.000427745899453688, 'samples': 7438464, 'steps': 38741, 'loss/train': 0.0744587630033493} -08/30/2021 20:11:01 - INFO - __main__ - Step 38743: {'lr': 0.00042774216766542386, 'samples': 7438656, 'steps': 38742, 'loss/train': 1.6099133491516113} -08/30/2021 20:11:02 - INFO - __main__ - Step 38744: {'lr': 0.0004277384357970717, 'samples': 7438848, 'steps': 38743, 'loss/train': 1.8320605754852295} -08/30/2021 20:11:02 - INFO - __main__ - Step 38745: {'lr': 0.00042773470384863344, 'samples': 7439040, 'steps': 38744, 'loss/train': 0.9649897813796997} -08/30/2021 20:11:03 - INFO - __main__ - Step 38746: {'lr': 0.0004277309718201107, 'samples': 7439232, 'steps': 38745, 'loss/train': 2.1139719486236572} -08/30/2021 20:11:03 - INFO - __main__ - Step 38747: {'lr': 0.000427727239711505, 'samples': 7439424, 'steps': 38746, 'loss/train': 1.3948806524276733} -08/30/2021 20:11:05 - INFO - __main__ - Step 38748: {'lr': 0.00042772350752281823, 'samples': 7439616, 'steps': 38747, 'loss/train': 1.5157158374786377} -08/30/2021 20:11:06 - INFO - __main__ - Step 38749: {'lr': 0.000427719775254052, 'samples': 7439808, 'steps': 38748, 'loss/train': 1.089264988899231} -08/30/2021 20:11:06 - INFO - __main__ - Step 38750: {'lr': 0.00042771604290520795, 'samples': 7440000, 'steps': 38749, 'loss/train': 1.44356369972229} -08/30/2021 20:11:06 - INFO - __main__ - Step 38751: {'lr': 0.00042771231047628776, 'samples': 7440192, 'steps': 38750, 'loss/train': 1.9884164333343506} -08/30/2021 20:11:08 - INFO - __main__ - Step 38752: {'lr': 0.0004277085779672932, 'samples': 7440384, 'steps': 38751, 'loss/train': 0.7363114953041077} -08/30/2021 20:11:08 - INFO - __main__ - Step 38753: {'lr': 0.0004277048453782259, 'samples': 7440576, 'steps': 38752, 'loss/train': 1.1619985103607178} -08/30/2021 20:11:09 - INFO - __main__ - Step 38754: {'lr': 0.0004277011127090875, 'samples': 7440768, 'steps': 38753, 'loss/train': 1.361302375793457} -08/30/2021 20:11:09 - INFO - __main__ - Step 38755: {'lr': 0.0004276973799598798, 'samples': 7440960, 'steps': 38754, 'loss/train': 1.1801483631134033} -08/30/2021 20:11:09 - INFO - __main__ - Step 38756: {'lr': 0.0004276936471306043, 'samples': 7441152, 'steps': 38755, 'loss/train': 1.3994168043136597} -08/30/2021 20:11:11 - INFO - __main__ - Step 38757: {'lr': 0.00042768991422126285, 'samples': 7441344, 'steps': 38756, 'loss/train': 1.5156992673873901} -08/30/2021 20:11:12 - INFO - __main__ - Step 38758: {'lr': 0.00042768618123185703, 'samples': 7441536, 'steps': 38757, 'loss/train': 0.6526063680648804} -08/30/2021 20:11:12 - INFO - __main__ - Step 38759: {'lr': 0.00042768244816238863, 'samples': 7441728, 'steps': 38758, 'loss/train': 1.3877465724945068} -08/30/2021 20:11:12 - INFO - __main__ - Step 38760: {'lr': 0.00042767871501285916, 'samples': 7441920, 'steps': 38759, 'loss/train': 1.3566300868988037} -08/30/2021 20:11:13 - INFO - __main__ - Step 38761: {'lr': 0.00042767498178327047, 'samples': 7442112, 'steps': 38760, 'loss/train': 1.9401377439498901} -08/30/2021 20:11:13 - INFO - __main__ - Step 38762: {'lr': 0.00042767124847362413, 'samples': 7442304, 'steps': 38761, 'loss/train': 1.9453312158584595} -08/30/2021 20:11:15 - INFO - __main__ - Step 38763: {'lr': 0.00042766751508392187, 'samples': 7442496, 'steps': 38762, 'loss/train': 1.4461653232574463} -08/30/2021 20:11:15 - INFO - __main__ - Step 38764: {'lr': 0.00042766378161416543, 'samples': 7442688, 'steps': 38763, 'loss/train': 1.3366578817367554} -08/30/2021 20:11:15 - INFO - __main__ - Step 38765: {'lr': 0.00042766004806435643, 'samples': 7442880, 'steps': 38764, 'loss/train': 1.4643217325210571} -08/30/2021 20:11:16 - INFO - __main__ - Step 38766: {'lr': 0.0004276563144344965, 'samples': 7443072, 'steps': 38765, 'loss/train': 0.7589820623397827} -08/30/2021 20:11:16 - INFO - __main__ - Step 38767: {'lr': 0.00042765258072458733, 'samples': 7443264, 'steps': 38766, 'loss/train': 1.4181276559829712} -08/30/2021 20:11:18 - INFO - __main__ - Step 38768: {'lr': 0.00042764884693463075, 'samples': 7443456, 'steps': 38767, 'loss/train': 1.443307638168335} -08/30/2021 20:11:18 - INFO - __main__ - Step 38769: {'lr': 0.0004276451130646283, 'samples': 7443648, 'steps': 38768, 'loss/train': 1.3338168859481812} -08/30/2021 20:11:18 - INFO - __main__ - Step 38770: {'lr': 0.0004276413791145817, 'samples': 7443840, 'steps': 38769, 'loss/train': 1.2715299129486084} -08/30/2021 20:11:19 - INFO - __main__ - Step 38771: {'lr': 0.00042763764508449263, 'samples': 7444032, 'steps': 38770, 'loss/train': 1.8022055625915527} -08/30/2021 20:11:19 - INFO - __main__ - Step 38772: {'lr': 0.0004276339109743628, 'samples': 7444224, 'steps': 38771, 'loss/train': 1.31218421459198} -08/30/2021 20:11:20 - INFO - __main__ - Step 38773: {'lr': 0.0004276301767841939, 'samples': 7444416, 'steps': 38772, 'loss/train': 2.7003791332244873} -08/30/2021 20:11:21 - INFO - __main__ - Step 38774: {'lr': 0.00042762644251398755, 'samples': 7444608, 'steps': 38773, 'loss/train': 1.368554949760437} -08/30/2021 20:11:21 - INFO - __main__ - Step 38775: {'lr': 0.0004276227081637454, 'samples': 7444800, 'steps': 38774, 'loss/train': 1.202033519744873} -08/30/2021 20:11:22 - INFO - __main__ - Step 38776: {'lr': 0.00042761897373346923, 'samples': 7444992, 'steps': 38775, 'loss/train': 1.1454054117202759} -08/30/2021 20:11:22 - INFO - __main__ - Step 38777: {'lr': 0.0004276152392231608, 'samples': 7445184, 'steps': 38776, 'loss/train': 1.5549793243408203} -08/30/2021 20:11:22 - INFO - __main__ - Step 38778: {'lr': 0.00042761150463282164, 'samples': 7445376, 'steps': 38777, 'loss/train': 1.290086269378662} -08/30/2021 20:11:24 - INFO - __main__ - Step 38779: {'lr': 0.0004276077699624534, 'samples': 7445568, 'steps': 38778, 'loss/train': 1.5495622158050537} -08/30/2021 20:11:25 - INFO - __main__ - Step 38780: {'lr': 0.0004276040352120578, 'samples': 7445760, 'steps': 38779, 'loss/train': 1.4970108270645142} -08/30/2021 20:11:25 - INFO - __main__ - Step 38781: {'lr': 0.0004276003003816367, 'samples': 7445952, 'steps': 38780, 'loss/train': 1.9532743692398071} -08/30/2021 20:11:25 - INFO - __main__ - Step 38782: {'lr': 0.0004275965654711916, 'samples': 7446144, 'steps': 38781, 'loss/train': 1.3598995208740234} -08/30/2021 20:11:26 - INFO - __main__ - Step 38783: {'lr': 0.0004275928304807242, 'samples': 7446336, 'steps': 38782, 'loss/train': 1.4608898162841797} -08/30/2021 20:11:27 - INFO - __main__ - Step 38784: {'lr': 0.0004275890954102362, 'samples': 7446528, 'steps': 38783, 'loss/train': 1.734776258468628} -08/30/2021 20:11:28 - INFO - __main__ - Step 38785: {'lr': 0.0004275853602597294, 'samples': 7446720, 'steps': 38784, 'loss/train': 1.3762632608413696} -08/30/2021 20:11:28 - INFO - __main__ - Step 38786: {'lr': 0.00042758162502920527, 'samples': 7446912, 'steps': 38785, 'loss/train': 0.9701852798461914} -08/30/2021 20:11:28 - INFO - __main__ - Step 38787: {'lr': 0.0004275778897186656, 'samples': 7447104, 'steps': 38786, 'loss/train': 1.4358216524124146} -08/30/2021 20:11:29 - INFO - __main__ - Step 38788: {'lr': 0.0004275741543281121, 'samples': 7447296, 'steps': 38787, 'loss/train': 1.4445950984954834} -08/30/2021 20:11:30 - INFO - __main__ - Step 38789: {'lr': 0.0004275704188575464, 'samples': 7447488, 'steps': 38788, 'loss/train': 0.5505427718162537} -08/30/2021 20:11:31 - INFO - __main__ - Step 38790: {'lr': 0.00042756668330697024, 'samples': 7447680, 'steps': 38789, 'loss/train': 0.9554463624954224} -08/30/2021 20:11:31 - INFO - __main__ - Step 38791: {'lr': 0.00042756294767638527, 'samples': 7447872, 'steps': 38790, 'loss/train': 1.079748511314392} -08/30/2021 20:11:31 - INFO - __main__ - Step 38792: {'lr': 0.00042755921196579316, 'samples': 7448064, 'steps': 38791, 'loss/train': 1.6538499593734741} -08/30/2021 20:11:32 - INFO - __main__ - Step 38793: {'lr': 0.0004275554761751956, 'samples': 7448256, 'steps': 38792, 'loss/train': 0.8024705648422241} -08/30/2021 20:11:34 - INFO - __main__ - Step 38794: {'lr': 0.0004275517403045943, 'samples': 7448448, 'steps': 38793, 'loss/train': 1.7083035707473755} -08/30/2021 20:11:34 - INFO - __main__ - Step 38795: {'lr': 0.000427548004353991, 'samples': 7448640, 'steps': 38794, 'loss/train': 1.5873737335205078} -08/30/2021 20:11:34 - INFO - __main__ - Step 38796: {'lr': 0.00042754426832338724, 'samples': 7448832, 'steps': 38795, 'loss/train': 0.06725167483091354} -08/30/2021 20:11:35 - INFO - __main__ - Step 38797: {'lr': 0.00042754053221278476, 'samples': 7449024, 'steps': 38796, 'loss/train': 0.6868668794631958} -08/30/2021 20:11:35 - INFO - __main__ - Step 38798: {'lr': 0.0004275367960221853, 'samples': 7449216, 'steps': 38797, 'loss/train': 0.6166905164718628} -08/30/2021 20:11:37 - INFO - __main__ - Step 38799: {'lr': 0.0004275330597515904, 'samples': 7449408, 'steps': 38798, 'loss/train': 1.342469573020935} -08/30/2021 20:11:38 - INFO - __main__ - Step 38800: {'lr': 0.00042752932340100195, 'samples': 7449600, 'steps': 38799, 'loss/train': 1.7195112705230713} -08/30/2021 20:11:38 - INFO - __main__ - Step 38801: {'lr': 0.00042752558697042143, 'samples': 7449792, 'steps': 38800, 'loss/train': 1.3047715425491333} -08/30/2021 20:11:38 - INFO - __main__ - Step 38802: {'lr': 0.0004275218504598507, 'samples': 7449984, 'steps': 38801, 'loss/train': 1.9004665613174438} -08/30/2021 20:11:39 - INFO - __main__ - Step 38803: {'lr': 0.0004275181138692914, 'samples': 7450176, 'steps': 38802, 'loss/train': 1.2620739936828613} -08/30/2021 20:11:40 - INFO - __main__ - Step 38804: {'lr': 0.0004275143771987451, 'samples': 7450368, 'steps': 38803, 'loss/train': 1.871267318725586} -08/30/2021 20:11:41 - INFO - __main__ - Step 38805: {'lr': 0.00042751064044821354, 'samples': 7450560, 'steps': 38804, 'loss/train': 1.3852405548095703} -08/30/2021 20:11:41 - INFO - __main__ - Step 38806: {'lr': 0.0004275069036176985, 'samples': 7450752, 'steps': 38805, 'loss/train': 1.641545295715332} -08/30/2021 20:11:41 - INFO - __main__ - Step 38807: {'lr': 0.0004275031667072015, 'samples': 7450944, 'steps': 38806, 'loss/train': 1.673424482345581} -08/30/2021 20:11:42 - INFO - __main__ - Step 38808: {'lr': 0.0004274994297167244, 'samples': 7451136, 'steps': 38807, 'loss/train': 1.533370018005371} -08/30/2021 20:11:42 - INFO - __main__ - Step 38809: {'lr': 0.00042749569264626875, 'samples': 7451328, 'steps': 38808, 'loss/train': 0.7603945732116699} -08/30/2021 20:11:44 - INFO - __main__ - Step 38810: {'lr': 0.0004274919554958363, 'samples': 7451520, 'steps': 38809, 'loss/train': 1.2478253841400146} -08/30/2021 20:11:44 - INFO - __main__ - Step 38811: {'lr': 0.00042748821826542875, 'samples': 7451712, 'steps': 38810, 'loss/train': 0.049417704343795776} -08/30/2021 20:11:45 - INFO - __main__ - Step 38812: {'lr': 0.00042748448095504765, 'samples': 7451904, 'steps': 38811, 'loss/train': 2.2108635902404785} -08/30/2021 20:11:45 - INFO - __main__ - Step 38813: {'lr': 0.0004274807435646948, 'samples': 7452096, 'steps': 38812, 'loss/train': 3.019526720046997} -08/30/2021 20:11:45 - INFO - __main__ - Step 38814: {'lr': 0.0004274770060943719, 'samples': 7452288, 'steps': 38813, 'loss/train': 0.995280921459198} -08/30/2021 20:11:47 - INFO - __main__ - Step 38815: {'lr': 0.00042747326854408063, 'samples': 7452480, 'steps': 38814, 'loss/train': 1.0013155937194824} -08/30/2021 20:11:47 - INFO - __main__ - Step 38816: {'lr': 0.00042746953091382254, 'samples': 7452672, 'steps': 38815, 'loss/train': 1.4817057847976685} -08/30/2021 20:11:47 - INFO - __main__ - Step 38817: {'lr': 0.00042746579320359956, 'samples': 7452864, 'steps': 38816, 'loss/train': 1.8496936559677124} -08/30/2021 20:11:48 - INFO - __main__ - Step 38818: {'lr': 0.00042746205541341315, 'samples': 7453056, 'steps': 38817, 'loss/train': 1.0554754734039307} -08/30/2021 20:11:48 - INFO - __main__ - Step 38819: {'lr': 0.0004274583175432651, 'samples': 7453248, 'steps': 38818, 'loss/train': 1.0900686979293823} -08/30/2021 20:11:50 - INFO - __main__ - Step 38820: {'lr': 0.000427454579593157, 'samples': 7453440, 'steps': 38819, 'loss/train': 0.7323368191719055} -08/30/2021 20:11:50 - INFO - __main__ - Step 38821: {'lr': 0.00042745084156309065, 'samples': 7453632, 'steps': 38820, 'loss/train': 1.5207645893096924} -08/30/2021 20:11:51 - INFO - __main__ - Step 38822: {'lr': 0.00042744710345306774, 'samples': 7453824, 'steps': 38821, 'loss/train': 1.7052807807922363} -08/30/2021 20:11:51 - INFO - __main__ - Step 38823: {'lr': 0.00042744336526308986, 'samples': 7454016, 'steps': 38822, 'loss/train': 1.7357161045074463} -08/30/2021 20:11:51 - INFO - __main__ - Step 38824: {'lr': 0.0004274396269931587, 'samples': 7454208, 'steps': 38823, 'loss/train': 5.671684741973877} -08/30/2021 20:11:52 - INFO - __main__ - Step 38825: {'lr': 0.0004274358886432761, 'samples': 7454400, 'steps': 38824, 'loss/train': 1.1085503101348877} -08/30/2021 20:11:53 - INFO - __main__ - Step 38826: {'lr': 0.0004274321502134435, 'samples': 7454592, 'steps': 38825, 'loss/train': 0.936346173286438} -08/30/2021 20:11:54 - INFO - __main__ - Step 38827: {'lr': 0.00042742841170366274, 'samples': 7454784, 'steps': 38826, 'loss/train': 1.3706201314926147} -08/30/2021 20:11:54 - INFO - __main__ - Step 38828: {'lr': 0.0004274246731139355, 'samples': 7454976, 'steps': 38827, 'loss/train': 1.6990272998809814} -08/30/2021 20:11:54 - INFO - __main__ - Step 38829: {'lr': 0.0004274209344442634, 'samples': 7455168, 'steps': 38828, 'loss/train': 1.3024113178253174} -08/30/2021 20:11:55 - INFO - __main__ - Step 38830: {'lr': 0.00042741719569464834, 'samples': 7455360, 'steps': 38829, 'loss/train': 1.5719633102416992} -08/30/2021 20:11:56 - INFO - __main__ - Step 38831: {'lr': 0.0004274134568650916, 'samples': 7455552, 'steps': 38830, 'loss/train': 1.2164031267166138} -08/30/2021 20:11:57 - INFO - __main__ - Step 38832: {'lr': 0.00042740971795559527, 'samples': 7455744, 'steps': 38831, 'loss/train': 1.5107475519180298} -08/30/2021 20:11:57 - INFO - __main__ - Step 38833: {'lr': 0.00042740597896616075, 'samples': 7455936, 'steps': 38832, 'loss/train': 1.4301981925964355} -08/30/2021 20:11:57 - INFO - __main__ - Step 38834: {'lr': 0.00042740223989678984, 'samples': 7456128, 'steps': 38833, 'loss/train': 1.6313468217849731} -08/30/2021 20:11:58 - INFO - __main__ - Step 38835: {'lr': 0.0004273985007474842, 'samples': 7456320, 'steps': 38834, 'loss/train': 1.4326335191726685} -08/30/2021 20:11:59 - INFO - __main__ - Step 38836: {'lr': 0.00042739476151824565, 'samples': 7456512, 'steps': 38835, 'loss/train': 1.4646745920181274} -08/30/2021 20:12:00 - INFO - __main__ - Step 38837: {'lr': 0.00042739102220907567, 'samples': 7456704, 'steps': 38836, 'loss/train': 1.492846131324768} -08/30/2021 20:12:00 - INFO - __main__ - Step 38838: {'lr': 0.000427387282819976, 'samples': 7456896, 'steps': 38837, 'loss/train': 0.743320643901825} -08/30/2021 20:12:00 - INFO - __main__ - Step 38839: {'lr': 0.0004273835433509484, 'samples': 7457088, 'steps': 38838, 'loss/train': 0.8244975805282593} -08/30/2021 20:12:01 - INFO - __main__ - Step 38840: {'lr': 0.0004273798038019945, 'samples': 7457280, 'steps': 38839, 'loss/train': 1.8393313884735107} -08/30/2021 20:12:02 - INFO - __main__ - Step 38841: {'lr': 0.000427376064173116, 'samples': 7457472, 'steps': 38840, 'loss/train': 1.638372778892517} -08/30/2021 20:12:03 - INFO - __main__ - Step 38842: {'lr': 0.0004273723244643146, 'samples': 7457664, 'steps': 38841, 'loss/train': 1.1974339485168457} -08/30/2021 20:12:03 - INFO - __main__ - Step 38843: {'lr': 0.000427368584675592, 'samples': 7457856, 'steps': 38842, 'loss/train': 1.6608766317367554} -08/30/2021 20:12:03 - INFO - __main__ - Step 38844: {'lr': 0.0004273648448069498, 'samples': 7458048, 'steps': 38843, 'loss/train': 1.576238751411438} -08/30/2021 20:12:04 - INFO - __main__ - Step 38845: {'lr': 0.00042736110485838973, 'samples': 7458240, 'steps': 38844, 'loss/train': 1.5806571245193481} -08/30/2021 20:12:06 - INFO - __main__ - Step 38846: {'lr': 0.0004273573648299135, 'samples': 7458432, 'steps': 38845, 'loss/train': 1.2291008234024048} -08/30/2021 20:12:06 - INFO - __main__ - Step 38847: {'lr': 0.0004273536247215227, 'samples': 7458624, 'steps': 38846, 'loss/train': 1.3920701742172241} -08/30/2021 20:12:06 - INFO - __main__ - Step 38848: {'lr': 0.00042734988453321923, 'samples': 7458816, 'steps': 38847, 'loss/train': 1.7615653276443481} -08/30/2021 20:12:07 - INFO - __main__ - Step 38849: {'lr': 0.0004273461442650046, 'samples': 7459008, 'steps': 38848, 'loss/train': 1.2972995042800903} -08/30/2021 20:12:07 - INFO - __main__ - Step 38850: {'lr': 0.0004273424039168805, 'samples': 7459200, 'steps': 38849, 'loss/train': 0.03974912688136101} -08/30/2021 20:12:07 - INFO - __main__ - Step 38851: {'lr': 0.00042733866348884864, 'samples': 7459392, 'steps': 38850, 'loss/train': 2.0268895626068115} -08/30/2021 20:12:08 - INFO - __main__ - Step 38852: {'lr': 0.0004273349229809108, 'samples': 7459584, 'steps': 38851, 'loss/train': 1.621764063835144} -08/30/2021 20:12:09 - INFO - __main__ - Step 38853: {'lr': 0.00042733118239306845, 'samples': 7459776, 'steps': 38852, 'loss/train': 0.741858184337616} -08/30/2021 20:12:10 - INFO - __main__ - Step 38854: {'lr': 0.0004273274417253235, 'samples': 7459968, 'steps': 38853, 'loss/train': 1.4695534706115723} -08/30/2021 20:12:10 - INFO - __main__ - Step 38855: {'lr': 0.00042732370097767756, 'samples': 7460160, 'steps': 38854, 'loss/train': 1.8754863739013672} -08/30/2021 20:12:10 - INFO - __main__ - Step 38856: {'lr': 0.0004273199601501322, 'samples': 7460352, 'steps': 38855, 'loss/train': 0.3878907263278961} -08/30/2021 20:12:11 - INFO - __main__ - Step 38857: {'lr': 0.0004273162192426893, 'samples': 7460544, 'steps': 38856, 'loss/train': 1.5242090225219727} -08/30/2021 20:12:13 - INFO - __main__ - Step 38858: {'lr': 0.00042731247825535037, 'samples': 7460736, 'steps': 38857, 'loss/train': 1.4300408363342285} -08/30/2021 20:12:13 - INFO - __main__ - Step 38859: {'lr': 0.00042730873718811724, 'samples': 7460928, 'steps': 38858, 'loss/train': 5.811954021453857} -08/30/2021 20:12:14 - INFO - __main__ - Step 38860: {'lr': 0.0004273049960409915, 'samples': 7461120, 'steps': 38859, 'loss/train': 1.892176866531372} -08/30/2021 20:12:14 - INFO - __main__ - Step 38861: {'lr': 0.00042730125481397487, 'samples': 7461312, 'steps': 38860, 'loss/train': 1.5292850732803345} -08/30/2021 20:12:14 - INFO - __main__ - Step 38862: {'lr': 0.00042729751350706905, 'samples': 7461504, 'steps': 38861, 'loss/train': 0.8005544543266296} -08/30/2021 20:12:16 - INFO - __main__ - Step 38863: {'lr': 0.00042729377212027557, 'samples': 7461696, 'steps': 38862, 'loss/train': 1.3388922214508057} -08/30/2021 20:12:16 - INFO - __main__ - Step 38864: {'lr': 0.0004272900306535964, 'samples': 7461888, 'steps': 38863, 'loss/train': 1.8581312894821167} -08/30/2021 20:12:17 - INFO - __main__ - Step 38865: {'lr': 0.00042728628910703305, 'samples': 7462080, 'steps': 38864, 'loss/train': 1.4440981149673462} -08/30/2021 20:12:17 - INFO - __main__ - Step 38866: {'lr': 0.0004272825474805872, 'samples': 7462272, 'steps': 38865, 'loss/train': 1.6697527170181274} -08/30/2021 20:12:17 - INFO - __main__ - Step 38867: {'lr': 0.0004272788057742606, 'samples': 7462464, 'steps': 38866, 'loss/train': 0.9913666844367981} -08/30/2021 20:12:19 - INFO - __main__ - Step 38868: {'lr': 0.0004272750639880549, 'samples': 7462656, 'steps': 38867, 'loss/train': 1.2427674531936646} -08/30/2021 20:12:19 - INFO - __main__ - Step 38869: {'lr': 0.0004272713221219718, 'samples': 7462848, 'steps': 38868, 'loss/train': 1.768541932106018} -08/30/2021 20:12:20 - INFO - __main__ - Step 38870: {'lr': 0.00042726758017601297, 'samples': 7463040, 'steps': 38869, 'loss/train': 1.740482211112976} -08/30/2021 20:12:20 - INFO - __main__ - Step 38871: {'lr': 0.00042726383815018006, 'samples': 7463232, 'steps': 38870, 'loss/train': 1.0954400300979614} -08/30/2021 20:12:20 - INFO - __main__ - Step 38872: {'lr': 0.00042726009604447484, 'samples': 7463424, 'steps': 38871, 'loss/train': 1.7786637544631958} -08/30/2021 20:12:22 - INFO - __main__ - Step 38873: {'lr': 0.00042725635385889893, 'samples': 7463616, 'steps': 38872, 'loss/train': 1.2100390195846558} -08/30/2021 20:12:22 - INFO - __main__ - Step 38874: {'lr': 0.0004272526115934541, 'samples': 7463808, 'steps': 38873, 'loss/train': 2.9023475646972656} -08/30/2021 20:12:23 - INFO - __main__ - Step 38875: {'lr': 0.0004272488692481419, 'samples': 7464000, 'steps': 38874, 'loss/train': 1.4789249897003174} -08/30/2021 20:12:23 - INFO - __main__ - Step 38876: {'lr': 0.00042724512682296416, 'samples': 7464192, 'steps': 38875, 'loss/train': 1.707767128944397} -08/30/2021 20:12:23 - INFO - __main__ - Step 38877: {'lr': 0.00042724138431792245, 'samples': 7464384, 'steps': 38876, 'loss/train': 1.9130243062973022} -08/30/2021 20:12:25 - INFO - __main__ - Step 38878: {'lr': 0.0004272376417330186, 'samples': 7464576, 'steps': 38877, 'loss/train': 1.606658697128296} -08/30/2021 20:12:25 - INFO - __main__ - Step 38879: {'lr': 0.00042723389906825415, 'samples': 7464768, 'steps': 38878, 'loss/train': 1.967221975326538} -08/30/2021 20:12:26 - INFO - __main__ - Step 38880: {'lr': 0.0004272301563236308, 'samples': 7464960, 'steps': 38879, 'loss/train': 1.6439955234527588} -08/30/2021 20:12:26 - INFO - __main__ - Step 38881: {'lr': 0.0004272264134991503, 'samples': 7465152, 'steps': 38880, 'loss/train': 1.4029533863067627} -08/30/2021 20:12:26 - INFO - __main__ - Step 38882: {'lr': 0.0004272226705948143, 'samples': 7465344, 'steps': 38881, 'loss/train': 1.0242358446121216} -08/30/2021 20:12:27 - INFO - __main__ - Step 38883: {'lr': 0.00042721892761062453, 'samples': 7465536, 'steps': 38882, 'loss/train': 1.760402798652649} -08/30/2021 20:12:28 - INFO - __main__ - Step 38884: {'lr': 0.00042721518454658265, 'samples': 7465728, 'steps': 38883, 'loss/train': 1.1447868347167969} -08/30/2021 20:12:29 - INFO - __main__ - Step 38885: {'lr': 0.0004272114414026903, 'samples': 7465920, 'steps': 38884, 'loss/train': 1.2751240730285645} -08/30/2021 20:12:29 - INFO - __main__ - Step 38886: {'lr': 0.00042720769817894926, 'samples': 7466112, 'steps': 38885, 'loss/train': 1.0240662097930908} -08/30/2021 20:12:29 - INFO - __main__ - Step 38887: {'lr': 0.00042720395487536115, 'samples': 7466304, 'steps': 38886, 'loss/train': 1.2464112043380737} -08/30/2021 20:12:30 - INFO - __main__ - Step 38888: {'lr': 0.0004272002114919277, 'samples': 7466496, 'steps': 38887, 'loss/train': 2.1759443283081055} -08/30/2021 20:12:31 - INFO - __main__ - Step 38889: {'lr': 0.0004271964680286505, 'samples': 7466688, 'steps': 38888, 'loss/train': 1.3713324069976807} -08/30/2021 20:12:32 - INFO - __main__ - Step 38890: {'lr': 0.00042719272448553137, 'samples': 7466880, 'steps': 38889, 'loss/train': 1.3767149448394775} -08/30/2021 20:12:32 - INFO - __main__ - Step 38891: {'lr': 0.00042718898086257183, 'samples': 7467072, 'steps': 38890, 'loss/train': 1.054800271987915} -08/30/2021 20:12:33 - INFO - __main__ - Step 38892: {'lr': 0.0004271852371597738, 'samples': 7467264, 'steps': 38891, 'loss/train': 1.1322903633117676} -08/30/2021 20:12:33 - INFO - __main__ - Step 38893: {'lr': 0.00042718149337713873, 'samples': 7467456, 'steps': 38892, 'loss/train': 1.3412657976150513} -08/30/2021 20:12:35 - INFO - __main__ - Step 38894: {'lr': 0.0004271777495146685, 'samples': 7467648, 'steps': 38893, 'loss/train': 1.7502262592315674} -08/30/2021 20:12:35 - INFO - __main__ - Step 38895: {'lr': 0.00042717400557236467, 'samples': 7467840, 'steps': 38894, 'loss/train': 1.6785212755203247} -08/30/2021 20:12:35 - INFO - __main__ - Step 38896: {'lr': 0.000427170261550229, 'samples': 7468032, 'steps': 38895, 'loss/train': 0.10268183797597885} -08/30/2021 20:12:36 - INFO - __main__ - Step 38897: {'lr': 0.0004271665174482631, 'samples': 7468224, 'steps': 38896, 'loss/train': 1.6445964574813843} -08/30/2021 20:12:36 - INFO - __main__ - Step 38898: {'lr': 0.0004271627732664687, 'samples': 7468416, 'steps': 38897, 'loss/train': 1.277680516242981} -08/30/2021 20:12:36 - INFO - __main__ - Step 38899: {'lr': 0.0004271590290048475, 'samples': 7468608, 'steps': 38898, 'loss/train': 1.1523408889770508} -08/30/2021 20:12:38 - INFO - __main__ - Step 38900: {'lr': 0.00042715528466340117, 'samples': 7468800, 'steps': 38899, 'loss/train': 1.2972526550292969} -08/30/2021 20:12:39 - INFO - __main__ - Step 38901: {'lr': 0.00042715154024213143, 'samples': 7468992, 'steps': 38900, 'loss/train': 1.7928061485290527} -08/30/2021 20:12:39 - INFO - __main__ - Step 38902: {'lr': 0.0004271477957410399, 'samples': 7469184, 'steps': 38901, 'loss/train': 1.1343905925750732} -08/30/2021 20:12:39 - INFO - __main__ - Step 38903: {'lr': 0.00042714405116012834, 'samples': 7469376, 'steps': 38902, 'loss/train': 1.207249402999878} -08/30/2021 20:12:40 - INFO - __main__ - Step 38904: {'lr': 0.0004271403064993984, 'samples': 7469568, 'steps': 38903, 'loss/train': 1.5169848203659058} -08/30/2021 20:12:41 - INFO - __main__ - Step 38905: {'lr': 0.00042713656175885173, 'samples': 7469760, 'steps': 38904, 'loss/train': 1.6788558959960938} -08/30/2021 20:12:41 - INFO - __main__ - Step 38906: {'lr': 0.00042713281693849015, 'samples': 7469952, 'steps': 38905, 'loss/train': 1.1194159984588623} -08/30/2021 20:12:42 - INFO - __main__ - Step 38907: {'lr': 0.0004271290720383152, 'samples': 7470144, 'steps': 38906, 'loss/train': 1.097764253616333} -08/30/2021 20:12:42 - INFO - __main__ - Step 38908: {'lr': 0.00042712532705832865, 'samples': 7470336, 'steps': 38907, 'loss/train': 2.204711675643921} -08/30/2021 20:12:43 - INFO - __main__ - Step 38909: {'lr': 0.0004271215819985321, 'samples': 7470528, 'steps': 38908, 'loss/train': 2.249115467071533} -08/30/2021 20:12:45 - INFO - __main__ - Step 38910: {'lr': 0.0004271178368589273, 'samples': 7470720, 'steps': 38909, 'loss/train': 1.112189769744873} -08/30/2021 20:12:45 - INFO - __main__ - Step 38911: {'lr': 0.000427114091639516, 'samples': 7470912, 'steps': 38910, 'loss/train': 1.3625484704971313} -08/30/2021 20:12:45 - INFO - __main__ - Step 38912: {'lr': 0.0004271103463402998, 'samples': 7471104, 'steps': 38911, 'loss/train': 1.3684254884719849} -08/30/2021 20:12:46 - INFO - __main__ - Step 38913: {'lr': 0.0004271066009612804, 'samples': 7471296, 'steps': 38912, 'loss/train': 1.8041632175445557} -08/30/2021 20:12:46 - INFO - __main__ - Step 38914: {'lr': 0.0004271028555024594, 'samples': 7471488, 'steps': 38913, 'loss/train': 1.4527479410171509} -08/30/2021 20:12:48 - INFO - __main__ - Step 38915: {'lr': 0.0004270991099638387, 'samples': 7471680, 'steps': 38914, 'loss/train': 1.4462686777114868} -08/30/2021 20:12:48 - INFO - __main__ - Step 38916: {'lr': 0.0004270953643454199, 'samples': 7471872, 'steps': 38915, 'loss/train': 1.3754023313522339} -08/30/2021 20:12:48 - INFO - __main__ - Step 38917: {'lr': 0.0004270916186472046, 'samples': 7472064, 'steps': 38916, 'loss/train': 1.425809621810913} -08/30/2021 20:12:49 - INFO - __main__ - Step 38918: {'lr': 0.0004270878728691946, 'samples': 7472256, 'steps': 38917, 'loss/train': 2.0539333820343018} -08/30/2021 20:12:49 - INFO - __main__ - Step 38919: {'lr': 0.00042708412701139147, 'samples': 7472448, 'steps': 38918, 'loss/train': 1.4504209756851196} -08/30/2021 20:12:50 - INFO - __main__ - Step 38920: {'lr': 0.000427080381073797, 'samples': 7472640, 'steps': 38919, 'loss/train': 2.1193222999572754} -08/30/2021 20:12:51 - INFO - __main__ - Step 38921: {'lr': 0.00042707663505641287, 'samples': 7472832, 'steps': 38920, 'loss/train': 1.7147212028503418} -08/30/2021 20:12:51 - INFO - __main__ - Step 38922: {'lr': 0.00042707288895924066, 'samples': 7473024, 'steps': 38921, 'loss/train': 1.0057674646377563} -08/30/2021 20:12:52 - INFO - __main__ - Step 38923: {'lr': 0.0004270691427822823, 'samples': 7473216, 'steps': 38922, 'loss/train': 1.7988524436950684} -08/30/2021 20:12:52 - INFO - __main__ - Step 38924: {'lr': 0.0004270653965255391, 'samples': 7473408, 'steps': 38923, 'loss/train': 1.2420998811721802} -08/30/2021 20:12:53 - INFO - __main__ - Step 38925: {'lr': 0.0004270616501890131, 'samples': 7473600, 'steps': 38924, 'loss/train': 1.2856082916259766} -08/30/2021 20:12:54 - INFO - __main__ - Step 38926: {'lr': 0.0004270579037727058, 'samples': 7473792, 'steps': 38925, 'loss/train': 1.660669207572937} -08/30/2021 20:12:54 - INFO - __main__ - Step 38927: {'lr': 0.000427054157276619, 'samples': 7473984, 'steps': 38926, 'loss/train': 1.3976815938949585} -08/30/2021 20:12:55 - INFO - __main__ - Step 38928: {'lr': 0.00042705041070075433, 'samples': 7474176, 'steps': 38927, 'loss/train': 0.8167530298233032} -08/30/2021 20:12:55 - INFO - __main__ - Step 38929: {'lr': 0.00042704666404511343, 'samples': 7474368, 'steps': 38928, 'loss/train': 1.8932794332504272} -08/30/2021 20:12:55 - INFO - __main__ - Step 38930: {'lr': 0.000427042917309698, 'samples': 7474560, 'steps': 38929, 'loss/train': 1.473808765411377} -08/30/2021 20:12:58 - INFO - __main__ - Step 38931: {'lr': 0.00042703917049450983, 'samples': 7474752, 'steps': 38930, 'loss/train': 1.594633936882019} -08/30/2021 20:12:58 - INFO - __main__ - Step 38932: {'lr': 0.0004270354235995505, 'samples': 7474944, 'steps': 38931, 'loss/train': 0.06461476534605026} -08/30/2021 20:12:59 - INFO - __main__ - Step 38933: {'lr': 0.0004270316766248218, 'samples': 7475136, 'steps': 38932, 'loss/train': 1.381054162979126} -08/30/2021 20:12:59 - INFO - __main__ - Step 38934: {'lr': 0.0004270279295703253, 'samples': 7475328, 'steps': 38933, 'loss/train': 2.11806058883667} -08/30/2021 20:12:59 - INFO - __main__ - Step 38935: {'lr': 0.00042702418243606275, 'samples': 7475520, 'steps': 38934, 'loss/train': 1.3243941068649292} -08/30/2021 20:13:00 - INFO - __main__ - Step 38936: {'lr': 0.00042702043522203594, 'samples': 7475712, 'steps': 38935, 'loss/train': 0.5328168272972107} -08/30/2021 20:13:00 - INFO - __main__ - Step 38937: {'lr': 0.00042701668792824633, 'samples': 7475904, 'steps': 38936, 'loss/train': 0.41878703236579895} -08/30/2021 20:13:01 - INFO - __main__ - Step 38938: {'lr': 0.00042701294055469576, 'samples': 7476096, 'steps': 38937, 'loss/train': 0.9047747254371643} -08/30/2021 20:13:02 - INFO - __main__ - Step 38939: {'lr': 0.0004270091931013859, 'samples': 7476288, 'steps': 38938, 'loss/train': 1.2436997890472412} -08/30/2021 20:13:02 - INFO - __main__ - Step 38940: {'lr': 0.00042700544556831846, 'samples': 7476480, 'steps': 38939, 'loss/train': 1.4766095876693726} -08/30/2021 20:13:03 - INFO - __main__ - Step 38941: {'lr': 0.00042700169795549504, 'samples': 7476672, 'steps': 38940, 'loss/train': 1.43293035030365} -08/30/2021 20:13:03 - INFO - __main__ - Step 38942: {'lr': 0.00042699795026291743, 'samples': 7476864, 'steps': 38941, 'loss/train': 2.0445070266723633} -08/30/2021 20:13:04 - INFO - __main__ - Step 38943: {'lr': 0.0004269942024905872, 'samples': 7477056, 'steps': 38942, 'loss/train': 0.8253125548362732} -08/30/2021 20:13:05 - INFO - __main__ - Step 38944: {'lr': 0.00042699045463850623, 'samples': 7477248, 'steps': 38943, 'loss/train': 1.3244879245758057} -08/30/2021 20:13:05 - INFO - __main__ - Step 38945: {'lr': 0.000426986706706676, 'samples': 7477440, 'steps': 38944, 'loss/train': 0.7600665092468262} -08/30/2021 20:13:06 - INFO - __main__ - Step 38946: {'lr': 0.00042698295869509836, 'samples': 7477632, 'steps': 38945, 'loss/train': 1.1268936395645142} -08/30/2021 20:13:06 - INFO - __main__ - Step 38947: {'lr': 0.0004269792106037749, 'samples': 7477824, 'steps': 38946, 'loss/train': 0.8434619307518005} -08/30/2021 20:13:07 - INFO - __main__ - Step 38948: {'lr': 0.0004269754624327073, 'samples': 7478016, 'steps': 38947, 'loss/train': 1.2072659730911255} -08/30/2021 20:13:08 - INFO - __main__ - Step 38949: {'lr': 0.0004269717141818973, 'samples': 7478208, 'steps': 38948, 'loss/train': 2.111098527908325} -08/30/2021 20:13:08 - INFO - __main__ - Step 38950: {'lr': 0.0004269679658513466, 'samples': 7478400, 'steps': 38949, 'loss/train': 1.4043744802474976} -08/30/2021 20:13:08 - INFO - __main__ - Step 38951: {'lr': 0.00042696421744105686, 'samples': 7478592, 'steps': 38950, 'loss/train': 1.335856556892395} -08/30/2021 20:13:09 - INFO - __main__ - Step 38952: {'lr': 0.0004269604689510298, 'samples': 7478784, 'steps': 38951, 'loss/train': 1.4491199254989624} -08/30/2021 20:13:10 - INFO - __main__ - Step 38953: {'lr': 0.0004269567203812671, 'samples': 7478976, 'steps': 38952, 'loss/train': 1.7880336046218872} -08/30/2021 20:13:11 - INFO - __main__ - Step 38954: {'lr': 0.00042695297173177033, 'samples': 7479168, 'steps': 38953, 'loss/train': 2.1866867542266846} -08/30/2021 20:13:11 - INFO - __main__ - Step 38955: {'lr': 0.0004269492230025413, 'samples': 7479360, 'steps': 38954, 'loss/train': 1.1974194049835205} -08/30/2021 20:13:11 - INFO - __main__ - Step 38956: {'lr': 0.0004269454741935818, 'samples': 7479552, 'steps': 38955, 'loss/train': 1.2394767999649048} -08/30/2021 20:13:12 - INFO - __main__ - Step 38957: {'lr': 0.00042694172530489326, 'samples': 7479744, 'steps': 38956, 'loss/train': 1.0012314319610596} -08/30/2021 20:13:13 - INFO - __main__ - Step 38958: {'lr': 0.00042693797633647755, 'samples': 7479936, 'steps': 38957, 'loss/train': 1.2408217191696167} -08/30/2021 20:13:14 - INFO - __main__ - Step 38959: {'lr': 0.00042693422728833644, 'samples': 7480128, 'steps': 38958, 'loss/train': 1.2148038148880005} -08/30/2021 20:13:14 - INFO - __main__ - Step 38960: {'lr': 0.00042693047816047135, 'samples': 7480320, 'steps': 38959, 'loss/train': 0.929209291934967} -08/30/2021 20:13:14 - INFO - __main__ - Step 38961: {'lr': 0.0004269267289528842, 'samples': 7480512, 'steps': 38960, 'loss/train': 1.593306064605713} -08/30/2021 20:13:15 - INFO - __main__ - Step 38962: {'lr': 0.00042692297966557657, 'samples': 7480704, 'steps': 38961, 'loss/train': 1.6138441562652588} -08/30/2021 20:13:18 - INFO - __main__ - Step 38963: {'lr': 0.0004269192302985502, 'samples': 7480896, 'steps': 38962, 'loss/train': 1.0217334032058716} -08/30/2021 20:13:18 - INFO - __main__ - Step 38964: {'lr': 0.00042691548085180666, 'samples': 7481088, 'steps': 38963, 'loss/train': 1.1979821920394897} -08/30/2021 20:13:18 - INFO - __main__ - Step 38965: {'lr': 0.00042691173132534775, 'samples': 7481280, 'steps': 38964, 'loss/train': 1.181747317314148} -08/30/2021 20:13:19 - INFO - __main__ - Step 38966: {'lr': 0.0004269079817191752, 'samples': 7481472, 'steps': 38965, 'loss/train': 0.7483606934547424} -08/30/2021 20:13:19 - INFO - __main__ - Step 38967: {'lr': 0.00042690423203329067, 'samples': 7481664, 'steps': 38966, 'loss/train': 1.322017788887024} -08/30/2021 20:13:19 - INFO - __main__ - Step 38968: {'lr': 0.0004269004822676958, 'samples': 7481856, 'steps': 38967, 'loss/train': 1.121822476387024} -08/30/2021 20:13:21 - INFO - __main__ - Step 38969: {'lr': 0.0004268967324223922, 'samples': 7482048, 'steps': 38968, 'loss/train': 1.158146858215332} -08/30/2021 20:13:21 - INFO - __main__ - Step 38970: {'lr': 0.00042689298249738185, 'samples': 7482240, 'steps': 38969, 'loss/train': 1.3048549890518188} -08/30/2021 20:13:22 - INFO - __main__ - Step 38971: {'lr': 0.00042688923249266614, 'samples': 7482432, 'steps': 38970, 'loss/train': 1.3903834819793701} -08/30/2021 20:13:22 - INFO - __main__ - Step 38972: {'lr': 0.00042688548240824687, 'samples': 7482624, 'steps': 38971, 'loss/train': 1.5594826936721802} -08/30/2021 20:13:22 - INFO - __main__ - Step 38973: {'lr': 0.00042688173224412573, 'samples': 7482816, 'steps': 38972, 'loss/train': 1.3469113111495972} -08/30/2021 20:13:24 - INFO - __main__ - Step 38974: {'lr': 0.00042687798200030446, 'samples': 7483008, 'steps': 38973, 'loss/train': 0.8241060376167297} -08/30/2021 20:13:24 - INFO - __main__ - Step 38975: {'lr': 0.00042687423167678463, 'samples': 7483200, 'steps': 38974, 'loss/train': 1.3494739532470703} -08/30/2021 20:13:25 - INFO - __main__ - Step 38976: {'lr': 0.0004268704812735681, 'samples': 7483392, 'steps': 38975, 'loss/train': 1.4919968843460083} -08/30/2021 20:13:25 - INFO - __main__ - Step 38977: {'lr': 0.00042686673079065637, 'samples': 7483584, 'steps': 38976, 'loss/train': 1.9727466106414795} -08/30/2021 20:13:25 - INFO - __main__ - Step 38978: {'lr': 0.00042686298022805126, 'samples': 7483776, 'steps': 38977, 'loss/train': 1.2541768550872803} -08/30/2021 20:13:26 - INFO - __main__ - Step 38979: {'lr': 0.0004268592295857544, 'samples': 7483968, 'steps': 38978, 'loss/train': 1.2378605604171753} -08/30/2021 20:13:27 - INFO - __main__ - Step 38980: {'lr': 0.0004268554788637675, 'samples': 7484160, 'steps': 38979, 'loss/train': 1.3495855331420898} -08/30/2021 20:13:28 - INFO - __main__ - Step 38981: {'lr': 0.0004268517280620923, 'samples': 7484352, 'steps': 38980, 'loss/train': 1.540118932723999} -08/30/2021 20:13:28 - INFO - __main__ - Step 38982: {'lr': 0.0004268479771807303, 'samples': 7484544, 'steps': 38981, 'loss/train': 0.09688853472471237} -08/30/2021 20:13:28 - INFO - __main__ - Step 38983: {'lr': 0.00042684422621968346, 'samples': 7484736, 'steps': 38982, 'loss/train': 1.5230143070220947} -08/30/2021 20:13:29 - INFO - __main__ - Step 38984: {'lr': 0.0004268404751789533, 'samples': 7484928, 'steps': 38983, 'loss/train': 1.1378527879714966} -08/30/2021 20:13:30 - INFO - __main__ - Step 38985: {'lr': 0.0004268367240585416, 'samples': 7485120, 'steps': 38984, 'loss/train': 1.434148907661438} -08/30/2021 20:13:31 - INFO - __main__ - Step 38986: {'lr': 0.0004268329728584499, 'samples': 7485312, 'steps': 38985, 'loss/train': 0.058183636516332626} -08/30/2021 20:13:31 - INFO - __main__ - Step 38987: {'lr': 0.0004268292215786801, 'samples': 7485504, 'steps': 38986, 'loss/train': 1.881852626800537} -08/30/2021 20:13:32 - INFO - __main__ - Step 38988: {'lr': 0.0004268254702192337, 'samples': 7485696, 'steps': 38987, 'loss/train': 1.5401113033294678} -08/30/2021 20:13:32 - INFO - __main__ - Step 38989: {'lr': 0.00042682171878011255, 'samples': 7485888, 'steps': 38988, 'loss/train': 0.6354928016662598} -08/30/2021 20:13:34 - INFO - __main__ - Step 38990: {'lr': 0.00042681796726131815, 'samples': 7486080, 'steps': 38989, 'loss/train': 1.691983938217163} -08/30/2021 20:13:34 - INFO - __main__ - Step 38991: {'lr': 0.0004268142156628524, 'samples': 7486272, 'steps': 38990, 'loss/train': 1.2542545795440674} -08/30/2021 20:13:34 - INFO - __main__ - Step 38992: {'lr': 0.00042681046398471693, 'samples': 7486464, 'steps': 38991, 'loss/train': 1.1526399850845337} -08/30/2021 20:13:35 - INFO - __main__ - Step 38993: {'lr': 0.00042680671222691325, 'samples': 7486656, 'steps': 38992, 'loss/train': 2.0675790309906006} -08/30/2021 20:13:35 - INFO - __main__ - Step 38994: {'lr': 0.0004268029603894433, 'samples': 7486848, 'steps': 38993, 'loss/train': 1.9092001914978027} -08/30/2021 20:13:37 - INFO - __main__ - Step 38995: {'lr': 0.00042679920847230865, 'samples': 7487040, 'steps': 38994, 'loss/train': 1.5690864324569702} -08/30/2021 20:13:37 - INFO - __main__ - Step 38996: {'lr': 0.000426795456475511, 'samples': 7487232, 'steps': 38995, 'loss/train': 1.309863805770874} -08/30/2021 20:13:37 - INFO - __main__ - Step 38997: {'lr': 0.00042679170439905204, 'samples': 7487424, 'steps': 38996, 'loss/train': 1.4097307920455933} -08/30/2021 20:13:38 - INFO - __main__ - Step 38998: {'lr': 0.0004267879522429334, 'samples': 7487616, 'steps': 38997, 'loss/train': 0.8415262699127197} -08/30/2021 20:13:38 - INFO - __main__ - Step 38999: {'lr': 0.00042678420000715687, 'samples': 7487808, 'steps': 38998, 'loss/train': 1.4544283151626587} -08/30/2021 20:13:40 - INFO - __main__ - Step 39000: {'lr': 0.0004267804476917242, 'samples': 7488000, 'steps': 38999, 'loss/train': 1.2814282178878784} -08/30/2021 20:13:40 - INFO - __main__ - Step 39001: {'lr': 0.00042677669529663686, 'samples': 7488192, 'steps': 39000, 'loss/train': 1.3801774978637695} -08/30/2021 20:13:40 - INFO - __main__ - Step 39002: {'lr': 0.0004267729428218968, 'samples': 7488384, 'steps': 39001, 'loss/train': 1.5354958772659302} -08/30/2021 20:13:41 - INFO - __main__ - Step 39003: {'lr': 0.0004267691902675055, 'samples': 7488576, 'steps': 39002, 'loss/train': 1.7666679620742798} -08/30/2021 20:13:41 - INFO - __main__ - Step 39004: {'lr': 0.0004267654376334647, 'samples': 7488768, 'steps': 39003, 'loss/train': 1.3279566764831543} -08/30/2021 20:13:41 - INFO - __main__ - Step 39005: {'lr': 0.00042676168491977617, 'samples': 7488960, 'steps': 39004, 'loss/train': 1.5926154851913452} -08/30/2021 20:13:43 - INFO - __main__ - Step 39006: {'lr': 0.00042675793212644156, 'samples': 7489152, 'steps': 39005, 'loss/train': 1.590686321258545} -08/30/2021 20:13:43 - INFO - __main__ - Step 39007: {'lr': 0.00042675417925346255, 'samples': 7489344, 'steps': 39006, 'loss/train': 2.3390822410583496} -08/30/2021 20:13:44 - INFO - __main__ - Step 39008: {'lr': 0.0004267504263008408, 'samples': 7489536, 'steps': 39007, 'loss/train': 1.6897366046905518} -08/30/2021 20:13:44 - INFO - __main__ - Step 39009: {'lr': 0.0004267466732685781, 'samples': 7489728, 'steps': 39008, 'loss/train': 1.3430382013320923} -08/30/2021 20:13:44 - INFO - __main__ - Step 39010: {'lr': 0.000426742920156676, 'samples': 7489920, 'steps': 39009, 'loss/train': 1.7711538076400757} -08/30/2021 20:13:46 - INFO - __main__ - Step 39011: {'lr': 0.00042673916696513625, 'samples': 7490112, 'steps': 39010, 'loss/train': 1.4898557662963867} -08/30/2021 20:13:46 - INFO - __main__ - Step 39012: {'lr': 0.0004267354136939607, 'samples': 7490304, 'steps': 39011, 'loss/train': 1.4680469036102295} -08/30/2021 20:13:47 - INFO - __main__ - Step 39013: {'lr': 0.0004267316603431508, 'samples': 7490496, 'steps': 39012, 'loss/train': 1.5781192779541016} -08/30/2021 20:13:47 - INFO - __main__ - Step 39014: {'lr': 0.00042672790691270835, 'samples': 7490688, 'steps': 39013, 'loss/train': 1.2442946434020996} -08/30/2021 20:13:48 - INFO - __main__ - Step 39015: {'lr': 0.00042672415340263507, 'samples': 7490880, 'steps': 39014, 'loss/train': 1.6976791620254517} -08/30/2021 20:13:49 - INFO - __main__ - Step 39016: {'lr': 0.00042672039981293255, 'samples': 7491072, 'steps': 39015, 'loss/train': 1.614533543586731} -08/30/2021 20:13:50 - INFO - __main__ - Step 39017: {'lr': 0.0004267166461436025, 'samples': 7491264, 'steps': 39016, 'loss/train': 1.3815348148345947} -08/30/2021 20:13:50 - INFO - __main__ - Step 39018: {'lr': 0.0004267128923946468, 'samples': 7491456, 'steps': 39017, 'loss/train': 1.6059067249298096} -08/30/2021 20:13:51 - INFO - __main__ - Step 39019: {'lr': 0.00042670913856606693, 'samples': 7491648, 'steps': 39018, 'loss/train': 1.1394164562225342} -08/30/2021 20:13:51 - INFO - __main__ - Step 39020: {'lr': 0.0004267053846578646, 'samples': 7491840, 'steps': 39019, 'loss/train': 1.4777863025665283} -08/30/2021 20:13:52 - INFO - __main__ - Step 39021: {'lr': 0.00042670163067004156, 'samples': 7492032, 'steps': 39020, 'loss/train': 1.1149781942367554} -08/30/2021 20:13:53 - INFO - __main__ - Step 39022: {'lr': 0.00042669787660259956, 'samples': 7492224, 'steps': 39021, 'loss/train': 0.8894286155700684} -08/30/2021 20:13:53 - INFO - __main__ - Step 39023: {'lr': 0.0004266941224555402, 'samples': 7492416, 'steps': 39022, 'loss/train': 2.54011869430542} -08/30/2021 20:13:54 - INFO - __main__ - Step 39024: {'lr': 0.0004266903682288652, 'samples': 7492608, 'steps': 39023, 'loss/train': 1.3905818462371826} -08/30/2021 20:13:54 - INFO - __main__ - Step 39025: {'lr': 0.00042668661392257626, 'samples': 7492800, 'steps': 39024, 'loss/train': 1.6680063009262085} -08/30/2021 20:13:56 - INFO - __main__ - Step 39026: {'lr': 0.00042668285953667497, 'samples': 7492992, 'steps': 39025, 'loss/train': 1.1222834587097168} -08/30/2021 20:13:56 - INFO - __main__ - Step 39027: {'lr': 0.0004266791050711632, 'samples': 7493184, 'steps': 39026, 'loss/train': 1.3310561180114746} -08/30/2021 20:13:56 - INFO - __main__ - Step 39028: {'lr': 0.0004266753505260425, 'samples': 7493376, 'steps': 39027, 'loss/train': 1.7979142665863037} -08/30/2021 20:13:57 - INFO - __main__ - Step 39029: {'lr': 0.00042667159590131467, 'samples': 7493568, 'steps': 39028, 'loss/train': 1.5943289995193481} -08/30/2021 20:13:57 - INFO - __main__ - Step 39030: {'lr': 0.0004266678411969813, 'samples': 7493760, 'steps': 39029, 'loss/train': 1.3485994338989258} -08/30/2021 20:13:59 - INFO - __main__ - Step 39031: {'lr': 0.0004266640864130441, 'samples': 7493952, 'steps': 39030, 'loss/train': 1.3079279661178589} -08/30/2021 20:13:59 - INFO - __main__ - Step 39032: {'lr': 0.00042666033154950485, 'samples': 7494144, 'steps': 39031, 'loss/train': 1.6716195344924927} -08/30/2021 20:13:59 - INFO - __main__ - Step 39033: {'lr': 0.00042665657660636517, 'samples': 7494336, 'steps': 39032, 'loss/train': 1.573898196220398} -08/30/2021 20:14:00 - INFO - __main__ - Step 39034: {'lr': 0.0004266528215836267, 'samples': 7494528, 'steps': 39033, 'loss/train': 1.597040057182312} -08/30/2021 20:14:00 - INFO - __main__ - Step 39035: {'lr': 0.0004266490664812913, 'samples': 7494720, 'steps': 39034, 'loss/train': 1.586173176765442} -08/30/2021 20:14:01 - INFO - __main__ - Step 39036: {'lr': 0.00042664531129936044, 'samples': 7494912, 'steps': 39035, 'loss/train': 1.112544298171997} -08/30/2021 20:14:02 - INFO - __main__ - Step 39037: {'lr': 0.00042664155603783606, 'samples': 7495104, 'steps': 39036, 'loss/train': 1.3590707778930664} -08/30/2021 20:14:03 - INFO - __main__ - Step 39038: {'lr': 0.00042663780069671965, 'samples': 7495296, 'steps': 39037, 'loss/train': 2.1780588626861572} -08/30/2021 20:14:03 - INFO - __main__ - Step 39039: {'lr': 0.00042663404527601293, 'samples': 7495488, 'steps': 39038, 'loss/train': 0.46188870072364807} -08/30/2021 20:14:03 - INFO - __main__ - Step 39040: {'lr': 0.00042663028977571774, 'samples': 7495680, 'steps': 39039, 'loss/train': 1.2312473058700562} -08/30/2021 20:14:04 - INFO - __main__ - Step 39041: {'lr': 0.0004266265341958355, 'samples': 7495872, 'steps': 39040, 'loss/train': 1.8984804153442383} -08/30/2021 20:14:05 - INFO - __main__ - Step 39042: {'lr': 0.0004266227785363682, 'samples': 7496064, 'steps': 39041, 'loss/train': 1.8092193603515625} -08/30/2021 20:14:05 - INFO - __main__ - Step 39043: {'lr': 0.0004266190227973174, 'samples': 7496256, 'steps': 39042, 'loss/train': 1.4890114068984985} -08/30/2021 20:14:06 - INFO - __main__ - Step 39044: {'lr': 0.00042661526697868475, 'samples': 7496448, 'steps': 39043, 'loss/train': 0.5905696153640747} -08/30/2021 20:14:06 - INFO - __main__ - Step 39045: {'lr': 0.000426611511080472, 'samples': 7496640, 'steps': 39044, 'loss/train': 1.751371145248413} -08/30/2021 20:14:06 - INFO - __main__ - Step 39046: {'lr': 0.0004266077551026809, 'samples': 7496832, 'steps': 39045, 'loss/train': 1.410527229309082} -08/30/2021 20:14:08 - INFO - __main__ - Step 39047: {'lr': 0.000426603999045313, 'samples': 7497024, 'steps': 39046, 'loss/train': 1.6472623348236084} -08/30/2021 20:14:09 - INFO - __main__ - Step 39048: {'lr': 0.00042660024290837003, 'samples': 7497216, 'steps': 39047, 'loss/train': 0.04206864535808563} -08/30/2021 20:14:09 - INFO - __main__ - Step 39049: {'lr': 0.00042659648669185376, 'samples': 7497408, 'steps': 39048, 'loss/train': 1.561629056930542} -08/30/2021 20:14:09 - INFO - __main__ - Step 39050: {'lr': 0.0004265927303957658, 'samples': 7497600, 'steps': 39049, 'loss/train': 1.5536412000656128} -08/30/2021 20:14:10 - INFO - __main__ - Step 39051: {'lr': 0.0004265889740201079, 'samples': 7497792, 'steps': 39050, 'loss/train': 1.8471053838729858} -08/30/2021 20:14:10 - INFO - __main__ - Step 39052: {'lr': 0.0004265852175648818, 'samples': 7497984, 'steps': 39051, 'loss/train': 1.4708019495010376} -08/30/2021 20:14:12 - INFO - __main__ - Step 39053: {'lr': 0.00042658146103008904, 'samples': 7498176, 'steps': 39052, 'loss/train': 1.2126667499542236} -08/30/2021 20:14:13 - INFO - __main__ - Step 39054: {'lr': 0.0004265777044157314, 'samples': 7498368, 'steps': 39053, 'loss/train': 1.099593162536621} -08/30/2021 20:14:13 - INFO - __main__ - Step 39055: {'lr': 0.0004265739477218106, 'samples': 7498560, 'steps': 39054, 'loss/train': 1.913072943687439} -08/30/2021 20:14:13 - INFO - __main__ - Step 39056: {'lr': 0.0004265701909483283, 'samples': 7498752, 'steps': 39055, 'loss/train': 1.4912137985229492} -08/30/2021 20:14:14 - INFO - __main__ - Step 39057: {'lr': 0.0004265664340952862, 'samples': 7498944, 'steps': 39056, 'loss/train': 1.2456638813018799} -08/30/2021 20:14:15 - INFO - __main__ - Step 39058: {'lr': 0.00042656267716268596, 'samples': 7499136, 'steps': 39057, 'loss/train': 0.7144192457199097} -08/30/2021 20:14:16 - INFO - __main__ - Step 39059: {'lr': 0.00042655892015052945, 'samples': 7499328, 'steps': 39058, 'loss/train': 1.4376308917999268} -08/30/2021 20:14:16 - INFO - __main__ - Step 39060: {'lr': 0.00042655516305881803, 'samples': 7499520, 'steps': 39059, 'loss/train': 1.449514389038086} -08/30/2021 20:14:16 - INFO - __main__ - Step 39061: {'lr': 0.00042655140588755366, 'samples': 7499712, 'steps': 39060, 'loss/train': 1.37236750125885} -08/30/2021 20:14:17 - INFO - __main__ - Step 39062: {'lr': 0.0004265476486367379, 'samples': 7499904, 'steps': 39061, 'loss/train': 1.8755433559417725} -08/30/2021 20:14:17 - INFO - __main__ - Step 39063: {'lr': 0.00042654389130637255, 'samples': 7500096, 'steps': 39062, 'loss/train': 1.4207885265350342} -08/30/2021 20:14:19 - INFO - __main__ - Step 39064: {'lr': 0.0004265401338964592, 'samples': 7500288, 'steps': 39063, 'loss/train': 1.5218433141708374} -08/30/2021 20:14:19 - INFO - __main__ - Step 39065: {'lr': 0.0004265363764069997, 'samples': 7500480, 'steps': 39064, 'loss/train': 1.3951611518859863} -08/30/2021 20:14:20 - INFO - __main__ - Step 39066: {'lr': 0.0004265326188379955, 'samples': 7500672, 'steps': 39065, 'loss/train': 1.4596272706985474} -08/30/2021 20:14:20 - INFO - __main__ - Step 39067: {'lr': 0.00042652886118944844, 'samples': 7500864, 'steps': 39066, 'loss/train': 1.3833550214767456} -08/30/2021 20:14:20 - INFO - __main__ - Step 39068: {'lr': 0.0004265251034613603, 'samples': 7501056, 'steps': 39067, 'loss/train': 1.3588005304336548} -08/30/2021 20:14:22 - INFO - __main__ - Step 39069: {'lr': 0.0004265213456537326, 'samples': 7501248, 'steps': 39068, 'loss/train': 1.6298719644546509} -08/30/2021 20:14:23 - INFO - __main__ - Step 39070: {'lr': 0.0004265175877665671, 'samples': 7501440, 'steps': 39069, 'loss/train': 1.5082911252975464} -08/30/2021 20:14:23 - INFO - __main__ - Step 39071: {'lr': 0.0004265138297998655, 'samples': 7501632, 'steps': 39070, 'loss/train': 1.578966498374939} -08/30/2021 20:14:23 - INFO - __main__ - Step 39072: {'lr': 0.0004265100717536295, 'samples': 7501824, 'steps': 39071, 'loss/train': 0.1390034556388855} -08/30/2021 20:14:24 - INFO - __main__ - Step 39073: {'lr': 0.0004265063136278608, 'samples': 7502016, 'steps': 39072, 'loss/train': 0.05011961981654167} -08/30/2021 20:14:26 - INFO - __main__ - Step 39074: {'lr': 0.00042650255542256107, 'samples': 7502208, 'steps': 39073, 'loss/train': 1.4226551055908203} -08/30/2021 20:14:26 - INFO - __main__ - Step 39075: {'lr': 0.000426498797137732, 'samples': 7502400, 'steps': 39074, 'loss/train': 1.2472825050354004} -08/30/2021 20:14:27 - INFO - __main__ - Step 39076: {'lr': 0.00042649503877337523, 'samples': 7502592, 'steps': 39075, 'loss/train': 2.1044628620147705} -08/30/2021 20:14:27 - INFO - __main__ - Step 39077: {'lr': 0.0004264912803294926, 'samples': 7502784, 'steps': 39076, 'loss/train': 1.8073034286499023} -08/30/2021 20:14:27 - INFO - __main__ - Step 39078: {'lr': 0.0004264875218060857, 'samples': 7502976, 'steps': 39077, 'loss/train': 1.684946894645691} -08/30/2021 20:14:29 - INFO - __main__ - Step 39079: {'lr': 0.00042648376320315634, 'samples': 7503168, 'steps': 39078, 'loss/train': 1.5687719583511353} -08/30/2021 20:14:29 - INFO - __main__ - Step 39080: {'lr': 0.000426480004520706, 'samples': 7503360, 'steps': 39079, 'loss/train': 0.0665900930762291} -08/30/2021 20:14:29 - INFO - __main__ - Step 39081: {'lr': 0.00042647624575873656, 'samples': 7503552, 'steps': 39080, 'loss/train': 1.672710657119751} -08/30/2021 20:14:30 - INFO - __main__ - Step 39082: {'lr': 0.0004264724869172496, 'samples': 7503744, 'steps': 39081, 'loss/train': 1.476485013961792} -08/30/2021 20:14:30 - INFO - __main__ - Step 39083: {'lr': 0.00042646872799624694, 'samples': 7503936, 'steps': 39082, 'loss/train': 1.4662269353866577} -08/30/2021 20:14:32 - INFO - __main__ - Step 39084: {'lr': 0.00042646496899573005, 'samples': 7504128, 'steps': 39083, 'loss/train': 1.0886486768722534} -08/30/2021 20:14:32 - INFO - __main__ - Step 39085: {'lr': 0.0004264612099157009, 'samples': 7504320, 'steps': 39084, 'loss/train': 1.6391215324401855} -08/30/2021 20:14:32 - INFO - __main__ - Step 39086: {'lr': 0.00042645745075616106, 'samples': 7504512, 'steps': 39085, 'loss/train': 1.3249776363372803} -08/30/2021 20:14:33 - INFO - __main__ - Step 39087: {'lr': 0.0004264536915171121, 'samples': 7504704, 'steps': 39086, 'loss/train': 0.7305589318275452} -08/30/2021 20:14:33 - INFO - __main__ - Step 39088: {'lr': 0.0004264499321985559, 'samples': 7504896, 'steps': 39087, 'loss/train': 1.3197695016860962} -08/30/2021 20:14:35 - INFO - __main__ - Step 39089: {'lr': 0.0004264461728004941, 'samples': 7505088, 'steps': 39088, 'loss/train': 0.15367215871810913} -08/30/2021 20:14:35 - INFO - __main__ - Step 39090: {'lr': 0.0004264424133229283, 'samples': 7505280, 'steps': 39089, 'loss/train': 1.4112424850463867} -08/30/2021 20:14:35 - INFO - __main__ - Step 39091: {'lr': 0.0004264386537658603, 'samples': 7505472, 'steps': 39090, 'loss/train': 1.0174434185028076} -08/30/2021 20:14:36 - INFO - __main__ - Step 39092: {'lr': 0.0004264348941292919, 'samples': 7505664, 'steps': 39091, 'loss/train': 0.962507426738739} -08/30/2021 20:14:36 - INFO - __main__ - Step 39093: {'lr': 0.0004264311344132245, 'samples': 7505856, 'steps': 39092, 'loss/train': 1.2160069942474365} -08/30/2021 20:14:37 - INFO - __main__ - Step 39094: {'lr': 0.00042642737461766003, 'samples': 7506048, 'steps': 39093, 'loss/train': 1.3217370510101318} -08/30/2021 20:14:38 - INFO - __main__ - Step 39095: {'lr': 0.0004264236147426, 'samples': 7506240, 'steps': 39094, 'loss/train': 1.3808517456054688} -08/30/2021 20:14:39 - INFO - __main__ - Step 39096: {'lr': 0.0004264198547880464, 'samples': 7506432, 'steps': 39095, 'loss/train': 1.059320092201233} -08/30/2021 20:14:39 - INFO - __main__ - Step 39097: {'lr': 0.00042641609475400054, 'samples': 7506624, 'steps': 39096, 'loss/train': 1.7606483697891235} -08/30/2021 20:14:39 - INFO - __main__ - Step 39098: {'lr': 0.0004264123346404644, 'samples': 7506816, 'steps': 39097, 'loss/train': 1.3320167064666748} -08/30/2021 20:14:40 - INFO - __main__ - Step 39099: {'lr': 0.0004264085744474396, 'samples': 7507008, 'steps': 39098, 'loss/train': 1.9074100255966187} -08/30/2021 20:14:41 - INFO - __main__ - Step 39100: {'lr': 0.0004264048141749278, 'samples': 7507200, 'steps': 39099, 'loss/train': 1.4979037046432495} -08/30/2021 20:14:42 - INFO - __main__ - Step 39101: {'lr': 0.00042640105382293073, 'samples': 7507392, 'steps': 39100, 'loss/train': 0.907530665397644} -08/30/2021 20:14:42 - INFO - __main__ - Step 39102: {'lr': 0.00042639729339145004, 'samples': 7507584, 'steps': 39101, 'loss/train': 0.15617690980434418} -08/30/2021 20:14:43 - INFO - __main__ - Step 39103: {'lr': 0.0004263935328804874, 'samples': 7507776, 'steps': 39102, 'loss/train': 0.2130056768655777} -08/30/2021 20:14:43 - INFO - __main__ - Step 39104: {'lr': 0.0004263897722900447, 'samples': 7507968, 'steps': 39103, 'loss/train': 1.9279919862747192} -08/30/2021 20:14:43 - INFO - __main__ - Step 39105: {'lr': 0.0004263860116201234, 'samples': 7508160, 'steps': 39104, 'loss/train': 1.8019262552261353} -08/30/2021 20:14:45 - INFO - __main__ - Step 39106: {'lr': 0.00042638225087072523, 'samples': 7508352, 'steps': 39105, 'loss/train': 1.7949875593185425} -08/30/2021 20:14:45 - INFO - __main__ - Step 39107: {'lr': 0.00042637849004185203, 'samples': 7508544, 'steps': 39106, 'loss/train': 1.3953295946121216} -08/30/2021 20:14:46 - INFO - __main__ - Step 39108: {'lr': 0.0004263747291335054, 'samples': 7508736, 'steps': 39107, 'loss/train': 1.1228476762771606} -08/30/2021 20:14:46 - INFO - __main__ - Step 39109: {'lr': 0.00042637096814568696, 'samples': 7508928, 'steps': 39108, 'loss/train': 1.1814470291137695} -08/30/2021 20:14:46 - INFO - __main__ - Step 39110: {'lr': 0.0004263672070783986, 'samples': 7509120, 'steps': 39109, 'loss/train': 1.302478551864624} -08/30/2021 20:14:48 - INFO - __main__ - Step 39111: {'lr': 0.0004263634459316418, 'samples': 7509312, 'steps': 39110, 'loss/train': 1.102424144744873} -08/30/2021 20:14:48 - INFO - __main__ - Step 39112: {'lr': 0.0004263596847054184, 'samples': 7509504, 'steps': 39111, 'loss/train': 1.7552907466888428} -08/30/2021 20:14:49 - INFO - __main__ - Step 39113: {'lr': 0.00042635592339973006, 'samples': 7509696, 'steps': 39112, 'loss/train': 1.0346333980560303} -08/30/2021 20:14:49 - INFO - __main__ - Step 39114: {'lr': 0.00042635216201457836, 'samples': 7509888, 'steps': 39113, 'loss/train': 1.3420451879501343} -08/30/2021 20:14:49 - INFO - __main__ - Step 39115: {'lr': 0.00042634840054996527, 'samples': 7510080, 'steps': 39114, 'loss/train': 2.001659631729126} -08/30/2021 20:14:50 - INFO - __main__ - Step 39116: {'lr': 0.00042634463900589214, 'samples': 7510272, 'steps': 39115, 'loss/train': 1.4357761144638062} -08/30/2021 20:14:51 - INFO - __main__ - Step 39117: {'lr': 0.0004263408773823609, 'samples': 7510464, 'steps': 39116, 'loss/train': 0.5859894752502441} -08/30/2021 20:14:51 - INFO - __main__ - Step 39118: {'lr': 0.00042633711567937325, 'samples': 7510656, 'steps': 39117, 'loss/train': 1.568800449371338} -08/30/2021 20:14:52 - INFO - __main__ - Step 39119: {'lr': 0.00042633335389693073, 'samples': 7510848, 'steps': 39118, 'loss/train': 1.540902018547058} -08/30/2021 20:14:52 - INFO - __main__ - Step 39120: {'lr': 0.0004263295920350352, 'samples': 7511040, 'steps': 39119, 'loss/train': 1.9303350448608398} -08/30/2021 20:14:52 - INFO - __main__ - Step 39121: {'lr': 0.0004263258300936882, 'samples': 7511232, 'steps': 39120, 'loss/train': 1.1475542783737183} -08/30/2021 20:14:54 - INFO - __main__ - Step 39122: {'lr': 0.00042632206807289154, 'samples': 7511424, 'steps': 39121, 'loss/train': 1.180432677268982} -08/30/2021 20:14:55 - INFO - __main__ - Step 39123: {'lr': 0.00042631830597264687, 'samples': 7511616, 'steps': 39122, 'loss/train': 1.460362195968628} -08/30/2021 20:14:55 - INFO - __main__ - Step 39124: {'lr': 0.0004263145437929559, 'samples': 7511808, 'steps': 39123, 'loss/train': 0.7202699184417725} -08/30/2021 20:14:55 - INFO - __main__ - Step 39125: {'lr': 0.0004263107815338203, 'samples': 7512000, 'steps': 39124, 'loss/train': 1.0189943313598633} -08/30/2021 20:14:56 - INFO - __main__ - Step 39126: {'lr': 0.00042630701919524176, 'samples': 7512192, 'steps': 39125, 'loss/train': 2.0857889652252197} -08/30/2021 20:14:58 - INFO - __main__ - Step 39127: {'lr': 0.00042630325677722204, 'samples': 7512384, 'steps': 39126, 'loss/train': 0.7416525483131409} -08/30/2021 20:14:58 - INFO - __main__ - Step 39128: {'lr': 0.0004262994942797628, 'samples': 7512576, 'steps': 39127, 'loss/train': 1.3737872838974} -08/30/2021 20:14:59 - INFO - __main__ - Step 39129: {'lr': 0.0004262957317028657, 'samples': 7512768, 'steps': 39128, 'loss/train': 1.5676079988479614} -08/30/2021 20:14:59 - INFO - __main__ - Step 39130: {'lr': 0.00042629196904653245, 'samples': 7512960, 'steps': 39129, 'loss/train': 0.9293034076690674} -08/30/2021 20:14:59 - INFO - __main__ - Step 39131: {'lr': 0.00042628820631076484, 'samples': 7513152, 'steps': 39130, 'loss/train': 0.6962493062019348} -08/30/2021 20:15:00 - INFO - __main__ - Step 39132: {'lr': 0.0004262844434955644, 'samples': 7513344, 'steps': 39131, 'loss/train': 1.7585588693618774} -08/30/2021 20:15:02 - INFO - __main__ - Step 39133: {'lr': 0.00042628068060093294, 'samples': 7513536, 'steps': 39132, 'loss/train': 1.7021483182907104} -08/30/2021 20:15:02 - INFO - __main__ - Step 39134: {'lr': 0.0004262769176268722, 'samples': 7513728, 'steps': 39133, 'loss/train': 1.4474977254867554} -08/30/2021 20:15:02 - INFO - __main__ - Step 39135: {'lr': 0.0004262731545733837, 'samples': 7513920, 'steps': 39134, 'loss/train': 1.8324302434921265} -08/30/2021 20:15:03 - INFO - __main__ - Step 39136: {'lr': 0.0004262693914404692, 'samples': 7514112, 'steps': 39135, 'loss/train': 1.6235870122909546} -08/30/2021 20:15:03 - INFO - __main__ - Step 39137: {'lr': 0.0004262656282281305, 'samples': 7514304, 'steps': 39136, 'loss/train': 1.699751615524292} -08/30/2021 20:15:05 - INFO - __main__ - Step 39138: {'lr': 0.0004262618649363692, 'samples': 7514496, 'steps': 39137, 'loss/train': 3.4799325466156006} -08/30/2021 20:15:05 - INFO - __main__ - Step 39139: {'lr': 0.0004262581015651871, 'samples': 7514688, 'steps': 39138, 'loss/train': 1.3937004804611206} -08/30/2021 20:15:06 - INFO - __main__ - Step 39140: {'lr': 0.0004262543381145857, 'samples': 7514880, 'steps': 39139, 'loss/train': 1.8962650299072266} -08/30/2021 20:15:06 - INFO - __main__ - Step 39141: {'lr': 0.0004262505745845669, 'samples': 7515072, 'steps': 39140, 'loss/train': 0.09406972676515579} -08/30/2021 20:15:06 - INFO - __main__ - Step 39142: {'lr': 0.0004262468109751323, 'samples': 7515264, 'steps': 39141, 'loss/train': 2.190310001373291} -08/30/2021 20:15:08 - INFO - __main__ - Step 39143: {'lr': 0.0004262430472862836, 'samples': 7515456, 'steps': 39142, 'loss/train': 1.079997181892395} -08/30/2021 20:15:08 - INFO - __main__ - Step 39144: {'lr': 0.00042623928351802245, 'samples': 7515648, 'steps': 39143, 'loss/train': 1.3742101192474365} -08/30/2021 20:15:09 - INFO - __main__ - Step 39145: {'lr': 0.00042623551967035066, 'samples': 7515840, 'steps': 39144, 'loss/train': 1.6789116859436035} -08/30/2021 20:15:09 - INFO - __main__ - Step 39146: {'lr': 0.0004262317557432699, 'samples': 7516032, 'steps': 39145, 'loss/train': 2.3123044967651367} -08/30/2021 20:15:09 - INFO - __main__ - Step 39147: {'lr': 0.0004262279917367817, 'samples': 7516224, 'steps': 39146, 'loss/train': 1.5434142351150513} -08/30/2021 20:15:10 - INFO - __main__ - Step 39148: {'lr': 0.00042622422765088805, 'samples': 7516416, 'steps': 39147, 'loss/train': 1.468110203742981} -08/30/2021 20:15:11 - INFO - __main__ - Step 39149: {'lr': 0.00042622046348559034, 'samples': 7516608, 'steps': 39148, 'loss/train': 1.066454291343689} -08/30/2021 20:15:12 - INFO - __main__ - Step 39150: {'lr': 0.00042621669924089044, 'samples': 7516800, 'steps': 39149, 'loss/train': 1.9181402921676636} -08/30/2021 20:15:12 - INFO - __main__ - Step 39151: {'lr': 0.00042621293491679007, 'samples': 7516992, 'steps': 39150, 'loss/train': 1.5696115493774414} -08/30/2021 20:15:12 - INFO - __main__ - Step 39152: {'lr': 0.00042620917051329086, 'samples': 7517184, 'steps': 39151, 'loss/train': 1.254530668258667} -08/30/2021 20:15:13 - INFO - __main__ - Step 39153: {'lr': 0.0004262054060303945, 'samples': 7517376, 'steps': 39152, 'loss/train': 1.6173115968704224} -08/30/2021 20:15:14 - INFO - __main__ - Step 39154: {'lr': 0.00042620164146810267, 'samples': 7517568, 'steps': 39153, 'loss/train': 1.3876872062683105} -08/30/2021 20:15:15 - INFO - __main__ - Step 39155: {'lr': 0.0004261978768264172, 'samples': 7517760, 'steps': 39154, 'loss/train': 1.2458218336105347} -08/30/2021 20:15:15 - INFO - __main__ - Step 39156: {'lr': 0.00042619411210533957, 'samples': 7517952, 'steps': 39155, 'loss/train': 1.3571326732635498} -08/30/2021 20:15:15 - INFO - __main__ - Step 39157: {'lr': 0.00042619034730487167, 'samples': 7518144, 'steps': 39156, 'loss/train': 0.08076008409261703} -08/30/2021 20:15:16 - INFO - __main__ - Step 39158: {'lr': 0.00042618658242501507, 'samples': 7518336, 'steps': 39157, 'loss/train': 1.8906840085983276} -08/30/2021 20:15:17 - INFO - __main__ - Step 39159: {'lr': 0.0004261828174657716, 'samples': 7518528, 'steps': 39158, 'loss/train': 0.06880287081003189} -08/30/2021 20:15:18 - INFO - __main__ - Step 39160: {'lr': 0.0004261790524271427, 'samples': 7518720, 'steps': 39159, 'loss/train': 1.4318112134933472} -08/30/2021 20:15:18 - INFO - __main__ - Step 39161: {'lr': 0.00042617528730913036, 'samples': 7518912, 'steps': 39160, 'loss/train': 1.2938989400863647} -08/30/2021 20:15:19 - INFO - __main__ - Step 39162: {'lr': 0.00042617152211173615, 'samples': 7519104, 'steps': 39161, 'loss/train': 1.4352787733078003} -08/30/2021 20:15:19 - INFO - __main__ - Step 39163: {'lr': 0.0004261677568349618, 'samples': 7519296, 'steps': 39162, 'loss/train': 1.2439548969268799} -08/30/2021 20:15:20 - INFO - __main__ - Step 39164: {'lr': 0.0004261639914788089, 'samples': 7519488, 'steps': 39163, 'loss/train': 1.2463551759719849} -08/30/2021 20:15:21 - INFO - __main__ - Step 39165: {'lr': 0.0004261602260432792, 'samples': 7519680, 'steps': 39164, 'loss/train': 1.2323464155197144} -08/30/2021 20:15:21 - INFO - __main__ - Step 39166: {'lr': 0.0004261564605283745, 'samples': 7519872, 'steps': 39165, 'loss/train': 1.5970195531845093} -08/30/2021 20:15:22 - INFO - __main__ - Step 39167: {'lr': 0.0004261526949340965, 'samples': 7520064, 'steps': 39166, 'loss/train': 1.86358642578125} -08/30/2021 20:15:22 - INFO - __main__ - Step 39168: {'lr': 0.0004261489292604467, 'samples': 7520256, 'steps': 39167, 'loss/train': 1.248688817024231} -08/30/2021 20:15:23 - INFO - __main__ - Step 39169: {'lr': 0.0004261451635074269, 'samples': 7520448, 'steps': 39168, 'loss/train': 1.2779831886291504} -08/30/2021 20:15:24 - INFO - __main__ - Step 39170: {'lr': 0.0004261413976750388, 'samples': 7520640, 'steps': 39169, 'loss/train': 1.563864827156067} -08/30/2021 20:15:24 - INFO - __main__ - Step 39171: {'lr': 0.00042613763176328415, 'samples': 7520832, 'steps': 39170, 'loss/train': 1.3924736976623535} -08/30/2021 20:15:24 - INFO - __main__ - Step 39172: {'lr': 0.00042613386577216455, 'samples': 7521024, 'steps': 39171, 'loss/train': 1.9655263423919678} -08/30/2021 20:15:25 - INFO - __main__ - Step 39173: {'lr': 0.0004261300997016818, 'samples': 7521216, 'steps': 39172, 'loss/train': 0.9479031562805176} -08/30/2021 20:15:26 - INFO - __main__ - Step 39174: {'lr': 0.0004261263335518375, 'samples': 7521408, 'steps': 39173, 'loss/train': 1.9122108221054077} -08/30/2021 20:15:27 - INFO - __main__ - Step 39175: {'lr': 0.00042612256732263345, 'samples': 7521600, 'steps': 39174, 'loss/train': 1.4972925186157227} -08/30/2021 20:15:27 - INFO - __main__ - Step 39176: {'lr': 0.0004261188010140712, 'samples': 7521792, 'steps': 39175, 'loss/train': 1.7078129053115845} -08/30/2021 20:15:27 - INFO - __main__ - Step 39177: {'lr': 0.00042611503462615266, 'samples': 7521984, 'steps': 39176, 'loss/train': 1.2863445281982422} -08/30/2021 20:15:28 - INFO - __main__ - Step 39178: {'lr': 0.0004261112681588793, 'samples': 7522176, 'steps': 39177, 'loss/train': 1.2235257625579834} -08/30/2021 20:15:30 - INFO - __main__ - Step 39179: {'lr': 0.000426107501612253, 'samples': 7522368, 'steps': 39178, 'loss/train': 2.2244679927825928} -08/30/2021 20:15:31 - INFO - __main__ - Step 39180: {'lr': 0.0004261037349862753, 'samples': 7522560, 'steps': 39179, 'loss/train': 1.0812623500823975} -08/30/2021 20:15:31 - INFO - __main__ - Step 39181: {'lr': 0.000426099968280948, 'samples': 7522752, 'steps': 39180, 'loss/train': 0.9474536180496216} -08/30/2021 20:15:31 - INFO - __main__ - Step 39182: {'lr': 0.00042609620149627284, 'samples': 7522944, 'steps': 39181, 'loss/train': 1.2128833532333374} -08/30/2021 20:15:32 - INFO - __main__ - Step 39183: {'lr': 0.00042609243463225134, 'samples': 7523136, 'steps': 39182, 'loss/train': 1.0542069673538208} -08/30/2021 20:15:32 - INFO - __main__ - Step 39184: {'lr': 0.00042608866768888533, 'samples': 7523328, 'steps': 39183, 'loss/train': 1.7255816459655762} -08/30/2021 20:15:34 - INFO - __main__ - Step 39185: {'lr': 0.0004260849006661765, 'samples': 7523520, 'steps': 39184, 'loss/train': 0.14229607582092285} -08/30/2021 20:15:34 - INFO - __main__ - Step 39186: {'lr': 0.0004260811335641266, 'samples': 7523712, 'steps': 39185, 'loss/train': 1.5025449991226196} -08/30/2021 20:15:34 - INFO - __main__ - Step 39187: {'lr': 0.0004260773663827372, 'samples': 7523904, 'steps': 39186, 'loss/train': 1.7135591506958008} -08/30/2021 20:15:35 - INFO - __main__ - Step 39188: {'lr': 0.00042607359912201004, 'samples': 7524096, 'steps': 39187, 'loss/train': 5.811387062072754} -08/30/2021 20:15:35 - INFO - __main__ - Step 39189: {'lr': 0.0004260698317819468, 'samples': 7524288, 'steps': 39188, 'loss/train': 1.4644395112991333} -08/30/2021 20:15:35 - INFO - __main__ - Step 39190: {'lr': 0.00042606606436254926, 'samples': 7524480, 'steps': 39189, 'loss/train': 1.6314276456832886} -08/30/2021 20:15:37 - INFO - __main__ - Step 39191: {'lr': 0.000426062296863819, 'samples': 7524672, 'steps': 39190, 'loss/train': 1.338916301727295} -08/30/2021 20:15:38 - INFO - __main__ - Step 39192: {'lr': 0.00042605852928575796, 'samples': 7524864, 'steps': 39191, 'loss/train': 1.9953043460845947} -08/30/2021 20:15:38 - INFO - __main__ - Step 39193: {'lr': 0.00042605476162836756, 'samples': 7525056, 'steps': 39192, 'loss/train': 1.5283734798431396} -08/30/2021 20:15:38 - INFO - __main__ - Step 39194: {'lr': 0.00042605099389164957, 'samples': 7525248, 'steps': 39193, 'loss/train': 1.6781046390533447} -08/30/2021 20:15:39 - INFO - __main__ - Step 39195: {'lr': 0.00042604722607560575, 'samples': 7525440, 'steps': 39194, 'loss/train': 1.2429226636886597} -08/30/2021 20:15:40 - INFO - __main__ - Step 39196: {'lr': 0.0004260434581802377, 'samples': 7525632, 'steps': 39195, 'loss/train': 1.4645442962646484} -08/30/2021 20:15:41 - INFO - __main__ - Step 39197: {'lr': 0.0004260396902055473, 'samples': 7525824, 'steps': 39196, 'loss/train': 0.0686180517077446} -08/30/2021 20:15:41 - INFO - __main__ - Step 39198: {'lr': 0.0004260359221515361, 'samples': 7526016, 'steps': 39197, 'loss/train': 1.7838993072509766} -08/30/2021 20:15:41 - INFO - __main__ - Step 39199: {'lr': 0.0004260321540182057, 'samples': 7526208, 'steps': 39198, 'loss/train': 1.4074504375457764} -08/30/2021 20:15:42 - INFO - __main__ - Step 39200: {'lr': 0.00042602838580555814, 'samples': 7526400, 'steps': 39199, 'loss/train': 1.5589021444320679} -08/30/2021 20:15:43 - INFO - __main__ - Step 39201: {'lr': 0.0004260246175135948, 'samples': 7526592, 'steps': 39200, 'loss/train': 1.4375873804092407} -08/30/2021 20:15:44 - INFO - __main__ - Step 39202: {'lr': 0.00042602084914231743, 'samples': 7526784, 'steps': 39201, 'loss/train': 1.554763913154602} -08/30/2021 20:15:44 - INFO - __main__ - Step 39203: {'lr': 0.0004260170806917278, 'samples': 7526976, 'steps': 39202, 'loss/train': 1.6370964050292969} -08/30/2021 20:15:45 - INFO - __main__ - Step 39204: {'lr': 0.0004260133121618276, 'samples': 7527168, 'steps': 39203, 'loss/train': 1.733738899230957} -08/30/2021 20:15:45 - INFO - __main__ - Step 39205: {'lr': 0.0004260095435526186, 'samples': 7527360, 'steps': 39204, 'loss/train': 1.4207985401153564} -08/30/2021 20:15:46 - INFO - __main__ - Step 39206: {'lr': 0.0004260057748641024, 'samples': 7527552, 'steps': 39205, 'loss/train': 0.0773579478263855} -08/30/2021 20:15:47 - INFO - __main__ - Step 39207: {'lr': 0.00042600200609628063, 'samples': 7527744, 'steps': 39206, 'loss/train': 1.6099849939346313} -08/30/2021 20:15:47 - INFO - __main__ - Step 39208: {'lr': 0.0004259982372491551, 'samples': 7527936, 'steps': 39207, 'loss/train': 1.5052069425582886} -08/30/2021 20:15:48 - INFO - __main__ - Step 39209: {'lr': 0.00042599446832272746, 'samples': 7528128, 'steps': 39208, 'loss/train': 1.2605875730514526} -08/30/2021 20:15:48 - INFO - __main__ - Step 39210: {'lr': 0.0004259906993169995, 'samples': 7528320, 'steps': 39209, 'loss/train': 1.5393530130386353} -08/30/2021 20:15:49 - INFO - __main__ - Step 39211: {'lr': 0.00042598693023197283, 'samples': 7528512, 'steps': 39210, 'loss/train': 1.4948527812957764} -08/30/2021 20:15:50 - INFO - __main__ - Step 39212: {'lr': 0.00042598316106764913, 'samples': 7528704, 'steps': 39211, 'loss/train': 0.7949560880661011} -08/30/2021 20:15:50 - INFO - __main__ - Step 39213: {'lr': 0.0004259793918240302, 'samples': 7528896, 'steps': 39212, 'loss/train': 2.4645466804504395} -08/30/2021 20:15:50 - INFO - __main__ - Step 39214: {'lr': 0.00042597562250111753, 'samples': 7529088, 'steps': 39213, 'loss/train': 1.5193893909454346} -08/30/2021 20:15:51 - INFO - __main__ - Step 39215: {'lr': 0.00042597185309891305, 'samples': 7529280, 'steps': 39214, 'loss/train': 1.2662200927734375} -08/30/2021 20:15:51 - INFO - __main__ - Step 39216: {'lr': 0.0004259680836174184, 'samples': 7529472, 'steps': 39215, 'loss/train': 1.31745445728302} -08/30/2021 20:15:53 - INFO - __main__ - Step 39217: {'lr': 0.0004259643140566352, 'samples': 7529664, 'steps': 39216, 'loss/train': 1.2903964519500732} -08/30/2021 20:15:53 - INFO - __main__ - Step 39218: {'lr': 0.0004259605444165652, 'samples': 7529856, 'steps': 39217, 'loss/train': 1.7505873441696167} -08/30/2021 20:15:54 - INFO - __main__ - Step 39219: {'lr': 0.0004259567746972101, 'samples': 7530048, 'steps': 39218, 'loss/train': 1.378353476524353} -08/30/2021 20:15:54 - INFO - __main__ - Step 39220: {'lr': 0.00042595300489857164, 'samples': 7530240, 'steps': 39219, 'loss/train': 1.2656008005142212} -08/30/2021 20:15:54 - INFO - __main__ - Step 39221: {'lr': 0.0004259492350206514, 'samples': 7530432, 'steps': 39220, 'loss/train': 1.7456952333450317} -08/30/2021 20:15:56 - INFO - __main__ - Step 39222: {'lr': 0.00042594546506345124, 'samples': 7530624, 'steps': 39221, 'loss/train': 1.2530466318130493} -08/30/2021 20:15:56 - INFO - __main__ - Step 39223: {'lr': 0.00042594169502697265, 'samples': 7530816, 'steps': 39222, 'loss/train': 1.15249502658844} -08/30/2021 20:15:57 - INFO - __main__ - Step 39224: {'lr': 0.00042593792491121753, 'samples': 7531008, 'steps': 39223, 'loss/train': 0.8006893396377563} -08/30/2021 20:15:57 - INFO - __main__ - Step 39225: {'lr': 0.00042593415471618744, 'samples': 7531200, 'steps': 39224, 'loss/train': 1.5839146375656128} -08/30/2021 20:15:57 - INFO - __main__ - Step 39226: {'lr': 0.0004259303844418841, 'samples': 7531392, 'steps': 39225, 'loss/train': 1.3223596811294556} -08/30/2021 20:15:59 - INFO - __main__ - Step 39227: {'lr': 0.00042592661408830937, 'samples': 7531584, 'steps': 39226, 'loss/train': 1.6665972471237183} -08/30/2021 20:16:00 - INFO - __main__ - Step 39228: {'lr': 0.00042592284365546474, 'samples': 7531776, 'steps': 39227, 'loss/train': 1.773131251335144} -08/30/2021 20:16:00 - INFO - __main__ - Step 39229: {'lr': 0.00042591907314335197, 'samples': 7531968, 'steps': 39228, 'loss/train': 1.867200255393982} -08/30/2021 20:16:00 - INFO - __main__ - Step 39230: {'lr': 0.00042591530255197286, 'samples': 7532160, 'steps': 39229, 'loss/train': 1.3140276670455933} -08/30/2021 20:16:01 - INFO - __main__ - Step 39231: {'lr': 0.00042591153188132903, 'samples': 7532352, 'steps': 39230, 'loss/train': 1.2540984153747559} -08/30/2021 20:16:01 - INFO - __main__ - Step 39232: {'lr': 0.00042590776113142216, 'samples': 7532544, 'steps': 39231, 'loss/train': 1.1593823432922363} -08/30/2021 20:16:02 - INFO - __main__ - Step 39233: {'lr': 0.00042590399030225393, 'samples': 7532736, 'steps': 39232, 'loss/train': 0.9333450198173523} -08/30/2021 20:16:03 - INFO - __main__ - Step 39234: {'lr': 0.0004259002193938261, 'samples': 7532928, 'steps': 39233, 'loss/train': 1.2447391748428345} -08/30/2021 20:16:03 - INFO - __main__ - Step 39235: {'lr': 0.0004258964484061403, 'samples': 7533120, 'steps': 39234, 'loss/train': 1.5167738199234009} -08/30/2021 20:16:04 - INFO - __main__ - Step 39236: {'lr': 0.00042589267733919833, 'samples': 7533312, 'steps': 39235, 'loss/train': 1.5196619033813477} -08/30/2021 20:16:04 - INFO - __main__ - Step 39237: {'lr': 0.0004258889061930018, 'samples': 7533504, 'steps': 39236, 'loss/train': 1.4889049530029297} -08/30/2021 20:16:06 - INFO - __main__ - Step 39238: {'lr': 0.0004258851349675524, 'samples': 7533696, 'steps': 39237, 'loss/train': 1.5146186351776123} -08/30/2021 20:16:07 - INFO - __main__ - Step 39239: {'lr': 0.00042588136366285197, 'samples': 7533888, 'steps': 39238, 'loss/train': 1.1814444065093994} -08/30/2021 20:16:07 - INFO - __main__ - Step 39240: {'lr': 0.0004258775922789021, 'samples': 7534080, 'steps': 39239, 'loss/train': 1.5750893354415894} -08/30/2021 20:16:07 - INFO - __main__ - Step 39241: {'lr': 0.0004258738208157045, 'samples': 7534272, 'steps': 39240, 'loss/train': 1.8444780111312866} -08/30/2021 20:16:08 - INFO - __main__ - Step 39242: {'lr': 0.0004258700492732608, 'samples': 7534464, 'steps': 39241, 'loss/train': 1.6651300191879272} -08/30/2021 20:16:08 - INFO - __main__ - Step 39243: {'lr': 0.0004258662776515728, 'samples': 7534656, 'steps': 39242, 'loss/train': 1.331242322921753} -08/30/2021 20:16:10 - INFO - __main__ - Step 39244: {'lr': 0.00042586250595064216, 'samples': 7534848, 'steps': 39243, 'loss/train': 0.8905333280563354} -08/30/2021 20:16:11 - INFO - __main__ - Step 39245: {'lr': 0.0004258587341704706, 'samples': 7535040, 'steps': 39244, 'loss/train': 2.15775465965271} -08/30/2021 20:16:11 - INFO - __main__ - Step 39246: {'lr': 0.00042585496231105986, 'samples': 7535232, 'steps': 39245, 'loss/train': 1.777660846710205} -08/30/2021 20:16:11 - INFO - __main__ - Step 39247: {'lr': 0.00042585119037241156, 'samples': 7535424, 'steps': 39246, 'loss/train': 2.3965721130371094} -08/30/2021 20:16:12 - INFO - __main__ - Step 39248: {'lr': 0.00042584741835452743, 'samples': 7535616, 'steps': 39247, 'loss/train': 1.7814289331436157} -08/30/2021 20:16:13 - INFO - __main__ - Step 39249: {'lr': 0.0004258436462574091, 'samples': 7535808, 'steps': 39248, 'loss/train': 0.7484597563743591} -08/30/2021 20:16:14 - INFO - __main__ - Step 39250: {'lr': 0.0004258398740810584, 'samples': 7536000, 'steps': 39249, 'loss/train': 1.218285322189331} -08/30/2021 20:16:14 - INFO - __main__ - Step 39251: {'lr': 0.00042583610182547694, 'samples': 7536192, 'steps': 39250, 'loss/train': 1.0163325071334839} -08/30/2021 20:16:14 - INFO - __main__ - Step 39252: {'lr': 0.0004258323294906665, 'samples': 7536384, 'steps': 39251, 'loss/train': 1.140373706817627} -08/30/2021 20:16:15 - INFO - __main__ - Step 39253: {'lr': 0.00042582855707662864, 'samples': 7536576, 'steps': 39252, 'loss/train': 1.8493263721466064} -08/30/2021 20:16:16 - INFO - __main__ - Step 39254: {'lr': 0.00042582478458336523, 'samples': 7536768, 'steps': 39253, 'loss/train': 0.8339062333106995} -08/30/2021 20:16:17 - INFO - __main__ - Step 39255: {'lr': 0.00042582101201087786, 'samples': 7536960, 'steps': 39254, 'loss/train': 1.7238658666610718} -08/30/2021 20:16:17 - INFO - __main__ - Step 39256: {'lr': 0.00042581723935916817, 'samples': 7537152, 'steps': 39255, 'loss/train': 1.4438048601150513} -08/30/2021 20:16:17 - INFO - __main__ - Step 39257: {'lr': 0.00042581346662823804, 'samples': 7537344, 'steps': 39256, 'loss/train': 1.309090495109558} -08/30/2021 20:16:18 - INFO - __main__ - Step 39258: {'lr': 0.00042580969381808906, 'samples': 7537536, 'steps': 39257, 'loss/train': 2.51485013961792} -08/30/2021 20:16:19 - INFO - __main__ - Step 39259: {'lr': 0.00042580592092872295, 'samples': 7537728, 'steps': 39258, 'loss/train': 0.9091335535049438} -08/30/2021 20:16:20 - INFO - __main__ - Step 39260: {'lr': 0.0004258021479601414, 'samples': 7537920, 'steps': 39259, 'loss/train': 2.7244107723236084} -08/30/2021 20:16:20 - INFO - __main__ - Step 39261: {'lr': 0.0004257983749123461, 'samples': 7538112, 'steps': 39260, 'loss/train': 1.6110857725143433} -08/30/2021 20:16:20 - INFO - __main__ - Step 39262: {'lr': 0.00042579460178533875, 'samples': 7538304, 'steps': 39261, 'loss/train': 1.5759211778640747} -08/30/2021 20:16:21 - INFO - __main__ - Step 39263: {'lr': 0.0004257908285791211, 'samples': 7538496, 'steps': 39262, 'loss/train': 1.3688291311264038} -08/30/2021 20:16:21 - INFO - __main__ - Step 39264: {'lr': 0.00042578705529369476, 'samples': 7538688, 'steps': 39263, 'loss/train': 2.0688281059265137} -08/30/2021 20:16:23 - INFO - __main__ - Step 39265: {'lr': 0.00042578328192906153, 'samples': 7538880, 'steps': 39264, 'loss/train': 1.6296072006225586} -08/30/2021 20:16:23 - INFO - __main__ - Step 39266: {'lr': 0.00042577950848522305, 'samples': 7539072, 'steps': 39265, 'loss/train': 1.6873074769973755} -08/30/2021 20:16:23 - INFO - __main__ - Step 39267: {'lr': 0.0004257757349621811, 'samples': 7539264, 'steps': 39266, 'loss/train': 1.5894533395767212} -08/30/2021 20:16:24 - INFO - __main__ - Step 39268: {'lr': 0.0004257719613599372, 'samples': 7539456, 'steps': 39267, 'loss/train': 1.077060341835022} -08/30/2021 20:16:24 - INFO - __main__ - Step 39269: {'lr': 0.0004257681876784932, 'samples': 7539648, 'steps': 39268, 'loss/train': 1.9370777606964111} -08/30/2021 20:16:25 - INFO - __main__ - Step 39270: {'lr': 0.0004257644139178508, 'samples': 7539840, 'steps': 39269, 'loss/train': 1.8108786344528198} -08/30/2021 20:16:26 - INFO - __main__ - Step 39271: {'lr': 0.0004257606400780117, 'samples': 7540032, 'steps': 39270, 'loss/train': 1.5082741975784302} -08/30/2021 20:16:26 - INFO - __main__ - Step 39272: {'lr': 0.0004257568661589775, 'samples': 7540224, 'steps': 39271, 'loss/train': 1.2383904457092285} -08/30/2021 20:16:27 - INFO - __main__ - Step 39273: {'lr': 0.00042575309216074997, 'samples': 7540416, 'steps': 39272, 'loss/train': 1.8964496850967407} -08/30/2021 20:16:27 - INFO - __main__ - Step 39274: {'lr': 0.00042574931808333095, 'samples': 7540608, 'steps': 39273, 'loss/train': 1.383758306503296} -08/30/2021 20:16:28 - INFO - __main__ - Step 39275: {'lr': 0.0004257455439267218, 'samples': 7540800, 'steps': 39274, 'loss/train': 1.560986042022705} -08/30/2021 20:16:29 - INFO - __main__ - Step 39276: {'lr': 0.00042574176969092454, 'samples': 7540992, 'steps': 39275, 'loss/train': 1.3361958265304565} -08/30/2021 20:16:29 - INFO - __main__ - Step 39277: {'lr': 0.0004257379953759407, 'samples': 7541184, 'steps': 39276, 'loss/train': 1.5455554723739624} -08/30/2021 20:16:30 - INFO - __main__ - Step 39278: {'lr': 0.00042573422098177204, 'samples': 7541376, 'steps': 39277, 'loss/train': 1.0981570482254028} -08/30/2021 20:16:30 - INFO - __main__ - Step 39279: {'lr': 0.0004257304465084203, 'samples': 7541568, 'steps': 39278, 'loss/train': 1.1934826374053955} -08/30/2021 20:16:32 - INFO - __main__ - Step 39280: {'lr': 0.0004257266719558871, 'samples': 7541760, 'steps': 39279, 'loss/train': 1.4602062702178955} -08/30/2021 20:16:32 - INFO - __main__ - Step 39281: {'lr': 0.0004257228973241741, 'samples': 7541952, 'steps': 39280, 'loss/train': 1.2158236503601074} -08/30/2021 20:16:32 - INFO - __main__ - Step 39282: {'lr': 0.00042571912261328315, 'samples': 7542144, 'steps': 39281, 'loss/train': 1.546975016593933} -08/30/2021 20:16:33 - INFO - __main__ - Step 39283: {'lr': 0.00042571534782321593, 'samples': 7542336, 'steps': 39282, 'loss/train': 1.710975170135498} -08/30/2021 20:16:33 - INFO - __main__ - Step 39284: {'lr': 0.000425711572953974, 'samples': 7542528, 'steps': 39283, 'loss/train': 0.4806158244609833} -08/30/2021 20:16:35 - INFO - __main__ - Step 39285: {'lr': 0.00042570779800555914, 'samples': 7542720, 'steps': 39284, 'loss/train': 1.3156388998031616} -08/30/2021 20:16:35 - INFO - __main__ - Step 39286: {'lr': 0.00042570402297797304, 'samples': 7542912, 'steps': 39285, 'loss/train': 1.1073112487792969} -08/30/2021 20:16:35 - INFO - __main__ - Step 39287: {'lr': 0.0004257002478712175, 'samples': 7543104, 'steps': 39286, 'loss/train': 0.7631056904792786} -08/30/2021 20:16:36 - INFO - __main__ - Step 39288: {'lr': 0.0004256964726852941, 'samples': 7543296, 'steps': 39287, 'loss/train': 1.4516005516052246} -08/30/2021 20:16:36 - INFO - __main__ - Step 39289: {'lr': 0.0004256926974202046, 'samples': 7543488, 'steps': 39288, 'loss/train': 1.4791836738586426} -08/30/2021 20:16:38 - INFO - __main__ - Step 39290: {'lr': 0.00042568892207595066, 'samples': 7543680, 'steps': 39289, 'loss/train': 1.9839260578155518} -08/30/2021 20:16:38 - INFO - __main__ - Step 39291: {'lr': 0.000425685146652534, 'samples': 7543872, 'steps': 39290, 'loss/train': 0.5053918957710266} -08/30/2021 20:16:39 - INFO - __main__ - Step 39292: {'lr': 0.00042568137114995633, 'samples': 7544064, 'steps': 39291, 'loss/train': 1.3245831727981567} -08/30/2021 20:16:39 - INFO - __main__ - Step 39293: {'lr': 0.00042567759556821937, 'samples': 7544256, 'steps': 39292, 'loss/train': 0.08145341277122498} -08/30/2021 20:16:39 - INFO - __main__ - Step 39294: {'lr': 0.00042567381990732476, 'samples': 7544448, 'steps': 39293, 'loss/train': 0.670648992061615} -08/30/2021 20:16:41 - INFO - __main__ - Step 39295: {'lr': 0.0004256700441672743, 'samples': 7544640, 'steps': 39294, 'loss/train': 1.8403757810592651} -08/30/2021 20:16:42 - INFO - __main__ - Step 39296: {'lr': 0.0004256662683480695, 'samples': 7544832, 'steps': 39295, 'loss/train': 1.3670477867126465} -08/30/2021 20:16:42 - INFO - __main__ - Step 39297: {'lr': 0.00042566249244971235, 'samples': 7545024, 'steps': 39296, 'loss/train': 1.0663715600967407} -08/30/2021 20:16:43 - INFO - __main__ - Step 39298: {'lr': 0.0004256587164722043, 'samples': 7545216, 'steps': 39297, 'loss/train': 1.6513261795043945} -08/30/2021 20:16:43 - INFO - __main__ - Step 39299: {'lr': 0.0004256549404155471, 'samples': 7545408, 'steps': 39298, 'loss/train': 2.644193410873413} -08/30/2021 20:16:44 - INFO - __main__ - Step 39300: {'lr': 0.0004256511642797426, 'samples': 7545600, 'steps': 39299, 'loss/train': 1.4818652868270874} -08/30/2021 20:16:45 - INFO - __main__ - Step 39301: {'lr': 0.0004256473880647923, 'samples': 7545792, 'steps': 39300, 'loss/train': 1.6008274555206299} -08/30/2021 20:16:45 - INFO - __main__ - Step 39302: {'lr': 0.0004256436117706981, 'samples': 7545984, 'steps': 39301, 'loss/train': 1.086125135421753} -08/30/2021 20:16:46 - INFO - __main__ - Step 39303: {'lr': 0.0004256398353974615, 'samples': 7546176, 'steps': 39302, 'loss/train': 1.7928388118743896} -08/30/2021 20:16:46 - INFO - __main__ - Step 39304: {'lr': 0.00042563605894508434, 'samples': 7546368, 'steps': 39303, 'loss/train': 1.5981634855270386} -08/30/2021 20:16:46 - INFO - __main__ - Step 39305: {'lr': 0.00042563228241356834, 'samples': 7546560, 'steps': 39304, 'loss/train': 1.6829520463943481} -08/30/2021 20:16:48 - INFO - __main__ - Step 39306: {'lr': 0.000425628505802915, 'samples': 7546752, 'steps': 39305, 'loss/train': 1.738876461982727} -08/30/2021 20:16:48 - INFO - __main__ - Step 39307: {'lr': 0.0004256247291131263, 'samples': 7546944, 'steps': 39306, 'loss/train': 1.655989408493042} -08/30/2021 20:16:49 - INFO - __main__ - Step 39308: {'lr': 0.00042562095234420375, 'samples': 7547136, 'steps': 39307, 'loss/train': 1.2943518161773682} -08/30/2021 20:16:49 - INFO - __main__ - Step 39309: {'lr': 0.00042561717549614907, 'samples': 7547328, 'steps': 39308, 'loss/train': 0.30530333518981934} -08/30/2021 20:16:49 - INFO - __main__ - Step 39310: {'lr': 0.0004256133985689641, 'samples': 7547520, 'steps': 39309, 'loss/train': 1.379294753074646} -08/30/2021 20:16:51 - INFO - __main__ - Step 39311: {'lr': 0.0004256096215626504, 'samples': 7547712, 'steps': 39310, 'loss/train': 1.431809425354004} -08/30/2021 20:16:51 - INFO - __main__ - Step 39312: {'lr': 0.0004256058444772097, 'samples': 7547904, 'steps': 39311, 'loss/train': 1.136567234992981} -08/30/2021 20:16:52 - INFO - __main__ - Step 39313: {'lr': 0.0004256020673126437, 'samples': 7548096, 'steps': 39312, 'loss/train': 0.739686131477356} -08/30/2021 20:16:52 - INFO - __main__ - Step 39314: {'lr': 0.0004255982900689541, 'samples': 7548288, 'steps': 39313, 'loss/train': 1.1690136194229126} -08/30/2021 20:16:52 - INFO - __main__ - Step 39315: {'lr': 0.0004255945127461427, 'samples': 7548480, 'steps': 39314, 'loss/train': 0.05878067389130592} -08/30/2021 20:16:54 - INFO - __main__ - Step 39316: {'lr': 0.00042559073534421114, 'samples': 7548672, 'steps': 39315, 'loss/train': 1.8100237846374512} -08/30/2021 20:16:54 - INFO - __main__ - Step 39317: {'lr': 0.00042558695786316106, 'samples': 7548864, 'steps': 39316, 'loss/train': 1.430045485496521} -08/30/2021 20:16:55 - INFO - __main__ - Step 39318: {'lr': 0.00042558318030299415, 'samples': 7549056, 'steps': 39317, 'loss/train': 1.5092629194259644} -08/30/2021 20:16:55 - INFO - __main__ - Step 39319: {'lr': 0.0004255794026637122, 'samples': 7549248, 'steps': 39318, 'loss/train': 0.06414658576250076} -08/30/2021 20:16:55 - INFO - __main__ - Step 39320: {'lr': 0.0004255756249453169, 'samples': 7549440, 'steps': 39319, 'loss/train': 1.1893595457077026} -08/30/2021 20:16:57 - INFO - __main__ - Step 39321: {'lr': 0.00042557184714780993, 'samples': 7549632, 'steps': 39320, 'loss/train': 1.2197809219360352} -08/30/2021 20:16:57 - INFO - __main__ - Step 39322: {'lr': 0.000425568069271193, 'samples': 7549824, 'steps': 39321, 'loss/train': 0.46699976921081543} -08/30/2021 20:16:58 - INFO - __main__ - Step 39323: {'lr': 0.00042556429131546775, 'samples': 7550016, 'steps': 39322, 'loss/train': 2.1314680576324463} -08/30/2021 20:16:58 - INFO - __main__ - Step 39324: {'lr': 0.000425560513280636, 'samples': 7550208, 'steps': 39323, 'loss/train': 1.6722991466522217} -08/30/2021 20:16:58 - INFO - __main__ - Step 39325: {'lr': 0.00042555673516669933, 'samples': 7550400, 'steps': 39324, 'loss/train': 1.047684907913208} -08/30/2021 20:17:00 - INFO - __main__ - Step 39326: {'lr': 0.0004255529569736596, 'samples': 7550592, 'steps': 39325, 'loss/train': 2.393691301345825} -08/30/2021 20:17:00 - INFO - __main__ - Step 39327: {'lr': 0.0004255491787015183, 'samples': 7550784, 'steps': 39326, 'loss/train': 1.661149024963379} -08/30/2021 20:17:01 - INFO - __main__ - Step 39328: {'lr': 0.0004255454003502774, 'samples': 7550976, 'steps': 39327, 'loss/train': 1.659741759300232} -08/30/2021 20:17:01 - INFO - __main__ - Step 39329: {'lr': 0.0004255416219199384, 'samples': 7551168, 'steps': 39328, 'loss/train': 1.645760416984558} -08/30/2021 20:17:01 - INFO - __main__ - Step 39330: {'lr': 0.0004255378434105029, 'samples': 7551360, 'steps': 39329, 'loss/train': 1.4031420946121216} -08/30/2021 20:17:03 - INFO - __main__ - Step 39331: {'lr': 0.00042553406482197297, 'samples': 7551552, 'steps': 39330, 'loss/train': 1.3567979335784912} -08/30/2021 20:17:03 - INFO - __main__ - Step 39332: {'lr': 0.00042553028615434997, 'samples': 7551744, 'steps': 39331, 'loss/train': 1.6148399114608765} -08/30/2021 20:17:04 - INFO - __main__ - Step 39333: {'lr': 0.0004255265074076358, 'samples': 7551936, 'steps': 39332, 'loss/train': 0.9594143629074097} -08/30/2021 20:17:04 - INFO - __main__ - Step 39334: {'lr': 0.00042552272858183203, 'samples': 7552128, 'steps': 39333, 'loss/train': 0.033706679940223694} -08/30/2021 20:17:04 - INFO - __main__ - Step 39335: {'lr': 0.0004255189496769405, 'samples': 7552320, 'steps': 39334, 'loss/train': 1.1487500667572021} -08/30/2021 20:17:06 - INFO - __main__ - Step 39336: {'lr': 0.00042551517069296276, 'samples': 7552512, 'steps': 39335, 'loss/train': 1.7795332670211792} -08/30/2021 20:17:07 - INFO - __main__ - Step 39337: {'lr': 0.00042551139162990065, 'samples': 7552704, 'steps': 39336, 'loss/train': 1.3000907897949219} -08/30/2021 20:17:07 - INFO - __main__ - Step 39338: {'lr': 0.0004255076124877558, 'samples': 7552896, 'steps': 39337, 'loss/train': 0.12005091458559036} -08/30/2021 20:17:07 - INFO - __main__ - Step 39339: {'lr': 0.0004255038332665299, 'samples': 7553088, 'steps': 39338, 'loss/train': 1.580047607421875} -08/30/2021 20:17:08 - INFO - __main__ - Step 39340: {'lr': 0.0004255000539662247, 'samples': 7553280, 'steps': 39339, 'loss/train': 1.6727694272994995} -08/30/2021 20:17:08 - INFO - __main__ - Step 39341: {'lr': 0.0004254962745868419, 'samples': 7553472, 'steps': 39340, 'loss/train': 1.2373043298721313} -08/30/2021 20:17:09 - INFO - __main__ - Step 39342: {'lr': 0.00042549249512838325, 'samples': 7553664, 'steps': 39341, 'loss/train': 1.2816848754882812} -08/30/2021 20:17:10 - INFO - __main__ - Step 39343: {'lr': 0.00042548871559085026, 'samples': 7553856, 'steps': 39342, 'loss/train': 0.9505172371864319} -08/30/2021 20:17:10 - INFO - __main__ - Step 39344: {'lr': 0.0004254849359742449, 'samples': 7554048, 'steps': 39343, 'loss/train': 0.4994402527809143} -08/30/2021 20:17:11 - INFO - __main__ - Step 39345: {'lr': 0.0004254811562785686, 'samples': 7554240, 'steps': 39344, 'loss/train': 1.2361412048339844} -08/30/2021 20:17:11 - INFO - __main__ - Step 39346: {'lr': 0.00042547737650382324, 'samples': 7554432, 'steps': 39345, 'loss/train': 1.553163766860962} -08/30/2021 20:17:13 - INFO - __main__ - Step 39347: {'lr': 0.0004254735966500105, 'samples': 7554624, 'steps': 39346, 'loss/train': 0.9998989701271057} -08/30/2021 20:17:14 - INFO - __main__ - Step 39348: {'lr': 0.00042546981671713206, 'samples': 7554816, 'steps': 39347, 'loss/train': 1.6435304880142212} -08/30/2021 20:17:14 - INFO - __main__ - Step 39349: {'lr': 0.0004254660367051896, 'samples': 7555008, 'steps': 39348, 'loss/train': 1.8735414743423462} -08/30/2021 20:17:14 - INFO - __main__ - Step 39350: {'lr': 0.0004254622566141849, 'samples': 7555200, 'steps': 39349, 'loss/train': 1.5143274068832397} -08/30/2021 20:17:15 - INFO - __main__ - Step 39351: {'lr': 0.0004254584764441196, 'samples': 7555392, 'steps': 39350, 'loss/train': 1.3694311380386353} -08/30/2021 20:17:16 - INFO - __main__ - Step 39352: {'lr': 0.00042545469619499545, 'samples': 7555584, 'steps': 39351, 'loss/train': 0.5295366048812866} -08/30/2021 20:17:16 - INFO - __main__ - Step 39353: {'lr': 0.00042545091586681404, 'samples': 7555776, 'steps': 39352, 'loss/train': 1.4884425401687622} -08/30/2021 20:17:17 - INFO - __main__ - Step 39354: {'lr': 0.0004254471354595772, 'samples': 7555968, 'steps': 39353, 'loss/train': 1.6351653337478638} -08/30/2021 20:17:17 - INFO - __main__ - Step 39355: {'lr': 0.0004254433549732866, 'samples': 7556160, 'steps': 39354, 'loss/train': 1.3009556531906128} -08/30/2021 20:17:18 - INFO - __main__ - Step 39356: {'lr': 0.0004254395744079439, 'samples': 7556352, 'steps': 39355, 'loss/train': 0.8656249642372131} -08/30/2021 20:17:19 - INFO - __main__ - Step 39357: {'lr': 0.0004254357937635509, 'samples': 7556544, 'steps': 39356, 'loss/train': 1.461314082145691} -08/30/2021 20:17:20 - INFO - __main__ - Step 39358: {'lr': 0.00042543201304010914, 'samples': 7556736, 'steps': 39357, 'loss/train': 1.8331661224365234} -08/30/2021 20:17:20 - INFO - __main__ - Step 39359: {'lr': 0.0004254282322376205, 'samples': 7556928, 'steps': 39358, 'loss/train': 1.5330111980438232} -08/30/2021 20:17:20 - INFO - __main__ - Step 39360: {'lr': 0.0004254244513560866, 'samples': 7557120, 'steps': 39359, 'loss/train': 1.3315730094909668} -08/30/2021 20:17:21 - INFO - __main__ - Step 39361: {'lr': 0.00042542067039550916, 'samples': 7557312, 'steps': 39360, 'loss/train': 1.5101749897003174} -08/30/2021 20:17:22 - INFO - __main__ - Step 39362: {'lr': 0.00042541688935588984, 'samples': 7557504, 'steps': 39361, 'loss/train': 1.3210201263427734} -08/30/2021 20:17:23 - INFO - __main__ - Step 39363: {'lr': 0.00042541310823723035, 'samples': 7557696, 'steps': 39362, 'loss/train': 1.3677185773849487} -08/30/2021 20:17:23 - INFO - __main__ - Step 39364: {'lr': 0.00042540932703953246, 'samples': 7557888, 'steps': 39363, 'loss/train': 1.2405917644500732} -08/30/2021 20:17:23 - INFO - __main__ - Step 39365: {'lr': 0.00042540554576279776, 'samples': 7558080, 'steps': 39364, 'loss/train': 0.6681594848632812} -08/30/2021 20:17:24 - INFO - __main__ - Step 39366: {'lr': 0.0004254017644070282, 'samples': 7558272, 'steps': 39365, 'loss/train': 0.9929782152175903} -08/30/2021 20:17:24 - INFO - __main__ - Step 39367: {'lr': 0.0004253979829722251, 'samples': 7558464, 'steps': 39366, 'loss/train': 0.08690003305673599} -08/30/2021 20:17:26 - INFO - __main__ - Step 39368: {'lr': 0.00042539420145839055, 'samples': 7558656, 'steps': 39367, 'loss/train': 1.2248239517211914} -08/30/2021 20:17:26 - INFO - __main__ - Step 39369: {'lr': 0.00042539041986552596, 'samples': 7558848, 'steps': 39368, 'loss/train': 1.0808542966842651} -08/30/2021 20:17:26 - INFO - __main__ - Step 39370: {'lr': 0.00042538663819363323, 'samples': 7559040, 'steps': 39369, 'loss/train': 3.869018793106079} -08/30/2021 20:17:27 - INFO - __main__ - Step 39371: {'lr': 0.000425382856442714, 'samples': 7559232, 'steps': 39370, 'loss/train': 0.8527717590332031} -08/30/2021 20:17:27 - INFO - __main__ - Step 39372: {'lr': 0.0004253790746127699, 'samples': 7559424, 'steps': 39371, 'loss/train': 1.0129683017730713} -08/30/2021 20:17:29 - INFO - __main__ - Step 39373: {'lr': 0.0004253752927038027, 'samples': 7559616, 'steps': 39372, 'loss/train': 0.922639012336731} -08/30/2021 20:17:29 - INFO - __main__ - Step 39374: {'lr': 0.0004253715107158141, 'samples': 7559808, 'steps': 39373, 'loss/train': 1.7660993337631226} -08/30/2021 20:17:29 - INFO - __main__ - Step 39375: {'lr': 0.0004253677286488058, 'samples': 7560000, 'steps': 39374, 'loss/train': 1.4221876859664917} -08/30/2021 20:17:30 - INFO - __main__ - Step 39376: {'lr': 0.00042536394650277953, 'samples': 7560192, 'steps': 39375, 'loss/train': 1.4791922569274902} -08/30/2021 20:17:30 - INFO - __main__ - Step 39377: {'lr': 0.000425360164277737, 'samples': 7560384, 'steps': 39376, 'loss/train': 1.7833961248397827} -08/30/2021 20:17:32 - INFO - __main__ - Step 39378: {'lr': 0.00042535638197367984, 'samples': 7560576, 'steps': 39377, 'loss/train': 1.848827600479126} -08/30/2021 20:17:32 - INFO - __main__ - Step 39379: {'lr': 0.0004253525995906098, 'samples': 7560768, 'steps': 39378, 'loss/train': 1.3308979272842407} -08/30/2021 20:17:32 - INFO - __main__ - Step 39380: {'lr': 0.00042534881712852856, 'samples': 7560960, 'steps': 39379, 'loss/train': 0.5071209073066711} -08/30/2021 20:17:33 - INFO - __main__ - Step 39381: {'lr': 0.0004253450345874379, 'samples': 7561152, 'steps': 39380, 'loss/train': 0.22713203728199005} -08/30/2021 20:17:33 - INFO - __main__ - Step 39382: {'lr': 0.00042534125196733955, 'samples': 7561344, 'steps': 39381, 'loss/train': 1.9108912944793701} -08/30/2021 20:17:35 - INFO - __main__ - Step 39383: {'lr': 0.000425337469268235, 'samples': 7561536, 'steps': 39382, 'loss/train': 1.2672617435455322} -08/30/2021 20:17:35 - INFO - __main__ - Step 39384: {'lr': 0.00042533368649012615, 'samples': 7561728, 'steps': 39383, 'loss/train': 1.6363317966461182} -08/30/2021 20:17:35 - INFO - __main__ - Step 39385: {'lr': 0.0004253299036330146, 'samples': 7561920, 'steps': 39384, 'loss/train': 0.5283082127571106} -08/30/2021 20:17:36 - INFO - __main__ - Step 39386: {'lr': 0.00042532612069690214, 'samples': 7562112, 'steps': 39385, 'loss/train': 1.4869177341461182} -08/30/2021 20:17:36 - INFO - __main__ - Step 39387: {'lr': 0.0004253223376817904, 'samples': 7562304, 'steps': 39386, 'loss/train': 1.831048607826233} -08/30/2021 20:17:38 - INFO - __main__ - Step 39388: {'lr': 0.0004253185545876812, 'samples': 7562496, 'steps': 39387, 'loss/train': 1.0880411863327026} -08/30/2021 20:17:38 - INFO - __main__ - Step 39389: {'lr': 0.0004253147714145761, 'samples': 7562688, 'steps': 39388, 'loss/train': 1.1887985467910767} -08/30/2021 20:17:39 - INFO - __main__ - Step 39390: {'lr': 0.00042531098816247695, 'samples': 7562880, 'steps': 39389, 'loss/train': 1.5237889289855957} -08/30/2021 20:17:39 - INFO - __main__ - Step 39391: {'lr': 0.00042530720483138524, 'samples': 7563072, 'steps': 39390, 'loss/train': 1.3814122676849365} -08/30/2021 20:17:39 - INFO - __main__ - Step 39392: {'lr': 0.00042530342142130283, 'samples': 7563264, 'steps': 39391, 'loss/train': 1.1057311296463013} -08/30/2021 20:17:40 - INFO - __main__ - Step 39393: {'lr': 0.0004252996379322315, 'samples': 7563456, 'steps': 39392, 'loss/train': 1.0700563192367554} -08/30/2021 20:17:41 - INFO - __main__ - Step 39394: {'lr': 0.0004252958543641728, 'samples': 7563648, 'steps': 39393, 'loss/train': 1.4636409282684326} -08/30/2021 20:17:42 - INFO - __main__ - Step 39395: {'lr': 0.0004252920707171285, 'samples': 7563840, 'steps': 39394, 'loss/train': 1.658215880393982} -08/30/2021 20:17:42 - INFO - __main__ - Step 39396: {'lr': 0.00042528828699110033, 'samples': 7564032, 'steps': 39395, 'loss/train': 1.7424261569976807} -08/30/2021 20:17:42 - INFO - __main__ - Step 39397: {'lr': 0.0004252845031860899, 'samples': 7564224, 'steps': 39396, 'loss/train': 1.0661591291427612} -08/30/2021 20:17:43 - INFO - __main__ - Step 39398: {'lr': 0.000425280719302099, 'samples': 7564416, 'steps': 39397, 'loss/train': 1.4587175846099854} -08/30/2021 20:17:44 - INFO - __main__ - Step 39399: {'lr': 0.0004252769353391294, 'samples': 7564608, 'steps': 39398, 'loss/train': 0.7495118975639343} -08/30/2021 20:17:45 - INFO - __main__ - Step 39400: {'lr': 0.00042527315129718257, 'samples': 7564800, 'steps': 39399, 'loss/train': 0.42761915922164917} -08/30/2021 20:17:45 - INFO - __main__ - Step 39401: {'lr': 0.00042526936717626046, 'samples': 7564992, 'steps': 39400, 'loss/train': 1.2316175699234009} -08/30/2021 20:17:45 - INFO - __main__ - Step 39402: {'lr': 0.00042526558297636464, 'samples': 7565184, 'steps': 39401, 'loss/train': 1.448720097541809} -08/30/2021 20:17:46 - INFO - __main__ - Step 39403: {'lr': 0.0004252617986974969, 'samples': 7565376, 'steps': 39402, 'loss/train': 1.3910382986068726} -08/30/2021 20:17:48 - INFO - __main__ - Step 39404: {'lr': 0.00042525801433965883, 'samples': 7565568, 'steps': 39403, 'loss/train': 1.7211908102035522} -08/30/2021 20:17:48 - INFO - __main__ - Step 39405: {'lr': 0.00042525422990285225, 'samples': 7565760, 'steps': 39404, 'loss/train': 1.9738531112670898} -08/30/2021 20:17:48 - INFO - __main__ - Step 39406: {'lr': 0.0004252504453870788, 'samples': 7565952, 'steps': 39405, 'loss/train': 1.6185775995254517} -08/30/2021 20:17:49 - INFO - __main__ - Step 39407: {'lr': 0.0004252466607923402, 'samples': 7566144, 'steps': 39406, 'loss/train': 1.0970726013183594} -08/30/2021 20:17:49 - INFO - __main__ - Step 39408: {'lr': 0.0004252428761186382, 'samples': 7566336, 'steps': 39407, 'loss/train': 1.7352116107940674} -08/30/2021 20:17:50 - INFO - __main__ - Step 39409: {'lr': 0.0004252390913659744, 'samples': 7566528, 'steps': 39408, 'loss/train': 1.5175449848175049} -08/30/2021 20:17:51 - INFO - __main__ - Step 39410: {'lr': 0.0004252353065343506, 'samples': 7566720, 'steps': 39409, 'loss/train': 1.4668569564819336} -08/30/2021 20:17:51 - INFO - __main__ - Step 39411: {'lr': 0.0004252315216237684, 'samples': 7566912, 'steps': 39410, 'loss/train': 1.9068946838378906} -08/30/2021 20:17:52 - INFO - __main__ - Step 39412: {'lr': 0.00042522773663422977, 'samples': 7567104, 'steps': 39411, 'loss/train': 1.8970649242401123} -08/30/2021 20:17:52 - INFO - __main__ - Step 39413: {'lr': 0.000425223951565736, 'samples': 7567296, 'steps': 39412, 'loss/train': 0.7986385822296143} -08/30/2021 20:17:53 - INFO - __main__ - Step 39414: {'lr': 0.0004252201664182892, 'samples': 7567488, 'steps': 39413, 'loss/train': 1.1627320051193237} -08/30/2021 20:17:54 - INFO - __main__ - Step 39415: {'lr': 0.0004252163811918909, 'samples': 7567680, 'steps': 39414, 'loss/train': 1.0643250942230225} -08/30/2021 20:17:54 - INFO - __main__ - Step 39416: {'lr': 0.00042521259588654264, 'samples': 7567872, 'steps': 39415, 'loss/train': 0.5217099785804749} -08/30/2021 20:17:55 - INFO - __main__ - Step 39417: {'lr': 0.00042520881050224637, 'samples': 7568064, 'steps': 39416, 'loss/train': 1.5016180276870728} -08/30/2021 20:17:55 - INFO - __main__ - Step 39418: {'lr': 0.0004252050250390037, 'samples': 7568256, 'steps': 39417, 'loss/train': 1.5426591634750366} -08/30/2021 20:17:55 - INFO - __main__ - Step 39419: {'lr': 0.0004252012394968164, 'samples': 7568448, 'steps': 39418, 'loss/train': 0.9755098223686218} -08/30/2021 20:17:57 - INFO - __main__ - Step 39420: {'lr': 0.0004251974538756861, 'samples': 7568640, 'steps': 39419, 'loss/train': 1.761231780052185} -08/30/2021 20:17:57 - INFO - __main__ - Step 39421: {'lr': 0.00042519366817561453, 'samples': 7568832, 'steps': 39420, 'loss/train': 1.431688666343689} -08/30/2021 20:17:58 - INFO - __main__ - Step 39422: {'lr': 0.0004251898823966034, 'samples': 7569024, 'steps': 39421, 'loss/train': 1.2372949123382568} -08/30/2021 20:17:58 - INFO - __main__ - Step 39423: {'lr': 0.00042518609653865444, 'samples': 7569216, 'steps': 39422, 'loss/train': 2.4636294841766357} -08/30/2021 20:18:00 - INFO - __main__ - Step 39424: {'lr': 0.00042518231060176926, 'samples': 7569408, 'steps': 39423, 'loss/train': 1.4081465005874634} -08/30/2021 20:18:00 - INFO - __main__ - Step 39425: {'lr': 0.00042517852458594967, 'samples': 7569600, 'steps': 39424, 'loss/train': 1.8521902561187744} -08/30/2021 20:18:01 - INFO - __main__ - Step 39426: {'lr': 0.00042517473849119734, 'samples': 7569792, 'steps': 39425, 'loss/train': 1.607431411743164} -08/30/2021 20:18:01 - INFO - __main__ - Step 39427: {'lr': 0.000425170952317514, 'samples': 7569984, 'steps': 39426, 'loss/train': 1.3722666501998901} -08/30/2021 20:18:02 - INFO - __main__ - Step 39428: {'lr': 0.0004251671660649013, 'samples': 7570176, 'steps': 39427, 'loss/train': 0.19016487896442413} -08/30/2021 20:18:02 - INFO - __main__ - Step 39429: {'lr': 0.000425163379733361, 'samples': 7570368, 'steps': 39428, 'loss/train': 1.5978096723556519} -08/30/2021 20:18:03 - INFO - __main__ - Step 39430: {'lr': 0.00042515959332289476, 'samples': 7570560, 'steps': 39429, 'loss/train': 0.8655191659927368} -08/30/2021 20:18:04 - INFO - __main__ - Step 39431: {'lr': 0.0004251558068335043, 'samples': 7570752, 'steps': 39430, 'loss/train': 1.6447068452835083} -08/30/2021 20:18:04 - INFO - __main__ - Step 39432: {'lr': 0.00042515202026519136, 'samples': 7570944, 'steps': 39431, 'loss/train': 1.4137521982192993} -08/30/2021 20:18:04 - INFO - __main__ - Step 39433: {'lr': 0.00042514823361795764, 'samples': 7571136, 'steps': 39432, 'loss/train': 1.389886736869812} -08/30/2021 20:18:05 - INFO - __main__ - Step 39434: {'lr': 0.0004251444468918048, 'samples': 7571328, 'steps': 39433, 'loss/train': 1.359593152999878} -08/30/2021 20:18:06 - INFO - __main__ - Step 39435: {'lr': 0.0004251406600867346, 'samples': 7571520, 'steps': 39434, 'loss/train': 1.7458051443099976} -08/30/2021 20:18:07 - INFO - __main__ - Step 39436: {'lr': 0.00042513687320274866, 'samples': 7571712, 'steps': 39435, 'loss/train': 0.9783296585083008} -08/30/2021 20:18:07 - INFO - __main__ - Step 39437: {'lr': 0.0004251330862398488, 'samples': 7571904, 'steps': 39436, 'loss/train': 1.424580454826355} -08/30/2021 20:18:07 - INFO - __main__ - Step 39438: {'lr': 0.0004251292991980367, 'samples': 7572096, 'steps': 39437, 'loss/train': 1.449739933013916} -08/30/2021 20:18:08 - INFO - __main__ - Step 39439: {'lr': 0.000425125512077314, 'samples': 7572288, 'steps': 39438, 'loss/train': 1.382744550704956} -08/30/2021 20:18:10 - INFO - __main__ - Step 39440: {'lr': 0.00042512172487768244, 'samples': 7572480, 'steps': 39439, 'loss/train': 1.4800609350204468} -08/30/2021 20:18:10 - INFO - __main__ - Step 39441: {'lr': 0.00042511793759914375, 'samples': 7572672, 'steps': 39440, 'loss/train': 1.0243180990219116} -08/30/2021 20:18:10 - INFO - __main__ - Step 39442: {'lr': 0.0004251141502416996, 'samples': 7572864, 'steps': 39441, 'loss/train': 1.5579551458358765} -08/30/2021 20:18:11 - INFO - __main__ - Step 39443: {'lr': 0.0004251103628053517, 'samples': 7573056, 'steps': 39442, 'loss/train': 1.1759260892868042} -08/30/2021 20:18:11 - INFO - __main__ - Step 39444: {'lr': 0.0004251065752901018, 'samples': 7573248, 'steps': 39443, 'loss/train': 0.05363607034087181} -08/30/2021 20:18:11 - INFO - __main__ - Step 39445: {'lr': 0.0004251027876959516, 'samples': 7573440, 'steps': 39444, 'loss/train': 1.4465770721435547} -08/30/2021 20:18:13 - INFO - __main__ - Step 39446: {'lr': 0.0004250990000229028, 'samples': 7573632, 'steps': 39445, 'loss/train': 1.134953260421753} -08/30/2021 20:18:14 - INFO - __main__ - Step 39447: {'lr': 0.00042509521227095706, 'samples': 7573824, 'steps': 39446, 'loss/train': 1.4134520292282104} -08/30/2021 20:18:14 - INFO - __main__ - Step 39448: {'lr': 0.0004250914244401161, 'samples': 7574016, 'steps': 39447, 'loss/train': 1.6693947315216064} -08/30/2021 20:18:14 - INFO - __main__ - Step 39449: {'lr': 0.00042508763653038167, 'samples': 7574208, 'steps': 39448, 'loss/train': 1.1682648658752441} -08/30/2021 20:18:15 - INFO - __main__ - Step 39450: {'lr': 0.0004250838485417554, 'samples': 7574400, 'steps': 39449, 'loss/train': 1.0540648698806763} -08/30/2021 20:18:17 - INFO - __main__ - Step 39451: {'lr': 0.00042508006047423916, 'samples': 7574592, 'steps': 39450, 'loss/train': 1.8485313653945923} -08/30/2021 20:18:17 - INFO - __main__ - Step 39452: {'lr': 0.0004250762723278344, 'samples': 7574784, 'steps': 39451, 'loss/train': 0.808741569519043} -08/30/2021 20:18:18 - INFO - __main__ - Step 39453: {'lr': 0.00042507248410254307, 'samples': 7574976, 'steps': 39452, 'loss/train': 1.4375113248825073} -08/30/2021 20:18:18 - INFO - __main__ - Step 39454: {'lr': 0.0004250686957983668, 'samples': 7575168, 'steps': 39453, 'loss/train': 1.6407214403152466} -08/30/2021 20:18:18 - INFO - __main__ - Step 39455: {'lr': 0.00042506490741530724, 'samples': 7575360, 'steps': 39454, 'loss/train': 1.4404360055923462} -08/30/2021 20:18:20 - INFO - __main__ - Step 39456: {'lr': 0.00042506111895336616, 'samples': 7575552, 'steps': 39455, 'loss/train': 1.480907917022705} -08/30/2021 20:18:21 - INFO - __main__ - Step 39457: {'lr': 0.00042505733041254526, 'samples': 7575744, 'steps': 39456, 'loss/train': 0.9219895601272583} -08/30/2021 20:18:21 - INFO - __main__ - Step 39458: {'lr': 0.00042505354179284615, 'samples': 7575936, 'steps': 39457, 'loss/train': 1.2193272113800049} -08/30/2021 20:18:21 - INFO - __main__ - Step 39459: {'lr': 0.00042504975309427064, 'samples': 7576128, 'steps': 39458, 'loss/train': 0.9388018250465393} -08/30/2021 20:18:22 - INFO - __main__ - Step 39460: {'lr': 0.0004250459643168204, 'samples': 7576320, 'steps': 39459, 'loss/train': 1.744175672531128} -08/30/2021 20:18:22 - INFO - __main__ - Step 39461: {'lr': 0.0004250421754604972, 'samples': 7576512, 'steps': 39460, 'loss/train': 1.3544243574142456} -08/30/2021 20:18:24 - INFO - __main__ - Step 39462: {'lr': 0.0004250383865253027, 'samples': 7576704, 'steps': 39461, 'loss/train': 0.6414830088615417} -08/30/2021 20:18:24 - INFO - __main__ - Step 39463: {'lr': 0.00042503459751123854, 'samples': 7576896, 'steps': 39462, 'loss/train': 1.3449714183807373} -08/30/2021 20:18:24 - INFO - __main__ - Step 39464: {'lr': 0.00042503080841830654, 'samples': 7577088, 'steps': 39463, 'loss/train': 1.4991395473480225} -08/30/2021 20:18:25 - INFO - __main__ - Step 39465: {'lr': 0.0004250270192465083, 'samples': 7577280, 'steps': 39464, 'loss/train': 0.6795907616615295} -08/30/2021 20:18:25 - INFO - __main__ - Step 39466: {'lr': 0.0004250232299958456, 'samples': 7577472, 'steps': 39465, 'loss/train': 1.0619497299194336} -08/30/2021 20:18:28 - INFO - __main__ - Step 39467: {'lr': 0.0004250194406663203, 'samples': 7577664, 'steps': 39466, 'loss/train': 0.04803982749581337} -08/30/2021 20:18:28 - INFO - __main__ - Step 39468: {'lr': 0.00042501565125793375, 'samples': 7577856, 'steps': 39467, 'loss/train': 0.48896893858909607} -08/30/2021 20:18:28 - INFO - __main__ - Step 39469: {'lr': 0.0004250118617706879, 'samples': 7578048, 'steps': 39468, 'loss/train': 0.471354603767395} -08/30/2021 20:18:29 - INFO - __main__ - Step 39470: {'lr': 0.0004250080722045844, 'samples': 7578240, 'steps': 39469, 'loss/train': 0.4417729675769806} -08/30/2021 20:18:29 - INFO - __main__ - Step 39471: {'lr': 0.000425004282559625, 'samples': 7578432, 'steps': 39470, 'loss/train': 1.9594004154205322} -08/30/2021 20:18:29 - INFO - __main__ - Step 39472: {'lr': 0.0004250004928358113, 'samples': 7578624, 'steps': 39471, 'loss/train': 1.3119771480560303} -08/30/2021 20:18:31 - INFO - __main__ - Step 39473: {'lr': 0.0004249967030331451, 'samples': 7578816, 'steps': 39472, 'loss/train': 1.843422532081604} -08/30/2021 20:18:31 - INFO - __main__ - Step 39474: {'lr': 0.0004249929131516281, 'samples': 7579008, 'steps': 39473, 'loss/train': 1.687857985496521} -08/30/2021 20:18:32 - INFO - __main__ - Step 39475: {'lr': 0.00042498912319126206, 'samples': 7579200, 'steps': 39474, 'loss/train': 1.562577486038208} -08/30/2021 20:18:32 - INFO - __main__ - Step 39476: {'lr': 0.00042498533315204855, 'samples': 7579392, 'steps': 39475, 'loss/train': 0.8977767825126648} -08/30/2021 20:18:32 - INFO - __main__ - Step 39477: {'lr': 0.0004249815430339894, 'samples': 7579584, 'steps': 39476, 'loss/train': 1.6779088973999023} -08/30/2021 20:18:34 - INFO - __main__ - Step 39478: {'lr': 0.0004249777528370862, 'samples': 7579776, 'steps': 39477, 'loss/train': 1.6529103517532349} -08/30/2021 20:18:34 - INFO - __main__ - Step 39479: {'lr': 0.00042497396256134073, 'samples': 7579968, 'steps': 39478, 'loss/train': 1.3054628372192383} -08/30/2021 20:18:35 - INFO - __main__ - Step 39480: {'lr': 0.0004249701722067547, 'samples': 7580160, 'steps': 39479, 'loss/train': 0.9560337662696838} -08/30/2021 20:18:35 - INFO - __main__ - Step 39481: {'lr': 0.0004249663817733298, 'samples': 7580352, 'steps': 39480, 'loss/train': 1.0896540880203247} -08/30/2021 20:18:36 - INFO - __main__ - Step 39482: {'lr': 0.00042496259126106786, 'samples': 7580544, 'steps': 39481, 'loss/train': 1.1687583923339844} -08/30/2021 20:18:36 - INFO - __main__ - Step 39483: {'lr': 0.0004249588006699704, 'samples': 7580736, 'steps': 39482, 'loss/train': 0.2920774817466736} -08/30/2021 20:18:37 - INFO - __main__ - Step 39484: {'lr': 0.0004249550100000392, 'samples': 7580928, 'steps': 39483, 'loss/train': 1.023453712463379} -08/30/2021 20:18:38 - INFO - __main__ - Step 39485: {'lr': 0.0004249512192512759, 'samples': 7581120, 'steps': 39484, 'loss/train': 1.498961329460144} -08/30/2021 20:18:38 - INFO - __main__ - Step 39486: {'lr': 0.0004249474284236824, 'samples': 7581312, 'steps': 39485, 'loss/train': 1.3543148040771484} -08/30/2021 20:18:39 - INFO - __main__ - Step 39487: {'lr': 0.0004249436375172602, 'samples': 7581504, 'steps': 39486, 'loss/train': 5.647855281829834} -08/30/2021 20:18:39 - INFO - __main__ - Step 39488: {'lr': 0.0004249398465320111, 'samples': 7581696, 'steps': 39487, 'loss/train': 1.8692651987075806} -08/30/2021 20:18:41 - INFO - __main__ - Step 39489: {'lr': 0.0004249360554679369, 'samples': 7581888, 'steps': 39488, 'loss/train': 1.686635136604309} -08/30/2021 20:18:41 - INFO - __main__ - Step 39490: {'lr': 0.00042493226432503917, 'samples': 7582080, 'steps': 39489, 'loss/train': 1.572129726409912} -08/30/2021 20:18:42 - INFO - __main__ - Step 39491: {'lr': 0.00042492847310331963, 'samples': 7582272, 'steps': 39490, 'loss/train': 1.2694830894470215} -08/30/2021 20:18:42 - INFO - __main__ - Step 39492: {'lr': 0.00042492468180278, 'samples': 7582464, 'steps': 39491, 'loss/train': 1.402726650238037} -08/30/2021 20:18:42 - INFO - __main__ - Step 39493: {'lr': 0.000424920890423422, 'samples': 7582656, 'steps': 39492, 'loss/train': 1.7928509712219238} -08/30/2021 20:18:43 - INFO - __main__ - Step 39494: {'lr': 0.0004249170989652474, 'samples': 7582848, 'steps': 39493, 'loss/train': 1.0122957229614258} -08/30/2021 20:18:44 - INFO - __main__ - Step 39495: {'lr': 0.00042491330742825783, 'samples': 7583040, 'steps': 39494, 'loss/train': 0.059469517320394516} -08/30/2021 20:18:45 - INFO - __main__ - Step 39496: {'lr': 0.0004249095158124551, 'samples': 7583232, 'steps': 39495, 'loss/train': 1.5529097318649292} -08/30/2021 20:18:45 - INFO - __main__ - Step 39497: {'lr': 0.0004249057241178407, 'samples': 7583424, 'steps': 39496, 'loss/train': 1.6514521837234497} -08/30/2021 20:18:45 - INFO - __main__ - Step 39498: {'lr': 0.00042490193234441656, 'samples': 7583616, 'steps': 39497, 'loss/train': 1.4907827377319336} -08/30/2021 20:18:46 - INFO - __main__ - Step 39499: {'lr': 0.00042489814049218434, 'samples': 7583808, 'steps': 39498, 'loss/train': 1.4580267667770386} -08/30/2021 20:18:46 - INFO - __main__ - Step 39500: {'lr': 0.00042489434856114565, 'samples': 7584000, 'steps': 39499, 'loss/train': 1.9874862432479858} -08/30/2021 20:18:47 - INFO - __main__ - Step 39501: {'lr': 0.00042489055655130226, 'samples': 7584192, 'steps': 39500, 'loss/train': 1.38264000415802} -08/30/2021 20:18:48 - INFO - __main__ - Step 39502: {'lr': 0.00042488676446265596, 'samples': 7584384, 'steps': 39501, 'loss/train': 1.1394124031066895} -08/30/2021 20:18:48 - INFO - __main__ - Step 39503: {'lr': 0.00042488297229520834, 'samples': 7584576, 'steps': 39502, 'loss/train': 1.03812575340271} -08/30/2021 20:18:49 - INFO - __main__ - Step 39504: {'lr': 0.00042487918004896117, 'samples': 7584768, 'steps': 39503, 'loss/train': 0.8285332322120667} -08/30/2021 20:18:49 - INFO - __main__ - Step 39505: {'lr': 0.0004248753877239161, 'samples': 7584960, 'steps': 39504, 'loss/train': 1.6451088190078735} -08/30/2021 20:18:50 - INFO - __main__ - Step 39506: {'lr': 0.0004248715953200749, 'samples': 7585152, 'steps': 39505, 'loss/train': 1.5462449789047241} -08/30/2021 20:18:51 - INFO - __main__ - Step 39507: {'lr': 0.00042486780283743927, 'samples': 7585344, 'steps': 39506, 'loss/train': 1.0202428102493286} -08/30/2021 20:18:51 - INFO - __main__ - Step 39508: {'lr': 0.00042486401027601084, 'samples': 7585536, 'steps': 39507, 'loss/train': 0.9145278930664062} -08/30/2021 20:18:52 - INFO - __main__ - Step 39509: {'lr': 0.0004248602176357915, 'samples': 7585728, 'steps': 39508, 'loss/train': 1.6860967874526978} -08/30/2021 20:18:52 - INFO - __main__ - Step 39510: {'lr': 0.0004248564249167828, 'samples': 7585920, 'steps': 39509, 'loss/train': 1.3073070049285889} -08/30/2021 20:18:54 - INFO - __main__ - Step 39511: {'lr': 0.00042485263211898647, 'samples': 7586112, 'steps': 39510, 'loss/train': 0.9959359765052795} -08/30/2021 20:18:54 - INFO - __main__ - Step 39512: {'lr': 0.00042484883924240427, 'samples': 7586304, 'steps': 39511, 'loss/train': 0.91527259349823} -08/30/2021 20:18:55 - INFO - __main__ - Step 39513: {'lr': 0.0004248450462870378, 'samples': 7586496, 'steps': 39512, 'loss/train': 1.3920543193817139} -08/30/2021 20:18:55 - INFO - __main__ - Step 39514: {'lr': 0.0004248412532528889, 'samples': 7586688, 'steps': 39513, 'loss/train': 1.7589521408081055} -08/30/2021 20:18:55 - INFO - __main__ - Step 39515: {'lr': 0.00042483746013995924, 'samples': 7586880, 'steps': 39514, 'loss/train': 1.122774600982666} -08/30/2021 20:18:57 - INFO - __main__ - Step 39516: {'lr': 0.00042483366694825054, 'samples': 7587072, 'steps': 39515, 'loss/train': 1.2255520820617676} -08/30/2021 20:18:57 - INFO - __main__ - Step 39517: {'lr': 0.0004248298736777645, 'samples': 7587264, 'steps': 39516, 'loss/train': 1.5675015449523926} -08/30/2021 20:18:58 - INFO - __main__ - Step 39518: {'lr': 0.00042482608032850275, 'samples': 7587456, 'steps': 39517, 'loss/train': 1.147222876548767} -08/30/2021 20:18:58 - INFO - __main__ - Step 39519: {'lr': 0.0004248222869004671, 'samples': 7587648, 'steps': 39518, 'loss/train': 1.7895618677139282} -08/30/2021 20:18:58 - INFO - __main__ - Step 39520: {'lr': 0.0004248184933936592, 'samples': 7587840, 'steps': 39519, 'loss/train': 1.3324826955795288} -08/30/2021 20:19:00 - INFO - __main__ - Step 39521: {'lr': 0.0004248146998080808, 'samples': 7588032, 'steps': 39520, 'loss/train': 1.1157089471817017} -08/30/2021 20:19:00 - INFO - __main__ - Step 39522: {'lr': 0.00042481090614373364, 'samples': 7588224, 'steps': 39521, 'loss/train': 1.195725917816162} -08/30/2021 20:19:01 - INFO - __main__ - Step 39523: {'lr': 0.00042480711240061933, 'samples': 7588416, 'steps': 39522, 'loss/train': 1.6636579036712646} -08/30/2021 20:19:01 - INFO - __main__ - Step 39524: {'lr': 0.0004248033185787397, 'samples': 7588608, 'steps': 39523, 'loss/train': 2.113940954208374} -08/30/2021 20:19:01 - INFO - __main__ - Step 39525: {'lr': 0.00042479952467809623, 'samples': 7588800, 'steps': 39524, 'loss/train': 0.8742247223854065} -08/30/2021 20:19:02 - INFO - __main__ - Step 39526: {'lr': 0.00042479573069869095, 'samples': 7588992, 'steps': 39525, 'loss/train': 1.3103822469711304} -08/30/2021 20:19:03 - INFO - __main__ - Step 39527: {'lr': 0.0004247919366405253, 'samples': 7589184, 'steps': 39526, 'loss/train': 0.8090722560882568} -08/30/2021 20:19:04 - INFO - __main__ - Step 39528: {'lr': 0.0004247881425036012, 'samples': 7589376, 'steps': 39527, 'loss/train': 1.4750295877456665} -08/30/2021 20:19:04 - INFO - __main__ - Step 39529: {'lr': 0.00042478434828792025, 'samples': 7589568, 'steps': 39528, 'loss/train': 1.0613157749176025} -08/30/2021 20:19:04 - INFO - __main__ - Step 39530: {'lr': 0.00042478055399348415, 'samples': 7589760, 'steps': 39529, 'loss/train': 1.7844194173812866} -08/30/2021 20:19:05 - INFO - __main__ - Step 39531: {'lr': 0.0004247767596202946, 'samples': 7589952, 'steps': 39530, 'loss/train': 1.3964990377426147} -08/30/2021 20:19:06 - INFO - __main__ - Step 39532: {'lr': 0.00042477296516835335, 'samples': 7590144, 'steps': 39531, 'loss/train': 1.268181324005127} -08/30/2021 20:19:07 - INFO - __main__ - Step 39533: {'lr': 0.00042476917063766207, 'samples': 7590336, 'steps': 39532, 'loss/train': 2.2163519859313965} -08/30/2021 20:19:07 - INFO - __main__ - Step 39534: {'lr': 0.0004247653760282225, 'samples': 7590528, 'steps': 39533, 'loss/train': 1.7320178747177124} -08/30/2021 20:19:08 - INFO - __main__ - Step 39535: {'lr': 0.0004247615813400364, 'samples': 7590720, 'steps': 39534, 'loss/train': 1.2027949094772339} -08/30/2021 20:19:08 - INFO - __main__ - Step 39536: {'lr': 0.0004247577865731055, 'samples': 7590912, 'steps': 39535, 'loss/train': 0.5038268566131592} -08/30/2021 20:19:09 - INFO - __main__ - Step 39537: {'lr': 0.00042475399172743134, 'samples': 7591104, 'steps': 39536, 'loss/train': 1.6581089496612549} -08/30/2021 20:19:10 - INFO - __main__ - Step 39538: {'lr': 0.0004247501968030157, 'samples': 7591296, 'steps': 39537, 'loss/train': 1.2676939964294434} -08/30/2021 20:19:10 - INFO - __main__ - Step 39539: {'lr': 0.00042474640179986035, 'samples': 7591488, 'steps': 39538, 'loss/train': 0.9572631120681763} -08/30/2021 20:19:10 - INFO - __main__ - Step 39540: {'lr': 0.00042474260671796697, 'samples': 7591680, 'steps': 39539, 'loss/train': 1.9065203666687012} -08/30/2021 20:19:11 - INFO - __main__ - Step 39541: {'lr': 0.0004247388115573373, 'samples': 7591872, 'steps': 39540, 'loss/train': 1.538730263710022} -08/30/2021 20:19:12 - INFO - __main__ - Step 39542: {'lr': 0.00042473501631797294, 'samples': 7592064, 'steps': 39541, 'loss/train': 0.1999540627002716} -08/30/2021 20:19:13 - INFO - __main__ - Step 39543: {'lr': 0.0004247312209998758, 'samples': 7592256, 'steps': 39542, 'loss/train': 1.7726805210113525} -08/30/2021 20:19:13 - INFO - __main__ - Step 39544: {'lr': 0.00042472742560304734, 'samples': 7592448, 'steps': 39543, 'loss/train': 1.321663737297058} -08/30/2021 20:19:13 - INFO - __main__ - Step 39545: {'lr': 0.00042472363012748947, 'samples': 7592640, 'steps': 39544, 'loss/train': 1.5099347829818726} -08/30/2021 20:19:14 - INFO - __main__ - Step 39546: {'lr': 0.00042471983457320384, 'samples': 7592832, 'steps': 39545, 'loss/train': 1.6786268949508667} -08/30/2021 20:19:16 - INFO - __main__ - Step 39547: {'lr': 0.00042471603894019206, 'samples': 7593024, 'steps': 39546, 'loss/train': 1.2953327894210815} -08/30/2021 20:19:16 - INFO - __main__ - Step 39548: {'lr': 0.00042471224322845603, 'samples': 7593216, 'steps': 39547, 'loss/train': 0.9177379608154297} -08/30/2021 20:19:16 - INFO - __main__ - Step 39549: {'lr': 0.00042470844743799734, 'samples': 7593408, 'steps': 39548, 'loss/train': 0.6467287540435791} -08/30/2021 20:19:17 - INFO - __main__ - Step 39550: {'lr': 0.00042470465156881765, 'samples': 7593600, 'steps': 39549, 'loss/train': 1.0442194938659668} -08/30/2021 20:19:17 - INFO - __main__ - Step 39551: {'lr': 0.00042470085562091887, 'samples': 7593792, 'steps': 39550, 'loss/train': 1.3773002624511719} -08/30/2021 20:19:19 - INFO - __main__ - Step 39552: {'lr': 0.0004246970595943025, 'samples': 7593984, 'steps': 39551, 'loss/train': 0.7412907481193542} -08/30/2021 20:19:19 - INFO - __main__ - Step 39553: {'lr': 0.0004246932634889703, 'samples': 7594176, 'steps': 39552, 'loss/train': 1.5008081197738647} -08/30/2021 20:19:20 - INFO - __main__ - Step 39554: {'lr': 0.00042468946730492404, 'samples': 7594368, 'steps': 39553, 'loss/train': 1.4761254787445068} -08/30/2021 20:19:20 - INFO - __main__ - Step 39555: {'lr': 0.00042468567104216536, 'samples': 7594560, 'steps': 39554, 'loss/train': 1.5336171388626099} -08/30/2021 20:19:20 - INFO - __main__ - Step 39556: {'lr': 0.0004246818747006961, 'samples': 7594752, 'steps': 39555, 'loss/train': 1.179232120513916} -08/30/2021 20:19:22 - INFO - __main__ - Step 39557: {'lr': 0.00042467807828051787, 'samples': 7594944, 'steps': 39556, 'loss/train': 1.318572759628296} -08/30/2021 20:19:22 - INFO - __main__ - Step 39558: {'lr': 0.0004246742817816323, 'samples': 7595136, 'steps': 39557, 'loss/train': 1.4071831703186035} -08/30/2021 20:19:23 - INFO - __main__ - Step 39559: {'lr': 0.00042467048520404126, 'samples': 7595328, 'steps': 39558, 'loss/train': 1.3430149555206299} -08/30/2021 20:19:23 - INFO - __main__ - Step 39560: {'lr': 0.00042466668854774636, 'samples': 7595520, 'steps': 39559, 'loss/train': 1.8356088399887085} -08/30/2021 20:19:23 - INFO - __main__ - Step 39561: {'lr': 0.00042466289181274943, 'samples': 7595712, 'steps': 39560, 'loss/train': 0.9999196529388428} -08/30/2021 20:19:26 - INFO - __main__ - Step 39562: {'lr': 0.00042465909499905206, 'samples': 7595904, 'steps': 39561, 'loss/train': 1.8007441759109497} -08/30/2021 20:19:26 - INFO - __main__ - Step 39563: {'lr': 0.0004246552981066559, 'samples': 7596096, 'steps': 39562, 'loss/train': 1.6961530447006226} -08/30/2021 20:19:26 - INFO - __main__ - Step 39564: {'lr': 0.0004246515011355629, 'samples': 7596288, 'steps': 39563, 'loss/train': 1.6991370916366577} -08/30/2021 20:19:27 - INFO - __main__ - Step 39565: {'lr': 0.0004246477040857746, 'samples': 7596480, 'steps': 39564, 'loss/train': 1.9942409992218018} -08/30/2021 20:19:27 - INFO - __main__ - Step 39566: {'lr': 0.0004246439069572926, 'samples': 7596672, 'steps': 39565, 'loss/train': 1.7631640434265137} -08/30/2021 20:19:27 - INFO - __main__ - Step 39567: {'lr': 0.00042464010975011893, 'samples': 7596864, 'steps': 39566, 'loss/train': 1.181044578552246} -08/30/2021 20:19:29 - INFO - __main__ - Step 39568: {'lr': 0.00042463631246425504, 'samples': 7597056, 'steps': 39567, 'loss/train': 0.8439130187034607} -08/30/2021 20:19:29 - INFO - __main__ - Step 39569: {'lr': 0.0004246325150997027, 'samples': 7597248, 'steps': 39568, 'loss/train': 1.4189765453338623} -08/30/2021 20:19:30 - INFO - __main__ - Step 39570: {'lr': 0.0004246287176564637, 'samples': 7597440, 'steps': 39569, 'loss/train': 1.715533971786499} -08/30/2021 20:19:30 - INFO - __main__ - Step 39571: {'lr': 0.0004246249201345397, 'samples': 7597632, 'steps': 39570, 'loss/train': 1.205657720565796} -08/30/2021 20:19:30 - INFO - __main__ - Step 39572: {'lr': 0.0004246211225339323, 'samples': 7597824, 'steps': 39571, 'loss/train': 1.4443302154541016} -08/30/2021 20:19:32 - INFO - __main__ - Step 39573: {'lr': 0.0004246173248546434, 'samples': 7598016, 'steps': 39572, 'loss/train': 1.4024207592010498} -08/30/2021 20:19:32 - INFO - __main__ - Step 39574: {'lr': 0.0004246135270966747, 'samples': 7598208, 'steps': 39573, 'loss/train': 1.9255534410476685} -08/30/2021 20:19:33 - INFO - __main__ - Step 39575: {'lr': 0.00042460972926002774, 'samples': 7598400, 'steps': 39574, 'loss/train': 1.9846572875976562} -08/30/2021 20:19:33 - INFO - __main__ - Step 39576: {'lr': 0.00042460593134470426, 'samples': 7598592, 'steps': 39575, 'loss/train': 0.5578235983848572} -08/30/2021 20:19:34 - INFO - __main__ - Step 39577: {'lr': 0.0004246021333507062, 'samples': 7598784, 'steps': 39576, 'loss/train': 1.2485721111297607} -08/30/2021 20:19:35 - INFO - __main__ - Step 39578: {'lr': 0.00042459833527803503, 'samples': 7598976, 'steps': 39577, 'loss/train': 1.5933971405029297} -08/30/2021 20:19:36 - INFO - __main__ - Step 39579: {'lr': 0.00042459453712669255, 'samples': 7599168, 'steps': 39578, 'loss/train': 1.4226523637771606} -08/30/2021 20:19:36 - INFO - __main__ - Step 39580: {'lr': 0.0004245907388966804, 'samples': 7599360, 'steps': 39579, 'loss/train': 1.3121119737625122} -08/30/2021 20:19:36 - INFO - __main__ - Step 39581: {'lr': 0.0004245869405880005, 'samples': 7599552, 'steps': 39580, 'loss/train': 1.4871419668197632} -08/30/2021 20:19:37 - INFO - __main__ - Step 39582: {'lr': 0.0004245831422006543, 'samples': 7599744, 'steps': 39581, 'loss/train': 1.8283289670944214} -08/30/2021 20:19:39 - INFO - __main__ - Step 39583: {'lr': 0.0004245793437346437, 'samples': 7599936, 'steps': 39582, 'loss/train': 1.5888737440109253} -08/30/2021 20:19:39 - INFO - __main__ - Step 39584: {'lr': 0.0004245755451899703, 'samples': 7600128, 'steps': 39583, 'loss/train': 1.085365653038025} -08/30/2021 20:19:39 - INFO - __main__ - Step 39585: {'lr': 0.0004245717465666359, 'samples': 7600320, 'steps': 39584, 'loss/train': 0.13444222509860992} -08/30/2021 20:19:40 - INFO - __main__ - Step 39586: {'lr': 0.0004245679478646421, 'samples': 7600512, 'steps': 39585, 'loss/train': 1.1106112003326416} -08/30/2021 20:19:40 - INFO - __main__ - Step 39587: {'lr': 0.00042456414908399075, 'samples': 7600704, 'steps': 39586, 'loss/train': 1.6339653730392456} -08/30/2021 20:19:42 - INFO - __main__ - Step 39588: {'lr': 0.00042456035022468344, 'samples': 7600896, 'steps': 39587, 'loss/train': 2.0127503871917725} -08/30/2021 20:19:42 - INFO - __main__ - Step 39589: {'lr': 0.0004245565512867219, 'samples': 7601088, 'steps': 39588, 'loss/train': 1.4844590425491333} -08/30/2021 20:19:43 - INFO - __main__ - Step 39590: {'lr': 0.000424552752270108, 'samples': 7601280, 'steps': 39589, 'loss/train': 0.3811574876308441} -08/30/2021 20:19:43 - INFO - __main__ - Step 39591: {'lr': 0.0004245489531748432, 'samples': 7601472, 'steps': 39590, 'loss/train': 1.7608567476272583} -08/30/2021 20:19:43 - INFO - __main__ - Step 39592: {'lr': 0.00042454515400092944, 'samples': 7601664, 'steps': 39591, 'loss/train': 5.242020606994629} -08/30/2021 20:19:44 - INFO - __main__ - Step 39593: {'lr': 0.00042454135474836817, 'samples': 7601856, 'steps': 39592, 'loss/train': 1.218087077140808} -08/30/2021 20:19:45 - INFO - __main__ - Step 39594: {'lr': 0.0004245375554171613, 'samples': 7602048, 'steps': 39593, 'loss/train': 0.9052404165267944} -08/30/2021 20:19:46 - INFO - __main__ - Step 39595: {'lr': 0.00042453375600731057, 'samples': 7602240, 'steps': 39594, 'loss/train': 1.5481382608413696} -08/30/2021 20:19:46 - INFO - __main__ - Step 39596: {'lr': 0.00042452995651881764, 'samples': 7602432, 'steps': 39595, 'loss/train': 1.738535761833191} -08/30/2021 20:19:46 - INFO - __main__ - Step 39597: {'lr': 0.0004245261569516842, 'samples': 7602624, 'steps': 39596, 'loss/train': 0.7275892496109009} -08/30/2021 20:19:47 - INFO - __main__ - Step 39598: {'lr': 0.00042452235730591195, 'samples': 7602816, 'steps': 39597, 'loss/train': 1.4351816177368164} -08/30/2021 20:19:48 - INFO - __main__ - Step 39599: {'lr': 0.00042451855758150254, 'samples': 7603008, 'steps': 39598, 'loss/train': 0.7411654591560364} -08/30/2021 20:19:49 - INFO - __main__ - Step 39600: {'lr': 0.00042451475777845784, 'samples': 7603200, 'steps': 39599, 'loss/train': 1.7640950679779053} -08/30/2021 20:19:49 - INFO - __main__ - Step 39601: {'lr': 0.00042451095789677943, 'samples': 7603392, 'steps': 39600, 'loss/train': 1.423945665359497} -08/30/2021 20:19:49 - INFO - __main__ - Step 39602: {'lr': 0.0004245071579364691, 'samples': 7603584, 'steps': 39601, 'loss/train': 1.0180280208587646} -08/30/2021 20:19:50 - INFO - __main__ - Step 39603: {'lr': 0.0004245033578975286, 'samples': 7603776, 'steps': 39602, 'loss/train': 1.0098040103912354} -08/30/2021 20:19:51 - INFO - __main__ - Step 39604: {'lr': 0.00042449955777995954, 'samples': 7603968, 'steps': 39603, 'loss/train': 1.530120849609375} -08/30/2021 20:19:52 - INFO - __main__ - Step 39605: {'lr': 0.0004244957575837636, 'samples': 7604160, 'steps': 39604, 'loss/train': 1.3768794536590576} -08/30/2021 20:19:52 - INFO - __main__ - Step 39606: {'lr': 0.00042449195730894266, 'samples': 7604352, 'steps': 39605, 'loss/train': 1.3495783805847168} -08/30/2021 20:19:53 - INFO - __main__ - Step 39607: {'lr': 0.00042448815695549823, 'samples': 7604544, 'steps': 39606, 'loss/train': 1.0748873949050903} -08/30/2021 20:19:53 - INFO - __main__ - Step 39608: {'lr': 0.00042448435652343223, 'samples': 7604736, 'steps': 39607, 'loss/train': 0.28193408250808716} -08/30/2021 20:19:53 - INFO - __main__ - Step 39609: {'lr': 0.0004244805560127463, 'samples': 7604928, 'steps': 39608, 'loss/train': 1.3490265607833862} -08/30/2021 20:19:55 - INFO - __main__ - Step 39610: {'lr': 0.00042447675542344203, 'samples': 7605120, 'steps': 39609, 'loss/train': 1.0516595840454102} -08/30/2021 20:19:55 - INFO - __main__ - Step 39611: {'lr': 0.0004244729547555213, 'samples': 7605312, 'steps': 39610, 'loss/train': 1.6864597797393799} -08/30/2021 20:19:56 - INFO - __main__ - Step 39612: {'lr': 0.00042446915400898565, 'samples': 7605504, 'steps': 39611, 'loss/train': 1.721461296081543} -08/30/2021 20:19:56 - INFO - __main__ - Step 39613: {'lr': 0.00042446535318383695, 'samples': 7605696, 'steps': 39612, 'loss/train': 1.4178909063339233} -08/30/2021 20:19:56 - INFO - __main__ - Step 39614: {'lr': 0.00042446155228007687, 'samples': 7605888, 'steps': 39613, 'loss/train': 1.7122137546539307} -08/30/2021 20:19:58 - INFO - __main__ - Step 39615: {'lr': 0.0004244577512977071, 'samples': 7606080, 'steps': 39614, 'loss/train': 2.324068307876587} -08/30/2021 20:19:59 - INFO - __main__ - Step 39616: {'lr': 0.00042445395023672935, 'samples': 7606272, 'steps': 39615, 'loss/train': 1.7929363250732422} -08/30/2021 20:19:59 - INFO - __main__ - Step 39617: {'lr': 0.0004244501490971454, 'samples': 7606464, 'steps': 39616, 'loss/train': 1.9229449033737183} -08/30/2021 20:19:59 - INFO - __main__ - Step 39618: {'lr': 0.0004244463478789568, 'samples': 7606656, 'steps': 39617, 'loss/train': 0.8985770344734192} -08/30/2021 20:20:00 - INFO - __main__ - Step 39619: {'lr': 0.0004244425465821654, 'samples': 7606848, 'steps': 39618, 'loss/train': 1.1737024784088135} -08/30/2021 20:20:00 - INFO - __main__ - Step 39620: {'lr': 0.0004244387452067729, 'samples': 7607040, 'steps': 39619, 'loss/train': 0.37495139241218567} -08/30/2021 20:20:02 - INFO - __main__ - Step 39621: {'lr': 0.000424434943752781, 'samples': 7607232, 'steps': 39620, 'loss/train': 1.5510468482971191} -08/30/2021 20:20:02 - INFO - __main__ - Step 39622: {'lr': 0.0004244311422201914, 'samples': 7607424, 'steps': 39621, 'loss/train': 1.1349774599075317} -08/30/2021 20:20:03 - INFO - __main__ - Step 39623: {'lr': 0.0004244273406090058, 'samples': 7607616, 'steps': 39622, 'loss/train': 1.3849761486053467} -08/30/2021 20:20:03 - INFO - __main__ - Step 39624: {'lr': 0.000424423538919226, 'samples': 7607808, 'steps': 39623, 'loss/train': 1.084895133972168} -08/30/2021 20:20:03 - INFO - __main__ - Step 39625: {'lr': 0.0004244197371508536, 'samples': 7608000, 'steps': 39624, 'loss/train': 2.32084059715271} -08/30/2021 20:20:05 - INFO - __main__ - Step 39626: {'lr': 0.00042441593530389025, 'samples': 7608192, 'steps': 39625, 'loss/train': 1.5204460620880127} -08/30/2021 20:20:05 - INFO - __main__ - Step 39627: {'lr': 0.0004244121333783379, 'samples': 7608384, 'steps': 39626, 'loss/train': 1.4676190614700317} -08/30/2021 20:20:06 - INFO - __main__ - Step 39628: {'lr': 0.0004244083313741981, 'samples': 7608576, 'steps': 39627, 'loss/train': 1.4633153676986694} -08/30/2021 20:20:06 - INFO - __main__ - Step 39629: {'lr': 0.0004244045292914726, 'samples': 7608768, 'steps': 39628, 'loss/train': 1.313714861869812} -08/30/2021 20:20:06 - INFO - __main__ - Step 39630: {'lr': 0.00042440072713016317, 'samples': 7608960, 'steps': 39629, 'loss/train': 1.387855052947998} -08/30/2021 20:20:08 - INFO - __main__ - Step 39631: {'lr': 0.00042439692489027136, 'samples': 7609152, 'steps': 39630, 'loss/train': 1.3798304796218872} -08/30/2021 20:20:08 - INFO - __main__ - Step 39632: {'lr': 0.000424393122571799, 'samples': 7609344, 'steps': 39631, 'loss/train': 1.1280311346054077} -08/30/2021 20:20:09 - INFO - __main__ - Step 39633: {'lr': 0.00042438932017474783, 'samples': 7609536, 'steps': 39632, 'loss/train': 1.1781045198440552} -08/30/2021 20:20:09 - INFO - __main__ - Step 39634: {'lr': 0.0004243855176991195, 'samples': 7609728, 'steps': 39633, 'loss/train': 1.705105185508728} -08/30/2021 20:20:09 - INFO - __main__ - Step 39635: {'lr': 0.0004243817151449158, 'samples': 7609920, 'steps': 39634, 'loss/train': 1.374541163444519} -08/30/2021 20:20:11 - INFO - __main__ - Step 39636: {'lr': 0.0004243779125121383, 'samples': 7610112, 'steps': 39635, 'loss/train': 1.4222357273101807} -08/30/2021 20:20:11 - INFO - __main__ - Step 39637: {'lr': 0.00042437410980078894, 'samples': 7610304, 'steps': 39636, 'loss/train': 1.373152732849121} -08/30/2021 20:20:12 - INFO - __main__ - Step 39638: {'lr': 0.0004243703070108692, 'samples': 7610496, 'steps': 39637, 'loss/train': 1.3218297958374023} -08/30/2021 20:20:12 - INFO - __main__ - Step 39639: {'lr': 0.00042436650414238086, 'samples': 7610688, 'steps': 39638, 'loss/train': 0.9254968762397766} -08/30/2021 20:20:12 - INFO - __main__ - Step 39640: {'lr': 0.0004243627011953257, 'samples': 7610880, 'steps': 39639, 'loss/train': 1.0002259016036987} -08/30/2021 20:20:14 - INFO - __main__ - Step 39641: {'lr': 0.0004243588981697054, 'samples': 7611072, 'steps': 39640, 'loss/train': 1.3645919561386108} -08/30/2021 20:20:14 - INFO - __main__ - Step 39642: {'lr': 0.0004243550950655217, 'samples': 7611264, 'steps': 39641, 'loss/train': 2.0988473892211914} -08/30/2021 20:20:15 - INFO - __main__ - Step 39643: {'lr': 0.00042435129188277625, 'samples': 7611456, 'steps': 39642, 'loss/train': 1.6015135049819946} -08/30/2021 20:20:15 - INFO - __main__ - Step 39644: {'lr': 0.0004243474886214708, 'samples': 7611648, 'steps': 39643, 'loss/train': 1.3720701932907104} -08/30/2021 20:20:15 - INFO - __main__ - Step 39645: {'lr': 0.0004243436852816071, 'samples': 7611840, 'steps': 39644, 'loss/train': 1.2842869758605957} -08/30/2021 20:20:17 - INFO - __main__ - Step 39646: {'lr': 0.0004243398818631868, 'samples': 7612032, 'steps': 39645, 'loss/train': 1.5468418598175049} -08/30/2021 20:20:17 - INFO - __main__ - Step 39647: {'lr': 0.0004243360783662116, 'samples': 7612224, 'steps': 39646, 'loss/train': 0.5295102000236511} -08/30/2021 20:20:18 - INFO - __main__ - Step 39648: {'lr': 0.0004243322747906833, 'samples': 7612416, 'steps': 39647, 'loss/train': 0.30289480090141296} -08/30/2021 20:20:18 - INFO - __main__ - Step 39649: {'lr': 0.00042432847113660355, 'samples': 7612608, 'steps': 39648, 'loss/train': 0.9014484286308289} -08/30/2021 20:20:18 - INFO - __main__ - Step 39650: {'lr': 0.0004243246674039741, 'samples': 7612800, 'steps': 39649, 'loss/train': 1.8353095054626465} -08/30/2021 20:20:20 - INFO - __main__ - Step 39651: {'lr': 0.00042432086359279667, 'samples': 7612992, 'steps': 39650, 'loss/train': 1.4529352188110352} -08/30/2021 20:20:20 - INFO - __main__ - Step 39652: {'lr': 0.0004243170597030729, 'samples': 7613184, 'steps': 39651, 'loss/train': 1.6424646377563477} -08/30/2021 20:20:21 - INFO - __main__ - Step 39653: {'lr': 0.0004243132557348045, 'samples': 7613376, 'steps': 39652, 'loss/train': 1.0673192739486694} -08/30/2021 20:20:21 - INFO - __main__ - Step 39654: {'lr': 0.00042430945168799326, 'samples': 7613568, 'steps': 39653, 'loss/train': 1.2372204065322876} -08/30/2021 20:20:21 - INFO - __main__ - Step 39655: {'lr': 0.000424305647562641, 'samples': 7613760, 'steps': 39654, 'loss/train': 0.9994213581085205} -08/30/2021 20:20:23 - INFO - __main__ - Step 39656: {'lr': 0.00042430184335874924, 'samples': 7613952, 'steps': 39655, 'loss/train': 1.098544955253601} -08/30/2021 20:20:23 - INFO - __main__ - Step 39657: {'lr': 0.0004242980390763197, 'samples': 7614144, 'steps': 39656, 'loss/train': 1.1567517518997192} -08/30/2021 20:20:24 - INFO - __main__ - Step 39658: {'lr': 0.0004242942347153542, 'samples': 7614336, 'steps': 39657, 'loss/train': 1.428024411201477} -08/30/2021 20:20:24 - INFO - __main__ - Step 39659: {'lr': 0.00042429043027585435, 'samples': 7614528, 'steps': 39658, 'loss/train': 1.4090584516525269} -08/30/2021 20:20:24 - INFO - __main__ - Step 39660: {'lr': 0.000424286625757822, 'samples': 7614720, 'steps': 39659, 'loss/train': 1.344565510749817} -08/30/2021 20:20:25 - INFO - __main__ - Step 39661: {'lr': 0.00042428282116125873, 'samples': 7614912, 'steps': 39660, 'loss/train': 1.4870916604995728} -08/30/2021 20:20:26 - INFO - __main__ - Step 39662: {'lr': 0.0004242790164861663, 'samples': 7615104, 'steps': 39661, 'loss/train': 1.3315699100494385} -08/30/2021 20:20:27 - INFO - __main__ - Step 39663: {'lr': 0.0004242752117325465, 'samples': 7615296, 'steps': 39662, 'loss/train': 1.230576515197754} -08/30/2021 20:20:27 - INFO - __main__ - Step 39664: {'lr': 0.000424271406900401, 'samples': 7615488, 'steps': 39663, 'loss/train': 0.9211643934249878} -08/30/2021 20:20:27 - INFO - __main__ - Step 39665: {'lr': 0.0004242676019897314, 'samples': 7615680, 'steps': 39664, 'loss/train': 1.0158231258392334} -08/30/2021 20:20:28 - INFO - __main__ - Step 39666: {'lr': 0.00042426379700053954, 'samples': 7615872, 'steps': 39665, 'loss/train': 1.5026607513427734} -08/30/2021 20:20:29 - INFO - __main__ - Step 39667: {'lr': 0.00042425999193282713, 'samples': 7616064, 'steps': 39666, 'loss/train': 1.8173192739486694} -08/30/2021 20:20:30 - INFO - __main__ - Step 39668: {'lr': 0.0004242561867865958, 'samples': 7616256, 'steps': 39667, 'loss/train': 1.5084888935089111} -08/30/2021 20:20:30 - INFO - __main__ - Step 39669: {'lr': 0.0004242523815618473, 'samples': 7616448, 'steps': 39668, 'loss/train': 1.3154528141021729} -08/30/2021 20:20:31 - INFO - __main__ - Step 39670: {'lr': 0.0004242485762585835, 'samples': 7616640, 'steps': 39669, 'loss/train': 1.3291431665420532} -08/30/2021 20:20:31 - INFO - __main__ - Step 39671: {'lr': 0.0004242447708768059, 'samples': 7616832, 'steps': 39670, 'loss/train': 1.6188416481018066} -08/30/2021 20:20:33 - INFO - __main__ - Step 39672: {'lr': 0.0004242409654165163, 'samples': 7617024, 'steps': 39671, 'loss/train': 1.55584716796875} -08/30/2021 20:20:33 - INFO - __main__ - Step 39673: {'lr': 0.00042423715987771637, 'samples': 7617216, 'steps': 39672, 'loss/train': 1.708908200263977} -08/30/2021 20:20:34 - INFO - __main__ - Step 39674: {'lr': 0.0004242333542604079, 'samples': 7617408, 'steps': 39673, 'loss/train': 1.2755793333053589} -08/30/2021 20:20:34 - INFO - __main__ - Step 39675: {'lr': 0.0004242295485645926, 'samples': 7617600, 'steps': 39674, 'loss/train': 1.422940969467163} -08/30/2021 20:20:34 - INFO - __main__ - Step 39676: {'lr': 0.0004242257427902721, 'samples': 7617792, 'steps': 39675, 'loss/train': 1.6290698051452637} -08/30/2021 20:20:36 - INFO - __main__ - Step 39677: {'lr': 0.00042422193693744827, 'samples': 7617984, 'steps': 39676, 'loss/train': 1.594285249710083} -08/30/2021 20:20:36 - INFO - __main__ - Step 39678: {'lr': 0.0004242181310061226, 'samples': 7618176, 'steps': 39677, 'loss/train': 2.1580467224121094} -08/30/2021 20:20:37 - INFO - __main__ - Step 39679: {'lr': 0.000424214324996297, 'samples': 7618368, 'steps': 39678, 'loss/train': 1.8396358489990234} -08/30/2021 20:20:37 - INFO - __main__ - Step 39680: {'lr': 0.000424210518907973, 'samples': 7618560, 'steps': 39679, 'loss/train': 1.3235629796981812} -08/30/2021 20:20:37 - INFO - __main__ - Step 39681: {'lr': 0.0004242067127411525, 'samples': 7618752, 'steps': 39680, 'loss/train': 1.2612700462341309} -08/30/2021 20:20:39 - INFO - __main__ - Step 39682: {'lr': 0.0004242029064958372, 'samples': 7618944, 'steps': 39681, 'loss/train': 1.8453831672668457} -08/30/2021 20:20:40 - INFO - __main__ - Step 39683: {'lr': 0.0004241991001720287, 'samples': 7619136, 'steps': 39682, 'loss/train': 1.2175443172454834} -08/30/2021 20:20:40 - INFO - __main__ - Step 39684: {'lr': 0.00042419529376972885, 'samples': 7619328, 'steps': 39683, 'loss/train': 1.4574471712112427} -08/30/2021 20:20:40 - INFO - __main__ - Step 39685: {'lr': 0.0004241914872889392, 'samples': 7619520, 'steps': 39684, 'loss/train': 1.4367091655731201} -08/30/2021 20:20:41 - INFO - __main__ - Step 39686: {'lr': 0.00042418768072966163, 'samples': 7619712, 'steps': 39685, 'loss/train': 1.7369105815887451} -08/30/2021 20:20:41 - INFO - __main__ - Step 39687: {'lr': 0.0004241838740918977, 'samples': 7619904, 'steps': 39686, 'loss/train': 2.5677261352539062} -08/30/2021 20:20:43 - INFO - __main__ - Step 39688: {'lr': 0.00042418006737564924, 'samples': 7620096, 'steps': 39687, 'loss/train': 1.3622618913650513} -08/30/2021 20:20:43 - INFO - __main__ - Step 39689: {'lr': 0.0004241762605809179, 'samples': 7620288, 'steps': 39688, 'loss/train': 1.7934119701385498} -08/30/2021 20:20:44 - INFO - __main__ - Step 39690: {'lr': 0.00042417245370770547, 'samples': 7620480, 'steps': 39689, 'loss/train': 1.4852654933929443} -08/30/2021 20:20:44 - INFO - __main__ - Step 39691: {'lr': 0.00042416864675601365, 'samples': 7620672, 'steps': 39690, 'loss/train': 2.3179264068603516} -08/30/2021 20:20:44 - INFO - __main__ - Step 39692: {'lr': 0.0004241648397258441, 'samples': 7620864, 'steps': 39691, 'loss/train': 1.2021403312683105} -08/30/2021 20:20:46 - INFO - __main__ - Step 39693: {'lr': 0.0004241610326171985, 'samples': 7621056, 'steps': 39692, 'loss/train': 1.3357957601547241} -08/30/2021 20:20:46 - INFO - __main__ - Step 39694: {'lr': 0.0004241572254300786, 'samples': 7621248, 'steps': 39693, 'loss/train': 1.3742859363555908} -08/30/2021 20:20:47 - INFO - __main__ - Step 39695: {'lr': 0.00042415341816448625, 'samples': 7621440, 'steps': 39694, 'loss/train': 0.7203447222709656} -08/30/2021 20:20:47 - INFO - __main__ - Step 39696: {'lr': 0.000424149610820423, 'samples': 7621632, 'steps': 39695, 'loss/train': 1.7883760929107666} -08/30/2021 20:20:47 - INFO - __main__ - Step 39697: {'lr': 0.00042414580339789065, 'samples': 7621824, 'steps': 39696, 'loss/train': 1.5429047346115112} -08/30/2021 20:20:49 - INFO - __main__ - Step 39698: {'lr': 0.00042414199589689084, 'samples': 7622016, 'steps': 39697, 'loss/train': 1.3451834917068481} -08/30/2021 20:20:49 - INFO - __main__ - Step 39699: {'lr': 0.0004241381883174254, 'samples': 7622208, 'steps': 39698, 'loss/train': 1.063746452331543} -08/30/2021 20:20:49 - INFO - __main__ - Step 39700: {'lr': 0.00042413438065949595, 'samples': 7622400, 'steps': 39699, 'loss/train': 1.5426853895187378} -08/30/2021 20:20:50 - INFO - __main__ - Step 39701: {'lr': 0.0004241305729231042, 'samples': 7622592, 'steps': 39700, 'loss/train': 1.979162573814392} -08/30/2021 20:20:50 - INFO - __main__ - Step 39702: {'lr': 0.00042412676510825197, 'samples': 7622784, 'steps': 39701, 'loss/train': 1.1119879484176636} -08/30/2021 20:20:52 - INFO - __main__ - Step 39703: {'lr': 0.00042412295721494086, 'samples': 7622976, 'steps': 39702, 'loss/train': 0.3166111707687378} -08/30/2021 20:20:52 - INFO - __main__ - Step 39704: {'lr': 0.00042411914924317265, 'samples': 7623168, 'steps': 39703, 'loss/train': 1.8205727338790894} -08/30/2021 20:20:53 - INFO - __main__ - Step 39705: {'lr': 0.00042411534119294903, 'samples': 7623360, 'steps': 39704, 'loss/train': 0.08558724820613861} -08/30/2021 20:20:53 - INFO - __main__ - Step 39706: {'lr': 0.0004241115330642717, 'samples': 7623552, 'steps': 39705, 'loss/train': 1.253430724143982} -08/30/2021 20:20:53 - INFO - __main__ - Step 39707: {'lr': 0.0004241077248571424, 'samples': 7623744, 'steps': 39706, 'loss/train': 1.7641167640686035} -08/30/2021 20:20:54 - INFO - __main__ - Step 39708: {'lr': 0.0004241039165715629, 'samples': 7623936, 'steps': 39707, 'loss/train': 1.6174490451812744} -08/30/2021 20:20:55 - INFO - __main__ - Step 39709: {'lr': 0.00042410010820753485, 'samples': 7624128, 'steps': 39708, 'loss/train': 1.50947904586792} -08/30/2021 20:20:56 - INFO - __main__ - Step 39710: {'lr': 0.00042409629976505994, 'samples': 7624320, 'steps': 39709, 'loss/train': 2.0942623615264893} -08/30/2021 20:20:56 - INFO - __main__ - Step 39711: {'lr': 0.00042409249124414, 'samples': 7624512, 'steps': 39710, 'loss/train': 1.424556851387024} -08/30/2021 20:20:57 - INFO - __main__ - Step 39712: {'lr': 0.00042408868264477657, 'samples': 7624704, 'steps': 39711, 'loss/train': 1.8498318195343018} -08/30/2021 20:20:57 - INFO - __main__ - Step 39713: {'lr': 0.00042408487396697147, 'samples': 7624896, 'steps': 39712, 'loss/train': 1.6383851766586304} -08/30/2021 20:20:58 - INFO - __main__ - Step 39714: {'lr': 0.0004240810652107265, 'samples': 7625088, 'steps': 39713, 'loss/train': 1.579742431640625} -08/30/2021 20:20:59 - INFO - __main__ - Step 39715: {'lr': 0.0004240772563760432, 'samples': 7625280, 'steps': 39714, 'loss/train': 1.310516119003296} -08/30/2021 20:20:59 - INFO - __main__ - Step 39716: {'lr': 0.00042407344746292345, 'samples': 7625472, 'steps': 39715, 'loss/train': 2.0912563800811768} -08/30/2021 20:21:00 - INFO - __main__ - Step 39717: {'lr': 0.00042406963847136883, 'samples': 7625664, 'steps': 39716, 'loss/train': 1.6308954954147339} -08/30/2021 20:21:00 - INFO - __main__ - Step 39718: {'lr': 0.0004240658294013812, 'samples': 7625856, 'steps': 39717, 'loss/train': 1.8312853574752808} -08/30/2021 20:21:01 - INFO - __main__ - Step 39719: {'lr': 0.00042406202025296213, 'samples': 7626048, 'steps': 39718, 'loss/train': 1.6745630502700806} -08/30/2021 20:21:02 - INFO - __main__ - Step 39720: {'lr': 0.00042405821102611336, 'samples': 7626240, 'steps': 39719, 'loss/train': 1.1348166465759277} -08/30/2021 20:21:02 - INFO - __main__ - Step 39721: {'lr': 0.0004240544017208367, 'samples': 7626432, 'steps': 39720, 'loss/train': 1.1951721906661987} -08/30/2021 20:21:03 - INFO - __main__ - Step 39722: {'lr': 0.0004240505923371338, 'samples': 7626624, 'steps': 39721, 'loss/train': 1.2257647514343262} -08/30/2021 20:21:03 - INFO - __main__ - Step 39723: {'lr': 0.0004240467828750064, 'samples': 7626816, 'steps': 39722, 'loss/train': 1.4201858043670654} -08/30/2021 20:21:05 - INFO - __main__ - Step 39724: {'lr': 0.0004240429733344562, 'samples': 7627008, 'steps': 39723, 'loss/train': 1.5598580837249756} -08/30/2021 20:21:06 - INFO - __main__ - Step 39725: {'lr': 0.0004240391637154849, 'samples': 7627200, 'steps': 39724, 'loss/train': 0.9043325781822205} -08/30/2021 20:21:06 - INFO - __main__ - Step 39726: {'lr': 0.0004240353540180942, 'samples': 7627392, 'steps': 39725, 'loss/train': 1.3059759140014648} -08/30/2021 20:21:06 - INFO - __main__ - Step 39727: {'lr': 0.00042403154424228596, 'samples': 7627584, 'steps': 39726, 'loss/train': 2.4985077381134033} -08/30/2021 20:21:07 - INFO - __main__ - Step 39728: {'lr': 0.00042402773438806175, 'samples': 7627776, 'steps': 39727, 'loss/train': 2.4102859497070312} -08/30/2021 20:21:07 - INFO - __main__ - Step 39729: {'lr': 0.00042402392445542333, 'samples': 7627968, 'steps': 39728, 'loss/train': 1.0131531953811646} -08/30/2021 20:21:07 - INFO - __main__ - Step 39730: {'lr': 0.0004240201144443724, 'samples': 7628160, 'steps': 39729, 'loss/train': 0.4219430685043335} -08/30/2021 20:21:09 - INFO - __main__ - Step 39731: {'lr': 0.00042401630435491073, 'samples': 7628352, 'steps': 39730, 'loss/train': 1.3452719449996948} -08/30/2021 20:21:10 - INFO - __main__ - Step 39732: {'lr': 0.00042401249418703996, 'samples': 7628544, 'steps': 39731, 'loss/train': 1.2301236391067505} -08/30/2021 20:21:10 - INFO - __main__ - Step 39733: {'lr': 0.00042400868394076185, 'samples': 7628736, 'steps': 39732, 'loss/train': 1.7061527967453003} -08/30/2021 20:21:10 - INFO - __main__ - Step 39734: {'lr': 0.0004240048736160781, 'samples': 7628928, 'steps': 39733, 'loss/train': 1.0829201936721802} -08/30/2021 20:21:11 - INFO - __main__ - Step 39735: {'lr': 0.0004240010632129905, 'samples': 7629120, 'steps': 39734, 'loss/train': 1.6662555932998657} -08/30/2021 20:21:12 - INFO - __main__ - Step 39736: {'lr': 0.00042399725273150056, 'samples': 7629312, 'steps': 39735, 'loss/train': 1.4515132904052734} -08/30/2021 20:21:13 - INFO - __main__ - Step 39737: {'lr': 0.0004239934421716103, 'samples': 7629504, 'steps': 39736, 'loss/train': 0.6121734976768494} -08/30/2021 20:21:13 - INFO - __main__ - Step 39738: {'lr': 0.00042398963153332124, 'samples': 7629696, 'steps': 39737, 'loss/train': 0.9485858678817749} -08/30/2021 20:21:13 - INFO - __main__ - Step 39739: {'lr': 0.00042398582081663513, 'samples': 7629888, 'steps': 39738, 'loss/train': 1.646243691444397} -08/30/2021 20:21:14 - INFO - __main__ - Step 39740: {'lr': 0.0004239820100215537, 'samples': 7630080, 'steps': 39739, 'loss/train': 1.9203139543533325} -08/30/2021 20:21:14 - INFO - __main__ - Step 39741: {'lr': 0.00042397819914807855, 'samples': 7630272, 'steps': 39740, 'loss/train': 0.053706929087638855} -08/30/2021 20:21:15 - INFO - __main__ - Step 39742: {'lr': 0.00042397438819621164, 'samples': 7630464, 'steps': 39741, 'loss/train': 1.4636296033859253} -08/30/2021 20:21:16 - INFO - __main__ - Step 39743: {'lr': 0.0004239705771659545, 'samples': 7630656, 'steps': 39742, 'loss/train': 1.2163830995559692} -08/30/2021 20:21:16 - INFO - __main__ - Step 39744: {'lr': 0.000423966766057309, 'samples': 7630848, 'steps': 39743, 'loss/train': 1.6223723888397217} -08/30/2021 20:21:16 - INFO - __main__ - Step 39745: {'lr': 0.00042396295487027666, 'samples': 7631040, 'steps': 39744, 'loss/train': 1.0613372325897217} -08/30/2021 20:21:17 - INFO - __main__ - Step 39746: {'lr': 0.0004239591436048593, 'samples': 7631232, 'steps': 39745, 'loss/train': 1.5498744249343872} -08/30/2021 20:21:19 - INFO - __main__ - Step 39747: {'lr': 0.0004239553322610586, 'samples': 7631424, 'steps': 39746, 'loss/train': 1.68617582321167} -08/30/2021 20:21:19 - INFO - __main__ - Step 39748: {'lr': 0.0004239515208388764, 'samples': 7631616, 'steps': 39747, 'loss/train': 1.2268978357315063} -08/30/2021 20:21:20 - INFO - __main__ - Step 39749: {'lr': 0.00042394770933831425, 'samples': 7631808, 'steps': 39748, 'loss/train': 1.8943700790405273} -08/30/2021 20:21:20 - INFO - __main__ - Step 39750: {'lr': 0.00042394389775937403, 'samples': 7632000, 'steps': 39749, 'loss/train': 1.6310123205184937} -08/30/2021 20:21:20 - INFO - __main__ - Step 39751: {'lr': 0.0004239400861020574, 'samples': 7632192, 'steps': 39750, 'loss/train': 2.052149534225464} -08/30/2021 20:21:21 - INFO - __main__ - Step 39752: {'lr': 0.00042393627436636597, 'samples': 7632384, 'steps': 39751, 'loss/train': 1.577345609664917} -08/30/2021 20:21:23 - INFO - __main__ - Step 39753: {'lr': 0.0004239324625523015, 'samples': 7632576, 'steps': 39752, 'loss/train': 1.107822299003601} -08/30/2021 20:21:24 - INFO - __main__ - Step 39754: {'lr': 0.00042392865065986573, 'samples': 7632768, 'steps': 39753, 'loss/train': 1.2555097341537476} -08/30/2021 20:21:24 - INFO - __main__ - Step 39755: {'lr': 0.00042392483868906053, 'samples': 7632960, 'steps': 39754, 'loss/train': 1.6713358163833618} -08/30/2021 20:21:24 - INFO - __main__ - Step 39756: {'lr': 0.0004239210266398874, 'samples': 7633152, 'steps': 39755, 'loss/train': 0.10498946160078049} -08/30/2021 20:21:25 - INFO - __main__ - Step 39757: {'lr': 0.0004239172145123481, 'samples': 7633344, 'steps': 39756, 'loss/train': 1.5836464166641235} -08/30/2021 20:21:25 - INFO - __main__ - Step 39758: {'lr': 0.0004239134023064445, 'samples': 7633536, 'steps': 39757, 'loss/train': 1.675431728363037} -08/30/2021 20:21:25 - INFO - __main__ - Step 39759: {'lr': 0.0004239095900221781, 'samples': 7633728, 'steps': 39758, 'loss/train': 0.0664868876338005} -08/30/2021 20:21:27 - INFO - __main__ - Step 39760: {'lr': 0.00042390577765955077, 'samples': 7633920, 'steps': 39759, 'loss/train': 1.6064023971557617} -08/30/2021 20:21:27 - INFO - __main__ - Step 39761: {'lr': 0.00042390196521856417, 'samples': 7634112, 'steps': 39760, 'loss/train': 1.6149566173553467} -08/30/2021 20:21:28 - INFO - __main__ - Step 39762: {'lr': 0.00042389815269922005, 'samples': 7634304, 'steps': 39761, 'loss/train': 1.4950525760650635} -08/30/2021 20:21:28 - INFO - __main__ - Step 39763: {'lr': 0.0004238943401015201, 'samples': 7634496, 'steps': 39762, 'loss/train': 1.5462342500686646} -08/30/2021 20:21:28 - INFO - __main__ - Step 39764: {'lr': 0.0004238905274254661, 'samples': 7634688, 'steps': 39763, 'loss/train': 1.8067632913589478} -08/30/2021 20:21:30 - INFO - __main__ - Step 39765: {'lr': 0.0004238867146710596, 'samples': 7634880, 'steps': 39764, 'loss/train': 2.1296796798706055} -08/30/2021 20:21:30 - INFO - __main__ - Step 39766: {'lr': 0.0004238829018383025, 'samples': 7635072, 'steps': 39765, 'loss/train': 1.5659006834030151} -08/30/2021 20:21:31 - INFO - __main__ - Step 39767: {'lr': 0.0004238790889271964, 'samples': 7635264, 'steps': 39766, 'loss/train': 1.9521446228027344} -08/30/2021 20:21:31 - INFO - __main__ - Step 39768: {'lr': 0.0004238752759377431, 'samples': 7635456, 'steps': 39767, 'loss/train': 1.5365787744522095} -08/30/2021 20:21:31 - INFO - __main__ - Step 39769: {'lr': 0.0004238714628699443, 'samples': 7635648, 'steps': 39768, 'loss/train': 1.3166062831878662} -08/30/2021 20:21:33 - INFO - __main__ - Step 39770: {'lr': 0.00042386764972380164, 'samples': 7635840, 'steps': 39769, 'loss/train': 1.8102490901947021} -08/30/2021 20:21:33 - INFO - __main__ - Step 39771: {'lr': 0.00042386383649931693, 'samples': 7636032, 'steps': 39770, 'loss/train': 1.4819411039352417} -08/30/2021 20:21:33 - INFO - __main__ - Step 39772: {'lr': 0.00042386002319649184, 'samples': 7636224, 'steps': 39771, 'loss/train': 1.9187854528427124} -08/30/2021 20:21:34 - INFO - __main__ - Step 39773: {'lr': 0.0004238562098153281, 'samples': 7636416, 'steps': 39772, 'loss/train': 1.5359846353530884} -08/30/2021 20:21:34 - INFO - __main__ - Step 39774: {'lr': 0.0004238523963558275, 'samples': 7636608, 'steps': 39773, 'loss/train': 1.1927670240402222} -08/30/2021 20:21:35 - INFO - __main__ - Step 39775: {'lr': 0.0004238485828179917, 'samples': 7636800, 'steps': 39774, 'loss/train': 1.3483922481536865} -08/30/2021 20:21:36 - INFO - __main__ - Step 39776: {'lr': 0.00042384476920182234, 'samples': 7636992, 'steps': 39775, 'loss/train': 1.1310625076293945} -08/30/2021 20:21:37 - INFO - __main__ - Step 39777: {'lr': 0.0004238409555073212, 'samples': 7637184, 'steps': 39776, 'loss/train': 1.4612566232681274} -08/30/2021 20:21:37 - INFO - __main__ - Step 39778: {'lr': 0.00042383714173449007, 'samples': 7637376, 'steps': 39777, 'loss/train': 1.555152416229248} -08/30/2021 20:21:37 - INFO - __main__ - Step 39779: {'lr': 0.00042383332788333055, 'samples': 7637568, 'steps': 39778, 'loss/train': 1.5594398975372314} -08/30/2021 20:21:38 - INFO - __main__ - Step 39780: {'lr': 0.0004238295139538445, 'samples': 7637760, 'steps': 39779, 'loss/train': 1.8967844247817993} -08/30/2021 20:21:39 - INFO - __main__ - Step 39781: {'lr': 0.0004238256999460335, 'samples': 7637952, 'steps': 39780, 'loss/train': 1.8482410907745361} -08/30/2021 20:21:40 - INFO - __main__ - Step 39782: {'lr': 0.00042382188585989933, 'samples': 7638144, 'steps': 39781, 'loss/train': 1.0997345447540283} -08/30/2021 20:21:40 - INFO - __main__ - Step 39783: {'lr': 0.0004238180716954436, 'samples': 7638336, 'steps': 39782, 'loss/train': 1.8072947263717651} -08/30/2021 20:21:40 - INFO - __main__ - Step 39784: {'lr': 0.0004238142574526683, 'samples': 7638528, 'steps': 39783, 'loss/train': 1.4344013929367065} -08/30/2021 20:21:41 - INFO - __main__ - Step 39785: {'lr': 0.0004238104431315749, 'samples': 7638720, 'steps': 39784, 'loss/train': 1.0944627523422241} -08/30/2021 20:21:42 - INFO - __main__ - Step 39786: {'lr': 0.00042380662873216517, 'samples': 7638912, 'steps': 39785, 'loss/train': 1.6362626552581787} -08/30/2021 20:21:43 - INFO - __main__ - Step 39787: {'lr': 0.00042380281425444087, 'samples': 7639104, 'steps': 39786, 'loss/train': 1.4634677171707153} -08/30/2021 20:21:43 - INFO - __main__ - Step 39788: {'lr': 0.0004237989996984037, 'samples': 7639296, 'steps': 39787, 'loss/train': 1.2802988290786743} -08/30/2021 20:21:43 - INFO - __main__ - Step 39789: {'lr': 0.0004237951850640555, 'samples': 7639488, 'steps': 39788, 'loss/train': 1.3769564628601074} -08/30/2021 20:21:44 - INFO - __main__ - Step 39790: {'lr': 0.0004237913703513977, 'samples': 7639680, 'steps': 39789, 'loss/train': 1.6763055324554443} -08/30/2021 20:21:45 - INFO - __main__ - Step 39791: {'lr': 0.00042378755556043225, 'samples': 7639872, 'steps': 39790, 'loss/train': 1.154290795326233} -08/30/2021 20:21:46 - INFO - __main__ - Step 39792: {'lr': 0.0004237837406911608, 'samples': 7640064, 'steps': 39791, 'loss/train': 1.4609167575836182} -08/30/2021 20:21:46 - INFO - __main__ - Step 39793: {'lr': 0.00042377992574358514, 'samples': 7640256, 'steps': 39792, 'loss/train': 1.802790880203247} -08/30/2021 20:21:47 - INFO - __main__ - Step 39794: {'lr': 0.0004237761107177068, 'samples': 7640448, 'steps': 39793, 'loss/train': 1.6666299104690552} -08/30/2021 20:21:47 - INFO - __main__ - Step 39795: {'lr': 0.00042377229561352774, 'samples': 7640640, 'steps': 39794, 'loss/train': 1.34855055809021} -08/30/2021 20:21:47 - INFO - __main__ - Step 39796: {'lr': 0.00042376848043104953, 'samples': 7640832, 'steps': 39795, 'loss/train': 1.399302363395691} -08/30/2021 20:21:49 - INFO - __main__ - Step 39797: {'lr': 0.00042376466517027387, 'samples': 7641024, 'steps': 39796, 'loss/train': 0.7730812430381775} -08/30/2021 20:21:49 - INFO - __main__ - Step 39798: {'lr': 0.00042376084983120266, 'samples': 7641216, 'steps': 39797, 'loss/train': 1.2225711345672607} -08/30/2021 20:21:50 - INFO - __main__ - Step 39799: {'lr': 0.0004237570344138374, 'samples': 7641408, 'steps': 39798, 'loss/train': 1.5387535095214844} -08/30/2021 20:21:50 - INFO - __main__ - Step 39800: {'lr': 0.00042375321891818, 'samples': 7641600, 'steps': 39799, 'loss/train': 1.4773350954055786} -08/30/2021 20:21:50 - INFO - __main__ - Step 39801: {'lr': 0.00042374940334423194, 'samples': 7641792, 'steps': 39800, 'loss/train': 0.9736891984939575} -08/30/2021 20:21:52 - INFO - __main__ - Step 39802: {'lr': 0.00042374558769199517, 'samples': 7641984, 'steps': 39801, 'loss/train': 0.5339415669441223} -08/30/2021 20:21:53 - INFO - __main__ - Step 39803: {'lr': 0.0004237417719614713, 'samples': 7642176, 'steps': 39802, 'loss/train': 1.0176312923431396} -08/30/2021 20:21:53 - INFO - __main__ - Step 39804: {'lr': 0.000423737956152662, 'samples': 7642368, 'steps': 39803, 'loss/train': 1.7241501808166504} -08/30/2021 20:21:53 - INFO - __main__ - Step 39805: {'lr': 0.0004237341402655692, 'samples': 7642560, 'steps': 39804, 'loss/train': 1.385020136833191} -08/30/2021 20:21:54 - INFO - __main__ - Step 39806: {'lr': 0.00042373032430019443, 'samples': 7642752, 'steps': 39805, 'loss/train': 1.0439468622207642} -08/30/2021 20:21:54 - INFO - __main__ - Step 39807: {'lr': 0.00042372650825653937, 'samples': 7642944, 'steps': 39806, 'loss/train': 1.5732402801513672} -08/30/2021 20:21:56 - INFO - __main__ - Step 39808: {'lr': 0.0004237226921346059, 'samples': 7643136, 'steps': 39807, 'loss/train': 2.7936289310455322} -08/30/2021 20:21:57 - INFO - __main__ - Step 39809: {'lr': 0.0004237188759343956, 'samples': 7643328, 'steps': 39808, 'loss/train': 1.8445457220077515} -08/30/2021 20:21:57 - INFO - __main__ - Step 39810: {'lr': 0.0004237150596559103, 'samples': 7643520, 'steps': 39809, 'loss/train': 0.8576852083206177} -08/30/2021 20:21:57 - INFO - __main__ - Step 39811: {'lr': 0.00042371124329915167, 'samples': 7643712, 'steps': 39810, 'loss/train': 1.330367088317871} -08/30/2021 20:21:58 - INFO - __main__ - Step 39812: {'lr': 0.0004237074268641215, 'samples': 7643904, 'steps': 39811, 'loss/train': 1.4323655366897583} -08/30/2021 20:21:59 - INFO - __main__ - Step 39813: {'lr': 0.00042370361035082136, 'samples': 7644096, 'steps': 39812, 'loss/train': 1.3146483898162842} -08/30/2021 20:22:00 - INFO - __main__ - Step 39814: {'lr': 0.000423699793759253, 'samples': 7644288, 'steps': 39813, 'loss/train': 1.748504877090454} -08/30/2021 20:22:00 - INFO - __main__ - Step 39815: {'lr': 0.0004236959770894183, 'samples': 7644480, 'steps': 39814, 'loss/train': 1.4523926973342896} -08/30/2021 20:22:00 - INFO - __main__ - Step 39816: {'lr': 0.00042369216034131887, 'samples': 7644672, 'steps': 39815, 'loss/train': 1.234877347946167} -08/30/2021 20:22:01 - INFO - __main__ - Step 39817: {'lr': 0.0004236883435149564, 'samples': 7644864, 'steps': 39816, 'loss/train': 1.5407646894454956} -08/30/2021 20:22:01 - INFO - __main__ - Step 39818: {'lr': 0.0004236845266103327, 'samples': 7645056, 'steps': 39817, 'loss/train': 1.4343197345733643} -08/30/2021 20:22:02 - INFO - __main__ - Step 39819: {'lr': 0.00042368070962744937, 'samples': 7645248, 'steps': 39818, 'loss/train': 0.7413326501846313} -08/30/2021 20:22:03 - INFO - __main__ - Step 39820: {'lr': 0.0004236768925663082, 'samples': 7645440, 'steps': 39819, 'loss/train': 1.5835468769073486} -08/30/2021 20:22:03 - INFO - __main__ - Step 39821: {'lr': 0.0004236730754269109, 'samples': 7645632, 'steps': 39820, 'loss/train': 1.2382744550704956} -08/30/2021 20:22:04 - INFO - __main__ - Step 39822: {'lr': 0.00042366925820925915, 'samples': 7645824, 'steps': 39821, 'loss/train': 1.099984049797058} -08/30/2021 20:22:04 - INFO - __main__ - Step 39823: {'lr': 0.0004236654409133548, 'samples': 7646016, 'steps': 39822, 'loss/train': 0.7239627838134766} -08/30/2021 20:22:06 - INFO - __main__ - Step 39824: {'lr': 0.0004236616235391995, 'samples': 7646208, 'steps': 39823, 'loss/train': 1.9253596067428589} -08/30/2021 20:22:06 - INFO - __main__ - Step 39825: {'lr': 0.0004236578060867949, 'samples': 7646400, 'steps': 39824, 'loss/train': 1.6039097309112549} -08/30/2021 20:22:07 - INFO - __main__ - Step 39826: {'lr': 0.0004236539885561427, 'samples': 7646592, 'steps': 39825, 'loss/train': 0.11956195533275604} -08/30/2021 20:22:07 - INFO - __main__ - Step 39827: {'lr': 0.0004236501709472448, 'samples': 7646784, 'steps': 39826, 'loss/train': 1.5506343841552734} -08/30/2021 20:22:07 - INFO - __main__ - Step 39828: {'lr': 0.00042364635326010277, 'samples': 7646976, 'steps': 39827, 'loss/train': 1.3428919315338135} -08/30/2021 20:22:08 - INFO - __main__ - Step 39829: {'lr': 0.0004236425354947183, 'samples': 7647168, 'steps': 39828, 'loss/train': 1.362579345703125} -08/30/2021 20:22:09 - INFO - __main__ - Step 39830: {'lr': 0.0004236387176510933, 'samples': 7647360, 'steps': 39829, 'loss/train': 2.4064180850982666} -08/30/2021 20:22:10 - INFO - __main__ - Step 39831: {'lr': 0.00042363489972922937, 'samples': 7647552, 'steps': 39830, 'loss/train': 1.4314252138137817} -08/30/2021 20:22:10 - INFO - __main__ - Step 39832: {'lr': 0.00042363108172912824, 'samples': 7647744, 'steps': 39831, 'loss/train': 1.1759506464004517} -08/30/2021 20:22:10 - INFO - __main__ - Step 39833: {'lr': 0.0004236272636507915, 'samples': 7647936, 'steps': 39832, 'loss/train': 1.8201500177383423} -08/30/2021 20:22:11 - INFO - __main__ - Step 39834: {'lr': 0.0004236234454942211, 'samples': 7648128, 'steps': 39833, 'loss/train': 1.2150834798812866} -08/30/2021 20:22:12 - INFO - __main__ - Step 39835: {'lr': 0.0004236196272594186, 'samples': 7648320, 'steps': 39834, 'loss/train': 3.5438666343688965} -08/30/2021 20:22:13 - INFO - __main__ - Step 39836: {'lr': 0.00042361580894638586, 'samples': 7648512, 'steps': 39835, 'loss/train': 1.3479591608047485} -08/30/2021 20:22:13 - INFO - __main__ - Step 39837: {'lr': 0.0004236119905551244, 'samples': 7648704, 'steps': 39836, 'loss/train': 1.3892861604690552} -08/30/2021 20:22:13 - INFO - __main__ - Step 39838: {'lr': 0.0004236081720856362, 'samples': 7648896, 'steps': 39837, 'loss/train': 1.6087465286254883} -08/30/2021 20:22:14 - INFO - __main__ - Step 39839: {'lr': 0.0004236043535379227, 'samples': 7649088, 'steps': 39838, 'loss/train': 1.2033506631851196} -08/30/2021 20:22:15 - INFO - __main__ - Step 39840: {'lr': 0.0004236005349119858, 'samples': 7649280, 'steps': 39839, 'loss/train': 1.4677839279174805} -08/30/2021 20:22:16 - INFO - __main__ - Step 39841: {'lr': 0.0004235967162078272, 'samples': 7649472, 'steps': 39840, 'loss/train': 1.2253412008285522} -08/30/2021 20:22:16 - INFO - __main__ - Step 39842: {'lr': 0.0004235928974254486, 'samples': 7649664, 'steps': 39841, 'loss/train': 1.2615032196044922} -08/30/2021 20:22:16 - INFO - __main__ - Step 39843: {'lr': 0.00042358907856485166, 'samples': 7649856, 'steps': 39842, 'loss/train': 1.5576845407485962} -08/30/2021 20:22:17 - INFO - __main__ - Step 39844: {'lr': 0.0004235852596260382, 'samples': 7650048, 'steps': 39843, 'loss/train': 1.876056432723999} -08/30/2021 20:22:17 - INFO - __main__ - Step 39845: {'lr': 0.0004235814406090099, 'samples': 7650240, 'steps': 39844, 'loss/train': 1.249107003211975} -08/30/2021 20:22:19 - INFO - __main__ - Step 39846: {'lr': 0.0004235776215137686, 'samples': 7650432, 'steps': 39845, 'loss/train': 1.5645771026611328} -08/30/2021 20:22:19 - INFO - __main__ - Step 39847: {'lr': 0.0004235738023403157, 'samples': 7650624, 'steps': 39846, 'loss/train': 1.2951265573501587} -08/30/2021 20:22:20 - INFO - __main__ - Step 39848: {'lr': 0.00042356998308865323, 'samples': 7650816, 'steps': 39847, 'loss/train': 1.1508517265319824} -08/30/2021 20:22:20 - INFO - __main__ - Step 39849: {'lr': 0.00042356616375878274, 'samples': 7651008, 'steps': 39848, 'loss/train': 1.85157310962677} -08/30/2021 20:22:20 - INFO - __main__ - Step 39850: {'lr': 0.00042356234435070604, 'samples': 7651200, 'steps': 39849, 'loss/train': 3.2641148567199707} -08/30/2021 20:22:22 - INFO - __main__ - Step 39851: {'lr': 0.0004235585248644249, 'samples': 7651392, 'steps': 39850, 'loss/train': 1.4653106927871704} -08/30/2021 20:22:22 - INFO - __main__ - Step 39852: {'lr': 0.0004235547052999409, 'samples': 7651584, 'steps': 39851, 'loss/train': 0.9225090146064758} -08/30/2021 20:22:23 - INFO - __main__ - Step 39853: {'lr': 0.00042355088565725584, 'samples': 7651776, 'steps': 39852, 'loss/train': 1.5941897630691528} -08/30/2021 20:22:23 - INFO - __main__ - Step 39854: {'lr': 0.0004235470659363714, 'samples': 7651968, 'steps': 39853, 'loss/train': 1.9329582452774048} -08/30/2021 20:22:23 - INFO - __main__ - Step 39855: {'lr': 0.0004235432461372894, 'samples': 7652160, 'steps': 39854, 'loss/train': 1.5335501432418823} -08/30/2021 20:22:26 - INFO - __main__ - Step 39856: {'lr': 0.0004235394262600114, 'samples': 7652352, 'steps': 39855, 'loss/train': 2.1897225379943848} -08/30/2021 20:22:26 - INFO - __main__ - Step 39857: {'lr': 0.0004235356063045393, 'samples': 7652544, 'steps': 39856, 'loss/train': 1.5117830038070679} -08/30/2021 20:22:27 - INFO - __main__ - Step 39858: {'lr': 0.0004235317862708747, 'samples': 7652736, 'steps': 39857, 'loss/train': 1.3249950408935547} -08/30/2021 20:22:27 - INFO - __main__ - Step 39859: {'lr': 0.00042352796615901937, 'samples': 7652928, 'steps': 39858, 'loss/train': 2.392627239227295} -08/30/2021 20:22:27 - INFO - __main__ - Step 39860: {'lr': 0.000423524145968975, 'samples': 7653120, 'steps': 39859, 'loss/train': 2.405303716659546} -08/30/2021 20:22:28 - INFO - __main__ - Step 39861: {'lr': 0.00042352032570074327, 'samples': 7653312, 'steps': 39860, 'loss/train': 3.2477967739105225} -08/30/2021 20:22:28 - INFO - __main__ - Step 39862: {'lr': 0.00042351650535432607, 'samples': 7653504, 'steps': 39861, 'loss/train': 0.34251442551612854} -08/30/2021 20:22:28 - INFO - __main__ - Step 39863: {'lr': 0.00042351268492972494, 'samples': 7653696, 'steps': 39862, 'loss/train': 0.23484422266483307} -08/30/2021 20:22:29 - INFO - __main__ - Step 39864: {'lr': 0.0004235088644269417, 'samples': 7653888, 'steps': 39863, 'loss/train': 1.8007278442382812} -08/30/2021 20:22:30 - INFO - __main__ - Step 39865: {'lr': 0.00042350504384597803, 'samples': 7654080, 'steps': 39864, 'loss/train': 6.510688304901123} -08/30/2021 20:22:30 - INFO - __main__ - Step 39866: {'lr': 0.0004235012231868357, 'samples': 7654272, 'steps': 39865, 'loss/train': 1.8088299036026} -08/30/2021 20:22:31 - INFO - __main__ - Step 39867: {'lr': 0.0004234974024495163, 'samples': 7654464, 'steps': 39866, 'loss/train': 2.0929627418518066} -08/30/2021 20:22:31 - INFO - __main__ - Step 39868: {'lr': 0.00042349358163402175, 'samples': 7654656, 'steps': 39867, 'loss/train': 1.964975118637085} -08/30/2021 20:22:32 - INFO - __main__ - Step 39869: {'lr': 0.0004234897607403536, 'samples': 7654848, 'steps': 39868, 'loss/train': 1.8140032291412354} -08/30/2021 20:22:33 - INFO - __main__ - Step 39870: {'lr': 0.0004234859397685137, 'samples': 7655040, 'steps': 39869, 'loss/train': 0.901826024055481} -08/30/2021 20:22:34 - INFO - __main__ - Step 39871: {'lr': 0.0004234821187185036, 'samples': 7655232, 'steps': 39870, 'loss/train': 1.8299572467803955} -08/30/2021 20:22:34 - INFO - __main__ - Step 39872: {'lr': 0.0004234782975903253, 'samples': 7655424, 'steps': 39871, 'loss/train': 1.7122297286987305} -08/30/2021 20:22:35 - INFO - __main__ - Step 39873: {'lr': 0.00042347447638398024, 'samples': 7655616, 'steps': 39872, 'loss/train': 1.5269038677215576} -08/30/2021 20:22:35 - INFO - __main__ - Step 39874: {'lr': 0.00042347065509947023, 'samples': 7655808, 'steps': 39873, 'loss/train': 1.7298256158828735} -08/30/2021 20:22:36 - INFO - __main__ - Step 39875: {'lr': 0.0004234668337367971, 'samples': 7656000, 'steps': 39874, 'loss/train': 2.083935260772705} -08/30/2021 20:22:37 - INFO - __main__ - Step 39876: {'lr': 0.0004234630122959625, 'samples': 7656192, 'steps': 39875, 'loss/train': 1.4115592241287231} -08/30/2021 20:22:37 - INFO - __main__ - Step 39877: {'lr': 0.0004234591907769681, 'samples': 7656384, 'steps': 39876, 'loss/train': 2.0594301223754883} -08/30/2021 20:22:38 - INFO - __main__ - Step 39878: {'lr': 0.0004234553691798156, 'samples': 7656576, 'steps': 39877, 'loss/train': 2.1799516677856445} -08/30/2021 20:22:38 - INFO - __main__ - Step 39879: {'lr': 0.000423451547504507, 'samples': 7656768, 'steps': 39878, 'loss/train': 1.482926845550537} -08/30/2021 20:22:39 - INFO - __main__ - Step 39880: {'lr': 0.0004234477257510436, 'samples': 7656960, 'steps': 39879, 'loss/train': 1.8995473384857178} -08/30/2021 20:22:40 - INFO - __main__ - Step 39881: {'lr': 0.00042344390391942745, 'samples': 7657152, 'steps': 39880, 'loss/train': 0.5500131249427795} -08/30/2021 20:22:40 - INFO - __main__ - Step 39882: {'lr': 0.0004234400820096601, 'samples': 7657344, 'steps': 39881, 'loss/train': 1.4850785732269287} -08/30/2021 20:22:41 - INFO - __main__ - Step 39883: {'lr': 0.0004234362600217433, 'samples': 7657536, 'steps': 39882, 'loss/train': 1.2737517356872559} -08/30/2021 20:22:41 - INFO - __main__ - Step 39884: {'lr': 0.0004234324379556789, 'samples': 7657728, 'steps': 39883, 'loss/train': 2.354860305786133} -08/30/2021 20:22:42 - INFO - __main__ - Step 39885: {'lr': 0.0004234286158114684, 'samples': 7657920, 'steps': 39884, 'loss/train': 1.7381205558776855} -08/30/2021 20:22:43 - INFO - __main__ - Step 39886: {'lr': 0.0004234247935891137, 'samples': 7658112, 'steps': 39885, 'loss/train': 1.4401222467422485} -08/30/2021 20:22:43 - INFO - __main__ - Step 39887: {'lr': 0.00042342097128861647, 'samples': 7658304, 'steps': 39886, 'loss/train': 1.9009616374969482} -08/30/2021 20:22:44 - INFO - __main__ - Step 39888: {'lr': 0.0004234171489099784, 'samples': 7658496, 'steps': 39887, 'loss/train': 1.29734206199646} -08/30/2021 20:22:44 - INFO - __main__ - Step 39889: {'lr': 0.00042341332645320126, 'samples': 7658688, 'steps': 39888, 'loss/train': 2.1100194454193115} -08/30/2021 20:22:46 - INFO - __main__ - Step 39890: {'lr': 0.0004234095039182867, 'samples': 7658880, 'steps': 39889, 'loss/train': 2.002281427383423} -08/30/2021 20:22:46 - INFO - __main__ - Step 39891: {'lr': 0.00042340568130523653, 'samples': 7659072, 'steps': 39890, 'loss/train': 1.6675454378128052} -08/30/2021 20:22:46 - INFO - __main__ - Step 39892: {'lr': 0.0004234018586140525, 'samples': 7659264, 'steps': 39891, 'loss/train': 1.6324392557144165} -08/30/2021 20:22:47 - INFO - __main__ - Step 39893: {'lr': 0.00042339803584473626, 'samples': 7659456, 'steps': 39892, 'loss/train': 1.6695985794067383} -08/30/2021 20:22:47 - INFO - __main__ - Step 39894: {'lr': 0.0004233942129972894, 'samples': 7659648, 'steps': 39893, 'loss/train': 0.17922604084014893} -08/30/2021 20:22:49 - INFO - __main__ - Step 39895: {'lr': 0.00042339039007171386, 'samples': 7659840, 'steps': 39894, 'loss/train': 1.1587668657302856} -08/30/2021 20:22:49 - INFO - __main__ - Step 39896: {'lr': 0.00042338656706801135, 'samples': 7660032, 'steps': 39895, 'loss/train': 1.8000980615615845} -08/30/2021 20:22:49 - INFO - __main__ - Step 39897: {'lr': 0.00042338274398618346, 'samples': 7660224, 'steps': 39896, 'loss/train': 1.6434587240219116} -08/30/2021 20:22:50 - INFO - __main__ - Step 39898: {'lr': 0.000423378920826232, 'samples': 7660416, 'steps': 39897, 'loss/train': 1.6689329147338867} -08/30/2021 20:22:50 - INFO - __main__ - Step 39899: {'lr': 0.0004233750975881587, 'samples': 7660608, 'steps': 39898, 'loss/train': 1.5078701972961426} -08/30/2021 20:22:50 - INFO - __main__ - Step 39900: {'lr': 0.0004233712742719652, 'samples': 7660800, 'steps': 39899, 'loss/train': 1.9081040620803833} -08/30/2021 20:22:52 - INFO - __main__ - Step 39901: {'lr': 0.0004233674508776533, 'samples': 7660992, 'steps': 39900, 'loss/train': 2.3875625133514404} -08/30/2021 20:22:52 - INFO - __main__ - Step 39902: {'lr': 0.00042336362740522473, 'samples': 7661184, 'steps': 39901, 'loss/train': 1.2209930419921875} -08/30/2021 20:22:53 - INFO - __main__ - Step 39903: {'lr': 0.0004233598038546812, 'samples': 7661376, 'steps': 39902, 'loss/train': 1.5918796062469482} -08/30/2021 20:22:53 - INFO - __main__ - Step 39904: {'lr': 0.0004233559802260244, 'samples': 7661568, 'steps': 39903, 'loss/train': 1.8165403604507446} -08/30/2021 20:22:53 - INFO - __main__ - Step 39905: {'lr': 0.000423352156519256, 'samples': 7661760, 'steps': 39904, 'loss/train': 1.0334722995758057} -08/30/2021 20:22:55 - INFO - __main__ - Step 39906: {'lr': 0.0004233483327343779, 'samples': 7661952, 'steps': 39905, 'loss/train': 1.5503871440887451} -08/30/2021 20:22:55 - INFO - __main__ - Step 39907: {'lr': 0.0004233445088713916, 'samples': 7662144, 'steps': 39906, 'loss/train': 1.7237764596939087} -08/30/2021 20:22:56 - INFO - __main__ - Step 39908: {'lr': 0.000423340684930299, 'samples': 7662336, 'steps': 39907, 'loss/train': 1.325069785118103} -08/30/2021 20:22:56 - INFO - __main__ - Step 39909: {'lr': 0.0004233368609111018, 'samples': 7662528, 'steps': 39908, 'loss/train': 1.6507238149642944} -08/30/2021 20:22:56 - INFO - __main__ - Step 39910: {'lr': 0.00042333303681380165, 'samples': 7662720, 'steps': 39909, 'loss/train': 1.624729871749878} -08/30/2021 20:22:58 - INFO - __main__ - Step 39911: {'lr': 0.0004233292126384003, 'samples': 7662912, 'steps': 39910, 'loss/train': 1.3100122213363647} -08/30/2021 20:22:58 - INFO - __main__ - Step 39912: {'lr': 0.00042332538838489955, 'samples': 7663104, 'steps': 39911, 'loss/train': 0.9684287905693054} -08/30/2021 20:22:58 - INFO - __main__ - Step 39913: {'lr': 0.0004233215640533009, 'samples': 7663296, 'steps': 39912, 'loss/train': 2.1299078464508057} -08/30/2021 20:22:59 - INFO - __main__ - Step 39914: {'lr': 0.0004233177396436064, 'samples': 7663488, 'steps': 39913, 'loss/train': 1.3713035583496094} -08/30/2021 20:22:59 - INFO - __main__ - Step 39915: {'lr': 0.00042331391515581753, 'samples': 7663680, 'steps': 39914, 'loss/train': 1.481816053390503} -08/30/2021 20:23:01 - INFO - __main__ - Step 39916: {'lr': 0.00042331009058993604, 'samples': 7663872, 'steps': 39915, 'loss/train': 0.8788862228393555} -08/30/2021 20:23:01 - INFO - __main__ - Step 39917: {'lr': 0.00042330626594596374, 'samples': 7664064, 'steps': 39916, 'loss/train': 1.7196238040924072} -08/30/2021 20:23:01 - INFO - __main__ - Step 39918: {'lr': 0.00042330244122390227, 'samples': 7664256, 'steps': 39917, 'loss/train': 1.3474643230438232} -08/30/2021 20:23:02 - INFO - __main__ - Step 39919: {'lr': 0.00042329861642375347, 'samples': 7664448, 'steps': 39918, 'loss/train': 1.5671926736831665} -08/30/2021 20:23:02 - INFO - __main__ - Step 39920: {'lr': 0.00042329479154551897, 'samples': 7664640, 'steps': 39919, 'loss/train': 1.7457983493804932} -08/30/2021 20:23:05 - INFO - __main__ - Step 39921: {'lr': 0.0004232909665892005, 'samples': 7664832, 'steps': 39920, 'loss/train': 1.34580659866333} -08/30/2021 20:23:05 - INFO - __main__ - Step 39922: {'lr': 0.00042328714155479973, 'samples': 7665024, 'steps': 39921, 'loss/train': 1.4555563926696777} -08/30/2021 20:23:05 - INFO - __main__ - Step 39923: {'lr': 0.0004232833164423185, 'samples': 7665216, 'steps': 39922, 'loss/train': 1.605604887008667} -08/30/2021 20:23:06 - INFO - __main__ - Step 39924: {'lr': 0.00042327949125175844, 'samples': 7665408, 'steps': 39923, 'loss/train': 1.1793478727340698} -08/30/2021 20:23:06 - INFO - __main__ - Step 39925: {'lr': 0.0004232756659831214, 'samples': 7665600, 'steps': 39924, 'loss/train': 1.2907603979110718} -08/30/2021 20:23:06 - INFO - __main__ - Step 39926: {'lr': 0.000423271840636409, 'samples': 7665792, 'steps': 39925, 'loss/train': 1.2843084335327148} -08/30/2021 20:23:08 - INFO - __main__ - Step 39927: {'lr': 0.00042326801521162295, 'samples': 7665984, 'steps': 39926, 'loss/train': 1.4443492889404297} -08/30/2021 20:23:08 - INFO - __main__ - Step 39928: {'lr': 0.000423264189708765, 'samples': 7666176, 'steps': 39927, 'loss/train': 1.5435090065002441} -08/30/2021 20:23:09 - INFO - __main__ - Step 39929: {'lr': 0.0004232603641278369, 'samples': 7666368, 'steps': 39928, 'loss/train': 1.5917209386825562} -08/30/2021 20:23:09 - INFO - __main__ - Step 39930: {'lr': 0.00042325653846884037, 'samples': 7666560, 'steps': 39929, 'loss/train': 1.4119353294372559} -08/30/2021 20:23:09 - INFO - __main__ - Step 39931: {'lr': 0.00042325271273177707, 'samples': 7666752, 'steps': 39930, 'loss/train': 0.9169667959213257} -08/30/2021 20:23:11 - INFO - __main__ - Step 39932: {'lr': 0.0004232488869166488, 'samples': 7666944, 'steps': 39931, 'loss/train': 1.5057662725448608} -08/30/2021 20:23:11 - INFO - __main__ - Step 39933: {'lr': 0.0004232450610234573, 'samples': 7667136, 'steps': 39932, 'loss/train': 1.2545952796936035} -08/30/2021 20:23:12 - INFO - __main__ - Step 39934: {'lr': 0.00042324123505220414, 'samples': 7667328, 'steps': 39933, 'loss/train': 1.3745766878128052} -08/30/2021 20:23:12 - INFO - __main__ - Step 39935: {'lr': 0.0004232374090028912, 'samples': 7667520, 'steps': 39934, 'loss/train': 1.1821707487106323} -08/30/2021 20:23:12 - INFO - __main__ - Step 39936: {'lr': 0.00042323358287552017, 'samples': 7667712, 'steps': 39935, 'loss/train': 2.2497944831848145} -08/30/2021 20:23:14 - INFO - __main__ - Step 39937: {'lr': 0.0004232297566700928, 'samples': 7667904, 'steps': 39936, 'loss/train': 1.1231679916381836} -08/30/2021 20:23:15 - INFO - __main__ - Step 39938: {'lr': 0.00042322593038661074, 'samples': 7668096, 'steps': 39937, 'loss/train': 1.443115472793579} -08/30/2021 20:23:15 - INFO - __main__ - Step 39939: {'lr': 0.0004232221040250758, 'samples': 7668288, 'steps': 39938, 'loss/train': 1.262053370475769} -08/30/2021 20:23:15 - INFO - __main__ - Step 39940: {'lr': 0.00042321827758548953, 'samples': 7668480, 'steps': 39939, 'loss/train': 1.3323216438293457} -08/30/2021 20:23:16 - INFO - __main__ - Step 39941: {'lr': 0.00042321445106785385, 'samples': 7668672, 'steps': 39940, 'loss/train': 1.4669933319091797} -08/30/2021 20:23:17 - INFO - __main__ - Step 39942: {'lr': 0.0004232106244721704, 'samples': 7668864, 'steps': 39941, 'loss/train': 1.7182587385177612} -08/30/2021 20:23:17 - INFO - __main__ - Step 39943: {'lr': 0.0004232067977984409, 'samples': 7669056, 'steps': 39942, 'loss/train': 1.418216586112976} -08/30/2021 20:23:18 - INFO - __main__ - Step 39944: {'lr': 0.0004232029710466671, 'samples': 7669248, 'steps': 39943, 'loss/train': 1.1714415550231934} -08/30/2021 20:23:18 - INFO - __main__ - Step 39945: {'lr': 0.00042319914421685067, 'samples': 7669440, 'steps': 39944, 'loss/train': 2.1570920944213867} -08/30/2021 20:23:19 - INFO - __main__ - Step 39946: {'lr': 0.0004231953173089935, 'samples': 7669632, 'steps': 39945, 'loss/train': 1.5293985605239868} -08/30/2021 20:23:20 - INFO - __main__ - Step 39947: {'lr': 0.00042319149032309713, 'samples': 7669824, 'steps': 39946, 'loss/train': 1.2032697200775146} -08/30/2021 20:23:20 - INFO - __main__ - Step 39948: {'lr': 0.00042318766325916336, 'samples': 7670016, 'steps': 39947, 'loss/train': 1.647952914237976} -08/30/2021 20:23:21 - INFO - __main__ - Step 39949: {'lr': 0.00042318383611719386, 'samples': 7670208, 'steps': 39948, 'loss/train': 1.2331401109695435} -08/30/2021 20:23:21 - INFO - __main__ - Step 39950: {'lr': 0.00042318000889719044, 'samples': 7670400, 'steps': 39949, 'loss/train': 0.0455939918756485} -08/30/2021 20:23:22 - INFO - __main__ - Step 39951: {'lr': 0.0004231761815991547, 'samples': 7670592, 'steps': 39950, 'loss/train': 1.5954842567443848} -08/30/2021 20:23:22 - INFO - __main__ - Step 39952: {'lr': 0.0004231723542230885, 'samples': 7670784, 'steps': 39951, 'loss/train': 1.6678485870361328} -08/30/2021 20:23:23 - INFO - __main__ - Step 39953: {'lr': 0.0004231685267689935, 'samples': 7670976, 'steps': 39952, 'loss/train': 1.9941524267196655} -08/30/2021 20:23:24 - INFO - __main__ - Step 39954: {'lr': 0.0004231646992368715, 'samples': 7671168, 'steps': 39953, 'loss/train': 1.7930129766464233} -08/30/2021 20:23:24 - INFO - __main__ - Step 39955: {'lr': 0.00042316087162672415, 'samples': 7671360, 'steps': 39954, 'loss/train': 1.3292405605316162} -08/30/2021 20:23:24 - INFO - __main__ - Step 39956: {'lr': 0.0004231570439385531, 'samples': 7671552, 'steps': 39955, 'loss/train': 1.0995622873306274} -08/30/2021 20:23:25 - INFO - __main__ - Step 39957: {'lr': 0.0004231532161723602, 'samples': 7671744, 'steps': 39956, 'loss/train': 1.0264662504196167} -08/30/2021 20:23:26 - INFO - __main__ - Step 39958: {'lr': 0.0004231493883281471, 'samples': 7671936, 'steps': 39957, 'loss/train': 2.15161395072937} -08/30/2021 20:23:27 - INFO - __main__ - Step 39959: {'lr': 0.00042314556040591567, 'samples': 7672128, 'steps': 39958, 'loss/train': 2.17378568649292} -08/30/2021 20:23:27 - INFO - __main__ - Step 39960: {'lr': 0.0004231417324056674, 'samples': 7672320, 'steps': 39959, 'loss/train': 1.5137709379196167} -08/30/2021 20:23:27 - INFO - __main__ - Step 39961: {'lr': 0.00042313790432740416, 'samples': 7672512, 'steps': 39960, 'loss/train': 1.715969204902649} -08/30/2021 20:23:28 - INFO - __main__ - Step 39962: {'lr': 0.00042313407617112765, 'samples': 7672704, 'steps': 39961, 'loss/train': 1.2451519966125488} -08/30/2021 20:23:29 - INFO - __main__ - Step 39963: {'lr': 0.00042313024793683965, 'samples': 7672896, 'steps': 39962, 'loss/train': 1.930191159248352} -08/30/2021 20:23:30 - INFO - __main__ - Step 39964: {'lr': 0.0004231264196245418, 'samples': 7673088, 'steps': 39963, 'loss/train': 1.4040091037750244} -08/30/2021 20:23:30 - INFO - __main__ - Step 39965: {'lr': 0.00042312259123423584, 'samples': 7673280, 'steps': 39964, 'loss/train': 1.5934674739837646} -08/30/2021 20:23:30 - INFO - __main__ - Step 39966: {'lr': 0.00042311876276592355, 'samples': 7673472, 'steps': 39965, 'loss/train': 1.616688847541809} -08/30/2021 20:23:31 - INFO - __main__ - Step 39967: {'lr': 0.00042311493421960656, 'samples': 7673664, 'steps': 39966, 'loss/train': 0.9064227938652039} -08/30/2021 20:23:32 - INFO - __main__ - Step 39968: {'lr': 0.0004231111055952867, 'samples': 7673856, 'steps': 39967, 'loss/train': 1.3322641849517822} -08/30/2021 20:23:33 - INFO - __main__ - Step 39969: {'lr': 0.00042310727689296563, 'samples': 7674048, 'steps': 39968, 'loss/train': 1.5939640998840332} -08/30/2021 20:23:33 - INFO - __main__ - Step 39970: {'lr': 0.0004231034481126451, 'samples': 7674240, 'steps': 39969, 'loss/train': 1.2966455221176147} -08/30/2021 20:23:33 - INFO - __main__ - Step 39971: {'lr': 0.0004230996192543268, 'samples': 7674432, 'steps': 39970, 'loss/train': 0.8900102376937866} -08/30/2021 20:23:34 - INFO - __main__ - Step 39972: {'lr': 0.0004230957903180125, 'samples': 7674624, 'steps': 39971, 'loss/train': 1.0530837774276733} -08/30/2021 20:23:36 - INFO - __main__ - Step 39973: {'lr': 0.00042309196130370396, 'samples': 7674816, 'steps': 39972, 'loss/train': 2.0230767726898193} -08/30/2021 20:23:37 - INFO - __main__ - Step 39974: {'lr': 0.00042308813221140275, 'samples': 7675008, 'steps': 39973, 'loss/train': 1.1553943157196045} -08/30/2021 20:23:37 - INFO - __main__ - Step 39975: {'lr': 0.00042308430304111076, 'samples': 7675200, 'steps': 39974, 'loss/train': 0.8316280245780945} -08/30/2021 20:23:37 - INFO - __main__ - Step 39976: {'lr': 0.00042308047379282967, 'samples': 7675392, 'steps': 39975, 'loss/train': 1.8400486707687378} -08/30/2021 20:23:38 - INFO - __main__ - Step 39977: {'lr': 0.00042307664446656116, 'samples': 7675584, 'steps': 39976, 'loss/train': 1.4745255708694458} -08/30/2021 20:23:38 - INFO - __main__ - Step 39978: {'lr': 0.000423072815062307, 'samples': 7675776, 'steps': 39977, 'loss/train': 1.0939977169036865} -08/30/2021 20:23:39 - INFO - __main__ - Step 39979: {'lr': 0.0004230689855800689, 'samples': 7675968, 'steps': 39978, 'loss/train': 1.5234830379486084} -08/30/2021 20:23:40 - INFO - __main__ - Step 39980: {'lr': 0.0004230651560198486, 'samples': 7676160, 'steps': 39979, 'loss/train': 1.273972988128662} -08/30/2021 20:23:40 - INFO - __main__ - Step 39981: {'lr': 0.0004230613263816478, 'samples': 7676352, 'steps': 39980, 'loss/train': 1.3743761777877808} -08/30/2021 20:23:40 - INFO - __main__ - Step 39982: {'lr': 0.0004230574966654682, 'samples': 7676544, 'steps': 39981, 'loss/train': 1.2279105186462402} -08/30/2021 20:23:41 - INFO - __main__ - Step 39983: {'lr': 0.0004230536668713116, 'samples': 7676736, 'steps': 39982, 'loss/train': 1.8766906261444092} -08/30/2021 20:23:42 - INFO - __main__ - Step 39984: {'lr': 0.00042304983699917965, 'samples': 7676928, 'steps': 39983, 'loss/train': 1.9027396440505981} -08/30/2021 20:23:43 - INFO - __main__ - Step 39985: {'lr': 0.00042304600704907416, 'samples': 7677120, 'steps': 39984, 'loss/train': 1.3698922395706177} -08/30/2021 20:23:43 - INFO - __main__ - Step 39986: {'lr': 0.0004230421770209968, 'samples': 7677312, 'steps': 39985, 'loss/train': 0.8721058964729309} -08/30/2021 20:23:43 - INFO - __main__ - Step 39987: {'lr': 0.0004230383469149493, 'samples': 7677504, 'steps': 39986, 'loss/train': 1.796926498413086} -08/30/2021 20:23:44 - INFO - __main__ - Step 39988: {'lr': 0.0004230345167309334, 'samples': 7677696, 'steps': 39987, 'loss/train': 2.138378381729126} -08/30/2021 20:23:45 - INFO - __main__ - Step 39989: {'lr': 0.00042303068646895077, 'samples': 7677888, 'steps': 39988, 'loss/train': 1.626409649848938} -08/30/2021 20:23:46 - INFO - __main__ - Step 39990: {'lr': 0.0004230268561290032, 'samples': 7678080, 'steps': 39989, 'loss/train': 1.6420769691467285} -08/30/2021 20:23:46 - INFO - __main__ - Step 39991: {'lr': 0.0004230230257110924, 'samples': 7678272, 'steps': 39990, 'loss/train': 1.2929669618606567} -08/30/2021 20:23:46 - INFO - __main__ - Step 39992: {'lr': 0.00042301919521522014, 'samples': 7678464, 'steps': 39991, 'loss/train': 1.5793284177780151} -08/30/2021 20:23:47 - INFO - __main__ - Step 39993: {'lr': 0.0004230153646413881, 'samples': 7678656, 'steps': 39992, 'loss/train': 1.4071989059448242} -08/30/2021 20:23:48 - INFO - __main__ - Step 39994: {'lr': 0.000423011533989598, 'samples': 7678848, 'steps': 39993, 'loss/train': 1.5328775644302368} -08/30/2021 20:23:49 - INFO - __main__ - Step 39995: {'lr': 0.0004230077032598515, 'samples': 7679040, 'steps': 39994, 'loss/train': 1.4727871417999268} -08/30/2021 20:23:49 - INFO - __main__ - Step 39996: {'lr': 0.00042300387245215043, 'samples': 7679232, 'steps': 39995, 'loss/train': 1.583439826965332} -08/30/2021 20:23:49 - INFO - __main__ - Step 39997: {'lr': 0.00042300004156649654, 'samples': 7679424, 'steps': 39996, 'loss/train': 1.5471478700637817} -08/30/2021 20:23:50 - INFO - __main__ - Step 39998: {'lr': 0.0004229962106028914, 'samples': 7679616, 'steps': 39997, 'loss/train': 1.212770700454712} -08/30/2021 20:23:52 - INFO - __main__ - Step 39999: {'lr': 0.0004229923795613369, 'samples': 7679808, 'steps': 39998, 'loss/train': 1.3915947675704956} -08/30/2021 20:23:52 - INFO - __main__ - Step 40000: {'lr': 0.00042298854844183476, 'samples': 7680000, 'steps': 39999, 'loss/train': 1.4365646839141846} -08/30/2021 20:23:52 - INFO - __main__ - Step 40001: {'lr': 0.0004229847172443866, 'samples': 7680192, 'steps': 40000, 'loss/train': 1.7908278703689575} -08/30/2021 20:23:53 - INFO - __main__ - Step 40002: {'lr': 0.0004229808859689941, 'samples': 7680384, 'steps': 40001, 'loss/train': 1.0729361772537231} -08/30/2021 20:23:53 - INFO - __main__ - Step 40003: {'lr': 0.0004229770546156592, 'samples': 7680576, 'steps': 40002, 'loss/train': 0.7916885614395142} -08/30/2021 20:23:53 - INFO - __main__ - Step 40004: {'lr': 0.00042297322318438345, 'samples': 7680768, 'steps': 40003, 'loss/train': 1.9215587377548218} -08/30/2021 20:23:55 - INFO - __main__ - Step 40005: {'lr': 0.0004229693916751687, 'samples': 7680960, 'steps': 40004, 'loss/train': 1.7415010929107666} -08/30/2021 20:23:56 - INFO - __main__ - Step 40006: {'lr': 0.00042296556008801663, 'samples': 7681152, 'steps': 40005, 'loss/train': 1.1243678331375122} -08/30/2021 20:23:56 - INFO - __main__ - Step 40007: {'lr': 0.0004229617284229289, 'samples': 7681344, 'steps': 40006, 'loss/train': 1.5198845863342285} -08/30/2021 20:23:56 - INFO - __main__ - Step 40008: {'lr': 0.00042295789667990726, 'samples': 7681536, 'steps': 40007, 'loss/train': 0.33052346110343933} -08/30/2021 20:23:57 - INFO - __main__ - Step 40009: {'lr': 0.00042295406485895346, 'samples': 7681728, 'steps': 40008, 'loss/train': 1.6835016012191772} -08/30/2021 20:23:58 - INFO - __main__ - Step 40010: {'lr': 0.0004229502329600692, 'samples': 7681920, 'steps': 40009, 'loss/train': 1.5930639505386353} -08/30/2021 20:23:59 - INFO - __main__ - Step 40011: {'lr': 0.0004229464009832563, 'samples': 7682112, 'steps': 40010, 'loss/train': 0.7433944344520569} -08/30/2021 20:23:59 - INFO - __main__ - Step 40012: {'lr': 0.0004229425689285163, 'samples': 7682304, 'steps': 40011, 'loss/train': 1.4278309345245361} -08/30/2021 20:23:59 - INFO - __main__ - Step 40013: {'lr': 0.00042293873679585125, 'samples': 7682496, 'steps': 40012, 'loss/train': 1.2927014827728271} -08/30/2021 20:24:00 - INFO - __main__ - Step 40014: {'lr': 0.00042293490458526257, 'samples': 7682688, 'steps': 40013, 'loss/train': 1.5832417011260986} -08/30/2021 20:24:02 - INFO - __main__ - Step 40015: {'lr': 0.0004229310722967521, 'samples': 7682880, 'steps': 40014, 'loss/train': 1.4748404026031494} -08/30/2021 20:24:02 - INFO - __main__ - Step 40016: {'lr': 0.00042292723993032157, 'samples': 7683072, 'steps': 40015, 'loss/train': 1.4790807962417603} -08/30/2021 20:24:03 - INFO - __main__ - Step 40017: {'lr': 0.0004229234074859726, 'samples': 7683264, 'steps': 40016, 'loss/train': 1.6112967729568481} -08/30/2021 20:24:03 - INFO - __main__ - Step 40018: {'lr': 0.00042291957496370713, 'samples': 7683456, 'steps': 40017, 'loss/train': 0.19286830723285675} -08/30/2021 20:24:03 - INFO - __main__ - Step 40019: {'lr': 0.0004229157423635267, 'samples': 7683648, 'steps': 40018, 'loss/train': 1.9733043909072876} -08/30/2021 20:24:05 - INFO - __main__ - Step 40020: {'lr': 0.00042291190968543315, 'samples': 7683840, 'steps': 40019, 'loss/train': 1.6683762073516846} -08/30/2021 20:24:06 - INFO - __main__ - Step 40021: {'lr': 0.0004229080769294281, 'samples': 7684032, 'steps': 40020, 'loss/train': 1.3969764709472656} -08/30/2021 20:24:06 - INFO - __main__ - Step 40022: {'lr': 0.00042290424409551343, 'samples': 7684224, 'steps': 40021, 'loss/train': 0.3898797333240509} -08/30/2021 20:24:06 - INFO - __main__ - Step 40023: {'lr': 0.0004229004111836907, 'samples': 7684416, 'steps': 40022, 'loss/train': 0.12853480875492096} -08/30/2021 20:24:07 - INFO - __main__ - Step 40024: {'lr': 0.0004228965781939617, 'samples': 7684608, 'steps': 40023, 'loss/train': 1.3174782991409302} -08/30/2021 20:24:07 - INFO - __main__ - Step 40025: {'lr': 0.00042289274512632817, 'samples': 7684800, 'steps': 40024, 'loss/train': 1.428648829460144} -08/30/2021 20:24:09 - INFO - __main__ - Step 40026: {'lr': 0.00042288891198079194, 'samples': 7684992, 'steps': 40025, 'loss/train': 1.0943942070007324} -08/30/2021 20:24:10 - INFO - __main__ - Step 40027: {'lr': 0.00042288507875735455, 'samples': 7685184, 'steps': 40026, 'loss/train': 0.9271484613418579} -08/30/2021 20:24:10 - INFO - __main__ - Step 40028: {'lr': 0.0004228812454560178, 'samples': 7685376, 'steps': 40027, 'loss/train': 1.2065141201019287} -08/30/2021 20:24:10 - INFO - __main__ - Step 40029: {'lr': 0.0004228774120767835, 'samples': 7685568, 'steps': 40028, 'loss/train': 1.2031065225601196} -08/30/2021 20:24:11 - INFO - __main__ - Step 40030: {'lr': 0.00042287357861965326, 'samples': 7685760, 'steps': 40029, 'loss/train': 0.0939389318227768} -08/30/2021 20:24:12 - INFO - __main__ - Step 40031: {'lr': 0.00042286974508462885, 'samples': 7685952, 'steps': 40030, 'loss/train': 0.4339176416397095} -08/30/2021 20:24:13 - INFO - __main__ - Step 40032: {'lr': 0.000422865911471712, 'samples': 7686144, 'steps': 40031, 'loss/train': 1.5876401662826538} -08/30/2021 20:24:13 - INFO - __main__ - Step 40033: {'lr': 0.00042286207778090447, 'samples': 7686336, 'steps': 40032, 'loss/train': 1.6221156120300293} -08/30/2021 20:24:13 - INFO - __main__ - Step 40034: {'lr': 0.00042285824401220787, 'samples': 7686528, 'steps': 40033, 'loss/train': 1.4964542388916016} -08/30/2021 20:24:14 - INFO - __main__ - Step 40035: {'lr': 0.0004228544101656241, 'samples': 7686720, 'steps': 40034, 'loss/train': 1.556596279144287} -08/30/2021 20:24:15 - INFO - __main__ - Step 40036: {'lr': 0.00042285057624115473, 'samples': 7686912, 'steps': 40035, 'loss/train': 1.0824153423309326} -08/30/2021 20:24:16 - INFO - __main__ - Step 40037: {'lr': 0.0004228467422388016, 'samples': 7687104, 'steps': 40036, 'loss/train': 1.5320526361465454} -08/30/2021 20:24:16 - INFO - __main__ - Step 40038: {'lr': 0.0004228429081585664, 'samples': 7687296, 'steps': 40037, 'loss/train': 1.1062607765197754} -08/30/2021 20:24:16 - INFO - __main__ - Step 40039: {'lr': 0.00042283907400045084, 'samples': 7687488, 'steps': 40038, 'loss/train': 0.6215230226516724} -08/30/2021 20:24:17 - INFO - __main__ - Step 40040: {'lr': 0.0004228352397644567, 'samples': 7687680, 'steps': 40039, 'loss/train': 1.4788440465927124} -08/30/2021 20:24:17 - INFO - __main__ - Step 40041: {'lr': 0.0004228314054505856, 'samples': 7687872, 'steps': 40040, 'loss/train': 1.5475090742111206} -08/30/2021 20:24:19 - INFO - __main__ - Step 40042: {'lr': 0.0004228275710588394, 'samples': 7688064, 'steps': 40041, 'loss/train': 1.282443881034851} -08/30/2021 20:24:19 - INFO - __main__ - Step 40043: {'lr': 0.0004228237365892197, 'samples': 7688256, 'steps': 40042, 'loss/train': 1.4643335342407227} -08/30/2021 20:24:19 - INFO - __main__ - Step 40044: {'lr': 0.00042281990204172837, 'samples': 7688448, 'steps': 40043, 'loss/train': 0.9389199018478394} -08/30/2021 20:24:20 - INFO - __main__ - Step 40045: {'lr': 0.000422816067416367, 'samples': 7688640, 'steps': 40044, 'loss/train': 1.473731279373169} -08/30/2021 20:24:20 - INFO - __main__ - Step 40046: {'lr': 0.00042281223271313734, 'samples': 7688832, 'steps': 40045, 'loss/train': 0.9742891192436218} -08/30/2021 20:24:22 - INFO - __main__ - Step 40047: {'lr': 0.0004228083979320412, 'samples': 7689024, 'steps': 40046, 'loss/train': 1.7017384767532349} -08/30/2021 20:24:22 - INFO - __main__ - Step 40048: {'lr': 0.00042280456307308034, 'samples': 7689216, 'steps': 40047, 'loss/train': 1.0361615419387817} -08/30/2021 20:24:22 - INFO - __main__ - Step 40049: {'lr': 0.0004228007281362563, 'samples': 7689408, 'steps': 40048, 'loss/train': 1.1506147384643555} -08/30/2021 20:24:23 - INFO - __main__ - Step 40050: {'lr': 0.0004227968931215709, 'samples': 7689600, 'steps': 40049, 'loss/train': 1.2911769151687622} -08/30/2021 20:24:23 - INFO - __main__ - Step 40051: {'lr': 0.000422793058029026, 'samples': 7689792, 'steps': 40050, 'loss/train': 1.5743813514709473} -08/30/2021 20:24:25 - INFO - __main__ - Step 40052: {'lr': 0.0004227892228586231, 'samples': 7689984, 'steps': 40051, 'loss/train': 1.305594563484192} -08/30/2021 20:24:25 - INFO - __main__ - Step 40053: {'lr': 0.0004227853876103641, 'samples': 7690176, 'steps': 40052, 'loss/train': 1.4357455968856812} -08/30/2021 20:24:26 - INFO - __main__ - Step 40054: {'lr': 0.0004227815522842507, 'samples': 7690368, 'steps': 40053, 'loss/train': 1.4548953771591187} -08/30/2021 20:24:26 - INFO - __main__ - Step 40055: {'lr': 0.00042277771688028457, 'samples': 7690560, 'steps': 40054, 'loss/train': 1.394719123840332} -08/30/2021 20:24:26 - INFO - __main__ - Step 40056: {'lr': 0.0004227738813984675, 'samples': 7690752, 'steps': 40055, 'loss/train': 1.5078915357589722} -08/30/2021 20:24:28 - INFO - __main__ - Step 40057: {'lr': 0.00042277004583880106, 'samples': 7690944, 'steps': 40056, 'loss/train': 1.3259233236312866} -08/30/2021 20:24:28 - INFO - __main__ - Step 40058: {'lr': 0.00042276621020128724, 'samples': 7691136, 'steps': 40057, 'loss/train': 1.6630440950393677} -08/30/2021 20:24:29 - INFO - __main__ - Step 40059: {'lr': 0.0004227623744859276, 'samples': 7691328, 'steps': 40058, 'loss/train': 1.198193073272705} -08/30/2021 20:24:29 - INFO - __main__ - Step 40060: {'lr': 0.0004227585386927239, 'samples': 7691520, 'steps': 40059, 'loss/train': 1.3635294437408447} -08/30/2021 20:24:29 - INFO - __main__ - Step 40061: {'lr': 0.0004227547028216778, 'samples': 7691712, 'steps': 40060, 'loss/train': 1.105837106704712} -08/30/2021 20:24:30 - INFO - __main__ - Step 40062: {'lr': 0.00042275086687279116, 'samples': 7691904, 'steps': 40061, 'loss/train': 1.3114802837371826} -08/30/2021 20:24:31 - INFO - __main__ - Step 40063: {'lr': 0.0004227470308460657, 'samples': 7692096, 'steps': 40062, 'loss/train': 1.6279492378234863} -08/30/2021 20:24:32 - INFO - __main__ - Step 40064: {'lr': 0.000422743194741503, 'samples': 7692288, 'steps': 40063, 'loss/train': 1.8441680669784546} -08/30/2021 20:24:32 - INFO - __main__ - Step 40065: {'lr': 0.00042273935855910487, 'samples': 7692480, 'steps': 40064, 'loss/train': 1.5744364261627197} -08/30/2021 20:24:32 - INFO - __main__ - Step 40066: {'lr': 0.00042273552229887313, 'samples': 7692672, 'steps': 40065, 'loss/train': 1.5886642932891846} -08/30/2021 20:24:33 - INFO - __main__ - Step 40067: {'lr': 0.00042273168596080934, 'samples': 7692864, 'steps': 40066, 'loss/train': 1.115769386291504} -08/30/2021 20:24:34 - INFO - __main__ - Step 40068: {'lr': 0.0004227278495449154, 'samples': 7693056, 'steps': 40067, 'loss/train': 0.4387758672237396} -08/30/2021 20:24:34 - INFO - __main__ - Step 40069: {'lr': 0.0004227240130511929, 'samples': 7693248, 'steps': 40068, 'loss/train': 1.2347543239593506} -08/30/2021 20:24:35 - INFO - __main__ - Step 40070: {'lr': 0.0004227201764796437, 'samples': 7693440, 'steps': 40069, 'loss/train': 1.8556299209594727} -08/30/2021 20:24:35 - INFO - __main__ - Step 40071: {'lr': 0.00042271633983026935, 'samples': 7693632, 'steps': 40070, 'loss/train': 1.4767194986343384} -08/30/2021 20:24:36 - INFO - __main__ - Step 40072: {'lr': 0.00042271250310307174, 'samples': 7693824, 'steps': 40071, 'loss/train': 1.3978941440582275} -08/30/2021 20:24:37 - INFO - __main__ - Step 40073: {'lr': 0.0004227086662980525, 'samples': 7694016, 'steps': 40072, 'loss/train': 1.6440999507904053} -08/30/2021 20:24:38 - INFO - __main__ - Step 40074: {'lr': 0.00042270482941521347, 'samples': 7694208, 'steps': 40073, 'loss/train': 1.8462797403335571} -08/30/2021 20:24:38 - INFO - __main__ - Step 40075: {'lr': 0.0004227009924545563, 'samples': 7694400, 'steps': 40074, 'loss/train': 1.6532827615737915} -08/30/2021 20:24:38 - INFO - __main__ - Step 40076: {'lr': 0.00042269715541608265, 'samples': 7694592, 'steps': 40075, 'loss/train': 1.437268614768982} -08/30/2021 20:24:39 - INFO - __main__ - Step 40077: {'lr': 0.0004226933182997944, 'samples': 7694784, 'steps': 40076, 'loss/train': 1.716097354888916} -08/30/2021 20:24:40 - INFO - __main__ - Step 40078: {'lr': 0.00042268948110569317, 'samples': 7694976, 'steps': 40077, 'loss/train': 1.6675812005996704} -08/30/2021 20:24:41 - INFO - __main__ - Step 40079: {'lr': 0.00042268564383378073, 'samples': 7695168, 'steps': 40078, 'loss/train': 1.4932663440704346} -08/30/2021 20:24:41 - INFO - __main__ - Step 40080: {'lr': 0.00042268180648405884, 'samples': 7695360, 'steps': 40079, 'loss/train': 1.8863270282745361} -08/30/2021 20:24:41 - INFO - __main__ - Step 40081: {'lr': 0.00042267796905652924, 'samples': 7695552, 'steps': 40080, 'loss/train': 1.533851146697998} -08/30/2021 20:24:42 - INFO - __main__ - Step 40082: {'lr': 0.0004226741315511935, 'samples': 7695744, 'steps': 40081, 'loss/train': 0.9106437563896179} -08/30/2021 20:24:44 - INFO - __main__ - Step 40083: {'lr': 0.00042267029396805345, 'samples': 7695936, 'steps': 40082, 'loss/train': 0.22785265743732452} -08/30/2021 20:24:44 - INFO - __main__ - Step 40084: {'lr': 0.0004226664563071109, 'samples': 7696128, 'steps': 40083, 'loss/train': 1.4615514278411865} -08/30/2021 20:24:45 - INFO - __main__ - Step 40085: {'lr': 0.0004226626185683675, 'samples': 7696320, 'steps': 40084, 'loss/train': 1.8035987615585327} -08/30/2021 20:24:45 - INFO - __main__ - Step 40086: {'lr': 0.00042265878075182497, 'samples': 7696512, 'steps': 40085, 'loss/train': 1.7350702285766602} -08/30/2021 20:24:45 - INFO - __main__ - Step 40087: {'lr': 0.0004226549428574851, 'samples': 7696704, 'steps': 40086, 'loss/train': 1.4968773126602173} -08/30/2021 20:24:46 - INFO - __main__ - Step 40088: {'lr': 0.0004226511048853495, 'samples': 7696896, 'steps': 40087, 'loss/train': 1.630066156387329} -08/30/2021 20:24:47 - INFO - __main__ - Step 40089: {'lr': 0.00042264726683542, 'samples': 7697088, 'steps': 40088, 'loss/train': 1.514136791229248} -08/30/2021 20:24:48 - INFO - __main__ - Step 40090: {'lr': 0.00042264342870769835, 'samples': 7697280, 'steps': 40089, 'loss/train': 1.4384431838989258} -08/30/2021 20:24:48 - INFO - __main__ - Step 40091: {'lr': 0.0004226395905021862, 'samples': 7697472, 'steps': 40090, 'loss/train': 3.484011650085449} -08/30/2021 20:24:49 - INFO - __main__ - Step 40092: {'lr': 0.0004226357522188853, 'samples': 7697664, 'steps': 40091, 'loss/train': 1.4920129776000977} -08/30/2021 20:24:49 - INFO - __main__ - Step 40093: {'lr': 0.0004226319138577974, 'samples': 7697856, 'steps': 40092, 'loss/train': 1.2493542432785034} -08/30/2021 20:24:50 - INFO - __main__ - Step 40094: {'lr': 0.0004226280754189243, 'samples': 7698048, 'steps': 40093, 'loss/train': 1.2865017652511597} -08/30/2021 20:24:51 - INFO - __main__ - Step 40095: {'lr': 0.0004226242369022676, 'samples': 7698240, 'steps': 40094, 'loss/train': 1.741750955581665} -08/30/2021 20:24:51 - INFO - __main__ - Step 40096: {'lr': 0.00042262039830782906, 'samples': 7698432, 'steps': 40095, 'loss/train': 0.4658586084842682} -08/30/2021 20:24:51 - INFO - __main__ - Step 40097: {'lr': 0.00042261655963561043, 'samples': 7698624, 'steps': 40096, 'loss/train': 1.557449460029602} -08/30/2021 20:24:52 - INFO - __main__ - Step 40098: {'lr': 0.0004226127208856134, 'samples': 7698816, 'steps': 40097, 'loss/train': 1.4780389070510864} -08/30/2021 20:24:53 - INFO - __main__ - Step 40099: {'lr': 0.0004226088820578399, 'samples': 7699008, 'steps': 40098, 'loss/train': 0.8832118511199951} -08/30/2021 20:24:54 - INFO - __main__ - Step 40100: {'lr': 0.00042260504315229136, 'samples': 7699200, 'steps': 40099, 'loss/train': 1.1463679075241089} -08/30/2021 20:24:54 - INFO - __main__ - Step 40101: {'lr': 0.00042260120416896975, 'samples': 7699392, 'steps': 40100, 'loss/train': 1.1320773363113403} -08/30/2021 20:24:54 - INFO - __main__ - Step 40102: {'lr': 0.0004225973651078766, 'samples': 7699584, 'steps': 40101, 'loss/train': 1.163228988647461} -08/30/2021 20:24:55 - INFO - __main__ - Step 40103: {'lr': 0.0004225935259690138, 'samples': 7699776, 'steps': 40102, 'loss/train': 1.7681277990341187} -08/30/2021 20:24:57 - INFO - __main__ - Step 40104: {'lr': 0.00042258968675238295, 'samples': 7699968, 'steps': 40103, 'loss/train': 1.5688971281051636} -08/30/2021 20:24:57 - INFO - __main__ - Step 40105: {'lr': 0.00042258584745798595, 'samples': 7700160, 'steps': 40104, 'loss/train': 1.2291992902755737} -08/30/2021 20:24:57 - INFO - __main__ - Step 40106: {'lr': 0.00042258200808582434, 'samples': 7700352, 'steps': 40105, 'loss/train': 1.602418303489685} -08/30/2021 20:24:58 - INFO - __main__ - Step 40107: {'lr': 0.00042257816863590006, 'samples': 7700544, 'steps': 40106, 'loss/train': 1.0369330644607544} -08/30/2021 20:24:58 - INFO - __main__ - Step 40108: {'lr': 0.0004225743291082146, 'samples': 7700736, 'steps': 40107, 'loss/train': 1.5382561683654785} -08/30/2021 20:24:59 - INFO - __main__ - Step 40109: {'lr': 0.0004225704895027699, 'samples': 7700928, 'steps': 40108, 'loss/train': 0.04080049693584442} -08/30/2021 20:25:00 - INFO - __main__ - Step 40110: {'lr': 0.0004225666498195675, 'samples': 7701120, 'steps': 40109, 'loss/train': 0.5043378472328186} -08/30/2021 20:25:01 - INFO - __main__ - Step 40111: {'lr': 0.0004225628100586093, 'samples': 7701312, 'steps': 40110, 'loss/train': 1.935161828994751} -08/30/2021 20:25:01 - INFO - __main__ - Step 40112: {'lr': 0.00042255897021989695, 'samples': 7701504, 'steps': 40111, 'loss/train': 1.0228524208068848} -08/30/2021 20:25:01 - INFO - __main__ - Step 40113: {'lr': 0.0004225551303034322, 'samples': 7701696, 'steps': 40112, 'loss/train': 1.6141903400421143} -08/30/2021 20:25:02 - INFO - __main__ - Step 40114: {'lr': 0.00042255129030921673, 'samples': 7701888, 'steps': 40113, 'loss/train': 1.0793025493621826} -08/30/2021 20:25:03 - INFO - __main__ - Step 40115: {'lr': 0.0004225474502372524, 'samples': 7702080, 'steps': 40114, 'loss/train': 1.5178107023239136} -08/30/2021 20:25:04 - INFO - __main__ - Step 40116: {'lr': 0.00042254361008754076, 'samples': 7702272, 'steps': 40115, 'loss/train': 1.3765003681182861} -08/30/2021 20:25:04 - INFO - __main__ - Step 40117: {'lr': 0.0004225397698600837, 'samples': 7702464, 'steps': 40116, 'loss/train': 2.1357617378234863} -08/30/2021 20:25:05 - INFO - __main__ - Step 40118: {'lr': 0.0004225359295548828, 'samples': 7702656, 'steps': 40117, 'loss/train': 0.9446281790733337} -08/30/2021 20:25:05 - INFO - __main__ - Step 40119: {'lr': 0.0004225320891719399, 'samples': 7702848, 'steps': 40118, 'loss/train': 1.4856083393096924} -08/30/2021 20:25:07 - INFO - __main__ - Step 40120: {'lr': 0.0004225282487112567, 'samples': 7703040, 'steps': 40119, 'loss/train': 1.324765682220459} -08/30/2021 20:25:07 - INFO - __main__ - Step 40121: {'lr': 0.000422524408172835, 'samples': 7703232, 'steps': 40120, 'loss/train': 2.013789415359497} -08/30/2021 20:25:08 - INFO - __main__ - Step 40122: {'lr': 0.0004225205675566765, 'samples': 7703424, 'steps': 40121, 'loss/train': 1.408373475074768} -08/30/2021 20:25:08 - INFO - __main__ - Step 40123: {'lr': 0.00042251672686278275, 'samples': 7703616, 'steps': 40122, 'loss/train': 1.0368902683258057} -08/30/2021 20:25:08 - INFO - __main__ - Step 40124: {'lr': 0.0004225128860911557, 'samples': 7703808, 'steps': 40123, 'loss/train': 1.0282988548278809} -08/30/2021 20:25:09 - INFO - __main__ - Step 40125: {'lr': 0.00042250904524179697, 'samples': 7704000, 'steps': 40124, 'loss/train': 1.749969244003296} -08/30/2021 20:25:10 - INFO - __main__ - Step 40126: {'lr': 0.00042250520431470827, 'samples': 7704192, 'steps': 40125, 'loss/train': 0.07141036540269852} -08/30/2021 20:25:11 - INFO - __main__ - Step 40127: {'lr': 0.00042250136330989154, 'samples': 7704384, 'steps': 40126, 'loss/train': 1.5025092363357544} -08/30/2021 20:25:11 - INFO - __main__ - Step 40128: {'lr': 0.00042249752222734826, 'samples': 7704576, 'steps': 40127, 'loss/train': 1.748719573020935} -08/30/2021 20:25:12 - INFO - __main__ - Step 40129: {'lr': 0.0004224936810670803, 'samples': 7704768, 'steps': 40128, 'loss/train': 1.230688214302063} -08/30/2021 20:25:12 - INFO - __main__ - Step 40130: {'lr': 0.0004224898398290893, 'samples': 7704960, 'steps': 40129, 'loss/train': 1.589765191078186} -08/30/2021 20:25:13 - INFO - __main__ - Step 40131: {'lr': 0.0004224859985133771, 'samples': 7705152, 'steps': 40130, 'loss/train': 0.2544907331466675} -08/30/2021 20:25:14 - INFO - __main__ - Step 40132: {'lr': 0.0004224821571199453, 'samples': 7705344, 'steps': 40131, 'loss/train': 1.3932286500930786} -08/30/2021 20:25:14 - INFO - __main__ - Step 40133: {'lr': 0.0004224783156487958, 'samples': 7705536, 'steps': 40132, 'loss/train': 1.7468143701553345} -08/30/2021 20:25:15 - INFO - __main__ - Step 40134: {'lr': 0.0004224744740999302, 'samples': 7705728, 'steps': 40133, 'loss/train': 1.5016592741012573} -08/30/2021 20:25:15 - INFO - __main__ - Step 40135: {'lr': 0.0004224706324733502, 'samples': 7705920, 'steps': 40134, 'loss/train': 1.1475318670272827} -08/30/2021 20:25:17 - INFO - __main__ - Step 40136: {'lr': 0.00042246679076905763, 'samples': 7706112, 'steps': 40135, 'loss/train': 1.443509578704834} -08/30/2021 20:25:17 - INFO - __main__ - Step 40137: {'lr': 0.00042246294898705416, 'samples': 7706304, 'steps': 40136, 'loss/train': 1.1780893802642822} -08/30/2021 20:25:18 - INFO - __main__ - Step 40138: {'lr': 0.0004224591071273416, 'samples': 7706496, 'steps': 40137, 'loss/train': 1.2799158096313477} -08/30/2021 20:25:18 - INFO - __main__ - Step 40139: {'lr': 0.00042245526518992164, 'samples': 7706688, 'steps': 40138, 'loss/train': 1.420188069343567} -08/30/2021 20:25:18 - INFO - __main__ - Step 40140: {'lr': 0.0004224514231747959, 'samples': 7706880, 'steps': 40139, 'loss/train': 1.156541109085083} -08/30/2021 20:25:19 - INFO - __main__ - Step 40141: {'lr': 0.00042244758108196635, 'samples': 7707072, 'steps': 40140, 'loss/train': 1.3181376457214355} -08/30/2021 20:25:20 - INFO - __main__ - Step 40142: {'lr': 0.00042244373891143453, 'samples': 7707264, 'steps': 40141, 'loss/train': 1.780436635017395} -08/30/2021 20:25:21 - INFO - __main__ - Step 40143: {'lr': 0.00042243989666320217, 'samples': 7707456, 'steps': 40142, 'loss/train': 0.983108401298523} -08/30/2021 20:25:21 - INFO - __main__ - Step 40144: {'lr': 0.00042243605433727106, 'samples': 7707648, 'steps': 40143, 'loss/train': 2.8953497409820557} -08/30/2021 20:25:21 - INFO - __main__ - Step 40145: {'lr': 0.0004224322119336429, 'samples': 7707840, 'steps': 40144, 'loss/train': 1.4392122030258179} -08/30/2021 20:25:22 - INFO - __main__ - Step 40146: {'lr': 0.0004224283694523195, 'samples': 7708032, 'steps': 40145, 'loss/train': 1.4808763265609741} -08/30/2021 20:25:23 - INFO - __main__ - Step 40147: {'lr': 0.0004224245268933025, 'samples': 7708224, 'steps': 40146, 'loss/train': 1.6406389474868774} -08/30/2021 20:25:24 - INFO - __main__ - Step 40148: {'lr': 0.0004224206842565937, 'samples': 7708416, 'steps': 40147, 'loss/train': 1.9504764080047607} -08/30/2021 20:25:24 - INFO - __main__ - Step 40149: {'lr': 0.0004224168415421948, 'samples': 7708608, 'steps': 40148, 'loss/train': 1.5916428565979004} -08/30/2021 20:25:24 - INFO - __main__ - Step 40150: {'lr': 0.0004224129987501075, 'samples': 7708800, 'steps': 40149, 'loss/train': 1.1741554737091064} -08/30/2021 20:25:25 - INFO - __main__ - Step 40151: {'lr': 0.0004224091558803337, 'samples': 7708992, 'steps': 40150, 'loss/train': 1.4782854318618774} -08/30/2021 20:25:26 - INFO - __main__ - Step 40152: {'lr': 0.0004224053129328748, 'samples': 7709184, 'steps': 40151, 'loss/train': 1.6107507944107056} -08/30/2021 20:25:27 - INFO - __main__ - Step 40153: {'lr': 0.0004224014699077329, 'samples': 7709376, 'steps': 40152, 'loss/train': 1.3659883737564087} -08/30/2021 20:25:27 - INFO - __main__ - Step 40154: {'lr': 0.00042239762680490944, 'samples': 7709568, 'steps': 40153, 'loss/train': 1.8823963403701782} -08/30/2021 20:25:27 - INFO - __main__ - Step 40155: {'lr': 0.00042239378362440627, 'samples': 7709760, 'steps': 40154, 'loss/train': 1.9861246347427368} -08/30/2021 20:25:28 - INFO - __main__ - Step 40156: {'lr': 0.0004223899403662251, 'samples': 7709952, 'steps': 40155, 'loss/train': 1.3641180992126465} -08/30/2021 20:25:29 - INFO - __main__ - Step 40157: {'lr': 0.0004223860970303678, 'samples': 7710144, 'steps': 40156, 'loss/train': 0.8633911609649658} -08/30/2021 20:25:29 - INFO - __main__ - Step 40158: {'lr': 0.00042238225361683593, 'samples': 7710336, 'steps': 40157, 'loss/train': 1.4306128025054932} -08/30/2021 20:25:30 - INFO - __main__ - Step 40159: {'lr': 0.00042237841012563126, 'samples': 7710528, 'steps': 40158, 'loss/train': 1.4161688089370728} -08/30/2021 20:25:30 - INFO - __main__ - Step 40160: {'lr': 0.00042237456655675555, 'samples': 7710720, 'steps': 40159, 'loss/train': 0.8530848622322083} -08/30/2021 20:25:31 - INFO - __main__ - Step 40161: {'lr': 0.0004223707229102105, 'samples': 7710912, 'steps': 40160, 'loss/train': 1.4616531133651733} -08/30/2021 20:25:32 - INFO - __main__ - Step 40162: {'lr': 0.0004223668791859979, 'samples': 7711104, 'steps': 40161, 'loss/train': 1.4830741882324219} -08/30/2021 20:25:32 - INFO - __main__ - Step 40163: {'lr': 0.00042236303538411934, 'samples': 7711296, 'steps': 40162, 'loss/train': 1.6665172576904297} -08/30/2021 20:25:33 - INFO - __main__ - Step 40164: {'lr': 0.0004223591915045768, 'samples': 7711488, 'steps': 40163, 'loss/train': 1.1709684133529663} -08/30/2021 20:25:33 - INFO - __main__ - Step 40165: {'lr': 0.0004223553475473718, 'samples': 7711680, 'steps': 40164, 'loss/train': 1.786667823791504} -08/30/2021 20:25:33 - INFO - __main__ - Step 40166: {'lr': 0.00042235150351250617, 'samples': 7711872, 'steps': 40165, 'loss/train': 0.9781188368797302} -08/30/2021 20:25:34 - INFO - __main__ - Step 40167: {'lr': 0.00042234765939998156, 'samples': 7712064, 'steps': 40166, 'loss/train': 1.8463987112045288} -08/30/2021 20:25:36 - INFO - __main__ - Step 40168: {'lr': 0.00042234381520979983, 'samples': 7712256, 'steps': 40167, 'loss/train': 1.7644538879394531} -08/30/2021 20:25:36 - INFO - __main__ - Step 40169: {'lr': 0.0004223399709419625, 'samples': 7712448, 'steps': 40168, 'loss/train': 1.6409869194030762} -08/30/2021 20:25:36 - INFO - __main__ - Step 40170: {'lr': 0.0004223361265964716, 'samples': 7712640, 'steps': 40169, 'loss/train': 1.7242861986160278} -08/30/2021 20:25:37 - INFO - __main__ - Step 40171: {'lr': 0.0004223322821733286, 'samples': 7712832, 'steps': 40170, 'loss/train': 1.6220542192459106} -08/30/2021 20:25:37 - INFO - __main__ - Step 40172: {'lr': 0.0004223284376725354, 'samples': 7713024, 'steps': 40171, 'loss/train': 1.19353187084198} -08/30/2021 20:25:39 - INFO - __main__ - Step 40173: {'lr': 0.00042232459309409355, 'samples': 7713216, 'steps': 40172, 'loss/train': 0.06970373541116714} -08/30/2021 20:25:39 - INFO - __main__ - Step 40174: {'lr': 0.00042232074843800494, 'samples': 7713408, 'steps': 40173, 'loss/train': 1.3166005611419678} -08/30/2021 20:25:40 - INFO - __main__ - Step 40175: {'lr': 0.00042231690370427135, 'samples': 7713600, 'steps': 40174, 'loss/train': 1.6356009244918823} -08/30/2021 20:25:40 - INFO - __main__ - Step 40176: {'lr': 0.00042231305889289437, 'samples': 7713792, 'steps': 40175, 'loss/train': 1.422113060951233} -08/30/2021 20:25:41 - INFO - __main__ - Step 40177: {'lr': 0.00042230921400387576, 'samples': 7713984, 'steps': 40176, 'loss/train': 1.337374210357666} -08/30/2021 20:25:41 - INFO - __main__ - Step 40178: {'lr': 0.0004223053690372173, 'samples': 7714176, 'steps': 40177, 'loss/train': 1.1246124505996704} -08/30/2021 20:25:42 - INFO - __main__ - Step 40179: {'lr': 0.00042230152399292065, 'samples': 7714368, 'steps': 40178, 'loss/train': 1.218896508216858} -08/30/2021 20:25:43 - INFO - __main__ - Step 40180: {'lr': 0.00042229767887098766, 'samples': 7714560, 'steps': 40179, 'loss/train': 0.061578940600156784} -08/30/2021 20:25:43 - INFO - __main__ - Step 40181: {'lr': 0.00042229383367142, 'samples': 7714752, 'steps': 40180, 'loss/train': 1.214537501335144} -08/30/2021 20:25:44 - INFO - __main__ - Step 40182: {'lr': 0.0004222899883942194, 'samples': 7714944, 'steps': 40181, 'loss/train': 1.0074496269226074} -08/30/2021 20:25:44 - INFO - __main__ - Step 40183: {'lr': 0.0004222861430393875, 'samples': 7715136, 'steps': 40182, 'loss/train': 2.0966055393218994} -08/30/2021 20:25:45 - INFO - __main__ - Step 40184: {'lr': 0.0004222822976069262, 'samples': 7715328, 'steps': 40183, 'loss/train': 1.9399789571762085} -08/30/2021 20:25:46 - INFO - __main__ - Step 40185: {'lr': 0.0004222784520968371, 'samples': 7715520, 'steps': 40184, 'loss/train': 1.4649888277053833} -08/30/2021 20:25:46 - INFO - __main__ - Step 40186: {'lr': 0.0004222746065091221, 'samples': 7715712, 'steps': 40185, 'loss/train': 1.5618942975997925} -08/30/2021 20:25:47 - INFO - __main__ - Step 40187: {'lr': 0.0004222707608437827, 'samples': 7715904, 'steps': 40186, 'loss/train': 0.6976447105407715} -08/30/2021 20:25:47 - INFO - __main__ - Step 40188: {'lr': 0.00042226691510082083, 'samples': 7716096, 'steps': 40187, 'loss/train': 1.6354740858078003} -08/30/2021 20:25:49 - INFO - __main__ - Step 40189: {'lr': 0.0004222630692802381, 'samples': 7716288, 'steps': 40188, 'loss/train': 1.2968591451644897} -08/30/2021 20:25:50 - INFO - __main__ - Step 40190: {'lr': 0.00042225922338203625, 'samples': 7716480, 'steps': 40189, 'loss/train': 1.4233076572418213} -08/30/2021 20:25:50 - INFO - __main__ - Step 40191: {'lr': 0.00042225537740621713, 'samples': 7716672, 'steps': 40190, 'loss/train': 0.5747855305671692} -08/30/2021 20:25:50 - INFO - __main__ - Step 40192: {'lr': 0.00042225153135278236, 'samples': 7716864, 'steps': 40191, 'loss/train': 1.2353590726852417} -08/30/2021 20:25:51 - INFO - __main__ - Step 40193: {'lr': 0.00042224768522173374, 'samples': 7717056, 'steps': 40192, 'loss/train': 1.044938564300537} -08/30/2021 20:25:51 - INFO - __main__ - Step 40194: {'lr': 0.00042224383901307293, 'samples': 7717248, 'steps': 40193, 'loss/train': 1.9550994634628296} -08/30/2021 20:25:53 - INFO - __main__ - Step 40195: {'lr': 0.0004222399927268018, 'samples': 7717440, 'steps': 40194, 'loss/train': 2.1724047660827637} -08/30/2021 20:25:53 - INFO - __main__ - Step 40196: {'lr': 0.0004222361463629218, 'samples': 7717632, 'steps': 40195, 'loss/train': 0.1256076693534851} -08/30/2021 20:25:54 - INFO - __main__ - Step 40197: {'lr': 0.00042223229992143505, 'samples': 7717824, 'steps': 40196, 'loss/train': 1.5086017847061157} -08/30/2021 20:25:54 - INFO - __main__ - Step 40198: {'lr': 0.00042222845340234293, 'samples': 7718016, 'steps': 40197, 'loss/train': 1.4065885543823242} -08/30/2021 20:25:54 - INFO - __main__ - Step 40199: {'lr': 0.00042222460680564747, 'samples': 7718208, 'steps': 40198, 'loss/train': 1.6255756616592407} -08/30/2021 20:25:55 - INFO - __main__ - Step 40200: {'lr': 0.0004222207601313501, 'samples': 7718400, 'steps': 40199, 'loss/train': 1.2395771741867065} -08/30/2021 20:25:56 - INFO - __main__ - Step 40201: {'lr': 0.00042221691337945285, 'samples': 7718592, 'steps': 40200, 'loss/train': 1.7549831867218018} -08/30/2021 20:25:57 - INFO - __main__ - Step 40202: {'lr': 0.0004222130665499573, 'samples': 7718784, 'steps': 40201, 'loss/train': 1.170562744140625} -08/30/2021 20:25:57 - INFO - __main__ - Step 40203: {'lr': 0.0004222092196428651, 'samples': 7718976, 'steps': 40202, 'loss/train': 1.9099899530410767} -08/30/2021 20:25:57 - INFO - __main__ - Step 40204: {'lr': 0.0004222053726581782, 'samples': 7719168, 'steps': 40203, 'loss/train': 1.7395405769348145} -08/30/2021 20:25:58 - INFO - __main__ - Step 40205: {'lr': 0.0004222015255958981, 'samples': 7719360, 'steps': 40204, 'loss/train': 1.62998628616333} -08/30/2021 20:25:59 - INFO - __main__ - Step 40206: {'lr': 0.0004221976784560267, 'samples': 7719552, 'steps': 40205, 'loss/train': 2.335939645767212} -08/30/2021 20:26:00 - INFO - __main__ - Step 40207: {'lr': 0.0004221938312385657, 'samples': 7719744, 'steps': 40206, 'loss/train': 1.6312938928604126} -08/30/2021 20:26:00 - INFO - __main__ - Step 40208: {'lr': 0.00042218998394351684, 'samples': 7719936, 'steps': 40207, 'loss/train': 0.9350178837776184} -08/30/2021 20:26:01 - INFO - __main__ - Step 40209: {'lr': 0.0004221861365708818, 'samples': 7720128, 'steps': 40208, 'loss/train': 1.3486769199371338} -08/30/2021 20:26:01 - INFO - __main__ - Step 40210: {'lr': 0.0004221822891206623, 'samples': 7720320, 'steps': 40209, 'loss/train': 1.4945238828659058} -08/30/2021 20:26:02 - INFO - __main__ - Step 40211: {'lr': 0.00042217844159286015, 'samples': 7720512, 'steps': 40210, 'loss/train': 1.356119155883789} -08/30/2021 20:26:03 - INFO - __main__ - Step 40212: {'lr': 0.00042217459398747703, 'samples': 7720704, 'steps': 40211, 'loss/train': 1.0561883449554443} -08/30/2021 20:26:03 - INFO - __main__ - Step 40213: {'lr': 0.0004221707463045148, 'samples': 7720896, 'steps': 40212, 'loss/train': 1.2845380306243896} -08/30/2021 20:26:04 - INFO - __main__ - Step 40214: {'lr': 0.0004221668985439749, 'samples': 7721088, 'steps': 40213, 'loss/train': 1.4505268335342407} -08/30/2021 20:26:04 - INFO - __main__ - Step 40215: {'lr': 0.00042216305070585946, 'samples': 7721280, 'steps': 40214, 'loss/train': 1.356143832206726} -08/30/2021 20:26:06 - INFO - __main__ - Step 40216: {'lr': 0.00042215920279016993, 'samples': 7721472, 'steps': 40215, 'loss/train': 1.7022701501846313} -08/30/2021 20:26:06 - INFO - __main__ - Step 40217: {'lr': 0.00042215535479690807, 'samples': 7721664, 'steps': 40216, 'loss/train': 1.1661900281906128} -08/30/2021 20:26:06 - INFO - __main__ - Step 40218: {'lr': 0.0004221515067260757, 'samples': 7721856, 'steps': 40217, 'loss/train': 1.6053369045257568} -08/30/2021 20:26:07 - INFO - __main__ - Step 40219: {'lr': 0.0004221476585776745, 'samples': 7722048, 'steps': 40218, 'loss/train': 0.9795981645584106} -08/30/2021 20:26:07 - INFO - __main__ - Step 40220: {'lr': 0.00042214381035170624, 'samples': 7722240, 'steps': 40219, 'loss/train': 1.2027286291122437} -08/30/2021 20:26:07 - INFO - __main__ - Step 40221: {'lr': 0.0004221399620481726, 'samples': 7722432, 'steps': 40220, 'loss/train': 1.3306986093521118} -08/30/2021 20:26:09 - INFO - __main__ - Step 40222: {'lr': 0.00042213611366707547, 'samples': 7722624, 'steps': 40221, 'loss/train': 1.4610397815704346} -08/30/2021 20:26:09 - INFO - __main__ - Step 40223: {'lr': 0.0004221322652084163, 'samples': 7722816, 'steps': 40222, 'loss/train': 1.5459133386611938} -08/30/2021 20:26:10 - INFO - __main__ - Step 40224: {'lr': 0.0004221284166721971, 'samples': 7723008, 'steps': 40223, 'loss/train': 1.3988077640533447} -08/30/2021 20:26:10 - INFO - __main__ - Step 40225: {'lr': 0.00042212456805841944, 'samples': 7723200, 'steps': 40224, 'loss/train': 1.1661248207092285} -08/30/2021 20:26:10 - INFO - __main__ - Step 40226: {'lr': 0.00042212071936708506, 'samples': 7723392, 'steps': 40225, 'loss/train': 1.7283368110656738} -08/30/2021 20:26:12 - INFO - __main__ - Step 40227: {'lr': 0.0004221168705981958, 'samples': 7723584, 'steps': 40226, 'loss/train': 1.7759498357772827} -08/30/2021 20:26:12 - INFO - __main__ - Step 40228: {'lr': 0.00042211302175175334, 'samples': 7723776, 'steps': 40227, 'loss/train': 1.4242711067199707} -08/30/2021 20:26:13 - INFO - __main__ - Step 40229: {'lr': 0.0004221091728277595, 'samples': 7723968, 'steps': 40228, 'loss/train': 1.1733466386795044} -08/30/2021 20:26:13 - INFO - __main__ - Step 40230: {'lr': 0.0004221053238262158, 'samples': 7724160, 'steps': 40229, 'loss/train': 1.3824355602264404} -08/30/2021 20:26:13 - INFO - __main__ - Step 40231: {'lr': 0.0004221014747471241, 'samples': 7724352, 'steps': 40230, 'loss/train': 1.3102034330368042} -08/30/2021 20:26:15 - INFO - __main__ - Step 40232: {'lr': 0.0004220976255904861, 'samples': 7724544, 'steps': 40231, 'loss/train': 2.7779786586761475} -08/30/2021 20:26:15 - INFO - __main__ - Step 40233: {'lr': 0.00042209377635630364, 'samples': 7724736, 'steps': 40232, 'loss/train': 1.4527312517166138} -08/30/2021 20:26:16 - INFO - __main__ - Step 40234: {'lr': 0.00042208992704457837, 'samples': 7724928, 'steps': 40233, 'loss/train': 1.3883405923843384} -08/30/2021 20:26:16 - INFO - __main__ - Step 40235: {'lr': 0.00042208607765531204, 'samples': 7725120, 'steps': 40234, 'loss/train': 0.9999542832374573} -08/30/2021 20:26:16 - INFO - __main__ - Step 40236: {'lr': 0.00042208222818850634, 'samples': 7725312, 'steps': 40235, 'loss/train': 1.4538649320602417} -08/30/2021 20:26:18 - INFO - __main__ - Step 40237: {'lr': 0.0004220783786441631, 'samples': 7725504, 'steps': 40236, 'loss/train': 2.277010917663574} -08/30/2021 20:26:19 - INFO - __main__ - Step 40238: {'lr': 0.0004220745290222839, 'samples': 7725696, 'steps': 40237, 'loss/train': 1.5419234037399292} -08/30/2021 20:26:19 - INFO - __main__ - Step 40239: {'lr': 0.00042207067932287066, 'samples': 7725888, 'steps': 40238, 'loss/train': 0.10715563595294952} -08/30/2021 20:26:19 - INFO - __main__ - Step 40240: {'lr': 0.00042206682954592503, 'samples': 7726080, 'steps': 40239, 'loss/train': 1.7700825929641724} -08/30/2021 20:26:20 - INFO - __main__ - Step 40241: {'lr': 0.0004220629796914487, 'samples': 7726272, 'steps': 40240, 'loss/train': 1.2869728803634644} -08/30/2021 20:26:21 - INFO - __main__ - Step 40242: {'lr': 0.00042205912975944344, 'samples': 7726464, 'steps': 40241, 'loss/train': 1.4915441274642944} -08/30/2021 20:26:22 - INFO - __main__ - Step 40243: {'lr': 0.00042205527974991096, 'samples': 7726656, 'steps': 40242, 'loss/train': 1.5039814710617065} -08/30/2021 20:26:22 - INFO - __main__ - Step 40244: {'lr': 0.00042205142966285315, 'samples': 7726848, 'steps': 40243, 'loss/train': 1.6874818801879883} -08/30/2021 20:26:22 - INFO - __main__ - Step 40245: {'lr': 0.0004220475794982716, 'samples': 7727040, 'steps': 40244, 'loss/train': 1.5026730298995972} -08/30/2021 20:26:23 - INFO - __main__ - Step 40246: {'lr': 0.00042204372925616797, 'samples': 7727232, 'steps': 40245, 'loss/train': 1.845436453819275} -08/30/2021 20:26:25 - INFO - __main__ - Step 40247: {'lr': 0.0004220398789365441, 'samples': 7727424, 'steps': 40246, 'loss/train': 1.6923195123672485} -08/30/2021 20:26:25 - INFO - __main__ - Step 40248: {'lr': 0.0004220360285394017, 'samples': 7727616, 'steps': 40247, 'loss/train': 1.8158271312713623} -08/30/2021 20:26:25 - INFO - __main__ - Step 40249: {'lr': 0.0004220321780647426, 'samples': 7727808, 'steps': 40248, 'loss/train': 1.2127046585083008} -08/30/2021 20:26:26 - INFO - __main__ - Step 40250: {'lr': 0.00042202832751256846, 'samples': 7728000, 'steps': 40249, 'loss/train': 1.5437755584716797} -08/30/2021 20:26:26 - INFO - __main__ - Step 40251: {'lr': 0.0004220244768828809, 'samples': 7728192, 'steps': 40250, 'loss/train': 1.290106177330017} -08/30/2021 20:26:27 - INFO - __main__ - Step 40252: {'lr': 0.0004220206261756819, 'samples': 7728384, 'steps': 40251, 'loss/train': 1.5362416505813599} -08/30/2021 20:26:28 - INFO - __main__ - Step 40253: {'lr': 0.00042201677539097294, 'samples': 7728576, 'steps': 40252, 'loss/train': 1.6931043863296509} -08/30/2021 20:26:28 - INFO - __main__ - Step 40254: {'lr': 0.00042201292452875595, 'samples': 7728768, 'steps': 40253, 'loss/train': 1.2157080173492432} -08/30/2021 20:26:29 - INFO - __main__ - Step 40255: {'lr': 0.00042200907358903264, 'samples': 7728960, 'steps': 40254, 'loss/train': 1.0430796146392822} -08/30/2021 20:26:29 - INFO - __main__ - Step 40256: {'lr': 0.0004220052225718046, 'samples': 7729152, 'steps': 40255, 'loss/train': 0.3433298170566559} -08/30/2021 20:26:31 - INFO - __main__ - Step 40257: {'lr': 0.0004220013714770737, 'samples': 7729344, 'steps': 40256, 'loss/train': 1.6203621625900269} -08/30/2021 20:26:31 - INFO - __main__ - Step 40258: {'lr': 0.0004219975203048416, 'samples': 7729536, 'steps': 40257, 'loss/train': 1.6242464780807495} -08/30/2021 20:26:31 - INFO - __main__ - Step 40259: {'lr': 0.0004219936690551101, 'samples': 7729728, 'steps': 40258, 'loss/train': 1.542497992515564} -08/30/2021 20:26:32 - INFO - __main__ - Step 40260: {'lr': 0.0004219898177278809, 'samples': 7729920, 'steps': 40259, 'loss/train': 1.1110448837280273} -08/30/2021 20:26:32 - INFO - __main__ - Step 40261: {'lr': 0.00042198596632315576, 'samples': 7730112, 'steps': 40260, 'loss/train': 1.1610714197158813} -08/30/2021 20:26:32 - INFO - __main__ - Step 40262: {'lr': 0.0004219821148409364, 'samples': 7730304, 'steps': 40261, 'loss/train': 0.886784553527832} -08/30/2021 20:26:34 - INFO - __main__ - Step 40263: {'lr': 0.00042197826328122456, 'samples': 7730496, 'steps': 40262, 'loss/train': 1.809583067893982} -08/30/2021 20:26:34 - INFO - __main__ - Step 40264: {'lr': 0.00042197441164402197, 'samples': 7730688, 'steps': 40263, 'loss/train': 0.9538978338241577} -08/30/2021 20:26:35 - INFO - __main__ - Step 40265: {'lr': 0.0004219705599293303, 'samples': 7730880, 'steps': 40264, 'loss/train': 1.320407509803772} -08/30/2021 20:26:35 - INFO - __main__ - Step 40266: {'lr': 0.00042196670813715137, 'samples': 7731072, 'steps': 40265, 'loss/train': 1.3191862106323242} -08/30/2021 20:26:35 - INFO - __main__ - Step 40267: {'lr': 0.0004219628562674869, 'samples': 7731264, 'steps': 40266, 'loss/train': 1.5166136026382446} -08/30/2021 20:26:37 - INFO - __main__ - Step 40268: {'lr': 0.00042195900432033865, 'samples': 7731456, 'steps': 40267, 'loss/train': 1.1742010116577148} -08/30/2021 20:26:38 - INFO - __main__ - Step 40269: {'lr': 0.00042195515229570833, 'samples': 7731648, 'steps': 40268, 'loss/train': 2.4226460456848145} -08/30/2021 20:26:38 - INFO - __main__ - Step 40270: {'lr': 0.0004219513001935976, 'samples': 7731840, 'steps': 40269, 'loss/train': 0.08580461144447327} -08/30/2021 20:26:38 - INFO - __main__ - Step 40271: {'lr': 0.00042194744801400837, 'samples': 7732032, 'steps': 40270, 'loss/train': 1.444115400314331} -08/30/2021 20:26:39 - INFO - __main__ - Step 40272: {'lr': 0.0004219435957569422, 'samples': 7732224, 'steps': 40271, 'loss/train': 1.6173263788223267} -08/30/2021 20:26:40 - INFO - __main__ - Step 40273: {'lr': 0.0004219397434224009, 'samples': 7732416, 'steps': 40272, 'loss/train': 1.2772033214569092} -08/30/2021 20:26:41 - INFO - __main__ - Step 40274: {'lr': 0.0004219358910103862, 'samples': 7732608, 'steps': 40273, 'loss/train': 1.7011590003967285} -08/30/2021 20:26:41 - INFO - __main__ - Step 40275: {'lr': 0.00042193203852089993, 'samples': 7732800, 'steps': 40274, 'loss/train': 1.663090705871582} -08/30/2021 20:26:41 - INFO - __main__ - Step 40276: {'lr': 0.00042192818595394367, 'samples': 7732992, 'steps': 40275, 'loss/train': 1.5258194208145142} -08/30/2021 20:26:42 - INFO - __main__ - Step 40277: {'lr': 0.00042192433330951926, 'samples': 7733184, 'steps': 40276, 'loss/train': 1.3969306945800781} -08/30/2021 20:26:42 - INFO - __main__ - Step 40278: {'lr': 0.00042192048058762834, 'samples': 7733376, 'steps': 40277, 'loss/train': 1.6105679273605347} -08/30/2021 20:26:44 - INFO - __main__ - Step 40279: {'lr': 0.00042191662778827275, 'samples': 7733568, 'steps': 40278, 'loss/train': 1.8405061960220337} -08/30/2021 20:26:44 - INFO - __main__ - Step 40280: {'lr': 0.0004219127749114541, 'samples': 7733760, 'steps': 40279, 'loss/train': 1.2166024446487427} -08/30/2021 20:26:45 - INFO - __main__ - Step 40281: {'lr': 0.00042190892195717426, 'samples': 7733952, 'steps': 40280, 'loss/train': 0.11395849287509918} -08/30/2021 20:26:45 - INFO - __main__ - Step 40282: {'lr': 0.000421905068925435, 'samples': 7734144, 'steps': 40281, 'loss/train': 0.8582900166511536} -08/30/2021 20:26:45 - INFO - __main__ - Step 40283: {'lr': 0.00042190121581623784, 'samples': 7734336, 'steps': 40282, 'loss/train': 0.1202424168586731} -08/30/2021 20:26:47 - INFO - __main__ - Step 40284: {'lr': 0.0004218973626295847, 'samples': 7734528, 'steps': 40283, 'loss/train': 0.883367657661438} -08/30/2021 20:26:47 - INFO - __main__ - Step 40285: {'lr': 0.0004218935093654772, 'samples': 7734720, 'steps': 40284, 'loss/train': 1.707689881324768} -08/30/2021 20:26:48 - INFO - __main__ - Step 40286: {'lr': 0.00042188965602391726, 'samples': 7734912, 'steps': 40285, 'loss/train': 1.4564054012298584} -08/30/2021 20:26:48 - INFO - __main__ - Step 40287: {'lr': 0.0004218858026049064, 'samples': 7735104, 'steps': 40286, 'loss/train': 1.4280130863189697} -08/30/2021 20:26:48 - INFO - __main__ - Step 40288: {'lr': 0.00042188194910844644, 'samples': 7735296, 'steps': 40287, 'loss/train': 0.8406389355659485} -08/30/2021 20:26:50 - INFO - __main__ - Step 40289: {'lr': 0.0004218780955345392, 'samples': 7735488, 'steps': 40288, 'loss/train': 1.1888542175292969} -08/30/2021 20:26:50 - INFO - __main__ - Step 40290: {'lr': 0.0004218742418831863, 'samples': 7735680, 'steps': 40289, 'loss/train': 1.2641905546188354} -08/30/2021 20:26:50 - INFO - __main__ - Step 40291: {'lr': 0.0004218703881543895, 'samples': 7735872, 'steps': 40290, 'loss/train': 1.9486578702926636} -08/30/2021 20:26:51 - INFO - __main__ - Step 40292: {'lr': 0.0004218665343481506, 'samples': 7736064, 'steps': 40291, 'loss/train': 1.593509554862976} -08/30/2021 20:26:51 - INFO - __main__ - Step 40293: {'lr': 0.00042186268046447124, 'samples': 7736256, 'steps': 40292, 'loss/train': 1.459471344947815} -08/30/2021 20:26:53 - INFO - __main__ - Step 40294: {'lr': 0.0004218588265033533, 'samples': 7736448, 'steps': 40293, 'loss/train': 1.3312150239944458} -08/30/2021 20:26:53 - INFO - __main__ - Step 40295: {'lr': 0.0004218549724647983, 'samples': 7736640, 'steps': 40294, 'loss/train': 1.2679634094238281} -08/30/2021 20:26:54 - INFO - __main__ - Step 40296: {'lr': 0.0004218511183488082, 'samples': 7736832, 'steps': 40295, 'loss/train': 1.7948038578033447} -08/30/2021 20:26:54 - INFO - __main__ - Step 40297: {'lr': 0.00042184726415538457, 'samples': 7737024, 'steps': 40296, 'loss/train': 0.22260817885398865} -08/30/2021 20:26:54 - INFO - __main__ - Step 40298: {'lr': 0.00042184340988452924, 'samples': 7737216, 'steps': 40297, 'loss/train': 0.058078914880752563} -08/30/2021 20:26:55 - INFO - __main__ - Step 40299: {'lr': 0.00042183955553624393, 'samples': 7737408, 'steps': 40298, 'loss/train': 3.3233203887939453} -08/30/2021 20:26:57 - INFO - __main__ - Step 40300: {'lr': 0.0004218357011105304, 'samples': 7737600, 'steps': 40299, 'loss/train': 1.1314195394515991} -08/30/2021 20:26:58 - INFO - __main__ - Step 40301: {'lr': 0.00042183184660739027, 'samples': 7737792, 'steps': 40300, 'loss/train': 1.8569934368133545} -08/30/2021 20:26:58 - INFO - __main__ - Step 40302: {'lr': 0.00042182799202682543, 'samples': 7737984, 'steps': 40301, 'loss/train': 1.2081995010375977} -08/30/2021 20:26:58 - INFO - __main__ - Step 40303: {'lr': 0.0004218241373688375, 'samples': 7738176, 'steps': 40302, 'loss/train': 1.2449356317520142} -08/30/2021 20:26:59 - INFO - __main__ - Step 40304: {'lr': 0.0004218202826334283, 'samples': 7738368, 'steps': 40303, 'loss/train': 1.396825909614563} -08/30/2021 20:27:00 - INFO - __main__ - Step 40305: {'lr': 0.0004218164278205995, 'samples': 7738560, 'steps': 40304, 'loss/train': 0.2743162512779236} -08/30/2021 20:27:01 - INFO - __main__ - Step 40306: {'lr': 0.00042181257293035293, 'samples': 7738752, 'steps': 40305, 'loss/train': 1.203744888305664} -08/30/2021 20:27:01 - INFO - __main__ - Step 40307: {'lr': 0.00042180871796269025, 'samples': 7738944, 'steps': 40306, 'loss/train': 1.3717964887619019} -08/30/2021 20:27:01 - INFO - __main__ - Step 40308: {'lr': 0.00042180486291761314, 'samples': 7739136, 'steps': 40307, 'loss/train': 1.3883644342422485} -08/30/2021 20:27:02 - INFO - __main__ - Step 40309: {'lr': 0.0004218010077951235, 'samples': 7739328, 'steps': 40308, 'loss/train': 1.1176751852035522} -08/30/2021 20:27:03 - INFO - __main__ - Step 40310: {'lr': 0.00042179715259522293, 'samples': 7739520, 'steps': 40309, 'loss/train': 1.3393816947937012} -08/30/2021 20:27:04 - INFO - __main__ - Step 40311: {'lr': 0.00042179329731791324, 'samples': 7739712, 'steps': 40310, 'loss/train': 1.5139739513397217} -08/30/2021 20:27:04 - INFO - __main__ - Step 40312: {'lr': 0.0004217894419631961, 'samples': 7739904, 'steps': 40311, 'loss/train': 1.3634111881256104} -08/30/2021 20:27:04 - INFO - __main__ - Step 40313: {'lr': 0.00042178558653107337, 'samples': 7740096, 'steps': 40312, 'loss/train': 1.403426170349121} -08/30/2021 20:27:05 - INFO - __main__ - Step 40314: {'lr': 0.0004217817310215466, 'samples': 7740288, 'steps': 40313, 'loss/train': 1.4507509469985962} -08/30/2021 20:27:05 - INFO - __main__ - Step 40315: {'lr': 0.00042177787543461767, 'samples': 7740480, 'steps': 40314, 'loss/train': 1.1985925436019897} -08/30/2021 20:27:07 - INFO - __main__ - Step 40316: {'lr': 0.0004217740197702883, 'samples': 7740672, 'steps': 40315, 'loss/train': 1.3934478759765625} -08/30/2021 20:27:07 - INFO - __main__ - Step 40317: {'lr': 0.00042177016402856023, 'samples': 7740864, 'steps': 40316, 'loss/train': 1.6885063648223877} -08/30/2021 20:27:07 - INFO - __main__ - Step 40318: {'lr': 0.00042176630820943515, 'samples': 7741056, 'steps': 40317, 'loss/train': 1.5838969945907593} -08/30/2021 20:27:08 - INFO - __main__ - Step 40319: {'lr': 0.0004217624523129148, 'samples': 7741248, 'steps': 40318, 'loss/train': 1.466996431350708} -08/30/2021 20:27:08 - INFO - __main__ - Step 40320: {'lr': 0.0004217585963390009, 'samples': 7741440, 'steps': 40319, 'loss/train': 1.7655426263809204} -08/30/2021 20:27:10 - INFO - __main__ - Step 40321: {'lr': 0.00042175474028769534, 'samples': 7741632, 'steps': 40320, 'loss/train': 1.281391978263855} -08/30/2021 20:27:10 - INFO - __main__ - Step 40322: {'lr': 0.00042175088415899963, 'samples': 7741824, 'steps': 40321, 'loss/train': 0.9976521730422974} -08/30/2021 20:27:11 - INFO - __main__ - Step 40323: {'lr': 0.00042174702795291574, 'samples': 7742016, 'steps': 40322, 'loss/train': 1.610156536102295} -08/30/2021 20:27:11 - INFO - __main__ - Step 40324: {'lr': 0.0004217431716694452, 'samples': 7742208, 'steps': 40323, 'loss/train': 1.3683069944381714} -08/30/2021 20:27:11 - INFO - __main__ - Step 40325: {'lr': 0.00042173931530858986, 'samples': 7742400, 'steps': 40324, 'loss/train': 1.3470276594161987} -08/30/2021 20:27:12 - INFO - __main__ - Step 40326: {'lr': 0.00042173545887035145, 'samples': 7742592, 'steps': 40325, 'loss/train': 2.7673308849334717} -08/30/2021 20:27:13 - INFO - __main__ - Step 40327: {'lr': 0.0004217316023547317, 'samples': 7742784, 'steps': 40326, 'loss/train': 1.4720513820648193} -08/30/2021 20:27:14 - INFO - __main__ - Step 40328: {'lr': 0.00042172774576173226, 'samples': 7742976, 'steps': 40327, 'loss/train': 1.5200849771499634} -08/30/2021 20:27:14 - INFO - __main__ - Step 40329: {'lr': 0.00042172388909135505, 'samples': 7743168, 'steps': 40328, 'loss/train': 1.0162831544876099} -08/30/2021 20:27:14 - INFO - __main__ - Step 40330: {'lr': 0.0004217200323436017, 'samples': 7743360, 'steps': 40329, 'loss/train': 1.2907416820526123} -08/30/2021 20:27:15 - INFO - __main__ - Step 40331: {'lr': 0.00042171617551847387, 'samples': 7743552, 'steps': 40330, 'loss/train': 1.3495899438858032} -08/30/2021 20:27:16 - INFO - __main__ - Step 40332: {'lr': 0.0004217123186159735, 'samples': 7743744, 'steps': 40331, 'loss/train': 1.6993693113327026} -08/30/2021 20:27:17 - INFO - __main__ - Step 40333: {'lr': 0.0004217084616361021, 'samples': 7743936, 'steps': 40332, 'loss/train': 1.6641629934310913} -08/30/2021 20:27:17 - INFO - __main__ - Step 40334: {'lr': 0.0004217046045788615, 'samples': 7744128, 'steps': 40333, 'loss/train': 0.5669681429862976} -08/30/2021 20:27:17 - INFO - __main__ - Step 40335: {'lr': 0.0004217007474442535, 'samples': 7744320, 'steps': 40334, 'loss/train': 1.3328664302825928} -08/30/2021 20:27:18 - INFO - __main__ - Step 40336: {'lr': 0.00042169689023227987, 'samples': 7744512, 'steps': 40335, 'loss/train': 1.328505516052246} -08/30/2021 20:27:19 - INFO - __main__ - Step 40337: {'lr': 0.00042169303294294216, 'samples': 7744704, 'steps': 40336, 'loss/train': 1.4756109714508057} -08/30/2021 20:27:20 - INFO - __main__ - Step 40338: {'lr': 0.0004216891755762423, 'samples': 7744896, 'steps': 40337, 'loss/train': 1.2971888780593872} -08/30/2021 20:27:20 - INFO - __main__ - Step 40339: {'lr': 0.00042168531813218193, 'samples': 7745088, 'steps': 40338, 'loss/train': 1.5193443298339844} -08/30/2021 20:27:20 - INFO - __main__ - Step 40340: {'lr': 0.0004216814606107627, 'samples': 7745280, 'steps': 40339, 'loss/train': 1.5263233184814453} -08/30/2021 20:27:21 - INFO - __main__ - Step 40341: {'lr': 0.00042167760301198656, 'samples': 7745472, 'steps': 40340, 'loss/train': 1.0317834615707397} -08/30/2021 20:27:22 - INFO - __main__ - Step 40342: {'lr': 0.0004216737453358551, 'samples': 7745664, 'steps': 40341, 'loss/train': 1.6369235515594482} -08/30/2021 20:27:22 - INFO - __main__ - Step 40343: {'lr': 0.00042166988758237013, 'samples': 7745856, 'steps': 40342, 'loss/train': 1.9898678064346313} -08/30/2021 20:27:23 - INFO - __main__ - Step 40344: {'lr': 0.00042166602975153333, 'samples': 7746048, 'steps': 40343, 'loss/train': 0.6933454275131226} -08/30/2021 20:27:23 - INFO - __main__ - Step 40345: {'lr': 0.0004216621718433465, 'samples': 7746240, 'steps': 40344, 'loss/train': 1.4344582557678223} -08/30/2021 20:27:23 - INFO - __main__ - Step 40346: {'lr': 0.0004216583138578113, 'samples': 7746432, 'steps': 40345, 'loss/train': 1.5408536195755005} -08/30/2021 20:27:24 - INFO - __main__ - Step 40347: {'lr': 0.00042165445579492956, 'samples': 7746624, 'steps': 40346, 'loss/train': 1.0205566883087158} -08/30/2021 20:27:25 - INFO - __main__ - Step 40348: {'lr': 0.00042165059765470294, 'samples': 7746816, 'steps': 40347, 'loss/train': 0.20116294920444489} -08/30/2021 20:27:26 - INFO - __main__ - Step 40349: {'lr': 0.0004216467394371333, 'samples': 7747008, 'steps': 40348, 'loss/train': 1.8667646646499634} -08/30/2021 20:27:26 - INFO - __main__ - Step 40350: {'lr': 0.00042164288114222213, 'samples': 7747200, 'steps': 40349, 'loss/train': 0.07593879848718643} -08/30/2021 20:27:27 - INFO - __main__ - Step 40351: {'lr': 0.0004216390227699714, 'samples': 7747392, 'steps': 40350, 'loss/train': 1.6598784923553467} -08/30/2021 20:27:27 - INFO - __main__ - Step 40352: {'lr': 0.0004216351643203828, 'samples': 7747584, 'steps': 40351, 'loss/train': 1.124419093132019} -08/30/2021 20:27:28 - INFO - __main__ - Step 40353: {'lr': 0.000421631305793458, 'samples': 7747776, 'steps': 40352, 'loss/train': 1.5605723857879639} -08/30/2021 20:27:29 - INFO - __main__ - Step 40354: {'lr': 0.00042162744718919875, 'samples': 7747968, 'steps': 40353, 'loss/train': 1.3406190872192383} -08/30/2021 20:27:29 - INFO - __main__ - Step 40355: {'lr': 0.0004216235885076069, 'samples': 7748160, 'steps': 40354, 'loss/train': 0.9849457740783691} -08/30/2021 20:27:29 - INFO - __main__ - Step 40356: {'lr': 0.00042161972974868415, 'samples': 7748352, 'steps': 40355, 'loss/train': 1.4419806003570557} -08/30/2021 20:27:30 - INFO - __main__ - Step 40357: {'lr': 0.00042161587091243215, 'samples': 7748544, 'steps': 40356, 'loss/train': 1.6206034421920776} -08/30/2021 20:27:32 - INFO - __main__ - Step 40358: {'lr': 0.00042161201199885257, 'samples': 7748736, 'steps': 40357, 'loss/train': 1.4444661140441895} -08/30/2021 20:27:32 - INFO - __main__ - Step 40359: {'lr': 0.0004216081530079474, 'samples': 7748928, 'steps': 40358, 'loss/train': 0.3225405812263489} -08/30/2021 20:27:33 - INFO - __main__ - Step 40360: {'lr': 0.0004216042939397182, 'samples': 7749120, 'steps': 40359, 'loss/train': 1.5831632614135742} -08/30/2021 20:27:33 - INFO - __main__ - Step 40361: {'lr': 0.00042160043479416676, 'samples': 7749312, 'steps': 40360, 'loss/train': 1.3057969808578491} -08/30/2021 20:27:33 - INFO - __main__ - Step 40362: {'lr': 0.00042159657557129483, 'samples': 7749504, 'steps': 40361, 'loss/train': 1.74065101146698} -08/30/2021 20:27:35 - INFO - __main__ - Step 40363: {'lr': 0.0004215927162711041, 'samples': 7749696, 'steps': 40362, 'loss/train': 2.012923002243042} -08/30/2021 20:27:36 - INFO - __main__ - Step 40364: {'lr': 0.00042158885689359637, 'samples': 7749888, 'steps': 40363, 'loss/train': 1.2692090272903442} -08/30/2021 20:27:36 - INFO - __main__ - Step 40365: {'lr': 0.0004215849974387733, 'samples': 7750080, 'steps': 40364, 'loss/train': 0.5138596296310425} -08/30/2021 20:27:36 - INFO - __main__ - Step 40366: {'lr': 0.0004215811379066367, 'samples': 7750272, 'steps': 40365, 'loss/train': 1.9462394714355469} -08/30/2021 20:27:37 - INFO - __main__ - Step 40367: {'lr': 0.00042157727829718827, 'samples': 7750464, 'steps': 40366, 'loss/train': 1.1545941829681396} -08/30/2021 20:27:38 - INFO - __main__ - Step 40368: {'lr': 0.00042157341861042986, 'samples': 7750656, 'steps': 40367, 'loss/train': 1.166222095489502} -08/30/2021 20:27:39 - INFO - __main__ - Step 40369: {'lr': 0.00042156955884636307, 'samples': 7750848, 'steps': 40368, 'loss/train': 1.1601929664611816} -08/30/2021 20:27:39 - INFO - __main__ - Step 40370: {'lr': 0.0004215656990049896, 'samples': 7751040, 'steps': 40369, 'loss/train': 0.9019650816917419} -08/30/2021 20:27:39 - INFO - __main__ - Step 40371: {'lr': 0.0004215618390863114, 'samples': 7751232, 'steps': 40370, 'loss/train': 0.5609971880912781} -08/30/2021 20:27:40 - INFO - __main__ - Step 40372: {'lr': 0.00042155797909033, 'samples': 7751424, 'steps': 40371, 'loss/train': 1.0752054452896118} -08/30/2021 20:27:42 - INFO - __main__ - Step 40373: {'lr': 0.00042155411901704723, 'samples': 7751616, 'steps': 40372, 'loss/train': 1.7423181533813477} -08/30/2021 20:27:42 - INFO - __main__ - Step 40374: {'lr': 0.0004215502588664648, 'samples': 7751808, 'steps': 40373, 'loss/train': 1.6888480186462402} -08/30/2021 20:27:42 - INFO - __main__ - Step 40375: {'lr': 0.0004215463986385845, 'samples': 7752000, 'steps': 40374, 'loss/train': 0.9067996144294739} -08/30/2021 20:27:43 - INFO - __main__ - Step 40376: {'lr': 0.0004215425383334081, 'samples': 7752192, 'steps': 40375, 'loss/train': 0.1130153089761734} -08/30/2021 20:27:43 - INFO - __main__ - Step 40377: {'lr': 0.00042153867795093714, 'samples': 7752384, 'steps': 40376, 'loss/train': 1.697483777999878} -08/30/2021 20:27:45 - INFO - __main__ - Step 40378: {'lr': 0.0004215348174911736, 'samples': 7752576, 'steps': 40377, 'loss/train': 1.3804517984390259} -08/30/2021 20:27:45 - INFO - __main__ - Step 40379: {'lr': 0.0004215309569541191, 'samples': 7752768, 'steps': 40378, 'loss/train': 1.7700001001358032} -08/30/2021 20:27:45 - INFO - __main__ - Step 40380: {'lr': 0.00042152709633977545, 'samples': 7752960, 'steps': 40379, 'loss/train': 0.9675085544586182} -08/30/2021 20:27:46 - INFO - __main__ - Step 40381: {'lr': 0.0004215232356481442, 'samples': 7753152, 'steps': 40380, 'loss/train': 1.470218539237976} -08/30/2021 20:27:46 - INFO - __main__ - Step 40382: {'lr': 0.0004215193748792273, 'samples': 7753344, 'steps': 40381, 'loss/train': 0.9617518782615662} -08/30/2021 20:27:46 - INFO - __main__ - Step 40383: {'lr': 0.00042151551403302645, 'samples': 7753536, 'steps': 40382, 'loss/train': 2.5395267009735107} -08/30/2021 20:27:48 - INFO - __main__ - Step 40384: {'lr': 0.00042151165310954335, 'samples': 7753728, 'steps': 40383, 'loss/train': 1.0392248630523682} -08/30/2021 20:27:48 - INFO - __main__ - Step 40385: {'lr': 0.0004215077921087798, 'samples': 7753920, 'steps': 40384, 'loss/train': 1.2678207159042358} -08/30/2021 20:27:49 - INFO - __main__ - Step 40386: {'lr': 0.00042150393103073736, 'samples': 7754112, 'steps': 40385, 'loss/train': 1.7337491512298584} -08/30/2021 20:27:49 - INFO - __main__ - Step 40387: {'lr': 0.00042150006987541795, 'samples': 7754304, 'steps': 40386, 'loss/train': 1.4797840118408203} -08/30/2021 20:27:49 - INFO - __main__ - Step 40388: {'lr': 0.0004214962086428232, 'samples': 7754496, 'steps': 40387, 'loss/train': 1.6027675867080688} -08/30/2021 20:27:51 - INFO - __main__ - Step 40389: {'lr': 0.00042149234733295497, 'samples': 7754688, 'steps': 40388, 'loss/train': 1.48690664768219} -08/30/2021 20:27:52 - INFO - __main__ - Step 40390: {'lr': 0.00042148848594581503, 'samples': 7754880, 'steps': 40389, 'loss/train': 0.8856250643730164} -08/30/2021 20:27:52 - INFO - __main__ - Step 40391: {'lr': 0.00042148462448140487, 'samples': 7755072, 'steps': 40390, 'loss/train': 1.2726149559020996} -08/30/2021 20:27:52 - INFO - __main__ - Step 40392: {'lr': 0.0004214807629397264, 'samples': 7755264, 'steps': 40391, 'loss/train': 1.0841002464294434} -08/30/2021 20:27:53 - INFO - __main__ - Step 40393: {'lr': 0.00042147690132078136, 'samples': 7755456, 'steps': 40392, 'loss/train': 0.5488522052764893} -08/30/2021 20:27:54 - INFO - __main__ - Step 40394: {'lr': 0.0004214730396245715, 'samples': 7755648, 'steps': 40393, 'loss/train': 1.7260538339614868} -08/30/2021 20:27:55 - INFO - __main__ - Step 40395: {'lr': 0.0004214691778510985, 'samples': 7755840, 'steps': 40394, 'loss/train': 1.1251493692398071} -08/30/2021 20:27:55 - INFO - __main__ - Step 40396: {'lr': 0.0004214653160003642, 'samples': 7756032, 'steps': 40395, 'loss/train': 1.223690152168274} -08/30/2021 20:27:55 - INFO - __main__ - Step 40397: {'lr': 0.00042146145407237023, 'samples': 7756224, 'steps': 40396, 'loss/train': 1.7771278619766235} -08/30/2021 20:27:56 - INFO - __main__ - Step 40398: {'lr': 0.00042145759206711834, 'samples': 7756416, 'steps': 40397, 'loss/train': 1.2685621976852417} -08/30/2021 20:27:57 - INFO - __main__ - Step 40399: {'lr': 0.0004214537299846104, 'samples': 7756608, 'steps': 40398, 'loss/train': 1.491264820098877} -08/30/2021 20:27:58 - INFO - __main__ - Step 40400: {'lr': 0.00042144986782484796, 'samples': 7756800, 'steps': 40399, 'loss/train': 0.7894092798233032} -08/30/2021 20:27:58 - INFO - __main__ - Step 40401: {'lr': 0.00042144600558783284, 'samples': 7756992, 'steps': 40400, 'loss/train': 1.8036856651306152} -08/30/2021 20:27:58 - INFO - __main__ - Step 40402: {'lr': 0.0004214421432735669, 'samples': 7757184, 'steps': 40401, 'loss/train': 1.860939621925354} -08/30/2021 20:27:59 - INFO - __main__ - Step 40403: {'lr': 0.0004214382808820517, 'samples': 7757376, 'steps': 40402, 'loss/train': 1.1518206596374512} -08/30/2021 20:28:00 - INFO - __main__ - Step 40404: {'lr': 0.0004214344184132891, 'samples': 7757568, 'steps': 40403, 'loss/train': 1.4019520282745361} -08/30/2021 20:28:01 - INFO - __main__ - Step 40405: {'lr': 0.0004214305558672808, 'samples': 7757760, 'steps': 40404, 'loss/train': 1.6815168857574463} -08/30/2021 20:28:01 - INFO - __main__ - Step 40406: {'lr': 0.0004214266932440285, 'samples': 7757952, 'steps': 40405, 'loss/train': 1.1195424795150757} -08/30/2021 20:28:01 - INFO - __main__ - Step 40407: {'lr': 0.000421422830543534, 'samples': 7758144, 'steps': 40406, 'loss/train': 1.978991985321045} -08/30/2021 20:28:02 - INFO - __main__ - Step 40408: {'lr': 0.00042141896776579904, 'samples': 7758336, 'steps': 40407, 'loss/train': 1.7775918245315552} -08/30/2021 20:28:02 - INFO - __main__ - Step 40409: {'lr': 0.0004214151049108252, 'samples': 7758528, 'steps': 40408, 'loss/train': 1.9017950296401978} -08/30/2021 20:28:04 - INFO - __main__ - Step 40410: {'lr': 0.00042141124197861456, 'samples': 7758720, 'steps': 40409, 'loss/train': 1.5890322923660278} -08/30/2021 20:28:05 - INFO - __main__ - Step 40411: {'lr': 0.0004214073789691686, 'samples': 7758912, 'steps': 40410, 'loss/train': 1.2397980690002441} -08/30/2021 20:28:05 - INFO - __main__ - Step 40412: {'lr': 0.00042140351588248906, 'samples': 7759104, 'steps': 40411, 'loss/train': 1.108689546585083} -08/30/2021 20:28:05 - INFO - __main__ - Step 40413: {'lr': 0.00042139965271857774, 'samples': 7759296, 'steps': 40412, 'loss/train': 1.601515293121338} -08/30/2021 20:28:06 - INFO - __main__ - Step 40414: {'lr': 0.0004213957894774364, 'samples': 7759488, 'steps': 40413, 'loss/train': 1.6199307441711426} -08/30/2021 20:28:07 - INFO - __main__ - Step 40415: {'lr': 0.0004213919261590667, 'samples': 7759680, 'steps': 40414, 'loss/train': 1.2000441551208496} -08/30/2021 20:28:08 - INFO - __main__ - Step 40416: {'lr': 0.0004213880627634705, 'samples': 7759872, 'steps': 40415, 'loss/train': 1.3455394506454468} -08/30/2021 20:28:08 - INFO - __main__ - Step 40417: {'lr': 0.0004213841992906496, 'samples': 7760064, 'steps': 40416, 'loss/train': 1.445949673652649} -08/30/2021 20:28:08 - INFO - __main__ - Step 40418: {'lr': 0.0004213803357406055, 'samples': 7760256, 'steps': 40417, 'loss/train': 3.0253524780273438} -08/30/2021 20:28:09 - INFO - __main__ - Step 40419: {'lr': 0.00042137647211334007, 'samples': 7760448, 'steps': 40418, 'loss/train': 1.703039288520813} -08/30/2021 20:28:10 - INFO - __main__ - Step 40420: {'lr': 0.000421372608408855, 'samples': 7760640, 'steps': 40419, 'loss/train': 1.0548624992370605} -08/30/2021 20:28:11 - INFO - __main__ - Step 40421: {'lr': 0.0004213687446271522, 'samples': 7760832, 'steps': 40420, 'loss/train': 0.630613386631012} -08/30/2021 20:28:11 - INFO - __main__ - Step 40422: {'lr': 0.0004213648807682332, 'samples': 7761024, 'steps': 40421, 'loss/train': 1.1315127611160278} -08/30/2021 20:28:12 - INFO - __main__ - Step 40423: {'lr': 0.00042136101683209993, 'samples': 7761216, 'steps': 40422, 'loss/train': 0.7948915958404541} -08/30/2021 20:28:12 - INFO - __main__ - Step 40424: {'lr': 0.00042135715281875393, 'samples': 7761408, 'steps': 40423, 'loss/train': 1.3141162395477295} -08/30/2021 20:28:13 - INFO - __main__ - Step 40425: {'lr': 0.000421353288728197, 'samples': 7761600, 'steps': 40424, 'loss/train': 1.365285873413086} -08/30/2021 20:28:14 - INFO - __main__ - Step 40426: {'lr': 0.00042134942456043104, 'samples': 7761792, 'steps': 40425, 'loss/train': 1.4979889392852783} -08/30/2021 20:28:14 - INFO - __main__ - Step 40427: {'lr': 0.00042134556031545755, 'samples': 7761984, 'steps': 40426, 'loss/train': 1.6646672487258911} -08/30/2021 20:28:15 - INFO - __main__ - Step 40428: {'lr': 0.0004213416959932785, 'samples': 7762176, 'steps': 40427, 'loss/train': 1.4719834327697754} -08/30/2021 20:28:15 - INFO - __main__ - Step 40429: {'lr': 0.0004213378315938955, 'samples': 7762368, 'steps': 40428, 'loss/train': 1.4625318050384521} -08/30/2021 20:28:16 - INFO - __main__ - Step 40430: {'lr': 0.0004213339671173103, 'samples': 7762560, 'steps': 40429, 'loss/train': 1.7609469890594482} -08/30/2021 20:28:17 - INFO - __main__ - Step 40431: {'lr': 0.00042133010256352466, 'samples': 7762752, 'steps': 40430, 'loss/train': 1.342767357826233} -08/30/2021 20:28:17 - INFO - __main__ - Step 40432: {'lr': 0.00042132623793254034, 'samples': 7762944, 'steps': 40431, 'loss/train': 1.5123486518859863} -08/30/2021 20:28:17 - INFO - __main__ - Step 40433: {'lr': 0.0004213223732243591, 'samples': 7763136, 'steps': 40432, 'loss/train': 1.015679955482483} -08/30/2021 20:28:18 - INFO - __main__ - Step 40434: {'lr': 0.00042131850843898255, 'samples': 7763328, 'steps': 40433, 'loss/train': 1.6167149543762207} -08/30/2021 20:28:19 - INFO - __main__ - Step 40435: {'lr': 0.0004213146435764126, 'samples': 7763520, 'steps': 40434, 'loss/train': 1.1222697496414185} -08/30/2021 20:28:20 - INFO - __main__ - Step 40436: {'lr': 0.00042131077863665086, 'samples': 7763712, 'steps': 40435, 'loss/train': 1.3205466270446777} -08/30/2021 20:28:20 - INFO - __main__ - Step 40437: {'lr': 0.00042130691361969914, 'samples': 7763904, 'steps': 40436, 'loss/train': 1.8007813692092896} -08/30/2021 20:28:20 - INFO - __main__ - Step 40438: {'lr': 0.00042130304852555916, 'samples': 7764096, 'steps': 40437, 'loss/train': 1.0469818115234375} -08/30/2021 20:28:21 - INFO - __main__ - Step 40439: {'lr': 0.00042129918335423265, 'samples': 7764288, 'steps': 40438, 'loss/train': 1.7245885133743286} -08/30/2021 20:28:21 - INFO - __main__ - Step 40440: {'lr': 0.0004212953181057214, 'samples': 7764480, 'steps': 40439, 'loss/train': 0.9249213933944702} -08/30/2021 20:28:23 - INFO - __main__ - Step 40441: {'lr': 0.0004212914527800272, 'samples': 7764672, 'steps': 40440, 'loss/train': 1.673649787902832} -08/30/2021 20:28:23 - INFO - __main__ - Step 40442: {'lr': 0.0004212875873771516, 'samples': 7764864, 'steps': 40441, 'loss/train': 1.8173637390136719} -08/30/2021 20:28:23 - INFO - __main__ - Step 40443: {'lr': 0.0004212837218970965, 'samples': 7765056, 'steps': 40442, 'loss/train': 1.2666174173355103} -08/30/2021 20:28:24 - INFO - __main__ - Step 40444: {'lr': 0.00042127985633986365, 'samples': 7765248, 'steps': 40443, 'loss/train': 1.8080965280532837} -08/30/2021 20:28:24 - INFO - __main__ - Step 40445: {'lr': 0.0004212759907054546, 'samples': 7765440, 'steps': 40444, 'loss/train': 0.9029436111450195} -08/30/2021 20:28:26 - INFO - __main__ - Step 40446: {'lr': 0.00042127212499387136, 'samples': 7765632, 'steps': 40445, 'loss/train': 1.9689255952835083} -08/30/2021 20:28:26 - INFO - __main__ - Step 40447: {'lr': 0.0004212682592051155, 'samples': 7765824, 'steps': 40446, 'loss/train': 0.8188783526420593} -08/30/2021 20:28:26 - INFO - __main__ - Step 40448: {'lr': 0.0004212643933391888, 'samples': 7766016, 'steps': 40447, 'loss/train': 1.0567514896392822} -08/30/2021 20:28:27 - INFO - __main__ - Step 40449: {'lr': 0.000421260527396093, 'samples': 7766208, 'steps': 40448, 'loss/train': 1.8368842601776123} -08/30/2021 20:28:27 - INFO - __main__ - Step 40450: {'lr': 0.0004212566613758299, 'samples': 7766400, 'steps': 40449, 'loss/train': 1.2382378578186035} -08/30/2021 20:28:28 - INFO - __main__ - Step 40451: {'lr': 0.00042125279527840124, 'samples': 7766592, 'steps': 40450, 'loss/train': 1.1999740600585938} -08/30/2021 20:28:29 - INFO - __main__ - Step 40452: {'lr': 0.0004212489291038085, 'samples': 7766784, 'steps': 40451, 'loss/train': 1.3785598278045654} -08/30/2021 20:28:29 - INFO - __main__ - Step 40453: {'lr': 0.0004212450628520538, 'samples': 7766976, 'steps': 40452, 'loss/train': 1.0922719240188599} -08/30/2021 20:28:30 - INFO - __main__ - Step 40454: {'lr': 0.0004212411965231387, 'samples': 7767168, 'steps': 40453, 'loss/train': 0.7920715808868408} -08/30/2021 20:28:30 - INFO - __main__ - Step 40455: {'lr': 0.0004212373301170649, 'samples': 7767360, 'steps': 40454, 'loss/train': 1.383434772491455} -08/30/2021 20:28:32 - INFO - __main__ - Step 40456: {'lr': 0.00042123346363383426, 'samples': 7767552, 'steps': 40455, 'loss/train': 1.9311542510986328} -08/30/2021 20:28:32 - INFO - __main__ - Step 40457: {'lr': 0.0004212295970734484, 'samples': 7767744, 'steps': 40456, 'loss/train': 1.3312681913375854} -08/30/2021 20:28:33 - INFO - __main__ - Step 40458: {'lr': 0.00042122573043590925, 'samples': 7767936, 'steps': 40457, 'loss/train': 1.8653721809387207} -08/30/2021 20:28:33 - INFO - __main__ - Step 40459: {'lr': 0.0004212218637212183, 'samples': 7768128, 'steps': 40458, 'loss/train': 1.610128402709961} -08/30/2021 20:28:33 - INFO - __main__ - Step 40460: {'lr': 0.00042121799692937747, 'samples': 7768320, 'steps': 40459, 'loss/train': 1.544898271560669} -08/30/2021 20:28:34 - INFO - __main__ - Step 40461: {'lr': 0.00042121413006038845, 'samples': 7768512, 'steps': 40460, 'loss/train': 0.045086152851581573} -08/30/2021 20:28:34 - INFO - __main__ - Step 40462: {'lr': 0.000421210263114253, 'samples': 7768704, 'steps': 40461, 'loss/train': 0.26992398500442505} -08/30/2021 20:28:36 - INFO - __main__ - Step 40463: {'lr': 0.00042120639609097277, 'samples': 7768896, 'steps': 40462, 'loss/train': 1.440134048461914} -08/30/2021 20:28:36 - INFO - __main__ - Step 40464: {'lr': 0.0004212025289905497, 'samples': 7769088, 'steps': 40463, 'loss/train': 1.5344254970550537} -08/30/2021 20:28:36 - INFO - __main__ - Step 40465: {'lr': 0.0004211986618129854, 'samples': 7769280, 'steps': 40464, 'loss/train': 1.4416701793670654} -08/30/2021 20:28:37 - INFO - __main__ - Step 40466: {'lr': 0.00042119479455828153, 'samples': 7769472, 'steps': 40465, 'loss/train': 1.1182299852371216} -08/30/2021 20:28:37 - INFO - __main__ - Step 40467: {'lr': 0.00042119092722644, 'samples': 7769664, 'steps': 40466, 'loss/train': 1.1801046133041382} -08/30/2021 20:28:39 - INFO - __main__ - Step 40468: {'lr': 0.0004211870598174624, 'samples': 7769856, 'steps': 40467, 'loss/train': 1.793915867805481} -08/30/2021 20:28:40 - INFO - __main__ - Step 40469: {'lr': 0.0004211831923313506, 'samples': 7770048, 'steps': 40468, 'loss/train': 0.9394699931144714} -08/30/2021 20:28:40 - INFO - __main__ - Step 40470: {'lr': 0.0004211793247681064, 'samples': 7770240, 'steps': 40469, 'loss/train': 1.645469307899475} -08/30/2021 20:28:40 - INFO - __main__ - Step 40471: {'lr': 0.0004211754571277313, 'samples': 7770432, 'steps': 40470, 'loss/train': 1.4317232370376587} -08/30/2021 20:28:41 - INFO - __main__ - Step 40472: {'lr': 0.0004211715894102272, 'samples': 7770624, 'steps': 40471, 'loss/train': 2.090947389602661} -08/30/2021 20:28:42 - INFO - __main__ - Step 40473: {'lr': 0.00042116772161559585, 'samples': 7770816, 'steps': 40472, 'loss/train': 1.602316975593567} -08/30/2021 20:28:43 - INFO - __main__ - Step 40474: {'lr': 0.0004211638537438389, 'samples': 7771008, 'steps': 40473, 'loss/train': 1.196723461151123} -08/30/2021 20:28:43 - INFO - __main__ - Step 40475: {'lr': 0.0004211599857949583, 'samples': 7771200, 'steps': 40474, 'loss/train': 1.0629518032073975} -08/30/2021 20:28:44 - INFO - __main__ - Step 40476: {'lr': 0.00042115611776895556, 'samples': 7771392, 'steps': 40475, 'loss/train': 1.3481874465942383} -08/30/2021 20:28:44 - INFO - __main__ - Step 40477: {'lr': 0.00042115224966583255, 'samples': 7771584, 'steps': 40476, 'loss/train': 1.5721675157546997} -08/30/2021 20:28:44 - INFO - __main__ - Step 40478: {'lr': 0.00042114838148559093, 'samples': 7771776, 'steps': 40477, 'loss/train': 1.6162680387496948} -08/30/2021 20:28:46 - INFO - __main__ - Step 40479: {'lr': 0.0004211445132282325, 'samples': 7771968, 'steps': 40478, 'loss/train': 2.3836116790771484} -08/30/2021 20:28:46 - INFO - __main__ - Step 40480: {'lr': 0.000421140644893759, 'samples': 7772160, 'steps': 40479, 'loss/train': 0.700352132320404} -08/30/2021 20:28:47 - INFO - __main__ - Step 40481: {'lr': 0.0004211367764821722, 'samples': 7772352, 'steps': 40480, 'loss/train': 1.353203296661377} -08/30/2021 20:28:47 - INFO - __main__ - Step 40482: {'lr': 0.00042113290799347376, 'samples': 7772544, 'steps': 40481, 'loss/train': 1.2763320207595825} -08/30/2021 20:28:47 - INFO - __main__ - Step 40483: {'lr': 0.00042112903942766546, 'samples': 7772736, 'steps': 40482, 'loss/train': 1.6155753135681152} -08/30/2021 20:28:49 - INFO - __main__ - Step 40484: {'lr': 0.00042112517078474914, 'samples': 7772928, 'steps': 40483, 'loss/train': 1.287023901939392} -08/30/2021 20:28:49 - INFO - __main__ - Step 40485: {'lr': 0.0004211213020647264, 'samples': 7773120, 'steps': 40484, 'loss/train': 0.597719132900238} -08/30/2021 20:28:50 - INFO - __main__ - Step 40486: {'lr': 0.00042111743326759903, 'samples': 7773312, 'steps': 40485, 'loss/train': 1.7989550828933716} -08/30/2021 20:28:50 - INFO - __main__ - Step 40487: {'lr': 0.00042111356439336877, 'samples': 7773504, 'steps': 40486, 'loss/train': 1.4463798999786377} -08/30/2021 20:28:50 - INFO - __main__ - Step 40488: {'lr': 0.0004211096954420375, 'samples': 7773696, 'steps': 40487, 'loss/train': 1.395016074180603} -08/30/2021 20:28:52 - INFO - __main__ - Step 40489: {'lr': 0.0004211058264136067, 'samples': 7773888, 'steps': 40488, 'loss/train': 1.35060715675354} -08/30/2021 20:28:52 - INFO - __main__ - Step 40490: {'lr': 0.0004211019573080783, 'samples': 7774080, 'steps': 40489, 'loss/train': 1.1428407430648804} -08/30/2021 20:28:53 - INFO - __main__ - Step 40491: {'lr': 0.00042109808812545405, 'samples': 7774272, 'steps': 40490, 'loss/train': 1.4952999353408813} -08/30/2021 20:28:53 - INFO - __main__ - Step 40492: {'lr': 0.0004210942188657356, 'samples': 7774464, 'steps': 40491, 'loss/train': 0.39101436734199524} -08/30/2021 20:28:53 - INFO - __main__ - Step 40493: {'lr': 0.00042109034952892473, 'samples': 7774656, 'steps': 40492, 'loss/train': 0.9900166988372803} -08/30/2021 20:28:55 - INFO - __main__ - Step 40494: {'lr': 0.00042108648011502314, 'samples': 7774848, 'steps': 40493, 'loss/train': 1.4828351736068726} -08/30/2021 20:28:55 - INFO - __main__ - Step 40495: {'lr': 0.00042108261062403276, 'samples': 7775040, 'steps': 40494, 'loss/train': 1.9816858768463135} -08/30/2021 20:28:55 - INFO - __main__ - Step 40496: {'lr': 0.00042107874105595507, 'samples': 7775232, 'steps': 40495, 'loss/train': 1.195799469947815} -08/30/2021 20:28:56 - INFO - __main__ - Step 40497: {'lr': 0.00042107487141079206, 'samples': 7775424, 'steps': 40496, 'loss/train': 0.9438231587409973} -08/30/2021 20:28:56 - INFO - __main__ - Step 40498: {'lr': 0.00042107100168854516, 'samples': 7775616, 'steps': 40497, 'loss/train': 1.4688013792037964} -08/30/2021 20:28:57 - INFO - __main__ - Step 40499: {'lr': 0.00042106713188921647, 'samples': 7775808, 'steps': 40498, 'loss/train': 1.4553735256195068} -08/30/2021 20:28:59 - INFO - __main__ - Step 40500: {'lr': 0.00042106326201280756, 'samples': 7776000, 'steps': 40499, 'loss/train': 0.4389041066169739} -08/30/2021 20:28:59 - INFO - __main__ - Step 40501: {'lr': 0.0004210593920593201, 'samples': 7776192, 'steps': 40500, 'loss/train': 1.2959622144699097} -08/30/2021 20:29:00 - INFO - __main__ - Step 40502: {'lr': 0.000421055522028756, 'samples': 7776384, 'steps': 40501, 'loss/train': 1.405869960784912} -08/30/2021 20:29:00 - INFO - __main__ - Step 40503: {'lr': 0.00042105165192111684, 'samples': 7776576, 'steps': 40502, 'loss/train': 1.3999860286712646} -08/30/2021 20:29:01 - INFO - __main__ - Step 40504: {'lr': 0.00042104778173640453, 'samples': 7776768, 'steps': 40503, 'loss/train': 1.0617791414260864} -08/30/2021 20:29:01 - INFO - __main__ - Step 40505: {'lr': 0.0004210439114746206, 'samples': 7776960, 'steps': 40504, 'loss/train': 0.5073390007019043} -08/30/2021 20:29:01 - INFO - __main__ - Step 40506: {'lr': 0.00042104004113576707, 'samples': 7777152, 'steps': 40505, 'loss/train': 0.43421733379364014} -08/30/2021 20:29:03 - INFO - __main__ - Step 40507: {'lr': 0.00042103617071984544, 'samples': 7777344, 'steps': 40506, 'loss/train': 0.43527668714523315} -08/30/2021 20:29:03 - INFO - __main__ - Step 40508: {'lr': 0.00042103230022685765, 'samples': 7777536, 'steps': 40507, 'loss/train': 1.2526508569717407} -08/30/2021 20:29:04 - INFO - __main__ - Step 40509: {'lr': 0.0004210284296568052, 'samples': 7777728, 'steps': 40508, 'loss/train': 1.5543291568756104} -08/30/2021 20:29:04 - INFO - __main__ - Step 40510: {'lr': 0.0004210245590096901, 'samples': 7777920, 'steps': 40509, 'loss/train': 1.6170828342437744} -08/30/2021 20:29:04 - INFO - __main__ - Step 40511: {'lr': 0.000421020688285514, 'samples': 7778112, 'steps': 40510, 'loss/train': 1.6495461463928223} -08/30/2021 20:29:06 - INFO - __main__ - Step 40512: {'lr': 0.0004210168174842785, 'samples': 7778304, 'steps': 40511, 'loss/train': 1.6361174583435059} -08/30/2021 20:29:06 - INFO - __main__ - Step 40513: {'lr': 0.00042101294660598556, 'samples': 7778496, 'steps': 40512, 'loss/train': 1.4974020719528198} -08/30/2021 20:29:07 - INFO - __main__ - Step 40514: {'lr': 0.0004210090756506367, 'samples': 7778688, 'steps': 40513, 'loss/train': 1.6260173320770264} -08/30/2021 20:29:07 - INFO - __main__ - Step 40515: {'lr': 0.0004210052046182339, 'samples': 7778880, 'steps': 40514, 'loss/train': 1.3380181789398193} -08/30/2021 20:29:07 - INFO - __main__ - Step 40516: {'lr': 0.0004210013335087787, 'samples': 7779072, 'steps': 40515, 'loss/train': 1.1280826330184937} -08/30/2021 20:29:09 - INFO - __main__ - Step 40517: {'lr': 0.000420997462322273, 'samples': 7779264, 'steps': 40516, 'loss/train': 1.1551539897918701} -08/30/2021 20:29:10 - INFO - __main__ - Step 40518: {'lr': 0.00042099359105871856, 'samples': 7779456, 'steps': 40517, 'loss/train': 2.428903341293335} -08/30/2021 20:29:10 - INFO - __main__ - Step 40519: {'lr': 0.00042098971971811695, 'samples': 7779648, 'steps': 40518, 'loss/train': 0.9138599634170532} -08/30/2021 20:29:10 - INFO - __main__ - Step 40520: {'lr': 0.00042098584830047004, 'samples': 7779840, 'steps': 40519, 'loss/train': 1.2494220733642578} -08/30/2021 20:29:11 - INFO - __main__ - Step 40521: {'lr': 0.00042098197680577956, 'samples': 7780032, 'steps': 40520, 'loss/train': 1.0672250986099243} -08/30/2021 20:29:13 - INFO - __main__ - Step 40522: {'lr': 0.00042097810523404714, 'samples': 7780224, 'steps': 40521, 'loss/train': 1.3310288190841675} -08/30/2021 20:29:13 - INFO - __main__ - Step 40523: {'lr': 0.0004209742335852747, 'samples': 7780416, 'steps': 40522, 'loss/train': 1.6031845808029175} -08/30/2021 20:29:14 - INFO - __main__ - Step 40524: {'lr': 0.0004209703618594639, 'samples': 7780608, 'steps': 40523, 'loss/train': 1.6723653078079224} -08/30/2021 20:29:14 - INFO - __main__ - Step 40525: {'lr': 0.00042096649005661654, 'samples': 7780800, 'steps': 40524, 'loss/train': 1.7833189964294434} -08/30/2021 20:29:14 - INFO - __main__ - Step 40526: {'lr': 0.00042096261817673423, 'samples': 7780992, 'steps': 40525, 'loss/train': 1.3080673217773438} -08/30/2021 20:29:16 - INFO - __main__ - Step 40527: {'lr': 0.0004209587462198189, 'samples': 7781184, 'steps': 40526, 'loss/train': 1.0665901899337769} -08/30/2021 20:29:16 - INFO - __main__ - Step 40528: {'lr': 0.0004209548741858721, 'samples': 7781376, 'steps': 40527, 'loss/train': 1.4239306449890137} -08/30/2021 20:29:17 - INFO - __main__ - Step 40529: {'lr': 0.00042095100207489573, 'samples': 7781568, 'steps': 40528, 'loss/train': 1.3944056034088135} -08/30/2021 20:29:17 - INFO - __main__ - Step 40530: {'lr': 0.0004209471298868914, 'samples': 7781760, 'steps': 40529, 'loss/train': 1.9133447408676147} -08/30/2021 20:29:17 - INFO - __main__ - Step 40531: {'lr': 0.00042094325762186103, 'samples': 7781952, 'steps': 40530, 'loss/train': 2.0818612575531006} -08/30/2021 20:29:18 - INFO - __main__ - Step 40532: {'lr': 0.0004209393852798062, 'samples': 7782144, 'steps': 40531, 'loss/train': 1.2844743728637695} -08/30/2021 20:29:19 - INFO - __main__ - Step 40533: {'lr': 0.00042093551286072887, 'samples': 7782336, 'steps': 40532, 'loss/train': 1.804255723953247} -08/30/2021 20:29:20 - INFO - __main__ - Step 40534: {'lr': 0.00042093164036463045, 'samples': 7782528, 'steps': 40533, 'loss/train': 1.6033272743225098} -08/30/2021 20:29:20 - INFO - __main__ - Step 40535: {'lr': 0.0004209277677915129, 'samples': 7782720, 'steps': 40534, 'loss/train': 0.6958231329917908} -08/30/2021 20:29:21 - INFO - __main__ - Step 40536: {'lr': 0.000420923895141378, 'samples': 7782912, 'steps': 40535, 'loss/train': 1.510439157485962} -08/30/2021 20:29:21 - INFO - __main__ - Step 40537: {'lr': 0.0004209200224142274, 'samples': 7783104, 'steps': 40536, 'loss/train': 1.6485573053359985} -08/30/2021 20:29:22 - INFO - __main__ - Step 40538: {'lr': 0.0004209161496100629, 'samples': 7783296, 'steps': 40537, 'loss/train': 1.9332777261734009} -08/30/2021 20:29:23 - INFO - __main__ - Step 40539: {'lr': 0.00042091227672888624, 'samples': 7783488, 'steps': 40538, 'loss/train': 1.284566879272461} -08/30/2021 20:29:23 - INFO - __main__ - Step 40540: {'lr': 0.00042090840377069906, 'samples': 7783680, 'steps': 40539, 'loss/train': 1.3033260107040405} -08/30/2021 20:29:24 - INFO - __main__ - Step 40541: {'lr': 0.00042090453073550323, 'samples': 7783872, 'steps': 40540, 'loss/train': 1.5416302680969238} -08/30/2021 20:29:24 - INFO - __main__ - Step 40542: {'lr': 0.0004209006576233004, 'samples': 7784064, 'steps': 40541, 'loss/train': 1.5478184223175049} -08/30/2021 20:29:26 - INFO - __main__ - Step 40543: {'lr': 0.0004208967844340925, 'samples': 7784256, 'steps': 40542, 'loss/train': 1.293800950050354} -08/30/2021 20:29:26 - INFO - __main__ - Step 40544: {'lr': 0.0004208929111678811, 'samples': 7784448, 'steps': 40543, 'loss/train': 1.3689665794372559} -08/30/2021 20:29:26 - INFO - __main__ - Step 40545: {'lr': 0.0004208890378246679, 'samples': 7784640, 'steps': 40544, 'loss/train': 0.8256595134735107} -08/30/2021 20:29:27 - INFO - __main__ - Step 40546: {'lr': 0.00042088516440445486, 'samples': 7784832, 'steps': 40545, 'loss/train': 1.716766357421875} -08/30/2021 20:29:27 - INFO - __main__ - Step 40547: {'lr': 0.0004208812909072435, 'samples': 7785024, 'steps': 40546, 'loss/train': 1.1976085901260376} -08/30/2021 20:29:28 - INFO - __main__ - Step 40548: {'lr': 0.00042087741733303575, 'samples': 7785216, 'steps': 40547, 'loss/train': 1.2565360069274902} -08/30/2021 20:29:29 - INFO - __main__ - Step 40549: {'lr': 0.00042087354368183316, 'samples': 7785408, 'steps': 40548, 'loss/train': 1.0759553909301758} -08/30/2021 20:29:29 - INFO - __main__ - Step 40550: {'lr': 0.00042086966995363774, 'samples': 7785600, 'steps': 40549, 'loss/train': 1.431450366973877} -08/30/2021 20:29:30 - INFO - __main__ - Step 40551: {'lr': 0.000420865796148451, 'samples': 7785792, 'steps': 40550, 'loss/train': 1.3393325805664062} -08/30/2021 20:29:30 - INFO - __main__ - Step 40552: {'lr': 0.00042086192226627476, 'samples': 7785984, 'steps': 40551, 'loss/train': 1.5410536527633667} -08/30/2021 20:29:31 - INFO - __main__ - Step 40553: {'lr': 0.00042085804830711084, 'samples': 7786176, 'steps': 40552, 'loss/train': 1.4146901369094849} -08/30/2021 20:29:32 - INFO - __main__ - Step 40554: {'lr': 0.00042085417427096085, 'samples': 7786368, 'steps': 40553, 'loss/train': 0.5668691396713257} -08/30/2021 20:29:32 - INFO - __main__ - Step 40555: {'lr': 0.0004208503001578266, 'samples': 7786560, 'steps': 40554, 'loss/train': 1.485809087753296} -08/30/2021 20:29:33 - INFO - __main__ - Step 40556: {'lr': 0.00042084642596770984, 'samples': 7786752, 'steps': 40555, 'loss/train': 0.9962664246559143} -08/30/2021 20:29:33 - INFO - __main__ - Step 40557: {'lr': 0.0004208425517006124, 'samples': 7786944, 'steps': 40556, 'loss/train': 1.43374502658844} -08/30/2021 20:29:35 - INFO - __main__ - Step 40558: {'lr': 0.0004208386773565359, 'samples': 7787136, 'steps': 40557, 'loss/train': 1.6456314325332642} -08/30/2021 20:29:35 - INFO - __main__ - Step 40559: {'lr': 0.0004208348029354821, 'samples': 7787328, 'steps': 40558, 'loss/train': 1.6254279613494873} -08/30/2021 20:29:35 - INFO - __main__ - Step 40560: {'lr': 0.00042083092843745275, 'samples': 7787520, 'steps': 40559, 'loss/train': 1.1712114810943604} -08/30/2021 20:29:36 - INFO - __main__ - Step 40561: {'lr': 0.0004208270538624497, 'samples': 7787712, 'steps': 40560, 'loss/train': 1.325748085975647} -08/30/2021 20:29:36 - INFO - __main__ - Step 40562: {'lr': 0.00042082317921047455, 'samples': 7787904, 'steps': 40561, 'loss/train': 0.9385061264038086} -08/30/2021 20:29:37 - INFO - __main__ - Step 40563: {'lr': 0.0004208193044815291, 'samples': 7788096, 'steps': 40562, 'loss/train': 1.8918570280075073} -08/30/2021 20:29:38 - INFO - __main__ - Step 40564: {'lr': 0.0004208154296756152, 'samples': 7788288, 'steps': 40563, 'loss/train': 1.2039144039154053} -08/30/2021 20:29:38 - INFO - __main__ - Step 40565: {'lr': 0.0004208115547927345, 'samples': 7788480, 'steps': 40564, 'loss/train': 1.1967377662658691} -08/30/2021 20:29:39 - INFO - __main__ - Step 40566: {'lr': 0.0004208076798328886, 'samples': 7788672, 'steps': 40565, 'loss/train': 1.9980802536010742} -08/30/2021 20:29:39 - INFO - __main__ - Step 40567: {'lr': 0.00042080380479607947, 'samples': 7788864, 'steps': 40566, 'loss/train': 1.5531868934631348} -08/30/2021 20:29:40 - INFO - __main__ - Step 40568: {'lr': 0.00042079992968230886, 'samples': 7789056, 'steps': 40567, 'loss/train': 1.3410086631774902} -08/30/2021 20:29:41 - INFO - __main__ - Step 40569: {'lr': 0.0004207960544915784, 'samples': 7789248, 'steps': 40568, 'loss/train': 1.0361840724945068} -08/30/2021 20:29:41 - INFO - __main__ - Step 40570: {'lr': 0.0004207921792238898, 'samples': 7789440, 'steps': 40569, 'loss/train': 1.177603840827942} -08/30/2021 20:29:42 - INFO - __main__ - Step 40571: {'lr': 0.0004207883038792449, 'samples': 7789632, 'steps': 40570, 'loss/train': 1.1117411851882935} -08/30/2021 20:29:42 - INFO - __main__ - Step 40572: {'lr': 0.0004207844284576455, 'samples': 7789824, 'steps': 40571, 'loss/train': 1.6639740467071533} -08/30/2021 20:29:44 - INFO - __main__ - Step 40573: {'lr': 0.0004207805529590932, 'samples': 7790016, 'steps': 40572, 'loss/train': 1.3262563943862915} -08/30/2021 20:29:44 - INFO - __main__ - Step 40574: {'lr': 0.0004207766773835899, 'samples': 7790208, 'steps': 40573, 'loss/train': 0.8548374176025391} -08/30/2021 20:29:45 - INFO - __main__ - Step 40575: {'lr': 0.0004207728017311372, 'samples': 7790400, 'steps': 40574, 'loss/train': 1.327256679534912} -08/30/2021 20:29:45 - INFO - __main__ - Step 40576: {'lr': 0.0004207689260017369, 'samples': 7790592, 'steps': 40575, 'loss/train': 1.304694652557373} -08/30/2021 20:29:46 - INFO - __main__ - Step 40577: {'lr': 0.0004207650501953908, 'samples': 7790784, 'steps': 40576, 'loss/train': 1.0193008184432983} -08/30/2021 20:29:47 - INFO - __main__ - Step 40578: {'lr': 0.0004207611743121006, 'samples': 7790976, 'steps': 40577, 'loss/train': 1.682633876800537} -08/30/2021 20:29:48 - INFO - __main__ - Step 40579: {'lr': 0.00042075729835186807, 'samples': 7791168, 'steps': 40578, 'loss/train': 1.562943458557129} -08/30/2021 20:29:48 - INFO - __main__ - Step 40580: {'lr': 0.0004207534223146948, 'samples': 7791360, 'steps': 40579, 'loss/train': 1.6095415353775024} -08/30/2021 20:29:48 - INFO - __main__ - Step 40581: {'lr': 0.0004207495462005828, 'samples': 7791552, 'steps': 40580, 'loss/train': 1.4702998399734497} -08/30/2021 20:29:49 - INFO - __main__ - Step 40582: {'lr': 0.0004207456700095337, 'samples': 7791744, 'steps': 40581, 'loss/train': 0.8661431074142456} -08/30/2021 20:29:50 - INFO - __main__ - Step 40583: {'lr': 0.0004207417937415492, 'samples': 7791936, 'steps': 40582, 'loss/train': 1.81490957736969} -08/30/2021 20:29:51 - INFO - __main__ - Step 40584: {'lr': 0.000420737917396631, 'samples': 7792128, 'steps': 40583, 'loss/train': 1.5431385040283203} -08/30/2021 20:29:51 - INFO - __main__ - Step 40585: {'lr': 0.00042073404097478105, 'samples': 7792320, 'steps': 40584, 'loss/train': 1.380693793296814} -08/30/2021 20:29:51 - INFO - __main__ - Step 40586: {'lr': 0.000420730164476001, 'samples': 7792512, 'steps': 40585, 'loss/train': 1.7884832620620728} -08/30/2021 20:29:52 - INFO - __main__ - Step 40587: {'lr': 0.00042072628790029243, 'samples': 7792704, 'steps': 40586, 'loss/train': 1.7218916416168213} -08/30/2021 20:29:52 - INFO - __main__ - Step 40588: {'lr': 0.0004207224112476573, 'samples': 7792896, 'steps': 40587, 'loss/train': 1.5347225666046143} -08/30/2021 20:29:53 - INFO - __main__ - Step 40589: {'lr': 0.0004207185345180973, 'samples': 7793088, 'steps': 40588, 'loss/train': 1.5618696212768555} -08/30/2021 20:29:54 - INFO - __main__ - Step 40590: {'lr': 0.00042071465771161416, 'samples': 7793280, 'steps': 40589, 'loss/train': 2.105295419692993} -08/30/2021 20:29:54 - INFO - __main__ - Step 40591: {'lr': 0.0004207107808282097, 'samples': 7793472, 'steps': 40590, 'loss/train': 1.6732038259506226} -08/30/2021 20:29:54 - INFO - __main__ - Step 40592: {'lr': 0.00042070690386788545, 'samples': 7793664, 'steps': 40591, 'loss/train': 1.551571011543274} -08/30/2021 20:29:55 - INFO - __main__ - Step 40593: {'lr': 0.0004207030268306434, 'samples': 7793856, 'steps': 40592, 'loss/train': 1.283904790878296} -08/30/2021 20:29:56 - INFO - __main__ - Step 40594: {'lr': 0.00042069914971648516, 'samples': 7794048, 'steps': 40593, 'loss/train': 1.5216953754425049} -08/30/2021 20:29:57 - INFO - __main__ - Step 40595: {'lr': 0.0004206952725254125, 'samples': 7794240, 'steps': 40594, 'loss/train': 1.1923627853393555} -08/30/2021 20:29:57 - INFO - __main__ - Step 40596: {'lr': 0.00042069139525742727, 'samples': 7794432, 'steps': 40595, 'loss/train': 0.9968594908714294} -08/30/2021 20:29:57 - INFO - __main__ - Step 40597: {'lr': 0.000420687517912531, 'samples': 7794624, 'steps': 40596, 'loss/train': 1.4605414867401123} -08/30/2021 20:29:58 - INFO - __main__ - Step 40598: {'lr': 0.0004206836404907257, 'samples': 7794816, 'steps': 40597, 'loss/train': 0.6130566000938416} -08/30/2021 20:29:59 - INFO - __main__ - Step 40599: {'lr': 0.0004206797629920129, 'samples': 7795008, 'steps': 40598, 'loss/train': 1.4869836568832397} -08/30/2021 20:30:00 - INFO - __main__ - Step 40600: {'lr': 0.0004206758854163945, 'samples': 7795200, 'steps': 40599, 'loss/train': 1.494636058807373} -08/30/2021 20:30:00 - INFO - __main__ - Step 40601: {'lr': 0.00042067200776387215, 'samples': 7795392, 'steps': 40600, 'loss/train': 1.434457540512085} -08/30/2021 20:30:00 - INFO - __main__ - Step 40602: {'lr': 0.0004206681300344476, 'samples': 7795584, 'steps': 40601, 'loss/train': 1.4297521114349365} -08/30/2021 20:30:01 - INFO - __main__ - Step 40603: {'lr': 0.0004206642522281227, 'samples': 7795776, 'steps': 40602, 'loss/train': 1.6480880975723267} -08/30/2021 20:30:02 - INFO - __main__ - Step 40604: {'lr': 0.000420660374344899, 'samples': 7795968, 'steps': 40603, 'loss/train': 0.9270496964454651} -08/30/2021 20:30:03 - INFO - __main__ - Step 40605: {'lr': 0.00042065649638477843, 'samples': 7796160, 'steps': 40604, 'loss/train': 1.1310598850250244} -08/30/2021 20:30:03 - INFO - __main__ - Step 40606: {'lr': 0.0004206526183477627, 'samples': 7796352, 'steps': 40605, 'loss/train': 1.1386243104934692} -08/30/2021 20:30:03 - INFO - __main__ - Step 40607: {'lr': 0.0004206487402338535, 'samples': 7796544, 'steps': 40606, 'loss/train': 0.95960533618927} -08/30/2021 20:30:04 - INFO - __main__ - Step 40608: {'lr': 0.00042064486204305263, 'samples': 7796736, 'steps': 40607, 'loss/train': 1.4682912826538086} -08/30/2021 20:30:05 - INFO - __main__ - Step 40609: {'lr': 0.0004206409837753618, 'samples': 7796928, 'steps': 40608, 'loss/train': 1.5144367218017578} -08/30/2021 20:30:06 - INFO - __main__ - Step 40610: {'lr': 0.00042063710543078283, 'samples': 7797120, 'steps': 40609, 'loss/train': 1.1375278234481812} -08/30/2021 20:30:06 - INFO - __main__ - Step 40611: {'lr': 0.00042063322700931733, 'samples': 7797312, 'steps': 40610, 'loss/train': 1.7519469261169434} -08/30/2021 20:30:07 - INFO - __main__ - Step 40612: {'lr': 0.0004206293485109672, 'samples': 7797504, 'steps': 40611, 'loss/train': 1.4417210817337036} -08/30/2021 20:30:07 - INFO - __main__ - Step 40613: {'lr': 0.0004206254699357341, 'samples': 7797696, 'steps': 40612, 'loss/train': 1.1510708332061768} -08/30/2021 20:30:07 - INFO - __main__ - Step 40614: {'lr': 0.00042062159128361976, 'samples': 7797888, 'steps': 40613, 'loss/train': 0.03064132109284401} -08/30/2021 20:30:09 - INFO - __main__ - Step 40615: {'lr': 0.000420617712554626, 'samples': 7798080, 'steps': 40614, 'loss/train': 1.5406118631362915} -08/30/2021 20:30:09 - INFO - __main__ - Step 40616: {'lr': 0.0004206138337487545, 'samples': 7798272, 'steps': 40615, 'loss/train': 1.668717622756958} -08/30/2021 20:30:10 - INFO - __main__ - Step 40617: {'lr': 0.0004206099548660071, 'samples': 7798464, 'steps': 40616, 'loss/train': 1.5844056606292725} -08/30/2021 20:30:10 - INFO - __main__ - Step 40618: {'lr': 0.00042060607590638547, 'samples': 7798656, 'steps': 40617, 'loss/train': 1.5757007598876953} -08/30/2021 20:30:10 - INFO - __main__ - Step 40619: {'lr': 0.00042060219686989133, 'samples': 7798848, 'steps': 40618, 'loss/train': 1.5157809257507324} -08/30/2021 20:30:12 - INFO - __main__ - Step 40620: {'lr': 0.00042059831775652644, 'samples': 7799040, 'steps': 40619, 'loss/train': 1.8588722944259644} -08/30/2021 20:30:12 - INFO - __main__ - Step 40621: {'lr': 0.00042059443856629265, 'samples': 7799232, 'steps': 40620, 'loss/train': 0.05576677620410919} -08/30/2021 20:30:13 - INFO - __main__ - Step 40622: {'lr': 0.00042059055929919163, 'samples': 7799424, 'steps': 40621, 'loss/train': 2.0204005241394043} -08/30/2021 20:30:13 - INFO - __main__ - Step 40623: {'lr': 0.00042058667995522513, 'samples': 7799616, 'steps': 40622, 'loss/train': 0.38546594977378845} -08/30/2021 20:30:13 - INFO - __main__ - Step 40624: {'lr': 0.0004205828005343949, 'samples': 7799808, 'steps': 40623, 'loss/train': 1.2320804595947266} -08/30/2021 20:30:14 - INFO - __main__ - Step 40625: {'lr': 0.00042057892103670275, 'samples': 7800000, 'steps': 40624, 'loss/train': 1.3380446434020996} -08/30/2021 20:30:16 - INFO - __main__ - Step 40626: {'lr': 0.0004205750414621503, 'samples': 7800192, 'steps': 40625, 'loss/train': 1.481024146080017} -08/30/2021 20:30:16 - INFO - __main__ - Step 40627: {'lr': 0.0004205711618107394, 'samples': 7800384, 'steps': 40626, 'loss/train': 1.230425238609314} -08/30/2021 20:30:17 - INFO - __main__ - Step 40628: {'lr': 0.00042056728208247175, 'samples': 7800576, 'steps': 40627, 'loss/train': 0.9796714782714844} -08/30/2021 20:30:17 - INFO - __main__ - Step 40629: {'lr': 0.0004205634022773491, 'samples': 7800768, 'steps': 40628, 'loss/train': 1.3274792432785034} -08/30/2021 20:30:17 - INFO - __main__ - Step 40630: {'lr': 0.0004205595223953732, 'samples': 7800960, 'steps': 40629, 'loss/train': 1.756373405456543} -08/30/2021 20:30:19 - INFO - __main__ - Step 40631: {'lr': 0.0004205556424365459, 'samples': 7801152, 'steps': 40630, 'loss/train': 0.5165131092071533} -08/30/2021 20:30:19 - INFO - __main__ - Step 40632: {'lr': 0.0004205517624008688, 'samples': 7801344, 'steps': 40631, 'loss/train': 1.3324552774429321} -08/30/2021 20:30:20 - INFO - __main__ - Step 40633: {'lr': 0.00042054788228834374, 'samples': 7801536, 'steps': 40632, 'loss/train': 1.2723091840744019} -08/30/2021 20:30:20 - INFO - __main__ - Step 40634: {'lr': 0.0004205440020989724, 'samples': 7801728, 'steps': 40633, 'loss/train': 1.8608767986297607} -08/30/2021 20:30:20 - INFO - __main__ - Step 40635: {'lr': 0.0004205401218327565, 'samples': 7801920, 'steps': 40634, 'loss/train': 0.1952928751707077} -08/30/2021 20:30:22 - INFO - __main__ - Step 40636: {'lr': 0.0004205362414896979, 'samples': 7802112, 'steps': 40635, 'loss/train': 1.4910147190093994} -08/30/2021 20:30:22 - INFO - __main__ - Step 40637: {'lr': 0.0004205323610697984, 'samples': 7802304, 'steps': 40636, 'loss/train': 1.6579813957214355} -08/30/2021 20:30:23 - INFO - __main__ - Step 40638: {'lr': 0.0004205284805730596, 'samples': 7802496, 'steps': 40637, 'loss/train': 1.6472336053848267} -08/30/2021 20:30:23 - INFO - __main__ - Step 40639: {'lr': 0.00042052459999948323, 'samples': 7802688, 'steps': 40638, 'loss/train': 1.7449266910552979} -08/30/2021 20:30:23 - INFO - __main__ - Step 40640: {'lr': 0.00042052071934907116, 'samples': 7802880, 'steps': 40639, 'loss/train': 1.3850665092468262} -08/30/2021 20:30:25 - INFO - __main__ - Step 40641: {'lr': 0.00042051683862182504, 'samples': 7803072, 'steps': 40640, 'loss/train': 1.5129368305206299} -08/30/2021 20:30:25 - INFO - __main__ - Step 40642: {'lr': 0.0004205129578177467, 'samples': 7803264, 'steps': 40641, 'loss/train': 1.6151237487792969} -08/30/2021 20:30:26 - INFO - __main__ - Step 40643: {'lr': 0.0004205090769368379, 'samples': 7803456, 'steps': 40642, 'loss/train': 1.2536816596984863} -08/30/2021 20:30:26 - INFO - __main__ - Step 40644: {'lr': 0.00042050519597910024, 'samples': 7803648, 'steps': 40643, 'loss/train': 1.6010931730270386} -08/30/2021 20:30:26 - INFO - __main__ - Step 40645: {'lr': 0.00042050131494453567, 'samples': 7803840, 'steps': 40644, 'loss/train': 1.305932641029358} -08/30/2021 20:30:28 - INFO - __main__ - Step 40646: {'lr': 0.00042049743383314577, 'samples': 7804032, 'steps': 40645, 'loss/train': 1.2957103252410889} -08/30/2021 20:30:28 - INFO - __main__ - Step 40647: {'lr': 0.0004204935526449324, 'samples': 7804224, 'steps': 40646, 'loss/train': 1.4285246133804321} -08/30/2021 20:30:28 - INFO - __main__ - Step 40648: {'lr': 0.0004204896713798972, 'samples': 7804416, 'steps': 40647, 'loss/train': 1.6725188493728638} -08/30/2021 20:30:29 - INFO - __main__ - Step 40649: {'lr': 0.00042048579003804205, 'samples': 7804608, 'steps': 40648, 'loss/train': 1.425777792930603} -08/30/2021 20:30:29 - INFO - __main__ - Step 40650: {'lr': 0.00042048190861936866, 'samples': 7804800, 'steps': 40649, 'loss/train': 1.3483316898345947} -08/30/2021 20:30:29 - INFO - __main__ - Step 40651: {'lr': 0.0004204780271238786, 'samples': 7804992, 'steps': 40650, 'loss/train': 1.0939075946807861} -08/30/2021 20:30:31 - INFO - __main__ - Step 40652: {'lr': 0.00042047414555157394, 'samples': 7805184, 'steps': 40651, 'loss/train': 1.7882989645004272} -08/30/2021 20:30:31 - INFO - __main__ - Step 40653: {'lr': 0.0004204702639024562, 'samples': 7805376, 'steps': 40652, 'loss/train': 1.6279653310775757} -08/30/2021 20:30:32 - INFO - __main__ - Step 40654: {'lr': 0.00042046638217652717, 'samples': 7805568, 'steps': 40653, 'loss/train': 1.6124012470245361} -08/30/2021 20:30:32 - INFO - __main__ - Step 40655: {'lr': 0.00042046250037378865, 'samples': 7805760, 'steps': 40654, 'loss/train': 2.157416820526123} -08/30/2021 20:30:33 - INFO - __main__ - Step 40656: {'lr': 0.0004204586184942423, 'samples': 7805952, 'steps': 40655, 'loss/train': 1.045082926750183} -08/30/2021 20:30:34 - INFO - __main__ - Step 40657: {'lr': 0.00042045473653789004, 'samples': 7806144, 'steps': 40656, 'loss/train': 0.9390610456466675} -08/30/2021 20:30:34 - INFO - __main__ - Step 40658: {'lr': 0.00042045085450473336, 'samples': 7806336, 'steps': 40657, 'loss/train': 0.6429643630981445} -08/30/2021 20:30:35 - INFO - __main__ - Step 40659: {'lr': 0.00042044697239477423, 'samples': 7806528, 'steps': 40658, 'loss/train': 0.7809738516807556} -08/30/2021 20:30:35 - INFO - __main__ - Step 40660: {'lr': 0.00042044309020801434, 'samples': 7806720, 'steps': 40659, 'loss/train': 1.6725441217422485} -08/30/2021 20:30:35 - INFO - __main__ - Step 40661: {'lr': 0.00042043920794445543, 'samples': 7806912, 'steps': 40660, 'loss/train': 1.09107506275177} -08/30/2021 20:30:37 - INFO - __main__ - Step 40662: {'lr': 0.0004204353256040992, 'samples': 7807104, 'steps': 40661, 'loss/train': 0.2506924569606781} -08/30/2021 20:30:38 - INFO - __main__ - Step 40663: {'lr': 0.0004204314431869475, 'samples': 7807296, 'steps': 40662, 'loss/train': 1.3914165496826172} -08/30/2021 20:30:38 - INFO - __main__ - Step 40664: {'lr': 0.0004204275606930019, 'samples': 7807488, 'steps': 40663, 'loss/train': 0.08640512824058533} -08/30/2021 20:30:38 - INFO - __main__ - Step 40665: {'lr': 0.00042042367812226446, 'samples': 7807680, 'steps': 40664, 'loss/train': 1.6619248390197754} -08/30/2021 20:30:39 - INFO - __main__ - Step 40666: {'lr': 0.00042041979547473665, 'samples': 7807872, 'steps': 40665, 'loss/train': 1.1679056882858276} -08/30/2021 20:30:40 - INFO - __main__ - Step 40667: {'lr': 0.0004204159127504202, 'samples': 7808064, 'steps': 40666, 'loss/train': 1.5541876554489136} -08/30/2021 20:30:41 - INFO - __main__ - Step 40668: {'lr': 0.0004204120299493171, 'samples': 7808256, 'steps': 40667, 'loss/train': 1.4965434074401855} -08/30/2021 20:30:41 - INFO - __main__ - Step 40669: {'lr': 0.0004204081470714289, 'samples': 7808448, 'steps': 40668, 'loss/train': 2.0811808109283447} -08/30/2021 20:30:41 - INFO - __main__ - Step 40670: {'lr': 0.00042040426411675747, 'samples': 7808640, 'steps': 40669, 'loss/train': 1.2840136289596558} -08/30/2021 20:30:42 - INFO - __main__ - Step 40671: {'lr': 0.0004204003810853045, 'samples': 7808832, 'steps': 40670, 'loss/train': 1.9235584735870361} -08/30/2021 20:30:43 - INFO - __main__ - Step 40672: {'lr': 0.00042039649797707176, 'samples': 7809024, 'steps': 40671, 'loss/train': 1.5719984769821167} -08/30/2021 20:30:44 - INFO - __main__ - Step 40673: {'lr': 0.0004203926147920609, 'samples': 7809216, 'steps': 40672, 'loss/train': 1.508525013923645} -08/30/2021 20:30:44 - INFO - __main__ - Step 40674: {'lr': 0.0004203887315302739, 'samples': 7809408, 'steps': 40673, 'loss/train': 1.892645239830017} -08/30/2021 20:30:44 - INFO - __main__ - Step 40675: {'lr': 0.0004203848481917122, 'samples': 7809600, 'steps': 40674, 'loss/train': 1.736484408378601} -08/30/2021 20:30:45 - INFO - __main__ - Step 40676: {'lr': 0.00042038096477637786, 'samples': 7809792, 'steps': 40675, 'loss/train': 0.9497137069702148} -08/30/2021 20:30:46 - INFO - __main__ - Step 40677: {'lr': 0.00042037708128427243, 'samples': 7809984, 'steps': 40676, 'loss/train': 1.9614101648330688} -08/30/2021 20:30:47 - INFO - __main__ - Step 40678: {'lr': 0.00042037319771539775, 'samples': 7810176, 'steps': 40677, 'loss/train': 1.2367404699325562} -08/30/2021 20:30:47 - INFO - __main__ - Step 40679: {'lr': 0.00042036931406975547, 'samples': 7810368, 'steps': 40678, 'loss/train': 1.1385862827301025} -08/30/2021 20:30:48 - INFO - __main__ - Step 40680: {'lr': 0.0004203654303473474, 'samples': 7810560, 'steps': 40679, 'loss/train': 1.5016164779663086} -08/30/2021 20:30:48 - INFO - __main__ - Step 40681: {'lr': 0.0004203615465481754, 'samples': 7810752, 'steps': 40680, 'loss/train': 2.079608678817749} -08/30/2021 20:30:48 - INFO - __main__ - Step 40682: {'lr': 0.0004203576626722411, 'samples': 7810944, 'steps': 40681, 'loss/train': 1.6436620950698853} -08/30/2021 20:30:50 - INFO - __main__ - Step 40683: {'lr': 0.00042035377871954614, 'samples': 7811136, 'steps': 40682, 'loss/train': 1.5468770265579224} -08/30/2021 20:30:51 - INFO - __main__ - Step 40684: {'lr': 0.00042034989469009245, 'samples': 7811328, 'steps': 40683, 'loss/train': 1.3297398090362549} -08/30/2021 20:30:51 - INFO - __main__ - Step 40685: {'lr': 0.0004203460105838818, 'samples': 7811520, 'steps': 40684, 'loss/train': 1.8256430625915527} -08/30/2021 20:30:52 - INFO - __main__ - Step 40686: {'lr': 0.00042034212640091587, 'samples': 7811712, 'steps': 40685, 'loss/train': 1.199657917022705} -08/30/2021 20:30:52 - INFO - __main__ - Step 40687: {'lr': 0.00042033824214119633, 'samples': 7811904, 'steps': 40686, 'loss/train': 2.0564515590667725} -08/30/2021 20:30:53 - INFO - __main__ - Step 40688: {'lr': 0.00042033435780472494, 'samples': 7812096, 'steps': 40687, 'loss/train': 1.097558856010437} -08/30/2021 20:30:54 - INFO - __main__ - Step 40689: {'lr': 0.00042033047339150363, 'samples': 7812288, 'steps': 40688, 'loss/train': 1.2923438549041748} -08/30/2021 20:30:54 - INFO - __main__ - Step 40690: {'lr': 0.00042032658890153404, 'samples': 7812480, 'steps': 40689, 'loss/train': 1.314319372177124} -08/30/2021 20:30:55 - INFO - __main__ - Step 40691: {'lr': 0.0004203227043348179, 'samples': 7812672, 'steps': 40690, 'loss/train': 1.4398634433746338} -08/30/2021 20:30:55 - INFO - __main__ - Step 40692: {'lr': 0.000420318819691357, 'samples': 7812864, 'steps': 40691, 'loss/train': 1.1700912714004517} -08/30/2021 20:30:57 - INFO - __main__ - Step 40693: {'lr': 0.00042031493497115304, 'samples': 7813056, 'steps': 40692, 'loss/train': 1.6856290102005005} -08/30/2021 20:30:57 - INFO - __main__ - Step 40694: {'lr': 0.0004203110501742078, 'samples': 7813248, 'steps': 40693, 'loss/train': 1.530055046081543} -08/30/2021 20:30:57 - INFO - __main__ - Step 40695: {'lr': 0.00042030716530052297, 'samples': 7813440, 'steps': 40694, 'loss/train': 1.0971704721450806} -08/30/2021 20:30:58 - INFO - __main__ - Step 40696: {'lr': 0.00042030328035010047, 'samples': 7813632, 'steps': 40695, 'loss/train': 1.4052329063415527} -08/30/2021 20:30:58 - INFO - __main__ - Step 40697: {'lr': 0.0004202993953229418, 'samples': 7813824, 'steps': 40696, 'loss/train': 1.1811143159866333} -08/30/2021 20:30:58 - INFO - __main__ - Step 40698: {'lr': 0.000420295510219049, 'samples': 7814016, 'steps': 40697, 'loss/train': 1.4804872274398804} -08/30/2021 20:31:00 - INFO - __main__ - Step 40699: {'lr': 0.00042029162503842357, 'samples': 7814208, 'steps': 40698, 'loss/train': 1.4191936254501343} -08/30/2021 20:31:01 - INFO - __main__ - Step 40700: {'lr': 0.0004202877397810674, 'samples': 7814400, 'steps': 40699, 'loss/train': 1.951290249824524} -08/30/2021 20:31:01 - INFO - __main__ - Step 40701: {'lr': 0.0004202838544469822, 'samples': 7814592, 'steps': 40700, 'loss/train': 1.3045618534088135} -08/30/2021 20:31:01 - INFO - __main__ - Step 40702: {'lr': 0.00042027996903616974, 'samples': 7814784, 'steps': 40701, 'loss/train': 1.5571815967559814} -08/30/2021 20:31:02 - INFO - __main__ - Step 40703: {'lr': 0.0004202760835486317, 'samples': 7814976, 'steps': 40702, 'loss/train': 1.5170612335205078} -08/30/2021 20:31:03 - INFO - __main__ - Step 40704: {'lr': 0.00042027219798436996, 'samples': 7815168, 'steps': 40703, 'loss/train': 0.7151506543159485} -08/30/2021 20:31:04 - INFO - __main__ - Step 40705: {'lr': 0.00042026831234338614, 'samples': 7815360, 'steps': 40704, 'loss/train': 0.5749585628509521} -08/30/2021 20:31:04 - INFO - __main__ - Step 40706: {'lr': 0.0004202644266256821, 'samples': 7815552, 'steps': 40705, 'loss/train': 1.3966641426086426} -08/30/2021 20:31:04 - INFO - __main__ - Step 40707: {'lr': 0.00042026054083125943, 'samples': 7815744, 'steps': 40706, 'loss/train': 1.345969796180725} -08/30/2021 20:31:05 - INFO - __main__ - Step 40708: {'lr': 0.0004202566549601201, 'samples': 7815936, 'steps': 40707, 'loss/train': 1.4172412157058716} -08/30/2021 20:31:06 - INFO - __main__ - Step 40709: {'lr': 0.00042025276901226573, 'samples': 7816128, 'steps': 40708, 'loss/train': 1.7815989255905151} -08/30/2021 20:31:07 - INFO - __main__ - Step 40710: {'lr': 0.00042024888298769806, 'samples': 7816320, 'steps': 40709, 'loss/train': 1.5435044765472412} -08/30/2021 20:31:07 - INFO - __main__ - Step 40711: {'lr': 0.0004202449968864188, 'samples': 7816512, 'steps': 40710, 'loss/train': 1.2542626857757568} -08/30/2021 20:31:07 - INFO - __main__ - Step 40712: {'lr': 0.00042024111070842985, 'samples': 7816704, 'steps': 40711, 'loss/train': 1.5079811811447144} -08/30/2021 20:31:08 - INFO - __main__ - Step 40713: {'lr': 0.0004202372244537329, 'samples': 7816896, 'steps': 40712, 'loss/train': 1.2696741819381714} -08/30/2021 20:31:09 - INFO - __main__ - Step 40714: {'lr': 0.00042023333812232967, 'samples': 7817088, 'steps': 40713, 'loss/train': 1.3684004545211792} -08/30/2021 20:31:10 - INFO - __main__ - Step 40715: {'lr': 0.0004202294517142219, 'samples': 7817280, 'steps': 40714, 'loss/train': 1.5804187059402466} -08/30/2021 20:31:10 - INFO - __main__ - Step 40716: {'lr': 0.0004202255652294114, 'samples': 7817472, 'steps': 40715, 'loss/train': 1.6122698783874512} -08/30/2021 20:31:10 - INFO - __main__ - Step 40717: {'lr': 0.00042022167866789985, 'samples': 7817664, 'steps': 40716, 'loss/train': 1.394217610359192} -08/30/2021 20:31:11 - INFO - __main__ - Step 40718: {'lr': 0.00042021779202968903, 'samples': 7817856, 'steps': 40717, 'loss/train': 1.4484519958496094} -08/30/2021 20:31:12 - INFO - __main__ - Step 40719: {'lr': 0.0004202139053147808, 'samples': 7818048, 'steps': 40718, 'loss/train': 1.6146900653839111} -08/30/2021 20:31:13 - INFO - __main__ - Step 40720: {'lr': 0.0004202100185231767, 'samples': 7818240, 'steps': 40719, 'loss/train': 1.3560950756072998} -08/30/2021 20:31:13 - INFO - __main__ - Step 40721: {'lr': 0.00042020613165487863, 'samples': 7818432, 'steps': 40720, 'loss/train': 1.5143665075302124} -08/30/2021 20:31:13 - INFO - __main__ - Step 40722: {'lr': 0.0004202022447098883, 'samples': 7818624, 'steps': 40721, 'loss/train': 1.448867917060852} -08/30/2021 20:31:14 - INFO - __main__ - Step 40723: {'lr': 0.00042019835768820744, 'samples': 7818816, 'steps': 40722, 'loss/train': 0.8615542650222778} -08/30/2021 20:31:14 - INFO - __main__ - Step 40724: {'lr': 0.00042019447058983786, 'samples': 7819008, 'steps': 40723, 'loss/train': 1.5015555620193481} -08/30/2021 20:31:15 - INFO - __main__ - Step 40725: {'lr': 0.0004201905834147813, 'samples': 7819200, 'steps': 40724, 'loss/train': 1.515428066253662} -08/30/2021 20:31:16 - INFO - __main__ - Step 40726: {'lr': 0.0004201866961630395, 'samples': 7819392, 'steps': 40725, 'loss/train': 1.4868468046188354} -08/30/2021 20:31:16 - INFO - __main__ - Step 40727: {'lr': 0.00042018280883461415, 'samples': 7819584, 'steps': 40726, 'loss/train': 1.3024789094924927} -08/30/2021 20:31:17 - INFO - __main__ - Step 40728: {'lr': 0.000420178921429507, 'samples': 7819776, 'steps': 40727, 'loss/train': 2.0891103744506836} -08/30/2021 20:31:17 - INFO - __main__ - Step 40729: {'lr': 0.00042017503394771997, 'samples': 7819968, 'steps': 40728, 'loss/train': 1.2729058265686035} -08/30/2021 20:31:19 - INFO - __main__ - Step 40730: {'lr': 0.00042017114638925456, 'samples': 7820160, 'steps': 40729, 'loss/train': 1.5011334419250488} -08/30/2021 20:31:19 - INFO - __main__ - Step 40731: {'lr': 0.00042016725875411274, 'samples': 7820352, 'steps': 40730, 'loss/train': 1.2995166778564453} -08/30/2021 20:31:19 - INFO - __main__ - Step 40732: {'lr': 0.0004201633710422962, 'samples': 7820544, 'steps': 40731, 'loss/train': 2.2093710899353027} -08/30/2021 20:31:20 - INFO - __main__ - Step 40733: {'lr': 0.0004201594832538067, 'samples': 7820736, 'steps': 40732, 'loss/train': 0.3605997860431671} -08/30/2021 20:31:20 - INFO - __main__ - Step 40734: {'lr': 0.0004201555953886459, 'samples': 7820928, 'steps': 40733, 'loss/train': 1.5841865539550781} -08/30/2021 20:31:22 - INFO - __main__ - Step 40735: {'lr': 0.00042015170744681566, 'samples': 7821120, 'steps': 40734, 'loss/train': 1.6072136163711548} -08/30/2021 20:31:23 - INFO - __main__ - Step 40736: {'lr': 0.00042014781942831757, 'samples': 7821312, 'steps': 40735, 'loss/train': 1.4822163581848145} -08/30/2021 20:31:23 - INFO - __main__ - Step 40737: {'lr': 0.00042014393133315366, 'samples': 7821504, 'steps': 40736, 'loss/train': 1.812747597694397} -08/30/2021 20:31:23 - INFO - __main__ - Step 40738: {'lr': 0.00042014004316132537, 'samples': 7821696, 'steps': 40737, 'loss/train': 1.6188654899597168} -08/30/2021 20:31:24 - INFO - __main__ - Step 40739: {'lr': 0.0004201361549128347, 'samples': 7821888, 'steps': 40738, 'loss/train': 0.8519554138183594} -08/30/2021 20:31:25 - INFO - __main__ - Step 40740: {'lr': 0.00042013226658768333, 'samples': 7822080, 'steps': 40739, 'loss/train': 0.8235333561897278} -08/30/2021 20:31:26 - INFO - __main__ - Step 40741: {'lr': 0.0004201283781858729, 'samples': 7822272, 'steps': 40740, 'loss/train': 1.0463306903839111} -08/30/2021 20:31:26 - INFO - __main__ - Step 40742: {'lr': 0.00042012448970740523, 'samples': 7822464, 'steps': 40741, 'loss/train': 1.7897881269454956} -08/30/2021 20:31:26 - INFO - __main__ - Step 40743: {'lr': 0.00042012060115228215, 'samples': 7822656, 'steps': 40742, 'loss/train': 1.5615816116333008} -08/30/2021 20:31:27 - INFO - __main__ - Step 40744: {'lr': 0.0004201167125205054, 'samples': 7822848, 'steps': 40743, 'loss/train': 1.391696810722351} -08/30/2021 20:31:28 - INFO - __main__ - Step 40745: {'lr': 0.0004201128238120766, 'samples': 7823040, 'steps': 40744, 'loss/train': 1.45644211769104} -08/30/2021 20:31:29 - INFO - __main__ - Step 40746: {'lr': 0.00042010893502699765, 'samples': 7823232, 'steps': 40745, 'loss/train': 1.5940656661987305} -08/30/2021 20:31:29 - INFO - __main__ - Step 40747: {'lr': 0.0004201050461652702, 'samples': 7823424, 'steps': 40746, 'loss/train': 1.6794425249099731} -08/30/2021 20:31:30 - INFO - __main__ - Step 40748: {'lr': 0.00042010115722689603, 'samples': 7823616, 'steps': 40747, 'loss/train': 1.3612704277038574} -08/30/2021 20:31:30 - INFO - __main__ - Step 40749: {'lr': 0.0004200972682118769, 'samples': 7823808, 'steps': 40748, 'loss/train': 3.4012866020202637} -08/30/2021 20:31:30 - INFO - __main__ - Step 40750: {'lr': 0.0004200933791202146, 'samples': 7824000, 'steps': 40749, 'loss/train': 1.6295348405838013} -08/30/2021 20:31:32 - INFO - __main__ - Step 40751: {'lr': 0.0004200894899519108, 'samples': 7824192, 'steps': 40750, 'loss/train': 0.8933557271957397} -08/30/2021 20:31:32 - INFO - __main__ - Step 40752: {'lr': 0.00042008560070696735, 'samples': 7824384, 'steps': 40751, 'loss/train': 0.6759853959083557} -08/30/2021 20:31:33 - INFO - __main__ - Step 40753: {'lr': 0.000420081711385386, 'samples': 7824576, 'steps': 40752, 'loss/train': 1.4800009727478027} -08/30/2021 20:31:33 - INFO - __main__ - Step 40754: {'lr': 0.00042007782198716836, 'samples': 7824768, 'steps': 40753, 'loss/train': 0.784487247467041} -08/30/2021 20:31:33 - INFO - __main__ - Step 40755: {'lr': 0.0004200739325123163, 'samples': 7824960, 'steps': 40754, 'loss/train': 1.2747842073440552} -08/30/2021 20:31:35 - INFO - __main__ - Step 40756: {'lr': 0.0004200700429608315, 'samples': 7825152, 'steps': 40755, 'loss/train': 1.3847298622131348} -08/30/2021 20:31:35 - INFO - __main__ - Step 40757: {'lr': 0.00042006615333271585, 'samples': 7825344, 'steps': 40756, 'loss/train': 2.2461814880371094} -08/30/2021 20:31:36 - INFO - __main__ - Step 40758: {'lr': 0.000420062263627971, 'samples': 7825536, 'steps': 40757, 'loss/train': 1.123727560043335} -08/30/2021 20:31:36 - INFO - __main__ - Step 40759: {'lr': 0.0004200583738465987, 'samples': 7825728, 'steps': 40758, 'loss/train': 1.3890599012374878} -08/30/2021 20:31:36 - INFO - __main__ - Step 40760: {'lr': 0.00042005448398860077, 'samples': 7825920, 'steps': 40759, 'loss/train': 1.6194686889648438} -08/30/2021 20:31:38 - INFO - __main__ - Step 40761: {'lr': 0.00042005059405397885, 'samples': 7826112, 'steps': 40760, 'loss/train': 1.5006707906723022} -08/30/2021 20:31:38 - INFO - __main__ - Step 40762: {'lr': 0.00042004670404273474, 'samples': 7826304, 'steps': 40761, 'loss/train': 1.7742111682891846} -08/30/2021 20:31:39 - INFO - __main__ - Step 40763: {'lr': 0.0004200428139548703, 'samples': 7826496, 'steps': 40762, 'loss/train': 1.2751787900924683} -08/30/2021 20:31:39 - INFO - __main__ - Step 40764: {'lr': 0.0004200389237903871, 'samples': 7826688, 'steps': 40763, 'loss/train': 1.3245795965194702} -08/30/2021 20:31:39 - INFO - __main__ - Step 40765: {'lr': 0.000420035033549287, 'samples': 7826880, 'steps': 40764, 'loss/train': 1.836117148399353} -08/30/2021 20:31:41 - INFO - __main__ - Step 40766: {'lr': 0.0004200311432315718, 'samples': 7827072, 'steps': 40765, 'loss/train': 1.620129942893982} -08/30/2021 20:31:41 - INFO - __main__ - Step 40767: {'lr': 0.0004200272528372432, 'samples': 7827264, 'steps': 40766, 'loss/train': 1.4418184757232666} -08/30/2021 20:31:42 - INFO - __main__ - Step 40768: {'lr': 0.0004200233623663028, 'samples': 7827456, 'steps': 40767, 'loss/train': 0.97811359167099} -08/30/2021 20:31:42 - INFO - __main__ - Step 40769: {'lr': 0.0004200194718187527, 'samples': 7827648, 'steps': 40768, 'loss/train': 1.4465548992156982} -08/30/2021 20:31:42 - INFO - __main__ - Step 40770: {'lr': 0.0004200155811945943, 'samples': 7827840, 'steps': 40769, 'loss/train': 1.631633996963501} -08/30/2021 20:31:43 - INFO - __main__ - Step 40771: {'lr': 0.0004200116904938295, 'samples': 7828032, 'steps': 40770, 'loss/train': 1.412317156791687} -08/30/2021 20:31:44 - INFO - __main__ - Step 40772: {'lr': 0.00042000779971646007, 'samples': 7828224, 'steps': 40771, 'loss/train': 0.9450168013572693} -08/30/2021 20:31:45 - INFO - __main__ - Step 40773: {'lr': 0.00042000390886248783, 'samples': 7828416, 'steps': 40772, 'loss/train': 1.4411104917526245} -08/30/2021 20:31:45 - INFO - __main__ - Step 40774: {'lr': 0.0004200000179319144, 'samples': 7828608, 'steps': 40773, 'loss/train': 1.274450659751892} -08/30/2021 20:31:46 - INFO - __main__ - Step 40775: {'lr': 0.0004199961269247416, 'samples': 7828800, 'steps': 40774, 'loss/train': 1.3851836919784546} -08/30/2021 20:31:46 - INFO - __main__ - Step 40776: {'lr': 0.0004199922358409711, 'samples': 7828992, 'steps': 40775, 'loss/train': 1.1934096813201904} -08/30/2021 20:31:47 - INFO - __main__ - Step 40777: {'lr': 0.0004199883446806048, 'samples': 7829184, 'steps': 40776, 'loss/train': 1.3191113471984863} -08/30/2021 20:31:48 - INFO - __main__ - Step 40778: {'lr': 0.0004199844534436443, 'samples': 7829376, 'steps': 40777, 'loss/train': 1.5529453754425049} -08/30/2021 20:31:48 - INFO - __main__ - Step 40779: {'lr': 0.0004199805621300915, 'samples': 7829568, 'steps': 40778, 'loss/train': 1.5645092725753784} -08/30/2021 20:31:49 - INFO - __main__ - Step 40780: {'lr': 0.0004199766707399481, 'samples': 7829760, 'steps': 40779, 'loss/train': 1.0841411352157593} -08/30/2021 20:31:49 - INFO - __main__ - Step 40781: {'lr': 0.0004199727792732158, 'samples': 7829952, 'steps': 40780, 'loss/train': 0.8259776830673218} -08/30/2021 20:31:50 - INFO - __main__ - Step 40782: {'lr': 0.0004199688877298964, 'samples': 7830144, 'steps': 40781, 'loss/train': 0.651124894618988} -08/30/2021 20:31:51 - INFO - __main__ - Step 40783: {'lr': 0.00041996499610999163, 'samples': 7830336, 'steps': 40782, 'loss/train': 1.0718125104904175} -08/30/2021 20:31:51 - INFO - __main__ - Step 40784: {'lr': 0.00041996110441350323, 'samples': 7830528, 'steps': 40783, 'loss/train': 1.4192897081375122} -08/30/2021 20:31:51 - INFO - __main__ - Step 40785: {'lr': 0.000419957212640433, 'samples': 7830720, 'steps': 40784, 'loss/train': 0.5693715214729309} -08/30/2021 20:31:52 - INFO - __main__ - Step 40786: {'lr': 0.0004199533207907827, 'samples': 7830912, 'steps': 40785, 'loss/train': 1.3015637397766113} -08/30/2021 20:31:53 - INFO - __main__ - Step 40787: {'lr': 0.00041994942886455403, 'samples': 7831104, 'steps': 40786, 'loss/train': 1.9497350454330444} -08/30/2021 20:31:54 - INFO - __main__ - Step 40788: {'lr': 0.00041994553686174876, 'samples': 7831296, 'steps': 40787, 'loss/train': 1.1419200897216797} -08/30/2021 20:31:54 - INFO - __main__ - Step 40789: {'lr': 0.0004199416447823686, 'samples': 7831488, 'steps': 40788, 'loss/train': 1.3467382192611694} -08/30/2021 20:31:54 - INFO - __main__ - Step 40790: {'lr': 0.0004199377526264154, 'samples': 7831680, 'steps': 40789, 'loss/train': 1.7472642660140991} -08/30/2021 20:31:55 - INFO - __main__ - Step 40791: {'lr': 0.00041993386039389095, 'samples': 7831872, 'steps': 40790, 'loss/train': 1.4851189851760864} -08/30/2021 20:31:57 - INFO - __main__ - Step 40792: {'lr': 0.0004199299680847969, 'samples': 7832064, 'steps': 40791, 'loss/train': 1.480136513710022} -08/30/2021 20:31:57 - INFO - __main__ - Step 40793: {'lr': 0.000419926075699135, 'samples': 7832256, 'steps': 40792, 'loss/train': 1.2308827638626099} -08/30/2021 20:31:58 - INFO - __main__ - Step 40794: {'lr': 0.000419922183236907, 'samples': 7832448, 'steps': 40793, 'loss/train': 2.031688690185547} -08/30/2021 20:31:58 - INFO - __main__ - Step 40795: {'lr': 0.0004199182906981147, 'samples': 7832640, 'steps': 40794, 'loss/train': 1.254698395729065} -08/30/2021 20:31:58 - INFO - __main__ - Step 40796: {'lr': 0.00041991439808275986, 'samples': 7832832, 'steps': 40795, 'loss/train': 1.4454256296157837} -08/30/2021 20:32:00 - INFO - __main__ - Step 40797: {'lr': 0.0004199105053908442, 'samples': 7833024, 'steps': 40796, 'loss/train': 1.0112686157226562} -08/30/2021 20:32:00 - INFO - __main__ - Step 40798: {'lr': 0.0004199066126223695, 'samples': 7833216, 'steps': 40797, 'loss/train': 1.6412845849990845} -08/30/2021 20:32:01 - INFO - __main__ - Step 40799: {'lr': 0.0004199027197773375, 'samples': 7833408, 'steps': 40798, 'loss/train': 1.3444037437438965} -08/30/2021 20:32:01 - INFO - __main__ - Step 40800: {'lr': 0.00041989882685575, 'samples': 7833600, 'steps': 40799, 'loss/train': 1.5402215719223022} -08/30/2021 20:32:01 - INFO - __main__ - Step 40801: {'lr': 0.0004198949338576086, 'samples': 7833792, 'steps': 40800, 'loss/train': 0.43507120013237} -08/30/2021 20:32:03 - INFO - __main__ - Step 40802: {'lr': 0.0004198910407829152, 'samples': 7833984, 'steps': 40801, 'loss/train': 1.6014635562896729} -08/30/2021 20:32:03 - INFO - __main__ - Step 40803: {'lr': 0.00041988714763167156, 'samples': 7834176, 'steps': 40802, 'loss/train': 1.6347209215164185} -08/30/2021 20:32:04 - INFO - __main__ - Step 40804: {'lr': 0.00041988325440387944, 'samples': 7834368, 'steps': 40803, 'loss/train': 1.5274289846420288} -08/30/2021 20:32:04 - INFO - __main__ - Step 40805: {'lr': 0.00041987936109954047, 'samples': 7834560, 'steps': 40804, 'loss/train': 0.7356760501861572} -08/30/2021 20:32:04 - INFO - __main__ - Step 40806: {'lr': 0.0004198754677186565, 'samples': 7834752, 'steps': 40805, 'loss/train': 1.103785753250122} -08/30/2021 20:32:05 - INFO - __main__ - Step 40807: {'lr': 0.0004198715742612292, 'samples': 7834944, 'steps': 40806, 'loss/train': 0.7137376666069031} -08/30/2021 20:32:07 - INFO - __main__ - Step 40808: {'lr': 0.0004198676807272605, 'samples': 7835136, 'steps': 40807, 'loss/train': 1.6436622142791748} -08/30/2021 20:32:07 - INFO - __main__ - Step 40809: {'lr': 0.000419863787116752, 'samples': 7835328, 'steps': 40808, 'loss/train': 2.2599761486053467} -08/30/2021 20:32:08 - INFO - __main__ - Step 40810: {'lr': 0.0004198598934297055, 'samples': 7835520, 'steps': 40809, 'loss/train': 1.6801259517669678} -08/30/2021 20:32:08 - INFO - __main__ - Step 40811: {'lr': 0.00041985599966612273, 'samples': 7835712, 'steps': 40810, 'loss/train': 1.842291235923767} -08/30/2021 20:32:08 - INFO - __main__ - Step 40812: {'lr': 0.0004198521058260055, 'samples': 7835904, 'steps': 40811, 'loss/train': 1.2753660678863525} -08/30/2021 20:32:10 - INFO - __main__ - Step 40813: {'lr': 0.0004198482119093555, 'samples': 7836096, 'steps': 40812, 'loss/train': 0.14927802979946136} -08/30/2021 20:32:11 - INFO - __main__ - Step 40814: {'lr': 0.00041984431791617456, 'samples': 7836288, 'steps': 40813, 'loss/train': 1.5204445123672485} -08/30/2021 20:32:11 - INFO - __main__ - Step 40815: {'lr': 0.0004198404238464644, 'samples': 7836480, 'steps': 40814, 'loss/train': 1.2533056735992432} -08/30/2021 20:32:11 - INFO - __main__ - Step 40816: {'lr': 0.0004198365297002267, 'samples': 7836672, 'steps': 40815, 'loss/train': 1.3474946022033691} -08/30/2021 20:32:12 - INFO - __main__ - Step 40817: {'lr': 0.0004198326354774633, 'samples': 7836864, 'steps': 40816, 'loss/train': 0.9882884621620178} -08/30/2021 20:32:13 - INFO - __main__ - Step 40818: {'lr': 0.00041982874117817593, 'samples': 7837056, 'steps': 40817, 'loss/train': 1.624408483505249} -08/30/2021 20:32:14 - INFO - __main__ - Step 40819: {'lr': 0.00041982484680236636, 'samples': 7837248, 'steps': 40818, 'loss/train': 1.7785921096801758} -08/30/2021 20:32:14 - INFO - __main__ - Step 40820: {'lr': 0.00041982095235003634, 'samples': 7837440, 'steps': 40819, 'loss/train': 0.9864234328269958} -08/30/2021 20:32:14 - INFO - __main__ - Step 40821: {'lr': 0.0004198170578211877, 'samples': 7837632, 'steps': 40820, 'loss/train': 0.7419716119766235} -08/30/2021 20:32:15 - INFO - __main__ - Step 40822: {'lr': 0.000419813163215822, 'samples': 7837824, 'steps': 40821, 'loss/train': 1.6487023830413818} -08/30/2021 20:32:15 - INFO - __main__ - Step 40823: {'lr': 0.0004198092685339411, 'samples': 7838016, 'steps': 40822, 'loss/train': 1.6824064254760742} -08/30/2021 20:32:17 - INFO - __main__ - Step 40824: {'lr': 0.00041980537377554685, 'samples': 7838208, 'steps': 40823, 'loss/train': 1.3728519678115845} -08/30/2021 20:32:17 - INFO - __main__ - Step 40825: {'lr': 0.00041980147894064086, 'samples': 7838400, 'steps': 40824, 'loss/train': 0.7681717872619629} -08/30/2021 20:32:17 - INFO - __main__ - Step 40826: {'lr': 0.00041979758402922496, 'samples': 7838592, 'steps': 40825, 'loss/train': 0.15895843505859375} -08/30/2021 20:32:18 - INFO - __main__ - Step 40827: {'lr': 0.00041979368904130086, 'samples': 7838784, 'steps': 40826, 'loss/train': 1.4759423732757568} -08/30/2021 20:32:18 - INFO - __main__ - Step 40828: {'lr': 0.00041978979397687047, 'samples': 7838976, 'steps': 40827, 'loss/train': 1.4417155981063843} -08/30/2021 20:32:20 - INFO - __main__ - Step 40829: {'lr': 0.00041978589883593525, 'samples': 7839168, 'steps': 40828, 'loss/train': 0.963193416595459} -08/30/2021 20:32:20 - INFO - __main__ - Step 40830: {'lr': 0.0004197820036184972, 'samples': 7839360, 'steps': 40829, 'loss/train': 1.3285272121429443} -08/30/2021 20:32:21 - INFO - __main__ - Step 40831: {'lr': 0.000419778108324558, 'samples': 7839552, 'steps': 40830, 'loss/train': 2.3227992057800293} -08/30/2021 20:32:21 - INFO - __main__ - Step 40832: {'lr': 0.00041977421295411944, 'samples': 7839744, 'steps': 40831, 'loss/train': 2.025751829147339} -08/30/2021 20:32:21 - INFO - __main__ - Step 40833: {'lr': 0.00041977031750718317, 'samples': 7839936, 'steps': 40832, 'loss/train': 1.7972112894058228} -08/30/2021 20:32:22 - INFO - __main__ - Step 40834: {'lr': 0.000419766421983751, 'samples': 7840128, 'steps': 40833, 'loss/train': 1.7379446029663086} -08/30/2021 20:32:23 - INFO - __main__ - Step 40835: {'lr': 0.00041976252638382483, 'samples': 7840320, 'steps': 40834, 'loss/train': 1.588943600654602} -08/30/2021 20:32:24 - INFO - __main__ - Step 40836: {'lr': 0.00041975863070740617, 'samples': 7840512, 'steps': 40835, 'loss/train': 1.5860025882720947} -08/30/2021 20:32:24 - INFO - __main__ - Step 40837: {'lr': 0.0004197547349544969, 'samples': 7840704, 'steps': 40836, 'loss/train': 1.605682134628296} -08/30/2021 20:32:25 - INFO - __main__ - Step 40838: {'lr': 0.0004197508391250988, 'samples': 7840896, 'steps': 40837, 'loss/train': 1.5250840187072754} -08/30/2021 20:32:25 - INFO - __main__ - Step 40839: {'lr': 0.0004197469432192136, 'samples': 7841088, 'steps': 40838, 'loss/train': 1.4490379095077515} -08/30/2021 20:32:26 - INFO - __main__ - Step 40840: {'lr': 0.000419743047236843, 'samples': 7841280, 'steps': 40839, 'loss/train': 1.5496867895126343} -08/30/2021 20:32:27 - INFO - __main__ - Step 40841: {'lr': 0.00041973915117798883, 'samples': 7841472, 'steps': 40840, 'loss/train': 1.083207607269287} -08/30/2021 20:32:27 - INFO - __main__ - Step 40842: {'lr': 0.0004197352550426528, 'samples': 7841664, 'steps': 40841, 'loss/train': 1.5124861001968384} -08/30/2021 20:32:28 - INFO - __main__ - Step 40843: {'lr': 0.0004197313588308367, 'samples': 7841856, 'steps': 40842, 'loss/train': 1.3684998750686646} -08/30/2021 20:32:28 - INFO - __main__ - Step 40844: {'lr': 0.0004197274625425423, 'samples': 7842048, 'steps': 40843, 'loss/train': 1.7779576778411865} -08/30/2021 20:32:30 - INFO - __main__ - Step 40845: {'lr': 0.0004197235661777713, 'samples': 7842240, 'steps': 40844, 'loss/train': 1.5463695526123047} -08/30/2021 20:32:30 - INFO - __main__ - Step 40846: {'lr': 0.00041971966973652545, 'samples': 7842432, 'steps': 40845, 'loss/train': 0.9762404561042786} -08/30/2021 20:32:31 - INFO - __main__ - Step 40847: {'lr': 0.00041971577321880656, 'samples': 7842624, 'steps': 40846, 'loss/train': 1.8867933750152588} -08/30/2021 20:32:31 - INFO - __main__ - Step 40848: {'lr': 0.00041971187662461634, 'samples': 7842816, 'steps': 40847, 'loss/train': 1.183830976486206} -08/30/2021 20:32:31 - INFO - __main__ - Step 40849: {'lr': 0.0004197079799539566, 'samples': 7843008, 'steps': 40848, 'loss/train': 1.3238204717636108} -08/30/2021 20:32:33 - INFO - __main__ - Step 40850: {'lr': 0.0004197040832068291, 'samples': 7843200, 'steps': 40849, 'loss/train': 1.2573596239089966} -08/30/2021 20:32:33 - INFO - __main__ - Step 40851: {'lr': 0.00041970018638323546, 'samples': 7843392, 'steps': 40850, 'loss/train': 1.4237372875213623} -08/30/2021 20:32:34 - INFO - __main__ - Step 40852: {'lr': 0.00041969628948317756, 'samples': 7843584, 'steps': 40851, 'loss/train': 0.417272686958313} -08/30/2021 20:32:34 - INFO - __main__ - Step 40853: {'lr': 0.00041969239250665716, 'samples': 7843776, 'steps': 40852, 'loss/train': 1.62783944606781} -08/30/2021 20:32:34 - INFO - __main__ - Step 40854: {'lr': 0.000419688495453676, 'samples': 7843968, 'steps': 40853, 'loss/train': 1.5535670518875122} -08/30/2021 20:32:35 - INFO - __main__ - Step 40855: {'lr': 0.0004196845983242358, 'samples': 7844160, 'steps': 40854, 'loss/train': 0.938503623008728} -08/30/2021 20:32:36 - INFO - __main__ - Step 40856: {'lr': 0.0004196807011183383, 'samples': 7844352, 'steps': 40855, 'loss/train': 1.6601595878601074} -08/30/2021 20:32:37 - INFO - __main__ - Step 40857: {'lr': 0.00041967680383598536, 'samples': 7844544, 'steps': 40856, 'loss/train': 1.7420214414596558} -08/30/2021 20:32:37 - INFO - __main__ - Step 40858: {'lr': 0.00041967290647717864, 'samples': 7844736, 'steps': 40857, 'loss/train': 1.5125513076782227} -08/30/2021 20:32:37 - INFO - __main__ - Step 40859: {'lr': 0.00041966900904191995, 'samples': 7844928, 'steps': 40858, 'loss/train': 1.4889695644378662} -08/30/2021 20:32:38 - INFO - __main__ - Step 40860: {'lr': 0.000419665111530211, 'samples': 7845120, 'steps': 40859, 'loss/train': 2.4015071392059326} -08/30/2021 20:32:39 - INFO - __main__ - Step 40861: {'lr': 0.00041966121394205357, 'samples': 7845312, 'steps': 40860, 'loss/train': 1.2893686294555664} -08/30/2021 20:32:40 - INFO - __main__ - Step 40862: {'lr': 0.0004196573162774494, 'samples': 7845504, 'steps': 40861, 'loss/train': 1.5658608675003052} -08/30/2021 20:32:40 - INFO - __main__ - Step 40863: {'lr': 0.0004196534185364003, 'samples': 7845696, 'steps': 40862, 'loss/train': 1.632365107536316} -08/30/2021 20:32:40 - INFO - __main__ - Step 40864: {'lr': 0.00041964952071890795, 'samples': 7845888, 'steps': 40863, 'loss/train': 1.7567949295043945} -08/30/2021 20:32:41 - INFO - __main__ - Step 40865: {'lr': 0.00041964562282497417, 'samples': 7846080, 'steps': 40864, 'loss/train': 3.308375358581543} -08/30/2021 20:32:42 - INFO - __main__ - Step 40866: {'lr': 0.0004196417248546006, 'samples': 7846272, 'steps': 40865, 'loss/train': 1.10386323928833} -08/30/2021 20:32:43 - INFO - __main__ - Step 40867: {'lr': 0.0004196378268077893, 'samples': 7846464, 'steps': 40866, 'loss/train': 1.3081706762313843} -08/30/2021 20:32:43 - INFO - __main__ - Step 40868: {'lr': 0.00041963392868454163, 'samples': 7846656, 'steps': 40867, 'loss/train': 1.3719993829727173} -08/30/2021 20:32:44 - INFO - __main__ - Step 40869: {'lr': 0.0004196300304848596, 'samples': 7846848, 'steps': 40868, 'loss/train': 1.3687745332717896} -08/30/2021 20:32:44 - INFO - __main__ - Step 40870: {'lr': 0.00041962613220874486, 'samples': 7847040, 'steps': 40869, 'loss/train': 2.1709072589874268} -08/30/2021 20:32:45 - INFO - __main__ - Step 40871: {'lr': 0.0004196222338561992, 'samples': 7847232, 'steps': 40870, 'loss/train': 0.800399899482727} -08/30/2021 20:32:46 - INFO - __main__ - Step 40872: {'lr': 0.0004196183354272244, 'samples': 7847424, 'steps': 40871, 'loss/train': 1.1716111898422241} -08/30/2021 20:32:46 - INFO - __main__ - Step 40873: {'lr': 0.00041961443692182214, 'samples': 7847616, 'steps': 40872, 'loss/train': 1.7098530530929565} -08/30/2021 20:32:47 - INFO - __main__ - Step 40874: {'lr': 0.00041961053833999433, 'samples': 7847808, 'steps': 40873, 'loss/train': 1.7292158603668213} -08/30/2021 20:32:47 - INFO - __main__ - Step 40875: {'lr': 0.00041960663968174263, 'samples': 7848000, 'steps': 40874, 'loss/train': 1.6533483266830444} -08/30/2021 20:32:47 - INFO - __main__ - Step 40876: {'lr': 0.0004196027409470687, 'samples': 7848192, 'steps': 40875, 'loss/train': 1.117339849472046} -08/30/2021 20:32:49 - INFO - __main__ - Step 40877: {'lr': 0.00041959884213597443, 'samples': 7848384, 'steps': 40876, 'loss/train': 1.6889264583587646} -08/30/2021 20:32:49 - INFO - __main__ - Step 40878: {'lr': 0.0004195949432484615, 'samples': 7848576, 'steps': 40877, 'loss/train': 2.027769088745117} -08/30/2021 20:32:50 - INFO - __main__ - Step 40879: {'lr': 0.00041959104428453175, 'samples': 7848768, 'steps': 40878, 'loss/train': 1.3049023151397705} -08/30/2021 20:32:50 - INFO - __main__ - Step 40880: {'lr': 0.000419587145244187, 'samples': 7848960, 'steps': 40879, 'loss/train': 1.8736363649368286} -08/30/2021 20:32:50 - INFO - __main__ - Step 40881: {'lr': 0.0004195832461274288, 'samples': 7849152, 'steps': 40880, 'loss/train': 1.5118097066879272} -08/30/2021 20:32:52 - INFO - __main__ - Step 40882: {'lr': 0.00041957934693425894, 'samples': 7849344, 'steps': 40881, 'loss/train': 1.5298237800598145} -08/30/2021 20:32:52 - INFO - __main__ - Step 40883: {'lr': 0.0004195754476646793, 'samples': 7849536, 'steps': 40882, 'loss/train': 1.593651533126831} -08/30/2021 20:32:53 - INFO - __main__ - Step 40884: {'lr': 0.0004195715483186916, 'samples': 7849728, 'steps': 40883, 'loss/train': 1.6793041229248047} -08/30/2021 20:32:53 - INFO - __main__ - Step 40885: {'lr': 0.00041956764889629756, 'samples': 7849920, 'steps': 40884, 'loss/train': 2.224100351333618} -08/30/2021 20:32:53 - INFO - __main__ - Step 40886: {'lr': 0.000419563749397499, 'samples': 7850112, 'steps': 40885, 'loss/train': 1.3643192052841187} -08/30/2021 20:32:54 - INFO - __main__ - Step 40887: {'lr': 0.00041955984982229756, 'samples': 7850304, 'steps': 40886, 'loss/train': 1.7641876935958862} -08/30/2021 20:32:55 - INFO - __main__ - Step 40888: {'lr': 0.0004195559501706951, 'samples': 7850496, 'steps': 40887, 'loss/train': 0.14660528302192688} -08/30/2021 20:32:56 - INFO - __main__ - Step 40889: {'lr': 0.0004195520504426933, 'samples': 7850688, 'steps': 40888, 'loss/train': 1.8347421884536743} -08/30/2021 20:32:56 - INFO - __main__ - Step 40890: {'lr': 0.000419548150638294, 'samples': 7850880, 'steps': 40889, 'loss/train': 1.368322491645813} -08/30/2021 20:32:56 - INFO - __main__ - Step 40891: {'lr': 0.0004195442507574989, 'samples': 7851072, 'steps': 40890, 'loss/train': 1.2386257648468018} -08/30/2021 20:32:57 - INFO - __main__ - Step 40892: {'lr': 0.00041954035080030985, 'samples': 7851264, 'steps': 40891, 'loss/train': 0.9416026473045349} -08/30/2021 20:32:58 - INFO - __main__ - Step 40893: {'lr': 0.0004195364507667284, 'samples': 7851456, 'steps': 40892, 'loss/train': 1.2902321815490723} -08/30/2021 20:32:59 - INFO - __main__ - Step 40894: {'lr': 0.0004195325506567566, 'samples': 7851648, 'steps': 40893, 'loss/train': 0.7052925825119019} -08/30/2021 20:32:59 - INFO - __main__ - Step 40895: {'lr': 0.00041952865047039604, 'samples': 7851840, 'steps': 40894, 'loss/train': 0.9954533576965332} -08/30/2021 20:32:59 - INFO - __main__ - Step 40896: {'lr': 0.00041952475020764834, 'samples': 7852032, 'steps': 40895, 'loss/train': 1.9334520101547241} -08/30/2021 20:33:00 - INFO - __main__ - Step 40897: {'lr': 0.00041952084986851546, 'samples': 7852224, 'steps': 40896, 'loss/train': 1.5377235412597656} -08/30/2021 20:33:02 - INFO - __main__ - Step 40898: {'lr': 0.0004195169494529991, 'samples': 7852416, 'steps': 40897, 'loss/train': 1.4728283882141113} -08/30/2021 20:33:02 - INFO - __main__ - Step 40899: {'lr': 0.0004195130489611011, 'samples': 7852608, 'steps': 40898, 'loss/train': 1.4611942768096924} -08/30/2021 20:33:03 - INFO - __main__ - Step 40900: {'lr': 0.0004195091483928231, 'samples': 7852800, 'steps': 40899, 'loss/train': 1.3139704465866089} -08/30/2021 20:33:03 - INFO - __main__ - Step 40901: {'lr': 0.0004195052477481669, 'samples': 7852992, 'steps': 40900, 'loss/train': 1.336854100227356} -08/30/2021 20:33:03 - INFO - __main__ - Step 40902: {'lr': 0.00041950134702713415, 'samples': 7853184, 'steps': 40901, 'loss/train': 0.6940378546714783} -08/30/2021 20:33:05 - INFO - __main__ - Step 40903: {'lr': 0.0004194974462297268, 'samples': 7853376, 'steps': 40902, 'loss/train': 0.768294632434845} -08/30/2021 20:33:06 - INFO - __main__ - Step 40904: {'lr': 0.00041949354535594655, 'samples': 7853568, 'steps': 40903, 'loss/train': 1.3073195219039917} -08/30/2021 20:33:06 - INFO - __main__ - Step 40905: {'lr': 0.000419489644405795, 'samples': 7853760, 'steps': 40904, 'loss/train': 1.103238821029663} -08/30/2021 20:33:06 - INFO - __main__ - Step 40906: {'lr': 0.00041948574337927414, 'samples': 7853952, 'steps': 40905, 'loss/train': 1.9622260332107544} -08/30/2021 20:33:07 - INFO - __main__ - Step 40907: {'lr': 0.0004194818422763856, 'samples': 7854144, 'steps': 40906, 'loss/train': 0.5710344314575195} -08/30/2021 20:33:07 - INFO - __main__ - Step 40908: {'lr': 0.00041947794109713113, 'samples': 7854336, 'steps': 40907, 'loss/train': 0.06249542161822319} -08/30/2021 20:33:09 - INFO - __main__ - Step 40909: {'lr': 0.0004194740398415125, 'samples': 7854528, 'steps': 40908, 'loss/train': 1.1699984073638916} -08/30/2021 20:33:09 - INFO - __main__ - Step 40910: {'lr': 0.00041947013850953156, 'samples': 7854720, 'steps': 40909, 'loss/train': 1.4442816972732544} -08/30/2021 20:33:09 - INFO - __main__ - Step 40911: {'lr': 0.00041946623710118993, 'samples': 7854912, 'steps': 40910, 'loss/train': 1.077022671699524} -08/30/2021 20:33:10 - INFO - __main__ - Step 40912: {'lr': 0.0004194623356164894, 'samples': 7855104, 'steps': 40911, 'loss/train': 1.2743233442306519} -08/30/2021 20:33:10 - INFO - __main__ - Step 40913: {'lr': 0.0004194584340554318, 'samples': 7855296, 'steps': 40912, 'loss/train': 1.6945490837097168} -08/30/2021 20:33:12 - INFO - __main__ - Step 40914: {'lr': 0.0004194545324180188, 'samples': 7855488, 'steps': 40913, 'loss/train': 1.3466601371765137} -08/30/2021 20:33:12 - INFO - __main__ - Step 40915: {'lr': 0.00041945063070425226, 'samples': 7855680, 'steps': 40914, 'loss/train': 1.2468785047531128} -08/30/2021 20:33:13 - INFO - __main__ - Step 40916: {'lr': 0.0004194467289141339, 'samples': 7855872, 'steps': 40915, 'loss/train': 1.5406134128570557} -08/30/2021 20:33:13 - INFO - __main__ - Step 40917: {'lr': 0.00041944282704766534, 'samples': 7856064, 'steps': 40916, 'loss/train': 0.8024212718009949} -08/30/2021 20:33:13 - INFO - __main__ - Step 40918: {'lr': 0.0004194389251048486, 'samples': 7856256, 'steps': 40917, 'loss/train': 1.2845203876495361} -08/30/2021 20:33:15 - INFO - __main__ - Step 40919: {'lr': 0.00041943502308568523, 'samples': 7856448, 'steps': 40918, 'loss/train': 0.3970642685890198} -08/30/2021 20:33:15 - INFO - __main__ - Step 40920: {'lr': 0.000419431120990177, 'samples': 7856640, 'steps': 40919, 'loss/train': 1.4084731340408325} -08/30/2021 20:33:16 - INFO - __main__ - Step 40921: {'lr': 0.0004194272188183258, 'samples': 7856832, 'steps': 40920, 'loss/train': 1.4735500812530518} -08/30/2021 20:33:16 - INFO - __main__ - Step 40922: {'lr': 0.0004194233165701333, 'samples': 7857024, 'steps': 40921, 'loss/train': 1.3554116487503052} -08/30/2021 20:33:16 - INFO - __main__ - Step 40923: {'lr': 0.0004194194142456013, 'samples': 7857216, 'steps': 40922, 'loss/train': 1.3129101991653442} -08/30/2021 20:33:18 - INFO - __main__ - Step 40924: {'lr': 0.00041941551184473144, 'samples': 7857408, 'steps': 40923, 'loss/train': 1.389233946800232} -08/30/2021 20:33:18 - INFO - __main__ - Step 40925: {'lr': 0.0004194116093675256, 'samples': 7857600, 'steps': 40924, 'loss/train': 1.1665074825286865} -08/30/2021 20:33:19 - INFO - __main__ - Step 40926: {'lr': 0.0004194077068139855, 'samples': 7857792, 'steps': 40925, 'loss/train': 1.9135937690734863} -08/30/2021 20:33:19 - INFO - __main__ - Step 40927: {'lr': 0.00041940380418411296, 'samples': 7857984, 'steps': 40926, 'loss/train': 1.7282769680023193} -08/30/2021 20:33:19 - INFO - __main__ - Step 40928: {'lr': 0.00041939990147790956, 'samples': 7858176, 'steps': 40927, 'loss/train': 0.7967919707298279} -08/30/2021 20:33:20 - INFO - __main__ - Step 40929: {'lr': 0.00041939599869537724, 'samples': 7858368, 'steps': 40928, 'loss/train': 1.0501060485839844} -08/30/2021 20:33:21 - INFO - __main__ - Step 40930: {'lr': 0.00041939209583651774, 'samples': 7858560, 'steps': 40929, 'loss/train': 1.4101780652999878} -08/30/2021 20:33:22 - INFO - __main__ - Step 40931: {'lr': 0.0004193881929013327, 'samples': 7858752, 'steps': 40930, 'loss/train': 1.2091023921966553} -08/30/2021 20:33:22 - INFO - __main__ - Step 40932: {'lr': 0.00041938428988982403, 'samples': 7858944, 'steps': 40931, 'loss/train': 1.4088445901870728} -08/30/2021 20:33:22 - INFO - __main__ - Step 40933: {'lr': 0.00041938038680199333, 'samples': 7859136, 'steps': 40932, 'loss/train': 1.4141396284103394} -08/30/2021 20:33:23 - INFO - __main__ - Step 40934: {'lr': 0.0004193764836378425, 'samples': 7859328, 'steps': 40933, 'loss/train': 1.4904959201812744} -08/30/2021 20:33:24 - INFO - __main__ - Step 40935: {'lr': 0.0004193725803973732, 'samples': 7859520, 'steps': 40934, 'loss/train': 1.1050435304641724} -08/30/2021 20:33:25 - INFO - __main__ - Step 40936: {'lr': 0.0004193686770805873, 'samples': 7859712, 'steps': 40935, 'loss/train': 1.6410069465637207} -08/30/2021 20:33:25 - INFO - __main__ - Step 40937: {'lr': 0.00041936477368748645, 'samples': 7859904, 'steps': 40936, 'loss/train': 1.3336771726608276} -08/30/2021 20:33:26 - INFO - __main__ - Step 40938: {'lr': 0.00041936087021807243, 'samples': 7860096, 'steps': 40937, 'loss/train': 0.07436837255954742} -08/30/2021 20:33:26 - INFO - __main__ - Step 40939: {'lr': 0.000419356966672347, 'samples': 7860288, 'steps': 40938, 'loss/train': 0.44961774349212646} -08/30/2021 20:33:27 - INFO - __main__ - Step 40940: {'lr': 0.00041935306305031195, 'samples': 7860480, 'steps': 40939, 'loss/train': 1.4658244848251343} -08/30/2021 20:33:28 - INFO - __main__ - Step 40941: {'lr': 0.000419349159351969, 'samples': 7860672, 'steps': 40940, 'loss/train': 1.6728591918945312} -08/30/2021 20:33:28 - INFO - __main__ - Step 40942: {'lr': 0.00041934525557732005, 'samples': 7860864, 'steps': 40941, 'loss/train': 1.8563625812530518} -08/30/2021 20:33:29 - INFO - __main__ - Step 40943: {'lr': 0.00041934135172636667, 'samples': 7861056, 'steps': 40942, 'loss/train': 0.6185595989227295} -08/30/2021 20:33:29 - INFO - __main__ - Step 40944: {'lr': 0.00041933744779911066, 'samples': 7861248, 'steps': 40943, 'loss/train': 1.0351604223251343} -08/30/2021 20:33:30 - INFO - __main__ - Step 40945: {'lr': 0.00041933354379555376, 'samples': 7861440, 'steps': 40944, 'loss/train': 0.8298118114471436} -08/30/2021 20:33:31 - INFO - __main__ - Step 40946: {'lr': 0.00041932963971569786, 'samples': 7861632, 'steps': 40945, 'loss/train': 1.2659929990768433} -08/30/2021 20:33:31 - INFO - __main__ - Step 40947: {'lr': 0.0004193257355595446, 'samples': 7861824, 'steps': 40946, 'loss/train': 1.6088361740112305} -08/30/2021 20:33:32 - INFO - __main__ - Step 40948: {'lr': 0.00041932183132709587, 'samples': 7862016, 'steps': 40947, 'loss/train': 1.2395412921905518} -08/30/2021 20:33:32 - INFO - __main__ - Step 40949: {'lr': 0.00041931792701835325, 'samples': 7862208, 'steps': 40948, 'loss/train': 0.9507985711097717} -08/30/2021 20:33:34 - INFO - __main__ - Step 40950: {'lr': 0.00041931402263331856, 'samples': 7862400, 'steps': 40949, 'loss/train': 1.495686650276184} -08/30/2021 20:33:34 - INFO - __main__ - Step 40951: {'lr': 0.0004193101181719936, 'samples': 7862592, 'steps': 40950, 'loss/train': 1.3619741201400757} -08/30/2021 20:33:35 - INFO - __main__ - Step 40952: {'lr': 0.00041930621363438014, 'samples': 7862784, 'steps': 40951, 'loss/train': 1.8789520263671875} -08/30/2021 20:33:35 - INFO - __main__ - Step 40953: {'lr': 0.0004193023090204799, 'samples': 7862976, 'steps': 40952, 'loss/train': 2.3328163623809814} -08/30/2021 20:33:36 - INFO - __main__ - Step 40954: {'lr': 0.0004192984043302947, 'samples': 7863168, 'steps': 40953, 'loss/train': 1.0303049087524414} -08/30/2021 20:33:36 - INFO - __main__ - Step 40955: {'lr': 0.00041929449956382625, 'samples': 7863360, 'steps': 40954, 'loss/train': 1.4737156629562378} -08/30/2021 20:33:38 - INFO - __main__ - Step 40956: {'lr': 0.0004192905947210762, 'samples': 7863552, 'steps': 40955, 'loss/train': 1.62615966796875} -08/30/2021 20:33:39 - INFO - __main__ - Step 40957: {'lr': 0.00041928668980204653, 'samples': 7863744, 'steps': 40956, 'loss/train': 1.65840744972229} -08/30/2021 20:33:39 - INFO - __main__ - Step 40958: {'lr': 0.00041928278480673884, 'samples': 7863936, 'steps': 40957, 'loss/train': 1.5239286422729492} -08/30/2021 20:33:39 - INFO - __main__ - Step 40959: {'lr': 0.00041927887973515493, 'samples': 7864128, 'steps': 40958, 'loss/train': 1.4872782230377197} -08/30/2021 20:33:40 - INFO - __main__ - Step 40960: {'lr': 0.0004192749745872966, 'samples': 7864320, 'steps': 40959, 'loss/train': 4.225166320800781} -08/30/2021 20:33:40 - INFO - __main__ - Step 40961: {'lr': 0.00041927106936316563, 'samples': 7864512, 'steps': 40960, 'loss/train': 1.5450806617736816} -08/30/2021 20:33:41 - INFO - __main__ - Step 40962: {'lr': 0.00041926716406276367, 'samples': 7864704, 'steps': 40961, 'loss/train': 2.4315237998962402} -08/30/2021 20:33:42 - INFO - __main__ - Step 40963: {'lr': 0.00041926325868609247, 'samples': 7864896, 'steps': 40962, 'loss/train': 1.53387451171875} -08/30/2021 20:33:42 - INFO - __main__ - Step 40964: {'lr': 0.0004192593532331539, 'samples': 7865088, 'steps': 40963, 'loss/train': 1.7144404649734497} -08/30/2021 20:33:43 - INFO - __main__ - Step 40965: {'lr': 0.00041925544770394976, 'samples': 7865280, 'steps': 40964, 'loss/train': 1.5886229276657104} -08/30/2021 20:33:43 - INFO - __main__ - Step 40966: {'lr': 0.0004192515420984816, 'samples': 7865472, 'steps': 40965, 'loss/train': 2.5931015014648438} -08/30/2021 20:33:43 - INFO - __main__ - Step 40967: {'lr': 0.0004192476364167514, 'samples': 7865664, 'steps': 40966, 'loss/train': 1.7479819059371948} -08/30/2021 20:33:45 - INFO - __main__ - Step 40968: {'lr': 0.0004192437306587608, 'samples': 7865856, 'steps': 40967, 'loss/train': 1.5609920024871826} -08/30/2021 20:33:45 - INFO - __main__ - Step 40969: {'lr': 0.0004192398248245116, 'samples': 7866048, 'steps': 40968, 'loss/train': 1.842596411705017} -08/30/2021 20:33:46 - INFO - __main__ - Step 40970: {'lr': 0.00041923591891400555, 'samples': 7866240, 'steps': 40969, 'loss/train': 1.1909911632537842} -08/30/2021 20:33:46 - INFO - __main__ - Step 40971: {'lr': 0.00041923201292724436, 'samples': 7866432, 'steps': 40970, 'loss/train': 1.5168083906173706} -08/30/2021 20:33:46 - INFO - __main__ - Step 40972: {'lr': 0.00041922810686422987, 'samples': 7866624, 'steps': 40971, 'loss/train': 1.8781682252883911} -08/30/2021 20:33:48 - INFO - __main__ - Step 40973: {'lr': 0.00041922420072496383, 'samples': 7866816, 'steps': 40972, 'loss/train': 1.786932110786438} -08/30/2021 20:33:48 - INFO - __main__ - Step 40974: {'lr': 0.00041922029450944785, 'samples': 7867008, 'steps': 40973, 'loss/train': 1.4572707414627075} -08/30/2021 20:33:49 - INFO - __main__ - Step 40975: {'lr': 0.000419216388217684, 'samples': 7867200, 'steps': 40974, 'loss/train': 1.5855839252471924} -08/30/2021 20:33:49 - INFO - __main__ - Step 40976: {'lr': 0.00041921248184967374, 'samples': 7867392, 'steps': 40975, 'loss/train': 1.5981673002243042} -08/30/2021 20:33:49 - INFO - __main__ - Step 40977: {'lr': 0.000419208575405419, 'samples': 7867584, 'steps': 40976, 'loss/train': 2.135380506515503} -08/30/2021 20:33:51 - INFO - __main__ - Step 40978: {'lr': 0.00041920466888492147, 'samples': 7867776, 'steps': 40977, 'loss/train': 1.3703010082244873} -08/30/2021 20:33:52 - INFO - __main__ - Step 40979: {'lr': 0.00041920076228818293, 'samples': 7867968, 'steps': 40978, 'loss/train': 1.575701355934143} -08/30/2021 20:33:52 - INFO - __main__ - Step 40980: {'lr': 0.0004191968556152051, 'samples': 7868160, 'steps': 40979, 'loss/train': 2.3708324432373047} -08/30/2021 20:33:52 - INFO - __main__ - Step 40981: {'lr': 0.0004191929488659898, 'samples': 7868352, 'steps': 40980, 'loss/train': 1.5656780004501343} -08/30/2021 20:33:53 - INFO - __main__ - Step 40982: {'lr': 0.00041918904204053874, 'samples': 7868544, 'steps': 40981, 'loss/train': 1.12666654586792} -08/30/2021 20:33:53 - INFO - __main__ - Step 40983: {'lr': 0.0004191851351388538, 'samples': 7868736, 'steps': 40982, 'loss/train': 1.218644142150879} -08/30/2021 20:33:54 - INFO - __main__ - Step 40984: {'lr': 0.0004191812281609366, 'samples': 7868928, 'steps': 40983, 'loss/train': 1.4286248683929443} -08/30/2021 20:33:55 - INFO - __main__ - Step 40985: {'lr': 0.00041917732110678896, 'samples': 7869120, 'steps': 40984, 'loss/train': 1.8776036500930786} -08/30/2021 20:33:55 - INFO - __main__ - Step 40986: {'lr': 0.0004191734139764126, 'samples': 7869312, 'steps': 40985, 'loss/train': 1.6581599712371826} -08/30/2021 20:33:56 - INFO - __main__ - Step 40987: {'lr': 0.00041916950676980933, 'samples': 7869504, 'steps': 40986, 'loss/train': 2.2027676105499268} -08/30/2021 20:33:56 - INFO - __main__ - Step 40988: {'lr': 0.0004191655994869809, 'samples': 7869696, 'steps': 40987, 'loss/train': 1.9761977195739746} -08/30/2021 20:33:57 - INFO - __main__ - Step 40989: {'lr': 0.000419161692127929, 'samples': 7869888, 'steps': 40988, 'loss/train': 1.248308539390564} -08/30/2021 20:33:58 - INFO - __main__ - Step 40990: {'lr': 0.00041915778469265555, 'samples': 7870080, 'steps': 40989, 'loss/train': 1.5555769205093384} -08/30/2021 20:33:58 - INFO - __main__ - Step 40991: {'lr': 0.0004191538771811621, 'samples': 7870272, 'steps': 40990, 'loss/train': 1.1149226427078247} -08/30/2021 20:33:59 - INFO - __main__ - Step 40992: {'lr': 0.00041914996959345057, 'samples': 7870464, 'steps': 40991, 'loss/train': 1.4795925617218018} -08/30/2021 20:33:59 - INFO - __main__ - Step 40993: {'lr': 0.0004191460619295227, 'samples': 7870656, 'steps': 40992, 'loss/train': 1.583585500717163} -08/30/2021 20:34:01 - INFO - __main__ - Step 40994: {'lr': 0.0004191421541893802, 'samples': 7870848, 'steps': 40993, 'loss/train': 1.6287332773208618} -08/30/2021 20:34:01 - INFO - __main__ - Step 40995: {'lr': 0.0004191382463730249, 'samples': 7871040, 'steps': 40994, 'loss/train': 1.6534956693649292} -08/30/2021 20:34:01 - INFO - __main__ - Step 40996: {'lr': 0.00041913433848045844, 'samples': 7871232, 'steps': 40995, 'loss/train': 1.4942495822906494} -08/30/2021 20:34:02 - INFO - __main__ - Step 40997: {'lr': 0.00041913043051168276, 'samples': 7871424, 'steps': 40996, 'loss/train': 0.5345218777656555} -08/30/2021 20:34:02 - INFO - __main__ - Step 40998: {'lr': 0.00041912652246669943, 'samples': 7871616, 'steps': 40997, 'loss/train': 0.9556570649147034} -08/30/2021 20:34:04 - INFO - __main__ - Step 40999: {'lr': 0.0004191226143455103, 'samples': 7871808, 'steps': 40998, 'loss/train': 2.0120275020599365} -08/30/2021 20:34:04 - INFO - __main__ - Step 41000: {'lr': 0.00041911870614811715, 'samples': 7872000, 'steps': 40999, 'loss/train': 1.7070958614349365} -08/30/2021 20:34:05 - INFO - __main__ - Step 41001: {'lr': 0.00041911479787452177, 'samples': 7872192, 'steps': 41000, 'loss/train': 1.471051573753357} -08/30/2021 20:34:05 - INFO - __main__ - Step 41002: {'lr': 0.0004191108895247258, 'samples': 7872384, 'steps': 41001, 'loss/train': 1.1451913118362427} -08/30/2021 20:34:05 - INFO - __main__ - Step 41003: {'lr': 0.00041910698109873116, 'samples': 7872576, 'steps': 41002, 'loss/train': 1.0168237686157227} -08/30/2021 20:34:07 - INFO - __main__ - Step 41004: {'lr': 0.0004191030725965394, 'samples': 7872768, 'steps': 41003, 'loss/train': 0.10557163506746292} -08/30/2021 20:34:07 - INFO - __main__ - Step 41005: {'lr': 0.00041909916401815245, 'samples': 7872960, 'steps': 41004, 'loss/train': 1.5996288061141968} -08/30/2021 20:34:08 - INFO - __main__ - Step 41006: {'lr': 0.00041909525536357206, 'samples': 7873152, 'steps': 41005, 'loss/train': 1.5740998983383179} -08/30/2021 20:34:08 - INFO - __main__ - Step 41007: {'lr': 0.0004190913466327999, 'samples': 7873344, 'steps': 41006, 'loss/train': 0.0771162211894989} -08/30/2021 20:34:08 - INFO - __main__ - Step 41008: {'lr': 0.00041908743782583793, 'samples': 7873536, 'steps': 41007, 'loss/train': 1.7025703191757202} -08/30/2021 20:34:11 - INFO - __main__ - Step 41009: {'lr': 0.00041908352894268766, 'samples': 7873728, 'steps': 41008, 'loss/train': 1.8158495426177979} -08/30/2021 20:34:11 - INFO - __main__ - Step 41010: {'lr': 0.00041907961998335094, 'samples': 7873920, 'steps': 41009, 'loss/train': 1.762906789779663} -08/30/2021 20:34:12 - INFO - __main__ - Step 41011: {'lr': 0.0004190757109478296, 'samples': 7874112, 'steps': 41010, 'loss/train': 1.8688335418701172} -08/30/2021 20:34:12 - INFO - __main__ - Step 41012: {'lr': 0.00041907180183612525, 'samples': 7874304, 'steps': 41011, 'loss/train': 1.7534507513046265} -08/30/2021 20:34:12 - INFO - __main__ - Step 41013: {'lr': 0.00041906789264823985, 'samples': 7874496, 'steps': 41012, 'loss/train': 0.09809020161628723} -08/30/2021 20:34:14 - INFO - __main__ - Step 41014: {'lr': 0.00041906398338417504, 'samples': 7874688, 'steps': 41013, 'loss/train': 1.5099958181381226} -08/30/2021 20:34:14 - INFO - __main__ - Step 41015: {'lr': 0.00041906007404393273, 'samples': 7874880, 'steps': 41014, 'loss/train': 1.496046781539917} -08/30/2021 20:34:15 - INFO - __main__ - Step 41016: {'lr': 0.0004190561646275144, 'samples': 7875072, 'steps': 41015, 'loss/train': 1.1792261600494385} -08/30/2021 20:34:15 - INFO - __main__ - Step 41017: {'lr': 0.0004190522551349221, 'samples': 7875264, 'steps': 41016, 'loss/train': 1.4963449239730835} -08/30/2021 20:34:15 - INFO - __main__ - Step 41018: {'lr': 0.00041904834556615733, 'samples': 7875456, 'steps': 41017, 'loss/train': 1.59846031665802} -08/30/2021 20:34:17 - INFO - __main__ - Step 41019: {'lr': 0.000419044435921222, 'samples': 7875648, 'steps': 41018, 'loss/train': 1.589135766029358} -08/30/2021 20:34:17 - INFO - __main__ - Step 41020: {'lr': 0.0004190405262001179, 'samples': 7875840, 'steps': 41019, 'loss/train': 1.3507919311523438} -08/30/2021 20:34:18 - INFO - __main__ - Step 41021: {'lr': 0.00041903661640284675, 'samples': 7876032, 'steps': 41020, 'loss/train': 1.435124158859253} -08/30/2021 20:34:18 - INFO - __main__ - Step 41022: {'lr': 0.0004190327065294104, 'samples': 7876224, 'steps': 41021, 'loss/train': 1.5862599611282349} -08/30/2021 20:34:18 - INFO - __main__ - Step 41023: {'lr': 0.00041902879657981036, 'samples': 7876416, 'steps': 41022, 'loss/train': 1.248430848121643} -08/30/2021 20:34:20 - INFO - __main__ - Step 41024: {'lr': 0.00041902488655404864, 'samples': 7876608, 'steps': 41023, 'loss/train': 1.1055865287780762} -08/30/2021 20:34:20 - INFO - __main__ - Step 41025: {'lr': 0.0004190209764521269, 'samples': 7876800, 'steps': 41024, 'loss/train': 1.3772032260894775} -08/30/2021 20:34:20 - INFO - __main__ - Step 41026: {'lr': 0.0004190170662740469, 'samples': 7876992, 'steps': 41025, 'loss/train': 1.45427405834198} -08/30/2021 20:34:21 - INFO - __main__ - Step 41027: {'lr': 0.0004190131560198104, 'samples': 7877184, 'steps': 41026, 'loss/train': 1.41404390335083} -08/30/2021 20:34:21 - INFO - __main__ - Step 41028: {'lr': 0.00041900924568941925, 'samples': 7877376, 'steps': 41027, 'loss/train': 1.3327659368515015} -08/30/2021 20:34:21 - INFO - __main__ - Step 41029: {'lr': 0.0004190053352828751, 'samples': 7877568, 'steps': 41028, 'loss/train': 1.8245478868484497} -08/30/2021 20:34:23 - INFO - __main__ - Step 41030: {'lr': 0.00041900142480017974, 'samples': 7877760, 'steps': 41029, 'loss/train': 0.3308565616607666} -08/30/2021 20:34:23 - INFO - __main__ - Step 41031: {'lr': 0.0004189975142413349, 'samples': 7877952, 'steps': 41030, 'loss/train': 1.8376173973083496} -08/30/2021 20:34:24 - INFO - __main__ - Step 41032: {'lr': 0.00041899360360634247, 'samples': 7878144, 'steps': 41031, 'loss/train': 1.2415484189987183} -08/30/2021 20:34:24 - INFO - __main__ - Step 41033: {'lr': 0.0004189896928952041, 'samples': 7878336, 'steps': 41032, 'loss/train': 1.8353732824325562} -08/30/2021 20:34:24 - INFO - __main__ - Step 41034: {'lr': 0.0004189857821079216, 'samples': 7878528, 'steps': 41033, 'loss/train': 1.7956066131591797} -08/30/2021 20:34:26 - INFO - __main__ - Step 41035: {'lr': 0.0004189818712444967, 'samples': 7878720, 'steps': 41034, 'loss/train': 1.1152185201644897} -08/30/2021 20:34:26 - INFO - __main__ - Step 41036: {'lr': 0.0004189779603049312, 'samples': 7878912, 'steps': 41035, 'loss/train': 0.5350671410560608} -08/30/2021 20:34:27 - INFO - __main__ - Step 41037: {'lr': 0.0004189740492892268, 'samples': 7879104, 'steps': 41036, 'loss/train': 1.9817450046539307} -08/30/2021 20:34:27 - INFO - __main__ - Step 41038: {'lr': 0.0004189701381973853, 'samples': 7879296, 'steps': 41037, 'loss/train': 1.8521685600280762} -08/30/2021 20:34:27 - INFO - __main__ - Step 41039: {'lr': 0.00041896622702940846, 'samples': 7879488, 'steps': 41038, 'loss/train': 0.6891412734985352} -08/30/2021 20:34:29 - INFO - __main__ - Step 41040: {'lr': 0.0004189623157852981, 'samples': 7879680, 'steps': 41039, 'loss/train': 1.5992757081985474} -08/30/2021 20:34:30 - INFO - __main__ - Step 41041: {'lr': 0.0004189584044650559, 'samples': 7879872, 'steps': 41040, 'loss/train': 0.8640210032463074} -08/30/2021 20:34:30 - INFO - __main__ - Step 41042: {'lr': 0.0004189544930686837, 'samples': 7880064, 'steps': 41041, 'loss/train': 2.5475447177886963} -08/30/2021 20:34:30 - INFO - __main__ - Step 41043: {'lr': 0.0004189505815961831, 'samples': 7880256, 'steps': 41042, 'loss/train': 1.4506341218948364} -08/30/2021 20:34:31 - INFO - __main__ - Step 41044: {'lr': 0.000418946670047556, 'samples': 7880448, 'steps': 41043, 'loss/train': 1.0487667322158813} -08/30/2021 20:34:32 - INFO - __main__ - Step 41045: {'lr': 0.0004189427584228042, 'samples': 7880640, 'steps': 41044, 'loss/train': 1.7175081968307495} -08/30/2021 20:34:33 - INFO - __main__ - Step 41046: {'lr': 0.0004189388467219294, 'samples': 7880832, 'steps': 41045, 'loss/train': 1.326883316040039} -08/30/2021 20:34:33 - INFO - __main__ - Step 41047: {'lr': 0.0004189349349449333, 'samples': 7881024, 'steps': 41046, 'loss/train': 2.106649875640869} -08/30/2021 20:34:33 - INFO - __main__ - Step 41048: {'lr': 0.00041893102309181773, 'samples': 7881216, 'steps': 41047, 'loss/train': 1.4961119890213013} -08/30/2021 20:34:34 - INFO - __main__ - Step 41049: {'lr': 0.00041892711116258454, 'samples': 7881408, 'steps': 41048, 'loss/train': 1.5439482927322388} -08/30/2021 20:34:35 - INFO - __main__ - Step 41050: {'lr': 0.00041892319915723533, 'samples': 7881600, 'steps': 41049, 'loss/train': 3.664855718612671} -08/30/2021 20:34:36 - INFO - __main__ - Step 41051: {'lr': 0.0004189192870757719, 'samples': 7881792, 'steps': 41050, 'loss/train': 0.9282266497612} -08/30/2021 20:34:36 - INFO - __main__ - Step 41052: {'lr': 0.0004189153749181961, 'samples': 7881984, 'steps': 41051, 'loss/train': 1.2515292167663574} -08/30/2021 20:34:36 - INFO - __main__ - Step 41053: {'lr': 0.00041891146268450963, 'samples': 7882176, 'steps': 41052, 'loss/train': 0.8474591970443726} -08/30/2021 20:34:37 - INFO - __main__ - Step 41054: {'lr': 0.0004189075503747142, 'samples': 7882368, 'steps': 41053, 'loss/train': 1.5076950788497925} -08/30/2021 20:34:37 - INFO - __main__ - Step 41055: {'lr': 0.0004189036379888117, 'samples': 7882560, 'steps': 41054, 'loss/train': 1.2326934337615967} -08/30/2021 20:34:38 - INFO - __main__ - Step 41056: {'lr': 0.00041889972552680387, 'samples': 7882752, 'steps': 41055, 'loss/train': 1.9456889629364014} -08/30/2021 20:34:39 - INFO - __main__ - Step 41057: {'lr': 0.0004188958129886924, 'samples': 7882944, 'steps': 41056, 'loss/train': 2.0564045906066895} -08/30/2021 20:34:39 - INFO - __main__ - Step 41058: {'lr': 0.000418891900374479, 'samples': 7883136, 'steps': 41057, 'loss/train': 1.8548705577850342} -08/30/2021 20:34:40 - INFO - __main__ - Step 41059: {'lr': 0.0004188879876841656, 'samples': 7883328, 'steps': 41058, 'loss/train': 1.7685585021972656} -08/30/2021 20:34:40 - INFO - __main__ - Step 41060: {'lr': 0.0004188840749177538, 'samples': 7883520, 'steps': 41059, 'loss/train': 0.6381027698516846} -08/30/2021 20:34:42 - INFO - __main__ - Step 41061: {'lr': 0.0004188801620752455, 'samples': 7883712, 'steps': 41060, 'loss/train': 1.7532620429992676} -08/30/2021 20:34:42 - INFO - __main__ - Step 41062: {'lr': 0.00041887624915664247, 'samples': 7883904, 'steps': 41061, 'loss/train': 1.5054994821548462} -08/30/2021 20:34:43 - INFO - __main__ - Step 41063: {'lr': 0.0004188723361619463, 'samples': 7884096, 'steps': 41062, 'loss/train': 1.0998432636260986} -08/30/2021 20:34:43 - INFO - __main__ - Step 41064: {'lr': 0.0004188684230911589, 'samples': 7884288, 'steps': 41063, 'loss/train': 1.6960923671722412} -08/30/2021 20:34:43 - INFO - __main__ - Step 41065: {'lr': 0.00041886450994428197, 'samples': 7884480, 'steps': 41064, 'loss/train': 1.6947439908981323} -08/30/2021 20:34:45 - INFO - __main__ - Step 41066: {'lr': 0.0004188605967213174, 'samples': 7884672, 'steps': 41065, 'loss/train': 1.2996693849563599} -08/30/2021 20:34:45 - INFO - __main__ - Step 41067: {'lr': 0.0004188566834222667, 'samples': 7884864, 'steps': 41066, 'loss/train': 1.9593781232833862} -08/30/2021 20:34:46 - INFO - __main__ - Step 41068: {'lr': 0.00041885277004713185, 'samples': 7885056, 'steps': 41067, 'loss/train': 1.4899647235870361} -08/30/2021 20:34:46 - INFO - __main__ - Step 41069: {'lr': 0.0004188488565959146, 'samples': 7885248, 'steps': 41068, 'loss/train': 1.6581939458847046} -08/30/2021 20:34:46 - INFO - __main__ - Step 41070: {'lr': 0.0004188449430686166, 'samples': 7885440, 'steps': 41069, 'loss/train': 1.0358103513717651} -08/30/2021 20:34:48 - INFO - __main__ - Step 41071: {'lr': 0.00041884102946523964, 'samples': 7885632, 'steps': 41070, 'loss/train': 1.515663981437683} -08/30/2021 20:34:48 - INFO - __main__ - Step 41072: {'lr': 0.0004188371157857856, 'samples': 7885824, 'steps': 41071, 'loss/train': 1.427071213722229} -08/30/2021 20:34:49 - INFO - __main__ - Step 41073: {'lr': 0.0004188332020302561, 'samples': 7886016, 'steps': 41072, 'loss/train': 2.385524034500122} -08/30/2021 20:34:49 - INFO - __main__ - Step 41074: {'lr': 0.000418829288198653, 'samples': 7886208, 'steps': 41073, 'loss/train': 1.531606912612915} -08/30/2021 20:34:49 - INFO - __main__ - Step 41075: {'lr': 0.00041882537429097804, 'samples': 7886400, 'steps': 41074, 'loss/train': 1.4643745422363281} -08/30/2021 20:34:51 - INFO - __main__ - Step 41076: {'lr': 0.00041882146030723297, 'samples': 7886592, 'steps': 41075, 'loss/train': 1.5161347389221191} -08/30/2021 20:34:51 - INFO - __main__ - Step 41077: {'lr': 0.0004188175462474195, 'samples': 7886784, 'steps': 41076, 'loss/train': 1.3104255199432373} -08/30/2021 20:34:52 - INFO - __main__ - Step 41078: {'lr': 0.0004188136321115395, 'samples': 7886976, 'steps': 41077, 'loss/train': 1.5040000677108765} -08/30/2021 20:34:52 - INFO - __main__ - Step 41079: {'lr': 0.00041880971789959466, 'samples': 7887168, 'steps': 41078, 'loss/train': 1.5095070600509644} -08/30/2021 20:34:52 - INFO - __main__ - Step 41080: {'lr': 0.0004188058036115868, 'samples': 7887360, 'steps': 41079, 'loss/train': 1.3772051334381104} -08/30/2021 20:34:54 - INFO - __main__ - Step 41081: {'lr': 0.0004188018892475176, 'samples': 7887552, 'steps': 41080, 'loss/train': 1.5810112953186035} -08/30/2021 20:34:55 - INFO - __main__ - Step 41082: {'lr': 0.0004187979748073889, 'samples': 7887744, 'steps': 41081, 'loss/train': 1.3758090734481812} -08/30/2021 20:34:55 - INFO - __main__ - Step 41083: {'lr': 0.0004187940602912024, 'samples': 7887936, 'steps': 41082, 'loss/train': 0.6491727232933044} -08/30/2021 20:34:55 - INFO - __main__ - Step 41084: {'lr': 0.00041879014569895994, 'samples': 7888128, 'steps': 41083, 'loss/train': 1.2365748882293701} -08/30/2021 20:34:56 - INFO - __main__ - Step 41085: {'lr': 0.0004187862310306633, 'samples': 7888320, 'steps': 41084, 'loss/train': 1.220784306526184} -08/30/2021 20:34:56 - INFO - __main__ - Step 41086: {'lr': 0.00041878231628631406, 'samples': 7888512, 'steps': 41085, 'loss/train': 0.9743812084197998} -08/30/2021 20:34:58 - INFO - __main__ - Step 41087: {'lr': 0.0004187784014659142, 'samples': 7888704, 'steps': 41086, 'loss/train': 0.9892066717147827} -08/30/2021 20:34:58 - INFO - __main__ - Step 41088: {'lr': 0.0004187744865694654, 'samples': 7888896, 'steps': 41087, 'loss/train': 1.1738516092300415} -08/30/2021 20:34:59 - INFO - __main__ - Step 41089: {'lr': 0.0004187705715969694, 'samples': 7889088, 'steps': 41088, 'loss/train': 1.317478895187378} -08/30/2021 20:34:59 - INFO - __main__ - Step 41090: {'lr': 0.0004187666565484279, 'samples': 7889280, 'steps': 41089, 'loss/train': 1.4726805686950684} -08/30/2021 20:34:59 - INFO - __main__ - Step 41091: {'lr': 0.0004187627414238428, 'samples': 7889472, 'steps': 41090, 'loss/train': 1.7937759160995483} -08/30/2021 20:35:01 - INFO - __main__ - Step 41092: {'lr': 0.0004187588262232159, 'samples': 7889664, 'steps': 41091, 'loss/train': 1.5622119903564453} -08/30/2021 20:35:01 - INFO - __main__ - Step 41093: {'lr': 0.00041875491094654885, 'samples': 7889856, 'steps': 41092, 'loss/train': 2.9122872352600098} -08/30/2021 20:35:02 - INFO - __main__ - Step 41094: {'lr': 0.0004187509955938434, 'samples': 7890048, 'steps': 41093, 'loss/train': 1.279302954673767} -08/30/2021 20:35:02 - INFO - __main__ - Step 41095: {'lr': 0.0004187470801651013, 'samples': 7890240, 'steps': 41094, 'loss/train': 1.1253182888031006} -08/30/2021 20:35:02 - INFO - __main__ - Step 41096: {'lr': 0.0004187431646603245, 'samples': 7890432, 'steps': 41095, 'loss/train': 1.3879632949829102} -08/30/2021 20:35:04 - INFO - __main__ - Step 41097: {'lr': 0.0004187392490795146, 'samples': 7890624, 'steps': 41096, 'loss/train': 1.0568162202835083} -08/30/2021 20:35:04 - INFO - __main__ - Step 41098: {'lr': 0.00041873533342267336, 'samples': 7890816, 'steps': 41097, 'loss/train': 0.3235325813293457} -08/30/2021 20:35:05 - INFO - __main__ - Step 41099: {'lr': 0.0004187314176898026, 'samples': 7891008, 'steps': 41098, 'loss/train': 2.0620148181915283} -08/30/2021 20:35:05 - INFO - __main__ - Step 41100: {'lr': 0.000418727501880904, 'samples': 7891200, 'steps': 41099, 'loss/train': 1.509527325630188} -08/30/2021 20:35:05 - INFO - __main__ - Step 41101: {'lr': 0.00041872358599597947, 'samples': 7891392, 'steps': 41100, 'loss/train': 1.011954426765442} -08/30/2021 20:35:07 - INFO - __main__ - Step 41102: {'lr': 0.00041871967003503073, 'samples': 7891584, 'steps': 41101, 'loss/train': 1.260717749595642} -08/30/2021 20:35:07 - INFO - __main__ - Step 41103: {'lr': 0.00041871575399805947, 'samples': 7891776, 'steps': 41102, 'loss/train': 0.8088870644569397} -08/30/2021 20:35:08 - INFO - __main__ - Step 41104: {'lr': 0.0004187118378850674, 'samples': 7891968, 'steps': 41103, 'loss/train': 1.5420666933059692} -08/30/2021 20:35:08 - INFO - __main__ - Step 41105: {'lr': 0.00041870792169605654, 'samples': 7892160, 'steps': 41104, 'loss/train': 2.1212775707244873} -08/30/2021 20:35:08 - INFO - __main__ - Step 41106: {'lr': 0.0004187040054310284, 'samples': 7892352, 'steps': 41105, 'loss/train': 1.63030207157135} -08/30/2021 20:35:10 - INFO - __main__ - Step 41107: {'lr': 0.0004187000890899848, 'samples': 7892544, 'steps': 41106, 'loss/train': 1.4593793153762817} -08/30/2021 20:35:11 - INFO - __main__ - Step 41108: {'lr': 0.0004186961726729276, 'samples': 7892736, 'steps': 41107, 'loss/train': 1.0815961360931396} -08/30/2021 20:35:11 - INFO - __main__ - Step 41109: {'lr': 0.0004186922561798585, 'samples': 7892928, 'steps': 41108, 'loss/train': 1.1557074785232544} -08/30/2021 20:35:12 - INFO - __main__ - Step 41110: {'lr': 0.00041868833961077935, 'samples': 7893120, 'steps': 41109, 'loss/train': 1.4992958307266235} -08/30/2021 20:35:12 - INFO - __main__ - Step 41111: {'lr': 0.0004186844229656917, 'samples': 7893312, 'steps': 41110, 'loss/train': 1.2947490215301514} -08/30/2021 20:35:12 - INFO - __main__ - Step 41112: {'lr': 0.0004186805062445975, 'samples': 7893504, 'steps': 41111, 'loss/train': 1.4569388628005981} -08/30/2021 20:35:13 - INFO - __main__ - Step 41113: {'lr': 0.00041867658944749856, 'samples': 7893696, 'steps': 41112, 'loss/train': 0.7800092697143555} -08/30/2021 20:35:14 - INFO - __main__ - Step 41114: {'lr': 0.00041867267257439644, 'samples': 7893888, 'steps': 41113, 'loss/train': 0.17996972799301147} -08/30/2021 20:35:15 - INFO - __main__ - Step 41115: {'lr': 0.00041866875562529305, 'samples': 7894080, 'steps': 41114, 'loss/train': 1.33939528465271} -08/30/2021 20:35:15 - INFO - __main__ - Step 41116: {'lr': 0.0004186648386001901, 'samples': 7894272, 'steps': 41115, 'loss/train': 0.7180574536323547} -08/30/2021 20:35:15 - INFO - __main__ - Step 41117: {'lr': 0.0004186609214990894, 'samples': 7894464, 'steps': 41116, 'loss/train': 2.001742362976074} -08/30/2021 20:35:16 - INFO - __main__ - Step 41118: {'lr': 0.0004186570043219927, 'samples': 7894656, 'steps': 41117, 'loss/train': 2.100369453430176} -08/30/2021 20:35:18 - INFO - __main__ - Step 41119: {'lr': 0.0004186530870689017, 'samples': 7894848, 'steps': 41118, 'loss/train': 1.9339611530303955} -08/30/2021 20:35:18 - INFO - __main__ - Step 41120: {'lr': 0.00041864916973981833, 'samples': 7895040, 'steps': 41119, 'loss/train': 1.5928391218185425} -08/30/2021 20:35:19 - INFO - __main__ - Step 41121: {'lr': 0.0004186452523347442, 'samples': 7895232, 'steps': 41120, 'loss/train': 1.2443376779556274} -08/30/2021 20:35:19 - INFO - __main__ - Step 41122: {'lr': 0.00041864133485368106, 'samples': 7895424, 'steps': 41121, 'loss/train': 1.0927437543869019} -08/30/2021 20:35:19 - INFO - __main__ - Step 41123: {'lr': 0.0004186374172966308, 'samples': 7895616, 'steps': 41122, 'loss/train': 1.3871151208877563} -08/30/2021 20:35:21 - INFO - __main__ - Step 41124: {'lr': 0.0004186334996635951, 'samples': 7895808, 'steps': 41123, 'loss/train': 1.2048654556274414} -08/30/2021 20:35:21 - INFO - __main__ - Step 41125: {'lr': 0.00041862958195457574, 'samples': 7896000, 'steps': 41124, 'loss/train': 1.8102298974990845} -08/30/2021 20:35:22 - INFO - __main__ - Step 41126: {'lr': 0.0004186256641695745, 'samples': 7896192, 'steps': 41125, 'loss/train': 1.4453532695770264} -08/30/2021 20:35:22 - INFO - __main__ - Step 41127: {'lr': 0.00041862174630859315, 'samples': 7896384, 'steps': 41126, 'loss/train': 1.3289623260498047} -08/30/2021 20:35:22 - INFO - __main__ - Step 41128: {'lr': 0.0004186178283716334, 'samples': 7896576, 'steps': 41127, 'loss/train': 1.6302162408828735} -08/30/2021 20:35:24 - INFO - __main__ - Step 41129: {'lr': 0.0004186139103586971, 'samples': 7896768, 'steps': 41128, 'loss/train': 0.8472530245780945} -08/30/2021 20:35:24 - INFO - __main__ - Step 41130: {'lr': 0.00041860999226978605, 'samples': 7896960, 'steps': 41129, 'loss/train': 1.3820165395736694} -08/30/2021 20:35:25 - INFO - __main__ - Step 41131: {'lr': 0.0004186060741049018, 'samples': 7897152, 'steps': 41130, 'loss/train': 1.2151693105697632} -08/30/2021 20:35:25 - INFO - __main__ - Step 41132: {'lr': 0.00041860215586404624, 'samples': 7897344, 'steps': 41131, 'loss/train': 1.4448633193969727} -08/30/2021 20:35:25 - INFO - __main__ - Step 41133: {'lr': 0.00041859823754722127, 'samples': 7897536, 'steps': 41132, 'loss/train': 1.6656172275543213} -08/30/2021 20:35:27 - INFO - __main__ - Step 41134: {'lr': 0.00041859431915442847, 'samples': 7897728, 'steps': 41133, 'loss/train': 1.26059889793396} -08/30/2021 20:35:28 - INFO - __main__ - Step 41135: {'lr': 0.0004185904006856697, 'samples': 7897920, 'steps': 41134, 'loss/train': 2.2405757904052734} -08/30/2021 20:35:28 - INFO - __main__ - Step 41136: {'lr': 0.0004185864821409467, 'samples': 7898112, 'steps': 41135, 'loss/train': 1.5884689092636108} -08/30/2021 20:35:28 - INFO - __main__ - Step 41137: {'lr': 0.00041858256352026124, 'samples': 7898304, 'steps': 41136, 'loss/train': 1.6267186403274536} -08/30/2021 20:35:29 - INFO - __main__ - Step 41138: {'lr': 0.0004185786448236151, 'samples': 7898496, 'steps': 41137, 'loss/train': 0.18343879282474518} -08/30/2021 20:35:30 - INFO - __main__ - Step 41139: {'lr': 0.0004185747260510099, 'samples': 7898688, 'steps': 41138, 'loss/train': 1.2509409189224243} -08/30/2021 20:35:30 - INFO - __main__ - Step 41140: {'lr': 0.0004185708072024476, 'samples': 7898880, 'steps': 41139, 'loss/train': 1.298266053199768} -08/30/2021 20:35:31 - INFO - __main__ - Step 41141: {'lr': 0.0004185668882779299, 'samples': 7899072, 'steps': 41140, 'loss/train': 1.5813754796981812} -08/30/2021 20:35:31 - INFO - __main__ - Step 41142: {'lr': 0.00041856296927745857, 'samples': 7899264, 'steps': 41141, 'loss/train': 1.2210720777511597} -08/30/2021 20:35:32 - INFO - __main__ - Step 41143: {'lr': 0.00041855905020103543, 'samples': 7899456, 'steps': 41142, 'loss/train': 1.44577956199646} -08/30/2021 20:35:33 - INFO - __main__ - Step 41144: {'lr': 0.00041855513104866203, 'samples': 7899648, 'steps': 41143, 'loss/train': 1.6004148721694946} -08/30/2021 20:35:33 - INFO - __main__ - Step 41145: {'lr': 0.00041855121182034037, 'samples': 7899840, 'steps': 41144, 'loss/train': 1.6002393960952759} -08/30/2021 20:35:34 - INFO - __main__ - Step 41146: {'lr': 0.00041854729251607214, 'samples': 7900032, 'steps': 41145, 'loss/train': 1.4809231758117676} -08/30/2021 20:35:34 - INFO - __main__ - Step 41147: {'lr': 0.00041854337313585913, 'samples': 7900224, 'steps': 41146, 'loss/train': 1.6612613201141357} -08/30/2021 20:35:35 - INFO - __main__ - Step 41148: {'lr': 0.000418539453679703, 'samples': 7900416, 'steps': 41147, 'loss/train': 1.6361193656921387} -08/30/2021 20:35:35 - INFO - __main__ - Step 41149: {'lr': 0.0004185355341476057, 'samples': 7900608, 'steps': 41148, 'loss/train': 0.9765746593475342} -08/30/2021 20:35:36 - INFO - __main__ - Step 41150: {'lr': 0.00041853161453956885, 'samples': 7900800, 'steps': 41149, 'loss/train': 1.0844651460647583} -08/30/2021 20:35:37 - INFO - __main__ - Step 41151: {'lr': 0.0004185276948555942, 'samples': 7900992, 'steps': 41150, 'loss/train': 0.9594156742095947} -08/30/2021 20:35:37 - INFO - __main__ - Step 41152: {'lr': 0.0004185237750956836, 'samples': 7901184, 'steps': 41151, 'loss/train': 1.0592890977859497} -08/30/2021 20:35:37 - INFO - __main__ - Step 41153: {'lr': 0.0004185198552598388, 'samples': 7901376, 'steps': 41152, 'loss/train': 1.8063973188400269} -08/30/2021 20:35:38 - INFO - __main__ - Step 41154: {'lr': 0.00041851593534806154, 'samples': 7901568, 'steps': 41153, 'loss/train': 1.9475303888320923} -08/30/2021 20:35:39 - INFO - __main__ - Step 41155: {'lr': 0.0004185120153603536, 'samples': 7901760, 'steps': 41154, 'loss/train': 1.7926287651062012} -08/30/2021 20:35:40 - INFO - __main__ - Step 41156: {'lr': 0.0004185080952967168, 'samples': 7901952, 'steps': 41155, 'loss/train': 1.501604676246643} -08/30/2021 20:35:40 - INFO - __main__ - Step 41157: {'lr': 0.00041850417515715277, 'samples': 7902144, 'steps': 41156, 'loss/train': 1.3695975542068481} -08/30/2021 20:35:40 - INFO - __main__ - Step 41158: {'lr': 0.00041850025494166346, 'samples': 7902336, 'steps': 41157, 'loss/train': 1.0999211072921753} -08/30/2021 20:35:41 - INFO - __main__ - Step 41159: {'lr': 0.0004184963346502504, 'samples': 7902528, 'steps': 41158, 'loss/train': 1.0254195928573608} -08/30/2021 20:35:42 - INFO - __main__ - Step 41160: {'lr': 0.00041849241428291555, 'samples': 7902720, 'steps': 41159, 'loss/train': 1.5622034072875977} -08/30/2021 20:35:43 - INFO - __main__ - Step 41161: {'lr': 0.00041848849383966063, 'samples': 7902912, 'steps': 41160, 'loss/train': 1.7479673624038696} -08/30/2021 20:35:43 - INFO - __main__ - Step 41162: {'lr': 0.0004184845733204874, 'samples': 7903104, 'steps': 41161, 'loss/train': 1.334159016609192} -08/30/2021 20:35:43 - INFO - __main__ - Step 41163: {'lr': 0.00041848065272539765, 'samples': 7903296, 'steps': 41162, 'loss/train': 1.4729894399642944} -08/30/2021 20:35:44 - INFO - __main__ - Step 41164: {'lr': 0.00041847673205439305, 'samples': 7903488, 'steps': 41163, 'loss/train': 1.6320799589157104} -08/30/2021 20:35:46 - INFO - __main__ - Step 41165: {'lr': 0.0004184728113074755, 'samples': 7903680, 'steps': 41164, 'loss/train': 1.4478167295455933} -08/30/2021 20:35:46 - INFO - __main__ - Step 41166: {'lr': 0.00041846889048464665, 'samples': 7903872, 'steps': 41165, 'loss/train': 1.0429561138153076} -08/30/2021 20:35:46 - INFO - __main__ - Step 41167: {'lr': 0.0004184649695859083, 'samples': 7904064, 'steps': 41166, 'loss/train': 1.8019750118255615} -08/30/2021 20:35:47 - INFO - __main__ - Step 41168: {'lr': 0.00041846104861126233, 'samples': 7904256, 'steps': 41167, 'loss/train': 1.6707919836044312} -08/30/2021 20:35:47 - INFO - __main__ - Step 41169: {'lr': 0.0004184571275607103, 'samples': 7904448, 'steps': 41168, 'loss/train': 1.258258581161499} -08/30/2021 20:35:49 - INFO - __main__ - Step 41170: {'lr': 0.0004184532064342542, 'samples': 7904640, 'steps': 41169, 'loss/train': 1.4854133129119873} -08/30/2021 20:35:49 - INFO - __main__ - Step 41171: {'lr': 0.0004184492852318956, 'samples': 7904832, 'steps': 41170, 'loss/train': 1.4144489765167236} -08/30/2021 20:35:49 - INFO - __main__ - Step 41172: {'lr': 0.00041844536395363636, 'samples': 7905024, 'steps': 41171, 'loss/train': 1.8512024879455566} -08/30/2021 20:35:50 - INFO - __main__ - Step 41173: {'lr': 0.00041844144259947825, 'samples': 7905216, 'steps': 41172, 'loss/train': 1.0345797538757324} -08/30/2021 20:35:50 - INFO - __main__ - Step 41174: {'lr': 0.000418437521169423, 'samples': 7905408, 'steps': 41173, 'loss/train': 1.175742268562317} -08/30/2021 20:35:52 - INFO - __main__ - Step 41175: {'lr': 0.0004184335996634725, 'samples': 7905600, 'steps': 41174, 'loss/train': 1.855373501777649} -08/30/2021 20:35:52 - INFO - __main__ - Step 41176: {'lr': 0.00041842967808162834, 'samples': 7905792, 'steps': 41175, 'loss/train': 1.1694527864456177} -08/30/2021 20:35:52 - INFO - __main__ - Step 41177: {'lr': 0.0004184257564238924, 'samples': 7905984, 'steps': 41176, 'loss/train': 1.225437045097351} -08/30/2021 20:35:53 - INFO - __main__ - Step 41178: {'lr': 0.0004184218346902663, 'samples': 7906176, 'steps': 41177, 'loss/train': 1.5754886865615845} -08/30/2021 20:35:53 - INFO - __main__ - Step 41179: {'lr': 0.00041841791288075203, 'samples': 7906368, 'steps': 41178, 'loss/train': 1.413666009902954} -08/30/2021 20:35:53 - INFO - __main__ - Step 41180: {'lr': 0.0004184139909953513, 'samples': 7906560, 'steps': 41179, 'loss/train': 1.5631316900253296} -08/30/2021 20:35:55 - INFO - __main__ - Step 41181: {'lr': 0.0004184100690340657, 'samples': 7906752, 'steps': 41180, 'loss/train': 1.9184987545013428} -08/30/2021 20:35:56 - INFO - __main__ - Step 41182: {'lr': 0.00041840614699689715, 'samples': 7906944, 'steps': 41181, 'loss/train': 1.3525869846343994} -08/30/2021 20:35:56 - INFO - __main__ - Step 41183: {'lr': 0.00041840222488384745, 'samples': 7907136, 'steps': 41182, 'loss/train': 1.8391982316970825} -08/30/2021 20:35:57 - INFO - __main__ - Step 41184: {'lr': 0.00041839830269491823, 'samples': 7907328, 'steps': 41183, 'loss/train': 1.794416069984436} -08/30/2021 20:35:57 - INFO - __main__ - Step 41185: {'lr': 0.0004183943804301114, 'samples': 7907520, 'steps': 41184, 'loss/train': 0.9707196950912476} -08/30/2021 20:35:58 - INFO - __main__ - Step 41186: {'lr': 0.0004183904580894287, 'samples': 7907712, 'steps': 41185, 'loss/train': 1.2880208492279053} -08/30/2021 20:35:59 - INFO - __main__ - Step 41187: {'lr': 0.0004183865356728717, 'samples': 7907904, 'steps': 41186, 'loss/train': 1.4405531883239746} -08/30/2021 20:35:59 - INFO - __main__ - Step 41188: {'lr': 0.0004183826131804424, 'samples': 7908096, 'steps': 41187, 'loss/train': 1.4917259216308594} -08/30/2021 20:36:00 - INFO - __main__ - Step 41189: {'lr': 0.0004183786906121425, 'samples': 7908288, 'steps': 41188, 'loss/train': 1.5126454830169678} -08/30/2021 20:36:00 - INFO - __main__ - Step 41190: {'lr': 0.0004183747679679738, 'samples': 7908480, 'steps': 41189, 'loss/train': 1.4933738708496094} -08/30/2021 20:36:01 - INFO - __main__ - Step 41191: {'lr': 0.000418370845247938, 'samples': 7908672, 'steps': 41190, 'loss/train': 1.5166252851486206} -08/30/2021 20:36:02 - INFO - __main__ - Step 41192: {'lr': 0.0004183669224520369, 'samples': 7908864, 'steps': 41191, 'loss/train': 1.0033994913101196} -08/30/2021 20:36:02 - INFO - __main__ - Step 41193: {'lr': 0.00041836299958027226, 'samples': 7909056, 'steps': 41192, 'loss/train': 1.684597373008728} -08/30/2021 20:36:03 - INFO - __main__ - Step 41194: {'lr': 0.00041835907663264585, 'samples': 7909248, 'steps': 41193, 'loss/train': 1.4224045276641846} -08/30/2021 20:36:03 - INFO - __main__ - Step 41195: {'lr': 0.0004183551536091594, 'samples': 7909440, 'steps': 41194, 'loss/train': 1.156130313873291} -08/30/2021 20:36:05 - INFO - __main__ - Step 41196: {'lr': 0.00041835123050981476, 'samples': 7909632, 'steps': 41195, 'loss/train': 1.3038029670715332} -08/30/2021 20:36:05 - INFO - __main__ - Step 41197: {'lr': 0.00041834730733461366, 'samples': 7909824, 'steps': 41196, 'loss/train': 1.849747896194458} -08/30/2021 20:36:05 - INFO - __main__ - Step 41198: {'lr': 0.0004183433840835578, 'samples': 7910016, 'steps': 41197, 'loss/train': 1.677782416343689} -08/30/2021 20:36:06 - INFO - __main__ - Step 41199: {'lr': 0.0004183394607566491, 'samples': 7910208, 'steps': 41198, 'loss/train': 1.5658795833587646} -08/30/2021 20:36:06 - INFO - __main__ - Step 41200: {'lr': 0.0004183355373538892, 'samples': 7910400, 'steps': 41199, 'loss/train': 1.3178255558013916} -08/30/2021 20:36:07 - INFO - __main__ - Step 41201: {'lr': 0.00041833161387527985, 'samples': 7910592, 'steps': 41200, 'loss/train': 2.0289249420166016} -08/30/2021 20:36:08 - INFO - __main__ - Step 41202: {'lr': 0.0004183276903208228, 'samples': 7910784, 'steps': 41201, 'loss/train': 1.6866228580474854} -08/30/2021 20:36:08 - INFO - __main__ - Step 41203: {'lr': 0.0004183237666905201, 'samples': 7910976, 'steps': 41202, 'loss/train': 2.2124955654144287} -08/30/2021 20:36:09 - INFO - __main__ - Step 41204: {'lr': 0.0004183198429843732, 'samples': 7911168, 'steps': 41203, 'loss/train': 1.5908187627792358} -08/30/2021 20:36:09 - INFO - __main__ - Step 41205: {'lr': 0.00041831591920238396, 'samples': 7911360, 'steps': 41204, 'loss/train': 1.152055025100708} -08/30/2021 20:36:09 - INFO - __main__ - Step 41206: {'lr': 0.0004183119953445542, 'samples': 7911552, 'steps': 41205, 'loss/train': 1.8606780767440796} -08/30/2021 20:36:11 - INFO - __main__ - Step 41207: {'lr': 0.00041830807141088566, 'samples': 7911744, 'steps': 41206, 'loss/train': 1.3945108652114868} -08/30/2021 20:36:11 - INFO - __main__ - Step 41208: {'lr': 0.0004183041474013801, 'samples': 7911936, 'steps': 41207, 'loss/train': 1.9925767183303833} -08/30/2021 20:36:12 - INFO - __main__ - Step 41209: {'lr': 0.00041830022331603925, 'samples': 7912128, 'steps': 41208, 'loss/train': 1.4634283781051636} -08/30/2021 20:36:12 - INFO - __main__ - Step 41210: {'lr': 0.000418296299154865, 'samples': 7912320, 'steps': 41209, 'loss/train': 0.9838194847106934} -08/30/2021 20:36:13 - INFO - __main__ - Step 41211: {'lr': 0.000418292374917859, 'samples': 7912512, 'steps': 41210, 'loss/train': 0.11574981361627579} -08/30/2021 20:36:14 - INFO - __main__ - Step 41212: {'lr': 0.00041828845060502297, 'samples': 7912704, 'steps': 41211, 'loss/train': 1.3025445938110352} -08/30/2021 20:36:14 - INFO - __main__ - Step 41213: {'lr': 0.00041828452621635884, 'samples': 7912896, 'steps': 41212, 'loss/train': 1.4020315408706665} -08/30/2021 20:36:15 - INFO - __main__ - Step 41214: {'lr': 0.0004182806017518682, 'samples': 7913088, 'steps': 41213, 'loss/train': 1.5939383506774902} -08/30/2021 20:36:15 - INFO - __main__ - Step 41215: {'lr': 0.00041827667721155303, 'samples': 7913280, 'steps': 41214, 'loss/train': 1.310970425605774} -08/30/2021 20:36:16 - INFO - __main__ - Step 41216: {'lr': 0.000418272752595415, 'samples': 7913472, 'steps': 41215, 'loss/train': 1.8270729780197144} -08/30/2021 20:36:17 - INFO - __main__ - Step 41217: {'lr': 0.00041826882790345577, 'samples': 7913664, 'steps': 41216, 'loss/train': 1.6407090425491333} -08/30/2021 20:36:18 - INFO - __main__ - Step 41218: {'lr': 0.00041826490313567725, 'samples': 7913856, 'steps': 41217, 'loss/train': 1.4719997644424438} -08/30/2021 20:36:18 - INFO - __main__ - Step 41219: {'lr': 0.0004182609782920812, 'samples': 7914048, 'steps': 41218, 'loss/train': 1.364977240562439} -08/30/2021 20:36:18 - INFO - __main__ - Step 41220: {'lr': 0.0004182570533726693, 'samples': 7914240, 'steps': 41219, 'loss/train': 1.3081600666046143} -08/30/2021 20:36:19 - INFO - __main__ - Step 41221: {'lr': 0.00041825312837744333, 'samples': 7914432, 'steps': 41220, 'loss/train': 1.5823677778244019} -08/30/2021 20:36:19 - INFO - __main__ - Step 41222: {'lr': 0.00041824920330640517, 'samples': 7914624, 'steps': 41221, 'loss/train': 1.9655245542526245} -08/30/2021 20:36:21 - INFO - __main__ - Step 41223: {'lr': 0.0004182452781595565, 'samples': 7914816, 'steps': 41222, 'loss/train': 1.5999000072479248} -08/30/2021 20:36:21 - INFO - __main__ - Step 41224: {'lr': 0.0004182413529368991, 'samples': 7915008, 'steps': 41223, 'loss/train': 1.6796811819076538} -08/30/2021 20:36:21 - INFO - __main__ - Step 41225: {'lr': 0.0004182374276384347, 'samples': 7915200, 'steps': 41224, 'loss/train': 1.036651372909546} -08/30/2021 20:36:22 - INFO - __main__ - Step 41226: {'lr': 0.0004182335022641651, 'samples': 7915392, 'steps': 41225, 'loss/train': 0.069374680519104} -08/30/2021 20:36:22 - INFO - __main__ - Step 41227: {'lr': 0.00041822957681409215, 'samples': 7915584, 'steps': 41226, 'loss/train': 1.2115402221679688} -08/30/2021 20:36:24 - INFO - __main__ - Step 41228: {'lr': 0.00041822565128821757, 'samples': 7915776, 'steps': 41227, 'loss/train': 2.117685079574585} -08/30/2021 20:36:24 - INFO - __main__ - Step 41229: {'lr': 0.00041822172568654306, 'samples': 7915968, 'steps': 41228, 'loss/train': 1.4366461038589478} -08/30/2021 20:36:24 - INFO - __main__ - Step 41230: {'lr': 0.0004182178000090704, 'samples': 7916160, 'steps': 41229, 'loss/train': 1.3132134675979614} -08/30/2021 20:36:25 - INFO - __main__ - Step 41231: {'lr': 0.0004182138742558015, 'samples': 7916352, 'steps': 41230, 'loss/train': 1.5946420431137085} -08/30/2021 20:36:25 - INFO - __main__ - Step 41232: {'lr': 0.00041820994842673787, 'samples': 7916544, 'steps': 41231, 'loss/train': 1.184988021850586} -08/30/2021 20:36:27 - INFO - __main__ - Step 41233: {'lr': 0.00041820602252188156, 'samples': 7916736, 'steps': 41232, 'loss/train': 1.5236599445343018} -08/30/2021 20:36:27 - INFO - __main__ - Step 41234: {'lr': 0.00041820209654123416, 'samples': 7916928, 'steps': 41233, 'loss/train': 0.06497249752283096} -08/30/2021 20:36:28 - INFO - __main__ - Step 41235: {'lr': 0.00041819817048479745, 'samples': 7917120, 'steps': 41234, 'loss/train': 2.5339417457580566} -08/30/2021 20:36:28 - INFO - __main__ - Step 41236: {'lr': 0.0004181942443525734, 'samples': 7917312, 'steps': 41235, 'loss/train': 1.3345385789871216} -08/30/2021 20:36:28 - INFO - __main__ - Step 41237: {'lr': 0.00041819031814456346, 'samples': 7917504, 'steps': 41236, 'loss/train': 1.2078496217727661} -08/30/2021 20:36:29 - INFO - __main__ - Step 41238: {'lr': 0.0004181863918607696, 'samples': 7917696, 'steps': 41237, 'loss/train': 2.0453271865844727} -08/30/2021 20:36:31 - INFO - __main__ - Step 41239: {'lr': 0.00041818246550119354, 'samples': 7917888, 'steps': 41238, 'loss/train': 0.9403941035270691} -08/30/2021 20:36:31 - INFO - __main__ - Step 41240: {'lr': 0.00041817853906583706, 'samples': 7918080, 'steps': 41239, 'loss/train': 1.2611885070800781} -08/30/2021 20:36:31 - INFO - __main__ - Step 41241: {'lr': 0.000418174612554702, 'samples': 7918272, 'steps': 41240, 'loss/train': 1.3527159690856934} -08/30/2021 20:36:32 - INFO - __main__ - Step 41242: {'lr': 0.00041817068596778994, 'samples': 7918464, 'steps': 41241, 'loss/train': 1.6246562004089355} -08/30/2021 20:36:32 - INFO - __main__ - Step 41243: {'lr': 0.0004181667593051028, 'samples': 7918656, 'steps': 41242, 'loss/train': 1.3783191442489624} -08/30/2021 20:36:34 - INFO - __main__ - Step 41244: {'lr': 0.0004181628325666424, 'samples': 7918848, 'steps': 41243, 'loss/train': 1.810223937034607} -08/30/2021 20:36:34 - INFO - __main__ - Step 41245: {'lr': 0.0004181589057524103, 'samples': 7919040, 'steps': 41244, 'loss/train': 1.1112293004989624} -08/30/2021 20:36:35 - INFO - __main__ - Step 41246: {'lr': 0.0004181549788624085, 'samples': 7919232, 'steps': 41245, 'loss/train': 1.631000280380249} -08/30/2021 20:36:35 - INFO - __main__ - Step 41247: {'lr': 0.0004181510518966386, 'samples': 7919424, 'steps': 41246, 'loss/train': 1.891631007194519} -08/30/2021 20:36:35 - INFO - __main__ - Step 41248: {'lr': 0.00041814712485510245, 'samples': 7919616, 'steps': 41247, 'loss/train': 1.438342809677124} -08/30/2021 20:36:36 - INFO - __main__ - Step 41249: {'lr': 0.0004181431977378017, 'samples': 7919808, 'steps': 41248, 'loss/train': 1.6112282276153564} -08/30/2021 20:36:37 - INFO - __main__ - Step 41250: {'lr': 0.00041813927054473835, 'samples': 7920000, 'steps': 41249, 'loss/train': 1.4170291423797607} -08/30/2021 20:36:38 - INFO - __main__ - Step 41251: {'lr': 0.000418135343275914, 'samples': 7920192, 'steps': 41250, 'loss/train': 1.076360821723938} -08/30/2021 20:36:38 - INFO - __main__ - Step 41252: {'lr': 0.0004181314159313305, 'samples': 7920384, 'steps': 41251, 'loss/train': 1.6936711072921753} -08/30/2021 20:36:38 - INFO - __main__ - Step 41253: {'lr': 0.0004181274885109895, 'samples': 7920576, 'steps': 41252, 'loss/train': 1.1377519369125366} -08/30/2021 20:36:39 - INFO - __main__ - Step 41254: {'lr': 0.0004181235610148929, 'samples': 7920768, 'steps': 41253, 'loss/train': 1.7415578365325928} -08/30/2021 20:36:40 - INFO - __main__ - Step 41255: {'lr': 0.0004181196334430424, 'samples': 7920960, 'steps': 41254, 'loss/train': 1.8357971906661987} -08/30/2021 20:36:41 - INFO - __main__ - Step 41256: {'lr': 0.00041811570579543977, 'samples': 7921152, 'steps': 41255, 'loss/train': 1.1603772640228271} -08/30/2021 20:36:41 - INFO - __main__ - Step 41257: {'lr': 0.0004181117780720868, 'samples': 7921344, 'steps': 41256, 'loss/train': 1.2881780862808228} -08/30/2021 20:36:41 - INFO - __main__ - Step 41258: {'lr': 0.00041810785027298524, 'samples': 7921536, 'steps': 41257, 'loss/train': 1.499526023864746} -08/30/2021 20:36:42 - INFO - __main__ - Step 41259: {'lr': 0.00041810392239813695, 'samples': 7921728, 'steps': 41258, 'loss/train': 1.756121277809143} -08/30/2021 20:36:43 - INFO - __main__ - Step 41260: {'lr': 0.00041809999444754353, 'samples': 7921920, 'steps': 41259, 'loss/train': 1.7205058336257935} -08/30/2021 20:36:44 - INFO - __main__ - Step 41261: {'lr': 0.0004180960664212069, 'samples': 7922112, 'steps': 41260, 'loss/train': 1.3784785270690918} -08/30/2021 20:36:44 - INFO - __main__ - Step 41262: {'lr': 0.00041809213831912884, 'samples': 7922304, 'steps': 41261, 'loss/train': 1.8103562593460083} -08/30/2021 20:36:44 - INFO - __main__ - Step 41263: {'lr': 0.0004180882101413109, 'samples': 7922496, 'steps': 41262, 'loss/train': 1.4028496742248535} -08/30/2021 20:36:45 - INFO - __main__ - Step 41264: {'lr': 0.00041808428188775515, 'samples': 7922688, 'steps': 41263, 'loss/train': 1.2405023574829102} -08/30/2021 20:36:45 - INFO - __main__ - Step 41265: {'lr': 0.0004180803535584632, 'samples': 7922880, 'steps': 41264, 'loss/train': 1.0862245559692383} -08/30/2021 20:36:47 - INFO - __main__ - Step 41266: {'lr': 0.0004180764251534368, 'samples': 7923072, 'steps': 41265, 'loss/train': 0.8103510141372681} -08/30/2021 20:36:47 - INFO - __main__ - Step 41267: {'lr': 0.0004180724966726778, 'samples': 7923264, 'steps': 41266, 'loss/train': 0.6353318095207214} -08/30/2021 20:36:47 - INFO - __main__ - Step 41268: {'lr': 0.00041806856811618784, 'samples': 7923456, 'steps': 41267, 'loss/train': 1.0904096364974976} -08/30/2021 20:36:48 - INFO - __main__ - Step 41269: {'lr': 0.00041806463948396876, 'samples': 7923648, 'steps': 41268, 'loss/train': 0.03769872710108757} -08/30/2021 20:36:48 - INFO - __main__ - Step 41270: {'lr': 0.0004180607107760225, 'samples': 7923840, 'steps': 41269, 'loss/train': 1.3871409893035889} -08/30/2021 20:36:50 - INFO - __main__ - Step 41271: {'lr': 0.0004180567819923505, 'samples': 7924032, 'steps': 41270, 'loss/train': 1.689682126045227} -08/30/2021 20:36:51 - INFO - __main__ - Step 41272: {'lr': 0.0004180528531329548, 'samples': 7924224, 'steps': 41271, 'loss/train': 1.1208053827285767} -08/30/2021 20:36:51 - INFO - __main__ - Step 41273: {'lr': 0.00041804892419783715, 'samples': 7924416, 'steps': 41272, 'loss/train': 1.3321681022644043} -08/30/2021 20:36:51 - INFO - __main__ - Step 41274: {'lr': 0.0004180449951869991, 'samples': 7924608, 'steps': 41273, 'loss/train': 2.166050672531128} -08/30/2021 20:36:52 - INFO - __main__ - Step 41275: {'lr': 0.00041804106610044263, 'samples': 7924800, 'steps': 41274, 'loss/train': 1.4557514190673828} -08/30/2021 20:36:52 - INFO - __main__ - Step 41276: {'lr': 0.00041803713693816947, 'samples': 7924992, 'steps': 41275, 'loss/train': 1.561365008354187} -08/30/2021 20:36:53 - INFO - __main__ - Step 41277: {'lr': 0.0004180332077001814, 'samples': 7925184, 'steps': 41276, 'loss/train': 1.3182331323623657} -08/30/2021 20:36:54 - INFO - __main__ - Step 41278: {'lr': 0.0004180292783864801, 'samples': 7925376, 'steps': 41277, 'loss/train': 0.9406395554542542} -08/30/2021 20:36:54 - INFO - __main__ - Step 41279: {'lr': 0.00041802534899706734, 'samples': 7925568, 'steps': 41278, 'loss/train': 1.492274522781372} -08/30/2021 20:36:55 - INFO - __main__ - Step 41280: {'lr': 0.0004180214195319451, 'samples': 7925760, 'steps': 41279, 'loss/train': 0.9967102408409119} -08/30/2021 20:36:55 - INFO - __main__ - Step 41281: {'lr': 0.00041801748999111487, 'samples': 7925952, 'steps': 41280, 'loss/train': 3.0506930351257324} -08/30/2021 20:36:57 - INFO - __main__ - Step 41282: {'lr': 0.0004180135603745786, 'samples': 7926144, 'steps': 41281, 'loss/train': 2.5706984996795654} -08/30/2021 20:36:57 - INFO - __main__ - Step 41283: {'lr': 0.000418009630682338, 'samples': 7926336, 'steps': 41282, 'loss/train': 1.1314271688461304} -08/30/2021 20:36:57 - INFO - __main__ - Step 41284: {'lr': 0.00041800570091439493, 'samples': 7926528, 'steps': 41283, 'loss/train': 0.8926066160202026} -08/30/2021 20:36:58 - INFO - __main__ - Step 41285: {'lr': 0.000418001771070751, 'samples': 7926720, 'steps': 41284, 'loss/train': 1.5769743919372559} -08/30/2021 20:36:58 - INFO - __main__ - Step 41286: {'lr': 0.0004179978411514081, 'samples': 7926912, 'steps': 41285, 'loss/train': 0.6704384088516235} -08/30/2021 20:37:00 - INFO - __main__ - Step 41287: {'lr': 0.000417993911156368, 'samples': 7927104, 'steps': 41286, 'loss/train': 1.2842239141464233} -08/30/2021 20:37:00 - INFO - __main__ - Step 41288: {'lr': 0.00041798998108563234, 'samples': 7927296, 'steps': 41287, 'loss/train': 1.8976343870162964} -08/30/2021 20:37:01 - INFO - __main__ - Step 41289: {'lr': 0.00041798605093920307, 'samples': 7927488, 'steps': 41288, 'loss/train': 1.4811615943908691} -08/30/2021 20:37:01 - INFO - __main__ - Step 41290: {'lr': 0.00041798212071708185, 'samples': 7927680, 'steps': 41289, 'loss/train': 1.5192782878875732} -08/30/2021 20:37:02 - INFO - __main__ - Step 41291: {'lr': 0.0004179781904192704, 'samples': 7927872, 'steps': 41290, 'loss/train': 1.0847587585449219} -08/30/2021 20:37:02 - INFO - __main__ - Step 41292: {'lr': 0.00041797426004577066, 'samples': 7928064, 'steps': 41291, 'loss/train': 1.0678871870040894} -08/30/2021 20:37:05 - INFO - __main__ - Step 41293: {'lr': 0.00041797032959658433, 'samples': 7928256, 'steps': 41292, 'loss/train': 0.04964858293533325} -08/30/2021 20:37:05 - INFO - __main__ - Step 41294: {'lr': 0.0004179663990717131, 'samples': 7928448, 'steps': 41293, 'loss/train': 0.8260741233825684} -08/30/2021 20:37:05 - INFO - __main__ - Step 41295: {'lr': 0.0004179624684711588, 'samples': 7928640, 'steps': 41294, 'loss/train': 1.6288862228393555} -08/30/2021 20:37:06 - INFO - __main__ - Step 41296: {'lr': 0.0004179585377949232, 'samples': 7928832, 'steps': 41295, 'loss/train': 1.1667031049728394} -08/30/2021 20:37:06 - INFO - __main__ - Step 41297: {'lr': 0.0004179546070430082, 'samples': 7929024, 'steps': 41296, 'loss/train': 1.6510547399520874} -08/30/2021 20:37:07 - INFO - __main__ - Step 41298: {'lr': 0.0004179506762154153, 'samples': 7929216, 'steps': 41297, 'loss/train': 1.3736963272094727} -08/30/2021 20:37:07 - INFO - __main__ - Step 41299: {'lr': 0.0004179467453121465, 'samples': 7929408, 'steps': 41298, 'loss/train': 0.03156067430973053} -08/30/2021 20:37:08 - INFO - __main__ - Step 41300: {'lr': 0.0004179428143332035, 'samples': 7929600, 'steps': 41299, 'loss/train': 0.03029993362724781} -08/30/2021 20:37:09 - INFO - __main__ - Step 41301: {'lr': 0.000417938883278588, 'samples': 7929792, 'steps': 41300, 'loss/train': 1.6002839803695679} -08/30/2021 20:37:09 - INFO - __main__ - Step 41302: {'lr': 0.0004179349521483018, 'samples': 7929984, 'steps': 41301, 'loss/train': 0.8408775329589844} -08/30/2021 20:37:10 - INFO - __main__ - Step 41303: {'lr': 0.00041793102094234673, 'samples': 7930176, 'steps': 41302, 'loss/train': 0.9855254888534546} -08/30/2021 20:37:10 - INFO - __main__ - Step 41304: {'lr': 0.00041792708966072455, 'samples': 7930368, 'steps': 41303, 'loss/train': 0.8408874273300171} -08/30/2021 20:37:11 - INFO - __main__ - Step 41305: {'lr': 0.0004179231583034371, 'samples': 7930560, 'steps': 41304, 'loss/train': 1.7330666780471802} -08/30/2021 20:37:12 - INFO - __main__ - Step 41306: {'lr': 0.0004179192268704859, 'samples': 7930752, 'steps': 41305, 'loss/train': 1.4362725019454956} -08/30/2021 20:37:12 - INFO - __main__ - Step 41307: {'lr': 0.000417915295361873, 'samples': 7930944, 'steps': 41306, 'loss/train': 1.5189247131347656} -08/30/2021 20:37:13 - INFO - __main__ - Step 41308: {'lr': 0.0004179113637776, 'samples': 7931136, 'steps': 41307, 'loss/train': 1.153175711631775} -08/30/2021 20:37:13 - INFO - __main__ - Step 41309: {'lr': 0.0004179074321176688, 'samples': 7931328, 'steps': 41308, 'loss/train': 5.87996768951416} -08/30/2021 20:37:14 - INFO - __main__ - Step 41310: {'lr': 0.000417903500382081, 'samples': 7931520, 'steps': 41309, 'loss/train': 1.574993371963501} -08/30/2021 20:37:15 - INFO - __main__ - Step 41311: {'lr': 0.00041789956857083853, 'samples': 7931712, 'steps': 41310, 'loss/train': 1.482379674911499} -08/30/2021 20:37:15 - INFO - __main__ - Step 41312: {'lr': 0.00041789563668394314, 'samples': 7931904, 'steps': 41311, 'loss/train': 1.3061654567718506} -08/30/2021 20:37:15 - INFO - __main__ - Step 41313: {'lr': 0.0004178917047213965, 'samples': 7932096, 'steps': 41312, 'loss/train': 1.6246038675308228} -08/30/2021 20:37:16 - INFO - __main__ - Step 41314: {'lr': 0.00041788777268320055, 'samples': 7932288, 'steps': 41313, 'loss/train': 1.4020289182662964} -08/30/2021 20:37:18 - INFO - __main__ - Step 41315: {'lr': 0.00041788384056935693, 'samples': 7932480, 'steps': 41314, 'loss/train': 1.9095011949539185} -08/30/2021 20:37:18 - INFO - __main__ - Step 41316: {'lr': 0.0004178799083798673, 'samples': 7932672, 'steps': 41315, 'loss/train': 0.05646982043981552} -08/30/2021 20:37:19 - INFO - __main__ - Step 41317: {'lr': 0.00041787597611473375, 'samples': 7932864, 'steps': 41316, 'loss/train': 0.280333012342453} -08/30/2021 20:37:19 - INFO - __main__ - Step 41318: {'lr': 0.00041787204377395783, 'samples': 7933056, 'steps': 41317, 'loss/train': 1.6196471452713013} -08/30/2021 20:37:19 - INFO - __main__ - Step 41319: {'lr': 0.0004178681113575413, 'samples': 7933248, 'steps': 41318, 'loss/train': 2.8572938442230225} -08/30/2021 20:37:20 - INFO - __main__ - Step 41320: {'lr': 0.00041786417886548606, 'samples': 7933440, 'steps': 41319, 'loss/train': 1.4754540920257568} -08/30/2021 20:37:21 - INFO - __main__ - Step 41321: {'lr': 0.0004178602462977937, 'samples': 7933632, 'steps': 41320, 'loss/train': 1.090175986289978} -08/30/2021 20:37:22 - INFO - __main__ - Step 41322: {'lr': 0.0004178563136544662, 'samples': 7933824, 'steps': 41321, 'loss/train': 0.8622119426727295} -08/30/2021 20:37:22 - INFO - __main__ - Step 41323: {'lr': 0.0004178523809355053, 'samples': 7934016, 'steps': 41322, 'loss/train': 1.6504896879196167} -08/30/2021 20:37:22 - INFO - __main__ - Step 41324: {'lr': 0.00041784844814091263, 'samples': 7934208, 'steps': 41323, 'loss/train': 1.3027901649475098} -08/30/2021 20:37:23 - INFO - __main__ - Step 41325: {'lr': 0.00041784451527069, 'samples': 7934400, 'steps': 41324, 'loss/train': 1.4094593524932861} -08/30/2021 20:37:24 - INFO - __main__ - Step 41326: {'lr': 0.0004178405823248392, 'samples': 7934592, 'steps': 41325, 'loss/train': 1.3172539472579956} -08/30/2021 20:37:25 - INFO - __main__ - Step 41327: {'lr': 0.0004178366493033621, 'samples': 7934784, 'steps': 41326, 'loss/train': 1.769757628440857} -08/30/2021 20:37:25 - INFO - __main__ - Step 41328: {'lr': 0.0004178327162062604, 'samples': 7934976, 'steps': 41327, 'loss/train': 1.6797744035720825} -08/30/2021 20:37:25 - INFO - __main__ - Step 41329: {'lr': 0.00041782878303353577, 'samples': 7935168, 'steps': 41328, 'loss/train': 1.444676399230957} -08/30/2021 20:37:26 - INFO - __main__ - Step 41330: {'lr': 0.0004178248497851902, 'samples': 7935360, 'steps': 41329, 'loss/train': 1.2998301982879639} -08/30/2021 20:37:27 - INFO - __main__ - Step 41331: {'lr': 0.00041782091646122533, 'samples': 7935552, 'steps': 41330, 'loss/train': 1.433681845664978} -08/30/2021 20:37:28 - INFO - __main__ - Step 41332: {'lr': 0.00041781698306164283, 'samples': 7935744, 'steps': 41331, 'loss/train': 1.5670560598373413} -08/30/2021 20:37:28 - INFO - __main__ - Step 41333: {'lr': 0.0004178130495864447, 'samples': 7935936, 'steps': 41332, 'loss/train': 0.9618202447891235} -08/30/2021 20:37:28 - INFO - __main__ - Step 41334: {'lr': 0.00041780911603563254, 'samples': 7936128, 'steps': 41333, 'loss/train': 2.1129024028778076} -08/30/2021 20:37:29 - INFO - __main__ - Step 41335: {'lr': 0.00041780518240920817, 'samples': 7936320, 'steps': 41334, 'loss/train': 1.4177297353744507} -08/30/2021 20:37:30 - INFO - __main__ - Step 41336: {'lr': 0.0004178012487071734, 'samples': 7936512, 'steps': 41335, 'loss/train': 1.4227393865585327} -08/30/2021 20:37:31 - INFO - __main__ - Step 41337: {'lr': 0.00041779731492953, 'samples': 7936704, 'steps': 41336, 'loss/train': 1.8759641647338867} -08/30/2021 20:37:31 - INFO - __main__ - Step 41338: {'lr': 0.0004177933810762797, 'samples': 7936896, 'steps': 41337, 'loss/train': 0.45274025201797485} -08/30/2021 20:37:31 - INFO - __main__ - Step 41339: {'lr': 0.00041778944714742435, 'samples': 7937088, 'steps': 41338, 'loss/train': 1.0199908018112183} -08/30/2021 20:37:32 - INFO - __main__ - Step 41340: {'lr': 0.00041778551314296556, 'samples': 7937280, 'steps': 41339, 'loss/train': 0.9563559293746948} -08/30/2021 20:37:33 - INFO - __main__ - Step 41341: {'lr': 0.00041778157906290525, 'samples': 7937472, 'steps': 41340, 'loss/train': 1.699133276939392} -08/30/2021 20:37:34 - INFO - __main__ - Step 41342: {'lr': 0.00041777764490724515, 'samples': 7937664, 'steps': 41341, 'loss/train': 1.13656747341156} -08/30/2021 20:37:34 - INFO - __main__ - Step 41343: {'lr': 0.00041777371067598705, 'samples': 7937856, 'steps': 41342, 'loss/train': 0.8937574028968811} -08/30/2021 20:37:34 - INFO - __main__ - Step 41344: {'lr': 0.00041776977636913274, 'samples': 7938048, 'steps': 41343, 'loss/train': 1.0681222677230835} -08/30/2021 20:37:35 - INFO - __main__ - Step 41345: {'lr': 0.0004177658419866839, 'samples': 7938240, 'steps': 41344, 'loss/train': 0.837557315826416} -08/30/2021 20:37:35 - INFO - __main__ - Step 41346: {'lr': 0.0004177619075286424, 'samples': 7938432, 'steps': 41345, 'loss/train': 1.1064404249191284} -08/30/2021 20:37:37 - INFO - __main__ - Step 41347: {'lr': 0.00041775797299500997, 'samples': 7938624, 'steps': 41346, 'loss/train': 1.5079741477966309} -08/30/2021 20:37:38 - INFO - __main__ - Step 41348: {'lr': 0.0004177540383857883, 'samples': 7938816, 'steps': 41347, 'loss/train': 2.0026466846466064} -08/30/2021 20:37:38 - INFO - __main__ - Step 41349: {'lr': 0.0004177501037009793, 'samples': 7939008, 'steps': 41348, 'loss/train': 1.864587426185608} -08/30/2021 20:37:38 - INFO - __main__ - Step 41350: {'lr': 0.0004177461689405847, 'samples': 7939200, 'steps': 41349, 'loss/train': 1.3859156370162964} -08/30/2021 20:37:39 - INFO - __main__ - Step 41351: {'lr': 0.00041774223410460633, 'samples': 7939392, 'steps': 41350, 'loss/train': 1.5511083602905273} -08/30/2021 20:37:40 - INFO - __main__ - Step 41352: {'lr': 0.00041773829919304584, 'samples': 7939584, 'steps': 41351, 'loss/train': 1.1542161703109741} -08/30/2021 20:37:41 - INFO - __main__ - Step 41353: {'lr': 0.000417734364205905, 'samples': 7939776, 'steps': 41352, 'loss/train': 1.1124930381774902} -08/30/2021 20:37:41 - INFO - __main__ - Step 41354: {'lr': 0.0004177304291431857, 'samples': 7939968, 'steps': 41353, 'loss/train': 2.221064329147339} -08/30/2021 20:37:41 - INFO - __main__ - Step 41355: {'lr': 0.00041772649400488967, 'samples': 7940160, 'steps': 41354, 'loss/train': 1.5445185899734497} -08/30/2021 20:37:42 - INFO - __main__ - Step 41356: {'lr': 0.0004177225587910186, 'samples': 7940352, 'steps': 41355, 'loss/train': 1.1371402740478516} -08/30/2021 20:37:43 - INFO - __main__ - Step 41357: {'lr': 0.0004177186235015744, 'samples': 7940544, 'steps': 41356, 'loss/train': 1.7798751592636108} -08/30/2021 20:37:44 - INFO - __main__ - Step 41358: {'lr': 0.0004177146881365588, 'samples': 7940736, 'steps': 41357, 'loss/train': 1.2525073289871216} -08/30/2021 20:37:44 - INFO - __main__ - Step 41359: {'lr': 0.00041771075269597354, 'samples': 7940928, 'steps': 41358, 'loss/train': 1.3471342325210571} -08/30/2021 20:37:44 - INFO - __main__ - Step 41360: {'lr': 0.0004177068171798204, 'samples': 7941120, 'steps': 41359, 'loss/train': 1.2018510103225708} -08/30/2021 20:37:45 - INFO - __main__ - Step 41361: {'lr': 0.0004177028815881011, 'samples': 7941312, 'steps': 41360, 'loss/train': 1.8874595165252686} -08/30/2021 20:37:46 - INFO - __main__ - Step 41362: {'lr': 0.00041769894592081746, 'samples': 7941504, 'steps': 41361, 'loss/train': 1.9354338645935059} -08/30/2021 20:37:47 - INFO - __main__ - Step 41363: {'lr': 0.0004176950101779713, 'samples': 7941696, 'steps': 41362, 'loss/train': 0.7589229345321655} -08/30/2021 20:37:47 - INFO - __main__ - Step 41364: {'lr': 0.00041769107435956444, 'samples': 7941888, 'steps': 41363, 'loss/train': 1.5308563709259033} -08/30/2021 20:37:48 - INFO - __main__ - Step 41365: {'lr': 0.00041768713846559844, 'samples': 7942080, 'steps': 41364, 'loss/train': 1.4399404525756836} -08/30/2021 20:37:48 - INFO - __main__ - Step 41366: {'lr': 0.00041768320249607527, 'samples': 7942272, 'steps': 41365, 'loss/train': 1.1068576574325562} -08/30/2021 20:37:49 - INFO - __main__ - Step 41367: {'lr': 0.00041767926645099664, 'samples': 7942464, 'steps': 41366, 'loss/train': 1.0698051452636719} -08/30/2021 20:37:50 - INFO - __main__ - Step 41368: {'lr': 0.00041767533033036425, 'samples': 7942656, 'steps': 41367, 'loss/train': 2.2422380447387695} -08/30/2021 20:37:50 - INFO - __main__ - Step 41369: {'lr': 0.00041767139413418, 'samples': 7942848, 'steps': 41368, 'loss/train': 1.1421459913253784} -08/30/2021 20:37:51 - INFO - __main__ - Step 41370: {'lr': 0.00041766745786244564, 'samples': 7943040, 'steps': 41369, 'loss/train': 1.7020671367645264} -08/30/2021 20:37:51 - INFO - __main__ - Step 41371: {'lr': 0.00041766352151516284, 'samples': 7943232, 'steps': 41370, 'loss/train': 2.0855867862701416} -08/30/2021 20:37:52 - INFO - __main__ - Step 41372: {'lr': 0.0004176595850923335, 'samples': 7943424, 'steps': 41371, 'loss/train': 0.4040973484516144} -08/30/2021 20:37:53 - INFO - __main__ - Step 41373: {'lr': 0.0004176556485939593, 'samples': 7943616, 'steps': 41372, 'loss/train': 0.9285533428192139} -08/30/2021 20:37:53 - INFO - __main__ - Step 41374: {'lr': 0.00041765171202004205, 'samples': 7943808, 'steps': 41373, 'loss/train': 1.5626639127731323} -08/30/2021 20:37:54 - INFO - __main__ - Step 41375: {'lr': 0.00041764777537058354, 'samples': 7944000, 'steps': 41374, 'loss/train': 1.3051823377609253} -08/30/2021 20:37:54 - INFO - __main__ - Step 41376: {'lr': 0.0004176438386455855, 'samples': 7944192, 'steps': 41375, 'loss/train': 1.5558784008026123} -08/30/2021 20:37:55 - INFO - __main__ - Step 41377: {'lr': 0.00041763990184504984, 'samples': 7944384, 'steps': 41376, 'loss/train': 1.1090941429138184} -08/30/2021 20:37:56 - INFO - __main__ - Step 41378: {'lr': 0.00041763596496897817, 'samples': 7944576, 'steps': 41377, 'loss/train': 1.9707355499267578} -08/30/2021 20:37:56 - INFO - __main__ - Step 41379: {'lr': 0.00041763202801737225, 'samples': 7944768, 'steps': 41378, 'loss/train': 1.4138187170028687} -08/30/2021 20:37:56 - INFO - __main__ - Step 41380: {'lr': 0.00041762809099023403, 'samples': 7944960, 'steps': 41379, 'loss/train': 1.791852355003357} -08/30/2021 20:37:57 - INFO - __main__ - Step 41381: {'lr': 0.00041762415388756514, 'samples': 7945152, 'steps': 41380, 'loss/train': 1.7626186609268188} -08/30/2021 20:37:58 - INFO - __main__ - Step 41382: {'lr': 0.00041762021670936736, 'samples': 7945344, 'steps': 41381, 'loss/train': 1.1181529760360718} -08/30/2021 20:37:59 - INFO - __main__ - Step 41383: {'lr': 0.0004176162794556425, 'samples': 7945536, 'steps': 41382, 'loss/train': 1.6964209079742432} -08/30/2021 20:37:59 - INFO - __main__ - Step 41384: {'lr': 0.0004176123421263923, 'samples': 7945728, 'steps': 41383, 'loss/train': 1.393151044845581} -08/30/2021 20:38:00 - INFO - __main__ - Step 41385: {'lr': 0.00041760840472161866, 'samples': 7945920, 'steps': 41384, 'loss/train': 1.5543761253356934} -08/30/2021 20:38:00 - INFO - __main__ - Step 41386: {'lr': 0.0004176044672413232, 'samples': 7946112, 'steps': 41385, 'loss/train': 2.9954159259796143} -08/30/2021 20:38:00 - INFO - __main__ - Step 41387: {'lr': 0.00041760052968550776, 'samples': 7946304, 'steps': 41386, 'loss/train': 1.5306628942489624} -08/30/2021 20:38:02 - INFO - __main__ - Step 41388: {'lr': 0.0004175965920541741, 'samples': 7946496, 'steps': 41387, 'loss/train': 1.3748397827148438} -08/30/2021 20:38:02 - INFO - __main__ - Step 41389: {'lr': 0.00041759265434732404, 'samples': 7946688, 'steps': 41388, 'loss/train': 1.5823618173599243} -08/30/2021 20:38:03 - INFO - __main__ - Step 41390: {'lr': 0.00041758871656495927, 'samples': 7946880, 'steps': 41389, 'loss/train': 1.0068360567092896} -08/30/2021 20:38:03 - INFO - __main__ - Step 41391: {'lr': 0.00041758477870708165, 'samples': 7947072, 'steps': 41390, 'loss/train': 0.8377043008804321} -08/30/2021 20:38:03 - INFO - __main__ - Step 41392: {'lr': 0.0004175808407736929, 'samples': 7947264, 'steps': 41391, 'loss/train': 1.8361799716949463} -08/30/2021 20:38:05 - INFO - __main__ - Step 41393: {'lr': 0.00041757690276479474, 'samples': 7947456, 'steps': 41392, 'loss/train': 1.3056310415267944} -08/30/2021 20:38:05 - INFO - __main__ - Step 41394: {'lr': 0.0004175729646803891, 'samples': 7947648, 'steps': 41393, 'loss/train': 1.055996060371399} -08/30/2021 20:38:05 - INFO - __main__ - Step 41395: {'lr': 0.00041756902652047767, 'samples': 7947840, 'steps': 41394, 'loss/train': 1.4928996562957764} -08/30/2021 20:38:06 - INFO - __main__ - Step 41396: {'lr': 0.0004175650882850622, 'samples': 7948032, 'steps': 41395, 'loss/train': 1.640062689781189} -08/30/2021 20:38:06 - INFO - __main__ - Step 41397: {'lr': 0.0004175611499741445, 'samples': 7948224, 'steps': 41396, 'loss/train': 1.1785069704055786} -08/30/2021 20:38:08 - INFO - __main__ - Step 41398: {'lr': 0.00041755721158772633, 'samples': 7948416, 'steps': 41397, 'loss/train': 1.6382743120193481} -08/30/2021 20:38:08 - INFO - __main__ - Step 41399: {'lr': 0.00041755327312580944, 'samples': 7948608, 'steps': 41398, 'loss/train': 1.462915301322937} -08/30/2021 20:38:08 - INFO - __main__ - Step 41400: {'lr': 0.0004175493345883956, 'samples': 7948800, 'steps': 41399, 'loss/train': 1.6920114755630493} -08/30/2021 20:38:09 - INFO - __main__ - Step 41401: {'lr': 0.0004175453959754867, 'samples': 7948992, 'steps': 41400, 'loss/train': 1.072318196296692} -08/30/2021 20:38:09 - INFO - __main__ - Step 41402: {'lr': 0.00041754145728708434, 'samples': 7949184, 'steps': 41401, 'loss/train': 1.888789415359497} -08/30/2021 20:38:11 - INFO - __main__ - Step 41403: {'lr': 0.0004175375185231904, 'samples': 7949376, 'steps': 41402, 'loss/train': 1.2134674787521362} -08/30/2021 20:38:12 - INFO - __main__ - Step 41404: {'lr': 0.00041753357968380675, 'samples': 7949568, 'steps': 41403, 'loss/train': 1.6988017559051514} -08/30/2021 20:38:12 - INFO - __main__ - Step 41405: {'lr': 0.00041752964076893496, 'samples': 7949760, 'steps': 41404, 'loss/train': 2.844590902328491} -08/30/2021 20:38:13 - INFO - __main__ - Step 41406: {'lr': 0.00041752570177857695, 'samples': 7949952, 'steps': 41405, 'loss/train': 1.5071130990982056} -08/30/2021 20:38:13 - INFO - __main__ - Step 41407: {'lr': 0.0004175217627127344, 'samples': 7950144, 'steps': 41406, 'loss/train': 1.532647967338562} -08/30/2021 20:38:15 - INFO - __main__ - Step 41408: {'lr': 0.0004175178235714091, 'samples': 7950336, 'steps': 41407, 'loss/train': 1.46100914478302} -08/30/2021 20:38:15 - INFO - __main__ - Step 41409: {'lr': 0.0004175138843546029, 'samples': 7950528, 'steps': 41408, 'loss/train': 0.05259615182876587} -08/30/2021 20:38:16 - INFO - __main__ - Step 41410: {'lr': 0.00041750994506231756, 'samples': 7950720, 'steps': 41409, 'loss/train': 1.2466177940368652} -08/30/2021 20:38:16 - INFO - __main__ - Step 41411: {'lr': 0.00041750600569455474, 'samples': 7950912, 'steps': 41410, 'loss/train': 1.555919885635376} -08/30/2021 20:38:16 - INFO - __main__ - Step 41412: {'lr': 0.0004175020662513164, 'samples': 7951104, 'steps': 41411, 'loss/train': 2.918903350830078} -08/30/2021 20:38:17 - INFO - __main__ - Step 41413: {'lr': 0.0004174981267326041, 'samples': 7951296, 'steps': 41412, 'loss/train': 1.8798463344573975} -08/30/2021 20:38:18 - INFO - __main__ - Step 41414: {'lr': 0.0004174941871384198, 'samples': 7951488, 'steps': 41413, 'loss/train': 1.8909170627593994} -08/30/2021 20:38:18 - INFO - __main__ - Step 41415: {'lr': 0.00041749024746876517, 'samples': 7951680, 'steps': 41414, 'loss/train': 1.196697473526001} -08/30/2021 20:38:19 - INFO - __main__ - Step 41416: {'lr': 0.00041748630772364204, 'samples': 7951872, 'steps': 41415, 'loss/train': 1.4976251125335693} -08/30/2021 20:38:19 - INFO - __main__ - Step 41417: {'lr': 0.00041748236790305215, 'samples': 7952064, 'steps': 41416, 'loss/train': 0.9984554648399353} -08/30/2021 20:38:20 - INFO - __main__ - Step 41418: {'lr': 0.0004174784280069973, 'samples': 7952256, 'steps': 41417, 'loss/train': 1.6519157886505127} -08/30/2021 20:38:21 - INFO - __main__ - Step 41419: {'lr': 0.00041747448803547925, 'samples': 7952448, 'steps': 41418, 'loss/train': 1.4101771116256714} -08/30/2021 20:38:22 - INFO - __main__ - Step 41420: {'lr': 0.0004174705479884998, 'samples': 7952640, 'steps': 41419, 'loss/train': 1.2860792875289917} -08/30/2021 20:38:22 - INFO - __main__ - Step 41421: {'lr': 0.0004174666078660607, 'samples': 7952832, 'steps': 41420, 'loss/train': 1.4192967414855957} -08/30/2021 20:38:23 - INFO - __main__ - Step 41422: {'lr': 0.00041746266766816377, 'samples': 7953024, 'steps': 41421, 'loss/train': 1.8272082805633545} -08/30/2021 20:38:23 - INFO - __main__ - Step 41423: {'lr': 0.0004174587273948106, 'samples': 7953216, 'steps': 41422, 'loss/train': 0.573168158531189} -08/30/2021 20:38:24 - INFO - __main__ - Step 41424: {'lr': 0.0004174547870460033, 'samples': 7953408, 'steps': 41423, 'loss/train': 1.5065640211105347} -08/30/2021 20:38:25 - INFO - __main__ - Step 41425: {'lr': 0.0004174508466217434, 'samples': 7953600, 'steps': 41424, 'loss/train': 1.6666555404663086} -08/30/2021 20:38:25 - INFO - __main__ - Step 41426: {'lr': 0.00041744690612203263, 'samples': 7953792, 'steps': 41425, 'loss/train': 1.2866551876068115} -08/30/2021 20:38:26 - INFO - __main__ - Step 41427: {'lr': 0.00041744296554687294, 'samples': 7953984, 'steps': 41426, 'loss/train': 1.8438634872436523} -08/30/2021 20:38:26 - INFO - __main__ - Step 41428: {'lr': 0.00041743902489626606, 'samples': 7954176, 'steps': 41427, 'loss/train': 1.6337019205093384} -08/30/2021 20:38:27 - INFO - __main__ - Step 41429: {'lr': 0.0004174350841702137, 'samples': 7954368, 'steps': 41428, 'loss/train': 2.0448713302612305} -08/30/2021 20:38:28 - INFO - __main__ - Step 41430: {'lr': 0.0004174311433687177, 'samples': 7954560, 'steps': 41429, 'loss/train': 1.7109603881835938} -08/30/2021 20:38:28 - INFO - __main__ - Step 41431: {'lr': 0.00041742720249177975, 'samples': 7954752, 'steps': 41430, 'loss/train': 2.66896653175354} -08/30/2021 20:38:29 - INFO - __main__ - Step 41432: {'lr': 0.0004174232615394018, 'samples': 7954944, 'steps': 41431, 'loss/train': 1.5298560857772827} -08/30/2021 20:38:29 - INFO - __main__ - Step 41433: {'lr': 0.00041741932051158535, 'samples': 7955136, 'steps': 41432, 'loss/train': 0.978148877620697} -08/30/2021 20:38:29 - INFO - __main__ - Step 41434: {'lr': 0.00041741537940833247, 'samples': 7955328, 'steps': 41433, 'loss/train': 1.3200790882110596} -08/30/2021 20:38:31 - INFO - __main__ - Step 41435: {'lr': 0.00041741143822964476, 'samples': 7955520, 'steps': 41434, 'loss/train': 1.3774951696395874} -08/30/2021 20:38:31 - INFO - __main__ - Step 41436: {'lr': 0.00041740749697552406, 'samples': 7955712, 'steps': 41435, 'loss/train': 0.8942598104476929} -08/30/2021 20:38:32 - INFO - __main__ - Step 41437: {'lr': 0.0004174035556459721, 'samples': 7955904, 'steps': 41436, 'loss/train': 0.5630281567573547} -08/30/2021 20:38:32 - INFO - __main__ - Step 41438: {'lr': 0.0004173996142409907, 'samples': 7956096, 'steps': 41437, 'loss/train': 1.3800159692764282} -08/30/2021 20:38:34 - INFO - __main__ - Step 41439: {'lr': 0.0004173956727605816, 'samples': 7956288, 'steps': 41438, 'loss/train': 0.20855551958084106} -08/30/2021 20:38:34 - INFO - __main__ - Step 41440: {'lr': 0.00041739173120474663, 'samples': 7956480, 'steps': 41439, 'loss/train': 0.7213126420974731} -08/30/2021 20:38:35 - INFO - __main__ - Step 41441: {'lr': 0.00041738778957348745, 'samples': 7956672, 'steps': 41440, 'loss/train': 1.5504837036132812} -08/30/2021 20:38:35 - INFO - __main__ - Step 41442: {'lr': 0.00041738384786680596, 'samples': 7956864, 'steps': 41441, 'loss/train': 1.3565422296524048} -08/30/2021 20:38:35 - INFO - __main__ - Step 41443: {'lr': 0.0004173799060847039, 'samples': 7957056, 'steps': 41442, 'loss/train': 1.049843192100525} -08/30/2021 20:38:36 - INFO - __main__ - Step 41444: {'lr': 0.00041737596422718306, 'samples': 7957248, 'steps': 41443, 'loss/train': 2.10805606842041} -08/30/2021 20:38:37 - INFO - __main__ - Step 41445: {'lr': 0.0004173720222942452, 'samples': 7957440, 'steps': 41444, 'loss/train': 1.4697864055633545} -08/30/2021 20:38:38 - INFO - __main__ - Step 41446: {'lr': 0.000417368080285892, 'samples': 7957632, 'steps': 41445, 'loss/train': 1.1761834621429443} -08/30/2021 20:38:38 - INFO - __main__ - Step 41447: {'lr': 0.0004173641382021254, 'samples': 7957824, 'steps': 41446, 'loss/train': 1.6018630266189575} -08/30/2021 20:38:38 - INFO - __main__ - Step 41448: {'lr': 0.00041736019604294704, 'samples': 7958016, 'steps': 41447, 'loss/train': 1.4833124876022339} -08/30/2021 20:38:39 - INFO - __main__ - Step 41449: {'lr': 0.00041735625380835884, 'samples': 7958208, 'steps': 41448, 'loss/train': 1.0895339250564575} -08/30/2021 20:38:40 - INFO - __main__ - Step 41450: {'lr': 0.0004173523114983624, 'samples': 7958400, 'steps': 41449, 'loss/train': 1.660897135734558} -08/30/2021 20:38:41 - INFO - __main__ - Step 41451: {'lr': 0.0004173483691129597, 'samples': 7958592, 'steps': 41450, 'loss/train': 1.5639561414718628} -08/30/2021 20:38:41 - INFO - __main__ - Step 41452: {'lr': 0.00041734442665215235, 'samples': 7958784, 'steps': 41451, 'loss/train': 1.9907350540161133} -08/30/2021 20:38:41 - INFO - __main__ - Step 41453: {'lr': 0.00041734048411594214, 'samples': 7958976, 'steps': 41452, 'loss/train': 0.7563914656639099} -08/30/2021 20:38:42 - INFO - __main__ - Step 41454: {'lr': 0.000417336541504331, 'samples': 7959168, 'steps': 41453, 'loss/train': 1.73635995388031} -08/30/2021 20:38:43 - INFO - __main__ - Step 41455: {'lr': 0.0004173325988173205, 'samples': 7959360, 'steps': 41454, 'loss/train': 1.8685799837112427} -08/30/2021 20:38:44 - INFO - __main__ - Step 41456: {'lr': 0.00041732865605491256, 'samples': 7959552, 'steps': 41455, 'loss/train': 1.984452486038208} -08/30/2021 20:38:44 - INFO - __main__ - Step 41457: {'lr': 0.00041732471321710886, 'samples': 7959744, 'steps': 41456, 'loss/train': 1.0195425748825073} -08/30/2021 20:38:44 - INFO - __main__ - Step 41458: {'lr': 0.00041732077030391126, 'samples': 7959936, 'steps': 41457, 'loss/train': 1.4068340063095093} -08/30/2021 20:38:45 - INFO - __main__ - Step 41459: {'lr': 0.00041731682731532154, 'samples': 7960128, 'steps': 41458, 'loss/train': 1.5764505863189697} -08/30/2021 20:38:47 - INFO - __main__ - Step 41460: {'lr': 0.0004173128842513414, 'samples': 7960320, 'steps': 41459, 'loss/train': 1.0523980855941772} -08/30/2021 20:38:47 - INFO - __main__ - Step 41461: {'lr': 0.00041730894111197266, 'samples': 7960512, 'steps': 41460, 'loss/train': 0.8384407758712769} -08/30/2021 20:38:48 - INFO - __main__ - Step 41462: {'lr': 0.0004173049978972171, 'samples': 7960704, 'steps': 41461, 'loss/train': 1.2816945314407349} -08/30/2021 20:38:48 - INFO - __main__ - Step 41463: {'lr': 0.0004173010546070765, 'samples': 7960896, 'steps': 41462, 'loss/train': 1.4940721988677979} -08/30/2021 20:38:48 - INFO - __main__ - Step 41464: {'lr': 0.00041729711124155255, 'samples': 7961088, 'steps': 41463, 'loss/train': 1.7958987951278687} -08/30/2021 20:38:50 - INFO - __main__ - Step 41465: {'lr': 0.0004172931678006472, 'samples': 7961280, 'steps': 41464, 'loss/train': 0.41954341530799866} -08/30/2021 20:38:51 - INFO - __main__ - Step 41466: {'lr': 0.00041728922428436213, 'samples': 7961472, 'steps': 41465, 'loss/train': 1.403683066368103} -08/30/2021 20:38:51 - INFO - __main__ - Step 41467: {'lr': 0.000417285280692699, 'samples': 7961664, 'steps': 41466, 'loss/train': 1.4509979486465454} -08/30/2021 20:38:51 - INFO - __main__ - Step 41468: {'lr': 0.00041728133702565985, 'samples': 7961856, 'steps': 41467, 'loss/train': 0.25000718235969543} -08/30/2021 20:38:52 - INFO - __main__ - Step 41469: {'lr': 0.0004172773932832462, 'samples': 7962048, 'steps': 41468, 'loss/train': 0.24955615401268005} -08/30/2021 20:38:53 - INFO - __main__ - Step 41470: {'lr': 0.00041727344946546, 'samples': 7962240, 'steps': 41469, 'loss/train': 2.0024654865264893} -08/30/2021 20:38:54 - INFO - __main__ - Step 41471: {'lr': 0.00041726950557230294, 'samples': 7962432, 'steps': 41470, 'loss/train': 1.3711596727371216} -08/30/2021 20:38:54 - INFO - __main__ - Step 41472: {'lr': 0.0004172655616037768, 'samples': 7962624, 'steps': 41471, 'loss/train': 1.7318528890609741} -08/30/2021 20:38:54 - INFO - __main__ - Step 41473: {'lr': 0.0004172616175598835, 'samples': 7962816, 'steps': 41472, 'loss/train': 1.5632617473602295} -08/30/2021 20:38:55 - INFO - __main__ - Step 41474: {'lr': 0.00041725767344062453, 'samples': 7963008, 'steps': 41473, 'loss/train': 1.4895762205123901} -08/30/2021 20:38:55 - INFO - __main__ - Step 41475: {'lr': 0.00041725372924600193, 'samples': 7963200, 'steps': 41474, 'loss/train': 1.7173179388046265} -08/30/2021 20:38:57 - INFO - __main__ - Step 41476: {'lr': 0.00041724978497601736, 'samples': 7963392, 'steps': 41475, 'loss/train': 0.9980760812759399} -08/30/2021 20:38:57 - INFO - __main__ - Step 41477: {'lr': 0.0004172458406306726, 'samples': 7963584, 'steps': 41476, 'loss/train': 0.7931108474731445} -08/30/2021 20:38:58 - INFO - __main__ - Step 41478: {'lr': 0.00041724189620996946, 'samples': 7963776, 'steps': 41477, 'loss/train': 0.9811127781867981} -08/30/2021 20:38:58 - INFO - __main__ - Step 41479: {'lr': 0.0004172379517139097, 'samples': 7963968, 'steps': 41478, 'loss/train': 1.246964454650879} -08/30/2021 20:38:58 - INFO - __main__ - Step 41480: {'lr': 0.0004172340071424951, 'samples': 7964160, 'steps': 41479, 'loss/train': 0.7575798034667969} -08/30/2021 20:39:00 - INFO - __main__ - Step 41481: {'lr': 0.00041723006249572744, 'samples': 7964352, 'steps': 41480, 'loss/train': 1.4947830438613892} -08/30/2021 20:39:00 - INFO - __main__ - Step 41482: {'lr': 0.00041722611777360844, 'samples': 7964544, 'steps': 41481, 'loss/train': 1.1833040714263916} -08/30/2021 20:39:01 - INFO - __main__ - Step 41483: {'lr': 0.00041722217297614, 'samples': 7964736, 'steps': 41482, 'loss/train': 1.942763090133667} -08/30/2021 20:39:01 - INFO - __main__ - Step 41484: {'lr': 0.00041721822810332384, 'samples': 7964928, 'steps': 41483, 'loss/train': 1.4728940725326538} -08/30/2021 20:39:01 - INFO - __main__ - Step 41485: {'lr': 0.00041721428315516176, 'samples': 7965120, 'steps': 41484, 'loss/train': 1.0895189046859741} -08/30/2021 20:39:03 - INFO - __main__ - Step 41486: {'lr': 0.00041721033813165543, 'samples': 7965312, 'steps': 41485, 'loss/train': 1.047298550605774} -08/30/2021 20:39:03 - INFO - __main__ - Step 41487: {'lr': 0.0004172063930328067, 'samples': 7965504, 'steps': 41486, 'loss/train': 1.745688557624817} -08/30/2021 20:39:04 - INFO - __main__ - Step 41488: {'lr': 0.00041720244785861736, 'samples': 7965696, 'steps': 41487, 'loss/train': 1.6669461727142334} -08/30/2021 20:39:04 - INFO - __main__ - Step 41489: {'lr': 0.0004171985026090892, 'samples': 7965888, 'steps': 41488, 'loss/train': 1.7797329425811768} -08/30/2021 20:39:04 - INFO - __main__ - Step 41490: {'lr': 0.00041719455728422394, 'samples': 7966080, 'steps': 41489, 'loss/train': 1.5193333625793457} -08/30/2021 20:39:06 - INFO - __main__ - Step 41491: {'lr': 0.0004171906118840234, 'samples': 7966272, 'steps': 41490, 'loss/train': 1.7020156383514404} -08/30/2021 20:39:06 - INFO - __main__ - Step 41492: {'lr': 0.00041718666640848937, 'samples': 7966464, 'steps': 41491, 'loss/train': 1.3126717805862427} -08/30/2021 20:39:07 - INFO - __main__ - Step 41493: {'lr': 0.0004171827208576236, 'samples': 7966656, 'steps': 41492, 'loss/train': 1.7679609060287476} -08/30/2021 20:39:07 - INFO - __main__ - Step 41494: {'lr': 0.00041717877523142786, 'samples': 7966848, 'steps': 41493, 'loss/train': 1.6426056623458862} -08/30/2021 20:39:07 - INFO - __main__ - Step 41495: {'lr': 0.00041717482952990394, 'samples': 7967040, 'steps': 41494, 'loss/train': 1.0831743478775024} -08/30/2021 20:39:09 - INFO - __main__ - Step 41496: {'lr': 0.00041717088375305367, 'samples': 7967232, 'steps': 41495, 'loss/train': 1.4067193269729614} -08/30/2021 20:39:09 - INFO - __main__ - Step 41497: {'lr': 0.0004171669379008787, 'samples': 7967424, 'steps': 41496, 'loss/train': 1.2224026918411255} -08/30/2021 20:39:10 - INFO - __main__ - Step 41498: {'lr': 0.00041716299197338093, 'samples': 7967616, 'steps': 41497, 'loss/train': 1.1732620000839233} -08/30/2021 20:39:10 - INFO - __main__ - Step 41499: {'lr': 0.0004171590459705622, 'samples': 7967808, 'steps': 41498, 'loss/train': 1.3189703226089478} -08/30/2021 20:39:10 - INFO - __main__ - Step 41500: {'lr': 0.0004171550998924241, 'samples': 7968000, 'steps': 41499, 'loss/train': 1.5910859107971191} -08/30/2021 20:39:12 - INFO - __main__ - Step 41501: {'lr': 0.0004171511537389684, 'samples': 7968192, 'steps': 41500, 'loss/train': 1.173943042755127} -08/30/2021 20:39:12 - INFO - __main__ - Step 41502: {'lr': 0.0004171472075101971, 'samples': 7968384, 'steps': 41501, 'loss/train': 1.6349396705627441} -08/30/2021 20:39:13 - INFO - __main__ - Step 41503: {'lr': 0.0004171432612061117, 'samples': 7968576, 'steps': 41502, 'loss/train': 1.531803846359253} -08/30/2021 20:39:13 - INFO - __main__ - Step 41504: {'lr': 0.00041713931482671425, 'samples': 7968768, 'steps': 41503, 'loss/train': 1.3499886989593506} -08/30/2021 20:39:13 - INFO - __main__ - Step 41505: {'lr': 0.0004171353683720064, 'samples': 7968960, 'steps': 41504, 'loss/train': 1.4708598852157593} -08/30/2021 20:39:15 - INFO - __main__ - Step 41506: {'lr': 0.00041713142184198994, 'samples': 7969152, 'steps': 41505, 'loss/train': 1.8893855810165405} -08/30/2021 20:39:15 - INFO - __main__ - Step 41507: {'lr': 0.0004171274752366665, 'samples': 7969344, 'steps': 41506, 'loss/train': 1.178467869758606} -08/30/2021 20:39:15 - INFO - __main__ - Step 41508: {'lr': 0.00041712352855603817, 'samples': 7969536, 'steps': 41507, 'loss/train': 1.5718910694122314} -08/30/2021 20:39:16 - INFO - __main__ - Step 41509: {'lr': 0.00041711958180010644, 'samples': 7969728, 'steps': 41508, 'loss/train': 0.7867884039878845} -08/30/2021 20:39:16 - INFO - __main__ - Step 41510: {'lr': 0.0004171156349688733, 'samples': 7969920, 'steps': 41509, 'loss/train': 1.8031187057495117} -08/30/2021 20:39:17 - INFO - __main__ - Step 41511: {'lr': 0.0004171116880623404, 'samples': 7970112, 'steps': 41510, 'loss/train': 1.1286834478378296} -08/30/2021 20:39:19 - INFO - __main__ - Step 41512: {'lr': 0.0004171077410805095, 'samples': 7970304, 'steps': 41511, 'loss/train': 1.209172010421753} -08/30/2021 20:39:19 - INFO - __main__ - Step 41513: {'lr': 0.0004171037940233825, 'samples': 7970496, 'steps': 41512, 'loss/train': 1.487059473991394} -08/30/2021 20:39:19 - INFO - __main__ - Step 41514: {'lr': 0.0004170998468909611, 'samples': 7970688, 'steps': 41513, 'loss/train': 0.9373190999031067} -08/30/2021 20:39:20 - INFO - __main__ - Step 41515: {'lr': 0.00041709589968324704, 'samples': 7970880, 'steps': 41514, 'loss/train': 1.4967365264892578} -08/30/2021 20:39:20 - INFO - __main__ - Step 41516: {'lr': 0.00041709195240024224, 'samples': 7971072, 'steps': 41515, 'loss/train': 1.346509337425232} -08/30/2021 20:39:21 - INFO - __main__ - Step 41517: {'lr': 0.0004170880050419483, 'samples': 7971264, 'steps': 41516, 'loss/train': 1.2530436515808105} -08/30/2021 20:39:22 - INFO - __main__ - Step 41518: {'lr': 0.0004170840576083671, 'samples': 7971456, 'steps': 41517, 'loss/train': 1.0286527872085571} -08/30/2021 20:39:22 - INFO - __main__ - Step 41519: {'lr': 0.00041708011009950044, 'samples': 7971648, 'steps': 41518, 'loss/train': 1.2466856241226196} -08/30/2021 20:39:23 - INFO - __main__ - Step 41520: {'lr': 0.00041707616251535, 'samples': 7971840, 'steps': 41519, 'loss/train': 1.613173007965088} -08/30/2021 20:39:23 - INFO - __main__ - Step 41521: {'lr': 0.0004170722148559176, 'samples': 7972032, 'steps': 41520, 'loss/train': 1.8256449699401855} -08/30/2021 20:39:24 - INFO - __main__ - Step 41522: {'lr': 0.0004170682671212051, 'samples': 7972224, 'steps': 41521, 'loss/train': 1.3022528886795044} -08/30/2021 20:39:25 - INFO - __main__ - Step 41523: {'lr': 0.00041706431931121416, 'samples': 7972416, 'steps': 41522, 'loss/train': 1.4363267421722412} -08/30/2021 20:39:25 - INFO - __main__ - Step 41524: {'lr': 0.00041706037142594666, 'samples': 7972608, 'steps': 41523, 'loss/train': 1.076782464981079} -08/30/2021 20:39:26 - INFO - __main__ - Step 41525: {'lr': 0.00041705642346540436, 'samples': 7972800, 'steps': 41524, 'loss/train': 1.3851639032363892} -08/30/2021 20:39:26 - INFO - __main__ - Step 41526: {'lr': 0.00041705247542958904, 'samples': 7972992, 'steps': 41525, 'loss/train': 1.574877381324768} -08/30/2021 20:39:27 - INFO - __main__ - Step 41527: {'lr': 0.00041704852731850234, 'samples': 7973184, 'steps': 41526, 'loss/train': 1.2817974090576172} -08/30/2021 20:39:28 - INFO - __main__ - Step 41528: {'lr': 0.0004170445791321462, 'samples': 7973376, 'steps': 41527, 'loss/train': 1.2958797216415405} -08/30/2021 20:39:28 - INFO - __main__ - Step 41529: {'lr': 0.00041704063087052236, 'samples': 7973568, 'steps': 41528, 'loss/train': 0.4314829111099243} -08/30/2021 20:39:29 - INFO - __main__ - Step 41530: {'lr': 0.0004170366825336326, 'samples': 7973760, 'steps': 41529, 'loss/train': 1.3234946727752686} -08/30/2021 20:39:29 - INFO - __main__ - Step 41531: {'lr': 0.0004170327341214787, 'samples': 7973952, 'steps': 41530, 'loss/train': 1.867661952972412} -08/30/2021 20:39:31 - INFO - __main__ - Step 41532: {'lr': 0.00041702878563406237, 'samples': 7974144, 'steps': 41531, 'loss/train': 1.7998889684677124} -08/30/2021 20:39:31 - INFO - __main__ - Step 41533: {'lr': 0.0004170248370713855, 'samples': 7974336, 'steps': 41532, 'loss/train': 1.7397903203964233} -08/30/2021 20:39:31 - INFO - __main__ - Step 41534: {'lr': 0.0004170208884334498, 'samples': 7974528, 'steps': 41533, 'loss/train': 0.8247806429862976} -08/30/2021 20:39:32 - INFO - __main__ - Step 41535: {'lr': 0.000417016939720257, 'samples': 7974720, 'steps': 41534, 'loss/train': 0.8748294711112976} -08/30/2021 20:39:32 - INFO - __main__ - Step 41536: {'lr': 0.000417012990931809, 'samples': 7974912, 'steps': 41535, 'loss/train': 0.7379003763198853} -08/30/2021 20:39:34 - INFO - __main__ - Step 41537: {'lr': 0.00041700904206810755, 'samples': 7975104, 'steps': 41536, 'loss/train': 0.9927288293838501} -08/30/2021 20:39:34 - INFO - __main__ - Step 41538: {'lr': 0.00041700509312915437, 'samples': 7975296, 'steps': 41537, 'loss/train': 1.592069149017334} -08/30/2021 20:39:35 - INFO - __main__ - Step 41539: {'lr': 0.0004170011441149513, 'samples': 7975488, 'steps': 41538, 'loss/train': 2.8865084648132324} -08/30/2021 20:39:35 - INFO - __main__ - Step 41540: {'lr': 0.0004169971950255001, 'samples': 7975680, 'steps': 41539, 'loss/train': 0.8969731330871582} -08/30/2021 20:39:35 - INFO - __main__ - Step 41541: {'lr': 0.0004169932458608025, 'samples': 7975872, 'steps': 41540, 'loss/train': 1.250950813293457} -08/30/2021 20:39:36 - INFO - __main__ - Step 41542: {'lr': 0.00041698929662086035, 'samples': 7976064, 'steps': 41541, 'loss/train': 0.42570292949676514} -08/30/2021 20:39:37 - INFO - __main__ - Step 41543: {'lr': 0.0004169853473056754, 'samples': 7976256, 'steps': 41542, 'loss/train': 1.0075010061264038} -08/30/2021 20:39:38 - INFO - __main__ - Step 41544: {'lr': 0.0004169813979152494, 'samples': 7976448, 'steps': 41543, 'loss/train': 1.811414122581482} -08/30/2021 20:39:38 - INFO - __main__ - Step 41545: {'lr': 0.0004169774484495841, 'samples': 7976640, 'steps': 41544, 'loss/train': 1.2107313871383667} -08/30/2021 20:39:38 - INFO - __main__ - Step 41546: {'lr': 0.00041697349890868146, 'samples': 7976832, 'steps': 41545, 'loss/train': 1.656603217124939} -08/30/2021 20:39:39 - INFO - __main__ - Step 41547: {'lr': 0.0004169695492925431, 'samples': 7977024, 'steps': 41546, 'loss/train': 1.1806819438934326} -08/30/2021 20:39:40 - INFO - __main__ - Step 41548: {'lr': 0.0004169655996011708, 'samples': 7977216, 'steps': 41547, 'loss/train': 1.7755823135375977} -08/30/2021 20:39:41 - INFO - __main__ - Step 41549: {'lr': 0.0004169616498345664, 'samples': 7977408, 'steps': 41548, 'loss/train': 1.4425559043884277} -08/30/2021 20:39:41 - INFO - __main__ - Step 41550: {'lr': 0.0004169576999927317, 'samples': 7977600, 'steps': 41549, 'loss/train': 1.7261983156204224} -08/30/2021 20:39:41 - INFO - __main__ - Step 41551: {'lr': 0.00041695375007566837, 'samples': 7977792, 'steps': 41550, 'loss/train': 1.1468747854232788} -08/30/2021 20:39:42 - INFO - __main__ - Step 41552: {'lr': 0.00041694980008337825, 'samples': 7977984, 'steps': 41551, 'loss/train': 1.8117878437042236} -08/30/2021 20:39:43 - INFO - __main__ - Step 41553: {'lr': 0.0004169458500158632, 'samples': 7978176, 'steps': 41552, 'loss/train': 1.265033483505249} -08/30/2021 20:39:43 - INFO - __main__ - Step 41554: {'lr': 0.0004169418998731249, 'samples': 7978368, 'steps': 41553, 'loss/train': 1.387193202972412} -08/30/2021 20:39:44 - INFO - __main__ - Step 41555: {'lr': 0.00041693794965516514, 'samples': 7978560, 'steps': 41554, 'loss/train': 1.7047737836837769} -08/30/2021 20:39:44 - INFO - __main__ - Step 41556: {'lr': 0.0004169339993619857, 'samples': 7978752, 'steps': 41555, 'loss/train': 2.482072353363037} -08/30/2021 20:39:44 - INFO - __main__ - Step 41557: {'lr': 0.0004169300489935884, 'samples': 7978944, 'steps': 41556, 'loss/train': 1.5112351179122925} -08/30/2021 20:39:46 - INFO - __main__ - Step 41558: {'lr': 0.000416926098549975, 'samples': 7979136, 'steps': 41557, 'loss/train': 1.1393442153930664} -08/30/2021 20:39:47 - INFO - __main__ - Step 41559: {'lr': 0.00041692214803114725, 'samples': 7979328, 'steps': 41558, 'loss/train': 1.5220495462417603} -08/30/2021 20:39:47 - INFO - __main__ - Step 41560: {'lr': 0.00041691819743710704, 'samples': 7979520, 'steps': 41559, 'loss/train': 0.31711891293525696} -08/30/2021 20:39:48 - INFO - __main__ - Step 41561: {'lr': 0.00041691424676785593, 'samples': 7979712, 'steps': 41560, 'loss/train': 1.0074025392532349} -08/30/2021 20:39:48 - INFO - __main__ - Step 41562: {'lr': 0.00041691029602339595, 'samples': 7979904, 'steps': 41561, 'loss/train': 1.6283786296844482} -08/30/2021 20:39:48 - INFO - __main__ - Step 41563: {'lr': 0.00041690634520372865, 'samples': 7980096, 'steps': 41562, 'loss/train': 0.6212571263313293} -08/30/2021 20:39:50 - INFO - __main__ - Step 41564: {'lr': 0.000416902394308856, 'samples': 7980288, 'steps': 41563, 'loss/train': 1.5276856422424316} -08/30/2021 20:39:51 - INFO - __main__ - Step 41565: {'lr': 0.00041689844333877966, 'samples': 7980480, 'steps': 41564, 'loss/train': 1.7597904205322266} -08/30/2021 20:39:51 - INFO - __main__ - Step 41566: {'lr': 0.00041689449229350155, 'samples': 7980672, 'steps': 41565, 'loss/train': 1.3865047693252563} -08/30/2021 20:39:51 - INFO - __main__ - Step 41567: {'lr': 0.00041689054117302333, 'samples': 7980864, 'steps': 41566, 'loss/train': 1.9710938930511475} -08/30/2021 20:39:52 - INFO - __main__ - Step 41568: {'lr': 0.00041688658997734675, 'samples': 7981056, 'steps': 41567, 'loss/train': 0.9598851203918457} -08/30/2021 20:39:53 - INFO - __main__ - Step 41569: {'lr': 0.0004168826387064737, 'samples': 7981248, 'steps': 41568, 'loss/train': 1.4870154857635498} -08/30/2021 20:39:54 - INFO - __main__ - Step 41570: {'lr': 0.00041687868736040593, 'samples': 7981440, 'steps': 41569, 'loss/train': 1.1243648529052734} -08/30/2021 20:39:54 - INFO - __main__ - Step 41571: {'lr': 0.0004168747359391451, 'samples': 7981632, 'steps': 41570, 'loss/train': 1.6850124597549438} -08/30/2021 20:39:54 - INFO - __main__ - Step 41572: {'lr': 0.00041687078444269316, 'samples': 7981824, 'steps': 41571, 'loss/train': 1.2938319444656372} -08/30/2021 20:39:55 - INFO - __main__ - Step 41573: {'lr': 0.0004168668328710518, 'samples': 7982016, 'steps': 41572, 'loss/train': 1.5878853797912598} -08/30/2021 20:39:56 - INFO - __main__ - Step 41574: {'lr': 0.0004168628812242228, 'samples': 7982208, 'steps': 41573, 'loss/train': 1.6730941534042358} -08/30/2021 20:39:57 - INFO - __main__ - Step 41575: {'lr': 0.00041685892950220804, 'samples': 7982400, 'steps': 41574, 'loss/train': 1.5698238611221313} -08/30/2021 20:39:57 - INFO - __main__ - Step 41576: {'lr': 0.0004168549777050091, 'samples': 7982592, 'steps': 41575, 'loss/train': 1.30485200881958} -08/30/2021 20:39:57 - INFO - __main__ - Step 41577: {'lr': 0.000416851025832628, 'samples': 7982784, 'steps': 41576, 'loss/train': 1.11117422580719} -08/30/2021 20:39:58 - INFO - __main__ - Step 41578: {'lr': 0.0004168470738850664, 'samples': 7982976, 'steps': 41577, 'loss/train': 1.492432951927185} -08/30/2021 20:39:59 - INFO - __main__ - Step 41579: {'lr': 0.00041684312186232597, 'samples': 7983168, 'steps': 41578, 'loss/train': 1.218453049659729} -08/30/2021 20:40:00 - INFO - __main__ - Step 41580: {'lr': 0.0004168391697644087, 'samples': 7983360, 'steps': 41579, 'loss/train': 1.2426108121871948} -08/30/2021 20:40:00 - INFO - __main__ - Step 41581: {'lr': 0.0004168352175913163, 'samples': 7983552, 'steps': 41580, 'loss/train': 1.7683639526367188} -08/30/2021 20:40:00 - INFO - __main__ - Step 41582: {'lr': 0.00041683126534305037, 'samples': 7983744, 'steps': 41581, 'loss/train': 0.6085885763168335} -08/30/2021 20:40:01 - INFO - __main__ - Step 41583: {'lr': 0.000416827313019613, 'samples': 7983936, 'steps': 41582, 'loss/train': 1.1550097465515137} -08/30/2021 20:40:02 - INFO - __main__ - Step 41584: {'lr': 0.0004168233606210058, 'samples': 7984128, 'steps': 41583, 'loss/train': 0.8691121339797974} -08/30/2021 20:40:03 - INFO - __main__ - Step 41585: {'lr': 0.0004168194081472305, 'samples': 7984320, 'steps': 41584, 'loss/train': 1.0411816835403442} -08/30/2021 20:40:03 - INFO - __main__ - Step 41586: {'lr': 0.000416815455598289, 'samples': 7984512, 'steps': 41585, 'loss/train': 0.1261669099330902} -08/30/2021 20:40:03 - INFO - __main__ - Step 41587: {'lr': 0.000416811502974183, 'samples': 7984704, 'steps': 41586, 'loss/train': 1.4329789876937866} -08/30/2021 20:40:04 - INFO - __main__ - Step 41588: {'lr': 0.00041680755027491433, 'samples': 7984896, 'steps': 41587, 'loss/train': 1.6943320035934448} -08/30/2021 20:40:05 - INFO - __main__ - Step 41589: {'lr': 0.0004168035975004847, 'samples': 7985088, 'steps': 41588, 'loss/train': 1.0669463872909546} -08/30/2021 20:40:06 - INFO - __main__ - Step 41590: {'lr': 0.00041679964465089596, 'samples': 7985280, 'steps': 41589, 'loss/train': 1.1656787395477295} -08/30/2021 20:40:06 - INFO - __main__ - Step 41591: {'lr': 0.00041679569172614996, 'samples': 7985472, 'steps': 41590, 'loss/train': 2.1059494018554688} -08/30/2021 20:40:06 - INFO - __main__ - Step 41592: {'lr': 0.0004167917387262483, 'samples': 7985664, 'steps': 41591, 'loss/train': 1.3925353288650513} -08/30/2021 20:40:07 - INFO - __main__ - Step 41593: {'lr': 0.0004167877856511929, 'samples': 7985856, 'steps': 41592, 'loss/train': 1.4096202850341797} -08/30/2021 20:40:07 - INFO - __main__ - Step 41594: {'lr': 0.0004167838325009855, 'samples': 7986048, 'steps': 41593, 'loss/train': 1.6820869445800781} -08/30/2021 20:40:09 - INFO - __main__ - Step 41595: {'lr': 0.0004167798792756279, 'samples': 7986240, 'steps': 41594, 'loss/train': 1.8147940635681152} -08/30/2021 20:40:09 - INFO - __main__ - Step 41596: {'lr': 0.0004167759259751218, 'samples': 7986432, 'steps': 41595, 'loss/train': 1.5824813842773438} -08/30/2021 20:40:09 - INFO - __main__ - Step 41597: {'lr': 0.0004167719725994691, 'samples': 7986624, 'steps': 41596, 'loss/train': 1.7292206287384033} -08/30/2021 20:40:10 - INFO - __main__ - Step 41598: {'lr': 0.00041676801914867145, 'samples': 7986816, 'steps': 41597, 'loss/train': 0.9773558378219604} -08/30/2021 20:40:10 - INFO - __main__ - Step 41599: {'lr': 0.00041676406562273074, 'samples': 7987008, 'steps': 41598, 'loss/train': 1.4441684484481812} -08/30/2021 20:40:12 - INFO - __main__ - Step 41600: {'lr': 0.00041676011202164875, 'samples': 7987200, 'steps': 41599, 'loss/train': 1.2454993724822998} -08/30/2021 20:40:13 - INFO - __main__ - Step 41601: {'lr': 0.00041675615834542716, 'samples': 7987392, 'steps': 41600, 'loss/train': 1.5815929174423218} -08/30/2021 20:40:13 - INFO - __main__ - Step 41602: {'lr': 0.0004167522045940678, 'samples': 7987584, 'steps': 41601, 'loss/train': 0.09359685331583023} -08/30/2021 20:40:13 - INFO - __main__ - Step 41603: {'lr': 0.0004167482507675726, 'samples': 7987776, 'steps': 41602, 'loss/train': 1.3966649770736694} -08/30/2021 20:40:14 - INFO - __main__ - Step 41604: {'lr': 0.0004167442968659431, 'samples': 7987968, 'steps': 41603, 'loss/train': 1.4776785373687744} -08/30/2021 20:40:16 - INFO - __main__ - Step 41605: {'lr': 0.0004167403428891812, 'samples': 7988160, 'steps': 41604, 'loss/train': 1.1176069974899292} -08/30/2021 20:40:16 - INFO - __main__ - Step 41606: {'lr': 0.00041673638883728877, 'samples': 7988352, 'steps': 41605, 'loss/train': 1.7049412727355957} -08/30/2021 20:40:16 - INFO - __main__ - Step 41607: {'lr': 0.00041673243471026746, 'samples': 7988544, 'steps': 41606, 'loss/train': 1.7950657606124878} -08/30/2021 20:40:17 - INFO - __main__ - Step 41608: {'lr': 0.000416728480508119, 'samples': 7988736, 'steps': 41607, 'loss/train': 0.930979311466217} -08/30/2021 20:40:17 - INFO - __main__ - Step 41609: {'lr': 0.00041672452623084535, 'samples': 7988928, 'steps': 41608, 'loss/train': 0.1624361276626587} -08/30/2021 20:40:19 - INFO - __main__ - Step 41610: {'lr': 0.0004167205718784481, 'samples': 7989120, 'steps': 41609, 'loss/train': 0.1405334174633026} -08/30/2021 20:40:19 - INFO - __main__ - Step 41611: {'lr': 0.0004167166174509293, 'samples': 7989312, 'steps': 41610, 'loss/train': 1.0899964570999146} -08/30/2021 20:40:19 - INFO - __main__ - Step 41612: {'lr': 0.00041671266294829036, 'samples': 7989504, 'steps': 41611, 'loss/train': 1.2400552034378052} -08/30/2021 20:40:20 - INFO - __main__ - Step 41613: {'lr': 0.0004167087083705334, 'samples': 7989696, 'steps': 41612, 'loss/train': 1.4398250579833984} -08/30/2021 20:40:20 - INFO - __main__ - Step 41614: {'lr': 0.00041670475371766, 'samples': 7989888, 'steps': 41613, 'loss/train': 2.004798412322998} -08/30/2021 20:40:22 - INFO - __main__ - Step 41615: {'lr': 0.0004167007989896721, 'samples': 7990080, 'steps': 41614, 'loss/train': 1.3180453777313232} -08/30/2021 20:40:22 - INFO - __main__ - Step 41616: {'lr': 0.0004166968441865714, 'samples': 7990272, 'steps': 41615, 'loss/train': 1.1415334939956665} -08/30/2021 20:40:22 - INFO - __main__ - Step 41617: {'lr': 0.00041669288930835957, 'samples': 7990464, 'steps': 41616, 'loss/train': 1.180234432220459} -08/30/2021 20:40:23 - INFO - __main__ - Step 41618: {'lr': 0.0004166889343550385, 'samples': 7990656, 'steps': 41617, 'loss/train': 1.3564943075180054} -08/30/2021 20:40:23 - INFO - __main__ - Step 41619: {'lr': 0.00041668497932661005, 'samples': 7990848, 'steps': 41618, 'loss/train': 2.0460641384124756} -08/30/2021 20:40:26 - INFO - __main__ - Step 41620: {'lr': 0.00041668102422307593, 'samples': 7991040, 'steps': 41619, 'loss/train': 2.012375593185425} -08/30/2021 20:40:26 - INFO - __main__ - Step 41621: {'lr': 0.0004166770690444378, 'samples': 7991232, 'steps': 41620, 'loss/train': 0.1633165031671524} -08/30/2021 20:40:27 - INFO - __main__ - Step 41622: {'lr': 0.0004166731137906976, 'samples': 7991424, 'steps': 41621, 'loss/train': 0.1540095955133438} -08/30/2021 20:40:27 - INFO - __main__ - Step 41623: {'lr': 0.0004166691584618572, 'samples': 7991616, 'steps': 41622, 'loss/train': 1.4212417602539062} -08/30/2021 20:40:27 - INFO - __main__ - Step 41624: {'lr': 0.00041666520305791806, 'samples': 7991808, 'steps': 41623, 'loss/train': 1.1137620210647583} -08/30/2021 20:40:29 - INFO - __main__ - Step 41625: {'lr': 0.00041666124757888223, 'samples': 7992000, 'steps': 41624, 'loss/train': 1.381408929824829} -08/30/2021 20:40:29 - INFO - __main__ - Step 41626: {'lr': 0.0004166572920247514, 'samples': 7992192, 'steps': 41625, 'loss/train': 2.322394847869873} -08/30/2021 20:40:29 - INFO - __main__ - Step 41627: {'lr': 0.0004166533363955274, 'samples': 7992384, 'steps': 41626, 'loss/train': 1.4913469552993774} -08/30/2021 20:40:30 - INFO - __main__ - Step 41628: {'lr': 0.00041664938069121195, 'samples': 7992576, 'steps': 41627, 'loss/train': 1.10299551486969} -08/30/2021 20:40:30 - INFO - __main__ - Step 41629: {'lr': 0.00041664542491180685, 'samples': 7992768, 'steps': 41628, 'loss/train': 1.6439335346221924} -08/30/2021 20:40:32 - INFO - __main__ - Step 41630: {'lr': 0.0004166414690573139, 'samples': 7992960, 'steps': 41629, 'loss/train': 1.7799092531204224} -08/30/2021 20:40:32 - INFO - __main__ - Step 41631: {'lr': 0.0004166375131277349, 'samples': 7993152, 'steps': 41630, 'loss/train': 1.5723235607147217} -08/30/2021 20:40:33 - INFO - __main__ - Step 41632: {'lr': 0.0004166335571230716, 'samples': 7993344, 'steps': 41631, 'loss/train': 1.0552995204925537} -08/30/2021 20:40:33 - INFO - __main__ - Step 41633: {'lr': 0.0004166296010433258, 'samples': 7993536, 'steps': 41632, 'loss/train': 0.09982667863368988} -08/30/2021 20:40:33 - INFO - __main__ - Step 41634: {'lr': 0.00041662564488849927, 'samples': 7993728, 'steps': 41633, 'loss/train': 1.9106051921844482} -08/30/2021 20:40:35 - INFO - __main__ - Step 41635: {'lr': 0.00041662168865859374, 'samples': 7993920, 'steps': 41634, 'loss/train': 0.09316297620534897} -08/30/2021 20:40:35 - INFO - __main__ - Step 41636: {'lr': 0.0004166177323536111, 'samples': 7994112, 'steps': 41635, 'loss/train': 1.5177817344665527} -08/30/2021 20:40:36 - INFO - __main__ - Step 41637: {'lr': 0.000416613775973553, 'samples': 7994304, 'steps': 41636, 'loss/train': 1.1875720024108887} -08/30/2021 20:40:36 - INFO - __main__ - Step 41638: {'lr': 0.0004166098195184214, 'samples': 7994496, 'steps': 41637, 'loss/train': 0.15914101898670197} -08/30/2021 20:40:36 - INFO - __main__ - Step 41639: {'lr': 0.000416605862988218, 'samples': 7994688, 'steps': 41638, 'loss/train': 1.3329083919525146} -08/30/2021 20:40:37 - INFO - __main__ - Step 41640: {'lr': 0.00041660190638294456, 'samples': 7994880, 'steps': 41639, 'loss/train': 1.1964194774627686} -08/30/2021 20:40:38 - INFO - __main__ - Step 41641: {'lr': 0.0004165979497026028, 'samples': 7995072, 'steps': 41640, 'loss/train': 1.3991683721542358} -08/30/2021 20:40:39 - INFO - __main__ - Step 41642: {'lr': 0.00041659399294719456, 'samples': 7995264, 'steps': 41641, 'loss/train': 0.5802916884422302} -08/30/2021 20:40:39 - INFO - __main__ - Step 41643: {'lr': 0.00041659003611672175, 'samples': 7995456, 'steps': 41642, 'loss/train': 1.4516220092773438} -08/30/2021 20:40:39 - INFO - __main__ - Step 41644: {'lr': 0.000416586079211186, 'samples': 7995648, 'steps': 41643, 'loss/train': 0.95184326171875} -08/30/2021 20:40:40 - INFO - __main__ - Step 41645: {'lr': 0.0004165821222305891, 'samples': 7995840, 'steps': 41644, 'loss/train': 2.0189318656921387} -08/30/2021 20:40:42 - INFO - __main__ - Step 41646: {'lr': 0.00041657816517493284, 'samples': 7996032, 'steps': 41645, 'loss/train': 1.3277875185012817} -08/30/2021 20:40:42 - INFO - __main__ - Step 41647: {'lr': 0.00041657420804421907, 'samples': 7996224, 'steps': 41646, 'loss/train': 0.09014960378408432} -08/30/2021 20:40:42 - INFO - __main__ - Step 41648: {'lr': 0.00041657025083844957, 'samples': 7996416, 'steps': 41647, 'loss/train': 1.9317916631698608} -08/30/2021 20:40:43 - INFO - __main__ - Step 41649: {'lr': 0.00041656629355762607, 'samples': 7996608, 'steps': 41648, 'loss/train': 3.170945882797241} -08/30/2021 20:40:43 - INFO - __main__ - Step 41650: {'lr': 0.00041656233620175035, 'samples': 7996800, 'steps': 41649, 'loss/train': 1.0516948699951172} -08/30/2021 20:40:45 - INFO - __main__ - Step 41651: {'lr': 0.0004165583787708242, 'samples': 7996992, 'steps': 41650, 'loss/train': 1.4989819526672363} -08/30/2021 20:40:45 - INFO - __main__ - Step 41652: {'lr': 0.0004165544212648494, 'samples': 7997184, 'steps': 41651, 'loss/train': 1.1397823095321655} -08/30/2021 20:40:45 - INFO - __main__ - Step 41653: {'lr': 0.0004165504636838278, 'samples': 7997376, 'steps': 41652, 'loss/train': 1.192221760749817} -08/30/2021 20:40:46 - INFO - __main__ - Step 41654: {'lr': 0.0004165465060277611, 'samples': 7997568, 'steps': 41653, 'loss/train': 1.7243061065673828} -08/30/2021 20:40:46 - INFO - __main__ - Step 41655: {'lr': 0.0004165425482966512, 'samples': 7997760, 'steps': 41654, 'loss/train': 1.3988286256790161} -08/30/2021 20:40:48 - INFO - __main__ - Step 41656: {'lr': 0.00041653859049049964, 'samples': 7997952, 'steps': 41655, 'loss/train': 1.3119416236877441} -08/30/2021 20:40:48 - INFO - __main__ - Step 41657: {'lr': 0.00041653463260930845, 'samples': 7998144, 'steps': 41656, 'loss/train': 0.28657767176628113} -08/30/2021 20:40:48 - INFO - __main__ - Step 41658: {'lr': 0.00041653067465307925, 'samples': 7998336, 'steps': 41657, 'loss/train': 1.3334693908691406} -08/30/2021 20:40:49 - INFO - __main__ - Step 41659: {'lr': 0.00041652671662181394, 'samples': 7998528, 'steps': 41658, 'loss/train': 2.8703110218048096} -08/30/2021 20:40:49 - INFO - __main__ - Step 41660: {'lr': 0.00041652275851551435, 'samples': 7998720, 'steps': 41659, 'loss/train': 1.5845590829849243} -08/30/2021 20:40:51 - INFO - __main__ - Step 41661: {'lr': 0.0004165188003341821, 'samples': 7998912, 'steps': 41660, 'loss/train': 1.2762160301208496} -08/30/2021 20:40:51 - INFO - __main__ - Step 41662: {'lr': 0.0004165148420778191, 'samples': 7999104, 'steps': 41661, 'loss/train': 1.0728442668914795} -08/30/2021 20:40:52 - INFO - __main__ - Step 41663: {'lr': 0.000416510883746427, 'samples': 7999296, 'steps': 41662, 'loss/train': 1.3767396211624146} -08/30/2021 20:40:52 - INFO - __main__ - Step 41664: {'lr': 0.00041650692534000766, 'samples': 7999488, 'steps': 41663, 'loss/train': 1.7291936874389648} -08/30/2021 20:40:53 - INFO - __main__ - Step 41665: {'lr': 0.0004165029668585629, 'samples': 7999680, 'steps': 41664, 'loss/train': 1.774588942527771} -08/30/2021 20:40:53 - INFO - __main__ - Step 41666: {'lr': 0.00041649900830209455, 'samples': 7999872, 'steps': 41665, 'loss/train': 1.6639882326126099} -08/30/2021 20:40:54 - INFO - __main__ - Step 41667: {'lr': 0.00041649504967060423, 'samples': 8000064, 'steps': 41666, 'loss/train': 0.029390107840299606} -08/30/2021 20:40:55 - INFO - __main__ - Step 41668: {'lr': 0.0004164910909640938, 'samples': 8000256, 'steps': 41667, 'loss/train': 1.9860399961471558} -08/30/2021 20:40:55 - INFO - __main__ - Step 41669: {'lr': 0.0004164871321825651, 'samples': 8000448, 'steps': 41668, 'loss/train': 1.43567955493927} -08/30/2021 20:40:56 - INFO - __main__ - Step 41670: {'lr': 0.0004164831733260198, 'samples': 8000640, 'steps': 41669, 'loss/train': 1.5842734575271606} -08/30/2021 20:40:56 - INFO - __main__ - Step 41671: {'lr': 0.0004164792143944598, 'samples': 8000832, 'steps': 41670, 'loss/train': 1.0877556800842285} -08/30/2021 20:40:58 - INFO - __main__ - Step 41672: {'lr': 0.0004164752553878868, 'samples': 8001024, 'steps': 41671, 'loss/train': 1.483295202255249} -08/30/2021 20:40:59 - INFO - __main__ - Step 41673: {'lr': 0.00041647129630630265, 'samples': 8001216, 'steps': 41672, 'loss/train': 1.4576988220214844} -08/30/2021 20:40:59 - INFO - __main__ - Step 41674: {'lr': 0.0004164673371497092, 'samples': 8001408, 'steps': 41673, 'loss/train': 1.1592954397201538} -08/30/2021 20:40:59 - INFO - __main__ - Step 41675: {'lr': 0.000416463377918108, 'samples': 8001600, 'steps': 41674, 'loss/train': 1.2738759517669678} -08/30/2021 20:41:00 - INFO - __main__ - Step 41676: {'lr': 0.00041645941861150103, 'samples': 8001792, 'steps': 41675, 'loss/train': 1.7697786092758179} -08/30/2021 20:41:01 - INFO - __main__ - Step 41677: {'lr': 0.00041645545922989, 'samples': 8001984, 'steps': 41676, 'loss/train': 1.461212158203125} -08/30/2021 20:41:02 - INFO - __main__ - Step 41678: {'lr': 0.00041645149977327667, 'samples': 8002176, 'steps': 41677, 'loss/train': 1.5270456075668335} -08/30/2021 20:41:02 - INFO - __main__ - Step 41679: {'lr': 0.0004164475402416629, 'samples': 8002368, 'steps': 41678, 'loss/train': 1.594008207321167} -08/30/2021 20:41:02 - INFO - __main__ - Step 41680: {'lr': 0.0004164435806350505, 'samples': 8002560, 'steps': 41679, 'loss/train': 1.2985014915466309} -08/30/2021 20:41:03 - INFO - __main__ - Step 41681: {'lr': 0.00041643962095344107, 'samples': 8002752, 'steps': 41680, 'loss/train': 1.9186331033706665} -08/30/2021 20:41:03 - INFO - __main__ - Step 41682: {'lr': 0.0004164356611968366, 'samples': 8002944, 'steps': 41681, 'loss/train': 2.1798055171966553} -08/30/2021 20:41:04 - INFO - __main__ - Step 41683: {'lr': 0.0004164317013652387, 'samples': 8003136, 'steps': 41682, 'loss/train': 1.7911888360977173} -08/30/2021 20:41:05 - INFO - __main__ - Step 41684: {'lr': 0.00041642774145864934, 'samples': 8003328, 'steps': 41683, 'loss/train': 1.2257550954818726} -08/30/2021 20:41:05 - INFO - __main__ - Step 41685: {'lr': 0.00041642378147707014, 'samples': 8003520, 'steps': 41684, 'loss/train': 1.4834332466125488} -08/30/2021 20:41:06 - INFO - __main__ - Step 41686: {'lr': 0.00041641982142050297, 'samples': 8003712, 'steps': 41685, 'loss/train': 2.2028777599334717} -08/30/2021 20:41:06 - INFO - __main__ - Step 41687: {'lr': 0.00041641586128894967, 'samples': 8003904, 'steps': 41686, 'loss/train': 1.3898755311965942} -08/30/2021 20:41:07 - INFO - __main__ - Step 41688: {'lr': 0.0004164119010824119, 'samples': 8004096, 'steps': 41687, 'loss/train': 1.174214243888855} -08/30/2021 20:41:08 - INFO - __main__ - Step 41689: {'lr': 0.00041640794080089144, 'samples': 8004288, 'steps': 41688, 'loss/train': 0.9038873314857483} -08/30/2021 20:41:08 - INFO - __main__ - Step 41690: {'lr': 0.0004164039804443902, 'samples': 8004480, 'steps': 41689, 'loss/train': 1.2460660934448242} -08/30/2021 20:41:09 - INFO - __main__ - Step 41691: {'lr': 0.0004164000200129099, 'samples': 8004672, 'steps': 41690, 'loss/train': 1.462849736213684} -08/30/2021 20:41:09 - INFO - __main__ - Step 41692: {'lr': 0.0004163960595064522, 'samples': 8004864, 'steps': 41691, 'loss/train': 0.45430922508239746} -08/30/2021 20:41:11 - INFO - __main__ - Step 41693: {'lr': 0.00041639209892501913, 'samples': 8005056, 'steps': 41692, 'loss/train': 1.3535102605819702} -08/30/2021 20:41:11 - INFO - __main__ - Step 41694: {'lr': 0.00041638813826861234, 'samples': 8005248, 'steps': 41693, 'loss/train': 0.0332728773355484} -08/30/2021 20:41:12 - INFO - __main__ - Step 41695: {'lr': 0.00041638417753723356, 'samples': 8005440, 'steps': 41694, 'loss/train': 0.026177937164902687} -08/30/2021 20:41:12 - INFO - __main__ - Step 41696: {'lr': 0.00041638021673088464, 'samples': 8005632, 'steps': 41695, 'loss/train': 0.538514256477356} -08/30/2021 20:41:12 - INFO - __main__ - Step 41697: {'lr': 0.0004163762558495674, 'samples': 8005824, 'steps': 41696, 'loss/train': 1.7629307508468628} -08/30/2021 20:41:13 - INFO - __main__ - Step 41698: {'lr': 0.0004163722948932836, 'samples': 8006016, 'steps': 41697, 'loss/train': 1.450182557106018} -08/30/2021 20:41:14 - INFO - __main__ - Step 41699: {'lr': 0.000416368333862035, 'samples': 8006208, 'steps': 41698, 'loss/train': 1.321563482284546} -08/30/2021 20:41:15 - INFO - __main__ - Step 41700: {'lr': 0.00041636437275582335, 'samples': 8006400, 'steps': 41699, 'loss/train': 0.8955653309822083} -08/30/2021 20:41:15 - INFO - __main__ - Step 41701: {'lr': 0.00041636041157465056, 'samples': 8006592, 'steps': 41700, 'loss/train': 1.5074267387390137} -08/30/2021 20:41:16 - INFO - __main__ - Step 41702: {'lr': 0.00041635645031851826, 'samples': 8006784, 'steps': 41701, 'loss/train': 0.4653592109680176} -08/30/2021 20:41:16 - INFO - __main__ - Step 41703: {'lr': 0.00041635248898742834, 'samples': 8006976, 'steps': 41702, 'loss/train': 1.423519253730774} -08/30/2021 20:41:17 - INFO - __main__ - Step 41704: {'lr': 0.00041634852758138253, 'samples': 8007168, 'steps': 41703, 'loss/train': 1.2567559480667114} -08/30/2021 20:41:18 - INFO - __main__ - Step 41705: {'lr': 0.0004163445661003827, 'samples': 8007360, 'steps': 41704, 'loss/train': 0.8124480247497559} -08/30/2021 20:41:18 - INFO - __main__ - Step 41706: {'lr': 0.0004163406045444306, 'samples': 8007552, 'steps': 41705, 'loss/train': 1.2445435523986816} -08/30/2021 20:41:18 - INFO - __main__ - Step 41707: {'lr': 0.0004163366429135279, 'samples': 8007744, 'steps': 41706, 'loss/train': 1.383264183998108} -08/30/2021 20:41:19 - INFO - __main__ - Step 41708: {'lr': 0.00041633268120767653, 'samples': 8007936, 'steps': 41707, 'loss/train': 1.9784590005874634} -08/30/2021 20:41:20 - INFO - __main__ - Step 41709: {'lr': 0.00041632871942687814, 'samples': 8008128, 'steps': 41708, 'loss/train': 1.3793046474456787} -08/30/2021 20:41:21 - INFO - __main__ - Step 41710: {'lr': 0.00041632475757113466, 'samples': 8008320, 'steps': 41709, 'loss/train': 1.2249361276626587} -08/30/2021 20:41:21 - INFO - __main__ - Step 41711: {'lr': 0.00041632079564044776, 'samples': 8008512, 'steps': 41710, 'loss/train': 1.6648656129837036} -08/30/2021 20:41:21 - INFO - __main__ - Step 41712: {'lr': 0.0004163168336348194, 'samples': 8008704, 'steps': 41711, 'loss/train': 1.4305875301361084} -08/30/2021 20:41:22 - INFO - __main__ - Step 41713: {'lr': 0.00041631287155425114, 'samples': 8008896, 'steps': 41712, 'loss/train': 1.3651845455169678} -08/30/2021 20:41:23 - INFO - __main__ - Step 41714: {'lr': 0.0004163089093987449, 'samples': 8009088, 'steps': 41713, 'loss/train': 0.8557790517807007} -08/30/2021 20:41:24 - INFO - __main__ - Step 41715: {'lr': 0.00041630494716830244, 'samples': 8009280, 'steps': 41714, 'loss/train': 1.4982314109802246} -08/30/2021 20:41:24 - INFO - __main__ - Step 41716: {'lr': 0.00041630098486292546, 'samples': 8009472, 'steps': 41715, 'loss/train': 1.1822165250778198} -08/30/2021 20:41:24 - INFO - __main__ - Step 41717: {'lr': 0.0004162970224826159, 'samples': 8009664, 'steps': 41716, 'loss/train': 0.06584852933883667} -08/30/2021 20:41:25 - INFO - __main__ - Step 41718: {'lr': 0.0004162930600273754, 'samples': 8009856, 'steps': 41717, 'loss/train': 1.3209549188613892} -08/30/2021 20:41:25 - INFO - __main__ - Step 41719: {'lr': 0.0004162890974972059, 'samples': 8010048, 'steps': 41718, 'loss/train': 1.4217456579208374} -08/30/2021 20:41:27 - INFO - __main__ - Step 41720: {'lr': 0.00041628513489210906, 'samples': 8010240, 'steps': 41719, 'loss/train': 1.3186596632003784} -08/30/2021 20:41:27 - INFO - __main__ - Step 41721: {'lr': 0.0004162811722120867, 'samples': 8010432, 'steps': 41720, 'loss/train': 0.04912729561328888} -08/30/2021 20:41:28 - INFO - __main__ - Step 41722: {'lr': 0.00041627720945714065, 'samples': 8010624, 'steps': 41721, 'loss/train': 1.4928698539733887} -08/30/2021 20:41:28 - INFO - __main__ - Step 41723: {'lr': 0.00041627324662727263, 'samples': 8010816, 'steps': 41722, 'loss/train': 1.291818618774414} -08/30/2021 20:41:28 - INFO - __main__ - Step 41724: {'lr': 0.0004162692837224844, 'samples': 8011008, 'steps': 41723, 'loss/train': 0.8185926675796509} -08/30/2021 20:41:30 - INFO - __main__ - Step 41725: {'lr': 0.00041626532074277785, 'samples': 8011200, 'steps': 41724, 'loss/train': 2.1224584579467773} -08/30/2021 20:41:31 - INFO - __main__ - Step 41726: {'lr': 0.00041626135768815467, 'samples': 8011392, 'steps': 41725, 'loss/train': 1.2835928201675415} -08/30/2021 20:41:31 - INFO - __main__ - Step 41727: {'lr': 0.0004162573945586168, 'samples': 8011584, 'steps': 41726, 'loss/train': 1.151503324508667} -08/30/2021 20:41:32 - INFO - __main__ - Step 41728: {'lr': 0.0004162534313541658, 'samples': 8011776, 'steps': 41727, 'loss/train': 1.7242884635925293} -08/30/2021 20:41:32 - INFO - __main__ - Step 41729: {'lr': 0.00041624946807480357, 'samples': 8011968, 'steps': 41728, 'loss/train': 1.2168521881103516} -08/30/2021 20:41:34 - INFO - __main__ - Step 41730: {'lr': 0.0004162455047205319, 'samples': 8012160, 'steps': 41729, 'loss/train': 1.6182444095611572} -08/30/2021 20:41:34 - INFO - __main__ - Step 41731: {'lr': 0.0004162415412913526, 'samples': 8012352, 'steps': 41730, 'loss/train': 1.455169439315796} -08/30/2021 20:41:34 - INFO - __main__ - Step 41732: {'lr': 0.00041623757778726743, 'samples': 8012544, 'steps': 41731, 'loss/train': 1.88149893283844} -08/30/2021 20:41:35 - INFO - __main__ - Step 41733: {'lr': 0.00041623361420827816, 'samples': 8012736, 'steps': 41732, 'loss/train': 1.9368934631347656} -08/30/2021 20:41:35 - INFO - __main__ - Step 41734: {'lr': 0.0004162296505543867, 'samples': 8012928, 'steps': 41733, 'loss/train': 1.6959967613220215} -08/30/2021 20:41:37 - INFO - __main__ - Step 41735: {'lr': 0.00041622568682559455, 'samples': 8013120, 'steps': 41734, 'loss/train': 1.5027997493743896} -08/30/2021 20:41:37 - INFO - __main__ - Step 41736: {'lr': 0.0004162217230219038, 'samples': 8013312, 'steps': 41735, 'loss/train': 1.6844298839569092} -08/30/2021 20:41:38 - INFO - __main__ - Step 41737: {'lr': 0.00041621775914331595, 'samples': 8013504, 'steps': 41736, 'loss/train': 1.9245612621307373} -08/30/2021 20:41:38 - INFO - __main__ - Step 41738: {'lr': 0.00041621379518983306, 'samples': 8013696, 'steps': 41737, 'loss/train': 1.6410257816314697} -08/30/2021 20:41:38 - INFO - __main__ - Step 41739: {'lr': 0.00041620983116145673, 'samples': 8013888, 'steps': 41738, 'loss/train': 1.424729585647583} -08/30/2021 20:41:39 - INFO - __main__ - Step 41740: {'lr': 0.00041620586705818887, 'samples': 8014080, 'steps': 41739, 'loss/train': 0.9353100657463074} -08/30/2021 20:41:40 - INFO - __main__ - Step 41741: {'lr': 0.00041620190288003126, 'samples': 8014272, 'steps': 41740, 'loss/train': 1.457993507385254} -08/30/2021 20:41:41 - INFO - __main__ - Step 41742: {'lr': 0.00041619793862698553, 'samples': 8014464, 'steps': 41741, 'loss/train': 1.6768105030059814} -08/30/2021 20:41:41 - INFO - __main__ - Step 41743: {'lr': 0.00041619397429905363, 'samples': 8014656, 'steps': 41742, 'loss/train': 1.489015817642212} -08/30/2021 20:41:42 - INFO - __main__ - Step 41744: {'lr': 0.0004161900098962373, 'samples': 8014848, 'steps': 41743, 'loss/train': 1.8153353929519653} -08/30/2021 20:41:42 - INFO - __main__ - Step 41745: {'lr': 0.00041618604541853826, 'samples': 8015040, 'steps': 41744, 'loss/train': 0.9990391135215759} -08/30/2021 20:41:44 - INFO - __main__ - Step 41746: {'lr': 0.00041618208086595843, 'samples': 8015232, 'steps': 41745, 'loss/train': 0.48116764426231384} -08/30/2021 20:41:44 - INFO - __main__ - Step 41747: {'lr': 0.0004161781162384994, 'samples': 8015424, 'steps': 41746, 'loss/train': 1.7746678590774536} -08/30/2021 20:41:44 - INFO - __main__ - Step 41748: {'lr': 0.00041617415153616323, 'samples': 8015616, 'steps': 41747, 'loss/train': 0.4191964268684387} -08/30/2021 20:41:45 - INFO - __main__ - Step 41749: {'lr': 0.00041617018675895145, 'samples': 8015808, 'steps': 41748, 'loss/train': 0.8925157785415649} -08/30/2021 20:41:45 - INFO - __main__ - Step 41750: {'lr': 0.00041616622190686597, 'samples': 8016000, 'steps': 41749, 'loss/train': 1.9171894788742065} -08/30/2021 20:41:47 - INFO - __main__ - Step 41751: {'lr': 0.0004161622569799086, 'samples': 8016192, 'steps': 41750, 'loss/train': 0.05079185962677002} -08/30/2021 20:41:47 - INFO - __main__ - Step 41752: {'lr': 0.00041615829197808095, 'samples': 8016384, 'steps': 41751, 'loss/train': 1.4282255172729492} -08/30/2021 20:41:48 - INFO - __main__ - Step 41753: {'lr': 0.0004161543269013851, 'samples': 8016576, 'steps': 41752, 'loss/train': 0.18148311972618103} -08/30/2021 20:41:48 - INFO - __main__ - Step 41754: {'lr': 0.0004161503617498226, 'samples': 8016768, 'steps': 41753, 'loss/train': 1.6366389989852905} -08/30/2021 20:41:49 - INFO - __main__ - Step 41755: {'lr': 0.00041614639652339533, 'samples': 8016960, 'steps': 41754, 'loss/train': 1.260956048965454} -08/30/2021 20:41:49 - INFO - __main__ - Step 41756: {'lr': 0.00041614243122210505, 'samples': 8017152, 'steps': 41755, 'loss/train': 0.8986827731132507} -08/30/2021 20:41:50 - INFO - __main__ - Step 41757: {'lr': 0.0004161384658459535, 'samples': 8017344, 'steps': 41756, 'loss/train': 1.7238725423812866} -08/30/2021 20:41:51 - INFO - __main__ - Step 41758: {'lr': 0.0004161345003949426, 'samples': 8017536, 'steps': 41757, 'loss/train': 1.31426203250885} -08/30/2021 20:41:51 - INFO - __main__ - Step 41759: {'lr': 0.00041613053486907396, 'samples': 8017728, 'steps': 41758, 'loss/train': 1.3150458335876465} -08/30/2021 20:41:52 - INFO - __main__ - Step 41760: {'lr': 0.0004161265692683496, 'samples': 8017920, 'steps': 41759, 'loss/train': 1.899686574935913} -08/30/2021 20:41:52 - INFO - __main__ - Step 41761: {'lr': 0.0004161226035927711, 'samples': 8018112, 'steps': 41760, 'loss/train': 2.4361443519592285} -08/30/2021 20:41:53 - INFO - __main__ - Step 41762: {'lr': 0.0004161186378423403, 'samples': 8018304, 'steps': 41761, 'loss/train': 0.9371394515037537} -08/30/2021 20:41:54 - INFO - __main__ - Step 41763: {'lr': 0.000416114672017059, 'samples': 8018496, 'steps': 41762, 'loss/train': 1.2019520998001099} -08/30/2021 20:41:54 - INFO - __main__ - Step 41764: {'lr': 0.000416110706116929, 'samples': 8018688, 'steps': 41763, 'loss/train': 1.0509260892868042} -08/30/2021 20:41:55 - INFO - __main__ - Step 41765: {'lr': 0.0004161067401419521, 'samples': 8018880, 'steps': 41764, 'loss/train': 1.5440552234649658} -08/30/2021 20:41:55 - INFO - __main__ - Step 41766: {'lr': 0.00041610277409213003, 'samples': 8019072, 'steps': 41765, 'loss/train': 1.3422781229019165} -08/30/2021 20:41:57 - INFO - __main__ - Step 41767: {'lr': 0.00041609880796746463, 'samples': 8019264, 'steps': 41766, 'loss/train': 1.0526846647262573} -08/30/2021 20:41:57 - INFO - __main__ - Step 41768: {'lr': 0.00041609484176795774, 'samples': 8019456, 'steps': 41767, 'loss/train': 1.498138666152954} -08/30/2021 20:41:57 - INFO - __main__ - Step 41769: {'lr': 0.000416090875493611, 'samples': 8019648, 'steps': 41768, 'loss/train': 0.9550386071205139} -08/30/2021 20:41:58 - INFO - __main__ - Step 41770: {'lr': 0.0004160869091444263, 'samples': 8019840, 'steps': 41769, 'loss/train': 1.6613816022872925} -08/30/2021 20:41:58 - INFO - __main__ - Step 41771: {'lr': 0.0004160829427204054, 'samples': 8020032, 'steps': 41770, 'loss/train': 0.5467845797538757} -08/30/2021 20:42:00 - INFO - __main__ - Step 41772: {'lr': 0.00041607897622155006, 'samples': 8020224, 'steps': 41771, 'loss/train': 1.3568012714385986} -08/30/2021 20:42:00 - INFO - __main__ - Step 41773: {'lr': 0.00041607500964786217, 'samples': 8020416, 'steps': 41772, 'loss/train': 1.6734267473220825} -08/30/2021 20:42:00 - INFO - __main__ - Step 41774: {'lr': 0.0004160710429993434, 'samples': 8020608, 'steps': 41773, 'loss/train': 1.9361891746520996} -08/30/2021 20:42:01 - INFO - __main__ - Step 41775: {'lr': 0.00041606707627599556, 'samples': 8020800, 'steps': 41774, 'loss/train': 1.5149098634719849} -08/30/2021 20:42:01 - INFO - __main__ - Step 41776: {'lr': 0.00041606310947782046, 'samples': 8020992, 'steps': 41775, 'loss/train': 1.3088252544403076} -08/30/2021 20:42:03 - INFO - __main__ - Step 41777: {'lr': 0.0004160591426048199, 'samples': 8021184, 'steps': 41776, 'loss/train': 1.2729098796844482} -08/30/2021 20:42:03 - INFO - __main__ - Step 41778: {'lr': 0.00041605517565699565, 'samples': 8021376, 'steps': 41777, 'loss/train': 1.208472728729248} -08/30/2021 20:42:03 - INFO - __main__ - Step 41779: {'lr': 0.00041605120863434945, 'samples': 8021568, 'steps': 41778, 'loss/train': 1.831836223602295} -08/30/2021 20:42:04 - INFO - __main__ - Step 41780: {'lr': 0.0004160472415368832, 'samples': 8021760, 'steps': 41779, 'loss/train': 1.271667718887329} -08/30/2021 20:42:04 - INFO - __main__ - Step 41781: {'lr': 0.00041604327436459864, 'samples': 8021952, 'steps': 41780, 'loss/train': 1.7045323848724365} -08/30/2021 20:42:04 - INFO - __main__ - Step 41782: {'lr': 0.0004160393071174975, 'samples': 8022144, 'steps': 41781, 'loss/train': 0.5790306329727173} -08/30/2021 20:42:07 - INFO - __main__ - Step 41783: {'lr': 0.00041603533979558163, 'samples': 8022336, 'steps': 41782, 'loss/train': 0.6085450649261475} -08/30/2021 20:42:07 - INFO - __main__ - Step 41784: {'lr': 0.0004160313723988528, 'samples': 8022528, 'steps': 41783, 'loss/train': 0.17379771173000336} -08/30/2021 20:42:07 - INFO - __main__ - Step 41785: {'lr': 0.00041602740492731284, 'samples': 8022720, 'steps': 41784, 'loss/train': 1.8490116596221924} -08/30/2021 20:42:08 - INFO - __main__ - Step 41786: {'lr': 0.0004160234373809634, 'samples': 8022912, 'steps': 41785, 'loss/train': 1.3827310800552368} -08/30/2021 20:42:08 - INFO - __main__ - Step 41787: {'lr': 0.0004160194697598064, 'samples': 8023104, 'steps': 41786, 'loss/train': 1.4580172300338745} -08/30/2021 20:42:10 - INFO - __main__ - Step 41788: {'lr': 0.0004160155020638436, 'samples': 8023296, 'steps': 41787, 'loss/train': 1.7783116102218628} -08/30/2021 20:42:10 - INFO - __main__ - Step 41789: {'lr': 0.0004160115342930768, 'samples': 8023488, 'steps': 41788, 'loss/train': 2.2475783824920654} -08/30/2021 20:42:10 - INFO - __main__ - Step 41790: {'lr': 0.0004160075664475077, 'samples': 8023680, 'steps': 41789, 'loss/train': 1.2616629600524902} -08/30/2021 20:42:11 - INFO - __main__ - Step 41791: {'lr': 0.0004160035985271382, 'samples': 8023872, 'steps': 41790, 'loss/train': 0.49890244007110596} -08/30/2021 20:42:11 - INFO - __main__ - Step 41792: {'lr': 0.00041599963053196997, 'samples': 8024064, 'steps': 41791, 'loss/train': 2.033851385116577} -08/30/2021 20:42:13 - INFO - __main__ - Step 41793: {'lr': 0.0004159956624620049, 'samples': 8024256, 'steps': 41792, 'loss/train': 1.469059944152832} -08/30/2021 20:42:13 - INFO - __main__ - Step 41794: {'lr': 0.0004159916943172448, 'samples': 8024448, 'steps': 41793, 'loss/train': 1.3045949935913086} -08/30/2021 20:42:14 - INFO - __main__ - Step 41795: {'lr': 0.0004159877260976914, 'samples': 8024640, 'steps': 41794, 'loss/train': 1.591121792793274} -08/30/2021 20:42:14 - INFO - __main__ - Step 41796: {'lr': 0.00041598375780334653, 'samples': 8024832, 'steps': 41795, 'loss/train': 0.847492516040802} -08/30/2021 20:42:14 - INFO - __main__ - Step 41797: {'lr': 0.0004159797894342118, 'samples': 8025024, 'steps': 41796, 'loss/train': 1.1704052686691284} -08/30/2021 20:42:16 - INFO - __main__ - Step 41798: {'lr': 0.0004159758209902892, 'samples': 8025216, 'steps': 41797, 'loss/train': 1.4010660648345947} -08/30/2021 20:42:16 - INFO - __main__ - Step 41799: {'lr': 0.00041597185247158053, 'samples': 8025408, 'steps': 41798, 'loss/train': 0.780902624130249} -08/30/2021 20:42:17 - INFO - __main__ - Step 41800: {'lr': 0.0004159678838780874, 'samples': 8025600, 'steps': 41799, 'loss/train': 1.338391900062561} -08/30/2021 20:42:17 - INFO - __main__ - Step 41801: {'lr': 0.0004159639152098118, 'samples': 8025792, 'steps': 41800, 'loss/train': 1.3567825555801392} -08/30/2021 20:42:17 - INFO - __main__ - Step 41802: {'lr': 0.00041595994646675537, 'samples': 8025984, 'steps': 41801, 'loss/train': 1.3682771921157837} -08/30/2021 20:42:18 - INFO - __main__ - Step 41803: {'lr': 0.0004159559776489199, 'samples': 8026176, 'steps': 41802, 'loss/train': 1.5757153034210205} -08/30/2021 20:42:19 - INFO - __main__ - Step 41804: {'lr': 0.00041595200875630734, 'samples': 8026368, 'steps': 41803, 'loss/train': 0.9679489135742188} -08/30/2021 20:42:19 - INFO - __main__ - Step 41805: {'lr': 0.00041594803978891925, 'samples': 8026560, 'steps': 41804, 'loss/train': 1.078711986541748} -08/30/2021 20:42:20 - INFO - __main__ - Step 41806: {'lr': 0.00041594407074675753, 'samples': 8026752, 'steps': 41805, 'loss/train': 1.5219484567642212} -08/30/2021 20:42:20 - INFO - __main__ - Step 41807: {'lr': 0.0004159401016298241, 'samples': 8026944, 'steps': 41806, 'loss/train': 2.496682643890381} -08/30/2021 20:42:21 - INFO - __main__ - Step 41808: {'lr': 0.0004159361324381206, 'samples': 8027136, 'steps': 41807, 'loss/train': 1.4242775440216064} -08/30/2021 20:42:22 - INFO - __main__ - Step 41809: {'lr': 0.0004159321631716487, 'samples': 8027328, 'steps': 41808, 'loss/train': 1.583635926246643} -08/30/2021 20:42:23 - INFO - __main__ - Step 41810: {'lr': 0.00041592819383041047, 'samples': 8027520, 'steps': 41809, 'loss/train': 1.483121633529663} -08/30/2021 20:42:23 - INFO - __main__ - Step 41811: {'lr': 0.0004159242244144075, 'samples': 8027712, 'steps': 41810, 'loss/train': 1.496715784072876} -08/30/2021 20:42:24 - INFO - __main__ - Step 41812: {'lr': 0.0004159202549236416, 'samples': 8027904, 'steps': 41811, 'loss/train': 1.4398528337478638} -08/30/2021 20:42:24 - INFO - __main__ - Step 41813: {'lr': 0.00041591628535811464, 'samples': 8028096, 'steps': 41812, 'loss/train': 0.08508310467004776} -08/30/2021 20:42:24 - INFO - __main__ - Step 41814: {'lr': 0.00041591231571782834, 'samples': 8028288, 'steps': 41813, 'loss/train': 0.26660722494125366} -08/30/2021 20:42:26 - INFO - __main__ - Step 41815: {'lr': 0.0004159083460027845, 'samples': 8028480, 'steps': 41814, 'loss/train': 1.042811632156372} -08/30/2021 20:42:26 - INFO - __main__ - Step 41816: {'lr': 0.000415904376212985, 'samples': 8028672, 'steps': 41815, 'loss/train': 1.7438234090805054} -08/30/2021 20:42:27 - INFO - __main__ - Step 41817: {'lr': 0.00041590040634843144, 'samples': 8028864, 'steps': 41816, 'loss/train': 1.9059609174728394} -08/30/2021 20:42:27 - INFO - __main__ - Step 41818: {'lr': 0.00041589643640912576, 'samples': 8029056, 'steps': 41817, 'loss/train': 1.4541925191879272} -08/30/2021 20:42:27 - INFO - __main__ - Step 41819: {'lr': 0.0004158924663950697, 'samples': 8029248, 'steps': 41818, 'loss/train': 1.4391422271728516} -08/30/2021 20:42:29 - INFO - __main__ - Step 41820: {'lr': 0.00041588849630626513, 'samples': 8029440, 'steps': 41819, 'loss/train': 1.200029969215393} -08/30/2021 20:42:29 - INFO - __main__ - Step 41821: {'lr': 0.00041588452614271364, 'samples': 8029632, 'steps': 41820, 'loss/train': 1.5291684865951538} -08/30/2021 20:42:30 - INFO - __main__ - Step 41822: {'lr': 0.00041588055590441726, 'samples': 8029824, 'steps': 41821, 'loss/train': 1.3797036409378052} -08/30/2021 20:42:30 - INFO - __main__ - Step 41823: {'lr': 0.0004158765855913776, 'samples': 8030016, 'steps': 41822, 'loss/train': 1.2176798582077026} -08/30/2021 20:42:31 - INFO - __main__ - Step 41824: {'lr': 0.0004158726152035965, 'samples': 8030208, 'steps': 41823, 'loss/train': 1.4863344430923462} -08/30/2021 20:42:33 - INFO - __main__ - Step 41825: {'lr': 0.00041586864474107575, 'samples': 8030400, 'steps': 41824, 'loss/train': 1.5318057537078857} -08/30/2021 20:42:34 - INFO - __main__ - Step 41826: {'lr': 0.0004158646742038172, 'samples': 8030592, 'steps': 41825, 'loss/train': 1.7026723623275757} -08/30/2021 20:42:34 - INFO - __main__ - Step 41827: {'lr': 0.00041586070359182255, 'samples': 8030784, 'steps': 41826, 'loss/train': 1.4229241609573364} -08/30/2021 20:42:35 - INFO - __main__ - Step 41828: {'lr': 0.00041585673290509364, 'samples': 8030976, 'steps': 41827, 'loss/train': 1.519781231880188} -08/30/2021 20:42:35 - INFO - __main__ - Step 41829: {'lr': 0.0004158527621436322, 'samples': 8031168, 'steps': 41828, 'loss/train': 1.8084534406661987} -08/30/2021 20:42:35 - INFO - __main__ - Step 41830: {'lr': 0.0004158487913074401, 'samples': 8031360, 'steps': 41829, 'loss/train': 1.7924851179122925} -08/30/2021 20:42:36 - INFO - __main__ - Step 41831: {'lr': 0.0004158448203965192, 'samples': 8031552, 'steps': 41830, 'loss/train': 1.825628399848938} -08/30/2021 20:42:36 - INFO - __main__ - Step 41832: {'lr': 0.000415840849410871, 'samples': 8031744, 'steps': 41831, 'loss/train': 0.1913384348154068} -08/30/2021 20:42:37 - INFO - __main__ - Step 41833: {'lr': 0.0004158368783504975, 'samples': 8031936, 'steps': 41832, 'loss/train': 1.4772800207138062} -08/30/2021 20:42:38 - INFO - __main__ - Step 41834: {'lr': 0.00041583290721540055, 'samples': 8032128, 'steps': 41833, 'loss/train': 1.0174660682678223} -08/30/2021 20:42:38 - INFO - __main__ - Step 41835: {'lr': 0.0004158289360055819, 'samples': 8032320, 'steps': 41834, 'loss/train': 1.4912314414978027} -08/30/2021 20:42:38 - INFO - __main__ - Step 41836: {'lr': 0.00041582496472104314, 'samples': 8032512, 'steps': 41835, 'loss/train': 1.8404120206832886} -08/30/2021 20:42:39 - INFO - __main__ - Step 41837: {'lr': 0.0004158209933617863, 'samples': 8032704, 'steps': 41836, 'loss/train': 1.5737131834030151} -08/30/2021 20:42:40 - INFO - __main__ - Step 41838: {'lr': 0.00041581702192781305, 'samples': 8032896, 'steps': 41837, 'loss/train': 1.67239511013031} -08/30/2021 20:42:41 - INFO - __main__ - Step 41839: {'lr': 0.0004158130504191252, 'samples': 8033088, 'steps': 41838, 'loss/train': 1.185289740562439} -08/30/2021 20:42:41 - INFO - __main__ - Step 41840: {'lr': 0.0004158090788357246, 'samples': 8033280, 'steps': 41839, 'loss/train': 1.847983717918396} -08/30/2021 20:42:42 - INFO - __main__ - Step 41841: {'lr': 0.0004158051071776129, 'samples': 8033472, 'steps': 41840, 'loss/train': 1.5942496061325073} -08/30/2021 20:42:42 - INFO - __main__ - Step 41842: {'lr': 0.00041580113544479203, 'samples': 8033664, 'steps': 41841, 'loss/train': 1.6874637603759766} -08/30/2021 20:42:44 - INFO - __main__ - Step 41843: {'lr': 0.00041579716363726376, 'samples': 8033856, 'steps': 41842, 'loss/train': 1.8654677867889404} -08/30/2021 20:42:44 - INFO - __main__ - Step 41844: {'lr': 0.00041579319175502985, 'samples': 8034048, 'steps': 41843, 'loss/train': 1.5211448669433594} -08/30/2021 20:42:45 - INFO - __main__ - Step 41845: {'lr': 0.000415789219798092, 'samples': 8034240, 'steps': 41844, 'loss/train': 1.0404632091522217} -08/30/2021 20:42:45 - INFO - __main__ - Step 41846: {'lr': 0.00041578524776645216, 'samples': 8034432, 'steps': 41845, 'loss/train': 1.1511561870574951} -08/30/2021 20:42:46 - INFO - __main__ - Step 41847: {'lr': 0.00041578127566011203, 'samples': 8034624, 'steps': 41846, 'loss/train': 1.2978366613388062} -08/30/2021 20:42:47 - INFO - __main__ - Step 41848: {'lr': 0.0004157773034790734, 'samples': 8034816, 'steps': 41847, 'loss/train': 0.9080016016960144} -08/30/2021 20:42:48 - INFO - __main__ - Step 41849: {'lr': 0.00041577333122333807, 'samples': 8035008, 'steps': 41848, 'loss/train': 1.3785098791122437} -08/30/2021 20:42:48 - INFO - __main__ - Step 41850: {'lr': 0.00041576935889290777, 'samples': 8035200, 'steps': 41849, 'loss/train': 1.5190757513046265} -08/30/2021 20:42:48 - INFO - __main__ - Step 41851: {'lr': 0.0004157653864877845, 'samples': 8035392, 'steps': 41850, 'loss/train': 0.7366766929626465} -08/30/2021 20:42:49 - INFO - __main__ - Step 41852: {'lr': 0.00041576141400796984, 'samples': 8035584, 'steps': 41851, 'loss/train': 0.07756426185369492} -08/30/2021 20:42:49 - INFO - __main__ - Step 41853: {'lr': 0.00041575744145346563, 'samples': 8035776, 'steps': 41852, 'loss/train': 0.9598649144172668} -08/30/2021 20:42:51 - INFO - __main__ - Step 41854: {'lr': 0.00041575346882427366, 'samples': 8035968, 'steps': 41853, 'loss/train': 1.652033805847168} -08/30/2021 20:42:51 - INFO - __main__ - Step 41855: {'lr': 0.00041574949612039583, 'samples': 8036160, 'steps': 41854, 'loss/train': 1.572953224182129} -08/30/2021 20:42:51 - INFO - __main__ - Step 41856: {'lr': 0.0004157455233418337, 'samples': 8036352, 'steps': 41855, 'loss/train': 1.3858767747879028} -08/30/2021 20:42:52 - INFO - __main__ - Step 41857: {'lr': 0.0004157415504885893, 'samples': 8036544, 'steps': 41856, 'loss/train': 1.0582249164581299} -08/30/2021 20:42:52 - INFO - __main__ - Step 41858: {'lr': 0.00041573757756066423, 'samples': 8036736, 'steps': 41857, 'loss/train': 0.40921273827552795} -08/30/2021 20:42:54 - INFO - __main__ - Step 41859: {'lr': 0.0004157336045580604, 'samples': 8036928, 'steps': 41858, 'loss/train': 1.0436087846755981} -08/30/2021 20:42:54 - INFO - __main__ - Step 41860: {'lr': 0.0004157296314807796, 'samples': 8037120, 'steps': 41859, 'loss/train': 1.573651671409607} -08/30/2021 20:42:54 - INFO - __main__ - Step 41861: {'lr': 0.0004157256583288235, 'samples': 8037312, 'steps': 41860, 'loss/train': 1.570266842842102} -08/30/2021 20:42:55 - INFO - __main__ - Step 41862: {'lr': 0.0004157216851021941, 'samples': 8037504, 'steps': 41861, 'loss/train': 1.5497149229049683} -08/30/2021 20:42:55 - INFO - __main__ - Step 41863: {'lr': 0.00041571771180089304, 'samples': 8037696, 'steps': 41862, 'loss/train': 1.0708867311477661} -08/30/2021 20:42:57 - INFO - __main__ - Step 41864: {'lr': 0.0004157137384249221, 'samples': 8037888, 'steps': 41863, 'loss/train': 1.174491286277771} -08/30/2021 20:42:57 - INFO - __main__ - Step 41865: {'lr': 0.00041570976497428303, 'samples': 8038080, 'steps': 41864, 'loss/train': 1.3570365905761719} -08/30/2021 20:42:58 - INFO - __main__ - Step 41866: {'lr': 0.0004157057914489778, 'samples': 8038272, 'steps': 41865, 'loss/train': 1.6820279359817505} -08/30/2021 20:42:58 - INFO - __main__ - Step 41867: {'lr': 0.00041570181784900806, 'samples': 8038464, 'steps': 41866, 'loss/train': 1.382882833480835} -08/30/2021 20:42:58 - INFO - __main__ - Step 41868: {'lr': 0.0004156978441743756, 'samples': 8038656, 'steps': 41867, 'loss/train': 2.1571285724639893} -08/30/2021 20:42:59 - INFO - __main__ - Step 41869: {'lr': 0.00041569387042508235, 'samples': 8038848, 'steps': 41868, 'loss/train': 1.3227064609527588} -08/30/2021 20:43:00 - INFO - __main__ - Step 41870: {'lr': 0.0004156898966011299, 'samples': 8039040, 'steps': 41869, 'loss/train': 1.7419781684875488} -08/30/2021 20:43:01 - INFO - __main__ - Step 41871: {'lr': 0.0004156859227025202, 'samples': 8039232, 'steps': 41870, 'loss/train': 1.4750696420669556} -08/30/2021 20:43:01 - INFO - __main__ - Step 41872: {'lr': 0.0004156819487292549, 'samples': 8039424, 'steps': 41871, 'loss/train': 1.37647545337677} -08/30/2021 20:43:02 - INFO - __main__ - Step 41873: {'lr': 0.00041567797468133595, 'samples': 8039616, 'steps': 41872, 'loss/train': 1.659361481666565} -08/30/2021 20:43:02 - INFO - __main__ - Step 41874: {'lr': 0.00041567400055876505, 'samples': 8039808, 'steps': 41873, 'loss/train': 1.371205449104309} -08/30/2021 20:43:04 - INFO - __main__ - Step 41875: {'lr': 0.00041567002636154406, 'samples': 8040000, 'steps': 41874, 'loss/train': 0.840124249458313} -08/30/2021 20:43:04 - INFO - __main__ - Step 41876: {'lr': 0.0004156660520896746, 'samples': 8040192, 'steps': 41875, 'loss/train': 1.6229898929595947} -08/30/2021 20:43:05 - INFO - __main__ - Step 41877: {'lr': 0.00041566207774315866, 'samples': 8040384, 'steps': 41876, 'loss/train': 1.4709619283676147} -08/30/2021 20:43:05 - INFO - __main__ - Step 41878: {'lr': 0.0004156581033219979, 'samples': 8040576, 'steps': 41877, 'loss/train': 0.6833112835884094} -08/30/2021 20:43:06 - INFO - __main__ - Step 41879: {'lr': 0.0004156541288261941, 'samples': 8040768, 'steps': 41878, 'loss/train': 1.489064335823059} -08/30/2021 20:43:06 - INFO - __main__ - Step 41880: {'lr': 0.00041565015425574917, 'samples': 8040960, 'steps': 41879, 'loss/train': 0.029329517856240273} -08/30/2021 20:43:07 - INFO - __main__ - Step 41881: {'lr': 0.00041564617961066487, 'samples': 8041152, 'steps': 41880, 'loss/train': 1.3005467653274536} -08/30/2021 20:43:08 - INFO - __main__ - Step 41882: {'lr': 0.00041564220489094295, 'samples': 8041344, 'steps': 41881, 'loss/train': 1.610386610031128} -08/30/2021 20:43:08 - INFO - __main__ - Step 41883: {'lr': 0.00041563823009658514, 'samples': 8041536, 'steps': 41882, 'loss/train': 0.897910475730896} -08/30/2021 20:43:09 - INFO - __main__ - Step 41884: {'lr': 0.00041563425522759336, 'samples': 8041728, 'steps': 41883, 'loss/train': 1.4776582717895508} -08/30/2021 20:43:09 - INFO - __main__ - Step 41885: {'lr': 0.0004156302802839693, 'samples': 8041920, 'steps': 41884, 'loss/train': 1.9614852666854858} -08/30/2021 20:43:10 - INFO - __main__ - Step 41886: {'lr': 0.0004156263052657148, 'samples': 8042112, 'steps': 41885, 'loss/train': 1.7023252248764038} -08/30/2021 20:43:11 - INFO - __main__ - Step 41887: {'lr': 0.0004156223301728316, 'samples': 8042304, 'steps': 41886, 'loss/train': 1.903437852859497} -08/30/2021 20:43:11 - INFO - __main__ - Step 41888: {'lr': 0.0004156183550053216, 'samples': 8042496, 'steps': 41887, 'loss/train': 1.803829312324524} -08/30/2021 20:43:11 - INFO - __main__ - Step 41889: {'lr': 0.0004156143797631866, 'samples': 8042688, 'steps': 41888, 'loss/train': 1.4281631708145142} -08/30/2021 20:43:12 - INFO - __main__ - Step 41890: {'lr': 0.0004156104044464282, 'samples': 8042880, 'steps': 41889, 'loss/train': 0.9988219141960144} -08/30/2021 20:43:14 - INFO - __main__ - Step 41891: {'lr': 0.00041560642905504833, 'samples': 8043072, 'steps': 41890, 'loss/train': 0.5660489797592163} -08/30/2021 20:43:14 - INFO - __main__ - Step 41892: {'lr': 0.0004156024535890487, 'samples': 8043264, 'steps': 41891, 'loss/train': 1.4819796085357666} -08/30/2021 20:43:15 - INFO - __main__ - Step 41893: {'lr': 0.00041559847804843123, 'samples': 8043456, 'steps': 41892, 'loss/train': 1.305707335472107} -08/30/2021 20:43:15 - INFO - __main__ - Step 41894: {'lr': 0.0004155945024331976, 'samples': 8043648, 'steps': 41893, 'loss/train': 1.7447402477264404} -08/30/2021 20:43:15 - INFO - __main__ - Step 41895: {'lr': 0.00041559052674334975, 'samples': 8043840, 'steps': 41894, 'loss/train': 1.294675350189209} -08/30/2021 20:43:16 - INFO - __main__ - Step 41896: {'lr': 0.0004155865509788893, 'samples': 8044032, 'steps': 41895, 'loss/train': 1.0206354856491089} -08/30/2021 20:43:18 - INFO - __main__ - Step 41897: {'lr': 0.00041558257513981805, 'samples': 8044224, 'steps': 41896, 'loss/train': 0.14419202506542206} -08/30/2021 20:43:18 - INFO - __main__ - Step 41898: {'lr': 0.00041557859922613795, 'samples': 8044416, 'steps': 41897, 'loss/train': 1.6448591947555542} -08/30/2021 20:43:19 - INFO - __main__ - Step 41899: {'lr': 0.00041557462323785053, 'samples': 8044608, 'steps': 41898, 'loss/train': 1.1527259349822998} -08/30/2021 20:43:19 - INFO - __main__ - Step 41900: {'lr': 0.00041557064717495786, 'samples': 8044800, 'steps': 41899, 'loss/train': 1.0871294736862183} -08/30/2021 20:43:19 - INFO - __main__ - Step 41901: {'lr': 0.00041556667103746157, 'samples': 8044992, 'steps': 41900, 'loss/train': 0.06764210015535355} -08/30/2021 20:43:21 - INFO - __main__ - Step 41902: {'lr': 0.00041556269482536355, 'samples': 8045184, 'steps': 41901, 'loss/train': 2.183725118637085} -08/30/2021 20:43:22 - INFO - __main__ - Step 41903: {'lr': 0.00041555871853866553, 'samples': 8045376, 'steps': 41902, 'loss/train': 1.1897425651550293} -08/30/2021 20:43:22 - INFO - __main__ - Step 41904: {'lr': 0.00041555474217736926, 'samples': 8045568, 'steps': 41903, 'loss/train': 0.4623366892337799} -08/30/2021 20:43:22 - INFO - __main__ - Step 41905: {'lr': 0.0004155507657414766, 'samples': 8045760, 'steps': 41904, 'loss/train': 1.517594337463379} -08/30/2021 20:43:23 - INFO - __main__ - Step 41906: {'lr': 0.0004155467892309893, 'samples': 8045952, 'steps': 41905, 'loss/train': 1.351616621017456} -08/30/2021 20:43:24 - INFO - __main__ - Step 41907: {'lr': 0.0004155428126459092, 'samples': 8046144, 'steps': 41906, 'loss/train': 1.2100814580917358} -08/30/2021 20:43:24 - INFO - __main__ - Step 41908: {'lr': 0.00041553883598623804, 'samples': 8046336, 'steps': 41907, 'loss/train': 1.0407642126083374} -08/30/2021 20:43:25 - INFO - __main__ - Step 41909: {'lr': 0.00041553485925197763, 'samples': 8046528, 'steps': 41908, 'loss/train': 1.5186941623687744} -08/30/2021 20:43:25 - INFO - __main__ - Step 41910: {'lr': 0.00041553088244312975, 'samples': 8046720, 'steps': 41909, 'loss/train': 1.2687880992889404} -08/30/2021 20:43:25 - INFO - __main__ - Step 41911: {'lr': 0.0004155269055596963, 'samples': 8046912, 'steps': 41910, 'loss/train': 1.5419580936431885} -08/30/2021 20:43:27 - INFO - __main__ - Step 41912: {'lr': 0.0004155229286016789, 'samples': 8047104, 'steps': 41911, 'loss/train': 0.28386372327804565} -08/30/2021 20:43:27 - INFO - __main__ - Step 41913: {'lr': 0.0004155189515690794, 'samples': 8047296, 'steps': 41912, 'loss/train': 1.9679127931594849} -08/30/2021 20:43:28 - INFO - __main__ - Step 41914: {'lr': 0.0004155149744618997, 'samples': 8047488, 'steps': 41913, 'loss/train': 0.8942242860794067} -08/30/2021 20:43:28 - INFO - __main__ - Step 41915: {'lr': 0.0004155109972801414, 'samples': 8047680, 'steps': 41914, 'loss/train': 1.5286887884140015} -08/30/2021 20:43:28 - INFO - __main__ - Step 41916: {'lr': 0.0004155070200238065, 'samples': 8047872, 'steps': 41915, 'loss/train': 1.4754290580749512} -08/30/2021 20:43:29 - INFO - __main__ - Step 41917: {'lr': 0.00041550304269289664, 'samples': 8048064, 'steps': 41916, 'loss/train': 1.644362449645996} -08/30/2021 20:43:30 - INFO - __main__ - Step 41918: {'lr': 0.00041549906528741366, 'samples': 8048256, 'steps': 41917, 'loss/train': 5.717835903167725} -08/30/2021 20:43:31 - INFO - __main__ - Step 41919: {'lr': 0.0004154950878073594, 'samples': 8048448, 'steps': 41918, 'loss/train': 1.3945873975753784} -08/30/2021 20:43:31 - INFO - __main__ - Step 41920: {'lr': 0.0004154911102527356, 'samples': 8048640, 'steps': 41919, 'loss/train': 1.3416826725006104} -08/30/2021 20:43:31 - INFO - __main__ - Step 41921: {'lr': 0.00041548713262354396, 'samples': 8048832, 'steps': 41920, 'loss/train': 1.6950429677963257} -08/30/2021 20:43:32 - INFO - __main__ - Step 41922: {'lr': 0.0004154831549197865, 'samples': 8049024, 'steps': 41921, 'loss/train': 1.313057541847229} -08/30/2021 20:43:33 - INFO - __main__ - Step 41923: {'lr': 0.0004154791771414648, 'samples': 8049216, 'steps': 41922, 'loss/train': 1.4533997774124146} -08/30/2021 20:43:34 - INFO - __main__ - Step 41924: {'lr': 0.0004154751992885808, 'samples': 8049408, 'steps': 41923, 'loss/train': 1.559550404548645} -08/30/2021 20:43:34 - INFO - __main__ - Step 41925: {'lr': 0.0004154712213611362, 'samples': 8049600, 'steps': 41924, 'loss/train': 1.6962049007415771} -08/30/2021 20:43:35 - INFO - __main__ - Step 41926: {'lr': 0.0004154672433591328, 'samples': 8049792, 'steps': 41925, 'loss/train': 1.6122878789901733} -08/30/2021 20:43:35 - INFO - __main__ - Step 41927: {'lr': 0.0004154632652825724, 'samples': 8049984, 'steps': 41926, 'loss/train': 2.295560836791992} -08/30/2021 20:43:36 - INFO - __main__ - Step 41928: {'lr': 0.00041545928713145687, 'samples': 8050176, 'steps': 41927, 'loss/train': 1.4711755514144897} -08/30/2021 20:43:37 - INFO - __main__ - Step 41929: {'lr': 0.00041545530890578784, 'samples': 8050368, 'steps': 41928, 'loss/train': 1.9420548677444458} -08/30/2021 20:43:37 - INFO - __main__ - Step 41930: {'lr': 0.00041545133060556734, 'samples': 8050560, 'steps': 41929, 'loss/train': 0.9520986676216125} -08/30/2021 20:43:38 - INFO - __main__ - Step 41931: {'lr': 0.00041544735223079693, 'samples': 8050752, 'steps': 41930, 'loss/train': 1.1703599691390991} -08/30/2021 20:43:38 - INFO - __main__ - Step 41932: {'lr': 0.0004154433737814786, 'samples': 8050944, 'steps': 41931, 'loss/train': 1.2997748851776123} -08/30/2021 20:43:39 - INFO - __main__ - Step 41933: {'lr': 0.0004154393952576139, 'samples': 8051136, 'steps': 41932, 'loss/train': 1.6423181295394897} -08/30/2021 20:43:40 - INFO - __main__ - Step 41934: {'lr': 0.00041543541665920483, 'samples': 8051328, 'steps': 41933, 'loss/train': 1.6377413272857666} -08/30/2021 20:43:40 - INFO - __main__ - Step 41935: {'lr': 0.000415431437986253, 'samples': 8051520, 'steps': 41934, 'loss/train': 1.0988579988479614} -08/30/2021 20:43:41 - INFO - __main__ - Step 41936: {'lr': 0.00041542745923876047, 'samples': 8051712, 'steps': 41935, 'loss/train': 0.6673511266708374} -08/30/2021 20:43:41 - INFO - __main__ - Step 41937: {'lr': 0.00041542348041672886, 'samples': 8051904, 'steps': 41936, 'loss/train': 1.1943817138671875} -08/30/2021 20:43:42 - INFO - __main__ - Step 41938: {'lr': 0.00041541950152015997, 'samples': 8052096, 'steps': 41937, 'loss/train': 1.6588021516799927} -08/30/2021 20:43:43 - INFO - __main__ - Step 41939: {'lr': 0.0004154155225490555, 'samples': 8052288, 'steps': 41938, 'loss/train': 0.11105537414550781} -08/30/2021 20:43:43 - INFO - __main__ - Step 41940: {'lr': 0.0004154115435034175, 'samples': 8052480, 'steps': 41939, 'loss/train': 1.7889378070831299} -08/30/2021 20:43:44 - INFO - __main__ - Step 41941: {'lr': 0.00041540756438324746, 'samples': 8052672, 'steps': 41940, 'loss/train': 1.812666893005371} -08/30/2021 20:43:44 - INFO - __main__ - Step 41942: {'lr': 0.0004154035851885474, 'samples': 8052864, 'steps': 41941, 'loss/train': 1.3219572305679321} -08/30/2021 20:43:45 - INFO - __main__ - Step 41943: {'lr': 0.0004153996059193191, 'samples': 8053056, 'steps': 41942, 'loss/train': 1.5544521808624268} -08/30/2021 20:43:46 - INFO - __main__ - Step 41944: {'lr': 0.0004153956265755642, 'samples': 8053248, 'steps': 41943, 'loss/train': 1.6918978691101074} -08/30/2021 20:43:46 - INFO - __main__ - Step 41945: {'lr': 0.0004153916471572846, 'samples': 8053440, 'steps': 41944, 'loss/train': 1.6003272533416748} -08/30/2021 20:43:47 - INFO - __main__ - Step 41946: {'lr': 0.0004153876676644821, 'samples': 8053632, 'steps': 41945, 'loss/train': 1.4478598833084106} -08/30/2021 20:43:47 - INFO - __main__ - Step 41947: {'lr': 0.0004153836880971585, 'samples': 8053824, 'steps': 41946, 'loss/train': 1.5218452215194702} -08/30/2021 20:43:47 - INFO - __main__ - Step 41948: {'lr': 0.00041537970845531547, 'samples': 8054016, 'steps': 41947, 'loss/train': 1.337354302406311} -08/30/2021 20:43:49 - INFO - __main__ - Step 41949: {'lr': 0.00041537572873895503, 'samples': 8054208, 'steps': 41948, 'loss/train': 1.4841079711914062} -08/30/2021 20:43:50 - INFO - __main__ - Step 41950: {'lr': 0.00041537174894807873, 'samples': 8054400, 'steps': 41949, 'loss/train': 1.608992338180542} -08/30/2021 20:43:50 - INFO - __main__ - Step 41951: {'lr': 0.00041536776908268847, 'samples': 8054592, 'steps': 41950, 'loss/train': 1.4331024885177612} -08/30/2021 20:43:51 - INFO - __main__ - Step 41952: {'lr': 0.00041536378914278603, 'samples': 8054784, 'steps': 41951, 'loss/train': 0.1175106018781662} -08/30/2021 20:43:51 - INFO - __main__ - Step 41953: {'lr': 0.00041535980912837326, 'samples': 8054976, 'steps': 41952, 'loss/train': 1.721665859222412} -08/30/2021 20:43:53 - INFO - __main__ - Step 41954: {'lr': 0.00041535582903945195, 'samples': 8055168, 'steps': 41953, 'loss/train': 0.03491394221782684} -08/30/2021 20:43:53 - INFO - __main__ - Step 41955: {'lr': 0.00041535184887602384, 'samples': 8055360, 'steps': 41954, 'loss/train': 0.6006178855895996} -08/30/2021 20:43:53 - INFO - __main__ - Step 41956: {'lr': 0.0004153478686380907, 'samples': 8055552, 'steps': 41955, 'loss/train': 2.0354340076446533} -08/30/2021 20:43:54 - INFO - __main__ - Step 41957: {'lr': 0.0004153438883256544, 'samples': 8055744, 'steps': 41956, 'loss/train': 1.9349210262298584} -08/30/2021 20:43:54 - INFO - __main__ - Step 41958: {'lr': 0.0004153399079387167, 'samples': 8055936, 'steps': 41957, 'loss/train': 1.0108331441879272} -08/30/2021 20:43:55 - INFO - __main__ - Step 41959: {'lr': 0.00041533592747727935, 'samples': 8056128, 'steps': 41958, 'loss/train': 1.2150534391403198} -08/30/2021 20:43:56 - INFO - __main__ - Step 41960: {'lr': 0.00041533194694134414, 'samples': 8056320, 'steps': 41959, 'loss/train': 1.5075238943099976} -08/30/2021 20:43:56 - INFO - __main__ - Step 41961: {'lr': 0.00041532796633091297, 'samples': 8056512, 'steps': 41960, 'loss/train': 1.1125930547714233} -08/30/2021 20:43:57 - INFO - __main__ - Step 41962: {'lr': 0.00041532398564598757, 'samples': 8056704, 'steps': 41961, 'loss/train': 1.5493428707122803} -08/30/2021 20:43:57 - INFO - __main__ - Step 41963: {'lr': 0.0004153200048865697, 'samples': 8056896, 'steps': 41962, 'loss/train': 1.2770804166793823} -08/30/2021 20:43:58 - INFO - __main__ - Step 41964: {'lr': 0.0004153160240526612, 'samples': 8057088, 'steps': 41963, 'loss/train': 1.2553688287734985} -08/30/2021 20:43:59 - INFO - __main__ - Step 41965: {'lr': 0.0004153120431442639, 'samples': 8057280, 'steps': 41964, 'loss/train': 1.5876924991607666} -08/30/2021 20:43:59 - INFO - __main__ - Step 41966: {'lr': 0.00041530806216137953, 'samples': 8057472, 'steps': 41965, 'loss/train': 1.6402713060379028} -08/30/2021 20:44:00 - INFO - __main__ - Step 41967: {'lr': 0.00041530408110400987, 'samples': 8057664, 'steps': 41966, 'loss/train': 1.7930269241333008} -08/30/2021 20:44:00 - INFO - __main__ - Step 41968: {'lr': 0.00041530009997215665, 'samples': 8057856, 'steps': 41967, 'loss/train': 1.823445200920105} -08/30/2021 20:44:02 - INFO - __main__ - Step 41969: {'lr': 0.00041529611876582194, 'samples': 8058048, 'steps': 41968, 'loss/train': 1.8255748748779297} -08/30/2021 20:44:02 - INFO - __main__ - Step 41970: {'lr': 0.00041529213748500726, 'samples': 8058240, 'steps': 41969, 'loss/train': 0.5113900303840637} -08/30/2021 20:44:02 - INFO - __main__ - Step 41971: {'lr': 0.0004152881561297145, 'samples': 8058432, 'steps': 41970, 'loss/train': 1.0384371280670166} -08/30/2021 20:44:03 - INFO - __main__ - Step 41972: {'lr': 0.0004152841746999454, 'samples': 8058624, 'steps': 41971, 'loss/train': 0.9688120484352112} -08/30/2021 20:44:03 - INFO - __main__ - Step 41973: {'lr': 0.00041528019319570186, 'samples': 8058816, 'steps': 41972, 'loss/train': 0.4540366530418396} -08/30/2021 20:44:03 - INFO - __main__ - Step 41974: {'lr': 0.0004152762116169856, 'samples': 8059008, 'steps': 41973, 'loss/train': 0.8219721913337708} -08/30/2021 20:44:05 - INFO - __main__ - Step 41975: {'lr': 0.00041527222996379844, 'samples': 8059200, 'steps': 41974, 'loss/train': 1.9123342037200928} -08/30/2021 20:44:05 - INFO - __main__ - Step 41976: {'lr': 0.0004152682482361422, 'samples': 8059392, 'steps': 41975, 'loss/train': 1.3277689218521118} -08/30/2021 20:44:06 - INFO - __main__ - Step 41977: {'lr': 0.0004152642664340185, 'samples': 8059584, 'steps': 41976, 'loss/train': 1.7774512767791748} -08/30/2021 20:44:06 - INFO - __main__ - Step 41978: {'lr': 0.00041526028455742936, 'samples': 8059776, 'steps': 41977, 'loss/train': 1.6565258502960205} -08/30/2021 20:44:06 - INFO - __main__ - Step 41979: {'lr': 0.0004152563026063765, 'samples': 8059968, 'steps': 41978, 'loss/train': 1.4913169145584106} -08/30/2021 20:44:08 - INFO - __main__ - Step 41980: {'lr': 0.00041525232058086173, 'samples': 8060160, 'steps': 41979, 'loss/train': 1.4618779420852661} -08/30/2021 20:44:08 - INFO - __main__ - Step 41981: {'lr': 0.0004152483384808867, 'samples': 8060352, 'steps': 41980, 'loss/train': 1.6179994344711304} -08/30/2021 20:44:08 - INFO - __main__ - Step 41982: {'lr': 0.0004152443563064534, 'samples': 8060544, 'steps': 41981, 'loss/train': 1.0159025192260742} -08/30/2021 20:44:09 - INFO - __main__ - Step 41983: {'lr': 0.00041524037405756356, 'samples': 8060736, 'steps': 41982, 'loss/train': 1.7705333232879639} -08/30/2021 20:44:09 - INFO - __main__ - Step 41984: {'lr': 0.0004152363917342189, 'samples': 8060928, 'steps': 41983, 'loss/train': 1.202101469039917} -08/30/2021 20:44:11 - INFO - __main__ - Step 41985: {'lr': 0.00041523240933642134, 'samples': 8061120, 'steps': 41984, 'loss/train': 1.7345613241195679} -08/30/2021 20:44:11 - INFO - __main__ - Step 41986: {'lr': 0.00041522842686417255, 'samples': 8061312, 'steps': 41985, 'loss/train': 1.6383717060089111} -08/30/2021 20:44:11 - INFO - __main__ - Step 41987: {'lr': 0.0004152244443174744, 'samples': 8061504, 'steps': 41986, 'loss/train': 0.06885938346385956} -08/30/2021 20:44:12 - INFO - __main__ - Step 41988: {'lr': 0.00041522046169632863, 'samples': 8061696, 'steps': 41987, 'loss/train': 1.3218573331832886} -08/30/2021 20:44:12 - INFO - __main__ - Step 41989: {'lr': 0.0004152164790007371, 'samples': 8061888, 'steps': 41988, 'loss/train': 1.261513352394104} -08/30/2021 20:44:14 - INFO - __main__ - Step 41990: {'lr': 0.00041521249623070164, 'samples': 8062080, 'steps': 41989, 'loss/train': 1.639464020729065} -08/30/2021 20:44:14 - INFO - __main__ - Step 41991: {'lr': 0.0004152085133862239, 'samples': 8062272, 'steps': 41990, 'loss/train': 1.3137935400009155} -08/30/2021 20:44:14 - INFO - __main__ - Step 41992: {'lr': 0.0004152045304673058, 'samples': 8062464, 'steps': 41991, 'loss/train': 1.3072303533554077} -08/30/2021 20:44:15 - INFO - __main__ - Step 41993: {'lr': 0.000415200547473949, 'samples': 8062656, 'steps': 41992, 'loss/train': 1.5884655714035034} -08/30/2021 20:44:15 - INFO - __main__ - Step 41994: {'lr': 0.00041519656440615544, 'samples': 8062848, 'steps': 41993, 'loss/train': 1.2554905414581299} -08/30/2021 20:44:17 - INFO - __main__ - Step 41995: {'lr': 0.00041519258126392685, 'samples': 8063040, 'steps': 41994, 'loss/train': 1.6075098514556885} -08/30/2021 20:44:17 - INFO - __main__ - Step 41996: {'lr': 0.00041518859804726507, 'samples': 8063232, 'steps': 41995, 'loss/train': 1.328611135482788} -08/30/2021 20:44:17 - INFO - __main__ - Step 41997: {'lr': 0.00041518461475617183, 'samples': 8063424, 'steps': 41996, 'loss/train': 1.576134204864502} -08/30/2021 20:44:18 - INFO - __main__ - Step 41998: {'lr': 0.00041518063139064893, 'samples': 8063616, 'steps': 41997, 'loss/train': 1.6799370050430298} -08/30/2021 20:44:18 - INFO - __main__ - Step 41999: {'lr': 0.0004151766479506982, 'samples': 8063808, 'steps': 41998, 'loss/train': 2.7042174339294434} -08/30/2021 20:44:20 - INFO - __main__ - Step 42000: {'lr': 0.0004151726644363214, 'samples': 8064000, 'steps': 41999, 'loss/train': 1.5599470138549805} -08/30/2021 20:44:21 - INFO - __main__ - Step 42001: {'lr': 0.00041516868084752034, 'samples': 8064192, 'steps': 42000, 'loss/train': 1.5925219058990479} -08/30/2021 20:44:21 - INFO - __main__ - Step 42002: {'lr': 0.0004151646971842968, 'samples': 8064384, 'steps': 42001, 'loss/train': 1.3629719018936157} -08/30/2021 20:44:21 - INFO - __main__ - Step 42003: {'lr': 0.00041516071344665275, 'samples': 8064576, 'steps': 42002, 'loss/train': 1.7206238508224487} -08/30/2021 20:44:22 - INFO - __main__ - Step 42004: {'lr': 0.00041515672963458975, 'samples': 8064768, 'steps': 42003, 'loss/train': 1.1813071966171265} -08/30/2021 20:44:22 - INFO - __main__ - Step 42005: {'lr': 0.00041515274574810965, 'samples': 8064960, 'steps': 42004, 'loss/train': 1.6746045351028442} -08/30/2021 20:44:24 - INFO - __main__ - Step 42006: {'lr': 0.00041514876178721426, 'samples': 8065152, 'steps': 42005, 'loss/train': 2.2018063068389893} -08/30/2021 20:44:25 - INFO - __main__ - Step 42007: {'lr': 0.0004151447777519054, 'samples': 8065344, 'steps': 42006, 'loss/train': 1.6507172584533691} -08/30/2021 20:44:25 - INFO - __main__ - Step 42008: {'lr': 0.00041514079364218483, 'samples': 8065536, 'steps': 42007, 'loss/train': 1.3309930562973022} -08/30/2021 20:44:25 - INFO - __main__ - Step 42009: {'lr': 0.0004151368094580544, 'samples': 8065728, 'steps': 42008, 'loss/train': 1.4450976848602295} -08/30/2021 20:44:26 - INFO - __main__ - Step 42010: {'lr': 0.0004151328251995159, 'samples': 8065920, 'steps': 42009, 'loss/train': 1.633277177810669} -08/30/2021 20:44:26 - INFO - __main__ - Step 42011: {'lr': 0.000415128840866571, 'samples': 8066112, 'steps': 42010, 'loss/train': 1.006747841835022} -08/30/2021 20:44:27 - INFO - __main__ - Step 42012: {'lr': 0.00041512485645922164, 'samples': 8066304, 'steps': 42011, 'loss/train': 0.03204198554158211} -08/30/2021 20:44:28 - INFO - __main__ - Step 42013: {'lr': 0.0004151208719774696, 'samples': 8066496, 'steps': 42012, 'loss/train': 0.5145212411880493} -08/30/2021 20:44:28 - INFO - __main__ - Step 42014: {'lr': 0.0004151168874213166, 'samples': 8066688, 'steps': 42013, 'loss/train': 0.7954835891723633} -08/30/2021 20:44:29 - INFO - __main__ - Step 42015: {'lr': 0.00041511290279076454, 'samples': 8066880, 'steps': 42014, 'loss/train': 1.919533371925354} -08/30/2021 20:44:29 - INFO - __main__ - Step 42016: {'lr': 0.0004151089180858151, 'samples': 8067072, 'steps': 42015, 'loss/train': 1.7257556915283203} -08/30/2021 20:44:31 - INFO - __main__ - Step 42017: {'lr': 0.00041510493330647015, 'samples': 8067264, 'steps': 42016, 'loss/train': 0.636605441570282} -08/30/2021 20:44:31 - INFO - __main__ - Step 42018: {'lr': 0.00041510094845273145, 'samples': 8067456, 'steps': 42017, 'loss/train': 0.7040926814079285} -08/30/2021 20:44:32 - INFO - __main__ - Step 42019: {'lr': 0.0004150969635246008, 'samples': 8067648, 'steps': 42018, 'loss/train': 1.7151103019714355} -08/30/2021 20:44:32 - INFO - __main__ - Step 42020: {'lr': 0.00041509297852208003, 'samples': 8067840, 'steps': 42019, 'loss/train': 1.4303449392318726} -08/30/2021 20:44:32 - INFO - __main__ - Step 42021: {'lr': 0.00041508899344517094, 'samples': 8068032, 'steps': 42020, 'loss/train': 1.4094502925872803} -08/30/2021 20:44:34 - INFO - __main__ - Step 42022: {'lr': 0.0004150850082938752, 'samples': 8068224, 'steps': 42021, 'loss/train': 1.4454941749572754} -08/30/2021 20:44:34 - INFO - __main__ - Step 42023: {'lr': 0.00041508102306819485, 'samples': 8068416, 'steps': 42022, 'loss/train': 1.2959115505218506} -08/30/2021 20:44:35 - INFO - __main__ - Step 42024: {'lr': 0.0004150770377681314, 'samples': 8068608, 'steps': 42023, 'loss/train': 1.805885672569275} -08/30/2021 20:44:35 - INFO - __main__ - Step 42025: {'lr': 0.00041507305239368684, 'samples': 8068800, 'steps': 42024, 'loss/train': 1.2741270065307617} -08/30/2021 20:44:35 - INFO - __main__ - Step 42026: {'lr': 0.0004150690669448629, 'samples': 8068992, 'steps': 42025, 'loss/train': 0.33695948123931885} -08/30/2021 20:44:37 - INFO - __main__ - Step 42027: {'lr': 0.0004150650814216614, 'samples': 8069184, 'steps': 42026, 'loss/train': 1.5946998596191406} -08/30/2021 20:44:37 - INFO - __main__ - Step 42028: {'lr': 0.0004150610958240841, 'samples': 8069376, 'steps': 42027, 'loss/train': 2.5631399154663086} -08/30/2021 20:44:38 - INFO - __main__ - Step 42029: {'lr': 0.00041505711015213284, 'samples': 8069568, 'steps': 42028, 'loss/train': 1.6531378030776978} -08/30/2021 20:44:38 - INFO - __main__ - Step 42030: {'lr': 0.0004150531244058094, 'samples': 8069760, 'steps': 42029, 'loss/train': 1.429823637008667} -08/30/2021 20:44:38 - INFO - __main__ - Step 42031: {'lr': 0.00041504913858511557, 'samples': 8069952, 'steps': 42030, 'loss/train': 0.6526381373405457} -08/30/2021 20:44:40 - INFO - __main__ - Step 42032: {'lr': 0.0004150451526900531, 'samples': 8070144, 'steps': 42031, 'loss/train': 1.5835820436477661} -08/30/2021 20:44:40 - INFO - __main__ - Step 42033: {'lr': 0.00041504116672062385, 'samples': 8070336, 'steps': 42032, 'loss/train': 1.0987393856048584} -08/30/2021 20:44:41 - INFO - __main__ - Step 42034: {'lr': 0.0004150371806768296, 'samples': 8070528, 'steps': 42033, 'loss/train': 1.2248111963272095} -08/30/2021 20:44:41 - INFO - __main__ - Step 42035: {'lr': 0.00041503319455867216, 'samples': 8070720, 'steps': 42034, 'loss/train': 1.1465586423873901} -08/30/2021 20:44:41 - INFO - __main__ - Step 42036: {'lr': 0.0004150292083661533, 'samples': 8070912, 'steps': 42035, 'loss/train': 1.0095746517181396} -08/30/2021 20:44:42 - INFO - __main__ - Step 42037: {'lr': 0.00041502522209927486, 'samples': 8071104, 'steps': 42036, 'loss/train': 1.3447126150131226} -08/30/2021 20:44:43 - INFO - __main__ - Step 42038: {'lr': 0.00041502123575803854, 'samples': 8071296, 'steps': 42037, 'loss/train': 2.114588499069214} -08/30/2021 20:44:44 - INFO - __main__ - Step 42039: {'lr': 0.0004150172493424462, 'samples': 8071488, 'steps': 42038, 'loss/train': 1.4473960399627686} -08/30/2021 20:44:44 - INFO - __main__ - Step 42040: {'lr': 0.00041501326285249963, 'samples': 8071680, 'steps': 42039, 'loss/train': 1.7579057216644287} -08/30/2021 20:44:44 - INFO - __main__ - Step 42041: {'lr': 0.0004150092762882007, 'samples': 8071872, 'steps': 42040, 'loss/train': 1.3453913927078247} -08/30/2021 20:44:45 - INFO - __main__ - Step 42042: {'lr': 0.00041500528964955106, 'samples': 8072064, 'steps': 42041, 'loss/train': 1.215481162071228} -08/30/2021 20:44:46 - INFO - __main__ - Step 42043: {'lr': 0.0004150013029365527, 'samples': 8072256, 'steps': 42042, 'loss/train': 1.2389215230941772} -08/30/2021 20:44:47 - INFO - __main__ - Step 42044: {'lr': 0.0004149973161492072, 'samples': 8072448, 'steps': 42043, 'loss/train': 1.378302812576294} -08/30/2021 20:44:47 - INFO - __main__ - Step 42045: {'lr': 0.0004149933292875164, 'samples': 8072640, 'steps': 42044, 'loss/train': 1.7734328508377075} -08/30/2021 20:44:47 - INFO - __main__ - Step 42046: {'lr': 0.0004149893423514822, 'samples': 8072832, 'steps': 42045, 'loss/train': 1.802382230758667} -08/30/2021 20:44:48 - INFO - __main__ - Step 42047: {'lr': 0.0004149853553411064, 'samples': 8073024, 'steps': 42046, 'loss/train': 1.4193822145462036} -08/30/2021 20:44:49 - INFO - __main__ - Step 42048: {'lr': 0.00041498136825639074, 'samples': 8073216, 'steps': 42047, 'loss/train': 1.117325782775879} -08/30/2021 20:44:50 - INFO - __main__ - Step 42049: {'lr': 0.000414977381097337, 'samples': 8073408, 'steps': 42048, 'loss/train': 1.589279055595398} -08/30/2021 20:44:50 - INFO - __main__ - Step 42050: {'lr': 0.000414973393863947, 'samples': 8073600, 'steps': 42049, 'loss/train': 1.5615315437316895} -08/30/2021 20:44:50 - INFO - __main__ - Step 42051: {'lr': 0.0004149694065562225, 'samples': 8073792, 'steps': 42050, 'loss/train': 0.7782192826271057} -08/30/2021 20:44:51 - INFO - __main__ - Step 42052: {'lr': 0.0004149654191741654, 'samples': 8073984, 'steps': 42051, 'loss/train': 1.3162301778793335} -08/30/2021 20:44:52 - INFO - __main__ - Step 42053: {'lr': 0.0004149614317177774, 'samples': 8074176, 'steps': 42052, 'loss/train': 1.6516133546829224} -08/30/2021 20:44:53 - INFO - __main__ - Step 42054: {'lr': 0.00041495744418706027, 'samples': 8074368, 'steps': 42053, 'loss/train': 1.6669666767120361} -08/30/2021 20:44:53 - INFO - __main__ - Step 42055: {'lr': 0.00041495345658201587, 'samples': 8074560, 'steps': 42054, 'loss/train': 1.176653265953064} -08/30/2021 20:44:53 - INFO - __main__ - Step 42056: {'lr': 0.00041494946890264606, 'samples': 8074752, 'steps': 42055, 'loss/train': 0.6083608865737915} -08/30/2021 20:44:54 - INFO - __main__ - Step 42057: {'lr': 0.00041494548114895255, 'samples': 8074944, 'steps': 42056, 'loss/train': 1.3563673496246338} -08/30/2021 20:44:56 - INFO - __main__ - Step 42058: {'lr': 0.0004149414933209371, 'samples': 8075136, 'steps': 42057, 'loss/train': 1.8304144144058228} -08/30/2021 20:44:56 - INFO - __main__ - Step 42059: {'lr': 0.00041493750541860165, 'samples': 8075328, 'steps': 42058, 'loss/train': 1.4650368690490723} -08/30/2021 20:44:56 - INFO - __main__ - Step 42060: {'lr': 0.0004149335174419478, 'samples': 8075520, 'steps': 42059, 'loss/train': 1.3190314769744873} -08/30/2021 20:44:57 - INFO - __main__ - Step 42061: {'lr': 0.0004149295293909775, 'samples': 8075712, 'steps': 42060, 'loss/train': 1.6788418292999268} -08/30/2021 20:44:57 - INFO - __main__ - Step 42062: {'lr': 0.0004149255412656925, 'samples': 8075904, 'steps': 42061, 'loss/train': 1.3540338277816772} -08/30/2021 20:44:59 - INFO - __main__ - Step 42063: {'lr': 0.00041492155306609456, 'samples': 8076096, 'steps': 42062, 'loss/train': 0.8162250518798828} -08/30/2021 20:45:00 - INFO - __main__ - Step 42064: {'lr': 0.00041491756479218557, 'samples': 8076288, 'steps': 42063, 'loss/train': 1.209893822669983} -08/30/2021 20:45:00 - INFO - __main__ - Step 42065: {'lr': 0.0004149135764439672, 'samples': 8076480, 'steps': 42064, 'loss/train': 1.308935284614563} -08/30/2021 20:45:00 - INFO - __main__ - Step 42066: {'lr': 0.0004149095880214414, 'samples': 8076672, 'steps': 42065, 'loss/train': 1.46317458152771} -08/30/2021 20:45:01 - INFO - __main__ - Step 42067: {'lr': 0.00041490559952460983, 'samples': 8076864, 'steps': 42066, 'loss/train': 1.1638134717941284} -08/30/2021 20:45:01 - INFO - __main__ - Step 42068: {'lr': 0.00041490161095347435, 'samples': 8077056, 'steps': 42067, 'loss/train': 0.02409498579800129} -08/30/2021 20:45:02 - INFO - __main__ - Step 42069: {'lr': 0.00041489762230803676, 'samples': 8077248, 'steps': 42068, 'loss/train': 1.397840976715088} -08/30/2021 20:45:03 - INFO - __main__ - Step 42070: {'lr': 0.00041489363358829885, 'samples': 8077440, 'steps': 42069, 'loss/train': 1.2321537733078003} -08/30/2021 20:45:03 - INFO - __main__ - Step 42071: {'lr': 0.0004148896447942624, 'samples': 8077632, 'steps': 42070, 'loss/train': 1.6488279104232788} -08/30/2021 20:45:04 - INFO - __main__ - Step 42072: {'lr': 0.00041488565592592917, 'samples': 8077824, 'steps': 42071, 'loss/train': 1.214510202407837} -08/30/2021 20:45:04 - INFO - __main__ - Step 42073: {'lr': 0.0004148816669833011, 'samples': 8078016, 'steps': 42072, 'loss/train': 1.2845994234085083} -08/30/2021 20:45:05 - INFO - __main__ - Step 42074: {'lr': 0.0004148776779663799, 'samples': 8078208, 'steps': 42073, 'loss/train': 1.5515477657318115} -08/30/2021 20:45:06 - INFO - __main__ - Step 42075: {'lr': 0.00041487368887516726, 'samples': 8078400, 'steps': 42074, 'loss/train': 1.2906405925750732} -08/30/2021 20:45:06 - INFO - __main__ - Step 42076: {'lr': 0.00041486969970966516, 'samples': 8078592, 'steps': 42075, 'loss/train': 0.5965171456336975} -08/30/2021 20:45:07 - INFO - __main__ - Step 42077: {'lr': 0.0004148657104698753, 'samples': 8078784, 'steps': 42076, 'loss/train': 1.554368495941162} -08/30/2021 20:45:07 - INFO - __main__ - Step 42078: {'lr': 0.00041486172115579945, 'samples': 8078976, 'steps': 42077, 'loss/train': 1.259277105331421} -08/30/2021 20:45:09 - INFO - __main__ - Step 42079: {'lr': 0.00041485773176743953, 'samples': 8079168, 'steps': 42078, 'loss/train': 1.202600359916687} -08/30/2021 20:45:09 - INFO - __main__ - Step 42080: {'lr': 0.00041485374230479724, 'samples': 8079360, 'steps': 42079, 'loss/train': 1.328616738319397} -08/30/2021 20:45:09 - INFO - __main__ - Step 42081: {'lr': 0.00041484975276787436, 'samples': 8079552, 'steps': 42080, 'loss/train': 0.7397907972335815} -08/30/2021 20:45:10 - INFO - __main__ - Step 42082: {'lr': 0.00041484576315667273, 'samples': 8079744, 'steps': 42081, 'loss/train': 0.28067469596862793} -08/30/2021 20:45:10 - INFO - __main__ - Step 42083: {'lr': 0.0004148417734711941, 'samples': 8079936, 'steps': 42082, 'loss/train': 1.526578664779663} -08/30/2021 20:45:12 - INFO - __main__ - Step 42084: {'lr': 0.00041483778371144046, 'samples': 8080128, 'steps': 42083, 'loss/train': 1.2580015659332275} -08/30/2021 20:45:12 - INFO - __main__ - Step 42085: {'lr': 0.0004148337938774134, 'samples': 8080320, 'steps': 42084, 'loss/train': 1.0709748268127441} -08/30/2021 20:45:13 - INFO - __main__ - Step 42086: {'lr': 0.00041482980396911467, 'samples': 8080512, 'steps': 42085, 'loss/train': 1.2933945655822754} -08/30/2021 20:45:13 - INFO - __main__ - Step 42087: {'lr': 0.0004148258139865463, 'samples': 8080704, 'steps': 42086, 'loss/train': 0.09568388015031815} -08/30/2021 20:45:13 - INFO - __main__ - Step 42088: {'lr': 0.00041482182392970984, 'samples': 8080896, 'steps': 42087, 'loss/train': 1.2936928272247314} -08/30/2021 20:45:15 - INFO - __main__ - Step 42089: {'lr': 0.00041481783379860725, 'samples': 8081088, 'steps': 42088, 'loss/train': 1.108892798423767} -08/30/2021 20:45:15 - INFO - __main__ - Step 42090: {'lr': 0.0004148138435932404, 'samples': 8081280, 'steps': 42089, 'loss/train': 0.617364227771759} -08/30/2021 20:45:16 - INFO - __main__ - Step 42091: {'lr': 0.0004148098533136109, 'samples': 8081472, 'steps': 42090, 'loss/train': 0.0499710887670517} -08/30/2021 20:45:16 - INFO - __main__ - Step 42092: {'lr': 0.0004148058629597206, 'samples': 8081664, 'steps': 42091, 'loss/train': 1.4710822105407715} -08/30/2021 20:45:16 - INFO - __main__ - Step 42093: {'lr': 0.0004148018725315713, 'samples': 8081856, 'steps': 42092, 'loss/train': 1.3668607473373413} -08/30/2021 20:45:18 - INFO - __main__ - Step 42094: {'lr': 0.00041479788202916483, 'samples': 8082048, 'steps': 42093, 'loss/train': 1.7293243408203125} -08/30/2021 20:45:18 - INFO - __main__ - Step 42095: {'lr': 0.000414793891452503, 'samples': 8082240, 'steps': 42094, 'loss/train': 1.3674372434616089} -08/30/2021 20:45:19 - INFO - __main__ - Step 42096: {'lr': 0.0004147899008015876, 'samples': 8082432, 'steps': 42095, 'loss/train': 1.4402815103530884} -08/30/2021 20:45:19 - INFO - __main__ - Step 42097: {'lr': 0.0004147859100764204, 'samples': 8082624, 'steps': 42096, 'loss/train': 1.3156471252441406} -08/30/2021 20:45:19 - INFO - __main__ - Step 42098: {'lr': 0.0004147819192770033, 'samples': 8082816, 'steps': 42097, 'loss/train': 1.2385623455047607} -08/30/2021 20:45:20 - INFO - __main__ - Step 42099: {'lr': 0.00041477792840333784, 'samples': 8083008, 'steps': 42098, 'loss/train': 1.3595072031021118} -08/30/2021 20:45:21 - INFO - __main__ - Step 42100: {'lr': 0.00041477393745542607, 'samples': 8083200, 'steps': 42099, 'loss/train': 1.516279697418213} -08/30/2021 20:45:21 - INFO - __main__ - Step 42101: {'lr': 0.0004147699464332697, 'samples': 8083392, 'steps': 42100, 'loss/train': 0.9354690909385681} -08/30/2021 20:45:22 - INFO - __main__ - Step 42102: {'lr': 0.0004147659553368706, 'samples': 8083584, 'steps': 42101, 'loss/train': 1.1088016033172607} -08/30/2021 20:45:22 - INFO - __main__ - Step 42103: {'lr': 0.00041476196416623034, 'samples': 8083776, 'steps': 42102, 'loss/train': 1.4322679042816162} -08/30/2021 20:45:23 - INFO - __main__ - Step 42104: {'lr': 0.0004147579729213511, 'samples': 8083968, 'steps': 42103, 'loss/train': 1.6741018295288086} -08/30/2021 20:45:24 - INFO - __main__ - Step 42105: {'lr': 0.0004147539816022343, 'samples': 8084160, 'steps': 42104, 'loss/train': 1.603182315826416} -08/30/2021 20:45:24 - INFO - __main__ - Step 42106: {'lr': 0.0004147499902088819, 'samples': 8084352, 'steps': 42105, 'loss/train': 0.5111899971961975} -08/30/2021 20:45:25 - INFO - __main__ - Step 42107: {'lr': 0.0004147459987412958, 'samples': 8084544, 'steps': 42106, 'loss/train': 1.6472759246826172} -08/30/2021 20:45:25 - INFO - __main__ - Step 42108: {'lr': 0.0004147420071994776, 'samples': 8084736, 'steps': 42107, 'loss/train': 1.324957251548767} -08/30/2021 20:45:25 - INFO - __main__ - Step 42109: {'lr': 0.0004147380155834293, 'samples': 8084928, 'steps': 42108, 'loss/train': 1.5634123086929321} -08/30/2021 20:45:28 - INFO - __main__ - Step 42110: {'lr': 0.0004147340238931525, 'samples': 8085120, 'steps': 42109, 'loss/train': 1.2766777276992798} -08/30/2021 20:45:28 - INFO - __main__ - Step 42111: {'lr': 0.0004147300321286491, 'samples': 8085312, 'steps': 42110, 'loss/train': 1.0279078483581543} -08/30/2021 20:45:29 - INFO - __main__ - Step 42112: {'lr': 0.0004147260402899209, 'samples': 8085504, 'steps': 42111, 'loss/train': 1.8470271825790405} -08/30/2021 20:45:29 - INFO - __main__ - Step 42113: {'lr': 0.0004147220483769697, 'samples': 8085696, 'steps': 42112, 'loss/train': 1.6055042743682861} -08/30/2021 20:45:29 - INFO - __main__ - Step 42114: {'lr': 0.0004147180563897972, 'samples': 8085888, 'steps': 42113, 'loss/train': 0.9499245882034302} -08/30/2021 20:45:31 - INFO - __main__ - Step 42115: {'lr': 0.0004147140643284054, 'samples': 8086080, 'steps': 42114, 'loss/train': 1.522879719734192} -08/30/2021 20:45:31 - INFO - __main__ - Step 42116: {'lr': 0.00041471007219279595, 'samples': 8086272, 'steps': 42115, 'loss/train': 1.5455400943756104} -08/30/2021 20:45:32 - INFO - __main__ - Step 42117: {'lr': 0.0004147060799829707, 'samples': 8086464, 'steps': 42116, 'loss/train': 1.317301869392395} -08/30/2021 20:45:32 - INFO - __main__ - Step 42118: {'lr': 0.00041470208769893137, 'samples': 8086656, 'steps': 42117, 'loss/train': 0.8650458455085754} -08/30/2021 20:45:32 - INFO - __main__ - Step 42119: {'lr': 0.0004146980953406799, 'samples': 8086848, 'steps': 42118, 'loss/train': 1.4716070890426636} -08/30/2021 20:45:34 - INFO - __main__ - Step 42120: {'lr': 0.000414694102908218, 'samples': 8087040, 'steps': 42119, 'loss/train': 1.7921462059020996} -08/30/2021 20:45:34 - INFO - __main__ - Step 42121: {'lr': 0.0004146901104015474, 'samples': 8087232, 'steps': 42120, 'loss/train': 1.6152158975601196} -08/30/2021 20:45:34 - INFO - __main__ - Step 42122: {'lr': 0.00041468611782067, 'samples': 8087424, 'steps': 42121, 'loss/train': 1.0863064527511597} -08/30/2021 20:45:35 - INFO - __main__ - Step 42123: {'lr': 0.0004146821251655877, 'samples': 8087616, 'steps': 42122, 'loss/train': 1.3849724531173706} -08/30/2021 20:45:35 - INFO - __main__ - Step 42124: {'lr': 0.000414678132436302, 'samples': 8087808, 'steps': 42123, 'loss/train': 1.5474445819854736} -08/30/2021 20:45:37 - INFO - __main__ - Step 42125: {'lr': 0.000414674139632815, 'samples': 8088000, 'steps': 42124, 'loss/train': 1.581607699394226} -08/30/2021 20:45:37 - INFO - __main__ - Step 42126: {'lr': 0.0004146701467551283, 'samples': 8088192, 'steps': 42125, 'loss/train': 1.3367286920547485} -08/30/2021 20:45:38 - INFO - __main__ - Step 42127: {'lr': 0.0004146661538032438, 'samples': 8088384, 'steps': 42126, 'loss/train': 1.5993620157241821} -08/30/2021 20:45:38 - INFO - __main__ - Step 42128: {'lr': 0.0004146621607771633, 'samples': 8088576, 'steps': 42127, 'loss/train': 1.5183007717132568} -08/30/2021 20:45:38 - INFO - __main__ - Step 42129: {'lr': 0.00041465816767688853, 'samples': 8088768, 'steps': 42128, 'loss/train': 0.9067882299423218} -08/30/2021 20:45:39 - INFO - __main__ - Step 42130: {'lr': 0.0004146541745024214, 'samples': 8088960, 'steps': 42129, 'loss/train': 1.7860867977142334} -08/30/2021 20:45:40 - INFO - __main__ - Step 42131: {'lr': 0.00041465018125376354, 'samples': 8089152, 'steps': 42130, 'loss/train': 1.2774993181228638} -08/30/2021 20:45:40 - INFO - __main__ - Step 42132: {'lr': 0.0004146461879309169, 'samples': 8089344, 'steps': 42131, 'loss/train': 1.5761557817459106} -08/30/2021 20:45:41 - INFO - __main__ - Step 42133: {'lr': 0.0004146421945338832, 'samples': 8089536, 'steps': 42132, 'loss/train': 0.6396993398666382} -08/30/2021 20:45:41 - INFO - __main__ - Step 42134: {'lr': 0.0004146382010626643, 'samples': 8089728, 'steps': 42133, 'loss/train': 1.1455062627792358} -08/30/2021 20:45:42 - INFO - __main__ - Step 42135: {'lr': 0.000414634207517262, 'samples': 8089920, 'steps': 42134, 'loss/train': 1.4439822435379028} -08/30/2021 20:45:43 - INFO - __main__ - Step 42136: {'lr': 0.000414630213897678, 'samples': 8090112, 'steps': 42135, 'loss/train': 1.022885799407959} -08/30/2021 20:45:44 - INFO - __main__ - Step 42137: {'lr': 0.00041462622020391416, 'samples': 8090304, 'steps': 42136, 'loss/train': 1.18490469455719} -08/30/2021 20:45:44 - INFO - __main__ - Step 42138: {'lr': 0.00041462222643597236, 'samples': 8090496, 'steps': 42137, 'loss/train': 1.3145403861999512} -08/30/2021 20:45:44 - INFO - __main__ - Step 42139: {'lr': 0.00041461823259385423, 'samples': 8090688, 'steps': 42138, 'loss/train': 1.1623032093048096} -08/30/2021 20:45:45 - INFO - __main__ - Step 42140: {'lr': 0.00041461423867756176, 'samples': 8090880, 'steps': 42139, 'loss/train': 0.8623557090759277} -08/30/2021 20:45:46 - INFO - __main__ - Step 42141: {'lr': 0.00041461024468709664, 'samples': 8091072, 'steps': 42140, 'loss/train': 1.5169148445129395} -08/30/2021 20:45:47 - INFO - __main__ - Step 42142: {'lr': 0.0004146062506224606, 'samples': 8091264, 'steps': 42141, 'loss/train': 1.6592957973480225} -08/30/2021 20:45:47 - INFO - __main__ - Step 42143: {'lr': 0.0004146022564836556, 'samples': 8091456, 'steps': 42142, 'loss/train': 1.1839269399642944} -08/30/2021 20:45:47 - INFO - __main__ - Step 42144: {'lr': 0.0004145982622706833, 'samples': 8091648, 'steps': 42143, 'loss/train': 1.323874831199646} -08/30/2021 20:45:48 - INFO - __main__ - Step 42145: {'lr': 0.00041459426798354563, 'samples': 8091840, 'steps': 42144, 'loss/train': 1.4421354532241821} -08/30/2021 20:45:49 - INFO - __main__ - Step 42146: {'lr': 0.00041459027362224433, 'samples': 8092032, 'steps': 42145, 'loss/train': 1.411238670349121} -08/30/2021 20:45:50 - INFO - __main__ - Step 42147: {'lr': 0.00041458627918678116, 'samples': 8092224, 'steps': 42146, 'loss/train': 0.050818443298339844} -08/30/2021 20:45:50 - INFO - __main__ - Step 42148: {'lr': 0.00041458228467715786, 'samples': 8092416, 'steps': 42147, 'loss/train': 0.9675813913345337} -08/30/2021 20:45:50 - INFO - __main__ - Step 42149: {'lr': 0.00041457829009337643, 'samples': 8092608, 'steps': 42148, 'loss/train': 1.189178466796875} -08/30/2021 20:45:51 - INFO - __main__ - Step 42150: {'lr': 0.00041457429543543856, 'samples': 8092800, 'steps': 42149, 'loss/train': 1.7160683870315552} -08/30/2021 20:45:52 - INFO - __main__ - Step 42151: {'lr': 0.0004145703007033461, 'samples': 8092992, 'steps': 42150, 'loss/train': 1.4187594652175903} -08/30/2021 20:45:53 - INFO - __main__ - Step 42152: {'lr': 0.00041456630589710073, 'samples': 8093184, 'steps': 42151, 'loss/train': 1.5434417724609375} -08/30/2021 20:45:53 - INFO - __main__ - Step 42153: {'lr': 0.0004145623110167043, 'samples': 8093376, 'steps': 42152, 'loss/train': 0.7602411508560181} -08/30/2021 20:45:53 - INFO - __main__ - Step 42154: {'lr': 0.00041455831606215863, 'samples': 8093568, 'steps': 42153, 'loss/train': 1.4812666177749634} -08/30/2021 20:45:54 - INFO - __main__ - Step 42155: {'lr': 0.0004145543210334656, 'samples': 8093760, 'steps': 42154, 'loss/train': 1.4547737836837769} -08/30/2021 20:45:54 - INFO - __main__ - Step 42156: {'lr': 0.00041455032593062685, 'samples': 8093952, 'steps': 42155, 'loss/train': 2.3969500064849854} -08/30/2021 20:45:56 - INFO - __main__ - Step 42157: {'lr': 0.00041454633075364427, 'samples': 8094144, 'steps': 42156, 'loss/train': 0.7574585676193237} -08/30/2021 20:45:56 - INFO - __main__ - Step 42158: {'lr': 0.00041454233550251976, 'samples': 8094336, 'steps': 42157, 'loss/train': 1.8785595893859863} -08/30/2021 20:45:56 - INFO - __main__ - Step 42159: {'lr': 0.0004145383401772549, 'samples': 8094528, 'steps': 42158, 'loss/train': 1.3645179271697998} -08/30/2021 20:45:57 - INFO - __main__ - Step 42160: {'lr': 0.00041453434477785165, 'samples': 8094720, 'steps': 42159, 'loss/train': 1.180868148803711} -08/30/2021 20:45:57 - INFO - __main__ - Step 42161: {'lr': 0.0004145303493043118, 'samples': 8094912, 'steps': 42160, 'loss/train': 0.8418003916740417} -08/30/2021 20:45:59 - INFO - __main__ - Step 42162: {'lr': 0.000414526353756637, 'samples': 8095104, 'steps': 42161, 'loss/train': 2.004115581512451} -08/30/2021 20:45:59 - INFO - __main__ - Step 42163: {'lr': 0.0004145223581348292, 'samples': 8095296, 'steps': 42162, 'loss/train': 1.0504868030548096} -08/30/2021 20:45:59 - INFO - __main__ - Step 42164: {'lr': 0.00041451836243889027, 'samples': 8095488, 'steps': 42163, 'loss/train': 1.025084137916565} -08/30/2021 20:46:00 - INFO - __main__ - Step 42165: {'lr': 0.0004145143666688218, 'samples': 8095680, 'steps': 42164, 'loss/train': 0.9310389161109924} -08/30/2021 20:46:00 - INFO - __main__ - Step 42166: {'lr': 0.0004145103708246257, 'samples': 8095872, 'steps': 42165, 'loss/train': 1.0532963275909424} -08/30/2021 20:46:02 - INFO - __main__ - Step 42167: {'lr': 0.0004145063749063038, 'samples': 8096064, 'steps': 42166, 'loss/train': 1.9102671146392822} -08/30/2021 20:46:02 - INFO - __main__ - Step 42168: {'lr': 0.00041450237891385783, 'samples': 8096256, 'steps': 42167, 'loss/train': 1.6247804164886475} -08/30/2021 20:46:03 - INFO - __main__ - Step 42169: {'lr': 0.00041449838284728964, 'samples': 8096448, 'steps': 42168, 'loss/train': 1.7039918899536133} -08/30/2021 20:46:03 - INFO - __main__ - Step 42170: {'lr': 0.000414494386706601, 'samples': 8096640, 'steps': 42169, 'loss/train': 1.6172739267349243} -08/30/2021 20:46:03 - INFO - __main__ - Step 42171: {'lr': 0.00041449039049179385, 'samples': 8096832, 'steps': 42170, 'loss/train': 1.4287976026535034} -08/30/2021 20:46:05 - INFO - __main__ - Step 42172: {'lr': 0.0004144863942028697, 'samples': 8097024, 'steps': 42171, 'loss/train': 1.3822600841522217} -08/30/2021 20:46:06 - INFO - __main__ - Step 42173: {'lr': 0.0004144823978398306, 'samples': 8097216, 'steps': 42172, 'loss/train': 1.5369291305541992} -08/30/2021 20:46:06 - INFO - __main__ - Step 42174: {'lr': 0.0004144784014026782, 'samples': 8097408, 'steps': 42173, 'loss/train': 1.4141660928726196} -08/30/2021 20:46:06 - INFO - __main__ - Step 42175: {'lr': 0.0004144744048914145, 'samples': 8097600, 'steps': 42174, 'loss/train': 1.4566032886505127} -08/30/2021 20:46:07 - INFO - __main__ - Step 42176: {'lr': 0.0004144704083060411, 'samples': 8097792, 'steps': 42175, 'loss/train': 1.6292386054992676} -08/30/2021 20:46:08 - INFO - __main__ - Step 42177: {'lr': 0.00041446641164655983, 'samples': 8097984, 'steps': 42176, 'loss/train': 1.6132475137710571} -08/30/2021 20:46:08 - INFO - __main__ - Step 42178: {'lr': 0.0004144624149129727, 'samples': 8098176, 'steps': 42177, 'loss/train': 1.4272546768188477} -08/30/2021 20:46:09 - INFO - __main__ - Step 42179: {'lr': 0.00041445841810528117, 'samples': 8098368, 'steps': 42178, 'loss/train': 1.5255573987960815} -08/30/2021 20:46:09 - INFO - __main__ - Step 42180: {'lr': 0.00041445442122348727, 'samples': 8098560, 'steps': 42179, 'loss/train': 1.7269580364227295} -08/30/2021 20:46:10 - INFO - __main__ - Step 42181: {'lr': 0.0004144504242675927, 'samples': 8098752, 'steps': 42180, 'loss/train': 1.402187705039978} -08/30/2021 20:46:11 - INFO - __main__ - Step 42182: {'lr': 0.0004144464272375994, 'samples': 8098944, 'steps': 42181, 'loss/train': 1.038556694984436} -08/30/2021 20:46:12 - INFO - __main__ - Step 42183: {'lr': 0.000414442430133509, 'samples': 8099136, 'steps': 42182, 'loss/train': 1.7038600444793701} -08/30/2021 20:46:12 - INFO - __main__ - Step 42184: {'lr': 0.00041443843295532333, 'samples': 8099328, 'steps': 42183, 'loss/train': 1.1766091585159302} -08/30/2021 20:46:12 - INFO - __main__ - Step 42185: {'lr': 0.0004144344357030444, 'samples': 8099520, 'steps': 42184, 'loss/train': 0.7377972602844238} -08/30/2021 20:46:13 - INFO - __main__ - Step 42186: {'lr': 0.0004144304383766737, 'samples': 8099712, 'steps': 42185, 'loss/train': 1.0757642984390259} -08/30/2021 20:46:13 - INFO - __main__ - Step 42187: {'lr': 0.0004144264409762133, 'samples': 8099904, 'steps': 42186, 'loss/train': 1.3502475023269653} -08/30/2021 20:46:14 - INFO - __main__ - Step 42188: {'lr': 0.0004144224435016648, 'samples': 8100096, 'steps': 42187, 'loss/train': 2.035529613494873} -08/30/2021 20:46:15 - INFO - __main__ - Step 42189: {'lr': 0.00041441844595303015, 'samples': 8100288, 'steps': 42188, 'loss/train': 1.5047987699508667} -08/30/2021 20:46:15 - INFO - __main__ - Step 42190: {'lr': 0.0004144144483303111, 'samples': 8100480, 'steps': 42189, 'loss/train': 1.7014646530151367} -08/30/2021 20:46:16 - INFO - __main__ - Step 42191: {'lr': 0.00041441045063350933, 'samples': 8100672, 'steps': 42190, 'loss/train': 1.41290283203125} -08/30/2021 20:46:16 - INFO - __main__ - Step 42192: {'lr': 0.00041440645286262677, 'samples': 8100864, 'steps': 42191, 'loss/train': 1.4311779737472534} -08/30/2021 20:46:17 - INFO - __main__ - Step 42193: {'lr': 0.0004144024550176653, 'samples': 8101056, 'steps': 42192, 'loss/train': 0.7025465965270996} -08/30/2021 20:46:18 - INFO - __main__ - Step 42194: {'lr': 0.0004143984570986265, 'samples': 8101248, 'steps': 42193, 'loss/train': 1.4432069063186646} -08/30/2021 20:46:18 - INFO - __main__ - Step 42195: {'lr': 0.00041439445910551235, 'samples': 8101440, 'steps': 42194, 'loss/train': 1.0412001609802246} -08/30/2021 20:46:19 - INFO - __main__ - Step 42196: {'lr': 0.00041439046103832454, 'samples': 8101632, 'steps': 42195, 'loss/train': 1.7480463981628418} -08/30/2021 20:46:19 - INFO - __main__ - Step 42197: {'lr': 0.000414386462897065, 'samples': 8101824, 'steps': 42196, 'loss/train': 1.311126947402954} -08/30/2021 20:46:20 - INFO - __main__ - Step 42198: {'lr': 0.00041438246468173545, 'samples': 8102016, 'steps': 42197, 'loss/train': 1.207491159439087} -08/30/2021 20:46:21 - INFO - __main__ - Step 42199: {'lr': 0.0004143784663923377, 'samples': 8102208, 'steps': 42198, 'loss/train': 1.446942925453186} -08/30/2021 20:46:21 - INFO - __main__ - Step 42200: {'lr': 0.00041437446802887354, 'samples': 8102400, 'steps': 42199, 'loss/train': 1.9346952438354492} -08/30/2021 20:46:21 - INFO - __main__ - Step 42201: {'lr': 0.0004143704695913447, 'samples': 8102592, 'steps': 42200, 'loss/train': 0.8921756744384766} -08/30/2021 20:46:22 - INFO - __main__ - Step 42202: {'lr': 0.0004143664710797531, 'samples': 8102784, 'steps': 42201, 'loss/train': 1.4309717416763306} -08/30/2021 20:46:23 - INFO - __main__ - Step 42203: {'lr': 0.0004143624724941006, 'samples': 8102976, 'steps': 42202, 'loss/train': 1.6684378385543823} -08/30/2021 20:46:24 - INFO - __main__ - Step 42204: {'lr': 0.00041435847383438886, 'samples': 8103168, 'steps': 42203, 'loss/train': 0.9194706678390503} -08/30/2021 20:46:24 - INFO - __main__ - Step 42205: {'lr': 0.0004143544751006197, 'samples': 8103360, 'steps': 42204, 'loss/train': 1.3952915668487549} -08/30/2021 20:46:25 - INFO - __main__ - Step 42206: {'lr': 0.000414350476292795, 'samples': 8103552, 'steps': 42205, 'loss/train': 0.5288825631141663} -08/30/2021 20:46:25 - INFO - __main__ - Step 42207: {'lr': 0.0004143464774109164, 'samples': 8103744, 'steps': 42206, 'loss/train': 1.461159110069275} -08/30/2021 20:46:26 - INFO - __main__ - Step 42208: {'lr': 0.0004143424784549859, 'samples': 8103936, 'steps': 42207, 'loss/train': 1.186647891998291} -08/30/2021 20:46:27 - INFO - __main__ - Step 42209: {'lr': 0.00041433847942500516, 'samples': 8104128, 'steps': 42208, 'loss/train': 1.447962999343872} -08/30/2021 20:46:27 - INFO - __main__ - Step 42210: {'lr': 0.0004143344803209761, 'samples': 8104320, 'steps': 42209, 'loss/train': 1.9218649864196777} -08/30/2021 20:46:27 - INFO - __main__ - Step 42211: {'lr': 0.0004143304811429005, 'samples': 8104512, 'steps': 42210, 'loss/train': 1.1474194526672363} -08/30/2021 20:46:28 - INFO - __main__ - Step 42212: {'lr': 0.00041432648189078006, 'samples': 8104704, 'steps': 42211, 'loss/train': 1.5400233268737793} -08/30/2021 20:46:28 - INFO - __main__ - Step 42213: {'lr': 0.0004143224825646166, 'samples': 8104896, 'steps': 42212, 'loss/train': 1.8447178602218628} -08/30/2021 20:46:30 - INFO - __main__ - Step 42214: {'lr': 0.000414318483164412, 'samples': 8105088, 'steps': 42213, 'loss/train': 1.5515023469924927} -08/30/2021 20:46:30 - INFO - __main__ - Step 42215: {'lr': 0.000414314483690168, 'samples': 8105280, 'steps': 42214, 'loss/train': 1.1254675388336182} -08/30/2021 20:46:30 - INFO - __main__ - Step 42216: {'lr': 0.00041431048414188645, 'samples': 8105472, 'steps': 42215, 'loss/train': 1.2145752906799316} -08/30/2021 20:46:31 - INFO - __main__ - Step 42217: {'lr': 0.00041430648451956913, 'samples': 8105664, 'steps': 42216, 'loss/train': 0.9684998393058777} -08/30/2021 20:46:31 - INFO - __main__ - Step 42218: {'lr': 0.00041430248482321794, 'samples': 8105856, 'steps': 42217, 'loss/train': 1.4339289665222168} -08/30/2021 20:46:33 - INFO - __main__ - Step 42219: {'lr': 0.00041429848505283444, 'samples': 8106048, 'steps': 42218, 'loss/train': 1.1669222116470337} -08/30/2021 20:46:34 - INFO - __main__ - Step 42220: {'lr': 0.00041429448520842064, 'samples': 8106240, 'steps': 42219, 'loss/train': 1.4249677658081055} -08/30/2021 20:46:34 - INFO - __main__ - Step 42221: {'lr': 0.0004142904852899783, 'samples': 8106432, 'steps': 42220, 'loss/train': 1.1597368717193604} -08/30/2021 20:46:34 - INFO - __main__ - Step 42222: {'lr': 0.0004142864852975092, 'samples': 8106624, 'steps': 42221, 'loss/train': 2.188777446746826} -08/30/2021 20:46:35 - INFO - __main__ - Step 42223: {'lr': 0.00041428248523101507, 'samples': 8106816, 'steps': 42222, 'loss/train': 0.25819453597068787} -08/30/2021 20:46:36 - INFO - __main__ - Step 42224: {'lr': 0.0004142784850904978, 'samples': 8107008, 'steps': 42223, 'loss/train': 1.8180350065231323} -08/30/2021 20:46:37 - INFO - __main__ - Step 42225: {'lr': 0.00041427448487595933, 'samples': 8107200, 'steps': 42224, 'loss/train': 1.1398649215698242} -08/30/2021 20:46:37 - INFO - __main__ - Step 42226: {'lr': 0.0004142704845874012, 'samples': 8107392, 'steps': 42225, 'loss/train': 1.6380653381347656} -08/30/2021 20:46:37 - INFO - __main__ - Step 42227: {'lr': 0.00041426648422482527, 'samples': 8107584, 'steps': 42226, 'loss/train': 1.6042135953903198} -08/30/2021 20:46:38 - INFO - __main__ - Step 42228: {'lr': 0.0004142624837882335, 'samples': 8107776, 'steps': 42227, 'loss/train': 1.3946853876113892} -08/30/2021 20:46:39 - INFO - __main__ - Step 42229: {'lr': 0.0004142584832776275, 'samples': 8107968, 'steps': 42228, 'loss/train': 1.629384160041809} -08/30/2021 20:46:40 - INFO - __main__ - Step 42230: {'lr': 0.00041425448269300923, 'samples': 8108160, 'steps': 42229, 'loss/train': 0.3680429458618164} -08/30/2021 20:46:40 - INFO - __main__ - Step 42231: {'lr': 0.00041425048203438036, 'samples': 8108352, 'steps': 42230, 'loss/train': 1.462911605834961} -08/30/2021 20:46:41 - INFO - __main__ - Step 42232: {'lr': 0.0004142464813017429, 'samples': 8108544, 'steps': 42231, 'loss/train': 0.07783259451389313} -08/30/2021 20:46:41 - INFO - __main__ - Step 42233: {'lr': 0.0004142424804950984, 'samples': 8108736, 'steps': 42232, 'loss/train': 0.4490537941455841} -08/30/2021 20:46:42 - INFO - __main__ - Step 42234: {'lr': 0.00041423847961444873, 'samples': 8108928, 'steps': 42233, 'loss/train': 1.3863348960876465} -08/30/2021 20:46:43 - INFO - __main__ - Step 42235: {'lr': 0.0004142344786597958, 'samples': 8109120, 'steps': 42234, 'loss/train': 1.1885013580322266} -08/30/2021 20:46:43 - INFO - __main__ - Step 42236: {'lr': 0.0004142304776311413, 'samples': 8109312, 'steps': 42235, 'loss/train': 1.1874572038650513} -08/30/2021 20:46:44 - INFO - __main__ - Step 42237: {'lr': 0.0004142264765284871, 'samples': 8109504, 'steps': 42236, 'loss/train': 1.1852940320968628} -08/30/2021 20:46:44 - INFO - __main__ - Step 42238: {'lr': 0.0004142224753518351, 'samples': 8109696, 'steps': 42237, 'loss/train': 0.8874362707138062} -08/30/2021 20:46:45 - INFO - __main__ - Step 42239: {'lr': 0.00041421847410118685, 'samples': 8109888, 'steps': 42238, 'loss/train': 1.4015588760375977} -08/30/2021 20:46:46 - INFO - __main__ - Step 42240: {'lr': 0.00041421447277654436, 'samples': 8110080, 'steps': 42239, 'loss/train': 1.5901575088500977} -08/30/2021 20:46:46 - INFO - __main__ - Step 42241: {'lr': 0.0004142104713779093, 'samples': 8110272, 'steps': 42240, 'loss/train': 1.4169880151748657} -08/30/2021 20:46:47 - INFO - __main__ - Step 42242: {'lr': 0.00041420646990528355, 'samples': 8110464, 'steps': 42241, 'loss/train': 1.8420770168304443} -08/30/2021 20:46:47 - INFO - __main__ - Step 42243: {'lr': 0.0004142024683586689, 'samples': 8110656, 'steps': 42242, 'loss/train': 1.6727858781814575} -08/30/2021 20:46:49 - INFO - __main__ - Step 42244: {'lr': 0.00041419846673806715, 'samples': 8110848, 'steps': 42243, 'loss/train': 1.2827200889587402} -08/30/2021 20:46:49 - INFO - __main__ - Step 42245: {'lr': 0.0004141944650434801, 'samples': 8111040, 'steps': 42244, 'loss/train': 1.2395683526992798} -08/30/2021 20:46:49 - INFO - __main__ - Step 42246: {'lr': 0.00041419046327490964, 'samples': 8111232, 'steps': 42245, 'loss/train': 1.6822307109832764} -08/30/2021 20:46:50 - INFO - __main__ - Step 42247: {'lr': 0.00041418646143235737, 'samples': 8111424, 'steps': 42246, 'loss/train': 1.0382400751113892} -08/30/2021 20:46:50 - INFO - __main__ - Step 42248: {'lr': 0.0004141824595158253, 'samples': 8111616, 'steps': 42247, 'loss/train': 1.8770506381988525} -08/30/2021 20:46:50 - INFO - __main__ - Step 42249: {'lr': 0.0004141784575253151, 'samples': 8111808, 'steps': 42248, 'loss/train': 1.2458492517471313} -08/30/2021 20:46:52 - INFO - __main__ - Step 42250: {'lr': 0.0004141744554608287, 'samples': 8112000, 'steps': 42249, 'loss/train': 1.2245113849639893} -08/30/2021 20:46:52 - INFO - __main__ - Step 42251: {'lr': 0.00041417045332236776, 'samples': 8112192, 'steps': 42250, 'loss/train': 1.21090567111969} -08/30/2021 20:46:53 - INFO - __main__ - Step 42252: {'lr': 0.0004141664511099341, 'samples': 8112384, 'steps': 42251, 'loss/train': 1.0141521692276} -08/30/2021 20:46:53 - INFO - __main__ - Step 42253: {'lr': 0.00041416244882352965, 'samples': 8112576, 'steps': 42252, 'loss/train': 1.0303927659988403} -08/30/2021 20:46:53 - INFO - __main__ - Step 42254: {'lr': 0.00041415844646315613, 'samples': 8112768, 'steps': 42253, 'loss/train': 1.3580528497695923} -08/30/2021 20:46:55 - INFO - __main__ - Step 42255: {'lr': 0.0004141544440288153, 'samples': 8112960, 'steps': 42254, 'loss/train': 1.4445478916168213} -08/30/2021 20:46:55 - INFO - __main__ - Step 42256: {'lr': 0.0004141504415205091, 'samples': 8113152, 'steps': 42255, 'loss/train': 0.8169226050376892} -08/30/2021 20:46:56 - INFO - __main__ - Step 42257: {'lr': 0.0004141464389382391, 'samples': 8113344, 'steps': 42256, 'loss/train': 1.4042410850524902} -08/30/2021 20:46:56 - INFO - __main__ - Step 42258: {'lr': 0.0004141424362820073, 'samples': 8113536, 'steps': 42257, 'loss/train': 1.4125057458877563} -08/30/2021 20:46:56 - INFO - __main__ - Step 42259: {'lr': 0.0004141384335518155, 'samples': 8113728, 'steps': 42258, 'loss/train': 1.494933843612671} -08/30/2021 20:46:58 - INFO - __main__ - Step 42260: {'lr': 0.00041413443074766543, 'samples': 8113920, 'steps': 42259, 'loss/train': 1.651997685432434} -08/30/2021 20:46:59 - INFO - __main__ - Step 42261: {'lr': 0.000414130427869559, 'samples': 8114112, 'steps': 42260, 'loss/train': 1.7769715785980225} -08/30/2021 20:46:59 - INFO - __main__ - Step 42262: {'lr': 0.0004141264249174978, 'samples': 8114304, 'steps': 42261, 'loss/train': 1.8201574087142944} -08/30/2021 20:46:59 - INFO - __main__ - Step 42263: {'lr': 0.00041412242189148383, 'samples': 8114496, 'steps': 42262, 'loss/train': 0.06089145690202713} -08/30/2021 20:47:00 - INFO - __main__ - Step 42264: {'lr': 0.00041411841879151877, 'samples': 8114688, 'steps': 42263, 'loss/train': 1.713726282119751} -08/30/2021 20:47:01 - INFO - __main__ - Step 42265: {'lr': 0.00041411441561760455, 'samples': 8114880, 'steps': 42264, 'loss/train': 0.847568929195404} -08/30/2021 20:47:02 - INFO - __main__ - Step 42266: {'lr': 0.0004141104123697429, 'samples': 8115072, 'steps': 42265, 'loss/train': 1.4999792575836182} -08/30/2021 20:47:02 - INFO - __main__ - Step 42267: {'lr': 0.00041410640904793563, 'samples': 8115264, 'steps': 42266, 'loss/train': 1.7000240087509155} -08/30/2021 20:47:02 - INFO - __main__ - Step 42268: {'lr': 0.0004141024056521845, 'samples': 8115456, 'steps': 42267, 'loss/train': 1.2713193893432617} -08/30/2021 20:47:03 - INFO - __main__ - Step 42269: {'lr': 0.0004140984021824914, 'samples': 8115648, 'steps': 42268, 'loss/train': 1.7952033281326294} -08/30/2021 20:47:04 - INFO - __main__ - Step 42270: {'lr': 0.0004140943986388581, 'samples': 8115840, 'steps': 42269, 'loss/train': 0.06707034260034561} -08/30/2021 20:47:05 - INFO - __main__ - Step 42271: {'lr': 0.00041409039502128634, 'samples': 8116032, 'steps': 42270, 'loss/train': 1.0375711917877197} -08/30/2021 20:47:05 - INFO - __main__ - Step 42272: {'lr': 0.000414086391329778, 'samples': 8116224, 'steps': 42271, 'loss/train': 1.1584436893463135} -08/30/2021 20:47:05 - INFO - __main__ - Step 42273: {'lr': 0.0004140823875643349, 'samples': 8116416, 'steps': 42272, 'loss/train': 0.8180829882621765} -08/30/2021 20:47:06 - INFO - __main__ - Step 42274: {'lr': 0.00041407838372495883, 'samples': 8116608, 'steps': 42273, 'loss/train': 1.377746343612671} -08/30/2021 20:47:06 - INFO - __main__ - Step 42275: {'lr': 0.00041407437981165154, 'samples': 8116800, 'steps': 42274, 'loss/train': 1.178992509841919} -08/30/2021 20:47:08 - INFO - __main__ - Step 42276: {'lr': 0.0004140703758244148, 'samples': 8116992, 'steps': 42275, 'loss/train': 1.6284089088439941} -08/30/2021 20:47:09 - INFO - __main__ - Step 42277: {'lr': 0.00041406637176325054, 'samples': 8117184, 'steps': 42276, 'loss/train': 1.1715081930160522} -08/30/2021 20:47:09 - INFO - __main__ - Step 42278: {'lr': 0.00041406236762816053, 'samples': 8117376, 'steps': 42277, 'loss/train': 1.3192260265350342} -08/30/2021 20:47:10 - INFO - __main__ - Step 42279: {'lr': 0.0004140583634191465, 'samples': 8117568, 'steps': 42278, 'loss/train': 1.326980471611023} -08/30/2021 20:47:10 - INFO - __main__ - Step 42280: {'lr': 0.00041405435913621037, 'samples': 8117760, 'steps': 42279, 'loss/train': 1.7745006084442139} -08/30/2021 20:47:11 - INFO - __main__ - Step 42281: {'lr': 0.0004140503547793538, 'samples': 8117952, 'steps': 42280, 'loss/train': 0.8168326616287231} -08/30/2021 20:47:12 - INFO - __main__ - Step 42282: {'lr': 0.00041404635034857876, 'samples': 8118144, 'steps': 42281, 'loss/train': 1.3293964862823486} -08/30/2021 20:47:12 - INFO - __main__ - Step 42283: {'lr': 0.00041404234584388683, 'samples': 8118336, 'steps': 42282, 'loss/train': 1.3677918910980225} -08/30/2021 20:47:13 - INFO - __main__ - Step 42284: {'lr': 0.00041403834126528007, 'samples': 8118528, 'steps': 42283, 'loss/train': 1.8644312620162964} -08/30/2021 20:47:13 - INFO - __main__ - Step 42285: {'lr': 0.00041403433661276015, 'samples': 8118720, 'steps': 42284, 'loss/train': 0.9539211988449097} -08/30/2021 20:47:14 - INFO - __main__ - Step 42286: {'lr': 0.0004140303318863288, 'samples': 8118912, 'steps': 42285, 'loss/train': 1.2375967502593994} -08/30/2021 20:47:15 - INFO - __main__ - Step 42287: {'lr': 0.00041402632708598797, 'samples': 8119104, 'steps': 42286, 'loss/train': 1.9723584651947021} -08/30/2021 20:47:15 - INFO - __main__ - Step 42288: {'lr': 0.0004140223222117394, 'samples': 8119296, 'steps': 42287, 'loss/train': 1.137107253074646} -08/30/2021 20:47:16 - INFO - __main__ - Step 42289: {'lr': 0.00041401831726358497, 'samples': 8119488, 'steps': 42288, 'loss/train': 0.07174333184957504} -08/30/2021 20:47:16 - INFO - __main__ - Step 42290: {'lr': 0.0004140143122415263, 'samples': 8119680, 'steps': 42289, 'loss/train': 1.2087912559509277} -08/30/2021 20:47:18 - INFO - __main__ - Step 42291: {'lr': 0.0004140103071455654, 'samples': 8119872, 'steps': 42290, 'loss/train': 1.216581106185913} -08/30/2021 20:47:18 - INFO - __main__ - Step 42292: {'lr': 0.000414006301975704, 'samples': 8120064, 'steps': 42291, 'loss/train': 1.4962636232376099} -08/30/2021 20:47:18 - INFO - __main__ - Step 42293: {'lr': 0.0004140022967319439, 'samples': 8120256, 'steps': 42292, 'loss/train': 1.4432076215744019} -08/30/2021 20:47:19 - INFO - __main__ - Step 42294: {'lr': 0.0004139982914142868, 'samples': 8120448, 'steps': 42293, 'loss/train': 1.4617767333984375} -08/30/2021 20:47:19 - INFO - __main__ - Step 42295: {'lr': 0.0004139942860227346, 'samples': 8120640, 'steps': 42294, 'loss/train': 0.6603941321372986} -08/30/2021 20:47:21 - INFO - __main__ - Step 42296: {'lr': 0.00041399028055728914, 'samples': 8120832, 'steps': 42295, 'loss/train': 1.6991488933563232} -08/30/2021 20:47:21 - INFO - __main__ - Step 42297: {'lr': 0.0004139862750179523, 'samples': 8121024, 'steps': 42296, 'loss/train': 1.3488762378692627} -08/30/2021 20:47:21 - INFO - __main__ - Step 42298: {'lr': 0.0004139822694047256, 'samples': 8121216, 'steps': 42297, 'loss/train': 1.7634027004241943} -08/30/2021 20:47:22 - INFO - __main__ - Step 42299: {'lr': 0.0004139782637176112, 'samples': 8121408, 'steps': 42298, 'loss/train': 1.4938671588897705} -08/30/2021 20:47:22 - INFO - __main__ - Step 42300: {'lr': 0.0004139742579566106, 'samples': 8121600, 'steps': 42299, 'loss/train': 1.2177492380142212} -08/30/2021 20:47:22 - INFO - __main__ - Step 42301: {'lr': 0.00041397025212172573, 'samples': 8121792, 'steps': 42300, 'loss/train': 1.2403696775436401} -08/30/2021 20:47:24 - INFO - __main__ - Step 42302: {'lr': 0.00041396624621295843, 'samples': 8121984, 'steps': 42301, 'loss/train': 0.5987139940261841} -08/30/2021 20:47:24 - INFO - __main__ - Step 42303: {'lr': 0.00041396224023031045, 'samples': 8122176, 'steps': 42302, 'loss/train': 1.612777829170227} -08/30/2021 20:47:25 - INFO - __main__ - Step 42304: {'lr': 0.0004139582341737836, 'samples': 8122368, 'steps': 42303, 'loss/train': 0.9146180152893066} -08/30/2021 20:47:25 - INFO - __main__ - Step 42305: {'lr': 0.0004139542280433797, 'samples': 8122560, 'steps': 42304, 'loss/train': 0.8867013454437256} -08/30/2021 20:47:25 - INFO - __main__ - Step 42306: {'lr': 0.00041395022183910064, 'samples': 8122752, 'steps': 42305, 'loss/train': 1.7288566827774048} -08/30/2021 20:47:27 - INFO - __main__ - Step 42307: {'lr': 0.00041394621556094805, 'samples': 8122944, 'steps': 42306, 'loss/train': 1.3016126155853271} -08/30/2021 20:47:27 - INFO - __main__ - Step 42308: {'lr': 0.0004139422092089239, 'samples': 8123136, 'steps': 42307, 'loss/train': 1.4550639390945435} -08/30/2021 20:47:28 - INFO - __main__ - Step 42309: {'lr': 0.0004139382027830298, 'samples': 8123328, 'steps': 42308, 'loss/train': 1.4436196088790894} -08/30/2021 20:47:28 - INFO - __main__ - Step 42310: {'lr': 0.00041393419628326777, 'samples': 8123520, 'steps': 42309, 'loss/train': 1.1155717372894287} -08/30/2021 20:47:28 - INFO - __main__ - Step 42311: {'lr': 0.00041393018970963945, 'samples': 8123712, 'steps': 42310, 'loss/train': 0.27183741331100464} -08/30/2021 20:47:30 - INFO - __main__ - Step 42312: {'lr': 0.00041392618306214683, 'samples': 8123904, 'steps': 42311, 'loss/train': 0.4071536958217621} -08/30/2021 20:47:30 - INFO - __main__ - Step 42313: {'lr': 0.0004139221763407915, 'samples': 8124096, 'steps': 42312, 'loss/train': 1.318495512008667} -08/30/2021 20:47:31 - INFO - __main__ - Step 42314: {'lr': 0.00041391816954557543, 'samples': 8124288, 'steps': 42313, 'loss/train': 1.7925927639007568} -08/30/2021 20:47:31 - INFO - __main__ - Step 42315: {'lr': 0.00041391416267650034, 'samples': 8124480, 'steps': 42314, 'loss/train': 1.2577730417251587} -08/30/2021 20:47:31 - INFO - __main__ - Step 42316: {'lr': 0.00041391015573356805, 'samples': 8124672, 'steps': 42315, 'loss/train': 1.387742280960083} -08/30/2021 20:47:33 - INFO - __main__ - Step 42317: {'lr': 0.0004139061487167804, 'samples': 8124864, 'steps': 42316, 'loss/train': 1.376395583152771} -08/30/2021 20:47:33 - INFO - __main__ - Step 42318: {'lr': 0.00041390214162613916, 'samples': 8125056, 'steps': 42317, 'loss/train': 0.8154731392860413} -08/30/2021 20:47:34 - INFO - __main__ - Step 42319: {'lr': 0.00041389813446164614, 'samples': 8125248, 'steps': 42318, 'loss/train': 0.37088194489479065} -08/30/2021 20:47:34 - INFO - __main__ - Step 42320: {'lr': 0.0004138941272233031, 'samples': 8125440, 'steps': 42319, 'loss/train': 1.0520355701446533} -08/30/2021 20:47:34 - INFO - __main__ - Step 42321: {'lr': 0.0004138901199111119, 'samples': 8125632, 'steps': 42320, 'loss/train': 1.4669736623764038} -08/30/2021 20:47:36 - INFO - __main__ - Step 42322: {'lr': 0.00041388611252507446, 'samples': 8125824, 'steps': 42321, 'loss/train': 1.990148663520813} -08/30/2021 20:47:37 - INFO - __main__ - Step 42323: {'lr': 0.0004138821050651923, 'samples': 8126016, 'steps': 42322, 'loss/train': 1.2143610715866089} -08/30/2021 20:47:37 - INFO - __main__ - Step 42324: {'lr': 0.00041387809753146756, 'samples': 8126208, 'steps': 42323, 'loss/train': 1.393174648284912} -08/30/2021 20:47:38 - INFO - __main__ - Step 42325: {'lr': 0.00041387408992390177, 'samples': 8126400, 'steps': 42324, 'loss/train': 1.2353628873825073} -08/30/2021 20:47:38 - INFO - __main__ - Step 42326: {'lr': 0.0004138700822424968, 'samples': 8126592, 'steps': 42325, 'loss/train': 1.2122210264205933} -08/30/2021 20:47:38 - INFO - __main__ - Step 42327: {'lr': 0.0004138660744872547, 'samples': 8126784, 'steps': 42326, 'loss/train': 1.7359952926635742} -08/30/2021 20:47:40 - INFO - __main__ - Step 42328: {'lr': 0.00041386206665817684, 'samples': 8126976, 'steps': 42327, 'loss/train': 0.7341434955596924} -08/30/2021 20:47:41 - INFO - __main__ - Step 42329: {'lr': 0.0004138580587552654, 'samples': 8127168, 'steps': 42328, 'loss/train': 1.654409646987915} -08/30/2021 20:47:41 - INFO - __main__ - Step 42330: {'lr': 0.000413854050778522, 'samples': 8127360, 'steps': 42329, 'loss/train': 1.464223861694336} -08/30/2021 20:47:42 - INFO - __main__ - Step 42331: {'lr': 0.00041385004272794846, 'samples': 8127552, 'steps': 42330, 'loss/train': 0.576591968536377} -08/30/2021 20:47:42 - INFO - __main__ - Step 42332: {'lr': 0.0004138460346035467, 'samples': 8127744, 'steps': 42331, 'loss/train': 1.5685197114944458} -08/30/2021 20:47:43 - INFO - __main__ - Step 42333: {'lr': 0.0004138420264053184, 'samples': 8127936, 'steps': 42332, 'loss/train': 1.5571768283843994} -08/30/2021 20:47:44 - INFO - __main__ - Step 42334: {'lr': 0.00041383801813326543, 'samples': 8128128, 'steps': 42333, 'loss/train': 1.3254379034042358} -08/30/2021 20:47:44 - INFO - __main__ - Step 42335: {'lr': 0.00041383400978738956, 'samples': 8128320, 'steps': 42334, 'loss/train': 1.1243456602096558} -08/30/2021 20:47:45 - INFO - __main__ - Step 42336: {'lr': 0.0004138300013676926, 'samples': 8128512, 'steps': 42335, 'loss/train': 1.4749187231063843} -08/30/2021 20:47:45 - INFO - __main__ - Step 42337: {'lr': 0.0004138259928741764, 'samples': 8128704, 'steps': 42336, 'loss/train': 1.1158260107040405} -08/30/2021 20:47:45 - INFO - __main__ - Step 42338: {'lr': 0.0004138219843068427, 'samples': 8128896, 'steps': 42337, 'loss/train': 1.6016513109207153} -08/30/2021 20:47:47 - INFO - __main__ - Step 42339: {'lr': 0.00041381797566569345, 'samples': 8129088, 'steps': 42338, 'loss/train': 1.2200013399124146} -08/30/2021 20:47:47 - INFO - __main__ - Step 42340: {'lr': 0.0004138139669507303, 'samples': 8129280, 'steps': 42339, 'loss/train': 1.9808986186981201} -08/30/2021 20:47:48 - INFO - __main__ - Step 42341: {'lr': 0.000413809958161955, 'samples': 8129472, 'steps': 42340, 'loss/train': 0.7874013781547546} -08/30/2021 20:47:48 - INFO - __main__ - Step 42342: {'lr': 0.0004138059492993695, 'samples': 8129664, 'steps': 42341, 'loss/train': 1.4540199041366577} -08/30/2021 20:47:49 - INFO - __main__ - Step 42343: {'lr': 0.0004138019403629756, 'samples': 8129856, 'steps': 42342, 'loss/train': 0.6971977949142456} -08/30/2021 20:47:50 - INFO - __main__ - Step 42344: {'lr': 0.0004137979313527751, 'samples': 8130048, 'steps': 42343, 'loss/train': 0.027746109291911125} -08/30/2021 20:47:50 - INFO - __main__ - Step 42345: {'lr': 0.00041379392226876974, 'samples': 8130240, 'steps': 42344, 'loss/train': 1.6688930988311768} -08/30/2021 20:47:51 - INFO - __main__ - Step 42346: {'lr': 0.0004137899131109614, 'samples': 8130432, 'steps': 42345, 'loss/train': 0.9629099369049072} -08/30/2021 20:47:51 - INFO - __main__ - Step 42347: {'lr': 0.0004137859038793518, 'samples': 8130624, 'steps': 42346, 'loss/train': 0.9345664381980896} -08/30/2021 20:47:51 - INFO - __main__ - Step 42348: {'lr': 0.0004137818945739428, 'samples': 8130816, 'steps': 42347, 'loss/train': 1.118801474571228} -08/30/2021 20:47:52 - INFO - __main__ - Step 42349: {'lr': 0.00041377788519473624, 'samples': 8131008, 'steps': 42348, 'loss/train': 1.4099096059799194} -08/30/2021 20:47:53 - INFO - __main__ - Step 42350: {'lr': 0.0004137738757417339, 'samples': 8131200, 'steps': 42349, 'loss/train': 1.2825098037719727} -08/30/2021 20:47:54 - INFO - __main__ - Step 42351: {'lr': 0.0004137698662149375, 'samples': 8131392, 'steps': 42350, 'loss/train': 1.5043368339538574} -08/30/2021 20:47:54 - INFO - __main__ - Step 42352: {'lr': 0.00041376585661434903, 'samples': 8131584, 'steps': 42351, 'loss/train': 1.049721121788025} -08/30/2021 20:47:54 - INFO - __main__ - Step 42353: {'lr': 0.0004137618469399702, 'samples': 8131776, 'steps': 42352, 'loss/train': 1.226038932800293} -08/30/2021 20:47:55 - INFO - __main__ - Step 42354: {'lr': 0.0004137578371918027, 'samples': 8131968, 'steps': 42353, 'loss/train': 1.4198780059814453} -08/30/2021 20:47:56 - INFO - __main__ - Step 42355: {'lr': 0.00041375382736984857, 'samples': 8132160, 'steps': 42354, 'loss/train': 0.3786611258983612} -08/30/2021 20:47:57 - INFO - __main__ - Step 42356: {'lr': 0.0004137498174741094, 'samples': 8132352, 'steps': 42355, 'loss/train': 1.0501378774642944} -08/30/2021 20:47:57 - INFO - __main__ - Step 42357: {'lr': 0.0004137458075045871, 'samples': 8132544, 'steps': 42356, 'loss/train': 1.5100451707839966} -08/30/2021 20:47:58 - INFO - __main__ - Step 42358: {'lr': 0.0004137417974612835, 'samples': 8132736, 'steps': 42357, 'loss/train': 0.7366935610771179} -08/30/2021 20:47:58 - INFO - __main__ - Step 42359: {'lr': 0.0004137377873442004, 'samples': 8132928, 'steps': 42358, 'loss/train': 1.0398112535476685} -08/30/2021 20:47:59 - INFO - __main__ - Step 42360: {'lr': 0.00041373377715333946, 'samples': 8133120, 'steps': 42359, 'loss/train': 0.3249274492263794} -08/30/2021 20:48:00 - INFO - __main__ - Step 42361: {'lr': 0.00041372976688870266, 'samples': 8133312, 'steps': 42360, 'loss/train': 1.0224472284317017} -08/30/2021 20:48:00 - INFO - __main__ - Step 42362: {'lr': 0.0004137257565502918, 'samples': 8133504, 'steps': 42361, 'loss/train': 1.5017039775848389} -08/30/2021 20:48:00 - INFO - __main__ - Step 42363: {'lr': 0.00041372174613810863, 'samples': 8133696, 'steps': 42362, 'loss/train': 0.9485722184181213} -08/30/2021 20:48:01 - INFO - __main__ - Step 42364: {'lr': 0.00041371773565215494, 'samples': 8133888, 'steps': 42363, 'loss/train': 1.691267728805542} -08/30/2021 20:48:02 - INFO - __main__ - Step 42365: {'lr': 0.00041371372509243256, 'samples': 8134080, 'steps': 42364, 'loss/train': 1.8485782146453857} -08/30/2021 20:48:03 - INFO - __main__ - Step 42366: {'lr': 0.00041370971445894335, 'samples': 8134272, 'steps': 42365, 'loss/train': 1.4423432350158691} -08/30/2021 20:48:03 - INFO - __main__ - Step 42367: {'lr': 0.00041370570375168903, 'samples': 8134464, 'steps': 42366, 'loss/train': 1.0338165760040283} -08/30/2021 20:48:04 - INFO - __main__ - Step 42368: {'lr': 0.00041370169297067145, 'samples': 8134656, 'steps': 42367, 'loss/train': 1.3190189599990845} -08/30/2021 20:48:04 - INFO - __main__ - Step 42369: {'lr': 0.00041369768211589245, 'samples': 8134848, 'steps': 42368, 'loss/train': 1.589645504951477} -08/30/2021 20:48:06 - INFO - __main__ - Step 42370: {'lr': 0.0004136936711873537, 'samples': 8135040, 'steps': 42369, 'loss/train': 1.5672895908355713} -08/30/2021 20:48:06 - INFO - __main__ - Step 42371: {'lr': 0.0004136896601850572, 'samples': 8135232, 'steps': 42370, 'loss/train': 1.205672264099121} -08/30/2021 20:48:07 - INFO - __main__ - Step 42372: {'lr': 0.0004136856491090046, 'samples': 8135424, 'steps': 42371, 'loss/train': 0.03171316534280777} -08/30/2021 20:48:07 - INFO - __main__ - Step 42373: {'lr': 0.0004136816379591979, 'samples': 8135616, 'steps': 42372, 'loss/train': 1.3279576301574707} -08/30/2021 20:48:07 - INFO - __main__ - Step 42374: {'lr': 0.0004136776267356387, 'samples': 8135808, 'steps': 42373, 'loss/train': 1.119813084602356} -08/30/2021 20:48:08 - INFO - __main__ - Step 42375: {'lr': 0.0004136736154383288, 'samples': 8136000, 'steps': 42374, 'loss/train': 0.40838176012039185} -08/30/2021 20:48:08 - INFO - __main__ - Step 42376: {'lr': 0.00041366960406727024, 'samples': 8136192, 'steps': 42375, 'loss/train': 1.4585062265396118} -08/30/2021 20:48:09 - INFO - __main__ - Step 42377: {'lr': 0.00041366559262246463, 'samples': 8136384, 'steps': 42376, 'loss/train': 1.2161041498184204} -08/30/2021 20:48:10 - INFO - __main__ - Step 42378: {'lr': 0.00041366158110391375, 'samples': 8136576, 'steps': 42377, 'loss/train': 1.6128627061843872} -08/30/2021 20:48:10 - INFO - __main__ - Step 42379: {'lr': 0.0004136575695116196, 'samples': 8136768, 'steps': 42378, 'loss/train': 0.9576939940452576} -08/30/2021 20:48:11 - INFO - __main__ - Step 42380: {'lr': 0.0004136535578455838, 'samples': 8136960, 'steps': 42379, 'loss/train': 1.3552660942077637} -08/30/2021 20:48:11 - INFO - __main__ - Step 42381: {'lr': 0.0004136495461058083, 'samples': 8137152, 'steps': 42380, 'loss/train': 1.3495925664901733} -08/30/2021 20:48:13 - INFO - __main__ - Step 42382: {'lr': 0.0004136455342922948, 'samples': 8137344, 'steps': 42381, 'loss/train': 1.1265242099761963} -08/30/2021 20:48:14 - INFO - __main__ - Step 42383: {'lr': 0.0004136415224050451, 'samples': 8137536, 'steps': 42382, 'loss/train': 1.225480318069458} -08/30/2021 20:48:14 - INFO - __main__ - Step 42384: {'lr': 0.0004136375104440611, 'samples': 8137728, 'steps': 42383, 'loss/train': 1.4332607984542847} -08/30/2021 20:48:14 - INFO - __main__ - Step 42385: {'lr': 0.0004136334984093446, 'samples': 8137920, 'steps': 42384, 'loss/train': 1.367175579071045} -08/30/2021 20:48:15 - INFO - __main__ - Step 42386: {'lr': 0.0004136294863008974, 'samples': 8138112, 'steps': 42385, 'loss/train': 1.166471242904663} -08/30/2021 20:48:16 - INFO - __main__ - Step 42387: {'lr': 0.00041362547411872116, 'samples': 8138304, 'steps': 42386, 'loss/train': 1.5373362302780151} -08/30/2021 20:48:17 - INFO - __main__ - Step 42388: {'lr': 0.00041362146186281777, 'samples': 8138496, 'steps': 42387, 'loss/train': 1.256736397743225} -08/30/2021 20:48:17 - INFO - __main__ - Step 42389: {'lr': 0.00041361744953318923, 'samples': 8138688, 'steps': 42388, 'loss/train': 1.2164804935455322} -08/30/2021 20:48:17 - INFO - __main__ - Step 42390: {'lr': 0.0004136134371298371, 'samples': 8138880, 'steps': 42389, 'loss/train': 1.3490917682647705} -08/30/2021 20:48:18 - INFO - __main__ - Step 42391: {'lr': 0.0004136094246527633, 'samples': 8139072, 'steps': 42390, 'loss/train': 1.1110398769378662} -08/30/2021 20:48:19 - INFO - __main__ - Step 42392: {'lr': 0.0004136054121019697, 'samples': 8139264, 'steps': 42391, 'loss/train': 1.7152825593948364} -08/30/2021 20:48:20 - INFO - __main__ - Step 42393: {'lr': 0.0004136013994774579, 'samples': 8139456, 'steps': 42392, 'loss/train': 1.9314446449279785} -08/30/2021 20:48:20 - INFO - __main__ - Step 42394: {'lr': 0.00041359738677922993, 'samples': 8139648, 'steps': 42393, 'loss/train': 0.9482883810997009} -08/30/2021 20:48:20 - INFO - __main__ - Step 42395: {'lr': 0.00041359337400728746, 'samples': 8139840, 'steps': 42394, 'loss/train': 1.4887709617614746} -08/30/2021 20:48:21 - INFO - __main__ - Step 42396: {'lr': 0.00041358936116163224, 'samples': 8140032, 'steps': 42395, 'loss/train': 1.4302090406417847} -08/30/2021 20:48:21 - INFO - __main__ - Step 42397: {'lr': 0.00041358534824226635, 'samples': 8140224, 'steps': 42396, 'loss/train': 0.04405956715345383} -08/30/2021 20:48:22 - INFO - __main__ - Step 42398: {'lr': 0.0004135813352491913, 'samples': 8140416, 'steps': 42397, 'loss/train': 1.9415369033813477} -08/30/2021 20:48:23 - INFO - __main__ - Step 42399: {'lr': 0.00041357732218240905, 'samples': 8140608, 'steps': 42398, 'loss/train': 1.2596665620803833} -08/30/2021 20:48:23 - INFO - __main__ - Step 42400: {'lr': 0.0004135733090419215, 'samples': 8140800, 'steps': 42399, 'loss/train': 1.1599003076553345} -08/30/2021 20:48:24 - INFO - __main__ - Step 42401: {'lr': 0.00041356929582773023, 'samples': 8140992, 'steps': 42400, 'loss/train': 2.08315110206604} -08/30/2021 20:48:24 - INFO - __main__ - Step 42402: {'lr': 0.00041356528253983714, 'samples': 8141184, 'steps': 42401, 'loss/train': 1.1858502626419067} -08/30/2021 20:48:26 - INFO - __main__ - Step 42403: {'lr': 0.0004135612691782441, 'samples': 8141376, 'steps': 42402, 'loss/train': 1.6564069986343384} -08/30/2021 20:48:26 - INFO - __main__ - Step 42404: {'lr': 0.0004135572557429529, 'samples': 8141568, 'steps': 42403, 'loss/train': 1.3619468212127686} -08/30/2021 20:48:26 - INFO - __main__ - Step 42405: {'lr': 0.0004135532422339653, 'samples': 8141760, 'steps': 42404, 'loss/train': 1.3367135524749756} -08/30/2021 20:48:27 - INFO - __main__ - Step 42406: {'lr': 0.00041354922865128316, 'samples': 8141952, 'steps': 42405, 'loss/train': 1.5595271587371826} -08/30/2021 20:48:27 - INFO - __main__ - Step 42407: {'lr': 0.00041354521499490813, 'samples': 8142144, 'steps': 42406, 'loss/train': 1.2361431121826172} -08/30/2021 20:48:28 - INFO - __main__ - Step 42408: {'lr': 0.00041354120126484227, 'samples': 8142336, 'steps': 42407, 'loss/train': 1.781445026397705} -08/30/2021 20:48:29 - INFO - __main__ - Step 42409: {'lr': 0.00041353718746108724, 'samples': 8142528, 'steps': 42408, 'loss/train': 1.3715013265609741} -08/30/2021 20:48:29 - INFO - __main__ - Step 42410: {'lr': 0.00041353317358364496, 'samples': 8142720, 'steps': 42409, 'loss/train': 1.4446797370910645} -08/30/2021 20:48:30 - INFO - __main__ - Step 42411: {'lr': 0.00041352915963251705, 'samples': 8142912, 'steps': 42410, 'loss/train': 1.5277940034866333} -08/30/2021 20:48:30 - INFO - __main__ - Step 42412: {'lr': 0.00041352514560770545, 'samples': 8143104, 'steps': 42411, 'loss/train': 0.3148159086704254} -08/30/2021 20:48:31 - INFO - __main__ - Step 42413: {'lr': 0.000413521131509212, 'samples': 8143296, 'steps': 42412, 'loss/train': 1.5040147304534912} -08/30/2021 20:48:32 - INFO - __main__ - Step 42414: {'lr': 0.0004135171173370383, 'samples': 8143488, 'steps': 42413, 'loss/train': 1.3710672855377197} -08/30/2021 20:48:32 - INFO - __main__ - Step 42415: {'lr': 0.00041351310309118653, 'samples': 8143680, 'steps': 42414, 'loss/train': 1.2292615175247192} -08/30/2021 20:48:33 - INFO - __main__ - Step 42416: {'lr': 0.00041350908877165805, 'samples': 8143872, 'steps': 42415, 'loss/train': 1.3799588680267334} -08/30/2021 20:48:33 - INFO - __main__ - Step 42417: {'lr': 0.00041350507437845505, 'samples': 8144064, 'steps': 42416, 'loss/train': 0.8461814522743225} -08/30/2021 20:48:34 - INFO - __main__ - Step 42418: {'lr': 0.00041350105991157915, 'samples': 8144256, 'steps': 42417, 'loss/train': 1.0097887516021729} -08/30/2021 20:48:35 - INFO - __main__ - Step 42419: {'lr': 0.00041349704537103216, 'samples': 8144448, 'steps': 42418, 'loss/train': 1.3813625574111938} -08/30/2021 20:48:35 - INFO - __main__ - Step 42420: {'lr': 0.000413493030756816, 'samples': 8144640, 'steps': 42419, 'loss/train': 1.6276328563690186} -08/30/2021 20:48:35 - INFO - __main__ - Step 42421: {'lr': 0.0004134890160689323, 'samples': 8144832, 'steps': 42420, 'loss/train': 1.6141060590744019} -08/30/2021 20:48:36 - INFO - __main__ - Step 42422: {'lr': 0.000413485001307383, 'samples': 8145024, 'steps': 42421, 'loss/train': 1.1245355606079102} -08/30/2021 20:48:37 - INFO - __main__ - Step 42423: {'lr': 0.00041348098647216993, 'samples': 8145216, 'steps': 42422, 'loss/train': 1.54545259475708} -08/30/2021 20:48:38 - INFO - __main__ - Step 42424: {'lr': 0.00041347697156329485, 'samples': 8145408, 'steps': 42423, 'loss/train': 1.2535576820373535} -08/30/2021 20:48:38 - INFO - __main__ - Step 42425: {'lr': 0.00041347295658075955, 'samples': 8145600, 'steps': 42424, 'loss/train': 1.6858940124511719} -08/30/2021 20:48:38 - INFO - __main__ - Step 42426: {'lr': 0.00041346894152456584, 'samples': 8145792, 'steps': 42425, 'loss/train': 1.5264227390289307} -08/30/2021 20:48:39 - INFO - __main__ - Step 42427: {'lr': 0.00041346492639471555, 'samples': 8145984, 'steps': 42426, 'loss/train': 1.5428723096847534} -08/30/2021 20:48:40 - INFO - __main__ - Step 42428: {'lr': 0.0004134609111912105, 'samples': 8146176, 'steps': 42427, 'loss/train': 1.4447158575057983} -08/30/2021 20:48:41 - INFO - __main__ - Step 42429: {'lr': 0.00041345689591405256, 'samples': 8146368, 'steps': 42428, 'loss/train': 0.8225834965705872} -08/30/2021 20:48:41 - INFO - __main__ - Step 42430: {'lr': 0.0004134528805632434, 'samples': 8146560, 'steps': 42429, 'loss/train': 1.8460559844970703} -08/30/2021 20:48:41 - INFO - __main__ - Step 42431: {'lr': 0.00041344886513878485, 'samples': 8146752, 'steps': 42430, 'loss/train': 1.1114012002944946} -08/30/2021 20:48:42 - INFO - __main__ - Step 42432: {'lr': 0.00041344484964067873, 'samples': 8146944, 'steps': 42431, 'loss/train': 1.7520263195037842} -08/30/2021 20:48:44 - INFO - __main__ - Step 42433: {'lr': 0.00041344083406892704, 'samples': 8147136, 'steps': 42432, 'loss/train': 1.3878406286239624} -08/30/2021 20:48:44 - INFO - __main__ - Step 42434: {'lr': 0.0004134368184235313, 'samples': 8147328, 'steps': 42433, 'loss/train': 1.199316382408142} -08/30/2021 20:48:45 - INFO - __main__ - Step 42435: {'lr': 0.0004134328027044935, 'samples': 8147520, 'steps': 42434, 'loss/train': 1.25644052028656} -08/30/2021 20:48:45 - INFO - __main__ - Step 42436: {'lr': 0.0004134287869118154, 'samples': 8147712, 'steps': 42435, 'loss/train': 3.500422239303589} -08/30/2021 20:48:45 - INFO - __main__ - Step 42437: {'lr': 0.0004134247710454988, 'samples': 8147904, 'steps': 42436, 'loss/train': 0.9930896162986755} -08/30/2021 20:48:47 - INFO - __main__ - Step 42438: {'lr': 0.00041342075510554554, 'samples': 8148096, 'steps': 42437, 'loss/train': 1.6353338956832886} -08/30/2021 20:48:47 - INFO - __main__ - Step 42439: {'lr': 0.0004134167390919574, 'samples': 8148288, 'steps': 42438, 'loss/train': 1.2115516662597656} -08/30/2021 20:48:48 - INFO - __main__ - Step 42440: {'lr': 0.0004134127230047362, 'samples': 8148480, 'steps': 42439, 'loss/train': 1.7827893495559692} -08/30/2021 20:48:48 - INFO - __main__ - Step 42441: {'lr': 0.00041340870684388375, 'samples': 8148672, 'steps': 42440, 'loss/train': 1.2603460550308228} -08/30/2021 20:48:48 - INFO - __main__ - Step 42442: {'lr': 0.00041340469060940183, 'samples': 8148864, 'steps': 42441, 'loss/train': 1.1322824954986572} -08/30/2021 20:48:50 - INFO - __main__ - Step 42443: {'lr': 0.0004134006743012923, 'samples': 8149056, 'steps': 42442, 'loss/train': 1.6862225532531738} -08/30/2021 20:48:50 - INFO - __main__ - Step 42444: {'lr': 0.00041339665791955695, 'samples': 8149248, 'steps': 42443, 'loss/train': 1.663807988166809} -08/30/2021 20:48:51 - INFO - __main__ - Step 42445: {'lr': 0.00041339264146419757, 'samples': 8149440, 'steps': 42444, 'loss/train': 1.8957269191741943} -08/30/2021 20:48:51 - INFO - __main__ - Step 42446: {'lr': 0.000413388624935216, 'samples': 8149632, 'steps': 42445, 'loss/train': 1.2831565141677856} -08/30/2021 20:48:51 - INFO - __main__ - Step 42447: {'lr': 0.00041338460833261403, 'samples': 8149824, 'steps': 42446, 'loss/train': 1.7989166975021362} -08/30/2021 20:48:52 - INFO - __main__ - Step 42448: {'lr': 0.0004133805916563935, 'samples': 8150016, 'steps': 42447, 'loss/train': 1.447562336921692} -08/30/2021 20:48:53 - INFO - __main__ - Step 42449: {'lr': 0.00041337657490655625, 'samples': 8150208, 'steps': 42448, 'loss/train': 1.2173305749893188} -08/30/2021 20:48:54 - INFO - __main__ - Step 42450: {'lr': 0.00041337255808310394, 'samples': 8150400, 'steps': 42449, 'loss/train': 1.344080924987793} -08/30/2021 20:48:54 - INFO - __main__ - Step 42451: {'lr': 0.0004133685411860385, 'samples': 8150592, 'steps': 42450, 'loss/train': 1.2352086305618286} -08/30/2021 20:48:54 - INFO - __main__ - Step 42452: {'lr': 0.0004133645242153617, 'samples': 8150784, 'steps': 42451, 'loss/train': 1.5105088949203491} -08/30/2021 20:48:55 - INFO - __main__ - Step 42453: {'lr': 0.0004133605071710754, 'samples': 8150976, 'steps': 42452, 'loss/train': 1.3102952241897583} -08/30/2021 20:48:56 - INFO - __main__ - Step 42454: {'lr': 0.00041335649005318133, 'samples': 8151168, 'steps': 42453, 'loss/train': 1.5437383651733398} -08/30/2021 20:48:56 - INFO - __main__ - Step 42455: {'lr': 0.0004133524728616814, 'samples': 8151360, 'steps': 42454, 'loss/train': 1.6159123182296753} -08/30/2021 20:48:57 - INFO - __main__ - Step 42456: {'lr': 0.00041334845559657735, 'samples': 8151552, 'steps': 42455, 'loss/train': 1.3256717920303345} -08/30/2021 20:48:57 - INFO - __main__ - Step 42457: {'lr': 0.00041334443825787097, 'samples': 8151744, 'steps': 42456, 'loss/train': 1.9957058429718018} -08/30/2021 20:48:57 - INFO - __main__ - Step 42458: {'lr': 0.0004133404208455642, 'samples': 8151936, 'steps': 42457, 'loss/train': 1.4002066850662231} -08/30/2021 20:48:59 - INFO - __main__ - Step 42459: {'lr': 0.00041333640335965865, 'samples': 8152128, 'steps': 42458, 'loss/train': 1.3307198286056519} -08/30/2021 20:49:00 - INFO - __main__ - Step 42460: {'lr': 0.0004133323858001563, 'samples': 8152320, 'steps': 42459, 'loss/train': 1.5307797193527222} -08/30/2021 20:49:00 - INFO - __main__ - Step 42461: {'lr': 0.0004133283681670589, 'samples': 8152512, 'steps': 42460, 'loss/train': 1.557697057723999} -08/30/2021 20:49:00 - INFO - __main__ - Step 42462: {'lr': 0.0004133243504603682, 'samples': 8152704, 'steps': 42461, 'loss/train': 1.1681164503097534} -08/30/2021 20:49:01 - INFO - __main__ - Step 42463: {'lr': 0.0004133203326800861, 'samples': 8152896, 'steps': 42462, 'loss/train': 1.160837173461914} -08/30/2021 20:49:02 - INFO - __main__ - Step 42464: {'lr': 0.0004133163148262144, 'samples': 8153088, 'steps': 42463, 'loss/train': 1.4581665992736816} -08/30/2021 20:49:03 - INFO - __main__ - Step 42465: {'lr': 0.00041331229689875487, 'samples': 8153280, 'steps': 42464, 'loss/train': 1.4419481754302979} -08/30/2021 20:49:03 - INFO - __main__ - Step 42466: {'lr': 0.0004133082788977093, 'samples': 8153472, 'steps': 42465, 'loss/train': 1.2427361011505127} -08/30/2021 20:49:04 - INFO - __main__ - Step 42467: {'lr': 0.00041330426082307963, 'samples': 8153664, 'steps': 42466, 'loss/train': 1.6228910684585571} -08/30/2021 20:49:04 - INFO - __main__ - Step 42468: {'lr': 0.0004133002426748675, 'samples': 8153856, 'steps': 42467, 'loss/train': 1.0492117404937744} -08/30/2021 20:49:05 - INFO - __main__ - Step 42469: {'lr': 0.0004132962244530749, 'samples': 8154048, 'steps': 42468, 'loss/train': 1.7547143697738647} -08/30/2021 20:49:06 - INFO - __main__ - Step 42470: {'lr': 0.0004132922061577035, 'samples': 8154240, 'steps': 42469, 'loss/train': 2.085209846496582} -08/30/2021 20:49:06 - INFO - __main__ - Step 42471: {'lr': 0.0004132881877887551, 'samples': 8154432, 'steps': 42470, 'loss/train': 1.7114394903182983} -08/30/2021 20:49:06 - INFO - __main__ - Step 42472: {'lr': 0.0004132841693462315, 'samples': 8154624, 'steps': 42471, 'loss/train': 1.3582477569580078} -08/30/2021 20:49:07 - INFO - __main__ - Step 42473: {'lr': 0.0004132801508301347, 'samples': 8154816, 'steps': 42472, 'loss/train': 1.6064342260360718} -08/30/2021 20:49:08 - INFO - __main__ - Step 42474: {'lr': 0.0004132761322404663, 'samples': 8155008, 'steps': 42473, 'loss/train': 1.0829704999923706} -08/30/2021 20:49:09 - INFO - __main__ - Step 42475: {'lr': 0.00041327211357722825, 'samples': 8155200, 'steps': 42474, 'loss/train': 1.2835875749588013} -08/30/2021 20:49:09 - INFO - __main__ - Step 42476: {'lr': 0.00041326809484042235, 'samples': 8155392, 'steps': 42475, 'loss/train': 0.7128322124481201} -08/30/2021 20:49:10 - INFO - __main__ - Step 42477: {'lr': 0.0004132640760300503, 'samples': 8155584, 'steps': 42476, 'loss/train': 1.240614652633667} -08/30/2021 20:49:10 - INFO - __main__ - Step 42478: {'lr': 0.000413260057146114, 'samples': 8155776, 'steps': 42477, 'loss/train': 1.553532600402832} -08/30/2021 20:49:11 - INFO - __main__ - Step 42479: {'lr': 0.00041325603818861517, 'samples': 8155968, 'steps': 42478, 'loss/train': 1.4823521375656128} -08/30/2021 20:49:12 - INFO - __main__ - Step 42480: {'lr': 0.0004132520191575558, 'samples': 8156160, 'steps': 42479, 'loss/train': 0.9626538753509521} -08/30/2021 20:49:12 - INFO - __main__ - Step 42481: {'lr': 0.0004132480000529375, 'samples': 8156352, 'steps': 42480, 'loss/train': 1.4451993703842163} -08/30/2021 20:49:12 - INFO - __main__ - Step 42482: {'lr': 0.0004132439808747622, 'samples': 8156544, 'steps': 42481, 'loss/train': 1.4184468984603882} -08/30/2021 20:49:13 - INFO - __main__ - Step 42483: {'lr': 0.00041323996162303167, 'samples': 8156736, 'steps': 42482, 'loss/train': 1.3234270811080933} -08/30/2021 20:49:14 - INFO - __main__ - Step 42484: {'lr': 0.0004132359422977477, 'samples': 8156928, 'steps': 42483, 'loss/train': 1.406661868095398} -08/30/2021 20:49:15 - INFO - __main__ - Step 42485: {'lr': 0.0004132319228989122, 'samples': 8157120, 'steps': 42484, 'loss/train': 1.8578543663024902} -08/30/2021 20:49:15 - INFO - __main__ - Step 42486: {'lr': 0.00041322790342652695, 'samples': 8157312, 'steps': 42485, 'loss/train': 1.0198510885238647} -08/30/2021 20:49:16 - INFO - __main__ - Step 42487: {'lr': 0.00041322388388059366, 'samples': 8157504, 'steps': 42486, 'loss/train': 1.4509892463684082} -08/30/2021 20:49:16 - INFO - __main__ - Step 42488: {'lr': 0.0004132198642611142, 'samples': 8157696, 'steps': 42487, 'loss/train': 1.0758757591247559} -08/30/2021 20:49:16 - INFO - __main__ - Step 42489: {'lr': 0.0004132158445680904, 'samples': 8157888, 'steps': 42488, 'loss/train': 0.9270089268684387} -08/30/2021 20:49:18 - INFO - __main__ - Step 42490: {'lr': 0.0004132118248015241, 'samples': 8158080, 'steps': 42489, 'loss/train': 1.3946577310562134} -08/30/2021 20:49:19 - INFO - __main__ - Step 42491: {'lr': 0.000413207804961417, 'samples': 8158272, 'steps': 42490, 'loss/train': 1.0323116779327393} -08/30/2021 20:49:19 - INFO - __main__ - Step 42492: {'lr': 0.000413203785047771, 'samples': 8158464, 'steps': 42491, 'loss/train': 0.9179449677467346} -08/30/2021 20:49:20 - INFO - __main__ - Step 42493: {'lr': 0.00041319976506058785, 'samples': 8158656, 'steps': 42492, 'loss/train': 1.4155821800231934} -08/30/2021 20:49:20 - INFO - __main__ - Step 42494: {'lr': 0.00041319574499986957, 'samples': 8158848, 'steps': 42493, 'loss/train': 1.4145019054412842} -08/30/2021 20:49:21 - INFO - __main__ - Step 42495: {'lr': 0.0004131917248656177, 'samples': 8159040, 'steps': 42494, 'loss/train': 1.4065266847610474} -08/30/2021 20:49:22 - INFO - __main__ - Step 42496: {'lr': 0.0004131877046578341, 'samples': 8159232, 'steps': 42495, 'loss/train': 1.091234564781189} -08/30/2021 20:49:22 - INFO - __main__ - Step 42497: {'lr': 0.0004131836843765207, 'samples': 8159424, 'steps': 42496, 'loss/train': 1.2532246112823486} -08/30/2021 20:49:23 - INFO - __main__ - Step 42498: {'lr': 0.00041317966402167923, 'samples': 8159616, 'steps': 42497, 'loss/train': 1.2371271848678589} -08/30/2021 20:49:23 - INFO - __main__ - Step 42499: {'lr': 0.0004131756435933115, 'samples': 8159808, 'steps': 42498, 'loss/train': 1.3292351961135864} -08/30/2021 20:49:24 - INFO - __main__ - Step 42500: {'lr': 0.00041317162309141944, 'samples': 8160000, 'steps': 42499, 'loss/train': 1.3966660499572754} -08/30/2021 20:49:25 - INFO - __main__ - Step 42501: {'lr': 0.00041316760251600474, 'samples': 8160192, 'steps': 42500, 'loss/train': 1.6189367771148682} -08/30/2021 20:49:25 - INFO - __main__ - Step 42502: {'lr': 0.00041316358186706915, 'samples': 8160384, 'steps': 42501, 'loss/train': 1.6204622983932495} -08/30/2021 20:49:26 - INFO - __main__ - Step 42503: {'lr': 0.0004131595611446146, 'samples': 8160576, 'steps': 42502, 'loss/train': 1.3200327157974243} -08/30/2021 20:49:26 - INFO - __main__ - Step 42504: {'lr': 0.0004131555403486429, 'samples': 8160768, 'steps': 42503, 'loss/train': 0.7993461489677429} -08/30/2021 20:49:28 - INFO - __main__ - Step 42505: {'lr': 0.00041315151947915577, 'samples': 8160960, 'steps': 42504, 'loss/train': 1.470508098602295} -08/30/2021 20:49:28 - INFO - __main__ - Step 42506: {'lr': 0.0004131474985361551, 'samples': 8161152, 'steps': 42505, 'loss/train': 1.4613349437713623} -08/30/2021 20:49:28 - INFO - __main__ - Step 42507: {'lr': 0.0004131434775196428, 'samples': 8161344, 'steps': 42506, 'loss/train': 1.308729887008667} -08/30/2021 20:49:29 - INFO - __main__ - Step 42508: {'lr': 0.0004131394564296205, 'samples': 8161536, 'steps': 42507, 'loss/train': 0.7662352323532104} -08/30/2021 20:49:29 - INFO - __main__ - Step 42509: {'lr': 0.00041313543526609, 'samples': 8161728, 'steps': 42508, 'loss/train': 1.3929641246795654} -08/30/2021 20:49:31 - INFO - __main__ - Step 42510: {'lr': 0.00041313141402905324, 'samples': 8161920, 'steps': 42509, 'loss/train': 1.1557228565216064} -08/30/2021 20:49:32 - INFO - __main__ - Step 42511: {'lr': 0.00041312739271851196, 'samples': 8162112, 'steps': 42510, 'loss/train': 0.04168722778558731} -08/30/2021 20:49:32 - INFO - __main__ - Step 42512: {'lr': 0.0004131233713344681, 'samples': 8162304, 'steps': 42511, 'loss/train': 1.5663254261016846} -08/30/2021 20:49:32 - INFO - __main__ - Step 42513: {'lr': 0.0004131193498769232, 'samples': 8162496, 'steps': 42512, 'loss/train': 1.2366207838058472} -08/30/2021 20:49:33 - INFO - __main__ - Step 42514: {'lr': 0.0004131153283458794, 'samples': 8162688, 'steps': 42513, 'loss/train': 1.5431313514709473} -08/30/2021 20:49:33 - INFO - __main__ - Step 42515: {'lr': 0.00041311130674133824, 'samples': 8162880, 'steps': 42514, 'loss/train': 1.900691270828247} -08/30/2021 20:49:35 - INFO - __main__ - Step 42516: {'lr': 0.0004131072850633017, 'samples': 8163072, 'steps': 42515, 'loss/train': 3.089237928390503} -08/30/2021 20:49:35 - INFO - __main__ - Step 42517: {'lr': 0.0004131032633117715, 'samples': 8163264, 'steps': 42516, 'loss/train': 1.9592214822769165} -08/30/2021 20:49:35 - INFO - __main__ - Step 42518: {'lr': 0.0004130992414867495, 'samples': 8163456, 'steps': 42517, 'loss/train': 1.484342336654663} -08/30/2021 20:49:36 - INFO - __main__ - Step 42519: {'lr': 0.0004130952195882375, 'samples': 8163648, 'steps': 42518, 'loss/train': 0.9774752855300903} -08/30/2021 20:49:36 - INFO - __main__ - Step 42520: {'lr': 0.0004130911976162373, 'samples': 8163840, 'steps': 42519, 'loss/train': 2.4007885456085205} -08/30/2021 20:49:36 - INFO - __main__ - Step 42521: {'lr': 0.0004130871755707508, 'samples': 8164032, 'steps': 42520, 'loss/train': 2.6587793827056885} -08/30/2021 20:49:38 - INFO - __main__ - Step 42522: {'lr': 0.0004130831534517796, 'samples': 8164224, 'steps': 42521, 'loss/train': 1.5851733684539795} -08/30/2021 20:49:38 - INFO - __main__ - Step 42523: {'lr': 0.00041307913125932574, 'samples': 8164416, 'steps': 42522, 'loss/train': 1.733384609222412} -08/30/2021 20:49:39 - INFO - __main__ - Step 42524: {'lr': 0.00041307510899339097, 'samples': 8164608, 'steps': 42523, 'loss/train': 1.9815850257873535} -08/30/2021 20:49:39 - INFO - __main__ - Step 42525: {'lr': 0.00041307108665397695, 'samples': 8164800, 'steps': 42524, 'loss/train': 1.700609803199768} -08/30/2021 20:49:39 - INFO - __main__ - Step 42526: {'lr': 0.00041306706424108563, 'samples': 8164992, 'steps': 42525, 'loss/train': 1.851414680480957} -08/30/2021 20:49:41 - INFO - __main__ - Step 42527: {'lr': 0.0004130630417547189, 'samples': 8165184, 'steps': 42526, 'loss/train': 0.22715997695922852} -08/30/2021 20:49:41 - INFO - __main__ - Step 42528: {'lr': 0.00041305901919487845, 'samples': 8165376, 'steps': 42527, 'loss/train': 1.1178879737854004} -08/30/2021 20:49:42 - INFO - __main__ - Step 42529: {'lr': 0.0004130549965615661, 'samples': 8165568, 'steps': 42528, 'loss/train': 1.2869858741760254} -08/30/2021 20:49:42 - INFO - __main__ - Step 42530: {'lr': 0.00041305097385478375, 'samples': 8165760, 'steps': 42529, 'loss/train': 1.551637053489685} -08/30/2021 20:49:42 - INFO - __main__ - Step 42531: {'lr': 0.00041304695107453307, 'samples': 8165952, 'steps': 42530, 'loss/train': 1.540576457977295} -08/30/2021 20:49:44 - INFO - __main__ - Step 42532: {'lr': 0.000413042928220816, 'samples': 8166144, 'steps': 42531, 'loss/train': 1.5075185298919678} -08/30/2021 20:49:44 - INFO - __main__ - Step 42533: {'lr': 0.0004130389052936342, 'samples': 8166336, 'steps': 42532, 'loss/train': 1.7715404033660889} -08/30/2021 20:49:45 - INFO - __main__ - Step 42534: {'lr': 0.0004130348822929897, 'samples': 8166528, 'steps': 42533, 'loss/train': 1.2812774181365967} -08/30/2021 20:49:45 - INFO - __main__ - Step 42535: {'lr': 0.0004130308592188842, 'samples': 8166720, 'steps': 42534, 'loss/train': 1.3679696321487427} -08/30/2021 20:49:45 - INFO - __main__ - Step 42536: {'lr': 0.0004130268360713194, 'samples': 8166912, 'steps': 42535, 'loss/train': 1.3101842403411865} -08/30/2021 20:49:47 - INFO - __main__ - Step 42537: {'lr': 0.0004130228128502973, 'samples': 8167104, 'steps': 42536, 'loss/train': 0.7195220589637756} -08/30/2021 20:49:48 - INFO - __main__ - Step 42538: {'lr': 0.0004130187895558196, 'samples': 8167296, 'steps': 42537, 'loss/train': 1.4899779558181763} -08/30/2021 20:49:48 - INFO - __main__ - Step 42539: {'lr': 0.00041301476618788827, 'samples': 8167488, 'steps': 42538, 'loss/train': 1.2303898334503174} -08/30/2021 20:49:48 - INFO - __main__ - Step 42540: {'lr': 0.0004130107427465049, 'samples': 8167680, 'steps': 42539, 'loss/train': 2.069544792175293} -08/30/2021 20:49:49 - INFO - __main__ - Step 42541: {'lr': 0.00041300671923167145, 'samples': 8167872, 'steps': 42540, 'loss/train': 1.3896760940551758} -08/30/2021 20:49:49 - INFO - __main__ - Step 42542: {'lr': 0.00041300269564338956, 'samples': 8168064, 'steps': 42541, 'loss/train': 1.662202000617981} -08/30/2021 20:49:51 - INFO - __main__ - Step 42543: {'lr': 0.0004129986719816613, 'samples': 8168256, 'steps': 42542, 'loss/train': 1.1935375928878784} -08/30/2021 20:49:52 - INFO - __main__ - Step 42544: {'lr': 0.0004129946482464883, 'samples': 8168448, 'steps': 42543, 'loss/train': 1.8810354471206665} -08/30/2021 20:49:52 - INFO - __main__ - Step 42545: {'lr': 0.0004129906244378724, 'samples': 8168640, 'steps': 42544, 'loss/train': 1.8081306219100952} -08/30/2021 20:49:52 - INFO - __main__ - Step 42546: {'lr': 0.0004129866005558155, 'samples': 8168832, 'steps': 42545, 'loss/train': 1.1107478141784668} -08/30/2021 20:49:53 - INFO - __main__ - Step 42547: {'lr': 0.00041298257660031935, 'samples': 8169024, 'steps': 42546, 'loss/train': 1.7478294372558594} -08/30/2021 20:49:54 - INFO - __main__ - Step 42548: {'lr': 0.00041297855257138577, 'samples': 8169216, 'steps': 42547, 'loss/train': 1.5327491760253906} -08/30/2021 20:49:55 - INFO - __main__ - Step 42549: {'lr': 0.0004129745284690165, 'samples': 8169408, 'steps': 42548, 'loss/train': 1.8275268077850342} -08/30/2021 20:49:55 - INFO - __main__ - Step 42550: {'lr': 0.0004129705042932135, 'samples': 8169600, 'steps': 42549, 'loss/train': 1.6237115859985352} -08/30/2021 20:49:56 - INFO - __main__ - Step 42551: {'lr': 0.0004129664800439785, 'samples': 8169792, 'steps': 42550, 'loss/train': 1.6580188274383545} -08/30/2021 20:49:56 - INFO - __main__ - Step 42552: {'lr': 0.0004129624557213133, 'samples': 8169984, 'steps': 42551, 'loss/train': 0.9206991791725159} -08/30/2021 20:49:57 - INFO - __main__ - Step 42553: {'lr': 0.00041295843132521973, 'samples': 8170176, 'steps': 42552, 'loss/train': 1.4790221452713013} -08/30/2021 20:49:58 - INFO - __main__ - Step 42554: {'lr': 0.0004129544068556996, 'samples': 8170368, 'steps': 42553, 'loss/train': 1.334619402885437} -08/30/2021 20:49:58 - INFO - __main__ - Step 42555: {'lr': 0.00041295038231275473, 'samples': 8170560, 'steps': 42554, 'loss/train': 1.3303892612457275} -08/30/2021 20:49:59 - INFO - __main__ - Step 42556: {'lr': 0.0004129463576963869, 'samples': 8170752, 'steps': 42555, 'loss/train': 1.7905478477478027} -08/30/2021 20:49:59 - INFO - __main__ - Step 42557: {'lr': 0.000412942333006598, 'samples': 8170944, 'steps': 42556, 'loss/train': 1.8300361633300781} -08/30/2021 20:50:00 - INFO - __main__ - Step 42558: {'lr': 0.0004129383082433898, 'samples': 8171136, 'steps': 42557, 'loss/train': 1.423487663269043} -08/30/2021 20:50:01 - INFO - __main__ - Step 42559: {'lr': 0.0004129342834067641, 'samples': 8171328, 'steps': 42558, 'loss/train': 0.595382809638977} -08/30/2021 20:50:01 - INFO - __main__ - Step 42560: {'lr': 0.0004129302584967227, 'samples': 8171520, 'steps': 42559, 'loss/train': 0.5447129011154175} -08/30/2021 20:50:02 - INFO - __main__ - Step 42561: {'lr': 0.0004129262335132675, 'samples': 8171712, 'steps': 42560, 'loss/train': 1.147903561592102} -08/30/2021 20:50:02 - INFO - __main__ - Step 42562: {'lr': 0.00041292220845640023, 'samples': 8171904, 'steps': 42561, 'loss/train': 1.5784170627593994} -08/30/2021 20:50:03 - INFO - __main__ - Step 42563: {'lr': 0.00041291818332612275, 'samples': 8172096, 'steps': 42562, 'loss/train': 1.3214142322540283} -08/30/2021 20:50:04 - INFO - __main__ - Step 42564: {'lr': 0.00041291415812243676, 'samples': 8172288, 'steps': 42563, 'loss/train': 1.2969063520431519} -08/30/2021 20:50:04 - INFO - __main__ - Step 42565: {'lr': 0.0004129101328453442, 'samples': 8172480, 'steps': 42564, 'loss/train': 1.8963228464126587} -08/30/2021 20:50:05 - INFO - __main__ - Step 42566: {'lr': 0.0004129061074948469, 'samples': 8172672, 'steps': 42565, 'loss/train': 0.8637040853500366} -08/30/2021 20:50:05 - INFO - __main__ - Step 42567: {'lr': 0.0004129020820709466, 'samples': 8172864, 'steps': 42566, 'loss/train': 1.4360512495040894} -08/30/2021 20:50:05 - INFO - __main__ - Step 42568: {'lr': 0.00041289805657364516, 'samples': 8173056, 'steps': 42567, 'loss/train': 1.4814757108688354} -08/30/2021 20:50:07 - INFO - __main__ - Step 42569: {'lr': 0.0004128940310029443, 'samples': 8173248, 'steps': 42568, 'loss/train': 1.460622787475586} -08/30/2021 20:50:07 - INFO - __main__ - Step 42570: {'lr': 0.0004128900053588459, 'samples': 8173440, 'steps': 42569, 'loss/train': 1.2954845428466797} -08/30/2021 20:50:08 - INFO - __main__ - Step 42571: {'lr': 0.00041288597964135186, 'samples': 8173632, 'steps': 42570, 'loss/train': 1.1991653442382812} -08/30/2021 20:50:08 - INFO - __main__ - Step 42572: {'lr': 0.0004128819538504639, 'samples': 8173824, 'steps': 42571, 'loss/train': 1.2448238134384155} -08/30/2021 20:50:08 - INFO - __main__ - Step 42573: {'lr': 0.00041287792798618374, 'samples': 8174016, 'steps': 42572, 'loss/train': 1.7913423776626587} -08/30/2021 20:50:10 - INFO - __main__ - Step 42574: {'lr': 0.00041287390204851343, 'samples': 8174208, 'steps': 42573, 'loss/train': 1.2062824964523315} -08/30/2021 20:50:10 - INFO - __main__ - Step 42575: {'lr': 0.0004128698760374546, 'samples': 8174400, 'steps': 42574, 'loss/train': 1.3583638668060303} -08/30/2021 20:50:11 - INFO - __main__ - Step 42576: {'lr': 0.0004128658499530091, 'samples': 8174592, 'steps': 42575, 'loss/train': 1.3554943799972534} -08/30/2021 20:50:11 - INFO - __main__ - Step 42577: {'lr': 0.00041286182379517876, 'samples': 8174784, 'steps': 42576, 'loss/train': 1.3241122961044312} -08/30/2021 20:50:11 - INFO - __main__ - Step 42578: {'lr': 0.00041285779756396543, 'samples': 8174976, 'steps': 42577, 'loss/train': 1.5234028100967407} -08/30/2021 20:50:13 - INFO - __main__ - Step 42579: {'lr': 0.00041285377125937085, 'samples': 8175168, 'steps': 42578, 'loss/train': 1.1367021799087524} -08/30/2021 20:50:13 - INFO - __main__ - Step 42580: {'lr': 0.0004128497448813969, 'samples': 8175360, 'steps': 42579, 'loss/train': 1.0235539674758911} -08/30/2021 20:50:13 - INFO - __main__ - Step 42581: {'lr': 0.0004128457184300454, 'samples': 8175552, 'steps': 42580, 'loss/train': 1.264026403427124} -08/30/2021 20:50:14 - INFO - __main__ - Step 42582: {'lr': 0.0004128416919053181, 'samples': 8175744, 'steps': 42581, 'loss/train': 1.6446257829666138} -08/30/2021 20:50:14 - INFO - __main__ - Step 42583: {'lr': 0.0004128376653072168, 'samples': 8175936, 'steps': 42582, 'loss/train': 2.0228919982910156} -08/30/2021 20:50:16 - INFO - __main__ - Step 42584: {'lr': 0.0004128336386357434, 'samples': 8176128, 'steps': 42583, 'loss/train': 0.9513541460037231} -08/30/2021 20:50:16 - INFO - __main__ - Step 42585: {'lr': 0.0004128296118908997, 'samples': 8176320, 'steps': 42584, 'loss/train': 0.9187955856323242} -08/30/2021 20:50:16 - INFO - __main__ - Step 42586: {'lr': 0.0004128255850726874, 'samples': 8176512, 'steps': 42585, 'loss/train': 1.342198133468628} -08/30/2021 20:50:17 - INFO - __main__ - Step 42587: {'lr': 0.0004128215581811085, 'samples': 8176704, 'steps': 42586, 'loss/train': 1.0489925146102905} -08/30/2021 20:50:17 - INFO - __main__ - Step 42588: {'lr': 0.0004128175312161647, 'samples': 8176896, 'steps': 42587, 'loss/train': 1.5324856042861938} -08/30/2021 20:50:19 - INFO - __main__ - Step 42589: {'lr': 0.00041281350417785777, 'samples': 8177088, 'steps': 42588, 'loss/train': 1.1539678573608398} -08/30/2021 20:50:19 - INFO - __main__ - Step 42590: {'lr': 0.00041280947706618965, 'samples': 8177280, 'steps': 42589, 'loss/train': 1.7433608770370483} -08/30/2021 20:50:19 - INFO - __main__ - Step 42591: {'lr': 0.0004128054498811621, 'samples': 8177472, 'steps': 42590, 'loss/train': 1.2905824184417725} -08/30/2021 20:50:20 - INFO - __main__ - Step 42592: {'lr': 0.0004128014226227769, 'samples': 8177664, 'steps': 42591, 'loss/train': 0.9582744836807251} -08/30/2021 20:50:20 - INFO - __main__ - Step 42593: {'lr': 0.00041279739529103586, 'samples': 8177856, 'steps': 42592, 'loss/train': 0.974994957447052} -08/30/2021 20:50:22 - INFO - __main__ - Step 42594: {'lr': 0.0004127933678859409, 'samples': 8178048, 'steps': 42593, 'loss/train': 1.4279515743255615} -08/30/2021 20:50:22 - INFO - __main__ - Step 42595: {'lr': 0.00041278934040749375, 'samples': 8178240, 'steps': 42594, 'loss/train': 1.3299150466918945} -08/30/2021 20:50:22 - INFO - __main__ - Step 42596: {'lr': 0.0004127853128556962, 'samples': 8178432, 'steps': 42595, 'loss/train': 0.41914287209510803} -08/30/2021 20:50:23 - INFO - __main__ - Step 42597: {'lr': 0.00041278128523055015, 'samples': 8178624, 'steps': 42596, 'loss/train': 1.0886958837509155} -08/30/2021 20:50:23 - INFO - __main__ - Step 42598: {'lr': 0.0004127772575320573, 'samples': 8178816, 'steps': 42597, 'loss/train': 1.7218480110168457} -08/30/2021 20:50:25 - INFO - __main__ - Step 42599: {'lr': 0.0004127732297602196, 'samples': 8179008, 'steps': 42598, 'loss/train': 1.7389047145843506} -08/30/2021 20:50:25 - INFO - __main__ - Step 42600: {'lr': 0.0004127692019150387, 'samples': 8179200, 'steps': 42599, 'loss/train': 1.8176203966140747} -08/30/2021 20:50:26 - INFO - __main__ - Step 42601: {'lr': 0.00041276517399651657, 'samples': 8179392, 'steps': 42600, 'loss/train': 1.3899518251419067} -08/30/2021 20:50:26 - INFO - __main__ - Step 42602: {'lr': 0.00041276114600465497, 'samples': 8179584, 'steps': 42601, 'loss/train': 1.1477563381195068} -08/30/2021 20:50:26 - INFO - __main__ - Step 42603: {'lr': 0.0004127571179394557, 'samples': 8179776, 'steps': 42602, 'loss/train': 1.45731782913208} -08/30/2021 20:50:27 - INFO - __main__ - Step 42604: {'lr': 0.0004127530898009205, 'samples': 8179968, 'steps': 42603, 'loss/train': 1.2893725633621216} -08/30/2021 20:50:28 - INFO - __main__ - Step 42605: {'lr': 0.00041274906158905137, 'samples': 8180160, 'steps': 42604, 'loss/train': 0.9913890361785889} -08/30/2021 20:50:29 - INFO - __main__ - Step 42606: {'lr': 0.00041274503330384997, 'samples': 8180352, 'steps': 42605, 'loss/train': 0.5048430562019348} -08/30/2021 20:50:29 - INFO - __main__ - Step 42607: {'lr': 0.0004127410049453182, 'samples': 8180544, 'steps': 42606, 'loss/train': 1.211820363998413} -08/30/2021 20:50:30 - INFO - __main__ - Step 42608: {'lr': 0.00041273697651345785, 'samples': 8180736, 'steps': 42607, 'loss/train': 1.0460318326950073} -08/30/2021 20:50:30 - INFO - __main__ - Step 42609: {'lr': 0.00041273294800827075, 'samples': 8180928, 'steps': 42608, 'loss/train': 1.3623193502426147} -08/30/2021 20:50:31 - INFO - __main__ - Step 42610: {'lr': 0.00041272891942975863, 'samples': 8181120, 'steps': 42609, 'loss/train': 1.2552400827407837} -08/30/2021 20:50:32 - INFO - __main__ - Step 42611: {'lr': 0.00041272489077792343, 'samples': 8181312, 'steps': 42610, 'loss/train': 1.045832633972168} -08/30/2021 20:50:32 - INFO - __main__ - Step 42612: {'lr': 0.0004127208620527669, 'samples': 8181504, 'steps': 42611, 'loss/train': 0.9717525839805603} -08/30/2021 20:50:33 - INFO - __main__ - Step 42613: {'lr': 0.00041271683325429075, 'samples': 8181696, 'steps': 42612, 'loss/train': 0.8153554797172546} -08/30/2021 20:50:33 - INFO - __main__ - Step 42614: {'lr': 0.00041271280438249705, 'samples': 8181888, 'steps': 42613, 'loss/train': 1.4658877849578857} -08/30/2021 20:50:35 - INFO - __main__ - Step 42615: {'lr': 0.00041270877543738744, 'samples': 8182080, 'steps': 42614, 'loss/train': 1.6607701778411865} -08/30/2021 20:50:35 - INFO - __main__ - Step 42616: {'lr': 0.0004127047464189637, 'samples': 8182272, 'steps': 42615, 'loss/train': 1.2117866277694702} -08/30/2021 20:50:35 - INFO - __main__ - Step 42617: {'lr': 0.0004127007173272278, 'samples': 8182464, 'steps': 42616, 'loss/train': 1.2703490257263184} -08/30/2021 20:50:36 - INFO - __main__ - Step 42618: {'lr': 0.0004126966881621814, 'samples': 8182656, 'steps': 42617, 'loss/train': 1.5068018436431885} -08/30/2021 20:50:36 - INFO - __main__ - Step 42619: {'lr': 0.0004126926589238264, 'samples': 8182848, 'steps': 42618, 'loss/train': 1.1753032207489014} -08/30/2021 20:50:38 - INFO - __main__ - Step 42620: {'lr': 0.00041268862961216457, 'samples': 8183040, 'steps': 42619, 'loss/train': 1.5578181743621826} -08/30/2021 20:50:38 - INFO - __main__ - Step 42621: {'lr': 0.00041268460022719783, 'samples': 8183232, 'steps': 42620, 'loss/train': 1.3847417831420898} -08/30/2021 20:50:38 - INFO - __main__ - Step 42622: {'lr': 0.0004126805707689279, 'samples': 8183424, 'steps': 42621, 'loss/train': 1.6318258047103882} -08/30/2021 20:50:39 - INFO - __main__ - Step 42623: {'lr': 0.0004126765412373566, 'samples': 8183616, 'steps': 42622, 'loss/train': 1.423075795173645} -08/30/2021 20:50:39 - INFO - __main__ - Step 42624: {'lr': 0.0004126725116324858, 'samples': 8183808, 'steps': 42623, 'loss/train': 2.2788617610931396} -08/30/2021 20:50:40 - INFO - __main__ - Step 42625: {'lr': 0.00041266848195431715, 'samples': 8184000, 'steps': 42624, 'loss/train': 2.6883630752563477} -08/30/2021 20:50:41 - INFO - __main__ - Step 42626: {'lr': 0.00041266445220285267, 'samples': 8184192, 'steps': 42625, 'loss/train': 1.554368019104004} -08/30/2021 20:50:41 - INFO - __main__ - Step 42627: {'lr': 0.0004126604223780941, 'samples': 8184384, 'steps': 42626, 'loss/train': 1.5231170654296875} -08/30/2021 20:50:42 - INFO - __main__ - Step 42628: {'lr': 0.00041265639248004327, 'samples': 8184576, 'steps': 42627, 'loss/train': 1.1753484010696411} -08/30/2021 20:50:42 - INFO - __main__ - Step 42629: {'lr': 0.000412652362508702, 'samples': 8184768, 'steps': 42628, 'loss/train': 1.1532585620880127} -08/30/2021 20:50:42 - INFO - __main__ - Step 42630: {'lr': 0.000412648332464072, 'samples': 8184960, 'steps': 42629, 'loss/train': 1.1923291683197021} -08/30/2021 20:50:44 - INFO - __main__ - Step 42631: {'lr': 0.00041264430234615526, 'samples': 8185152, 'steps': 42630, 'loss/train': 1.5295366048812866} -08/30/2021 20:50:44 - INFO - __main__ - Step 42632: {'lr': 0.0004126402721549535, 'samples': 8185344, 'steps': 42631, 'loss/train': 1.3435066938400269} -08/30/2021 20:50:45 - INFO - __main__ - Step 42633: {'lr': 0.00041263624189046846, 'samples': 8185536, 'steps': 42632, 'loss/train': 1.9694530963897705} -08/30/2021 20:50:45 - INFO - __main__ - Step 42634: {'lr': 0.0004126322115527021, 'samples': 8185728, 'steps': 42633, 'loss/train': 1.7155439853668213} -08/30/2021 20:50:45 - INFO - __main__ - Step 42635: {'lr': 0.00041262818114165615, 'samples': 8185920, 'steps': 42634, 'loss/train': 0.8143765330314636} -08/30/2021 20:50:47 - INFO - __main__ - Step 42636: {'lr': 0.0004126241506573325, 'samples': 8186112, 'steps': 42635, 'loss/train': 1.4423202276229858} -08/30/2021 20:50:47 - INFO - __main__ - Step 42637: {'lr': 0.00041262012009973283, 'samples': 8186304, 'steps': 42636, 'loss/train': 1.0636776685714722} -08/30/2021 20:50:48 - INFO - __main__ - Step 42638: {'lr': 0.0004126160894688591, 'samples': 8186496, 'steps': 42637, 'loss/train': 1.1029741764068604} -08/30/2021 20:50:48 - INFO - __main__ - Step 42639: {'lr': 0.00041261205876471307, 'samples': 8186688, 'steps': 42638, 'loss/train': 1.4843602180480957} -08/30/2021 20:50:48 - INFO - __main__ - Step 42640: {'lr': 0.0004126080279872966, 'samples': 8186880, 'steps': 42639, 'loss/train': 1.6286613941192627} -08/30/2021 20:50:50 - INFO - __main__ - Step 42641: {'lr': 0.0004126039971366114, 'samples': 8187072, 'steps': 42640, 'loss/train': 1.3744587898254395} -08/30/2021 20:50:51 - INFO - __main__ - Step 42642: {'lr': 0.0004125999662126594, 'samples': 8187264, 'steps': 42641, 'loss/train': 1.0720371007919312} -08/30/2021 20:50:51 - INFO - __main__ - Step 42643: {'lr': 0.00041259593521544223, 'samples': 8187456, 'steps': 42642, 'loss/train': 1.090353012084961} -08/30/2021 20:50:52 - INFO - __main__ - Step 42644: {'lr': 0.00041259190414496194, 'samples': 8187648, 'steps': 42643, 'loss/train': 1.4614031314849854} -08/30/2021 20:50:52 - INFO - __main__ - Step 42645: {'lr': 0.00041258787300122026, 'samples': 8187840, 'steps': 42644, 'loss/train': 1.0903599262237549} -08/30/2021 20:50:52 - INFO - __main__ - Step 42646: {'lr': 0.000412583841784219, 'samples': 8188032, 'steps': 42645, 'loss/train': 0.9116281867027283} -08/30/2021 20:50:54 - INFO - __main__ - Step 42647: {'lr': 0.00041257981049395997, 'samples': 8188224, 'steps': 42646, 'loss/train': 0.9863569736480713} -08/30/2021 20:50:54 - INFO - __main__ - Step 42648: {'lr': 0.000412575779130445, 'samples': 8188416, 'steps': 42647, 'loss/train': 0.9859895706176758} -08/30/2021 20:50:55 - INFO - __main__ - Step 42649: {'lr': 0.0004125717476936758, 'samples': 8188608, 'steps': 42648, 'loss/train': 1.2508624792099} -08/30/2021 20:50:55 - INFO - __main__ - Step 42650: {'lr': 0.0004125677161836543, 'samples': 8188800, 'steps': 42649, 'loss/train': 1.386723518371582} -08/30/2021 20:50:55 - INFO - __main__ - Step 42651: {'lr': 0.00041256368460038237, 'samples': 8188992, 'steps': 42650, 'loss/train': 1.272167444229126} -08/30/2021 20:50:57 - INFO - __main__ - Step 42652: {'lr': 0.00041255965294386174, 'samples': 8189184, 'steps': 42651, 'loss/train': 1.139366626739502} -08/30/2021 20:50:57 - INFO - __main__ - Step 42653: {'lr': 0.00041255562121409416, 'samples': 8189376, 'steps': 42652, 'loss/train': 1.252394676208496} -08/30/2021 20:50:58 - INFO - __main__ - Step 42654: {'lr': 0.0004125515894110816, 'samples': 8189568, 'steps': 42653, 'loss/train': 1.7041313648223877} -08/30/2021 20:50:58 - INFO - __main__ - Step 42655: {'lr': 0.00041254755753482574, 'samples': 8189760, 'steps': 42654, 'loss/train': 0.987637996673584} -08/30/2021 20:50:58 - INFO - __main__ - Step 42656: {'lr': 0.00041254352558532854, 'samples': 8189952, 'steps': 42655, 'loss/train': 1.3389077186584473} -08/30/2021 20:51:00 - INFO - __main__ - Step 42657: {'lr': 0.0004125394935625917, 'samples': 8190144, 'steps': 42656, 'loss/train': 1.2290616035461426} -08/30/2021 20:51:00 - INFO - __main__ - Step 42658: {'lr': 0.00041253546146661704, 'samples': 8190336, 'steps': 42657, 'loss/train': 1.597948670387268} -08/30/2021 20:51:01 - INFO - __main__ - Step 42659: {'lr': 0.00041253142929740643, 'samples': 8190528, 'steps': 42658, 'loss/train': 0.8809319138526917} -08/30/2021 20:51:01 - INFO - __main__ - Step 42660: {'lr': 0.00041252739705496165, 'samples': 8190720, 'steps': 42659, 'loss/train': 1.0182900428771973} -08/30/2021 20:51:01 - INFO - __main__ - Step 42661: {'lr': 0.00041252336473928455, 'samples': 8190912, 'steps': 42660, 'loss/train': 1.8301284313201904} -08/30/2021 20:51:03 - INFO - __main__ - Step 42662: {'lr': 0.00041251933235037695, 'samples': 8191104, 'steps': 42661, 'loss/train': 1.517749309539795} -08/30/2021 20:51:03 - INFO - __main__ - Step 42663: {'lr': 0.00041251529988824067, 'samples': 8191296, 'steps': 42662, 'loss/train': 0.9042937159538269} -08/30/2021 20:51:04 - INFO - __main__ - Step 42664: {'lr': 0.0004125112673528775, 'samples': 8191488, 'steps': 42663, 'loss/train': 1.3166545629501343} -08/30/2021 20:51:04 - INFO - __main__ - Step 42665: {'lr': 0.0004125072347442892, 'samples': 8191680, 'steps': 42664, 'loss/train': 1.620734453201294} -08/30/2021 20:51:04 - INFO - __main__ - Step 42666: {'lr': 0.0004125032020624776, 'samples': 8191872, 'steps': 42665, 'loss/train': 1.7824167013168335} -08/30/2021 20:51:06 - INFO - __main__ - Step 42667: {'lr': 0.0004124991693074447, 'samples': 8192064, 'steps': 42666, 'loss/train': 1.478500247001648} -08/30/2021 20:51:06 - INFO - __main__ - Step 42668: {'lr': 0.00041249513647919207, 'samples': 8192256, 'steps': 42667, 'loss/train': 1.3233987092971802} -08/30/2021 20:51:07 - INFO - __main__ - Step 42669: {'lr': 0.00041249110357772167, 'samples': 8192448, 'steps': 42668, 'loss/train': 1.3106153011322021} -08/30/2021 20:51:07 - INFO - __main__ - Step 42670: {'lr': 0.00041248707060303536, 'samples': 8192640, 'steps': 42669, 'loss/train': 1.2161531448364258} -08/30/2021 20:51:07 - INFO - __main__ - Step 42671: {'lr': 0.00041248303755513484, 'samples': 8192832, 'steps': 42670, 'loss/train': 1.5994771718978882} -08/30/2021 20:51:10 - INFO - __main__ - Step 42672: {'lr': 0.00041247900443402194, 'samples': 8193024, 'steps': 42671, 'loss/train': 1.877849817276001} -08/30/2021 20:51:10 - INFO - __main__ - Step 42673: {'lr': 0.00041247497123969844, 'samples': 8193216, 'steps': 42672, 'loss/train': 1.4366408586502075} -08/30/2021 20:51:10 - INFO - __main__ - Step 42674: {'lr': 0.00041247093797216637, 'samples': 8193408, 'steps': 42673, 'loss/train': 2.9169890880584717} -08/30/2021 20:51:11 - INFO - __main__ - Step 42675: {'lr': 0.00041246690463142733, 'samples': 8193600, 'steps': 42674, 'loss/train': 0.12583310902118683} -08/30/2021 20:51:11 - INFO - __main__ - Step 42676: {'lr': 0.0004124628712174833, 'samples': 8193792, 'steps': 42675, 'loss/train': 0.24078887701034546} -08/30/2021 20:51:12 - INFO - __main__ - Step 42677: {'lr': 0.0004124588377303359, 'samples': 8193984, 'steps': 42676, 'loss/train': 1.1301815509796143} -08/30/2021 20:51:13 - INFO - __main__ - Step 42678: {'lr': 0.00041245480416998704, 'samples': 8194176, 'steps': 42677, 'loss/train': 1.311215877532959} -08/30/2021 20:51:13 - INFO - __main__ - Step 42679: {'lr': 0.00041245077053643866, 'samples': 8194368, 'steps': 42678, 'loss/train': 1.1596556901931763} -08/30/2021 20:51:14 - INFO - __main__ - Step 42680: {'lr': 0.0004124467368296924, 'samples': 8194560, 'steps': 42679, 'loss/train': 0.9840144515037537} -08/30/2021 20:51:14 - INFO - __main__ - Step 42681: {'lr': 0.00041244270304975004, 'samples': 8194752, 'steps': 42680, 'loss/train': 1.235546588897705} -08/30/2021 20:51:14 - INFO - __main__ - Step 42682: {'lr': 0.0004124386691966137, 'samples': 8194944, 'steps': 42681, 'loss/train': 1.643437385559082} -08/30/2021 20:51:16 - INFO - __main__ - Step 42683: {'lr': 0.00041243463527028493, 'samples': 8195136, 'steps': 42682, 'loss/train': 1.6930502653121948} -08/30/2021 20:51:16 - INFO - __main__ - Step 42684: {'lr': 0.0004124306012707656, 'samples': 8195328, 'steps': 42683, 'loss/train': 1.128927230834961} -08/30/2021 20:51:17 - INFO - __main__ - Step 42685: {'lr': 0.00041242656719805754, 'samples': 8195520, 'steps': 42684, 'loss/train': 1.5005710124969482} -08/30/2021 20:51:17 - INFO - __main__ - Step 42686: {'lr': 0.0004124225330521626, 'samples': 8195712, 'steps': 42685, 'loss/train': 1.2922616004943848} -08/30/2021 20:51:17 - INFO - __main__ - Step 42687: {'lr': 0.0004124184988330826, 'samples': 8195904, 'steps': 42686, 'loss/train': 1.1025948524475098} -08/30/2021 20:51:19 - INFO - __main__ - Step 42688: {'lr': 0.0004124144645408192, 'samples': 8196096, 'steps': 42687, 'loss/train': 2.2752678394317627} -08/30/2021 20:51:19 - INFO - __main__ - Step 42689: {'lr': 0.0004124104301753745, 'samples': 8196288, 'steps': 42688, 'loss/train': 1.0980074405670166} -08/30/2021 20:51:20 - INFO - __main__ - Step 42690: {'lr': 0.0004124063957367501, 'samples': 8196480, 'steps': 42689, 'loss/train': 0.9873174428939819} -08/30/2021 20:51:20 - INFO - __main__ - Step 42691: {'lr': 0.0004124023612249479, 'samples': 8196672, 'steps': 42690, 'loss/train': 0.8801842927932739} -08/30/2021 20:51:20 - INFO - __main__ - Step 42692: {'lr': 0.0004123983266399697, 'samples': 8196864, 'steps': 42691, 'loss/train': 1.5642693042755127} -08/30/2021 20:51:22 - INFO - __main__ - Step 42693: {'lr': 0.0004123942919818173, 'samples': 8197056, 'steps': 42692, 'loss/train': 1.1973350048065186} -08/30/2021 20:51:22 - INFO - __main__ - Step 42694: {'lr': 0.00041239025725049256, 'samples': 8197248, 'steps': 42693, 'loss/train': 1.8853051662445068} -08/30/2021 20:51:23 - INFO - __main__ - Step 42695: {'lr': 0.0004123862224459973, 'samples': 8197440, 'steps': 42694, 'loss/train': 1.9385746717453003} -08/30/2021 20:51:23 - INFO - __main__ - Step 42696: {'lr': 0.0004123821875683333, 'samples': 8197632, 'steps': 42695, 'loss/train': 1.6885868310928345} -08/30/2021 20:51:23 - INFO - __main__ - Step 42697: {'lr': 0.0004123781526175023, 'samples': 8197824, 'steps': 42696, 'loss/train': 1.3855059146881104} -08/30/2021 20:51:26 - INFO - __main__ - Step 42698: {'lr': 0.0004123741175935063, 'samples': 8198016, 'steps': 42697, 'loss/train': 1.3950804471969604} -08/30/2021 20:51:26 - INFO - __main__ - Step 42699: {'lr': 0.000412370082496347, 'samples': 8198208, 'steps': 42698, 'loss/train': 1.429821491241455} -08/30/2021 20:51:27 - INFO - __main__ - Step 42700: {'lr': 0.0004123660473260263, 'samples': 8198400, 'steps': 42699, 'loss/train': 1.7408299446105957} -08/30/2021 20:51:27 - INFO - __main__ - Step 42701: {'lr': 0.0004123620120825459, 'samples': 8198592, 'steps': 42700, 'loss/train': 1.7905468940734863} -08/30/2021 20:51:27 - INFO - __main__ - Step 42702: {'lr': 0.00041235797676590776, 'samples': 8198784, 'steps': 42701, 'loss/train': 1.6065155267715454} -08/30/2021 20:51:28 - INFO - __main__ - Step 42703: {'lr': 0.0004123539413761136, 'samples': 8198976, 'steps': 42702, 'loss/train': 1.134494423866272} -08/30/2021 20:51:29 - INFO - __main__ - Step 42704: {'lr': 0.0004123499059131652, 'samples': 8199168, 'steps': 42703, 'loss/train': 0.7257978320121765} -08/30/2021 20:51:30 - INFO - __main__ - Step 42705: {'lr': 0.00041234587037706447, 'samples': 8199360, 'steps': 42704, 'loss/train': 0.3595121502876282} -08/30/2021 20:51:30 - INFO - __main__ - Step 42706: {'lr': 0.0004123418347678132, 'samples': 8199552, 'steps': 42705, 'loss/train': 0.3763863742351532} -08/30/2021 20:51:31 - INFO - __main__ - Step 42707: {'lr': 0.00041233779908541316, 'samples': 8199744, 'steps': 42706, 'loss/train': 1.2722951173782349} -08/30/2021 20:51:31 - INFO - __main__ - Step 42708: {'lr': 0.0004123337633298662, 'samples': 8199936, 'steps': 42707, 'loss/train': 1.1446754932403564} -08/30/2021 20:51:33 - INFO - __main__ - Step 42709: {'lr': 0.0004123297275011743, 'samples': 8200128, 'steps': 42708, 'loss/train': 1.24917733669281} -08/30/2021 20:51:33 - INFO - __main__ - Step 42710: {'lr': 0.00041232569159933895, 'samples': 8200320, 'steps': 42709, 'loss/train': 0.7024908065795898} -08/30/2021 20:51:34 - INFO - __main__ - Step 42711: {'lr': 0.00041232165562436225, 'samples': 8200512, 'steps': 42710, 'loss/train': 0.7034547924995422} -08/30/2021 20:51:34 - INFO - __main__ - Step 42712: {'lr': 0.00041231761957624593, 'samples': 8200704, 'steps': 42711, 'loss/train': 1.034439206123352} -08/30/2021 20:51:34 - INFO - __main__ - Step 42713: {'lr': 0.0004123135834549917, 'samples': 8200896, 'steps': 42712, 'loss/train': 0.9282547831535339} -08/30/2021 20:51:35 - INFO - __main__ - Step 42714: {'lr': 0.00041230954726060155, 'samples': 8201088, 'steps': 42713, 'loss/train': 1.7811814546585083} -08/30/2021 20:51:36 - INFO - __main__ - Step 42715: {'lr': 0.00041230551099307724, 'samples': 8201280, 'steps': 42714, 'loss/train': 0.07779279351234436} -08/30/2021 20:51:37 - INFO - __main__ - Step 42716: {'lr': 0.0004123014746524205, 'samples': 8201472, 'steps': 42715, 'loss/train': 0.580621063709259} -08/30/2021 20:51:37 - INFO - __main__ - Step 42717: {'lr': 0.0004122974382386333, 'samples': 8201664, 'steps': 42716, 'loss/train': 0.7306473255157471} -08/30/2021 20:51:38 - INFO - __main__ - Step 42718: {'lr': 0.00041229340175171733, 'samples': 8201856, 'steps': 42717, 'loss/train': 1.378116488456726} -08/30/2021 20:51:38 - INFO - __main__ - Step 42719: {'lr': 0.00041228936519167446, 'samples': 8202048, 'steps': 42718, 'loss/train': 1.2331045866012573} -08/30/2021 20:51:39 - INFO - __main__ - Step 42720: {'lr': 0.00041228532855850655, 'samples': 8202240, 'steps': 42719, 'loss/train': 1.4135370254516602} -08/30/2021 20:51:40 - INFO - __main__ - Step 42721: {'lr': 0.0004122812918522153, 'samples': 8202432, 'steps': 42720, 'loss/train': 1.4351112842559814} -08/30/2021 20:51:40 - INFO - __main__ - Step 42722: {'lr': 0.0004122772550728027, 'samples': 8202624, 'steps': 42721, 'loss/train': 0.8106284737586975} -08/30/2021 20:51:40 - INFO - __main__ - Step 42723: {'lr': 0.0004122732182202703, 'samples': 8202816, 'steps': 42722, 'loss/train': 1.8287279605865479} -08/30/2021 20:51:41 - INFO - __main__ - Step 42724: {'lr': 0.0004122691812946202, 'samples': 8203008, 'steps': 42723, 'loss/train': 0.2856653332710266} -08/30/2021 20:51:42 - INFO - __main__ - Step 42725: {'lr': 0.00041226514429585417, 'samples': 8203200, 'steps': 42724, 'loss/train': 1.4880412817001343} -08/30/2021 20:51:43 - INFO - __main__ - Step 42726: {'lr': 0.0004122611072239739, 'samples': 8203392, 'steps': 42725, 'loss/train': 0.20633737742900848} -08/30/2021 20:51:43 - INFO - __main__ - Step 42727: {'lr': 0.00041225707007898127, 'samples': 8203584, 'steps': 42726, 'loss/train': 0.8177879452705383} -08/30/2021 20:51:43 - INFO - __main__ - Step 42728: {'lr': 0.0004122530328608781, 'samples': 8203776, 'steps': 42727, 'loss/train': 1.210819959640503} -08/30/2021 20:51:44 - INFO - __main__ - Step 42729: {'lr': 0.00041224899556966635, 'samples': 8203968, 'steps': 42728, 'loss/train': 1.593616008758545} -08/30/2021 20:51:45 - INFO - __main__ - Step 42730: {'lr': 0.00041224495820534757, 'samples': 8204160, 'steps': 42729, 'loss/train': 1.6073495149612427} -08/30/2021 20:51:46 - INFO - __main__ - Step 42731: {'lr': 0.00041224092076792374, 'samples': 8204352, 'steps': 42730, 'loss/train': 1.475361943244934} -08/30/2021 20:51:46 - INFO - __main__ - Step 42732: {'lr': 0.0004122368832573967, 'samples': 8204544, 'steps': 42731, 'loss/train': 1.1168408393859863} -08/30/2021 20:51:46 - INFO - __main__ - Step 42733: {'lr': 0.00041223284567376816, 'samples': 8204736, 'steps': 42732, 'loss/train': 1.1464427709579468} -08/30/2021 20:51:47 - INFO - __main__ - Step 42734: {'lr': 0.00041222880801704005, 'samples': 8204928, 'steps': 42733, 'loss/train': 1.3804570436477661} -08/30/2021 20:51:48 - INFO - __main__ - Step 42735: {'lr': 0.0004122247702872141, 'samples': 8205120, 'steps': 42734, 'loss/train': 1.5680476427078247} -08/30/2021 20:51:49 - INFO - __main__ - Step 42736: {'lr': 0.0004122207324842923, 'samples': 8205312, 'steps': 42735, 'loss/train': 1.2770121097564697} -08/30/2021 20:51:49 - INFO - __main__ - Step 42737: {'lr': 0.00041221669460827614, 'samples': 8205504, 'steps': 42736, 'loss/train': 1.2181936502456665} -08/30/2021 20:51:50 - INFO - __main__ - Step 42738: {'lr': 0.00041221265665916776, 'samples': 8205696, 'steps': 42737, 'loss/train': 1.5945320129394531} -08/30/2021 20:51:50 - INFO - __main__ - Step 42739: {'lr': 0.00041220861863696886, 'samples': 8205888, 'steps': 42738, 'loss/train': 2.015470266342163} -08/30/2021 20:51:51 - INFO - __main__ - Step 42740: {'lr': 0.0004122045805416812, 'samples': 8206080, 'steps': 42739, 'loss/train': 0.0998903140425682} -08/30/2021 20:51:52 - INFO - __main__ - Step 42741: {'lr': 0.00041220054237330674, 'samples': 8206272, 'steps': 42740, 'loss/train': 1.2674150466918945} -08/30/2021 20:51:52 - INFO - __main__ - Step 42742: {'lr': 0.00041219650413184714, 'samples': 8206464, 'steps': 42741, 'loss/train': 1.152045726776123} -08/30/2021 20:51:52 - INFO - __main__ - Step 42743: {'lr': 0.00041219246581730435, 'samples': 8206656, 'steps': 42742, 'loss/train': 1.2147914171218872} -08/30/2021 20:51:53 - INFO - __main__ - Step 42744: {'lr': 0.0004121884274296801, 'samples': 8206848, 'steps': 42743, 'loss/train': 1.6697134971618652} -08/30/2021 20:51:53 - INFO - __main__ - Step 42745: {'lr': 0.00041218438896897623, 'samples': 8207040, 'steps': 42744, 'loss/train': 1.5761781930923462} -08/30/2021 20:51:55 - INFO - __main__ - Step 42746: {'lr': 0.00041218035043519464, 'samples': 8207232, 'steps': 42745, 'loss/train': 0.6791060566902161} -08/30/2021 20:51:55 - INFO - __main__ - Step 42747: {'lr': 0.00041217631182833707, 'samples': 8207424, 'steps': 42746, 'loss/train': 1.3686248064041138} -08/30/2021 20:51:55 - INFO - __main__ - Step 42748: {'lr': 0.00041217227314840535, 'samples': 8207616, 'steps': 42747, 'loss/train': 1.5877742767333984} -08/30/2021 20:51:56 - INFO - __main__ - Step 42749: {'lr': 0.00041216823439540134, 'samples': 8207808, 'steps': 42748, 'loss/train': 1.3075661659240723} -08/30/2021 20:51:56 - INFO - __main__ - Step 42750: {'lr': 0.0004121641955693268, 'samples': 8208000, 'steps': 42749, 'loss/train': 1.519882082939148} -08/30/2021 20:51:58 - INFO - __main__ - Step 42751: {'lr': 0.00041216015667018357, 'samples': 8208192, 'steps': 42750, 'loss/train': 1.529238224029541} -08/30/2021 20:51:59 - INFO - __main__ - Step 42752: {'lr': 0.00041215611769797344, 'samples': 8208384, 'steps': 42751, 'loss/train': 1.2978233098983765} -08/30/2021 20:51:59 - INFO - __main__ - Step 42753: {'lr': 0.00041215207865269833, 'samples': 8208576, 'steps': 42752, 'loss/train': 1.2263840436935425} -08/30/2021 20:51:59 - INFO - __main__ - Step 42754: {'lr': 0.00041214803953435993, 'samples': 8208768, 'steps': 42753, 'loss/train': 1.5428600311279297} -08/30/2021 20:52:00 - INFO - __main__ - Step 42755: {'lr': 0.0004121440003429602, 'samples': 8208960, 'steps': 42754, 'loss/train': 1.6345829963684082} -08/30/2021 20:52:01 - INFO - __main__ - Step 42756: {'lr': 0.0004121399610785008, 'samples': 8209152, 'steps': 42755, 'loss/train': 0.3770456910133362} -08/30/2021 20:52:02 - INFO - __main__ - Step 42757: {'lr': 0.00041213592174098367, 'samples': 8209344, 'steps': 42756, 'loss/train': 1.4098496437072754} -08/30/2021 20:52:02 - INFO - __main__ - Step 42758: {'lr': 0.00041213188233041065, 'samples': 8209536, 'steps': 42757, 'loss/train': 1.814401388168335} -08/30/2021 20:52:02 - INFO - __main__ - Step 42759: {'lr': 0.00041212784284678345, 'samples': 8209728, 'steps': 42758, 'loss/train': 1.141072154045105} -08/30/2021 20:52:03 - INFO - __main__ - Step 42760: {'lr': 0.0004121238032901039, 'samples': 8209920, 'steps': 42759, 'loss/train': 1.5040597915649414} -08/30/2021 20:52:04 - INFO - __main__ - Step 42761: {'lr': 0.00041211976366037394, 'samples': 8210112, 'steps': 42760, 'loss/train': 1.5597246885299683} -08/30/2021 20:52:05 - INFO - __main__ - Step 42762: {'lr': 0.0004121157239575953, 'samples': 8210304, 'steps': 42761, 'loss/train': 1.2797777652740479} -08/30/2021 20:52:05 - INFO - __main__ - Step 42763: {'lr': 0.0004121116841817699, 'samples': 8210496, 'steps': 42762, 'loss/train': 2.1422858238220215} -08/30/2021 20:52:06 - INFO - __main__ - Step 42764: {'lr': 0.00041210764433289936, 'samples': 8210688, 'steps': 42763, 'loss/train': 1.0626745223999023} -08/30/2021 20:52:06 - INFO - __main__ - Step 42765: {'lr': 0.0004121036044109856, 'samples': 8210880, 'steps': 42764, 'loss/train': 0.0444820336997509} -08/30/2021 20:52:06 - INFO - __main__ - Step 42766: {'lr': 0.00041209956441603054, 'samples': 8211072, 'steps': 42765, 'loss/train': 0.05257513001561165} -08/30/2021 20:52:08 - INFO - __main__ - Step 42767: {'lr': 0.0004120955243480359, 'samples': 8211264, 'steps': 42766, 'loss/train': 1.326391577720642} -08/30/2021 20:52:08 - INFO - __main__ - Step 42768: {'lr': 0.0004120914842070035, 'samples': 8211456, 'steps': 42767, 'loss/train': 1.9479166269302368} -08/30/2021 20:52:09 - INFO - __main__ - Step 42769: {'lr': 0.0004120874439929352, 'samples': 8211648, 'steps': 42768, 'loss/train': 1.226039171218872} -08/30/2021 20:52:09 - INFO - __main__ - Step 42770: {'lr': 0.00041208340370583275, 'samples': 8211840, 'steps': 42769, 'loss/train': 1.243990182876587} -08/30/2021 20:52:10 - INFO - __main__ - Step 42771: {'lr': 0.0004120793633456981, 'samples': 8212032, 'steps': 42770, 'loss/train': 1.5370738506317139} -08/30/2021 20:52:11 - INFO - __main__ - Step 42772: {'lr': 0.0004120753229125329, 'samples': 8212224, 'steps': 42771, 'loss/train': 0.3223148584365845} -08/30/2021 20:52:11 - INFO - __main__ - Step 42773: {'lr': 0.00041207128240633906, 'samples': 8212416, 'steps': 42772, 'loss/train': 0.8358148336410522} -08/30/2021 20:52:12 - INFO - __main__ - Step 42774: {'lr': 0.0004120672418271184, 'samples': 8212608, 'steps': 42773, 'loss/train': 1.6780993938446045} -08/30/2021 20:52:12 - INFO - __main__ - Step 42775: {'lr': 0.0004120632011748728, 'samples': 8212800, 'steps': 42774, 'loss/train': 1.3218542337417603} -08/30/2021 20:52:12 - INFO - __main__ - Step 42776: {'lr': 0.00041205916044960406, 'samples': 8212992, 'steps': 42775, 'loss/train': 1.6444679498672485} -08/30/2021 20:52:14 - INFO - __main__ - Step 42777: {'lr': 0.0004120551196513139, 'samples': 8213184, 'steps': 42776, 'loss/train': 1.0199215412139893} -08/30/2021 20:52:15 - INFO - __main__ - Step 42778: {'lr': 0.0004120510787800042, 'samples': 8213376, 'steps': 42777, 'loss/train': 1.2396245002746582} -08/30/2021 20:52:15 - INFO - __main__ - Step 42779: {'lr': 0.0004120470378356768, 'samples': 8213568, 'steps': 42778, 'loss/train': 1.6554065942764282} -08/30/2021 20:52:16 - INFO - __main__ - Step 42780: {'lr': 0.00041204299681833344, 'samples': 8213760, 'steps': 42779, 'loss/train': 1.4116393327713013} -08/30/2021 20:52:16 - INFO - __main__ - Step 42781: {'lr': 0.00041203895572797613, 'samples': 8213952, 'steps': 42780, 'loss/train': 0.26155638694763184} -08/30/2021 20:52:16 - INFO - __main__ - Step 42782: {'lr': 0.00041203491456460653, 'samples': 8214144, 'steps': 42781, 'loss/train': 1.3729006052017212} -08/30/2021 20:52:18 - INFO - __main__ - Step 42783: {'lr': 0.00041203087332822644, 'samples': 8214336, 'steps': 42782, 'loss/train': 1.929867148399353} -08/30/2021 20:52:18 - INFO - __main__ - Step 42784: {'lr': 0.0004120268320188378, 'samples': 8214528, 'steps': 42783, 'loss/train': 1.0946468114852905} -08/30/2021 20:52:18 - INFO - __main__ - Step 42785: {'lr': 0.00041202279063644234, 'samples': 8214720, 'steps': 42784, 'loss/train': 1.5491408109664917} -08/30/2021 20:52:19 - INFO - __main__ - Step 42786: {'lr': 0.00041201874918104185, 'samples': 8214912, 'steps': 42785, 'loss/train': 1.2300634384155273} -08/30/2021 20:52:19 - INFO - __main__ - Step 42787: {'lr': 0.0004120147076526383, 'samples': 8215104, 'steps': 42786, 'loss/train': 1.3511295318603516} -08/30/2021 20:52:21 - INFO - __main__ - Step 42788: {'lr': 0.0004120106660512334, 'samples': 8215296, 'steps': 42787, 'loss/train': 1.5419447422027588} -08/30/2021 20:52:21 - INFO - __main__ - Step 42789: {'lr': 0.000412006624376829, 'samples': 8215488, 'steps': 42788, 'loss/train': 1.2196044921875} -08/30/2021 20:52:21 - INFO - __main__ - Step 42790: {'lr': 0.0004120025826294269, 'samples': 8215680, 'steps': 42789, 'loss/train': 1.9221341609954834} -08/30/2021 20:52:22 - INFO - __main__ - Step 42791: {'lr': 0.00041199854080902897, 'samples': 8215872, 'steps': 42790, 'loss/train': 1.1416150331497192} -08/30/2021 20:52:22 - INFO - __main__ - Step 42792: {'lr': 0.00041199449891563694, 'samples': 8216064, 'steps': 42791, 'loss/train': 1.2159194946289062} -08/30/2021 20:52:24 - INFO - __main__ - Step 42793: {'lr': 0.00041199045694925273, 'samples': 8216256, 'steps': 42792, 'loss/train': 1.6979012489318848} -08/30/2021 20:52:24 - INFO - __main__ - Step 42794: {'lr': 0.0004119864149098781, 'samples': 8216448, 'steps': 42793, 'loss/train': 1.5664771795272827} -08/30/2021 20:52:24 - INFO - __main__ - Step 42795: {'lr': 0.0004119823727975149, 'samples': 8216640, 'steps': 42794, 'loss/train': 1.4682016372680664} -08/30/2021 20:52:25 - INFO - __main__ - Step 42796: {'lr': 0.00041197833061216494, 'samples': 8216832, 'steps': 42795, 'loss/train': 1.8733136653900146} -08/30/2021 20:52:25 - INFO - __main__ - Step 42797: {'lr': 0.00041197428835383, 'samples': 8217024, 'steps': 42796, 'loss/train': 1.9760923385620117} -08/30/2021 20:52:27 - INFO - __main__ - Step 42798: {'lr': 0.00041197024602251204, 'samples': 8217216, 'steps': 42797, 'loss/train': 0.9231312870979309} -08/30/2021 20:52:27 - INFO - __main__ - Step 42799: {'lr': 0.0004119662036182127, 'samples': 8217408, 'steps': 42798, 'loss/train': 1.344942569732666} -08/30/2021 20:52:28 - INFO - __main__ - Step 42800: {'lr': 0.00041196216114093397, 'samples': 8217600, 'steps': 42799, 'loss/train': 0.9927522540092468} -08/30/2021 20:52:28 - INFO - __main__ - Step 42801: {'lr': 0.00041195811859067756, 'samples': 8217792, 'steps': 42800, 'loss/train': 1.3030191659927368} -08/30/2021 20:52:28 - INFO - __main__ - Step 42802: {'lr': 0.0004119540759674453, 'samples': 8217984, 'steps': 42801, 'loss/train': 1.5118681192398071} -08/30/2021 20:52:30 - INFO - __main__ - Step 42803: {'lr': 0.000411950033271239, 'samples': 8218176, 'steps': 42802, 'loss/train': 0.9536420106887817} -08/30/2021 20:52:31 - INFO - __main__ - Step 42804: {'lr': 0.0004119459905020606, 'samples': 8218368, 'steps': 42803, 'loss/train': 1.7397682666778564} -08/30/2021 20:52:31 - INFO - __main__ - Step 42805: {'lr': 0.0004119419476599118, 'samples': 8218560, 'steps': 42804, 'loss/train': 1.6398180723190308} -08/30/2021 20:52:31 - INFO - __main__ - Step 42806: {'lr': 0.0004119379047447944, 'samples': 8218752, 'steps': 42805, 'loss/train': 0.8062236309051514} -08/30/2021 20:52:32 - INFO - __main__ - Step 42807: {'lr': 0.00041193386175671033, 'samples': 8218944, 'steps': 42806, 'loss/train': 0.8588298559188843} -08/30/2021 20:52:32 - INFO - __main__ - Step 42808: {'lr': 0.0004119298186956613, 'samples': 8219136, 'steps': 42807, 'loss/train': 2.1786930561065674} -08/30/2021 20:52:34 - INFO - __main__ - Step 42809: {'lr': 0.00041192577556164924, 'samples': 8219328, 'steps': 42808, 'loss/train': 0.7691994309425354} -08/30/2021 20:52:35 - INFO - __main__ - Step 42810: {'lr': 0.000411921732354676, 'samples': 8219520, 'steps': 42809, 'loss/train': 0.030235696583986282} -08/30/2021 20:52:35 - INFO - __main__ - Step 42811: {'lr': 0.00041191768907474326, 'samples': 8219712, 'steps': 42810, 'loss/train': 0.026263045147061348} -08/30/2021 20:52:35 - INFO - __main__ - Step 42812: {'lr': 0.00041191364572185286, 'samples': 8219904, 'steps': 42811, 'loss/train': 1.3629406690597534} -08/30/2021 20:52:36 - INFO - __main__ - Step 42813: {'lr': 0.0004119096022960067, 'samples': 8220096, 'steps': 42812, 'loss/train': 0.1095290333032608} -08/30/2021 20:52:36 - INFO - __main__ - Step 42814: {'lr': 0.0004119055587972066, 'samples': 8220288, 'steps': 42813, 'loss/train': 1.9197845458984375} -08/30/2021 20:52:37 - INFO - __main__ - Step 42815: {'lr': 0.0004119015152254543, 'samples': 8220480, 'steps': 42814, 'loss/train': 1.541056513786316} -08/30/2021 20:52:38 - INFO - __main__ - Step 42816: {'lr': 0.00041189747158075176, 'samples': 8220672, 'steps': 42815, 'loss/train': 1.2116667032241821} -08/30/2021 20:52:38 - INFO - __main__ - Step 42817: {'lr': 0.00041189342786310067, 'samples': 8220864, 'steps': 42816, 'loss/train': 0.5459004044532776} -08/30/2021 20:52:39 - INFO - __main__ - Step 42818: {'lr': 0.0004118893840725029, 'samples': 8221056, 'steps': 42817, 'loss/train': 1.2930238246917725} -08/30/2021 20:52:39 - INFO - __main__ - Step 42819: {'lr': 0.0004118853402089603, 'samples': 8221248, 'steps': 42818, 'loss/train': 1.6231409311294556} -08/30/2021 20:52:41 - INFO - __main__ - Step 42820: {'lr': 0.0004118812962724746, 'samples': 8221440, 'steps': 42819, 'loss/train': 1.44464111328125} -08/30/2021 20:52:42 - INFO - __main__ - Step 42821: {'lr': 0.00041187725226304775, 'samples': 8221632, 'steps': 42820, 'loss/train': 1.3955358266830444} -08/30/2021 20:52:42 - INFO - __main__ - Step 42822: {'lr': 0.0004118732081806814, 'samples': 8221824, 'steps': 42821, 'loss/train': 0.9620579481124878} -08/30/2021 20:52:43 - INFO - __main__ - Step 42823: {'lr': 0.0004118691640253777, 'samples': 8222016, 'steps': 42822, 'loss/train': 1.7535643577575684} -08/30/2021 20:52:43 - INFO - __main__ - Step 42824: {'lr': 0.00041186511979713806, 'samples': 8222208, 'steps': 42823, 'loss/train': 1.4558895826339722} -08/30/2021 20:52:43 - INFO - __main__ - Step 42825: {'lr': 0.00041186107549596453, 'samples': 8222400, 'steps': 42824, 'loss/train': 0.46301376819610596} -08/30/2021 20:52:45 - INFO - __main__ - Step 42826: {'lr': 0.0004118570311218589, 'samples': 8222592, 'steps': 42825, 'loss/train': 0.4012913405895233} -08/30/2021 20:52:46 - INFO - __main__ - Step 42827: {'lr': 0.00041185298667482294, 'samples': 8222784, 'steps': 42826, 'loss/train': 1.157563328742981} -08/30/2021 20:52:46 - INFO - __main__ - Step 42828: {'lr': 0.0004118489421548586, 'samples': 8222976, 'steps': 42827, 'loss/train': 1.3738535642623901} -08/30/2021 20:52:46 - INFO - __main__ - Step 42829: {'lr': 0.00041184489756196764, 'samples': 8223168, 'steps': 42828, 'loss/train': 1.152182698249817} -08/30/2021 20:52:47 - INFO - __main__ - Step 42830: {'lr': 0.0004118408528961519, 'samples': 8223360, 'steps': 42829, 'loss/train': 1.5130033493041992} -08/30/2021 20:52:47 - INFO - __main__ - Step 42831: {'lr': 0.00041183680815741307, 'samples': 8223552, 'steps': 42830, 'loss/train': 1.4232146739959717} -08/30/2021 20:52:49 - INFO - __main__ - Step 42832: {'lr': 0.0004118327633457531, 'samples': 8223744, 'steps': 42831, 'loss/train': 0.8346356749534607} -08/30/2021 20:52:49 - INFO - __main__ - Step 42833: {'lr': 0.00041182871846117373, 'samples': 8223936, 'steps': 42832, 'loss/train': 1.4951962232589722} -08/30/2021 20:52:49 - INFO - __main__ - Step 42834: {'lr': 0.0004118246735036769, 'samples': 8224128, 'steps': 42833, 'loss/train': 1.8352375030517578} -08/30/2021 20:52:50 - INFO - __main__ - Step 42835: {'lr': 0.0004118206284732644, 'samples': 8224320, 'steps': 42834, 'loss/train': 1.4015146493911743} -08/30/2021 20:52:50 - INFO - __main__ - Step 42836: {'lr': 0.000411816583369938, 'samples': 8224512, 'steps': 42835, 'loss/train': 1.4538276195526123} -08/30/2021 20:52:52 - INFO - __main__ - Step 42837: {'lr': 0.0004118125381936996, 'samples': 8224704, 'steps': 42836, 'loss/train': 1.6377867460250854} -08/30/2021 20:52:52 - INFO - __main__ - Step 42838: {'lr': 0.0004118084929445508, 'samples': 8224896, 'steps': 42837, 'loss/train': 1.1447142362594604} -08/30/2021 20:52:53 - INFO - __main__ - Step 42839: {'lr': 0.0004118044476224937, 'samples': 8225088, 'steps': 42838, 'loss/train': 1.6882789134979248} -08/30/2021 20:52:53 - INFO - __main__ - Step 42840: {'lr': 0.00041180040222753, 'samples': 8225280, 'steps': 42839, 'loss/train': 1.0161800384521484} -08/30/2021 20:52:53 - INFO - __main__ - Step 42841: {'lr': 0.00041179635675966155, 'samples': 8225472, 'steps': 42840, 'loss/train': 1.38160240650177} -08/30/2021 20:52:55 - INFO - __main__ - Step 42842: {'lr': 0.00041179231121889014, 'samples': 8225664, 'steps': 42841, 'loss/train': 1.4770721197128296} -08/30/2021 20:52:55 - INFO - __main__ - Step 42843: {'lr': 0.0004117882656052176, 'samples': 8225856, 'steps': 42842, 'loss/train': 1.7939602136611938} -08/30/2021 20:52:56 - INFO - __main__ - Step 42844: {'lr': 0.0004117842199186458, 'samples': 8226048, 'steps': 42843, 'loss/train': 1.4858546257019043} -08/30/2021 20:52:56 - INFO - __main__ - Step 42845: {'lr': 0.00041178017415917655, 'samples': 8226240, 'steps': 42844, 'loss/train': 1.8660188913345337} -08/30/2021 20:52:56 - INFO - __main__ - Step 42846: {'lr': 0.00041177612832681156, 'samples': 8226432, 'steps': 42845, 'loss/train': 1.0155410766601562} -08/30/2021 20:52:58 - INFO - __main__ - Step 42847: {'lr': 0.00041177208242155285, 'samples': 8226624, 'steps': 42846, 'loss/train': 1.1603670120239258} -08/30/2021 20:52:59 - INFO - __main__ - Step 42848: {'lr': 0.000411768036443402, 'samples': 8226816, 'steps': 42847, 'loss/train': 1.6450775861740112} -08/30/2021 20:52:59 - INFO - __main__ - Step 42849: {'lr': 0.0004117639903923611, 'samples': 8227008, 'steps': 42848, 'loss/train': 0.08885498344898224} -08/30/2021 20:52:59 - INFO - __main__ - Step 42850: {'lr': 0.00041175994426843177, 'samples': 8227200, 'steps': 42849, 'loss/train': 1.087542176246643} -08/30/2021 20:53:00 - INFO - __main__ - Step 42851: {'lr': 0.00041175589807161597, 'samples': 8227392, 'steps': 42850, 'loss/train': 0.3503994047641754} -08/30/2021 20:53:01 - INFO - __main__ - Step 42852: {'lr': 0.0004117518518019154, 'samples': 8227584, 'steps': 42851, 'loss/train': 1.0052155256271362} -08/30/2021 20:53:01 - INFO - __main__ - Step 42853: {'lr': 0.00041174780545933195, 'samples': 8227776, 'steps': 42852, 'loss/train': 1.4477592706680298} -08/30/2021 20:53:02 - INFO - __main__ - Step 42854: {'lr': 0.0004117437590438674, 'samples': 8227968, 'steps': 42853, 'loss/train': 1.4567382335662842} -08/30/2021 20:53:02 - INFO - __main__ - Step 42855: {'lr': 0.0004117397125555237, 'samples': 8228160, 'steps': 42854, 'loss/train': 0.15344618260860443} -08/30/2021 20:53:03 - INFO - __main__ - Step 42856: {'lr': 0.00041173566599430245, 'samples': 8228352, 'steps': 42855, 'loss/train': 1.1155697107315063} -08/30/2021 20:53:04 - INFO - __main__ - Step 42857: {'lr': 0.00041173161936020573, 'samples': 8228544, 'steps': 42856, 'loss/train': 1.1189734935760498} -08/30/2021 20:53:04 - INFO - __main__ - Step 42858: {'lr': 0.0004117275726532352, 'samples': 8228736, 'steps': 42857, 'loss/train': 1.1313668489456177} -08/30/2021 20:53:05 - INFO - __main__ - Step 42859: {'lr': 0.0004117235258733927, 'samples': 8228928, 'steps': 42858, 'loss/train': 1.4892619848251343} -08/30/2021 20:53:05 - INFO - __main__ - Step 42860: {'lr': 0.00041171947902068006, 'samples': 8229120, 'steps': 42859, 'loss/train': 1.7968533039093018} -08/30/2021 20:53:05 - INFO - __main__ - Step 42861: {'lr': 0.00041171543209509923, 'samples': 8229312, 'steps': 42860, 'loss/train': 1.0041232109069824} -08/30/2021 20:53:06 - INFO - __main__ - Step 42862: {'lr': 0.0004117113850966517, 'samples': 8229504, 'steps': 42861, 'loss/train': 0.9973611235618591} -08/30/2021 20:53:08 - INFO - __main__ - Step 42863: {'lr': 0.00041170733802533974, 'samples': 8229696, 'steps': 42862, 'loss/train': 0.8780614137649536} -08/30/2021 20:53:08 - INFO - __main__ - Step 42864: {'lr': 0.0004117032908811649, 'samples': 8229888, 'steps': 42863, 'loss/train': 1.8098726272583008} -08/30/2021 20:53:09 - INFO - __main__ - Step 42865: {'lr': 0.000411699243664129, 'samples': 8230080, 'steps': 42864, 'loss/train': 1.443603754043579} -08/30/2021 20:53:09 - INFO - __main__ - Step 42866: {'lr': 0.00041169519637423394, 'samples': 8230272, 'steps': 42865, 'loss/train': 1.1232253313064575} -08/30/2021 20:53:09 - INFO - __main__ - Step 42867: {'lr': 0.0004116911490114815, 'samples': 8230464, 'steps': 42866, 'loss/train': 1.7242082357406616} -08/30/2021 20:53:11 - INFO - __main__ - Step 42868: {'lr': 0.0004116871015758735, 'samples': 8230656, 'steps': 42867, 'loss/train': 1.5670757293701172} -08/30/2021 20:53:11 - INFO - __main__ - Step 42869: {'lr': 0.0004116830540674118, 'samples': 8230848, 'steps': 42868, 'loss/train': 1.870622158050537} -08/30/2021 20:53:12 - INFO - __main__ - Step 42870: {'lr': 0.00041167900648609825, 'samples': 8231040, 'steps': 42869, 'loss/train': 1.8268203735351562} -08/30/2021 20:53:12 - INFO - __main__ - Step 42871: {'lr': 0.00041167495883193464, 'samples': 8231232, 'steps': 42870, 'loss/train': 1.4920810461044312} -08/30/2021 20:53:12 - INFO - __main__ - Step 42872: {'lr': 0.00041167091110492273, 'samples': 8231424, 'steps': 42871, 'loss/train': 1.83479642868042} -08/30/2021 20:53:14 - INFO - __main__ - Step 42873: {'lr': 0.0004116668633050644, 'samples': 8231616, 'steps': 42872, 'loss/train': 1.071567416191101} -08/30/2021 20:53:15 - INFO - __main__ - Step 42874: {'lr': 0.0004116628154323616, 'samples': 8231808, 'steps': 42873, 'loss/train': 0.1352720558643341} -08/30/2021 20:53:15 - INFO - __main__ - Step 42875: {'lr': 0.0004116587674868159, 'samples': 8232000, 'steps': 42874, 'loss/train': 1.1919699907302856} -08/30/2021 20:53:16 - INFO - __main__ - Step 42876: {'lr': 0.00041165471946842924, 'samples': 8232192, 'steps': 42875, 'loss/train': 1.3944077491760254} -08/30/2021 20:53:16 - INFO - __main__ - Step 42877: {'lr': 0.00041165067137720356, 'samples': 8232384, 'steps': 42876, 'loss/train': 1.2207744121551514} -08/30/2021 20:53:18 - INFO - __main__ - Step 42878: {'lr': 0.00041164662321314054, 'samples': 8232576, 'steps': 42877, 'loss/train': 1.6044350862503052} -08/30/2021 20:53:18 - INFO - __main__ - Step 42879: {'lr': 0.000411642574976242, 'samples': 8232768, 'steps': 42878, 'loss/train': 0.9108901619911194} -08/30/2021 20:53:18 - INFO - __main__ - Step 42880: {'lr': 0.0004116385266665099, 'samples': 8232960, 'steps': 42879, 'loss/train': 1.097786784172058} -08/30/2021 20:53:19 - INFO - __main__ - Step 42881: {'lr': 0.0004116344782839459, 'samples': 8233152, 'steps': 42880, 'loss/train': 1.279736042022705} -08/30/2021 20:53:19 - INFO - __main__ - Step 42882: {'lr': 0.00041163042982855194, 'samples': 8233344, 'steps': 42881, 'loss/train': 0.9716207981109619} -08/30/2021 20:53:21 - INFO - __main__ - Step 42883: {'lr': 0.00041162638130032975, 'samples': 8233536, 'steps': 42882, 'loss/train': 0.08397163450717926} -08/30/2021 20:53:21 - INFO - __main__ - Step 42884: {'lr': 0.00041162233269928126, 'samples': 8233728, 'steps': 42883, 'loss/train': 1.1683320999145508} -08/30/2021 20:53:21 - INFO - __main__ - Step 42885: {'lr': 0.0004116182840254082, 'samples': 8233920, 'steps': 42884, 'loss/train': 1.6379175186157227} -08/30/2021 20:53:22 - INFO - __main__ - Step 42886: {'lr': 0.0004116142352787125, 'samples': 8234112, 'steps': 42885, 'loss/train': 1.2654114961624146} -08/30/2021 20:53:22 - INFO - __main__ - Step 42887: {'lr': 0.00041161018645919593, 'samples': 8234304, 'steps': 42886, 'loss/train': 1.6422559022903442} -08/30/2021 20:53:24 - INFO - __main__ - Step 42888: {'lr': 0.00041160613756686015, 'samples': 8234496, 'steps': 42887, 'loss/train': 1.6191211938858032} -08/30/2021 20:53:24 - INFO - __main__ - Step 42889: {'lr': 0.00041160208860170725, 'samples': 8234688, 'steps': 42888, 'loss/train': 1.5554444789886475} -08/30/2021 20:53:25 - INFO - __main__ - Step 42890: {'lr': 0.000411598039563739, 'samples': 8234880, 'steps': 42889, 'loss/train': 1.5288052558898926} -08/30/2021 20:53:25 - INFO - __main__ - Step 42891: {'lr': 0.0004115939904529571, 'samples': 8235072, 'steps': 42890, 'loss/train': 1.9154614210128784} -08/30/2021 20:53:25 - INFO - __main__ - Step 42892: {'lr': 0.00041158994126936347, 'samples': 8235264, 'steps': 42891, 'loss/train': 5.809218883514404} -08/30/2021 20:53:26 - INFO - __main__ - Step 42893: {'lr': 0.0004115858920129598, 'samples': 8235456, 'steps': 42892, 'loss/train': 0.41727232933044434} -08/30/2021 20:53:27 - INFO - __main__ - Step 42894: {'lr': 0.0004115818426837481, 'samples': 8235648, 'steps': 42893, 'loss/train': 1.4420056343078613} -08/30/2021 20:53:27 - INFO - __main__ - Step 42895: {'lr': 0.0004115777932817301, 'samples': 8235840, 'steps': 42894, 'loss/train': 1.2058171033859253} -08/30/2021 20:53:28 - INFO - __main__ - Step 42896: {'lr': 0.00041157374380690765, 'samples': 8236032, 'steps': 42895, 'loss/train': 1.7355314493179321} -08/30/2021 20:53:28 - INFO - __main__ - Step 42897: {'lr': 0.0004115696942592826, 'samples': 8236224, 'steps': 42896, 'loss/train': 1.4481213092803955} -08/30/2021 20:53:29 - INFO - __main__ - Step 42898: {'lr': 0.0004115656446388567, 'samples': 8236416, 'steps': 42897, 'loss/train': 1.7035605907440186} -08/30/2021 20:53:30 - INFO - __main__ - Step 42899: {'lr': 0.00041156159494563183, 'samples': 8236608, 'steps': 42898, 'loss/train': 1.4951162338256836} -08/30/2021 20:53:31 - INFO - __main__ - Step 42900: {'lr': 0.00041155754517960974, 'samples': 8236800, 'steps': 42899, 'loss/train': 1.2954660654067993} -08/30/2021 20:53:31 - INFO - __main__ - Step 42901: {'lr': 0.00041155349534079236, 'samples': 8236992, 'steps': 42900, 'loss/train': 1.0552476644515991} -08/30/2021 20:53:31 - INFO - __main__ - Step 42902: {'lr': 0.0004115494454291815, 'samples': 8237184, 'steps': 42901, 'loss/train': 0.16165167093276978} -08/30/2021 20:53:32 - INFO - __main__ - Step 42903: {'lr': 0.0004115453954447789, 'samples': 8237376, 'steps': 42902, 'loss/train': 1.3315397500991821} -08/30/2021 20:53:33 - INFO - __main__ - Step 42904: {'lr': 0.0004115413453875865, 'samples': 8237568, 'steps': 42903, 'loss/train': 1.1729339361190796} -08/30/2021 20:53:34 - INFO - __main__ - Step 42905: {'lr': 0.000411537295257606, 'samples': 8237760, 'steps': 42904, 'loss/train': 1.0337938070297241} -08/30/2021 20:53:34 - INFO - __main__ - Step 42906: {'lr': 0.00041153324505483933, 'samples': 8237952, 'steps': 42905, 'loss/train': 0.1835448443889618} -08/30/2021 20:53:35 - INFO - __main__ - Step 42907: {'lr': 0.0004115291947792882, 'samples': 8238144, 'steps': 42906, 'loss/train': 1.2645149230957031} -08/30/2021 20:53:35 - INFO - __main__ - Step 42908: {'lr': 0.00041152514443095454, 'samples': 8238336, 'steps': 42907, 'loss/train': 1.3040850162506104} -08/30/2021 20:53:36 - INFO - __main__ - Step 42909: {'lr': 0.00041152109400984015, 'samples': 8238528, 'steps': 42908, 'loss/train': 1.9677035808563232} -08/30/2021 20:53:37 - INFO - __main__ - Step 42910: {'lr': 0.0004115170435159469, 'samples': 8238720, 'steps': 42909, 'loss/train': 1.6824175119400024} -08/30/2021 20:53:37 - INFO - __main__ - Step 42911: {'lr': 0.00041151299294927657, 'samples': 8238912, 'steps': 42910, 'loss/train': 1.0541698932647705} -08/30/2021 20:53:38 - INFO - __main__ - Step 42912: {'lr': 0.0004115089423098309, 'samples': 8239104, 'steps': 42911, 'loss/train': 1.4474738836288452} -08/30/2021 20:53:38 - INFO - __main__ - Step 42913: {'lr': 0.00041150489159761186, 'samples': 8239296, 'steps': 42912, 'loss/train': 1.3622851371765137} -08/30/2021 20:53:40 - INFO - __main__ - Step 42914: {'lr': 0.00041150084081262105, 'samples': 8239488, 'steps': 42913, 'loss/train': 1.0948444604873657} -08/30/2021 20:53:40 - INFO - __main__ - Step 42915: {'lr': 0.0004114967899548606, 'samples': 8239680, 'steps': 42914, 'loss/train': 0.9798698425292969} -08/30/2021 20:53:40 - INFO - __main__ - Step 42916: {'lr': 0.0004114927390243322, 'samples': 8239872, 'steps': 42915, 'loss/train': 0.13289666175842285} -08/30/2021 20:53:41 - INFO - __main__ - Step 42917: {'lr': 0.00041148868802103766, 'samples': 8240064, 'steps': 42916, 'loss/train': 1.7086477279663086} -08/30/2021 20:53:41 - INFO - __main__ - Step 42918: {'lr': 0.00041148463694497874, 'samples': 8240256, 'steps': 42917, 'loss/train': 0.8621677160263062} -08/30/2021 20:53:43 - INFO - __main__ - Step 42919: {'lr': 0.00041148058579615733, 'samples': 8240448, 'steps': 42918, 'loss/train': 0.07445593178272247} -08/30/2021 20:53:44 - INFO - __main__ - Step 42920: {'lr': 0.00041147653457457534, 'samples': 8240640, 'steps': 42919, 'loss/train': 1.5192316770553589} -08/30/2021 20:53:44 - INFO - __main__ - Step 42921: {'lr': 0.0004114724832802345, 'samples': 8240832, 'steps': 42920, 'loss/train': 1.2820676565170288} -08/30/2021 20:53:44 - INFO - __main__ - Step 42922: {'lr': 0.0004114684319131366, 'samples': 8241024, 'steps': 42921, 'loss/train': 1.4727269411087036} -08/30/2021 20:53:45 - INFO - __main__ - Step 42923: {'lr': 0.00041146438047328347, 'samples': 8241216, 'steps': 42922, 'loss/train': 2.0088417530059814} -08/30/2021 20:53:46 - INFO - __main__ - Step 42924: {'lr': 0.0004114603289606771, 'samples': 8241408, 'steps': 42923, 'loss/train': 1.1138535737991333} -08/30/2021 20:53:47 - INFO - __main__ - Step 42925: {'lr': 0.00041145627737531915, 'samples': 8241600, 'steps': 42924, 'loss/train': 0.8508906960487366} -08/30/2021 20:53:47 - INFO - __main__ - Step 42926: {'lr': 0.0004114522257172115, 'samples': 8241792, 'steps': 42925, 'loss/train': 1.475974202156067} -08/30/2021 20:53:47 - INFO - __main__ - Step 42927: {'lr': 0.000411448173986356, 'samples': 8241984, 'steps': 42926, 'loss/train': 1.4380686283111572} -08/30/2021 20:53:48 - INFO - __main__ - Step 42928: {'lr': 0.0004114441221827544, 'samples': 8242176, 'steps': 42927, 'loss/train': 1.2631417512893677} -08/30/2021 20:53:48 - INFO - __main__ - Step 42929: {'lr': 0.0004114400703064085, 'samples': 8242368, 'steps': 42928, 'loss/train': 1.3651388883590698} -08/30/2021 20:53:49 - INFO - __main__ - Step 42930: {'lr': 0.0004114360183573203, 'samples': 8242560, 'steps': 42929, 'loss/train': 1.5953912734985352} -08/30/2021 20:53:50 - INFO - __main__ - Step 42931: {'lr': 0.0004114319663354915, 'samples': 8242752, 'steps': 42930, 'loss/train': 0.5755936503410339} -08/30/2021 20:53:50 - INFO - __main__ - Step 42932: {'lr': 0.000411427914240924, 'samples': 8242944, 'steps': 42931, 'loss/train': 1.3591316938400269} -08/30/2021 20:53:51 - INFO - __main__ - Step 42933: {'lr': 0.0004114238620736195, 'samples': 8243136, 'steps': 42932, 'loss/train': 1.2380326986312866} -08/30/2021 20:53:51 - INFO - __main__ - Step 42934: {'lr': 0.00041141980983357986, 'samples': 8243328, 'steps': 42933, 'loss/train': 1.1282389163970947} -08/30/2021 20:53:53 - INFO - __main__ - Step 42935: {'lr': 0.000411415757520807, 'samples': 8243520, 'steps': 42934, 'loss/train': 1.7134774923324585} -08/30/2021 20:53:53 - INFO - __main__ - Step 42936: {'lr': 0.00041141170513530267, 'samples': 8243712, 'steps': 42935, 'loss/train': 1.3076099157333374} -08/30/2021 20:53:53 - INFO - __main__ - Step 42937: {'lr': 0.0004114076526770688, 'samples': 8243904, 'steps': 42936, 'loss/train': 1.791196346282959} -08/30/2021 20:53:54 - INFO - __main__ - Step 42938: {'lr': 0.000411403600146107, 'samples': 8244096, 'steps': 42937, 'loss/train': 1.2904411554336548} -08/30/2021 20:53:54 - INFO - __main__ - Step 42939: {'lr': 0.0004113995475424193, 'samples': 8244288, 'steps': 42938, 'loss/train': 1.544174075126648} -08/30/2021 20:53:55 - INFO - __main__ - Step 42940: {'lr': 0.0004113954948660075, 'samples': 8244480, 'steps': 42939, 'loss/train': 1.528918981552124} -08/30/2021 20:53:56 - INFO - __main__ - Step 42941: {'lr': 0.00041139144211687327, 'samples': 8244672, 'steps': 42940, 'loss/train': 1.118261456489563} -08/30/2021 20:53:56 - INFO - __main__ - Step 42942: {'lr': 0.0004113873892950186, 'samples': 8244864, 'steps': 42941, 'loss/train': 1.538267970085144} -08/30/2021 20:53:57 - INFO - __main__ - Step 42943: {'lr': 0.00041138333640044523, 'samples': 8245056, 'steps': 42942, 'loss/train': 1.3038625717163086} -08/30/2021 20:53:57 - INFO - __main__ - Step 42944: {'lr': 0.0004113792834331551, 'samples': 8245248, 'steps': 42943, 'loss/train': 0.9847640991210938} -08/30/2021 20:53:58 - INFO - __main__ - Step 42945: {'lr': 0.00041137523039314994, 'samples': 8245440, 'steps': 42944, 'loss/train': 1.8071902990341187} -08/30/2021 20:53:59 - INFO - __main__ - Step 42946: {'lr': 0.0004113711772804315, 'samples': 8245632, 'steps': 42945, 'loss/train': 1.2316664457321167} -08/30/2021 20:53:59 - INFO - __main__ - Step 42947: {'lr': 0.0004113671240950018, 'samples': 8245824, 'steps': 42946, 'loss/train': 0.8486292958259583} -08/30/2021 20:54:00 - INFO - __main__ - Step 42948: {'lr': 0.0004113630708368625, 'samples': 8246016, 'steps': 42947, 'loss/train': 1.2827318906784058} -08/30/2021 20:54:00 - INFO - __main__ - Step 42949: {'lr': 0.0004113590175060155, 'samples': 8246208, 'steps': 42948, 'loss/train': 1.527235746383667} -08/30/2021 20:54:02 - INFO - __main__ - Step 42950: {'lr': 0.00041135496410246264, 'samples': 8246400, 'steps': 42949, 'loss/train': 1.4695416688919067} -08/30/2021 20:54:02 - INFO - __main__ - Step 42951: {'lr': 0.0004113509106262058, 'samples': 8246592, 'steps': 42950, 'loss/train': 1.556428074836731} -08/30/2021 20:54:02 - INFO - __main__ - Step 42952: {'lr': 0.00041134685707724656, 'samples': 8246784, 'steps': 42951, 'loss/train': 1.46836256980896} -08/30/2021 20:54:03 - INFO - __main__ - Step 42953: {'lr': 0.000411342803455587, 'samples': 8246976, 'steps': 42952, 'loss/train': 0.7759209871292114} -08/30/2021 20:54:03 - INFO - __main__ - Step 42954: {'lr': 0.0004113387497612289, 'samples': 8247168, 'steps': 42953, 'loss/train': 1.290662407875061} -08/30/2021 20:54:05 - INFO - __main__ - Step 42955: {'lr': 0.00041133469599417393, 'samples': 8247360, 'steps': 42954, 'loss/train': 1.3949353694915771} -08/30/2021 20:54:05 - INFO - __main__ - Step 42956: {'lr': 0.00041133064215442415, 'samples': 8247552, 'steps': 42955, 'loss/train': 1.7359212636947632} -08/30/2021 20:54:06 - INFO - __main__ - Step 42957: {'lr': 0.0004113265882419812, 'samples': 8247744, 'steps': 42956, 'loss/train': 0.11023519188165665} -08/30/2021 20:54:06 - INFO - __main__ - Step 42958: {'lr': 0.0004113225342568471, 'samples': 8247936, 'steps': 42957, 'loss/train': 1.3494611978530884} -08/30/2021 20:54:06 - INFO - __main__ - Step 42959: {'lr': 0.00041131848019902343, 'samples': 8248128, 'steps': 42958, 'loss/train': 0.9846700429916382} -08/30/2021 20:54:08 - INFO - __main__ - Step 42960: {'lr': 0.0004113144260685122, 'samples': 8248320, 'steps': 42959, 'loss/train': 0.4094661474227905} -08/30/2021 20:54:08 - INFO - __main__ - Step 42961: {'lr': 0.00041131037186531514, 'samples': 8248512, 'steps': 42960, 'loss/train': 1.7571051120758057} -08/30/2021 20:54:09 - INFO - __main__ - Step 42962: {'lr': 0.00041130631758943414, 'samples': 8248704, 'steps': 42961, 'loss/train': 1.472283959388733} -08/30/2021 20:54:09 - INFO - __main__ - Step 42963: {'lr': 0.00041130226324087094, 'samples': 8248896, 'steps': 42962, 'loss/train': 0.9628196954727173} -08/30/2021 20:54:09 - INFO - __main__ - Step 42964: {'lr': 0.00041129820881962754, 'samples': 8249088, 'steps': 42963, 'loss/train': 1.908008337020874} -08/30/2021 20:54:10 - INFO - __main__ - Step 42965: {'lr': 0.0004112941543257056, 'samples': 8249280, 'steps': 42964, 'loss/train': 1.7026253938674927} -08/30/2021 20:54:12 - INFO - __main__ - Step 42966: {'lr': 0.00041129009975910704, 'samples': 8249472, 'steps': 42965, 'loss/train': 1.1823099851608276} -08/30/2021 20:54:12 - INFO - __main__ - Step 42967: {'lr': 0.00041128604511983356, 'samples': 8249664, 'steps': 42966, 'loss/train': 0.098127081990242} -08/30/2021 20:54:13 - INFO - __main__ - Step 42968: {'lr': 0.00041128199040788715, 'samples': 8249856, 'steps': 42967, 'loss/train': 1.0449495315551758} -08/30/2021 20:54:13 - INFO - __main__ - Step 42969: {'lr': 0.00041127793562326955, 'samples': 8250048, 'steps': 42968, 'loss/train': 1.4471373558044434} -08/30/2021 20:54:13 - INFO - __main__ - Step 42970: {'lr': 0.0004112738807659826, 'samples': 8250240, 'steps': 42969, 'loss/train': 1.9988512992858887} -08/30/2021 20:54:15 - INFO - __main__ - Step 42971: {'lr': 0.00041126982583602817, 'samples': 8250432, 'steps': 42970, 'loss/train': 1.7404166460037231} -08/30/2021 20:54:16 - INFO - __main__ - Step 42972: {'lr': 0.00041126577083340797, 'samples': 8250624, 'steps': 42971, 'loss/train': 1.699367642402649} -08/30/2021 20:54:16 - INFO - __main__ - Step 42973: {'lr': 0.000411261715758124, 'samples': 8250816, 'steps': 42972, 'loss/train': 1.3783475160598755} -08/30/2021 20:54:17 - INFO - __main__ - Step 42974: {'lr': 0.0004112576606101779, 'samples': 8251008, 'steps': 42973, 'loss/train': 0.2923354208469391} -08/30/2021 20:54:17 - INFO - __main__ - Step 42975: {'lr': 0.0004112536053895716, 'samples': 8251200, 'steps': 42974, 'loss/train': 1.114609956741333} -08/30/2021 20:54:19 - INFO - __main__ - Step 42976: {'lr': 0.0004112495500963069, 'samples': 8251392, 'steps': 42975, 'loss/train': 1.5944143533706665} -08/30/2021 20:54:19 - INFO - __main__ - Step 42977: {'lr': 0.00041124549473038564, 'samples': 8251584, 'steps': 42976, 'loss/train': 1.1461849212646484} -08/30/2021 20:54:20 - INFO - __main__ - Step 42978: {'lr': 0.0004112414392918097, 'samples': 8251776, 'steps': 42977, 'loss/train': 1.4242169857025146} -08/30/2021 20:54:20 - INFO - __main__ - Step 42979: {'lr': 0.00041123738378058083, 'samples': 8251968, 'steps': 42978, 'loss/train': 1.6473948955535889} -08/30/2021 20:54:20 - INFO - __main__ - Step 42980: {'lr': 0.0004112333281967009, 'samples': 8252160, 'steps': 42979, 'loss/train': 1.504165530204773} -08/30/2021 20:54:22 - INFO - __main__ - Step 42981: {'lr': 0.00041122927254017173, 'samples': 8252352, 'steps': 42980, 'loss/train': 0.08477223664522171} -08/30/2021 20:54:23 - INFO - __main__ - Step 42982: {'lr': 0.0004112252168109951, 'samples': 8252544, 'steps': 42981, 'loss/train': 1.4745913743972778} -08/30/2021 20:54:23 - INFO - __main__ - Step 42983: {'lr': 0.0004112211610091728, 'samples': 8252736, 'steps': 42982, 'loss/train': 0.8877905607223511} -08/30/2021 20:54:23 - INFO - __main__ - Step 42984: {'lr': 0.0004112171051347069, 'samples': 8252928, 'steps': 42983, 'loss/train': 1.5028365850448608} -08/30/2021 20:54:24 - INFO - __main__ - Step 42985: {'lr': 0.00041121304918759893, 'samples': 8253120, 'steps': 42984, 'loss/train': 1.6529144048690796} -08/30/2021 20:54:24 - INFO - __main__ - Step 42986: {'lr': 0.00041120899316785095, 'samples': 8253312, 'steps': 42985, 'loss/train': 1.1791515350341797} -08/30/2021 20:54:25 - INFO - __main__ - Step 42987: {'lr': 0.00041120493707546456, 'samples': 8253504, 'steps': 42986, 'loss/train': 1.733790636062622} -08/30/2021 20:54:26 - INFO - __main__ - Step 42988: {'lr': 0.00041120088091044183, 'samples': 8253696, 'steps': 42987, 'loss/train': 1.5295441150665283} -08/30/2021 20:54:26 - INFO - __main__ - Step 42989: {'lr': 0.0004111968246727844, 'samples': 8253888, 'steps': 42988, 'loss/train': 1.394679069519043} -08/30/2021 20:54:27 - INFO - __main__ - Step 42990: {'lr': 0.0004111927683624942, 'samples': 8254080, 'steps': 42989, 'loss/train': 1.6150819063186646} -08/30/2021 20:54:27 - INFO - __main__ - Step 42991: {'lr': 0.00041118871197957306, 'samples': 8254272, 'steps': 42990, 'loss/train': 1.1454073190689087} -08/30/2021 20:54:28 - INFO - __main__ - Step 42992: {'lr': 0.00041118465552402274, 'samples': 8254464, 'steps': 42991, 'loss/train': 1.2107809782028198} -08/30/2021 20:54:29 - INFO - __main__ - Step 42993: {'lr': 0.00041118059899584503, 'samples': 8254656, 'steps': 42992, 'loss/train': 1.2875572443008423} -08/30/2021 20:54:29 - INFO - __main__ - Step 42994: {'lr': 0.00041117654239504193, 'samples': 8254848, 'steps': 42993, 'loss/train': 0.7668571472167969} -08/30/2021 20:54:30 - INFO - __main__ - Step 42995: {'lr': 0.0004111724857216151, 'samples': 8255040, 'steps': 42994, 'loss/train': 1.070777177810669} -08/30/2021 20:54:30 - INFO - __main__ - Step 42996: {'lr': 0.0004111684289755665, 'samples': 8255232, 'steps': 42995, 'loss/train': 1.1700886487960815} -08/30/2021 20:54:32 - INFO - __main__ - Step 42997: {'lr': 0.00041116437215689785, 'samples': 8255424, 'steps': 42996, 'loss/train': 1.3913509845733643} -08/30/2021 20:54:32 - INFO - __main__ - Step 42998: {'lr': 0.000411160315265611, 'samples': 8255616, 'steps': 42997, 'loss/train': 1.449651837348938} -08/30/2021 20:54:32 - INFO - __main__ - Step 42999: {'lr': 0.0004111562583017079, 'samples': 8255808, 'steps': 42998, 'loss/train': 1.2014268636703491} -08/30/2021 20:54:33 - INFO - __main__ - Step 43000: {'lr': 0.00041115220126519014, 'samples': 8256000, 'steps': 42999, 'loss/train': 1.4964714050292969} -08/30/2021 20:54:33 - INFO - __main__ - Step 43001: {'lr': 0.00041114814415605977, 'samples': 8256192, 'steps': 43000, 'loss/train': 0.9783806204795837} -08/30/2021 20:54:34 - INFO - __main__ - Step 43002: {'lr': 0.0004111440869743185, 'samples': 8256384, 'steps': 43001, 'loss/train': 1.5132663249969482} -08/30/2021 20:54:35 - INFO - __main__ - Step 43003: {'lr': 0.00041114002971996824, 'samples': 8256576, 'steps': 43002, 'loss/train': 1.4489054679870605} -08/30/2021 20:54:35 - INFO - __main__ - Step 43004: {'lr': 0.0004111359723930107, 'samples': 8256768, 'steps': 43003, 'loss/train': 1.620793104171753} -08/30/2021 20:54:36 - INFO - __main__ - Step 43005: {'lr': 0.00041113191499344784, 'samples': 8256960, 'steps': 43004, 'loss/train': 1.5167750120162964} -08/30/2021 20:54:36 - INFO - __main__ - Step 43006: {'lr': 0.0004111278575212814, 'samples': 8257152, 'steps': 43005, 'loss/train': 0.6572314500808716} -08/30/2021 20:54:37 - INFO - __main__ - Step 43007: {'lr': 0.0004111237999765132, 'samples': 8257344, 'steps': 43006, 'loss/train': 1.3900483846664429} -08/30/2021 20:54:38 - INFO - __main__ - Step 43008: {'lr': 0.0004111197423591452, 'samples': 8257536, 'steps': 43007, 'loss/train': 1.0233813524246216} -08/30/2021 20:54:38 - INFO - __main__ - Step 43009: {'lr': 0.000411115684669179, 'samples': 8257728, 'steps': 43008, 'loss/train': 1.621573567390442} -08/30/2021 20:54:39 - INFO - __main__ - Step 43010: {'lr': 0.00041111162690661665, 'samples': 8257920, 'steps': 43009, 'loss/train': 1.2237497568130493} -08/30/2021 20:54:39 - INFO - __main__ - Step 43011: {'lr': 0.00041110756907145984, 'samples': 8258112, 'steps': 43010, 'loss/train': 1.7718816995620728} -08/30/2021 20:54:40 - INFO - __main__ - Step 43012: {'lr': 0.0004111035111637105, 'samples': 8258304, 'steps': 43011, 'loss/train': 1.0399419069290161} -08/30/2021 20:54:41 - INFO - __main__ - Step 43013: {'lr': 0.00041109945318337034, 'samples': 8258496, 'steps': 43012, 'loss/train': 1.405644178390503} -08/30/2021 20:54:41 - INFO - __main__ - Step 43014: {'lr': 0.00041109539513044127, 'samples': 8258688, 'steps': 43013, 'loss/train': 1.6959083080291748} -08/30/2021 20:54:42 - INFO - __main__ - Step 43015: {'lr': 0.0004110913370049251, 'samples': 8258880, 'steps': 43014, 'loss/train': 1.3006491661071777} -08/30/2021 20:54:42 - INFO - __main__ - Step 43016: {'lr': 0.00041108727880682363, 'samples': 8259072, 'steps': 43015, 'loss/train': 1.342881679534912} -08/30/2021 20:54:43 - INFO - __main__ - Step 43017: {'lr': 0.0004110832205361388, 'samples': 8259264, 'steps': 43016, 'loss/train': 0.15349045395851135} -08/30/2021 20:54:44 - INFO - __main__ - Step 43018: {'lr': 0.0004110791621928723, 'samples': 8259456, 'steps': 43017, 'loss/train': 1.2687389850616455} -08/30/2021 20:54:44 - INFO - __main__ - Step 43019: {'lr': 0.00041107510377702604, 'samples': 8259648, 'steps': 43018, 'loss/train': 1.9783213138580322} -08/30/2021 20:54:45 - INFO - __main__ - Step 43020: {'lr': 0.00041107104528860186, 'samples': 8259840, 'steps': 43019, 'loss/train': 1.0433523654937744} -08/30/2021 20:54:45 - INFO - __main__ - Step 43021: {'lr': 0.00041106698672760145, 'samples': 8260032, 'steps': 43020, 'loss/train': 1.1559176445007324} -08/30/2021 20:54:45 - INFO - __main__ - Step 43022: {'lr': 0.0004110629280940268, 'samples': 8260224, 'steps': 43021, 'loss/train': 1.5960071086883545} -08/30/2021 20:54:47 - INFO - __main__ - Step 43023: {'lr': 0.0004110588693878796, 'samples': 8260416, 'steps': 43022, 'loss/train': 0.8455272316932678} -08/30/2021 20:54:48 - INFO - __main__ - Step 43024: {'lr': 0.0004110548106091619, 'samples': 8260608, 'steps': 43023, 'loss/train': 1.1341500282287598} -08/30/2021 20:54:48 - INFO - __main__ - Step 43025: {'lr': 0.00041105075175787534, 'samples': 8260800, 'steps': 43024, 'loss/train': 1.5918952226638794} -08/30/2021 20:54:49 - INFO - __main__ - Step 43026: {'lr': 0.00041104669283402174, 'samples': 8260992, 'steps': 43025, 'loss/train': 1.2125768661499023} -08/30/2021 20:54:49 - INFO - __main__ - Step 43027: {'lr': 0.00041104263383760304, 'samples': 8261184, 'steps': 43026, 'loss/train': 0.5623721480369568} -08/30/2021 20:54:50 - INFO - __main__ - Step 43028: {'lr': 0.000411038574768621, 'samples': 8261376, 'steps': 43027, 'loss/train': 1.2327876091003418} -08/30/2021 20:54:51 - INFO - __main__ - Step 43029: {'lr': 0.00041103451562707745, 'samples': 8261568, 'steps': 43028, 'loss/train': 1.1186000108718872} -08/30/2021 20:54:51 - INFO - __main__ - Step 43030: {'lr': 0.0004110304564129742, 'samples': 8261760, 'steps': 43029, 'loss/train': 1.7397935390472412} -08/30/2021 20:54:51 - INFO - __main__ - Step 43031: {'lr': 0.00041102639712631316, 'samples': 8261952, 'steps': 43030, 'loss/train': 1.7311002016067505} -08/30/2021 20:54:52 - INFO - __main__ - Step 43032: {'lr': 0.0004110223377670962, 'samples': 8262144, 'steps': 43031, 'loss/train': 1.5193501710891724} -08/30/2021 20:54:54 - INFO - __main__ - Step 43033: {'lr': 0.0004110182783353249, 'samples': 8262336, 'steps': 43032, 'loss/train': 1.6572611331939697} -08/30/2021 20:54:54 - INFO - __main__ - Step 43034: {'lr': 0.0004110142188310013, 'samples': 8262528, 'steps': 43033, 'loss/train': 1.1107121706008911} -08/30/2021 20:54:55 - INFO - __main__ - Step 43035: {'lr': 0.0004110101592541272, 'samples': 8262720, 'steps': 43034, 'loss/train': 1.4978253841400146} -08/30/2021 20:54:55 - INFO - __main__ - Step 43036: {'lr': 0.0004110060996047044, 'samples': 8262912, 'steps': 43035, 'loss/train': 1.8207767009735107} -08/30/2021 20:54:55 - INFO - __main__ - Step 43037: {'lr': 0.00041100203988273475, 'samples': 8263104, 'steps': 43036, 'loss/train': 1.5406898260116577} -08/30/2021 20:54:56 - INFO - __main__ - Step 43038: {'lr': 0.0004109979800882201, 'samples': 8263296, 'steps': 43037, 'loss/train': 0.8528545498847961} -08/30/2021 20:54:57 - INFO - __main__ - Step 43039: {'lr': 0.00041099392022116214, 'samples': 8263488, 'steps': 43038, 'loss/train': 1.31240975856781} -08/30/2021 20:54:58 - INFO - __main__ - Step 43040: {'lr': 0.0004109898602815629, 'samples': 8263680, 'steps': 43039, 'loss/train': 1.2402949333190918} -08/30/2021 20:54:58 - INFO - __main__ - Step 43041: {'lr': 0.000410985800269424, 'samples': 8263872, 'steps': 43040, 'loss/train': 1.3851898908615112} -08/30/2021 20:54:58 - INFO - __main__ - Step 43042: {'lr': 0.00041098174018474747, 'samples': 8264064, 'steps': 43041, 'loss/train': 1.4205424785614014} -08/30/2021 20:54:59 - INFO - __main__ - Step 43043: {'lr': 0.000410977680027535, 'samples': 8264256, 'steps': 43042, 'loss/train': 1.4728164672851562} -08/30/2021 20:55:00 - INFO - __main__ - Step 43044: {'lr': 0.00041097361979778853, 'samples': 8264448, 'steps': 43043, 'loss/train': 1.7134778499603271} -08/30/2021 20:55:01 - INFO - __main__ - Step 43045: {'lr': 0.00041096955949550983, 'samples': 8264640, 'steps': 43044, 'loss/train': 2.695533037185669} -08/30/2021 20:55:01 - INFO - __main__ - Step 43046: {'lr': 0.00041096549912070067, 'samples': 8264832, 'steps': 43045, 'loss/train': 1.2888792753219604} -08/30/2021 20:55:02 - INFO - __main__ - Step 43047: {'lr': 0.000410961438673363, 'samples': 8265024, 'steps': 43046, 'loss/train': 1.505315899848938} -08/30/2021 20:55:02 - INFO - __main__ - Step 43048: {'lr': 0.0004109573781534985, 'samples': 8265216, 'steps': 43047, 'loss/train': 2.0587618350982666} -08/30/2021 20:55:04 - INFO - __main__ - Step 43049: {'lr': 0.0004109533175611092, 'samples': 8265408, 'steps': 43048, 'loss/train': 1.5550066232681274} -08/30/2021 20:55:04 - INFO - __main__ - Step 43050: {'lr': 0.0004109492568961968, 'samples': 8265600, 'steps': 43049, 'loss/train': 1.3739714622497559} -08/30/2021 20:55:04 - INFO - __main__ - Step 43051: {'lr': 0.00041094519615876313, 'samples': 8265792, 'steps': 43050, 'loss/train': 1.5388081073760986} -08/30/2021 20:55:05 - INFO - __main__ - Step 43052: {'lr': 0.0004109411353488101, 'samples': 8265984, 'steps': 43051, 'loss/train': 1.6552338600158691} -08/30/2021 20:55:05 - INFO - __main__ - Step 43053: {'lr': 0.00041093707446633934, 'samples': 8266176, 'steps': 43052, 'loss/train': 1.3406568765640259} -08/30/2021 20:55:07 - INFO - __main__ - Step 43054: {'lr': 0.00041093301351135294, 'samples': 8266368, 'steps': 43053, 'loss/train': 0.39391854405403137} -08/30/2021 20:55:07 - INFO - __main__ - Step 43055: {'lr': 0.00041092895248385255, 'samples': 8266560, 'steps': 43054, 'loss/train': 1.4422074556350708} -08/30/2021 20:55:08 - INFO - __main__ - Step 43056: {'lr': 0.00041092489138384, 'samples': 8266752, 'steps': 43055, 'loss/train': 0.11934449523687363} -08/30/2021 20:55:08 - INFO - __main__ - Step 43057: {'lr': 0.0004109208302113173, 'samples': 8266944, 'steps': 43056, 'loss/train': 1.5346908569335938} -08/30/2021 20:55:08 - INFO - __main__ - Step 43058: {'lr': 0.00041091676896628604, 'samples': 8267136, 'steps': 43057, 'loss/train': 0.6464435458183289} -08/30/2021 20:55:10 - INFO - __main__ - Step 43059: {'lr': 0.00041091270764874823, 'samples': 8267328, 'steps': 43058, 'loss/train': 1.2979649305343628} -08/30/2021 20:55:11 - INFO - __main__ - Step 43060: {'lr': 0.0004109086462587056, 'samples': 8267520, 'steps': 43059, 'loss/train': 1.1548914909362793} -08/30/2021 20:55:11 - INFO - __main__ - Step 43061: {'lr': 0.0004109045847961601, 'samples': 8267712, 'steps': 43060, 'loss/train': 0.536292552947998} -08/30/2021 20:55:11 - INFO - __main__ - Step 43062: {'lr': 0.0004109005232611134, 'samples': 8267904, 'steps': 43061, 'loss/train': 0.4752870202064514} -08/30/2021 20:55:12 - INFO - __main__ - Step 43063: {'lr': 0.00041089646165356743, 'samples': 8268096, 'steps': 43062, 'loss/train': 0.8744156956672668} -08/30/2021 20:55:12 - INFO - __main__ - Step 43064: {'lr': 0.000410892399973524, 'samples': 8268288, 'steps': 43063, 'loss/train': 1.301539659500122} -08/30/2021 20:55:14 - INFO - __main__ - Step 43065: {'lr': 0.00041088833822098495, 'samples': 8268480, 'steps': 43064, 'loss/train': 1.0908784866333008} -08/30/2021 20:55:14 - INFO - __main__ - Step 43066: {'lr': 0.00041088427639595206, 'samples': 8268672, 'steps': 43065, 'loss/train': 1.5283879041671753} -08/30/2021 20:55:14 - INFO - __main__ - Step 43067: {'lr': 0.0004108802144984273, 'samples': 8268864, 'steps': 43066, 'loss/train': 1.5658838748931885} -08/30/2021 20:55:15 - INFO - __main__ - Step 43068: {'lr': 0.0004108761525284123, 'samples': 8269056, 'steps': 43067, 'loss/train': 1.3104747533798218} -08/30/2021 20:55:15 - INFO - __main__ - Step 43069: {'lr': 0.000410872090485909, 'samples': 8269248, 'steps': 43068, 'loss/train': 1.3385337591171265} -08/30/2021 20:55:17 - INFO - __main__ - Step 43070: {'lr': 0.00041086802837091916, 'samples': 8269440, 'steps': 43069, 'loss/train': 1.539482831954956} -08/30/2021 20:55:17 - INFO - __main__ - Step 43071: {'lr': 0.00041086396618344475, 'samples': 8269632, 'steps': 43070, 'loss/train': 1.0114749670028687} -08/30/2021 20:55:18 - INFO - __main__ - Step 43072: {'lr': 0.0004108599039234875, 'samples': 8269824, 'steps': 43071, 'loss/train': 1.4196584224700928} -08/30/2021 20:55:18 - INFO - __main__ - Step 43073: {'lr': 0.00041085584159104925, 'samples': 8270016, 'steps': 43072, 'loss/train': 0.05706416070461273} -08/30/2021 20:55:18 - INFO - __main__ - Step 43074: {'lr': 0.00041085177918613185, 'samples': 8270208, 'steps': 43073, 'loss/train': 2.471883773803711} -08/30/2021 20:55:20 - INFO - __main__ - Step 43075: {'lr': 0.0004108477167087371, 'samples': 8270400, 'steps': 43074, 'loss/train': 0.9876798391342163} -08/30/2021 20:55:21 - INFO - __main__ - Step 43076: {'lr': 0.0004108436541588669, 'samples': 8270592, 'steps': 43075, 'loss/train': 1.0809775590896606} -08/30/2021 20:55:21 - INFO - __main__ - Step 43077: {'lr': 0.000410839591536523, 'samples': 8270784, 'steps': 43076, 'loss/train': 1.496696949005127} -08/30/2021 20:55:21 - INFO - __main__ - Step 43078: {'lr': 0.00041083552884170726, 'samples': 8270976, 'steps': 43077, 'loss/train': 1.478933572769165} -08/30/2021 20:55:22 - INFO - __main__ - Step 43079: {'lr': 0.0004108314660744216, 'samples': 8271168, 'steps': 43078, 'loss/train': 1.5491466522216797} -08/30/2021 20:55:22 - INFO - __main__ - Step 43080: {'lr': 0.0004108274032346676, 'samples': 8271360, 'steps': 43079, 'loss/train': 1.7027873992919922} -08/30/2021 20:55:25 - INFO - __main__ - Step 43081: {'lr': 0.0004108233403224474, 'samples': 8271552, 'steps': 43080, 'loss/train': 1.9535102844238281} -08/30/2021 20:55:26 - INFO - __main__ - Step 43082: {'lr': 0.0004108192773377626, 'samples': 8271744, 'steps': 43081, 'loss/train': 0.9428542852401733} -08/30/2021 20:55:26 - INFO - __main__ - Step 43083: {'lr': 0.0004108152142806151, 'samples': 8271936, 'steps': 43082, 'loss/train': 1.867835521697998} -08/30/2021 20:55:27 - INFO - __main__ - Step 43084: {'lr': 0.00041081115115100677, 'samples': 8272128, 'steps': 43083, 'loss/train': 2.852897882461548} -08/30/2021 20:55:27 - INFO - __main__ - Step 43085: {'lr': 0.0004108070879489395, 'samples': 8272320, 'steps': 43084, 'loss/train': 3.130497694015503} -08/30/2021 20:55:27 - INFO - __main__ - Step 43086: {'lr': 0.0004108030246744149, 'samples': 8272512, 'steps': 43085, 'loss/train': 2.817951202392578} -08/30/2021 20:55:28 - INFO - __main__ - Step 43087: {'lr': 0.00041079896132743506, 'samples': 8272704, 'steps': 43086, 'loss/train': 3.796910524368286} -08/30/2021 20:55:28 - INFO - __main__ - Step 43088: {'lr': 0.0004107948979080016, 'samples': 8272896, 'steps': 43087, 'loss/train': 2.6971192359924316} -08/30/2021 20:55:29 - INFO - __main__ - Step 43089: {'lr': 0.00041079083441611646, 'samples': 8273088, 'steps': 43088, 'loss/train': 1.759987711906433} -08/30/2021 20:55:30 - INFO - __main__ - Step 43090: {'lr': 0.0004107867708517815, 'samples': 8273280, 'steps': 43089, 'loss/train': 2.4432783126831055} -08/30/2021 20:55:30 - INFO - __main__ - Step 43091: {'lr': 0.0004107827072149984, 'samples': 8273472, 'steps': 43090, 'loss/train': 2.1201558113098145} -08/30/2021 20:55:31 - INFO - __main__ - Step 43092: {'lr': 0.0004107786435057692, 'samples': 8273664, 'steps': 43091, 'loss/train': 1.9819567203521729} -08/30/2021 20:55:31 - INFO - __main__ - Step 43093: {'lr': 0.0004107745797240956, 'samples': 8273856, 'steps': 43092, 'loss/train': 1.7590715885162354} -08/30/2021 20:55:32 - INFO - __main__ - Step 43094: {'lr': 0.0004107705158699794, 'samples': 8274048, 'steps': 43093, 'loss/train': 2.135681629180908} -08/30/2021 20:55:33 - INFO - __main__ - Step 43095: {'lr': 0.00041076645194342254, 'samples': 8274240, 'steps': 43094, 'loss/train': 1.6176354885101318} -08/30/2021 20:55:33 - INFO - __main__ - Step 43096: {'lr': 0.00041076238794442675, 'samples': 8274432, 'steps': 43095, 'loss/train': 2.0285708904266357} -08/30/2021 20:55:34 - INFO - __main__ - Step 43097: {'lr': 0.00041075832387299396, 'samples': 8274624, 'steps': 43096, 'loss/train': 2.0638937950134277} -08/30/2021 20:55:34 - INFO - __main__ - Step 43098: {'lr': 0.00041075425972912595, 'samples': 8274816, 'steps': 43097, 'loss/train': 1.5374903678894043} -08/30/2021 20:55:35 - INFO - __main__ - Step 43099: {'lr': 0.00041075019551282455, 'samples': 8275008, 'steps': 43098, 'loss/train': 1.8236980438232422} -08/30/2021 20:55:36 - INFO - __main__ - Step 43100: {'lr': 0.00041074613122409157, 'samples': 8275200, 'steps': 43099, 'loss/train': 2.400517225265503} -08/30/2021 20:55:36 - INFO - __main__ - Step 43101: {'lr': 0.0004107420668629289, 'samples': 8275392, 'steps': 43100, 'loss/train': 1.7645496129989624} -08/30/2021 20:55:36 - INFO - __main__ - Step 43102: {'lr': 0.00041073800242933826, 'samples': 8275584, 'steps': 43101, 'loss/train': 2.390949010848999} -08/30/2021 20:55:37 - INFO - __main__ - Step 43103: {'lr': 0.00041073393792332157, 'samples': 8275776, 'steps': 43102, 'loss/train': 1.0891464948654175} -08/30/2021 20:55:38 - INFO - __main__ - Step 43104: {'lr': 0.0004107298733448807, 'samples': 8275968, 'steps': 43103, 'loss/train': 2.014225959777832} -08/30/2021 20:55:39 - INFO - __main__ - Step 43105: {'lr': 0.0004107258086940174, 'samples': 8276160, 'steps': 43104, 'loss/train': 1.7214444875717163} -08/30/2021 20:55:39 - INFO - __main__ - Step 43106: {'lr': 0.0004107217439707336, 'samples': 8276352, 'steps': 43105, 'loss/train': 1.5326868295669556} -08/30/2021 20:55:39 - INFO - __main__ - Step 43107: {'lr': 0.000410717679175031, 'samples': 8276544, 'steps': 43106, 'loss/train': 1.7199546098709106} -08/30/2021 20:55:40 - INFO - __main__ - Step 43108: {'lr': 0.00041071361430691143, 'samples': 8276736, 'steps': 43107, 'loss/train': 1.5477620363235474} -08/30/2021 20:55:41 - INFO - __main__ - Step 43109: {'lr': 0.00041070954936637687, 'samples': 8276928, 'steps': 43108, 'loss/train': 1.5906322002410889} -08/30/2021 20:55:42 - INFO - __main__ - Step 43110: {'lr': 0.00041070548435342903, 'samples': 8277120, 'steps': 43109, 'loss/train': 1.9322139024734497} -08/30/2021 20:55:42 - INFO - __main__ - Step 43111: {'lr': 0.00041070141926806983, 'samples': 8277312, 'steps': 43110, 'loss/train': 0.8504245281219482} -08/30/2021 20:55:43 - INFO - __main__ - Step 43112: {'lr': 0.00041069735411030105, 'samples': 8277504, 'steps': 43111, 'loss/train': 1.200981616973877} -08/30/2021 20:55:43 - INFO - __main__ - Step 43113: {'lr': 0.00041069328888012447, 'samples': 8277696, 'steps': 43112, 'loss/train': 1.0931965112686157} -08/30/2021 20:55:44 - INFO - __main__ - Step 43114: {'lr': 0.000410689223577542, 'samples': 8277888, 'steps': 43113, 'loss/train': 1.9876457452774048} -08/30/2021 20:55:45 - INFO - __main__ - Step 43115: {'lr': 0.00041068515820255543, 'samples': 8278080, 'steps': 43114, 'loss/train': 1.8466354608535767} -08/30/2021 20:55:45 - INFO - __main__ - Step 43116: {'lr': 0.00041068109275516665, 'samples': 8278272, 'steps': 43115, 'loss/train': 1.5738556385040283} -08/30/2021 20:55:46 - INFO - __main__ - Step 43117: {'lr': 0.0004106770272353774, 'samples': 8278464, 'steps': 43116, 'loss/train': 1.864491581916809} -08/30/2021 20:55:46 - INFO - __main__ - Step 43118: {'lr': 0.00041067296164318956, 'samples': 8278656, 'steps': 43117, 'loss/train': 1.5471930503845215} -08/30/2021 20:55:47 - INFO - __main__ - Step 43119: {'lr': 0.000410668895978605, 'samples': 8278848, 'steps': 43118, 'loss/train': 1.773576021194458} -08/30/2021 20:55:48 - INFO - __main__ - Step 43120: {'lr': 0.0004106648302416255, 'samples': 8279040, 'steps': 43119, 'loss/train': 1.5012117624282837} -08/30/2021 20:55:48 - INFO - __main__ - Step 43121: {'lr': 0.0004106607644322529, 'samples': 8279232, 'steps': 43120, 'loss/train': 1.490515947341919} -08/30/2021 20:55:49 - INFO - __main__ - Step 43122: {'lr': 0.00041065669855048896, 'samples': 8279424, 'steps': 43121, 'loss/train': 1.4472399950027466} -08/30/2021 20:55:49 - INFO - __main__ - Step 43123: {'lr': 0.0004106526325963357, 'samples': 8279616, 'steps': 43122, 'loss/train': 1.9854379892349243} -08/30/2021 20:55:50 - INFO - __main__ - Step 43124: {'lr': 0.0004106485665697948, 'samples': 8279808, 'steps': 43123, 'loss/train': 2.118741989135742} -08/30/2021 20:55:51 - INFO - __main__ - Step 43125: {'lr': 0.00041064450047086814, 'samples': 8280000, 'steps': 43124, 'loss/train': 1.5702439546585083} -08/30/2021 20:55:51 - INFO - __main__ - Step 43126: {'lr': 0.00041064043429955756, 'samples': 8280192, 'steps': 43125, 'loss/train': 1.6925501823425293} -08/30/2021 20:55:52 - INFO - __main__ - Step 43127: {'lr': 0.0004106363680558649, 'samples': 8280384, 'steps': 43126, 'loss/train': 0.9814291000366211} -08/30/2021 20:55:52 - INFO - __main__ - Step 43128: {'lr': 0.0004106323017397919, 'samples': 8280576, 'steps': 43127, 'loss/train': 1.7775154113769531} -08/30/2021 20:55:53 - INFO - __main__ - Step 43129: {'lr': 0.00041062823535134053, 'samples': 8280768, 'steps': 43128, 'loss/train': 1.8378931283950806} -08/30/2021 20:55:54 - INFO - __main__ - Step 43130: {'lr': 0.0004106241688905126, 'samples': 8280960, 'steps': 43129, 'loss/train': 1.81867516040802} -08/30/2021 20:55:54 - INFO - __main__ - Step 43131: {'lr': 0.00041062010235730974, 'samples': 8281152, 'steps': 43130, 'loss/train': 1.5315477848052979} -08/30/2021 20:55:55 - INFO - __main__ - Step 43132: {'lr': 0.0004106160357517341, 'samples': 8281344, 'steps': 43131, 'loss/train': 1.633876919746399} -08/30/2021 20:55:55 - INFO - __main__ - Step 43133: {'lr': 0.00041061196907378727, 'samples': 8281536, 'steps': 43132, 'loss/train': 1.5402170419692993} -08/30/2021 20:55:57 - INFO - __main__ - Step 43134: {'lr': 0.00041060790232347116, 'samples': 8281728, 'steps': 43133, 'loss/train': 1.6886050701141357} -08/30/2021 20:55:57 - INFO - __main__ - Step 43135: {'lr': 0.00041060383550078764, 'samples': 8281920, 'steps': 43134, 'loss/train': 1.912307620048523} -08/30/2021 20:55:58 - INFO - __main__ - Step 43136: {'lr': 0.00041059976860573845, 'samples': 8282112, 'steps': 43135, 'loss/train': 2.060131072998047} -08/30/2021 20:55:58 - INFO - __main__ - Step 43137: {'lr': 0.00041059570163832555, 'samples': 8282304, 'steps': 43136, 'loss/train': 1.4196592569351196} -08/30/2021 20:55:58 - INFO - __main__ - Step 43138: {'lr': 0.00041059163459855066, 'samples': 8282496, 'steps': 43137, 'loss/train': 1.8933769464492798} -08/30/2021 20:56:00 - INFO - __main__ - Step 43139: {'lr': 0.00041058756748641573, 'samples': 8282688, 'steps': 43138, 'loss/train': 1.4502156972885132} -08/30/2021 20:56:00 - INFO - __main__ - Step 43140: {'lr': 0.0004105835003019225, 'samples': 8282880, 'steps': 43139, 'loss/train': 1.7310553789138794} -08/30/2021 20:56:01 - INFO - __main__ - Step 43141: {'lr': 0.00041057943304507273, 'samples': 8283072, 'steps': 43140, 'loss/train': 2.4128997325897217} -08/30/2021 20:56:01 - INFO - __main__ - Step 43142: {'lr': 0.0004105753657158684, 'samples': 8283264, 'steps': 43141, 'loss/train': 1.6390939950942993} -08/30/2021 20:56:02 - INFO - __main__ - Step 43143: {'lr': 0.00041057129831431133, 'samples': 8283456, 'steps': 43142, 'loss/train': 1.4584561586380005} -08/30/2021 20:56:02 - INFO - __main__ - Step 43144: {'lr': 0.00041056723084040324, 'samples': 8283648, 'steps': 43143, 'loss/train': 2.5227386951446533} -08/30/2021 20:56:04 - INFO - __main__ - Step 43145: {'lr': 0.00041056316329414613, 'samples': 8283840, 'steps': 43144, 'loss/train': 1.335874319076538} -08/30/2021 20:56:04 - INFO - __main__ - Step 43146: {'lr': 0.00041055909567554166, 'samples': 8284032, 'steps': 43145, 'loss/train': 1.2328912019729614} -08/30/2021 20:56:04 - INFO - __main__ - Step 43147: {'lr': 0.00041055502798459175, 'samples': 8284224, 'steps': 43146, 'loss/train': 0.1554865539073944} -08/30/2021 20:56:05 - INFO - __main__ - Step 43148: {'lr': 0.00041055096022129823, 'samples': 8284416, 'steps': 43147, 'loss/train': 1.098775863647461} -08/30/2021 20:56:05 - INFO - __main__ - Step 43149: {'lr': 0.0004105468923856629, 'samples': 8284608, 'steps': 43148, 'loss/train': 1.5607126951217651} -08/30/2021 20:56:07 - INFO - __main__ - Step 43150: {'lr': 0.00041054282447768763, 'samples': 8284800, 'steps': 43149, 'loss/train': 0.9097418785095215} -08/30/2021 20:56:07 - INFO - __main__ - Step 43151: {'lr': 0.00041053875649737424, 'samples': 8284992, 'steps': 43150, 'loss/train': 1.4875164031982422} -08/30/2021 20:56:08 - INFO - __main__ - Step 43152: {'lr': 0.0004105346884447246, 'samples': 8285184, 'steps': 43151, 'loss/train': 1.6775925159454346} -08/30/2021 20:56:08 - INFO - __main__ - Step 43153: {'lr': 0.00041053062031974055, 'samples': 8285376, 'steps': 43152, 'loss/train': 2.6256110668182373} -08/30/2021 20:56:08 - INFO - __main__ - Step 43154: {'lr': 0.00041052655212242377, 'samples': 8285568, 'steps': 43153, 'loss/train': 1.8446276187896729} -08/30/2021 20:56:10 - INFO - __main__ - Step 43155: {'lr': 0.00041052248385277623, 'samples': 8285760, 'steps': 43154, 'loss/train': 1.4902443885803223} -08/30/2021 20:56:10 - INFO - __main__ - Step 43156: {'lr': 0.0004105184155107998, 'samples': 8285952, 'steps': 43155, 'loss/train': 1.7433875799179077} -08/30/2021 20:56:11 - INFO - __main__ - Step 43157: {'lr': 0.00041051434709649614, 'samples': 8286144, 'steps': 43156, 'loss/train': 1.2297192811965942} -08/30/2021 20:56:11 - INFO - __main__ - Step 43158: {'lr': 0.0004105102786098672, 'samples': 8286336, 'steps': 43157, 'loss/train': 1.7540655136108398} -08/30/2021 20:56:11 - INFO - __main__ - Step 43159: {'lr': 0.0004105062100509149, 'samples': 8286528, 'steps': 43158, 'loss/train': 2.0551722049713135} -08/30/2021 20:56:13 - INFO - __main__ - Step 43160: {'lr': 0.000410502141419641, 'samples': 8286720, 'steps': 43159, 'loss/train': 0.9355669021606445} -08/30/2021 20:56:14 - INFO - __main__ - Step 43161: {'lr': 0.00041049807271604724, 'samples': 8286912, 'steps': 43160, 'loss/train': 0.8614419102668762} -08/30/2021 20:56:14 - INFO - __main__ - Step 43162: {'lr': 0.00041049400394013545, 'samples': 8287104, 'steps': 43161, 'loss/train': 1.5363117456436157} -08/30/2021 20:56:14 - INFO - __main__ - Step 43163: {'lr': 0.0004104899350919077, 'samples': 8287296, 'steps': 43162, 'loss/train': 1.1739214658737183} -08/30/2021 20:56:15 - INFO - __main__ - Step 43164: {'lr': 0.0004104858661713655, 'samples': 8287488, 'steps': 43163, 'loss/train': 1.264413833618164} -08/30/2021 20:56:15 - INFO - __main__ - Step 43165: {'lr': 0.00041048179717851095, 'samples': 8287680, 'steps': 43164, 'loss/train': 1.8646942377090454} -08/30/2021 20:56:17 - INFO - __main__ - Step 43166: {'lr': 0.00041047772811334584, 'samples': 8287872, 'steps': 43165, 'loss/train': 1.9736560583114624} -08/30/2021 20:56:17 - INFO - __main__ - Step 43167: {'lr': 0.0004104736589758719, 'samples': 8288064, 'steps': 43166, 'loss/train': 2.0940358638763428} -08/30/2021 20:56:17 - INFO - __main__ - Step 43168: {'lr': 0.0004104695897660909, 'samples': 8288256, 'steps': 43167, 'loss/train': 1.7892898321151733} -08/30/2021 20:56:18 - INFO - __main__ - Step 43169: {'lr': 0.0004104655204840048, 'samples': 8288448, 'steps': 43168, 'loss/train': 1.464721441268921} -08/30/2021 20:56:18 - INFO - __main__ - Step 43170: {'lr': 0.0004104614511296155, 'samples': 8288640, 'steps': 43169, 'loss/train': 1.292941927909851} -08/30/2021 20:56:20 - INFO - __main__ - Step 43171: {'lr': 0.00041045738170292467, 'samples': 8288832, 'steps': 43170, 'loss/train': 1.2955961227416992} -08/30/2021 20:56:20 - INFO - __main__ - Step 43172: {'lr': 0.0004104533122039342, 'samples': 8289024, 'steps': 43171, 'loss/train': 1.3241108655929565} -08/30/2021 20:56:20 - INFO - __main__ - Step 43173: {'lr': 0.00041044924263264603, 'samples': 8289216, 'steps': 43172, 'loss/train': 1.7729849815368652} -08/30/2021 20:56:21 - INFO - __main__ - Step 43174: {'lr': 0.00041044517298906194, 'samples': 8289408, 'steps': 43173, 'loss/train': 1.3600283861160278} -08/30/2021 20:56:21 - INFO - __main__ - Step 43175: {'lr': 0.0004104411032731836, 'samples': 8289600, 'steps': 43174, 'loss/train': 1.2630465030670166} -08/30/2021 20:56:23 - INFO - __main__ - Step 43176: {'lr': 0.00041043703348501304, 'samples': 8289792, 'steps': 43175, 'loss/train': 1.2705659866333008} -08/30/2021 20:56:23 - INFO - __main__ - Step 43177: {'lr': 0.0004104329636245521, 'samples': 8289984, 'steps': 43176, 'loss/train': 1.558911681175232} -08/30/2021 20:56:23 - INFO - __main__ - Step 43178: {'lr': 0.0004104288936918024, 'samples': 8290176, 'steps': 43177, 'loss/train': 1.6005598306655884} -08/30/2021 20:56:24 - INFO - __main__ - Step 43179: {'lr': 0.00041042482368676604, 'samples': 8290368, 'steps': 43178, 'loss/train': 1.395361065864563} -08/30/2021 20:56:24 - INFO - __main__ - Step 43180: {'lr': 0.00041042075360944464, 'samples': 8290560, 'steps': 43179, 'loss/train': 1.6645832061767578} -08/30/2021 20:56:26 - INFO - __main__ - Step 43181: {'lr': 0.0004104166834598402, 'samples': 8290752, 'steps': 43180, 'loss/train': 1.572617769241333} -08/30/2021 20:56:26 - INFO - __main__ - Step 43182: {'lr': 0.00041041261323795437, 'samples': 8290944, 'steps': 43181, 'loss/train': 1.6113719940185547} -08/30/2021 20:56:26 - INFO - __main__ - Step 43183: {'lr': 0.0004104085429437892, 'samples': 8291136, 'steps': 43182, 'loss/train': 1.317272424697876} -08/30/2021 20:56:27 - INFO - __main__ - Step 43184: {'lr': 0.00041040447257734635, 'samples': 8291328, 'steps': 43183, 'loss/train': 1.3970937728881836} -08/30/2021 20:56:27 - INFO - __main__ - Step 43185: {'lr': 0.00041040040213862774, 'samples': 8291520, 'steps': 43184, 'loss/train': 1.9437177181243896} -08/30/2021 20:56:27 - INFO - __main__ - Step 43186: {'lr': 0.00041039633162763523, 'samples': 8291712, 'steps': 43185, 'loss/train': 1.3823318481445312} -08/30/2021 20:56:29 - INFO - __main__ - Step 43187: {'lr': 0.00041039226104437056, 'samples': 8291904, 'steps': 43186, 'loss/train': 1.1192784309387207} -08/30/2021 20:56:30 - INFO - __main__ - Step 43188: {'lr': 0.0004103881903888356, 'samples': 8292096, 'steps': 43187, 'loss/train': 1.5928676128387451} -08/30/2021 20:56:30 - INFO - __main__ - Step 43189: {'lr': 0.0004103841196610322, 'samples': 8292288, 'steps': 43188, 'loss/train': 2.524419069290161} -08/30/2021 20:56:31 - INFO - __main__ - Step 43190: {'lr': 0.0004103800488609622, 'samples': 8292480, 'steps': 43189, 'loss/train': 1.5301052331924438} -08/30/2021 20:56:32 - INFO - __main__ - Step 43191: {'lr': 0.0004103759779886274, 'samples': 8292672, 'steps': 43190, 'loss/train': 0.9256829023361206} -08/30/2021 20:56:33 - INFO - __main__ - Step 43192: {'lr': 0.0004103719070440297, 'samples': 8292864, 'steps': 43191, 'loss/train': 0.2546115517616272} -08/30/2021 20:56:33 - INFO - __main__ - Step 43193: {'lr': 0.00041036783602717086, 'samples': 8293056, 'steps': 43192, 'loss/train': 1.9964308738708496} -08/30/2021 20:56:33 - INFO - __main__ - Step 43194: {'lr': 0.00041036376493805286, 'samples': 8293248, 'steps': 43193, 'loss/train': 1.8302520513534546} -08/30/2021 20:56:34 - INFO - __main__ - Step 43195: {'lr': 0.0004103596937766773, 'samples': 8293440, 'steps': 43194, 'loss/train': 1.5031763315200806} -08/30/2021 20:56:34 - INFO - __main__ - Step 43196: {'lr': 0.00041035562254304614, 'samples': 8293632, 'steps': 43195, 'loss/train': 1.8386255502700806} -08/30/2021 20:56:36 - INFO - __main__ - Step 43197: {'lr': 0.00041035155123716127, 'samples': 8293824, 'steps': 43196, 'loss/train': 1.88656485080719} -08/30/2021 20:56:36 - INFO - __main__ - Step 43198: {'lr': 0.00041034747985902446, 'samples': 8294016, 'steps': 43197, 'loss/train': 1.1430670022964478} -08/30/2021 20:56:37 - INFO - __main__ - Step 43199: {'lr': 0.0004103434084086375, 'samples': 8294208, 'steps': 43198, 'loss/train': 0.44922199845314026} -08/30/2021 20:56:37 - INFO - __main__ - Step 43200: {'lr': 0.0004103393368860023, 'samples': 8294400, 'steps': 43199, 'loss/train': 1.2825961112976074} -08/30/2021 20:56:37 - INFO - __main__ - Step 43201: {'lr': 0.0004103352652911206, 'samples': 8294592, 'steps': 43200, 'loss/train': 0.7601348161697388} -08/30/2021 20:56:39 - INFO - __main__ - Step 43202: {'lr': 0.0004103311936239944, 'samples': 8294784, 'steps': 43201, 'loss/train': 1.7089953422546387} -08/30/2021 20:56:39 - INFO - __main__ - Step 43203: {'lr': 0.0004103271218846254, 'samples': 8294976, 'steps': 43202, 'loss/train': 2.0975441932678223} -08/30/2021 20:56:40 - INFO - __main__ - Step 43204: {'lr': 0.00041032305007301554, 'samples': 8295168, 'steps': 43203, 'loss/train': 1.337768793106079} -08/30/2021 20:56:40 - INFO - __main__ - Step 43205: {'lr': 0.00041031897818916645, 'samples': 8295360, 'steps': 43204, 'loss/train': 1.448705792427063} -08/30/2021 20:56:40 - INFO - __main__ - Step 43206: {'lr': 0.0004103149062330802, 'samples': 8295552, 'steps': 43205, 'loss/train': 0.9176228046417236} -08/30/2021 20:56:42 - INFO - __main__ - Step 43207: {'lr': 0.00041031083420475854, 'samples': 8295744, 'steps': 43206, 'loss/train': 1.174670934677124} -08/30/2021 20:56:42 - INFO - __main__ - Step 43208: {'lr': 0.00041030676210420324, 'samples': 8295936, 'steps': 43207, 'loss/train': 0.7236738801002502} -08/30/2021 20:56:43 - INFO - __main__ - Step 43209: {'lr': 0.0004103026899314162, 'samples': 8296128, 'steps': 43208, 'loss/train': 1.2783769369125366} -08/30/2021 20:56:43 - INFO - __main__ - Step 43210: {'lr': 0.00041029861768639934, 'samples': 8296320, 'steps': 43209, 'loss/train': 1.0573124885559082} -08/30/2021 20:56:43 - INFO - __main__ - Step 43211: {'lr': 0.0004102945453691542, 'samples': 8296512, 'steps': 43210, 'loss/train': 1.7038862705230713} -08/30/2021 20:56:45 - INFO - __main__ - Step 43212: {'lr': 0.00041029047297968293, 'samples': 8296704, 'steps': 43211, 'loss/train': 1.4660732746124268} -08/30/2021 20:56:45 - INFO - __main__ - Step 43213: {'lr': 0.00041028640051798726, 'samples': 8296896, 'steps': 43212, 'loss/train': 1.6577725410461426} -08/30/2021 20:56:46 - INFO - __main__ - Step 43214: {'lr': 0.000410282327984069, 'samples': 8297088, 'steps': 43213, 'loss/train': 1.0727344751358032} -08/30/2021 20:56:46 - INFO - __main__ - Step 43215: {'lr': 0.00041027825537792993, 'samples': 8297280, 'steps': 43214, 'loss/train': 1.4634149074554443} -08/30/2021 20:56:46 - INFO - __main__ - Step 43216: {'lr': 0.0004102741826995721, 'samples': 8297472, 'steps': 43215, 'loss/train': 1.6086004972457886} -08/30/2021 20:56:48 - INFO - __main__ - Step 43217: {'lr': 0.000410270109948997, 'samples': 8297664, 'steps': 43216, 'loss/train': 1.3327802419662476} -08/30/2021 20:56:48 - INFO - __main__ - Step 43218: {'lr': 0.0004102660371262068, 'samples': 8297856, 'steps': 43217, 'loss/train': 1.402684211730957} -08/30/2021 20:56:49 - INFO - __main__ - Step 43219: {'lr': 0.0004102619642312031, 'samples': 8298048, 'steps': 43218, 'loss/train': 0.6042243242263794} -08/30/2021 20:56:49 - INFO - __main__ - Step 43220: {'lr': 0.00041025789126398793, 'samples': 8298240, 'steps': 43219, 'loss/train': 1.2345627546310425} -08/30/2021 20:56:49 - INFO - __main__ - Step 43221: {'lr': 0.000410253818224563, 'samples': 8298432, 'steps': 43220, 'loss/train': 1.1704076528549194} -08/30/2021 20:56:51 - INFO - __main__ - Step 43222: {'lr': 0.0004102497451129302, 'samples': 8298624, 'steps': 43221, 'loss/train': 1.4527727365493774} -08/30/2021 20:56:52 - INFO - __main__ - Step 43223: {'lr': 0.00041024567192909125, 'samples': 8298816, 'steps': 43222, 'loss/train': 1.1646500825881958} -08/30/2021 20:56:52 - INFO - __main__ - Step 43224: {'lr': 0.0004102415986730481, 'samples': 8299008, 'steps': 43223, 'loss/train': 1.9749263525009155} -08/30/2021 20:56:52 - INFO - __main__ - Step 43225: {'lr': 0.0004102375253448026, 'samples': 8299200, 'steps': 43224, 'loss/train': 2.0163774490356445} -08/30/2021 20:56:53 - INFO - __main__ - Step 43226: {'lr': 0.0004102334519443565, 'samples': 8299392, 'steps': 43225, 'loss/train': 2.1163246631622314} -08/30/2021 20:56:55 - INFO - __main__ - Step 43227: {'lr': 0.0004102293784717117, 'samples': 8299584, 'steps': 43226, 'loss/train': 2.4043784141540527} -08/30/2021 20:56:55 - INFO - __main__ - Step 43228: {'lr': 0.00041022530492687006, 'samples': 8299776, 'steps': 43227, 'loss/train': 1.658603310585022} -08/30/2021 20:56:56 - INFO - __main__ - Step 43229: {'lr': 0.0004102212313098333, 'samples': 8299968, 'steps': 43228, 'loss/train': 1.077207326889038} -08/30/2021 20:56:56 - INFO - __main__ - Step 43230: {'lr': 0.00041021715762060336, 'samples': 8300160, 'steps': 43229, 'loss/train': 1.538438320159912} -08/30/2021 20:56:56 - INFO - __main__ - Step 43231: {'lr': 0.000410213083859182, 'samples': 8300352, 'steps': 43230, 'loss/train': 1.754391074180603} -08/30/2021 20:56:57 - INFO - __main__ - Step 43232: {'lr': 0.0004102090100255711, 'samples': 8300544, 'steps': 43231, 'loss/train': 0.8378159999847412} -08/30/2021 20:56:57 - INFO - __main__ - Step 43233: {'lr': 0.00041020493611977263, 'samples': 8300736, 'steps': 43232, 'loss/train': 0.06667105853557587} -08/30/2021 20:56:59 - INFO - __main__ - Step 43234: {'lr': 0.0004102008621417881, 'samples': 8300928, 'steps': 43233, 'loss/train': 0.054393839091062546} -08/30/2021 20:57:00 - INFO - __main__ - Step 43235: {'lr': 0.0004101967880916196, 'samples': 8301120, 'steps': 43234, 'loss/train': 1.5266391038894653} -08/30/2021 20:57:00 - INFO - __main__ - Step 43236: {'lr': 0.00041019271396926894, 'samples': 8301312, 'steps': 43235, 'loss/train': 0.8984933495521545} -08/30/2021 20:57:00 - INFO - __main__ - Step 43237: {'lr': 0.0004101886397747379, 'samples': 8301504, 'steps': 43236, 'loss/train': 1.8313606977462769} -08/30/2021 20:57:01 - INFO - __main__ - Step 43238: {'lr': 0.0004101845655080283, 'samples': 8301696, 'steps': 43237, 'loss/train': 1.2376304864883423} -08/30/2021 20:57:02 - INFO - __main__ - Step 43239: {'lr': 0.00041018049116914204, 'samples': 8301888, 'steps': 43238, 'loss/train': 1.576903223991394} -08/30/2021 20:57:03 - INFO - __main__ - Step 43240: {'lr': 0.00041017641675808095, 'samples': 8302080, 'steps': 43239, 'loss/train': 1.4447237253189087} -08/30/2021 20:57:03 - INFO - __main__ - Step 43241: {'lr': 0.00041017234227484675, 'samples': 8302272, 'steps': 43240, 'loss/train': 1.3892391920089722} -08/30/2021 20:57:03 - INFO - __main__ - Step 43242: {'lr': 0.0004101682677194414, 'samples': 8302464, 'steps': 43241, 'loss/train': 1.3279780149459839} -08/30/2021 20:57:04 - INFO - __main__ - Step 43243: {'lr': 0.0004101641930918667, 'samples': 8302656, 'steps': 43242, 'loss/train': 1.5703035593032837} -08/30/2021 20:57:04 - INFO - __main__ - Step 43244: {'lr': 0.00041016011839212446, 'samples': 8302848, 'steps': 43243, 'loss/train': 0.08699626475572586} -08/30/2021 20:57:06 - INFO - __main__ - Step 43245: {'lr': 0.0004101560436202166, 'samples': 8303040, 'steps': 43244, 'loss/train': 1.2573353052139282} -08/30/2021 20:57:07 - INFO - __main__ - Step 43246: {'lr': 0.0004101519687761449, 'samples': 8303232, 'steps': 43245, 'loss/train': 1.365147352218628} -08/30/2021 20:57:07 - INFO - __main__ - Step 43247: {'lr': 0.00041014789385991114, 'samples': 8303424, 'steps': 43246, 'loss/train': 0.09524846076965332} -08/30/2021 20:57:07 - INFO - __main__ - Step 43248: {'lr': 0.00041014381887151727, 'samples': 8303616, 'steps': 43247, 'loss/train': 1.0626354217529297} -08/30/2021 20:57:08 - INFO - __main__ - Step 43249: {'lr': 0.00041013974381096503, 'samples': 8303808, 'steps': 43248, 'loss/train': 0.7480886578559875} -08/30/2021 20:57:09 - INFO - __main__ - Step 43250: {'lr': 0.00041013566867825627, 'samples': 8304000, 'steps': 43249, 'loss/train': 1.284941554069519} -08/30/2021 20:57:09 - INFO - __main__ - Step 43251: {'lr': 0.00041013159347339293, 'samples': 8304192, 'steps': 43250, 'loss/train': 2.1499013900756836} -08/30/2021 20:57:10 - INFO - __main__ - Step 43252: {'lr': 0.0004101275181963767, 'samples': 8304384, 'steps': 43251, 'loss/train': 1.934585690498352} -08/30/2021 20:57:10 - INFO - __main__ - Step 43253: {'lr': 0.0004101234428472095, 'samples': 8304576, 'steps': 43252, 'loss/train': 1.6276915073394775} -08/30/2021 20:57:10 - INFO - __main__ - Step 43254: {'lr': 0.0004101193674258931, 'samples': 8304768, 'steps': 43253, 'loss/train': 1.7796305418014526} -08/30/2021 20:57:12 - INFO - __main__ - Step 43255: {'lr': 0.00041011529193242947, 'samples': 8304960, 'steps': 43254, 'loss/train': 0.6792890429496765} -08/30/2021 20:57:12 - INFO - __main__ - Step 43256: {'lr': 0.00041011121636682024, 'samples': 8305152, 'steps': 43255, 'loss/train': 1.7855327129364014} -08/30/2021 20:57:13 - INFO - __main__ - Step 43257: {'lr': 0.0004101071407290675, 'samples': 8305344, 'steps': 43256, 'loss/train': 1.4853849411010742} -08/30/2021 20:57:13 - INFO - __main__ - Step 43258: {'lr': 0.00041010306501917287, 'samples': 8305536, 'steps': 43257, 'loss/train': 1.3908770084381104} -08/30/2021 20:57:14 - INFO - __main__ - Step 43259: {'lr': 0.0004100989892371383, 'samples': 8305728, 'steps': 43258, 'loss/train': 1.152788758277893} -08/30/2021 20:57:15 - INFO - __main__ - Step 43260: {'lr': 0.00041009491338296557, 'samples': 8305920, 'steps': 43259, 'loss/train': 1.1953675746917725} -08/30/2021 20:57:16 - INFO - __main__ - Step 43261: {'lr': 0.00041009083745665654, 'samples': 8306112, 'steps': 43260, 'loss/train': 1.8269766569137573} -08/30/2021 20:57:16 - INFO - __main__ - Step 43262: {'lr': 0.0004100867614582131, 'samples': 8306304, 'steps': 43261, 'loss/train': 1.5924428701400757} -08/30/2021 20:57:16 - INFO - __main__ - Step 43263: {'lr': 0.00041008268538763703, 'samples': 8306496, 'steps': 43262, 'loss/train': 1.9329931735992432} -08/30/2021 20:57:17 - INFO - __main__ - Step 43264: {'lr': 0.00041007860924493014, 'samples': 8306688, 'steps': 43263, 'loss/train': 1.3639891147613525} -08/30/2021 20:57:18 - INFO - __main__ - Step 43265: {'lr': 0.0004100745330300943, 'samples': 8306880, 'steps': 43264, 'loss/train': 1.416107416152954} -08/30/2021 20:57:19 - INFO - __main__ - Step 43266: {'lr': 0.0004100704567431314, 'samples': 8307072, 'steps': 43265, 'loss/train': 1.5389951467514038} -08/30/2021 20:57:19 - INFO - __main__ - Step 43267: {'lr': 0.0004100663803840431, 'samples': 8307264, 'steps': 43266, 'loss/train': 1.7031641006469727} -08/30/2021 20:57:19 - INFO - __main__ - Step 43268: {'lr': 0.0004100623039528315, 'samples': 8307456, 'steps': 43267, 'loss/train': 2.2104427814483643} -08/30/2021 20:57:20 - INFO - __main__ - Step 43269: {'lr': 0.0004100582274494982, 'samples': 8307648, 'steps': 43268, 'loss/train': 1.275783896446228} -08/30/2021 20:57:21 - INFO - __main__ - Step 43270: {'lr': 0.00041005415087404516, 'samples': 8307840, 'steps': 43269, 'loss/train': 1.8312181234359741} -08/30/2021 20:57:22 - INFO - __main__ - Step 43271: {'lr': 0.0004100500742264742, 'samples': 8308032, 'steps': 43270, 'loss/train': 1.5607789754867554} -08/30/2021 20:57:22 - INFO - __main__ - Step 43272: {'lr': 0.0004100459975067871, 'samples': 8308224, 'steps': 43271, 'loss/train': 1.6923092603683472} -08/30/2021 20:57:22 - INFO - __main__ - Step 43273: {'lr': 0.0004100419207149858, 'samples': 8308416, 'steps': 43272, 'loss/train': 1.5120006799697876} -08/30/2021 20:57:23 - INFO - __main__ - Step 43274: {'lr': 0.0004100378438510721, 'samples': 8308608, 'steps': 43273, 'loss/train': 1.1149519681930542} -08/30/2021 20:57:24 - INFO - __main__ - Step 43275: {'lr': 0.00041003376691504777, 'samples': 8308800, 'steps': 43274, 'loss/train': 1.576702356338501} -08/30/2021 20:57:25 - INFO - __main__ - Step 43276: {'lr': 0.0004100296899069147, 'samples': 8308992, 'steps': 43275, 'loss/train': 0.930472195148468} -08/30/2021 20:57:25 - INFO - __main__ - Step 43277: {'lr': 0.0004100256128266747, 'samples': 8309184, 'steps': 43276, 'loss/train': 1.6813923120498657} -08/30/2021 20:57:25 - INFO - __main__ - Step 43278: {'lr': 0.00041002153567432965, 'samples': 8309376, 'steps': 43277, 'loss/train': 0.9155459403991699} -08/30/2021 20:57:26 - INFO - __main__ - Step 43279: {'lr': 0.00041001745844988134, 'samples': 8309568, 'steps': 43278, 'loss/train': 1.7488728761672974} -08/30/2021 20:57:26 - INFO - __main__ - Step 43280: {'lr': 0.00041001338115333175, 'samples': 8309760, 'steps': 43279, 'loss/train': 0.9087408781051636} -08/30/2021 20:57:28 - INFO - __main__ - Step 43281: {'lr': 0.0004100093037846825, 'samples': 8309952, 'steps': 43280, 'loss/train': 1.424195647239685} -08/30/2021 20:57:28 - INFO - __main__ - Step 43282: {'lr': 0.0004100052263439355, 'samples': 8310144, 'steps': 43281, 'loss/train': 1.234944462776184} -08/30/2021 20:57:28 - INFO - __main__ - Step 43283: {'lr': 0.00041000114883109264, 'samples': 8310336, 'steps': 43282, 'loss/train': 1.565063238143921} -08/30/2021 20:57:29 - INFO - __main__ - Step 43284: {'lr': 0.00040999707124615573, 'samples': 8310528, 'steps': 43283, 'loss/train': 1.1456494331359863} -08/30/2021 20:57:29 - INFO - __main__ - Step 43285: {'lr': 0.00040999299358912664, 'samples': 8310720, 'steps': 43284, 'loss/train': 1.3309671878814697} -08/30/2021 20:57:31 - INFO - __main__ - Step 43286: {'lr': 0.00040998891586000716, 'samples': 8310912, 'steps': 43285, 'loss/train': 0.8662579655647278} -08/30/2021 20:57:31 - INFO - __main__ - Step 43287: {'lr': 0.0004099848380587992, 'samples': 8311104, 'steps': 43286, 'loss/train': 1.4355156421661377} -08/30/2021 20:57:31 - INFO - __main__ - Step 43288: {'lr': 0.00040998076018550444, 'samples': 8311296, 'steps': 43287, 'loss/train': 1.2939621210098267} -08/30/2021 20:57:32 - INFO - __main__ - Step 43289: {'lr': 0.00040997668224012485, 'samples': 8311488, 'steps': 43288, 'loss/train': 1.2802733182907104} -08/30/2021 20:57:32 - INFO - __main__ - Step 43290: {'lr': 0.00040997260422266223, 'samples': 8311680, 'steps': 43289, 'loss/train': 1.5579886436462402} -08/30/2021 20:57:33 - INFO - __main__ - Step 43291: {'lr': 0.00040996852613311844, 'samples': 8311872, 'steps': 43290, 'loss/train': 1.4921661615371704} -08/30/2021 20:57:34 - INFO - __main__ - Step 43292: {'lr': 0.00040996444797149526, 'samples': 8312064, 'steps': 43291, 'loss/train': 1.5541744232177734} -08/30/2021 20:57:34 - INFO - __main__ - Step 43293: {'lr': 0.0004099603697377946, 'samples': 8312256, 'steps': 43292, 'loss/train': 1.6156797409057617} -08/30/2021 20:57:35 - INFO - __main__ - Step 43294: {'lr': 0.0004099562914320183, 'samples': 8312448, 'steps': 43293, 'loss/train': 1.19282865524292} -08/30/2021 20:57:35 - INFO - __main__ - Step 43295: {'lr': 0.0004099522130541681, 'samples': 8312640, 'steps': 43294, 'loss/train': 1.2898142337799072} -08/30/2021 20:57:37 - INFO - __main__ - Step 43296: {'lr': 0.000409948134604246, 'samples': 8312832, 'steps': 43295, 'loss/train': 2.0650501251220703} -08/30/2021 20:57:37 - INFO - __main__ - Step 43297: {'lr': 0.0004099440560822536, 'samples': 8313024, 'steps': 43296, 'loss/train': 1.9747849702835083} -08/30/2021 20:57:38 - INFO - __main__ - Step 43298: {'lr': 0.000409939977488193, 'samples': 8313216, 'steps': 43297, 'loss/train': 1.3749817609786987} -08/30/2021 20:57:38 - INFO - __main__ - Step 43299: {'lr': 0.0004099358988220658, 'samples': 8313408, 'steps': 43298, 'loss/train': 1.4827638864517212} -08/30/2021 20:57:39 - INFO - __main__ - Step 43300: {'lr': 0.00040993182008387406, 'samples': 8313600, 'steps': 43299, 'loss/train': 1.8128889799118042} -08/30/2021 20:57:40 - INFO - __main__ - Step 43301: {'lr': 0.0004099277412736195, 'samples': 8313792, 'steps': 43300, 'loss/train': 1.1603326797485352} -08/30/2021 20:57:41 - INFO - __main__ - Step 43302: {'lr': 0.0004099236623913039, 'samples': 8313984, 'steps': 43301, 'loss/train': 1.1888824701309204} -08/30/2021 20:57:41 - INFO - __main__ - Step 43303: {'lr': 0.0004099195834369292, 'samples': 8314176, 'steps': 43302, 'loss/train': 0.5895113348960876} -08/30/2021 20:57:42 - INFO - __main__ - Step 43304: {'lr': 0.0004099155044104972, 'samples': 8314368, 'steps': 43303, 'loss/train': 1.690457820892334} -08/30/2021 20:57:42 - INFO - __main__ - Step 43305: {'lr': 0.00040991142531200973, 'samples': 8314560, 'steps': 43304, 'loss/train': 1.3655470609664917} -08/30/2021 20:57:42 - INFO - __main__ - Step 43306: {'lr': 0.0004099073461414686, 'samples': 8314752, 'steps': 43305, 'loss/train': 0.5894904732704163} -08/30/2021 20:57:44 - INFO - __main__ - Step 43307: {'lr': 0.0004099032668988758, 'samples': 8314944, 'steps': 43306, 'loss/train': 1.3736538887023926} -08/30/2021 20:57:45 - INFO - __main__ - Step 43308: {'lr': 0.00040989918758423306, 'samples': 8315136, 'steps': 43307, 'loss/train': 1.5043609142303467} -08/30/2021 20:57:45 - INFO - __main__ - Step 43309: {'lr': 0.0004098951081975421, 'samples': 8315328, 'steps': 43308, 'loss/train': 1.9528248310089111} -08/30/2021 20:57:45 - INFO - __main__ - Step 43310: {'lr': 0.0004098910287388049, 'samples': 8315520, 'steps': 43309, 'loss/train': 1.2753669023513794} -08/30/2021 20:57:46 - INFO - __main__ - Step 43311: {'lr': 0.00040988694920802326, 'samples': 8315712, 'steps': 43310, 'loss/train': 5.918020725250244} -08/30/2021 20:57:46 - INFO - __main__ - Step 43312: {'lr': 0.0004098828696051991, 'samples': 8315904, 'steps': 43311, 'loss/train': 5.878353118896484} -08/30/2021 20:57:47 - INFO - __main__ - Step 43313: {'lr': 0.00040987878993033417, 'samples': 8316096, 'steps': 43312, 'loss/train': 1.402848720550537} -08/30/2021 20:57:48 - INFO - __main__ - Step 43314: {'lr': 0.0004098747101834303, 'samples': 8316288, 'steps': 43313, 'loss/train': 0.8779363036155701} -08/30/2021 20:57:48 - INFO - __main__ - Step 43315: {'lr': 0.00040987063036448934, 'samples': 8316480, 'steps': 43314, 'loss/train': 1.0568691492080688} -08/30/2021 20:57:49 - INFO - __main__ - Step 43316: {'lr': 0.0004098665504735132, 'samples': 8316672, 'steps': 43315, 'loss/train': 1.6869804859161377} -08/30/2021 20:57:49 - INFO - __main__ - Step 43317: {'lr': 0.0004098624705105036, 'samples': 8316864, 'steps': 43316, 'loss/train': 0.6246923208236694} -08/30/2021 20:57:49 - INFO - __main__ - Step 43318: {'lr': 0.00040985839047546243, 'samples': 8317056, 'steps': 43317, 'loss/train': 1.9683358669281006} -08/30/2021 20:57:52 - INFO - __main__ - Step 43319: {'lr': 0.00040985431036839155, 'samples': 8317248, 'steps': 43318, 'loss/train': 1.346144437789917} -08/30/2021 20:57:52 - INFO - __main__ - Step 43320: {'lr': 0.00040985023018929277, 'samples': 8317440, 'steps': 43319, 'loss/train': 0.14741285145282745} -08/30/2021 20:57:52 - INFO - __main__ - Step 43321: {'lr': 0.000409846149938168, 'samples': 8317632, 'steps': 43320, 'loss/train': 1.372376799583435} -08/30/2021 20:57:53 - INFO - __main__ - Step 43322: {'lr': 0.000409842069615019, 'samples': 8317824, 'steps': 43321, 'loss/train': 1.4731149673461914} -08/30/2021 20:57:53 - INFO - __main__ - Step 43323: {'lr': 0.0004098379892198476, 'samples': 8318016, 'steps': 43322, 'loss/train': 0.18085931241512299} -08/30/2021 20:57:54 - INFO - __main__ - Step 43324: {'lr': 0.0004098339087526557, 'samples': 8318208, 'steps': 43323, 'loss/train': 0.05744965746998787} -08/30/2021 20:57:54 - INFO - __main__ - Step 43325: {'lr': 0.00040982982821344505, 'samples': 8318400, 'steps': 43324, 'loss/train': 0.554118275642395} -08/30/2021 20:57:56 - INFO - __main__ - Step 43326: {'lr': 0.0004098257476022176, 'samples': 8318592, 'steps': 43325, 'loss/train': 0.48451897501945496} -08/30/2021 20:57:56 - INFO - __main__ - Step 43327: {'lr': 0.00040982166691897517, 'samples': 8318784, 'steps': 43326, 'loss/train': 1.301076054573059} -08/30/2021 20:57:56 - INFO - __main__ - Step 43328: {'lr': 0.00040981758616371943, 'samples': 8318976, 'steps': 43327, 'loss/train': 1.4311808347702026} -08/30/2021 20:57:57 - INFO - __main__ - Step 43329: {'lr': 0.00040981350533645245, 'samples': 8319168, 'steps': 43328, 'loss/train': 1.9092429876327515} -08/30/2021 20:57:57 - INFO - __main__ - Step 43330: {'lr': 0.00040980942443717596, 'samples': 8319360, 'steps': 43329, 'loss/train': 1.692765712738037} -08/30/2021 20:57:58 - INFO - __main__ - Step 43331: {'lr': 0.0004098053434658918, 'samples': 8319552, 'steps': 43330, 'loss/train': 1.0924246311187744} -08/30/2021 20:57:59 - INFO - __main__ - Step 43332: {'lr': 0.0004098012624226018, 'samples': 8319744, 'steps': 43331, 'loss/train': 1.207492470741272} -08/30/2021 20:57:59 - INFO - __main__ - Step 43333: {'lr': 0.00040979718130730786, 'samples': 8319936, 'steps': 43332, 'loss/train': 1.9438953399658203} -08/30/2021 20:58:00 - INFO - __main__ - Step 43334: {'lr': 0.0004097931001200118, 'samples': 8320128, 'steps': 43333, 'loss/train': 1.279848337173462} -08/30/2021 20:58:00 - INFO - __main__ - Step 43335: {'lr': 0.00040978901886071543, 'samples': 8320320, 'steps': 43334, 'loss/train': 0.936413049697876} -08/30/2021 20:58:00 - INFO - __main__ - Step 43336: {'lr': 0.0004097849375294205, 'samples': 8320512, 'steps': 43335, 'loss/train': 1.6210170984268188} -08/30/2021 20:58:02 - INFO - __main__ - Step 43337: {'lr': 0.000409780856126129, 'samples': 8320704, 'steps': 43336, 'loss/train': 1.6832184791564941} -08/30/2021 20:58:03 - INFO - __main__ - Step 43338: {'lr': 0.00040977677465084275, 'samples': 8320896, 'steps': 43337, 'loss/train': 1.524421215057373} -08/30/2021 20:58:03 - INFO - __main__ - Step 43339: {'lr': 0.00040977269310356345, 'samples': 8321088, 'steps': 43338, 'loss/train': 1.1104391813278198} -08/30/2021 20:58:03 - INFO - __main__ - Step 43340: {'lr': 0.00040976861148429313, 'samples': 8321280, 'steps': 43339, 'loss/train': 2.2770543098449707} -08/30/2021 20:58:04 - INFO - __main__ - Step 43341: {'lr': 0.0004097645297930335, 'samples': 8321472, 'steps': 43340, 'loss/train': 0.0981130376458168} -08/30/2021 20:58:05 - INFO - __main__ - Step 43342: {'lr': 0.00040976044802978645, 'samples': 8321664, 'steps': 43341, 'loss/train': 1.6146026849746704} -08/30/2021 20:58:06 - INFO - __main__ - Step 43343: {'lr': 0.0004097563661945538, 'samples': 8321856, 'steps': 43342, 'loss/train': 1.3437130451202393} -08/30/2021 20:58:06 - INFO - __main__ - Step 43344: {'lr': 0.0004097522842873374, 'samples': 8322048, 'steps': 43343, 'loss/train': 1.407339334487915} -08/30/2021 20:58:06 - INFO - __main__ - Step 43345: {'lr': 0.0004097482023081391, 'samples': 8322240, 'steps': 43344, 'loss/train': 1.2994706630706787} -08/30/2021 20:58:07 - INFO - __main__ - Step 43346: {'lr': 0.00040974412025696067, 'samples': 8322432, 'steps': 43345, 'loss/train': 1.680964708328247} -08/30/2021 20:58:08 - INFO - __main__ - Step 43347: {'lr': 0.0004097400381338041, 'samples': 8322624, 'steps': 43346, 'loss/train': 1.319219708442688} -08/30/2021 20:58:09 - INFO - __main__ - Step 43348: {'lr': 0.0004097359559386711, 'samples': 8322816, 'steps': 43347, 'loss/train': 1.5931075811386108} -08/30/2021 20:58:09 - INFO - __main__ - Step 43349: {'lr': 0.0004097318736715635, 'samples': 8323008, 'steps': 43348, 'loss/train': 1.4774757623672485} -08/30/2021 20:58:09 - INFO - __main__ - Step 43350: {'lr': 0.0004097277913324832, 'samples': 8323200, 'steps': 43349, 'loss/train': 1.358873963356018} -08/30/2021 20:58:10 - INFO - __main__ - Step 43351: {'lr': 0.000409723708921432, 'samples': 8323392, 'steps': 43350, 'loss/train': 1.7013866901397705} -08/30/2021 20:58:10 - INFO - __main__ - Step 43352: {'lr': 0.0004097196264384118, 'samples': 8323584, 'steps': 43351, 'loss/train': 1.1859010457992554} -08/30/2021 20:58:12 - INFO - __main__ - Step 43353: {'lr': 0.00040971554388342436, 'samples': 8323776, 'steps': 43352, 'loss/train': 1.1149338483810425} -08/30/2021 20:58:13 - INFO - __main__ - Step 43354: {'lr': 0.00040971146125647165, 'samples': 8323968, 'steps': 43353, 'loss/train': 1.788057804107666} -08/30/2021 20:58:13 - INFO - __main__ - Step 43355: {'lr': 0.00040970737855755535, 'samples': 8324160, 'steps': 43354, 'loss/train': 1.388297200202942} -08/30/2021 20:58:14 - INFO - __main__ - Step 43356: {'lr': 0.00040970329578667735, 'samples': 8324352, 'steps': 43355, 'loss/train': 0.2147456854581833} -08/30/2021 20:58:14 - INFO - __main__ - Step 43357: {'lr': 0.00040969921294383956, 'samples': 8324544, 'steps': 43356, 'loss/train': 1.1008005142211914} -08/30/2021 20:58:16 - INFO - __main__ - Step 43358: {'lr': 0.00040969513002904375, 'samples': 8324736, 'steps': 43357, 'loss/train': 1.5434210300445557} -08/30/2021 20:58:16 - INFO - __main__ - Step 43359: {'lr': 0.0004096910470422918, 'samples': 8324928, 'steps': 43358, 'loss/train': 1.9454022645950317} -08/30/2021 20:58:16 - INFO - __main__ - Step 43360: {'lr': 0.0004096869639835855, 'samples': 8325120, 'steps': 43359, 'loss/train': 1.454698085784912} -08/30/2021 20:58:17 - INFO - __main__ - Step 43361: {'lr': 0.0004096828808529267, 'samples': 8325312, 'steps': 43360, 'loss/train': 0.07345447689294815} -08/30/2021 20:58:17 - INFO - __main__ - Step 43362: {'lr': 0.0004096787976503173, 'samples': 8325504, 'steps': 43361, 'loss/train': 0.7993736863136292} -08/30/2021 20:58:18 - INFO - __main__ - Step 43363: {'lr': 0.0004096747143757591, 'samples': 8325696, 'steps': 43362, 'loss/train': 1.400583028793335} -08/30/2021 20:58:19 - INFO - __main__ - Step 43364: {'lr': 0.0004096706310292539, 'samples': 8325888, 'steps': 43363, 'loss/train': 1.705430030822754} -08/30/2021 20:58:19 - INFO - __main__ - Step 43365: {'lr': 0.0004096665476108036, 'samples': 8326080, 'steps': 43364, 'loss/train': 1.1131094694137573} -08/30/2021 20:58:20 - INFO - __main__ - Step 43366: {'lr': 0.00040966246412040995, 'samples': 8326272, 'steps': 43365, 'loss/train': 1.2293146848678589} -08/30/2021 20:58:20 - INFO - __main__ - Step 43367: {'lr': 0.00040965838055807493, 'samples': 8326464, 'steps': 43366, 'loss/train': 1.9997642040252686} -08/30/2021 20:58:20 - INFO - __main__ - Step 43368: {'lr': 0.00040965429692380034, 'samples': 8326656, 'steps': 43367, 'loss/train': 1.0075520277023315} -08/30/2021 20:58:22 - INFO - __main__ - Step 43369: {'lr': 0.00040965021321758796, 'samples': 8326848, 'steps': 43368, 'loss/train': 1.459784984588623} -08/30/2021 20:58:22 - INFO - __main__ - Step 43370: {'lr': 0.00040964612943943964, 'samples': 8327040, 'steps': 43369, 'loss/train': 1.4586421251296997} -08/30/2021 20:58:23 - INFO - __main__ - Step 43371: {'lr': 0.00040964204558935726, 'samples': 8327232, 'steps': 43370, 'loss/train': 1.2619712352752686} -08/30/2021 20:58:23 - INFO - __main__ - Step 43372: {'lr': 0.00040963796166734257, 'samples': 8327424, 'steps': 43371, 'loss/train': 0.8410171866416931} -08/30/2021 20:58:23 - INFO - __main__ - Step 43373: {'lr': 0.00040963387767339757, 'samples': 8327616, 'steps': 43372, 'loss/train': 1.6045360565185547} -08/30/2021 20:58:25 - INFO - __main__ - Step 43374: {'lr': 0.00040962979360752394, 'samples': 8327808, 'steps': 43373, 'loss/train': 1.0213145017623901} -08/30/2021 20:58:25 - INFO - __main__ - Step 43375: {'lr': 0.0004096257094697236, 'samples': 8328000, 'steps': 43374, 'loss/train': 0.8814600706100464} -08/30/2021 20:58:26 - INFO - __main__ - Step 43376: {'lr': 0.00040962162525999833, 'samples': 8328192, 'steps': 43375, 'loss/train': 1.1390459537506104} -08/30/2021 20:58:26 - INFO - __main__ - Step 43377: {'lr': 0.00040961754097835015, 'samples': 8328384, 'steps': 43376, 'loss/train': 0.8413316011428833} -08/30/2021 20:58:26 - INFO - __main__ - Step 43378: {'lr': 0.00040961345662478065, 'samples': 8328576, 'steps': 43377, 'loss/train': 1.6547396183013916} -08/30/2021 20:58:28 - INFO - __main__ - Step 43379: {'lr': 0.00040960937219929186, 'samples': 8328768, 'steps': 43378, 'loss/train': 1.0291426181793213} -08/30/2021 20:58:29 - INFO - __main__ - Step 43380: {'lr': 0.00040960528770188554, 'samples': 8328960, 'steps': 43379, 'loss/train': 1.0927127599716187} -08/30/2021 20:58:29 - INFO - __main__ - Step 43381: {'lr': 0.00040960120313256356, 'samples': 8329152, 'steps': 43380, 'loss/train': 1.1517938375473022} -08/30/2021 20:58:30 - INFO - __main__ - Step 43382: {'lr': 0.0004095971184913277, 'samples': 8329344, 'steps': 43381, 'loss/train': 1.6215919256210327} -08/30/2021 20:58:30 - INFO - __main__ - Step 43383: {'lr': 0.0004095930337781798, 'samples': 8329536, 'steps': 43382, 'loss/train': 1.6278475522994995} -08/30/2021 20:58:30 - INFO - __main__ - Step 43384: {'lr': 0.00040958894899312183, 'samples': 8329728, 'steps': 43383, 'loss/train': 1.1109435558319092} -08/30/2021 20:58:32 - INFO - __main__ - Step 43385: {'lr': 0.0004095848641361555, 'samples': 8329920, 'steps': 43384, 'loss/train': 1.0669652223587036} -08/30/2021 20:58:32 - INFO - __main__ - Step 43386: {'lr': 0.0004095807792072827, 'samples': 8330112, 'steps': 43385, 'loss/train': 1.3824292421340942} -08/30/2021 20:58:32 - INFO - __main__ - Step 43387: {'lr': 0.00040957669420650525, 'samples': 8330304, 'steps': 43386, 'loss/train': 1.7778005599975586} -08/30/2021 20:58:33 - INFO - __main__ - Step 43388: {'lr': 0.000409572609133825, 'samples': 8330496, 'steps': 43387, 'loss/train': 1.4954004287719727} -08/30/2021 20:58:33 - INFO - __main__ - Step 43389: {'lr': 0.00040956852398924383, 'samples': 8330688, 'steps': 43388, 'loss/train': 1.5687731504440308} -08/30/2021 20:58:35 - INFO - __main__ - Step 43390: {'lr': 0.0004095644387727635, 'samples': 8330880, 'steps': 43389, 'loss/train': 2.525780439376831} -08/30/2021 20:58:35 - INFO - __main__ - Step 43391: {'lr': 0.0004095603534843859, 'samples': 8331072, 'steps': 43390, 'loss/train': 1.3043450117111206} -08/30/2021 20:58:35 - INFO - __main__ - Step 43392: {'lr': 0.00040955626812411297, 'samples': 8331264, 'steps': 43391, 'loss/train': 1.4299070835113525} -08/30/2021 20:58:36 - INFO - __main__ - Step 43393: {'lr': 0.0004095521826919463, 'samples': 8331456, 'steps': 43392, 'loss/train': 1.1157358884811401} -08/30/2021 20:58:36 - INFO - __main__ - Step 43394: {'lr': 0.0004095480971878879, 'samples': 8331648, 'steps': 43393, 'loss/train': 1.221972942352295} -08/30/2021 20:58:38 - INFO - __main__ - Step 43395: {'lr': 0.0004095440116119397, 'samples': 8331840, 'steps': 43394, 'loss/train': 1.6612670421600342} -08/30/2021 20:58:38 - INFO - __main__ - Step 43396: {'lr': 0.00040953992596410335, 'samples': 8332032, 'steps': 43395, 'loss/train': 1.297799825668335} -08/30/2021 20:58:38 - INFO - __main__ - Step 43397: {'lr': 0.0004095358402443808, 'samples': 8332224, 'steps': 43396, 'loss/train': 1.5782296657562256} -08/30/2021 20:58:39 - INFO - __main__ - Step 43398: {'lr': 0.0004095317544527738, 'samples': 8332416, 'steps': 43397, 'loss/train': 1.165611743927002} -08/30/2021 20:58:39 - INFO - __main__ - Step 43399: {'lr': 0.00040952766858928433, 'samples': 8332608, 'steps': 43398, 'loss/train': 0.9418405294418335} -08/30/2021 20:58:41 - INFO - __main__ - Step 43400: {'lr': 0.0004095235826539141, 'samples': 8332800, 'steps': 43399, 'loss/train': 1.2756699323654175} -08/30/2021 20:58:41 - INFO - __main__ - Step 43401: {'lr': 0.00040951949664666504, 'samples': 8332992, 'steps': 43400, 'loss/train': 0.5364533066749573} -08/30/2021 20:58:41 - INFO - __main__ - Step 43402: {'lr': 0.00040951541056753895, 'samples': 8333184, 'steps': 43401, 'loss/train': 2.167762279510498} -08/30/2021 20:58:42 - INFO - __main__ - Step 43403: {'lr': 0.00040951132441653773, 'samples': 8333376, 'steps': 43402, 'loss/train': 1.5748502016067505} -08/30/2021 20:58:42 - INFO - __main__ - Step 43404: {'lr': 0.00040950723819366307, 'samples': 8333568, 'steps': 43403, 'loss/train': 0.9157592058181763} -08/30/2021 20:58:44 - INFO - __main__ - Step 43405: {'lr': 0.000409503151898917, 'samples': 8333760, 'steps': 43404, 'loss/train': 0.4294249415397644} -08/30/2021 20:58:44 - INFO - __main__ - Step 43406: {'lr': 0.0004094990655323012, 'samples': 8333952, 'steps': 43405, 'loss/train': 1.1591331958770752} -08/30/2021 20:58:44 - INFO - __main__ - Step 43407: {'lr': 0.00040949497909381757, 'samples': 8334144, 'steps': 43406, 'loss/train': 0.509672224521637} -08/30/2021 20:58:45 - INFO - __main__ - Step 43408: {'lr': 0.000409490892583468, 'samples': 8334336, 'steps': 43407, 'loss/train': 1.084208607673645} -08/30/2021 20:58:45 - INFO - __main__ - Step 43409: {'lr': 0.0004094868060012543, 'samples': 8334528, 'steps': 43408, 'loss/train': 0.672725260257721} -08/30/2021 20:58:47 - INFO - __main__ - Step 43410: {'lr': 0.0004094827193471783, 'samples': 8334720, 'steps': 43409, 'loss/train': 1.4566689729690552} -08/30/2021 20:58:48 - INFO - __main__ - Step 43411: {'lr': 0.00040947863262124186, 'samples': 8334912, 'steps': 43410, 'loss/train': 1.4267734289169312} -08/30/2021 20:58:48 - INFO - __main__ - Step 43412: {'lr': 0.0004094745458234468, 'samples': 8335104, 'steps': 43411, 'loss/train': 1.5116239786148071} -08/30/2021 20:58:49 - INFO - __main__ - Step 43413: {'lr': 0.00040947045895379494, 'samples': 8335296, 'steps': 43412, 'loss/train': 1.513641595840454} -08/30/2021 20:58:49 - INFO - __main__ - Step 43414: {'lr': 0.00040946637201228815, 'samples': 8335488, 'steps': 43413, 'loss/train': 0.3500490188598633} -08/30/2021 20:58:49 - INFO - __main__ - Step 43415: {'lr': 0.00040946228499892835, 'samples': 8335680, 'steps': 43414, 'loss/train': 1.5490992069244385} -08/30/2021 20:58:51 - INFO - __main__ - Step 43416: {'lr': 0.0004094581979137172, 'samples': 8335872, 'steps': 43415, 'loss/train': 1.1055530309677124} -08/30/2021 20:58:51 - INFO - __main__ - Step 43417: {'lr': 0.00040945411075665674, 'samples': 8336064, 'steps': 43416, 'loss/train': 1.5763269662857056} -08/30/2021 20:58:52 - INFO - __main__ - Step 43418: {'lr': 0.0004094500235277486, 'samples': 8336256, 'steps': 43417, 'loss/train': 1.535204291343689} -08/30/2021 20:58:52 - INFO - __main__ - Step 43419: {'lr': 0.0004094459362269949, 'samples': 8336448, 'steps': 43418, 'loss/train': 1.4099704027175903} -08/30/2021 20:58:52 - INFO - __main__ - Step 43420: {'lr': 0.0004094418488543972, 'samples': 8336640, 'steps': 43419, 'loss/train': 1.3240219354629517} -08/30/2021 20:58:54 - INFO - __main__ - Step 43421: {'lr': 0.00040943776140995756, 'samples': 8336832, 'steps': 43420, 'loss/train': 1.636500597000122} -08/30/2021 20:58:54 - INFO - __main__ - Step 43422: {'lr': 0.0004094336738936777, 'samples': 8337024, 'steps': 43421, 'loss/train': 1.5919028520584106} -08/30/2021 20:58:55 - INFO - __main__ - Step 43423: {'lr': 0.0004094295863055594, 'samples': 8337216, 'steps': 43422, 'loss/train': 1.3845083713531494} -08/30/2021 20:58:55 - INFO - __main__ - Step 43424: {'lr': 0.0004094254986456046, 'samples': 8337408, 'steps': 43423, 'loss/train': 1.5208150148391724} -08/30/2021 20:58:55 - INFO - __main__ - Step 43425: {'lr': 0.0004094214109138152, 'samples': 8337600, 'steps': 43424, 'loss/train': 1.5718562602996826} -08/30/2021 20:58:57 - INFO - __main__ - Step 43426: {'lr': 0.000409417323110193, 'samples': 8337792, 'steps': 43425, 'loss/train': 1.39116370677948} -08/30/2021 20:58:57 - INFO - __main__ - Step 43427: {'lr': 0.00040941323523473975, 'samples': 8337984, 'steps': 43426, 'loss/train': 0.9971347451210022} -08/30/2021 20:58:58 - INFO - __main__ - Step 43428: {'lr': 0.00040940914728745736, 'samples': 8338176, 'steps': 43427, 'loss/train': 1.3643150329589844} -08/30/2021 20:58:58 - INFO - __main__ - Step 43429: {'lr': 0.0004094050592683477, 'samples': 8338368, 'steps': 43428, 'loss/train': 2.310330390930176} -08/30/2021 20:58:58 - INFO - __main__ - Step 43430: {'lr': 0.00040940097117741255, 'samples': 8338560, 'steps': 43429, 'loss/train': 1.6164817810058594} -08/30/2021 20:58:59 - INFO - __main__ - Step 43431: {'lr': 0.00040939688301465377, 'samples': 8338752, 'steps': 43430, 'loss/train': 1.855127215385437} -08/30/2021 20:59:00 - INFO - __main__ - Step 43432: {'lr': 0.0004093927947800732, 'samples': 8338944, 'steps': 43431, 'loss/train': 2.8005080223083496} -08/30/2021 20:59:01 - INFO - __main__ - Step 43433: {'lr': 0.00040938870647367275, 'samples': 8339136, 'steps': 43432, 'loss/train': 0.2542159855365753} -08/30/2021 20:59:01 - INFO - __main__ - Step 43434: {'lr': 0.0004093846180954542, 'samples': 8339328, 'steps': 43433, 'loss/train': 1.6060121059417725} -08/30/2021 20:59:02 - INFO - __main__ - Step 43435: {'lr': 0.00040938052964541936, 'samples': 8339520, 'steps': 43434, 'loss/train': 1.561721682548523} -08/30/2021 20:59:02 - INFO - __main__ - Step 43436: {'lr': 0.0004093764411235702, 'samples': 8339712, 'steps': 43435, 'loss/train': 1.6833140850067139} -08/30/2021 20:59:04 - INFO - __main__ - Step 43437: {'lr': 0.00040937235252990834, 'samples': 8339904, 'steps': 43436, 'loss/train': 1.2376240491867065} -08/30/2021 20:59:04 - INFO - __main__ - Step 43438: {'lr': 0.00040936826386443585, 'samples': 8340096, 'steps': 43437, 'loss/train': 1.8350682258605957} -08/30/2021 20:59:04 - INFO - __main__ - Step 43439: {'lr': 0.00040936417512715454, 'samples': 8340288, 'steps': 43438, 'loss/train': 1.7881381511688232} -08/30/2021 20:59:05 - INFO - __main__ - Step 43440: {'lr': 0.00040936008631806603, 'samples': 8340480, 'steps': 43439, 'loss/train': 1.2008146047592163} -08/30/2021 20:59:05 - INFO - __main__ - Step 43441: {'lr': 0.00040935599743717243, 'samples': 8340672, 'steps': 43440, 'loss/train': 1.6067630052566528} -08/30/2021 20:59:07 - INFO - __main__ - Step 43442: {'lr': 0.00040935190848447544, 'samples': 8340864, 'steps': 43441, 'loss/train': 1.3503886461257935} -08/30/2021 20:59:07 - INFO - __main__ - Step 43443: {'lr': 0.000409347819459977, 'samples': 8341056, 'steps': 43442, 'loss/train': 1.217471718788147} -08/30/2021 20:59:08 - INFO - __main__ - Step 43444: {'lr': 0.0004093437303636788, 'samples': 8341248, 'steps': 43443, 'loss/train': 2.0348846912384033} -08/30/2021 20:59:08 - INFO - __main__ - Step 43445: {'lr': 0.0004093396411955829, 'samples': 8341440, 'steps': 43444, 'loss/train': 0.8413245677947998} -08/30/2021 20:59:08 - INFO - __main__ - Step 43446: {'lr': 0.0004093355519556908, 'samples': 8341632, 'steps': 43445, 'loss/train': 1.2147419452667236} -08/30/2021 20:59:10 - INFO - __main__ - Step 43447: {'lr': 0.0004093314626440048, 'samples': 8341824, 'steps': 43446, 'loss/train': 1.4269837141036987} -08/30/2021 20:59:10 - INFO - __main__ - Step 43448: {'lr': 0.0004093273732605264, 'samples': 8342016, 'steps': 43447, 'loss/train': 1.7882280349731445} -08/30/2021 20:59:11 - INFO - __main__ - Step 43449: {'lr': 0.0004093232838052575, 'samples': 8342208, 'steps': 43448, 'loss/train': 1.3685007095336914} -08/30/2021 20:59:11 - INFO - __main__ - Step 43450: {'lr': 0.0004093191942782001, 'samples': 8342400, 'steps': 43449, 'loss/train': 1.5755748748779297} -08/30/2021 20:59:11 - INFO - __main__ - Step 43451: {'lr': 0.0004093151046793558, 'samples': 8342592, 'steps': 43450, 'loss/train': 1.5783625841140747} -08/30/2021 20:59:13 - INFO - __main__ - Step 43452: {'lr': 0.00040931101500872656, 'samples': 8342784, 'steps': 43451, 'loss/train': 1.5340065956115723} -08/30/2021 20:59:13 - INFO - __main__ - Step 43453: {'lr': 0.00040930692526631443, 'samples': 8342976, 'steps': 43452, 'loss/train': 1.3310062885284424} -08/30/2021 20:59:14 - INFO - __main__ - Step 43454: {'lr': 0.0004093028354521209, 'samples': 8343168, 'steps': 43453, 'loss/train': 1.7738624811172485} -08/30/2021 20:59:14 - INFO - __main__ - Step 43455: {'lr': 0.000409298745566148, 'samples': 8343360, 'steps': 43454, 'loss/train': 1.6138641834259033} -08/30/2021 20:59:14 - INFO - __main__ - Step 43456: {'lr': 0.00040929465560839753, 'samples': 8343552, 'steps': 43455, 'loss/train': 1.0026392936706543} -08/30/2021 20:59:15 - INFO - __main__ - Step 43457: {'lr': 0.00040929056557887137, 'samples': 8343744, 'steps': 43456, 'loss/train': 1.594305396080017} -08/30/2021 20:59:17 - INFO - __main__ - Step 43458: {'lr': 0.0004092864754775713, 'samples': 8343936, 'steps': 43457, 'loss/train': 1.7979779243469238} -08/30/2021 20:59:17 - INFO - __main__ - Step 43459: {'lr': 0.00040928238530449926, 'samples': 8344128, 'steps': 43458, 'loss/train': 1.6893632411956787} -08/30/2021 20:59:17 - INFO - __main__ - Step 43460: {'lr': 0.00040927829505965694, 'samples': 8344320, 'steps': 43459, 'loss/train': 1.198866844177246} -08/30/2021 20:59:18 - INFO - __main__ - Step 43461: {'lr': 0.00040927420474304646, 'samples': 8344512, 'steps': 43460, 'loss/train': 1.4430618286132812} -08/30/2021 20:59:18 - INFO - __main__ - Step 43462: {'lr': 0.00040927011435466933, 'samples': 8344704, 'steps': 43461, 'loss/train': 2.045926332473755} -08/30/2021 20:59:20 - INFO - __main__ - Step 43463: {'lr': 0.0004092660238945276, 'samples': 8344896, 'steps': 43462, 'loss/train': 0.4425169825553894} -08/30/2021 20:59:21 - INFO - __main__ - Step 43464: {'lr': 0.00040926193336262304, 'samples': 8345088, 'steps': 43463, 'loss/train': 1.5673891305923462} -08/30/2021 20:59:21 - INFO - __main__ - Step 43465: {'lr': 0.0004092578427589575, 'samples': 8345280, 'steps': 43464, 'loss/train': 1.622633695602417} -08/30/2021 20:59:21 - INFO - __main__ - Step 43466: {'lr': 0.0004092537520835328, 'samples': 8345472, 'steps': 43465, 'loss/train': 0.8515864610671997} -08/30/2021 20:59:22 - INFO - __main__ - Step 43467: {'lr': 0.0004092496613363509, 'samples': 8345664, 'steps': 43466, 'loss/train': 1.6168700456619263} -08/30/2021 20:59:22 - INFO - __main__ - Step 43468: {'lr': 0.0004092455705174135, 'samples': 8345856, 'steps': 43467, 'loss/train': 1.315977692604065} -08/30/2021 20:59:23 - INFO - __main__ - Step 43469: {'lr': 0.00040924147962672253, 'samples': 8346048, 'steps': 43468, 'loss/train': 1.5509092807769775} -08/30/2021 20:59:24 - INFO - __main__ - Step 43470: {'lr': 0.00040923738866427986, 'samples': 8346240, 'steps': 43469, 'loss/train': 1.4158509969711304} -08/30/2021 20:59:24 - INFO - __main__ - Step 43471: {'lr': 0.00040923329763008714, 'samples': 8346432, 'steps': 43470, 'loss/train': 1.3277255296707153} -08/30/2021 20:59:24 - INFO - __main__ - Step 43472: {'lr': 0.0004092292065241464, 'samples': 8346624, 'steps': 43471, 'loss/train': 1.3438161611557007} -08/30/2021 20:59:25 - INFO - __main__ - Step 43473: {'lr': 0.00040922511534645953, 'samples': 8346816, 'steps': 43472, 'loss/train': 1.7162595987319946} -08/30/2021 20:59:27 - INFO - __main__ - Step 43474: {'lr': 0.0004092210240970282, 'samples': 8347008, 'steps': 43473, 'loss/train': 0.415038138628006} -08/30/2021 20:59:27 - INFO - __main__ - Step 43475: {'lr': 0.0004092169327758544, 'samples': 8347200, 'steps': 43474, 'loss/train': 2.0186753273010254} -08/30/2021 20:59:27 - INFO - __main__ - Step 43476: {'lr': 0.0004092128413829398, 'samples': 8347392, 'steps': 43475, 'loss/train': 1.492740273475647} -08/30/2021 20:59:28 - INFO - __main__ - Step 43477: {'lr': 0.0004092087499182864, 'samples': 8347584, 'steps': 43476, 'loss/train': 1.8593817949295044} -08/30/2021 20:59:28 - INFO - __main__ - Step 43478: {'lr': 0.000409204658381896, 'samples': 8347776, 'steps': 43477, 'loss/train': 1.3084630966186523} -08/30/2021 20:59:29 - INFO - __main__ - Step 43479: {'lr': 0.00040920056677377047, 'samples': 8347968, 'steps': 43478, 'loss/train': 1.449884295463562} -08/30/2021 20:59:30 - INFO - __main__ - Step 43480: {'lr': 0.00040919647509391155, 'samples': 8348160, 'steps': 43479, 'loss/train': 1.1660586595535278} -08/30/2021 20:59:30 - INFO - __main__ - Step 43481: {'lr': 0.0004091923833423212, 'samples': 8348352, 'steps': 43480, 'loss/train': 1.6018120050430298} -08/30/2021 20:59:31 - INFO - __main__ - Step 43482: {'lr': 0.00040918829151900127, 'samples': 8348544, 'steps': 43481, 'loss/train': 1.1463183164596558} -08/30/2021 20:59:31 - INFO - __main__ - Step 43483: {'lr': 0.0004091841996239535, 'samples': 8348736, 'steps': 43482, 'loss/train': 1.4388169050216675} -08/30/2021 20:59:33 - INFO - __main__ - Step 43484: {'lr': 0.00040918010765717976, 'samples': 8348928, 'steps': 43483, 'loss/train': 2.377580165863037} -08/30/2021 20:59:33 - INFO - __main__ - Step 43485: {'lr': 0.00040917601561868194, 'samples': 8349120, 'steps': 43484, 'loss/train': 1.4399527311325073} -08/30/2021 20:59:33 - INFO - __main__ - Step 43486: {'lr': 0.00040917192350846187, 'samples': 8349312, 'steps': 43485, 'loss/train': 1.2692066431045532} -08/30/2021 20:59:34 - INFO - __main__ - Step 43487: {'lr': 0.00040916783132652134, 'samples': 8349504, 'steps': 43486, 'loss/train': 1.2149641513824463} -08/30/2021 20:59:34 - INFO - __main__ - Step 43488: {'lr': 0.0004091637390728623, 'samples': 8349696, 'steps': 43487, 'loss/train': 1.3833638429641724} -08/30/2021 20:59:36 - INFO - __main__ - Step 43489: {'lr': 0.00040915964674748665, 'samples': 8349888, 'steps': 43488, 'loss/train': 1.2569570541381836} -08/30/2021 20:59:36 - INFO - __main__ - Step 43490: {'lr': 0.0004091555543503959, 'samples': 8350080, 'steps': 43489, 'loss/train': 1.5424100160598755} -08/30/2021 20:59:36 - INFO - __main__ - Step 43491: {'lr': 0.00040915146188159223, 'samples': 8350272, 'steps': 43490, 'loss/train': 1.5001763105392456} -08/30/2021 20:59:37 - INFO - __main__ - Step 43492: {'lr': 0.0004091473693410773, 'samples': 8350464, 'steps': 43491, 'loss/train': 1.5339666604995728} -08/30/2021 20:59:37 - INFO - __main__ - Step 43493: {'lr': 0.0004091432767288531, 'samples': 8350656, 'steps': 43492, 'loss/train': 1.5622690916061401} -08/30/2021 20:59:38 - INFO - __main__ - Step 43494: {'lr': 0.0004091391840449213, 'samples': 8350848, 'steps': 43493, 'loss/train': 0.9105747938156128} -08/30/2021 20:59:39 - INFO - __main__ - Step 43495: {'lr': 0.00040913509128928394, 'samples': 8351040, 'steps': 43494, 'loss/train': 0.9648832082748413} -08/30/2021 20:59:39 - INFO - __main__ - Step 43496: {'lr': 0.00040913099846194274, 'samples': 8351232, 'steps': 43495, 'loss/train': 0.9120098352432251} -08/30/2021 20:59:40 - INFO - __main__ - Step 43497: {'lr': 0.00040912690556289957, 'samples': 8351424, 'steps': 43496, 'loss/train': 0.5447750091552734} -08/30/2021 20:59:40 - INFO - __main__ - Step 43498: {'lr': 0.0004091228125921562, 'samples': 8351616, 'steps': 43497, 'loss/train': 1.810316801071167} -08/30/2021 20:59:40 - INFO - __main__ - Step 43499: {'lr': 0.0004091187195497146, 'samples': 8351808, 'steps': 43498, 'loss/train': 1.1804993152618408} -08/30/2021 20:59:42 - INFO - __main__ - Step 43500: {'lr': 0.00040911462643557656, 'samples': 8352000, 'steps': 43499, 'loss/train': 1.554088830947876} -08/30/2021 20:59:42 - INFO - __main__ - Step 43501: {'lr': 0.0004091105332497439, 'samples': 8352192, 'steps': 43500, 'loss/train': 1.2700055837631226} -08/30/2021 20:59:43 - INFO - __main__ - Step 43502: {'lr': 0.0004091064399922185, 'samples': 8352384, 'steps': 43501, 'loss/train': 1.230256199836731} -08/30/2021 20:59:43 - INFO - __main__ - Step 43503: {'lr': 0.0004091023466630023, 'samples': 8352576, 'steps': 43502, 'loss/train': 1.2320678234100342} -08/30/2021 20:59:43 - INFO - __main__ - Step 43504: {'lr': 0.00040909825326209694, 'samples': 8352768, 'steps': 43503, 'loss/train': 1.304828405380249} -08/30/2021 20:59:45 - INFO - __main__ - Step 43505: {'lr': 0.0004090941597895043, 'samples': 8352960, 'steps': 43504, 'loss/train': 1.513417363166809} -08/30/2021 20:59:45 - INFO - __main__ - Step 43506: {'lr': 0.0004090900662452264, 'samples': 8353152, 'steps': 43505, 'loss/train': 0.8245118856430054} -08/30/2021 20:59:46 - INFO - __main__ - Step 43507: {'lr': 0.00040908597262926484, 'samples': 8353344, 'steps': 43506, 'loss/train': 0.46327120065689087} -08/30/2021 20:59:46 - INFO - __main__ - Step 43508: {'lr': 0.0004090818789416217, 'samples': 8353536, 'steps': 43507, 'loss/train': 1.8288776874542236} -08/30/2021 20:59:46 - INFO - __main__ - Step 43509: {'lr': 0.0004090777851822988, 'samples': 8353728, 'steps': 43508, 'loss/train': 1.6535285711288452} -08/30/2021 20:59:48 - INFO - __main__ - Step 43510: {'lr': 0.0004090736913512977, 'samples': 8353920, 'steps': 43509, 'loss/train': 1.4248156547546387} -08/30/2021 20:59:48 - INFO - __main__ - Step 43511: {'lr': 0.0004090695974486206, 'samples': 8354112, 'steps': 43510, 'loss/train': 1.4615013599395752} -08/30/2021 20:59:49 - INFO - __main__ - Step 43512: {'lr': 0.00040906550347426907, 'samples': 8354304, 'steps': 43511, 'loss/train': 2.2905707359313965} -08/30/2021 20:59:49 - INFO - __main__ - Step 43513: {'lr': 0.0004090614094282452, 'samples': 8354496, 'steps': 43512, 'loss/train': 1.2138750553131104} -08/30/2021 20:59:49 - INFO - __main__ - Step 43514: {'lr': 0.00040905731531055067, 'samples': 8354688, 'steps': 43513, 'loss/train': 1.4084804058074951} -08/30/2021 20:59:51 - INFO - __main__ - Step 43515: {'lr': 0.0004090532211211874, 'samples': 8354880, 'steps': 43514, 'loss/train': 1.2168047428131104} -08/30/2021 20:59:51 - INFO - __main__ - Step 43516: {'lr': 0.0004090491268601572, 'samples': 8355072, 'steps': 43515, 'loss/train': 1.6737269163131714} -08/30/2021 20:59:52 - INFO - __main__ - Step 43517: {'lr': 0.0004090450325274618, 'samples': 8355264, 'steps': 43516, 'loss/train': 0.9451260566711426} -08/30/2021 20:59:52 - INFO - __main__ - Step 43518: {'lr': 0.0004090409381231033, 'samples': 8355456, 'steps': 43517, 'loss/train': 1.3149120807647705} -08/30/2021 20:59:52 - INFO - __main__ - Step 43519: {'lr': 0.0004090368436470833, 'samples': 8355648, 'steps': 43518, 'loss/train': 1.4054244756698608} -08/30/2021 20:59:54 - INFO - __main__ - Step 43520: {'lr': 0.0004090327490994038, 'samples': 8355840, 'steps': 43519, 'loss/train': 1.840895414352417} -08/30/2021 20:59:55 - INFO - __main__ - Step 43521: {'lr': 0.00040902865448006663, 'samples': 8356032, 'steps': 43520, 'loss/train': 0.7905577421188354} -08/30/2021 20:59:56 - INFO - __main__ - Step 43522: {'lr': 0.0004090245597890736, 'samples': 8356224, 'steps': 43521, 'loss/train': 1.9034472703933716} -08/30/2021 20:59:56 - INFO - __main__ - Step 43523: {'lr': 0.00040902046502642656, 'samples': 8356416, 'steps': 43522, 'loss/train': 1.4901223182678223} -08/30/2021 20:59:56 - INFO - __main__ - Step 43524: {'lr': 0.0004090163701921273, 'samples': 8356608, 'steps': 43523, 'loss/train': 2.0895180702209473} -08/30/2021 20:59:58 - INFO - __main__ - Step 43525: {'lr': 0.0004090122752861777, 'samples': 8356800, 'steps': 43524, 'loss/train': 1.4673142433166504} -08/30/2021 20:59:58 - INFO - __main__ - Step 43526: {'lr': 0.0004090081803085797, 'samples': 8356992, 'steps': 43525, 'loss/train': 1.6373339891433716} -08/30/2021 20:59:59 - INFO - __main__ - Step 43527: {'lr': 0.00040900408525933505, 'samples': 8357184, 'steps': 43526, 'loss/train': 0.7308704853057861} -08/30/2021 20:59:59 - INFO - __main__ - Step 43528: {'lr': 0.0004089999901384456, 'samples': 8357376, 'steps': 43527, 'loss/train': 1.4978106021881104} -08/30/2021 20:59:59 - INFO - __main__ - Step 43529: {'lr': 0.00040899589494591316, 'samples': 8357568, 'steps': 43528, 'loss/train': 1.6159049272537231} -08/30/2021 21:00:00 - INFO - __main__ - Step 43530: {'lr': 0.0004089917996817397, 'samples': 8357760, 'steps': 43529, 'loss/train': 1.2600092887878418} -08/30/2021 21:00:01 - INFO - __main__ - Step 43531: {'lr': 0.00040898770434592694, 'samples': 8357952, 'steps': 43530, 'loss/train': 1.5700477361679077} -08/30/2021 21:00:02 - INFO - __main__ - Step 43532: {'lr': 0.0004089836089384768, 'samples': 8358144, 'steps': 43531, 'loss/train': 1.2421658039093018} -08/30/2021 21:00:02 - INFO - __main__ - Step 43533: {'lr': 0.0004089795134593911, 'samples': 8358336, 'steps': 43532, 'loss/train': 1.5936055183410645} -08/30/2021 21:00:02 - INFO - __main__ - Step 43534: {'lr': 0.00040897541790867165, 'samples': 8358528, 'steps': 43533, 'loss/train': 0.3454930782318115} -08/30/2021 21:00:03 - INFO - __main__ - Step 43535: {'lr': 0.00040897132228632035, 'samples': 8358720, 'steps': 43534, 'loss/train': 1.991028904914856} -08/30/2021 21:00:03 - INFO - __main__ - Step 43536: {'lr': 0.000408967226592339, 'samples': 8358912, 'steps': 43535, 'loss/train': 1.256789207458496} -08/30/2021 21:00:05 - INFO - __main__ - Step 43537: {'lr': 0.00040896313082672953, 'samples': 8359104, 'steps': 43536, 'loss/train': 1.0655033588409424} -08/30/2021 21:00:05 - INFO - __main__ - Step 43538: {'lr': 0.0004089590349894937, 'samples': 8359296, 'steps': 43537, 'loss/train': 1.5189064741134644} -08/30/2021 21:00:05 - INFO - __main__ - Step 43539: {'lr': 0.0004089549390806334, 'samples': 8359488, 'steps': 43538, 'loss/train': 1.5763905048370361} -08/30/2021 21:00:06 - INFO - __main__ - Step 43540: {'lr': 0.0004089508431001504, 'samples': 8359680, 'steps': 43539, 'loss/train': 0.6611826419830322} -08/30/2021 21:00:06 - INFO - __main__ - Step 43541: {'lr': 0.00040894674704804667, 'samples': 8359872, 'steps': 43540, 'loss/train': 1.797633171081543} -08/30/2021 21:00:07 - INFO - __main__ - Step 43542: {'lr': 0.00040894265092432397, 'samples': 8360064, 'steps': 43541, 'loss/train': 1.352376937866211} -08/30/2021 21:00:08 - INFO - __main__ - Step 43543: {'lr': 0.0004089385547289841, 'samples': 8360256, 'steps': 43542, 'loss/train': 1.684341311454773} -08/30/2021 21:00:08 - INFO - __main__ - Step 43544: {'lr': 0.00040893445846202904, 'samples': 8360448, 'steps': 43543, 'loss/train': 1.78757905960083} -08/30/2021 21:00:09 - INFO - __main__ - Step 43545: {'lr': 0.00040893036212346056, 'samples': 8360640, 'steps': 43544, 'loss/train': 1.09691321849823} -08/30/2021 21:00:09 - INFO - __main__ - Step 43546: {'lr': 0.00040892626571328053, 'samples': 8360832, 'steps': 43545, 'loss/train': 1.354297399520874} -08/30/2021 21:00:11 - INFO - __main__ - Step 43547: {'lr': 0.00040892216923149073, 'samples': 8361024, 'steps': 43546, 'loss/train': 1.2973880767822266} -08/30/2021 21:00:11 - INFO - __main__ - Step 43548: {'lr': 0.000408918072678093, 'samples': 8361216, 'steps': 43547, 'loss/train': 1.8560454845428467} -08/30/2021 21:00:12 - INFO - __main__ - Step 43549: {'lr': 0.0004089139760530893, 'samples': 8361408, 'steps': 43548, 'loss/train': 1.3205373287200928} -08/30/2021 21:00:12 - INFO - __main__ - Step 43550: {'lr': 0.0004089098793564815, 'samples': 8361600, 'steps': 43549, 'loss/train': 1.5110255479812622} -08/30/2021 21:00:12 - INFO - __main__ - Step 43551: {'lr': 0.00040890578258827125, 'samples': 8361792, 'steps': 43550, 'loss/train': 0.12010274082422256} -08/30/2021 21:00:14 - INFO - __main__ - Step 43552: {'lr': 0.00040890168574846055, 'samples': 8361984, 'steps': 43551, 'loss/train': 2.036977767944336} -08/30/2021 21:00:14 - INFO - __main__ - Step 43553: {'lr': 0.0004088975888370512, 'samples': 8362176, 'steps': 43552, 'loss/train': 1.012085199356079} -08/30/2021 21:00:15 - INFO - __main__ - Step 43554: {'lr': 0.00040889349185404503, 'samples': 8362368, 'steps': 43553, 'loss/train': 1.2202578783035278} -08/30/2021 21:00:15 - INFO - __main__ - Step 43555: {'lr': 0.00040888939479944385, 'samples': 8362560, 'steps': 43554, 'loss/train': 1.8396084308624268} -08/30/2021 21:00:15 - INFO - __main__ - Step 43556: {'lr': 0.00040888529767324966, 'samples': 8362752, 'steps': 43555, 'loss/train': 1.653887152671814} -08/30/2021 21:00:17 - INFO - __main__ - Step 43557: {'lr': 0.0004088812004754642, 'samples': 8362944, 'steps': 43556, 'loss/train': 1.1581887006759644} -08/30/2021 21:00:18 - INFO - __main__ - Step 43558: {'lr': 0.00040887710320608927, 'samples': 8363136, 'steps': 43557, 'loss/train': 1.6807453632354736} -08/30/2021 21:00:18 - INFO - __main__ - Step 43559: {'lr': 0.00040887300586512677, 'samples': 8363328, 'steps': 43558, 'loss/train': 0.6707919836044312} -08/30/2021 21:00:18 - INFO - __main__ - Step 43560: {'lr': 0.0004088689084525786, 'samples': 8363520, 'steps': 43559, 'loss/train': 1.6107722520828247} -08/30/2021 21:00:19 - INFO - __main__ - Step 43561: {'lr': 0.0004088648109684465, 'samples': 8363712, 'steps': 43560, 'loss/train': 1.2834357023239136} -08/30/2021 21:00:20 - INFO - __main__ - Step 43562: {'lr': 0.00040886071341273236, 'samples': 8363904, 'steps': 43561, 'loss/train': 1.5500766038894653} -08/30/2021 21:00:21 - INFO - __main__ - Step 43563: {'lr': 0.0004088566157854381, 'samples': 8364096, 'steps': 43562, 'loss/train': 1.4507262706756592} -08/30/2021 21:00:21 - INFO - __main__ - Step 43564: {'lr': 0.0004088525180865654, 'samples': 8364288, 'steps': 43563, 'loss/train': 1.3127750158309937} -08/30/2021 21:00:21 - INFO - __main__ - Step 43565: {'lr': 0.0004088484203161163, 'samples': 8364480, 'steps': 43564, 'loss/train': 1.2134068012237549} -08/30/2021 21:00:22 - INFO - __main__ - Step 43566: {'lr': 0.0004088443224740925, 'samples': 8364672, 'steps': 43565, 'loss/train': 1.307991623878479} -08/30/2021 21:00:23 - INFO - __main__ - Step 43567: {'lr': 0.00040884022456049595, 'samples': 8364864, 'steps': 43566, 'loss/train': 1.4102755784988403} -08/30/2021 21:00:24 - INFO - __main__ - Step 43568: {'lr': 0.00040883612657532844, 'samples': 8365056, 'steps': 43567, 'loss/train': 1.437592625617981} -08/30/2021 21:00:24 - INFO - __main__ - Step 43569: {'lr': 0.0004088320285185918, 'samples': 8365248, 'steps': 43568, 'loss/train': 2.1850321292877197} -08/30/2021 21:00:24 - INFO - __main__ - Step 43570: {'lr': 0.0004088279303902879, 'samples': 8365440, 'steps': 43569, 'loss/train': 1.4614529609680176} -08/30/2021 21:00:25 - INFO - __main__ - Step 43571: {'lr': 0.0004088238321904185, 'samples': 8365632, 'steps': 43570, 'loss/train': 1.2102651596069336} -08/30/2021 21:00:27 - INFO - __main__ - Step 43572: {'lr': 0.00040881973391898563, 'samples': 8365824, 'steps': 43571, 'loss/train': 1.9799891710281372} -08/30/2021 21:00:27 - INFO - __main__ - Step 43573: {'lr': 0.00040881563557599107, 'samples': 8366016, 'steps': 43572, 'loss/train': 1.2908083200454712} -08/30/2021 21:00:28 - INFO - __main__ - Step 43574: {'lr': 0.00040881153716143656, 'samples': 8366208, 'steps': 43573, 'loss/train': 1.3629207611083984} -08/30/2021 21:00:28 - INFO - __main__ - Step 43575: {'lr': 0.000408807438675324, 'samples': 8366400, 'steps': 43574, 'loss/train': 1.2900439500808716} -08/30/2021 21:00:28 - INFO - __main__ - Step 43576: {'lr': 0.0004088033401176554, 'samples': 8366592, 'steps': 43575, 'loss/train': 1.2305748462677002} -08/30/2021 21:00:30 - INFO - __main__ - Step 43577: {'lr': 0.00040879924148843233, 'samples': 8366784, 'steps': 43576, 'loss/train': 1.3015834093093872} -08/30/2021 21:00:30 - INFO - __main__ - Step 43578: {'lr': 0.00040879514278765685, 'samples': 8366976, 'steps': 43577, 'loss/train': 1.572119116783142} -08/30/2021 21:00:31 - INFO - __main__ - Step 43579: {'lr': 0.00040879104401533064, 'samples': 8367168, 'steps': 43578, 'loss/train': 1.538743495941162} -08/30/2021 21:00:31 - INFO - __main__ - Step 43580: {'lr': 0.0004087869451714557, 'samples': 8367360, 'steps': 43579, 'loss/train': 0.8841307163238525} -08/30/2021 21:00:31 - INFO - __main__ - Step 43581: {'lr': 0.0004087828462560338, 'samples': 8367552, 'steps': 43580, 'loss/train': 1.8244174718856812} -08/30/2021 21:00:32 - INFO - __main__ - Step 43582: {'lr': 0.0004087787472690668, 'samples': 8367744, 'steps': 43581, 'loss/train': 0.39079025387763977} -08/30/2021 21:00:33 - INFO - __main__ - Step 43583: {'lr': 0.00040877464821055656, 'samples': 8367936, 'steps': 43582, 'loss/train': 1.4974087476730347} -08/30/2021 21:00:33 - INFO - __main__ - Step 43584: {'lr': 0.00040877054908050495, 'samples': 8368128, 'steps': 43583, 'loss/train': 1.0725429058074951} -08/30/2021 21:00:34 - INFO - __main__ - Step 43585: {'lr': 0.0004087664498789137, 'samples': 8368320, 'steps': 43584, 'loss/train': 1.1277167797088623} -08/30/2021 21:00:34 - INFO - __main__ - Step 43586: {'lr': 0.00040876235060578476, 'samples': 8368512, 'steps': 43585, 'loss/train': 0.8686061501502991} -08/30/2021 21:00:34 - INFO - __main__ - Step 43587: {'lr': 0.00040875825126112, 'samples': 8368704, 'steps': 43586, 'loss/train': 1.2955750226974487} -08/30/2021 21:00:36 - INFO - __main__ - Step 43588: {'lr': 0.00040875415184492113, 'samples': 8368896, 'steps': 43587, 'loss/train': 1.6488643884658813} -08/30/2021 21:00:36 - INFO - __main__ - Step 43589: {'lr': 0.0004087500523571902, 'samples': 8369088, 'steps': 43588, 'loss/train': 1.1287872791290283} -08/30/2021 21:00:37 - INFO - __main__ - Step 43590: {'lr': 0.00040874595279792884, 'samples': 8369280, 'steps': 43589, 'loss/train': 0.82212895154953} -08/30/2021 21:00:37 - INFO - __main__ - Step 43591: {'lr': 0.00040874185316713905, 'samples': 8369472, 'steps': 43590, 'loss/train': 1.332965612411499} -08/30/2021 21:00:37 - INFO - __main__ - Step 43592: {'lr': 0.00040873775346482265, 'samples': 8369664, 'steps': 43591, 'loss/train': 1.5776841640472412} -08/30/2021 21:00:39 - INFO - __main__ - Step 43593: {'lr': 0.0004087336536909815, 'samples': 8369856, 'steps': 43592, 'loss/train': 1.265476107597351} -08/30/2021 21:00:39 - INFO - __main__ - Step 43594: {'lr': 0.00040872955384561735, 'samples': 8370048, 'steps': 43593, 'loss/train': 1.8268992900848389} -08/30/2021 21:00:40 - INFO - __main__ - Step 43595: {'lr': 0.00040872545392873214, 'samples': 8370240, 'steps': 43594, 'loss/train': 1.119771122932434} -08/30/2021 21:00:40 - INFO - __main__ - Step 43596: {'lr': 0.00040872135394032764, 'samples': 8370432, 'steps': 43595, 'loss/train': 1.3884943723678589} -08/30/2021 21:00:40 - INFO - __main__ - Step 43597: {'lr': 0.0004087172538804058, 'samples': 8370624, 'steps': 43596, 'loss/train': 1.2326133251190186} -08/30/2021 21:00:42 - INFO - __main__ - Step 43598: {'lr': 0.0004087131537489685, 'samples': 8370816, 'steps': 43597, 'loss/train': 0.9040321111679077} -08/30/2021 21:00:42 - INFO - __main__ - Step 43599: {'lr': 0.00040870905354601733, 'samples': 8371008, 'steps': 43598, 'loss/train': 1.3405879735946655} -08/30/2021 21:00:43 - INFO - __main__ - Step 43600: {'lr': 0.0004087049532715544, 'samples': 8371200, 'steps': 43599, 'loss/train': 1.5261836051940918} -08/30/2021 21:00:43 - INFO - __main__ - Step 43601: {'lr': 0.00040870085292558147, 'samples': 8371392, 'steps': 43600, 'loss/train': 1.6984177827835083} -08/30/2021 21:00:43 - INFO - __main__ - Step 43602: {'lr': 0.0004086967525081003, 'samples': 8371584, 'steps': 43601, 'loss/train': 0.9577161073684692} -08/30/2021 21:00:45 - INFO - __main__ - Step 43603: {'lr': 0.00040869265201911285, 'samples': 8371776, 'steps': 43602, 'loss/train': 1.515116810798645} -08/30/2021 21:00:46 - INFO - __main__ - Step 43604: {'lr': 0.00040868855145862105, 'samples': 8371968, 'steps': 43603, 'loss/train': 1.2844641208648682} -08/30/2021 21:00:46 - INFO - __main__ - Step 43605: {'lr': 0.00040868445082662655, 'samples': 8372160, 'steps': 43604, 'loss/train': 1.6302162408828735} -08/30/2021 21:00:46 - INFO - __main__ - Step 43606: {'lr': 0.0004086803501231313, 'samples': 8372352, 'steps': 43605, 'loss/train': 1.1906564235687256} -08/30/2021 21:00:47 - INFO - __main__ - Step 43607: {'lr': 0.00040867624934813715, 'samples': 8372544, 'steps': 43606, 'loss/train': 1.7421822547912598} -08/30/2021 21:00:48 - INFO - __main__ - Step 43608: {'lr': 0.00040867214850164594, 'samples': 8372736, 'steps': 43607, 'loss/train': 0.7915459871292114} -08/30/2021 21:00:48 - INFO - __main__ - Step 43609: {'lr': 0.0004086680475836594, 'samples': 8372928, 'steps': 43608, 'loss/train': 1.2626932859420776} -08/30/2021 21:00:49 - INFO - __main__ - Step 43610: {'lr': 0.0004086639465941796, 'samples': 8373120, 'steps': 43609, 'loss/train': 1.2351818084716797} -08/30/2021 21:00:49 - INFO - __main__ - Step 43611: {'lr': 0.00040865984553320825, 'samples': 8373312, 'steps': 43610, 'loss/train': 2.0004420280456543} -08/30/2021 21:00:49 - INFO - __main__ - Step 43612: {'lr': 0.0004086557444007472, 'samples': 8373504, 'steps': 43611, 'loss/train': 1.4509479999542236} -08/30/2021 21:00:51 - INFO - __main__ - Step 43613: {'lr': 0.0004086516431967984, 'samples': 8373696, 'steps': 43612, 'loss/train': 1.6439779996871948} -08/30/2021 21:00:51 - INFO - __main__ - Step 43614: {'lr': 0.0004086475419213635, 'samples': 8373888, 'steps': 43613, 'loss/train': 1.9279168844223022} -08/30/2021 21:00:52 - INFO - __main__ - Step 43615: {'lr': 0.0004086434405744445, 'samples': 8374080, 'steps': 43614, 'loss/train': 1.1898761987686157} -08/30/2021 21:00:52 - INFO - __main__ - Step 43616: {'lr': 0.00040863933915604323, 'samples': 8374272, 'steps': 43615, 'loss/train': 1.2589688301086426} -08/30/2021 21:00:52 - INFO - __main__ - Step 43617: {'lr': 0.00040863523766616157, 'samples': 8374464, 'steps': 43616, 'loss/train': 1.367022156715393} -08/30/2021 21:00:54 - INFO - __main__ - Step 43618: {'lr': 0.0004086311361048012, 'samples': 8374656, 'steps': 43617, 'loss/train': 1.3885738849639893} -08/30/2021 21:00:54 - INFO - __main__ - Step 43619: {'lr': 0.0004086270344719642, 'samples': 8374848, 'steps': 43618, 'loss/train': 1.4041556119918823} -08/30/2021 21:00:55 - INFO - __main__ - Step 43620: {'lr': 0.00040862293276765227, 'samples': 8375040, 'steps': 43619, 'loss/train': 1.7073453664779663} -08/30/2021 21:00:55 - INFO - __main__ - Step 43621: {'lr': 0.00040861883099186725, 'samples': 8375232, 'steps': 43620, 'loss/train': 1.5339233875274658} -08/30/2021 21:00:55 - INFO - __main__ - Step 43622: {'lr': 0.0004086147291446111, 'samples': 8375424, 'steps': 43621, 'loss/train': 1.1537561416625977} -08/30/2021 21:00:56 - INFO - __main__ - Step 43623: {'lr': 0.0004086106272258856, 'samples': 8375616, 'steps': 43622, 'loss/train': 3.4219653606414795} -08/30/2021 21:00:58 - INFO - __main__ - Step 43624: {'lr': 0.0004086065252356925, 'samples': 8375808, 'steps': 43623, 'loss/train': 1.460680365562439} -08/30/2021 21:00:58 - INFO - __main__ - Step 43625: {'lr': 0.00040860242317403383, 'samples': 8376000, 'steps': 43624, 'loss/train': 1.245326280593872} -08/30/2021 21:00:59 - INFO - __main__ - Step 43626: {'lr': 0.0004085983210409114, 'samples': 8376192, 'steps': 43625, 'loss/train': 1.675591230392456} -08/30/2021 21:00:59 - INFO - __main__ - Step 43627: {'lr': 0.00040859421883632696, 'samples': 8376384, 'steps': 43626, 'loss/train': 1.3258898258209229} -08/30/2021 21:00:59 - INFO - __main__ - Step 43628: {'lr': 0.0004085901165602824, 'samples': 8376576, 'steps': 43627, 'loss/train': 1.4475562572479248} -08/30/2021 21:01:01 - INFO - __main__ - Step 43629: {'lr': 0.00040858601421277956, 'samples': 8376768, 'steps': 43628, 'loss/train': 4.370294094085693} -08/30/2021 21:01:02 - INFO - __main__ - Step 43630: {'lr': 0.00040858191179382044, 'samples': 8376960, 'steps': 43629, 'loss/train': 0.07411886751651764} -08/30/2021 21:01:02 - INFO - __main__ - Step 43631: {'lr': 0.0004085778093034066, 'samples': 8377152, 'steps': 43630, 'loss/train': 1.795538067817688} -08/30/2021 21:01:02 - INFO - __main__ - Step 43632: {'lr': 0.0004085737067415401, 'samples': 8377344, 'steps': 43631, 'loss/train': 1.4656035900115967} -08/30/2021 21:01:03 - INFO - __main__ - Step 43633: {'lr': 0.00040856960410822277, 'samples': 8377536, 'steps': 43632, 'loss/train': 0.781088650226593} -08/30/2021 21:01:04 - INFO - __main__ - Step 43634: {'lr': 0.0004085655014034564, 'samples': 8377728, 'steps': 43633, 'loss/train': 1.227291464805603} -08/30/2021 21:01:05 - INFO - __main__ - Step 43635: {'lr': 0.0004085613986272428, 'samples': 8377920, 'steps': 43634, 'loss/train': 1.5319759845733643} -08/30/2021 21:01:05 - INFO - __main__ - Step 43636: {'lr': 0.0004085572957795839, 'samples': 8378112, 'steps': 43635, 'loss/train': 1.3055925369262695} -08/30/2021 21:01:05 - INFO - __main__ - Step 43637: {'lr': 0.00040855319286048163, 'samples': 8378304, 'steps': 43636, 'loss/train': 1.7575457096099854} -08/30/2021 21:01:06 - INFO - __main__ - Step 43638: {'lr': 0.0004085490898699377, 'samples': 8378496, 'steps': 43637, 'loss/train': 1.7916195392608643} -08/30/2021 21:01:06 - INFO - __main__ - Step 43639: {'lr': 0.0004085449868079539, 'samples': 8378688, 'steps': 43638, 'loss/train': 1.268640398979187} -08/30/2021 21:01:07 - INFO - __main__ - Step 43640: {'lr': 0.00040854088367453225, 'samples': 8378880, 'steps': 43639, 'loss/train': 1.395135521888733} -08/30/2021 21:01:08 - INFO - __main__ - Step 43641: {'lr': 0.00040853678046967454, 'samples': 8379072, 'steps': 43640, 'loss/train': 1.7019858360290527} -08/30/2021 21:01:08 - INFO - __main__ - Step 43642: {'lr': 0.00040853267719338256, 'samples': 8379264, 'steps': 43641, 'loss/train': 1.9262727499008179} -08/30/2021 21:01:09 - INFO - __main__ - Step 43643: {'lr': 0.00040852857384565824, 'samples': 8379456, 'steps': 43642, 'loss/train': 1.7774850130081177} -08/30/2021 21:01:09 - INFO - __main__ - Step 43644: {'lr': 0.00040852447042650337, 'samples': 8379648, 'steps': 43643, 'loss/train': 1.3540111780166626} -08/30/2021 21:01:10 - INFO - __main__ - Step 43645: {'lr': 0.0004085203669359198, 'samples': 8379840, 'steps': 43644, 'loss/train': 1.5102699995040894} -08/30/2021 21:01:11 - INFO - __main__ - Step 43646: {'lr': 0.0004085162633739095, 'samples': 8380032, 'steps': 43645, 'loss/train': 1.3230069875717163} -08/30/2021 21:01:11 - INFO - __main__ - Step 43647: {'lr': 0.0004085121597404741, 'samples': 8380224, 'steps': 43646, 'loss/train': 1.4717904329299927} -08/30/2021 21:01:12 - INFO - __main__ - Step 43648: {'lr': 0.0004085080560356156, 'samples': 8380416, 'steps': 43647, 'loss/train': 1.499605417251587} -08/30/2021 21:01:12 - INFO - __main__ - Step 43649: {'lr': 0.0004085039522593358, 'samples': 8380608, 'steps': 43648, 'loss/train': 1.5564775466918945} -08/30/2021 21:01:13 - INFO - __main__ - Step 43650: {'lr': 0.0004084998484116366, 'samples': 8380800, 'steps': 43649, 'loss/train': 1.0594967603683472} -08/30/2021 21:01:14 - INFO - __main__ - Step 43651: {'lr': 0.0004084957444925198, 'samples': 8380992, 'steps': 43650, 'loss/train': 1.7161197662353516} -08/30/2021 21:01:14 - INFO - __main__ - Step 43652: {'lr': 0.0004084916405019873, 'samples': 8381184, 'steps': 43651, 'loss/train': 1.237003207206726} -08/30/2021 21:01:15 - INFO - __main__ - Step 43653: {'lr': 0.0004084875364400409, 'samples': 8381376, 'steps': 43652, 'loss/train': 1.4637783765792847} -08/30/2021 21:01:15 - INFO - __main__ - Step 43654: {'lr': 0.0004084834323066824, 'samples': 8381568, 'steps': 43653, 'loss/train': 1.5486664772033691} -08/30/2021 21:01:17 - INFO - __main__ - Step 43655: {'lr': 0.00040847932810191375, 'samples': 8381760, 'steps': 43654, 'loss/train': 0.529299795627594} -08/30/2021 21:01:17 - INFO - __main__ - Step 43656: {'lr': 0.00040847522382573675, 'samples': 8381952, 'steps': 43655, 'loss/train': 1.722328543663025} -08/30/2021 21:01:17 - INFO - __main__ - Step 43657: {'lr': 0.0004084711194781533, 'samples': 8382144, 'steps': 43656, 'loss/train': 1.4397668838500977} -08/30/2021 21:01:18 - INFO - __main__ - Step 43658: {'lr': 0.00040846701505916516, 'samples': 8382336, 'steps': 43657, 'loss/train': 1.9381386041641235} -08/30/2021 21:01:18 - INFO - __main__ - Step 43659: {'lr': 0.00040846291056877425, 'samples': 8382528, 'steps': 43658, 'loss/train': 2.053208112716675} -08/30/2021 21:01:19 - INFO - __main__ - Step 43660: {'lr': 0.0004084588060069824, 'samples': 8382720, 'steps': 43659, 'loss/train': 1.2218683958053589} -08/30/2021 21:01:20 - INFO - __main__ - Step 43661: {'lr': 0.0004084547013737915, 'samples': 8382912, 'steps': 43660, 'loss/train': 1.1074050664901733} -08/30/2021 21:01:20 - INFO - __main__ - Step 43662: {'lr': 0.00040845059666920323, 'samples': 8383104, 'steps': 43661, 'loss/train': 0.9613440632820129} -08/30/2021 21:01:21 - INFO - __main__ - Step 43663: {'lr': 0.0004084464918932197, 'samples': 8383296, 'steps': 43662, 'loss/train': 1.67049241065979} -08/30/2021 21:01:21 - INFO - __main__ - Step 43664: {'lr': 0.0004084423870458426, 'samples': 8383488, 'steps': 43663, 'loss/train': 1.410565972328186} -08/30/2021 21:01:23 - INFO - __main__ - Step 43665: {'lr': 0.00040843828212707366, 'samples': 8383680, 'steps': 43664, 'loss/train': 1.6554551124572754} -08/30/2021 21:01:23 - INFO - __main__ - Step 43666: {'lr': 0.00040843417713691505, 'samples': 8383872, 'steps': 43665, 'loss/train': 1.251230239868164} -08/30/2021 21:01:23 - INFO - __main__ - Step 43667: {'lr': 0.0004084300720753684, 'samples': 8384064, 'steps': 43666, 'loss/train': 1.2498807907104492} -08/30/2021 21:01:24 - INFO - __main__ - Step 43668: {'lr': 0.0004084259669424356, 'samples': 8384256, 'steps': 43667, 'loss/train': 1.5934815406799316} -08/30/2021 21:01:24 - INFO - __main__ - Step 43669: {'lr': 0.0004084218617381185, 'samples': 8384448, 'steps': 43668, 'loss/train': 1.8616904020309448} -08/30/2021 21:01:26 - INFO - __main__ - Step 43670: {'lr': 0.00040841775646241897, 'samples': 8384640, 'steps': 43669, 'loss/train': 0.9714229702949524} -08/30/2021 21:01:26 - INFO - __main__ - Step 43671: {'lr': 0.0004084136511153388, 'samples': 8384832, 'steps': 43670, 'loss/train': 1.8559218645095825} -08/30/2021 21:01:26 - INFO - __main__ - Step 43672: {'lr': 0.0004084095456968799, 'samples': 8385024, 'steps': 43671, 'loss/train': 1.5746978521347046} -08/30/2021 21:01:27 - INFO - __main__ - Step 43673: {'lr': 0.0004084054402070441, 'samples': 8385216, 'steps': 43672, 'loss/train': 2.47072434425354} -08/30/2021 21:01:27 - INFO - __main__ - Step 43674: {'lr': 0.0004084013346458333, 'samples': 8385408, 'steps': 43673, 'loss/train': 1.443535327911377} -08/30/2021 21:01:28 - INFO - __main__ - Step 43675: {'lr': 0.00040839722901324924, 'samples': 8385600, 'steps': 43674, 'loss/train': 1.4247541427612305} -08/30/2021 21:01:29 - INFO - __main__ - Step 43676: {'lr': 0.00040839312330929377, 'samples': 8385792, 'steps': 43675, 'loss/train': 1.2561787366867065} -08/30/2021 21:01:29 - INFO - __main__ - Step 43677: {'lr': 0.00040838901753396896, 'samples': 8385984, 'steps': 43676, 'loss/train': 0.9809263944625854} -08/30/2021 21:01:30 - INFO - __main__ - Step 43678: {'lr': 0.0004083849116872764, 'samples': 8386176, 'steps': 43677, 'loss/train': 1.2022013664245605} -08/30/2021 21:01:30 - INFO - __main__ - Step 43679: {'lr': 0.0004083808057692181, 'samples': 8386368, 'steps': 43678, 'loss/train': 0.6751843690872192} -08/30/2021 21:01:30 - INFO - __main__ - Step 43680: {'lr': 0.00040837669977979586, 'samples': 8386560, 'steps': 43679, 'loss/train': 1.5646017789840698} -08/30/2021 21:01:33 - INFO - __main__ - Step 43681: {'lr': 0.00040837259371901145, 'samples': 8386752, 'steps': 43680, 'loss/train': 2.472356081008911} -08/30/2021 21:01:33 - INFO - __main__ - Step 43682: {'lr': 0.00040836848758686687, 'samples': 8386944, 'steps': 43681, 'loss/train': 1.1849440336227417} -08/30/2021 21:01:33 - INFO - __main__ - Step 43683: {'lr': 0.00040836438138336384, 'samples': 8387136, 'steps': 43682, 'loss/train': 1.327950119972229} -08/30/2021 21:01:34 - INFO - __main__ - Step 43684: {'lr': 0.00040836027510850426, 'samples': 8387328, 'steps': 43683, 'loss/train': 1.4204602241516113} -08/30/2021 21:01:34 - INFO - __main__ - Step 43685: {'lr': 0.00040835616876229, 'samples': 8387520, 'steps': 43684, 'loss/train': 1.4153857231140137} -08/30/2021 21:01:36 - INFO - __main__ - Step 43686: {'lr': 0.00040835206234472287, 'samples': 8387712, 'steps': 43685, 'loss/train': 1.4426779747009277} -08/30/2021 21:01:36 - INFO - __main__ - Step 43687: {'lr': 0.0004083479558558048, 'samples': 8387904, 'steps': 43686, 'loss/train': 1.643937587738037} -08/30/2021 21:01:36 - INFO - __main__ - Step 43688: {'lr': 0.0004083438492955376, 'samples': 8388096, 'steps': 43687, 'loss/train': 1.5799084901809692} -08/30/2021 21:01:37 - INFO - __main__ - Step 43689: {'lr': 0.00040833974266392306, 'samples': 8388288, 'steps': 43688, 'loss/train': 1.8566995859146118} -08/30/2021 21:01:37 - INFO - __main__ - Step 43690: {'lr': 0.00040833563596096305, 'samples': 8388480, 'steps': 43689, 'loss/train': 1.5041723251342773} -08/30/2021 21:01:39 - INFO - __main__ - Step 43691: {'lr': 0.0004083315291866595, 'samples': 8388672, 'steps': 43690, 'loss/train': 0.6873224377632141} -08/30/2021 21:01:39 - INFO - __main__ - Step 43692: {'lr': 0.00040832742234101415, 'samples': 8388864, 'steps': 43691, 'loss/train': 1.5964791774749756} -08/30/2021 21:01:40 - INFO - __main__ - Step 43693: {'lr': 0.00040832331542402895, 'samples': 8389056, 'steps': 43692, 'loss/train': 1.6457117795944214} -08/30/2021 21:01:40 - INFO - __main__ - Step 43694: {'lr': 0.0004083192084357057, 'samples': 8389248, 'steps': 43693, 'loss/train': 1.4226797819137573} -08/30/2021 21:01:40 - INFO - __main__ - Step 43695: {'lr': 0.0004083151013760462, 'samples': 8389440, 'steps': 43694, 'loss/train': 1.2428357601165771} -08/30/2021 21:01:42 - INFO - __main__ - Step 43696: {'lr': 0.0004083109942450524, 'samples': 8389632, 'steps': 43695, 'loss/train': 0.08396401256322861} -08/30/2021 21:01:42 - INFO - __main__ - Step 43697: {'lr': 0.00040830688704272615, 'samples': 8389824, 'steps': 43696, 'loss/train': 1.7063456773757935} -08/30/2021 21:01:43 - INFO - __main__ - Step 43698: {'lr': 0.0004083027797690693, 'samples': 8390016, 'steps': 43697, 'loss/train': 1.39260995388031} -08/30/2021 21:01:43 - INFO - __main__ - Step 43699: {'lr': 0.0004082986724240835, 'samples': 8390208, 'steps': 43698, 'loss/train': 1.6733640432357788} -08/30/2021 21:01:43 - INFO - __main__ - Step 43700: {'lr': 0.00040829456500777084, 'samples': 8390400, 'steps': 43699, 'loss/train': 1.4554531574249268} -08/30/2021 21:01:44 - INFO - __main__ - Step 43701: {'lr': 0.00040829045752013317, 'samples': 8390592, 'steps': 43700, 'loss/train': 1.7216246128082275} -08/30/2021 21:01:45 - INFO - __main__ - Step 43702: {'lr': 0.00040828634996117213, 'samples': 8390784, 'steps': 43701, 'loss/train': 0.9410873055458069} -08/30/2021 21:01:46 - INFO - __main__ - Step 43703: {'lr': 0.0004082822423308897, 'samples': 8390976, 'steps': 43702, 'loss/train': 1.5017255544662476} -08/30/2021 21:01:46 - INFO - __main__ - Step 43704: {'lr': 0.00040827813462928784, 'samples': 8391168, 'steps': 43703, 'loss/train': 1.172599196434021} -08/30/2021 21:01:46 - INFO - __main__ - Step 43705: {'lr': 0.0004082740268563683, 'samples': 8391360, 'steps': 43704, 'loss/train': 1.2726798057556152} -08/30/2021 21:01:47 - INFO - __main__ - Step 43706: {'lr': 0.0004082699190121329, 'samples': 8391552, 'steps': 43705, 'loss/train': 1.0417487621307373} -08/30/2021 21:01:48 - INFO - __main__ - Step 43707: {'lr': 0.00040826581109658345, 'samples': 8391744, 'steps': 43706, 'loss/train': 1.6766895055770874} -08/30/2021 21:01:49 - INFO - __main__ - Step 43708: {'lr': 0.00040826170310972196, 'samples': 8391936, 'steps': 43707, 'loss/train': 1.2837923765182495} -08/30/2021 21:01:49 - INFO - __main__ - Step 43709: {'lr': 0.0004082575950515501, 'samples': 8392128, 'steps': 43708, 'loss/train': 1.6939594745635986} -08/30/2021 21:01:49 - INFO - __main__ - Step 43710: {'lr': 0.00040825348692206985, 'samples': 8392320, 'steps': 43709, 'loss/train': 0.06294246762990952} -08/30/2021 21:01:50 - INFO - __main__ - Step 43711: {'lr': 0.0004082493787212831, 'samples': 8392512, 'steps': 43710, 'loss/train': 1.4290003776550293} -08/30/2021 21:01:51 - INFO - __main__ - Step 43712: {'lr': 0.00040824527044919153, 'samples': 8392704, 'steps': 43711, 'loss/train': 1.5055707693099976} -08/30/2021 21:01:52 - INFO - __main__ - Step 43713: {'lr': 0.0004082411621057971, 'samples': 8392896, 'steps': 43712, 'loss/train': 0.5905166864395142} -08/30/2021 21:01:52 - INFO - __main__ - Step 43714: {'lr': 0.00040823705369110163, 'samples': 8393088, 'steps': 43713, 'loss/train': 1.1393905878067017} -08/30/2021 21:01:52 - INFO - __main__ - Step 43715: {'lr': 0.000408232945205107, 'samples': 8393280, 'steps': 43714, 'loss/train': 0.6976398825645447} -08/30/2021 21:01:53 - INFO - __main__ - Step 43716: {'lr': 0.00040822883664781506, 'samples': 8393472, 'steps': 43715, 'loss/train': 1.6211543083190918} -08/30/2021 21:01:54 - INFO - __main__ - Step 43717: {'lr': 0.0004082247280192276, 'samples': 8393664, 'steps': 43716, 'loss/train': 1.4505462646484375} -08/30/2021 21:01:55 - INFO - __main__ - Step 43718: {'lr': 0.00040822061931934656, 'samples': 8393856, 'steps': 43717, 'loss/train': 1.775937795639038} -08/30/2021 21:01:55 - INFO - __main__ - Step 43719: {'lr': 0.00040821651054817376, 'samples': 8394048, 'steps': 43718, 'loss/train': 0.8606746196746826} -08/30/2021 21:01:55 - INFO - __main__ - Step 43720: {'lr': 0.000408212401705711, 'samples': 8394240, 'steps': 43719, 'loss/train': 0.05085897445678711} -08/30/2021 21:01:56 - INFO - __main__ - Step 43721: {'lr': 0.0004082082927919602, 'samples': 8394432, 'steps': 43720, 'loss/train': 0.7344890236854553} -08/30/2021 21:01:57 - INFO - __main__ - Step 43722: {'lr': 0.0004082041838069232, 'samples': 8394624, 'steps': 43721, 'loss/train': 0.7271328568458557} -08/30/2021 21:01:58 - INFO - __main__ - Step 43723: {'lr': 0.0004082000747506018, 'samples': 8394816, 'steps': 43722, 'loss/train': 1.4934117794036865} -08/30/2021 21:01:58 - INFO - __main__ - Step 43724: {'lr': 0.00040819596562299793, 'samples': 8395008, 'steps': 43723, 'loss/train': 1.8259570598602295} -08/30/2021 21:01:59 - INFO - __main__ - Step 43725: {'lr': 0.0004081918564241134, 'samples': 8395200, 'steps': 43724, 'loss/train': 1.497853398323059} -08/30/2021 21:01:59 - INFO - __main__ - Step 43726: {'lr': 0.00040818774715395, 'samples': 8395392, 'steps': 43725, 'loss/train': 1.4134975671768188} -08/30/2021 21:02:01 - INFO - __main__ - Step 43727: {'lr': 0.0004081836378125097, 'samples': 8395584, 'steps': 43726, 'loss/train': 0.7622026801109314} -08/30/2021 21:02:01 - INFO - __main__ - Step 43728: {'lr': 0.00040817952839979424, 'samples': 8395776, 'steps': 43727, 'loss/train': 1.0191752910614014} -08/30/2021 21:02:02 - INFO - __main__ - Step 43729: {'lr': 0.00040817541891580557, 'samples': 8395968, 'steps': 43728, 'loss/train': 1.3521406650543213} -08/30/2021 21:02:02 - INFO - __main__ - Step 43730: {'lr': 0.00040817130936054546, 'samples': 8396160, 'steps': 43729, 'loss/train': 1.674381971359253} -08/30/2021 21:02:02 - INFO - __main__ - Step 43731: {'lr': 0.00040816719973401586, 'samples': 8396352, 'steps': 43730, 'loss/train': 1.7359634637832642} -08/30/2021 21:02:03 - INFO - __main__ - Step 43732: {'lr': 0.0004081630900362185, 'samples': 8396544, 'steps': 43731, 'loss/train': 1.6136072874069214} -08/30/2021 21:02:03 - INFO - __main__ - Step 43733: {'lr': 0.0004081589802671553, 'samples': 8396736, 'steps': 43732, 'loss/train': 1.2608113288879395} -08/30/2021 21:02:05 - INFO - __main__ - Step 43734: {'lr': 0.00040815487042682814, 'samples': 8396928, 'steps': 43733, 'loss/train': 1.5819666385650635} -08/30/2021 21:02:06 - INFO - __main__ - Step 43735: {'lr': 0.0004081507605152388, 'samples': 8397120, 'steps': 43734, 'loss/train': 0.5912426710128784} -08/30/2021 21:02:06 - INFO - __main__ - Step 43736: {'lr': 0.0004081466505323892, 'samples': 8397312, 'steps': 43735, 'loss/train': 1.3046391010284424} -08/30/2021 21:02:06 - INFO - __main__ - Step 43737: {'lr': 0.0004081425404782811, 'samples': 8397504, 'steps': 43736, 'loss/train': 1.4426459074020386} -08/30/2021 21:02:07 - INFO - __main__ - Step 43738: {'lr': 0.00040813843035291655, 'samples': 8397696, 'steps': 43737, 'loss/train': 1.0813347101211548} -08/30/2021 21:02:08 - INFO - __main__ - Step 43739: {'lr': 0.00040813432015629714, 'samples': 8397888, 'steps': 43738, 'loss/train': 2.5605125427246094} -08/30/2021 21:02:09 - INFO - __main__ - Step 43740: {'lr': 0.0004081302098884249, 'samples': 8398080, 'steps': 43739, 'loss/train': 0.8698285818099976} -08/30/2021 21:02:09 - INFO - __main__ - Step 43741: {'lr': 0.0004081260995493015, 'samples': 8398272, 'steps': 43740, 'loss/train': 1.6621204614639282} -08/30/2021 21:02:09 - INFO - __main__ - Step 43742: {'lr': 0.0004081219891389291, 'samples': 8398464, 'steps': 43741, 'loss/train': 1.5140966176986694} -08/30/2021 21:02:10 - INFO - __main__ - Step 43743: {'lr': 0.0004081178786573092, 'samples': 8398656, 'steps': 43742, 'loss/train': 1.632564663887024} -08/30/2021 21:02:11 - INFO - __main__ - Step 43744: {'lr': 0.000408113768104444, 'samples': 8398848, 'steps': 43743, 'loss/train': 1.4046502113342285} -08/30/2021 21:02:12 - INFO - __main__ - Step 43745: {'lr': 0.0004081096574803351, 'samples': 8399040, 'steps': 43744, 'loss/train': 1.2226265668869019} -08/30/2021 21:02:12 - INFO - __main__ - Step 43746: {'lr': 0.00040810554678498434, 'samples': 8399232, 'steps': 43745, 'loss/train': 1.4193094968795776} -08/30/2021 21:02:12 - INFO - __main__ - Step 43747: {'lr': 0.00040810143601839377, 'samples': 8399424, 'steps': 43746, 'loss/train': 1.0071032047271729} -08/30/2021 21:02:13 - INFO - __main__ - Step 43748: {'lr': 0.0004080973251805651, 'samples': 8399616, 'steps': 43747, 'loss/train': 1.4941350221633911} -08/30/2021 21:02:13 - INFO - __main__ - Step 43749: {'lr': 0.0004080932142715002, 'samples': 8399808, 'steps': 43748, 'loss/train': 1.2283105850219727} -08/30/2021 21:02:15 - INFO - __main__ - Step 43750: {'lr': 0.000408089103291201, 'samples': 8400000, 'steps': 43749, 'loss/train': 0.14603550732135773} -08/30/2021 21:02:15 - INFO - __main__ - Step 43751: {'lr': 0.0004080849922396692, 'samples': 8400192, 'steps': 43750, 'loss/train': 1.366817593574524} -08/30/2021 21:02:16 - INFO - __main__ - Step 43752: {'lr': 0.00040808088111690677, 'samples': 8400384, 'steps': 43751, 'loss/train': 0.3306434750556946} -08/30/2021 21:02:16 - INFO - __main__ - Step 43753: {'lr': 0.00040807676992291557, 'samples': 8400576, 'steps': 43752, 'loss/train': 1.340009331703186} -08/30/2021 21:02:16 - INFO - __main__ - Step 43754: {'lr': 0.0004080726586576974, 'samples': 8400768, 'steps': 43753, 'loss/train': 1.3768584728240967} -08/30/2021 21:02:18 - INFO - __main__ - Step 43755: {'lr': 0.0004080685473212541, 'samples': 8400960, 'steps': 43754, 'loss/train': 1.0741140842437744} -08/30/2021 21:02:18 - INFO - __main__ - Step 43756: {'lr': 0.0004080644359135876, 'samples': 8401152, 'steps': 43755, 'loss/train': 0.8876070976257324} -08/30/2021 21:02:19 - INFO - __main__ - Step 43757: {'lr': 0.00040806032443469967, 'samples': 8401344, 'steps': 43756, 'loss/train': 2.336810827255249} -08/30/2021 21:02:19 - INFO - __main__ - Step 43758: {'lr': 0.0004080562128845923, 'samples': 8401536, 'steps': 43757, 'loss/train': 0.38245025277137756} -08/30/2021 21:02:19 - INFO - __main__ - Step 43759: {'lr': 0.0004080521012632671, 'samples': 8401728, 'steps': 43758, 'loss/train': 1.6534713506698608} -08/30/2021 21:02:21 - INFO - __main__ - Step 43760: {'lr': 0.00040804798957072607, 'samples': 8401920, 'steps': 43759, 'loss/train': 1.2356674671173096} -08/30/2021 21:02:21 - INFO - __main__ - Step 43761: {'lr': 0.0004080438778069711, 'samples': 8402112, 'steps': 43760, 'loss/train': 1.4373027086257935} -08/30/2021 21:02:22 - INFO - __main__ - Step 43762: {'lr': 0.000408039765972004, 'samples': 8402304, 'steps': 43761, 'loss/train': 1.1325913667678833} -08/30/2021 21:02:22 - INFO - __main__ - Step 43763: {'lr': 0.0004080356540658266, 'samples': 8402496, 'steps': 43762, 'loss/train': 1.7916455268859863} -08/30/2021 21:02:22 - INFO - __main__ - Step 43764: {'lr': 0.00040803154208844086, 'samples': 8402688, 'steps': 43763, 'loss/train': 0.8445713520050049} -08/30/2021 21:02:24 - INFO - __main__ - Step 43765: {'lr': 0.00040802743003984845, 'samples': 8402880, 'steps': 43764, 'loss/train': 1.5798017978668213} -08/30/2021 21:02:24 - INFO - __main__ - Step 43766: {'lr': 0.0004080233179200513, 'samples': 8403072, 'steps': 43765, 'loss/train': 1.2093489170074463} -08/30/2021 21:02:25 - INFO - __main__ - Step 43767: {'lr': 0.00040801920572905133, 'samples': 8403264, 'steps': 43766, 'loss/train': 1.7842795848846436} -08/30/2021 21:02:25 - INFO - __main__ - Step 43768: {'lr': 0.0004080150934668503, 'samples': 8403456, 'steps': 43767, 'loss/train': 0.964861273765564} -08/30/2021 21:02:25 - INFO - __main__ - Step 43769: {'lr': 0.00040801098113345014, 'samples': 8403648, 'steps': 43768, 'loss/train': 1.5773066282272339} -08/30/2021 21:02:26 - INFO - __main__ - Step 43770: {'lr': 0.00040800686872885267, 'samples': 8403840, 'steps': 43769, 'loss/train': 1.9818191528320312} -08/30/2021 21:02:27 - INFO - __main__ - Step 43771: {'lr': 0.0004080027562530598, 'samples': 8404032, 'steps': 43770, 'loss/train': 1.4162108898162842} -08/30/2021 21:02:28 - INFO - __main__ - Step 43772: {'lr': 0.0004079986437060733, 'samples': 8404224, 'steps': 43771, 'loss/train': 1.3940703868865967} -08/30/2021 21:02:28 - INFO - __main__ - Step 43773: {'lr': 0.00040799453108789497, 'samples': 8404416, 'steps': 43772, 'loss/train': 1.5082343816757202} -08/30/2021 21:02:28 - INFO - __main__ - Step 43774: {'lr': 0.0004079904183985268, 'samples': 8404608, 'steps': 43773, 'loss/train': 1.5286884307861328} -08/30/2021 21:02:29 - INFO - __main__ - Step 43775: {'lr': 0.00040798630563797055, 'samples': 8404800, 'steps': 43774, 'loss/train': 1.7596948146820068} -08/30/2021 21:02:30 - INFO - __main__ - Step 43776: {'lr': 0.00040798219280622816, 'samples': 8404992, 'steps': 43775, 'loss/train': 1.007391095161438} -08/30/2021 21:02:31 - INFO - __main__ - Step 43777: {'lr': 0.0004079780799033014, 'samples': 8405184, 'steps': 43776, 'loss/train': 1.338560938835144} -08/30/2021 21:02:31 - INFO - __main__ - Step 43778: {'lr': 0.0004079739669291922, 'samples': 8405376, 'steps': 43777, 'loss/train': 1.2960642576217651} -08/30/2021 21:02:32 - INFO - __main__ - Step 43779: {'lr': 0.0004079698538839023, 'samples': 8405568, 'steps': 43778, 'loss/train': 0.4765457212924957} -08/30/2021 21:02:32 - INFO - __main__ - Step 43780: {'lr': 0.00040796574076743366, 'samples': 8405760, 'steps': 43779, 'loss/train': 1.7926512956619263} -08/30/2021 21:02:33 - INFO - __main__ - Step 43781: {'lr': 0.00040796162757978803, 'samples': 8405952, 'steps': 43780, 'loss/train': 1.431853175163269} -08/30/2021 21:02:34 - INFO - __main__ - Step 43782: {'lr': 0.00040795751432096746, 'samples': 8406144, 'steps': 43781, 'loss/train': 1.6874363422393799} -08/30/2021 21:02:34 - INFO - __main__ - Step 43783: {'lr': 0.00040795340099097357, 'samples': 8406336, 'steps': 43782, 'loss/train': 1.5607199668884277} -08/30/2021 21:02:35 - INFO - __main__ - Step 43784: {'lr': 0.00040794928758980837, 'samples': 8406528, 'steps': 43783, 'loss/train': 1.580759048461914} -08/30/2021 21:02:35 - INFO - __main__ - Step 43785: {'lr': 0.0004079451741174737, 'samples': 8406720, 'steps': 43784, 'loss/train': 1.0252681970596313} -08/30/2021 21:02:37 - INFO - __main__ - Step 43786: {'lr': 0.00040794106057397123, 'samples': 8406912, 'steps': 43785, 'loss/train': 1.7935954332351685} -08/30/2021 21:02:37 - INFO - __main__ - Step 43787: {'lr': 0.00040793694695930304, 'samples': 8407104, 'steps': 43786, 'loss/train': 1.7533847093582153} -08/30/2021 21:02:38 - INFO - __main__ - Step 43788: {'lr': 0.00040793283327347085, 'samples': 8407296, 'steps': 43787, 'loss/train': 1.3374837636947632} -08/30/2021 21:02:38 - INFO - __main__ - Step 43789: {'lr': 0.00040792871951647657, 'samples': 8407488, 'steps': 43788, 'loss/train': 1.531365990638733} -08/30/2021 21:02:38 - INFO - __main__ - Step 43790: {'lr': 0.00040792460568832214, 'samples': 8407680, 'steps': 43789, 'loss/train': 1.2555129528045654} -08/30/2021 21:02:40 - INFO - __main__ - Step 43791: {'lr': 0.00040792049178900924, 'samples': 8407872, 'steps': 43790, 'loss/train': 0.8884113430976868} -08/30/2021 21:02:40 - INFO - __main__ - Step 43792: {'lr': 0.00040791637781853983, 'samples': 8408064, 'steps': 43791, 'loss/train': 0.9146926999092102} -08/30/2021 21:02:41 - INFO - __main__ - Step 43793: {'lr': 0.0004079122637769157, 'samples': 8408256, 'steps': 43792, 'loss/train': 1.1160128116607666} -08/30/2021 21:02:41 - INFO - __main__ - Step 43794: {'lr': 0.0004079081496641388, 'samples': 8408448, 'steps': 43793, 'loss/train': 1.344011664390564} -08/30/2021 21:02:41 - INFO - __main__ - Step 43795: {'lr': 0.0004079040354802109, 'samples': 8408640, 'steps': 43794, 'loss/train': 1.2532360553741455} -08/30/2021 21:02:43 - INFO - __main__ - Step 43796: {'lr': 0.00040789992122513386, 'samples': 8408832, 'steps': 43795, 'loss/train': 1.2086224555969238} -08/30/2021 21:02:44 - INFO - __main__ - Step 43797: {'lr': 0.00040789580689890953, 'samples': 8409024, 'steps': 43796, 'loss/train': 1.8269503116607666} -08/30/2021 21:02:44 - INFO - __main__ - Step 43798: {'lr': 0.00040789169250153985, 'samples': 8409216, 'steps': 43797, 'loss/train': 1.4898165464401245} -08/30/2021 21:02:44 - INFO - __main__ - Step 43799: {'lr': 0.00040788757803302656, 'samples': 8409408, 'steps': 43798, 'loss/train': 1.146410584449768} -08/30/2021 21:02:45 - INFO - __main__ - Step 43800: {'lr': 0.00040788346349337156, 'samples': 8409600, 'steps': 43799, 'loss/train': 1.0319801568984985} -08/30/2021 21:02:46 - INFO - __main__ - Step 43801: {'lr': 0.00040787934888257673, 'samples': 8409792, 'steps': 43800, 'loss/train': 0.7334209680557251} -08/30/2021 21:02:47 - INFO - __main__ - Step 43802: {'lr': 0.00040787523420064394, 'samples': 8409984, 'steps': 43801, 'loss/train': 1.9177191257476807} -08/30/2021 21:02:47 - INFO - __main__ - Step 43803: {'lr': 0.00040787111944757496, 'samples': 8410176, 'steps': 43802, 'loss/train': 1.2845685482025146} -08/30/2021 21:02:47 - INFO - __main__ - Step 43804: {'lr': 0.0004078670046233717, 'samples': 8410368, 'steps': 43803, 'loss/train': 1.444190502166748} -08/30/2021 21:02:48 - INFO - __main__ - Step 43805: {'lr': 0.000407862889728036, 'samples': 8410560, 'steps': 43804, 'loss/train': 1.090221881866455} -08/30/2021 21:02:49 - INFO - __main__ - Step 43806: {'lr': 0.0004078587747615697, 'samples': 8410752, 'steps': 43805, 'loss/train': 1.213196873664856} -08/30/2021 21:02:50 - INFO - __main__ - Step 43807: {'lr': 0.00040785465972397475, 'samples': 8410944, 'steps': 43806, 'loss/train': 1.4244780540466309} -08/30/2021 21:02:50 - INFO - __main__ - Step 43808: {'lr': 0.0004078505446152528, 'samples': 8411136, 'steps': 43807, 'loss/train': 1.005820631980896} -08/30/2021 21:02:51 - INFO - __main__ - Step 43809: {'lr': 0.0004078464294354059, 'samples': 8411328, 'steps': 43808, 'loss/train': 0.8411766886711121} -08/30/2021 21:02:51 - INFO - __main__ - Step 43810: {'lr': 0.00040784231418443585, 'samples': 8411520, 'steps': 43809, 'loss/train': 1.2766271829605103} -08/30/2021 21:02:51 - INFO - __main__ - Step 43811: {'lr': 0.00040783819886234445, 'samples': 8411712, 'steps': 43810, 'loss/train': 0.6391169428825378} -08/30/2021 21:02:53 - INFO - __main__ - Step 43812: {'lr': 0.00040783408346913366, 'samples': 8411904, 'steps': 43811, 'loss/train': 0.5448909401893616} -08/30/2021 21:02:53 - INFO - __main__ - Step 43813: {'lr': 0.00040782996800480523, 'samples': 8412096, 'steps': 43812, 'loss/train': 0.4895644783973694} -08/30/2021 21:02:53 - INFO - __main__ - Step 43814: {'lr': 0.000407825852469361, 'samples': 8412288, 'steps': 43813, 'loss/train': 1.6099004745483398} -08/30/2021 21:02:54 - INFO - __main__ - Step 43815: {'lr': 0.00040782173686280287, 'samples': 8412480, 'steps': 43814, 'loss/train': 1.7540996074676514} -08/30/2021 21:02:54 - INFO - __main__ - Step 43816: {'lr': 0.0004078176211851328, 'samples': 8412672, 'steps': 43815, 'loss/train': 1.876587152481079} -08/30/2021 21:02:56 - INFO - __main__ - Step 43817: {'lr': 0.0004078135054363524, 'samples': 8412864, 'steps': 43816, 'loss/train': 1.8550409078598022} -08/30/2021 21:02:56 - INFO - __main__ - Step 43818: {'lr': 0.00040780938961646385, 'samples': 8413056, 'steps': 43817, 'loss/train': 1.0840035676956177} -08/30/2021 21:02:56 - INFO - __main__ - Step 43819: {'lr': 0.00040780527372546874, 'samples': 8413248, 'steps': 43818, 'loss/train': 1.4322997331619263} -08/30/2021 21:02:57 - INFO - __main__ - Step 43820: {'lr': 0.000407801157763369, 'samples': 8413440, 'steps': 43819, 'loss/train': 1.511563777923584} -08/30/2021 21:02:57 - INFO - __main__ - Step 43821: {'lr': 0.0004077970417301665, 'samples': 8413632, 'steps': 43820, 'loss/train': 1.0809530019760132} -08/30/2021 21:02:59 - INFO - __main__ - Step 43822: {'lr': 0.00040779292562586304, 'samples': 8413824, 'steps': 43821, 'loss/train': 1.597350001335144} -08/30/2021 21:02:59 - INFO - __main__ - Step 43823: {'lr': 0.0004077888094504606, 'samples': 8414016, 'steps': 43822, 'loss/train': 0.8721112608909607} -08/30/2021 21:02:59 - INFO - __main__ - Step 43824: {'lr': 0.0004077846932039609, 'samples': 8414208, 'steps': 43823, 'loss/train': 0.8232129812240601} -08/30/2021 21:03:00 - INFO - __main__ - Step 43825: {'lr': 0.00040778057688636594, 'samples': 8414400, 'steps': 43824, 'loss/train': 1.5072728395462036} -08/30/2021 21:03:00 - INFO - __main__ - Step 43826: {'lr': 0.00040777646049767736, 'samples': 8414592, 'steps': 43825, 'loss/train': 1.5393011569976807} -08/30/2021 21:03:02 - INFO - __main__ - Step 43827: {'lr': 0.0004077723440378972, 'samples': 8414784, 'steps': 43826, 'loss/train': 1.9465694427490234} -08/30/2021 21:03:02 - INFO - __main__ - Step 43828: {'lr': 0.0004077682275070273, 'samples': 8414976, 'steps': 43827, 'loss/train': 1.6047816276550293} -08/30/2021 21:03:02 - INFO - __main__ - Step 43829: {'lr': 0.00040776411090506944, 'samples': 8415168, 'steps': 43828, 'loss/train': 2.350435256958008} -08/30/2021 21:03:03 - INFO - __main__ - Step 43830: {'lr': 0.0004077599942320255, 'samples': 8415360, 'steps': 43829, 'loss/train': 0.9171452522277832} -08/30/2021 21:03:03 - INFO - __main__ - Step 43831: {'lr': 0.00040775587748789733, 'samples': 8415552, 'steps': 43830, 'loss/train': 1.3286149501800537} -08/30/2021 21:03:05 - INFO - __main__ - Step 43832: {'lr': 0.0004077517606726868, 'samples': 8415744, 'steps': 43831, 'loss/train': 0.9289796352386475} -08/30/2021 21:03:05 - INFO - __main__ - Step 43833: {'lr': 0.0004077476437863958, 'samples': 8415936, 'steps': 43832, 'loss/train': 0.6664148569107056} -08/30/2021 21:03:06 - INFO - __main__ - Step 43834: {'lr': 0.0004077435268290261, 'samples': 8416128, 'steps': 43833, 'loss/train': 1.2577805519104004} -08/30/2021 21:03:06 - INFO - __main__ - Step 43835: {'lr': 0.0004077394098005796, 'samples': 8416320, 'steps': 43834, 'loss/train': 1.7036726474761963} -08/30/2021 21:03:06 - INFO - __main__ - Step 43836: {'lr': 0.00040773529270105816, 'samples': 8416512, 'steps': 43835, 'loss/train': 1.7892454862594604} -08/30/2021 21:03:07 - INFO - __main__ - Step 43837: {'lr': 0.0004077311755304637, 'samples': 8416704, 'steps': 43836, 'loss/train': 1.1891313791275024} -08/30/2021 21:03:08 - INFO - __main__ - Step 43838: {'lr': 0.000407727058288798, 'samples': 8416896, 'steps': 43837, 'loss/train': 1.8460379838943481} -08/30/2021 21:03:08 - INFO - __main__ - Step 43839: {'lr': 0.00040772294097606276, 'samples': 8417088, 'steps': 43838, 'loss/train': 0.9670521020889282} -08/30/2021 21:03:09 - INFO - __main__ - Step 43840: {'lr': 0.0004077188235922601, 'samples': 8417280, 'steps': 43839, 'loss/train': 0.8974589705467224} -08/30/2021 21:03:09 - INFO - __main__ - Step 43841: {'lr': 0.0004077147061373918, 'samples': 8417472, 'steps': 43840, 'loss/train': 1.8419151306152344} -08/30/2021 21:03:10 - INFO - __main__ - Step 43842: {'lr': 0.00040771058861145963, 'samples': 8417664, 'steps': 43841, 'loss/train': 1.1319509744644165} -08/30/2021 21:03:11 - INFO - __main__ - Step 43843: {'lr': 0.0004077064710144656, 'samples': 8417856, 'steps': 43842, 'loss/train': 1.4944205284118652} -08/30/2021 21:03:12 - INFO - __main__ - Step 43844: {'lr': 0.0004077023533464114, 'samples': 8418048, 'steps': 43843, 'loss/train': 1.3543598651885986} -08/30/2021 21:03:12 - INFO - __main__ - Step 43845: {'lr': 0.000407698235607299, 'samples': 8418240, 'steps': 43844, 'loss/train': 1.1973967552185059} -08/30/2021 21:03:13 - INFO - __main__ - Step 43846: {'lr': 0.0004076941177971301, 'samples': 8418432, 'steps': 43845, 'loss/train': 1.476593255996704} -08/30/2021 21:03:13 - INFO - __main__ - Step 43847: {'lr': 0.0004076899999159067, 'samples': 8418624, 'steps': 43846, 'loss/train': 1.3293201923370361} -08/30/2021 21:03:14 - INFO - __main__ - Step 43848: {'lr': 0.0004076858819636307, 'samples': 8418816, 'steps': 43847, 'loss/train': 1.1217072010040283} -08/30/2021 21:03:15 - INFO - __main__ - Step 43849: {'lr': 0.0004076817639403038, 'samples': 8419008, 'steps': 43848, 'loss/train': 1.5927393436431885} -08/30/2021 21:03:15 - INFO - __main__ - Step 43850: {'lr': 0.0004076776458459279, 'samples': 8419200, 'steps': 43849, 'loss/train': 1.2272676229476929} -08/30/2021 21:03:15 - INFO - __main__ - Step 43851: {'lr': 0.00040767352768050503, 'samples': 8419392, 'steps': 43850, 'loss/train': 1.0939770936965942} -08/30/2021 21:03:16 - INFO - __main__ - Step 43852: {'lr': 0.0004076694094440368, 'samples': 8419584, 'steps': 43851, 'loss/train': 1.546807050704956} -08/30/2021 21:03:17 - INFO - __main__ - Step 43853: {'lr': 0.0004076652911365252, 'samples': 8419776, 'steps': 43852, 'loss/train': 1.1474628448486328} -08/30/2021 21:03:18 - INFO - __main__ - Step 43854: {'lr': 0.00040766117275797196, 'samples': 8419968, 'steps': 43853, 'loss/train': 1.6309174299240112} -08/30/2021 21:03:18 - INFO - __main__ - Step 43855: {'lr': 0.0004076570543083792, 'samples': 8420160, 'steps': 43854, 'loss/train': 1.2588063478469849} -08/30/2021 21:03:18 - INFO - __main__ - Step 43856: {'lr': 0.0004076529357877485, 'samples': 8420352, 'steps': 43855, 'loss/train': 1.4545656442642212} -08/30/2021 21:03:19 - INFO - __main__ - Step 43857: {'lr': 0.00040764881719608184, 'samples': 8420544, 'steps': 43856, 'loss/train': 2.186136245727539} -08/30/2021 21:03:20 - INFO - __main__ - Step 43858: {'lr': 0.000407644698533381, 'samples': 8420736, 'steps': 43857, 'loss/train': 1.274720311164856} -08/30/2021 21:03:21 - INFO - __main__ - Step 43859: {'lr': 0.00040764057979964793, 'samples': 8420928, 'steps': 43858, 'loss/train': 1.7305853366851807} -08/30/2021 21:03:21 - INFO - __main__ - Step 43860: {'lr': 0.0004076364609948844, 'samples': 8421120, 'steps': 43859, 'loss/train': 1.5938680171966553} -08/30/2021 21:03:21 - INFO - __main__ - Step 43861: {'lr': 0.0004076323421190924, 'samples': 8421312, 'steps': 43860, 'loss/train': 1.387589931488037} -08/30/2021 21:03:22 - INFO - __main__ - Step 43862: {'lr': 0.0004076282231722737, 'samples': 8421504, 'steps': 43861, 'loss/train': 1.0618559122085571} -08/30/2021 21:03:24 - INFO - __main__ - Step 43863: {'lr': 0.0004076241041544301, 'samples': 8421696, 'steps': 43862, 'loss/train': 1.2857544422149658} -08/30/2021 21:03:24 - INFO - __main__ - Step 43864: {'lr': 0.00040761998506556353, 'samples': 8421888, 'steps': 43863, 'loss/train': 1.4223642349243164} -08/30/2021 21:03:24 - INFO - __main__ - Step 43865: {'lr': 0.0004076158659056758, 'samples': 8422080, 'steps': 43864, 'loss/train': 1.2648245096206665} -08/30/2021 21:03:25 - INFO - __main__ - Step 43866: {'lr': 0.00040761174667476883, 'samples': 8422272, 'steps': 43865, 'loss/train': 0.03963041305541992} -08/30/2021 21:03:25 - INFO - __main__ - Step 43867: {'lr': 0.0004076076273728444, 'samples': 8422464, 'steps': 43866, 'loss/train': 1.169355869293213} -08/30/2021 21:03:26 - INFO - __main__ - Step 43868: {'lr': 0.0004076035079999045, 'samples': 8422656, 'steps': 43867, 'loss/train': 0.9768556952476501} -08/30/2021 21:03:27 - INFO - __main__ - Step 43869: {'lr': 0.0004075993885559508, 'samples': 8422848, 'steps': 43868, 'loss/train': 0.4165455102920532} -08/30/2021 21:03:27 - INFO - __main__ - Step 43870: {'lr': 0.0004075952690409852, 'samples': 8423040, 'steps': 43869, 'loss/train': 1.5621095895767212} -08/30/2021 21:03:28 - INFO - __main__ - Step 43871: {'lr': 0.00040759114945500974, 'samples': 8423232, 'steps': 43870, 'loss/train': 1.6777276992797852} -08/30/2021 21:03:28 - INFO - __main__ - Step 43872: {'lr': 0.0004075870297980261, 'samples': 8423424, 'steps': 43871, 'loss/train': 0.8194810152053833} -08/30/2021 21:03:29 - INFO - __main__ - Step 43873: {'lr': 0.0004075829100700361, 'samples': 8423616, 'steps': 43872, 'loss/train': 0.7439547777175903} -08/30/2021 21:03:30 - INFO - __main__ - Step 43874: {'lr': 0.0004075787902710417, 'samples': 8423808, 'steps': 43873, 'loss/train': 1.4584407806396484} -08/30/2021 21:03:31 - INFO - __main__ - Step 43875: {'lr': 0.0004075746704010448, 'samples': 8424000, 'steps': 43874, 'loss/train': 1.446795105934143} -08/30/2021 21:03:31 - INFO - __main__ - Step 43876: {'lr': 0.0004075705504600471, 'samples': 8424192, 'steps': 43875, 'loss/train': 1.3926080465316772} -08/30/2021 21:03:31 - INFO - __main__ - Step 43877: {'lr': 0.00040756643044805057, 'samples': 8424384, 'steps': 43876, 'loss/train': 1.0353636741638184} -08/30/2021 21:03:32 - INFO - __main__ - Step 43878: {'lr': 0.0004075623103650571, 'samples': 8424576, 'steps': 43877, 'loss/train': 1.4024126529693604} -08/30/2021 21:03:32 - INFO - __main__ - Step 43879: {'lr': 0.00040755819021106844, 'samples': 8424768, 'steps': 43878, 'loss/train': 1.1849769353866577} -08/30/2021 21:03:33 - INFO - __main__ - Step 43880: {'lr': 0.00040755406998608645, 'samples': 8424960, 'steps': 43879, 'loss/train': 1.5743694305419922} -08/30/2021 21:03:34 - INFO - __main__ - Step 43881: {'lr': 0.00040754994969011306, 'samples': 8425152, 'steps': 43880, 'loss/train': 1.6137919425964355} -08/30/2021 21:03:34 - INFO - __main__ - Step 43882: {'lr': 0.00040754582932315007, 'samples': 8425344, 'steps': 43881, 'loss/train': 1.4733422994613647} -08/30/2021 21:03:35 - INFO - __main__ - Step 43883: {'lr': 0.0004075417088851994, 'samples': 8425536, 'steps': 43882, 'loss/train': 1.5610766410827637} -08/30/2021 21:03:35 - INFO - __main__ - Step 43884: {'lr': 0.0004075375883762629, 'samples': 8425728, 'steps': 43883, 'loss/train': 1.7823412418365479} -08/30/2021 21:03:37 - INFO - __main__ - Step 43885: {'lr': 0.0004075334677963423, 'samples': 8425920, 'steps': 43884, 'loss/train': 1.299405574798584} -08/30/2021 21:03:37 - INFO - __main__ - Step 43886: {'lr': 0.0004075293471454396, 'samples': 8426112, 'steps': 43885, 'loss/train': 1.5364983081817627} -08/30/2021 21:03:38 - INFO - __main__ - Step 43887: {'lr': 0.0004075252264235566, 'samples': 8426304, 'steps': 43886, 'loss/train': 1.0168243646621704} -08/30/2021 21:03:38 - INFO - __main__ - Step 43888: {'lr': 0.0004075211056306951, 'samples': 8426496, 'steps': 43887, 'loss/train': 1.063670039176941} -08/30/2021 21:03:38 - INFO - __main__ - Step 43889: {'lr': 0.00040751698476685716, 'samples': 8426688, 'steps': 43888, 'loss/train': 0.824373185634613} -08/30/2021 21:03:40 - INFO - __main__ - Step 43890: {'lr': 0.00040751286383204437, 'samples': 8426880, 'steps': 43889, 'loss/train': 1.1412771940231323} -08/30/2021 21:03:40 - INFO - __main__ - Step 43891: {'lr': 0.0004075087428262588, 'samples': 8427072, 'steps': 43890, 'loss/train': 0.9771620035171509} -08/30/2021 21:03:41 - INFO - __main__ - Step 43892: {'lr': 0.0004075046217495022, 'samples': 8427264, 'steps': 43891, 'loss/train': 0.9868575930595398} -08/30/2021 21:03:41 - INFO - __main__ - Step 43893: {'lr': 0.00040750050060177643, 'samples': 8427456, 'steps': 43892, 'loss/train': 0.15345190465450287} -08/30/2021 21:03:42 - INFO - __main__ - Step 43894: {'lr': 0.00040749637938308336, 'samples': 8427648, 'steps': 43893, 'loss/train': 1.109050989151001} -08/30/2021 21:03:42 - INFO - __main__ - Step 43895: {'lr': 0.00040749225809342485, 'samples': 8427840, 'steps': 43894, 'loss/train': 1.54781174659729} -08/30/2021 21:03:44 - INFO - __main__ - Step 43896: {'lr': 0.00040748813673280277, 'samples': 8428032, 'steps': 43895, 'loss/train': 1.2555979490280151} -08/30/2021 21:03:44 - INFO - __main__ - Step 43897: {'lr': 0.0004074840153012189, 'samples': 8428224, 'steps': 43896, 'loss/train': 1.1280982494354248} -08/30/2021 21:03:45 - INFO - __main__ - Step 43898: {'lr': 0.0004074798937986753, 'samples': 8428416, 'steps': 43897, 'loss/train': 1.4909759759902954} -08/30/2021 21:03:45 - INFO - __main__ - Step 43899: {'lr': 0.00040747577222517364, 'samples': 8428608, 'steps': 43898, 'loss/train': 1.1590861082077026} -08/30/2021 21:03:46 - INFO - __main__ - Step 43900: {'lr': 0.0004074716505807158, 'samples': 8428800, 'steps': 43899, 'loss/train': 1.1700905561447144} -08/30/2021 21:03:47 - INFO - __main__ - Step 43901: {'lr': 0.0004074675288653037, 'samples': 8428992, 'steps': 43900, 'loss/train': 1.1349079608917236} -08/30/2021 21:03:48 - INFO - __main__ - Step 43902: {'lr': 0.0004074634070789391, 'samples': 8429184, 'steps': 43901, 'loss/train': 1.6077814102172852} -08/30/2021 21:03:48 - INFO - __main__ - Step 43903: {'lr': 0.0004074592852216239, 'samples': 8429376, 'steps': 43902, 'loss/train': 1.3170939683914185} -08/30/2021 21:03:48 - INFO - __main__ - Step 43904: {'lr': 0.0004074551632933601, 'samples': 8429568, 'steps': 43903, 'loss/train': 0.9808275103569031} -08/30/2021 21:03:49 - INFO - __main__ - Step 43905: {'lr': 0.00040745104129414933, 'samples': 8429760, 'steps': 43904, 'loss/train': 0.9745615124702454} -08/30/2021 21:03:50 - INFO - __main__ - Step 43906: {'lr': 0.0004074469192239936, 'samples': 8429952, 'steps': 43905, 'loss/train': 2.1799445152282715} -08/30/2021 21:03:51 - INFO - __main__ - Step 43907: {'lr': 0.0004074427970828947, 'samples': 8430144, 'steps': 43906, 'loss/train': 1.1147089004516602} -08/30/2021 21:03:51 - INFO - __main__ - Step 43908: {'lr': 0.00040743867487085444, 'samples': 8430336, 'steps': 43907, 'loss/train': 1.3706434965133667} -08/30/2021 21:03:52 - INFO - __main__ - Step 43909: {'lr': 0.0004074345525878748, 'samples': 8430528, 'steps': 43908, 'loss/train': 2.2214980125427246} -08/30/2021 21:03:52 - INFO - __main__ - Step 43910: {'lr': 0.0004074304302339576, 'samples': 8430720, 'steps': 43909, 'loss/train': 0.03032659739255905} -08/30/2021 21:03:52 - INFO - __main__ - Step 43911: {'lr': 0.0004074263078091046, 'samples': 8430912, 'steps': 43910, 'loss/train': 0.25154292583465576} -08/30/2021 21:03:54 - INFO - __main__ - Step 43912: {'lr': 0.00040742218531331786, 'samples': 8431104, 'steps': 43911, 'loss/train': 1.2891852855682373} -08/30/2021 21:03:54 - INFO - __main__ - Step 43913: {'lr': 0.0004074180627465991, 'samples': 8431296, 'steps': 43912, 'loss/train': 1.1473833322525024} -08/30/2021 21:03:55 - INFO - __main__ - Step 43914: {'lr': 0.00040741394010895013, 'samples': 8431488, 'steps': 43913, 'loss/train': 0.8665730357170105} -08/30/2021 21:03:55 - INFO - __main__ - Step 43915: {'lr': 0.0004074098174003729, 'samples': 8431680, 'steps': 43914, 'loss/train': 0.4884485900402069} -08/30/2021 21:03:56 - INFO - __main__ - Step 43916: {'lr': 0.0004074056946208692, 'samples': 8431872, 'steps': 43915, 'loss/train': 1.7602063417434692} -08/30/2021 21:03:57 - INFO - __main__ - Step 43917: {'lr': 0.0004074015717704409, 'samples': 8432064, 'steps': 43916, 'loss/train': 1.4096194505691528} -08/30/2021 21:03:57 - INFO - __main__ - Step 43918: {'lr': 0.00040739744884908994, 'samples': 8432256, 'steps': 43917, 'loss/train': 1.1563514471054077} -08/30/2021 21:03:58 - INFO - __main__ - Step 43919: {'lr': 0.00040739332585681807, 'samples': 8432448, 'steps': 43918, 'loss/train': 1.4544111490249634} -08/30/2021 21:03:58 - INFO - __main__ - Step 43920: {'lr': 0.00040738920279362724, 'samples': 8432640, 'steps': 43919, 'loss/train': 1.5442497730255127} -08/30/2021 21:03:58 - INFO - __main__ - Step 43921: {'lr': 0.00040738507965951923, 'samples': 8432832, 'steps': 43920, 'loss/train': 1.340509295463562} -08/30/2021 21:03:59 - INFO - __main__ - Step 43922: {'lr': 0.0004073809564544959, 'samples': 8433024, 'steps': 43921, 'loss/train': 1.0293766260147095} -08/30/2021 21:04:00 - INFO - __main__ - Step 43923: {'lr': 0.0004073768331785592, 'samples': 8433216, 'steps': 43922, 'loss/train': 1.2574676275253296} -08/30/2021 21:04:01 - INFO - __main__ - Step 43924: {'lr': 0.0004073727098317109, 'samples': 8433408, 'steps': 43923, 'loss/train': 0.984167218208313} -08/30/2021 21:04:01 - INFO - __main__ - Step 43925: {'lr': 0.0004073685864139529, 'samples': 8433600, 'steps': 43924, 'loss/train': 1.1035782098770142} -08/30/2021 21:04:02 - INFO - __main__ - Step 43926: {'lr': 0.00040736446292528704, 'samples': 8433792, 'steps': 43925, 'loss/train': 0.4938061237335205} -08/30/2021 21:04:02 - INFO - __main__ - Step 43927: {'lr': 0.0004073603393657152, 'samples': 8433984, 'steps': 43926, 'loss/train': 1.6660019159317017} -08/30/2021 21:04:03 - INFO - __main__ - Step 43928: {'lr': 0.0004073562157352392, 'samples': 8434176, 'steps': 43927, 'loss/train': 1.6551334857940674} -08/30/2021 21:04:04 - INFO - __main__ - Step 43929: {'lr': 0.00040735209203386093, 'samples': 8434368, 'steps': 43928, 'loss/train': 0.8628782629966736} -08/30/2021 21:04:04 - INFO - __main__ - Step 43930: {'lr': 0.00040734796826158226, 'samples': 8434560, 'steps': 43929, 'loss/train': 1.896470546722412} -08/30/2021 21:04:05 - INFO - __main__ - Step 43931: {'lr': 0.000407343844418405, 'samples': 8434752, 'steps': 43930, 'loss/train': 1.371834397315979} -08/30/2021 21:04:05 - INFO - __main__ - Step 43932: {'lr': 0.000407339720504331, 'samples': 8434944, 'steps': 43931, 'loss/train': 1.731903076171875} -08/30/2021 21:04:06 - INFO - __main__ - Step 43933: {'lr': 0.00040733559651936216, 'samples': 8435136, 'steps': 43932, 'loss/train': 1.1435072422027588} -08/30/2021 21:04:07 - INFO - __main__ - Step 43934: {'lr': 0.0004073314724635003, 'samples': 8435328, 'steps': 43933, 'loss/train': 1.2890568971633911} -08/30/2021 21:04:07 - INFO - __main__ - Step 43935: {'lr': 0.0004073273483367474, 'samples': 8435520, 'steps': 43934, 'loss/train': 1.3700639009475708} -08/30/2021 21:04:08 - INFO - __main__ - Step 43936: {'lr': 0.0004073232241391052, 'samples': 8435712, 'steps': 43935, 'loss/train': 0.9591358304023743} -08/30/2021 21:04:08 - INFO - __main__ - Step 43937: {'lr': 0.00040731909987057547, 'samples': 8435904, 'steps': 43936, 'loss/train': 1.744177222251892} -08/30/2021 21:04:09 - INFO - __main__ - Step 43938: {'lr': 0.0004073149755311603, 'samples': 8436096, 'steps': 43937, 'loss/train': 0.9035826921463013} -08/30/2021 21:04:10 - INFO - __main__ - Step 43939: {'lr': 0.0004073108511208614, 'samples': 8436288, 'steps': 43938, 'loss/train': 0.13453228771686554} -08/30/2021 21:04:10 - INFO - __main__ - Step 43940: {'lr': 0.0004073067266396807, 'samples': 8436480, 'steps': 43939, 'loss/train': 1.2400567531585693} -08/30/2021 21:04:11 - INFO - __main__ - Step 43941: {'lr': 0.00040730260208761995, 'samples': 8436672, 'steps': 43940, 'loss/train': 1.8284215927124023} -08/30/2021 21:04:11 - INFO - __main__ - Step 43942: {'lr': 0.0004072984774646811, 'samples': 8436864, 'steps': 43941, 'loss/train': 1.6001628637313843} -08/30/2021 21:04:11 - INFO - __main__ - Step 43943: {'lr': 0.0004072943527708659, 'samples': 8437056, 'steps': 43942, 'loss/train': 1.002147912979126} -08/30/2021 21:04:13 - INFO - __main__ - Step 43944: {'lr': 0.00040729022800617637, 'samples': 8437248, 'steps': 43943, 'loss/train': 1.5290356874465942} -08/30/2021 21:04:14 - INFO - __main__ - Step 43945: {'lr': 0.00040728610317061433, 'samples': 8437440, 'steps': 43944, 'loss/train': 1.4458039999008179} -08/30/2021 21:04:14 - INFO - __main__ - Step 43946: {'lr': 0.0004072819782641816, 'samples': 8437632, 'steps': 43945, 'loss/train': 0.09694980084896088} -08/30/2021 21:04:14 - INFO - __main__ - Step 43947: {'lr': 0.00040727785328687995, 'samples': 8437824, 'steps': 43946, 'loss/train': 1.6269800662994385} -08/30/2021 21:04:15 - INFO - __main__ - Step 43948: {'lr': 0.00040727372823871135, 'samples': 8438016, 'steps': 43947, 'loss/train': 1.74516761302948} -08/30/2021 21:04:17 - INFO - __main__ - Step 43949: {'lr': 0.00040726960311967766, 'samples': 8438208, 'steps': 43948, 'loss/train': 1.564193844795227} -08/30/2021 21:04:17 - INFO - __main__ - Step 43950: {'lr': 0.0004072654779297807, 'samples': 8438400, 'steps': 43949, 'loss/train': 1.4121545553207397} -08/30/2021 21:04:18 - INFO - __main__ - Step 43951: {'lr': 0.0004072613526690223, 'samples': 8438592, 'steps': 43950, 'loss/train': 1.3532283306121826} -08/30/2021 21:04:18 - INFO - __main__ - Step 43952: {'lr': 0.00040725722733740444, 'samples': 8438784, 'steps': 43951, 'loss/train': 0.6691199541091919} -08/30/2021 21:04:18 - INFO - __main__ - Step 43953: {'lr': 0.0004072531019349289, 'samples': 8438976, 'steps': 43952, 'loss/train': 0.08725161850452423} -08/30/2021 21:04:20 - INFO - __main__ - Step 43954: {'lr': 0.00040724897646159753, 'samples': 8439168, 'steps': 43953, 'loss/train': 1.4267401695251465} -08/30/2021 21:04:21 - INFO - __main__ - Step 43955: {'lr': 0.0004072448509174121, 'samples': 8439360, 'steps': 43954, 'loss/train': 1.5169744491577148} -08/30/2021 21:04:21 - INFO - __main__ - Step 43956: {'lr': 0.00040724072530237465, 'samples': 8439552, 'steps': 43955, 'loss/train': 1.4594926834106445} -08/30/2021 21:04:21 - INFO - __main__ - Step 43957: {'lr': 0.00040723659961648694, 'samples': 8439744, 'steps': 43956, 'loss/train': 2.367868185043335} -08/30/2021 21:04:22 - INFO - __main__ - Step 43958: {'lr': 0.0004072324738597509, 'samples': 8439936, 'steps': 43957, 'loss/train': 1.8564107418060303} -08/30/2021 21:04:22 - INFO - __main__ - Step 43959: {'lr': 0.00040722834803216834, 'samples': 8440128, 'steps': 43958, 'loss/train': 1.297493577003479} -08/30/2021 21:04:24 - INFO - __main__ - Step 43960: {'lr': 0.000407224222133741, 'samples': 8440320, 'steps': 43959, 'loss/train': 1.605318546295166} -08/30/2021 21:04:24 - INFO - __main__ - Step 43961: {'lr': 0.00040722009616447094, 'samples': 8440512, 'steps': 43960, 'loss/train': 0.9258254766464233} -08/30/2021 21:04:24 - INFO - __main__ - Step 43962: {'lr': 0.0004072159701243599, 'samples': 8440704, 'steps': 43961, 'loss/train': 1.8031784296035767} -08/30/2021 21:04:25 - INFO - __main__ - Step 43963: {'lr': 0.00040721184401340977, 'samples': 8440896, 'steps': 43962, 'loss/train': 1.1122639179229736} -08/30/2021 21:04:25 - INFO - __main__ - Step 43964: {'lr': 0.00040720771783162236, 'samples': 8441088, 'steps': 43963, 'loss/train': 2.069490671157837} -08/30/2021 21:04:27 - INFO - __main__ - Step 43965: {'lr': 0.0004072035915789997, 'samples': 8441280, 'steps': 43964, 'loss/train': 1.6985869407653809} -08/30/2021 21:04:27 - INFO - __main__ - Step 43966: {'lr': 0.0004071994652555434, 'samples': 8441472, 'steps': 43965, 'loss/train': 1.697348952293396} -08/30/2021 21:04:27 - INFO - __main__ - Step 43967: {'lr': 0.0004071953388612555, 'samples': 8441664, 'steps': 43966, 'loss/train': 1.953321933746338} -08/30/2021 21:04:28 - INFO - __main__ - Step 43968: {'lr': 0.0004071912123961379, 'samples': 8441856, 'steps': 43967, 'loss/train': 1.9049609899520874} -08/30/2021 21:04:28 - INFO - __main__ - Step 43969: {'lr': 0.00040718708586019226, 'samples': 8442048, 'steps': 43968, 'loss/train': 2.4460678100585938} -08/30/2021 21:04:30 - INFO - __main__ - Step 43970: {'lr': 0.00040718295925342053, 'samples': 8442240, 'steps': 43969, 'loss/train': 1.5364702939987183} -08/30/2021 21:04:30 - INFO - __main__ - Step 43971: {'lr': 0.0004071788325758246, 'samples': 8442432, 'steps': 43970, 'loss/train': 1.694097876548767} -08/30/2021 21:04:31 - INFO - __main__ - Step 43972: {'lr': 0.00040717470582740634, 'samples': 8442624, 'steps': 43971, 'loss/train': 1.186929702758789} -08/30/2021 21:04:31 - INFO - __main__ - Step 43973: {'lr': 0.0004071705790081676, 'samples': 8442816, 'steps': 43972, 'loss/train': 1.6415050029754639} -08/30/2021 21:04:31 - INFO - __main__ - Step 43974: {'lr': 0.0004071664521181102, 'samples': 8443008, 'steps': 43973, 'loss/train': 1.6543328762054443} -08/30/2021 21:04:32 - INFO - __main__ - Step 43975: {'lr': 0.00040716232515723596, 'samples': 8443200, 'steps': 43974, 'loss/train': 0.9742529988288879} -08/30/2021 21:04:33 - INFO - __main__ - Step 43976: {'lr': 0.00040715819812554686, 'samples': 8443392, 'steps': 43975, 'loss/train': 1.328025460243225} -08/30/2021 21:04:34 - INFO - __main__ - Step 43977: {'lr': 0.0004071540710230447, 'samples': 8443584, 'steps': 43976, 'loss/train': 1.250742793083191} -08/30/2021 21:04:34 - INFO - __main__ - Step 43978: {'lr': 0.0004071499438497314, 'samples': 8443776, 'steps': 43977, 'loss/train': 1.7461166381835938} -08/30/2021 21:04:34 - INFO - __main__ - Step 43979: {'lr': 0.0004071458166056087, 'samples': 8443968, 'steps': 43978, 'loss/train': 1.1584110260009766} -08/30/2021 21:04:35 - INFO - __main__ - Step 43980: {'lr': 0.00040714168929067854, 'samples': 8444160, 'steps': 43979, 'loss/train': 1.5158499479293823} -08/30/2021 21:04:36 - INFO - __main__ - Step 43981: {'lr': 0.0004071375619049427, 'samples': 8444352, 'steps': 43980, 'loss/train': 0.52995365858078} -08/30/2021 21:04:36 - INFO - __main__ - Step 43982: {'lr': 0.0004071334344484031, 'samples': 8444544, 'steps': 43981, 'loss/train': 1.6067311763763428} -08/30/2021 21:04:37 - INFO - __main__ - Step 43983: {'lr': 0.00040712930692106164, 'samples': 8444736, 'steps': 43982, 'loss/train': 1.567029595375061} -08/30/2021 21:04:37 - INFO - __main__ - Step 43984: {'lr': 0.00040712517932292016, 'samples': 8444928, 'steps': 43983, 'loss/train': 1.1418006420135498} -08/30/2021 21:04:37 - INFO - __main__ - Step 43985: {'lr': 0.00040712105165398044, 'samples': 8445120, 'steps': 43984, 'loss/train': 1.5418975353240967} -08/30/2021 21:04:40 - INFO - __main__ - Step 43986: {'lr': 0.0004071169239142445, 'samples': 8445312, 'steps': 43985, 'loss/train': 0.8572920560836792} -08/30/2021 21:04:40 - INFO - __main__ - Step 43987: {'lr': 0.000407112796103714, 'samples': 8445504, 'steps': 43986, 'loss/train': 1.5083720684051514} -08/30/2021 21:04:41 - INFO - __main__ - Step 43988: {'lr': 0.0004071086682223909, 'samples': 8445696, 'steps': 43987, 'loss/train': 1.4546016454696655} -08/30/2021 21:04:41 - INFO - __main__ - Step 43989: {'lr': 0.0004071045402702771, 'samples': 8445888, 'steps': 43988, 'loss/train': 1.4353991746902466} -08/30/2021 21:04:41 - INFO - __main__ - Step 43990: {'lr': 0.0004071004122473744, 'samples': 8446080, 'steps': 43989, 'loss/train': 4.287884712219238} -08/30/2021 21:04:42 - INFO - __main__ - Step 43991: {'lr': 0.0004070962841536847, 'samples': 8446272, 'steps': 43990, 'loss/train': 3.6109960079193115} -08/30/2021 21:04:42 - INFO - __main__ - Step 43992: {'lr': 0.0004070921559892098, 'samples': 8446464, 'steps': 43991, 'loss/train': 1.8031673431396484} -08/30/2021 21:04:44 - INFO - __main__ - Step 43993: {'lr': 0.00040708802775395165, 'samples': 8446656, 'steps': 43992, 'loss/train': 1.3961414098739624} -08/30/2021 21:04:44 - INFO - __main__ - Step 43994: {'lr': 0.000407083899447912, 'samples': 8446848, 'steps': 43993, 'loss/train': 1.6908056735992432} -08/30/2021 21:04:45 - INFO - __main__ - Step 43995: {'lr': 0.00040707977107109285, 'samples': 8447040, 'steps': 43994, 'loss/train': 1.4549931287765503} -08/30/2021 21:04:45 - INFO - __main__ - Step 43996: {'lr': 0.00040707564262349594, 'samples': 8447232, 'steps': 43995, 'loss/train': 1.7547231912612915} -08/30/2021 21:04:46 - INFO - __main__ - Step 43997: {'lr': 0.0004070715141051231, 'samples': 8447424, 'steps': 43996, 'loss/train': 1.4241794347763062} -08/30/2021 21:04:46 - INFO - __main__ - Step 43998: {'lr': 0.00040706738551597634, 'samples': 8447616, 'steps': 43997, 'loss/train': 1.6100412607192993} -08/30/2021 21:04:48 - INFO - __main__ - Step 43999: {'lr': 0.0004070632568560574, 'samples': 8447808, 'steps': 43998, 'loss/train': 1.0230473279953003} -08/30/2021 21:04:48 - INFO - __main__ - Step 44000: {'lr': 0.0004070591281253682, 'samples': 8448000, 'steps': 43999, 'loss/train': 1.6883628368377686} -08/30/2021 21:04:49 - INFO - __main__ - Step 44001: {'lr': 0.0004070549993239106, 'samples': 8448192, 'steps': 44000, 'loss/train': 1.7681210041046143} -08/30/2021 21:04:49 - INFO - __main__ - Step 44002: {'lr': 0.0004070508704516864, 'samples': 8448384, 'steps': 44001, 'loss/train': 1.634460687637329} -08/30/2021 21:04:49 - INFO - __main__ - Step 44003: {'lr': 0.00040704674150869753, 'samples': 8448576, 'steps': 44002, 'loss/train': 0.09653045237064362} -08/30/2021 21:04:51 - INFO - __main__ - Step 44004: {'lr': 0.0004070426124949458, 'samples': 8448768, 'steps': 44003, 'loss/train': 1.0189266204833984} -08/30/2021 21:04:52 - INFO - __main__ - Step 44005: {'lr': 0.00040703848341043313, 'samples': 8448960, 'steps': 44004, 'loss/train': 1.2246114015579224} -08/30/2021 21:04:52 - INFO - __main__ - Step 44006: {'lr': 0.00040703435425516136, 'samples': 8449152, 'steps': 44005, 'loss/train': 1.3576551675796509} -08/30/2021 21:04:53 - INFO - __main__ - Step 44007: {'lr': 0.0004070302250291322, 'samples': 8449344, 'steps': 44006, 'loss/train': 1.2517186403274536} -08/30/2021 21:04:53 - INFO - __main__ - Step 44008: {'lr': 0.0004070260957323478, 'samples': 8449536, 'steps': 44007, 'loss/train': 0.9721700549125671} -08/30/2021 21:04:54 - INFO - __main__ - Step 44009: {'lr': 0.0004070219663648098, 'samples': 8449728, 'steps': 44008, 'loss/train': 0.29462742805480957} -08/30/2021 21:04:55 - INFO - __main__ - Step 44010: {'lr': 0.0004070178369265201, 'samples': 8449920, 'steps': 44009, 'loss/train': 1.1606645584106445} -08/30/2021 21:04:55 - INFO - __main__ - Step 44011: {'lr': 0.00040701370741748057, 'samples': 8450112, 'steps': 44010, 'loss/train': 1.4054937362670898} -08/30/2021 21:04:56 - INFO - __main__ - Step 44012: {'lr': 0.0004070095778376932, 'samples': 8450304, 'steps': 44011, 'loss/train': 1.9526406526565552} -08/30/2021 21:04:56 - INFO - __main__ - Step 44013: {'lr': 0.0004070054481871597, 'samples': 8450496, 'steps': 44012, 'loss/train': 1.422410011291504} -08/30/2021 21:04:56 - INFO - __main__ - Step 44014: {'lr': 0.00040700131846588185, 'samples': 8450688, 'steps': 44013, 'loss/train': 0.7295418977737427} -08/30/2021 21:04:58 - INFO - __main__ - Step 44015: {'lr': 0.0004069971886738617, 'samples': 8450880, 'steps': 44014, 'loss/train': 0.7755770683288574} -08/30/2021 21:04:58 - INFO - __main__ - Step 44016: {'lr': 0.00040699305881110103, 'samples': 8451072, 'steps': 44015, 'loss/train': 0.23817451298236847} -08/30/2021 21:04:59 - INFO - __main__ - Step 44017: {'lr': 0.00040698892887760174, 'samples': 8451264, 'steps': 44016, 'loss/train': 1.6032133102416992} -08/30/2021 21:04:59 - INFO - __main__ - Step 44018: {'lr': 0.00040698479887336567, 'samples': 8451456, 'steps': 44017, 'loss/train': 0.8851715922355652} -08/30/2021 21:04:59 - INFO - __main__ - Step 44019: {'lr': 0.00040698066879839463, 'samples': 8451648, 'steps': 44018, 'loss/train': 1.801906943321228} -08/30/2021 21:05:01 - INFO - __main__ - Step 44020: {'lr': 0.00040697653865269057, 'samples': 8451840, 'steps': 44019, 'loss/train': 1.512095332145691} -08/30/2021 21:05:01 - INFO - __main__ - Step 44021: {'lr': 0.00040697240843625527, 'samples': 8452032, 'steps': 44020, 'loss/train': 1.5614702701568604} -08/30/2021 21:05:02 - INFO - __main__ - Step 44022: {'lr': 0.00040696827814909063, 'samples': 8452224, 'steps': 44021, 'loss/train': 1.474902629852295} -08/30/2021 21:05:02 - INFO - __main__ - Step 44023: {'lr': 0.0004069641477911985, 'samples': 8452416, 'steps': 44022, 'loss/train': 1.4494317770004272} -08/30/2021 21:05:02 - INFO - __main__ - Step 44024: {'lr': 0.00040696001736258077, 'samples': 8452608, 'steps': 44023, 'loss/train': 1.4783082008361816} -08/30/2021 21:05:03 - INFO - __main__ - Step 44025: {'lr': 0.0004069558868632393, 'samples': 8452800, 'steps': 44024, 'loss/train': 1.7977288961410522} -08/30/2021 21:05:04 - INFO - __main__ - Step 44026: {'lr': 0.0004069517562931759, 'samples': 8452992, 'steps': 44025, 'loss/train': 0.8883320093154907} -08/30/2021 21:05:05 - INFO - __main__ - Step 44027: {'lr': 0.0004069476256523924, 'samples': 8453184, 'steps': 44026, 'loss/train': 1.756035327911377} -08/30/2021 21:05:05 - INFO - __main__ - Step 44028: {'lr': 0.0004069434949408908, 'samples': 8453376, 'steps': 44027, 'loss/train': 1.7327704429626465} -08/30/2021 21:05:05 - INFO - __main__ - Step 44029: {'lr': 0.0004069393641586728, 'samples': 8453568, 'steps': 44028, 'loss/train': 1.2854416370391846} -08/30/2021 21:05:06 - INFO - __main__ - Step 44030: {'lr': 0.00040693523330574043, 'samples': 8453760, 'steps': 44029, 'loss/train': 1.326966404914856} -08/30/2021 21:05:07 - INFO - __main__ - Step 44031: {'lr': 0.0004069311023820954, 'samples': 8453952, 'steps': 44030, 'loss/train': 0.4490516483783722} -08/30/2021 21:05:08 - INFO - __main__ - Step 44032: {'lr': 0.0004069269713877397, 'samples': 8454144, 'steps': 44031, 'loss/train': 1.516026258468628} -08/30/2021 21:05:08 - INFO - __main__ - Step 44033: {'lr': 0.00040692284032267515, 'samples': 8454336, 'steps': 44032, 'loss/train': 1.405348539352417} -08/30/2021 21:05:08 - INFO - __main__ - Step 44034: {'lr': 0.0004069187091869035, 'samples': 8454528, 'steps': 44033, 'loss/train': 1.6795917749404907} -08/30/2021 21:05:09 - INFO - __main__ - Step 44035: {'lr': 0.00040691457798042673, 'samples': 8454720, 'steps': 44034, 'loss/train': 1.501344084739685} -08/30/2021 21:05:10 - INFO - __main__ - Step 44036: {'lr': 0.00040691044670324673, 'samples': 8454912, 'steps': 44035, 'loss/train': 1.3635294437408447} -08/30/2021 21:05:11 - INFO - __main__ - Step 44037: {'lr': 0.00040690631535536526, 'samples': 8455104, 'steps': 44036, 'loss/train': 1.8514584302902222} -08/30/2021 21:05:11 - INFO - __main__ - Step 44038: {'lr': 0.00040690218393678426, 'samples': 8455296, 'steps': 44037, 'loss/train': 1.7052663564682007} -08/30/2021 21:05:11 - INFO - __main__ - Step 44039: {'lr': 0.0004068980524475054, 'samples': 8455488, 'steps': 44038, 'loss/train': 0.9369568824768066} -08/30/2021 21:05:12 - INFO - __main__ - Step 44040: {'lr': 0.00040689392088753097, 'samples': 8455680, 'steps': 44039, 'loss/train': 1.6158311367034912} -08/30/2021 21:05:13 - INFO - __main__ - Step 44041: {'lr': 0.00040688978925686235, 'samples': 8455872, 'steps': 44040, 'loss/train': 1.236326813697815} -08/30/2021 21:05:14 - INFO - __main__ - Step 44042: {'lr': 0.00040688565755550164, 'samples': 8456064, 'steps': 44041, 'loss/train': 1.429333209991455} -08/30/2021 21:05:14 - INFO - __main__ - Step 44043: {'lr': 0.00040688152578345074, 'samples': 8456256, 'steps': 44042, 'loss/train': 1.495693325996399} -08/30/2021 21:05:14 - INFO - __main__ - Step 44044: {'lr': 0.0004068773939407114, 'samples': 8456448, 'steps': 44043, 'loss/train': 2.3508682250976562} -08/30/2021 21:05:15 - INFO - __main__ - Step 44045: {'lr': 0.0004068732620272856, 'samples': 8456640, 'steps': 44044, 'loss/train': 1.1969764232635498} -08/30/2021 21:05:16 - INFO - __main__ - Step 44046: {'lr': 0.000406869130043175, 'samples': 8456832, 'steps': 44045, 'loss/train': 1.5663310289382935} -08/30/2021 21:05:17 - INFO - __main__ - Step 44047: {'lr': 0.0004068649979883817, 'samples': 8457024, 'steps': 44046, 'loss/train': 1.184269905090332} -08/30/2021 21:05:17 - INFO - __main__ - Step 44048: {'lr': 0.0004068608658629074, 'samples': 8457216, 'steps': 44047, 'loss/train': 1.5107033252716064} -08/30/2021 21:05:17 - INFO - __main__ - Step 44049: {'lr': 0.000406856733666754, 'samples': 8457408, 'steps': 44048, 'loss/train': 1.5339034795761108} -08/30/2021 21:05:18 - INFO - __main__ - Step 44050: {'lr': 0.00040685260139992343, 'samples': 8457600, 'steps': 44049, 'loss/train': 3.922504425048828} -08/30/2021 21:05:18 - INFO - __main__ - Step 44051: {'lr': 0.00040684846906241745, 'samples': 8457792, 'steps': 44050, 'loss/train': 1.319611668586731} -08/30/2021 21:05:20 - INFO - __main__ - Step 44052: {'lr': 0.000406844336654238, 'samples': 8457984, 'steps': 44051, 'loss/train': 1.6890438795089722} -08/30/2021 21:05:20 - INFO - __main__ - Step 44053: {'lr': 0.00040684020417538694, 'samples': 8458176, 'steps': 44052, 'loss/train': 1.6068098545074463} -08/30/2021 21:05:20 - INFO - __main__ - Step 44054: {'lr': 0.00040683607162586604, 'samples': 8458368, 'steps': 44053, 'loss/train': 1.1027469635009766} -08/30/2021 21:05:21 - INFO - __main__ - Step 44055: {'lr': 0.00040683193900567727, 'samples': 8458560, 'steps': 44054, 'loss/train': 1.6322596073150635} -08/30/2021 21:05:21 - INFO - __main__ - Step 44056: {'lr': 0.00040682780631482243, 'samples': 8458752, 'steps': 44055, 'loss/train': 1.3942008018493652} -08/30/2021 21:05:23 - INFO - __main__ - Step 44057: {'lr': 0.0004068236735533034, 'samples': 8458944, 'steps': 44056, 'loss/train': 1.5049303770065308} -08/30/2021 21:05:23 - INFO - __main__ - Step 44058: {'lr': 0.00040681954072112206, 'samples': 8459136, 'steps': 44057, 'loss/train': 1.6280584335327148} -08/30/2021 21:05:24 - INFO - __main__ - Step 44059: {'lr': 0.0004068154078182802, 'samples': 8459328, 'steps': 44058, 'loss/train': 1.3362181186676025} -08/30/2021 21:05:24 - INFO - __main__ - Step 44060: {'lr': 0.00040681127484477983, 'samples': 8459520, 'steps': 44059, 'loss/train': 1.1541709899902344} -08/30/2021 21:05:24 - INFO - __main__ - Step 44061: {'lr': 0.0004068071418006226, 'samples': 8459712, 'steps': 44060, 'loss/train': 0.5931140780448914} -08/30/2021 21:05:25 - INFO - __main__ - Step 44062: {'lr': 0.0004068030086858106, 'samples': 8459904, 'steps': 44061, 'loss/train': 0.5837137699127197} -08/30/2021 21:05:27 - INFO - __main__ - Step 44063: {'lr': 0.00040679887550034555, 'samples': 8460096, 'steps': 44062, 'loss/train': 1.3376882076263428} -08/30/2021 21:05:27 - INFO - __main__ - Step 44064: {'lr': 0.0004067947422442293, 'samples': 8460288, 'steps': 44063, 'loss/train': 0.8842340707778931} -08/30/2021 21:05:28 - INFO - __main__ - Step 44065: {'lr': 0.00040679060891746384, 'samples': 8460480, 'steps': 44064, 'loss/train': 1.1304583549499512} -08/30/2021 21:05:28 - INFO - __main__ - Step 44066: {'lr': 0.00040678647552005087, 'samples': 8460672, 'steps': 44065, 'loss/train': 1.2364016771316528} -08/30/2021 21:05:28 - INFO - __main__ - Step 44067: {'lr': 0.00040678234205199237, 'samples': 8460864, 'steps': 44066, 'loss/train': 1.329094409942627} -08/30/2021 21:05:30 - INFO - __main__ - Step 44068: {'lr': 0.0004067782085132902, 'samples': 8461056, 'steps': 44067, 'loss/train': 1.4064669609069824} -08/30/2021 21:05:30 - INFO - __main__ - Step 44069: {'lr': 0.00040677407490394616, 'samples': 8461248, 'steps': 44068, 'loss/train': 1.4992949962615967} -08/30/2021 21:05:31 - INFO - __main__ - Step 44070: {'lr': 0.0004067699412239622, 'samples': 8461440, 'steps': 44069, 'loss/train': 1.8124302625656128} -08/30/2021 21:05:31 - INFO - __main__ - Step 44071: {'lr': 0.00040676580747334, 'samples': 8461632, 'steps': 44070, 'loss/train': 1.4818695783615112} -08/30/2021 21:05:31 - INFO - __main__ - Step 44072: {'lr': 0.0004067616736520816, 'samples': 8461824, 'steps': 44071, 'loss/train': 1.3591928482055664} -08/30/2021 21:05:33 - INFO - __main__ - Step 44073: {'lr': 0.0004067575397601888, 'samples': 8462016, 'steps': 44072, 'loss/train': 1.4126721620559692} -08/30/2021 21:05:33 - INFO - __main__ - Step 44074: {'lr': 0.0004067534057976635, 'samples': 8462208, 'steps': 44073, 'loss/train': 1.7215222120285034} -08/30/2021 21:05:34 - INFO - __main__ - Step 44075: {'lr': 0.0004067492717645075, 'samples': 8462400, 'steps': 44074, 'loss/train': 1.1917779445648193} -08/30/2021 21:05:34 - INFO - __main__ - Step 44076: {'lr': 0.00040674513766072274, 'samples': 8462592, 'steps': 44075, 'loss/train': 1.491504192352295} -08/30/2021 21:05:34 - INFO - __main__ - Step 44077: {'lr': 0.000406741003486311, 'samples': 8462784, 'steps': 44076, 'loss/train': 1.7367831468582153} -08/30/2021 21:05:36 - INFO - __main__ - Step 44078: {'lr': 0.00040673686924127416, 'samples': 8462976, 'steps': 44077, 'loss/train': 1.3610408306121826} -08/30/2021 21:05:36 - INFO - __main__ - Step 44079: {'lr': 0.0004067327349256142, 'samples': 8463168, 'steps': 44078, 'loss/train': 1.1683216094970703} -08/30/2021 21:05:37 - INFO - __main__ - Step 44080: {'lr': 0.00040672860053933286, 'samples': 8463360, 'steps': 44079, 'loss/train': 1.4513936042785645} -08/30/2021 21:05:37 - INFO - __main__ - Step 44081: {'lr': 0.00040672446608243194, 'samples': 8463552, 'steps': 44080, 'loss/train': 1.4032937288284302} -08/30/2021 21:05:37 - INFO - __main__ - Step 44082: {'lr': 0.0004067203315549135, 'samples': 8463744, 'steps': 44081, 'loss/train': 1.293398141860962} -08/30/2021 21:05:39 - INFO - __main__ - Step 44083: {'lr': 0.00040671619695677923, 'samples': 8463936, 'steps': 44082, 'loss/train': 0.9986708760261536} -08/30/2021 21:05:39 - INFO - __main__ - Step 44084: {'lr': 0.00040671206228803117, 'samples': 8464128, 'steps': 44083, 'loss/train': 1.7144861221313477} -08/30/2021 21:05:40 - INFO - __main__ - Step 44085: {'lr': 0.0004067079275486709, 'samples': 8464320, 'steps': 44084, 'loss/train': 1.4291151762008667} -08/30/2021 21:05:40 - INFO - __main__ - Step 44086: {'lr': 0.00040670379273870054, 'samples': 8464512, 'steps': 44085, 'loss/train': 1.1487314701080322} -08/30/2021 21:05:40 - INFO - __main__ - Step 44087: {'lr': 0.00040669965785812193, 'samples': 8464704, 'steps': 44086, 'loss/train': 1.2978435754776} -08/30/2021 21:05:42 - INFO - __main__ - Step 44088: {'lr': 0.00040669552290693677, 'samples': 8464896, 'steps': 44087, 'loss/train': 1.4583364725112915} -08/30/2021 21:05:42 - INFO - __main__ - Step 44089: {'lr': 0.0004066913878851471, 'samples': 8465088, 'steps': 44088, 'loss/train': 1.3761975765228271} -08/30/2021 21:05:43 - INFO - __main__ - Step 44090: {'lr': 0.00040668725279275464, 'samples': 8465280, 'steps': 44089, 'loss/train': 1.0192394256591797} -08/30/2021 21:05:43 - INFO - __main__ - Step 44091: {'lr': 0.0004066831176297614, 'samples': 8465472, 'steps': 44090, 'loss/train': 2.068331241607666} -08/30/2021 21:05:43 - INFO - __main__ - Step 44092: {'lr': 0.0004066789823961691, 'samples': 8465664, 'steps': 44091, 'loss/train': 1.458799958229065} -08/30/2021 21:05:44 - INFO - __main__ - Step 44093: {'lr': 0.00040667484709197967, 'samples': 8465856, 'steps': 44092, 'loss/train': 1.0155807733535767} -08/30/2021 21:05:45 - INFO - __main__ - Step 44094: {'lr': 0.00040667071171719503, 'samples': 8466048, 'steps': 44093, 'loss/train': 1.2309426069259644} -08/30/2021 21:05:46 - INFO - __main__ - Step 44095: {'lr': 0.00040666657627181697, 'samples': 8466240, 'steps': 44094, 'loss/train': 1.088587760925293} -08/30/2021 21:05:46 - INFO - __main__ - Step 44096: {'lr': 0.00040666244075584736, 'samples': 8466432, 'steps': 44095, 'loss/train': 1.5288745164871216} -08/30/2021 21:05:46 - INFO - __main__ - Step 44097: {'lr': 0.000406658305169288, 'samples': 8466624, 'steps': 44096, 'loss/train': 1.044421911239624} -08/30/2021 21:05:47 - INFO - __main__ - Step 44098: {'lr': 0.000406654169512141, 'samples': 8466816, 'steps': 44097, 'loss/train': 1.3983596563339233} -08/30/2021 21:05:48 - INFO - __main__ - Step 44099: {'lr': 0.0004066500337844078, 'samples': 8467008, 'steps': 44098, 'loss/train': 1.4583714008331299} -08/30/2021 21:05:49 - INFO - __main__ - Step 44100: {'lr': 0.0004066458979860907, 'samples': 8467200, 'steps': 44099, 'loss/train': 1.4323664903640747} -08/30/2021 21:05:49 - INFO - __main__ - Step 44101: {'lr': 0.00040664176211719136, 'samples': 8467392, 'steps': 44100, 'loss/train': 0.8173502683639526} -08/30/2021 21:05:50 - INFO - __main__ - Step 44102: {'lr': 0.00040663762617771163, 'samples': 8467584, 'steps': 44101, 'loss/train': 0.12298928946256638} -08/30/2021 21:05:50 - INFO - __main__ - Step 44103: {'lr': 0.00040663349016765337, 'samples': 8467776, 'steps': 44102, 'loss/train': 1.1373111009597778} -08/30/2021 21:05:52 - INFO - __main__ - Step 44104: {'lr': 0.00040662935408701853, 'samples': 8467968, 'steps': 44103, 'loss/train': 1.406807780265808} -08/30/2021 21:05:52 - INFO - __main__ - Step 44105: {'lr': 0.00040662521793580886, 'samples': 8468160, 'steps': 44104, 'loss/train': 1.4186218976974487} -08/30/2021 21:05:53 - INFO - __main__ - Step 44106: {'lr': 0.0004066210817140263, 'samples': 8468352, 'steps': 44105, 'loss/train': 1.270269513130188} -08/30/2021 21:05:53 - INFO - __main__ - Step 44107: {'lr': 0.0004066169454216727, 'samples': 8468544, 'steps': 44106, 'loss/train': 0.07096153497695923} -08/30/2021 21:05:53 - INFO - __main__ - Step 44108: {'lr': 0.00040661280905875, 'samples': 8468736, 'steps': 44107, 'loss/train': 1.267858624458313} -08/30/2021 21:05:54 - INFO - __main__ - Step 44109: {'lr': 0.0004066086726252599, 'samples': 8468928, 'steps': 44108, 'loss/train': 1.168114423751831} -08/30/2021 21:05:55 - INFO - __main__ - Step 44110: {'lr': 0.0004066045361212043, 'samples': 8469120, 'steps': 44109, 'loss/train': 1.3575265407562256} -08/30/2021 21:05:56 - INFO - __main__ - Step 44111: {'lr': 0.00040660039954658523, 'samples': 8469312, 'steps': 44110, 'loss/train': 1.1176503896713257} -08/30/2021 21:05:56 - INFO - __main__ - Step 44112: {'lr': 0.0004065962629014044, 'samples': 8469504, 'steps': 44111, 'loss/train': 1.4290441274642944} -08/30/2021 21:05:56 - INFO - __main__ - Step 44113: {'lr': 0.00040659212618566364, 'samples': 8469696, 'steps': 44112, 'loss/train': 0.9308264851570129} -08/30/2021 21:05:57 - INFO - __main__ - Step 44114: {'lr': 0.000406587989399365, 'samples': 8469888, 'steps': 44113, 'loss/train': 1.6912705898284912} -08/30/2021 21:05:57 - INFO - __main__ - Step 44115: {'lr': 0.0004065838525425102, 'samples': 8470080, 'steps': 44114, 'loss/train': 1.562868595123291} -08/30/2021 21:05:59 - INFO - __main__ - Step 44116: {'lr': 0.00040657971561510104, 'samples': 8470272, 'steps': 44115, 'loss/train': 1.3296985626220703} -08/30/2021 21:05:59 - INFO - __main__ - Step 44117: {'lr': 0.00040657557861713956, 'samples': 8470464, 'steps': 44116, 'loss/train': 0.8412728905677795} -08/30/2021 21:06:00 - INFO - __main__ - Step 44118: {'lr': 0.00040657144154862746, 'samples': 8470656, 'steps': 44117, 'loss/train': 1.5692476034164429} -08/30/2021 21:06:00 - INFO - __main__ - Step 44119: {'lr': 0.00040656730440956677, 'samples': 8470848, 'steps': 44118, 'loss/train': 1.500753402709961} -08/30/2021 21:06:00 - INFO - __main__ - Step 44120: {'lr': 0.0004065631671999592, 'samples': 8471040, 'steps': 44119, 'loss/train': 1.0208393335342407} -08/30/2021 21:06:02 - INFO - __main__ - Step 44121: {'lr': 0.0004065590299198068, 'samples': 8471232, 'steps': 44120, 'loss/train': 0.2500440776348114} -08/30/2021 21:06:02 - INFO - __main__ - Step 44122: {'lr': 0.00040655489256911123, 'samples': 8471424, 'steps': 44121, 'loss/train': 1.3094968795776367} -08/30/2021 21:06:03 - INFO - __main__ - Step 44123: {'lr': 0.00040655075514787445, 'samples': 8471616, 'steps': 44122, 'loss/train': 1.3478151559829712} -08/30/2021 21:06:03 - INFO - __main__ - Step 44124: {'lr': 0.0004065466176560983, 'samples': 8471808, 'steps': 44123, 'loss/train': 1.3414958715438843} -08/30/2021 21:06:03 - INFO - __main__ - Step 44125: {'lr': 0.0004065424800937847, 'samples': 8472000, 'steps': 44124, 'loss/train': 1.5347563028335571} -08/30/2021 21:06:05 - INFO - __main__ - Step 44126: {'lr': 0.0004065383424609354, 'samples': 8472192, 'steps': 44125, 'loss/train': 0.9165471196174622} -08/30/2021 21:06:05 - INFO - __main__ - Step 44127: {'lr': 0.00040653420475755245, 'samples': 8472384, 'steps': 44126, 'loss/train': 1.5624030828475952} -08/30/2021 21:06:06 - INFO - __main__ - Step 44128: {'lr': 0.0004065300669836375, 'samples': 8472576, 'steps': 44127, 'loss/train': 1.4960596561431885} -08/30/2021 21:06:06 - INFO - __main__ - Step 44129: {'lr': 0.0004065259291391926, 'samples': 8472768, 'steps': 44128, 'loss/train': 1.1617436408996582} -08/30/2021 21:06:06 - INFO - __main__ - Step 44130: {'lr': 0.0004065217912242195, 'samples': 8472960, 'steps': 44129, 'loss/train': 1.5795999765396118} -08/30/2021 21:06:08 - INFO - __main__ - Step 44131: {'lr': 0.00040651765323872, 'samples': 8473152, 'steps': 44130, 'loss/train': 1.4055019617080688} -08/30/2021 21:06:08 - INFO - __main__ - Step 44132: {'lr': 0.0004065135151826962, 'samples': 8473344, 'steps': 44131, 'loss/train': 1.4845198392868042} -08/30/2021 21:06:09 - INFO - __main__ - Step 44133: {'lr': 0.00040650937705614975, 'samples': 8473536, 'steps': 44132, 'loss/train': 1.2122938632965088} -08/30/2021 21:06:09 - INFO - __main__ - Step 44134: {'lr': 0.0004065052388590826, 'samples': 8473728, 'steps': 44133, 'loss/train': 1.4062912464141846} -08/30/2021 21:06:09 - INFO - __main__ - Step 44135: {'lr': 0.00040650110059149664, 'samples': 8473920, 'steps': 44134, 'loss/train': 1.6718124151229858} -08/30/2021 21:06:11 - INFO - __main__ - Step 44136: {'lr': 0.0004064969622533937, 'samples': 8474112, 'steps': 44135, 'loss/train': 1.1252530813217163} -08/30/2021 21:06:11 - INFO - __main__ - Step 44137: {'lr': 0.0004064928238447756, 'samples': 8474304, 'steps': 44136, 'loss/train': 0.7014845013618469} -08/30/2021 21:06:12 - INFO - __main__ - Step 44138: {'lr': 0.00040648868536564427, 'samples': 8474496, 'steps': 44137, 'loss/train': 1.4529163837432861} -08/30/2021 21:06:12 - INFO - __main__ - Step 44139: {'lr': 0.00040648454681600153, 'samples': 8474688, 'steps': 44138, 'loss/train': 1.6480276584625244} -08/30/2021 21:06:12 - INFO - __main__ - Step 44140: {'lr': 0.0004064804081958493, 'samples': 8474880, 'steps': 44139, 'loss/train': 1.2589802742004395} -08/30/2021 21:06:14 - INFO - __main__ - Step 44141: {'lr': 0.00040647626950518945, 'samples': 8475072, 'steps': 44140, 'loss/train': 1.8385587930679321} -08/30/2021 21:06:14 - INFO - __main__ - Step 44142: {'lr': 0.00040647213074402374, 'samples': 8475264, 'steps': 44141, 'loss/train': 1.5320193767547607} -08/30/2021 21:06:15 - INFO - __main__ - Step 44143: {'lr': 0.0004064679919123541, 'samples': 8475456, 'steps': 44142, 'loss/train': 1.4705506563186646} -08/30/2021 21:06:15 - INFO - __main__ - Step 44144: {'lr': 0.00040646385301018243, 'samples': 8475648, 'steps': 44143, 'loss/train': 1.7159574031829834} -08/30/2021 21:06:15 - INFO - __main__ - Step 44145: {'lr': 0.0004064597140375105, 'samples': 8475840, 'steps': 44144, 'loss/train': 1.5686514377593994} -08/30/2021 21:06:17 - INFO - __main__ - Step 44146: {'lr': 0.00040645557499434035, 'samples': 8476032, 'steps': 44145, 'loss/train': 1.5966949462890625} -08/30/2021 21:06:17 - INFO - __main__ - Step 44147: {'lr': 0.0004064514358806737, 'samples': 8476224, 'steps': 44146, 'loss/train': 1.3904095888137817} -08/30/2021 21:06:18 - INFO - __main__ - Step 44148: {'lr': 0.00040644729669651235, 'samples': 8476416, 'steps': 44147, 'loss/train': 1.3803188800811768} -08/30/2021 21:06:18 - INFO - __main__ - Step 44149: {'lr': 0.0004064431574418583, 'samples': 8476608, 'steps': 44148, 'loss/train': 1.4059433937072754} -08/30/2021 21:06:18 - INFO - __main__ - Step 44150: {'lr': 0.00040643901811671345, 'samples': 8476800, 'steps': 44149, 'loss/train': 1.6222126483917236} -08/30/2021 21:06:20 - INFO - __main__ - Step 44151: {'lr': 0.0004064348787210795, 'samples': 8476992, 'steps': 44150, 'loss/train': 1.2151063680648804} -08/30/2021 21:06:20 - INFO - __main__ - Step 44152: {'lr': 0.0004064307392549585, 'samples': 8477184, 'steps': 44151, 'loss/train': 1.2867988348007202} -08/30/2021 21:06:20 - INFO - __main__ - Step 44153: {'lr': 0.00040642659971835217, 'samples': 8477376, 'steps': 44152, 'loss/train': 0.3661315441131592} -08/30/2021 21:06:21 - INFO - __main__ - Step 44154: {'lr': 0.0004064224601112625, 'samples': 8477568, 'steps': 44153, 'loss/train': 1.40620756149292} -08/30/2021 21:06:21 - INFO - __main__ - Step 44155: {'lr': 0.0004064183204336912, 'samples': 8477760, 'steps': 44154, 'loss/train': 1.3225756883621216} -08/30/2021 21:06:23 - INFO - __main__ - Step 44156: {'lr': 0.00040641418068564024, 'samples': 8477952, 'steps': 44155, 'loss/train': 0.6734851598739624} -08/30/2021 21:06:23 - INFO - __main__ - Step 44157: {'lr': 0.0004064100408671114, 'samples': 8478144, 'steps': 44156, 'loss/train': 1.5098363161087036} -08/30/2021 21:06:23 - INFO - __main__ - Step 44158: {'lr': 0.0004064059009781067, 'samples': 8478336, 'steps': 44157, 'loss/train': 1.511729121208191} -08/30/2021 21:06:24 - INFO - __main__ - Step 44159: {'lr': 0.0004064017610186279, 'samples': 8478528, 'steps': 44158, 'loss/train': 1.451151967048645} -08/30/2021 21:06:24 - INFO - __main__ - Step 44160: {'lr': 0.00040639762098867684, 'samples': 8478720, 'steps': 44159, 'loss/train': 0.9728785753250122} -08/30/2021 21:06:26 - INFO - __main__ - Step 44161: {'lr': 0.0004063934808882555, 'samples': 8478912, 'steps': 44160, 'loss/train': 1.5216493606567383} -08/30/2021 21:06:26 - INFO - __main__ - Step 44162: {'lr': 0.0004063893407173656, 'samples': 8479104, 'steps': 44161, 'loss/train': 1.3516279458999634} -08/30/2021 21:06:27 - INFO - __main__ - Step 44163: {'lr': 0.00040638520047600916, 'samples': 8479296, 'steps': 44162, 'loss/train': 1.7257524728775024} -08/30/2021 21:06:27 - INFO - __main__ - Step 44164: {'lr': 0.00040638106016418785, 'samples': 8479488, 'steps': 44163, 'loss/train': 1.6789913177490234} -08/30/2021 21:06:27 - INFO - __main__ - Step 44165: {'lr': 0.0004063769197819037, 'samples': 8479680, 'steps': 44164, 'loss/train': 1.4162310361862183} -08/30/2021 21:06:28 - INFO - __main__ - Step 44166: {'lr': 0.0004063727793291585, 'samples': 8479872, 'steps': 44165, 'loss/train': 1.1711804866790771} -08/30/2021 21:06:29 - INFO - __main__ - Step 44167: {'lr': 0.00040636863880595415, 'samples': 8480064, 'steps': 44166, 'loss/train': 1.2680935859680176} -08/30/2021 21:06:30 - INFO - __main__ - Step 44168: {'lr': 0.0004063644982122926, 'samples': 8480256, 'steps': 44167, 'loss/train': 1.6841156482696533} -08/30/2021 21:06:30 - INFO - __main__ - Step 44169: {'lr': 0.00040636035754817545, 'samples': 8480448, 'steps': 44168, 'loss/train': 1.058955430984497} -08/30/2021 21:06:30 - INFO - __main__ - Step 44170: {'lr': 0.00040635621681360485, 'samples': 8480640, 'steps': 44169, 'loss/train': 1.4076007604599} -08/30/2021 21:06:31 - INFO - __main__ - Step 44171: {'lr': 0.00040635207600858247, 'samples': 8480832, 'steps': 44170, 'loss/train': 0.6762776374816895} -08/30/2021 21:06:33 - INFO - __main__ - Step 44172: {'lr': 0.00040634793513311037, 'samples': 8481024, 'steps': 44171, 'loss/train': 0.8838333487510681} -08/30/2021 21:06:33 - INFO - __main__ - Step 44173: {'lr': 0.0004063437941871903, 'samples': 8481216, 'steps': 44172, 'loss/train': 1.3215932846069336} -08/30/2021 21:06:33 - INFO - __main__ - Step 44174: {'lr': 0.000406339653170824, 'samples': 8481408, 'steps': 44173, 'loss/train': 1.5783798694610596} -08/30/2021 21:06:34 - INFO - __main__ - Step 44175: {'lr': 0.00040633551208401356, 'samples': 8481600, 'steps': 44174, 'loss/train': 1.1169246435165405} -08/30/2021 21:06:34 - INFO - __main__ - Step 44176: {'lr': 0.0004063313709267607, 'samples': 8481792, 'steps': 44175, 'loss/train': 1.2964143753051758} -08/30/2021 21:06:36 - INFO - __main__ - Step 44177: {'lr': 0.0004063272296990674, 'samples': 8481984, 'steps': 44176, 'loss/train': 1.526625394821167} -08/30/2021 21:06:36 - INFO - __main__ - Step 44178: {'lr': 0.00040632308840093533, 'samples': 8482176, 'steps': 44177, 'loss/train': 0.9614483714103699} -08/30/2021 21:06:36 - INFO - __main__ - Step 44179: {'lr': 0.0004063189470323666, 'samples': 8482368, 'steps': 44178, 'loss/train': 0.8579971790313721} -08/30/2021 21:06:37 - INFO - __main__ - Step 44180: {'lr': 0.000406314805593363, 'samples': 8482560, 'steps': 44179, 'loss/train': 1.4750815629959106} -08/30/2021 21:06:37 - INFO - __main__ - Step 44181: {'lr': 0.00040631066408392636, 'samples': 8482752, 'steps': 44180, 'loss/train': 0.8314672112464905} -08/30/2021 21:06:39 - INFO - __main__ - Step 44182: {'lr': 0.0004063065225040584, 'samples': 8482944, 'steps': 44181, 'loss/train': 1.0320812463760376} -08/30/2021 21:06:39 - INFO - __main__ - Step 44183: {'lr': 0.0004063023808537613, 'samples': 8483136, 'steps': 44182, 'loss/train': 1.485159993171692} -08/30/2021 21:06:40 - INFO - __main__ - Step 44184: {'lr': 0.00040629823913303665, 'samples': 8483328, 'steps': 44183, 'loss/train': 1.607389211654663} -08/30/2021 21:06:40 - INFO - __main__ - Step 44185: {'lr': 0.0004062940973418865, 'samples': 8483520, 'steps': 44184, 'loss/train': 2.7643890380859375} -08/30/2021 21:06:40 - INFO - __main__ - Step 44186: {'lr': 0.00040628995548031254, 'samples': 8483712, 'steps': 44185, 'loss/train': 1.3176820278167725} -08/30/2021 21:06:41 - INFO - __main__ - Step 44187: {'lr': 0.00040628581354831687, 'samples': 8483904, 'steps': 44186, 'loss/train': 1.4538748264312744} -08/30/2021 21:06:42 - INFO - __main__ - Step 44188: {'lr': 0.0004062816715459011, 'samples': 8484096, 'steps': 44187, 'loss/train': 1.4020036458969116} -08/30/2021 21:06:43 - INFO - __main__ - Step 44189: {'lr': 0.0004062775294730673, 'samples': 8484288, 'steps': 44188, 'loss/train': 1.2786281108856201} -08/30/2021 21:06:43 - INFO - __main__ - Step 44190: {'lr': 0.0004062733873298172, 'samples': 8484480, 'steps': 44189, 'loss/train': 1.6497596502304077} -08/30/2021 21:06:43 - INFO - __main__ - Step 44191: {'lr': 0.0004062692451161528, 'samples': 8484672, 'steps': 44190, 'loss/train': 1.0401939153671265} -08/30/2021 21:06:44 - INFO - __main__ - Step 44192: {'lr': 0.00040626510283207586, 'samples': 8484864, 'steps': 44191, 'loss/train': 1.780696988105774} -08/30/2021 21:06:45 - INFO - __main__ - Step 44193: {'lr': 0.00040626096047758823, 'samples': 8485056, 'steps': 44192, 'loss/train': 1.407740592956543} -08/30/2021 21:06:46 - INFO - __main__ - Step 44194: {'lr': 0.0004062568180526919, 'samples': 8485248, 'steps': 44193, 'loss/train': 0.06727295368909836} -08/30/2021 21:06:46 - INFO - __main__ - Step 44195: {'lr': 0.0004062526755573886, 'samples': 8485440, 'steps': 44194, 'loss/train': 1.4399356842041016} -08/30/2021 21:06:47 - INFO - __main__ - Step 44196: {'lr': 0.00040624853299168025, 'samples': 8485632, 'steps': 44195, 'loss/train': 1.7573808431625366} -08/30/2021 21:06:47 - INFO - __main__ - Step 44197: {'lr': 0.0004062443903555687, 'samples': 8485824, 'steps': 44196, 'loss/train': 1.3407443761825562} -08/30/2021 21:06:49 - INFO - __main__ - Step 44198: {'lr': 0.0004062402476490559, 'samples': 8486016, 'steps': 44197, 'loss/train': 1.9403477907180786} -08/30/2021 21:06:49 - INFO - __main__ - Step 44199: {'lr': 0.00040623610487214366, 'samples': 8486208, 'steps': 44198, 'loss/train': 0.8868473172187805} -08/30/2021 21:06:49 - INFO - __main__ - Step 44200: {'lr': 0.0004062319620248338, 'samples': 8486400, 'steps': 44199, 'loss/train': 1.279229760169983} -08/30/2021 21:06:50 - INFO - __main__ - Step 44201: {'lr': 0.00040622781910712826, 'samples': 8486592, 'steps': 44200, 'loss/train': 1.4272246360778809} -08/30/2021 21:06:50 - INFO - __main__ - Step 44202: {'lr': 0.00040622367611902886, 'samples': 8486784, 'steps': 44201, 'loss/train': 1.5270839929580688} -08/30/2021 21:06:51 - INFO - __main__ - Step 44203: {'lr': 0.0004062195330605375, 'samples': 8486976, 'steps': 44202, 'loss/train': 1.258521318435669} -08/30/2021 21:06:52 - INFO - __main__ - Step 44204: {'lr': 0.000406215389931656, 'samples': 8487168, 'steps': 44203, 'loss/train': 1.3526769876480103} -08/30/2021 21:06:52 - INFO - __main__ - Step 44205: {'lr': 0.0004062112467323863, 'samples': 8487360, 'steps': 44204, 'loss/train': 1.6489837169647217} -08/30/2021 21:06:53 - INFO - __main__ - Step 44206: {'lr': 0.00040620710346273015, 'samples': 8487552, 'steps': 44205, 'loss/train': 1.5647201538085938} -08/30/2021 21:06:53 - INFO - __main__ - Step 44207: {'lr': 0.00040620296012268956, 'samples': 8487744, 'steps': 44206, 'loss/train': 1.396378993988037} -08/30/2021 21:06:54 - INFO - __main__ - Step 44208: {'lr': 0.0004061988167122663, 'samples': 8487936, 'steps': 44207, 'loss/train': 1.0479145050048828} -08/30/2021 21:06:55 - INFO - __main__ - Step 44209: {'lr': 0.00040619467323146224, 'samples': 8488128, 'steps': 44208, 'loss/train': 1.0903661251068115} -08/30/2021 21:06:55 - INFO - __main__ - Step 44210: {'lr': 0.0004061905296802793, 'samples': 8488320, 'steps': 44209, 'loss/train': 1.6131728887557983} -08/30/2021 21:06:55 - INFO - __main__ - Step 44211: {'lr': 0.00040618638605871934, 'samples': 8488512, 'steps': 44210, 'loss/train': 1.4721304178237915} -08/30/2021 21:06:56 - INFO - __main__ - Step 44212: {'lr': 0.00040618224236678413, 'samples': 8488704, 'steps': 44211, 'loss/train': 1.6304879188537598} -08/30/2021 21:06:57 - INFO - __main__ - Step 44213: {'lr': 0.00040617809860447564, 'samples': 8488896, 'steps': 44212, 'loss/train': 0.9545351266860962} -08/30/2021 21:06:58 - INFO - __main__ - Step 44214: {'lr': 0.00040617395477179577, 'samples': 8489088, 'steps': 44213, 'loss/train': 1.9828261137008667} -08/30/2021 21:06:58 - INFO - __main__ - Step 44215: {'lr': 0.0004061698108687463, 'samples': 8489280, 'steps': 44214, 'loss/train': 1.167463779449463} -08/30/2021 21:06:59 - INFO - __main__ - Step 44216: {'lr': 0.00040616566689532905, 'samples': 8489472, 'steps': 44215, 'loss/train': 1.4615789651870728} -08/30/2021 21:06:59 - INFO - __main__ - Step 44217: {'lr': 0.00040616152285154607, 'samples': 8489664, 'steps': 44216, 'loss/train': 0.8346847295761108} -08/30/2021 21:07:00 - INFO - __main__ - Step 44218: {'lr': 0.000406157378737399, 'samples': 8489856, 'steps': 44217, 'loss/train': 0.7510921359062195} -08/30/2021 21:07:01 - INFO - __main__ - Step 44219: {'lr': 0.0004061532345528899, 'samples': 8490048, 'steps': 44218, 'loss/train': 1.3765695095062256} -08/30/2021 21:07:01 - INFO - __main__ - Step 44220: {'lr': 0.00040614909029802054, 'samples': 8490240, 'steps': 44219, 'loss/train': 0.6475852727890015} -08/30/2021 21:07:02 - INFO - __main__ - Step 44221: {'lr': 0.0004061449459727928, 'samples': 8490432, 'steps': 44220, 'loss/train': 1.4275166988372803} -08/30/2021 21:07:02 - INFO - __main__ - Step 44222: {'lr': 0.0004061408015772086, 'samples': 8490624, 'steps': 44221, 'loss/train': 1.222055196762085} -08/30/2021 21:07:02 - INFO - __main__ - Step 44223: {'lr': 0.0004061366571112698, 'samples': 8490816, 'steps': 44222, 'loss/train': 1.6360888481140137} -08/30/2021 21:07:04 - INFO - __main__ - Step 44224: {'lr': 0.0004061325125749781, 'samples': 8491008, 'steps': 44223, 'loss/train': 1.2136449813842773} -08/30/2021 21:07:05 - INFO - __main__ - Step 44225: {'lr': 0.00040612836796833556, 'samples': 8491200, 'steps': 44224, 'loss/train': 1.289175033569336} -08/30/2021 21:07:05 - INFO - __main__ - Step 44226: {'lr': 0.000406124223291344, 'samples': 8491392, 'steps': 44225, 'loss/train': 1.1006243228912354} -08/30/2021 21:07:06 - INFO - __main__ - Step 44227: {'lr': 0.0004061200785440052, 'samples': 8491584, 'steps': 44226, 'loss/train': 1.8398195505142212} -08/30/2021 21:07:06 - INFO - __main__ - Step 44228: {'lr': 0.0004061159337263213, 'samples': 8491776, 'steps': 44227, 'loss/train': 1.19362211227417} -08/30/2021 21:07:07 - INFO - __main__ - Step 44229: {'lr': 0.0004061117888382938, 'samples': 8491968, 'steps': 44228, 'loss/train': 1.4343485832214355} -08/30/2021 21:07:08 - INFO - __main__ - Step 44230: {'lr': 0.00040610764387992475, 'samples': 8492160, 'steps': 44229, 'loss/train': 1.6166287660598755} -08/30/2021 21:07:08 - INFO - __main__ - Step 44231: {'lr': 0.0004061034988512161, 'samples': 8492352, 'steps': 44230, 'loss/train': 1.3016630411148071} -08/30/2021 21:07:09 - INFO - __main__ - Step 44232: {'lr': 0.0004060993537521695, 'samples': 8492544, 'steps': 44231, 'loss/train': 1.1095161437988281} -08/30/2021 21:07:09 - INFO - __main__ - Step 44233: {'lr': 0.00040609520858278704, 'samples': 8492736, 'steps': 44232, 'loss/train': 1.3086873292922974} -08/30/2021 21:07:10 - INFO - __main__ - Step 44234: {'lr': 0.0004060910633430704, 'samples': 8492928, 'steps': 44233, 'loss/train': 1.9117945432662964} -08/30/2021 21:07:11 - INFO - __main__ - Step 44235: {'lr': 0.0004060869180330216, 'samples': 8493120, 'steps': 44234, 'loss/train': 1.2222625017166138} -08/30/2021 21:07:11 - INFO - __main__ - Step 44236: {'lr': 0.00040608277265264243, 'samples': 8493312, 'steps': 44235, 'loss/train': 1.3907073736190796} -08/30/2021 21:07:12 - INFO - __main__ - Step 44237: {'lr': 0.0004060786272019348, 'samples': 8493504, 'steps': 44236, 'loss/train': 1.9474618434906006} -08/30/2021 21:07:12 - INFO - __main__ - Step 44238: {'lr': 0.00040607448168090044, 'samples': 8493696, 'steps': 44237, 'loss/train': 1.4182382822036743} -08/30/2021 21:07:14 - INFO - __main__ - Step 44239: {'lr': 0.00040607033608954136, 'samples': 8493888, 'steps': 44238, 'loss/train': 0.38596755266189575} -08/30/2021 21:07:14 - INFO - __main__ - Step 44240: {'lr': 0.0004060661904278595, 'samples': 8494080, 'steps': 44239, 'loss/train': 1.5403029918670654} -08/30/2021 21:07:14 - INFO - __main__ - Step 44241: {'lr': 0.0004060620446958565, 'samples': 8494272, 'steps': 44240, 'loss/train': 1.410273790359497} -08/30/2021 21:07:15 - INFO - __main__ - Step 44242: {'lr': 0.00040605789889353445, 'samples': 8494464, 'steps': 44241, 'loss/train': 1.7102348804473877} -08/30/2021 21:07:15 - INFO - __main__ - Step 44243: {'lr': 0.00040605375302089507, 'samples': 8494656, 'steps': 44242, 'loss/train': 1.4443905353546143} -08/30/2021 21:07:16 - INFO - __main__ - Step 44244: {'lr': 0.00040604960707794023, 'samples': 8494848, 'steps': 44243, 'loss/train': 1.3313616514205933} -08/30/2021 21:07:17 - INFO - __main__ - Step 44245: {'lr': 0.00040604546106467196, 'samples': 8495040, 'steps': 44244, 'loss/train': 1.096571445465088} -08/30/2021 21:07:17 - INFO - __main__ - Step 44246: {'lr': 0.00040604131498109193, 'samples': 8495232, 'steps': 44245, 'loss/train': 1.005394458770752} -08/30/2021 21:07:18 - INFO - __main__ - Step 44247: {'lr': 0.0004060371688272021, 'samples': 8495424, 'steps': 44246, 'loss/train': 1.7249945402145386} -08/30/2021 21:07:18 - INFO - __main__ - Step 44248: {'lr': 0.00040603302260300435, 'samples': 8495616, 'steps': 44247, 'loss/train': 1.425903081893921} -08/30/2021 21:07:18 - INFO - __main__ - Step 44249: {'lr': 0.00040602887630850055, 'samples': 8495808, 'steps': 44248, 'loss/train': 1.4206792116165161} -08/30/2021 21:07:20 - INFO - __main__ - Step 44250: {'lr': 0.0004060247299436925, 'samples': 8496000, 'steps': 44249, 'loss/train': 1.3775831460952759} -08/30/2021 21:07:20 - INFO - __main__ - Step 44251: {'lr': 0.0004060205835085821, 'samples': 8496192, 'steps': 44250, 'loss/train': 1.731313705444336} -08/30/2021 21:07:21 - INFO - __main__ - Step 44252: {'lr': 0.00040601643700317126, 'samples': 8496384, 'steps': 44251, 'loss/train': 1.2964200973510742} -08/30/2021 21:07:21 - INFO - __main__ - Step 44253: {'lr': 0.0004060122904274618, 'samples': 8496576, 'steps': 44252, 'loss/train': 1.4697345495224} -08/30/2021 21:07:21 - INFO - __main__ - Step 44254: {'lr': 0.0004060081437814557, 'samples': 8496768, 'steps': 44253, 'loss/train': 1.290294885635376} -08/30/2021 21:07:23 - INFO - __main__ - Step 44255: {'lr': 0.00040600399706515466, 'samples': 8496960, 'steps': 44254, 'loss/train': 1.2453558444976807} -08/30/2021 21:07:23 - INFO - __main__ - Step 44256: {'lr': 0.0004059998502785606, 'samples': 8497152, 'steps': 44255, 'loss/train': 0.8972698450088501} -08/30/2021 21:07:24 - INFO - __main__ - Step 44257: {'lr': 0.0004059957034216755, 'samples': 8497344, 'steps': 44256, 'loss/train': 1.6260112524032593} -08/30/2021 21:07:24 - INFO - __main__ - Step 44258: {'lr': 0.00040599155649450106, 'samples': 8497536, 'steps': 44257, 'loss/train': 1.6431219577789307} -08/30/2021 21:07:24 - INFO - __main__ - Step 44259: {'lr': 0.00040598740949703927, 'samples': 8497728, 'steps': 44258, 'loss/train': 1.289858341217041} -08/30/2021 21:07:26 - INFO - __main__ - Step 44260: {'lr': 0.00040598326242929195, 'samples': 8497920, 'steps': 44259, 'loss/train': 1.2255562543869019} -08/30/2021 21:07:26 - INFO - __main__ - Step 44261: {'lr': 0.00040597911529126096, 'samples': 8498112, 'steps': 44260, 'loss/train': 1.1856263875961304} -08/30/2021 21:07:27 - INFO - __main__ - Step 44262: {'lr': 0.00040597496808294825, 'samples': 8498304, 'steps': 44261, 'loss/train': 1.9981262683868408} -08/30/2021 21:07:27 - INFO - __main__ - Step 44263: {'lr': 0.0004059708208043556, 'samples': 8498496, 'steps': 44262, 'loss/train': 1.3707419633865356} -08/30/2021 21:07:27 - INFO - __main__ - Step 44264: {'lr': 0.00040596667345548486, 'samples': 8498688, 'steps': 44263, 'loss/train': 0.8817673921585083} -08/30/2021 21:07:29 - INFO - __main__ - Step 44265: {'lr': 0.00040596252603633797, 'samples': 8498880, 'steps': 44264, 'loss/train': 0.9865076541900635} -08/30/2021 21:07:30 - INFO - __main__ - Step 44266: {'lr': 0.0004059583785469168, 'samples': 8499072, 'steps': 44265, 'loss/train': 1.5346657037734985} -08/30/2021 21:07:30 - INFO - __main__ - Step 44267: {'lr': 0.00040595423098722315, 'samples': 8499264, 'steps': 44266, 'loss/train': 0.6381934881210327} -08/30/2021 21:07:30 - INFO - __main__ - Step 44268: {'lr': 0.000405950083357259, 'samples': 8499456, 'steps': 44267, 'loss/train': 0.1051681861281395} -08/30/2021 21:07:31 - INFO - __main__ - Step 44269: {'lr': 0.0004059459356570261, 'samples': 8499648, 'steps': 44268, 'loss/train': 1.7870903015136719} -08/30/2021 21:07:32 - INFO - __main__ - Step 44270: {'lr': 0.00040594178788652636, 'samples': 8499840, 'steps': 44269, 'loss/train': 1.3645126819610596} -08/30/2021 21:07:33 - INFO - __main__ - Step 44271: {'lr': 0.00040593764004576166, 'samples': 8500032, 'steps': 44270, 'loss/train': 0.8432281613349915} -08/30/2021 21:07:33 - INFO - __main__ - Step 44272: {'lr': 0.0004059334921347339, 'samples': 8500224, 'steps': 44271, 'loss/train': 1.7896136045455933} -08/30/2021 21:07:33 - INFO - __main__ - Step 44273: {'lr': 0.00040592934415344486, 'samples': 8500416, 'steps': 44272, 'loss/train': 1.0209556818008423} -08/30/2021 21:07:34 - INFO - __main__ - Step 44274: {'lr': 0.0004059251961018965, 'samples': 8500608, 'steps': 44273, 'loss/train': 1.3701362609863281} -08/30/2021 21:07:35 - INFO - __main__ - Step 44275: {'lr': 0.00040592104798009066, 'samples': 8500800, 'steps': 44274, 'loss/train': 0.9669306874275208} -08/30/2021 21:07:36 - INFO - __main__ - Step 44276: {'lr': 0.00040591689978802917, 'samples': 8500992, 'steps': 44275, 'loss/train': 1.9835619926452637} -08/30/2021 21:07:36 - INFO - __main__ - Step 44277: {'lr': 0.0004059127515257139, 'samples': 8501184, 'steps': 44276, 'loss/train': 1.2374932765960693} -08/30/2021 21:07:36 - INFO - __main__ - Step 44278: {'lr': 0.0004059086031931468, 'samples': 8501376, 'steps': 44277, 'loss/train': 1.4289745092391968} -08/30/2021 21:07:37 - INFO - __main__ - Step 44279: {'lr': 0.00040590445479032965, 'samples': 8501568, 'steps': 44278, 'loss/train': 0.5289366841316223} -08/30/2021 21:07:39 - INFO - __main__ - Step 44280: {'lr': 0.0004059003063172644, 'samples': 8501760, 'steps': 44279, 'loss/train': 2.079277753829956} -08/30/2021 21:07:39 - INFO - __main__ - Step 44281: {'lr': 0.0004058961577739529, 'samples': 8501952, 'steps': 44280, 'loss/train': 1.273216724395752} -08/30/2021 21:07:40 - INFO - __main__ - Step 44282: {'lr': 0.00040589200916039703, 'samples': 8502144, 'steps': 44281, 'loss/train': 1.8912079334259033} -08/30/2021 21:07:40 - INFO - __main__ - Step 44283: {'lr': 0.0004058878604765985, 'samples': 8502336, 'steps': 44282, 'loss/train': 1.608237862586975} -08/30/2021 21:07:40 - INFO - __main__ - Step 44284: {'lr': 0.00040588371172255936, 'samples': 8502528, 'steps': 44283, 'loss/train': 1.7200936079025269} -08/30/2021 21:07:42 - INFO - __main__ - Step 44285: {'lr': 0.0004058795628982814, 'samples': 8502720, 'steps': 44284, 'loss/train': 1.2227617502212524} -08/30/2021 21:07:42 - INFO - __main__ - Step 44286: {'lr': 0.0004058754140037666, 'samples': 8502912, 'steps': 44285, 'loss/train': 1.2834556102752686} -08/30/2021 21:07:43 - INFO - __main__ - Step 44287: {'lr': 0.00040587126503901664, 'samples': 8503104, 'steps': 44286, 'loss/train': 1.5086218118667603} -08/30/2021 21:07:43 - INFO - __main__ - Step 44288: {'lr': 0.0004058671160040336, 'samples': 8503296, 'steps': 44287, 'loss/train': 1.3518232107162476} -08/30/2021 21:07:43 - INFO - __main__ - Step 44289: {'lr': 0.0004058629668988192, 'samples': 8503488, 'steps': 44288, 'loss/train': 1.1476361751556396} -08/30/2021 21:07:45 - INFO - __main__ - Step 44290: {'lr': 0.0004058588177233753, 'samples': 8503680, 'steps': 44289, 'loss/train': 1.532558560371399} -08/30/2021 21:07:45 - INFO - __main__ - Step 44291: {'lr': 0.0004058546684777039, 'samples': 8503872, 'steps': 44290, 'loss/train': 0.211063951253891} -08/30/2021 21:07:46 - INFO - __main__ - Step 44292: {'lr': 0.0004058505191618067, 'samples': 8504064, 'steps': 44291, 'loss/train': 1.150338053703308} -08/30/2021 21:07:46 - INFO - __main__ - Step 44293: {'lr': 0.00040584636977568573, 'samples': 8504256, 'steps': 44292, 'loss/train': 0.8358545303344727} -08/30/2021 21:07:46 - INFO - __main__ - Step 44294: {'lr': 0.0004058422203193428, 'samples': 8504448, 'steps': 44293, 'loss/train': 0.9335961937904358} -08/30/2021 21:07:48 - INFO - __main__ - Step 44295: {'lr': 0.0004058380707927798, 'samples': 8504640, 'steps': 44294, 'loss/train': 1.069401741027832} -08/30/2021 21:07:48 - INFO - __main__ - Step 44296: {'lr': 0.00040583392119599847, 'samples': 8504832, 'steps': 44295, 'loss/train': 1.6561537981033325} -08/30/2021 21:07:49 - INFO - __main__ - Step 44297: {'lr': 0.0004058297715290008, 'samples': 8505024, 'steps': 44296, 'loss/train': 1.3577299118041992} -08/30/2021 21:07:49 - INFO - __main__ - Step 44298: {'lr': 0.00040582562179178864, 'samples': 8505216, 'steps': 44297, 'loss/train': 1.6764581203460693} -08/30/2021 21:07:49 - INFO - __main__ - Step 44299: {'lr': 0.0004058214719843639, 'samples': 8505408, 'steps': 44298, 'loss/train': 1.693547010421753} -08/30/2021 21:07:51 - INFO - __main__ - Step 44300: {'lr': 0.0004058173221067284, 'samples': 8505600, 'steps': 44299, 'loss/train': 1.5342638492584229} -08/30/2021 21:07:52 - INFO - __main__ - Step 44301: {'lr': 0.00040581317215888403, 'samples': 8505792, 'steps': 44300, 'loss/train': 1.0842876434326172} -08/30/2021 21:07:52 - INFO - __main__ - Step 44302: {'lr': 0.0004058090221408326, 'samples': 8505984, 'steps': 44301, 'loss/train': 0.6397159695625305} -08/30/2021 21:07:52 - INFO - __main__ - Step 44303: {'lr': 0.0004058048720525761, 'samples': 8506176, 'steps': 44302, 'loss/train': 0.8952687382698059} -08/30/2021 21:07:53 - INFO - __main__ - Step 44304: {'lr': 0.00040580072189411626, 'samples': 8506368, 'steps': 44303, 'loss/train': 1.2569971084594727} -08/30/2021 21:07:53 - INFO - __main__ - Step 44305: {'lr': 0.00040579657166545503, 'samples': 8506560, 'steps': 44304, 'loss/train': 1.7909328937530518} -08/30/2021 21:07:55 - INFO - __main__ - Step 44306: {'lr': 0.0004057924213665943, 'samples': 8506752, 'steps': 44305, 'loss/train': 0.21140064299106598} -08/30/2021 21:07:55 - INFO - __main__ - Step 44307: {'lr': 0.0004057882709975359, 'samples': 8506944, 'steps': 44306, 'loss/train': 1.1904557943344116} -08/30/2021 21:07:55 - INFO - __main__ - Step 44308: {'lr': 0.0004057841205582817, 'samples': 8507136, 'steps': 44307, 'loss/train': 1.4542088508605957} -08/30/2021 21:07:56 - INFO - __main__ - Step 44309: {'lr': 0.0004057799700488336, 'samples': 8507328, 'steps': 44308, 'loss/train': 1.513412594795227} -08/30/2021 21:07:56 - INFO - __main__ - Step 44310: {'lr': 0.0004057758194691934, 'samples': 8507520, 'steps': 44309, 'loss/train': 1.5556021928787231} -08/30/2021 21:07:57 - INFO - __main__ - Step 44311: {'lr': 0.00040577166881936304, 'samples': 8507712, 'steps': 44310, 'loss/train': 1.3197760581970215} -08/30/2021 21:07:58 - INFO - __main__ - Step 44312: {'lr': 0.0004057675180993444, 'samples': 8507904, 'steps': 44311, 'loss/train': 0.688572347164154} -08/30/2021 21:07:58 - INFO - __main__ - Step 44313: {'lr': 0.00040576336730913933, 'samples': 8508096, 'steps': 44312, 'loss/train': 0.686278760433197} -08/30/2021 21:07:59 - INFO - __main__ - Step 44314: {'lr': 0.00040575921644874966, 'samples': 8508288, 'steps': 44313, 'loss/train': 1.106673240661621} -08/30/2021 21:07:59 - INFO - __main__ - Step 44315: {'lr': 0.00040575506551817725, 'samples': 8508480, 'steps': 44314, 'loss/train': 1.3167310953140259} -08/30/2021 21:08:00 - INFO - __main__ - Step 44316: {'lr': 0.00040575091451742405, 'samples': 8508672, 'steps': 44315, 'loss/train': 1.2857811450958252} -08/30/2021 21:08:01 - INFO - __main__ - Step 44317: {'lr': 0.0004057467634464919, 'samples': 8508864, 'steps': 44316, 'loss/train': 1.5763572454452515} -08/30/2021 21:08:01 - INFO - __main__ - Step 44318: {'lr': 0.00040574261230538267, 'samples': 8509056, 'steps': 44317, 'loss/train': 1.7079591751098633} -08/30/2021 21:08:02 - INFO - __main__ - Step 44319: {'lr': 0.0004057384610940982, 'samples': 8509248, 'steps': 44318, 'loss/train': 1.7545469999313354} -08/30/2021 21:08:02 - INFO - __main__ - Step 44320: {'lr': 0.0004057343098126404, 'samples': 8509440, 'steps': 44319, 'loss/train': 1.6263655424118042} -08/30/2021 21:08:04 - INFO - __main__ - Step 44321: {'lr': 0.0004057301584610111, 'samples': 8509632, 'steps': 44320, 'loss/train': 2.9451348781585693} -08/30/2021 21:08:04 - INFO - __main__ - Step 44322: {'lr': 0.00040572600703921223, 'samples': 8509824, 'steps': 44321, 'loss/train': 1.6663204431533813} -08/30/2021 21:08:04 - INFO - __main__ - Step 44323: {'lr': 0.0004057218555472456, 'samples': 8510016, 'steps': 44322, 'loss/train': 1.0474318265914917} -08/30/2021 21:08:05 - INFO - __main__ - Step 44324: {'lr': 0.0004057177039851131, 'samples': 8510208, 'steps': 44323, 'loss/train': 0.9182167053222656} -08/30/2021 21:08:05 - INFO - __main__ - Step 44325: {'lr': 0.00040571355235281657, 'samples': 8510400, 'steps': 44324, 'loss/train': 1.3504478931427002} -08/30/2021 21:08:06 - INFO - __main__ - Step 44326: {'lr': 0.00040570940065035797, 'samples': 8510592, 'steps': 44325, 'loss/train': 0.0857388824224472} -08/30/2021 21:08:07 - INFO - __main__ - Step 44327: {'lr': 0.0004057052488777392, 'samples': 8510784, 'steps': 44326, 'loss/train': 1.8662266731262207} -08/30/2021 21:08:08 - INFO - __main__ - Step 44328: {'lr': 0.0004057010970349619, 'samples': 8510976, 'steps': 44327, 'loss/train': 1.5167348384857178} -08/30/2021 21:08:08 - INFO - __main__ - Step 44329: {'lr': 0.00040569694512202815, 'samples': 8511168, 'steps': 44328, 'loss/train': 0.7417482137680054} -08/30/2021 21:08:08 - INFO - __main__ - Step 44330: {'lr': 0.00040569279313893976, 'samples': 8511360, 'steps': 44329, 'loss/train': 1.1411490440368652} -08/30/2021 21:08:09 - INFO - __main__ - Step 44331: {'lr': 0.0004056886410856986, 'samples': 8511552, 'steps': 44330, 'loss/train': 1.4563403129577637} -08/30/2021 21:08:11 - INFO - __main__ - Step 44332: {'lr': 0.0004056844889623065, 'samples': 8511744, 'steps': 44331, 'loss/train': 0.6688815355300903} -08/30/2021 21:08:11 - INFO - __main__ - Step 44333: {'lr': 0.0004056803367687654, 'samples': 8511936, 'steps': 44332, 'loss/train': 2.130687952041626} -08/30/2021 21:08:11 - INFO - __main__ - Step 44334: {'lr': 0.0004056761845050772, 'samples': 8512128, 'steps': 44333, 'loss/train': 0.916379988193512} -08/30/2021 21:08:12 - INFO - __main__ - Step 44335: {'lr': 0.0004056720321712436, 'samples': 8512320, 'steps': 44334, 'loss/train': 2.310025930404663} -08/30/2021 21:08:12 - INFO - __main__ - Step 44336: {'lr': 0.00040566787976726665, 'samples': 8512512, 'steps': 44335, 'loss/train': 1.4363394975662231} -08/30/2021 21:08:14 - INFO - __main__ - Step 44337: {'lr': 0.00040566372729314813, 'samples': 8512704, 'steps': 44336, 'loss/train': 1.2332144975662231} -08/30/2021 21:08:14 - INFO - __main__ - Step 44338: {'lr': 0.00040565957474889, 'samples': 8512896, 'steps': 44337, 'loss/train': 1.513017177581787} -08/30/2021 21:08:14 - INFO - __main__ - Step 44339: {'lr': 0.000405655422134494, 'samples': 8513088, 'steps': 44338, 'loss/train': 1.5066421031951904} -08/30/2021 21:08:15 - INFO - __main__ - Step 44340: {'lr': 0.0004056512694499621, 'samples': 8513280, 'steps': 44339, 'loss/train': 1.3086494207382202} -08/30/2021 21:08:15 - INFO - __main__ - Step 44341: {'lr': 0.0004056471166952961, 'samples': 8513472, 'steps': 44340, 'loss/train': 1.198072910308838} -08/30/2021 21:08:17 - INFO - __main__ - Step 44342: {'lr': 0.0004056429638704979, 'samples': 8513664, 'steps': 44341, 'loss/train': 1.437775731086731} -08/30/2021 21:08:17 - INFO - __main__ - Step 44343: {'lr': 0.0004056388109755695, 'samples': 8513856, 'steps': 44342, 'loss/train': 0.780569851398468} -08/30/2021 21:08:18 - INFO - __main__ - Step 44344: {'lr': 0.0004056346580105126, 'samples': 8514048, 'steps': 44343, 'loss/train': 1.385893702507019} -08/30/2021 21:08:18 - INFO - __main__ - Step 44345: {'lr': 0.00040563050497532905, 'samples': 8514240, 'steps': 44344, 'loss/train': 1.0065590143203735} -08/30/2021 21:08:18 - INFO - __main__ - Step 44346: {'lr': 0.00040562635187002083, 'samples': 8514432, 'steps': 44345, 'loss/train': 1.6725244522094727} -08/30/2021 21:08:20 - INFO - __main__ - Step 44347: {'lr': 0.0004056221986945898, 'samples': 8514624, 'steps': 44346, 'loss/train': 1.7639890909194946} -08/30/2021 21:08:20 - INFO - __main__ - Step 44348: {'lr': 0.0004056180454490378, 'samples': 8514816, 'steps': 44347, 'loss/train': 1.2765198945999146} -08/30/2021 21:08:20 - INFO - __main__ - Step 44349: {'lr': 0.00040561389213336673, 'samples': 8515008, 'steps': 44348, 'loss/train': 1.6406426429748535} -08/30/2021 21:08:21 - INFO - __main__ - Step 44350: {'lr': 0.00040560973874757844, 'samples': 8515200, 'steps': 44349, 'loss/train': 1.497821569442749} -08/30/2021 21:08:21 - INFO - __main__ - Step 44351: {'lr': 0.0004056055852916748, 'samples': 8515392, 'steps': 44350, 'loss/train': 1.352238655090332} -08/30/2021 21:08:22 - INFO - __main__ - Step 44352: {'lr': 0.0004056014317656577, 'samples': 8515584, 'steps': 44351, 'loss/train': 0.9462263584136963} -08/30/2021 21:08:23 - INFO - __main__ - Step 44353: {'lr': 0.00040559727816952897, 'samples': 8515776, 'steps': 44352, 'loss/train': 0.90390944480896} -08/30/2021 21:08:23 - INFO - __main__ - Step 44354: {'lr': 0.0004055931245032904, 'samples': 8515968, 'steps': 44353, 'loss/train': 1.8002678155899048} -08/30/2021 21:08:24 - INFO - __main__ - Step 44355: {'lr': 0.0004055889707669441, 'samples': 8516160, 'steps': 44354, 'loss/train': 1.4575846195220947} -08/30/2021 21:08:24 - INFO - __main__ - Step 44356: {'lr': 0.0004055848169604919, 'samples': 8516352, 'steps': 44355, 'loss/train': 1.347817063331604} -08/30/2021 21:08:24 - INFO - __main__ - Step 44357: {'lr': 0.00040558066308393536, 'samples': 8516544, 'steps': 44356, 'loss/train': 1.2407376766204834} -08/30/2021 21:08:26 - INFO - __main__ - Step 44358: {'lr': 0.0004055765091372767, 'samples': 8516736, 'steps': 44357, 'loss/train': 1.603507161140442} -08/30/2021 21:08:26 - INFO - __main__ - Step 44359: {'lr': 0.0004055723551205177, 'samples': 8516928, 'steps': 44358, 'loss/train': 1.2168844938278198} -08/30/2021 21:08:27 - INFO - __main__ - Step 44360: {'lr': 0.0004055682010336601, 'samples': 8517120, 'steps': 44359, 'loss/train': 1.5627723932266235} -08/30/2021 21:08:27 - INFO - __main__ - Step 44361: {'lr': 0.0004055640468767059, 'samples': 8517312, 'steps': 44360, 'loss/train': 1.615235447883606} -08/30/2021 21:08:28 - INFO - __main__ - Step 44362: {'lr': 0.000405559892649657, 'samples': 8517504, 'steps': 44361, 'loss/train': 1.522583246231079} -08/30/2021 21:08:29 - INFO - __main__ - Step 44363: {'lr': 0.00040555573835251513, 'samples': 8517696, 'steps': 44362, 'loss/train': 1.4683529138565063} -08/30/2021 21:08:30 - INFO - __main__ - Step 44364: {'lr': 0.00040555158398528237, 'samples': 8517888, 'steps': 44363, 'loss/train': 1.1983929872512817} -08/30/2021 21:08:30 - INFO - __main__ - Step 44365: {'lr': 0.0004055474295479603, 'samples': 8518080, 'steps': 44364, 'loss/train': 1.5823521614074707} -08/30/2021 21:08:30 - INFO - __main__ - Step 44366: {'lr': 0.00040554327504055106, 'samples': 8518272, 'steps': 44365, 'loss/train': 1.7043169736862183} -08/30/2021 21:08:31 - INFO - __main__ - Step 44367: {'lr': 0.0004055391204630564, 'samples': 8518464, 'steps': 44366, 'loss/train': 1.4671788215637207} -08/30/2021 21:08:32 - INFO - __main__ - Step 44368: {'lr': 0.0004055349658154782, 'samples': 8518656, 'steps': 44367, 'loss/train': 0.8614078164100647} -08/30/2021 21:08:33 - INFO - __main__ - Step 44369: {'lr': 0.00040553081109781844, 'samples': 8518848, 'steps': 44368, 'loss/train': 1.3381456136703491} -08/30/2021 21:08:33 - INFO - __main__ - Step 44370: {'lr': 0.0004055266563100788, 'samples': 8519040, 'steps': 44369, 'loss/train': 1.3427907228469849} -08/30/2021 21:08:33 - INFO - __main__ - Step 44371: {'lr': 0.00040552250145226124, 'samples': 8519232, 'steps': 44370, 'loss/train': 1.5324828624725342} -08/30/2021 21:08:34 - INFO - __main__ - Step 44372: {'lr': 0.0004055183465243676, 'samples': 8519424, 'steps': 44371, 'loss/train': 1.672202706336975} -08/30/2021 21:08:35 - INFO - __main__ - Step 44373: {'lr': 0.0004055141915263999, 'samples': 8519616, 'steps': 44372, 'loss/train': 1.2652825117111206} -08/30/2021 21:08:36 - INFO - __main__ - Step 44374: {'lr': 0.0004055100364583598, 'samples': 8519808, 'steps': 44373, 'loss/train': 1.2054704427719116} -08/30/2021 21:08:36 - INFO - __main__ - Step 44375: {'lr': 0.0004055058813202493, 'samples': 8520000, 'steps': 44374, 'loss/train': 1.5328508615493774} -08/30/2021 21:08:36 - INFO - __main__ - Step 44376: {'lr': 0.0004055017261120704, 'samples': 8520192, 'steps': 44375, 'loss/train': 1.181402325630188} -08/30/2021 21:08:37 - INFO - __main__ - Step 44377: {'lr': 0.00040549757083382465, 'samples': 8520384, 'steps': 44376, 'loss/train': 0.12349032610654831} -08/30/2021 21:08:38 - INFO - __main__ - Step 44378: {'lr': 0.00040549341548551415, 'samples': 8520576, 'steps': 44377, 'loss/train': 1.0654141902923584} -08/30/2021 21:08:39 - INFO - __main__ - Step 44379: {'lr': 0.0004054892600671407, 'samples': 8520768, 'steps': 44378, 'loss/train': 1.143369197845459} -08/30/2021 21:08:39 - INFO - __main__ - Step 44380: {'lr': 0.00040548510457870623, 'samples': 8520960, 'steps': 44379, 'loss/train': 0.18210400640964508} -08/30/2021 21:08:40 - INFO - __main__ - Step 44381: {'lr': 0.00040548094902021257, 'samples': 8521152, 'steps': 44380, 'loss/train': 0.9839759469032288} -08/30/2021 21:08:40 - INFO - __main__ - Step 44382: {'lr': 0.00040547679339166155, 'samples': 8521344, 'steps': 44381, 'loss/train': 1.4647890329360962} -08/30/2021 21:08:42 - INFO - __main__ - Step 44383: {'lr': 0.0004054726376930551, 'samples': 8521536, 'steps': 44382, 'loss/train': 1.3601447343826294} -08/30/2021 21:08:42 - INFO - __main__ - Step 44384: {'lr': 0.0004054684819243951, 'samples': 8521728, 'steps': 44383, 'loss/train': 1.464267611503601} -08/30/2021 21:08:42 - INFO - __main__ - Step 44385: {'lr': 0.0004054643260856834, 'samples': 8521920, 'steps': 44384, 'loss/train': 1.268541693687439} -08/30/2021 21:08:43 - INFO - __main__ - Step 44386: {'lr': 0.00040546017017692183, 'samples': 8522112, 'steps': 44385, 'loss/train': 0.5542771220207214} -08/30/2021 21:08:43 - INFO - __main__ - Step 44387: {'lr': 0.00040545601419811236, 'samples': 8522304, 'steps': 44386, 'loss/train': 0.6981580853462219} -08/30/2021 21:08:43 - INFO - __main__ - Step 44388: {'lr': 0.00040545185814925676, 'samples': 8522496, 'steps': 44387, 'loss/train': 0.9781181812286377} -08/30/2021 21:08:46 - INFO - __main__ - Step 44389: {'lr': 0.00040544770203035705, 'samples': 8522688, 'steps': 44388, 'loss/train': 1.3792634010314941} -08/30/2021 21:08:46 - INFO - __main__ - Step 44390: {'lr': 0.0004054435458414149, 'samples': 8522880, 'steps': 44389, 'loss/train': 1.5857902765274048} -08/30/2021 21:08:46 - INFO - __main__ - Step 44391: {'lr': 0.0004054393895824323, 'samples': 8523072, 'steps': 44390, 'loss/train': 1.8444561958312988} -08/30/2021 21:08:47 - INFO - __main__ - Step 44392: {'lr': 0.00040543523325341116, 'samples': 8523264, 'steps': 44391, 'loss/train': 1.0472975969314575} -08/30/2021 21:08:47 - INFO - __main__ - Step 44393: {'lr': 0.0004054310768543532, 'samples': 8523456, 'steps': 44392, 'loss/train': 0.889835000038147} -08/30/2021 21:08:49 - INFO - __main__ - Step 44394: {'lr': 0.00040542692038526054, 'samples': 8523648, 'steps': 44393, 'loss/train': 1.0555006265640259} -08/30/2021 21:08:49 - INFO - __main__ - Step 44395: {'lr': 0.0004054227638461348, 'samples': 8523840, 'steps': 44394, 'loss/train': 1.0273945331573486} -08/30/2021 21:08:49 - INFO - __main__ - Step 44396: {'lr': 0.000405418607236978, 'samples': 8524032, 'steps': 44395, 'loss/train': 1.463208794593811} -08/30/2021 21:08:50 - INFO - __main__ - Step 44397: {'lr': 0.00040541445055779197, 'samples': 8524224, 'steps': 44396, 'loss/train': 1.6251517534255981} -08/30/2021 21:08:50 - INFO - __main__ - Step 44398: {'lr': 0.0004054102938085786, 'samples': 8524416, 'steps': 44397, 'loss/train': 1.1361525058746338} -08/30/2021 21:08:52 - INFO - __main__ - Step 44399: {'lr': 0.0004054061369893397, 'samples': 8524608, 'steps': 44398, 'loss/train': 1.5430678129196167} -08/30/2021 21:08:52 - INFO - __main__ - Step 44400: {'lr': 0.0004054019801000772, 'samples': 8524800, 'steps': 44399, 'loss/train': 1.450382947921753} -08/30/2021 21:08:52 - INFO - __main__ - Step 44401: {'lr': 0.00040539782314079304, 'samples': 8524992, 'steps': 44400, 'loss/train': 1.108041763305664} -08/30/2021 21:08:53 - INFO - __main__ - Step 44402: {'lr': 0.000405393666111489, 'samples': 8525184, 'steps': 44401, 'loss/train': 1.10700523853302} -08/30/2021 21:08:53 - INFO - __main__ - Step 44403: {'lr': 0.0004053895090121669, 'samples': 8525376, 'steps': 44402, 'loss/train': 1.555692434310913} -08/30/2021 21:08:55 - INFO - __main__ - Step 44404: {'lr': 0.00040538535184282877, 'samples': 8525568, 'steps': 44403, 'loss/train': 1.4380104541778564} -08/30/2021 21:08:55 - INFO - __main__ - Step 44405: {'lr': 0.00040538119460347636, 'samples': 8525760, 'steps': 44404, 'loss/train': 0.3123876452445984} -08/30/2021 21:08:56 - INFO - __main__ - Step 44406: {'lr': 0.0004053770372941116, 'samples': 8525952, 'steps': 44405, 'loss/train': 1.4943342208862305} -08/30/2021 21:08:56 - INFO - __main__ - Step 44407: {'lr': 0.00040537287991473627, 'samples': 8526144, 'steps': 44406, 'loss/train': 1.6229242086410522} -08/30/2021 21:08:56 - INFO - __main__ - Step 44408: {'lr': 0.0004053687224653524, 'samples': 8526336, 'steps': 44407, 'loss/train': 1.8058867454528809} -08/30/2021 21:08:57 - INFO - __main__ - Step 44409: {'lr': 0.0004053645649459617, 'samples': 8526528, 'steps': 44408, 'loss/train': 1.1329448223114014} -08/30/2021 21:08:58 - INFO - __main__ - Step 44410: {'lr': 0.0004053604073565662, 'samples': 8526720, 'steps': 44409, 'loss/train': 1.3405773639678955} -08/30/2021 21:08:59 - INFO - __main__ - Step 44411: {'lr': 0.0004053562496971677, 'samples': 8526912, 'steps': 44410, 'loss/train': 1.1856756210327148} -08/30/2021 21:08:59 - INFO - __main__ - Step 44412: {'lr': 0.00040535209196776803, 'samples': 8527104, 'steps': 44411, 'loss/train': 0.09055878221988678} -08/30/2021 21:08:59 - INFO - __main__ - Step 44413: {'lr': 0.00040534793416836915, 'samples': 8527296, 'steps': 44412, 'loss/train': 0.9902360439300537} -08/30/2021 21:09:00 - INFO - __main__ - Step 44414: {'lr': 0.00040534377629897276, 'samples': 8527488, 'steps': 44413, 'loss/train': 0.7650054097175598} -08/30/2021 21:09:01 - INFO - __main__ - Step 44415: {'lr': 0.000405339618359581, 'samples': 8527680, 'steps': 44414, 'loss/train': 0.4365941882133484} -08/30/2021 21:09:02 - INFO - __main__ - Step 44416: {'lr': 0.0004053354603501956, 'samples': 8527872, 'steps': 44415, 'loss/train': 1.9157416820526123} -08/30/2021 21:09:02 - INFO - __main__ - Step 44417: {'lr': 0.0004053313022708184, 'samples': 8528064, 'steps': 44416, 'loss/train': 1.7101826667785645} -08/30/2021 21:09:02 - INFO - __main__ - Step 44418: {'lr': 0.00040532714412145135, 'samples': 8528256, 'steps': 44417, 'loss/train': 1.0287338495254517} -08/30/2021 21:09:03 - INFO - __main__ - Step 44419: {'lr': 0.0004053229859020962, 'samples': 8528448, 'steps': 44418, 'loss/train': 1.6128599643707275} -08/30/2021 21:09:05 - INFO - __main__ - Step 44420: {'lr': 0.00040531882761275496, 'samples': 8528640, 'steps': 44419, 'loss/train': 1.497105360031128} -08/30/2021 21:09:05 - INFO - __main__ - Step 44421: {'lr': 0.00040531466925342947, 'samples': 8528832, 'steps': 44420, 'loss/train': 0.8967697024345398} -08/30/2021 21:09:05 - INFO - __main__ - Step 44422: {'lr': 0.0004053105108241216, 'samples': 8529024, 'steps': 44421, 'loss/train': 1.6246263980865479} -08/30/2021 21:09:06 - INFO - __main__ - Step 44423: {'lr': 0.0004053063523248331, 'samples': 8529216, 'steps': 44422, 'loss/train': 1.360418438911438} -08/30/2021 21:09:06 - INFO - __main__ - Step 44424: {'lr': 0.0004053021937555661, 'samples': 8529408, 'steps': 44423, 'loss/train': 1.585578203201294} -08/30/2021 21:09:07 - INFO - __main__ - Step 44425: {'lr': 0.00040529803511632224, 'samples': 8529600, 'steps': 44424, 'loss/train': 1.7599161863327026} -08/30/2021 21:09:08 - INFO - __main__ - Step 44426: {'lr': 0.0004052938764071035, 'samples': 8529792, 'steps': 44425, 'loss/train': 1.6455732583999634} -08/30/2021 21:09:08 - INFO - __main__ - Step 44427: {'lr': 0.00040528971762791177, 'samples': 8529984, 'steps': 44426, 'loss/train': 1.3100522756576538} -08/30/2021 21:09:08 - INFO - __main__ - Step 44428: {'lr': 0.0004052855587787488, 'samples': 8530176, 'steps': 44427, 'loss/train': 1.5594284534454346} -08/30/2021 21:09:09 - INFO - __main__ - Step 44429: {'lr': 0.0004052813998596167, 'samples': 8530368, 'steps': 44428, 'loss/train': 1.7124489545822144} -08/30/2021 21:09:10 - INFO - __main__ - Step 44430: {'lr': 0.0004052772408705171, 'samples': 8530560, 'steps': 44429, 'loss/train': 1.6920275688171387} -08/30/2021 21:09:11 - INFO - __main__ - Step 44431: {'lr': 0.000405273081811452, 'samples': 8530752, 'steps': 44430, 'loss/train': 1.4410616159439087} -08/30/2021 21:09:11 - INFO - __main__ - Step 44432: {'lr': 0.0004052689226824232, 'samples': 8530944, 'steps': 44431, 'loss/train': 1.5302947759628296} -08/30/2021 21:09:12 - INFO - __main__ - Step 44433: {'lr': 0.0004052647634834327, 'samples': 8531136, 'steps': 44432, 'loss/train': 1.1068027019500732} -08/30/2021 21:09:12 - INFO - __main__ - Step 44434: {'lr': 0.00040526060421448216, 'samples': 8531328, 'steps': 44433, 'loss/train': 1.0758174657821655} -08/30/2021 21:09:14 - INFO - __main__ - Step 44435: {'lr': 0.00040525644487557366, 'samples': 8531520, 'steps': 44434, 'loss/train': 2.474747896194458} -08/30/2021 21:09:14 - INFO - __main__ - Step 44436: {'lr': 0.000405252285466709, 'samples': 8531712, 'steps': 44435, 'loss/train': 1.5391771793365479} -08/30/2021 21:09:15 - INFO - __main__ - Step 44437: {'lr': 0.0004052481259878901, 'samples': 8531904, 'steps': 44436, 'loss/train': 1.489598274230957} -08/30/2021 21:09:15 - INFO - __main__ - Step 44438: {'lr': 0.00040524396643911874, 'samples': 8532096, 'steps': 44437, 'loss/train': 1.71968674659729} -08/30/2021 21:09:15 - INFO - __main__ - Step 44439: {'lr': 0.00040523980682039684, 'samples': 8532288, 'steps': 44438, 'loss/train': 0.9684491157531738} -08/30/2021 21:09:16 - INFO - __main__ - Step 44440: {'lr': 0.00040523564713172634, 'samples': 8532480, 'steps': 44439, 'loss/train': 0.7825356721878052} -08/30/2021 21:09:18 - INFO - __main__ - Step 44441: {'lr': 0.000405231487373109, 'samples': 8532672, 'steps': 44440, 'loss/train': 1.4384033679962158} -08/30/2021 21:09:18 - INFO - __main__ - Step 44442: {'lr': 0.00040522732754454674, 'samples': 8532864, 'steps': 44441, 'loss/train': 1.5658432245254517} -08/30/2021 21:09:19 - INFO - __main__ - Step 44443: {'lr': 0.0004052231676460415, 'samples': 8533056, 'steps': 44442, 'loss/train': 0.04636095464229584} -08/30/2021 21:09:19 - INFO - __main__ - Step 44444: {'lr': 0.000405219007677595, 'samples': 8533248, 'steps': 44443, 'loss/train': 1.0714856386184692} -08/30/2021 21:09:19 - INFO - __main__ - Step 44445: {'lr': 0.0004052148476392093, 'samples': 8533440, 'steps': 44444, 'loss/train': 1.0937790870666504} -08/30/2021 21:09:21 - INFO - __main__ - Step 44446: {'lr': 0.00040521068753088615, 'samples': 8533632, 'steps': 44445, 'loss/train': 1.9813108444213867} -08/30/2021 21:09:21 - INFO - __main__ - Step 44447: {'lr': 0.0004052065273526274, 'samples': 8533824, 'steps': 44446, 'loss/train': 1.0501751899719238} -08/30/2021 21:09:22 - INFO - __main__ - Step 44448: {'lr': 0.0004052023671044351, 'samples': 8534016, 'steps': 44447, 'loss/train': 1.4251588582992554} -08/30/2021 21:09:22 - INFO - __main__ - Step 44449: {'lr': 0.0004051982067863109, 'samples': 8534208, 'steps': 44448, 'loss/train': 1.5152170658111572} -08/30/2021 21:09:22 - INFO - __main__ - Step 44450: {'lr': 0.0004051940463982569, 'samples': 8534400, 'steps': 44449, 'loss/train': 2.029966115951538} -08/30/2021 21:09:24 - INFO - __main__ - Step 44451: {'lr': 0.0004051898859402748, 'samples': 8534592, 'steps': 44450, 'loss/train': 0.6633539199829102} -08/30/2021 21:09:24 - INFO - __main__ - Step 44452: {'lr': 0.00040518572541236653, 'samples': 8534784, 'steps': 44451, 'loss/train': 1.9171779155731201} -08/30/2021 21:09:25 - INFO - __main__ - Step 44453: {'lr': 0.00040518156481453397, 'samples': 8534976, 'steps': 44452, 'loss/train': 1.0319797992706299} -08/30/2021 21:09:25 - INFO - __main__ - Step 44454: {'lr': 0.0004051774041467789, 'samples': 8535168, 'steps': 44453, 'loss/train': 0.956123948097229} -08/30/2021 21:09:25 - INFO - __main__ - Step 44455: {'lr': 0.00040517324340910347, 'samples': 8535360, 'steps': 44454, 'loss/train': 1.4808039665222168} -08/30/2021 21:09:27 - INFO - __main__ - Step 44456: {'lr': 0.0004051690826015092, 'samples': 8535552, 'steps': 44455, 'loss/train': 1.4301506280899048} -08/30/2021 21:09:27 - INFO - __main__ - Step 44457: {'lr': 0.0004051649217239982, 'samples': 8535744, 'steps': 44456, 'loss/train': 1.0478050708770752} -08/30/2021 21:09:27 - INFO - __main__ - Step 44458: {'lr': 0.00040516076077657233, 'samples': 8535936, 'steps': 44457, 'loss/train': 1.3084079027175903} -08/30/2021 21:09:28 - INFO - __main__ - Step 44459: {'lr': 0.0004051565997592334, 'samples': 8536128, 'steps': 44458, 'loss/train': 1.7300537824630737} -08/30/2021 21:09:28 - INFO - __main__ - Step 44460: {'lr': 0.0004051524386719832, 'samples': 8536320, 'steps': 44459, 'loss/train': 1.4327802658081055} -08/30/2021 21:09:30 - INFO - __main__ - Step 44461: {'lr': 0.0004051482775148238, 'samples': 8536512, 'steps': 44460, 'loss/train': 1.2706925868988037} -08/30/2021 21:09:30 - INFO - __main__ - Step 44462: {'lr': 0.00040514411628775695, 'samples': 8536704, 'steps': 44461, 'loss/train': 1.3717412948608398} -08/30/2021 21:09:30 - INFO - __main__ - Step 44463: {'lr': 0.0004051399549907846, 'samples': 8536896, 'steps': 44462, 'loss/train': 0.8411885499954224} -08/30/2021 21:09:31 - INFO - __main__ - Step 44464: {'lr': 0.0004051357936239085, 'samples': 8537088, 'steps': 44463, 'loss/train': 1.7029852867126465} -08/30/2021 21:09:31 - INFO - __main__ - Step 44465: {'lr': 0.0004051316321871307, 'samples': 8537280, 'steps': 44464, 'loss/train': 1.7586841583251953} -08/30/2021 21:09:33 - INFO - __main__ - Step 44466: {'lr': 0.0004051274706804529, 'samples': 8537472, 'steps': 44465, 'loss/train': 1.1580958366394043} -08/30/2021 21:09:33 - INFO - __main__ - Step 44467: {'lr': 0.00040512330910387706, 'samples': 8537664, 'steps': 44466, 'loss/train': 1.5329684019088745} -08/30/2021 21:09:33 - INFO - __main__ - Step 44468: {'lr': 0.0004051191474574051, 'samples': 8537856, 'steps': 44467, 'loss/train': 0.5874102115631104} -08/30/2021 21:09:34 - INFO - __main__ - Step 44469: {'lr': 0.0004051149857410388, 'samples': 8538048, 'steps': 44468, 'loss/train': 1.3083397150039673} -08/30/2021 21:09:34 - INFO - __main__ - Step 44470: {'lr': 0.00040511082395478014, 'samples': 8538240, 'steps': 44469, 'loss/train': 0.9663345813751221} -08/30/2021 21:09:36 - INFO - __main__ - Step 44471: {'lr': 0.0004051066620986309, 'samples': 8538432, 'steps': 44470, 'loss/train': 1.491760492324829} -08/30/2021 21:09:36 - INFO - __main__ - Step 44472: {'lr': 0.00040510250017259297, 'samples': 8538624, 'steps': 44471, 'loss/train': 1.2722337245941162} -08/30/2021 21:09:36 - INFO - __main__ - Step 44473: {'lr': 0.0004050983381766683, 'samples': 8538816, 'steps': 44472, 'loss/train': 1.2302114963531494} -08/30/2021 21:09:37 - INFO - __main__ - Step 44474: {'lr': 0.00040509417611085864, 'samples': 8539008, 'steps': 44473, 'loss/train': 1.02627694606781} -08/30/2021 21:09:37 - INFO - __main__ - Step 44475: {'lr': 0.000405090013975166, 'samples': 8539200, 'steps': 44474, 'loss/train': 1.4069682359695435} -08/30/2021 21:09:39 - INFO - __main__ - Step 44476: {'lr': 0.0004050858517695921, 'samples': 8539392, 'steps': 44475, 'loss/train': 0.056732427328825} -08/30/2021 21:09:39 - INFO - __main__ - Step 44477: {'lr': 0.00040508168949413904, 'samples': 8539584, 'steps': 44476, 'loss/train': 0.49713489413261414} -08/30/2021 21:09:40 - INFO - __main__ - Step 44478: {'lr': 0.00040507752714880854, 'samples': 8539776, 'steps': 44477, 'loss/train': 1.7905160188674927} -08/30/2021 21:09:40 - INFO - __main__ - Step 44479: {'lr': 0.0004050733647336024, 'samples': 8539968, 'steps': 44478, 'loss/train': 0.039963483810424805} -08/30/2021 21:09:40 - INFO - __main__ - Step 44480: {'lr': 0.00040506920224852265, 'samples': 8540160, 'steps': 44479, 'loss/train': 1.5167438983917236} -08/30/2021 21:09:42 - INFO - __main__ - Step 44481: {'lr': 0.0004050650396935711, 'samples': 8540352, 'steps': 44480, 'loss/train': 0.9848048686981201} -08/30/2021 21:09:42 - INFO - __main__ - Step 44482: {'lr': 0.00040506087706874966, 'samples': 8540544, 'steps': 44481, 'loss/train': 1.1850807666778564} -08/30/2021 21:09:43 - INFO - __main__ - Step 44483: {'lr': 0.00040505671437406017, 'samples': 8540736, 'steps': 44482, 'loss/train': 1.566209316253662} -08/30/2021 21:09:43 - INFO - __main__ - Step 44484: {'lr': 0.00040505255160950453, 'samples': 8540928, 'steps': 44483, 'loss/train': 1.4203972816467285} -08/30/2021 21:09:43 - INFO - __main__ - Step 44485: {'lr': 0.00040504838877508464, 'samples': 8541120, 'steps': 44484, 'loss/train': 1.0548129081726074} -08/30/2021 21:09:44 - INFO - __main__ - Step 44486: {'lr': 0.0004050442258708022, 'samples': 8541312, 'steps': 44485, 'loss/train': 1.396460771560669} -08/30/2021 21:09:45 - INFO - __main__ - Step 44487: {'lr': 0.0004050400628966594, 'samples': 8541504, 'steps': 44486, 'loss/train': 1.2104344367980957} -08/30/2021 21:09:46 - INFO - __main__ - Step 44488: {'lr': 0.0004050358998526578, 'samples': 8541696, 'steps': 44487, 'loss/train': 1.3652832508087158} -08/30/2021 21:09:46 - INFO - __main__ - Step 44489: {'lr': 0.00040503173673879945, 'samples': 8541888, 'steps': 44488, 'loss/train': 0.5879058837890625} -08/30/2021 21:09:46 - INFO - __main__ - Step 44490: {'lr': 0.00040502757355508626, 'samples': 8542080, 'steps': 44489, 'loss/train': 1.201690435409546} -08/30/2021 21:09:47 - INFO - __main__ - Step 44491: {'lr': 0.00040502341030152, 'samples': 8542272, 'steps': 44490, 'loss/train': 1.2262431383132935} -08/30/2021 21:09:49 - INFO - __main__ - Step 44492: {'lr': 0.0004050192469781025, 'samples': 8542464, 'steps': 44491, 'loss/train': 1.5194636583328247} -08/30/2021 21:09:49 - INFO - __main__ - Step 44493: {'lr': 0.00040501508358483583, 'samples': 8542656, 'steps': 44492, 'loss/train': 1.5061290264129639} -08/30/2021 21:09:50 - INFO - __main__ - Step 44494: {'lr': 0.00040501092012172173, 'samples': 8542848, 'steps': 44493, 'loss/train': 1.147111177444458} -08/30/2021 21:09:50 - INFO - __main__ - Step 44495: {'lr': 0.0004050067565887621, 'samples': 8543040, 'steps': 44494, 'loss/train': 1.7778196334838867} -08/30/2021 21:09:50 - INFO - __main__ - Step 44496: {'lr': 0.00040500259298595874, 'samples': 8543232, 'steps': 44495, 'loss/train': 0.8166763186454773} -08/30/2021 21:09:52 - INFO - __main__ - Step 44497: {'lr': 0.00040499842931331374, 'samples': 8543424, 'steps': 44496, 'loss/train': 2.023059844970703} -08/30/2021 21:09:52 - INFO - __main__ - Step 44498: {'lr': 0.0004049942655708287, 'samples': 8543616, 'steps': 44497, 'loss/train': 1.2264952659606934} -08/30/2021 21:09:53 - INFO - __main__ - Step 44499: {'lr': 0.0004049901017585058, 'samples': 8543808, 'steps': 44498, 'loss/train': 1.063349723815918} -08/30/2021 21:09:53 - INFO - __main__ - Step 44500: {'lr': 0.00040498593787634664, 'samples': 8544000, 'steps': 44499, 'loss/train': 1.9578582048416138} -08/30/2021 21:09:53 - INFO - __main__ - Step 44501: {'lr': 0.0004049817739243532, 'samples': 8544192, 'steps': 44500, 'loss/train': 1.4517039060592651} -08/30/2021 21:09:55 - INFO - __main__ - Step 44502: {'lr': 0.0004049776099025274, 'samples': 8544384, 'steps': 44501, 'loss/train': 1.0581343173980713} -08/30/2021 21:09:55 - INFO - __main__ - Step 44503: {'lr': 0.000404973445810871, 'samples': 8544576, 'steps': 44502, 'loss/train': 1.193643569946289} -08/30/2021 21:09:56 - INFO - __main__ - Step 44504: {'lr': 0.00040496928164938614, 'samples': 8544768, 'steps': 44503, 'loss/train': 1.5667099952697754} -08/30/2021 21:09:56 - INFO - __main__ - Step 44505: {'lr': 0.0004049651174180744, 'samples': 8544960, 'steps': 44504, 'loss/train': 1.494455337524414} -08/30/2021 21:09:56 - INFO - __main__ - Step 44506: {'lr': 0.00040496095311693775, 'samples': 8545152, 'steps': 44505, 'loss/train': 1.3121304512023926} -08/30/2021 21:09:57 - INFO - __main__ - Step 44507: {'lr': 0.0004049567887459781, 'samples': 8545344, 'steps': 44506, 'loss/train': 1.0474810600280762} -08/30/2021 21:09:58 - INFO - __main__ - Step 44508: {'lr': 0.0004049526243051973, 'samples': 8545536, 'steps': 44507, 'loss/train': 0.04861311987042427} -08/30/2021 21:09:59 - INFO - __main__ - Step 44509: {'lr': 0.0004049484597945973, 'samples': 8545728, 'steps': 44508, 'loss/train': 2.0066797733306885} -08/30/2021 21:09:59 - INFO - __main__ - Step 44510: {'lr': 0.00040494429521417983, 'samples': 8545920, 'steps': 44509, 'loss/train': 0.8908435106277466} -08/30/2021 21:10:00 - INFO - __main__ - Step 44511: {'lr': 0.0004049401305639469, 'samples': 8546112, 'steps': 44510, 'loss/train': 1.5709240436553955} -08/30/2021 21:10:00 - INFO - __main__ - Step 44512: {'lr': 0.00040493596584390034, 'samples': 8546304, 'steps': 44511, 'loss/train': 1.5960265398025513} -08/30/2021 21:10:02 - INFO - __main__ - Step 44513: {'lr': 0.00040493180105404203, 'samples': 8546496, 'steps': 44512, 'loss/train': 1.4478884935379028} -08/30/2021 21:10:02 - INFO - __main__ - Step 44514: {'lr': 0.0004049276361943738, 'samples': 8546688, 'steps': 44513, 'loss/train': 0.0514056570827961} -08/30/2021 21:10:02 - INFO - __main__ - Step 44515: {'lr': 0.0004049234712648976, 'samples': 8546880, 'steps': 44514, 'loss/train': 1.0247831344604492} -08/30/2021 21:10:03 - INFO - __main__ - Step 44516: {'lr': 0.00040491930626561525, 'samples': 8547072, 'steps': 44515, 'loss/train': 1.5291014909744263} -08/30/2021 21:10:03 - INFO - __main__ - Step 44517: {'lr': 0.00040491514119652875, 'samples': 8547264, 'steps': 44516, 'loss/train': 1.1822515726089478} -08/30/2021 21:10:03 - INFO - __main__ - Step 44518: {'lr': 0.00040491097605763974, 'samples': 8547456, 'steps': 44517, 'loss/train': 1.1921422481536865} -08/30/2021 21:10:05 - INFO - __main__ - Step 44519: {'lr': 0.00040490681084895034, 'samples': 8547648, 'steps': 44518, 'loss/train': 1.7431014776229858} -08/30/2021 21:10:05 - INFO - __main__ - Step 44520: {'lr': 0.00040490264557046217, 'samples': 8547840, 'steps': 44519, 'loss/train': 0.5104594826698303} -08/30/2021 21:10:06 - INFO - __main__ - Step 44521: {'lr': 0.0004048984802221774, 'samples': 8548032, 'steps': 44520, 'loss/train': 1.6499903202056885} -08/30/2021 21:10:06 - INFO - __main__ - Step 44522: {'lr': 0.0004048943148040977, 'samples': 8548224, 'steps': 44521, 'loss/train': 1.3680845499038696} -08/30/2021 21:10:06 - INFO - __main__ - Step 44523: {'lr': 0.0004048901493162251, 'samples': 8548416, 'steps': 44522, 'loss/train': 1.0962400436401367} -08/30/2021 21:10:08 - INFO - __main__ - Step 44524: {'lr': 0.00040488598375856133, 'samples': 8548608, 'steps': 44523, 'loss/train': 0.7335981130599976} -08/30/2021 21:10:08 - INFO - __main__ - Step 44525: {'lr': 0.0004048818181311083, 'samples': 8548800, 'steps': 44524, 'loss/train': 1.4960570335388184} -08/30/2021 21:10:09 - INFO - __main__ - Step 44526: {'lr': 0.000404877652433868, 'samples': 8548992, 'steps': 44525, 'loss/train': 0.5900524258613586} -08/30/2021 21:10:09 - INFO - __main__ - Step 44527: {'lr': 0.0004048734866668421, 'samples': 8549184, 'steps': 44526, 'loss/train': 1.2702893018722534} -08/30/2021 21:10:10 - INFO - __main__ - Step 44528: {'lr': 0.0004048693208300327, 'samples': 8549376, 'steps': 44527, 'loss/train': 1.304343581199646} -08/30/2021 21:10:11 - INFO - __main__ - Step 44529: {'lr': 0.00040486515492344145, 'samples': 8549568, 'steps': 44528, 'loss/train': 1.3608784675598145} -08/30/2021 21:10:11 - INFO - __main__ - Step 44530: {'lr': 0.00040486098894707044, 'samples': 8549760, 'steps': 44529, 'loss/train': 0.8541049361228943} -08/30/2021 21:10:12 - INFO - __main__ - Step 44531: {'lr': 0.00040485682290092144, 'samples': 8549952, 'steps': 44530, 'loss/train': 1.5711885690689087} -08/30/2021 21:10:12 - INFO - __main__ - Step 44532: {'lr': 0.0004048526567849964, 'samples': 8550144, 'steps': 44531, 'loss/train': 1.330690622329712} -08/30/2021 21:10:13 - INFO - __main__ - Step 44533: {'lr': 0.00040484849059929705, 'samples': 8550336, 'steps': 44532, 'loss/train': 1.4260104894638062} -08/30/2021 21:10:14 - INFO - __main__ - Step 44534: {'lr': 0.00040484432434382547, 'samples': 8550528, 'steps': 44533, 'loss/train': 1.393811583518982} -08/30/2021 21:10:14 - INFO - __main__ - Step 44535: {'lr': 0.0004048401580185833, 'samples': 8550720, 'steps': 44534, 'loss/train': 1.7350919246673584} -08/30/2021 21:10:15 - INFO - __main__ - Step 44536: {'lr': 0.00040483599162357257, 'samples': 8550912, 'steps': 44535, 'loss/train': 1.83530855178833} -08/30/2021 21:10:15 - INFO - __main__ - Step 44537: {'lr': 0.0004048318251587952, 'samples': 8551104, 'steps': 44536, 'loss/train': 1.079136610031128} -08/30/2021 21:10:16 - INFO - __main__ - Step 44538: {'lr': 0.000404827658624253, 'samples': 8551296, 'steps': 44537, 'loss/train': 1.5141124725341797} -08/30/2021 21:10:17 - INFO - __main__ - Step 44539: {'lr': 0.00040482349201994785, 'samples': 8551488, 'steps': 44538, 'loss/train': 1.415168046951294} -08/30/2021 21:10:17 - INFO - __main__ - Step 44540: {'lr': 0.00040481932534588153, 'samples': 8551680, 'steps': 44539, 'loss/train': 0.9200124740600586} -08/30/2021 21:10:18 - INFO - __main__ - Step 44541: {'lr': 0.00040481515860205607, 'samples': 8551872, 'steps': 44540, 'loss/train': 1.6551047563552856} -08/30/2021 21:10:18 - INFO - __main__ - Step 44542: {'lr': 0.00040481099178847326, 'samples': 8552064, 'steps': 44541, 'loss/train': 1.1200001239776611} -08/30/2021 21:10:18 - INFO - __main__ - Step 44543: {'lr': 0.000404806824905135, 'samples': 8552256, 'steps': 44542, 'loss/train': 1.4508363008499146} -08/30/2021 21:10:19 - INFO - __main__ - Step 44544: {'lr': 0.0004048026579520433, 'samples': 8552448, 'steps': 44543, 'loss/train': 1.4934316873550415} -08/30/2021 21:10:21 - INFO - __main__ - Step 44545: {'lr': 0.00040479849092919974, 'samples': 8552640, 'steps': 44544, 'loss/train': 1.4598311185836792} -08/30/2021 21:10:21 - INFO - __main__ - Step 44546: {'lr': 0.00040479432383660644, 'samples': 8552832, 'steps': 44545, 'loss/train': 1.3036412000656128} -08/30/2021 21:10:22 - INFO - __main__ - Step 44547: {'lr': 0.00040479015667426523, 'samples': 8553024, 'steps': 44546, 'loss/train': 0.9568488597869873} -08/30/2021 21:10:22 - INFO - __main__ - Step 44548: {'lr': 0.00040478598944217794, 'samples': 8553216, 'steps': 44547, 'loss/train': 1.3391884565353394} -08/30/2021 21:10:22 - INFO - __main__ - Step 44549: {'lr': 0.0004047818221403464, 'samples': 8553408, 'steps': 44548, 'loss/train': 1.869517207145691} -08/30/2021 21:10:24 - INFO - __main__ - Step 44550: {'lr': 0.0004047776547687727, 'samples': 8553600, 'steps': 44549, 'loss/train': 2.083289384841919} -08/30/2021 21:10:25 - INFO - __main__ - Step 44551: {'lr': 0.00040477348732745853, 'samples': 8553792, 'steps': 44550, 'loss/train': 1.6396681070327759} -08/30/2021 21:10:25 - INFO - __main__ - Step 44552: {'lr': 0.0004047693198164058, 'samples': 8553984, 'steps': 44551, 'loss/train': 0.03724002093076706} -08/30/2021 21:10:25 - INFO - __main__ - Step 44553: {'lr': 0.0004047651522356164, 'samples': 8554176, 'steps': 44552, 'loss/train': 1.58552086353302} -08/30/2021 21:10:26 - INFO - __main__ - Step 44554: {'lr': 0.0004047609845850922, 'samples': 8554368, 'steps': 44553, 'loss/train': 3.346970319747925} -08/30/2021 21:10:27 - INFO - __main__ - Step 44555: {'lr': 0.0004047568168648351, 'samples': 8554560, 'steps': 44554, 'loss/train': 1.0322961807250977} -08/30/2021 21:10:28 - INFO - __main__ - Step 44556: {'lr': 0.00040475264907484696, 'samples': 8554752, 'steps': 44555, 'loss/train': 1.4441256523132324} -08/30/2021 21:10:28 - INFO - __main__ - Step 44557: {'lr': 0.0004047484812151296, 'samples': 8554944, 'steps': 44556, 'loss/train': 0.47064775228500366} -08/30/2021 21:10:28 - INFO - __main__ - Step 44558: {'lr': 0.00040474431328568506, 'samples': 8555136, 'steps': 44557, 'loss/train': 1.3238126039505005} -08/30/2021 21:10:29 - INFO - __main__ - Step 44559: {'lr': 0.00040474014528651514, 'samples': 8555328, 'steps': 44558, 'loss/train': 1.3393900394439697} -08/30/2021 21:10:31 - INFO - __main__ - Step 44560: {'lr': 0.00040473597721762164, 'samples': 8555520, 'steps': 44559, 'loss/train': 1.0714969635009766} -08/30/2021 21:10:31 - INFO - __main__ - Step 44561: {'lr': 0.00040473180907900645, 'samples': 8555712, 'steps': 44560, 'loss/train': 1.986654281616211} -08/30/2021 21:10:31 - INFO - __main__ - Step 44562: {'lr': 0.0004047276408706716, 'samples': 8555904, 'steps': 44561, 'loss/train': 1.0027275085449219} -08/30/2021 21:10:32 - INFO - __main__ - Step 44563: {'lr': 0.00040472347259261875, 'samples': 8556096, 'steps': 44562, 'loss/train': 1.2030565738677979} -08/30/2021 21:10:32 - INFO - __main__ - Step 44564: {'lr': 0.00040471930424485, 'samples': 8556288, 'steps': 44563, 'loss/train': 0.9676149487495422} -08/30/2021 21:10:34 - INFO - __main__ - Step 44565: {'lr': 0.0004047151358273671, 'samples': 8556480, 'steps': 44564, 'loss/train': 0.5190265774726868} -08/30/2021 21:10:34 - INFO - __main__ - Step 44566: {'lr': 0.00040471096734017185, 'samples': 8556672, 'steps': 44565, 'loss/train': 1.3869503736495972} -08/30/2021 21:10:34 - INFO - __main__ - Step 44567: {'lr': 0.0004047067987832663, 'samples': 8556864, 'steps': 44566, 'loss/train': 1.4650006294250488} -08/30/2021 21:10:35 - INFO - __main__ - Step 44568: {'lr': 0.00040470263015665234, 'samples': 8557056, 'steps': 44567, 'loss/train': 1.9376749992370605} -08/30/2021 21:10:35 - INFO - __main__ - Step 44569: {'lr': 0.00040469846146033164, 'samples': 8557248, 'steps': 44568, 'loss/train': 1.3339883089065552} -08/30/2021 21:10:36 - INFO - __main__ - Step 44570: {'lr': 0.00040469429269430617, 'samples': 8557440, 'steps': 44569, 'loss/train': 1.1745285987854004} -08/30/2021 21:10:37 - INFO - __main__ - Step 44571: {'lr': 0.00040469012385857794, 'samples': 8557632, 'steps': 44570, 'loss/train': 1.4878660440444946} -08/30/2021 21:10:37 - INFO - __main__ - Step 44572: {'lr': 0.0004046859549531487, 'samples': 8557824, 'steps': 44571, 'loss/train': 1.124781847000122} -08/30/2021 21:10:38 - INFO - __main__ - Step 44573: {'lr': 0.0004046817859780203, 'samples': 8558016, 'steps': 44572, 'loss/train': 1.2476392984390259} -08/30/2021 21:10:38 - INFO - __main__ - Step 44574: {'lr': 0.00040467761693319473, 'samples': 8558208, 'steps': 44573, 'loss/train': 1.9991528987884521} -08/30/2021 21:10:39 - INFO - __main__ - Step 44575: {'lr': 0.0004046734478186738, 'samples': 8558400, 'steps': 44574, 'loss/train': 1.5686951875686646} -08/30/2021 21:10:40 - INFO - __main__ - Step 44576: {'lr': 0.0004046692786344594, 'samples': 8558592, 'steps': 44575, 'loss/train': 0.7465823292732239} -08/30/2021 21:10:40 - INFO - __main__ - Step 44577: {'lr': 0.0004046651093805534, 'samples': 8558784, 'steps': 44576, 'loss/train': 1.6808507442474365} -08/30/2021 21:10:41 - INFO - __main__ - Step 44578: {'lr': 0.0004046609400569577, 'samples': 8558976, 'steps': 44577, 'loss/train': 1.4354959726333618} -08/30/2021 21:10:41 - INFO - __main__ - Step 44579: {'lr': 0.00040465677066367424, 'samples': 8559168, 'steps': 44578, 'loss/train': 2.2899327278137207} -08/30/2021 21:10:41 - INFO - __main__ - Step 44580: {'lr': 0.0004046526012007047, 'samples': 8559360, 'steps': 44579, 'loss/train': 1.1801016330718994} -08/30/2021 21:10:43 - INFO - __main__ - Step 44581: {'lr': 0.0004046484316680511, 'samples': 8559552, 'steps': 44580, 'loss/train': 1.6281802654266357} -08/30/2021 21:10:43 - INFO - __main__ - Step 44582: {'lr': 0.0004046442620657154, 'samples': 8559744, 'steps': 44581, 'loss/train': 1.3720782995224} -08/30/2021 21:10:44 - INFO - __main__ - Step 44583: {'lr': 0.00040464009239369925, 'samples': 8559936, 'steps': 44582, 'loss/train': 1.4667978286743164} -08/30/2021 21:10:44 - INFO - __main__ - Step 44584: {'lr': 0.0004046359226520048, 'samples': 8560128, 'steps': 44583, 'loss/train': 1.2026638984680176} -08/30/2021 21:10:44 - INFO - __main__ - Step 44585: {'lr': 0.0004046317528406337, 'samples': 8560320, 'steps': 44584, 'loss/train': 2.0747039318084717} -08/30/2021 21:10:46 - INFO - __main__ - Step 44586: {'lr': 0.0004046275829595879, 'samples': 8560512, 'steps': 44585, 'loss/train': 1.427085280418396} -08/30/2021 21:10:46 - INFO - __main__ - Step 44587: {'lr': 0.0004046234130088694, 'samples': 8560704, 'steps': 44586, 'loss/train': 1.8774505853652954} -08/30/2021 21:10:47 - INFO - __main__ - Step 44588: {'lr': 0.00040461924298847987, 'samples': 8560896, 'steps': 44587, 'loss/train': 1.5450016260147095} -08/30/2021 21:10:47 - INFO - __main__ - Step 44589: {'lr': 0.0004046150728984214, 'samples': 8561088, 'steps': 44588, 'loss/train': 1.47158682346344} -08/30/2021 21:10:47 - INFO - __main__ - Step 44590: {'lr': 0.00040461090273869566, 'samples': 8561280, 'steps': 44589, 'loss/train': 1.338092565536499} -08/30/2021 21:10:49 - INFO - __main__ - Step 44591: {'lr': 0.0004046067325093047, 'samples': 8561472, 'steps': 44590, 'loss/train': 1.5805087089538574} -08/30/2021 21:10:49 - INFO - __main__ - Step 44592: {'lr': 0.00040460256221025025, 'samples': 8561664, 'steps': 44591, 'loss/train': 1.2867668867111206} -08/30/2021 21:10:50 - INFO - __main__ - Step 44593: {'lr': 0.00040459839184153436, 'samples': 8561856, 'steps': 44592, 'loss/train': 0.5937618017196655} -08/30/2021 21:10:50 - INFO - __main__ - Step 44594: {'lr': 0.00040459422140315876, 'samples': 8562048, 'steps': 44593, 'loss/train': 1.3605940341949463} -08/30/2021 21:10:50 - INFO - __main__ - Step 44595: {'lr': 0.00040459005089512544, 'samples': 8562240, 'steps': 44594, 'loss/train': 1.4812759160995483} -08/30/2021 21:10:52 - INFO - __main__ - Step 44596: {'lr': 0.0004045858803174362, 'samples': 8562432, 'steps': 44595, 'loss/train': 0.9486871361732483} -08/30/2021 21:10:52 - INFO - __main__ - Step 44597: {'lr': 0.0004045817096700929, 'samples': 8562624, 'steps': 44596, 'loss/train': 1.0470929145812988} -08/30/2021 21:10:53 - INFO - __main__ - Step 44598: {'lr': 0.0004045775389530976, 'samples': 8562816, 'steps': 44597, 'loss/train': 1.4578419923782349} -08/30/2021 21:10:53 - INFO - __main__ - Step 44599: {'lr': 0.00040457336816645195, 'samples': 8563008, 'steps': 44598, 'loss/train': 1.2007524967193604} -08/30/2021 21:10:53 - INFO - __main__ - Step 44600: {'lr': 0.000404569197310158, 'samples': 8563200, 'steps': 44599, 'loss/train': 0.5367192625999451} -08/30/2021 21:10:54 - INFO - __main__ - Step 44601: {'lr': 0.0004045650263842174, 'samples': 8563392, 'steps': 44600, 'loss/train': 1.443903923034668} -08/30/2021 21:10:56 - INFO - __main__ - Step 44602: {'lr': 0.0004045608553886323, 'samples': 8563584, 'steps': 44601, 'loss/train': 1.5638363361358643} -08/30/2021 21:10:56 - INFO - __main__ - Step 44603: {'lr': 0.0004045566843234044, 'samples': 8563776, 'steps': 44602, 'loss/train': 1.3564800024032593} -08/30/2021 21:10:57 - INFO - __main__ - Step 44604: {'lr': 0.0004045525131885357, 'samples': 8563968, 'steps': 44603, 'loss/train': 1.8736985921859741} -08/30/2021 21:10:57 - INFO - __main__ - Step 44605: {'lr': 0.0004045483419840281, 'samples': 8564160, 'steps': 44604, 'loss/train': 1.6619324684143066} -08/30/2021 21:10:57 - INFO - __main__ - Step 44606: {'lr': 0.00040454417070988325, 'samples': 8564352, 'steps': 44605, 'loss/train': 1.4417486190795898} -08/30/2021 21:10:59 - INFO - __main__ - Step 44607: {'lr': 0.0004045399993661033, 'samples': 8564544, 'steps': 44606, 'loss/train': 1.2746599912643433} -08/30/2021 21:11:00 - INFO - __main__ - Step 44608: {'lr': 0.00040453582795268994, 'samples': 8564736, 'steps': 44607, 'loss/train': 1.128827452659607} -08/30/2021 21:11:00 - INFO - __main__ - Step 44609: {'lr': 0.00040453165646964505, 'samples': 8564928, 'steps': 44608, 'loss/train': 1.4094294309616089} -08/30/2021 21:11:00 - INFO - __main__ - Step 44610: {'lr': 0.00040452748491697074, 'samples': 8565120, 'steps': 44609, 'loss/train': 1.2495408058166504} -08/30/2021 21:11:01 - INFO - __main__ - Step 44611: {'lr': 0.00040452331329466864, 'samples': 8565312, 'steps': 44610, 'loss/train': 1.2370538711547852} -08/30/2021 21:11:02 - INFO - __main__ - Step 44612: {'lr': 0.0004045191416027407, 'samples': 8565504, 'steps': 44611, 'loss/train': 1.7766664028167725} -08/30/2021 21:11:03 - INFO - __main__ - Step 44613: {'lr': 0.0004045149698411889, 'samples': 8565696, 'steps': 44612, 'loss/train': 1.398087501525879} -08/30/2021 21:11:03 - INFO - __main__ - Step 44614: {'lr': 0.000404510798010015, 'samples': 8565888, 'steps': 44613, 'loss/train': 1.3768959045410156} -08/30/2021 21:11:03 - INFO - __main__ - Step 44615: {'lr': 0.0004045066261092209, 'samples': 8566080, 'steps': 44614, 'loss/train': 1.4024088382720947} -08/30/2021 21:11:04 - INFO - __main__ - Step 44616: {'lr': 0.0004045024541388085, 'samples': 8566272, 'steps': 44615, 'loss/train': 1.6499426364898682} -08/30/2021 21:11:06 - INFO - __main__ - Step 44617: {'lr': 0.0004044982820987797, 'samples': 8566464, 'steps': 44616, 'loss/train': 1.173856258392334} -08/30/2021 21:11:06 - INFO - __main__ - Step 44618: {'lr': 0.0004044941099891364, 'samples': 8566656, 'steps': 44617, 'loss/train': 1.4359219074249268} -08/30/2021 21:11:06 - INFO - __main__ - Step 44619: {'lr': 0.0004044899378098803, 'samples': 8566848, 'steps': 44618, 'loss/train': 0.23497290909290314} -08/30/2021 21:11:07 - INFO - __main__ - Step 44620: {'lr': 0.00040448576556101356, 'samples': 8567040, 'steps': 44619, 'loss/train': 0.146611288189888} -08/30/2021 21:11:07 - INFO - __main__ - Step 44621: {'lr': 0.0004044815932425379, 'samples': 8567232, 'steps': 44620, 'loss/train': 1.557465672492981} -08/30/2021 21:11:08 - INFO - __main__ - Step 44622: {'lr': 0.0004044774208544551, 'samples': 8567424, 'steps': 44621, 'loss/train': 1.8804394006729126} -08/30/2021 21:11:09 - INFO - __main__ - Step 44623: {'lr': 0.00040447324839676727, 'samples': 8567616, 'steps': 44622, 'loss/train': 0.31287211179733276} -08/30/2021 21:11:09 - INFO - __main__ - Step 44624: {'lr': 0.00040446907586947614, 'samples': 8567808, 'steps': 44623, 'loss/train': 1.286818265914917} -08/30/2021 21:11:10 - INFO - __main__ - Step 44625: {'lr': 0.0004044649032725836, 'samples': 8568000, 'steps': 44624, 'loss/train': 1.5650722980499268} -08/30/2021 21:11:10 - INFO - __main__ - Step 44626: {'lr': 0.00040446073060609156, 'samples': 8568192, 'steps': 44625, 'loss/train': 1.2029505968093872} -08/30/2021 21:11:10 - INFO - __main__ - Step 44627: {'lr': 0.00040445655787000196, 'samples': 8568384, 'steps': 44626, 'loss/train': 1.951327919960022} -08/30/2021 21:11:12 - INFO - __main__ - Step 44628: {'lr': 0.0004044523850643166, 'samples': 8568576, 'steps': 44627, 'loss/train': 1.024367332458496} -08/30/2021 21:11:13 - INFO - __main__ - Step 44629: {'lr': 0.0004044482121890374, 'samples': 8568768, 'steps': 44628, 'loss/train': 1.6101847887039185} -08/30/2021 21:11:13 - INFO - __main__ - Step 44630: {'lr': 0.00040444403924416614, 'samples': 8568960, 'steps': 44629, 'loss/train': 0.09740839898586273} -08/30/2021 21:11:13 - INFO - __main__ - Step 44631: {'lr': 0.00040443986622970486, 'samples': 8569152, 'steps': 44630, 'loss/train': 1.6449363231658936} -08/30/2021 21:11:14 - INFO - __main__ - Step 44632: {'lr': 0.0004044356931456553, 'samples': 8569344, 'steps': 44631, 'loss/train': 1.6267058849334717} -08/30/2021 21:11:15 - INFO - __main__ - Step 44633: {'lr': 0.00040443151999201946, 'samples': 8569536, 'steps': 44632, 'loss/train': 1.104532241821289} -08/30/2021 21:11:16 - INFO - __main__ - Step 44634: {'lr': 0.00040442734676879907, 'samples': 8569728, 'steps': 44633, 'loss/train': 1.3367877006530762} -08/30/2021 21:11:16 - INFO - __main__ - Step 44635: {'lr': 0.0004044231734759961, 'samples': 8569920, 'steps': 44634, 'loss/train': 1.462814211845398} -08/30/2021 21:11:16 - INFO - __main__ - Step 44636: {'lr': 0.00040441900011361256, 'samples': 8570112, 'steps': 44635, 'loss/train': 1.0984530448913574} -08/30/2021 21:11:17 - INFO - __main__ - Step 44637: {'lr': 0.0004044148266816501, 'samples': 8570304, 'steps': 44636, 'loss/train': 1.2905670404434204} -08/30/2021 21:11:18 - INFO - __main__ - Step 44638: {'lr': 0.0004044106531801107, 'samples': 8570496, 'steps': 44637, 'loss/train': 0.05202246829867363} -08/30/2021 21:11:19 - INFO - __main__ - Step 44639: {'lr': 0.0004044064796089963, 'samples': 8570688, 'steps': 44638, 'loss/train': 1.5542014837265015} -08/30/2021 21:11:19 - INFO - __main__ - Step 44640: {'lr': 0.0004044023059683087, 'samples': 8570880, 'steps': 44639, 'loss/train': 2.373070001602173} -08/30/2021 21:11:20 - INFO - __main__ - Step 44641: {'lr': 0.00040439813225804977, 'samples': 8571072, 'steps': 44640, 'loss/train': 1.9628074169158936} -08/30/2021 21:11:20 - INFO - __main__ - Step 44642: {'lr': 0.00040439395847822145, 'samples': 8571264, 'steps': 44641, 'loss/train': 1.1866061687469482} -08/30/2021 21:11:20 - INFO - __main__ - Step 44643: {'lr': 0.00040438978462882557, 'samples': 8571456, 'steps': 44642, 'loss/train': 1.1060564517974854} -08/30/2021 21:11:22 - INFO - __main__ - Step 44644: {'lr': 0.0004043856107098641, 'samples': 8571648, 'steps': 44643, 'loss/train': 1.6540125608444214} -08/30/2021 21:11:22 - INFO - __main__ - Step 44645: {'lr': 0.0004043814367213388, 'samples': 8571840, 'steps': 44644, 'loss/train': 1.6237667798995972} -08/30/2021 21:11:23 - INFO - __main__ - Step 44646: {'lr': 0.00040437726266325164, 'samples': 8572032, 'steps': 44645, 'loss/train': 1.1387388706207275} -08/30/2021 21:11:23 - INFO - __main__ - Step 44647: {'lr': 0.00040437308853560444, 'samples': 8572224, 'steps': 44646, 'loss/train': 1.3084309101104736} -08/30/2021 21:11:23 - INFO - __main__ - Step 44648: {'lr': 0.0004043689143383991, 'samples': 8572416, 'steps': 44647, 'loss/train': 1.6508070230484009} -08/30/2021 21:11:25 - INFO - __main__ - Step 44649: {'lr': 0.00040436474007163754, 'samples': 8572608, 'steps': 44648, 'loss/train': 1.7929701805114746} -08/30/2021 21:11:25 - INFO - __main__ - Step 44650: {'lr': 0.0004043605657353216, 'samples': 8572800, 'steps': 44649, 'loss/train': 1.3815667629241943} -08/30/2021 21:11:25 - INFO - __main__ - Step 44651: {'lr': 0.00040435639132945314, 'samples': 8572992, 'steps': 44650, 'loss/train': 1.6113414764404297} -08/30/2021 21:11:26 - INFO - __main__ - Step 44652: {'lr': 0.0004043522168540341, 'samples': 8573184, 'steps': 44651, 'loss/train': 1.4216866493225098} -08/30/2021 21:11:26 - INFO - __main__ - Step 44653: {'lr': 0.0004043480423090664, 'samples': 8573376, 'steps': 44652, 'loss/train': 1.890062689781189} -08/30/2021 21:11:29 - INFO - __main__ - Step 44654: {'lr': 0.0004043438676945518, 'samples': 8573568, 'steps': 44653, 'loss/train': 1.3811109066009521} -08/30/2021 21:11:29 - INFO - __main__ - Step 44655: {'lr': 0.0004043396930104922, 'samples': 8573760, 'steps': 44654, 'loss/train': 0.7382684946060181} -08/30/2021 21:11:30 - INFO - __main__ - Step 44656: {'lr': 0.0004043355182568895, 'samples': 8573952, 'steps': 44655, 'loss/train': 1.6606881618499756} -08/30/2021 21:11:30 - INFO - __main__ - Step 44657: {'lr': 0.00040433134343374565, 'samples': 8574144, 'steps': 44656, 'loss/train': 1.5059059858322144} -08/30/2021 21:11:30 - INFO - __main__ - Step 44658: {'lr': 0.0004043271685410625, 'samples': 8574336, 'steps': 44657, 'loss/train': 1.1747535467147827} -08/30/2021 21:11:31 - INFO - __main__ - Step 44659: {'lr': 0.00040432299357884185, 'samples': 8574528, 'steps': 44658, 'loss/train': 0.9353310465812683} -08/30/2021 21:11:33 - INFO - __main__ - Step 44660: {'lr': 0.0004043188185470856, 'samples': 8574720, 'steps': 44659, 'loss/train': 0.7692214250564575} -08/30/2021 21:11:33 - INFO - __main__ - Step 44661: {'lr': 0.00040431464344579585, 'samples': 8574912, 'steps': 44660, 'loss/train': 1.4351422786712646} -08/30/2021 21:11:33 - INFO - __main__ - Step 44662: {'lr': 0.00040431046827497415, 'samples': 8575104, 'steps': 44661, 'loss/train': 0.36177942156791687} -08/30/2021 21:11:34 - INFO - __main__ - Step 44663: {'lr': 0.00040430629303462256, 'samples': 8575296, 'steps': 44662, 'loss/train': 1.2546839714050293} -08/30/2021 21:11:34 - INFO - __main__ - Step 44664: {'lr': 0.000404302117724743, 'samples': 8575488, 'steps': 44663, 'loss/train': 0.21498185396194458} -08/30/2021 21:11:36 - INFO - __main__ - Step 44665: {'lr': 0.00040429794234533726, 'samples': 8575680, 'steps': 44664, 'loss/train': 0.13312803208827972} -08/30/2021 21:11:36 - INFO - __main__ - Step 44666: {'lr': 0.0004042937668964072, 'samples': 8575872, 'steps': 44665, 'loss/train': 1.3231137990951538} -08/30/2021 21:11:36 - INFO - __main__ - Step 44667: {'lr': 0.00040428959137795475, 'samples': 8576064, 'steps': 44666, 'loss/train': 1.6441969871520996} -08/30/2021 21:11:37 - INFO - __main__ - Step 44668: {'lr': 0.0004042854157899818, 'samples': 8576256, 'steps': 44667, 'loss/train': 1.4304097890853882} -08/30/2021 21:11:37 - INFO - __main__ - Step 44669: {'lr': 0.0004042812401324902, 'samples': 8576448, 'steps': 44668, 'loss/train': 1.2681901454925537} -08/30/2021 21:11:39 - INFO - __main__ - Step 44670: {'lr': 0.0004042770644054819, 'samples': 8576640, 'steps': 44669, 'loss/train': 1.4806114435195923} -08/30/2021 21:11:39 - INFO - __main__ - Step 44671: {'lr': 0.0004042728886089587, 'samples': 8576832, 'steps': 44670, 'loss/train': 1.3516522645950317} -08/30/2021 21:11:39 - INFO - __main__ - Step 44672: {'lr': 0.00040426871274292257, 'samples': 8577024, 'steps': 44671, 'loss/train': 1.53693425655365} -08/30/2021 21:11:40 - INFO - __main__ - Step 44673: {'lr': 0.00040426453680737534, 'samples': 8577216, 'steps': 44672, 'loss/train': 1.702268123626709} -08/30/2021 21:11:40 - INFO - __main__ - Step 44674: {'lr': 0.0004042603608023189, 'samples': 8577408, 'steps': 44673, 'loss/train': 0.33006757497787476} -08/30/2021 21:11:42 - INFO - __main__ - Step 44675: {'lr': 0.00040425618472775504, 'samples': 8577600, 'steps': 44674, 'loss/train': 0.7661734223365784} -08/30/2021 21:11:42 - INFO - __main__ - Step 44676: {'lr': 0.0004042520085836857, 'samples': 8577792, 'steps': 44675, 'loss/train': 0.9462581276893616} -08/30/2021 21:11:43 - INFO - __main__ - Step 44677: {'lr': 0.0004042478323701129, 'samples': 8577984, 'steps': 44676, 'loss/train': 1.4574273824691772} -08/30/2021 21:11:43 - INFO - __main__ - Step 44678: {'lr': 0.00040424365608703836, 'samples': 8578176, 'steps': 44677, 'loss/train': 0.20433904230594635} -08/30/2021 21:11:43 - INFO - __main__ - Step 44679: {'lr': 0.00040423947973446404, 'samples': 8578368, 'steps': 44678, 'loss/train': 1.3947556018829346} -08/30/2021 21:11:45 - INFO - __main__ - Step 44680: {'lr': 0.00040423530331239177, 'samples': 8578560, 'steps': 44679, 'loss/train': 1.6145468950271606} -08/30/2021 21:11:45 - INFO - __main__ - Step 44681: {'lr': 0.0004042311268208234, 'samples': 8578752, 'steps': 44680, 'loss/train': 1.1512095928192139} -08/30/2021 21:11:46 - INFO - __main__ - Step 44682: {'lr': 0.00040422695025976084, 'samples': 8578944, 'steps': 44681, 'loss/train': 1.4892487525939941} -08/30/2021 21:11:46 - INFO - __main__ - Step 44683: {'lr': 0.00040422277362920614, 'samples': 8579136, 'steps': 44682, 'loss/train': 0.6761452555656433} -08/30/2021 21:11:46 - INFO - __main__ - Step 44684: {'lr': 0.0004042185969291609, 'samples': 8579328, 'steps': 44683, 'loss/train': 1.565118432044983} -08/30/2021 21:11:47 - INFO - __main__ - Step 44685: {'lr': 0.00040421442015962727, 'samples': 8579520, 'steps': 44684, 'loss/train': 1.8606051206588745} -08/30/2021 21:11:48 - INFO - __main__ - Step 44686: {'lr': 0.0004042102433206069, 'samples': 8579712, 'steps': 44685, 'loss/train': 1.0377438068389893} -08/30/2021 21:11:48 - INFO - __main__ - Step 44687: {'lr': 0.0004042060664121018, 'samples': 8579904, 'steps': 44686, 'loss/train': 2.0329248905181885} -08/30/2021 21:11:49 - INFO - __main__ - Step 44688: {'lr': 0.00040420188943411385, 'samples': 8580096, 'steps': 44687, 'loss/train': 1.2740154266357422} -08/30/2021 21:11:49 - INFO - __main__ - Step 44689: {'lr': 0.0004041977123866448, 'samples': 8580288, 'steps': 44688, 'loss/train': 1.4535404443740845} -08/30/2021 21:11:50 - INFO - __main__ - Step 44690: {'lr': 0.0004041935352696968, 'samples': 8580480, 'steps': 44689, 'loss/train': 1.383649230003357} -08/30/2021 21:11:51 - INFO - __main__ - Step 44691: {'lr': 0.00040418935808327153, 'samples': 8580672, 'steps': 44690, 'loss/train': 1.1525440216064453} -08/30/2021 21:11:52 - INFO - __main__ - Step 44692: {'lr': 0.00040418518082737087, 'samples': 8580864, 'steps': 44691, 'loss/train': 1.4060755968093872} -08/30/2021 21:11:52 - INFO - __main__ - Step 44693: {'lr': 0.0004041810035019967, 'samples': 8581056, 'steps': 44692, 'loss/train': 1.3666003942489624} -08/30/2021 21:11:53 - INFO - __main__ - Step 44694: {'lr': 0.00040417682610715107, 'samples': 8581248, 'steps': 44693, 'loss/train': 1.4005112648010254} -08/30/2021 21:11:53 - INFO - __main__ - Step 44695: {'lr': 0.00040417264864283563, 'samples': 8581440, 'steps': 44694, 'loss/train': 1.1218857765197754} -08/30/2021 21:11:53 - INFO - __main__ - Step 44696: {'lr': 0.00040416847110905243, 'samples': 8581632, 'steps': 44695, 'loss/train': 2.3378443717956543} -08/30/2021 21:11:55 - INFO - __main__ - Step 44697: {'lr': 0.0004041642935058033, 'samples': 8581824, 'steps': 44696, 'loss/train': 4.12662935256958} -08/30/2021 21:11:55 - INFO - __main__ - Step 44698: {'lr': 0.0004041601158330901, 'samples': 8582016, 'steps': 44697, 'loss/train': 1.7522892951965332} -08/30/2021 21:11:56 - INFO - __main__ - Step 44699: {'lr': 0.0004041559380909148, 'samples': 8582208, 'steps': 44698, 'loss/train': 2.321178913116455} -08/30/2021 21:11:56 - INFO - __main__ - Step 44700: {'lr': 0.00040415176027927915, 'samples': 8582400, 'steps': 44699, 'loss/train': 1.611406922340393} -08/30/2021 21:11:56 - INFO - __main__ - Step 44701: {'lr': 0.00040414758239818506, 'samples': 8582592, 'steps': 44700, 'loss/train': 1.4158567190170288} -08/30/2021 21:11:58 - INFO - __main__ - Step 44702: {'lr': 0.00040414340444763455, 'samples': 8582784, 'steps': 44701, 'loss/train': 1.0129512548446655} -08/30/2021 21:11:58 - INFO - __main__ - Step 44703: {'lr': 0.0004041392264276292, 'samples': 8582976, 'steps': 44702, 'loss/train': 0.12805743515491486} -08/30/2021 21:11:59 - INFO - __main__ - Step 44704: {'lr': 0.00040413504833817127, 'samples': 8583168, 'steps': 44703, 'loss/train': 1.6544349193572998} -08/30/2021 21:11:59 - INFO - __main__ - Step 44705: {'lr': 0.0004041308701792625, 'samples': 8583360, 'steps': 44704, 'loss/train': 1.9136465787887573} -08/30/2021 21:11:59 - INFO - __main__ - Step 44706: {'lr': 0.00040412669195090466, 'samples': 8583552, 'steps': 44705, 'loss/train': 1.2178682088851929} -08/30/2021 21:12:01 - INFO - __main__ - Step 44707: {'lr': 0.0004041225136530997, 'samples': 8583744, 'steps': 44706, 'loss/train': 0.1818217635154724} -08/30/2021 21:12:02 - INFO - __main__ - Step 44708: {'lr': 0.0004041183352858495, 'samples': 8583936, 'steps': 44707, 'loss/train': 1.3122010231018066} -08/30/2021 21:12:02 - INFO - __main__ - Step 44709: {'lr': 0.00040411415684915596, 'samples': 8584128, 'steps': 44708, 'loss/train': 0.7890591621398926} -08/30/2021 21:12:03 - INFO - __main__ - Step 44710: {'lr': 0.000404109978343021, 'samples': 8584320, 'steps': 44709, 'loss/train': 1.327783226966858} -08/30/2021 21:12:03 - INFO - __main__ - Step 44711: {'lr': 0.0004041057997674464, 'samples': 8584512, 'steps': 44710, 'loss/train': 2.0814294815063477} -08/30/2021 21:12:04 - INFO - __main__ - Step 44712: {'lr': 0.0004041016211224342, 'samples': 8584704, 'steps': 44711, 'loss/train': 2.0686967372894287} -08/30/2021 21:12:05 - INFO - __main__ - Step 44713: {'lr': 0.0004040974424079862, 'samples': 8584896, 'steps': 44712, 'loss/train': 1.5370765924453735} -08/30/2021 21:12:05 - INFO - __main__ - Step 44714: {'lr': 0.00040409326362410416, 'samples': 8585088, 'steps': 44713, 'loss/train': 0.9850499033927917} -08/30/2021 21:12:06 - INFO - __main__ - Step 44715: {'lr': 0.0004040890847707901, 'samples': 8585280, 'steps': 44714, 'loss/train': 1.515038251876831} -08/30/2021 21:12:06 - INFO - __main__ - Step 44716: {'lr': 0.0004040849058480459, 'samples': 8585472, 'steps': 44715, 'loss/train': 1.6759437322616577} -08/30/2021 21:12:08 - INFO - __main__ - Step 44717: {'lr': 0.0004040807268558734, 'samples': 8585664, 'steps': 44716, 'loss/train': 0.9891268610954285} -08/30/2021 21:12:08 - INFO - __main__ - Step 44718: {'lr': 0.0004040765477942745, 'samples': 8585856, 'steps': 44717, 'loss/train': 1.1774619817733765} -08/30/2021 21:12:08 - INFO - __main__ - Step 44719: {'lr': 0.0004040723686632512, 'samples': 8586048, 'steps': 44718, 'loss/train': 0.14400401711463928} -08/30/2021 21:12:09 - INFO - __main__ - Step 44720: {'lr': 0.00040406818946280514, 'samples': 8586240, 'steps': 44719, 'loss/train': 1.463714599609375} -08/30/2021 21:12:09 - INFO - __main__ - Step 44721: {'lr': 0.0004040640101929384, 'samples': 8586432, 'steps': 44720, 'loss/train': 1.3119109869003296} -08/30/2021 21:12:10 - INFO - __main__ - Step 44722: {'lr': 0.0004040598308536527, 'samples': 8586624, 'steps': 44721, 'loss/train': 2.74611496925354} -08/30/2021 21:12:11 - INFO - __main__ - Step 44723: {'lr': 0.0004040556514449501, 'samples': 8586816, 'steps': 44722, 'loss/train': 0.10382609814405441} -08/30/2021 21:12:11 - INFO - __main__ - Step 44724: {'lr': 0.0004040514719668324, 'samples': 8587008, 'steps': 44723, 'loss/train': 1.820826768875122} -08/30/2021 21:12:12 - INFO - __main__ - Step 44725: {'lr': 0.00040404729241930144, 'samples': 8587200, 'steps': 44724, 'loss/train': 1.4273552894592285} -08/30/2021 21:12:12 - INFO - __main__ - Step 44726: {'lr': 0.0004040431128023592, 'samples': 8587392, 'steps': 44725, 'loss/train': 1.0794281959533691} -08/30/2021 21:12:12 - INFO - __main__ - Step 44727: {'lr': 0.0004040389331160075, 'samples': 8587584, 'steps': 44726, 'loss/train': 0.5066059231758118} -08/30/2021 21:12:14 - INFO - __main__ - Step 44728: {'lr': 0.00040403475336024816, 'samples': 8587776, 'steps': 44727, 'loss/train': 1.3578089475631714} -08/30/2021 21:12:14 - INFO - __main__ - Step 44729: {'lr': 0.0004040305735350832, 'samples': 8587968, 'steps': 44728, 'loss/train': 1.3866970539093018} -08/30/2021 21:12:15 - INFO - __main__ - Step 44730: {'lr': 0.00040402639364051443, 'samples': 8588160, 'steps': 44729, 'loss/train': 1.7742223739624023} -08/30/2021 21:12:15 - INFO - __main__ - Step 44731: {'lr': 0.0004040222136765437, 'samples': 8588352, 'steps': 44730, 'loss/train': 1.0697300434112549} -08/30/2021 21:12:15 - INFO - __main__ - Step 44732: {'lr': 0.000404018033643173, 'samples': 8588544, 'steps': 44731, 'loss/train': 1.42644464969635} -08/30/2021 21:12:17 - INFO - __main__ - Step 44733: {'lr': 0.00040401385354040415, 'samples': 8588736, 'steps': 44732, 'loss/train': 1.4834192991256714} -08/30/2021 21:12:18 - INFO - __main__ - Step 44734: {'lr': 0.00040400967336823903, 'samples': 8588928, 'steps': 44733, 'loss/train': 0.5549272298812866} -08/30/2021 21:12:18 - INFO - __main__ - Step 44735: {'lr': 0.0004040054931266795, 'samples': 8589120, 'steps': 44734, 'loss/train': 1.0352789163589478} -08/30/2021 21:12:19 - INFO - __main__ - Step 44736: {'lr': 0.0004040013128157275, 'samples': 8589312, 'steps': 44735, 'loss/train': 1.5035122632980347} -08/30/2021 21:12:19 - INFO - __main__ - Step 44737: {'lr': 0.00040399713243538483, 'samples': 8589504, 'steps': 44736, 'loss/train': 1.7758814096450806} -08/30/2021 21:12:19 - INFO - __main__ - Step 44738: {'lr': 0.00040399295198565344, 'samples': 8589696, 'steps': 44737, 'loss/train': 1.4000332355499268} -08/30/2021 21:12:21 - INFO - __main__ - Step 44739: {'lr': 0.0004039887714665352, 'samples': 8589888, 'steps': 44738, 'loss/train': 1.2474510669708252} -08/30/2021 21:12:21 - INFO - __main__ - Step 44740: {'lr': 0.0004039845908780321, 'samples': 8590080, 'steps': 44739, 'loss/train': 0.25095704197883606} -08/30/2021 21:12:22 - INFO - __main__ - Step 44741: {'lr': 0.00040398041022014585, 'samples': 8590272, 'steps': 44740, 'loss/train': 0.3515515625476837} -08/30/2021 21:12:22 - INFO - __main__ - Step 44742: {'lr': 0.0004039762294928784, 'samples': 8590464, 'steps': 44741, 'loss/train': 1.3373171091079712} -08/30/2021 21:12:23 - INFO - __main__ - Step 44743: {'lr': 0.0004039720486962316, 'samples': 8590656, 'steps': 44742, 'loss/train': 1.7016260623931885} -08/30/2021 21:12:23 - INFO - __main__ - Step 44744: {'lr': 0.00040396786783020747, 'samples': 8590848, 'steps': 44743, 'loss/train': 1.3754642009735107} -08/30/2021 21:12:24 - INFO - __main__ - Step 44745: {'lr': 0.00040396368689480766, 'samples': 8591040, 'steps': 44744, 'loss/train': 1.0809239149093628} -08/30/2021 21:12:25 - INFO - __main__ - Step 44746: {'lr': 0.00040395950589003425, 'samples': 8591232, 'steps': 44745, 'loss/train': 1.9665225744247437} -08/30/2021 21:12:25 - INFO - __main__ - Step 44747: {'lr': 0.00040395532481588914, 'samples': 8591424, 'steps': 44746, 'loss/train': 1.4787989854812622} -08/30/2021 21:12:25 - INFO - __main__ - Step 44748: {'lr': 0.00040395114367237407, 'samples': 8591616, 'steps': 44747, 'loss/train': 1.827306866645813} -08/30/2021 21:12:26 - INFO - __main__ - Step 44749: {'lr': 0.00040394696245949093, 'samples': 8591808, 'steps': 44748, 'loss/train': 1.3914703130722046} -08/30/2021 21:12:27 - INFO - __main__ - Step 44750: {'lr': 0.0004039427811772417, 'samples': 8592000, 'steps': 44749, 'loss/train': 1.7765800952911377} -08/30/2021 21:12:28 - INFO - __main__ - Step 44751: {'lr': 0.0004039385998256283, 'samples': 8592192, 'steps': 44750, 'loss/train': 1.7809475660324097} -08/30/2021 21:12:28 - INFO - __main__ - Step 44752: {'lr': 0.0004039344184046525, 'samples': 8592384, 'steps': 44751, 'loss/train': 1.1189547777175903} -08/30/2021 21:12:28 - INFO - __main__ - Step 44753: {'lr': 0.00040393023691431617, 'samples': 8592576, 'steps': 44752, 'loss/train': 1.2198259830474854} -08/30/2021 21:12:29 - INFO - __main__ - Step 44754: {'lr': 0.00040392605535462137, 'samples': 8592768, 'steps': 44753, 'loss/train': 1.5017012357711792} -08/30/2021 21:12:29 - INFO - __main__ - Step 44755: {'lr': 0.00040392187372556977, 'samples': 8592960, 'steps': 44754, 'loss/train': 1.3450887203216553} -08/30/2021 21:12:31 - INFO - __main__ - Step 44756: {'lr': 0.00040391769202716333, 'samples': 8593152, 'steps': 44755, 'loss/train': 1.689627766609192} -08/30/2021 21:12:31 - INFO - __main__ - Step 44757: {'lr': 0.00040391351025940406, 'samples': 8593344, 'steps': 44756, 'loss/train': 2.285498857498169} -08/30/2021 21:12:31 - INFO - __main__ - Step 44758: {'lr': 0.00040390932842229363, 'samples': 8593536, 'steps': 44757, 'loss/train': 1.3162336349487305} -08/30/2021 21:12:32 - INFO - __main__ - Step 44759: {'lr': 0.0004039051465158341, 'samples': 8593728, 'steps': 44758, 'loss/train': 1.2031238079071045} -08/30/2021 21:12:32 - INFO - __main__ - Step 44760: {'lr': 0.0004039009645400272, 'samples': 8593920, 'steps': 44759, 'loss/train': 2.238046407699585} -08/30/2021 21:12:34 - INFO - __main__ - Step 44761: {'lr': 0.00040389678249487504, 'samples': 8594112, 'steps': 44760, 'loss/train': 1.9598907232284546} -08/30/2021 21:12:34 - INFO - __main__ - Step 44762: {'lr': 0.00040389260038037924, 'samples': 8594304, 'steps': 44761, 'loss/train': 1.3632460832595825} -08/30/2021 21:12:34 - INFO - __main__ - Step 44763: {'lr': 0.0004038884181965419, 'samples': 8594496, 'steps': 44762, 'loss/train': 1.8618515729904175} -08/30/2021 21:12:35 - INFO - __main__ - Step 44764: {'lr': 0.0004038842359433647, 'samples': 8594688, 'steps': 44763, 'loss/train': 1.0962245464324951} -08/30/2021 21:12:35 - INFO - __main__ - Step 44765: {'lr': 0.0004038800536208497, 'samples': 8594880, 'steps': 44764, 'loss/train': 1.3337403535842896} -08/30/2021 21:12:37 - INFO - __main__ - Step 44766: {'lr': 0.00040387587122899877, 'samples': 8595072, 'steps': 44765, 'loss/train': 1.6342111825942993} -08/30/2021 21:12:38 - INFO - __main__ - Step 44767: {'lr': 0.0004038716887678137, 'samples': 8595264, 'steps': 44766, 'loss/train': 1.220460295677185} -08/30/2021 21:12:38 - INFO - __main__ - Step 44768: {'lr': 0.0004038675062372964, 'samples': 8595456, 'steps': 44767, 'loss/train': 0.762306809425354} -08/30/2021 21:12:38 - INFO - __main__ - Step 44769: {'lr': 0.00040386332363744884, 'samples': 8595648, 'steps': 44768, 'loss/train': 1.6427874565124512} -08/30/2021 21:12:39 - INFO - __main__ - Step 44770: {'lr': 0.0004038591409682728, 'samples': 8595840, 'steps': 44769, 'loss/train': 1.0624582767486572} -08/30/2021 21:12:40 - INFO - __main__ - Step 44771: {'lr': 0.00040385495822977015, 'samples': 8596032, 'steps': 44770, 'loss/train': 1.3694335222244263} -08/30/2021 21:12:41 - INFO - __main__ - Step 44772: {'lr': 0.00040385077542194294, 'samples': 8596224, 'steps': 44771, 'loss/train': 0.9849164485931396} -08/30/2021 21:12:41 - INFO - __main__ - Step 44773: {'lr': 0.0004038465925447929, 'samples': 8596416, 'steps': 44772, 'loss/train': 1.452582836151123} -08/30/2021 21:12:42 - INFO - __main__ - Step 44774: {'lr': 0.00040384240959832196, 'samples': 8596608, 'steps': 44773, 'loss/train': 1.5353108644485474} -08/30/2021 21:12:42 - INFO - __main__ - Step 44775: {'lr': 0.000403838226582532, 'samples': 8596800, 'steps': 44774, 'loss/train': 1.2722387313842773} -08/30/2021 21:12:43 - INFO - __main__ - Step 44776: {'lr': 0.00040383404349742484, 'samples': 8596992, 'steps': 44775, 'loss/train': 0.08614099025726318} -08/30/2021 21:12:44 - INFO - __main__ - Step 44777: {'lr': 0.0004038298603430025, 'samples': 8597184, 'steps': 44776, 'loss/train': 1.6187736988067627} -08/30/2021 21:12:44 - INFO - __main__ - Step 44778: {'lr': 0.0004038256771192668, 'samples': 8597376, 'steps': 44777, 'loss/train': 1.1794672012329102} -08/30/2021 21:12:44 - INFO - __main__ - Step 44779: {'lr': 0.00040382149382621967, 'samples': 8597568, 'steps': 44778, 'loss/train': 1.0087658166885376} -08/30/2021 21:12:45 - INFO - __main__ - Step 44780: {'lr': 0.00040381731046386295, 'samples': 8597760, 'steps': 44779, 'loss/train': 1.5379784107208252} -08/30/2021 21:12:46 - INFO - __main__ - Step 44781: {'lr': 0.0004038131270321984, 'samples': 8597952, 'steps': 44780, 'loss/train': 1.3625178337097168} -08/30/2021 21:12:47 - INFO - __main__ - Step 44782: {'lr': 0.0004038089435312281, 'samples': 8598144, 'steps': 44781, 'loss/train': 1.5956666469573975} -08/30/2021 21:12:47 - INFO - __main__ - Step 44783: {'lr': 0.0004038047599609539, 'samples': 8598336, 'steps': 44782, 'loss/train': 0.7987320423126221} -08/30/2021 21:12:48 - INFO - __main__ - Step 44784: {'lr': 0.00040380057632137756, 'samples': 8598528, 'steps': 44783, 'loss/train': 1.4341366291046143} -08/30/2021 21:12:48 - INFO - __main__ - Step 44785: {'lr': 0.0004037963926125011, 'samples': 8598720, 'steps': 44784, 'loss/train': 0.057333629578351974} -08/30/2021 21:12:49 - INFO - __main__ - Step 44786: {'lr': 0.00040379220883432644, 'samples': 8598912, 'steps': 44785, 'loss/train': 1.1526473760604858} -08/30/2021 21:12:50 - INFO - __main__ - Step 44787: {'lr': 0.0004037880249868553, 'samples': 8599104, 'steps': 44786, 'loss/train': 1.2982807159423828} -08/30/2021 21:12:50 - INFO - __main__ - Step 44788: {'lr': 0.00040378384107008967, 'samples': 8599296, 'steps': 44787, 'loss/train': 1.4623582363128662} -08/30/2021 21:12:51 - INFO - __main__ - Step 44789: {'lr': 0.00040377965708403133, 'samples': 8599488, 'steps': 44788, 'loss/train': 1.7044297456741333} -08/30/2021 21:12:51 - INFO - __main__ - Step 44790: {'lr': 0.00040377547302868235, 'samples': 8599680, 'steps': 44789, 'loss/train': 1.9895410537719727} -08/30/2021 21:12:51 - INFO - __main__ - Step 44791: {'lr': 0.00040377128890404444, 'samples': 8599872, 'steps': 44790, 'loss/train': 1.7813513278961182} -08/30/2021 21:12:53 - INFO - __main__ - Step 44792: {'lr': 0.00040376710471011967, 'samples': 8600064, 'steps': 44791, 'loss/train': 1.7507117986679077} -08/30/2021 21:12:53 - INFO - __main__ - Step 44793: {'lr': 0.0004037629204469098, 'samples': 8600256, 'steps': 44792, 'loss/train': 1.2732532024383545} -08/30/2021 21:12:54 - INFO - __main__ - Step 44794: {'lr': 0.0004037587361144166, 'samples': 8600448, 'steps': 44793, 'loss/train': 1.7000207901000977} -08/30/2021 21:12:54 - INFO - __main__ - Step 44795: {'lr': 0.0004037545517126422, 'samples': 8600640, 'steps': 44794, 'loss/train': 0.5240303874015808} -08/30/2021 21:12:54 - INFO - __main__ - Step 44796: {'lr': 0.0004037503672415883, 'samples': 8600832, 'steps': 44795, 'loss/train': 1.7082513570785522} -08/30/2021 21:12:56 - INFO - __main__ - Step 44797: {'lr': 0.000403746182701257, 'samples': 8601024, 'steps': 44796, 'loss/train': 1.4022642374038696} -08/30/2021 21:12:56 - INFO - __main__ - Step 44798: {'lr': 0.0004037419980916499, 'samples': 8601216, 'steps': 44797, 'loss/train': 1.2172809839248657} -08/30/2021 21:12:57 - INFO - __main__ - Step 44799: {'lr': 0.00040373781341276904, 'samples': 8601408, 'steps': 44798, 'loss/train': 1.5933799743652344} -08/30/2021 21:12:57 - INFO - __main__ - Step 44800: {'lr': 0.00040373362866461633, 'samples': 8601600, 'steps': 44799, 'loss/train': 1.5234166383743286} -08/30/2021 21:12:57 - INFO - __main__ - Step 44801: {'lr': 0.0004037294438471936, 'samples': 8601792, 'steps': 44800, 'loss/train': 1.8410542011260986} -08/30/2021 21:12:59 - INFO - __main__ - Step 44802: {'lr': 0.00040372525896050285, 'samples': 8601984, 'steps': 44801, 'loss/train': 1.719411849975586} -08/30/2021 21:12:59 - INFO - __main__ - Step 44803: {'lr': 0.0004037210740045457, 'samples': 8602176, 'steps': 44802, 'loss/train': 0.5989000797271729} -08/30/2021 21:13:00 - INFO - __main__ - Step 44804: {'lr': 0.0004037168889793243, 'samples': 8602368, 'steps': 44803, 'loss/train': 1.1456217765808105} -08/30/2021 21:13:00 - INFO - __main__ - Step 44805: {'lr': 0.0004037127038848404, 'samples': 8602560, 'steps': 44804, 'loss/train': 1.4343721866607666} -08/30/2021 21:13:00 - INFO - __main__ - Step 44806: {'lr': 0.00040370851872109604, 'samples': 8602752, 'steps': 44805, 'loss/train': 0.966774046421051} -08/30/2021 21:13:02 - INFO - __main__ - Step 44807: {'lr': 0.0004037043334880929, 'samples': 8602944, 'steps': 44806, 'loss/train': 1.4352450370788574} -08/30/2021 21:13:02 - INFO - __main__ - Step 44808: {'lr': 0.000403700148185833, 'samples': 8603136, 'steps': 44807, 'loss/train': 1.2813022136688232} -08/30/2021 21:13:03 - INFO - __main__ - Step 44809: {'lr': 0.00040369596281431816, 'samples': 8603328, 'steps': 44808, 'loss/train': 0.12124764919281006} -08/30/2021 21:13:03 - INFO - __main__ - Step 44810: {'lr': 0.0004036917773735502, 'samples': 8603520, 'steps': 44809, 'loss/train': 1.1848020553588867} -08/30/2021 21:13:04 - INFO - __main__ - Step 44811: {'lr': 0.00040368759186353123, 'samples': 8603712, 'steps': 44810, 'loss/train': 0.3524267375469208} -08/30/2021 21:13:05 - INFO - __main__ - Step 44812: {'lr': 0.0004036834062842629, 'samples': 8603904, 'steps': 44811, 'loss/train': 1.1271228790283203} -08/30/2021 21:13:05 - INFO - __main__ - Step 44813: {'lr': 0.00040367922063574735, 'samples': 8604096, 'steps': 44812, 'loss/train': 1.3416420221328735} -08/30/2021 21:13:06 - INFO - __main__ - Step 44814: {'lr': 0.0004036750349179862, 'samples': 8604288, 'steps': 44813, 'loss/train': 1.1397815942764282} -08/30/2021 21:13:06 - INFO - __main__ - Step 44815: {'lr': 0.00040367084913098153, 'samples': 8604480, 'steps': 44814, 'loss/train': 0.9503486752510071} -08/30/2021 21:13:06 - INFO - __main__ - Step 44816: {'lr': 0.000403666663274735, 'samples': 8604672, 'steps': 44815, 'loss/train': 1.4151442050933838} -08/30/2021 21:13:08 - INFO - __main__ - Step 44817: {'lr': 0.0004036624773492488, 'samples': 8604864, 'steps': 44816, 'loss/train': 1.4580477476119995} -08/30/2021 21:13:09 - INFO - __main__ - Step 44818: {'lr': 0.0004036582913545246, 'samples': 8605056, 'steps': 44817, 'loss/train': 1.3998230695724487} -08/30/2021 21:13:09 - INFO - __main__ - Step 44819: {'lr': 0.0004036541052905643, 'samples': 8605248, 'steps': 44818, 'loss/train': 1.0086911916732788} -08/30/2021 21:13:10 - INFO - __main__ - Step 44820: {'lr': 0.0004036499191573699, 'samples': 8605440, 'steps': 44819, 'loss/train': 1.54413640499115} -08/30/2021 21:13:10 - INFO - __main__ - Step 44821: {'lr': 0.00040364573295494316, 'samples': 8605632, 'steps': 44820, 'loss/train': 1.0503805875778198} -08/30/2021 21:13:10 - INFO - __main__ - Step 44822: {'lr': 0.00040364154668328604, 'samples': 8605824, 'steps': 44821, 'loss/train': 1.2390207052230835} -08/30/2021 21:13:13 - INFO - __main__ - Step 44823: {'lr': 0.0004036373603424004, 'samples': 8606016, 'steps': 44822, 'loss/train': 1.408416748046875} -08/30/2021 21:13:14 - INFO - __main__ - Step 44824: {'lr': 0.00040363317393228814, 'samples': 8606208, 'steps': 44823, 'loss/train': 1.9918785095214844} -08/30/2021 21:13:14 - INFO - __main__ - Step 44825: {'lr': 0.00040362898745295117, 'samples': 8606400, 'steps': 44824, 'loss/train': 1.9970000982284546} -08/30/2021 21:13:14 - INFO - __main__ - Step 44826: {'lr': 0.00040362480090439136, 'samples': 8606592, 'steps': 44825, 'loss/train': 1.832792043685913} -08/30/2021 21:13:15 - INFO - __main__ - Step 44827: {'lr': 0.00040362061428661055, 'samples': 8606784, 'steps': 44826, 'loss/train': 1.7892916202545166} -08/30/2021 21:13:15 - INFO - __main__ - Step 44828: {'lr': 0.0004036164275996107, 'samples': 8606976, 'steps': 44827, 'loss/train': 1.4752496480941772} -08/30/2021 21:13:15 - INFO - __main__ - Step 44829: {'lr': 0.00040361224084339365, 'samples': 8607168, 'steps': 44828, 'loss/train': 1.9663931131362915} -08/30/2021 21:13:17 - INFO - __main__ - Step 44830: {'lr': 0.00040360805401796124, 'samples': 8607360, 'steps': 44829, 'loss/train': 1.1984492540359497} -08/30/2021 21:13:17 - INFO - __main__ - Step 44831: {'lr': 0.0004036038671233154, 'samples': 8607552, 'steps': 44830, 'loss/train': 1.2167338132858276} -08/30/2021 21:13:18 - INFO - __main__ - Step 44832: {'lr': 0.00040359968015945814, 'samples': 8607744, 'steps': 44831, 'loss/train': 2.0896899700164795} -08/30/2021 21:13:18 - INFO - __main__ - Step 44833: {'lr': 0.0004035954931263912, 'samples': 8607936, 'steps': 44832, 'loss/train': 1.2225323915481567} -08/30/2021 21:13:19 - INFO - __main__ - Step 44834: {'lr': 0.00040359130602411644, 'samples': 8608128, 'steps': 44833, 'loss/train': 1.1123920679092407} -08/30/2021 21:13:20 - INFO - __main__ - Step 44835: {'lr': 0.0004035871188526358, 'samples': 8608320, 'steps': 44834, 'loss/train': 1.6819673776626587} -08/30/2021 21:13:20 - INFO - __main__ - Step 44836: {'lr': 0.00040358293161195125, 'samples': 8608512, 'steps': 44835, 'loss/train': 1.055145025253296} -08/30/2021 21:13:21 - INFO - __main__ - Step 44837: {'lr': 0.0004035787443020645, 'samples': 8608704, 'steps': 44836, 'loss/train': 1.4019320011138916} -08/30/2021 21:13:21 - INFO - __main__ - Step 44838: {'lr': 0.00040357455692297765, 'samples': 8608896, 'steps': 44837, 'loss/train': 0.7773519158363342} -08/30/2021 21:13:22 - INFO - __main__ - Step 44839: {'lr': 0.0004035703694746924, 'samples': 8609088, 'steps': 44838, 'loss/train': 1.1051130294799805} -08/30/2021 21:13:22 - INFO - __main__ - Step 44840: {'lr': 0.0004035661819572108, 'samples': 8609280, 'steps': 44839, 'loss/train': 1.2858930826187134} -08/30/2021 21:13:23 - INFO - __main__ - Step 44841: {'lr': 0.0004035619943705345, 'samples': 8609472, 'steps': 44840, 'loss/train': 1.8081300258636475} -08/30/2021 21:13:24 - INFO - __main__ - Step 44842: {'lr': 0.0004035578067146657, 'samples': 8609664, 'steps': 44841, 'loss/train': 1.3008902072906494} -08/30/2021 21:13:24 - INFO - __main__ - Step 44843: {'lr': 0.000403553618989606, 'samples': 8609856, 'steps': 44842, 'loss/train': 1.1326730251312256} -08/30/2021 21:13:25 - INFO - __main__ - Step 44844: {'lr': 0.0004035494311953575, 'samples': 8610048, 'steps': 44843, 'loss/train': 1.447136640548706} -08/30/2021 21:13:25 - INFO - __main__ - Step 44845: {'lr': 0.0004035452433319219, 'samples': 8610240, 'steps': 44844, 'loss/train': 0.6824878454208374} -08/30/2021 21:13:26 - INFO - __main__ - Step 44846: {'lr': 0.0004035410553993012, 'samples': 8610432, 'steps': 44845, 'loss/train': 1.9774402379989624} -08/30/2021 21:13:27 - INFO - __main__ - Step 44847: {'lr': 0.00040353686739749733, 'samples': 8610624, 'steps': 44846, 'loss/train': 1.1656694412231445} -08/30/2021 21:13:27 - INFO - __main__ - Step 44848: {'lr': 0.0004035326793265121, 'samples': 8610816, 'steps': 44847, 'loss/train': 1.234243392944336} -08/30/2021 21:13:28 - INFO - __main__ - Step 44849: {'lr': 0.0004035284911863474, 'samples': 8611008, 'steps': 44848, 'loss/train': 1.1792242527008057} -08/30/2021 21:13:28 - INFO - __main__ - Step 44850: {'lr': 0.00040352430297700513, 'samples': 8611200, 'steps': 44849, 'loss/train': 0.7943199872970581} -08/30/2021 21:13:29 - INFO - __main__ - Step 44851: {'lr': 0.00040352011469848713, 'samples': 8611392, 'steps': 44850, 'loss/train': 1.5195316076278687} -08/30/2021 21:13:30 - INFO - __main__ - Step 44852: {'lr': 0.00040351592635079535, 'samples': 8611584, 'steps': 44851, 'loss/train': 1.5766055583953857} -08/30/2021 21:13:30 - INFO - __main__ - Step 44853: {'lr': 0.0004035117379339318, 'samples': 8611776, 'steps': 44852, 'loss/train': 1.315437912940979} -08/30/2021 21:13:31 - INFO - __main__ - Step 44854: {'lr': 0.00040350754944789815, 'samples': 8611968, 'steps': 44853, 'loss/train': 1.4011709690093994} -08/30/2021 21:13:31 - INFO - __main__ - Step 44855: {'lr': 0.0004035033608926963, 'samples': 8612160, 'steps': 44854, 'loss/train': 1.288525938987732} -08/30/2021 21:13:32 - INFO - __main__ - Step 44856: {'lr': 0.0004034991722683282, 'samples': 8612352, 'steps': 44855, 'loss/train': 1.4414703845977783} -08/30/2021 21:13:33 - INFO - __main__ - Step 44857: {'lr': 0.0004034949835747958, 'samples': 8612544, 'steps': 44856, 'loss/train': 1.63954758644104} -08/30/2021 21:13:33 - INFO - __main__ - Step 44858: {'lr': 0.00040349079481210096, 'samples': 8612736, 'steps': 44857, 'loss/train': 1.5960896015167236} -08/30/2021 21:13:34 - INFO - __main__ - Step 44859: {'lr': 0.00040348660598024547, 'samples': 8612928, 'steps': 44858, 'loss/train': 2.125499963760376} -08/30/2021 21:13:34 - INFO - __main__ - Step 44860: {'lr': 0.0004034824170792313, 'samples': 8613120, 'steps': 44859, 'loss/train': 1.7612104415893555} -08/30/2021 21:13:34 - INFO - __main__ - Step 44861: {'lr': 0.0004034782281090603, 'samples': 8613312, 'steps': 44860, 'loss/train': 1.3749823570251465} -08/30/2021 21:13:36 - INFO - __main__ - Step 44862: {'lr': 0.00040347403906973445, 'samples': 8613504, 'steps': 44861, 'loss/train': 1.1683363914489746} -08/30/2021 21:13:37 - INFO - __main__ - Step 44863: {'lr': 0.0004034698499612555, 'samples': 8613696, 'steps': 44862, 'loss/train': 0.06823708862066269} -08/30/2021 21:13:37 - INFO - __main__ - Step 44864: {'lr': 0.00040346566078362545, 'samples': 8613888, 'steps': 44863, 'loss/train': 0.049810729920864105} -08/30/2021 21:13:37 - INFO - __main__ - Step 44865: {'lr': 0.0004034614715368461, 'samples': 8614080, 'steps': 44864, 'loss/train': 1.4070563316345215} -08/30/2021 21:13:38 - INFO - __main__ - Step 44866: {'lr': 0.0004034572822209194, 'samples': 8614272, 'steps': 44865, 'loss/train': 1.8077664375305176} -08/30/2021 21:13:38 - INFO - __main__ - Step 44867: {'lr': 0.00040345309283584726, 'samples': 8614464, 'steps': 44866, 'loss/train': 1.9318798780441284} -08/30/2021 21:13:39 - INFO - __main__ - Step 44868: {'lr': 0.0004034489033816314, 'samples': 8614656, 'steps': 44867, 'loss/train': 0.6336967945098877} -08/30/2021 21:13:40 - INFO - __main__ - Step 44869: {'lr': 0.00040344471385827396, 'samples': 8614848, 'steps': 44868, 'loss/train': 1.1346098184585571} -08/30/2021 21:13:40 - INFO - __main__ - Step 44870: {'lr': 0.00040344052426577665, 'samples': 8615040, 'steps': 44869, 'loss/train': 0.7720788717269897} -08/30/2021 21:13:41 - INFO - __main__ - Step 44871: {'lr': 0.0004034363346041414, 'samples': 8615232, 'steps': 44870, 'loss/train': 1.6827176809310913} -08/30/2021 21:13:41 - INFO - __main__ - Step 44872: {'lr': 0.0004034321448733701, 'samples': 8615424, 'steps': 44871, 'loss/train': 1.4226248264312744} -08/30/2021 21:13:43 - INFO - __main__ - Step 44873: {'lr': 0.00040342795507346464, 'samples': 8615616, 'steps': 44872, 'loss/train': 1.684158205986023} -08/30/2021 21:13:43 - INFO - __main__ - Step 44874: {'lr': 0.000403423765204427, 'samples': 8615808, 'steps': 44873, 'loss/train': 1.4739277362823486} -08/30/2021 21:13:44 - INFO - __main__ - Step 44875: {'lr': 0.0004034195752662589, 'samples': 8616000, 'steps': 44874, 'loss/train': 0.8114175796508789} -08/30/2021 21:13:44 - INFO - __main__ - Step 44876: {'lr': 0.00040341538525896233, 'samples': 8616192, 'steps': 44875, 'loss/train': 1.1240508556365967} -08/30/2021 21:13:44 - INFO - __main__ - Step 44877: {'lr': 0.0004034111951825391, 'samples': 8616384, 'steps': 44876, 'loss/train': 0.12597016990184784} -08/30/2021 21:13:46 - INFO - __main__ - Step 44878: {'lr': 0.00040340700503699116, 'samples': 8616576, 'steps': 44877, 'loss/train': 1.5539361238479614} -08/30/2021 21:13:47 - INFO - __main__ - Step 44879: {'lr': 0.0004034028148223204, 'samples': 8616768, 'steps': 44878, 'loss/train': 1.5281035900115967} -08/30/2021 21:13:47 - INFO - __main__ - Step 44880: {'lr': 0.0004033986245385288, 'samples': 8616960, 'steps': 44879, 'loss/train': 0.9278026223182678} -08/30/2021 21:13:47 - INFO - __main__ - Step 44881: {'lr': 0.0004033944341856181, 'samples': 8617152, 'steps': 44880, 'loss/train': 1.3097578287124634} -08/30/2021 21:13:48 - INFO - __main__ - Step 44882: {'lr': 0.00040339024376359015, 'samples': 8617344, 'steps': 44881, 'loss/train': 1.283706784248352} -08/30/2021 21:13:49 - INFO - __main__ - Step 44883: {'lr': 0.000403386053272447, 'samples': 8617536, 'steps': 44882, 'loss/train': 1.464145302772522} -08/30/2021 21:13:50 - INFO - __main__ - Step 44884: {'lr': 0.0004033818627121904, 'samples': 8617728, 'steps': 44883, 'loss/train': 0.14013558626174927} -08/30/2021 21:13:50 - INFO - __main__ - Step 44885: {'lr': 0.00040337767208282235, 'samples': 8617920, 'steps': 44884, 'loss/train': 1.519673466682434} -08/30/2021 21:13:51 - INFO - __main__ - Step 44886: {'lr': 0.00040337348138434466, 'samples': 8618112, 'steps': 44885, 'loss/train': 2.190647840499878} -08/30/2021 21:13:51 - INFO - __main__ - Step 44887: {'lr': 0.00040336929061675933, 'samples': 8618304, 'steps': 44886, 'loss/train': 2.1774699687957764} -08/30/2021 21:13:51 - INFO - __main__ - Step 44888: {'lr': 0.0004033650997800681, 'samples': 8618496, 'steps': 44887, 'loss/train': 1.4825836420059204} -08/30/2021 21:13:53 - INFO - __main__ - Step 44889: {'lr': 0.00040336090887427284, 'samples': 8618688, 'steps': 44888, 'loss/train': 1.1236737966537476} -08/30/2021 21:13:53 - INFO - __main__ - Step 44890: {'lr': 0.00040335671789937564, 'samples': 8618880, 'steps': 44889, 'loss/train': 1.5144944190979004} -08/30/2021 21:13:54 - INFO - __main__ - Step 44891: {'lr': 0.00040335252685537817, 'samples': 8619072, 'steps': 44890, 'loss/train': 1.1874704360961914} -08/30/2021 21:13:54 - INFO - __main__ - Step 44892: {'lr': 0.0004033483357422825, 'samples': 8619264, 'steps': 44891, 'loss/train': 1.4392975568771362} -08/30/2021 21:13:54 - INFO - __main__ - Step 44893: {'lr': 0.0004033441445600904, 'samples': 8619456, 'steps': 44892, 'loss/train': 1.5645421743392944} -08/30/2021 21:13:56 - INFO - __main__ - Step 44894: {'lr': 0.0004033399533088038, 'samples': 8619648, 'steps': 44893, 'loss/train': 1.152329683303833} -08/30/2021 21:13:57 - INFO - __main__ - Step 44895: {'lr': 0.00040333576198842456, 'samples': 8619840, 'steps': 44894, 'loss/train': 1.283441424369812} -08/30/2021 21:13:57 - INFO - __main__ - Step 44896: {'lr': 0.00040333157059895463, 'samples': 8620032, 'steps': 44895, 'loss/train': 1.3250155448913574} -08/30/2021 21:13:58 - INFO - __main__ - Step 44897: {'lr': 0.0004033273791403959, 'samples': 8620224, 'steps': 44896, 'loss/train': 1.0440212488174438} -08/30/2021 21:13:58 - INFO - __main__ - Step 44898: {'lr': 0.0004033231876127501, 'samples': 8620416, 'steps': 44897, 'loss/train': 0.9838039875030518} -08/30/2021 21:14:00 - INFO - __main__ - Step 44899: {'lr': 0.00040331899601601934, 'samples': 8620608, 'steps': 44898, 'loss/train': 1.089269757270813} -08/30/2021 21:14:00 - INFO - __main__ - Step 44900: {'lr': 0.0004033148043502054, 'samples': 8620800, 'steps': 44899, 'loss/train': 1.3817768096923828} -08/30/2021 21:14:01 - INFO - __main__ - Step 44901: {'lr': 0.00040331061261531014, 'samples': 8620992, 'steps': 44900, 'loss/train': 1.220621109008789} -08/30/2021 21:14:01 - INFO - __main__ - Step 44902: {'lr': 0.0004033064208113355, 'samples': 8621184, 'steps': 44901, 'loss/train': 1.7035713195800781} -08/30/2021 21:14:01 - INFO - __main__ - Step 44903: {'lr': 0.00040330222893828334, 'samples': 8621376, 'steps': 44902, 'loss/train': 0.05508426949381828} -08/30/2021 21:14:02 - INFO - __main__ - Step 44904: {'lr': 0.0004032980369961555, 'samples': 8621568, 'steps': 44903, 'loss/train': 0.047360729426145554} -08/30/2021 21:14:03 - INFO - __main__ - Step 44905: {'lr': 0.000403293844984954, 'samples': 8621760, 'steps': 44904, 'loss/train': 0.61209636926651} -08/30/2021 21:14:04 - INFO - __main__ - Step 44906: {'lr': 0.00040328965290468066, 'samples': 8621952, 'steps': 44905, 'loss/train': 1.838263988494873} -08/30/2021 21:14:04 - INFO - __main__ - Step 44907: {'lr': 0.00040328546075533745, 'samples': 8622144, 'steps': 44906, 'loss/train': 1.6684576272964478} -08/30/2021 21:14:04 - INFO - __main__ - Step 44908: {'lr': 0.00040328126853692606, 'samples': 8622336, 'steps': 44907, 'loss/train': 1.5004563331604004} -08/30/2021 21:14:05 - INFO - __main__ - Step 44909: {'lr': 0.00040327707624944855, 'samples': 8622528, 'steps': 44908, 'loss/train': 2.075423240661621} -08/30/2021 21:14:06 - INFO - __main__ - Step 44910: {'lr': 0.0004032728838929067, 'samples': 8622720, 'steps': 44909, 'loss/train': 1.376769781112671} -08/30/2021 21:14:07 - INFO - __main__ - Step 44911: {'lr': 0.0004032686914673025, 'samples': 8622912, 'steps': 44910, 'loss/train': 1.015067458152771} -08/30/2021 21:14:07 - INFO - __main__ - Step 44912: {'lr': 0.00040326449897263775, 'samples': 8623104, 'steps': 44911, 'loss/train': 1.6484332084655762} -08/30/2021 21:14:07 - INFO - __main__ - Step 44913: {'lr': 0.0004032603064089144, 'samples': 8623296, 'steps': 44912, 'loss/train': 2.6110422611236572} -08/30/2021 21:14:08 - INFO - __main__ - Step 44914: {'lr': 0.00040325611377613435, 'samples': 8623488, 'steps': 44913, 'loss/train': 1.0199846029281616} -08/30/2021 21:14:09 - INFO - __main__ - Step 44915: {'lr': 0.00040325192107429944, 'samples': 8623680, 'steps': 44914, 'loss/train': 1.5279827117919922} -08/30/2021 21:14:10 - INFO - __main__ - Step 44916: {'lr': 0.00040324772830341163, 'samples': 8623872, 'steps': 44915, 'loss/train': 1.4078264236450195} -08/30/2021 21:14:10 - INFO - __main__ - Step 44917: {'lr': 0.0004032435354634726, 'samples': 8624064, 'steps': 44916, 'loss/train': 1.3844274282455444} -08/30/2021 21:14:11 - INFO - __main__ - Step 44918: {'lr': 0.00040323934255448457, 'samples': 8624256, 'steps': 44917, 'loss/train': 1.578859567642212} -08/30/2021 21:14:11 - INFO - __main__ - Step 44919: {'lr': 0.00040323514957644915, 'samples': 8624448, 'steps': 44918, 'loss/train': 1.1246085166931152} -08/30/2021 21:14:11 - INFO - __main__ - Step 44920: {'lr': 0.00040323095652936843, 'samples': 8624640, 'steps': 44919, 'loss/train': 2.017256498336792} -08/30/2021 21:14:13 - INFO - __main__ - Step 44921: {'lr': 0.00040322676341324415, 'samples': 8624832, 'steps': 44920, 'loss/train': 1.0597833395004272} -08/30/2021 21:14:14 - INFO - __main__ - Step 44922: {'lr': 0.0004032225702280783, 'samples': 8625024, 'steps': 44921, 'loss/train': 1.168633222579956} -08/30/2021 21:14:14 - INFO - __main__ - Step 44923: {'lr': 0.00040321837697387264, 'samples': 8625216, 'steps': 44922, 'loss/train': 1.4514899253845215} -08/30/2021 21:14:14 - INFO - __main__ - Step 44924: {'lr': 0.00040321418365062915, 'samples': 8625408, 'steps': 44923, 'loss/train': 1.0002316236495972} -08/30/2021 21:14:15 - INFO - __main__ - Step 44925: {'lr': 0.00040320999025834973, 'samples': 8625600, 'steps': 44924, 'loss/train': 1.454721450805664} -08/30/2021 21:14:16 - INFO - __main__ - Step 44926: {'lr': 0.0004032057967970363, 'samples': 8625792, 'steps': 44925, 'loss/train': 0.06795018911361694} -08/30/2021 21:14:17 - INFO - __main__ - Step 44927: {'lr': 0.0004032016032666907, 'samples': 8625984, 'steps': 44926, 'loss/train': 1.5177743434906006} -08/30/2021 21:14:17 - INFO - __main__ - Step 44928: {'lr': 0.00040319740966731477, 'samples': 8626176, 'steps': 44927, 'loss/train': 1.4378429651260376} -08/30/2021 21:14:17 - INFO - __main__ - Step 44929: {'lr': 0.0004031932159989105, 'samples': 8626368, 'steps': 44928, 'loss/train': 1.5881174802780151} -08/30/2021 21:14:18 - INFO - __main__ - Step 44930: {'lr': 0.0004031890222614797, 'samples': 8626560, 'steps': 44929, 'loss/train': 1.4071862697601318} -08/30/2021 21:14:18 - INFO - __main__ - Step 44931: {'lr': 0.0004031848284550243, 'samples': 8626752, 'steps': 44930, 'loss/train': 1.6574229001998901} -08/30/2021 21:14:20 - INFO - __main__ - Step 44932: {'lr': 0.0004031806345795462, 'samples': 8626944, 'steps': 44931, 'loss/train': 1.4888023138046265} -08/30/2021 21:14:21 - INFO - __main__ - Step 44933: {'lr': 0.0004031764406350472, 'samples': 8627136, 'steps': 44932, 'loss/train': 1.3646762371063232} -08/30/2021 21:14:21 - INFO - __main__ - Step 44934: {'lr': 0.0004031722466215293, 'samples': 8627328, 'steps': 44933, 'loss/train': 0.13535496592521667} -08/30/2021 21:14:22 - INFO - __main__ - Step 44935: {'lr': 0.00040316805253899434, 'samples': 8627520, 'steps': 44934, 'loss/train': 1.5405174493789673} -08/30/2021 21:14:22 - INFO - __main__ - Step 44936: {'lr': 0.0004031638583874443, 'samples': 8627712, 'steps': 44935, 'loss/train': 1.0725810527801514} -08/30/2021 21:14:24 - INFO - __main__ - Step 44937: {'lr': 0.0004031596641668809, 'samples': 8627904, 'steps': 44936, 'loss/train': 1.475506067276001} -08/30/2021 21:14:24 - INFO - __main__ - Step 44938: {'lr': 0.0004031554698773061, 'samples': 8628096, 'steps': 44937, 'loss/train': 0.7295766472816467} -08/30/2021 21:14:25 - INFO - __main__ - Step 44939: {'lr': 0.0004031512755187219, 'samples': 8628288, 'steps': 44938, 'loss/train': 1.4751077890396118} -08/30/2021 21:14:25 - INFO - __main__ - Step 44940: {'lr': 0.00040314708109113003, 'samples': 8628480, 'steps': 44939, 'loss/train': 1.4967466592788696} -08/30/2021 21:14:26 - INFO - __main__ - Step 44941: {'lr': 0.0004031428865945325, 'samples': 8628672, 'steps': 44940, 'loss/train': 1.3530702590942383} -08/30/2021 21:14:26 - INFO - __main__ - Step 44942: {'lr': 0.0004031386920289311, 'samples': 8628864, 'steps': 44941, 'loss/train': 1.267376184463501} -08/30/2021 21:14:28 - INFO - __main__ - Step 44943: {'lr': 0.0004031344973943278, 'samples': 8629056, 'steps': 44942, 'loss/train': 0.04985160380601883} -08/30/2021 21:14:28 - INFO - __main__ - Step 44944: {'lr': 0.00040313030269072445, 'samples': 8629248, 'steps': 44943, 'loss/train': 3.206683397293091} -08/30/2021 21:14:29 - INFO - __main__ - Step 44945: {'lr': 0.00040312610791812286, 'samples': 8629440, 'steps': 44944, 'loss/train': 3.8430142402648926} -08/30/2021 21:14:29 - INFO - __main__ - Step 44946: {'lr': 0.00040312191307652513, 'samples': 8629632, 'steps': 44945, 'loss/train': 1.984574794769287} -08/30/2021 21:14:29 - INFO - __main__ - Step 44947: {'lr': 0.000403117718165933, 'samples': 8629824, 'steps': 44946, 'loss/train': 1.3935471773147583} -08/30/2021 21:14:30 - INFO - __main__ - Step 44948: {'lr': 0.00040311352318634844, 'samples': 8630016, 'steps': 44947, 'loss/train': 1.3401875495910645} -08/30/2021 21:14:30 - INFO - __main__ - Step 44949: {'lr': 0.00040310932813777316, 'samples': 8630208, 'steps': 44948, 'loss/train': 3.4064152240753174} -08/30/2021 21:14:31 - INFO - __main__ - Step 44950: {'lr': 0.0004031051330202092, 'samples': 8630400, 'steps': 44949, 'loss/train': 2.279451608657837} -08/30/2021 21:14:32 - INFO - __main__ - Step 44951: {'lr': 0.00040310093783365854, 'samples': 8630592, 'steps': 44950, 'loss/train': 1.5151925086975098} -08/30/2021 21:14:32 - INFO - __main__ - Step 44952: {'lr': 0.0004030967425781229, 'samples': 8630784, 'steps': 44951, 'loss/train': 1.4714986085891724} -08/30/2021 21:14:32 - INFO - __main__ - Step 44953: {'lr': 0.0004030925472536042, 'samples': 8630976, 'steps': 44952, 'loss/train': 1.6764044761657715} -08/30/2021 21:14:33 - INFO - __main__ - Step 44954: {'lr': 0.0004030883518601044, 'samples': 8631168, 'steps': 44953, 'loss/train': 1.183774471282959} -08/30/2021 21:14:34 - INFO - __main__ - Step 44955: {'lr': 0.0004030841563976254, 'samples': 8631360, 'steps': 44954, 'loss/train': 1.4662946462631226} -08/30/2021 21:14:35 - INFO - __main__ - Step 44956: {'lr': 0.00040307996086616895, 'samples': 8631552, 'steps': 44955, 'loss/train': 1.4177237749099731} -08/30/2021 21:14:35 - INFO - __main__ - Step 44957: {'lr': 0.00040307576526573704, 'samples': 8631744, 'steps': 44956, 'loss/train': 1.635191559791565} -08/30/2021 21:14:35 - INFO - __main__ - Step 44958: {'lr': 0.00040307156959633154, 'samples': 8631936, 'steps': 44957, 'loss/train': 1.4528034925460815} -08/30/2021 21:14:36 - INFO - __main__ - Step 44959: {'lr': 0.00040306737385795437, 'samples': 8632128, 'steps': 44958, 'loss/train': 1.2309240102767944} -08/30/2021 21:14:37 - INFO - __main__ - Step 44960: {'lr': 0.00040306317805060746, 'samples': 8632320, 'steps': 44959, 'loss/train': 1.8696389198303223} -08/30/2021 21:14:38 - INFO - __main__ - Step 44961: {'lr': 0.0004030589821742926, 'samples': 8632512, 'steps': 44960, 'loss/train': 1.4075578451156616} -08/30/2021 21:14:38 - INFO - __main__ - Step 44962: {'lr': 0.00040305478622901177, 'samples': 8632704, 'steps': 44961, 'loss/train': 2.2401885986328125} -08/30/2021 21:14:38 - INFO - __main__ - Step 44963: {'lr': 0.0004030505902147668, 'samples': 8632896, 'steps': 44962, 'loss/train': 1.155764102935791} -08/30/2021 21:14:39 - INFO - __main__ - Step 44964: {'lr': 0.00040304639413155953, 'samples': 8633088, 'steps': 44963, 'loss/train': 1.3837316036224365} -08/30/2021 21:14:40 - INFO - __main__ - Step 44965: {'lr': 0.0004030421979793919, 'samples': 8633280, 'steps': 44964, 'loss/train': 1.4347622394561768} -08/30/2021 21:14:41 - INFO - __main__ - Step 44966: {'lr': 0.0004030380017582659, 'samples': 8633472, 'steps': 44965, 'loss/train': 0.919955849647522} -08/30/2021 21:14:41 - INFO - __main__ - Step 44967: {'lr': 0.0004030338054681833, 'samples': 8633664, 'steps': 44966, 'loss/train': 1.210355520248413} -08/30/2021 21:14:41 - INFO - __main__ - Step 44968: {'lr': 0.0004030296091091461, 'samples': 8633856, 'steps': 44967, 'loss/train': 0.8844677209854126} -08/30/2021 21:14:42 - INFO - __main__ - Step 44969: {'lr': 0.000403025412681156, 'samples': 8634048, 'steps': 44968, 'loss/train': 1.4895728826522827} -08/30/2021 21:14:43 - INFO - __main__ - Step 44970: {'lr': 0.00040302121618421505, 'samples': 8634240, 'steps': 44969, 'loss/train': 1.4343740940093994} -08/30/2021 21:14:44 - INFO - __main__ - Step 44971: {'lr': 0.0004030170196183252, 'samples': 8634432, 'steps': 44970, 'loss/train': 1.7820158004760742} -08/30/2021 21:14:44 - INFO - __main__ - Step 44972: {'lr': 0.00040301282298348806, 'samples': 8634624, 'steps': 44971, 'loss/train': 1.2913589477539062} -08/30/2021 21:14:45 - INFO - __main__ - Step 44973: {'lr': 0.0004030086262797058, 'samples': 8634816, 'steps': 44972, 'loss/train': 1.0297352075576782} -08/30/2021 21:14:45 - INFO - __main__ - Step 44974: {'lr': 0.0004030044295069803, 'samples': 8635008, 'steps': 44973, 'loss/train': 1.4256709814071655} -08/30/2021 21:14:46 - INFO - __main__ - Step 44975: {'lr': 0.00040300023266531327, 'samples': 8635200, 'steps': 44974, 'loss/train': 1.3890684843063354} -08/30/2021 21:14:47 - INFO - __main__ - Step 44976: {'lr': 0.0004029960357547067, 'samples': 8635392, 'steps': 44975, 'loss/train': 1.1985225677490234} -08/30/2021 21:14:47 - INFO - __main__ - Step 44977: {'lr': 0.0004029918387751625, 'samples': 8635584, 'steps': 44976, 'loss/train': 1.3467111587524414} -08/30/2021 21:14:48 - INFO - __main__ - Step 44978: {'lr': 0.00040298764172668253, 'samples': 8635776, 'steps': 44977, 'loss/train': 1.2234351634979248} -08/30/2021 21:14:48 - INFO - __main__ - Step 44979: {'lr': 0.00040298344460926866, 'samples': 8635968, 'steps': 44978, 'loss/train': 1.788515329360962} -08/30/2021 21:14:48 - INFO - __main__ - Step 44980: {'lr': 0.0004029792474229228, 'samples': 8636160, 'steps': 44979, 'loss/train': 1.798466682434082} -08/30/2021 21:14:50 - INFO - __main__ - Step 44981: {'lr': 0.00040297505016764697, 'samples': 8636352, 'steps': 44980, 'loss/train': 1.6477324962615967} -08/30/2021 21:14:50 - INFO - __main__ - Step 44982: {'lr': 0.00040297085284344284, 'samples': 8636544, 'steps': 44981, 'loss/train': 1.4184931516647339} -08/30/2021 21:14:50 - INFO - __main__ - Step 44983: {'lr': 0.0004029666554503124, 'samples': 8636736, 'steps': 44982, 'loss/train': 1.7507404088974} -08/30/2021 21:14:51 - INFO - __main__ - Step 44984: {'lr': 0.0004029624579882576, 'samples': 8636928, 'steps': 44983, 'loss/train': 0.8345987200737} -08/30/2021 21:14:51 - INFO - __main__ - Step 44985: {'lr': 0.00040295826045728023, 'samples': 8637120, 'steps': 44984, 'loss/train': 1.2658404111862183} -08/30/2021 21:14:53 - INFO - __main__ - Step 44986: {'lr': 0.00040295406285738224, 'samples': 8637312, 'steps': 44985, 'loss/train': 1.327380657196045} -08/30/2021 21:14:53 - INFO - __main__ - Step 44987: {'lr': 0.00040294986518856553, 'samples': 8637504, 'steps': 44986, 'loss/train': 0.9981260299682617} -08/30/2021 21:14:53 - INFO - __main__ - Step 44988: {'lr': 0.00040294566745083195, 'samples': 8637696, 'steps': 44987, 'loss/train': 1.7384164333343506} -08/30/2021 21:14:54 - INFO - __main__ - Step 44989: {'lr': 0.00040294146964418344, 'samples': 8637888, 'steps': 44988, 'loss/train': 1.4508442878723145} -08/30/2021 21:14:54 - INFO - __main__ - Step 44990: {'lr': 0.00040293727176862184, 'samples': 8638080, 'steps': 44989, 'loss/train': 0.9214214086532593} -08/30/2021 21:14:56 - INFO - __main__ - Step 44991: {'lr': 0.000402933073824149, 'samples': 8638272, 'steps': 44990, 'loss/train': 1.816994309425354} -08/30/2021 21:14:57 - INFO - __main__ - Step 44992: {'lr': 0.000402928875810767, 'samples': 8638464, 'steps': 44991, 'loss/train': 0.9074856638908386} -08/30/2021 21:14:57 - INFO - __main__ - Step 44993: {'lr': 0.00040292467772847754, 'samples': 8638656, 'steps': 44992, 'loss/train': 0.8389215469360352} -08/30/2021 21:14:58 - INFO - __main__ - Step 44994: {'lr': 0.00040292047957728264, 'samples': 8638848, 'steps': 44993, 'loss/train': 1.8396106958389282} -08/30/2021 21:14:58 - INFO - __main__ - Step 44995: {'lr': 0.00040291628135718404, 'samples': 8639040, 'steps': 44994, 'loss/train': 1.2606348991394043} -08/30/2021 21:14:59 - INFO - __main__ - Step 44996: {'lr': 0.0004029120830681838, 'samples': 8639232, 'steps': 44995, 'loss/train': 1.3793385028839111} -08/30/2021 21:15:00 - INFO - __main__ - Step 44997: {'lr': 0.0004029078847102837, 'samples': 8639424, 'steps': 44996, 'loss/train': 1.0976223945617676} -08/30/2021 21:15:00 - INFO - __main__ - Step 44998: {'lr': 0.00040290368628348564, 'samples': 8639616, 'steps': 44997, 'loss/train': 0.9544579386711121} -08/30/2021 21:15:01 - INFO - __main__ - Step 44999: {'lr': 0.00040289948778779157, 'samples': 8639808, 'steps': 44998, 'loss/train': 1.2889509201049805} -08/30/2021 21:15:01 - INFO - __main__ - Step 45000: {'lr': 0.00040289528922320334, 'samples': 8640000, 'steps': 44999, 'loss/train': 1.3871757984161377} -08/30/2021 21:15:01 - INFO - __main__ - Evaluating model checkpoint -08/30/2021 21:23:39 - INFO - __main__ - Step 45000: {'loss/eval': 1.285548210144043, 'perplexity': 3.616650104522705} -08/30/2021 21:23:39 - INFO - __main__ - Saving model checkpoint -08/30/2021 21:24:31 - INFO - __main__ - Step 45001: {'lr': 0.00040289109058972285, 'samples': 8640192, 'steps': 45000, 'loss/train': 1.4529192447662354} -08/30/2021 21:24:33 - INFO - __main__ - Step 45002: {'lr': 0.000402886891887352, 'samples': 8640384, 'steps': 45001, 'loss/train': 1.7427260875701904} -08/30/2021 21:24:33 - INFO - __main__ - Step 45003: {'lr': 0.0004028826931160927, 'samples': 8640576, 'steps': 45002, 'loss/train': 0.9633615612983704} -08/30/2021 21:24:34 - INFO - __main__ - Step 45004: {'lr': 0.0004028784942759468, 'samples': 8640768, 'steps': 45003, 'loss/train': 1.0695204734802246} -08/30/2021 21:24:34 - INFO - __main__ - Step 45005: {'lr': 0.0004028742953669162, 'samples': 8640960, 'steps': 45004, 'loss/train': 1.0802251100540161} -08/30/2021 21:24:34 - INFO - __main__ - Step 45006: {'lr': 0.0004028700963890028, 'samples': 8641152, 'steps': 45005, 'loss/train': 1.7785050868988037} -08/30/2021 21:24:36 - INFO - __main__ - Step 45007: {'lr': 0.0004028658973422085, 'samples': 8641344, 'steps': 45006, 'loss/train': 1.711496114730835} -08/30/2021 21:24:36 - INFO - __main__ - Step 45008: {'lr': 0.0004028616982265352, 'samples': 8641536, 'steps': 45007, 'loss/train': 1.7617367506027222} -08/30/2021 21:24:37 - INFO - __main__ - Step 45009: {'lr': 0.0004028574990419848, 'samples': 8641728, 'steps': 45008, 'loss/train': 1.7040481567382812} -08/30/2021 21:24:37 - INFO - __main__ - Step 45010: {'lr': 0.0004028532997885591, 'samples': 8641920, 'steps': 45009, 'loss/train': 1.4897103309631348} -08/30/2021 21:24:37 - INFO - __main__ - Step 45011: {'lr': 0.0004028491004662601, 'samples': 8642112, 'steps': 45010, 'loss/train': 1.4451160430908203} -08/30/2021 21:24:38 - INFO - __main__ - Step 45012: {'lr': 0.0004028449010750896, 'samples': 8642304, 'steps': 45011, 'loss/train': 1.6340372562408447} -08/30/2021 21:24:39 - INFO - __main__ - Step 45013: {'lr': 0.0004028407016150496, 'samples': 8642496, 'steps': 45012, 'loss/train': 2.0591118335723877} -08/30/2021 21:24:40 - INFO - __main__ - Step 45014: {'lr': 0.000402836502086142, 'samples': 8642688, 'steps': 45013, 'loss/train': 2.6037046909332275} -08/30/2021 21:24:40 - INFO - __main__ - Step 45015: {'lr': 0.00040283230248836855, 'samples': 8642880, 'steps': 45014, 'loss/train': 1.441423773765564} -08/30/2021 21:24:40 - INFO - __main__ - Step 45016: {'lr': 0.0004028281028217312, 'samples': 8643072, 'steps': 45015, 'loss/train': 1.0699127912521362} -08/30/2021 21:24:41 - INFO - __main__ - Step 45017: {'lr': 0.00040282390308623195, 'samples': 8643264, 'steps': 45016, 'loss/train': 1.4675841331481934} -08/30/2021 21:24:42 - INFO - __main__ - Step 45018: {'lr': 0.0004028197032818726, 'samples': 8643456, 'steps': 45017, 'loss/train': 1.482582926750183} -08/30/2021 21:24:43 - INFO - __main__ - Step 45019: {'lr': 0.00040281550340865493, 'samples': 8643648, 'steps': 45018, 'loss/train': 0.7939011454582214} -08/30/2021 21:24:43 - INFO - __main__ - Step 45020: {'lr': 0.000402811303466581, 'samples': 8643840, 'steps': 45019, 'loss/train': 1.3104171752929688} -08/30/2021 21:24:43 - INFO - __main__ - Step 45021: {'lr': 0.00040280710345565277, 'samples': 8644032, 'steps': 45020, 'loss/train': 1.2066048383712769} -08/30/2021 21:24:44 - INFO - __main__ - Step 45022: {'lr': 0.0004028029033758719, 'samples': 8644224, 'steps': 45021, 'loss/train': 0.5076983571052551} -08/30/2021 21:24:45 - INFO - __main__ - Step 45023: {'lr': 0.00040279870322724044, 'samples': 8644416, 'steps': 45022, 'loss/train': 1.5589089393615723} -08/30/2021 21:24:46 - INFO - __main__ - Step 45024: {'lr': 0.00040279450300976025, 'samples': 8644608, 'steps': 45023, 'loss/train': 1.701154112815857} -08/30/2021 21:24:46 - INFO - __main__ - Step 45025: {'lr': 0.0004027903027234332, 'samples': 8644800, 'steps': 45024, 'loss/train': 1.7186825275421143} -08/30/2021 21:24:46 - INFO - __main__ - Step 45026: {'lr': 0.0004027861023682612, 'samples': 8644992, 'steps': 45025, 'loss/train': 1.7952632904052734} -08/30/2021 21:24:47 - INFO - __main__ - Step 45027: {'lr': 0.00040278190194424613, 'samples': 8645184, 'steps': 45026, 'loss/train': 1.8114113807678223} -08/30/2021 21:24:48 - INFO - __main__ - Step 45028: {'lr': 0.0004027777014513899, 'samples': 8645376, 'steps': 45027, 'loss/train': 1.1434229612350464} -08/30/2021 21:24:49 - INFO - __main__ - Step 45029: {'lr': 0.0004027735008896944, 'samples': 8645568, 'steps': 45028, 'loss/train': 1.470395565032959} -08/30/2021 21:24:49 - INFO - __main__ - Step 45030: {'lr': 0.0004027693002591615, 'samples': 8645760, 'steps': 45029, 'loss/train': 1.7409037351608276} -08/30/2021 21:24:49 - INFO - __main__ - Step 45031: {'lr': 0.0004027650995597931, 'samples': 8645952, 'steps': 45030, 'loss/train': 1.4654394388198853} -08/30/2021 21:24:50 - INFO - __main__ - Step 45032: {'lr': 0.0004027608987915912, 'samples': 8646144, 'steps': 45031, 'loss/train': 1.1138930320739746} -08/30/2021 21:24:51 - INFO - __main__ - Step 45033: {'lr': 0.0004027566979545574, 'samples': 8646336, 'steps': 45032, 'loss/train': 1.749453067779541} -08/30/2021 21:24:52 - INFO - __main__ - Step 45034: {'lr': 0.000402752497048694, 'samples': 8646528, 'steps': 45033, 'loss/train': 1.281395673751831} -08/30/2021 21:24:52 - INFO - __main__ - Step 45035: {'lr': 0.0004027482960740026, 'samples': 8646720, 'steps': 45034, 'loss/train': 1.667781114578247} -08/30/2021 21:24:52 - INFO - __main__ - Step 45036: {'lr': 0.00040274409503048513, 'samples': 8646912, 'steps': 45035, 'loss/train': 1.2671470642089844} -08/30/2021 21:24:53 - INFO - __main__ - Step 45037: {'lr': 0.0004027398939181436, 'samples': 8647104, 'steps': 45036, 'loss/train': 2.7126309871673584} -08/30/2021 21:24:53 - INFO - __main__ - Step 45038: {'lr': 0.00040273569273697974, 'samples': 8647296, 'steps': 45037, 'loss/train': 1.6907230615615845} -08/30/2021 21:24:55 - INFO - __main__ - Step 45039: {'lr': 0.0004027314914869956, 'samples': 8647488, 'steps': 45038, 'loss/train': 1.9945603609085083} -08/30/2021 21:24:56 - INFO - __main__ - Step 45040: {'lr': 0.000402727290168193, 'samples': 8647680, 'steps': 45039, 'loss/train': 1.7411452531814575} -08/30/2021 21:24:56 - INFO - __main__ - Step 45041: {'lr': 0.00040272308878057383, 'samples': 8647872, 'steps': 45040, 'loss/train': 1.96919584274292} -08/30/2021 21:24:56 - INFO - __main__ - Step 45042: {'lr': 0.0004027188873241401, 'samples': 8648064, 'steps': 45041, 'loss/train': 1.712279200553894} -08/30/2021 21:24:57 - INFO - __main__ - Step 45043: {'lr': 0.00040271468579889346, 'samples': 8648256, 'steps': 45042, 'loss/train': 1.2977653741836548} -08/30/2021 21:24:57 - INFO - __main__ - Step 45044: {'lr': 0.0004027104842048359, 'samples': 8648448, 'steps': 45043, 'loss/train': 0.8696951866149902} -08/30/2021 21:24:59 - INFO - __main__ - Step 45045: {'lr': 0.0004027062825419695, 'samples': 8648640, 'steps': 45044, 'loss/train': 1.4597512483596802} -08/30/2021 21:25:00 - INFO - __main__ - Step 45046: {'lr': 0.0004027020808102959, 'samples': 8648832, 'steps': 45045, 'loss/train': 1.647222638130188} -08/30/2021 21:25:00 - INFO - __main__ - Step 45047: {'lr': 0.0004026978790098171, 'samples': 8649024, 'steps': 45046, 'loss/train': 2.0563488006591797} -08/30/2021 21:25:00 - INFO - __main__ - Step 45048: {'lr': 0.0004026936771405351, 'samples': 8649216, 'steps': 45047, 'loss/train': 1.577674388885498} -08/30/2021 21:25:01 - INFO - __main__ - Step 45049: {'lr': 0.0004026894752024516, 'samples': 8649408, 'steps': 45048, 'loss/train': 1.3633127212524414} -08/30/2021 21:25:02 - INFO - __main__ - Step 45050: {'lr': 0.00040268527319556856, 'samples': 8649600, 'steps': 45049, 'loss/train': 1.5550334453582764} -08/30/2021 21:25:03 - INFO - __main__ - Step 45051: {'lr': 0.0004026810711198879, 'samples': 8649792, 'steps': 45050, 'loss/train': 1.421905279159546} -08/30/2021 21:25:03 - INFO - __main__ - Step 45052: {'lr': 0.00040267686897541157, 'samples': 8649984, 'steps': 45051, 'loss/train': 1.6891404390335083} -08/30/2021 21:25:03 - INFO - __main__ - Step 45053: {'lr': 0.0004026726667621413, 'samples': 8650176, 'steps': 45052, 'loss/train': 1.5040290355682373} -08/30/2021 21:25:04 - INFO - __main__ - Step 45054: {'lr': 0.00040266846448007914, 'samples': 8650368, 'steps': 45053, 'loss/train': 1.712159514427185} -08/30/2021 21:25:05 - INFO - __main__ - Step 45055: {'lr': 0.00040266426212922697, 'samples': 8650560, 'steps': 45054, 'loss/train': 0.8725683689117432} -08/30/2021 21:25:06 - INFO - __main__ - Step 45056: {'lr': 0.00040266005970958656, 'samples': 8650752, 'steps': 45055, 'loss/train': 1.3331995010375977} -08/30/2021 21:25:06 - INFO - __main__ - Step 45057: {'lr': 0.0004026558572211599, 'samples': 8650944, 'steps': 45056, 'loss/train': 1.406862735748291} -08/30/2021 21:25:07 - INFO - __main__ - Step 45058: {'lr': 0.00040265165466394894, 'samples': 8651136, 'steps': 45057, 'loss/train': 1.4554100036621094} -08/30/2021 21:25:07 - INFO - __main__ - Step 45059: {'lr': 0.00040264745203795536, 'samples': 8651328, 'steps': 45058, 'loss/train': 1.6819303035736084} -08/30/2021 21:25:10 - INFO - __main__ - Step 45060: {'lr': 0.0004026432493431813, 'samples': 8651520, 'steps': 45059, 'loss/train': 0.13371874392032623} -08/30/2021 21:25:10 - INFO - __main__ - Step 45061: {'lr': 0.0004026390465796286, 'samples': 8651712, 'steps': 45060, 'loss/train': 1.288615107536316} -08/30/2021 21:25:11 - INFO - __main__ - Step 45062: {'lr': 0.000402634843747299, 'samples': 8651904, 'steps': 45061, 'loss/train': 2.206705331802368} -08/30/2021 21:25:11 - INFO - __main__ - Step 45063: {'lr': 0.0004026306408461945, 'samples': 8652096, 'steps': 45062, 'loss/train': 3.178462505340576} -08/30/2021 21:25:11 - INFO - __main__ - Step 45064: {'lr': 0.000402626437876317, 'samples': 8652288, 'steps': 45063, 'loss/train': 1.5514113903045654} -08/30/2021 21:25:12 - INFO - __main__ - Step 45065: {'lr': 0.00040262223483766835, 'samples': 8652480, 'steps': 45064, 'loss/train': 1.488478183746338} -08/30/2021 21:25:13 - INFO - __main__ - Step 45066: {'lr': 0.0004026180317302506, 'samples': 8652672, 'steps': 45065, 'loss/train': 2.1092100143432617} -08/30/2021 21:25:14 - INFO - __main__ - Step 45067: {'lr': 0.0004026138285540654, 'samples': 8652864, 'steps': 45066, 'loss/train': 2.2072505950927734} -08/30/2021 21:25:14 - INFO - __main__ - Step 45068: {'lr': 0.0004026096253091148, 'samples': 8653056, 'steps': 45067, 'loss/train': 1.8169845342636108} -08/30/2021 21:25:14 - INFO - __main__ - Step 45069: {'lr': 0.00040260542199540064, 'samples': 8653248, 'steps': 45068, 'loss/train': 1.8276143074035645} -08/30/2021 21:25:15 - INFO - __main__ - Step 45070: {'lr': 0.00040260121861292484, 'samples': 8653440, 'steps': 45069, 'loss/train': 2.101228952407837} -08/30/2021 21:25:15 - INFO - __main__ - Step 45071: {'lr': 0.0004025970151616893, 'samples': 8653632, 'steps': 45070, 'loss/train': 4.186982154846191} -08/30/2021 21:25:16 - INFO - __main__ - Step 45072: {'lr': 0.0004025928116416959, 'samples': 8653824, 'steps': 45071, 'loss/train': 1.756313443183899} -08/30/2021 21:25:17 - INFO - __main__ - Step 45073: {'lr': 0.0004025886080529465, 'samples': 8654016, 'steps': 45072, 'loss/train': 1.7998212575912476} -08/30/2021 21:25:17 - INFO - __main__ - Step 45074: {'lr': 0.00040258440439544307, 'samples': 8654208, 'steps': 45073, 'loss/train': 1.5091502666473389} -08/30/2021 21:25:18 - INFO - __main__ - Step 45075: {'lr': 0.0004025802006691874, 'samples': 8654400, 'steps': 45074, 'loss/train': 1.4549766778945923} -08/30/2021 21:25:18 - INFO - __main__ - Step 45076: {'lr': 0.0004025759968741816, 'samples': 8654592, 'steps': 45075, 'loss/train': 1.9283344745635986} -08/30/2021 21:25:19 - INFO - __main__ - Step 45077: {'lr': 0.00040257179301042724, 'samples': 8654784, 'steps': 45076, 'loss/train': 1.647515058517456} -08/30/2021 21:25:20 - INFO - __main__ - Step 45078: {'lr': 0.00040256758907792646, 'samples': 8654976, 'steps': 45077, 'loss/train': 2.8315911293029785} -08/30/2021 21:25:20 - INFO - __main__ - Step 45079: {'lr': 0.0004025633850766811, 'samples': 8655168, 'steps': 45078, 'loss/train': 1.2989681959152222} -08/30/2021 21:25:21 - INFO - __main__ - Step 45080: {'lr': 0.00040255918100669296, 'samples': 8655360, 'steps': 45079, 'loss/train': 1.736068606376648} -08/30/2021 21:25:21 - INFO - __main__ - Step 45081: {'lr': 0.000402554976867964, 'samples': 8655552, 'steps': 45080, 'loss/train': 1.838010311126709} -08/30/2021 21:25:23 - INFO - __main__ - Step 45082: {'lr': 0.00040255077266049624, 'samples': 8655744, 'steps': 45081, 'loss/train': 1.5102806091308594} -08/30/2021 21:25:23 - INFO - __main__ - Step 45083: {'lr': 0.0004025465683842914, 'samples': 8655936, 'steps': 45082, 'loss/train': 1.8476357460021973} -08/30/2021 21:25:23 - INFO - __main__ - Step 45084: {'lr': 0.0004025423640393514, 'samples': 8656128, 'steps': 45083, 'loss/train': 1.7623934745788574} -08/30/2021 21:25:24 - INFO - __main__ - Step 45085: {'lr': 0.0004025381596256782, 'samples': 8656320, 'steps': 45084, 'loss/train': 1.4438000917434692} -08/30/2021 21:25:24 - INFO - __main__ - Step 45086: {'lr': 0.0004025339551432736, 'samples': 8656512, 'steps': 45085, 'loss/train': 1.7174092531204224} -08/30/2021 21:25:26 - INFO - __main__ - Step 45087: {'lr': 0.0004025297505921396, 'samples': 8656704, 'steps': 45086, 'loss/train': 1.3684344291687012} -08/30/2021 21:25:26 - INFO - __main__ - Step 45088: {'lr': 0.00040252554597227795, 'samples': 8656896, 'steps': 45087, 'loss/train': 2.029940366744995} -08/30/2021 21:25:26 - INFO - __main__ - Step 45089: {'lr': 0.00040252134128369085, 'samples': 8657088, 'steps': 45088, 'loss/train': 1.645632266998291} -08/30/2021 21:25:27 - INFO - __main__ - Step 45090: {'lr': 0.00040251713652637985, 'samples': 8657280, 'steps': 45089, 'loss/train': 2.0566251277923584} -08/30/2021 21:25:27 - INFO - __main__ - Step 45091: {'lr': 0.00040251293170034697, 'samples': 8657472, 'steps': 45090, 'loss/train': 1.2192778587341309} -08/30/2021 21:25:29 - INFO - __main__ - Step 45092: {'lr': 0.00040250872680559416, 'samples': 8657664, 'steps': 45091, 'loss/train': 1.8568124771118164} -08/30/2021 21:25:29 - INFO - __main__ - Step 45093: {'lr': 0.00040250452184212326, 'samples': 8657856, 'steps': 45092, 'loss/train': 1.3581924438476562} -08/30/2021 21:25:29 - INFO - __main__ - Step 45094: {'lr': 0.00040250031680993617, 'samples': 8658048, 'steps': 45093, 'loss/train': 1.4816144704818726} -08/30/2021 21:25:30 - INFO - __main__ - Step 45095: {'lr': 0.0004024961117090348, 'samples': 8658240, 'steps': 45094, 'loss/train': 2.1238787174224854} -08/30/2021 21:25:30 - INFO - __main__ - Step 45096: {'lr': 0.00040249190653942105, 'samples': 8658432, 'steps': 45095, 'loss/train': 1.2603925466537476} -08/30/2021 21:25:30 - INFO - __main__ - Step 45097: {'lr': 0.00040248770130109677, 'samples': 8658624, 'steps': 45096, 'loss/train': 1.5867254734039307} -08/30/2021 21:25:32 - INFO - __main__ - Step 45098: {'lr': 0.0004024834959940639, 'samples': 8658816, 'steps': 45097, 'loss/train': 1.7172764539718628} -08/30/2021 21:25:33 - INFO - __main__ - Step 45099: {'lr': 0.0004024792906183243, 'samples': 8659008, 'steps': 45098, 'loss/train': 1.516958236694336} -08/30/2021 21:25:33 - INFO - __main__ - Step 45100: {'lr': 0.0004024750851738799, 'samples': 8659200, 'steps': 45099, 'loss/train': 1.6982613801956177} -08/30/2021 21:25:33 - INFO - __main__ - Step 45101: {'lr': 0.00040247087966073253, 'samples': 8659392, 'steps': 45100, 'loss/train': 1.380101203918457} -08/30/2021 21:25:34 - INFO - __main__ - Step 45102: {'lr': 0.00040246667407888427, 'samples': 8659584, 'steps': 45101, 'loss/train': 1.3081490993499756} -08/30/2021 21:25:35 - INFO - __main__ - Step 45103: {'lr': 0.0004024624684283368, 'samples': 8659776, 'steps': 45102, 'loss/train': 1.572332739830017} -08/30/2021 21:25:36 - INFO - __main__ - Step 45104: {'lr': 0.000402458262709092, 'samples': 8659968, 'steps': 45103, 'loss/train': 1.3511675596237183} -08/30/2021 21:25:36 - INFO - __main__ - Step 45105: {'lr': 0.00040245405692115193, 'samples': 8660160, 'steps': 45104, 'loss/train': 1.4388599395751953} -08/30/2021 21:25:36 - INFO - __main__ - Step 45106: {'lr': 0.0004024498510645185, 'samples': 8660352, 'steps': 45105, 'loss/train': 1.2101796865463257} -08/30/2021 21:25:37 - INFO - __main__ - Step 45107: {'lr': 0.0004024456451391934, 'samples': 8660544, 'steps': 45106, 'loss/train': 1.2687268257141113} -08/30/2021 21:25:38 - INFO - __main__ - Step 45108: {'lr': 0.0004024414391451787, 'samples': 8660736, 'steps': 45107, 'loss/train': 1.5186289548873901} -08/30/2021 21:25:39 - INFO - __main__ - Step 45109: {'lr': 0.00040243723308247624, 'samples': 8660928, 'steps': 45108, 'loss/train': 1.085286259651184} -08/30/2021 21:25:39 - INFO - __main__ - Step 45110: {'lr': 0.0004024330269510879, 'samples': 8661120, 'steps': 45109, 'loss/train': 1.389014720916748} -08/30/2021 21:25:39 - INFO - __main__ - Step 45111: {'lr': 0.00040242882075101563, 'samples': 8661312, 'steps': 45110, 'loss/train': 1.1004711389541626} -08/30/2021 21:25:40 - INFO - __main__ - Step 45112: {'lr': 0.0004024246144822612, 'samples': 8661504, 'steps': 45111, 'loss/train': 0.9022179245948792} -08/30/2021 21:25:41 - INFO - __main__ - Step 45113: {'lr': 0.00040242040814482665, 'samples': 8661696, 'steps': 45112, 'loss/train': 1.7989670038223267} -08/30/2021 21:25:42 - INFO - __main__ - Step 45114: {'lr': 0.00040241620173871385, 'samples': 8661888, 'steps': 45113, 'loss/train': 1.1808686256408691} -08/30/2021 21:25:42 - INFO - __main__ - Step 45115: {'lr': 0.0004024119952639246, 'samples': 8662080, 'steps': 45114, 'loss/train': 1.1829791069030762} -08/30/2021 21:25:42 - INFO - __main__ - Step 45116: {'lr': 0.00040240778872046093, 'samples': 8662272, 'steps': 45115, 'loss/train': 2.0790300369262695} -08/30/2021 21:25:43 - INFO - __main__ - Step 45117: {'lr': 0.00040240358210832456, 'samples': 8662464, 'steps': 45116, 'loss/train': 1.0125223398208618} -08/30/2021 21:25:44 - INFO - __main__ - Step 45118: {'lr': 0.00040239937542751753, 'samples': 8662656, 'steps': 45117, 'loss/train': 1.2831854820251465} -08/30/2021 21:25:45 - INFO - __main__ - Step 45119: {'lr': 0.0004023951686780417, 'samples': 8662848, 'steps': 45118, 'loss/train': 1.3456792831420898} -08/30/2021 21:25:45 - INFO - __main__ - Step 45120: {'lr': 0.000402390961859899, 'samples': 8663040, 'steps': 45119, 'loss/train': 1.8141673803329468} -08/30/2021 21:25:45 - INFO - __main__ - Step 45121: {'lr': 0.00040238675497309117, 'samples': 8663232, 'steps': 45120, 'loss/train': 1.1669790744781494} -08/30/2021 21:25:46 - INFO - __main__ - Step 45122: {'lr': 0.0004023825480176204, 'samples': 8663424, 'steps': 45121, 'loss/train': 1.5144553184509277} -08/30/2021 21:25:47 - INFO - __main__ - Step 45123: {'lr': 0.0004023783409934882, 'samples': 8663616, 'steps': 45122, 'loss/train': 0.5693473815917969} -08/30/2021 21:25:48 - INFO - __main__ - Step 45124: {'lr': 0.00040237413390069684, 'samples': 8663808, 'steps': 45123, 'loss/train': 1.1970113515853882} -08/30/2021 21:25:48 - INFO - __main__ - Step 45125: {'lr': 0.000402369926739248, 'samples': 8664000, 'steps': 45124, 'loss/train': 1.4020979404449463} -08/30/2021 21:25:49 - INFO - __main__ - Step 45126: {'lr': 0.0004023657195091436, 'samples': 8664192, 'steps': 45125, 'loss/train': 1.6678982973098755} -08/30/2021 21:25:49 - INFO - __main__ - Step 45127: {'lr': 0.00040236151221038555, 'samples': 8664384, 'steps': 45126, 'loss/train': 0.18871457874774933} -08/30/2021 21:25:50 - INFO - __main__ - Step 45128: {'lr': 0.00040235730484297573, 'samples': 8664576, 'steps': 45127, 'loss/train': 1.0326552391052246} -08/30/2021 21:25:51 - INFO - __main__ - Step 45129: {'lr': 0.00040235309740691607, 'samples': 8664768, 'steps': 45128, 'loss/train': 1.3598569631576538} -08/30/2021 21:25:51 - INFO - __main__ - Step 45130: {'lr': 0.0004023488899022085, 'samples': 8664960, 'steps': 45129, 'loss/train': 1.6308218240737915} -08/30/2021 21:25:51 - INFO - __main__ - Step 45131: {'lr': 0.00040234468232885483, 'samples': 8665152, 'steps': 45130, 'loss/train': 1.5824154615402222} -08/30/2021 21:25:52 - INFO - __main__ - Step 45132: {'lr': 0.00040234047468685704, 'samples': 8665344, 'steps': 45131, 'loss/train': 1.6160740852355957} -08/30/2021 21:25:53 - INFO - __main__ - Step 45133: {'lr': 0.00040233626697621695, 'samples': 8665536, 'steps': 45132, 'loss/train': 1.3872069120407104} -08/30/2021 21:25:54 - INFO - __main__ - Step 45134: {'lr': 0.0004023320591969365, 'samples': 8665728, 'steps': 45133, 'loss/train': 1.5919708013534546} -08/30/2021 21:25:54 - INFO - __main__ - Step 45135: {'lr': 0.00040232785134901755, 'samples': 8665920, 'steps': 45134, 'loss/train': 0.6691237688064575} -08/30/2021 21:25:54 - INFO - __main__ - Step 45136: {'lr': 0.0004023236434324621, 'samples': 8666112, 'steps': 45135, 'loss/train': 1.3559731245040894} -08/30/2021 21:25:55 - INFO - __main__ - Step 45137: {'lr': 0.0004023194354472719, 'samples': 8666304, 'steps': 45136, 'loss/train': 1.3152339458465576} -08/30/2021 21:25:56 - INFO - __main__ - Step 45138: {'lr': 0.0004023152273934489, 'samples': 8666496, 'steps': 45137, 'loss/train': 1.6463127136230469} -08/30/2021 21:25:57 - INFO - __main__ - Step 45139: {'lr': 0.000402311019270995, 'samples': 8666688, 'steps': 45138, 'loss/train': 0.6973602175712585} -08/30/2021 21:25:57 - INFO - __main__ - Step 45140: {'lr': 0.00040230681107991217, 'samples': 8666880, 'steps': 45139, 'loss/train': 1.6793612241744995} -08/30/2021 21:25:58 - INFO - __main__ - Step 45141: {'lr': 0.0004023026028202021, 'samples': 8667072, 'steps': 45140, 'loss/train': 1.6262484788894653} -08/30/2021 21:25:58 - INFO - __main__ - Step 45142: {'lr': 0.000402298394491867, 'samples': 8667264, 'steps': 45141, 'loss/train': 1.3933535814285278} -08/30/2021 21:25:58 - INFO - __main__ - Step 45143: {'lr': 0.0004022941860949085, 'samples': 8667456, 'steps': 45142, 'loss/train': 1.4439202547073364} -08/30/2021 21:26:00 - INFO - __main__ - Step 45144: {'lr': 0.0004022899776293287, 'samples': 8667648, 'steps': 45143, 'loss/train': 0.09861698001623154} -08/30/2021 21:26:01 - INFO - __main__ - Step 45145: {'lr': 0.00040228576909512927, 'samples': 8667840, 'steps': 45144, 'loss/train': 1.7973074913024902} -08/30/2021 21:26:01 - INFO - __main__ - Step 45146: {'lr': 0.0004022815604923122, 'samples': 8668032, 'steps': 45145, 'loss/train': 3.4507994651794434} -08/30/2021 21:26:01 - INFO - __main__ - Step 45147: {'lr': 0.00040227735182087954, 'samples': 8668224, 'steps': 45146, 'loss/train': 0.0915398970246315} -08/30/2021 21:26:02 - INFO - __main__ - Step 45148: {'lr': 0.00040227314308083296, 'samples': 8668416, 'steps': 45147, 'loss/train': 1.4490028619766235} -08/30/2021 21:26:02 - INFO - __main__ - Step 45149: {'lr': 0.0004022689342721745, 'samples': 8668608, 'steps': 45148, 'loss/train': 1.3307652473449707} -08/30/2021 21:26:04 - INFO - __main__ - Step 45150: {'lr': 0.000402264725394906, 'samples': 8668800, 'steps': 45149, 'loss/train': 1.6872589588165283} -08/30/2021 21:26:04 - INFO - __main__ - Step 45151: {'lr': 0.00040226051644902925, 'samples': 8668992, 'steps': 45150, 'loss/train': 1.2641016244888306} -08/30/2021 21:26:04 - INFO - __main__ - Step 45152: {'lr': 0.0004022563074345464, 'samples': 8669184, 'steps': 45151, 'loss/train': 1.261623501777649} -08/30/2021 21:26:05 - INFO - __main__ - Step 45153: {'lr': 0.00040225209835145916, 'samples': 8669376, 'steps': 45152, 'loss/train': 1.574806809425354} -08/30/2021 21:26:05 - INFO - __main__ - Step 45154: {'lr': 0.0004022478891997695, 'samples': 8669568, 'steps': 45153, 'loss/train': 1.6885905265808105} -08/30/2021 21:26:07 - INFO - __main__ - Step 45155: {'lr': 0.0004022436799794792, 'samples': 8669760, 'steps': 45154, 'loss/train': 0.9964928030967712} -08/30/2021 21:26:08 - INFO - __main__ - Step 45156: {'lr': 0.0004022394706905904, 'samples': 8669952, 'steps': 45155, 'loss/train': 1.844875693321228} -08/30/2021 21:26:08 - INFO - __main__ - Step 45157: {'lr': 0.0004022352613331047, 'samples': 8670144, 'steps': 45156, 'loss/train': 1.6679919958114624} -08/30/2021 21:26:08 - INFO - __main__ - Step 45158: {'lr': 0.0004022310519070242, 'samples': 8670336, 'steps': 45157, 'loss/train': 1.661723256111145} -08/30/2021 21:26:09 - INFO - __main__ - Step 45159: {'lr': 0.00040222684241235075, 'samples': 8670528, 'steps': 45158, 'loss/train': 1.6632270812988281} -08/30/2021 21:26:10 - INFO - __main__ - Step 45160: {'lr': 0.00040222263284908616, 'samples': 8670720, 'steps': 45159, 'loss/train': 1.235009789466858} -08/30/2021 21:26:11 - INFO - __main__ - Step 45161: {'lr': 0.00040221842321723245, 'samples': 8670912, 'steps': 45160, 'loss/train': 0.6463727355003357} -08/30/2021 21:26:11 - INFO - __main__ - Step 45162: {'lr': 0.0004022142135167915, 'samples': 8671104, 'steps': 45161, 'loss/train': 1.435362458229065} -08/30/2021 21:26:12 - INFO - __main__ - Step 45163: {'lr': 0.0004022100037477652, 'samples': 8671296, 'steps': 45162, 'loss/train': 1.6625282764434814} -08/30/2021 21:26:12 - INFO - __main__ - Step 45164: {'lr': 0.0004022057939101553, 'samples': 8671488, 'steps': 45163, 'loss/train': 1.5202744007110596} -08/30/2021 21:26:12 - INFO - __main__ - Step 45165: {'lr': 0.0004022015840039639, 'samples': 8671680, 'steps': 45164, 'loss/train': 1.7744377851486206} -08/30/2021 21:26:14 - INFO - __main__ - Step 45166: {'lr': 0.00040219737402919284, 'samples': 8671872, 'steps': 45165, 'loss/train': 1.7089102268218994} -08/30/2021 21:26:14 - INFO - __main__ - Step 45167: {'lr': 0.0004021931639858439, 'samples': 8672064, 'steps': 45166, 'loss/train': 1.8279352188110352} -08/30/2021 21:26:15 - INFO - __main__ - Step 45168: {'lr': 0.00040218895387391913, 'samples': 8672256, 'steps': 45167, 'loss/train': 1.2124706506729126} -08/30/2021 21:26:15 - INFO - __main__ - Step 45169: {'lr': 0.0004021847436934204, 'samples': 8672448, 'steps': 45168, 'loss/train': 1.634500503540039} -08/30/2021 21:26:15 - INFO - __main__ - Step 45170: {'lr': 0.0004021805334443496, 'samples': 8672640, 'steps': 45169, 'loss/train': 2.0135257244110107} -08/30/2021 21:26:17 - INFO - __main__ - Step 45171: {'lr': 0.00040217632312670846, 'samples': 8672832, 'steps': 45170, 'loss/train': 1.0767260789871216} -08/30/2021 21:26:17 - INFO - __main__ - Step 45172: {'lr': 0.0004021721127404991, 'samples': 8673024, 'steps': 45171, 'loss/train': 1.7100480794906616} -08/30/2021 21:26:18 - INFO - __main__ - Step 45173: {'lr': 0.0004021679022857233, 'samples': 8673216, 'steps': 45172, 'loss/train': 0.8735764622688293} -08/30/2021 21:26:18 - INFO - __main__ - Step 45174: {'lr': 0.000402163691762383, 'samples': 8673408, 'steps': 45173, 'loss/train': 0.9695132374763489} -08/30/2021 21:26:18 - INFO - __main__ - Step 45175: {'lr': 0.00040215948117048006, 'samples': 8673600, 'steps': 45174, 'loss/train': 1.5175728797912598} -08/30/2021 21:26:20 - INFO - __main__ - Step 45176: {'lr': 0.00040215527051001653, 'samples': 8673792, 'steps': 45175, 'loss/train': 2.1440935134887695} -08/30/2021 21:26:20 - INFO - __main__ - Step 45177: {'lr': 0.00040215105978099407, 'samples': 8673984, 'steps': 45176, 'loss/train': 0.6213804483413696} -08/30/2021 21:26:21 - INFO - __main__ - Step 45178: {'lr': 0.00040214684898341475, 'samples': 8674176, 'steps': 45177, 'loss/train': 1.0209404230117798} -08/30/2021 21:26:21 - INFO - __main__ - Step 45179: {'lr': 0.00040214263811728034, 'samples': 8674368, 'steps': 45178, 'loss/train': 1.6317853927612305} -08/30/2021 21:26:21 - INFO - __main__ - Step 45180: {'lr': 0.00040213842718259287, 'samples': 8674560, 'steps': 45179, 'loss/train': 1.3017443418502808} -08/30/2021 21:26:23 - INFO - __main__ - Step 45181: {'lr': 0.00040213421617935416, 'samples': 8674752, 'steps': 45180, 'loss/train': 1.840362787246704} -08/30/2021 21:26:23 - INFO - __main__ - Step 45182: {'lr': 0.000402130005107566, 'samples': 8674944, 'steps': 45181, 'loss/train': 0.6452128291130066} -08/30/2021 21:26:24 - INFO - __main__ - Step 45183: {'lr': 0.0004021257939672306, 'samples': 8675136, 'steps': 45182, 'loss/train': 1.3573397397994995} -08/30/2021 21:26:24 - INFO - __main__ - Step 45184: {'lr': 0.0004021215827583496, 'samples': 8675328, 'steps': 45183, 'loss/train': 1.5065065622329712} -08/30/2021 21:26:24 - INFO - __main__ - Step 45185: {'lr': 0.0004021173714809249, 'samples': 8675520, 'steps': 45184, 'loss/train': 2.3413240909576416} -08/30/2021 21:26:26 - INFO - __main__ - Step 45186: {'lr': 0.0004021131601349585, 'samples': 8675712, 'steps': 45185, 'loss/train': 0.1006455197930336} -08/30/2021 21:26:27 - INFO - __main__ - Step 45187: {'lr': 0.0004021089487204522, 'samples': 8675904, 'steps': 45186, 'loss/train': 1.4627920389175415} -08/30/2021 21:26:27 - INFO - __main__ - Step 45188: {'lr': 0.00040210473723740803, 'samples': 8676096, 'steps': 45187, 'loss/train': 0.1854332983493805} -08/30/2021 21:26:28 - INFO - __main__ - Step 45189: {'lr': 0.0004021005256858279, 'samples': 8676288, 'steps': 45188, 'loss/train': 2.417635679244995} -08/30/2021 21:26:28 - INFO - __main__ - Step 45190: {'lr': 0.00040209631406571344, 'samples': 8676480, 'steps': 45189, 'loss/train': 1.8251458406448364} -08/30/2021 21:26:29 - INFO - __main__ - Step 45191: {'lr': 0.00040209210237706684, 'samples': 8676672, 'steps': 45190, 'loss/train': 1.7103395462036133} -08/30/2021 21:26:30 - INFO - __main__ - Step 45192: {'lr': 0.0004020878906198898, 'samples': 8676864, 'steps': 45191, 'loss/train': 1.358802080154419} -08/30/2021 21:26:30 - INFO - __main__ - Step 45193: {'lr': 0.0004020836787941844, 'samples': 8677056, 'steps': 45192, 'loss/train': 1.6523271799087524} -08/30/2021 21:26:31 - INFO - __main__ - Step 45194: {'lr': 0.0004020794668999524, 'samples': 8677248, 'steps': 45193, 'loss/train': 1.580916404724121} -08/30/2021 21:26:31 - INFO - __main__ - Step 45195: {'lr': 0.0004020752549371957, 'samples': 8677440, 'steps': 45194, 'loss/train': 2.040734052658081} -08/30/2021 21:26:33 - INFO - __main__ - Step 45196: {'lr': 0.00040207104290591633, 'samples': 8677632, 'steps': 45195, 'loss/train': 1.3342704772949219} -08/30/2021 21:26:33 - INFO - __main__ - Step 45197: {'lr': 0.000402066830806116, 'samples': 8677824, 'steps': 45196, 'loss/train': 1.5754648447036743} -08/30/2021 21:26:33 - INFO - __main__ - Step 45198: {'lr': 0.0004020626186377967, 'samples': 8678016, 'steps': 45197, 'loss/train': 1.622589349746704} -08/30/2021 21:26:34 - INFO - __main__ - Step 45199: {'lr': 0.00040205840640096036, 'samples': 8678208, 'steps': 45198, 'loss/train': 1.131399393081665} -08/30/2021 21:26:34 - INFO - __main__ - Step 45200: {'lr': 0.0004020541940956089, 'samples': 8678400, 'steps': 45199, 'loss/train': 1.2490323781967163} -08/30/2021 21:26:36 - INFO - __main__ - Step 45201: {'lr': 0.0004020499817217441, 'samples': 8678592, 'steps': 45200, 'loss/train': 2.06465220451355} -08/30/2021 21:26:36 - INFO - __main__ - Step 45202: {'lr': 0.000402045769279368, 'samples': 8678784, 'steps': 45201, 'loss/train': 1.343319296836853} -08/30/2021 21:26:37 - INFO - __main__ - Step 45203: {'lr': 0.0004020415567684823, 'samples': 8678976, 'steps': 45202, 'loss/train': 1.325750470161438} -08/30/2021 21:26:37 - INFO - __main__ - Step 45204: {'lr': 0.0004020373441890891, 'samples': 8679168, 'steps': 45203, 'loss/train': 1.1039748191833496} -08/30/2021 21:26:37 - INFO - __main__ - Step 45205: {'lr': 0.00040203313154119026, 'samples': 8679360, 'steps': 45204, 'loss/train': 0.6253945827484131} -08/30/2021 21:26:38 - INFO - __main__ - Step 45206: {'lr': 0.00040202891882478754, 'samples': 8679552, 'steps': 45205, 'loss/train': 1.3993908166885376} -08/30/2021 21:26:40 - INFO - __main__ - Step 45207: {'lr': 0.000402024706039883, 'samples': 8679744, 'steps': 45206, 'loss/train': 0.05071474611759186} -08/30/2021 21:26:40 - INFO - __main__ - Step 45208: {'lr': 0.0004020204931864785, 'samples': 8679936, 'steps': 45207, 'loss/train': 0.66348797082901} -08/30/2021 21:26:41 - INFO - __main__ - Step 45209: {'lr': 0.0004020162802645758, 'samples': 8680128, 'steps': 45208, 'loss/train': 1.10163152217865} -08/30/2021 21:26:41 - INFO - __main__ - Step 45210: {'lr': 0.000402012067274177, 'samples': 8680320, 'steps': 45209, 'loss/train': 1.6773884296417236} -08/30/2021 21:26:41 - INFO - __main__ - Step 45211: {'lr': 0.0004020078542152839, 'samples': 8680512, 'steps': 45210, 'loss/train': 1.4000777006149292} -08/30/2021 21:26:43 - INFO - __main__ - Step 45212: {'lr': 0.0004020036410878984, 'samples': 8680704, 'steps': 45211, 'loss/train': 1.1540910005569458} -08/30/2021 21:26:43 - INFO - __main__ - Step 45213: {'lr': 0.0004019994278920224, 'samples': 8680896, 'steps': 45212, 'loss/train': 1.5811522006988525} -08/30/2021 21:26:44 - INFO - __main__ - Step 45214: {'lr': 0.00040199521462765776, 'samples': 8681088, 'steps': 45213, 'loss/train': 1.3787648677825928} -08/30/2021 21:26:44 - INFO - __main__ - Step 45215: {'lr': 0.0004019910012948065, 'samples': 8681280, 'steps': 45214, 'loss/train': 0.09304669499397278} -08/30/2021 21:26:44 - INFO - __main__ - Step 45216: {'lr': 0.0004019867878934704, 'samples': 8681472, 'steps': 45215, 'loss/train': 1.4651738405227661} -08/30/2021 21:26:46 - INFO - __main__ - Step 45217: {'lr': 0.0004019825744236514, 'samples': 8681664, 'steps': 45216, 'loss/train': 0.48439496755599976} -08/30/2021 21:26:46 - INFO - __main__ - Step 45218: {'lr': 0.0004019783608853513, 'samples': 8681856, 'steps': 45217, 'loss/train': 1.2058886289596558} -08/30/2021 21:26:47 - INFO - __main__ - Step 45219: {'lr': 0.0004019741472785723, 'samples': 8682048, 'steps': 45218, 'loss/train': 1.054483413696289} -08/30/2021 21:26:47 - INFO - __main__ - Step 45220: {'lr': 0.0004019699336033159, 'samples': 8682240, 'steps': 45219, 'loss/train': 2.2588601112365723} -08/30/2021 21:26:47 - INFO - __main__ - Step 45221: {'lr': 0.0004019657198595843, 'samples': 8682432, 'steps': 45220, 'loss/train': 1.4068375825881958} -08/30/2021 21:26:49 - INFO - __main__ - Step 45222: {'lr': 0.00040196150604737924, 'samples': 8682624, 'steps': 45221, 'loss/train': 1.260451316833496} -08/30/2021 21:26:49 - INFO - __main__ - Step 45223: {'lr': 0.0004019572921667027, 'samples': 8682816, 'steps': 45222, 'loss/train': 1.1345397233963013} -08/30/2021 21:26:50 - INFO - __main__ - Step 45224: {'lr': 0.0004019530782175566, 'samples': 8683008, 'steps': 45223, 'loss/train': 0.8595730066299438} -08/30/2021 21:26:50 - INFO - __main__ - Step 45225: {'lr': 0.00040194886419994274, 'samples': 8683200, 'steps': 45224, 'loss/train': 1.3685495853424072} -08/30/2021 21:26:50 - INFO - __main__ - Step 45226: {'lr': 0.0004019446501138631, 'samples': 8683392, 'steps': 45225, 'loss/train': 1.742268443107605} -08/30/2021 21:26:52 - INFO - __main__ - Step 45227: {'lr': 0.0004019404359593195, 'samples': 8683584, 'steps': 45226, 'loss/train': 1.4271306991577148} -08/30/2021 21:26:52 - INFO - __main__ - Step 45228: {'lr': 0.0004019362217363138, 'samples': 8683776, 'steps': 45227, 'loss/train': 1.571885347366333} -08/30/2021 21:26:53 - INFO - __main__ - Step 45229: {'lr': 0.00040193200744484815, 'samples': 8683968, 'steps': 45228, 'loss/train': 0.9927380084991455} -08/30/2021 21:26:53 - INFO - __main__ - Step 45230: {'lr': 0.00040192779308492423, 'samples': 8684160, 'steps': 45229, 'loss/train': 1.130592942237854} -08/30/2021 21:26:53 - INFO - __main__ - Step 45231: {'lr': 0.00040192357865654395, 'samples': 8684352, 'steps': 45230, 'loss/train': 0.5775272846221924} -08/30/2021 21:26:55 - INFO - __main__ - Step 45232: {'lr': 0.00040191936415970926, 'samples': 8684544, 'steps': 45231, 'loss/train': 1.9309287071228027} -08/30/2021 21:26:56 - INFO - __main__ - Step 45233: {'lr': 0.00040191514959442206, 'samples': 8684736, 'steps': 45232, 'loss/train': 0.07123694568872452} -08/30/2021 21:26:56 - INFO - __main__ - Step 45234: {'lr': 0.0004019109349606842, 'samples': 8684928, 'steps': 45233, 'loss/train': 1.4687259197235107} -08/30/2021 21:26:56 - INFO - __main__ - Step 45235: {'lr': 0.0004019067202584977, 'samples': 8685120, 'steps': 45234, 'loss/train': 0.5876619815826416} -08/30/2021 21:26:57 - INFO - __main__ - Step 45236: {'lr': 0.0004019025054878643, 'samples': 8685312, 'steps': 45235, 'loss/train': 0.8078687787055969} -08/30/2021 21:26:58 - INFO - __main__ - Step 45237: {'lr': 0.00040189829064878605, 'samples': 8685504, 'steps': 45236, 'loss/train': 1.732340693473816} -08/30/2021 21:26:59 - INFO - __main__ - Step 45238: {'lr': 0.0004018940757412647, 'samples': 8685696, 'steps': 45237, 'loss/train': 1.624877691268921} -08/30/2021 21:26:59 - INFO - __main__ - Step 45239: {'lr': 0.0004018898607653022, 'samples': 8685888, 'steps': 45238, 'loss/train': 1.5087510347366333} -08/30/2021 21:26:59 - INFO - __main__ - Step 45240: {'lr': 0.00040188564572090057, 'samples': 8686080, 'steps': 45239, 'loss/train': 1.4165570735931396} -08/30/2021 21:27:00 - INFO - __main__ - Step 45241: {'lr': 0.00040188143060806156, 'samples': 8686272, 'steps': 45240, 'loss/train': 1.0970169305801392} -08/30/2021 21:27:00 - INFO - __main__ - Step 45242: {'lr': 0.0004018772154267871, 'samples': 8686464, 'steps': 45241, 'loss/train': 1.244028925895691} -08/30/2021 21:27:02 - INFO - __main__ - Step 45243: {'lr': 0.0004018730001770792, 'samples': 8686656, 'steps': 45242, 'loss/train': 0.06590409576892853} -08/30/2021 21:27:02 - INFO - __main__ - Step 45244: {'lr': 0.00040186878485893955, 'samples': 8686848, 'steps': 45243, 'loss/train': 1.2824143171310425} -08/30/2021 21:27:02 - INFO - __main__ - Step 45245: {'lr': 0.0004018645694723703, 'samples': 8687040, 'steps': 45244, 'loss/train': 1.242163896560669} -08/30/2021 21:27:03 - INFO - __main__ - Step 45246: {'lr': 0.00040186035401737307, 'samples': 8687232, 'steps': 45245, 'loss/train': 1.4473241567611694} -08/30/2021 21:27:03 - INFO - __main__ - Step 45247: {'lr': 0.00040185613849395, 'samples': 8687424, 'steps': 45246, 'loss/train': 2.455127716064453} -08/30/2021 21:27:05 - INFO - __main__ - Step 45248: {'lr': 0.0004018519229021029, 'samples': 8687616, 'steps': 45247, 'loss/train': 1.652255892753601} -08/30/2021 21:27:05 - INFO - __main__ - Step 45249: {'lr': 0.0004018477072418336, 'samples': 8687808, 'steps': 45248, 'loss/train': 1.7025799751281738} -08/30/2021 21:27:05 - INFO - __main__ - Step 45250: {'lr': 0.00040184349151314413, 'samples': 8688000, 'steps': 45249, 'loss/train': 1.5914254188537598} -08/30/2021 21:27:06 - INFO - __main__ - Step 45251: {'lr': 0.0004018392757160363, 'samples': 8688192, 'steps': 45250, 'loss/train': 1.1948776245117188} -08/30/2021 21:27:06 - INFO - __main__ - Step 45252: {'lr': 0.00040183505985051204, 'samples': 8688384, 'steps': 45251, 'loss/train': 1.5230097770690918} -08/30/2021 21:27:08 - INFO - __main__ - Step 45253: {'lr': 0.0004018308439165733, 'samples': 8688576, 'steps': 45252, 'loss/train': 1.324571132659912} -08/30/2021 21:27:08 - INFO - __main__ - Step 45254: {'lr': 0.00040182662791422185, 'samples': 8688768, 'steps': 45253, 'loss/train': 0.5762340426445007} -08/30/2021 21:27:09 - INFO - __main__ - Step 45255: {'lr': 0.0004018224118434597, 'samples': 8688960, 'steps': 45254, 'loss/train': 1.4324442148208618} -08/30/2021 21:27:09 - INFO - __main__ - Step 45256: {'lr': 0.0004018181957042887, 'samples': 8689152, 'steps': 45255, 'loss/train': 1.5107744932174683} -08/30/2021 21:27:09 - INFO - __main__ - Step 45257: {'lr': 0.00040181397949671073, 'samples': 8689344, 'steps': 45256, 'loss/train': 0.6136773824691772} -08/30/2021 21:27:11 - INFO - __main__ - Step 45258: {'lr': 0.00040180976322072776, 'samples': 8689536, 'steps': 45257, 'loss/train': 1.2147080898284912} -08/30/2021 21:27:11 - INFO - __main__ - Step 45259: {'lr': 0.0004018055468763416, 'samples': 8689728, 'steps': 45258, 'loss/train': 1.5769293308258057} -08/30/2021 21:27:12 - INFO - __main__ - Step 45260: {'lr': 0.0004018013304635543, 'samples': 8689920, 'steps': 45259, 'loss/train': 1.0438284873962402} -08/30/2021 21:27:12 - INFO - __main__ - Step 45261: {'lr': 0.0004017971139823676, 'samples': 8690112, 'steps': 45260, 'loss/train': 1.6896641254425049} -08/30/2021 21:27:12 - INFO - __main__ - Step 45262: {'lr': 0.0004017928974327835, 'samples': 8690304, 'steps': 45261, 'loss/train': 1.7051851749420166} -08/30/2021 21:27:14 - INFO - __main__ - Step 45263: {'lr': 0.00040178868081480393, 'samples': 8690496, 'steps': 45262, 'loss/train': 1.5047693252563477} -08/30/2021 21:27:15 - INFO - __main__ - Step 45264: {'lr': 0.00040178446412843054, 'samples': 8690688, 'steps': 45263, 'loss/train': 1.429306983947754} -08/30/2021 21:27:15 - INFO - __main__ - Step 45265: {'lr': 0.0004017802473736655, 'samples': 8690880, 'steps': 45264, 'loss/train': 1.924657940864563} -08/30/2021 21:27:15 - INFO - __main__ - Step 45266: {'lr': 0.00040177603055051065, 'samples': 8691072, 'steps': 45265, 'loss/train': 1.6970393657684326} -08/30/2021 21:27:16 - INFO - __main__ - Step 45267: {'lr': 0.0004017718136589679, 'samples': 8691264, 'steps': 45266, 'loss/train': 1.4279415607452393} -08/30/2021 21:27:17 - INFO - __main__ - Step 45268: {'lr': 0.000401767596699039, 'samples': 8691456, 'steps': 45267, 'loss/train': 1.8002479076385498} -08/30/2021 21:27:18 - INFO - __main__ - Step 45269: {'lr': 0.00040176337967072603, 'samples': 8691648, 'steps': 45268, 'loss/train': 1.7292377948760986} -08/30/2021 21:27:18 - INFO - __main__ - Step 45270: {'lr': 0.0004017591625740308, 'samples': 8691840, 'steps': 45269, 'loss/train': 1.7646021842956543} -08/30/2021 21:27:19 - INFO - __main__ - Step 45271: {'lr': 0.0004017549454089553, 'samples': 8692032, 'steps': 45270, 'loss/train': 1.4502753019332886} -08/30/2021 21:27:19 - INFO - __main__ - Step 45272: {'lr': 0.00040175072817550127, 'samples': 8692224, 'steps': 45271, 'loss/train': 1.2278869152069092} -08/30/2021 21:27:19 - INFO - __main__ - Step 45273: {'lr': 0.00040174651087367076, 'samples': 8692416, 'steps': 45272, 'loss/train': 1.3958121538162231} -08/30/2021 21:27:21 - INFO - __main__ - Step 45274: {'lr': 0.0004017422935034656, 'samples': 8692608, 'steps': 45273, 'loss/train': 0.32039281725883484} -08/30/2021 21:27:21 - INFO - __main__ - Step 45275: {'lr': 0.00040173807606488763, 'samples': 8692800, 'steps': 45274, 'loss/train': 1.6026588678359985} -08/30/2021 21:27:22 - INFO - __main__ - Step 45276: {'lr': 0.0004017338585579389, 'samples': 8692992, 'steps': 45275, 'loss/train': 1.8548914194107056} -08/30/2021 21:27:22 - INFO - __main__ - Step 45277: {'lr': 0.0004017296409826213, 'samples': 8693184, 'steps': 45276, 'loss/train': 1.3057940006256104} -08/30/2021 21:27:22 - INFO - __main__ - Step 45278: {'lr': 0.00040172542333893657, 'samples': 8693376, 'steps': 45277, 'loss/train': 1.186486005783081} -08/30/2021 21:27:24 - INFO - __main__ - Step 45279: {'lr': 0.00040172120562688673, 'samples': 8693568, 'steps': 45278, 'loss/train': 1.3602626323699951} -08/30/2021 21:27:24 - INFO - __main__ - Step 45280: {'lr': 0.00040171698784647366, 'samples': 8693760, 'steps': 45279, 'loss/train': 1.3070400953292847} -08/30/2021 21:27:25 - INFO - __main__ - Step 45281: {'lr': 0.00040171276999769926, 'samples': 8693952, 'steps': 45280, 'loss/train': 1.3612293004989624} -08/30/2021 21:27:25 - INFO - __main__ - Step 45282: {'lr': 0.00040170855208056537, 'samples': 8694144, 'steps': 45281, 'loss/train': 0.5573500394821167} -08/30/2021 21:27:25 - INFO - __main__ - Step 45283: {'lr': 0.000401704334095074, 'samples': 8694336, 'steps': 45282, 'loss/train': 2.2114064693450928} -08/30/2021 21:27:27 - INFO - __main__ - Step 45284: {'lr': 0.00040170011604122704, 'samples': 8694528, 'steps': 45283, 'loss/train': 1.6097602844238281} -08/30/2021 21:27:27 - INFO - __main__ - Step 45285: {'lr': 0.0004016958979190263, 'samples': 8694720, 'steps': 45284, 'loss/train': 1.6535147428512573} -08/30/2021 21:27:28 - INFO - __main__ - Step 45286: {'lr': 0.0004016916797284738, 'samples': 8694912, 'steps': 45285, 'loss/train': 1.5273797512054443} -08/30/2021 21:27:28 - INFO - __main__ - Step 45287: {'lr': 0.00040168746146957123, 'samples': 8695104, 'steps': 45286, 'loss/train': 1.1005959510803223} -08/30/2021 21:27:28 - INFO - __main__ - Step 45288: {'lr': 0.0004016832431423207, 'samples': 8695296, 'steps': 45287, 'loss/train': 1.3159942626953125} -08/30/2021 21:27:30 - INFO - __main__ - Step 45289: {'lr': 0.00040167902474672404, 'samples': 8695488, 'steps': 45288, 'loss/train': 1.511220932006836} -08/30/2021 21:27:30 - INFO - __main__ - Step 45290: {'lr': 0.0004016748062827832, 'samples': 8695680, 'steps': 45289, 'loss/train': 1.4889229536056519} -08/30/2021 21:27:31 - INFO - __main__ - Step 45291: {'lr': 0.00040167058775049993, 'samples': 8695872, 'steps': 45290, 'loss/train': 0.9322032928466797} -08/30/2021 21:27:31 - INFO - __main__ - Step 45292: {'lr': 0.0004016663691498763, 'samples': 8696064, 'steps': 45291, 'loss/train': 2.1582694053649902} -08/30/2021 21:27:31 - INFO - __main__ - Step 45293: {'lr': 0.00040166215048091414, 'samples': 8696256, 'steps': 45292, 'loss/train': 1.3934918642044067} -08/30/2021 21:27:33 - INFO - __main__ - Step 45294: {'lr': 0.0004016579317436153, 'samples': 8696448, 'steps': 45293, 'loss/train': 1.3077359199523926} -08/30/2021 21:27:33 - INFO - __main__ - Step 45295: {'lr': 0.0004016537129379818, 'samples': 8696640, 'steps': 45294, 'loss/train': 0.5296040773391724} -08/30/2021 21:27:34 - INFO - __main__ - Step 45296: {'lr': 0.0004016494940640155, 'samples': 8696832, 'steps': 45295, 'loss/train': 1.626242756843567} -08/30/2021 21:27:34 - INFO - __main__ - Step 45297: {'lr': 0.0004016452751217183, 'samples': 8697024, 'steps': 45296, 'loss/train': 1.5968647003173828} -08/30/2021 21:27:34 - INFO - __main__ - Step 45298: {'lr': 0.00040164105611109195, 'samples': 8697216, 'steps': 45297, 'loss/train': 1.4990514516830444} -08/30/2021 21:27:36 - INFO - __main__ - Step 45299: {'lr': 0.0004016368370321386, 'samples': 8697408, 'steps': 45298, 'loss/train': 1.072702407836914} -08/30/2021 21:27:37 - INFO - __main__ - Step 45300: {'lr': 0.00040163261788485994, 'samples': 8697600, 'steps': 45299, 'loss/train': 0.779970645904541} -08/30/2021 21:27:37 - INFO - __main__ - Step 45301: {'lr': 0.00040162839866925804, 'samples': 8697792, 'steps': 45300, 'loss/train': 2.057222843170166} -08/30/2021 21:27:37 - INFO - __main__ - Step 45302: {'lr': 0.0004016241793853347, 'samples': 8697984, 'steps': 45301, 'loss/train': 1.5212918519973755} -08/30/2021 21:27:38 - INFO - __main__ - Step 45303: {'lr': 0.00040161996003309174, 'samples': 8698176, 'steps': 45302, 'loss/train': 0.07882996648550034} -08/30/2021 21:27:39 - INFO - __main__ - Step 45304: {'lr': 0.00040161574061253134, 'samples': 8698368, 'steps': 45303, 'loss/train': 1.3946245908737183} -08/30/2021 21:27:39 - INFO - __main__ - Step 45305: {'lr': 0.0004016115211236552, 'samples': 8698560, 'steps': 45304, 'loss/train': 1.4245455265045166} -08/30/2021 21:27:40 - INFO - __main__ - Step 45306: {'lr': 0.0004016073015664651, 'samples': 8698752, 'steps': 45305, 'loss/train': 1.5707294940948486} -08/30/2021 21:27:40 - INFO - __main__ - Step 45307: {'lr': 0.0004016030819409632, 'samples': 8698944, 'steps': 45306, 'loss/train': 1.669108510017395} -08/30/2021 21:27:41 - INFO - __main__ - Step 45308: {'lr': 0.00040159886224715126, 'samples': 8699136, 'steps': 45307, 'loss/train': 1.294464349746704} -08/30/2021 21:27:41 - INFO - __main__ - Step 45309: {'lr': 0.0004015946424850312, 'samples': 8699328, 'steps': 45308, 'loss/train': 1.6534972190856934} -08/30/2021 21:27:42 - INFO - __main__ - Step 45310: {'lr': 0.000401590422654605, 'samples': 8699520, 'steps': 45309, 'loss/train': 1.4779269695281982} -08/30/2021 21:27:43 - INFO - __main__ - Step 45311: {'lr': 0.00040158620275587443, 'samples': 8699712, 'steps': 45310, 'loss/train': 0.8517269492149353} -08/30/2021 21:27:43 - INFO - __main__ - Step 45312: {'lr': 0.0004015819827888415, 'samples': 8699904, 'steps': 45311, 'loss/train': 0.2647896707057953} -08/30/2021 21:27:44 - INFO - __main__ - Step 45313: {'lr': 0.00040157776275350805, 'samples': 8700096, 'steps': 45312, 'loss/train': 1.3386090993881226} -08/30/2021 21:27:44 - INFO - __main__ - Step 45314: {'lr': 0.000401573542649876, 'samples': 8700288, 'steps': 45313, 'loss/train': 1.1151525974273682} -08/30/2021 21:27:46 - INFO - __main__ - Step 45315: {'lr': 0.0004015693224779472, 'samples': 8700480, 'steps': 45314, 'loss/train': 1.425656795501709} -08/30/2021 21:27:47 - INFO - __main__ - Step 45316: {'lr': 0.0004015651022377237, 'samples': 8700672, 'steps': 45315, 'loss/train': 1.3129818439483643} -08/30/2021 21:27:47 - INFO - __main__ - Step 45317: {'lr': 0.00040156088192920726, 'samples': 8700864, 'steps': 45316, 'loss/train': 1.5592702627182007} -08/30/2021 21:27:47 - INFO - __main__ - Step 45318: {'lr': 0.0004015566615523998, 'samples': 8701056, 'steps': 45317, 'loss/train': 0.5816635489463806} -08/30/2021 21:27:48 - INFO - __main__ - Step 45319: {'lr': 0.00040155244110730325, 'samples': 8701248, 'steps': 45318, 'loss/train': 1.3422900438308716} -08/30/2021 21:27:49 - INFO - __main__ - Step 45320: {'lr': 0.00040154822059391954, 'samples': 8701440, 'steps': 45319, 'loss/train': 0.23084278404712677} -08/30/2021 21:27:50 - INFO - __main__ - Step 45321: {'lr': 0.00040154400001225055, 'samples': 8701632, 'steps': 45320, 'loss/train': 1.3002429008483887} -08/30/2021 21:27:50 - INFO - __main__ - Step 45322: {'lr': 0.00040153977936229813, 'samples': 8701824, 'steps': 45321, 'loss/train': 1.5011858940124512} -08/30/2021 21:27:50 - INFO - __main__ - Step 45323: {'lr': 0.00040153555864406423, 'samples': 8702016, 'steps': 45322, 'loss/train': 1.5152275562286377} -08/30/2021 21:27:51 - INFO - __main__ - Step 45324: {'lr': 0.0004015313378575508, 'samples': 8702208, 'steps': 45323, 'loss/train': 0.7593422532081604} -08/30/2021 21:27:52 - INFO - __main__ - Step 45325: {'lr': 0.00040152711700275963, 'samples': 8702400, 'steps': 45324, 'loss/train': 1.472410798072815} -08/30/2021 21:27:52 - INFO - __main__ - Step 45326: {'lr': 0.0004015228960796927, 'samples': 8702592, 'steps': 45325, 'loss/train': 1.106531023979187} -08/30/2021 21:27:53 - INFO - __main__ - Step 45327: {'lr': 0.0004015186750883518, 'samples': 8702784, 'steps': 45326, 'loss/train': 1.4397965669631958} -08/30/2021 21:27:53 - INFO - __main__ - Step 45328: {'lr': 0.0004015144540287391, 'samples': 8702976, 'steps': 45327, 'loss/train': 1.7939039468765259} -08/30/2021 21:27:54 - INFO - __main__ - Step 45329: {'lr': 0.0004015102329008562, 'samples': 8703168, 'steps': 45328, 'loss/train': 1.007328987121582} -08/30/2021 21:27:55 - INFO - __main__ - Step 45330: {'lr': 0.0004015060117047051, 'samples': 8703360, 'steps': 45329, 'loss/train': 1.4897968769073486} -08/30/2021 21:27:56 - INFO - __main__ - Step 45331: {'lr': 0.0004015017904402879, 'samples': 8703552, 'steps': 45330, 'loss/train': 1.1192376613616943} -08/30/2021 21:27:56 - INFO - __main__ - Step 45332: {'lr': 0.00040149756910760616, 'samples': 8703744, 'steps': 45331, 'loss/train': 1.6463425159454346} -08/30/2021 21:27:56 - INFO - __main__ - Step 45333: {'lr': 0.000401493347706662, 'samples': 8703936, 'steps': 45332, 'loss/train': 1.337498426437378} -08/30/2021 21:27:57 - INFO - __main__ - Step 45334: {'lr': 0.00040148912623745733, 'samples': 8704128, 'steps': 45333, 'loss/train': 1.8205915689468384} -08/30/2021 21:27:57 - INFO - __main__ - Step 45335: {'lr': 0.0004014849046999939, 'samples': 8704320, 'steps': 45334, 'loss/train': 1.6223994493484497} -08/30/2021 21:27:58 - INFO - __main__ - Step 45336: {'lr': 0.00040148068309427376, 'samples': 8704512, 'steps': 45335, 'loss/train': 0.8280646204948425} -08/30/2021 21:27:59 - INFO - __main__ - Step 45337: {'lr': 0.00040147646142029884, 'samples': 8704704, 'steps': 45336, 'loss/train': 1.5944470167160034} -08/30/2021 21:27:59 - INFO - __main__ - Step 45338: {'lr': 0.0004014722396780709, 'samples': 8704896, 'steps': 45337, 'loss/train': 0.5360270738601685} -08/30/2021 21:28:00 - INFO - __main__ - Step 45339: {'lr': 0.00040146801786759183, 'samples': 8705088, 'steps': 45338, 'loss/train': 1.356668472290039} -08/30/2021 21:28:00 - INFO - __main__ - Step 45340: {'lr': 0.00040146379598886376, 'samples': 8705280, 'steps': 45339, 'loss/train': 1.6232160329818726} -08/30/2021 21:28:02 - INFO - __main__ - Step 45341: {'lr': 0.00040145957404188825, 'samples': 8705472, 'steps': 45340, 'loss/train': 0.8288556933403015} -08/30/2021 21:28:02 - INFO - __main__ - Step 45342: {'lr': 0.00040145535202666747, 'samples': 8705664, 'steps': 45341, 'loss/train': 1.5144007205963135} -08/30/2021 21:28:02 - INFO - __main__ - Step 45343: {'lr': 0.0004014511299432033, 'samples': 8705856, 'steps': 45342, 'loss/train': 1.071869969367981} -08/30/2021 21:28:03 - INFO - __main__ - Step 45344: {'lr': 0.0004014469077914976, 'samples': 8706048, 'steps': 45343, 'loss/train': 0.9121518731117249} -08/30/2021 21:28:03 - INFO - __main__ - Step 45345: {'lr': 0.0004014426855715523, 'samples': 8706240, 'steps': 45344, 'loss/train': 1.3119964599609375} -08/30/2021 21:28:04 - INFO - __main__ - Step 45346: {'lr': 0.00040143846328336913, 'samples': 8706432, 'steps': 45345, 'loss/train': 1.8048839569091797} -08/30/2021 21:28:05 - INFO - __main__ - Step 45347: {'lr': 0.00040143424092695015, 'samples': 8706624, 'steps': 45346, 'loss/train': 1.022029161453247} -08/30/2021 21:28:05 - INFO - __main__ - Step 45348: {'lr': 0.00040143001850229733, 'samples': 8706816, 'steps': 45347, 'loss/train': 1.3824069499969482} -08/30/2021 21:28:06 - INFO - __main__ - Step 45349: {'lr': 0.00040142579600941237, 'samples': 8707008, 'steps': 45348, 'loss/train': 2.026054859161377} -08/30/2021 21:28:06 - INFO - __main__ - Step 45350: {'lr': 0.0004014215734482973, 'samples': 8707200, 'steps': 45349, 'loss/train': 1.4047070741653442} -08/30/2021 21:28:08 - INFO - __main__ - Step 45351: {'lr': 0.00040141735081895407, 'samples': 8707392, 'steps': 45350, 'loss/train': 1.727834939956665} -08/30/2021 21:28:08 - INFO - __main__ - Step 45352: {'lr': 0.00040141312812138453, 'samples': 8707584, 'steps': 45351, 'loss/train': 1.3803212642669678} -08/30/2021 21:28:08 - INFO - __main__ - Step 45353: {'lr': 0.0004014089053555905, 'samples': 8707776, 'steps': 45352, 'loss/train': 2.1634228229522705} -08/30/2021 21:28:09 - INFO - __main__ - Step 45354: {'lr': 0.000401404682521574, 'samples': 8707968, 'steps': 45353, 'loss/train': 0.2770467698574066} -08/30/2021 21:28:09 - INFO - __main__ - Step 45355: {'lr': 0.0004014004596193368, 'samples': 8708160, 'steps': 45354, 'loss/train': 1.6003938913345337} -08/30/2021 21:28:11 - INFO - __main__ - Step 45356: {'lr': 0.000401396236648881, 'samples': 8708352, 'steps': 45355, 'loss/train': 1.273625373840332} -08/30/2021 21:28:11 - INFO - __main__ - Step 45357: {'lr': 0.00040139201361020827, 'samples': 8708544, 'steps': 45356, 'loss/train': 5.488168716430664} -08/30/2021 21:28:11 - INFO - __main__ - Step 45358: {'lr': 0.0004013877905033208, 'samples': 8708736, 'steps': 45357, 'loss/train': 1.6528087854385376} -08/30/2021 21:28:12 - INFO - __main__ - Step 45359: {'lr': 0.0004013835673282202, 'samples': 8708928, 'steps': 45358, 'loss/train': 1.9127607345581055} -08/30/2021 21:28:12 - INFO - __main__ - Step 45360: {'lr': 0.00040137934408490856, 'samples': 8709120, 'steps': 45359, 'loss/train': 1.0785194635391235} -08/30/2021 21:28:14 - INFO - __main__ - Step 45361: {'lr': 0.0004013751207733877, 'samples': 8709312, 'steps': 45360, 'loss/train': 0.5043270587921143} -08/30/2021 21:28:14 - INFO - __main__ - Step 45362: {'lr': 0.0004013708973936595, 'samples': 8709504, 'steps': 45361, 'loss/train': 1.7443922758102417} -08/30/2021 21:28:15 - INFO - __main__ - Step 45363: {'lr': 0.000401366673945726, 'samples': 8709696, 'steps': 45362, 'loss/train': 0.9119384288787842} -08/30/2021 21:28:15 - INFO - __main__ - Step 45364: {'lr': 0.00040136245042958897, 'samples': 8709888, 'steps': 45363, 'loss/train': 1.0617207288742065} -08/30/2021 21:28:15 - INFO - __main__ - Step 45365: {'lr': 0.00040135822684525036, 'samples': 8710080, 'steps': 45364, 'loss/train': 1.573112964630127} -08/30/2021 21:28:16 - INFO - __main__ - Step 45366: {'lr': 0.0004013540031927121, 'samples': 8710272, 'steps': 45365, 'loss/train': 1.224539875984192} -08/30/2021 21:28:18 - INFO - __main__ - Step 45367: {'lr': 0.000401349779471976, 'samples': 8710464, 'steps': 45366, 'loss/train': 1.812270998954773} -08/30/2021 21:28:18 - INFO - __main__ - Step 45368: {'lr': 0.000401345555683044, 'samples': 8710656, 'steps': 45367, 'loss/train': 1.7808396816253662} -08/30/2021 21:28:19 - INFO - __main__ - Step 45369: {'lr': 0.00040134133182591813, 'samples': 8710848, 'steps': 45368, 'loss/train': 1.260252833366394} -08/30/2021 21:28:19 - INFO - __main__ - Step 45370: {'lr': 0.0004013371079006001, 'samples': 8711040, 'steps': 45369, 'loss/train': 1.496720314025879} -08/30/2021 21:28:19 - INFO - __main__ - Step 45371: {'lr': 0.000401332883907092, 'samples': 8711232, 'steps': 45370, 'loss/train': 1.5574270486831665} -08/30/2021 21:28:21 - INFO - __main__ - Step 45372: {'lr': 0.00040132865984539556, 'samples': 8711424, 'steps': 45371, 'loss/train': 0.4318111836910248} -08/30/2021 21:28:21 - INFO - __main__ - Step 45373: {'lr': 0.0004013244357155128, 'samples': 8711616, 'steps': 45372, 'loss/train': 2.623877763748169} -08/30/2021 21:28:22 - INFO - __main__ - Step 45374: {'lr': 0.0004013202115174456, 'samples': 8711808, 'steps': 45373, 'loss/train': 0.1138872429728508} -08/30/2021 21:28:22 - INFO - __main__ - Step 45375: {'lr': 0.0004013159872511958, 'samples': 8712000, 'steps': 45374, 'loss/train': 1.6977163553237915} -08/30/2021 21:28:22 - INFO - __main__ - Step 45376: {'lr': 0.0004013117629167653, 'samples': 8712192, 'steps': 45375, 'loss/train': 1.474536657333374} -08/30/2021 21:28:24 - INFO - __main__ - Step 45377: {'lr': 0.0004013075385141561, 'samples': 8712384, 'steps': 45376, 'loss/train': 0.8163807392120361} -08/30/2021 21:28:24 - INFO - __main__ - Step 45378: {'lr': 0.0004013033140433702, 'samples': 8712576, 'steps': 45377, 'loss/train': 1.6421191692352295} -08/30/2021 21:28:25 - INFO - __main__ - Step 45379: {'lr': 0.0004012990895044092, 'samples': 8712768, 'steps': 45378, 'loss/train': 1.4193545579910278} -08/30/2021 21:28:25 - INFO - __main__ - Step 45380: {'lr': 0.0004012948648972752, 'samples': 8712960, 'steps': 45379, 'loss/train': 1.4047447443008423} -08/30/2021 21:28:25 - INFO - __main__ - Step 45381: {'lr': 0.00040129064022197006, 'samples': 8713152, 'steps': 45380, 'loss/train': 1.6190682649612427} -08/30/2021 21:28:27 - INFO - __main__ - Step 45382: {'lr': 0.0004012864154784957, 'samples': 8713344, 'steps': 45381, 'loss/train': 1.1732662916183472} -08/30/2021 21:28:28 - INFO - __main__ - Step 45383: {'lr': 0.00040128219066685403, 'samples': 8713536, 'steps': 45382, 'loss/train': 1.0996413230895996} -08/30/2021 21:28:28 - INFO - __main__ - Step 45384: {'lr': 0.00040127796578704703, 'samples': 8713728, 'steps': 45383, 'loss/train': 1.3954378366470337} -08/30/2021 21:28:29 - INFO - __main__ - Step 45385: {'lr': 0.00040127374083907634, 'samples': 8713920, 'steps': 45384, 'loss/train': 1.5807826519012451} -08/30/2021 21:28:29 - INFO - __main__ - Step 45386: {'lr': 0.00040126951582294414, 'samples': 8714112, 'steps': 45385, 'loss/train': 1.41490638256073} -08/30/2021 21:28:30 - INFO - __main__ - Step 45387: {'lr': 0.00040126529073865216, 'samples': 8714304, 'steps': 45386, 'loss/train': 0.07542635500431061} -08/30/2021 21:28:31 - INFO - __main__ - Step 45388: {'lr': 0.00040126106558620246, 'samples': 8714496, 'steps': 45387, 'loss/train': 1.5419925451278687} -08/30/2021 21:28:31 - INFO - __main__ - Step 45389: {'lr': 0.0004012568403655967, 'samples': 8714688, 'steps': 45388, 'loss/train': 1.31706702709198} -08/30/2021 21:28:32 - INFO - __main__ - Step 45390: {'lr': 0.00040125261507683706, 'samples': 8714880, 'steps': 45389, 'loss/train': 0.8293589353561401} -08/30/2021 21:28:32 - INFO - __main__ - Step 45391: {'lr': 0.0004012483897199254, 'samples': 8715072, 'steps': 45390, 'loss/train': 1.2823151350021362} -08/30/2021 21:28:32 - INFO - __main__ - Step 45392: {'lr': 0.0004012441642948635, 'samples': 8715264, 'steps': 45391, 'loss/train': 1.317599892616272} -08/30/2021 21:28:34 - INFO - __main__ - Step 45393: {'lr': 0.0004012399388016533, 'samples': 8715456, 'steps': 45392, 'loss/train': 1.1026018857955933} -08/30/2021 21:28:35 - INFO - __main__ - Step 45394: {'lr': 0.00040123571324029663, 'samples': 8715648, 'steps': 45393, 'loss/train': 1.3523563146591187} -08/30/2021 21:28:35 - INFO - __main__ - Step 45395: {'lr': 0.0004012314876107956, 'samples': 8715840, 'steps': 45394, 'loss/train': 1.7424101829528809} -08/30/2021 21:28:35 - INFO - __main__ - Step 45396: {'lr': 0.00040122726191315196, 'samples': 8716032, 'steps': 45395, 'loss/train': 1.8487505912780762} -08/30/2021 21:28:36 - INFO - __main__ - Step 45397: {'lr': 0.00040122303614736763, 'samples': 8716224, 'steps': 45396, 'loss/train': 0.09886649996042252} -08/30/2021 21:28:37 - INFO - __main__ - Step 45398: {'lr': 0.00040121881031344455, 'samples': 8716416, 'steps': 45397, 'loss/train': 1.9953153133392334} -08/30/2021 21:28:38 - INFO - __main__ - Step 45399: {'lr': 0.00040121458441138457, 'samples': 8716608, 'steps': 45398, 'loss/train': 1.039934754371643} -08/30/2021 21:28:38 - INFO - __main__ - Step 45400: {'lr': 0.0004012103584411897, 'samples': 8716800, 'steps': 45399, 'loss/train': 1.3867274522781372} -08/30/2021 21:28:38 - INFO - __main__ - Step 45401: {'lr': 0.0004012061324028617, 'samples': 8716992, 'steps': 45400, 'loss/train': 1.5387483835220337} -08/30/2021 21:28:39 - INFO - __main__ - Step 45402: {'lr': 0.0004012019062964026, 'samples': 8717184, 'steps': 45401, 'loss/train': 1.2923636436462402} -08/30/2021 21:28:40 - INFO - __main__ - Step 45403: {'lr': 0.00040119768012181423, 'samples': 8717376, 'steps': 45402, 'loss/train': 1.4038010835647583} -08/30/2021 21:28:40 - INFO - __main__ - Step 45404: {'lr': 0.0004011934538790986, 'samples': 8717568, 'steps': 45403, 'loss/train': 1.52717924118042} -08/30/2021 21:28:41 - INFO - __main__ - Step 45405: {'lr': 0.00040118922756825735, 'samples': 8717760, 'steps': 45404, 'loss/train': 1.5960084199905396} -08/30/2021 21:28:41 - INFO - __main__ - Step 45406: {'lr': 0.00040118500118929267, 'samples': 8717952, 'steps': 45405, 'loss/train': 1.4100596904754639} -08/30/2021 21:28:41 - INFO - __main__ - Step 45407: {'lr': 0.00040118077474220643, 'samples': 8718144, 'steps': 45406, 'loss/train': 0.9633892774581909} -08/30/2021 21:28:43 - INFO - __main__ - Step 45408: {'lr': 0.00040117654822700047, 'samples': 8718336, 'steps': 45407, 'loss/train': 0.9670495986938477} -08/30/2021 21:28:44 - INFO - __main__ - Step 45409: {'lr': 0.0004011723216436766, 'samples': 8718528, 'steps': 45408, 'loss/train': 1.2607340812683105} -08/30/2021 21:28:44 - INFO - __main__ - Step 45410: {'lr': 0.0004011680949922368, 'samples': 8718720, 'steps': 45409, 'loss/train': 2.0846927165985107} -08/30/2021 21:28:45 - INFO - __main__ - Step 45411: {'lr': 0.00040116386827268304, 'samples': 8718912, 'steps': 45410, 'loss/train': 1.393372654914856} -08/30/2021 21:28:45 - INFO - __main__ - Step 45412: {'lr': 0.0004011596414850172, 'samples': 8719104, 'steps': 45411, 'loss/train': 1.2103919982910156} -08/30/2021 21:28:45 - INFO - __main__ - Step 45413: {'lr': 0.0004011554146292411, 'samples': 8719296, 'steps': 45412, 'loss/train': 1.2174266576766968} -08/30/2021 21:28:47 - INFO - __main__ - Step 45414: {'lr': 0.0004011511877053567, 'samples': 8719488, 'steps': 45413, 'loss/train': 0.08311525732278824} -08/30/2021 21:28:47 - INFO - __main__ - Step 45415: {'lr': 0.0004011469607133659, 'samples': 8719680, 'steps': 45414, 'loss/train': 1.235756278038025} -08/30/2021 21:28:48 - INFO - __main__ - Step 45416: {'lr': 0.0004011427336532707, 'samples': 8719872, 'steps': 45415, 'loss/train': 0.9479379057884216} -08/30/2021 21:28:48 - INFO - __main__ - Step 45417: {'lr': 0.00040113850652507286, 'samples': 8720064, 'steps': 45416, 'loss/train': 1.297389030456543} -08/30/2021 21:28:48 - INFO - __main__ - Step 45418: {'lr': 0.00040113427932877434, 'samples': 8720256, 'steps': 45417, 'loss/train': 2.1371407508850098} -08/30/2021 21:28:50 - INFO - __main__ - Step 45419: {'lr': 0.00040113005206437704, 'samples': 8720448, 'steps': 45418, 'loss/train': 1.5319702625274658} -08/30/2021 21:28:51 - INFO - __main__ - Step 45420: {'lr': 0.00040112582473188284, 'samples': 8720640, 'steps': 45419, 'loss/train': 1.5424004793167114} -08/30/2021 21:28:51 - INFO - __main__ - Step 45421: {'lr': 0.00040112159733129375, 'samples': 8720832, 'steps': 45420, 'loss/train': 1.8127344846725464} -08/30/2021 21:28:51 - INFO - __main__ - Step 45422: {'lr': 0.00040111736986261155, 'samples': 8721024, 'steps': 45421, 'loss/train': 1.8065634965896606} -08/30/2021 21:28:52 - INFO - __main__ - Step 45423: {'lr': 0.00040111314232583816, 'samples': 8721216, 'steps': 45422, 'loss/train': 1.6546831130981445} -08/30/2021 21:28:53 - INFO - __main__ - Step 45424: {'lr': 0.0004011089147209756, 'samples': 8721408, 'steps': 45423, 'loss/train': 1.1582897901535034} -08/30/2021 21:28:54 - INFO - __main__ - Step 45425: {'lr': 0.00040110468704802573, 'samples': 8721600, 'steps': 45424, 'loss/train': 1.1235169172286987} -08/30/2021 21:28:54 - INFO - __main__ - Step 45426: {'lr': 0.00040110045930699033, 'samples': 8721792, 'steps': 45425, 'loss/train': 1.5955837965011597} -08/30/2021 21:28:55 - INFO - __main__ - Step 45427: {'lr': 0.00040109623149787137, 'samples': 8721984, 'steps': 45426, 'loss/train': 0.06536370515823364} -08/30/2021 21:28:55 - INFO - __main__ - Step 45428: {'lr': 0.0004010920036206709, 'samples': 8722176, 'steps': 45427, 'loss/train': 1.6359869241714478} -08/30/2021 21:28:55 - INFO - __main__ - Step 45429: {'lr': 0.00040108777567539057, 'samples': 8722368, 'steps': 45428, 'loss/train': 2.8949060440063477} -08/30/2021 21:28:57 - INFO - __main__ - Step 45430: {'lr': 0.00040108354766203247, 'samples': 8722560, 'steps': 45429, 'loss/train': 1.245950698852539} -08/30/2021 21:28:57 - INFO - __main__ - Step 45431: {'lr': 0.0004010793195805985, 'samples': 8722752, 'steps': 45430, 'loss/train': 0.9855471849441528} -08/30/2021 21:28:58 - INFO - __main__ - Step 45432: {'lr': 0.0004010750914310905, 'samples': 8722944, 'steps': 45431, 'loss/train': 1.2119560241699219} -08/30/2021 21:28:58 - INFO - __main__ - Step 45433: {'lr': 0.0004010708632135104, 'samples': 8723136, 'steps': 45432, 'loss/train': 1.519665002822876} -08/30/2021 21:28:58 - INFO - __main__ - Step 45434: {'lr': 0.00040106663492786007, 'samples': 8723328, 'steps': 45433, 'loss/train': 1.0891577005386353} -08/30/2021 21:29:00 - INFO - __main__ - Step 45435: {'lr': 0.00040106240657414137, 'samples': 8723520, 'steps': 45434, 'loss/train': 1.9796557426452637} -08/30/2021 21:29:00 - INFO - __main__ - Step 45436: {'lr': 0.0004010581781523564, 'samples': 8723712, 'steps': 45435, 'loss/train': 1.5103728771209717} -08/30/2021 21:29:01 - INFO - __main__ - Step 45437: {'lr': 0.0004010539496625069, 'samples': 8723904, 'steps': 45436, 'loss/train': 1.4284931421279907} -08/30/2021 21:29:01 - INFO - __main__ - Step 45438: {'lr': 0.00040104972110459493, 'samples': 8724096, 'steps': 45437, 'loss/train': 1.1571506261825562} -08/30/2021 21:29:01 - INFO - __main__ - Step 45439: {'lr': 0.00040104549247862217, 'samples': 8724288, 'steps': 45438, 'loss/train': 0.8309714794158936} -08/30/2021 21:29:03 - INFO - __main__ - Step 45440: {'lr': 0.0004010412637845906, 'samples': 8724480, 'steps': 45439, 'loss/train': 1.3919790983200073} -08/30/2021 21:29:03 - INFO - __main__ - Step 45441: {'lr': 0.00040103703502250223, 'samples': 8724672, 'steps': 45440, 'loss/train': 1.5892564058303833} -08/30/2021 21:29:04 - INFO - __main__ - Step 45442: {'lr': 0.0004010328061923589, 'samples': 8724864, 'steps': 45441, 'loss/train': 1.2075039148330688} -08/30/2021 21:29:04 - INFO - __main__ - Step 45443: {'lr': 0.00040102857729416256, 'samples': 8725056, 'steps': 45442, 'loss/train': 0.7748900055885315} -08/30/2021 21:29:04 - INFO - __main__ - Step 45444: {'lr': 0.000401024348327915, 'samples': 8725248, 'steps': 45443, 'loss/train': 0.8441669940948486} -08/30/2021 21:29:06 - INFO - __main__ - Step 45445: {'lr': 0.00040102011929361826, 'samples': 8725440, 'steps': 45444, 'loss/train': 1.2751429080963135} -08/30/2021 21:29:06 - INFO - __main__ - Step 45446: {'lr': 0.00040101589019127416, 'samples': 8725632, 'steps': 45445, 'loss/train': 1.0400675535202026} -08/30/2021 21:29:07 - INFO - __main__ - Step 45447: {'lr': 0.0004010116610208846, 'samples': 8725824, 'steps': 45446, 'loss/train': 1.0018789768218994} -08/30/2021 21:29:07 - INFO - __main__ - Step 45448: {'lr': 0.0004010074317824516, 'samples': 8726016, 'steps': 45447, 'loss/train': 1.3485724925994873} -08/30/2021 21:29:07 - INFO - __main__ - Step 45449: {'lr': 0.0004010032024759769, 'samples': 8726208, 'steps': 45448, 'loss/train': 1.177703619003296} -08/30/2021 21:29:08 - INFO - __main__ - Step 45450: {'lr': 0.0004009989731014625, 'samples': 8726400, 'steps': 45449, 'loss/train': 1.7052592039108276} -08/30/2021 21:29:09 - INFO - __main__ - Step 45451: {'lr': 0.00040099474365891033, 'samples': 8726592, 'steps': 45450, 'loss/train': 1.4146960973739624} -08/30/2021 21:29:10 - INFO - __main__ - Step 45452: {'lr': 0.0004009905141483222, 'samples': 8726784, 'steps': 45451, 'loss/train': 0.34710901975631714} -08/30/2021 21:29:10 - INFO - __main__ - Step 45453: {'lr': 0.0004009862845697001, 'samples': 8726976, 'steps': 45452, 'loss/train': 1.0887223482131958} -08/30/2021 21:29:10 - INFO - __main__ - Step 45454: {'lr': 0.00040098205492304596, 'samples': 8727168, 'steps': 45453, 'loss/train': 1.1947344541549683} -08/30/2021 21:29:11 - INFO - __main__ - Step 45455: {'lr': 0.00040097782520836156, 'samples': 8727360, 'steps': 45454, 'loss/train': 1.1545122861862183} -08/30/2021 21:29:12 - INFO - __main__ - Step 45456: {'lr': 0.00040097359542564894, 'samples': 8727552, 'steps': 45455, 'loss/train': 2.0078704357147217} -08/30/2021 21:29:13 - INFO - __main__ - Step 45457: {'lr': 0.0004009693655749099, 'samples': 8727744, 'steps': 45456, 'loss/train': 0.11971364915370941} -08/30/2021 21:29:13 - INFO - __main__ - Step 45458: {'lr': 0.00040096513565614645, 'samples': 8727936, 'steps': 45457, 'loss/train': 1.2176803350448608} -08/30/2021 21:29:13 - INFO - __main__ - Step 45459: {'lr': 0.00040096090566936037, 'samples': 8728128, 'steps': 45458, 'loss/train': 0.8424366116523743} -08/30/2021 21:29:14 - INFO - __main__ - Step 45460: {'lr': 0.00040095667561455367, 'samples': 8728320, 'steps': 45459, 'loss/train': 2.1787607669830322} -08/30/2021 21:29:15 - INFO - __main__ - Step 45461: {'lr': 0.00040095244549172824, 'samples': 8728512, 'steps': 45460, 'loss/train': 1.6568368673324585} -08/30/2021 21:29:16 - INFO - __main__ - Step 45462: {'lr': 0.00040094821530088594, 'samples': 8728704, 'steps': 45461, 'loss/train': 1.0476864576339722} -08/30/2021 21:29:16 - INFO - __main__ - Step 45463: {'lr': 0.0004009439850420287, 'samples': 8728896, 'steps': 45462, 'loss/train': 1.9075450897216797} -08/30/2021 21:29:16 - INFO - __main__ - Step 45464: {'lr': 0.00040093975471515843, 'samples': 8729088, 'steps': 45463, 'loss/train': 1.4943007230758667} -08/30/2021 21:29:17 - INFO - __main__ - Step 45465: {'lr': 0.00040093552432027713, 'samples': 8729280, 'steps': 45464, 'loss/train': 1.2659046649932861} -08/30/2021 21:29:18 - INFO - __main__ - Step 45466: {'lr': 0.0004009312938573865, 'samples': 8729472, 'steps': 45465, 'loss/train': 1.3164613246917725} -08/30/2021 21:29:19 - INFO - __main__ - Step 45467: {'lr': 0.00040092706332648856, 'samples': 8729664, 'steps': 45466, 'loss/train': 1.007828950881958} -08/30/2021 21:29:19 - INFO - __main__ - Step 45468: {'lr': 0.00040092283272758525, 'samples': 8729856, 'steps': 45467, 'loss/train': 1.7720130681991577} -08/30/2021 21:29:20 - INFO - __main__ - Step 45469: {'lr': 0.00040091860206067844, 'samples': 8730048, 'steps': 45468, 'loss/train': 1.6414732933044434} -08/30/2021 21:29:20 - INFO - __main__ - Step 45470: {'lr': 0.00040091437132577004, 'samples': 8730240, 'steps': 45469, 'loss/train': 2.295259475708008} -08/30/2021 21:29:22 - INFO - __main__ - Step 45471: {'lr': 0.0004009101405228619, 'samples': 8730432, 'steps': 45470, 'loss/train': 1.6183714866638184} -08/30/2021 21:29:22 - INFO - __main__ - Step 45472: {'lr': 0.00040090590965195604, 'samples': 8730624, 'steps': 45471, 'loss/train': 1.215678095817566} -08/30/2021 21:29:22 - INFO - __main__ - Step 45473: {'lr': 0.0004009016787130543, 'samples': 8730816, 'steps': 45472, 'loss/train': 1.4575421810150146} -08/30/2021 21:29:23 - INFO - __main__ - Step 45474: {'lr': 0.0004008974477061586, 'samples': 8731008, 'steps': 45473, 'loss/train': 1.6828049421310425} -08/30/2021 21:29:23 - INFO - __main__ - Step 45475: {'lr': 0.0004008932166312708, 'samples': 8731200, 'steps': 45474, 'loss/train': 0.7714130878448486} -08/30/2021 21:29:25 - INFO - __main__ - Step 45476: {'lr': 0.0004008889854883929, 'samples': 8731392, 'steps': 45475, 'loss/train': 1.5005035400390625} -08/30/2021 21:29:26 - INFO - __main__ - Step 45477: {'lr': 0.0004008847542775267, 'samples': 8731584, 'steps': 45476, 'loss/train': 1.3288564682006836} -08/30/2021 21:29:26 - INFO - __main__ - Step 45478: {'lr': 0.00040088052299867415, 'samples': 8731776, 'steps': 45477, 'loss/train': 0.6208505034446716} -08/30/2021 21:29:26 - INFO - __main__ - Step 45479: {'lr': 0.0004008762916518372, 'samples': 8731968, 'steps': 45478, 'loss/train': 1.729872226715088} -08/30/2021 21:29:27 - INFO - __main__ - Step 45480: {'lr': 0.0004008720602370177, 'samples': 8732160, 'steps': 45479, 'loss/train': 0.5428986549377441} -08/30/2021 21:29:27 - INFO - __main__ - Step 45481: {'lr': 0.00040086782875421755, 'samples': 8732352, 'steps': 45480, 'loss/train': 1.205990195274353} -08/30/2021 21:29:29 - INFO - __main__ - Step 45482: {'lr': 0.0004008635972034388, 'samples': 8732544, 'steps': 45481, 'loss/train': 0.07471577823162079} -08/30/2021 21:29:29 - INFO - __main__ - Step 45483: {'lr': 0.0004008593655846831, 'samples': 8732736, 'steps': 45482, 'loss/train': 0.6490263938903809} -08/30/2021 21:29:30 - INFO - __main__ - Step 45484: {'lr': 0.0004008551338979526, 'samples': 8732928, 'steps': 45483, 'loss/train': 1.3342127799987793} -08/30/2021 21:29:30 - INFO - __main__ - Step 45485: {'lr': 0.00040085090214324906, 'samples': 8733120, 'steps': 45484, 'loss/train': 1.4586942195892334} -08/30/2021 21:29:30 - INFO - __main__ - Step 45486: {'lr': 0.00040084667032057444, 'samples': 8733312, 'steps': 45485, 'loss/train': 1.4325790405273438} -08/30/2021 21:29:32 - INFO - __main__ - Step 45487: {'lr': 0.00040084243842993065, 'samples': 8733504, 'steps': 45486, 'loss/train': 1.696501612663269} -08/30/2021 21:29:32 - INFO - __main__ - Step 45488: {'lr': 0.0004008382064713195, 'samples': 8733696, 'steps': 45487, 'loss/train': 1.1347908973693848} -08/30/2021 21:29:33 - INFO - __main__ - Step 45489: {'lr': 0.0004008339744447431, 'samples': 8733888, 'steps': 45488, 'loss/train': 0.8334765434265137} -08/30/2021 21:29:33 - INFO - __main__ - Step 45490: {'lr': 0.0004008297423502032, 'samples': 8734080, 'steps': 45489, 'loss/train': 1.8002088069915771} -08/30/2021 21:29:33 - INFO - __main__ - Step 45491: {'lr': 0.0004008255101877017, 'samples': 8734272, 'steps': 45490, 'loss/train': 1.6147581338882446} -08/30/2021 21:29:35 - INFO - __main__ - Step 45492: {'lr': 0.00040082127795724066, 'samples': 8734464, 'steps': 45491, 'loss/train': 1.075305461883545} -08/30/2021 21:29:35 - INFO - __main__ - Step 45493: {'lr': 0.00040081704565882176, 'samples': 8734656, 'steps': 45492, 'loss/train': 1.6420460939407349} -08/30/2021 21:29:36 - INFO - __main__ - Step 45494: {'lr': 0.00040081281329244707, 'samples': 8734848, 'steps': 45493, 'loss/train': 1.2672457695007324} -08/30/2021 21:29:36 - INFO - __main__ - Step 45495: {'lr': 0.00040080858085811844, 'samples': 8735040, 'steps': 45494, 'loss/train': 1.67847740650177} -08/30/2021 21:29:36 - INFO - __main__ - Step 45496: {'lr': 0.00040080434835583777, 'samples': 8735232, 'steps': 45495, 'loss/train': 1.8523110151290894} -08/30/2021 21:29:38 - INFO - __main__ - Step 45497: {'lr': 0.00040080011578560705, 'samples': 8735424, 'steps': 45496, 'loss/train': 1.3734145164489746} -08/30/2021 21:29:38 - INFO - __main__ - Step 45498: {'lr': 0.0004007958831474281, 'samples': 8735616, 'steps': 45497, 'loss/train': 1.0486962795257568} -08/30/2021 21:29:39 - INFO - __main__ - Step 45499: {'lr': 0.0004007916504413029, 'samples': 8735808, 'steps': 45498, 'loss/train': 1.5811030864715576} -08/30/2021 21:29:39 - INFO - __main__ - Step 45500: {'lr': 0.00040078741766723326, 'samples': 8736000, 'steps': 45499, 'loss/train': 0.6940418481826782} -08/30/2021 21:29:40 - INFO - __main__ - Step 45501: {'lr': 0.00040078318482522114, 'samples': 8736192, 'steps': 45500, 'loss/train': 1.7465928792953491} -08/30/2021 21:29:40 - INFO - __main__ - Step 45502: {'lr': 0.0004007789519152684, 'samples': 8736384, 'steps': 45501, 'loss/train': 1.59458589553833} -08/30/2021 21:29:41 - INFO - __main__ - Step 45503: {'lr': 0.00040077471893737703, 'samples': 8736576, 'steps': 45502, 'loss/train': 1.2154748439788818} -08/30/2021 21:29:42 - INFO - __main__ - Step 45504: {'lr': 0.0004007704858915489, 'samples': 8736768, 'steps': 45503, 'loss/train': 1.0664267539978027} -08/30/2021 21:29:42 - INFO - __main__ - Step 45505: {'lr': 0.00040076625277778594, 'samples': 8736960, 'steps': 45504, 'loss/train': 1.6744377613067627} -08/30/2021 21:29:43 - INFO - __main__ - Step 45506: {'lr': 0.00040076201959609003, 'samples': 8737152, 'steps': 45505, 'loss/train': 1.6000587940216064} -08/30/2021 21:29:43 - INFO - __main__ - Step 45507: {'lr': 0.00040075778634646305, 'samples': 8737344, 'steps': 45506, 'loss/train': 1.4726711511611938} -08/30/2021 21:29:44 - INFO - __main__ - Step 45508: {'lr': 0.0004007535530289069, 'samples': 8737536, 'steps': 45507, 'loss/train': 1.6910285949707031} -08/30/2021 21:29:45 - INFO - __main__ - Step 45509: {'lr': 0.0004007493196434236, 'samples': 8737728, 'steps': 45508, 'loss/train': 1.3586182594299316} -08/30/2021 21:29:45 - INFO - __main__ - Step 45510: {'lr': 0.0004007450861900149, 'samples': 8737920, 'steps': 45509, 'loss/train': 1.1043330430984497} -08/30/2021 21:29:46 - INFO - __main__ - Step 45511: {'lr': 0.00040074085266868285, 'samples': 8738112, 'steps': 45510, 'loss/train': 1.0693639516830444} -08/30/2021 21:29:46 - INFO - __main__ - Step 45512: {'lr': 0.0004007366190794294, 'samples': 8738304, 'steps': 45511, 'loss/train': 1.3530992269515991} -08/30/2021 21:29:47 - INFO - __main__ - Step 45513: {'lr': 0.00040073238542225623, 'samples': 8738496, 'steps': 45512, 'loss/train': 1.760133981704712} -08/30/2021 21:29:48 - INFO - __main__ - Step 45514: {'lr': 0.00040072815169716534, 'samples': 8738688, 'steps': 45513, 'loss/train': 1.5427560806274414} -08/30/2021 21:29:48 - INFO - __main__ - Step 45515: {'lr': 0.00040072391790415873, 'samples': 8738880, 'steps': 45514, 'loss/train': 1.7055184841156006} -08/30/2021 21:29:49 - INFO - __main__ - Step 45516: {'lr': 0.00040071968404323824, 'samples': 8739072, 'steps': 45515, 'loss/train': 1.5958950519561768} -08/30/2021 21:29:49 - INFO - __main__ - Step 45517: {'lr': 0.0004007154501144058, 'samples': 8739264, 'steps': 45516, 'loss/train': 1.3519912958145142} -08/30/2021 21:29:49 - INFO - __main__ - Step 45518: {'lr': 0.00040071121611766325, 'samples': 8739456, 'steps': 45517, 'loss/train': 1.5267068147659302} -08/30/2021 21:29:51 - INFO - __main__ - Step 45519: {'lr': 0.00040070698205301266, 'samples': 8739648, 'steps': 45518, 'loss/train': 1.2159485816955566} -08/30/2021 21:29:52 - INFO - __main__ - Step 45520: {'lr': 0.0004007027479204557, 'samples': 8739840, 'steps': 45519, 'loss/train': 1.5194048881530762} -08/30/2021 21:29:52 - INFO - __main__ - Step 45521: {'lr': 0.0004006985137199945, 'samples': 8740032, 'steps': 45520, 'loss/train': 1.0500580072402954} -08/30/2021 21:29:52 - INFO - __main__ - Step 45522: {'lr': 0.00040069427945163083, 'samples': 8740224, 'steps': 45521, 'loss/train': 1.6080890893936157} -08/30/2021 21:29:53 - INFO - __main__ - Step 45523: {'lr': 0.00040069004511536667, 'samples': 8740416, 'steps': 45522, 'loss/train': 0.7664833664894104} -08/30/2021 21:29:54 - INFO - __main__ - Step 45524: {'lr': 0.00040068581071120386, 'samples': 8740608, 'steps': 45523, 'loss/train': 1.7894295454025269} -08/30/2021 21:29:55 - INFO - __main__ - Step 45525: {'lr': 0.00040068157623914435, 'samples': 8740800, 'steps': 45524, 'loss/train': 1.0367735624313354} -08/30/2021 21:29:55 - INFO - __main__ - Step 45526: {'lr': 0.0004006773416991901, 'samples': 8740992, 'steps': 45525, 'loss/train': 0.7200155854225159} -08/30/2021 21:29:55 - INFO - __main__ - Step 45527: {'lr': 0.00040067310709134295, 'samples': 8741184, 'steps': 45526, 'loss/train': 1.2963911294937134} -08/30/2021 21:29:56 - INFO - __main__ - Step 45528: {'lr': 0.0004006688724156048, 'samples': 8741376, 'steps': 45527, 'loss/train': 1.4715675115585327} -08/30/2021 21:29:56 - INFO - __main__ - Step 45529: {'lr': 0.00040066463767197757, 'samples': 8741568, 'steps': 45528, 'loss/train': 5.922485828399658} -08/30/2021 21:29:57 - INFO - __main__ - Step 45530: {'lr': 0.00040066040286046325, 'samples': 8741760, 'steps': 45529, 'loss/train': 1.1490989923477173} -08/30/2021 21:29:58 - INFO - __main__ - Step 45531: {'lr': 0.0004006561679810636, 'samples': 8741952, 'steps': 45530, 'loss/train': 1.5902715921401978} -08/30/2021 21:29:58 - INFO - __main__ - Step 45532: {'lr': 0.0004006519330337807, 'samples': 8742144, 'steps': 45531, 'loss/train': 1.101464867591858} -08/30/2021 21:29:59 - INFO - __main__ - Step 45533: {'lr': 0.0004006476980186163, 'samples': 8742336, 'steps': 45532, 'loss/train': 1.519769310951233} -08/30/2021 21:29:59 - INFO - __main__ - Step 45534: {'lr': 0.0004006434629355723, 'samples': 8742528, 'steps': 45533, 'loss/train': 1.768357753753662} -08/30/2021 21:30:01 - INFO - __main__ - Step 45535: {'lr': 0.0004006392277846508, 'samples': 8742720, 'steps': 45534, 'loss/train': 1.5503679513931274} -08/30/2021 21:30:01 - INFO - __main__ - Step 45536: {'lr': 0.00040063499256585354, 'samples': 8742912, 'steps': 45535, 'loss/train': 1.3042975664138794} -08/30/2021 21:30:02 - INFO - __main__ - Step 45537: {'lr': 0.00040063075727918247, 'samples': 8743104, 'steps': 45536, 'loss/train': 1.399466872215271} -08/30/2021 21:30:02 - INFO - __main__ - Step 45538: {'lr': 0.0004006265219246395, 'samples': 8743296, 'steps': 45537, 'loss/train': 1.2500193119049072} -08/30/2021 21:30:02 - INFO - __main__ - Step 45539: {'lr': 0.00040062228650222657, 'samples': 8743488, 'steps': 45538, 'loss/train': 1.764947533607483} -08/30/2021 21:30:04 - INFO - __main__ - Step 45540: {'lr': 0.00040061805101194553, 'samples': 8743680, 'steps': 45539, 'loss/train': 1.8575208187103271} -08/30/2021 21:30:04 - INFO - __main__ - Step 45541: {'lr': 0.00040061381545379837, 'samples': 8743872, 'steps': 45540, 'loss/train': 1.5655728578567505} -08/30/2021 21:30:04 - INFO - __main__ - Step 45542: {'lr': 0.00040060957982778687, 'samples': 8744064, 'steps': 45541, 'loss/train': 1.728339672088623} -08/30/2021 21:30:05 - INFO - __main__ - Step 45543: {'lr': 0.0004006053441339131, 'samples': 8744256, 'steps': 45542, 'loss/train': 1.527356505393982} -08/30/2021 21:30:05 - INFO - __main__ - Step 45544: {'lr': 0.00040060110837217885, 'samples': 8744448, 'steps': 45543, 'loss/train': 1.4790219068527222} -08/30/2021 21:30:07 - INFO - __main__ - Step 45545: {'lr': 0.000400596872542586, 'samples': 8744640, 'steps': 45544, 'loss/train': 0.9987359642982483} -08/30/2021 21:30:07 - INFO - __main__ - Step 45546: {'lr': 0.0004005926366451367, 'samples': 8744832, 'steps': 45545, 'loss/train': 1.2463665008544922} -08/30/2021 21:30:07 - INFO - __main__ - Step 45547: {'lr': 0.0004005884006798325, 'samples': 8745024, 'steps': 45546, 'loss/train': 0.9123632907867432} -08/30/2021 21:30:08 - INFO - __main__ - Step 45548: {'lr': 0.0004005841646466756, 'samples': 8745216, 'steps': 45547, 'loss/train': 1.4175655841827393} -08/30/2021 21:30:08 - INFO - __main__ - Step 45549: {'lr': 0.00040057992854566774, 'samples': 8745408, 'steps': 45548, 'loss/train': 1.6521754264831543} -08/30/2021 21:30:10 - INFO - __main__ - Step 45550: {'lr': 0.0004005756923768109, 'samples': 8745600, 'steps': 45549, 'loss/train': 1.5313432216644287} -08/30/2021 21:30:10 - INFO - __main__ - Step 45551: {'lr': 0.0004005714561401069, 'samples': 8745792, 'steps': 45550, 'loss/train': 0.9201018810272217} -08/30/2021 21:30:10 - INFO - __main__ - Step 45552: {'lr': 0.0004005672198355579, 'samples': 8745984, 'steps': 45551, 'loss/train': 1.7975521087646484} -08/30/2021 21:30:11 - INFO - __main__ - Step 45553: {'lr': 0.00040056298346316554, 'samples': 8746176, 'steps': 45552, 'loss/train': 1.6051639318466187} -08/30/2021 21:30:11 - INFO - __main__ - Step 45554: {'lr': 0.0004005587470229318, 'samples': 8746368, 'steps': 45553, 'loss/train': 1.3946226835250854} -08/30/2021 21:30:13 - INFO - __main__ - Step 45555: {'lr': 0.00040055451051485865, 'samples': 8746560, 'steps': 45554, 'loss/train': 0.8503422737121582} -08/30/2021 21:30:13 - INFO - __main__ - Step 45556: {'lr': 0.0004005502739389479, 'samples': 8746752, 'steps': 45555, 'loss/train': 1.3847535848617554} -08/30/2021 21:30:14 - INFO - __main__ - Step 45557: {'lr': 0.00040054603729520154, 'samples': 8746944, 'steps': 45556, 'loss/train': 1.164264440536499} -08/30/2021 21:30:14 - INFO - __main__ - Step 45558: {'lr': 0.00040054180058362156, 'samples': 8747136, 'steps': 45557, 'loss/train': 1.205686330795288} -08/30/2021 21:30:14 - INFO - __main__ - Step 45559: {'lr': 0.0004005375638042097, 'samples': 8747328, 'steps': 45558, 'loss/train': 1.2713847160339355} -08/30/2021 21:30:15 - INFO - __main__ - Step 45560: {'lr': 0.0004005333269569679, 'samples': 8747520, 'steps': 45559, 'loss/train': 0.03529397398233414} -08/30/2021 21:30:16 - INFO - __main__ - Step 45561: {'lr': 0.0004005290900418982, 'samples': 8747712, 'steps': 45560, 'loss/train': 1.3542087078094482} -08/30/2021 21:30:17 - INFO - __main__ - Step 45562: {'lr': 0.0004005248530590023, 'samples': 8747904, 'steps': 45561, 'loss/train': 0.6402948498725891} -08/30/2021 21:30:17 - INFO - __main__ - Step 45563: {'lr': 0.0004005206160082823, 'samples': 8748096, 'steps': 45562, 'loss/train': 1.2478729486465454} -08/30/2021 21:30:17 - INFO - __main__ - Step 45564: {'lr': 0.00040051637888973996, 'samples': 8748288, 'steps': 45563, 'loss/train': 1.1593557596206665} -08/30/2021 21:30:18 - INFO - __main__ - Step 45565: {'lr': 0.0004005121417033773, 'samples': 8748480, 'steps': 45564, 'loss/train': 2.1077229976654053} -08/30/2021 21:30:19 - INFO - __main__ - Step 45566: {'lr': 0.0004005079044491963, 'samples': 8748672, 'steps': 45565, 'loss/train': 1.3774333000183105} -08/30/2021 21:30:20 - INFO - __main__ - Step 45567: {'lr': 0.0004005036671271986, 'samples': 8748864, 'steps': 45566, 'loss/train': 1.4116657972335815} -08/30/2021 21:30:20 - INFO - __main__ - Step 45568: {'lr': 0.00040049942973738626, 'samples': 8749056, 'steps': 45567, 'loss/train': 1.5779608488082886} -08/30/2021 21:30:21 - INFO - __main__ - Step 45569: {'lr': 0.00040049519227976135, 'samples': 8749248, 'steps': 45568, 'loss/train': 1.1621469259262085} -08/30/2021 21:30:21 - INFO - __main__ - Step 45570: {'lr': 0.0004004909547543255, 'samples': 8749440, 'steps': 45569, 'loss/train': 0.09808221459388733} -08/30/2021 21:30:23 - INFO - __main__ - Step 45571: {'lr': 0.0004004867171610808, 'samples': 8749632, 'steps': 45570, 'loss/train': 1.1585769653320312} -08/30/2021 21:30:24 - INFO - __main__ - Step 45572: {'lr': 0.00040048247950002917, 'samples': 8749824, 'steps': 45571, 'loss/train': 1.1929718255996704} -08/30/2021 21:30:24 - INFO - __main__ - Step 45573: {'lr': 0.0004004782417711724, 'samples': 8750016, 'steps': 45572, 'loss/train': 1.6099721193313599} -08/30/2021 21:30:24 - INFO - __main__ - Step 45574: {'lr': 0.0004004740039745124, 'samples': 8750208, 'steps': 45573, 'loss/train': 1.5693515539169312} -08/30/2021 21:30:25 - INFO - __main__ - Step 45575: {'lr': 0.0004004697661100512, 'samples': 8750400, 'steps': 45574, 'loss/train': 1.6056859493255615} -08/30/2021 21:30:25 - INFO - __main__ - Step 45576: {'lr': 0.0004004655281777906, 'samples': 8750592, 'steps': 45575, 'loss/train': 1.7467777729034424} -08/30/2021 21:30:27 - INFO - __main__ - Step 45577: {'lr': 0.0004004612901777326, 'samples': 8750784, 'steps': 45576, 'loss/train': 1.7978405952453613} -08/30/2021 21:30:27 - INFO - __main__ - Step 45578: {'lr': 0.000400457052109879, 'samples': 8750976, 'steps': 45577, 'loss/train': 1.581963300704956} -08/30/2021 21:30:28 - INFO - __main__ - Step 45579: {'lr': 0.0004004528139742319, 'samples': 8751168, 'steps': 45578, 'loss/train': 1.3904138803482056} -08/30/2021 21:30:28 - INFO - __main__ - Step 45580: {'lr': 0.00040044857577079294, 'samples': 8751360, 'steps': 45579, 'loss/train': 1.352089285850525} -08/30/2021 21:30:28 - INFO - __main__ - Step 45581: {'lr': 0.00040044433749956434, 'samples': 8751552, 'steps': 45580, 'loss/train': 1.4210666418075562} -08/30/2021 21:30:29 - INFO - __main__ - Step 45582: {'lr': 0.0004004400991605477, 'samples': 8751744, 'steps': 45581, 'loss/train': 1.3799400329589844} -08/30/2021 21:30:30 - INFO - __main__ - Step 45583: {'lr': 0.0004004358607537451, 'samples': 8751936, 'steps': 45582, 'loss/train': 1.426185965538025} -08/30/2021 21:30:31 - INFO - __main__ - Step 45584: {'lr': 0.0004004316222791584, 'samples': 8752128, 'steps': 45583, 'loss/train': 0.9114278554916382} -08/30/2021 21:30:31 - INFO - __main__ - Step 45585: {'lr': 0.00040042738373678954, 'samples': 8752320, 'steps': 45584, 'loss/train': 1.2945493459701538} -08/30/2021 21:30:31 - INFO - __main__ - Step 45586: {'lr': 0.0004004231451266406, 'samples': 8752512, 'steps': 45585, 'loss/train': 1.7090985774993896} -08/30/2021 21:30:32 - INFO - __main__ - Step 45587: {'lr': 0.0004004189064487131, 'samples': 8752704, 'steps': 45586, 'loss/train': 1.0333878993988037} -08/30/2021 21:30:33 - INFO - __main__ - Step 45588: {'lr': 0.00040041466770300923, 'samples': 8752896, 'steps': 45587, 'loss/train': 1.3956458568572998} -08/30/2021 21:30:34 - INFO - __main__ - Step 45589: {'lr': 0.00040041042888953085, 'samples': 8753088, 'steps': 45588, 'loss/train': 1.5097129344940186} -08/30/2021 21:30:34 - INFO - __main__ - Step 45590: {'lr': 0.0004004061900082798, 'samples': 8753280, 'steps': 45589, 'loss/train': 1.5660483837127686} -08/30/2021 21:30:35 - INFO - __main__ - Step 45591: {'lr': 0.00040040195105925803, 'samples': 8753472, 'steps': 45590, 'loss/train': 1.2408846616744995} -08/30/2021 21:30:35 - INFO - __main__ - Step 45592: {'lr': 0.00040039771204246756, 'samples': 8753664, 'steps': 45591, 'loss/train': 1.593881607055664} -08/30/2021 21:30:36 - INFO - __main__ - Step 45593: {'lr': 0.0004003934729579101, 'samples': 8753856, 'steps': 45592, 'loss/train': 0.12923464179039001} -08/30/2021 21:30:37 - INFO - __main__ - Step 45594: {'lr': 0.0004003892338055877, 'samples': 8754048, 'steps': 45593, 'loss/train': 0.11357492953538895} -08/30/2021 21:30:37 - INFO - __main__ - Step 45595: {'lr': 0.0004003849945855023, 'samples': 8754240, 'steps': 45594, 'loss/train': 1.4381378889083862} -08/30/2021 21:30:38 - INFO - __main__ - Step 45596: {'lr': 0.0004003807552976556, 'samples': 8754432, 'steps': 45595, 'loss/train': 1.894063949584961} -08/30/2021 21:30:38 - INFO - __main__ - Step 45597: {'lr': 0.00040037651594204975, 'samples': 8754624, 'steps': 45596, 'loss/train': 1.1790415048599243} -08/30/2021 21:30:40 - INFO - __main__ - Step 45598: {'lr': 0.00040037227651868655, 'samples': 8754816, 'steps': 45597, 'loss/train': 1.7249220609664917} -08/30/2021 21:30:40 - INFO - __main__ - Step 45599: {'lr': 0.000400368037027568, 'samples': 8755008, 'steps': 45598, 'loss/train': 1.5415078401565552} -08/30/2021 21:30:40 - INFO - __main__ - Step 45600: {'lr': 0.0004003637974686958, 'samples': 8755200, 'steps': 45599, 'loss/train': 1.1206258535385132} -08/30/2021 21:30:41 - INFO - __main__ - Step 45601: {'lr': 0.000400359557842072, 'samples': 8755392, 'steps': 45600, 'loss/train': 1.5202081203460693} -08/30/2021 21:30:41 - INFO - __main__ - Step 45602: {'lr': 0.00040035531814769853, 'samples': 8755584, 'steps': 45601, 'loss/train': 1.4554232358932495} -08/30/2021 21:30:43 - INFO - __main__ - Step 45603: {'lr': 0.0004003510783855774, 'samples': 8755776, 'steps': 45602, 'loss/train': 1.5050292015075684} -08/30/2021 21:30:43 - INFO - __main__ - Step 45604: {'lr': 0.00040034683855571027, 'samples': 8755968, 'steps': 45603, 'loss/train': 1.5374759435653687} -08/30/2021 21:30:44 - INFO - __main__ - Step 45605: {'lr': 0.00040034259865809915, 'samples': 8756160, 'steps': 45604, 'loss/train': 1.7383564710617065} -08/30/2021 21:30:44 - INFO - __main__ - Step 45606: {'lr': 0.00040033835869274605, 'samples': 8756352, 'steps': 45605, 'loss/train': 1.903132438659668} -08/30/2021 21:30:44 - INFO - __main__ - Step 45607: {'lr': 0.00040033411865965276, 'samples': 8756544, 'steps': 45606, 'loss/train': 1.8588534593582153} -08/30/2021 21:30:46 - INFO - __main__ - Step 45608: {'lr': 0.0004003298785588212, 'samples': 8756736, 'steps': 45607, 'loss/train': 0.06825053691864014} -08/30/2021 21:30:47 - INFO - __main__ - Step 45609: {'lr': 0.00040032563839025335, 'samples': 8756928, 'steps': 45608, 'loss/train': 1.7190632820129395} -08/30/2021 21:30:47 - INFO - __main__ - Step 45610: {'lr': 0.00040032139815395114, 'samples': 8757120, 'steps': 45609, 'loss/train': 1.9274654388427734} -08/30/2021 21:30:47 - INFO - __main__ - Step 45611: {'lr': 0.00040031715784991643, 'samples': 8757312, 'steps': 45610, 'loss/train': 0.8872581720352173} -08/30/2021 21:30:48 - INFO - __main__ - Step 45612: {'lr': 0.000400312917478151, 'samples': 8757504, 'steps': 45611, 'loss/train': 1.425658106803894} -08/30/2021 21:30:48 - INFO - __main__ - Step 45613: {'lr': 0.000400308677038657, 'samples': 8757696, 'steps': 45612, 'loss/train': 0.7507902383804321} -08/30/2021 21:30:49 - INFO - __main__ - Step 45614: {'lr': 0.0004003044365314362, 'samples': 8757888, 'steps': 45613, 'loss/train': 1.42909836769104} -08/30/2021 21:30:50 - INFO - __main__ - Step 45615: {'lr': 0.0004003001959564906, 'samples': 8758080, 'steps': 45614, 'loss/train': 1.3172701597213745} -08/30/2021 21:30:50 - INFO - __main__ - Step 45616: {'lr': 0.000400295955313822, 'samples': 8758272, 'steps': 45615, 'loss/train': 1.369828224182129} -08/30/2021 21:30:51 - INFO - __main__ - Step 45617: {'lr': 0.0004002917146034323, 'samples': 8758464, 'steps': 45616, 'loss/train': 1.1888891458511353} -08/30/2021 21:30:51 - INFO - __main__ - Step 45618: {'lr': 0.0004002874738253235, 'samples': 8758656, 'steps': 45617, 'loss/train': 1.2672510147094727} -08/30/2021 21:30:53 - INFO - __main__ - Step 45619: {'lr': 0.00040028323297949754, 'samples': 8758848, 'steps': 45618, 'loss/train': 1.2632243633270264} -08/30/2021 21:30:53 - INFO - __main__ - Step 45620: {'lr': 0.0004002789920659563, 'samples': 8759040, 'steps': 45619, 'loss/train': 1.6408114433288574} -08/30/2021 21:30:54 - INFO - __main__ - Step 45621: {'lr': 0.0004002747510847016, 'samples': 8759232, 'steps': 45620, 'loss/train': 1.0925028324127197} -08/30/2021 21:30:54 - INFO - __main__ - Step 45622: {'lr': 0.0004002705100357354, 'samples': 8759424, 'steps': 45621, 'loss/train': 1.4130882024765015} -08/30/2021 21:30:54 - INFO - __main__ - Step 45623: {'lr': 0.00040026626891905963, 'samples': 8759616, 'steps': 45622, 'loss/train': 0.97480708360672} -08/30/2021 21:30:55 - INFO - __main__ - Step 45624: {'lr': 0.00040026202773467623, 'samples': 8759808, 'steps': 45623, 'loss/train': 1.5982215404510498} -08/30/2021 21:30:57 - INFO - __main__ - Step 45625: {'lr': 0.00040025778648258706, 'samples': 8760000, 'steps': 45624, 'loss/train': 0.045749176293611526} -08/30/2021 21:30:57 - INFO - __main__ - Step 45626: {'lr': 0.00040025354516279413, 'samples': 8760192, 'steps': 45625, 'loss/train': 1.8206430673599243} -08/30/2021 21:30:57 - INFO - __main__ - Step 45627: {'lr': 0.0004002493037752992, 'samples': 8760384, 'steps': 45626, 'loss/train': 1.7614457607269287} -08/30/2021 21:30:58 - INFO - __main__ - Step 45628: {'lr': 0.0004002450623201043, 'samples': 8760576, 'steps': 45627, 'loss/train': 1.2492746114730835} -08/30/2021 21:30:58 - INFO - __main__ - Step 45629: {'lr': 0.0004002408207972111, 'samples': 8760768, 'steps': 45628, 'loss/train': 1.8820266723632812} -08/30/2021 21:31:00 - INFO - __main__ - Step 45630: {'lr': 0.00040023657920662195, 'samples': 8760960, 'steps': 45629, 'loss/train': 1.9036760330200195} -08/30/2021 21:31:00 - INFO - __main__ - Step 45631: {'lr': 0.0004002323375483384, 'samples': 8761152, 'steps': 45630, 'loss/train': 1.6004084348678589} -08/30/2021 21:31:01 - INFO - __main__ - Step 45632: {'lr': 0.00040022809582236245, 'samples': 8761344, 'steps': 45631, 'loss/train': 0.8890056014060974} -08/30/2021 21:31:01 - INFO - __main__ - Step 45633: {'lr': 0.0004002238540286961, 'samples': 8761536, 'steps': 45632, 'loss/train': 1.4282796382904053} -08/30/2021 21:31:01 - INFO - __main__ - Step 45634: {'lr': 0.00040021961216734123, 'samples': 8761728, 'steps': 45633, 'loss/train': 1.3680033683776855} -08/30/2021 21:31:02 - INFO - __main__ - Step 45635: {'lr': 0.0004002153702382997, 'samples': 8761920, 'steps': 45634, 'loss/train': 1.284507155418396} -08/30/2021 21:31:03 - INFO - __main__ - Step 45636: {'lr': 0.0004002111282415734, 'samples': 8762112, 'steps': 45635, 'loss/train': 0.9587433338165283} -08/30/2021 21:31:04 - INFO - __main__ - Step 45637: {'lr': 0.00040020688617716427, 'samples': 8762304, 'steps': 45636, 'loss/train': 1.4804365634918213} -08/30/2021 21:31:04 - INFO - __main__ - Step 45638: {'lr': 0.0004002026440450742, 'samples': 8762496, 'steps': 45637, 'loss/train': 0.9273775815963745} -08/30/2021 21:31:04 - INFO - __main__ - Step 45639: {'lr': 0.0004001984018453052, 'samples': 8762688, 'steps': 45638, 'loss/train': 1.2588932514190674} -08/30/2021 21:31:05 - INFO - __main__ - Step 45640: {'lr': 0.0004001941595778592, 'samples': 8762880, 'steps': 45639, 'loss/train': 0.9720456004142761} -08/30/2021 21:31:06 - INFO - __main__ - Step 45641: {'lr': 0.0004001899172427379, 'samples': 8763072, 'steps': 45640, 'loss/train': 1.5970231294631958} -08/30/2021 21:31:07 - INFO - __main__ - Step 45642: {'lr': 0.00040018567483994337, 'samples': 8763264, 'steps': 45641, 'loss/train': 1.4056333303451538} -08/30/2021 21:31:07 - INFO - __main__ - Step 45643: {'lr': 0.00040018143236947756, 'samples': 8763456, 'steps': 45642, 'loss/train': 1.3044254779815674} -08/30/2021 21:31:07 - INFO - __main__ - Step 45644: {'lr': 0.0004001771898313422, 'samples': 8763648, 'steps': 45643, 'loss/train': 1.5113991498947144} -08/30/2021 21:31:08 - INFO - __main__ - Step 45645: {'lr': 0.00040017294722553945, 'samples': 8763840, 'steps': 45644, 'loss/train': 0.6521874666213989} -08/30/2021 21:31:08 - INFO - __main__ - Step 45646: {'lr': 0.000400168704552071, 'samples': 8764032, 'steps': 45645, 'loss/train': 0.3046039938926697} -08/30/2021 21:31:10 - INFO - __main__ - Step 45647: {'lr': 0.0004001644618109389, 'samples': 8764224, 'steps': 45646, 'loss/train': 0.9743245244026184} -08/30/2021 21:31:10 - INFO - __main__ - Step 45648: {'lr': 0.00040016021900214497, 'samples': 8764416, 'steps': 45647, 'loss/train': 1.7741951942443848} -08/30/2021 21:31:10 - INFO - __main__ - Step 45649: {'lr': 0.00040015597612569115, 'samples': 8764608, 'steps': 45648, 'loss/train': 1.0282500982284546} -08/30/2021 21:31:11 - INFO - __main__ - Step 45650: {'lr': 0.00040015173318157937, 'samples': 8764800, 'steps': 45649, 'loss/train': 1.1559091806411743} -08/30/2021 21:31:11 - INFO - __main__ - Step 45651: {'lr': 0.00040014749016981154, 'samples': 8764992, 'steps': 45650, 'loss/train': 1.6319549083709717} -08/30/2021 21:31:13 - INFO - __main__ - Step 45652: {'lr': 0.00040014324709038965, 'samples': 8765184, 'steps': 45651, 'loss/train': 1.382581353187561} -08/30/2021 21:31:13 - INFO - __main__ - Step 45653: {'lr': 0.00040013900394331544, 'samples': 8765376, 'steps': 45652, 'loss/train': 1.2670832872390747} -08/30/2021 21:31:14 - INFO - __main__ - Step 45654: {'lr': 0.0004001347607285909, 'samples': 8765568, 'steps': 45653, 'loss/train': 1.1949220895767212} -08/30/2021 21:31:14 - INFO - __main__ - Step 45655: {'lr': 0.000400130517446218, 'samples': 8765760, 'steps': 45654, 'loss/train': 0.4517842233181} -08/30/2021 21:31:14 - INFO - __main__ - Step 45656: {'lr': 0.00040012627409619853, 'samples': 8765952, 'steps': 45655, 'loss/train': 1.4933371543884277} -08/30/2021 21:31:16 - INFO - __main__ - Step 45657: {'lr': 0.00040012203067853457, 'samples': 8766144, 'steps': 45656, 'loss/train': 1.934327483177185} -08/30/2021 21:31:16 - INFO - __main__ - Step 45658: {'lr': 0.0004001177871932279, 'samples': 8766336, 'steps': 45657, 'loss/train': 1.5139893293380737} -08/30/2021 21:31:16 - INFO - __main__ - Step 45659: {'lr': 0.00040011354364028053, 'samples': 8766528, 'steps': 45658, 'loss/train': 1.7372409105300903} -08/30/2021 21:31:17 - INFO - __main__ - Step 45660: {'lr': 0.00040010930001969426, 'samples': 8766720, 'steps': 45659, 'loss/train': 1.2435288429260254} -08/30/2021 21:31:17 - INFO - __main__ - Step 45661: {'lr': 0.00040010505633147106, 'samples': 8766912, 'steps': 45660, 'loss/train': 1.042527198791504} -08/30/2021 21:31:19 - INFO - __main__ - Step 45662: {'lr': 0.00040010081257561283, 'samples': 8767104, 'steps': 45661, 'loss/train': 1.4332000017166138} -08/30/2021 21:31:20 - INFO - __main__ - Step 45663: {'lr': 0.0004000965687521215, 'samples': 8767296, 'steps': 45662, 'loss/train': 1.4125158786773682} -08/30/2021 21:31:20 - INFO - __main__ - Step 45664: {'lr': 0.0004000923248609989, 'samples': 8767488, 'steps': 45663, 'loss/train': 0.5679012537002563} -08/30/2021 21:31:20 - INFO - __main__ - Step 45665: {'lr': 0.00040008808090224714, 'samples': 8767680, 'steps': 45664, 'loss/train': 1.638641119003296} -08/30/2021 21:31:21 - INFO - __main__ - Step 45666: {'lr': 0.0004000838368758679, 'samples': 8767872, 'steps': 45665, 'loss/train': 0.9655702114105225} -08/30/2021 21:31:21 - INFO - __main__ - Step 45667: {'lr': 0.00040007959278186327, 'samples': 8768064, 'steps': 45666, 'loss/train': 0.028480539098381996} -08/30/2021 21:31:23 - INFO - __main__ - Step 45668: {'lr': 0.0004000753486202351, 'samples': 8768256, 'steps': 45667, 'loss/train': 1.4113613367080688} -08/30/2021 21:31:23 - INFO - __main__ - Step 45669: {'lr': 0.0004000711043909853, 'samples': 8768448, 'steps': 45668, 'loss/train': 1.301478624343872} -08/30/2021 21:31:23 - INFO - __main__ - Step 45670: {'lr': 0.0004000668600941157, 'samples': 8768640, 'steps': 45669, 'loss/train': 1.0411229133605957} -08/30/2021 21:31:24 - INFO - __main__ - Step 45671: {'lr': 0.00040006261572962833, 'samples': 8768832, 'steps': 45670, 'loss/train': 1.7721610069274902} -08/30/2021 21:31:24 - INFO - __main__ - Step 45672: {'lr': 0.00040005837129752496, 'samples': 8769024, 'steps': 45671, 'loss/train': 1.4920334815979004} -08/30/2021 21:31:24 - INFO - __main__ - Step 45673: {'lr': 0.00040005412679780777, 'samples': 8769216, 'steps': 45672, 'loss/train': 1.280248761177063} -08/30/2021 21:31:26 - INFO - __main__ - Step 45674: {'lr': 0.00040004988223047843, 'samples': 8769408, 'steps': 45673, 'loss/train': 1.319585919380188} -08/30/2021 21:31:26 - INFO - __main__ - Step 45675: {'lr': 0.0004000456375955389, 'samples': 8769600, 'steps': 45674, 'loss/train': 0.6134784817695618} -08/30/2021 21:31:27 - INFO - __main__ - Step 45676: {'lr': 0.00040004139289299127, 'samples': 8769792, 'steps': 45675, 'loss/train': 1.514657974243164} -08/30/2021 21:31:27 - INFO - __main__ - Step 45677: {'lr': 0.0004000371481228371, 'samples': 8769984, 'steps': 45676, 'loss/train': 1.6194335222244263} -08/30/2021 21:31:28 - INFO - __main__ - Step 45678: {'lr': 0.00040003290328507855, 'samples': 8770176, 'steps': 45677, 'loss/train': 1.5988292694091797} -08/30/2021 21:31:28 - INFO - __main__ - Step 45679: {'lr': 0.0004000286583797176, 'samples': 8770368, 'steps': 45678, 'loss/train': 1.1662352085113525} -08/30/2021 21:31:29 - INFO - __main__ - Step 45680: {'lr': 0.000400024413406756, 'samples': 8770560, 'steps': 45679, 'loss/train': 5.883415222167969} -08/30/2021 21:31:30 - INFO - __main__ - Step 45681: {'lr': 0.0004000201683661957, 'samples': 8770752, 'steps': 45680, 'loss/train': 0.9710056781768799} -08/30/2021 21:31:30 - INFO - __main__ - Step 45682: {'lr': 0.0004000159232580386, 'samples': 8770944, 'steps': 45681, 'loss/train': 1.4683516025543213} -08/30/2021 21:31:31 - INFO - __main__ - Step 45683: {'lr': 0.0004000116780822867, 'samples': 8771136, 'steps': 45682, 'loss/train': 1.7683079242706299} -08/30/2021 21:31:31 - INFO - __main__ - Step 45684: {'lr': 0.0004000074328389418, 'samples': 8771328, 'steps': 45683, 'loss/train': 1.3312487602233887} -08/30/2021 21:31:33 - INFO - __main__ - Step 45685: {'lr': 0.0004000031875280059, 'samples': 8771520, 'steps': 45684, 'loss/train': 1.3476998805999756} -08/30/2021 21:31:34 - INFO - __main__ - Step 45686: {'lr': 0.00039999894214948087, 'samples': 8771712, 'steps': 45685, 'loss/train': 1.0608386993408203} -08/30/2021 21:31:34 - INFO - __main__ - Step 45687: {'lr': 0.00039999469670336864, 'samples': 8771904, 'steps': 45686, 'loss/train': 1.2171738147735596} -08/30/2021 21:31:34 - INFO - __main__ - Step 45688: {'lr': 0.0003999904511896711, 'samples': 8772096, 'steps': 45687, 'loss/train': 1.53910231590271} -08/30/2021 21:31:35 - INFO - __main__ - Step 45689: {'lr': 0.00039998620560839014, 'samples': 8772288, 'steps': 45688, 'loss/train': 1.030777096748352} -08/30/2021 21:31:36 - INFO - __main__ - Step 45690: {'lr': 0.0003999819599595278, 'samples': 8772480, 'steps': 45689, 'loss/train': 0.5401210784912109} -08/30/2021 21:31:37 - INFO - __main__ - Step 45691: {'lr': 0.00039997771424308583, 'samples': 8772672, 'steps': 45690, 'loss/train': 0.47847780585289} -08/30/2021 21:31:37 - INFO - __main__ - Step 45692: {'lr': 0.0003999734684590662, 'samples': 8772864, 'steps': 45691, 'loss/train': 1.5724024772644043} -08/30/2021 21:31:37 - INFO - __main__ - Step 45693: {'lr': 0.0003999692226074709, 'samples': 8773056, 'steps': 45692, 'loss/train': 1.4545607566833496} -08/30/2021 21:31:38 - INFO - __main__ - Step 45694: {'lr': 0.0003999649766883018, 'samples': 8773248, 'steps': 45693, 'loss/train': 1.3308472633361816} -08/30/2021 21:31:39 - INFO - __main__ - Step 45695: {'lr': 0.0003999607307015607, 'samples': 8773440, 'steps': 45694, 'loss/train': 1.6001659631729126} -08/30/2021 21:31:40 - INFO - __main__ - Step 45696: {'lr': 0.00039995648464724966, 'samples': 8773632, 'steps': 45695, 'loss/train': 1.3919919729232788} -08/30/2021 21:31:40 - INFO - __main__ - Step 45697: {'lr': 0.00039995223852537054, 'samples': 8773824, 'steps': 45696, 'loss/train': 1.4473979473114014} -08/30/2021 21:31:40 - INFO - __main__ - Step 45698: {'lr': 0.0003999479923359253, 'samples': 8774016, 'steps': 45697, 'loss/train': 1.136098027229309} -08/30/2021 21:31:41 - INFO - __main__ - Step 45699: {'lr': 0.0003999437460789157, 'samples': 8774208, 'steps': 45698, 'loss/train': 1.8405425548553467} -08/30/2021 21:31:43 - INFO - __main__ - Step 45700: {'lr': 0.0003999394997543439, 'samples': 8774400, 'steps': 45699, 'loss/train': 1.5210239887237549} -08/30/2021 21:31:43 - INFO - __main__ - Step 45701: {'lr': 0.0003999352533622116, 'samples': 8774592, 'steps': 45700, 'loss/train': 0.22797487676143646} -08/30/2021 21:31:43 - INFO - __main__ - Step 45702: {'lr': 0.00039993100690252084, 'samples': 8774784, 'steps': 45701, 'loss/train': 1.781153917312622} -08/30/2021 21:31:44 - INFO - __main__ - Step 45703: {'lr': 0.00039992676037527337, 'samples': 8774976, 'steps': 45702, 'loss/train': 1.6705224514007568} -08/30/2021 21:31:44 - INFO - __main__ - Step 45704: {'lr': 0.0003999225137804713, 'samples': 8775168, 'steps': 45703, 'loss/train': 1.9252976179122925} -08/30/2021 21:31:45 - INFO - __main__ - Step 45705: {'lr': 0.0003999182671181164, 'samples': 8775360, 'steps': 45704, 'loss/train': 1.451731562614441} -08/30/2021 21:31:46 - INFO - __main__ - Step 45706: {'lr': 0.00039991402038821067, 'samples': 8775552, 'steps': 45705, 'loss/train': 0.5823312401771545} -08/30/2021 21:31:46 - INFO - __main__ - Step 45707: {'lr': 0.00039990977359075607, 'samples': 8775744, 'steps': 45706, 'loss/train': 1.7803608179092407} -08/30/2021 21:31:47 - INFO - __main__ - Step 45708: {'lr': 0.00039990552672575436, 'samples': 8775936, 'steps': 45707, 'loss/train': 1.5841566324234009} -08/30/2021 21:31:47 - INFO - __main__ - Step 45709: {'lr': 0.00039990127979320757, 'samples': 8776128, 'steps': 45708, 'loss/train': 1.2163341045379639} -08/30/2021 21:31:49 - INFO - __main__ - Step 45710: {'lr': 0.00039989703279311753, 'samples': 8776320, 'steps': 45709, 'loss/train': 1.7694246768951416} -08/30/2021 21:31:49 - INFO - __main__ - Step 45711: {'lr': 0.00039989278572548625, 'samples': 8776512, 'steps': 45710, 'loss/train': 1.7745155096054077} -08/30/2021 21:31:49 - INFO - __main__ - Step 45712: {'lr': 0.00039988853859031557, 'samples': 8776704, 'steps': 45711, 'loss/train': 1.1858346462249756} -08/30/2021 21:31:50 - INFO - __main__ - Step 45713: {'lr': 0.0003998842913876074, 'samples': 8776896, 'steps': 45712, 'loss/train': 1.0947071313858032} -08/30/2021 21:31:50 - INFO - __main__ - Step 45714: {'lr': 0.0003998800441173637, 'samples': 8777088, 'steps': 45713, 'loss/train': 1.3598521947860718} -08/30/2021 21:31:50 - INFO - __main__ - Step 45715: {'lr': 0.00039987579677958643, 'samples': 8777280, 'steps': 45714, 'loss/train': 1.56691575050354} -08/30/2021 21:31:52 - INFO - __main__ - Step 45716: {'lr': 0.0003998715493742774, 'samples': 8777472, 'steps': 45715, 'loss/train': 1.5442273616790771} -08/30/2021 21:31:52 - INFO - __main__ - Step 45717: {'lr': 0.0003998673019014385, 'samples': 8777664, 'steps': 45716, 'loss/train': 2.142970085144043} -08/30/2021 21:31:53 - INFO - __main__ - Step 45718: {'lr': 0.0003998630543610717, 'samples': 8777856, 'steps': 45717, 'loss/train': 1.1037765741348267} -08/30/2021 21:31:53 - INFO - __main__ - Step 45719: {'lr': 0.00039985880675317897, 'samples': 8778048, 'steps': 45718, 'loss/train': 1.637785792350769} -08/30/2021 21:31:54 - INFO - __main__ - Step 45720: {'lr': 0.0003998545590777622, 'samples': 8778240, 'steps': 45719, 'loss/train': 1.7826141119003296} -08/30/2021 21:31:55 - INFO - __main__ - Step 45721: {'lr': 0.0003998503113348233, 'samples': 8778432, 'steps': 45720, 'loss/train': 1.620204210281372} -08/30/2021 21:31:55 - INFO - __main__ - Step 45722: {'lr': 0.0003998460635243641, 'samples': 8778624, 'steps': 45721, 'loss/train': 1.5672633647918701} -08/30/2021 21:31:56 - INFO - __main__ - Step 45723: {'lr': 0.00039984181564638654, 'samples': 8778816, 'steps': 45722, 'loss/train': 1.310011625289917} -08/30/2021 21:31:56 - INFO - __main__ - Step 45724: {'lr': 0.00039983756770089264, 'samples': 8779008, 'steps': 45723, 'loss/train': 1.7102843523025513} -08/30/2021 21:31:56 - INFO - __main__ - Step 45725: {'lr': 0.0003998333196878843, 'samples': 8779200, 'steps': 45724, 'loss/train': 1.3844170570373535} -08/30/2021 21:31:58 - INFO - __main__ - Step 45726: {'lr': 0.00039982907160736325, 'samples': 8779392, 'steps': 45725, 'loss/train': 1.552479863166809} -08/30/2021 21:31:59 - INFO - __main__ - Step 45727: {'lr': 0.00039982482345933155, 'samples': 8779584, 'steps': 45726, 'loss/train': 1.3059972524642944} -08/30/2021 21:31:59 - INFO - __main__ - Step 45728: {'lr': 0.00039982057524379124, 'samples': 8779776, 'steps': 45727, 'loss/train': 1.1507110595703125} -08/30/2021 21:31:59 - INFO - __main__ - Step 45729: {'lr': 0.00039981632696074396, 'samples': 8779968, 'steps': 45728, 'loss/train': 1.6962097883224487} -08/30/2021 21:32:00 - INFO - __main__ - Step 45730: {'lr': 0.00039981207861019175, 'samples': 8780160, 'steps': 45729, 'loss/train': 1.4264379739761353} -08/30/2021 21:32:01 - INFO - __main__ - Step 45731: {'lr': 0.0003998078301921365, 'samples': 8780352, 'steps': 45730, 'loss/train': 1.6870983839035034} -08/30/2021 21:32:02 - INFO - __main__ - Step 45732: {'lr': 0.00039980358170658026, 'samples': 8780544, 'steps': 45731, 'loss/train': 0.5918977856636047} -08/30/2021 21:32:02 - INFO - __main__ - Step 45733: {'lr': 0.0003997993331535248, 'samples': 8780736, 'steps': 45732, 'loss/train': 1.3852952718734741} -08/30/2021 21:32:03 - INFO - __main__ - Step 45734: {'lr': 0.0003997950845329721, 'samples': 8780928, 'steps': 45733, 'loss/train': 0.7267405390739441} -08/30/2021 21:32:03 - INFO - __main__ - Step 45735: {'lr': 0.000399790835844924, 'samples': 8781120, 'steps': 45734, 'loss/train': 1.3988796472549438} -08/30/2021 21:32:03 - INFO - __main__ - Step 45736: {'lr': 0.00039978658708938244, 'samples': 8781312, 'steps': 45735, 'loss/train': 0.04054870456457138} -08/30/2021 21:32:05 - INFO - __main__ - Step 45737: {'lr': 0.00039978233826634934, 'samples': 8781504, 'steps': 45736, 'loss/train': 0.04201611131429672} -08/30/2021 21:32:06 - INFO - __main__ - Step 45738: {'lr': 0.0003997780893758267, 'samples': 8781696, 'steps': 45737, 'loss/train': 1.4057588577270508} -08/30/2021 21:32:06 - INFO - __main__ - Step 45739: {'lr': 0.0003997738404178164, 'samples': 8781888, 'steps': 45738, 'loss/train': 1.3034766912460327} -08/30/2021 21:32:07 - INFO - __main__ - Step 45740: {'lr': 0.00039976959139232017, 'samples': 8782080, 'steps': 45739, 'loss/train': 1.550410270690918} -08/30/2021 21:32:07 - INFO - __main__ - Step 45741: {'lr': 0.0003997653422993402, 'samples': 8782272, 'steps': 45740, 'loss/train': 1.3442806005477905} -08/30/2021 21:32:09 - INFO - __main__ - Step 45742: {'lr': 0.0003997610931388782, 'samples': 8782464, 'steps': 45741, 'loss/train': 2.68050217628479} -08/30/2021 21:32:09 - INFO - __main__ - Step 45743: {'lr': 0.0003997568439109363, 'samples': 8782656, 'steps': 45742, 'loss/train': 1.544089913368225} -08/30/2021 21:32:09 - INFO - __main__ - Step 45744: {'lr': 0.00039975259461551613, 'samples': 8782848, 'steps': 45743, 'loss/train': 1.8000953197479248} -08/30/2021 21:32:10 - INFO - __main__ - Step 45745: {'lr': 0.0003997483452526198, 'samples': 8783040, 'steps': 45744, 'loss/train': 1.804950475692749} -08/30/2021 21:32:10 - INFO - __main__ - Step 45746: {'lr': 0.0003997440958222491, 'samples': 8783232, 'steps': 45745, 'loss/train': 1.5842504501342773} -08/30/2021 21:32:12 - INFO - __main__ - Step 45747: {'lr': 0.0003997398463244062, 'samples': 8783424, 'steps': 45746, 'loss/train': 2.106240749359131} -08/30/2021 21:32:12 - INFO - __main__ - Step 45748: {'lr': 0.00039973559675909274, 'samples': 8783616, 'steps': 45747, 'loss/train': 1.1705864667892456} -08/30/2021 21:32:12 - INFO - __main__ - Step 45749: {'lr': 0.00039973134712631067, 'samples': 8783808, 'steps': 45748, 'loss/train': 1.3314101696014404} -08/30/2021 21:32:13 - INFO - __main__ - Step 45750: {'lr': 0.00039972709742606207, 'samples': 8784000, 'steps': 45749, 'loss/train': 1.6287176609039307} -08/30/2021 21:32:13 - INFO - __main__ - Step 45751: {'lr': 0.00039972284765834866, 'samples': 8784192, 'steps': 45750, 'loss/train': 2.1587624549865723} -08/30/2021 21:32:15 - INFO - __main__ - Step 45752: {'lr': 0.00039971859782317245, 'samples': 8784384, 'steps': 45751, 'loss/train': 1.4193994998931885} -08/30/2021 21:32:15 - INFO - __main__ - Step 45753: {'lr': 0.0003997143479205354, 'samples': 8784576, 'steps': 45752, 'loss/train': 1.2462074756622314} -08/30/2021 21:32:16 - INFO - __main__ - Step 45754: {'lr': 0.0003997100979504394, 'samples': 8784768, 'steps': 45753, 'loss/train': 0.04681426286697388} -08/30/2021 21:32:16 - INFO - __main__ - Step 45755: {'lr': 0.00039970584791288626, 'samples': 8784960, 'steps': 45754, 'loss/train': 1.263257622718811} -08/30/2021 21:32:16 - INFO - __main__ - Step 45756: {'lr': 0.000399701597807878, 'samples': 8785152, 'steps': 45755, 'loss/train': 1.7074925899505615} -08/30/2021 21:32:18 - INFO - __main__ - Step 45757: {'lr': 0.00039969734763541657, 'samples': 8785344, 'steps': 45756, 'loss/train': 1.359625220298767} -08/30/2021 21:32:18 - INFO - __main__ - Step 45758: {'lr': 0.00039969309739550373, 'samples': 8785536, 'steps': 45757, 'loss/train': 1.2389707565307617} -08/30/2021 21:32:19 - INFO - __main__ - Step 45759: {'lr': 0.0003996888470881416, 'samples': 8785728, 'steps': 45758, 'loss/train': 1.407562255859375} -08/30/2021 21:32:19 - INFO - __main__ - Step 45760: {'lr': 0.0003996845967133319, 'samples': 8785920, 'steps': 45759, 'loss/train': 1.3659547567367554} -08/30/2021 21:32:19 - INFO - __main__ - Step 45761: {'lr': 0.0003996803462710766, 'samples': 8786112, 'steps': 45760, 'loss/train': 1.514388918876648} -08/30/2021 21:32:21 - INFO - __main__ - Step 45762: {'lr': 0.00039967609576137774, 'samples': 8786304, 'steps': 45761, 'loss/train': 1.777955174446106} -08/30/2021 21:32:22 - INFO - __main__ - Step 45763: {'lr': 0.0003996718451842371, 'samples': 8786496, 'steps': 45762, 'loss/train': 1.290058970451355} -08/30/2021 21:32:22 - INFO - __main__ - Step 45764: {'lr': 0.00039966759453965664, 'samples': 8786688, 'steps': 45763, 'loss/train': 1.766306757926941} -08/30/2021 21:32:22 - INFO - __main__ - Step 45765: {'lr': 0.00039966334382763826, 'samples': 8786880, 'steps': 45764, 'loss/train': 1.765210747718811} -08/30/2021 21:32:23 - INFO - __main__ - Step 45766: {'lr': 0.00039965909304818387, 'samples': 8787072, 'steps': 45765, 'loss/train': 1.630203366279602} -08/30/2021 21:32:25 - INFO - __main__ - Step 45767: {'lr': 0.00039965484220129546, 'samples': 8787264, 'steps': 45766, 'loss/train': 1.7340587377548218} -08/30/2021 21:32:25 - INFO - __main__ - Step 45768: {'lr': 0.0003996505912869749, 'samples': 8787456, 'steps': 45767, 'loss/train': 1.8549233675003052} -08/30/2021 21:32:25 - INFO - __main__ - Step 45769: {'lr': 0.000399646340305224, 'samples': 8787648, 'steps': 45768, 'loss/train': 0.6560509204864502} -08/30/2021 21:32:26 - INFO - __main__ - Step 45770: {'lr': 0.00039964208925604485, 'samples': 8787840, 'steps': 45769, 'loss/train': 0.8023548126220703} -08/30/2021 21:32:26 - INFO - __main__ - Step 45771: {'lr': 0.0003996378381394392, 'samples': 8788032, 'steps': 45770, 'loss/train': 1.5847631692886353} -08/30/2021 21:32:27 - INFO - __main__ - Step 45772: {'lr': 0.00039963358695540907, 'samples': 8788224, 'steps': 45771, 'loss/train': 1.3048385381698608} -08/30/2021 21:32:28 - INFO - __main__ - Step 45773: {'lr': 0.0003996293357039564, 'samples': 8788416, 'steps': 45772, 'loss/train': 1.6023977994918823} -08/30/2021 21:32:29 - INFO - __main__ - Step 45774: {'lr': 0.0003996250843850831, 'samples': 8788608, 'steps': 45773, 'loss/train': 1.0310152769088745} -08/30/2021 21:32:29 - INFO - __main__ - Step 45775: {'lr': 0.000399620832998791, 'samples': 8788800, 'steps': 45774, 'loss/train': 1.878286361694336} -08/30/2021 21:32:30 - INFO - __main__ - Step 45776: {'lr': 0.000399616581545082, 'samples': 8788992, 'steps': 45775, 'loss/train': 1.5252773761749268} -08/30/2021 21:32:30 - INFO - __main__ - Step 45777: {'lr': 0.0003996123300239581, 'samples': 8789184, 'steps': 45776, 'loss/train': 1.6312905550003052} -08/30/2021 21:32:30 - INFO - __main__ - Step 45778: {'lr': 0.0003996080784354212, 'samples': 8789376, 'steps': 45777, 'loss/train': 1.090775728225708} -08/30/2021 21:32:32 - INFO - __main__ - Step 45779: {'lr': 0.0003996038267794733, 'samples': 8789568, 'steps': 45778, 'loss/train': 0.096169114112854} -08/30/2021 21:32:32 - INFO - __main__ - Step 45780: {'lr': 0.0003995995750561161, 'samples': 8789760, 'steps': 45779, 'loss/train': 1.1614532470703125} -08/30/2021 21:32:33 - INFO - __main__ - Step 45781: {'lr': 0.00039959532326535175, 'samples': 8789952, 'steps': 45780, 'loss/train': 1.170967936515808} -08/30/2021 21:32:33 - INFO - __main__ - Step 45782: {'lr': 0.000399591071407182, 'samples': 8790144, 'steps': 45781, 'loss/train': 1.3381215333938599} -08/30/2021 21:32:33 - INFO - __main__ - Step 45783: {'lr': 0.0003995868194816088, 'samples': 8790336, 'steps': 45782, 'loss/train': 1.15363609790802} -08/30/2021 21:32:35 - INFO - __main__ - Step 45784: {'lr': 0.0003995825674886341, 'samples': 8790528, 'steps': 45783, 'loss/train': 1.415030598640442} -08/30/2021 21:32:35 - INFO - __main__ - Step 45785: {'lr': 0.00039957831542825983, 'samples': 8790720, 'steps': 45784, 'loss/train': 1.0968674421310425} -08/30/2021 21:32:36 - INFO - __main__ - Step 45786: {'lr': 0.0003995740633004878, 'samples': 8790912, 'steps': 45785, 'loss/train': 1.6236929893493652} -08/30/2021 21:32:36 - INFO - __main__ - Step 45787: {'lr': 0.00039956981110532007, 'samples': 8791104, 'steps': 45786, 'loss/train': 1.8155336380004883} -08/30/2021 21:32:36 - INFO - __main__ - Step 45788: {'lr': 0.0003995655588427586, 'samples': 8791296, 'steps': 45787, 'loss/train': 1.5406101942062378} -08/30/2021 21:32:38 - INFO - __main__ - Step 45789: {'lr': 0.00039956130651280504, 'samples': 8791488, 'steps': 45788, 'loss/train': 1.2359778881072998} -08/30/2021 21:32:38 - INFO - __main__ - Step 45790: {'lr': 0.0003995570541154615, 'samples': 8791680, 'steps': 45789, 'loss/train': 1.6529431343078613} -08/30/2021 21:32:39 - INFO - __main__ - Step 45791: {'lr': 0.0003995528016507298, 'samples': 8791872, 'steps': 45790, 'loss/train': 0.9503229260444641} -08/30/2021 21:32:39 - INFO - __main__ - Step 45792: {'lr': 0.000399548549118612, 'samples': 8792064, 'steps': 45791, 'loss/train': 0.8938019275665283} -08/30/2021 21:32:39 - INFO - __main__ - Step 45793: {'lr': 0.00039954429651910993, 'samples': 8792256, 'steps': 45792, 'loss/train': 1.4242010116577148} -08/30/2021 21:32:42 - INFO - __main__ - Step 45794: {'lr': 0.00039954004385222555, 'samples': 8792448, 'steps': 45793, 'loss/train': 1.5062648057937622} -08/30/2021 21:32:42 - INFO - __main__ - Step 45795: {'lr': 0.00039953579111796065, 'samples': 8792640, 'steps': 45794, 'loss/train': 1.07527494430542} -08/30/2021 21:32:42 - INFO - __main__ - Step 45796: {'lr': 0.00039953153831631726, 'samples': 8792832, 'steps': 45795, 'loss/train': 2.9385814666748047} -08/30/2021 21:32:43 - INFO - __main__ - Step 45797: {'lr': 0.0003995272854472972, 'samples': 8793024, 'steps': 45796, 'loss/train': 1.1036850214004517} -08/30/2021 21:32:43 - INFO - __main__ - Step 45798: {'lr': 0.00039952303251090254, 'samples': 8793216, 'steps': 45797, 'loss/train': 1.6317808628082275} -08/30/2021 21:32:44 - INFO - __main__ - Step 45799: {'lr': 0.00039951877950713513, 'samples': 8793408, 'steps': 45798, 'loss/train': 1.0030560493469238} -08/30/2021 21:32:45 - INFO - __main__ - Step 45800: {'lr': 0.0003995145264359968, 'samples': 8793600, 'steps': 45799, 'loss/train': 1.8060802221298218} -08/30/2021 21:32:45 - INFO - __main__ - Step 45801: {'lr': 0.00039951027329748957, 'samples': 8793792, 'steps': 45800, 'loss/train': 1.2176737785339355} -08/30/2021 21:32:46 - INFO - __main__ - Step 45802: {'lr': 0.0003995060200916153, 'samples': 8793984, 'steps': 45801, 'loss/train': 1.5483342409133911} -08/30/2021 21:32:46 - INFO - __main__ - Step 45803: {'lr': 0.0003995017668183759, 'samples': 8794176, 'steps': 45802, 'loss/train': 1.2297035455703735} -08/30/2021 21:32:47 - INFO - __main__ - Step 45804: {'lr': 0.0003994975134777733, 'samples': 8794368, 'steps': 45803, 'loss/train': 1.6194614171981812} -08/30/2021 21:32:48 - INFO - __main__ - Step 45805: {'lr': 0.00039949326006980944, 'samples': 8794560, 'steps': 45804, 'loss/train': 0.9340513348579407} -08/30/2021 21:32:49 - INFO - __main__ - Step 45806: {'lr': 0.0003994890065944863, 'samples': 8794752, 'steps': 45805, 'loss/train': 0.7877193689346313} -08/30/2021 21:32:49 - INFO - __main__ - Step 45807: {'lr': 0.00039948475305180567, 'samples': 8794944, 'steps': 45806, 'loss/train': 1.4938911199569702} -08/30/2021 21:32:50 - INFO - __main__ - Step 45808: {'lr': 0.0003994804994417695, 'samples': 8795136, 'steps': 45807, 'loss/train': 0.08275206387042999} -08/30/2021 21:32:50 - INFO - __main__ - Step 45809: {'lr': 0.0003994762457643797, 'samples': 8795328, 'steps': 45808, 'loss/train': 1.5253511667251587} -08/30/2021 21:32:52 - INFO - __main__ - Step 45810: {'lr': 0.0003994719920196383, 'samples': 8795520, 'steps': 45809, 'loss/train': 0.14636556804180145} -08/30/2021 21:32:52 - INFO - __main__ - Step 45811: {'lr': 0.00039946773820754704, 'samples': 8795712, 'steps': 45810, 'loss/train': 1.3765766620635986} -08/30/2021 21:32:52 - INFO - __main__ - Step 45812: {'lr': 0.00039946348432810797, 'samples': 8795904, 'steps': 45811, 'loss/train': 1.2858155965805054} -08/30/2021 21:32:53 - INFO - __main__ - Step 45813: {'lr': 0.0003994592303813229, 'samples': 8796096, 'steps': 45812, 'loss/train': 1.4192514419555664} -08/30/2021 21:32:53 - INFO - __main__ - Step 45814: {'lr': 0.00039945497636719384, 'samples': 8796288, 'steps': 45813, 'loss/train': 1.5997782945632935} -08/30/2021 21:32:53 - INFO - __main__ - Step 45815: {'lr': 0.00039945072228572275, 'samples': 8796480, 'steps': 45814, 'loss/train': 0.4692443311214447} -08/30/2021 21:32:55 - INFO - __main__ - Step 45816: {'lr': 0.0003994464681369114, 'samples': 8796672, 'steps': 45815, 'loss/train': 1.213433027267456} -08/30/2021 21:32:55 - INFO - __main__ - Step 45817: {'lr': 0.0003994422139207618, 'samples': 8796864, 'steps': 45816, 'loss/train': 1.4724456071853638} -08/30/2021 21:32:56 - INFO - __main__ - Step 45818: {'lr': 0.00039943795963727583, 'samples': 8797056, 'steps': 45817, 'loss/train': 0.6934868097305298} -08/30/2021 21:32:56 - INFO - __main__ - Step 45819: {'lr': 0.0003994337052864554, 'samples': 8797248, 'steps': 45818, 'loss/train': 0.8116896152496338} -08/30/2021 21:32:56 - INFO - __main__ - Step 45820: {'lr': 0.00039942945086830246, 'samples': 8797440, 'steps': 45819, 'loss/train': 1.499266505241394} -08/30/2021 21:32:58 - INFO - __main__ - Step 45821: {'lr': 0.00039942519638281893, 'samples': 8797632, 'steps': 45820, 'loss/train': 1.9684098958969116} -08/30/2021 21:32:58 - INFO - __main__ - Step 45822: {'lr': 0.0003994209418300068, 'samples': 8797824, 'steps': 45821, 'loss/train': 1.5065957307815552} -08/30/2021 21:32:59 - INFO - __main__ - Step 45823: {'lr': 0.0003994166872098677, 'samples': 8798016, 'steps': 45822, 'loss/train': 1.4278074502944946} -08/30/2021 21:32:59 - INFO - __main__ - Step 45824: {'lr': 0.0003994124325224039, 'samples': 8798208, 'steps': 45823, 'loss/train': 1.2310861349105835} -08/30/2021 21:32:59 - INFO - __main__ - Step 45825: {'lr': 0.00039940817776761706, 'samples': 8798400, 'steps': 45824, 'loss/train': 1.5549328327178955} -08/30/2021 21:33:01 - INFO - __main__ - Step 45826: {'lr': 0.0003994039229455093, 'samples': 8798592, 'steps': 45825, 'loss/train': 1.5929532051086426} -08/30/2021 21:33:02 - INFO - __main__ - Step 45827: {'lr': 0.00039939966805608234, 'samples': 8798784, 'steps': 45826, 'loss/train': 1.0453182458877563} -08/30/2021 21:33:02 - INFO - __main__ - Step 45828: {'lr': 0.0003993954130993383, 'samples': 8798976, 'steps': 45827, 'loss/train': 1.3045328855514526} -08/30/2021 21:33:02 - INFO - __main__ - Step 45829: {'lr': 0.0003993911580752789, 'samples': 8799168, 'steps': 45828, 'loss/train': 2.1668474674224854} -08/30/2021 21:33:03 - INFO - __main__ - Step 45830: {'lr': 0.00039938690298390624, 'samples': 8799360, 'steps': 45829, 'loss/train': 1.710523247718811} -08/30/2021 21:33:04 - INFO - __main__ - Step 45831: {'lr': 0.00039938264782522206, 'samples': 8799552, 'steps': 45830, 'loss/train': 1.1563140153884888} -08/30/2021 21:33:05 - INFO - __main__ - Step 45832: {'lr': 0.0003993783925992284, 'samples': 8799744, 'steps': 45831, 'loss/train': 1.2424277067184448} -08/30/2021 21:33:05 - INFO - __main__ - Step 45833: {'lr': 0.00039937413730592713, 'samples': 8799936, 'steps': 45832, 'loss/train': 2.8488364219665527} -08/30/2021 21:33:05 - INFO - __main__ - Step 45834: {'lr': 0.0003993698819453202, 'samples': 8800128, 'steps': 45833, 'loss/train': 1.3206452131271362} -08/30/2021 21:33:06 - INFO - __main__ - Step 45835: {'lr': 0.00039936562651740956, 'samples': 8800320, 'steps': 45834, 'loss/train': 1.7306476831436157} -08/30/2021 21:33:07 - INFO - __main__ - Step 45836: {'lr': 0.00039936137102219695, 'samples': 8800512, 'steps': 45835, 'loss/train': 1.238366961479187} -08/30/2021 21:33:07 - INFO - __main__ - Step 45837: {'lr': 0.0003993571154596845, 'samples': 8800704, 'steps': 45836, 'loss/train': 1.3619805574417114} -08/30/2021 21:33:08 - INFO - __main__ - Step 45838: {'lr': 0.00039935285982987403, 'samples': 8800896, 'steps': 45837, 'loss/train': 1.4047608375549316} -08/30/2021 21:33:08 - INFO - __main__ - Step 45839: {'lr': 0.0003993486041327674, 'samples': 8801088, 'steps': 45838, 'loss/train': 1.5239295959472656} -08/30/2021 21:33:08 - INFO - __main__ - Step 45840: {'lr': 0.00039934434836836664, 'samples': 8801280, 'steps': 45839, 'loss/train': 1.3367984294891357} -08/30/2021 21:33:10 - INFO - __main__ - Step 45841: {'lr': 0.00039934009253667356, 'samples': 8801472, 'steps': 45840, 'loss/train': 1.990939974784851} -08/30/2021 21:33:11 - INFO - __main__ - Step 45842: {'lr': 0.0003993358366376903, 'samples': 8801664, 'steps': 45841, 'loss/train': 1.1347744464874268} -08/30/2021 21:33:11 - INFO - __main__ - Step 45843: {'lr': 0.0003993315806714185, 'samples': 8801856, 'steps': 45842, 'loss/train': 0.45819583535194397} -08/30/2021 21:33:11 - INFO - __main__ - Step 45844: {'lr': 0.0003993273246378602, 'samples': 8802048, 'steps': 45843, 'loss/train': 1.4478795528411865} -08/30/2021 21:33:12 - INFO - __main__ - Step 45845: {'lr': 0.00039932306853701735, 'samples': 8802240, 'steps': 45844, 'loss/train': 1.007699728012085} -08/30/2021 21:33:14 - INFO - __main__ - Step 45846: {'lr': 0.0003993188123688918, 'samples': 8802432, 'steps': 45845, 'loss/train': 1.6348592042922974} -08/30/2021 21:33:14 - INFO - __main__ - Step 45847: {'lr': 0.00039931455613348546, 'samples': 8802624, 'steps': 45846, 'loss/train': 1.3800431489944458} -08/30/2021 21:33:14 - INFO - __main__ - Step 45848: {'lr': 0.0003993102998308004, 'samples': 8802816, 'steps': 45847, 'loss/train': 1.3395081758499146} -08/30/2021 21:33:15 - INFO - __main__ - Step 45849: {'lr': 0.0003993060434608383, 'samples': 8803008, 'steps': 45848, 'loss/train': 1.1784669160842896} -08/30/2021 21:33:15 - INFO - __main__ - Step 45850: {'lr': 0.0003993017870236012, 'samples': 8803200, 'steps': 45849, 'loss/train': 1.4567183256149292} -08/30/2021 21:33:17 - INFO - __main__ - Step 45851: {'lr': 0.0003992975305190911, 'samples': 8803392, 'steps': 45850, 'loss/train': 1.535145878791809} -08/30/2021 21:33:17 - INFO - __main__ - Step 45852: {'lr': 0.0003992932739473098, 'samples': 8803584, 'steps': 45851, 'loss/train': 1.2231274843215942} -08/30/2021 21:33:18 - INFO - __main__ - Step 45853: {'lr': 0.0003992890173082593, 'samples': 8803776, 'steps': 45852, 'loss/train': 1.3898508548736572} -08/30/2021 21:33:18 - INFO - __main__ - Step 45854: {'lr': 0.00039928476060194137, 'samples': 8803968, 'steps': 45853, 'loss/train': 1.2472736835479736} -08/30/2021 21:33:18 - INFO - __main__ - Step 45855: {'lr': 0.0003992805038283581, 'samples': 8804160, 'steps': 45854, 'loss/train': 1.6525698900222778} -08/30/2021 21:33:19 - INFO - __main__ - Step 45856: {'lr': 0.0003992762469875113, 'samples': 8804352, 'steps': 45855, 'loss/train': 1.320794701576233} -08/30/2021 21:33:21 - INFO - __main__ - Step 45857: {'lr': 0.00039927199007940294, 'samples': 8804544, 'steps': 45856, 'loss/train': 1.7343603372573853} -08/30/2021 21:33:21 - INFO - __main__ - Step 45858: {'lr': 0.00039926773310403497, 'samples': 8804736, 'steps': 45857, 'loss/train': 1.3271514177322388} -08/30/2021 21:33:21 - INFO - __main__ - Step 45859: {'lr': 0.0003992634760614092, 'samples': 8804928, 'steps': 45858, 'loss/train': 1.2711429595947266} -08/30/2021 21:33:22 - INFO - __main__ - Step 45860: {'lr': 0.00039925921895152765, 'samples': 8805120, 'steps': 45859, 'loss/train': 1.6370981931686401} -08/30/2021 21:33:22 - INFO - __main__ - Step 45861: {'lr': 0.00039925496177439226, 'samples': 8805312, 'steps': 45860, 'loss/train': 1.435247778892517} -08/30/2021 21:33:23 - INFO - __main__ - Step 45862: {'lr': 0.0003992507045300048, 'samples': 8805504, 'steps': 45861, 'loss/train': 1.2945324182510376} -08/30/2021 21:33:24 - INFO - __main__ - Step 45863: {'lr': 0.00039924644721836734, 'samples': 8805696, 'steps': 45862, 'loss/train': 0.9160441756248474} -08/30/2021 21:33:24 - INFO - __main__ - Step 45864: {'lr': 0.0003992421898394817, 'samples': 8805888, 'steps': 45863, 'loss/train': 2.2872025966644287} -08/30/2021 21:33:25 - INFO - __main__ - Step 45865: {'lr': 0.00039923793239334974, 'samples': 8806080, 'steps': 45864, 'loss/train': 1.0798128843307495} -08/30/2021 21:33:25 - INFO - __main__ - Step 45866: {'lr': 0.0003992336748799736, 'samples': 8806272, 'steps': 45865, 'loss/train': 1.1462929248809814} -08/30/2021 21:33:26 - INFO - __main__ - Step 45867: {'lr': 0.00039922941729935503, 'samples': 8806464, 'steps': 45866, 'loss/train': 0.9772617220878601} -08/30/2021 21:33:27 - INFO - __main__ - Step 45868: {'lr': 0.000399225159651496, 'samples': 8806656, 'steps': 45867, 'loss/train': 1.1342010498046875} -08/30/2021 21:33:27 - INFO - __main__ - Step 45869: {'lr': 0.0003992209019363984, 'samples': 8806848, 'steps': 45868, 'loss/train': 1.7325915098190308} -08/30/2021 21:33:28 - INFO - __main__ - Step 45870: {'lr': 0.0003992166441540641, 'samples': 8807040, 'steps': 45869, 'loss/train': 1.0027644634246826} -08/30/2021 21:33:28 - INFO - __main__ - Step 45871: {'lr': 0.00039921238630449515, 'samples': 8807232, 'steps': 45870, 'loss/train': 1.4486463069915771} -08/30/2021 21:33:28 - INFO - __main__ - Step 45872: {'lr': 0.0003992081283876934, 'samples': 8807424, 'steps': 45871, 'loss/train': 1.6098607778549194} -08/30/2021 21:33:30 - INFO - __main__ - Step 45873: {'lr': 0.00039920387040366076, 'samples': 8807616, 'steps': 45872, 'loss/train': 0.7041446566581726} -08/30/2021 21:33:31 - INFO - __main__ - Step 45874: {'lr': 0.00039919961235239913, 'samples': 8807808, 'steps': 45873, 'loss/train': 1.3921667337417603} -08/30/2021 21:33:31 - INFO - __main__ - Step 45875: {'lr': 0.0003991953542339105, 'samples': 8808000, 'steps': 45874, 'loss/train': 0.9629362225532532} -08/30/2021 21:33:31 - INFO - __main__ - Step 45876: {'lr': 0.00039919109604819676, 'samples': 8808192, 'steps': 45875, 'loss/train': 1.245280385017395} -08/30/2021 21:33:32 - INFO - __main__ - Step 45877: {'lr': 0.00039918683779525976, 'samples': 8808384, 'steps': 45876, 'loss/train': 1.3967478275299072} -08/30/2021 21:33:33 - INFO - __main__ - Step 45878: {'lr': 0.0003991825794751015, 'samples': 8808576, 'steps': 45877, 'loss/train': 1.1662044525146484} -08/30/2021 21:33:34 - INFO - __main__ - Step 45879: {'lr': 0.0003991783210877239, 'samples': 8808768, 'steps': 45878, 'loss/train': 1.7753769159317017} -08/30/2021 21:33:34 - INFO - __main__ - Step 45880: {'lr': 0.00039917406263312885, 'samples': 8808960, 'steps': 45879, 'loss/train': 1.012062668800354} -08/30/2021 21:33:34 - INFO - __main__ - Step 45881: {'lr': 0.0003991698041113182, 'samples': 8809152, 'steps': 45880, 'loss/train': 1.456717848777771} -08/30/2021 21:33:35 - INFO - __main__ - Step 45882: {'lr': 0.000399165545522294, 'samples': 8809344, 'steps': 45881, 'loss/train': 1.4315998554229736} -08/30/2021 21:33:36 - INFO - __main__ - Step 45883: {'lr': 0.0003991612868660581, 'samples': 8809536, 'steps': 45882, 'loss/train': 1.0726063251495361} -08/30/2021 21:33:37 - INFO - __main__ - Step 45884: {'lr': 0.0003991570281426124, 'samples': 8809728, 'steps': 45883, 'loss/train': 1.6751062870025635} -08/30/2021 21:33:37 - INFO - __main__ - Step 45885: {'lr': 0.0003991527693519589, 'samples': 8809920, 'steps': 45884, 'loss/train': 1.5585232973098755} -08/30/2021 21:33:37 - INFO - __main__ - Step 45886: {'lr': 0.0003991485104940994, 'samples': 8810112, 'steps': 45885, 'loss/train': 1.547220230102539} -08/30/2021 21:33:38 - INFO - __main__ - Step 45887: {'lr': 0.0003991442515690359, 'samples': 8810304, 'steps': 45886, 'loss/train': 1.4062625169754028} -08/30/2021 21:33:40 - INFO - __main__ - Step 45888: {'lr': 0.00039913999257677025, 'samples': 8810496, 'steps': 45887, 'loss/train': 1.7330727577209473} -08/30/2021 21:33:40 - INFO - __main__ - Step 45889: {'lr': 0.0003991357335173045, 'samples': 8810688, 'steps': 45888, 'loss/train': 1.272483468055725} -08/30/2021 21:33:40 - INFO - __main__ - Step 45890: {'lr': 0.0003991314743906405, 'samples': 8810880, 'steps': 45889, 'loss/train': 1.3651748895645142} -08/30/2021 21:33:41 - INFO - __main__ - Step 45891: {'lr': 0.0003991272151967801, 'samples': 8811072, 'steps': 45890, 'loss/train': 0.0798591822385788} -08/30/2021 21:33:41 - INFO - __main__ - Step 45892: {'lr': 0.0003991229559357253, 'samples': 8811264, 'steps': 45891, 'loss/train': 0.03657440096139908} -08/30/2021 21:33:43 - INFO - __main__ - Step 45893: {'lr': 0.00039911869660747804, 'samples': 8811456, 'steps': 45892, 'loss/train': 1.5833854675292969} -08/30/2021 21:33:43 - INFO - __main__ - Step 45894: {'lr': 0.0003991144372120401, 'samples': 8811648, 'steps': 45893, 'loss/train': 1.4732928276062012} -08/30/2021 21:33:43 - INFO - __main__ - Step 45895: {'lr': 0.0003991101777494136, 'samples': 8811840, 'steps': 45894, 'loss/train': 1.619711995124817} -08/30/2021 21:33:44 - INFO - __main__ - Step 45896: {'lr': 0.0003991059182196003, 'samples': 8812032, 'steps': 45895, 'loss/train': 2.6794183254241943} -08/30/2021 21:33:44 - INFO - __main__ - Step 45897: {'lr': 0.00039910165862260216, 'samples': 8812224, 'steps': 45896, 'loss/train': 0.8295580744743347} -08/30/2021 21:33:47 - INFO - __main__ - Step 45898: {'lr': 0.0003990973989584211, 'samples': 8812416, 'steps': 45897, 'loss/train': 1.5137559175491333} -08/30/2021 21:33:47 - INFO - __main__ - Step 45899: {'lr': 0.00039909313922705913, 'samples': 8812608, 'steps': 45898, 'loss/train': 0.6221747398376465} -08/30/2021 21:33:47 - INFO - __main__ - Step 45900: {'lr': 0.000399088879428518, 'samples': 8812800, 'steps': 45899, 'loss/train': 1.3043019771575928} -08/30/2021 21:33:48 - INFO - __main__ - Step 45901: {'lr': 0.0003990846195627998, 'samples': 8812992, 'steps': 45900, 'loss/train': 1.4080753326416016} -08/30/2021 21:33:48 - INFO - __main__ - Step 45902: {'lr': 0.0003990803596299064, 'samples': 8813184, 'steps': 45901, 'loss/train': 1.4008264541625977} -08/30/2021 21:33:48 - INFO - __main__ - Step 45903: {'lr': 0.0003990760996298396, 'samples': 8813376, 'steps': 45902, 'loss/train': 1.3440762758255005} -08/30/2021 21:33:50 - INFO - __main__ - Step 45904: {'lr': 0.0003990718395626014, 'samples': 8813568, 'steps': 45903, 'loss/train': 0.16512420773506165} -08/30/2021 21:33:50 - INFO - __main__ - Step 45905: {'lr': 0.0003990675794281938, 'samples': 8813760, 'steps': 45904, 'loss/train': 1.7513208389282227} -08/30/2021 21:33:51 - INFO - __main__ - Step 45906: {'lr': 0.00039906331922661857, 'samples': 8813952, 'steps': 45905, 'loss/train': 1.7248902320861816} -08/30/2021 21:33:51 - INFO - __main__ - Step 45907: {'lr': 0.00039905905895787775, 'samples': 8814144, 'steps': 45906, 'loss/train': 1.5553399324417114} -08/30/2021 21:33:52 - INFO - __main__ - Step 45908: {'lr': 0.00039905479862197327, 'samples': 8814336, 'steps': 45907, 'loss/train': 0.7354121208190918} -08/30/2021 21:33:53 - INFO - __main__ - Step 45909: {'lr': 0.00039905053821890697, 'samples': 8814528, 'steps': 45908, 'loss/train': 1.3031671047210693} -08/30/2021 21:33:53 - INFO - __main__ - Step 45910: {'lr': 0.0003990462777486808, 'samples': 8814720, 'steps': 45909, 'loss/train': 1.3022174835205078} -08/30/2021 21:33:54 - INFO - __main__ - Step 45911: {'lr': 0.00039904201721129663, 'samples': 8814912, 'steps': 45910, 'loss/train': 1.3297829627990723} -08/30/2021 21:33:54 - INFO - __main__ - Step 45912: {'lr': 0.00039903775660675645, 'samples': 8815104, 'steps': 45911, 'loss/train': 2.0103020668029785} -08/30/2021 21:33:55 - INFO - __main__ - Step 45913: {'lr': 0.00039903349593506214, 'samples': 8815296, 'steps': 45912, 'loss/train': 1.5464253425598145} -08/30/2021 21:33:56 - INFO - __main__ - Step 45914: {'lr': 0.0003990292351962157, 'samples': 8815488, 'steps': 45913, 'loss/train': 0.8021082878112793} -08/30/2021 21:33:56 - INFO - __main__ - Step 45915: {'lr': 0.00039902497439021895, 'samples': 8815680, 'steps': 45914, 'loss/train': 1.675797462463379} -08/30/2021 21:33:57 - INFO - __main__ - Step 45916: {'lr': 0.0003990207135170738, 'samples': 8815872, 'steps': 45915, 'loss/train': 0.9508106112480164} -08/30/2021 21:33:57 - INFO - __main__ - Step 45917: {'lr': 0.00039901645257678234, 'samples': 8816064, 'steps': 45916, 'loss/train': 0.556931734085083} -08/30/2021 21:33:57 - INFO - __main__ - Step 45918: {'lr': 0.0003990121915693462, 'samples': 8816256, 'steps': 45917, 'loss/train': 1.3384051322937012} -08/30/2021 21:33:58 - INFO - __main__ - Step 45919: {'lr': 0.0003990079304947676, 'samples': 8816448, 'steps': 45918, 'loss/train': 0.9686638712882996} -08/30/2021 21:33:59 - INFO - __main__ - Step 45920: {'lr': 0.00039900366935304824, 'samples': 8816640, 'steps': 45919, 'loss/train': 1.8176053762435913} -08/30/2021 21:34:00 - INFO - __main__ - Step 45921: {'lr': 0.0003989994081441902, 'samples': 8816832, 'steps': 45920, 'loss/train': 1.976651906967163} -08/30/2021 21:34:00 - INFO - __main__ - Step 45922: {'lr': 0.00039899514686819526, 'samples': 8817024, 'steps': 45921, 'loss/train': 0.12316101789474487} -08/30/2021 21:34:01 - INFO - __main__ - Step 45923: {'lr': 0.00039899088552506544, 'samples': 8817216, 'steps': 45922, 'loss/train': 0.9177865982055664} -08/30/2021 21:34:01 - INFO - __main__ - Step 45924: {'lr': 0.00039898662411480264, 'samples': 8817408, 'steps': 45923, 'loss/train': 1.1662096977233887} -08/30/2021 21:34:02 - INFO - __main__ - Step 45925: {'lr': 0.00039898236263740875, 'samples': 8817600, 'steps': 45924, 'loss/train': 1.1464731693267822} -08/30/2021 21:34:03 - INFO - __main__ - Step 45926: {'lr': 0.00039897810109288566, 'samples': 8817792, 'steps': 45925, 'loss/train': 1.1101843118667603} -08/30/2021 21:34:03 - INFO - __main__ - Step 45927: {'lr': 0.0003989738394812354, 'samples': 8817984, 'steps': 45926, 'loss/train': 1.1896226406097412} -08/30/2021 21:34:04 - INFO - __main__ - Step 45928: {'lr': 0.0003989695778024598, 'samples': 8818176, 'steps': 45927, 'loss/train': 1.5410248041152954} -08/30/2021 21:34:04 - INFO - __main__ - Step 45929: {'lr': 0.00039896531605656085, 'samples': 8818368, 'steps': 45928, 'loss/train': 1.9736499786376953} -08/30/2021 21:34:06 - INFO - __main__ - Step 45930: {'lr': 0.00039896105424354035, 'samples': 8818560, 'steps': 45929, 'loss/train': 1.1277334690093994} -08/30/2021 21:34:06 - INFO - __main__ - Step 45931: {'lr': 0.0003989567923634003, 'samples': 8818752, 'steps': 45930, 'loss/train': 1.309943675994873} -08/30/2021 21:34:06 - INFO - __main__ - Step 45932: {'lr': 0.00039895253041614265, 'samples': 8818944, 'steps': 45931, 'loss/train': 1.166379451751709} -08/30/2021 21:34:07 - INFO - __main__ - Step 45933: {'lr': 0.00039894826840176933, 'samples': 8819136, 'steps': 45932, 'loss/train': 1.2008832693099976} -08/30/2021 21:34:07 - INFO - __main__ - Step 45934: {'lr': 0.00039894400632028217, 'samples': 8819328, 'steps': 45933, 'loss/train': 1.6712656021118164} -08/30/2021 21:34:08 - INFO - __main__ - Step 45935: {'lr': 0.00039893974417168316, 'samples': 8819520, 'steps': 45934, 'loss/train': 1.550011396408081} -08/30/2021 21:34:09 - INFO - __main__ - Step 45936: {'lr': 0.00039893548195597415, 'samples': 8819712, 'steps': 45935, 'loss/train': 1.5504117012023926} -08/30/2021 21:34:09 - INFO - __main__ - Step 45937: {'lr': 0.0003989312196731572, 'samples': 8819904, 'steps': 45936, 'loss/train': 0.873008131980896} -08/30/2021 21:34:10 - INFO - __main__ - Step 45938: {'lr': 0.0003989269573232341, 'samples': 8820096, 'steps': 45937, 'loss/train': 1.8701066970825195} -08/30/2021 21:34:10 - INFO - __main__ - Step 45939: {'lr': 0.0003989226949062068, 'samples': 8820288, 'steps': 45938, 'loss/train': 1.6357719898223877} -08/30/2021 21:34:10 - INFO - __main__ - Step 45940: {'lr': 0.00039891843242207726, 'samples': 8820480, 'steps': 45939, 'loss/train': 1.146041750907898} -08/30/2021 21:34:12 - INFO - __main__ - Step 45941: {'lr': 0.00039891416987084726, 'samples': 8820672, 'steps': 45940, 'loss/train': 0.5608364939689636} -08/30/2021 21:34:12 - INFO - __main__ - Step 45942: {'lr': 0.00039890990725251896, 'samples': 8820864, 'steps': 45941, 'loss/train': 1.4235665798187256} -08/30/2021 21:34:13 - INFO - __main__ - Step 45943: {'lr': 0.0003989056445670941, 'samples': 8821056, 'steps': 45942, 'loss/train': 1.67377769947052} -08/30/2021 21:34:13 - INFO - __main__ - Step 45944: {'lr': 0.0003989013818145747, 'samples': 8821248, 'steps': 45943, 'loss/train': 1.1196436882019043} -08/30/2021 21:34:14 - INFO - __main__ - Step 45945: {'lr': 0.0003988971189949626, 'samples': 8821440, 'steps': 45944, 'loss/train': 0.8334695100784302} -08/30/2021 21:34:14 - INFO - __main__ - Step 45946: {'lr': 0.0003988928561082598, 'samples': 8821632, 'steps': 45945, 'loss/train': 1.5286099910736084} -08/30/2021 21:34:16 - INFO - __main__ - Step 45947: {'lr': 0.0003988885931544681, 'samples': 8821824, 'steps': 45946, 'loss/train': 1.1778885126113892} -08/30/2021 21:34:16 - INFO - __main__ - Step 45948: {'lr': 0.0003988843301335895, 'samples': 8822016, 'steps': 45947, 'loss/train': 1.183476209640503} -08/30/2021 21:34:17 - INFO - __main__ - Step 45949: {'lr': 0.00039888006704562594, 'samples': 8822208, 'steps': 45948, 'loss/train': 1.108405590057373} -08/30/2021 21:34:17 - INFO - __main__ - Step 45950: {'lr': 0.0003988758038905794, 'samples': 8822400, 'steps': 45949, 'loss/train': 1.4362045526504517} -08/30/2021 21:34:17 - INFO - __main__ - Step 45951: {'lr': 0.00039887154066845166, 'samples': 8822592, 'steps': 45950, 'loss/train': 0.6259725689888} -08/30/2021 21:34:18 - INFO - __main__ - Step 45952: {'lr': 0.00039886727737924464, 'samples': 8822784, 'steps': 45951, 'loss/train': 0.9381634593009949} -08/30/2021 21:34:19 - INFO - __main__ - Step 45953: {'lr': 0.00039886301402296037, 'samples': 8822976, 'steps': 45952, 'loss/train': 1.2229812145233154} -08/30/2021 21:34:20 - INFO - __main__ - Step 45954: {'lr': 0.00039885875059960074, 'samples': 8823168, 'steps': 45953, 'loss/train': 1.5409786701202393} -08/30/2021 21:34:20 - INFO - __main__ - Step 45955: {'lr': 0.0003988544871091676, 'samples': 8823360, 'steps': 45954, 'loss/train': 1.3310774564743042} -08/30/2021 21:34:20 - INFO - __main__ - Step 45956: {'lr': 0.000398850223551663, 'samples': 8823552, 'steps': 45955, 'loss/train': 1.934818983078003} -08/30/2021 21:34:21 - INFO - __main__ - Step 45957: {'lr': 0.00039884595992708877, 'samples': 8823744, 'steps': 45956, 'loss/train': 1.6563388109207153} -08/30/2021 21:34:23 - INFO - __main__ - Step 45958: {'lr': 0.00039884169623544683, 'samples': 8823936, 'steps': 45957, 'loss/train': 0.6444125771522522} -08/30/2021 21:34:23 - INFO - __main__ - Step 45959: {'lr': 0.0003988374324767391, 'samples': 8824128, 'steps': 45958, 'loss/train': 1.2904642820358276} -08/30/2021 21:34:24 - INFO - __main__ - Step 45960: {'lr': 0.0003988331686509675, 'samples': 8824320, 'steps': 45959, 'loss/train': 0.8290671706199646} -08/30/2021 21:34:24 - INFO - __main__ - Step 45961: {'lr': 0.000398828904758134, 'samples': 8824512, 'steps': 45960, 'loss/train': 0.5800647735595703} -08/30/2021 21:34:24 - INFO - __main__ - Step 45962: {'lr': 0.0003988246407982405, 'samples': 8824704, 'steps': 45961, 'loss/train': 1.6646595001220703} -08/30/2021 21:34:26 - INFO - __main__ - Step 45963: {'lr': 0.00039882037677128895, 'samples': 8824896, 'steps': 45962, 'loss/train': 0.8743748664855957} -08/30/2021 21:34:26 - INFO - __main__ - Step 45964: {'lr': 0.0003988161126772812, 'samples': 8825088, 'steps': 45963, 'loss/train': 1.4011805057525635} -08/30/2021 21:34:27 - INFO - __main__ - Step 45965: {'lr': 0.0003988118485162192, 'samples': 8825280, 'steps': 45964, 'loss/train': 1.5982658863067627} -08/30/2021 21:34:27 - INFO - __main__ - Step 45966: {'lr': 0.00039880758428810487, 'samples': 8825472, 'steps': 45965, 'loss/train': 1.5529544353485107} -08/30/2021 21:34:27 - INFO - __main__ - Step 45967: {'lr': 0.00039880331999294017, 'samples': 8825664, 'steps': 45966, 'loss/train': 1.2997111082077026} -08/30/2021 21:34:29 - INFO - __main__ - Step 45968: {'lr': 0.00039879905563072694, 'samples': 8825856, 'steps': 45967, 'loss/train': 0.6538985371589661} -08/30/2021 21:34:29 - INFO - __main__ - Step 45969: {'lr': 0.00039879479120146725, 'samples': 8826048, 'steps': 45968, 'loss/train': 0.47482556104660034} -08/30/2021 21:34:30 - INFO - __main__ - Step 45970: {'lr': 0.0003987905267051628, 'samples': 8826240, 'steps': 45969, 'loss/train': 1.6342581510543823} -08/30/2021 21:34:30 - INFO - __main__ - Step 45971: {'lr': 0.0003987862621418157, 'samples': 8826432, 'steps': 45970, 'loss/train': 1.4716788530349731} -08/30/2021 21:34:30 - INFO - __main__ - Step 45972: {'lr': 0.0003987819975114278, 'samples': 8826624, 'steps': 45971, 'loss/train': 1.6564103364944458} -08/30/2021 21:34:32 - INFO - __main__ - Step 45973: {'lr': 0.000398777732814001, 'samples': 8826816, 'steps': 45972, 'loss/train': 1.319682240486145} -08/30/2021 21:34:32 - INFO - __main__ - Step 45974: {'lr': 0.0003987734680495373, 'samples': 8827008, 'steps': 45973, 'loss/train': 1.4295915365219116} -08/30/2021 21:34:33 - INFO - __main__ - Step 45975: {'lr': 0.0003987692032180385, 'samples': 8827200, 'steps': 45974, 'loss/train': 1.4333821535110474} -08/30/2021 21:34:33 - INFO - __main__ - Step 45976: {'lr': 0.00039876493831950664, 'samples': 8827392, 'steps': 45975, 'loss/train': 2.162172555923462} -08/30/2021 21:34:33 - INFO - __main__ - Step 45977: {'lr': 0.00039876067335394363, 'samples': 8827584, 'steps': 45976, 'loss/train': 1.4194296598434448} -08/30/2021 21:34:35 - INFO - __main__ - Step 45978: {'lr': 0.0003987564083213513, 'samples': 8827776, 'steps': 45977, 'loss/train': 1.04628324508667} -08/30/2021 21:34:35 - INFO - __main__ - Step 45979: {'lr': 0.00039875214322173167, 'samples': 8827968, 'steps': 45978, 'loss/train': 1.8911947011947632} -08/30/2021 21:34:36 - INFO - __main__ - Step 45980: {'lr': 0.00039874787805508656, 'samples': 8828160, 'steps': 45979, 'loss/train': 1.6589652299880981} -08/30/2021 21:34:36 - INFO - __main__ - Step 45981: {'lr': 0.000398743612821418, 'samples': 8828352, 'steps': 45980, 'loss/train': 1.4017174243927002} -08/30/2021 21:34:36 - INFO - __main__ - Step 45982: {'lr': 0.0003987393475207278, 'samples': 8828544, 'steps': 45981, 'loss/train': 2.876781940460205} -08/30/2021 21:34:37 - INFO - __main__ - Step 45983: {'lr': 0.000398735082153018, 'samples': 8828736, 'steps': 45982, 'loss/train': 1.3135699033737183} -08/30/2021 21:34:38 - INFO - __main__ - Step 45984: {'lr': 0.00039873081671829046, 'samples': 8828928, 'steps': 45983, 'loss/train': 1.3262829780578613} -08/30/2021 21:34:39 - INFO - __main__ - Step 45985: {'lr': 0.0003987265512165471, 'samples': 8829120, 'steps': 45984, 'loss/train': 1.9111242294311523} -08/30/2021 21:34:39 - INFO - __main__ - Step 45986: {'lr': 0.0003987222856477899, 'samples': 8829312, 'steps': 45985, 'loss/train': 1.7914196252822876} -08/30/2021 21:34:39 - INFO - __main__ - Step 45987: {'lr': 0.0003987180200120207, 'samples': 8829504, 'steps': 45986, 'loss/train': 0.8986952304840088} -08/30/2021 21:34:40 - INFO - __main__ - Step 45988: {'lr': 0.0003987137543092414, 'samples': 8829696, 'steps': 45987, 'loss/train': 0.6883071064949036} -08/30/2021 21:34:41 - INFO - __main__ - Step 45989: {'lr': 0.0003987094885394541, 'samples': 8829888, 'steps': 45988, 'loss/train': 1.5992047786712646} -08/30/2021 21:34:41 - INFO - __main__ - Step 45990: {'lr': 0.0003987052227026605, 'samples': 8830080, 'steps': 45989, 'loss/train': 1.3425664901733398} -08/30/2021 21:34:42 - INFO - __main__ - Step 45991: {'lr': 0.0003987009567988626, 'samples': 8830272, 'steps': 45990, 'loss/train': 0.8926039934158325} -08/30/2021 21:34:42 - INFO - __main__ - Step 45992: {'lr': 0.00039869669082806243, 'samples': 8830464, 'steps': 45991, 'loss/train': 1.725190281867981} -08/30/2021 21:34:43 - INFO - __main__ - Step 45993: {'lr': 0.0003986924247902618, 'samples': 8830656, 'steps': 45992, 'loss/train': 0.8363355994224548} -08/30/2021 21:34:44 - INFO - __main__ - Step 45994: {'lr': 0.00039868815868546257, 'samples': 8830848, 'steps': 45993, 'loss/train': 1.0703015327453613} -08/30/2021 21:34:44 - INFO - __main__ - Step 45995: {'lr': 0.00039868389251366686, 'samples': 8831040, 'steps': 45994, 'loss/train': 1.4130018949508667} -08/30/2021 21:34:45 - INFO - __main__ - Step 45996: {'lr': 0.00039867962627487645, 'samples': 8831232, 'steps': 45995, 'loss/train': 1.5226773023605347} -08/30/2021 21:34:45 - INFO - __main__ - Step 45997: {'lr': 0.0003986753599690933, 'samples': 8831424, 'steps': 45996, 'loss/train': 1.3419251441955566} -08/30/2021 21:34:45 - INFO - __main__ - Step 45998: {'lr': 0.00039867109359631935, 'samples': 8831616, 'steps': 45997, 'loss/train': 1.1787835359573364} -08/30/2021 21:34:47 - INFO - __main__ - Step 45999: {'lr': 0.00039866682715655646, 'samples': 8831808, 'steps': 45998, 'loss/train': 1.144551157951355} -08/30/2021 21:34:47 - INFO - __main__ - Step 46000: {'lr': 0.00039866256064980657, 'samples': 8832000, 'steps': 45999, 'loss/train': 1.1735973358154297} -08/30/2021 21:34:48 - INFO - __main__ - Step 46001: {'lr': 0.0003986582940760717, 'samples': 8832192, 'steps': 46000, 'loss/train': 1.7374322414398193} -08/30/2021 21:34:48 - INFO - __main__ - Step 46002: {'lr': 0.0003986540274353536, 'samples': 8832384, 'steps': 46001, 'loss/train': 1.0739721059799194} -08/30/2021 21:34:48 - INFO - __main__ - Step 46003: {'lr': 0.00039864976072765437, 'samples': 8832576, 'steps': 46002, 'loss/train': 1.173020362854004} -08/30/2021 21:34:50 - INFO - __main__ - Step 46004: {'lr': 0.0003986454939529758, 'samples': 8832768, 'steps': 46003, 'loss/train': 1.0811725854873657} -08/30/2021 21:34:50 - INFO - __main__ - Step 46005: {'lr': 0.0003986412271113199, 'samples': 8832960, 'steps': 46004, 'loss/train': 0.9034219980239868} -08/30/2021 21:34:51 - INFO - __main__ - Step 46006: {'lr': 0.0003986369602026886, 'samples': 8833152, 'steps': 46005, 'loss/train': 1.269287347793579} -08/30/2021 21:34:51 - INFO - __main__ - Step 46007: {'lr': 0.0003986326932270836, 'samples': 8833344, 'steps': 46006, 'loss/train': 1.2735518217086792} -08/30/2021 21:34:51 - INFO - __main__ - Step 46008: {'lr': 0.00039862842618450717, 'samples': 8833536, 'steps': 46007, 'loss/train': 1.4346592426300049} -08/30/2021 21:34:54 - INFO - __main__ - Step 46009: {'lr': 0.00039862415907496103, 'samples': 8833728, 'steps': 46008, 'loss/train': 1.2043991088867188} -08/30/2021 21:34:54 - INFO - __main__ - Step 46010: {'lr': 0.00039861989189844715, 'samples': 8833920, 'steps': 46009, 'loss/train': 1.2698410749435425} -08/30/2021 21:34:55 - INFO - __main__ - Step 46011: {'lr': 0.00039861562465496735, 'samples': 8834112, 'steps': 46010, 'loss/train': 0.44780731201171875} -08/30/2021 21:34:55 - INFO - __main__ - Step 46012: {'lr': 0.00039861135734452376, 'samples': 8834304, 'steps': 46011, 'loss/train': 0.15395143628120422} -08/30/2021 21:34:55 - INFO - __main__ - Step 46013: {'lr': 0.00039860708996711816, 'samples': 8834496, 'steps': 46012, 'loss/train': 1.599525809288025} -08/30/2021 21:34:57 - INFO - __main__ - Step 46014: {'lr': 0.00039860282252275245, 'samples': 8834688, 'steps': 46013, 'loss/train': 2.1880736351013184} -08/30/2021 21:34:57 - INFO - __main__ - Step 46015: {'lr': 0.0003985985550114286, 'samples': 8834880, 'steps': 46014, 'loss/train': 1.771926999092102} -08/30/2021 21:34:57 - INFO - __main__ - Step 46016: {'lr': 0.00039859428743314857, 'samples': 8835072, 'steps': 46015, 'loss/train': 1.3153576850891113} -08/30/2021 21:34:58 - INFO - __main__ - Step 46017: {'lr': 0.0003985900197879142, 'samples': 8835264, 'steps': 46016, 'loss/train': 0.9063101410865784} -08/30/2021 21:34:58 - INFO - __main__ - Step 46018: {'lr': 0.00039858575207572756, 'samples': 8835456, 'steps': 46017, 'loss/train': 0.9806237816810608} -08/30/2021 21:35:00 - INFO - __main__ - Step 46019: {'lr': 0.00039858148429659036, 'samples': 8835648, 'steps': 46018, 'loss/train': 1.1178653240203857} -08/30/2021 21:35:00 - INFO - __main__ - Step 46020: {'lr': 0.0003985772164505047, 'samples': 8835840, 'steps': 46019, 'loss/train': 1.2177878618240356} -08/30/2021 21:35:00 - INFO - __main__ - Step 46021: {'lr': 0.0003985729485374724, 'samples': 8836032, 'steps': 46020, 'loss/train': 1.352109432220459} -08/30/2021 21:35:01 - INFO - __main__ - Step 46022: {'lr': 0.0003985686805574954, 'samples': 8836224, 'steps': 46021, 'loss/train': 1.0561004877090454} -08/30/2021 21:35:01 - INFO - __main__ - Step 46023: {'lr': 0.00039856441251057573, 'samples': 8836416, 'steps': 46022, 'loss/train': 1.6003743410110474} -08/30/2021 21:35:02 - INFO - __main__ - Step 46024: {'lr': 0.0003985601443967152, 'samples': 8836608, 'steps': 46023, 'loss/train': 1.4200018644332886} -08/30/2021 21:35:03 - INFO - __main__ - Step 46025: {'lr': 0.0003985558762159157, 'samples': 8836800, 'steps': 46024, 'loss/train': 1.4329794645309448} -08/30/2021 21:35:03 - INFO - __main__ - Step 46026: {'lr': 0.0003985516079681793, 'samples': 8836992, 'steps': 46025, 'loss/train': 1.9898192882537842} -08/30/2021 21:35:04 - INFO - __main__ - Step 46027: {'lr': 0.0003985473396535078, 'samples': 8837184, 'steps': 46026, 'loss/train': 2.1930010318756104} -08/30/2021 21:35:04 - INFO - __main__ - Step 46028: {'lr': 0.00039854307127190316, 'samples': 8837376, 'steps': 46027, 'loss/train': 1.0728346109390259} -08/30/2021 21:35:04 - INFO - __main__ - Step 46029: {'lr': 0.0003985388028233673, 'samples': 8837568, 'steps': 46028, 'loss/train': 1.0078150033950806} -08/30/2021 21:35:06 - INFO - __main__ - Step 46030: {'lr': 0.0003985345343079022, 'samples': 8837760, 'steps': 46029, 'loss/train': 1.5804888010025024} -08/30/2021 21:35:06 - INFO - __main__ - Step 46031: {'lr': 0.00039853026572550965, 'samples': 8837952, 'steps': 46030, 'loss/train': 1.2204777002334595} -08/30/2021 21:35:07 - INFO - __main__ - Step 46032: {'lr': 0.0003985259970761917, 'samples': 8838144, 'steps': 46031, 'loss/train': 1.3898285627365112} -08/30/2021 21:35:07 - INFO - __main__ - Step 46033: {'lr': 0.0003985217283599502, 'samples': 8838336, 'steps': 46032, 'loss/train': 1.1773681640625} -08/30/2021 21:35:08 - INFO - __main__ - Step 46034: {'lr': 0.0003985174595767871, 'samples': 8838528, 'steps': 46033, 'loss/train': 1.0620403289794922} -08/30/2021 21:35:09 - INFO - __main__ - Step 46035: {'lr': 0.0003985131907267043, 'samples': 8838720, 'steps': 46034, 'loss/train': 1.7556136846542358} -08/30/2021 21:35:10 - INFO - __main__ - Step 46036: {'lr': 0.00039850892180970387, 'samples': 8838912, 'steps': 46035, 'loss/train': 1.4639158248901367} -08/30/2021 21:35:10 - INFO - __main__ - Step 46037: {'lr': 0.0003985046528257875, 'samples': 8839104, 'steps': 46036, 'loss/train': 1.5760293006896973} -08/30/2021 21:35:10 - INFO - __main__ - Step 46038: {'lr': 0.00039850038377495727, 'samples': 8839296, 'steps': 46037, 'loss/train': 1.2258882522583008} -08/30/2021 21:35:11 - INFO - __main__ - Step 46039: {'lr': 0.000398496114657215, 'samples': 8839488, 'steps': 46038, 'loss/train': 0.9945687651634216} -08/30/2021 21:35:11 - INFO - __main__ - Step 46040: {'lr': 0.0003984918454725628, 'samples': 8839680, 'steps': 46039, 'loss/train': 1.3057918548583984} -08/30/2021 21:35:12 - INFO - __main__ - Step 46041: {'lr': 0.0003984875762210023, 'samples': 8839872, 'steps': 46040, 'loss/train': 1.7759654521942139} -08/30/2021 21:35:13 - INFO - __main__ - Step 46042: {'lr': 0.0003984833069025357, 'samples': 8840064, 'steps': 46041, 'loss/train': 1.5332950353622437} -08/30/2021 21:35:13 - INFO - __main__ - Step 46043: {'lr': 0.00039847903751716486, 'samples': 8840256, 'steps': 46042, 'loss/train': 1.4358203411102295} -08/30/2021 21:35:14 - INFO - __main__ - Step 46044: {'lr': 0.00039847476806489153, 'samples': 8840448, 'steps': 46043, 'loss/train': 1.3734197616577148} -08/30/2021 21:35:14 - INFO - __main__ - Step 46045: {'lr': 0.00039847049854571784, 'samples': 8840640, 'steps': 46044, 'loss/train': 1.4672223329544067} -08/30/2021 21:35:16 - INFO - __main__ - Step 46046: {'lr': 0.00039846622895964556, 'samples': 8840832, 'steps': 46045, 'loss/train': 1.105386734008789} -08/30/2021 21:35:16 - INFO - __main__ - Step 46047: {'lr': 0.0003984619593066767, 'samples': 8841024, 'steps': 46046, 'loss/train': 1.7899452447891235} -08/30/2021 21:35:17 - INFO - __main__ - Step 46048: {'lr': 0.0003984576895868132, 'samples': 8841216, 'steps': 46047, 'loss/train': 1.5395907163619995} -08/30/2021 21:35:17 - INFO - __main__ - Step 46049: {'lr': 0.000398453419800057, 'samples': 8841408, 'steps': 46048, 'loss/train': 0.8314034938812256} -08/30/2021 21:35:18 - INFO - __main__ - Step 46050: {'lr': 0.00039844914994640994, 'samples': 8841600, 'steps': 46049, 'loss/train': 0.3109332025051117} -08/30/2021 21:35:18 - INFO - __main__ - Step 46051: {'lr': 0.00039844488002587397, 'samples': 8841792, 'steps': 46050, 'loss/train': 1.7853615283966064} -08/30/2021 21:35:19 - INFO - __main__ - Step 46052: {'lr': 0.00039844061003845114, 'samples': 8841984, 'steps': 46051, 'loss/train': 0.5214645862579346} -08/30/2021 21:35:20 - INFO - __main__ - Step 46053: {'lr': 0.00039843633998414306, 'samples': 8842176, 'steps': 46052, 'loss/train': 1.3784608840942383} -08/30/2021 21:35:20 - INFO - __main__ - Step 46054: {'lr': 0.000398432069862952, 'samples': 8842368, 'steps': 46053, 'loss/train': 1.4672095775604248} -08/30/2021 21:35:21 - INFO - __main__ - Step 46055: {'lr': 0.00039842779967487967, 'samples': 8842560, 'steps': 46054, 'loss/train': 1.5179264545440674} -08/30/2021 21:35:21 - INFO - __main__ - Step 46056: {'lr': 0.0003984235294199281, 'samples': 8842752, 'steps': 46055, 'loss/train': 1.3943374156951904} -08/30/2021 21:35:23 - INFO - __main__ - Step 46057: {'lr': 0.0003984192590980992, 'samples': 8842944, 'steps': 46056, 'loss/train': 1.4477373361587524} -08/30/2021 21:35:24 - INFO - __main__ - Step 46058: {'lr': 0.00039841498870939483, 'samples': 8843136, 'steps': 46057, 'loss/train': 2.065382719039917} -08/30/2021 21:35:24 - INFO - __main__ - Step 46059: {'lr': 0.000398410718253817, 'samples': 8843328, 'steps': 46058, 'loss/train': 1.6766257286071777} -08/30/2021 21:35:24 - INFO - __main__ - Step 46060: {'lr': 0.00039840644773136757, 'samples': 8843520, 'steps': 46059, 'loss/train': 1.5089621543884277} -08/30/2021 21:35:25 - INFO - __main__ - Step 46061: {'lr': 0.0003984021771420484, 'samples': 8843712, 'steps': 46060, 'loss/train': 1.3594402074813843} -08/30/2021 21:35:25 - INFO - __main__ - Step 46062: {'lr': 0.0003983979064858616, 'samples': 8843904, 'steps': 46061, 'loss/train': 1.247732400894165} -08/30/2021 21:35:25 - INFO - __main__ - Step 46063: {'lr': 0.000398393635762809, 'samples': 8844096, 'steps': 46062, 'loss/train': 0.05368264392018318} -08/30/2021 21:35:27 - INFO - __main__ - Step 46064: {'lr': 0.0003983893649728925, 'samples': 8844288, 'steps': 46063, 'loss/train': 0.7466768026351929} -08/30/2021 21:35:28 - INFO - __main__ - Step 46065: {'lr': 0.000398385094116114, 'samples': 8844480, 'steps': 46064, 'loss/train': 1.3943030834197998} -08/30/2021 21:35:28 - INFO - __main__ - Step 46066: {'lr': 0.0003983808231924755, 'samples': 8844672, 'steps': 46065, 'loss/train': 1.189836859703064} -08/30/2021 21:35:29 - INFO - __main__ - Step 46067: {'lr': 0.0003983765522019789, 'samples': 8844864, 'steps': 46066, 'loss/train': 0.10465364158153534} -08/30/2021 21:35:29 - INFO - __main__ - Step 46068: {'lr': 0.0003983722811446261, 'samples': 8845056, 'steps': 46067, 'loss/train': 1.2041999101638794} -08/30/2021 21:35:30 - INFO - __main__ - Step 46069: {'lr': 0.00039836801002041903, 'samples': 8845248, 'steps': 46068, 'loss/train': 1.5342386960983276} -08/30/2021 21:35:31 - INFO - __main__ - Step 46070: {'lr': 0.00039836373882935967, 'samples': 8845440, 'steps': 46069, 'loss/train': 0.9626764059066772} -08/30/2021 21:35:31 - INFO - __main__ - Step 46071: {'lr': 0.0003983594675714498, 'samples': 8845632, 'steps': 46070, 'loss/train': 1.5838414430618286} -08/30/2021 21:35:32 - INFO - __main__ - Step 46072: {'lr': 0.0003983551962466915, 'samples': 8845824, 'steps': 46071, 'loss/train': 0.5252110362052917} -08/30/2021 21:35:32 - INFO - __main__ - Step 46073: {'lr': 0.0003983509248550867, 'samples': 8846016, 'steps': 46072, 'loss/train': 1.6192330121994019} -08/30/2021 21:35:33 - INFO - __main__ - Step 46074: {'lr': 0.00039834665339663725, 'samples': 8846208, 'steps': 46073, 'loss/train': 1.453455924987793} -08/30/2021 21:35:34 - INFO - __main__ - Step 46075: {'lr': 0.00039834238187134497, 'samples': 8846400, 'steps': 46074, 'loss/train': 1.0606783628463745} -08/30/2021 21:35:34 - INFO - __main__ - Step 46076: {'lr': 0.00039833811027921196, 'samples': 8846592, 'steps': 46075, 'loss/train': 1.0795825719833374} -08/30/2021 21:35:35 - INFO - __main__ - Step 46077: {'lr': 0.00039833383862024016, 'samples': 8846784, 'steps': 46076, 'loss/train': 1.3732281923294067} -08/30/2021 21:35:35 - INFO - __main__ - Step 46078: {'lr': 0.00039832956689443135, 'samples': 8846976, 'steps': 46077, 'loss/train': 1.1644858121871948} -08/30/2021 21:35:36 - INFO - __main__ - Step 46079: {'lr': 0.00039832529510178756, 'samples': 8847168, 'steps': 46078, 'loss/train': 1.5265620946884155} -08/30/2021 21:35:37 - INFO - __main__ - Step 46080: {'lr': 0.0003983210232423107, 'samples': 8847360, 'steps': 46079, 'loss/train': 1.5379303693771362} -08/30/2021 21:35:37 - INFO - __main__ - Step 46081: {'lr': 0.00039831675131600253, 'samples': 8847552, 'steps': 46080, 'loss/train': 1.4588737487792969} -08/30/2021 21:35:38 - INFO - __main__ - Step 46082: {'lr': 0.0003983124793228653, 'samples': 8847744, 'steps': 46081, 'loss/train': 1.8334448337554932} -08/30/2021 21:35:38 - INFO - __main__ - Step 46083: {'lr': 0.00039830820726290063, 'samples': 8847936, 'steps': 46082, 'loss/train': 1.2814098596572876} -08/30/2021 21:35:40 - INFO - __main__ - Step 46084: {'lr': 0.0003983039351361106, 'samples': 8848128, 'steps': 46083, 'loss/train': 1.3197534084320068} -08/30/2021 21:35:40 - INFO - __main__ - Step 46085: {'lr': 0.0003982996629424972, 'samples': 8848320, 'steps': 46084, 'loss/train': 2.0131566524505615} -08/30/2021 21:35:40 - INFO - __main__ - Step 46086: {'lr': 0.0003982953906820622, 'samples': 8848512, 'steps': 46085, 'loss/train': 1.2611488103866577} -08/30/2021 21:35:41 - INFO - __main__ - Step 46087: {'lr': 0.0003982911183548075, 'samples': 8848704, 'steps': 46086, 'loss/train': 1.3952438831329346} -08/30/2021 21:35:41 - INFO - __main__ - Step 46088: {'lr': 0.0003982868459607352, 'samples': 8848896, 'steps': 46087, 'loss/train': 1.7468812465667725} -08/30/2021 21:35:43 - INFO - __main__ - Step 46089: {'lr': 0.0003982825734998471, 'samples': 8849088, 'steps': 46088, 'loss/train': 1.384050965309143} -08/30/2021 21:35:43 - INFO - __main__ - Step 46090: {'lr': 0.0003982783009721452, 'samples': 8849280, 'steps': 46089, 'loss/train': 1.6091235876083374} -08/30/2021 21:35:44 - INFO - __main__ - Step 46091: {'lr': 0.00039827402837763136, 'samples': 8849472, 'steps': 46090, 'loss/train': 1.1778900623321533} -08/30/2021 21:35:44 - INFO - __main__ - Step 46092: {'lr': 0.00039826975571630754, 'samples': 8849664, 'steps': 46091, 'loss/train': 0.9310660362243652} -08/30/2021 21:35:44 - INFO - __main__ - Step 46093: {'lr': 0.0003982654829881757, 'samples': 8849856, 'steps': 46092, 'loss/train': 1.8160934448242188} -08/30/2021 21:35:45 - INFO - __main__ - Step 46094: {'lr': 0.0003982612101932376, 'samples': 8850048, 'steps': 46093, 'loss/train': 1.1759487390518188} -08/30/2021 21:35:45 - INFO - __main__ - Step 46095: {'lr': 0.0003982569373314954, 'samples': 8850240, 'steps': 46094, 'loss/train': 0.03603367879986763} -08/30/2021 21:35:47 - INFO - __main__ - Step 46096: {'lr': 0.0003982526644029508, 'samples': 8850432, 'steps': 46095, 'loss/train': 1.5609126091003418} -08/30/2021 21:35:47 - INFO - __main__ - Step 46097: {'lr': 0.000398248391407606, 'samples': 8850624, 'steps': 46096, 'loss/train': 1.5165722370147705} -08/30/2021 21:35:47 - INFO - __main__ - Step 46098: {'lr': 0.0003982441183454627, 'samples': 8850816, 'steps': 46097, 'loss/train': 1.7708914279937744} -08/30/2021 21:35:48 - INFO - __main__ - Step 46099: {'lr': 0.0003982398452165228, 'samples': 8851008, 'steps': 46098, 'loss/train': 1.1890300512313843} -08/30/2021 21:35:48 - INFO - __main__ - Step 46100: {'lr': 0.0003982355720207884, 'samples': 8851200, 'steps': 46099, 'loss/train': 1.7634931802749634} -08/30/2021 21:35:50 - INFO - __main__ - Step 46101: {'lr': 0.00039823129875826127, 'samples': 8851392, 'steps': 46100, 'loss/train': 1.0142585039138794} -08/30/2021 21:35:50 - INFO - __main__ - Step 46102: {'lr': 0.0003982270254289435, 'samples': 8851584, 'steps': 46101, 'loss/train': 2.123687267303467} -08/30/2021 21:35:51 - INFO - __main__ - Step 46103: {'lr': 0.0003982227520328368, 'samples': 8851776, 'steps': 46102, 'loss/train': 1.2674418687820435} -08/30/2021 21:35:51 - INFO - __main__ - Step 46104: {'lr': 0.0003982184785699433, 'samples': 8851968, 'steps': 46103, 'loss/train': 1.8261513710021973} -08/30/2021 21:35:51 - INFO - __main__ - Step 46105: {'lr': 0.00039821420504026486, 'samples': 8852160, 'steps': 46104, 'loss/train': 1.1738165616989136} -08/30/2021 21:35:53 - INFO - __main__ - Step 46106: {'lr': 0.00039820993144380333, 'samples': 8852352, 'steps': 46105, 'loss/train': 1.0078974962234497} -08/30/2021 21:35:53 - INFO - __main__ - Step 46107: {'lr': 0.0003982056577805607, 'samples': 8852544, 'steps': 46106, 'loss/train': 0.9887067675590515} -08/30/2021 21:35:54 - INFO - __main__ - Step 46108: {'lr': 0.00039820138405053887, 'samples': 8852736, 'steps': 46107, 'loss/train': 1.2157014608383179} -08/30/2021 21:35:54 - INFO - __main__ - Step 46109: {'lr': 0.0003981971102537398, 'samples': 8852928, 'steps': 46108, 'loss/train': 1.0998417139053345} -08/30/2021 21:35:54 - INFO - __main__ - Step 46110: {'lr': 0.00039819283639016547, 'samples': 8853120, 'steps': 46109, 'loss/train': 1.6847704648971558} -08/30/2021 21:35:56 - INFO - __main__ - Step 46111: {'lr': 0.00039818856245981766, 'samples': 8853312, 'steps': 46110, 'loss/train': 1.3850125074386597} -08/30/2021 21:35:56 - INFO - __main__ - Step 46112: {'lr': 0.0003981842884626984, 'samples': 8853504, 'steps': 46111, 'loss/train': 0.20583832263946533} -08/30/2021 21:35:57 - INFO - __main__ - Step 46113: {'lr': 0.0003981800143988095, 'samples': 8853696, 'steps': 46112, 'loss/train': 1.6219192743301392} -08/30/2021 21:35:57 - INFO - __main__ - Step 46114: {'lr': 0.00039817574026815305, 'samples': 8853888, 'steps': 46113, 'loss/train': 1.994206190109253} -08/30/2021 21:35:57 - INFO - __main__ - Step 46115: {'lr': 0.0003981714660707309, 'samples': 8854080, 'steps': 46114, 'loss/train': 1.6100820302963257} -08/30/2021 21:35:59 - INFO - __main__ - Step 46116: {'lr': 0.00039816719180654493, 'samples': 8854272, 'steps': 46115, 'loss/train': 1.5760902166366577} -08/30/2021 21:36:00 - INFO - __main__ - Step 46117: {'lr': 0.0003981629174755972, 'samples': 8854464, 'steps': 46116, 'loss/train': 1.4815994501113892} -08/30/2021 21:36:00 - INFO - __main__ - Step 46118: {'lr': 0.0003981586430778895, 'samples': 8854656, 'steps': 46117, 'loss/train': 1.3517539501190186} -08/30/2021 21:36:00 - INFO - __main__ - Step 46119: {'lr': 0.0003981543686134238, 'samples': 8854848, 'steps': 46118, 'loss/train': 1.9788190126419067} -08/30/2021 21:36:01 - INFO - __main__ - Step 46120: {'lr': 0.000398150094082202, 'samples': 8855040, 'steps': 46119, 'loss/train': 0.6015864610671997} -08/30/2021 21:36:01 - INFO - __main__ - Step 46121: {'lr': 0.000398145819484226, 'samples': 8855232, 'steps': 46120, 'loss/train': 1.427643895149231} -08/30/2021 21:36:03 - INFO - __main__ - Step 46122: {'lr': 0.00039814154481949786, 'samples': 8855424, 'steps': 46121, 'loss/train': 0.10691922158002853} -08/30/2021 21:36:04 - INFO - __main__ - Step 46123: {'lr': 0.00039813727008801945, 'samples': 8855616, 'steps': 46122, 'loss/train': 0.900311291217804} -08/30/2021 21:36:04 - INFO - __main__ - Step 46124: {'lr': 0.00039813299528979263, 'samples': 8855808, 'steps': 46123, 'loss/train': 1.440889596939087} -08/30/2021 21:36:04 - INFO - __main__ - Step 46125: {'lr': 0.0003981287204248194, 'samples': 8856000, 'steps': 46124, 'loss/train': 1.5318527221679688} -08/30/2021 21:36:05 - INFO - __main__ - Step 46126: {'lr': 0.0003981244454931017, 'samples': 8856192, 'steps': 46125, 'loss/train': 1.2276725769042969} -08/30/2021 21:36:06 - INFO - __main__ - Step 46127: {'lr': 0.00039812017049464126, 'samples': 8856384, 'steps': 46126, 'loss/train': 1.801188349723816} -08/30/2021 21:36:07 - INFO - __main__ - Step 46128: {'lr': 0.0003981158954294403, 'samples': 8856576, 'steps': 46127, 'loss/train': 1.2678282260894775} -08/30/2021 21:36:07 - INFO - __main__ - Step 46129: {'lr': 0.00039811162029750047, 'samples': 8856768, 'steps': 46128, 'loss/train': 1.3311612606048584} -08/30/2021 21:36:07 - INFO - __main__ - Step 46130: {'lr': 0.00039810734509882395, 'samples': 8856960, 'steps': 46129, 'loss/train': 1.0655478239059448} -08/30/2021 21:36:08 - INFO - __main__ - Step 46131: {'lr': 0.0003981030698334125, 'samples': 8857152, 'steps': 46130, 'loss/train': 1.7195959091186523} -08/30/2021 21:36:09 - INFO - __main__ - Step 46132: {'lr': 0.00039809879450126805, 'samples': 8857344, 'steps': 46131, 'loss/train': 1.5221997499465942} -08/30/2021 21:36:10 - INFO - __main__ - Step 46133: {'lr': 0.00039809451910239257, 'samples': 8857536, 'steps': 46132, 'loss/train': 1.752462387084961} -08/30/2021 21:36:10 - INFO - __main__ - Step 46134: {'lr': 0.000398090243636788, 'samples': 8857728, 'steps': 46133, 'loss/train': 1.5113725662231445} -08/30/2021 21:36:10 - INFO - __main__ - Step 46135: {'lr': 0.00039808596810445636, 'samples': 8857920, 'steps': 46134, 'loss/train': 1.106951117515564} -08/30/2021 21:36:11 - INFO - __main__ - Step 46136: {'lr': 0.0003980816925053994, 'samples': 8858112, 'steps': 46135, 'loss/train': 1.3570268154144287} -08/30/2021 21:36:13 - INFO - __main__ - Step 46137: {'lr': 0.0003980774168396191, 'samples': 8858304, 'steps': 46136, 'loss/train': 0.6676763892173767} -08/30/2021 21:36:13 - INFO - __main__ - Step 46138: {'lr': 0.00039807314110711735, 'samples': 8858496, 'steps': 46137, 'loss/train': 1.039880633354187} -08/30/2021 21:36:14 - INFO - __main__ - Step 46139: {'lr': 0.0003980688653078962, 'samples': 8858688, 'steps': 46138, 'loss/train': 0.527498185634613} -08/30/2021 21:36:14 - INFO - __main__ - Step 46140: {'lr': 0.00039806458944195743, 'samples': 8858880, 'steps': 46139, 'loss/train': 1.460119605064392} -08/30/2021 21:36:14 - INFO - __main__ - Step 46141: {'lr': 0.00039806031350930315, 'samples': 8859072, 'steps': 46140, 'loss/train': 1.4636150598526} -08/30/2021 21:36:15 - INFO - __main__ - Step 46142: {'lr': 0.00039805603750993514, 'samples': 8859264, 'steps': 46141, 'loss/train': 0.8240839242935181} -08/30/2021 21:36:17 - INFO - __main__ - Step 46143: {'lr': 0.0003980517614438553, 'samples': 8859456, 'steps': 46142, 'loss/train': 0.1934243142604828} -08/30/2021 21:36:17 - INFO - __main__ - Step 46144: {'lr': 0.00039804748531106565, 'samples': 8859648, 'steps': 46143, 'loss/train': 0.29726606607437134} -08/30/2021 21:36:17 - INFO - __main__ - Step 46145: {'lr': 0.0003980432091115681, 'samples': 8859840, 'steps': 46144, 'loss/train': 1.9492334127426147} -08/30/2021 21:36:18 - INFO - __main__ - Step 46146: {'lr': 0.0003980389328453646, 'samples': 8860032, 'steps': 46145, 'loss/train': 1.390972375869751} -08/30/2021 21:36:18 - INFO - __main__ - Step 46147: {'lr': 0.00039803465651245694, 'samples': 8860224, 'steps': 46146, 'loss/train': 1.752730131149292} -08/30/2021 21:36:20 - INFO - __main__ - Step 46148: {'lr': 0.00039803038011284724, 'samples': 8860416, 'steps': 46147, 'loss/train': 1.2309606075286865} -08/30/2021 21:36:20 - INFO - __main__ - Step 46149: {'lr': 0.00039802610364653737, 'samples': 8860608, 'steps': 46148, 'loss/train': 1.667372703552246} -08/30/2021 21:36:20 - INFO - __main__ - Step 46150: {'lr': 0.00039802182711352906, 'samples': 8860800, 'steps': 46149, 'loss/train': 1.5557856559753418} -08/30/2021 21:36:21 - INFO - __main__ - Step 46151: {'lr': 0.0003980175505138246, 'samples': 8860992, 'steps': 46150, 'loss/train': 1.385726809501648} -08/30/2021 21:36:21 - INFO - __main__ - Step 46152: {'lr': 0.0003980132738474256, 'samples': 8861184, 'steps': 46151, 'loss/train': 1.421400547027588} -08/30/2021 21:36:23 - INFO - __main__ - Step 46153: {'lr': 0.0003980089971143341, 'samples': 8861376, 'steps': 46152, 'loss/train': 1.3695296049118042} -08/30/2021 21:36:24 - INFO - __main__ - Step 46154: {'lr': 0.000398004720314552, 'samples': 8861568, 'steps': 46153, 'loss/train': 1.2512880563735962} -08/30/2021 21:36:24 - INFO - __main__ - Step 46155: {'lr': 0.00039800044344808134, 'samples': 8861760, 'steps': 46154, 'loss/train': 1.1035337448120117} -08/30/2021 21:36:24 - INFO - __main__ - Step 46156: {'lr': 0.00039799616651492394, 'samples': 8861952, 'steps': 46155, 'loss/train': 1.1669267416000366} -08/30/2021 21:36:25 - INFO - __main__ - Step 46157: {'lr': 0.00039799188951508176, 'samples': 8862144, 'steps': 46156, 'loss/train': 1.2630959749221802} -08/30/2021 21:36:25 - INFO - __main__ - Step 46158: {'lr': 0.0003979876124485567, 'samples': 8862336, 'steps': 46157, 'loss/train': 0.9439281821250916} -08/30/2021 21:36:25 - INFO - __main__ - Step 46159: {'lr': 0.0003979833353153507, 'samples': 8862528, 'steps': 46158, 'loss/train': 1.7229725122451782} -08/30/2021 21:36:27 - INFO - __main__ - Step 46160: {'lr': 0.00039797905811546564, 'samples': 8862720, 'steps': 46159, 'loss/train': 1.7560029029846191} -08/30/2021 21:36:27 - INFO - __main__ - Step 46161: {'lr': 0.0003979747808489036, 'samples': 8862912, 'steps': 46160, 'loss/train': 1.4252433776855469} -08/30/2021 21:36:28 - INFO - __main__ - Step 46162: {'lr': 0.0003979705035156663, 'samples': 8863104, 'steps': 46161, 'loss/train': 1.0816069841384888} -08/30/2021 21:36:28 - INFO - __main__ - Step 46163: {'lr': 0.0003979662261157558, 'samples': 8863296, 'steps': 46162, 'loss/train': 1.4421778917312622} -08/30/2021 21:36:28 - INFO - __main__ - Step 46164: {'lr': 0.00039796194864917414, 'samples': 8863488, 'steps': 46163, 'loss/train': 1.2068511247634888} -08/30/2021 21:36:30 - INFO - __main__ - Step 46165: {'lr': 0.00039795767111592303, 'samples': 8863680, 'steps': 46164, 'loss/train': 1.4976835250854492} -08/30/2021 21:36:30 - INFO - __main__ - Step 46166: {'lr': 0.00039795339351600444, 'samples': 8863872, 'steps': 46165, 'loss/train': 1.525852918624878} -08/30/2021 21:36:31 - INFO - __main__ - Step 46167: {'lr': 0.0003979491158494203, 'samples': 8864064, 'steps': 46166, 'loss/train': 0.6323105096817017} -08/30/2021 21:36:31 - INFO - __main__ - Step 46168: {'lr': 0.00039794483811617267, 'samples': 8864256, 'steps': 46167, 'loss/train': 1.0992785692214966} -08/30/2021 21:36:31 - INFO - __main__ - Step 46169: {'lr': 0.0003979405603162633, 'samples': 8864448, 'steps': 46168, 'loss/train': 0.6095963716506958} -08/30/2021 21:36:33 - INFO - __main__ - Step 46170: {'lr': 0.0003979362824496942, 'samples': 8864640, 'steps': 46169, 'loss/train': 1.1593022346496582} -08/30/2021 21:36:34 - INFO - __main__ - Step 46171: {'lr': 0.00039793200451646737, 'samples': 8864832, 'steps': 46170, 'loss/train': 2.0511343479156494} -08/30/2021 21:36:34 - INFO - __main__ - Step 46172: {'lr': 0.0003979277265165846, 'samples': 8865024, 'steps': 46171, 'loss/train': 0.8530001640319824} -08/30/2021 21:36:34 - INFO - __main__ - Step 46173: {'lr': 0.00039792344845004793, 'samples': 8865216, 'steps': 46172, 'loss/train': 0.21832449734210968} -08/30/2021 21:36:35 - INFO - __main__ - Step 46174: {'lr': 0.00039791917031685914, 'samples': 8865408, 'steps': 46173, 'loss/train': 1.4622730016708374} -08/30/2021 21:36:35 - INFO - __main__ - Step 46175: {'lr': 0.0003979148921170203, 'samples': 8865600, 'steps': 46174, 'loss/train': 1.5187691450119019} -08/30/2021 21:36:37 - INFO - __main__ - Step 46176: {'lr': 0.0003979106138505333, 'samples': 8865792, 'steps': 46175, 'loss/train': 0.1938311755657196} -08/30/2021 21:36:38 - INFO - __main__ - Step 46177: {'lr': 0.00039790633551740006, 'samples': 8865984, 'steps': 46176, 'loss/train': 1.7372809648513794} -08/30/2021 21:36:38 - INFO - __main__ - Step 46178: {'lr': 0.0003979020571176226, 'samples': 8866176, 'steps': 46177, 'loss/train': 1.3579798936843872} -08/30/2021 21:36:38 - INFO - __main__ - Step 46179: {'lr': 0.00039789777865120257, 'samples': 8866368, 'steps': 46178, 'loss/train': 1.2651915550231934} -08/30/2021 21:36:39 - INFO - __main__ - Step 46180: {'lr': 0.0003978935001181422, 'samples': 8866560, 'steps': 46179, 'loss/train': 0.8050438761711121} -08/30/2021 21:36:40 - INFO - __main__ - Step 46181: {'lr': 0.0003978892215184433, 'samples': 8866752, 'steps': 46180, 'loss/train': 1.3935328722000122} -08/30/2021 21:36:41 - INFO - __main__ - Step 46182: {'lr': 0.00039788494285210774, 'samples': 8866944, 'steps': 46181, 'loss/train': 1.5677921772003174} -08/30/2021 21:36:41 - INFO - __main__ - Step 46183: {'lr': 0.0003978806641191376, 'samples': 8867136, 'steps': 46182, 'loss/train': 1.093623399734497} -08/30/2021 21:36:41 - INFO - __main__ - Step 46184: {'lr': 0.0003978763853195346, 'samples': 8867328, 'steps': 46183, 'loss/train': 1.6276055574417114} -08/30/2021 21:36:42 - INFO - __main__ - Step 46185: {'lr': 0.0003978721064533009, 'samples': 8867520, 'steps': 46184, 'loss/train': 0.7652538418769836} -08/30/2021 21:36:43 - INFO - __main__ - Step 46186: {'lr': 0.0003978678275204383, 'samples': 8867712, 'steps': 46185, 'loss/train': 1.3193808794021606} -08/30/2021 21:36:44 - INFO - __main__ - Step 46187: {'lr': 0.00039786354852094864, 'samples': 8867904, 'steps': 46186, 'loss/train': 1.2814688682556152} -08/30/2021 21:36:44 - INFO - __main__ - Step 46188: {'lr': 0.00039785926945483396, 'samples': 8868096, 'steps': 46187, 'loss/train': 1.363050103187561} -08/30/2021 21:36:44 - INFO - __main__ - Step 46189: {'lr': 0.00039785499032209625, 'samples': 8868288, 'steps': 46188, 'loss/train': 1.6129274368286133} -08/30/2021 21:36:45 - INFO - __main__ - Step 46190: {'lr': 0.0003978507111227373, 'samples': 8868480, 'steps': 46189, 'loss/train': 1.592990756034851} -08/30/2021 21:36:46 - INFO - __main__ - Step 46191: {'lr': 0.00039784643185675916, 'samples': 8868672, 'steps': 46190, 'loss/train': 1.0570385456085205} -08/30/2021 21:36:47 - INFO - __main__ - Step 46192: {'lr': 0.0003978421525241637, 'samples': 8868864, 'steps': 46191, 'loss/train': 1.2486673593521118} -08/30/2021 21:36:47 - INFO - __main__ - Step 46193: {'lr': 0.00039783787312495277, 'samples': 8869056, 'steps': 46192, 'loss/train': 1.3574209213256836} -08/30/2021 21:36:47 - INFO - __main__ - Step 46194: {'lr': 0.0003978335936591284, 'samples': 8869248, 'steps': 46193, 'loss/train': 1.377662181854248} -08/30/2021 21:36:48 - INFO - __main__ - Step 46195: {'lr': 0.00039782931412669253, 'samples': 8869440, 'steps': 46194, 'loss/train': 1.480639934539795} -08/30/2021 21:36:49 - INFO - __main__ - Step 46196: {'lr': 0.000397825034527647, 'samples': 8869632, 'steps': 46195, 'loss/train': 1.0930739641189575} -08/30/2021 21:36:50 - INFO - __main__ - Step 46197: {'lr': 0.0003978207548619939, 'samples': 8869824, 'steps': 46196, 'loss/train': 1.1441224813461304} -08/30/2021 21:36:50 - INFO - __main__ - Step 46198: {'lr': 0.000397816475129735, 'samples': 8870016, 'steps': 46197, 'loss/train': 1.2958287000656128} -08/30/2021 21:36:50 - INFO - __main__ - Step 46199: {'lr': 0.0003978121953308722, 'samples': 8870208, 'steps': 46198, 'loss/train': 0.08704115450382233} -08/30/2021 21:36:51 - INFO - __main__ - Step 46200: {'lr': 0.0003978079154654075, 'samples': 8870400, 'steps': 46199, 'loss/train': 1.887276530265808} -08/30/2021 21:36:52 - INFO - __main__ - Step 46201: {'lr': 0.000397803635533343, 'samples': 8870592, 'steps': 46200, 'loss/train': 1.4722938537597656} -08/30/2021 21:36:53 - INFO - __main__ - Step 46202: {'lr': 0.00039779935553468026, 'samples': 8870784, 'steps': 46201, 'loss/train': 0.962514340877533} -08/30/2021 21:36:53 - INFO - __main__ - Step 46203: {'lr': 0.0003977950754694215, 'samples': 8870976, 'steps': 46202, 'loss/train': 1.211369276046753} -08/30/2021 21:36:53 - INFO - __main__ - Step 46204: {'lr': 0.00039779079533756856, 'samples': 8871168, 'steps': 46203, 'loss/train': 0.9213801026344299} -08/30/2021 21:36:54 - INFO - __main__ - Step 46205: {'lr': 0.00039778651513912343, 'samples': 8871360, 'steps': 46204, 'loss/train': 1.4540120363235474} -08/30/2021 21:36:55 - INFO - __main__ - Step 46206: {'lr': 0.00039778223487408796, 'samples': 8871552, 'steps': 46205, 'loss/train': 1.5263670682907104} -08/30/2021 21:36:56 - INFO - __main__ - Step 46207: {'lr': 0.000397777954542464, 'samples': 8871744, 'steps': 46206, 'loss/train': 1.5929806232452393} -08/30/2021 21:36:56 - INFO - __main__ - Step 46208: {'lr': 0.0003977736741442537, 'samples': 8871936, 'steps': 46207, 'loss/train': 0.9667959809303284} -08/30/2021 21:36:57 - INFO - __main__ - Step 46209: {'lr': 0.00039776939367945874, 'samples': 8872128, 'steps': 46208, 'loss/train': 0.7413719296455383} -08/30/2021 21:36:57 - INFO - __main__ - Step 46210: {'lr': 0.00039776511314808125, 'samples': 8872320, 'steps': 46209, 'loss/train': 1.5515624284744263} -08/30/2021 21:36:59 - INFO - __main__ - Step 46211: {'lr': 0.00039776083255012307, 'samples': 8872512, 'steps': 46210, 'loss/train': 1.241766095161438} -08/30/2021 21:36:59 - INFO - __main__ - Step 46212: {'lr': 0.0003977565518855861, 'samples': 8872704, 'steps': 46211, 'loss/train': 1.7987287044525146} -08/30/2021 21:36:59 - INFO - __main__ - Step 46213: {'lr': 0.0003977522711544723, 'samples': 8872896, 'steps': 46212, 'loss/train': 1.8362617492675781} -08/30/2021 21:37:00 - INFO - __main__ - Step 46214: {'lr': 0.00039774799035678367, 'samples': 8873088, 'steps': 46213, 'loss/train': 1.6681052446365356} -08/30/2021 21:37:00 - INFO - __main__ - Step 46215: {'lr': 0.000397743709492522, 'samples': 8873280, 'steps': 46214, 'loss/train': 1.1651482582092285} -08/30/2021 21:37:00 - INFO - __main__ - Step 46216: {'lr': 0.0003977394285616893, 'samples': 8873472, 'steps': 46215, 'loss/train': 1.7766283750534058} -08/30/2021 21:37:02 - INFO - __main__ - Step 46217: {'lr': 0.0003977351475642876, 'samples': 8873664, 'steps': 46216, 'loss/train': 1.6095948219299316} -08/30/2021 21:37:02 - INFO - __main__ - Step 46218: {'lr': 0.00039773086650031866, 'samples': 8873856, 'steps': 46217, 'loss/train': 1.8161734342575073} -08/30/2021 21:37:03 - INFO - __main__ - Step 46219: {'lr': 0.00039772658536978443, 'samples': 8874048, 'steps': 46218, 'loss/train': 2.2312960624694824} -08/30/2021 21:37:03 - INFO - __main__ - Step 46220: {'lr': 0.00039772230417268697, 'samples': 8874240, 'steps': 46219, 'loss/train': 1.3596910238265991} -08/30/2021 21:37:03 - INFO - __main__ - Step 46221: {'lr': 0.00039771802290902806, 'samples': 8874432, 'steps': 46220, 'loss/train': 1.7038460969924927} -08/30/2021 21:37:05 - INFO - __main__ - Step 46222: {'lr': 0.0003977137415788097, 'samples': 8874624, 'steps': 46221, 'loss/train': 1.1598373651504517} -08/30/2021 21:37:06 - INFO - __main__ - Step 46223: {'lr': 0.00039770946018203375, 'samples': 8874816, 'steps': 46222, 'loss/train': 1.12007737159729} -08/30/2021 21:37:06 - INFO - __main__ - Step 46224: {'lr': 0.00039770517871870226, 'samples': 8875008, 'steps': 46223, 'loss/train': 1.3621773719787598} -08/30/2021 21:37:06 - INFO - __main__ - Step 46225: {'lr': 0.00039770089718881707, 'samples': 8875200, 'steps': 46224, 'loss/train': 1.7137166261672974} -08/30/2021 21:37:07 - INFO - __main__ - Step 46226: {'lr': 0.00039769661559238014, 'samples': 8875392, 'steps': 46225, 'loss/train': 2.332510232925415} -08/30/2021 21:37:09 - INFO - __main__ - Step 46227: {'lr': 0.0003976923339293934, 'samples': 8875584, 'steps': 46226, 'loss/train': 1.9135557413101196} -08/30/2021 21:37:09 - INFO - __main__ - Step 46228: {'lr': 0.0003976880521998588, 'samples': 8875776, 'steps': 46227, 'loss/train': 1.3628970384597778} -08/30/2021 21:37:10 - INFO - __main__ - Step 46229: {'lr': 0.00039768377040377823, 'samples': 8875968, 'steps': 46228, 'loss/train': 1.220140814781189} -08/30/2021 21:37:10 - INFO - __main__ - Step 46230: {'lr': 0.00039767948854115356, 'samples': 8876160, 'steps': 46229, 'loss/train': 1.4693472385406494} -08/30/2021 21:37:10 - INFO - __main__ - Step 46231: {'lr': 0.0003976752066119869, 'samples': 8876352, 'steps': 46230, 'loss/train': 0.8738886713981628} -08/30/2021 21:37:12 - INFO - __main__ - Step 46232: {'lr': 0.00039767092461628, 'samples': 8876544, 'steps': 46231, 'loss/train': 1.5112401247024536} -08/30/2021 21:37:12 - INFO - __main__ - Step 46233: {'lr': 0.0003976666425540349, 'samples': 8876736, 'steps': 46232, 'loss/train': 1.237876296043396} -08/30/2021 21:37:13 - INFO - __main__ - Step 46234: {'lr': 0.00039766236042525346, 'samples': 8876928, 'steps': 46233, 'loss/train': 1.1422197818756104} -08/30/2021 21:37:13 - INFO - __main__ - Step 46235: {'lr': 0.0003976580782299376, 'samples': 8877120, 'steps': 46234, 'loss/train': 0.8942980170249939} -08/30/2021 21:37:13 - INFO - __main__ - Step 46236: {'lr': 0.0003976537959680894, 'samples': 8877312, 'steps': 46235, 'loss/train': 0.6486141085624695} -08/30/2021 21:37:14 - INFO - __main__ - Step 46237: {'lr': 0.0003976495136397106, 'samples': 8877504, 'steps': 46236, 'loss/train': 1.5675405263900757} -08/30/2021 21:37:15 - INFO - __main__ - Step 46238: {'lr': 0.0003976452312448032, 'samples': 8877696, 'steps': 46237, 'loss/train': 0.45567041635513306} -08/30/2021 21:37:16 - INFO - __main__ - Step 46239: {'lr': 0.0003976409487833692, 'samples': 8877888, 'steps': 46238, 'loss/train': 0.8916254043579102} -08/30/2021 21:37:16 - INFO - __main__ - Step 46240: {'lr': 0.0003976366662554104, 'samples': 8878080, 'steps': 46239, 'loss/train': 1.6405450105667114} -08/30/2021 21:37:16 - INFO - __main__ - Step 46241: {'lr': 0.0003976323836609288, 'samples': 8878272, 'steps': 46240, 'loss/train': 1.2557779550552368} -08/30/2021 21:37:17 - INFO - __main__ - Step 46242: {'lr': 0.00039762810099992644, 'samples': 8878464, 'steps': 46241, 'loss/train': 1.4504786729812622} -08/30/2021 21:37:18 - INFO - __main__ - Step 46243: {'lr': 0.00039762381827240496, 'samples': 8878656, 'steps': 46242, 'loss/train': 0.8763937950134277} -08/30/2021 21:37:19 - INFO - __main__ - Step 46244: {'lr': 0.00039761953547836655, 'samples': 8878848, 'steps': 46243, 'loss/train': 1.3108327388763428} -08/30/2021 21:37:19 - INFO - __main__ - Step 46245: {'lr': 0.00039761525261781304, 'samples': 8879040, 'steps': 46244, 'loss/train': 1.341046929359436} -08/30/2021 21:37:19 - INFO - __main__ - Step 46246: {'lr': 0.00039761096969074644, 'samples': 8879232, 'steps': 46245, 'loss/train': 2.0777194499969482} -08/30/2021 21:37:20 - INFO - __main__ - Step 46247: {'lr': 0.0003976066866971686, 'samples': 8879424, 'steps': 46246, 'loss/train': 2.3430278301239014} -08/30/2021 21:37:22 - INFO - __main__ - Step 46248: {'lr': 0.0003976024036370814, 'samples': 8879616, 'steps': 46247, 'loss/train': 1.6097919940948486} -08/30/2021 21:37:22 - INFO - __main__ - Step 46249: {'lr': 0.0003975981205104868, 'samples': 8879808, 'steps': 46248, 'loss/train': 1.5714012384414673} -08/30/2021 21:37:23 - INFO - __main__ - Step 46250: {'lr': 0.0003975938373173868, 'samples': 8880000, 'steps': 46249, 'loss/train': 1.0613620281219482} -08/30/2021 21:37:23 - INFO - __main__ - Step 46251: {'lr': 0.00039758955405778344, 'samples': 8880192, 'steps': 46250, 'loss/train': 1.2717669010162354} -08/30/2021 21:37:23 - INFO - __main__ - Step 46252: {'lr': 0.0003975852707316784, 'samples': 8880384, 'steps': 46251, 'loss/train': 0.6949333548545837} -08/30/2021 21:37:25 - INFO - __main__ - Step 46253: {'lr': 0.00039758098733907364, 'samples': 8880576, 'steps': 46252, 'loss/train': 1.4614229202270508} -08/30/2021 21:37:26 - INFO - __main__ - Step 46254: {'lr': 0.00039757670387997125, 'samples': 8880768, 'steps': 46253, 'loss/train': 1.3671222925186157} -08/30/2021 21:37:26 - INFO - __main__ - Step 46255: {'lr': 0.000397572420354373, 'samples': 8880960, 'steps': 46254, 'loss/train': 1.1175525188446045} -08/30/2021 21:37:26 - INFO - __main__ - Step 46256: {'lr': 0.00039756813676228097, 'samples': 8881152, 'steps': 46255, 'loss/train': 0.03302577883005142} -08/30/2021 21:37:27 - INFO - __main__ - Step 46257: {'lr': 0.00039756385310369703, 'samples': 8881344, 'steps': 46256, 'loss/train': 1.6000744104385376} -08/30/2021 21:37:27 - INFO - __main__ - Step 46258: {'lr': 0.00039755956937862305, 'samples': 8881536, 'steps': 46257, 'loss/train': 1.1022528409957886} -08/30/2021 21:37:28 - INFO - __main__ - Step 46259: {'lr': 0.000397555285587061, 'samples': 8881728, 'steps': 46258, 'loss/train': 1.7841720581054688} -08/30/2021 21:37:29 - INFO - __main__ - Step 46260: {'lr': 0.0003975510017290128, 'samples': 8881920, 'steps': 46259, 'loss/train': 1.7257399559020996} -08/30/2021 21:37:29 - INFO - __main__ - Step 46261: {'lr': 0.00039754671780448044, 'samples': 8882112, 'steps': 46260, 'loss/train': 1.54389488697052} -08/30/2021 21:37:30 - INFO - __main__ - Step 46262: {'lr': 0.00039754243381346575, 'samples': 8882304, 'steps': 46261, 'loss/train': 1.3437176942825317} -08/30/2021 21:37:30 - INFO - __main__ - Step 46263: {'lr': 0.0003975381497559708, 'samples': 8882496, 'steps': 46262, 'loss/train': 1.2379319667816162} -08/30/2021 21:37:32 - INFO - __main__ - Step 46264: {'lr': 0.00039753386563199733, 'samples': 8882688, 'steps': 46263, 'loss/train': 1.2745450735092163} -08/30/2021 21:37:32 - INFO - __main__ - Step 46265: {'lr': 0.0003975295814415475, 'samples': 8882880, 'steps': 46264, 'loss/train': 1.6064344644546509} -08/30/2021 21:37:32 - INFO - __main__ - Step 46266: {'lr': 0.000397525297184623, 'samples': 8883072, 'steps': 46265, 'loss/train': 1.5587611198425293} -08/30/2021 21:37:33 - INFO - __main__ - Step 46267: {'lr': 0.000397521012861226, 'samples': 8883264, 'steps': 46266, 'loss/train': 1.1561015844345093} -08/30/2021 21:37:33 - INFO - __main__ - Step 46268: {'lr': 0.0003975167284713582, 'samples': 8883456, 'steps': 46267, 'loss/train': 0.9928433299064636} -08/30/2021 21:37:33 - INFO - __main__ - Step 46269: {'lr': 0.0003975124440150217, 'samples': 8883648, 'steps': 46268, 'loss/train': 1.107236385345459} -08/30/2021 21:37:35 - INFO - __main__ - Step 46270: {'lr': 0.0003975081594922183, 'samples': 8883840, 'steps': 46269, 'loss/train': 1.228446364402771} -08/30/2021 21:37:35 - INFO - __main__ - Step 46271: {'lr': 0.00039750387490295006, 'samples': 8884032, 'steps': 46270, 'loss/train': 1.3913148641586304} -08/30/2021 21:37:36 - INFO - __main__ - Step 46272: {'lr': 0.00039749959024721883, 'samples': 8884224, 'steps': 46271, 'loss/train': 1.6982171535491943} -08/30/2021 21:37:36 - INFO - __main__ - Step 46273: {'lr': 0.00039749530552502654, 'samples': 8884416, 'steps': 46272, 'loss/train': 1.3710078001022339} -08/30/2021 21:37:36 - INFO - __main__ - Step 46274: {'lr': 0.0003974910207363752, 'samples': 8884608, 'steps': 46273, 'loss/train': 1.2208378314971924} -08/30/2021 21:37:38 - INFO - __main__ - Step 46275: {'lr': 0.00039748673588126674, 'samples': 8884800, 'steps': 46274, 'loss/train': 1.2052921056747437} -08/30/2021 21:37:39 - INFO - __main__ - Step 46276: {'lr': 0.00039748245095970285, 'samples': 8884992, 'steps': 46275, 'loss/train': 1.2287741899490356} -08/30/2021 21:37:39 - INFO - __main__ - Step 46277: {'lr': 0.0003974781659716857, 'samples': 8885184, 'steps': 46276, 'loss/train': 1.2335220575332642} -08/30/2021 21:37:39 - INFO - __main__ - Step 46278: {'lr': 0.00039747388091721723, 'samples': 8885376, 'steps': 46277, 'loss/train': 1.5257847309112549} -08/30/2021 21:37:40 - INFO - __main__ - Step 46279: {'lr': 0.00039746959579629924, 'samples': 8885568, 'steps': 46278, 'loss/train': 1.1049121618270874} -08/30/2021 21:37:40 - INFO - __main__ - Step 46280: {'lr': 0.00039746531060893387, 'samples': 8885760, 'steps': 46279, 'loss/train': 1.31150484085083} -08/30/2021 21:37:41 - INFO - __main__ - Step 46281: {'lr': 0.00039746102535512273, 'samples': 8885952, 'steps': 46280, 'loss/train': 0.13650427758693695} -08/30/2021 21:37:42 - INFO - __main__ - Step 46282: {'lr': 0.000397456740034868, 'samples': 8886144, 'steps': 46281, 'loss/train': 0.8148044943809509} -08/30/2021 21:37:42 - INFO - __main__ - Step 46283: {'lr': 0.00039745245464817156, 'samples': 8886336, 'steps': 46282, 'loss/train': 1.9434828758239746} -08/30/2021 21:37:43 - INFO - __main__ - Step 46284: {'lr': 0.0003974481691950352, 'samples': 8886528, 'steps': 46283, 'loss/train': 1.0992425680160522} -08/30/2021 21:37:43 - INFO - __main__ - Step 46285: {'lr': 0.00039744388367546113, 'samples': 8886720, 'steps': 46284, 'loss/train': 1.3984664678573608} -08/30/2021 21:37:45 - INFO - __main__ - Step 46286: {'lr': 0.0003974395980894511, 'samples': 8886912, 'steps': 46285, 'loss/train': 1.708347201347351} -08/30/2021 21:37:46 - INFO - __main__ - Step 46287: {'lr': 0.000397435312437007, 'samples': 8887104, 'steps': 46286, 'loss/train': 1.7272266149520874} -08/30/2021 21:37:46 - INFO - __main__ - Step 46288: {'lr': 0.0003974310267181308, 'samples': 8887296, 'steps': 46287, 'loss/train': 1.528700351715088} -08/30/2021 21:37:47 - INFO - __main__ - Step 46289: {'lr': 0.00039742674093282447, 'samples': 8887488, 'steps': 46288, 'loss/train': 1.1809642314910889} -08/30/2021 21:37:47 - INFO - __main__ - Step 46290: {'lr': 0.00039742245508109, 'samples': 8887680, 'steps': 46289, 'loss/train': 1.0454107522964478} -08/30/2021 21:37:47 - INFO - __main__ - Step 46291: {'lr': 0.0003974181691629292, 'samples': 8887872, 'steps': 46290, 'loss/train': 0.8907452821731567} -08/30/2021 21:37:49 - INFO - __main__ - Step 46292: {'lr': 0.00039741388317834404, 'samples': 8888064, 'steps': 46291, 'loss/train': 1.265981674194336} -08/30/2021 21:37:49 - INFO - __main__ - Step 46293: {'lr': 0.0003974095971273365, 'samples': 8888256, 'steps': 46292, 'loss/train': 1.664109230041504} -08/30/2021 21:37:50 - INFO - __main__ - Step 46294: {'lr': 0.0003974053110099084, 'samples': 8888448, 'steps': 46293, 'loss/train': 0.955172061920166} -08/30/2021 21:37:50 - INFO - __main__ - Step 46295: {'lr': 0.00039740102482606175, 'samples': 8888640, 'steps': 46294, 'loss/train': 0.922761857509613} -08/30/2021 21:37:50 - INFO - __main__ - Step 46296: {'lr': 0.0003973967385757985, 'samples': 8888832, 'steps': 46295, 'loss/train': 1.448323369026184} -08/30/2021 21:37:52 - INFO - __main__ - Step 46297: {'lr': 0.00039739245225912055, 'samples': 8889024, 'steps': 46296, 'loss/train': 0.8080700039863586} -08/30/2021 21:37:52 - INFO - __main__ - Step 46298: {'lr': 0.0003973881658760298, 'samples': 8889216, 'steps': 46297, 'loss/train': 5.871662139892578} -08/30/2021 21:37:53 - INFO - __main__ - Step 46299: {'lr': 0.0003973838794265283, 'samples': 8889408, 'steps': 46298, 'loss/train': 1.580929160118103} -08/30/2021 21:37:53 - INFO - __main__ - Step 46300: {'lr': 0.00039737959291061785, 'samples': 8889600, 'steps': 46299, 'loss/train': 1.277411699295044} -08/30/2021 21:37:53 - INFO - __main__ - Step 46301: {'lr': 0.00039737530632830045, 'samples': 8889792, 'steps': 46300, 'loss/train': 0.9611787796020508} -08/30/2021 21:37:55 - INFO - __main__ - Step 46302: {'lr': 0.000397371019679578, 'samples': 8889984, 'steps': 46301, 'loss/train': 1.0047014951705933} -08/30/2021 21:37:55 - INFO - __main__ - Step 46303: {'lr': 0.00039736673296445233, 'samples': 8890176, 'steps': 46302, 'loss/train': 0.8591474890708923} -08/30/2021 21:37:56 - INFO - __main__ - Step 46304: {'lr': 0.00039736244618292563, 'samples': 8890368, 'steps': 46303, 'loss/train': 1.2880016565322876} -08/30/2021 21:37:56 - INFO - __main__ - Step 46305: {'lr': 0.0003973581593349997, 'samples': 8890560, 'steps': 46304, 'loss/train': 1.2761203050613403} -08/30/2021 21:37:56 - INFO - __main__ - Step 46306: {'lr': 0.00039735387242067637, 'samples': 8890752, 'steps': 46305, 'loss/train': 1.420340895652771} -08/30/2021 21:37:58 - INFO - __main__ - Step 46307: {'lr': 0.0003973495854399577, 'samples': 8890944, 'steps': 46306, 'loss/train': 1.4159529209136963} -08/30/2021 21:37:58 - INFO - __main__ - Step 46308: {'lr': 0.0003973452983928456, 'samples': 8891136, 'steps': 46307, 'loss/train': 1.291045069694519} -08/30/2021 21:37:59 - INFO - __main__ - Step 46309: {'lr': 0.00039734101127934194, 'samples': 8891328, 'steps': 46308, 'loss/train': 1.4797084331512451} -08/30/2021 21:37:59 - INFO - __main__ - Step 46310: {'lr': 0.0003973367240994487, 'samples': 8891520, 'steps': 46309, 'loss/train': 1.1744816303253174} -08/30/2021 21:38:00 - INFO - __main__ - Step 46311: {'lr': 0.00039733243685316776, 'samples': 8891712, 'steps': 46310, 'loss/train': 1.0302352905273438} -08/30/2021 21:38:00 - INFO - __main__ - Step 46312: {'lr': 0.00039732814954050125, 'samples': 8891904, 'steps': 46311, 'loss/train': 1.0603570938110352} -08/30/2021 21:38:01 - INFO - __main__ - Step 46313: {'lr': 0.0003973238621614508, 'samples': 8892096, 'steps': 46312, 'loss/train': 1.2772960662841797} -08/30/2021 21:38:02 - INFO - __main__ - Step 46314: {'lr': 0.0003973195747160185, 'samples': 8892288, 'steps': 46313, 'loss/train': 1.4406161308288574} -08/30/2021 21:38:02 - INFO - __main__ - Step 46315: {'lr': 0.00039731528720420635, 'samples': 8892480, 'steps': 46314, 'loss/train': 1.1468085050582886} -08/30/2021 21:38:03 - INFO - __main__ - Step 46316: {'lr': 0.00039731099962601613, 'samples': 8892672, 'steps': 46315, 'loss/train': 1.6534302234649658} -08/30/2021 21:38:03 - INFO - __main__ - Step 46317: {'lr': 0.0003973067119814499, 'samples': 8892864, 'steps': 46316, 'loss/train': 1.471175193786621} -08/30/2021 21:38:05 - INFO - __main__ - Step 46318: {'lr': 0.00039730242427050955, 'samples': 8893056, 'steps': 46317, 'loss/train': 1.638662338256836} -08/30/2021 21:38:05 - INFO - __main__ - Step 46319: {'lr': 0.00039729813649319704, 'samples': 8893248, 'steps': 46318, 'loss/train': 1.3218716382980347} -08/30/2021 21:38:05 - INFO - __main__ - Step 46320: {'lr': 0.0003972938486495141, 'samples': 8893440, 'steps': 46319, 'loss/train': 1.574557900428772} -08/30/2021 21:38:06 - INFO - __main__ - Step 46321: {'lr': 0.000397289560739463, 'samples': 8893632, 'steps': 46320, 'loss/train': 1.5087918043136597} -08/30/2021 21:38:06 - INFO - __main__ - Step 46322: {'lr': 0.0003972852727630454, 'samples': 8893824, 'steps': 46321, 'loss/train': 0.4920039474964142} -08/30/2021 21:38:08 - INFO - __main__ - Step 46323: {'lr': 0.0003972809847202633, 'samples': 8894016, 'steps': 46322, 'loss/train': 1.6612825393676758} -08/30/2021 21:38:08 - INFO - __main__ - Step 46324: {'lr': 0.0003972766966111187, 'samples': 8894208, 'steps': 46323, 'loss/train': 1.1593036651611328} -08/30/2021 21:38:09 - INFO - __main__ - Step 46325: {'lr': 0.0003972724084356135, 'samples': 8894400, 'steps': 46324, 'loss/train': 0.040521807968616486} -08/30/2021 21:38:09 - INFO - __main__ - Step 46326: {'lr': 0.0003972681201937497, 'samples': 8894592, 'steps': 46325, 'loss/train': 1.5153847932815552} -08/30/2021 21:38:09 - INFO - __main__ - Step 46327: {'lr': 0.00039726383188552907, 'samples': 8894784, 'steps': 46326, 'loss/train': 1.453345775604248} -08/30/2021 21:38:11 - INFO - __main__ - Step 46328: {'lr': 0.0003972595435109536, 'samples': 8894976, 'steps': 46327, 'loss/train': 1.4819231033325195} -08/30/2021 21:38:11 - INFO - __main__ - Step 46329: {'lr': 0.0003972552550700253, 'samples': 8895168, 'steps': 46328, 'loss/train': 1.424748182296753} -08/30/2021 21:38:12 - INFO - __main__ - Step 46330: {'lr': 0.00039725096656274605, 'samples': 8895360, 'steps': 46329, 'loss/train': 1.365673542022705} -08/30/2021 21:38:12 - INFO - __main__ - Step 46331: {'lr': 0.0003972466779891178, 'samples': 8895552, 'steps': 46330, 'loss/train': 1.0477070808410645} -08/30/2021 21:38:12 - INFO - __main__ - Step 46332: {'lr': 0.00039724238934914246, 'samples': 8895744, 'steps': 46331, 'loss/train': 0.24520935118198395} -08/30/2021 21:38:14 - INFO - __main__ - Step 46333: {'lr': 0.00039723810064282194, 'samples': 8895936, 'steps': 46332, 'loss/train': 1.0881191492080688} -08/30/2021 21:38:14 - INFO - __main__ - Step 46334: {'lr': 0.00039723381187015827, 'samples': 8896128, 'steps': 46333, 'loss/train': 0.9277474284172058} -08/30/2021 21:38:14 - INFO - __main__ - Step 46335: {'lr': 0.00039722952303115325, 'samples': 8896320, 'steps': 46334, 'loss/train': 0.9513620734214783} -08/30/2021 21:38:15 - INFO - __main__ - Step 46336: {'lr': 0.00039722523412580893, 'samples': 8896512, 'steps': 46335, 'loss/train': 1.427181363105774} -08/30/2021 21:38:15 - INFO - __main__ - Step 46337: {'lr': 0.00039722094515412716, 'samples': 8896704, 'steps': 46336, 'loss/train': 1.63276207447052} -08/30/2021 21:38:17 - INFO - __main__ - Step 46338: {'lr': 0.0003972166561161099, 'samples': 8896896, 'steps': 46337, 'loss/train': 1.3761049509048462} -08/30/2021 21:38:18 - INFO - __main__ - Step 46339: {'lr': 0.0003972123670117591, 'samples': 8897088, 'steps': 46338, 'loss/train': 0.9049459099769592} -08/30/2021 21:38:18 - INFO - __main__ - Step 46340: {'lr': 0.0003972080778410767, 'samples': 8897280, 'steps': 46339, 'loss/train': 1.4141075611114502} -08/30/2021 21:38:18 - INFO - __main__ - Step 46341: {'lr': 0.0003972037886040646, 'samples': 8897472, 'steps': 46340, 'loss/train': 1.6987277269363403} -08/30/2021 21:38:19 - INFO - __main__ - Step 46342: {'lr': 0.0003971994993007247, 'samples': 8897664, 'steps': 46341, 'loss/train': 1.3541159629821777} -08/30/2021 21:38:20 - INFO - __main__ - Step 46343: {'lr': 0.000397195209931059, 'samples': 8897856, 'steps': 46342, 'loss/train': 1.1848081350326538} -08/30/2021 21:38:21 - INFO - __main__ - Step 46344: {'lr': 0.00039719092049506945, 'samples': 8898048, 'steps': 46343, 'loss/train': 1.038587212562561} -08/30/2021 21:38:21 - INFO - __main__ - Step 46345: {'lr': 0.0003971866309927579, 'samples': 8898240, 'steps': 46344, 'loss/train': 1.5718634128570557} -08/30/2021 21:38:21 - INFO - __main__ - Step 46346: {'lr': 0.0003971823414241263, 'samples': 8898432, 'steps': 46345, 'loss/train': 1.2847014665603638} -08/30/2021 21:38:22 - INFO - __main__ - Step 46347: {'lr': 0.00039717805178917666, 'samples': 8898624, 'steps': 46346, 'loss/train': 1.255956768989563} -08/30/2021 21:38:23 - INFO - __main__ - Step 46348: {'lr': 0.0003971737620879109, 'samples': 8898816, 'steps': 46347, 'loss/train': 2.589430809020996} -08/30/2021 21:38:24 - INFO - __main__ - Step 46349: {'lr': 0.00039716947232033086, 'samples': 8899008, 'steps': 46348, 'loss/train': 1.7308956384658813} -08/30/2021 21:38:24 - INFO - __main__ - Step 46350: {'lr': 0.0003971651824864385, 'samples': 8899200, 'steps': 46349, 'loss/train': 2.113405466079712} -08/30/2021 21:38:24 - INFO - __main__ - Step 46351: {'lr': 0.0003971608925862358, 'samples': 8899392, 'steps': 46350, 'loss/train': 1.2174782752990723} -08/30/2021 21:38:25 - INFO - __main__ - Step 46352: {'lr': 0.0003971566026197247, 'samples': 8899584, 'steps': 46351, 'loss/train': 1.4920482635498047} -08/30/2021 21:38:25 - INFO - __main__ - Step 46353: {'lr': 0.0003971523125869071, 'samples': 8899776, 'steps': 46352, 'loss/train': 1.7018327713012695} -08/30/2021 21:38:26 - INFO - __main__ - Step 46354: {'lr': 0.0003971480224877849, 'samples': 8899968, 'steps': 46353, 'loss/train': 1.3080763816833496} -08/30/2021 21:38:27 - INFO - __main__ - Step 46355: {'lr': 0.0003971437323223601, 'samples': 8900160, 'steps': 46354, 'loss/train': 1.4450814723968506} -08/30/2021 21:38:27 - INFO - __main__ - Step 46356: {'lr': 0.0003971394420906346, 'samples': 8900352, 'steps': 46355, 'loss/train': 0.7579420208930969} -08/30/2021 21:38:28 - INFO - __main__ - Step 46357: {'lr': 0.0003971351517926103, 'samples': 8900544, 'steps': 46356, 'loss/train': 1.5609254837036133} -08/30/2021 21:38:28 - INFO - __main__ - Step 46358: {'lr': 0.00039713086142828926, 'samples': 8900736, 'steps': 46357, 'loss/train': 1.2565550804138184} -08/30/2021 21:38:30 - INFO - __main__ - Step 46359: {'lr': 0.0003971265709976732, 'samples': 8900928, 'steps': 46358, 'loss/train': 1.2098388671875} -08/30/2021 21:38:30 - INFO - __main__ - Step 46360: {'lr': 0.0003971222805007643, 'samples': 8901120, 'steps': 46359, 'loss/train': 0.48269620537757874} -08/30/2021 21:38:30 - INFO - __main__ - Step 46361: {'lr': 0.0003971179899375643, 'samples': 8901312, 'steps': 46360, 'loss/train': 1.6152585744857788} -08/30/2021 21:38:31 - INFO - __main__ - Step 46362: {'lr': 0.0003971136993080753, 'samples': 8901504, 'steps': 46361, 'loss/train': 1.2865593433380127} -08/30/2021 21:38:31 - INFO - __main__ - Step 46363: {'lr': 0.000397109408612299, 'samples': 8901696, 'steps': 46362, 'loss/train': 1.8012503385543823} -08/30/2021 21:38:33 - INFO - __main__ - Step 46364: {'lr': 0.0003971051178502375, 'samples': 8901888, 'steps': 46363, 'loss/train': 1.3171979188919067} -08/30/2021 21:38:33 - INFO - __main__ - Step 46365: {'lr': 0.00039710082702189276, 'samples': 8902080, 'steps': 46364, 'loss/train': 1.145189642906189} -08/30/2021 21:38:34 - INFO - __main__ - Step 46366: {'lr': 0.0003970965361272667, 'samples': 8902272, 'steps': 46365, 'loss/train': 1.235060453414917} -08/30/2021 21:38:34 - INFO - __main__ - Step 46367: {'lr': 0.0003970922451663611, 'samples': 8902464, 'steps': 46366, 'loss/train': 1.468003511428833} -08/30/2021 21:38:34 - INFO - __main__ - Step 46368: {'lr': 0.0003970879541391781, 'samples': 8902656, 'steps': 46367, 'loss/train': 0.9957088232040405} -08/30/2021 21:38:35 - INFO - __main__ - Step 46369: {'lr': 0.0003970836630457194, 'samples': 8902848, 'steps': 46368, 'loss/train': 1.3989332914352417} -08/30/2021 21:38:36 - INFO - __main__ - Step 46370: {'lr': 0.00039707937188598717, 'samples': 8903040, 'steps': 46369, 'loss/train': 1.7219014167785645} -08/30/2021 21:38:37 - INFO - __main__ - Step 46371: {'lr': 0.00039707508065998324, 'samples': 8903232, 'steps': 46370, 'loss/train': 0.7707935571670532} -08/30/2021 21:38:37 - INFO - __main__ - Step 46372: {'lr': 0.0003970707893677095, 'samples': 8903424, 'steps': 46371, 'loss/train': 1.5996007919311523} -08/30/2021 21:38:37 - INFO - __main__ - Step 46373: {'lr': 0.00039706649800916804, 'samples': 8903616, 'steps': 46372, 'loss/train': 1.0786998271942139} -08/30/2021 21:38:38 - INFO - __main__ - Step 46374: {'lr': 0.0003970622065843607, 'samples': 8903808, 'steps': 46373, 'loss/train': 1.22597336769104} -08/30/2021 21:38:40 - INFO - __main__ - Step 46375: {'lr': 0.00039705791509328926, 'samples': 8904000, 'steps': 46374, 'loss/train': 1.8490779399871826} -08/30/2021 21:38:40 - INFO - __main__ - Step 46376: {'lr': 0.0003970536235359558, 'samples': 8904192, 'steps': 46375, 'loss/train': 0.08509698510169983} -08/30/2021 21:38:41 - INFO - __main__ - Step 46377: {'lr': 0.00039704933191236225, 'samples': 8904384, 'steps': 46376, 'loss/train': 1.120384693145752} -08/30/2021 21:38:41 - INFO - __main__ - Step 46378: {'lr': 0.00039704504022251066, 'samples': 8904576, 'steps': 46377, 'loss/train': 1.7474642992019653} -08/30/2021 21:38:41 - INFO - __main__ - Step 46379: {'lr': 0.00039704074846640277, 'samples': 8904768, 'steps': 46378, 'loss/train': 0.44692519307136536} -08/30/2021 21:38:43 - INFO - __main__ - Step 46380: {'lr': 0.0003970364566440406, 'samples': 8904960, 'steps': 46379, 'loss/train': 1.6594629287719727} -08/30/2021 21:38:43 - INFO - __main__ - Step 46381: {'lr': 0.000397032164755426, 'samples': 8905152, 'steps': 46380, 'loss/train': 1.3192886114120483} -08/30/2021 21:38:44 - INFO - __main__ - Step 46382: {'lr': 0.0003970278728005611, 'samples': 8905344, 'steps': 46381, 'loss/train': 1.883972406387329} -08/30/2021 21:38:44 - INFO - __main__ - Step 46383: {'lr': 0.0003970235807794476, 'samples': 8905536, 'steps': 46382, 'loss/train': 1.01622474193573} -08/30/2021 21:38:44 - INFO - __main__ - Step 46384: {'lr': 0.00039701928869208757, 'samples': 8905728, 'steps': 46383, 'loss/train': 1.8688762187957764} -08/30/2021 21:38:46 - INFO - __main__ - Step 46385: {'lr': 0.0003970149965384829, 'samples': 8905920, 'steps': 46384, 'loss/train': 1.564450740814209} -08/30/2021 21:38:46 - INFO - __main__ - Step 46386: {'lr': 0.00039701070431863564, 'samples': 8906112, 'steps': 46385, 'loss/train': 0.7310260534286499} -08/30/2021 21:38:47 - INFO - __main__ - Step 46387: {'lr': 0.00039700641203254755, 'samples': 8906304, 'steps': 46386, 'loss/train': 1.1244299411773682} -08/30/2021 21:38:47 - INFO - __main__ - Step 46388: {'lr': 0.0003970021196802206, 'samples': 8906496, 'steps': 46387, 'loss/train': 0.5553213357925415} -08/30/2021 21:38:47 - INFO - __main__ - Step 46389: {'lr': 0.0003969978272616569, 'samples': 8906688, 'steps': 46388, 'loss/train': 1.1225703954696655} -08/30/2021 21:38:49 - INFO - __main__ - Step 46390: {'lr': 0.0003969935347768581, 'samples': 8906880, 'steps': 46389, 'loss/train': 1.4424350261688232} -08/30/2021 21:38:50 - INFO - __main__ - Step 46391: {'lr': 0.00039698924222582636, 'samples': 8907072, 'steps': 46390, 'loss/train': 1.399309515953064} -08/30/2021 21:38:50 - INFO - __main__ - Step 46392: {'lr': 0.00039698494960856346, 'samples': 8907264, 'steps': 46391, 'loss/train': 1.6217565536499023} -08/30/2021 21:38:50 - INFO - __main__ - Step 46393: {'lr': 0.0003969806569250716, 'samples': 8907456, 'steps': 46392, 'loss/train': 1.702538251876831} -08/30/2021 21:38:51 - INFO - __main__ - Step 46394: {'lr': 0.0003969763641753523, 'samples': 8907648, 'steps': 46393, 'loss/train': 1.9131591320037842} -08/30/2021 21:38:51 - INFO - __main__ - Step 46395: {'lr': 0.00039697207135940785, 'samples': 8907840, 'steps': 46394, 'loss/train': 1.413002848625183} -08/30/2021 21:38:53 - INFO - __main__ - Step 46396: {'lr': 0.00039696777847724, 'samples': 8908032, 'steps': 46395, 'loss/train': 1.2963913679122925} -08/30/2021 21:38:54 - INFO - __main__ - Step 46397: {'lr': 0.00039696348552885075, 'samples': 8908224, 'steps': 46396, 'loss/train': 1.4687113761901855} -08/30/2021 21:38:54 - INFO - __main__ - Step 46398: {'lr': 0.000396959192514242, 'samples': 8908416, 'steps': 46397, 'loss/train': 0.5586197972297668} -08/30/2021 21:38:54 - INFO - __main__ - Step 46399: {'lr': 0.0003969548994334158, 'samples': 8908608, 'steps': 46398, 'loss/train': 1.152075171470642} -08/30/2021 21:38:55 - INFO - __main__ - Step 46400: {'lr': 0.0003969506062863739, 'samples': 8908800, 'steps': 46399, 'loss/train': 1.3723593950271606} -08/30/2021 21:38:56 - INFO - __main__ - Step 46401: {'lr': 0.0003969463130731183, 'samples': 8908992, 'steps': 46400, 'loss/train': 1.1905274391174316} -08/30/2021 21:38:57 - INFO - __main__ - Step 46402: {'lr': 0.00039694201979365094, 'samples': 8909184, 'steps': 46401, 'loss/train': 1.1204434633255005} -08/30/2021 21:38:57 - INFO - __main__ - Step 46403: {'lr': 0.00039693772644797386, 'samples': 8909376, 'steps': 46402, 'loss/train': 1.4405134916305542} -08/30/2021 21:38:57 - INFO - __main__ - Step 46404: {'lr': 0.0003969334330360889, 'samples': 8909568, 'steps': 46403, 'loss/train': 0.5971283316612244} -08/30/2021 21:38:58 - INFO - __main__ - Step 46405: {'lr': 0.000396929139557998, 'samples': 8909760, 'steps': 46404, 'loss/train': 1.2352240085601807} -08/30/2021 21:38:59 - INFO - __main__ - Step 46406: {'lr': 0.00039692484601370305, 'samples': 8909952, 'steps': 46405, 'loss/train': 0.257072776556015} -08/30/2021 21:39:00 - INFO - __main__ - Step 46407: {'lr': 0.0003969205524032061, 'samples': 8910144, 'steps': 46406, 'loss/train': 1.5808016061782837} -08/30/2021 21:39:00 - INFO - __main__ - Step 46408: {'lr': 0.00039691625872650895, 'samples': 8910336, 'steps': 46407, 'loss/train': 0.11251096427440643} -08/30/2021 21:39:01 - INFO - __main__ - Step 46409: {'lr': 0.00039691196498361364, 'samples': 8910528, 'steps': 46408, 'loss/train': 1.4163175821304321} -08/30/2021 21:39:01 - INFO - __main__ - Step 46410: {'lr': 0.0003969076711745221, 'samples': 8910720, 'steps': 46409, 'loss/train': 1.0320390462875366} -08/30/2021 21:39:02 - INFO - __main__ - Step 46411: {'lr': 0.00039690337729923617, 'samples': 8910912, 'steps': 46410, 'loss/train': 1.420272707939148} -08/30/2021 21:39:03 - INFO - __main__ - Step 46412: {'lr': 0.0003968990833577578, 'samples': 8911104, 'steps': 46411, 'loss/train': 1.061478853225708} -08/30/2021 21:39:03 - INFO - __main__ - Step 46413: {'lr': 0.00039689478935008905, 'samples': 8911296, 'steps': 46412, 'loss/train': 1.1672465801239014} -08/30/2021 21:39:04 - INFO - __main__ - Step 46414: {'lr': 0.00039689049527623176, 'samples': 8911488, 'steps': 46413, 'loss/train': 1.199647068977356} -08/30/2021 21:39:04 - INFO - __main__ - Step 46415: {'lr': 0.0003968862011361879, 'samples': 8911680, 'steps': 46414, 'loss/train': 4.687029838562012} -08/30/2021 21:39:04 - INFO - __main__ - Step 46416: {'lr': 0.0003968819069299593, 'samples': 8911872, 'steps': 46415, 'loss/train': 1.5679432153701782} -08/30/2021 21:39:06 - INFO - __main__ - Step 46417: {'lr': 0.0003968776126575481, 'samples': 8912064, 'steps': 46416, 'loss/train': 1.315466284751892} -08/30/2021 21:39:06 - INFO - __main__ - Step 46418: {'lr': 0.000396873318318956, 'samples': 8912256, 'steps': 46417, 'loss/train': 1.759112000465393} -08/30/2021 21:39:07 - INFO - __main__ - Step 46419: {'lr': 0.00039686902391418514, 'samples': 8912448, 'steps': 46418, 'loss/train': 1.6858388185501099} -08/30/2021 21:39:07 - INFO - __main__ - Step 46420: {'lr': 0.00039686472944323734, 'samples': 8912640, 'steps': 46419, 'loss/train': 1.2738598585128784} -08/30/2021 21:39:07 - INFO - __main__ - Step 46421: {'lr': 0.0003968604349061145, 'samples': 8912832, 'steps': 46420, 'loss/train': 1.1749749183654785} -08/30/2021 21:39:09 - INFO - __main__ - Step 46422: {'lr': 0.0003968561403028187, 'samples': 8913024, 'steps': 46421, 'loss/train': 0.9057864546775818} -08/30/2021 21:39:09 - INFO - __main__ - Step 46423: {'lr': 0.00039685184563335174, 'samples': 8913216, 'steps': 46422, 'loss/train': 0.8991967439651489} -08/30/2021 21:39:10 - INFO - __main__ - Step 46424: {'lr': 0.00039684755089771555, 'samples': 8913408, 'steps': 46423, 'loss/train': 1.1481351852416992} -08/30/2021 21:39:10 - INFO - __main__ - Step 46425: {'lr': 0.0003968432560959122, 'samples': 8913600, 'steps': 46424, 'loss/train': 1.4056631326675415} -08/30/2021 21:39:10 - INFO - __main__ - Step 46426: {'lr': 0.00039683896122794354, 'samples': 8913792, 'steps': 46425, 'loss/train': 0.5119500160217285} -08/30/2021 21:39:12 - INFO - __main__ - Step 46427: {'lr': 0.0003968346662938115, 'samples': 8913984, 'steps': 46426, 'loss/train': 1.2142152786254883} -08/30/2021 21:39:12 - INFO - __main__ - Step 46428: {'lr': 0.00039683037129351805, 'samples': 8914176, 'steps': 46427, 'loss/train': 1.055873155593872} -08/30/2021 21:39:13 - INFO - __main__ - Step 46429: {'lr': 0.000396826076227065, 'samples': 8914368, 'steps': 46428, 'loss/train': 2.5989089012145996} -08/30/2021 21:39:13 - INFO - __main__ - Step 46430: {'lr': 0.00039682178109445447, 'samples': 8914560, 'steps': 46429, 'loss/train': 1.3609981536865234} -08/30/2021 21:39:14 - INFO - __main__ - Step 46431: {'lr': 0.0003968174858956883, 'samples': 8914752, 'steps': 46430, 'loss/train': 1.3880488872528076} -08/30/2021 21:39:14 - INFO - __main__ - Step 46432: {'lr': 0.0003968131906307684, 'samples': 8914944, 'steps': 46431, 'loss/train': 2.0379881858825684} -08/30/2021 21:39:15 - INFO - __main__ - Step 46433: {'lr': 0.00039680889529969686, 'samples': 8915136, 'steps': 46432, 'loss/train': 1.4394398927688599} -08/30/2021 21:39:16 - INFO - __main__ - Step 46434: {'lr': 0.0003968045999024754, 'samples': 8915328, 'steps': 46433, 'loss/train': 1.478371500968933} -08/30/2021 21:39:16 - INFO - __main__ - Step 46435: {'lr': 0.0003968003044391061, 'samples': 8915520, 'steps': 46434, 'loss/train': 1.430979609489441} -08/30/2021 21:39:17 - INFO - __main__ - Step 46436: {'lr': 0.00039679600890959077, 'samples': 8915712, 'steps': 46435, 'loss/train': 1.47868013381958} -08/30/2021 21:39:17 - INFO - __main__ - Step 46437: {'lr': 0.0003967917133139315, 'samples': 8915904, 'steps': 46436, 'loss/train': 0.9623647928237915} -08/30/2021 21:39:18 - INFO - __main__ - Step 46438: {'lr': 0.00039678741765213006, 'samples': 8916096, 'steps': 46437, 'loss/train': 1.2012237310409546} -08/30/2021 21:39:19 - INFO - __main__ - Step 46439: {'lr': 0.0003967831219241885, 'samples': 8916288, 'steps': 46438, 'loss/train': 1.716123342514038} -08/30/2021 21:39:19 - INFO - __main__ - Step 46440: {'lr': 0.00039677882613010885, 'samples': 8916480, 'steps': 46439, 'loss/train': 1.2938593626022339} -08/30/2021 21:39:20 - INFO - __main__ - Step 46441: {'lr': 0.0003967745302698928, 'samples': 8916672, 'steps': 46440, 'loss/train': 1.6129469871520996} -08/30/2021 21:39:20 - INFO - __main__ - Step 46442: {'lr': 0.0003967702343435424, 'samples': 8916864, 'steps': 46441, 'loss/train': 1.0996365547180176} -08/30/2021 21:39:21 - INFO - __main__ - Step 46443: {'lr': 0.00039676593835105966, 'samples': 8917056, 'steps': 46442, 'loss/train': 1.3036185503005981} -08/30/2021 21:39:22 - INFO - __main__ - Step 46444: {'lr': 0.0003967616422924465, 'samples': 8917248, 'steps': 46443, 'loss/train': 0.3570886254310608} -08/30/2021 21:39:22 - INFO - __main__ - Step 46445: {'lr': 0.0003967573461677047, 'samples': 8917440, 'steps': 46444, 'loss/train': 1.205920934677124} -08/30/2021 21:39:23 - INFO - __main__ - Step 46446: {'lr': 0.0003967530499768364, 'samples': 8917632, 'steps': 46445, 'loss/train': 1.3876349925994873} -08/30/2021 21:39:23 - INFO - __main__ - Step 46447: {'lr': 0.00039674875371984336, 'samples': 8917824, 'steps': 46446, 'loss/train': 1.094080924987793} -08/30/2021 21:39:25 - INFO - __main__ - Step 46448: {'lr': 0.0003967444573967277, 'samples': 8918016, 'steps': 46447, 'loss/train': 1.777151107788086} -08/30/2021 21:39:26 - INFO - __main__ - Step 46449: {'lr': 0.0003967401610074911, 'samples': 8918208, 'steps': 46448, 'loss/train': 1.5550758838653564} -08/30/2021 21:39:26 - INFO - __main__ - Step 46450: {'lr': 0.0003967358645521357, 'samples': 8918400, 'steps': 46449, 'loss/train': 1.61412513256073} -08/30/2021 21:39:26 - INFO - __main__ - Step 46451: {'lr': 0.00039673156803066346, 'samples': 8918592, 'steps': 46450, 'loss/train': 1.265376329421997} -08/30/2021 21:39:27 - INFO - __main__ - Step 46452: {'lr': 0.00039672727144307617, 'samples': 8918784, 'steps': 46451, 'loss/train': 1.3651338815689087} -08/30/2021 21:39:29 - INFO - __main__ - Step 46453: {'lr': 0.0003967229747893759, 'samples': 8918976, 'steps': 46452, 'loss/train': 1.778683066368103} -08/30/2021 21:39:29 - INFO - __main__ - Step 46454: {'lr': 0.0003967186780695645, 'samples': 8919168, 'steps': 46453, 'loss/train': 0.8877943754196167} -08/30/2021 21:39:29 - INFO - __main__ - Step 46455: {'lr': 0.0003967143812836439, 'samples': 8919360, 'steps': 46454, 'loss/train': 1.4448751211166382} -08/30/2021 21:39:30 - INFO - __main__ - Step 46456: {'lr': 0.00039671008443161604, 'samples': 8919552, 'steps': 46455, 'loss/train': 1.5197033882141113} -08/30/2021 21:39:30 - INFO - __main__ - Step 46457: {'lr': 0.00039670578751348283, 'samples': 8919744, 'steps': 46456, 'loss/train': 1.4699782133102417} -08/30/2021 21:39:31 - INFO - __main__ - Step 46458: {'lr': 0.0003967014905292464, 'samples': 8919936, 'steps': 46457, 'loss/train': 1.248752474784851} -08/30/2021 21:39:32 - INFO - __main__ - Step 46459: {'lr': 0.0003966971934789084, 'samples': 8920128, 'steps': 46458, 'loss/train': 1.0813713073730469} -08/30/2021 21:39:33 - INFO - __main__ - Step 46460: {'lr': 0.0003966928963624711, 'samples': 8920320, 'steps': 46459, 'loss/train': 0.6591024994850159} -08/30/2021 21:39:33 - INFO - __main__ - Step 46461: {'lr': 0.0003966885991799361, 'samples': 8920512, 'steps': 46460, 'loss/train': 0.09682805836200714} -08/30/2021 21:39:34 - INFO - __main__ - Step 46462: {'lr': 0.0003966843019313055, 'samples': 8920704, 'steps': 46461, 'loss/train': 1.508422613143921} -08/30/2021 21:39:34 - INFO - __main__ - Step 46463: {'lr': 0.00039668000461658126, 'samples': 8920896, 'steps': 46462, 'loss/train': 1.7693690061569214} -08/30/2021 21:39:34 - INFO - __main__ - Step 46464: {'lr': 0.00039667570723576516, 'samples': 8921088, 'steps': 46463, 'loss/train': 1.7197455167770386} -08/30/2021 21:39:36 - INFO - __main__ - Step 46465: {'lr': 0.0003966714097888594, 'samples': 8921280, 'steps': 46464, 'loss/train': 1.1874061822891235} -08/30/2021 21:39:37 - INFO - __main__ - Step 46466: {'lr': 0.0003966671122758657, 'samples': 8921472, 'steps': 46465, 'loss/train': 1.247516393661499} -08/30/2021 21:39:37 - INFO - __main__ - Step 46467: {'lr': 0.00039666281469678604, 'samples': 8921664, 'steps': 46466, 'loss/train': 0.1041969582438469} -08/30/2021 21:39:37 - INFO - __main__ - Step 46468: {'lr': 0.0003966585170516224, 'samples': 8921856, 'steps': 46467, 'loss/train': 1.6621135473251343} -08/30/2021 21:39:38 - INFO - __main__ - Step 46469: {'lr': 0.0003966542193403767, 'samples': 8922048, 'steps': 46468, 'loss/train': 1.3643832206726074} -08/30/2021 21:39:39 - INFO - __main__ - Step 46470: {'lr': 0.00039664992156305086, 'samples': 8922240, 'steps': 46469, 'loss/train': 1.1635733842849731} -08/30/2021 21:39:40 - INFO - __main__ - Step 46471: {'lr': 0.00039664562371964683, 'samples': 8922432, 'steps': 46470, 'loss/train': 1.905537486076355} -08/30/2021 21:39:40 - INFO - __main__ - Step 46472: {'lr': 0.00039664132581016654, 'samples': 8922624, 'steps': 46471, 'loss/train': 1.318577766418457} -08/30/2021 21:39:40 - INFO - __main__ - Step 46473: {'lr': 0.000396637027834612, 'samples': 8922816, 'steps': 46472, 'loss/train': 1.265029788017273} -08/30/2021 21:39:41 - INFO - __main__ - Step 46474: {'lr': 0.000396632729792985, 'samples': 8923008, 'steps': 46473, 'loss/train': 1.259962558746338} -08/30/2021 21:39:42 - INFO - __main__ - Step 46475: {'lr': 0.00039662843168528756, 'samples': 8923200, 'steps': 46474, 'loss/train': 0.720410168170929} -08/30/2021 21:39:43 - INFO - __main__ - Step 46476: {'lr': 0.0003966241335115216, 'samples': 8923392, 'steps': 46475, 'loss/train': 0.5920434594154358} -08/30/2021 21:39:43 - INFO - __main__ - Step 46477: {'lr': 0.0003966198352716891, 'samples': 8923584, 'steps': 46476, 'loss/train': 1.7952494621276855} -08/30/2021 21:39:43 - INFO - __main__ - Step 46478: {'lr': 0.000396615536965792, 'samples': 8923776, 'steps': 46477, 'loss/train': 1.2083547115325928} -08/30/2021 21:39:44 - INFO - __main__ - Step 46479: {'lr': 0.00039661123859383214, 'samples': 8923968, 'steps': 46478, 'loss/train': 1.3400609493255615} -08/30/2021 21:39:45 - INFO - __main__ - Step 46480: {'lr': 0.0003966069401558116, 'samples': 8924160, 'steps': 46479, 'loss/train': 1.2760469913482666} -08/30/2021 21:39:46 - INFO - __main__ - Step 46481: {'lr': 0.0003966026416517321, 'samples': 8924352, 'steps': 46480, 'loss/train': 1.30097496509552} -08/30/2021 21:39:46 - INFO - __main__ - Step 46482: {'lr': 0.0003965983430815958, 'samples': 8924544, 'steps': 46481, 'loss/train': 0.6618870496749878} -08/30/2021 21:39:46 - INFO - __main__ - Step 46483: {'lr': 0.00039659404444540456, 'samples': 8924736, 'steps': 46482, 'loss/train': 0.9682953953742981} -08/30/2021 21:39:47 - INFO - __main__ - Step 46484: {'lr': 0.0003965897457431602, 'samples': 8924928, 'steps': 46483, 'loss/train': 1.440982460975647} -08/30/2021 21:39:48 - INFO - __main__ - Step 46485: {'lr': 0.00039658544697486486, 'samples': 8925120, 'steps': 46484, 'loss/train': 0.9061474800109863} -08/30/2021 21:39:49 - INFO - __main__ - Step 46486: {'lr': 0.0003965811481405204, 'samples': 8925312, 'steps': 46485, 'loss/train': 1.4429975748062134} -08/30/2021 21:39:49 - INFO - __main__ - Step 46487: {'lr': 0.00039657684924012873, 'samples': 8925504, 'steps': 46486, 'loss/train': 1.25197434425354} -08/30/2021 21:39:49 - INFO - __main__ - Step 46488: {'lr': 0.0003965725502736917, 'samples': 8925696, 'steps': 46487, 'loss/train': 2.442518472671509} -08/30/2021 21:39:50 - INFO - __main__ - Step 46489: {'lr': 0.0003965682512412114, 'samples': 8925888, 'steps': 46488, 'loss/train': 1.2521421909332275} -08/30/2021 21:39:52 - INFO - __main__ - Step 46490: {'lr': 0.0003965639521426897, 'samples': 8926080, 'steps': 46489, 'loss/train': 1.011144995689392} -08/30/2021 21:39:52 - INFO - __main__ - Step 46491: {'lr': 0.0003965596529781286, 'samples': 8926272, 'steps': 46490, 'loss/train': 1.5611035823822021} -08/30/2021 21:39:52 - INFO - __main__ - Step 46492: {'lr': 0.0003965553537475299, 'samples': 8926464, 'steps': 46491, 'loss/train': 0.7885032892227173} -08/30/2021 21:39:53 - INFO - __main__ - Step 46493: {'lr': 0.0003965510544508957, 'samples': 8926656, 'steps': 46492, 'loss/train': 2.105489492416382} -08/30/2021 21:39:53 - INFO - __main__ - Step 46494: {'lr': 0.0003965467550882278, 'samples': 8926848, 'steps': 46493, 'loss/train': 0.4497945308685303} -08/30/2021 21:39:53 - INFO - __main__ - Step 46495: {'lr': 0.0003965424556595282, 'samples': 8927040, 'steps': 46494, 'loss/train': 0.15612703561782837} -08/30/2021 21:39:55 - INFO - __main__ - Step 46496: {'lr': 0.0003965381561647988, 'samples': 8927232, 'steps': 46495, 'loss/train': 0.16381971538066864} -08/30/2021 21:39:56 - INFO - __main__ - Step 46497: {'lr': 0.0003965338566040416, 'samples': 8927424, 'steps': 46496, 'loss/train': 2.6674323081970215} -08/30/2021 21:39:56 - INFO - __main__ - Step 46498: {'lr': 0.0003965295569772585, 'samples': 8927616, 'steps': 46497, 'loss/train': 1.3930017948150635} -08/30/2021 21:39:56 - INFO - __main__ - Step 46499: {'lr': 0.00039652525728445145, 'samples': 8927808, 'steps': 46498, 'loss/train': 1.14142906665802} -08/30/2021 21:39:57 - INFO - __main__ - Step 46500: {'lr': 0.00039652095752562246, 'samples': 8928000, 'steps': 46499, 'loss/train': 1.0763142108917236} -08/30/2021 21:39:57 - INFO - __main__ - Step 46501: {'lr': 0.00039651665770077326, 'samples': 8928192, 'steps': 46500, 'loss/train': 1.2496905326843262} -08/30/2021 21:39:59 - INFO - __main__ - Step 46502: {'lr': 0.00039651235780990596, 'samples': 8928384, 'steps': 46501, 'loss/train': 1.7091392278671265} -08/30/2021 21:40:00 - INFO - __main__ - Step 46503: {'lr': 0.00039650805785302245, 'samples': 8928576, 'steps': 46502, 'loss/train': 1.410305142402649} -08/30/2021 21:40:00 - INFO - __main__ - Step 46504: {'lr': 0.0003965037578301247, 'samples': 8928768, 'steps': 46503, 'loss/train': 2.1920878887176514} -08/30/2021 21:40:01 - INFO - __main__ - Step 46505: {'lr': 0.00039649945774121453, 'samples': 8928960, 'steps': 46504, 'loss/train': 0.07647178322076797} -08/30/2021 21:40:01 - INFO - __main__ - Step 46506: {'lr': 0.0003964951575862941, 'samples': 8929152, 'steps': 46505, 'loss/train': 2.2515416145324707} -08/30/2021 21:40:03 - INFO - __main__ - Step 46507: {'lr': 0.00039649085736536517, 'samples': 8929344, 'steps': 46506, 'loss/train': 1.6036421060562134} -08/30/2021 21:40:03 - INFO - __main__ - Step 46508: {'lr': 0.0003964865570784296, 'samples': 8929536, 'steps': 46507, 'loss/train': 1.660893201828003} -08/30/2021 21:40:03 - INFO - __main__ - Step 46509: {'lr': 0.00039648225672548953, 'samples': 8929728, 'steps': 46508, 'loss/train': 1.238147497177124} -08/30/2021 21:40:04 - INFO - __main__ - Step 46510: {'lr': 0.00039647795630654687, 'samples': 8929920, 'steps': 46509, 'loss/train': 0.27527180314064026} -08/30/2021 21:40:04 - INFO - __main__ - Step 46511: {'lr': 0.00039647365582160345, 'samples': 8930112, 'steps': 46510, 'loss/train': 1.1017048358917236} -08/30/2021 21:40:06 - INFO - __main__ - Step 46512: {'lr': 0.00039646935527066124, 'samples': 8930304, 'steps': 46511, 'loss/train': 1.0389946699142456} -08/30/2021 21:40:06 - INFO - __main__ - Step 46513: {'lr': 0.00039646505465372223, 'samples': 8930496, 'steps': 46512, 'loss/train': 1.0745177268981934} -08/30/2021 21:40:06 - INFO - __main__ - Step 46514: {'lr': 0.0003964607539707884, 'samples': 8930688, 'steps': 46513, 'loss/train': 1.3683040142059326} -08/30/2021 21:40:07 - INFO - __main__ - Step 46515: {'lr': 0.0003964564532218615, 'samples': 8930880, 'steps': 46514, 'loss/train': 1.363304853439331} -08/30/2021 21:40:07 - INFO - __main__ - Step 46516: {'lr': 0.0003964521524069436, 'samples': 8931072, 'steps': 46515, 'loss/train': 1.4092862606048584} -08/30/2021 21:40:09 - INFO - __main__ - Step 46517: {'lr': 0.00039644785152603666, 'samples': 8931264, 'steps': 46516, 'loss/train': 2.0359411239624023} -08/30/2021 21:40:09 - INFO - __main__ - Step 46518: {'lr': 0.0003964435505791425, 'samples': 8931456, 'steps': 46517, 'loss/train': 1.0100133419036865} -08/30/2021 21:40:09 - INFO - __main__ - Step 46519: {'lr': 0.0003964392495662632, 'samples': 8931648, 'steps': 46518, 'loss/train': 2.2036702632904053} -08/30/2021 21:40:10 - INFO - __main__ - Step 46520: {'lr': 0.0003964349484874007, 'samples': 8931840, 'steps': 46519, 'loss/train': 1.5280835628509521} -08/30/2021 21:40:10 - INFO - __main__ - Step 46521: {'lr': 0.00039643064734255675, 'samples': 8932032, 'steps': 46520, 'loss/train': 1.4089839458465576} -08/30/2021 21:40:12 - INFO - __main__ - Step 46522: {'lr': 0.0003964263461317334, 'samples': 8932224, 'steps': 46521, 'loss/train': 1.513013243675232} -08/30/2021 21:40:12 - INFO - __main__ - Step 46523: {'lr': 0.0003964220448549327, 'samples': 8932416, 'steps': 46522, 'loss/train': 1.6826832294464111} -08/30/2021 21:40:12 - INFO - __main__ - Step 46524: {'lr': 0.0003964177435121565, 'samples': 8932608, 'steps': 46523, 'loss/train': 1.1576457023620605} -08/30/2021 21:40:13 - INFO - __main__ - Step 46525: {'lr': 0.00039641344210340665, 'samples': 8932800, 'steps': 46524, 'loss/train': 1.2321707010269165} -08/30/2021 21:40:13 - INFO - __main__ - Step 46526: {'lr': 0.00039640914062868515, 'samples': 8932992, 'steps': 46525, 'loss/train': 1.8718773126602173} -08/30/2021 21:40:15 - INFO - __main__ - Step 46527: {'lr': 0.000396404839087994, 'samples': 8933184, 'steps': 46526, 'loss/train': 1.7893112897872925} -08/30/2021 21:40:16 - INFO - __main__ - Step 46528: {'lr': 0.0003964005374813351, 'samples': 8933376, 'steps': 46527, 'loss/train': 1.5159106254577637} -08/30/2021 21:40:16 - INFO - __main__ - Step 46529: {'lr': 0.0003963962358087103, 'samples': 8933568, 'steps': 46528, 'loss/train': 1.5724738836288452} -08/30/2021 21:40:16 - INFO - __main__ - Step 46530: {'lr': 0.00039639193407012166, 'samples': 8933760, 'steps': 46529, 'loss/train': 1.3901058435440063} -08/30/2021 21:40:17 - INFO - __main__ - Step 46531: {'lr': 0.00039638763226557106, 'samples': 8933952, 'steps': 46530, 'loss/train': 0.6951644420623779} -08/30/2021 21:40:17 - INFO - __main__ - Step 46532: {'lr': 0.0003963833303950605, 'samples': 8934144, 'steps': 46531, 'loss/train': 1.2721052169799805} -08/30/2021 21:40:18 - INFO - __main__ - Step 46533: {'lr': 0.00039637902845859185, 'samples': 8934336, 'steps': 46532, 'loss/train': 0.113104909658432} -08/30/2021 21:40:19 - INFO - __main__ - Step 46534: {'lr': 0.00039637472645616704, 'samples': 8934528, 'steps': 46533, 'loss/train': 1.9434700012207031} -08/30/2021 21:40:19 - INFO - __main__ - Step 46535: {'lr': 0.00039637042438778804, 'samples': 8934720, 'steps': 46534, 'loss/train': 1.445247769355774} -08/30/2021 21:40:20 - INFO - __main__ - Step 46536: {'lr': 0.0003963661222534568, 'samples': 8934912, 'steps': 46535, 'loss/train': 1.4683629274368286} -08/30/2021 21:40:20 - INFO - __main__ - Step 46537: {'lr': 0.00039636182005317524, 'samples': 8935104, 'steps': 46536, 'loss/train': 0.9552136063575745} -08/30/2021 21:40:22 - INFO - __main__ - Step 46538: {'lr': 0.0003963575177869453, 'samples': 8935296, 'steps': 46537, 'loss/train': 1.3797650337219238} -08/30/2021 21:40:22 - INFO - __main__ - Step 46539: {'lr': 0.00039635321545476894, 'samples': 8935488, 'steps': 46538, 'loss/train': 1.5685139894485474} -08/30/2021 21:40:23 - INFO - __main__ - Step 46540: {'lr': 0.00039634891305664806, 'samples': 8935680, 'steps': 46539, 'loss/train': 0.4467147886753082} -08/30/2021 21:40:23 - INFO - __main__ - Step 46541: {'lr': 0.00039634461059258466, 'samples': 8935872, 'steps': 46540, 'loss/train': 1.5122681856155396} -08/30/2021 21:40:23 - INFO - __main__ - Step 46542: {'lr': 0.0003963403080625806, 'samples': 8936064, 'steps': 46541, 'loss/train': 1.4097596406936646} -08/30/2021 21:40:24 - INFO - __main__ - Step 46543: {'lr': 0.00039633600546663784, 'samples': 8936256, 'steps': 46542, 'loss/train': 0.620442807674408} -08/30/2021 21:40:25 - INFO - __main__ - Step 46544: {'lr': 0.00039633170280475833, 'samples': 8936448, 'steps': 46543, 'loss/train': 0.02913687936961651} -08/30/2021 21:40:26 - INFO - __main__ - Step 46545: {'lr': 0.000396327400076944, 'samples': 8936640, 'steps': 46544, 'loss/train': 1.2260843515396118} -08/30/2021 21:40:26 - INFO - __main__ - Step 46546: {'lr': 0.0003963230972831968, 'samples': 8936832, 'steps': 46545, 'loss/train': 1.0982706546783447} -08/30/2021 21:40:26 - INFO - __main__ - Step 46547: {'lr': 0.0003963187944235188, 'samples': 8937024, 'steps': 46546, 'loss/train': 1.8399192094802856} -08/30/2021 21:40:27 - INFO - __main__ - Step 46548: {'lr': 0.00039631449149791164, 'samples': 8937216, 'steps': 46547, 'loss/train': 1.7213678359985352} -08/30/2021 21:40:27 - INFO - __main__ - Step 46549: {'lr': 0.0003963101885063776, 'samples': 8937408, 'steps': 46548, 'loss/train': 0.965840220451355} -08/30/2021 21:40:29 - INFO - __main__ - Step 46550: {'lr': 0.00039630588544891835, 'samples': 8937600, 'steps': 46549, 'loss/train': 1.4790263175964355} -08/30/2021 21:40:29 - INFO - __main__ - Step 46551: {'lr': 0.0003963015823255359, 'samples': 8937792, 'steps': 46550, 'loss/train': 1.2357102632522583} -08/30/2021 21:40:30 - INFO - __main__ - Step 46552: {'lr': 0.00039629727913623213, 'samples': 8937984, 'steps': 46551, 'loss/train': 0.5301083922386169} -08/30/2021 21:40:30 - INFO - __main__ - Step 46553: {'lr': 0.0003962929758810092, 'samples': 8938176, 'steps': 46552, 'loss/train': 1.064673900604248} -08/30/2021 21:40:30 - INFO - __main__ - Step 46554: {'lr': 0.00039628867255986887, 'samples': 8938368, 'steps': 46553, 'loss/train': 1.47206449508667} -08/30/2021 21:40:32 - INFO - __main__ - Step 46555: {'lr': 0.0003962843691728132, 'samples': 8938560, 'steps': 46554, 'loss/train': 1.1223132610321045} -08/30/2021 21:40:32 - INFO - __main__ - Step 46556: {'lr': 0.000396280065719844, 'samples': 8938752, 'steps': 46555, 'loss/train': 1.6951189041137695} -08/30/2021 21:40:33 - INFO - __main__ - Step 46557: {'lr': 0.0003962757622009632, 'samples': 8938944, 'steps': 46556, 'loss/train': 1.1746906042099} -08/30/2021 21:40:33 - INFO - __main__ - Step 46558: {'lr': 0.0003962714586161729, 'samples': 8939136, 'steps': 46557, 'loss/train': 1.461194634437561} -08/30/2021 21:40:33 - INFO - __main__ - Step 46559: {'lr': 0.0003962671549654748, 'samples': 8939328, 'steps': 46558, 'loss/train': 1.3189209699630737} -08/30/2021 21:40:35 - INFO - __main__ - Step 46560: {'lr': 0.00039626285124887107, 'samples': 8939520, 'steps': 46559, 'loss/train': 1.350839376449585} -08/30/2021 21:40:36 - INFO - __main__ - Step 46561: {'lr': 0.00039625854746636356, 'samples': 8939712, 'steps': 46560, 'loss/train': 1.627736210823059} -08/30/2021 21:40:36 - INFO - __main__ - Step 46562: {'lr': 0.0003962542436179542, 'samples': 8939904, 'steps': 46561, 'loss/train': 1.5022746324539185} -08/30/2021 21:40:37 - INFO - __main__ - Step 46563: {'lr': 0.0003962499397036449, 'samples': 8940096, 'steps': 46562, 'loss/train': 1.1978126764297485} -08/30/2021 21:40:37 - INFO - __main__ - Step 46564: {'lr': 0.0003962456357234377, 'samples': 8940288, 'steps': 46563, 'loss/train': 1.5251049995422363} -08/30/2021 21:40:38 - INFO - __main__ - Step 46565: {'lr': 0.0003962413316773344, 'samples': 8940480, 'steps': 46564, 'loss/train': 0.9784834980964661} -08/30/2021 21:40:39 - INFO - __main__ - Step 46566: {'lr': 0.000396237027565337, 'samples': 8940672, 'steps': 46565, 'loss/train': 1.513731837272644} -08/30/2021 21:40:39 - INFO - __main__ - Step 46567: {'lr': 0.00039623272338744754, 'samples': 8940864, 'steps': 46566, 'loss/train': 1.0512104034423828} -08/30/2021 21:40:40 - INFO - __main__ - Step 46568: {'lr': 0.00039622841914366784, 'samples': 8941056, 'steps': 46567, 'loss/train': 1.1498605012893677} -08/30/2021 21:40:40 - INFO - __main__ - Step 46569: {'lr': 0.0003962241148339999, 'samples': 8941248, 'steps': 46568, 'loss/train': 1.5554029941558838} -08/30/2021 21:40:41 - INFO - __main__ - Step 46570: {'lr': 0.0003962198104584456, 'samples': 8941440, 'steps': 46569, 'loss/train': 1.2344026565551758} -08/30/2021 21:40:42 - INFO - __main__ - Step 46571: {'lr': 0.00039621550601700683, 'samples': 8941632, 'steps': 46570, 'loss/train': 1.5185738801956177} -08/30/2021 21:40:42 - INFO - __main__ - Step 46572: {'lr': 0.0003962112015096857, 'samples': 8941824, 'steps': 46571, 'loss/train': 0.6050847768783569} -08/30/2021 21:40:43 - INFO - __main__ - Step 46573: {'lr': 0.00039620689693648404, 'samples': 8942016, 'steps': 46572, 'loss/train': 1.4969356060028076} -08/30/2021 21:40:43 - INFO - __main__ - Step 46574: {'lr': 0.0003962025922974038, 'samples': 8942208, 'steps': 46573, 'loss/train': 1.7167227268218994} -08/30/2021 21:40:45 - INFO - __main__ - Step 46575: {'lr': 0.00039619828759244693, 'samples': 8942400, 'steps': 46574, 'loss/train': 1.585473895072937} -08/30/2021 21:40:45 - INFO - __main__ - Step 46576: {'lr': 0.00039619398282161536, 'samples': 8942592, 'steps': 46575, 'loss/train': 0.7961347103118896} -08/30/2021 21:40:45 - INFO - __main__ - Step 46577: {'lr': 0.000396189677984911, 'samples': 8942784, 'steps': 46576, 'loss/train': 1.3021938800811768} -08/30/2021 21:40:46 - INFO - __main__ - Step 46578: {'lr': 0.00039618537308233593, 'samples': 8942976, 'steps': 46577, 'loss/train': 1.3764525651931763} -08/30/2021 21:40:46 - INFO - __main__ - Step 46579: {'lr': 0.00039618106811389187, 'samples': 8943168, 'steps': 46578, 'loss/train': 1.0017321109771729} -08/30/2021 21:40:46 - INFO - __main__ - Step 46580: {'lr': 0.00039617676307958095, 'samples': 8943360, 'steps': 46579, 'loss/train': 1.287327527999878} -08/30/2021 21:40:48 - INFO - __main__ - Step 46581: {'lr': 0.000396172457979405, 'samples': 8943552, 'steps': 46580, 'loss/train': 0.498635470867157} -08/30/2021 21:40:48 - INFO - __main__ - Step 46582: {'lr': 0.0003961681528133661, 'samples': 8943744, 'steps': 46581, 'loss/train': 1.1807124614715576} -08/30/2021 21:40:49 - INFO - __main__ - Step 46583: {'lr': 0.00039616384758146594, 'samples': 8943936, 'steps': 46582, 'loss/train': 1.3059812784194946} -08/30/2021 21:40:49 - INFO - __main__ - Step 46584: {'lr': 0.0003961595422837067, 'samples': 8944128, 'steps': 46583, 'loss/train': 1.5214323997497559} -08/30/2021 21:40:50 - INFO - __main__ - Step 46585: {'lr': 0.0003961552369200902, 'samples': 8944320, 'steps': 46584, 'loss/train': 2.019771099090576} -08/30/2021 21:40:51 - INFO - __main__ - Step 46586: {'lr': 0.0003961509314906184, 'samples': 8944512, 'steps': 46585, 'loss/train': 1.2820249795913696} -08/30/2021 21:40:51 - INFO - __main__ - Step 46587: {'lr': 0.00039614662599529325, 'samples': 8944704, 'steps': 46586, 'loss/train': 1.367170810699463} -08/30/2021 21:40:52 - INFO - __main__ - Step 46588: {'lr': 0.0003961423204341167, 'samples': 8944896, 'steps': 46587, 'loss/train': 1.2543559074401855} -08/30/2021 21:40:52 - INFO - __main__ - Step 46589: {'lr': 0.00039613801480709065, 'samples': 8945088, 'steps': 46588, 'loss/train': 1.3060096502304077} -08/30/2021 21:40:52 - INFO - __main__ - Step 46590: {'lr': 0.00039613370911421706, 'samples': 8945280, 'steps': 46589, 'loss/train': 0.9692651629447937} -08/30/2021 21:40:54 - INFO - __main__ - Step 46591: {'lr': 0.00039612940335549793, 'samples': 8945472, 'steps': 46590, 'loss/train': 1.582956075668335} -08/30/2021 21:40:54 - INFO - __main__ - Step 46592: {'lr': 0.0003961250975309351, 'samples': 8945664, 'steps': 46591, 'loss/train': 1.4397635459899902} -08/30/2021 21:40:55 - INFO - __main__ - Step 46593: {'lr': 0.0003961207916405305, 'samples': 8945856, 'steps': 46592, 'loss/train': 1.5003052949905396} -08/30/2021 21:40:55 - INFO - __main__ - Step 46594: {'lr': 0.00039611648568428626, 'samples': 8946048, 'steps': 46593, 'loss/train': 1.9489387273788452} -08/30/2021 21:40:55 - INFO - __main__ - Step 46595: {'lr': 0.0003961121796622041, 'samples': 8946240, 'steps': 46594, 'loss/train': 0.9217385053634644} -08/30/2021 21:40:57 - INFO - __main__ - Step 46596: {'lr': 0.000396107873574286, 'samples': 8946432, 'steps': 46595, 'loss/train': 1.646704912185669} -08/30/2021 21:40:58 - INFO - __main__ - Step 46597: {'lr': 0.00039610356742053403, 'samples': 8946624, 'steps': 46596, 'loss/train': 1.2484387159347534} -08/30/2021 21:40:58 - INFO - __main__ - Step 46598: {'lr': 0.0003960992612009501, 'samples': 8946816, 'steps': 46597, 'loss/train': 1.335153341293335} -08/30/2021 21:40:58 - INFO - __main__ - Step 46599: {'lr': 0.0003960949549155359, 'samples': 8947008, 'steps': 46598, 'loss/train': 1.810439109802246} -08/30/2021 21:40:59 - INFO - __main__ - Step 46600: {'lr': 0.0003960906485642938, 'samples': 8947200, 'steps': 46599, 'loss/train': 1.3295032978057861} -08/30/2021 21:41:00 - INFO - __main__ - Step 46601: {'lr': 0.0003960863421472254, 'samples': 8947392, 'steps': 46600, 'loss/train': 1.6985481977462769} -08/30/2021 21:41:01 - INFO - __main__ - Step 46602: {'lr': 0.00039608203566433273, 'samples': 8947584, 'steps': 46601, 'loss/train': 0.1064622700214386} -08/30/2021 21:41:01 - INFO - __main__ - Step 46603: {'lr': 0.00039607772911561776, 'samples': 8947776, 'steps': 46602, 'loss/train': 1.2042964696884155} -08/30/2021 21:41:01 - INFO - __main__ - Step 46604: {'lr': 0.00039607342250108234, 'samples': 8947968, 'steps': 46603, 'loss/train': 4.798513412475586} -08/30/2021 21:41:02 - INFO - __main__ - Step 46605: {'lr': 0.0003960691158207287, 'samples': 8948160, 'steps': 46604, 'loss/train': 1.0515400171279907} -08/30/2021 21:41:03 - INFO - __main__ - Step 46606: {'lr': 0.0003960648090745584, 'samples': 8948352, 'steps': 46605, 'loss/train': 1.8739527463912964} -08/30/2021 21:41:04 - INFO - __main__ - Step 46607: {'lr': 0.00039606050226257354, 'samples': 8948544, 'steps': 46606, 'loss/train': 1.622254729270935} -08/30/2021 21:41:04 - INFO - __main__ - Step 46608: {'lr': 0.00039605619538477617, 'samples': 8948736, 'steps': 46607, 'loss/train': 1.3610005378723145} -08/30/2021 21:41:04 - INFO - __main__ - Step 46609: {'lr': 0.00039605188844116815, 'samples': 8948928, 'steps': 46608, 'loss/train': 1.7554134130477905} -08/30/2021 21:41:05 - INFO - __main__ - Step 46610: {'lr': 0.0003960475814317512, 'samples': 8949120, 'steps': 46609, 'loss/train': 1.739786148071289} -08/30/2021 21:41:07 - INFO - __main__ - Step 46611: {'lr': 0.0003960432743565277, 'samples': 8949312, 'steps': 46610, 'loss/train': 1.4992097616195679} -08/30/2021 21:41:07 - INFO - __main__ - Step 46612: {'lr': 0.00039603896721549924, 'samples': 8949504, 'steps': 46611, 'loss/train': 1.392314076423645} -08/30/2021 21:41:08 - INFO - __main__ - Step 46613: {'lr': 0.0003960346600086679, 'samples': 8949696, 'steps': 46612, 'loss/train': 0.6547484993934631} -08/30/2021 21:41:08 - INFO - __main__ - Step 46614: {'lr': 0.0003960303527360356, 'samples': 8949888, 'steps': 46613, 'loss/train': 0.21509812772274017} -08/30/2021 21:41:09 - INFO - __main__ - Step 46615: {'lr': 0.00039602604539760425, 'samples': 8950080, 'steps': 46614, 'loss/train': 1.5131797790527344} -08/30/2021 21:41:09 - INFO - __main__ - Step 46616: {'lr': 0.0003960217379933758, 'samples': 8950272, 'steps': 46615, 'loss/train': 0.821017324924469} -08/30/2021 21:41:10 - INFO - __main__ - Step 46617: {'lr': 0.00039601743052335224, 'samples': 8950464, 'steps': 46616, 'loss/train': 1.099391222000122} -08/30/2021 21:41:11 - INFO - __main__ - Step 46618: {'lr': 0.00039601312298753554, 'samples': 8950656, 'steps': 46617, 'loss/train': 1.1759282350540161} -08/30/2021 21:41:11 - INFO - __main__ - Step 46619: {'lr': 0.0003960088153859275, 'samples': 8950848, 'steps': 46618, 'loss/train': 1.1875337362289429} -08/30/2021 21:41:12 - INFO - __main__ - Step 46620: {'lr': 0.0003960045077185301, 'samples': 8951040, 'steps': 46619, 'loss/train': 1.3251686096191406} -08/30/2021 21:41:12 - INFO - __main__ - Step 46621: {'lr': 0.0003960001999853454, 'samples': 8951232, 'steps': 46620, 'loss/train': 1.4342947006225586} -08/30/2021 21:41:13 - INFO - __main__ - Step 46622: {'lr': 0.00039599589218637535, 'samples': 8951424, 'steps': 46621, 'loss/train': 2.8867359161376953} -08/30/2021 21:41:14 - INFO - __main__ - Step 46623: {'lr': 0.00039599158432162163, 'samples': 8951616, 'steps': 46622, 'loss/train': 1.3775701522827148} -08/30/2021 21:41:14 - INFO - __main__ - Step 46624: {'lr': 0.00039598727639108644, 'samples': 8951808, 'steps': 46623, 'loss/train': 1.4124351739883423} -08/30/2021 21:41:15 - INFO - __main__ - Step 46625: {'lr': 0.00039598296839477167, 'samples': 8952000, 'steps': 46624, 'loss/train': 1.266311526298523} -08/30/2021 21:41:15 - INFO - __main__ - Step 46626: {'lr': 0.00039597866033267917, 'samples': 8952192, 'steps': 46625, 'loss/train': 1.1594483852386475} -08/30/2021 21:41:16 - INFO - __main__ - Step 46627: {'lr': 0.00039597435220481094, 'samples': 8952384, 'steps': 46626, 'loss/train': 0.37517017126083374} -08/30/2021 21:41:17 - INFO - __main__ - Step 46628: {'lr': 0.0003959700440111689, 'samples': 8952576, 'steps': 46627, 'loss/train': 0.752773106098175} -08/30/2021 21:41:17 - INFO - __main__ - Step 46629: {'lr': 0.00039596573575175506, 'samples': 8952768, 'steps': 46628, 'loss/train': 1.2355459928512573} -08/30/2021 21:41:18 - INFO - __main__ - Step 46630: {'lr': 0.00039596142742657125, 'samples': 8952960, 'steps': 46629, 'loss/train': 0.8349224925041199} -08/30/2021 21:41:18 - INFO - __main__ - Step 46631: {'lr': 0.00039595711903561947, 'samples': 8953152, 'steps': 46630, 'loss/train': 1.322335958480835} -08/30/2021 21:41:18 - INFO - __main__ - Step 46632: {'lr': 0.0003959528105789018, 'samples': 8953344, 'steps': 46631, 'loss/train': 1.4486145973205566} -08/30/2021 21:41:20 - INFO - __main__ - Step 46633: {'lr': 0.00039594850205641985, 'samples': 8953536, 'steps': 46632, 'loss/train': 2.146667242050171} -08/30/2021 21:41:20 - INFO - __main__ - Step 46634: {'lr': 0.0003959441934681759, 'samples': 8953728, 'steps': 46633, 'loss/train': 0.9349782466888428} -08/30/2021 21:41:20 - INFO - __main__ - Step 46635: {'lr': 0.00039593988481417174, 'samples': 8953920, 'steps': 46634, 'loss/train': 1.77628493309021} -08/30/2021 21:41:21 - INFO - __main__ - Step 46636: {'lr': 0.0003959355760944093, 'samples': 8954112, 'steps': 46635, 'loss/train': 1.5776880979537964} -08/30/2021 21:41:21 - INFO - __main__ - Step 46637: {'lr': 0.0003959312673088905, 'samples': 8954304, 'steps': 46636, 'loss/train': 1.3206682205200195} -08/30/2021 21:41:23 - INFO - __main__ - Step 46638: {'lr': 0.0003959269584576173, 'samples': 8954496, 'steps': 46637, 'loss/train': 1.2387782335281372} -08/30/2021 21:41:23 - INFO - __main__ - Step 46639: {'lr': 0.00039592264954059177, 'samples': 8954688, 'steps': 46638, 'loss/train': 1.8264864683151245} -08/30/2021 21:41:24 - INFO - __main__ - Step 46640: {'lr': 0.00039591834055781566, 'samples': 8954880, 'steps': 46639, 'loss/train': 0.7616661787033081} -08/30/2021 21:41:24 - INFO - __main__ - Step 46641: {'lr': 0.0003959140315092911, 'samples': 8955072, 'steps': 46640, 'loss/train': 1.5174589157104492} -08/30/2021 21:41:25 - INFO - __main__ - Step 46642: {'lr': 0.00039590972239501984, 'samples': 8955264, 'steps': 46641, 'loss/train': 1.505954384803772} -08/30/2021 21:41:26 - INFO - __main__ - Step 46643: {'lr': 0.0003959054132150039, 'samples': 8955456, 'steps': 46642, 'loss/train': 1.04756498336792} -08/30/2021 21:41:26 - INFO - __main__ - Step 46644: {'lr': 0.00039590110396924526, 'samples': 8955648, 'steps': 46643, 'loss/train': 1.6038703918457031} -08/30/2021 21:41:27 - INFO - __main__ - Step 46645: {'lr': 0.0003958967946577459, 'samples': 8955840, 'steps': 46644, 'loss/train': 1.108014702796936} -08/30/2021 21:41:27 - INFO - __main__ - Step 46646: {'lr': 0.0003958924852805076, 'samples': 8956032, 'steps': 46645, 'loss/train': 1.7820674180984497} -08/30/2021 21:41:28 - INFO - __main__ - Step 46647: {'lr': 0.00039588817583753236, 'samples': 8956224, 'steps': 46646, 'loss/train': 1.1025137901306152} -08/30/2021 21:41:28 - INFO - __main__ - Step 46648: {'lr': 0.0003958838663288223, 'samples': 8956416, 'steps': 46647, 'loss/train': 1.5573009252548218} -08/30/2021 21:41:29 - INFO - __main__ - Step 46649: {'lr': 0.00039587955675437917, 'samples': 8956608, 'steps': 46648, 'loss/train': 1.522752285003662} -08/30/2021 21:41:30 - INFO - __main__ - Step 46650: {'lr': 0.00039587524711420487, 'samples': 8956800, 'steps': 46649, 'loss/train': 1.0329043865203857} -08/30/2021 21:41:30 - INFO - __main__ - Step 46651: {'lr': 0.00039587093740830147, 'samples': 8956992, 'steps': 46650, 'loss/train': 1.0183699131011963} -08/30/2021 21:41:30 - INFO - __main__ - Step 46652: {'lr': 0.0003958666276366709, 'samples': 8957184, 'steps': 46651, 'loss/train': 1.0930331945419312} -08/30/2021 21:41:31 - INFO - __main__ - Step 46653: {'lr': 0.00039586231779931516, 'samples': 8957376, 'steps': 46652, 'loss/train': 1.5064520835876465} -08/30/2021 21:41:32 - INFO - __main__ - Step 46654: {'lr': 0.000395858007896236, 'samples': 8957568, 'steps': 46653, 'loss/train': 1.2531154155731201} -08/30/2021 21:41:33 - INFO - __main__ - Step 46655: {'lr': 0.0003958536979274355, 'samples': 8957760, 'steps': 46654, 'loss/train': 1.304987907409668} -08/30/2021 21:41:33 - INFO - __main__ - Step 46656: {'lr': 0.00039584938789291563, 'samples': 8957952, 'steps': 46655, 'loss/train': 1.5240198373794556} -08/30/2021 21:41:33 - INFO - __main__ - Step 46657: {'lr': 0.0003958450777926782, 'samples': 8958144, 'steps': 46656, 'loss/train': 1.392342209815979} -08/30/2021 21:41:34 - INFO - __main__ - Step 46658: {'lr': 0.00039584076762672526, 'samples': 8958336, 'steps': 46657, 'loss/train': 1.3740333318710327} -08/30/2021 21:41:35 - INFO - __main__ - Step 46659: {'lr': 0.0003958364573950587, 'samples': 8958528, 'steps': 46658, 'loss/train': 1.1832071542739868} -08/30/2021 21:41:36 - INFO - __main__ - Step 46660: {'lr': 0.00039583214709768054, 'samples': 8958720, 'steps': 46659, 'loss/train': 0.8641722202301025} -08/30/2021 21:41:36 - INFO - __main__ - Step 46661: {'lr': 0.0003958278367345926, 'samples': 8958912, 'steps': 46660, 'loss/train': 1.4959338903427124} -08/30/2021 21:41:37 - INFO - __main__ - Step 46662: {'lr': 0.00039582352630579697, 'samples': 8959104, 'steps': 46661, 'loss/train': 0.5050196647644043} -08/30/2021 21:41:37 - INFO - __main__ - Step 46663: {'lr': 0.00039581921581129543, 'samples': 8959296, 'steps': 46662, 'loss/train': 1.296554446220398} -08/30/2021 21:41:39 - INFO - __main__ - Step 46664: {'lr': 0.00039581490525109005, 'samples': 8959488, 'steps': 46663, 'loss/train': 1.3569530248641968} -08/30/2021 21:41:39 - INFO - __main__ - Step 46665: {'lr': 0.00039581059462518266, 'samples': 8959680, 'steps': 46664, 'loss/train': 1.441269874572754} -08/30/2021 21:41:40 - INFO - __main__ - Step 46666: {'lr': 0.00039580628393357534, 'samples': 8959872, 'steps': 46665, 'loss/train': 2.0926387310028076} -08/30/2021 21:41:40 - INFO - __main__ - Step 46667: {'lr': 0.0003958019731762699, 'samples': 8960064, 'steps': 46666, 'loss/train': 1.323270559310913} -08/30/2021 21:41:41 - INFO - __main__ - Step 46668: {'lr': 0.0003957976623532684, 'samples': 8960256, 'steps': 46667, 'loss/train': 1.51996910572052} -08/30/2021 21:41:42 - INFO - __main__ - Step 46669: {'lr': 0.0003957933514645727, 'samples': 8960448, 'steps': 46668, 'loss/train': 0.8904617428779602} -08/30/2021 21:41:43 - INFO - __main__ - Step 46670: {'lr': 0.00039578904051018474, 'samples': 8960640, 'steps': 46669, 'loss/train': 1.41978120803833} -08/30/2021 21:41:43 - INFO - __main__ - Step 46671: {'lr': 0.00039578472949010644, 'samples': 8960832, 'steps': 46670, 'loss/train': 1.8270494937896729} -08/30/2021 21:41:44 - INFO - __main__ - Step 46672: {'lr': 0.00039578041840433986, 'samples': 8961024, 'steps': 46671, 'loss/train': 1.687943696975708} -08/30/2021 21:41:44 - INFO - __main__ - Step 46673: {'lr': 0.00039577610725288694, 'samples': 8961216, 'steps': 46672, 'loss/train': 1.4522080421447754} -08/30/2021 21:41:44 - INFO - __main__ - Step 46674: {'lr': 0.0003957717960357494, 'samples': 8961408, 'steps': 46673, 'loss/train': 0.05596524477005005} -08/30/2021 21:41:46 - INFO - __main__ - Step 46675: {'lr': 0.0003957674847529295, 'samples': 8961600, 'steps': 46674, 'loss/train': 1.565984845161438} -08/30/2021 21:41:46 - INFO - __main__ - Step 46676: {'lr': 0.00039576317340442893, 'samples': 8961792, 'steps': 46675, 'loss/train': 0.8277280926704407} -08/30/2021 21:41:47 - INFO - __main__ - Step 46677: {'lr': 0.00039575886199024976, 'samples': 8961984, 'steps': 46676, 'loss/train': 1.6112449169158936} -08/30/2021 21:41:47 - INFO - __main__ - Step 46678: {'lr': 0.0003957545505103939, 'samples': 8962176, 'steps': 46677, 'loss/train': 1.4441978931427002} -08/30/2021 21:41:47 - INFO - __main__ - Step 46679: {'lr': 0.0003957502389648632, 'samples': 8962368, 'steps': 46678, 'loss/train': 0.9319394826889038} -08/30/2021 21:41:49 - INFO - __main__ - Step 46680: {'lr': 0.00039574592735365976, 'samples': 8962560, 'steps': 46679, 'loss/train': 1.4110281467437744} -08/30/2021 21:41:49 - INFO - __main__ - Step 46681: {'lr': 0.00039574161567678545, 'samples': 8962752, 'steps': 46680, 'loss/train': 1.7208095788955688} -08/30/2021 21:41:50 - INFO - __main__ - Step 46682: {'lr': 0.00039573730393424226, 'samples': 8962944, 'steps': 46681, 'loss/train': 1.565172791481018} -08/30/2021 21:41:50 - INFO - __main__ - Step 46683: {'lr': 0.000395732992126032, 'samples': 8963136, 'steps': 46682, 'loss/train': 0.8123407959938049} -08/30/2021 21:41:50 - INFO - __main__ - Step 46684: {'lr': 0.00039572868025215677, 'samples': 8963328, 'steps': 46683, 'loss/train': 1.3226916790008545} -08/30/2021 21:41:52 - INFO - __main__ - Step 46685: {'lr': 0.0003957243683126184, 'samples': 8963520, 'steps': 46684, 'loss/train': 1.796629786491394} -08/30/2021 21:41:52 - INFO - __main__ - Step 46686: {'lr': 0.00039572005630741886, 'samples': 8963712, 'steps': 46685, 'loss/train': 1.2148160934448242} -08/30/2021 21:41:52 - INFO - __main__ - Step 46687: {'lr': 0.00039571574423656017, 'samples': 8963904, 'steps': 46686, 'loss/train': 1.4637819528579712} -08/30/2021 21:41:53 - INFO - __main__ - Step 46688: {'lr': 0.0003957114321000442, 'samples': 8964096, 'steps': 46687, 'loss/train': 1.4490044116973877} -08/30/2021 21:41:53 - INFO - __main__ - Step 46689: {'lr': 0.0003957071198978729, 'samples': 8964288, 'steps': 46688, 'loss/train': 1.9750012159347534} -08/30/2021 21:41:55 - INFO - __main__ - Step 46690: {'lr': 0.00039570280763004823, 'samples': 8964480, 'steps': 46689, 'loss/train': 0.6598650813102722} -08/30/2021 21:41:55 - INFO - __main__ - Step 46691: {'lr': 0.0003956984952965721, 'samples': 8964672, 'steps': 46690, 'loss/train': 0.6906108856201172} -08/30/2021 21:41:56 - INFO - __main__ - Step 46692: {'lr': 0.0003956941828974465, 'samples': 8964864, 'steps': 46691, 'loss/train': 1.3910542726516724} -08/30/2021 21:41:56 - INFO - __main__ - Step 46693: {'lr': 0.0003956898704326733, 'samples': 8965056, 'steps': 46692, 'loss/train': 1.6841434240341187} -08/30/2021 21:41:56 - INFO - __main__ - Step 46694: {'lr': 0.00039568555790225456, 'samples': 8965248, 'steps': 46693, 'loss/train': 0.796154260635376} -08/30/2021 21:41:58 - INFO - __main__ - Step 46695: {'lr': 0.00039568124530619213, 'samples': 8965440, 'steps': 46694, 'loss/train': 1.714715838432312} -08/30/2021 21:41:58 - INFO - __main__ - Step 46696: {'lr': 0.00039567693264448803, 'samples': 8965632, 'steps': 46695, 'loss/train': 1.0624397993087769} -08/30/2021 21:41:59 - INFO - __main__ - Step 46697: {'lr': 0.00039567261991714406, 'samples': 8965824, 'steps': 46696, 'loss/train': 1.678095817565918} -08/30/2021 21:41:59 - INFO - __main__ - Step 46698: {'lr': 0.00039566830712416226, 'samples': 8966016, 'steps': 46697, 'loss/train': 1.608786940574646} -08/30/2021 21:41:59 - INFO - __main__ - Step 46699: {'lr': 0.0003956639942655446, 'samples': 8966208, 'steps': 46698, 'loss/train': 1.038271188735962} -08/30/2021 21:42:01 - INFO - __main__ - Step 46700: {'lr': 0.000395659681341293, 'samples': 8966400, 'steps': 46699, 'loss/train': 1.3168480396270752} -08/30/2021 21:42:01 - INFO - __main__ - Step 46701: {'lr': 0.00039565536835140934, 'samples': 8966592, 'steps': 46700, 'loss/train': 1.6376005411148071} -08/30/2021 21:42:01 - INFO - __main__ - Step 46702: {'lr': 0.00039565105529589575, 'samples': 8966784, 'steps': 46701, 'loss/train': 0.26876187324523926} -08/30/2021 21:42:02 - INFO - __main__ - Step 46703: {'lr': 0.00039564674217475393, 'samples': 8966976, 'steps': 46702, 'loss/train': 2.0138771533966064} -08/30/2021 21:42:02 - INFO - __main__ - Step 46704: {'lr': 0.00039564242898798595, 'samples': 8967168, 'steps': 46703, 'loss/train': 1.4675276279449463} -08/30/2021 21:42:03 - INFO - __main__ - Step 46705: {'lr': 0.00039563811573559377, 'samples': 8967360, 'steps': 46704, 'loss/train': 1.349774718284607} -08/30/2021 21:42:04 - INFO - __main__ - Step 46706: {'lr': 0.00039563380241757927, 'samples': 8967552, 'steps': 46705, 'loss/train': 2.0031542778015137} -08/30/2021 21:42:05 - INFO - __main__ - Step 46707: {'lr': 0.00039562948903394446, 'samples': 8967744, 'steps': 46706, 'loss/train': 1.5094764232635498} -08/30/2021 21:42:05 - INFO - __main__ - Step 46708: {'lr': 0.00039562517558469124, 'samples': 8967936, 'steps': 46707, 'loss/train': 1.3479992151260376} -08/30/2021 21:42:05 - INFO - __main__ - Step 46709: {'lr': 0.00039562086206982157, 'samples': 8968128, 'steps': 46708, 'loss/train': 1.9954441785812378} -08/30/2021 21:42:06 - INFO - __main__ - Step 46710: {'lr': 0.0003956165484893374, 'samples': 8968320, 'steps': 46709, 'loss/train': 1.4335076808929443} -08/30/2021 21:42:07 - INFO - __main__ - Step 46711: {'lr': 0.0003956122348432406, 'samples': 8968512, 'steps': 46710, 'loss/train': 1.5069633722305298} -08/30/2021 21:42:08 - INFO - __main__ - Step 46712: {'lr': 0.0003956079211315332, 'samples': 8968704, 'steps': 46711, 'loss/train': 1.1742591857910156} -08/30/2021 21:42:08 - INFO - __main__ - Step 46713: {'lr': 0.00039560360735421706, 'samples': 8968896, 'steps': 46712, 'loss/train': 1.3166167736053467} -08/30/2021 21:42:08 - INFO - __main__ - Step 46714: {'lr': 0.0003955992935112943, 'samples': 8969088, 'steps': 46713, 'loss/train': 2.564699649810791} -08/30/2021 21:42:09 - INFO - __main__ - Step 46715: {'lr': 0.00039559497960276667, 'samples': 8969280, 'steps': 46714, 'loss/train': 0.9008917212486267} -08/30/2021 21:42:10 - INFO - __main__ - Step 46716: {'lr': 0.0003955906656286362, 'samples': 8969472, 'steps': 46715, 'loss/train': 1.0075536966323853} -08/30/2021 21:42:11 - INFO - __main__ - Step 46717: {'lr': 0.00039558635158890487, 'samples': 8969664, 'steps': 46716, 'loss/train': 1.7885315418243408} -08/30/2021 21:42:11 - INFO - __main__ - Step 46718: {'lr': 0.0003955820374835745, 'samples': 8969856, 'steps': 46717, 'loss/train': 1.791002869606018} -08/30/2021 21:42:11 - INFO - __main__ - Step 46719: {'lr': 0.0003955777233126472, 'samples': 8970048, 'steps': 46718, 'loss/train': 1.9397109746932983} -08/30/2021 21:42:12 - INFO - __main__ - Step 46720: {'lr': 0.00039557340907612473, 'samples': 8970240, 'steps': 46719, 'loss/train': 1.7698420286178589} -08/30/2021 21:42:14 - INFO - __main__ - Step 46721: {'lr': 0.00039556909477400914, 'samples': 8970432, 'steps': 46720, 'loss/train': 1.16049063205719} -08/30/2021 21:42:14 - INFO - __main__ - Step 46722: {'lr': 0.00039556478040630246, 'samples': 8970624, 'steps': 46721, 'loss/train': 0.9853895902633667} -08/30/2021 21:42:14 - INFO - __main__ - Step 46723: {'lr': 0.0003955604659730064, 'samples': 8970816, 'steps': 46722, 'loss/train': 1.8158965110778809} -08/30/2021 21:42:15 - INFO - __main__ - Step 46724: {'lr': 0.00039555615147412315, 'samples': 8971008, 'steps': 46723, 'loss/train': 1.3533720970153809} -08/30/2021 21:42:15 - INFO - __main__ - Step 46725: {'lr': 0.00039555183690965454, 'samples': 8971200, 'steps': 46724, 'loss/train': 0.7115915417671204} -08/30/2021 21:42:16 - INFO - __main__ - Step 46726: {'lr': 0.00039554752227960243, 'samples': 8971392, 'steps': 46725, 'loss/train': 1.4556275606155396} -08/30/2021 21:42:17 - INFO - __main__ - Step 46727: {'lr': 0.0003955432075839689, 'samples': 8971584, 'steps': 46726, 'loss/train': 1.592814326286316} -08/30/2021 21:42:18 - INFO - __main__ - Step 46728: {'lr': 0.00039553889282275585, 'samples': 8971776, 'steps': 46727, 'loss/train': 1.2864998579025269} -08/30/2021 21:42:18 - INFO - __main__ - Step 46729: {'lr': 0.0003955345779959653, 'samples': 8971968, 'steps': 46728, 'loss/train': 1.4471197128295898} -08/30/2021 21:42:18 - INFO - __main__ - Step 46730: {'lr': 0.00039553026310359897, 'samples': 8972160, 'steps': 46729, 'loss/train': 1.2276301383972168} -08/30/2021 21:42:19 - INFO - __main__ - Step 46731: {'lr': 0.000395525948145659, 'samples': 8972352, 'steps': 46730, 'loss/train': 1.077656865119934} -08/30/2021 21:42:21 - INFO - __main__ - Step 46732: {'lr': 0.0003955216331221473, 'samples': 8972544, 'steps': 46731, 'loss/train': 1.38236665725708} -08/30/2021 21:42:21 - INFO - __main__ - Step 46733: {'lr': 0.00039551731803306577, 'samples': 8972736, 'steps': 46732, 'loss/train': 1.2690858840942383} -08/30/2021 21:42:21 - INFO - __main__ - Step 46734: {'lr': 0.0003955130028784165, 'samples': 8972928, 'steps': 46733, 'loss/train': 1.246100902557373} -08/30/2021 21:42:22 - INFO - __main__ - Step 46735: {'lr': 0.0003955086876582012, 'samples': 8973120, 'steps': 46734, 'loss/train': 1.5914968252182007} -08/30/2021 21:42:22 - INFO - __main__ - Step 46736: {'lr': 0.000395504372372422, 'samples': 8973312, 'steps': 46735, 'loss/train': 1.3203520774841309} -08/30/2021 21:42:23 - INFO - __main__ - Step 46737: {'lr': 0.0003955000570210807, 'samples': 8973504, 'steps': 46736, 'loss/train': 1.2192316055297852} -08/30/2021 21:42:24 - INFO - __main__ - Step 46738: {'lr': 0.0003954957416041793, 'samples': 8973696, 'steps': 46737, 'loss/train': 1.6705372333526611} -08/30/2021 21:42:24 - INFO - __main__ - Step 46739: {'lr': 0.0003954914261217198, 'samples': 8973888, 'steps': 46738, 'loss/train': 1.587420105934143} -08/30/2021 21:42:25 - INFO - __main__ - Step 46740: {'lr': 0.0003954871105737042, 'samples': 8974080, 'steps': 46739, 'loss/train': 1.7164605855941772} -08/30/2021 21:42:25 - INFO - __main__ - Step 46741: {'lr': 0.00039548279496013424, 'samples': 8974272, 'steps': 46740, 'loss/train': 1.354990005493164} -08/30/2021 21:42:26 - INFO - __main__ - Step 46742: {'lr': 0.000395478479281012, 'samples': 8974464, 'steps': 46741, 'loss/train': 0.49001172184944153} -08/30/2021 21:42:27 - INFO - __main__ - Step 46743: {'lr': 0.00039547416353633946, 'samples': 8974656, 'steps': 46742, 'loss/train': 1.719616174697876} -08/30/2021 21:42:27 - INFO - __main__ - Step 46744: {'lr': 0.00039546984772611843, 'samples': 8974848, 'steps': 46743, 'loss/train': 1.4128555059432983} -08/30/2021 21:42:28 - INFO - __main__ - Step 46745: {'lr': 0.00039546553185035093, 'samples': 8975040, 'steps': 46744, 'loss/train': 1.2041451930999756} -08/30/2021 21:42:28 - INFO - __main__ - Step 46746: {'lr': 0.00039546121590903897, 'samples': 8975232, 'steps': 46745, 'loss/train': 0.9949818849563599} -08/30/2021 21:42:29 - INFO - __main__ - Step 46747: {'lr': 0.0003954568999021844, 'samples': 8975424, 'steps': 46746, 'loss/train': 0.9891777634620667} -08/30/2021 21:42:30 - INFO - __main__ - Step 46748: {'lr': 0.0003954525838297892, 'samples': 8975616, 'steps': 46747, 'loss/train': 0.6386354565620422} -08/30/2021 21:42:30 - INFO - __main__ - Step 46749: {'lr': 0.0003954482676918553, 'samples': 8975808, 'steps': 46748, 'loss/train': 1.3243474960327148} -08/30/2021 21:42:31 - INFO - __main__ - Step 46750: {'lr': 0.00039544395148838465, 'samples': 8976000, 'steps': 46749, 'loss/train': 1.4077264070510864} -08/30/2021 21:42:31 - INFO - __main__ - Step 46751: {'lr': 0.0003954396352193792, 'samples': 8976192, 'steps': 46750, 'loss/train': 1.731931209564209} -08/30/2021 21:42:32 - INFO - __main__ - Step 46752: {'lr': 0.000395435318884841, 'samples': 8976384, 'steps': 46751, 'loss/train': 0.9415560364723206} -08/30/2021 21:42:33 - INFO - __main__ - Step 46753: {'lr': 0.0003954310024847717, 'samples': 8976576, 'steps': 46752, 'loss/train': 0.8254061341285706} -08/30/2021 21:42:33 - INFO - __main__ - Step 46754: {'lr': 0.00039542668601917353, 'samples': 8976768, 'steps': 46753, 'loss/train': 1.4402449131011963} -08/30/2021 21:42:34 - INFO - __main__ - Step 46755: {'lr': 0.0003954223694880483, 'samples': 8976960, 'steps': 46754, 'loss/train': 1.4386957883834839} -08/30/2021 21:42:34 - INFO - __main__ - Step 46756: {'lr': 0.0003954180528913981, 'samples': 8977152, 'steps': 46755, 'loss/train': 1.414384365081787} -08/30/2021 21:42:34 - INFO - __main__ - Step 46757: {'lr': 0.0003954137362292247, 'samples': 8977344, 'steps': 46756, 'loss/train': 1.3734735250473022} -08/30/2021 21:42:36 - INFO - __main__ - Step 46758: {'lr': 0.0003954094195015301, 'samples': 8977536, 'steps': 46757, 'loss/train': 1.3338264226913452} -08/30/2021 21:42:36 - INFO - __main__ - Step 46759: {'lr': 0.0003954051027083163, 'samples': 8977728, 'steps': 46758, 'loss/train': 1.257049322128296} -08/30/2021 21:42:37 - INFO - __main__ - Step 46760: {'lr': 0.0003954007858495852, 'samples': 8977920, 'steps': 46759, 'loss/train': 1.6133140325546265} -08/30/2021 21:42:37 - INFO - __main__ - Step 46761: {'lr': 0.00039539646892533867, 'samples': 8978112, 'steps': 46760, 'loss/train': 0.7925180792808533} -08/30/2021 21:42:37 - INFO - __main__ - Step 46762: {'lr': 0.00039539215193557886, 'samples': 8978304, 'steps': 46761, 'loss/train': 1.6431457996368408} -08/30/2021 21:42:39 - INFO - __main__ - Step 46763: {'lr': 0.0003953878348803075, 'samples': 8978496, 'steps': 46762, 'loss/train': 1.5009441375732422} -08/30/2021 21:42:40 - INFO - __main__ - Step 46764: {'lr': 0.0003953835177595266, 'samples': 8978688, 'steps': 46763, 'loss/train': 1.6703245639801025} -08/30/2021 21:42:40 - INFO - __main__ - Step 46765: {'lr': 0.0003953792005732382, 'samples': 8978880, 'steps': 46764, 'loss/train': 1.4324314594268799} -08/30/2021 21:42:40 - INFO - __main__ - Step 46766: {'lr': 0.0003953748833214442, 'samples': 8979072, 'steps': 46765, 'loss/train': 2.132652759552002} -08/30/2021 21:42:41 - INFO - __main__ - Step 46767: {'lr': 0.00039537056600414647, 'samples': 8979264, 'steps': 46766, 'loss/train': 1.484071969985962} -08/30/2021 21:42:43 - INFO - __main__ - Step 46768: {'lr': 0.00039536624862134695, 'samples': 8979456, 'steps': 46767, 'loss/train': 0.051184408366680145} -08/30/2021 21:42:43 - INFO - __main__ - Step 46769: {'lr': 0.00039536193117304774, 'samples': 8979648, 'steps': 46768, 'loss/train': 0.13648787140846252} -08/30/2021 21:42:43 - INFO - __main__ - Step 46770: {'lr': 0.0003953576136592507, 'samples': 8979840, 'steps': 46769, 'loss/train': 1.4143809080123901} -08/30/2021 21:42:44 - INFO - __main__ - Step 46771: {'lr': 0.0003953532960799577, 'samples': 8980032, 'steps': 46770, 'loss/train': 0.10448271036148071} -08/30/2021 21:42:44 - INFO - __main__ - Step 46772: {'lr': 0.0003953489784351707, 'samples': 8980224, 'steps': 46771, 'loss/train': 1.5549207925796509} -08/30/2021 21:42:46 - INFO - __main__ - Step 46773: {'lr': 0.0003953446607248918, 'samples': 8980416, 'steps': 46772, 'loss/train': 0.9098787903785706} -08/30/2021 21:42:47 - INFO - __main__ - Step 46774: {'lr': 0.00039534034294912276, 'samples': 8980608, 'steps': 46773, 'loss/train': 1.4835467338562012} -08/30/2021 21:42:47 - INFO - __main__ - Step 46775: {'lr': 0.0003953360251078656, 'samples': 8980800, 'steps': 46774, 'loss/train': 1.5607223510742188} -08/30/2021 21:42:47 - INFO - __main__ - Step 46776: {'lr': 0.0003953317072011224, 'samples': 8980992, 'steps': 46775, 'loss/train': 1.2999229431152344} -08/30/2021 21:42:48 - INFO - __main__ - Step 46777: {'lr': 0.0003953273892288949, 'samples': 8981184, 'steps': 46776, 'loss/train': 0.8891803026199341} -08/30/2021 21:42:48 - INFO - __main__ - Step 46778: {'lr': 0.00039532307119118505, 'samples': 8981376, 'steps': 46777, 'loss/train': 1.2651509046554565} -08/30/2021 21:42:50 - INFO - __main__ - Step 46779: {'lr': 0.00039531875308799493, 'samples': 8981568, 'steps': 46778, 'loss/train': 1.9276164770126343} -08/30/2021 21:42:50 - INFO - __main__ - Step 46780: {'lr': 0.0003953144349193264, 'samples': 8981760, 'steps': 46779, 'loss/train': 1.5773847103118896} -08/30/2021 21:42:50 - INFO - __main__ - Step 46781: {'lr': 0.0003953101166851814, 'samples': 8981952, 'steps': 46780, 'loss/train': 1.127846360206604} -08/30/2021 21:42:51 - INFO - __main__ - Step 46782: {'lr': 0.0003953057983855619, 'samples': 8982144, 'steps': 46781, 'loss/train': 0.2567024230957031} -08/30/2021 21:42:51 - INFO - __main__ - Step 46783: {'lr': 0.00039530148002046996, 'samples': 8982336, 'steps': 46782, 'loss/train': 0.8835437297821045} -08/30/2021 21:42:53 - INFO - __main__ - Step 46784: {'lr': 0.0003952971615899074, 'samples': 8982528, 'steps': 46783, 'loss/train': 1.8005626201629639} -08/30/2021 21:42:53 - INFO - __main__ - Step 46785: {'lr': 0.00039529284309387607, 'samples': 8982720, 'steps': 46784, 'loss/train': 0.7701586484909058} -08/30/2021 21:42:53 - INFO - __main__ - Step 46786: {'lr': 0.0003952885245323781, 'samples': 8982912, 'steps': 46785, 'loss/train': 1.129795789718628} -08/30/2021 21:42:54 - INFO - __main__ - Step 46787: {'lr': 0.00039528420590541536, 'samples': 8983104, 'steps': 46786, 'loss/train': 1.7253730297088623} -08/30/2021 21:42:54 - INFO - __main__ - Step 46788: {'lr': 0.0003952798872129897, 'samples': 8983296, 'steps': 46787, 'loss/train': 1.5704959630966187} -08/30/2021 21:42:56 - INFO - __main__ - Step 46789: {'lr': 0.00039527556845510336, 'samples': 8983488, 'steps': 46788, 'loss/train': 0.7137991786003113} -08/30/2021 21:42:56 - INFO - __main__ - Step 46790: {'lr': 0.00039527124963175796, 'samples': 8983680, 'steps': 46789, 'loss/train': 1.4640997648239136} -08/30/2021 21:42:56 - INFO - __main__ - Step 46791: {'lr': 0.0003952669307429556, 'samples': 8983872, 'steps': 46790, 'loss/train': 1.5724915266036987} -08/30/2021 21:42:57 - INFO - __main__ - Step 46792: {'lr': 0.00039526261178869816, 'samples': 8984064, 'steps': 46791, 'loss/train': 1.6930660009384155} -08/30/2021 21:42:57 - INFO - __main__ - Step 46793: {'lr': 0.0003952582927689877, 'samples': 8984256, 'steps': 46792, 'loss/train': 1.3517203330993652} -08/30/2021 21:42:59 - INFO - __main__ - Step 46794: {'lr': 0.00039525397368382604, 'samples': 8984448, 'steps': 46793, 'loss/train': 1.7242711782455444} -08/30/2021 21:42:59 - INFO - __main__ - Step 46795: {'lr': 0.0003952496545332152, 'samples': 8984640, 'steps': 46794, 'loss/train': 1.0633474588394165} -08/30/2021 21:42:59 - INFO - __main__ - Step 46796: {'lr': 0.00039524533531715714, 'samples': 8984832, 'steps': 46795, 'loss/train': 0.38748928904533386} -08/30/2021 21:43:00 - INFO - __main__ - Step 46797: {'lr': 0.00039524101603565377, 'samples': 8985024, 'steps': 46796, 'loss/train': 1.515345811843872} -08/30/2021 21:43:00 - INFO - __main__ - Step 46798: {'lr': 0.000395236696688707, 'samples': 8985216, 'steps': 46797, 'loss/train': 1.1993645429611206} -08/30/2021 21:43:02 - INFO - __main__ - Step 46799: {'lr': 0.0003952323772763188, 'samples': 8985408, 'steps': 46798, 'loss/train': 1.1981366872787476} -08/30/2021 21:43:02 - INFO - __main__ - Step 46800: {'lr': 0.00039522805779849116, 'samples': 8985600, 'steps': 46799, 'loss/train': 1.5931971073150635} -08/30/2021 21:43:02 - INFO - __main__ - Step 46801: {'lr': 0.000395223738255226, 'samples': 8985792, 'steps': 46800, 'loss/train': 1.298779010772705} -08/30/2021 21:43:03 - INFO - __main__ - Step 46802: {'lr': 0.00039521941864652525, 'samples': 8985984, 'steps': 46801, 'loss/train': 1.1574164628982544} -08/30/2021 21:43:03 - INFO - __main__ - Step 46803: {'lr': 0.0003952150989723909, 'samples': 8986176, 'steps': 46802, 'loss/train': 0.6707392334938049} -08/30/2021 21:43:04 - INFO - __main__ - Step 46804: {'lr': 0.00039521077923282486, 'samples': 8986368, 'steps': 46803, 'loss/train': 1.3017579317092896} -08/30/2021 21:43:05 - INFO - __main__ - Step 46805: {'lr': 0.00039520645942782906, 'samples': 8986560, 'steps': 46804, 'loss/train': 1.4511346817016602} -08/30/2021 21:43:05 - INFO - __main__ - Step 46806: {'lr': 0.00039520213955740555, 'samples': 8986752, 'steps': 46805, 'loss/train': 1.5111244916915894} -08/30/2021 21:43:06 - INFO - __main__ - Step 46807: {'lr': 0.0003951978196215561, 'samples': 8986944, 'steps': 46806, 'loss/train': 0.9505908489227295} -08/30/2021 21:43:06 - INFO - __main__ - Step 46808: {'lr': 0.00039519349962028276, 'samples': 8987136, 'steps': 46807, 'loss/train': 1.3132978677749634} -08/30/2021 21:43:06 - INFO - __main__ - Step 46809: {'lr': 0.0003951891795535875, 'samples': 8987328, 'steps': 46808, 'loss/train': 0.7465982437133789} -08/30/2021 21:43:08 - INFO - __main__ - Step 46810: {'lr': 0.00039518485942147233, 'samples': 8987520, 'steps': 46809, 'loss/train': 1.4024896621704102} -08/30/2021 21:43:09 - INFO - __main__ - Step 46811: {'lr': 0.0003951805392239389, 'samples': 8987712, 'steps': 46810, 'loss/train': 1.0648093223571777} -08/30/2021 21:43:09 - INFO - __main__ - Step 46812: {'lr': 0.00039517621896098954, 'samples': 8987904, 'steps': 46811, 'loss/train': 0.9817931056022644} -08/30/2021 21:43:09 - INFO - __main__ - Step 46813: {'lr': 0.00039517189863262593, 'samples': 8988096, 'steps': 46812, 'loss/train': 1.2508925199508667} -08/30/2021 21:43:10 - INFO - __main__ - Step 46814: {'lr': 0.00039516757823885006, 'samples': 8988288, 'steps': 46813, 'loss/train': 1.2731566429138184} -08/30/2021 21:43:11 - INFO - __main__ - Step 46815: {'lr': 0.000395163257779664, 'samples': 8988480, 'steps': 46814, 'loss/train': 0.9015750288963318} -08/30/2021 21:43:12 - INFO - __main__ - Step 46816: {'lr': 0.00039515893725506956, 'samples': 8988672, 'steps': 46815, 'loss/train': 1.5776115655899048} -08/30/2021 21:43:12 - INFO - __main__ - Step 46817: {'lr': 0.0003951546166650688, 'samples': 8988864, 'steps': 46816, 'loss/train': 1.4892765283584595} -08/30/2021 21:43:12 - INFO - __main__ - Step 46818: {'lr': 0.0003951502960096636, 'samples': 8989056, 'steps': 46817, 'loss/train': 1.0947678089141846} -08/30/2021 21:43:13 - INFO - __main__ - Step 46819: {'lr': 0.00039514597528885587, 'samples': 8989248, 'steps': 46818, 'loss/train': 1.752001166343689} -08/30/2021 21:43:13 - INFO - __main__ - Step 46820: {'lr': 0.0003951416545026476, 'samples': 8989440, 'steps': 46819, 'loss/train': 1.6288435459136963} -08/30/2021 21:43:15 - INFO - __main__ - Step 46821: {'lr': 0.0003951373336510408, 'samples': 8989632, 'steps': 46820, 'loss/train': 0.8195870518684387} -08/30/2021 21:43:15 - INFO - __main__ - Step 46822: {'lr': 0.00039513301273403733, 'samples': 8989824, 'steps': 46821, 'loss/train': 1.6529247760772705} -08/30/2021 21:43:15 - INFO - __main__ - Step 46823: {'lr': 0.0003951286917516392, 'samples': 8990016, 'steps': 46822, 'loss/train': 0.9636734127998352} -08/30/2021 21:43:16 - INFO - __main__ - Step 46824: {'lr': 0.00039512437070384827, 'samples': 8990208, 'steps': 46823, 'loss/train': 1.0846912860870361} -08/30/2021 21:43:16 - INFO - __main__ - Step 46825: {'lr': 0.00039512004959066653, 'samples': 8990400, 'steps': 46824, 'loss/train': 2.174528121948242} -08/30/2021 21:43:18 - INFO - __main__ - Step 46826: {'lr': 0.00039511572841209597, 'samples': 8990592, 'steps': 46825, 'loss/train': 1.1301943063735962} -08/30/2021 21:43:18 - INFO - __main__ - Step 46827: {'lr': 0.00039511140716813847, 'samples': 8990784, 'steps': 46826, 'loss/train': 1.4306621551513672} -08/30/2021 21:43:19 - INFO - __main__ - Step 46828: {'lr': 0.00039510708585879605, 'samples': 8990976, 'steps': 46827, 'loss/train': 1.274446725845337} -08/30/2021 21:43:19 - INFO - __main__ - Step 46829: {'lr': 0.00039510276448407054, 'samples': 8991168, 'steps': 46828, 'loss/train': 1.6111103296279907} -08/30/2021 21:43:19 - INFO - __main__ - Step 46830: {'lr': 0.00039509844304396407, 'samples': 8991360, 'steps': 46829, 'loss/train': 0.9941524863243103} -08/30/2021 21:43:21 - INFO - __main__ - Step 46831: {'lr': 0.00039509412153847847, 'samples': 8991552, 'steps': 46830, 'loss/train': 1.8219833374023438} -08/30/2021 21:43:22 - INFO - __main__ - Step 46832: {'lr': 0.00039508979996761564, 'samples': 8991744, 'steps': 46831, 'loss/train': 0.06311263889074326} -08/30/2021 21:43:22 - INFO - __main__ - Step 46833: {'lr': 0.00039508547833137753, 'samples': 8991936, 'steps': 46832, 'loss/train': 1.9140911102294922} -08/30/2021 21:43:22 - INFO - __main__ - Step 46834: {'lr': 0.0003950811566297662, 'samples': 8992128, 'steps': 46833, 'loss/train': 0.9637599587440491} -08/30/2021 21:43:23 - INFO - __main__ - Step 46835: {'lr': 0.00039507683486278357, 'samples': 8992320, 'steps': 46834, 'loss/train': 0.997583270072937} -08/30/2021 21:43:25 - INFO - __main__ - Step 46836: {'lr': 0.00039507251303043156, 'samples': 8992512, 'steps': 46835, 'loss/train': 1.4343088865280151} -08/30/2021 21:43:25 - INFO - __main__ - Step 46837: {'lr': 0.0003950681911327121, 'samples': 8992704, 'steps': 46836, 'loss/train': 0.8677394390106201} -08/30/2021 21:43:26 - INFO - __main__ - Step 46838: {'lr': 0.00039506386916962714, 'samples': 8992896, 'steps': 46837, 'loss/train': 1.7345106601715088} -08/30/2021 21:43:26 - INFO - __main__ - Step 46839: {'lr': 0.0003950595471411786, 'samples': 8993088, 'steps': 46838, 'loss/train': 0.7948237061500549} -08/30/2021 21:43:26 - INFO - __main__ - Step 46840: {'lr': 0.00039505522504736855, 'samples': 8993280, 'steps': 46839, 'loss/train': 1.6832594871520996} -08/30/2021 21:43:27 - INFO - __main__ - Step 46841: {'lr': 0.00039505090288819876, 'samples': 8993472, 'steps': 46840, 'loss/train': 1.6884573698043823} -08/30/2021 21:43:27 - INFO - __main__ - Step 46842: {'lr': 0.00039504658066367136, 'samples': 8993664, 'steps': 46841, 'loss/train': 1.4265028238296509} -08/30/2021 21:43:29 - INFO - __main__ - Step 46843: {'lr': 0.0003950422583737882, 'samples': 8993856, 'steps': 46842, 'loss/train': 1.5434978008270264} -08/30/2021 21:43:29 - INFO - __main__ - Step 46844: {'lr': 0.0003950379360185512, 'samples': 8994048, 'steps': 46843, 'loss/train': 0.9535610675811768} -08/30/2021 21:43:29 - INFO - __main__ - Step 46845: {'lr': 0.00039503361359796235, 'samples': 8994240, 'steps': 46844, 'loss/train': 0.6791813969612122} -08/30/2021 21:43:30 - INFO - __main__ - Step 46846: {'lr': 0.00039502929111202357, 'samples': 8994432, 'steps': 46845, 'loss/train': 1.835464358329773} -08/30/2021 21:43:30 - INFO - __main__ - Step 46847: {'lr': 0.0003950249685607369, 'samples': 8994624, 'steps': 46846, 'loss/train': 1.4448151588439941} -08/30/2021 21:43:32 - INFO - __main__ - Step 46848: {'lr': 0.00039502064594410414, 'samples': 8994816, 'steps': 46847, 'loss/train': 1.239708423614502} -08/30/2021 21:43:32 - INFO - __main__ - Step 46849: {'lr': 0.00039501632326212734, 'samples': 8995008, 'steps': 46848, 'loss/train': 1.8383761644363403} -08/30/2021 21:43:33 - INFO - __main__ - Step 46850: {'lr': 0.00039501200051480844, 'samples': 8995200, 'steps': 46849, 'loss/train': 1.7683511972427368} -08/30/2021 21:43:33 - INFO - __main__ - Step 46851: {'lr': 0.0003950076777021494, 'samples': 8995392, 'steps': 46850, 'loss/train': 1.6279022693634033} -08/30/2021 21:43:33 - INFO - __main__ - Step 46852: {'lr': 0.00039500335482415205, 'samples': 8995584, 'steps': 46851, 'loss/train': 1.3126909732818604} -08/30/2021 21:43:35 - INFO - __main__ - Step 46853: {'lr': 0.00039499903188081856, 'samples': 8995776, 'steps': 46852, 'loss/train': 1.5261602401733398} -08/30/2021 21:43:35 - INFO - __main__ - Step 46854: {'lr': 0.0003949947088721506, 'samples': 8995968, 'steps': 46853, 'loss/train': 1.5286965370178223} -08/30/2021 21:43:36 - INFO - __main__ - Step 46855: {'lr': 0.0003949903857981503, 'samples': 8996160, 'steps': 46854, 'loss/train': 1.4346762895584106} -08/30/2021 21:43:36 - INFO - __main__ - Step 46856: {'lr': 0.0003949860626588196, 'samples': 8996352, 'steps': 46855, 'loss/train': 1.3137578964233398} -08/30/2021 21:43:36 - INFO - __main__ - Step 46857: {'lr': 0.0003949817394541604, 'samples': 8996544, 'steps': 46856, 'loss/train': 1.7748647928237915} -08/30/2021 21:43:37 - INFO - __main__ - Step 46858: {'lr': 0.0003949774161841747, 'samples': 8996736, 'steps': 46857, 'loss/train': 1.0847824811935425} -08/30/2021 21:43:38 - INFO - __main__ - Step 46859: {'lr': 0.0003949730928488644, 'samples': 8996928, 'steps': 46858, 'loss/train': 1.1866612434387207} -08/30/2021 21:43:39 - INFO - __main__ - Step 46860: {'lr': 0.0003949687694482314, 'samples': 8997120, 'steps': 46859, 'loss/train': 0.5565835237503052} -08/30/2021 21:43:39 - INFO - __main__ - Step 46861: {'lr': 0.0003949644459822778, 'samples': 8997312, 'steps': 46860, 'loss/train': 1.680198073387146} -08/30/2021 21:43:40 - INFO - __main__ - Step 46862: {'lr': 0.00039496012245100536, 'samples': 8997504, 'steps': 46861, 'loss/train': 1.6474800109863281} -08/30/2021 21:43:40 - INFO - __main__ - Step 46863: {'lr': 0.0003949557988544162, 'samples': 8997696, 'steps': 46862, 'loss/train': 1.7829217910766602} -08/30/2021 21:43:40 - INFO - __main__ - Step 46864: {'lr': 0.0003949514751925122, 'samples': 8997888, 'steps': 46863, 'loss/train': 0.6775663495063782} -08/30/2021 21:43:42 - INFO - __main__ - Step 46865: {'lr': 0.00039494715146529526, 'samples': 8998080, 'steps': 46864, 'loss/train': 0.6734489798545837} -08/30/2021 21:43:42 - INFO - __main__ - Step 46866: {'lr': 0.00039494282767276736, 'samples': 8998272, 'steps': 46865, 'loss/train': 1.3911417722702026} -08/30/2021 21:43:42 - INFO - __main__ - Step 46867: {'lr': 0.0003949385038149305, 'samples': 8998464, 'steps': 46866, 'loss/train': 1.6095683574676514} -08/30/2021 21:43:43 - INFO - __main__ - Step 46868: {'lr': 0.0003949341798917866, 'samples': 8998656, 'steps': 46867, 'loss/train': 1.4861193895339966} -08/30/2021 21:43:43 - INFO - __main__ - Step 46869: {'lr': 0.00039492985590333754, 'samples': 8998848, 'steps': 46868, 'loss/train': 1.6450875997543335} -08/30/2021 21:43:45 - INFO - __main__ - Step 46870: {'lr': 0.00039492553184958533, 'samples': 8999040, 'steps': 46869, 'loss/train': 1.5479779243469238} -08/30/2021 21:43:45 - INFO - __main__ - Step 46871: {'lr': 0.00039492120773053195, 'samples': 8999232, 'steps': 46870, 'loss/train': 0.8354942202568054} -08/30/2021 21:43:46 - INFO - __main__ - Step 46872: {'lr': 0.0003949168835461793, 'samples': 8999424, 'steps': 46871, 'loss/train': 1.2415190935134888} -08/30/2021 21:43:46 - INFO - __main__ - Step 46873: {'lr': 0.0003949125592965293, 'samples': 8999616, 'steps': 46872, 'loss/train': 1.026503086090088} -08/30/2021 21:43:46 - INFO - __main__ - Step 46874: {'lr': 0.000394908234981584, 'samples': 8999808, 'steps': 46873, 'loss/train': 1.2157422304153442} -08/30/2021 21:43:48 - INFO - __main__ - Step 46875: {'lr': 0.00039490391060134525, 'samples': 9000000, 'steps': 46874, 'loss/train': 0.33740949630737305} -08/30/2021 21:43:48 - INFO - __main__ - Step 46876: {'lr': 0.000394899586155815, 'samples': 9000192, 'steps': 46875, 'loss/train': 1.6828782558441162} -08/30/2021 21:43:49 - INFO - __main__ - Step 46877: {'lr': 0.00039489526164499536, 'samples': 9000384, 'steps': 46876, 'loss/train': 1.5990478992462158} -08/30/2021 21:43:49 - INFO - __main__ - Step 46878: {'lr': 0.000394890937068888, 'samples': 9000576, 'steps': 46877, 'loss/train': 1.383968472480774} -08/30/2021 21:43:49 - INFO - __main__ - Step 46879: {'lr': 0.00039488661242749506, 'samples': 9000768, 'steps': 46878, 'loss/train': 0.0676184818148613} -08/30/2021 21:43:51 - INFO - __main__ - Step 46880: {'lr': 0.00039488228772081846, 'samples': 9000960, 'steps': 46879, 'loss/train': 1.2641034126281738} -08/30/2021 21:43:51 - INFO - __main__ - Step 46881: {'lr': 0.00039487796294886016, 'samples': 9001152, 'steps': 46880, 'loss/train': 1.5757015943527222} -08/30/2021 21:43:52 - INFO - __main__ - Step 46882: {'lr': 0.0003948736381116221, 'samples': 9001344, 'steps': 46881, 'loss/train': 0.9407084584236145} -08/30/2021 21:43:52 - INFO - __main__ - Step 46883: {'lr': 0.0003948693132091061, 'samples': 9001536, 'steps': 46882, 'loss/train': 1.3212473392486572} -08/30/2021 21:43:52 - INFO - __main__ - Step 46884: {'lr': 0.00039486498824131434, 'samples': 9001728, 'steps': 46883, 'loss/train': 0.8301441669464111} -08/30/2021 21:43:53 - INFO - __main__ - Step 46885: {'lr': 0.00039486066320824865, 'samples': 9001920, 'steps': 46884, 'loss/train': 1.3472568988800049} -08/30/2021 21:43:55 - INFO - __main__ - Step 46886: {'lr': 0.00039485633810991096, 'samples': 9002112, 'steps': 46885, 'loss/train': 1.4078797101974487} -08/30/2021 21:43:55 - INFO - __main__ - Step 46887: {'lr': 0.0003948520129463032, 'samples': 9002304, 'steps': 46886, 'loss/train': 1.7623382806777954} -08/30/2021 21:43:55 - INFO - __main__ - Step 46888: {'lr': 0.0003948476877174274, 'samples': 9002496, 'steps': 46887, 'loss/train': 1.0218671560287476} -08/30/2021 21:43:56 - INFO - __main__ - Step 46889: {'lr': 0.0003948433624232854, 'samples': 9002688, 'steps': 46888, 'loss/train': 0.778704047203064} -08/30/2021 21:43:56 - INFO - __main__ - Step 46890: {'lr': 0.0003948390370638794, 'samples': 9002880, 'steps': 46889, 'loss/train': 0.9362194538116455} -08/30/2021 21:43:58 - INFO - __main__ - Step 46891: {'lr': 0.000394834711639211, 'samples': 9003072, 'steps': 46890, 'loss/train': 1.4387551546096802} -08/30/2021 21:43:59 - INFO - __main__ - Step 46892: {'lr': 0.00039483038614928235, 'samples': 9003264, 'steps': 46891, 'loss/train': 2.5729401111602783} -08/30/2021 21:43:59 - INFO - __main__ - Step 46893: {'lr': 0.0003948260605940953, 'samples': 9003456, 'steps': 46892, 'loss/train': 2.4900550842285156} -08/30/2021 21:44:00 - INFO - __main__ - Step 46894: {'lr': 0.00039482173497365193, 'samples': 9003648, 'steps': 46893, 'loss/train': 0.16495098173618317} -08/30/2021 21:44:00 - INFO - __main__ - Step 46895: {'lr': 0.0003948174092879541, 'samples': 9003840, 'steps': 46894, 'loss/train': 1.792518973350525} -08/30/2021 21:44:00 - INFO - __main__ - Step 46896: {'lr': 0.0003948130835370038, 'samples': 9004032, 'steps': 46895, 'loss/train': 1.7676103115081787} -08/30/2021 21:44:02 - INFO - __main__ - Step 46897: {'lr': 0.000394808757720803, 'samples': 9004224, 'steps': 46896, 'loss/train': 1.2244478464126587} -08/30/2021 21:44:02 - INFO - __main__ - Step 46898: {'lr': 0.00039480443183935357, 'samples': 9004416, 'steps': 46897, 'loss/train': 1.4690419435501099} -08/30/2021 21:44:02 - INFO - __main__ - Step 46899: {'lr': 0.0003948001058926575, 'samples': 9004608, 'steps': 46898, 'loss/train': 1.1695542335510254} -08/30/2021 21:44:03 - INFO - __main__ - Step 46900: {'lr': 0.0003947957798807167, 'samples': 9004800, 'steps': 46899, 'loss/train': 1.4416167736053467} -08/30/2021 21:44:03 - INFO - __main__ - Step 46901: {'lr': 0.00039479145380353313, 'samples': 9004992, 'steps': 46900, 'loss/train': 1.119141936302185} -08/30/2021 21:44:05 - INFO - __main__ - Step 46902: {'lr': 0.0003947871276611088, 'samples': 9005184, 'steps': 46901, 'loss/train': 1.3132799863815308} -08/30/2021 21:44:05 - INFO - __main__ - Step 46903: {'lr': 0.0003947828014534457, 'samples': 9005376, 'steps': 46902, 'loss/train': 0.9954779744148254} -08/30/2021 21:44:06 - INFO - __main__ - Step 46904: {'lr': 0.00039477847518054566, 'samples': 9005568, 'steps': 46903, 'loss/train': 1.407454252243042} -08/30/2021 21:44:06 - INFO - __main__ - Step 46905: {'lr': 0.00039477414884241064, 'samples': 9005760, 'steps': 46904, 'loss/train': 1.0129156112670898} -08/30/2021 21:44:06 - INFO - __main__ - Step 46906: {'lr': 0.0003947698224390426, 'samples': 9005952, 'steps': 46905, 'loss/train': 1.088590383529663} -08/30/2021 21:44:08 - INFO - __main__ - Step 46907: {'lr': 0.0003947654959704435, 'samples': 9006144, 'steps': 46906, 'loss/train': 1.8336222171783447} -08/30/2021 21:44:08 - INFO - __main__ - Step 46908: {'lr': 0.00039476116943661544, 'samples': 9006336, 'steps': 46907, 'loss/train': 1.141404390335083} -08/30/2021 21:44:09 - INFO - __main__ - Step 46909: {'lr': 0.00039475684283756007, 'samples': 9006528, 'steps': 46908, 'loss/train': 0.9881564378738403} -08/30/2021 21:44:09 - INFO - __main__ - Step 46910: {'lr': 0.0003947525161732797, 'samples': 9006720, 'steps': 46909, 'loss/train': 1.0977205038070679} -08/30/2021 21:44:09 - INFO - __main__ - Step 46911: {'lr': 0.0003947481894437759, 'samples': 9006912, 'steps': 46910, 'loss/train': 1.8670387268066406} -08/30/2021 21:44:11 - INFO - __main__ - Step 46912: {'lr': 0.0003947438626490508, 'samples': 9007104, 'steps': 46911, 'loss/train': 1.5186539888381958} -08/30/2021 21:44:11 - INFO - __main__ - Step 46913: {'lr': 0.0003947395357891064, 'samples': 9007296, 'steps': 46912, 'loss/train': 1.1929248571395874} -08/30/2021 21:44:12 - INFO - __main__ - Step 46914: {'lr': 0.00039473520886394465, 'samples': 9007488, 'steps': 46913, 'loss/train': 1.3482972383499146} -08/30/2021 21:44:12 - INFO - __main__ - Step 46915: {'lr': 0.00039473088187356737, 'samples': 9007680, 'steps': 46914, 'loss/train': 3.0119411945343018} -08/30/2021 21:44:12 - INFO - __main__ - Step 46916: {'lr': 0.0003947265548179766, 'samples': 9007872, 'steps': 46915, 'loss/train': 1.7715628147125244} -08/30/2021 21:44:13 - INFO - __main__ - Step 46917: {'lr': 0.00039472222769717434, 'samples': 9008064, 'steps': 46916, 'loss/train': 1.0797874927520752} -08/30/2021 21:44:14 - INFO - __main__ - Step 46918: {'lr': 0.00039471790051116243, 'samples': 9008256, 'steps': 46917, 'loss/train': 1.1832444667816162} -08/30/2021 21:44:15 - INFO - __main__ - Step 46919: {'lr': 0.0003947135732599428, 'samples': 9008448, 'steps': 46918, 'loss/train': 1.14852774143219} -08/30/2021 21:44:15 - INFO - __main__ - Step 46920: {'lr': 0.0003947092459435176, 'samples': 9008640, 'steps': 46919, 'loss/train': 1.499640703201294} -08/30/2021 21:44:16 - INFO - __main__ - Step 46921: {'lr': 0.0003947049185618886, 'samples': 9008832, 'steps': 46920, 'loss/train': 1.3729298114776611} -08/30/2021 21:44:16 - INFO - __main__ - Step 46922: {'lr': 0.0003947005911150577, 'samples': 9009024, 'steps': 46921, 'loss/train': 0.9926202297210693} -08/30/2021 21:44:16 - INFO - __main__ - Step 46923: {'lr': 0.0003946962636030271, 'samples': 9009216, 'steps': 46922, 'loss/train': 1.3934400081634521} -08/30/2021 21:44:18 - INFO - __main__ - Step 46924: {'lr': 0.00039469193602579856, 'samples': 9009408, 'steps': 46923, 'loss/train': 1.8092750310897827} -08/30/2021 21:44:18 - INFO - __main__ - Step 46925: {'lr': 0.000394687608383374, 'samples': 9009600, 'steps': 46924, 'loss/train': 0.7849079966545105} -08/30/2021 21:44:19 - INFO - __main__ - Step 46926: {'lr': 0.0003946832806757554, 'samples': 9009792, 'steps': 46925, 'loss/train': 2.220301866531372} -08/30/2021 21:44:19 - INFO - __main__ - Step 46927: {'lr': 0.00039467895290294484, 'samples': 9009984, 'steps': 46926, 'loss/train': 1.5471405982971191} -08/30/2021 21:44:19 - INFO - __main__ - Step 46928: {'lr': 0.00039467462506494416, 'samples': 9010176, 'steps': 46927, 'loss/train': 1.6559935808181763} -08/30/2021 21:44:21 - INFO - __main__ - Step 46929: {'lr': 0.0003946702971617553, 'samples': 9010368, 'steps': 46928, 'loss/train': 1.1120922565460205} -08/30/2021 21:44:21 - INFO - __main__ - Step 46930: {'lr': 0.00039466596919338027, 'samples': 9010560, 'steps': 46929, 'loss/train': 1.6416133642196655} -08/30/2021 21:44:22 - INFO - __main__ - Step 46931: {'lr': 0.000394661641159821, 'samples': 9010752, 'steps': 46930, 'loss/train': 1.5514638423919678} -08/30/2021 21:44:22 - INFO - __main__ - Step 46932: {'lr': 0.00039465731306107937, 'samples': 9010944, 'steps': 46931, 'loss/train': 1.6745285987854004} -08/30/2021 21:44:22 - INFO - __main__ - Step 46933: {'lr': 0.0003946529848971574, 'samples': 9011136, 'steps': 46932, 'loss/train': 1.6818374395370483} -08/30/2021 21:44:24 - INFO - __main__ - Step 46934: {'lr': 0.00039464865666805706, 'samples': 9011328, 'steps': 46933, 'loss/train': 1.267052412033081} -08/30/2021 21:44:25 - INFO - __main__ - Step 46935: {'lr': 0.00039464432837378025, 'samples': 9011520, 'steps': 46934, 'loss/train': 1.4714409112930298} -08/30/2021 21:44:25 - INFO - __main__ - Step 46936: {'lr': 0.0003946400000143289, 'samples': 9011712, 'steps': 46935, 'loss/train': 1.5869170427322388} -08/30/2021 21:44:25 - INFO - __main__ - Step 46937: {'lr': 0.000394635671589705, 'samples': 9011904, 'steps': 46936, 'loss/train': 1.4760212898254395} -08/30/2021 21:44:26 - INFO - __main__ - Step 46938: {'lr': 0.0003946313430999106, 'samples': 9012096, 'steps': 46937, 'loss/train': 1.5378096103668213} -08/30/2021 21:44:28 - INFO - __main__ - Step 46939: {'lr': 0.0003946270145449475, 'samples': 9012288, 'steps': 46938, 'loss/train': 1.1220684051513672} -08/30/2021 21:44:28 - INFO - __main__ - Step 46940: {'lr': 0.00039462268592481767, 'samples': 9012480, 'steps': 46939, 'loss/train': 1.6197477579116821} -08/30/2021 21:44:28 - INFO - __main__ - Step 46941: {'lr': 0.00039461835723952313, 'samples': 9012672, 'steps': 46940, 'loss/train': 1.4468624591827393} -08/30/2021 21:44:29 - INFO - __main__ - Step 46942: {'lr': 0.0003946140284890657, 'samples': 9012864, 'steps': 46941, 'loss/train': 2.260392189025879} -08/30/2021 21:44:29 - INFO - __main__ - Step 46943: {'lr': 0.0003946096996734475, 'samples': 9013056, 'steps': 46942, 'loss/train': 1.5174592733383179} -08/30/2021 21:44:31 - INFO - __main__ - Step 46944: {'lr': 0.00039460537079267035, 'samples': 9013248, 'steps': 46943, 'loss/train': 1.016710638999939} -08/30/2021 21:44:32 - INFO - __main__ - Step 46945: {'lr': 0.00039460104184673627, 'samples': 9013440, 'steps': 46944, 'loss/train': 0.7979376912117004} -08/30/2021 21:44:32 - INFO - __main__ - Step 46946: {'lr': 0.00039459671283564727, 'samples': 9013632, 'steps': 46945, 'loss/train': 1.6598806381225586} -08/30/2021 21:44:32 - INFO - __main__ - Step 46947: {'lr': 0.0003945923837594051, 'samples': 9013824, 'steps': 46946, 'loss/train': 0.9393380284309387} -08/30/2021 21:44:33 - INFO - __main__ - Step 46948: {'lr': 0.0003945880546180119, 'samples': 9014016, 'steps': 46947, 'loss/train': 1.2374600172042847} -08/30/2021 21:44:33 - INFO - __main__ - Step 46949: {'lr': 0.00039458372541146955, 'samples': 9014208, 'steps': 46948, 'loss/train': 1.5660732984542847} -08/30/2021 21:44:35 - INFO - __main__ - Step 46950: {'lr': 0.00039457939613978, 'samples': 9014400, 'steps': 46949, 'loss/train': 1.7887295484542847} -08/30/2021 21:44:35 - INFO - __main__ - Step 46951: {'lr': 0.0003945750668029452, 'samples': 9014592, 'steps': 46950, 'loss/train': 1.6144603490829468} -08/30/2021 21:44:35 - INFO - __main__ - Step 46952: {'lr': 0.0003945707374009671, 'samples': 9014784, 'steps': 46951, 'loss/train': 1.471245527267456} -08/30/2021 21:44:36 - INFO - __main__ - Step 46953: {'lr': 0.0003945664079338477, 'samples': 9014976, 'steps': 46952, 'loss/train': 2.249976873397827} -08/30/2021 21:44:36 - INFO - __main__ - Step 46954: {'lr': 0.0003945620784015888, 'samples': 9015168, 'steps': 46953, 'loss/train': 1.4158796072006226} -08/30/2021 21:44:38 - INFO - __main__ - Step 46955: {'lr': 0.00039455774880419256, 'samples': 9015360, 'steps': 46954, 'loss/train': 1.712270736694336} -08/30/2021 21:44:38 - INFO - __main__ - Step 46956: {'lr': 0.00039455341914166074, 'samples': 9015552, 'steps': 46955, 'loss/train': 1.4940677881240845} -08/30/2021 21:44:38 - INFO - __main__ - Step 46957: {'lr': 0.0003945490894139955, 'samples': 9015744, 'steps': 46956, 'loss/train': 1.315157413482666} -08/30/2021 21:44:39 - INFO - __main__ - Step 46958: {'lr': 0.0003945447596211986, 'samples': 9015936, 'steps': 46957, 'loss/train': 1.2470693588256836} -08/30/2021 21:44:39 - INFO - __main__ - Step 46959: {'lr': 0.0003945404297632721, 'samples': 9016128, 'steps': 46958, 'loss/train': 1.544315218925476} -08/30/2021 21:44:41 - INFO - __main__ - Step 46960: {'lr': 0.00039453609984021787, 'samples': 9016320, 'steps': 46959, 'loss/train': 1.6414031982421875} -08/30/2021 21:44:41 - INFO - __main__ - Step 46961: {'lr': 0.00039453176985203785, 'samples': 9016512, 'steps': 46960, 'loss/train': 1.4637598991394043} -08/30/2021 21:44:41 - INFO - __main__ - Step 46962: {'lr': 0.0003945274397987342, 'samples': 9016704, 'steps': 46961, 'loss/train': 1.4995415210723877} -08/30/2021 21:44:42 - INFO - __main__ - Step 46963: {'lr': 0.0003945231096803086, 'samples': 9016896, 'steps': 46962, 'loss/train': 0.4901764988899231} -08/30/2021 21:44:42 - INFO - __main__ - Step 46964: {'lr': 0.0003945187794967632, 'samples': 9017088, 'steps': 46963, 'loss/train': 1.1779558658599854} -08/30/2021 21:44:43 - INFO - __main__ - Step 46965: {'lr': 0.00039451444924809976, 'samples': 9017280, 'steps': 46964, 'loss/train': 1.3195405006408691} -08/30/2021 21:44:44 - INFO - __main__ - Step 46966: {'lr': 0.0003945101189343204, 'samples': 9017472, 'steps': 46965, 'loss/train': 0.8720847964286804} -08/30/2021 21:44:44 - INFO - __main__ - Step 46967: {'lr': 0.000394505788555427, 'samples': 9017664, 'steps': 46966, 'loss/train': 1.677130103111267} -08/30/2021 21:44:45 - INFO - __main__ - Step 46968: {'lr': 0.0003945014581114215, 'samples': 9017856, 'steps': 46967, 'loss/train': 1.6841708421707153} -08/30/2021 21:44:45 - INFO - __main__ - Step 46969: {'lr': 0.00039449712760230584, 'samples': 9018048, 'steps': 46968, 'loss/train': 1.2529847621917725} -08/30/2021 21:44:47 - INFO - __main__ - Step 46970: {'lr': 0.0003944927970280821, 'samples': 9018240, 'steps': 46969, 'loss/train': 1.7225449085235596} -08/30/2021 21:44:47 - INFO - __main__ - Step 46971: {'lr': 0.00039448846638875213, 'samples': 9018432, 'steps': 46970, 'loss/train': 1.5357646942138672} -08/30/2021 21:44:47 - INFO - __main__ - Step 46972: {'lr': 0.00039448413568431785, 'samples': 9018624, 'steps': 46971, 'loss/train': 1.1177994012832642} -08/30/2021 21:44:48 - INFO - __main__ - Step 46973: {'lr': 0.0003944798049147812, 'samples': 9018816, 'steps': 46972, 'loss/train': 1.3170790672302246} -08/30/2021 21:44:48 - INFO - __main__ - Step 46974: {'lr': 0.00039447547408014426, 'samples': 9019008, 'steps': 46973, 'loss/train': 1.2802783250808716} -08/30/2021 21:44:48 - INFO - __main__ - Step 46975: {'lr': 0.00039447114318040885, 'samples': 9019200, 'steps': 46974, 'loss/train': 1.9557400941848755} -08/30/2021 21:44:50 - INFO - __main__ - Step 46976: {'lr': 0.000394466812215577, 'samples': 9019392, 'steps': 46975, 'loss/train': 2.048022985458374} -08/30/2021 21:44:50 - INFO - __main__ - Step 46977: {'lr': 0.0003944624811856506, 'samples': 9019584, 'steps': 46976, 'loss/train': 1.5928115844726562} -08/30/2021 21:44:51 - INFO - __main__ - Step 46978: {'lr': 0.0003944581500906317, 'samples': 9019776, 'steps': 46977, 'loss/train': 1.9153282642364502} -08/30/2021 21:44:51 - INFO - __main__ - Step 46979: {'lr': 0.00039445381893052215, 'samples': 9019968, 'steps': 46978, 'loss/train': 3.6052839756011963} -08/30/2021 21:44:51 - INFO - __main__ - Step 46980: {'lr': 0.0003944494877053239, 'samples': 9020160, 'steps': 46979, 'loss/train': 1.5440027713775635} -08/30/2021 21:44:53 - INFO - __main__ - Step 46981: {'lr': 0.00039444515641503896, 'samples': 9020352, 'steps': 46980, 'loss/train': 1.8482164144515991} -08/30/2021 21:44:53 - INFO - __main__ - Step 46982: {'lr': 0.00039444082505966926, 'samples': 9020544, 'steps': 46981, 'loss/train': 1.3363295793533325} -08/30/2021 21:44:54 - INFO - __main__ - Step 46983: {'lr': 0.0003944364936392168, 'samples': 9020736, 'steps': 46982, 'loss/train': 1.784623384475708} -08/30/2021 21:44:54 - INFO - __main__ - Step 46984: {'lr': 0.0003944321621536835, 'samples': 9020928, 'steps': 46983, 'loss/train': 1.76750910282135} -08/30/2021 21:44:54 - INFO - __main__ - Step 46985: {'lr': 0.00039442783060307117, 'samples': 9021120, 'steps': 46984, 'loss/train': 1.5290135145187378} -08/30/2021 21:44:55 - INFO - __main__ - Step 46986: {'lr': 0.00039442349898738204, 'samples': 9021312, 'steps': 46985, 'loss/train': 1.8976329565048218} -08/30/2021 21:44:56 - INFO - __main__ - Step 46987: {'lr': 0.0003944191673066178, 'samples': 9021504, 'steps': 46986, 'loss/train': 1.7026069164276123} -08/30/2021 21:44:57 - INFO - __main__ - Step 46988: {'lr': 0.00039441483556078055, 'samples': 9021696, 'steps': 46987, 'loss/train': 1.8321424722671509} -08/30/2021 21:44:57 - INFO - __main__ - Step 46989: {'lr': 0.0003944105037498722, 'samples': 9021888, 'steps': 46988, 'loss/train': 0.8016990423202515} -08/30/2021 21:44:57 - INFO - __main__ - Step 46990: {'lr': 0.0003944061718738947, 'samples': 9022080, 'steps': 46989, 'loss/train': 1.5196932554244995} -08/30/2021 21:44:58 - INFO - __main__ - Step 46991: {'lr': 0.00039440183993285006, 'samples': 9022272, 'steps': 46990, 'loss/train': 1.5645670890808105} -08/30/2021 21:44:59 - INFO - __main__ - Step 46992: {'lr': 0.0003943975079267401, 'samples': 9022464, 'steps': 46991, 'loss/train': 1.1234192848205566} -08/30/2021 21:45:00 - INFO - __main__ - Step 46993: {'lr': 0.0003943931758555669, 'samples': 9022656, 'steps': 46992, 'loss/train': 0.9302326440811157} -08/30/2021 21:45:00 - INFO - __main__ - Step 46994: {'lr': 0.0003943888437193324, 'samples': 9022848, 'steps': 46993, 'loss/train': 1.0642530918121338} -08/30/2021 21:45:01 - INFO - __main__ - Step 46995: {'lr': 0.00039438451151803844, 'samples': 9023040, 'steps': 46994, 'loss/train': 1.7438215017318726} -08/30/2021 21:45:01 - INFO - __main__ - Step 46996: {'lr': 0.000394380179251687, 'samples': 9023232, 'steps': 46995, 'loss/train': 2.1431987285614014} -08/30/2021 21:45:03 - INFO - __main__ - Step 46997: {'lr': 0.0003943758469202802, 'samples': 9023424, 'steps': 46996, 'loss/train': 1.2174314260482788} -08/30/2021 21:45:03 - INFO - __main__ - Step 46998: {'lr': 0.0003943715145238198, 'samples': 9023616, 'steps': 46997, 'loss/train': 1.0514683723449707} -08/30/2021 21:45:04 - INFO - __main__ - Step 46999: {'lr': 0.00039436718206230795, 'samples': 9023808, 'steps': 46998, 'loss/train': 1.1923924684524536} -08/30/2021 21:45:04 - INFO - __main__ - Step 47000: {'lr': 0.0003943628495357463, 'samples': 9024000, 'steps': 46999, 'loss/train': 0.7480464577674866} -08/30/2021 21:45:04 - INFO - __main__ - Step 47001: {'lr': 0.00039435851694413705, 'samples': 9024192, 'steps': 47000, 'loss/train': 1.3538702726364136} -08/30/2021 21:45:06 - INFO - __main__ - Step 47002: {'lr': 0.00039435418428748206, 'samples': 9024384, 'steps': 47001, 'loss/train': 1.1366056203842163} -08/30/2021 21:45:06 - INFO - __main__ - Step 47003: {'lr': 0.00039434985156578333, 'samples': 9024576, 'steps': 47002, 'loss/train': 1.3417569398880005} -08/30/2021 21:45:07 - INFO - __main__ - Step 47004: {'lr': 0.0003943455187790428, 'samples': 9024768, 'steps': 47003, 'loss/train': 1.371974229812622} -08/30/2021 21:45:07 - INFO - __main__ - Step 47005: {'lr': 0.0003943411859272624, 'samples': 9024960, 'steps': 47004, 'loss/train': 1.052565574645996} -08/30/2021 21:45:07 - INFO - __main__ - Step 47006: {'lr': 0.0003943368530104441, 'samples': 9025152, 'steps': 47005, 'loss/train': 1.609918475151062} -08/30/2021 21:45:09 - INFO - __main__ - Step 47007: {'lr': 0.00039433252002858975, 'samples': 9025344, 'steps': 47006, 'loss/train': 1.7140456438064575} -08/30/2021 21:45:09 - INFO - __main__ - Step 47008: {'lr': 0.0003943281869817015, 'samples': 9025536, 'steps': 47007, 'loss/train': 1.5079469680786133} -08/30/2021 21:45:10 - INFO - __main__ - Step 47009: {'lr': 0.0003943238538697811, 'samples': 9025728, 'steps': 47008, 'loss/train': 1.6488761901855469} -08/30/2021 21:45:10 - INFO - __main__ - Step 47010: {'lr': 0.00039431952069283067, 'samples': 9025920, 'steps': 47009, 'loss/train': 1.4270639419555664} -08/30/2021 21:45:10 - INFO - __main__ - Step 47011: {'lr': 0.00039431518745085205, 'samples': 9026112, 'steps': 47010, 'loss/train': 1.5178182125091553} -08/30/2021 21:45:11 - INFO - __main__ - Step 47012: {'lr': 0.00039431085414384727, 'samples': 9026304, 'steps': 47011, 'loss/train': 0.6716890335083008} -08/30/2021 21:45:13 - INFO - __main__ - Step 47013: {'lr': 0.0003943065207718182, 'samples': 9026496, 'steps': 47012, 'loss/train': 1.6696041822433472} -08/30/2021 21:45:13 - INFO - __main__ - Step 47014: {'lr': 0.0003943021873347669, 'samples': 9026688, 'steps': 47013, 'loss/train': 1.5473829507827759} -08/30/2021 21:45:13 - INFO - __main__ - Step 47015: {'lr': 0.00039429785383269524, 'samples': 9026880, 'steps': 47014, 'loss/train': 2.9138872623443604} -08/30/2021 21:45:14 - INFO - __main__ - Step 47016: {'lr': 0.00039429352026560516, 'samples': 9027072, 'steps': 47015, 'loss/train': 1.1713416576385498} -08/30/2021 21:45:14 - INFO - __main__ - Step 47017: {'lr': 0.0003942891866334987, 'samples': 9027264, 'steps': 47016, 'loss/train': 1.0460469722747803} -08/30/2021 21:45:16 - INFO - __main__ - Step 47018: {'lr': 0.00039428485293637773, 'samples': 9027456, 'steps': 47017, 'loss/train': 1.8020797967910767} -08/30/2021 21:45:16 - INFO - __main__ - Step 47019: {'lr': 0.00039428051917424423, 'samples': 9027648, 'steps': 47018, 'loss/train': 1.086907982826233} -08/30/2021 21:45:17 - INFO - __main__ - Step 47020: {'lr': 0.0003942761853471002, 'samples': 9027840, 'steps': 47019, 'loss/train': 1.6968697309494019} -08/30/2021 21:45:17 - INFO - __main__ - Step 47021: {'lr': 0.0003942718514549475, 'samples': 9028032, 'steps': 47020, 'loss/train': 1.5713204145431519} -08/30/2021 21:45:17 - INFO - __main__ - Step 47022: {'lr': 0.0003942675174977881, 'samples': 9028224, 'steps': 47021, 'loss/train': 1.4160035848617554} -08/30/2021 21:45:19 - INFO - __main__ - Step 47023: {'lr': 0.000394263183475624, 'samples': 9028416, 'steps': 47022, 'loss/train': 0.7884634733200073} -08/30/2021 21:45:20 - INFO - __main__ - Step 47024: {'lr': 0.0003942588493884571, 'samples': 9028608, 'steps': 47023, 'loss/train': 1.5771461725234985} -08/30/2021 21:45:20 - INFO - __main__ - Step 47025: {'lr': 0.00039425451523628953, 'samples': 9028800, 'steps': 47024, 'loss/train': 1.2272441387176514} -08/30/2021 21:45:20 - INFO - __main__ - Step 47026: {'lr': 0.00039425018101912305, 'samples': 9028992, 'steps': 47025, 'loss/train': 1.5435431003570557} -08/30/2021 21:45:21 - INFO - __main__ - Step 47027: {'lr': 0.00039424584673695956, 'samples': 9029184, 'steps': 47026, 'loss/train': 1.3484901189804077} -08/30/2021 21:45:21 - INFO - __main__ - Step 47028: {'lr': 0.0003942415123898012, 'samples': 9029376, 'steps': 47027, 'loss/train': 0.33479100465774536} -08/30/2021 21:45:23 - INFO - __main__ - Step 47029: {'lr': 0.0003942371779776498, 'samples': 9029568, 'steps': 47028, 'loss/train': 1.252678632736206} -08/30/2021 21:45:23 - INFO - __main__ - Step 47030: {'lr': 0.00039423284350050735, 'samples': 9029760, 'steps': 47029, 'loss/train': 1.354400873184204} -08/30/2021 21:45:24 - INFO - __main__ - Step 47031: {'lr': 0.0003942285089583759, 'samples': 9029952, 'steps': 47030, 'loss/train': 1.5203813314437866} -08/30/2021 21:45:24 - INFO - __main__ - Step 47032: {'lr': 0.0003942241743512572, 'samples': 9030144, 'steps': 47031, 'loss/train': 1.0415359735488892} -08/30/2021 21:45:24 - INFO - __main__ - Step 47033: {'lr': 0.00039421983967915337, 'samples': 9030336, 'steps': 47032, 'loss/train': 1.2102928161621094} -08/30/2021 21:45:26 - INFO - __main__ - Step 47034: {'lr': 0.00039421550494206625, 'samples': 9030528, 'steps': 47033, 'loss/train': 0.6218977570533752} -08/30/2021 21:45:26 - INFO - __main__ - Step 47035: {'lr': 0.0003942111701399979, 'samples': 9030720, 'steps': 47034, 'loss/train': 1.8368933200836182} -08/30/2021 21:45:27 - INFO - __main__ - Step 47036: {'lr': 0.0003942068352729502, 'samples': 9030912, 'steps': 47035, 'loss/train': 1.4152131080627441} -08/30/2021 21:45:27 - INFO - __main__ - Step 47037: {'lr': 0.0003942025003409252, 'samples': 9031104, 'steps': 47036, 'loss/train': 1.9444457292556763} -08/30/2021 21:45:28 - INFO - __main__ - Step 47038: {'lr': 0.0003941981653439247, 'samples': 9031296, 'steps': 47037, 'loss/train': 1.0517847537994385} -08/30/2021 21:45:29 - INFO - __main__ - Step 47039: {'lr': 0.00039419383028195076, 'samples': 9031488, 'steps': 47038, 'loss/train': 1.2911107540130615} -08/30/2021 21:45:30 - INFO - __main__ - Step 47040: {'lr': 0.00039418949515500524, 'samples': 9031680, 'steps': 47039, 'loss/train': 1.6040315628051758} -08/30/2021 21:45:30 - INFO - __main__ - Step 47041: {'lr': 0.0003941851599630902, 'samples': 9031872, 'steps': 47040, 'loss/train': 1.6276823282241821} -08/30/2021 21:45:30 - INFO - __main__ - Step 47042: {'lr': 0.00039418082470620756, 'samples': 9032064, 'steps': 47041, 'loss/train': 0.8975918889045715} -08/30/2021 21:45:31 - INFO - __main__ - Step 47043: {'lr': 0.0003941764893843593, 'samples': 9032256, 'steps': 47042, 'loss/train': 1.4319145679473877} -08/30/2021 21:45:32 - INFO - __main__ - Step 47044: {'lr': 0.0003941721539975473, 'samples': 9032448, 'steps': 47043, 'loss/train': 1.940021276473999} -08/30/2021 21:45:33 - INFO - __main__ - Step 47045: {'lr': 0.0003941678185457736, 'samples': 9032640, 'steps': 47044, 'loss/train': 1.6918425559997559} -08/30/2021 21:45:33 - INFO - __main__ - Step 47046: {'lr': 0.00039416348302904005, 'samples': 9032832, 'steps': 47045, 'loss/train': 1.6045674085617065} -08/30/2021 21:45:34 - INFO - __main__ - Step 47047: {'lr': 0.0003941591474473487, 'samples': 9033024, 'steps': 47046, 'loss/train': 1.2545980215072632} -08/30/2021 21:45:34 - INFO - __main__ - Step 47048: {'lr': 0.0003941548118007014, 'samples': 9033216, 'steps': 47047, 'loss/train': 0.8215344548225403} -08/30/2021 21:45:36 - INFO - __main__ - Step 47049: {'lr': 0.00039415047608910023, 'samples': 9033408, 'steps': 47048, 'loss/train': 0.1027296856045723} -08/30/2021 21:45:36 - INFO - __main__ - Step 47050: {'lr': 0.000394146140312547, 'samples': 9033600, 'steps': 47049, 'loss/train': 0.8259753584861755} -08/30/2021 21:45:37 - INFO - __main__ - Step 47051: {'lr': 0.0003941418044710438, 'samples': 9033792, 'steps': 47050, 'loss/train': 1.8476759195327759} -08/30/2021 21:45:37 - INFO - __main__ - Step 47052: {'lr': 0.00039413746856459253, 'samples': 9033984, 'steps': 47051, 'loss/train': 1.7540653944015503} -08/30/2021 21:45:37 - INFO - __main__ - Step 47053: {'lr': 0.0003941331325931952, 'samples': 9034176, 'steps': 47052, 'loss/train': 1.3884731531143188} -08/30/2021 21:45:38 - INFO - __main__ - Step 47054: {'lr': 0.0003941287965568536, 'samples': 9034368, 'steps': 47053, 'loss/train': 0.5963377952575684} -08/30/2021 21:45:39 - INFO - __main__ - Step 47055: {'lr': 0.0003941244604555698, 'samples': 9034560, 'steps': 47054, 'loss/train': 1.5608035326004028} -08/30/2021 21:45:39 - INFO - __main__ - Step 47056: {'lr': 0.0003941201242893457, 'samples': 9034752, 'steps': 47055, 'loss/train': 0.8580886721611023} -08/30/2021 21:45:40 - INFO - __main__ - Step 47057: {'lr': 0.00039411578805818344, 'samples': 9034944, 'steps': 47056, 'loss/train': 1.5278757810592651} -08/30/2021 21:45:40 - INFO - __main__ - Step 47058: {'lr': 0.00039411145176208477, 'samples': 9035136, 'steps': 47057, 'loss/train': 1.5152755975723267} -08/30/2021 21:45:41 - INFO - __main__ - Step 47059: {'lr': 0.0003941071154010517, 'samples': 9035328, 'steps': 47058, 'loss/train': 1.2857751846313477} -08/30/2021 21:45:42 - INFO - __main__ - Step 47060: {'lr': 0.00039410277897508617, 'samples': 9035520, 'steps': 47059, 'loss/train': 1.3531262874603271} -08/30/2021 21:45:43 - INFO - __main__ - Step 47061: {'lr': 0.00039409844248419014, 'samples': 9035712, 'steps': 47060, 'loss/train': 1.585766315460205} -08/30/2021 21:45:43 - INFO - __main__ - Step 47062: {'lr': 0.0003940941059283656, 'samples': 9035904, 'steps': 47061, 'loss/train': 1.4567688703536987} -08/30/2021 21:45:43 - INFO - __main__ - Step 47063: {'lr': 0.00039408976930761444, 'samples': 9036096, 'steps': 47062, 'loss/train': 1.182168960571289} -08/30/2021 21:45:44 - INFO - __main__ - Step 47064: {'lr': 0.00039408543262193867, 'samples': 9036288, 'steps': 47063, 'loss/train': 1.4591920375823975} -08/30/2021 21:45:45 - INFO - __main__ - Step 47065: {'lr': 0.00039408109587134034, 'samples': 9036480, 'steps': 47064, 'loss/train': 1.959205985069275} -08/30/2021 21:45:46 - INFO - __main__ - Step 47066: {'lr': 0.00039407675905582117, 'samples': 9036672, 'steps': 47065, 'loss/train': 1.7146639823913574} -08/30/2021 21:45:46 - INFO - __main__ - Step 47067: {'lr': 0.00039407242217538317, 'samples': 9036864, 'steps': 47066, 'loss/train': 1.0863569974899292} -08/30/2021 21:45:46 - INFO - __main__ - Step 47068: {'lr': 0.0003940680852300285, 'samples': 9037056, 'steps': 47067, 'loss/train': 1.4741212129592896} -08/30/2021 21:45:47 - INFO - __main__ - Step 47069: {'lr': 0.00039406374821975893, 'samples': 9037248, 'steps': 47068, 'loss/train': 1.7408515214920044} -08/30/2021 21:45:48 - INFO - __main__ - Step 47070: {'lr': 0.00039405941114457644, 'samples': 9037440, 'steps': 47069, 'loss/train': 1.5101934671401978} -08/30/2021 21:45:49 - INFO - __main__ - Step 47071: {'lr': 0.000394055074004483, 'samples': 9037632, 'steps': 47070, 'loss/train': 1.4572372436523438} -08/30/2021 21:45:49 - INFO - __main__ - Step 47072: {'lr': 0.0003940507367994806, 'samples': 9037824, 'steps': 47071, 'loss/train': 1.3657548427581787} -08/30/2021 21:45:50 - INFO - __main__ - Step 47073: {'lr': 0.00039404639952957116, 'samples': 9038016, 'steps': 47072, 'loss/train': 0.06788039952516556} -08/30/2021 21:45:50 - INFO - __main__ - Step 47074: {'lr': 0.00039404206219475655, 'samples': 9038208, 'steps': 47073, 'loss/train': 0.8680133819580078} -08/30/2021 21:45:50 - INFO - __main__ - Step 47075: {'lr': 0.00039403772479503895, 'samples': 9038400, 'steps': 47074, 'loss/train': 1.4910752773284912} -08/30/2021 21:45:52 - INFO - __main__ - Step 47076: {'lr': 0.0003940333873304201, 'samples': 9038592, 'steps': 47075, 'loss/train': 4.312713623046875} -08/30/2021 21:45:52 - INFO - __main__ - Step 47077: {'lr': 0.000394029049800902, 'samples': 9038784, 'steps': 47076, 'loss/train': 1.2238141298294067} -08/30/2021 21:45:53 - INFO - __main__ - Step 47078: {'lr': 0.00039402471220648675, 'samples': 9038976, 'steps': 47077, 'loss/train': 1.933716893196106} -08/30/2021 21:45:53 - INFO - __main__ - Step 47079: {'lr': 0.000394020374547176, 'samples': 9039168, 'steps': 47078, 'loss/train': 1.262068748474121} -08/30/2021 21:45:53 - INFO - __main__ - Step 47080: {'lr': 0.00039401603682297204, 'samples': 9039360, 'steps': 47079, 'loss/train': 1.51416015625} -08/30/2021 21:45:55 - INFO - __main__ - Step 47081: {'lr': 0.0003940116990338766, 'samples': 9039552, 'steps': 47080, 'loss/train': 2.1935997009277344} -08/30/2021 21:45:56 - INFO - __main__ - Step 47082: {'lr': 0.00039400736117989175, 'samples': 9039744, 'steps': 47081, 'loss/train': 1.6061735153198242} -08/30/2021 21:45:56 - INFO - __main__ - Step 47083: {'lr': 0.0003940030232610194, 'samples': 9039936, 'steps': 47082, 'loss/train': 1.4907827377319336} -08/30/2021 21:45:57 - INFO - __main__ - Step 47084: {'lr': 0.0003939986852772615, 'samples': 9040128, 'steps': 47083, 'loss/train': 1.3143213987350464} -08/30/2021 21:45:57 - INFO - __main__ - Step 47085: {'lr': 0.00039399434722862004, 'samples': 9040320, 'steps': 47084, 'loss/train': 1.3996050357818604} -08/30/2021 21:45:59 - INFO - __main__ - Step 47086: {'lr': 0.00039399000911509685, 'samples': 9040512, 'steps': 47085, 'loss/train': 1.675197958946228} -08/30/2021 21:45:59 - INFO - __main__ - Step 47087: {'lr': 0.00039398567093669413, 'samples': 9040704, 'steps': 47086, 'loss/train': 1.6289172172546387} -08/30/2021 21:46:00 - INFO - __main__ - Step 47088: {'lr': 0.00039398133269341357, 'samples': 9040896, 'steps': 47087, 'loss/train': 0.8133636116981506} -08/30/2021 21:46:00 - INFO - __main__ - Step 47089: {'lr': 0.0003939769943852573, 'samples': 9041088, 'steps': 47088, 'loss/train': 0.26620832085609436} -08/30/2021 21:46:00 - INFO - __main__ - Step 47090: {'lr': 0.0003939726560122272, 'samples': 9041280, 'steps': 47089, 'loss/train': 1.7133350372314453} -08/30/2021 21:46:01 - INFO - __main__ - Step 47091: {'lr': 0.00039396831757432526, 'samples': 9041472, 'steps': 47090, 'loss/train': 2.0110116004943848} -08/30/2021 21:46:02 - INFO - __main__ - Step 47092: {'lr': 0.0003939639790715535, 'samples': 9041664, 'steps': 47091, 'loss/train': 1.6223446130752563} -08/30/2021 21:46:03 - INFO - __main__ - Step 47093: {'lr': 0.0003939596405039136, 'samples': 9041856, 'steps': 47092, 'loss/train': 1.348044514656067} -08/30/2021 21:46:03 - INFO - __main__ - Step 47094: {'lr': 0.00039395530187140784, 'samples': 9042048, 'steps': 47093, 'loss/train': 1.1098629236221313} -08/30/2021 21:46:03 - INFO - __main__ - Step 47095: {'lr': 0.000393950963174038, 'samples': 9042240, 'steps': 47094, 'loss/train': 0.1541656106710434} -08/30/2021 21:46:05 - INFO - __main__ - Step 47096: {'lr': 0.00039394662441180606, 'samples': 9042432, 'steps': 47095, 'loss/train': 1.5069993734359741} -08/30/2021 21:46:05 - INFO - __main__ - Step 47097: {'lr': 0.000393942285584714, 'samples': 9042624, 'steps': 47096, 'loss/train': 1.5107636451721191} -08/30/2021 21:46:06 - INFO - __main__ - Step 47098: {'lr': 0.00039393794669276386, 'samples': 9042816, 'steps': 47097, 'loss/train': 1.9983701705932617} -08/30/2021 21:46:06 - INFO - __main__ - Step 47099: {'lr': 0.00039393360773595744, 'samples': 9043008, 'steps': 47098, 'loss/train': 0.9121749401092529} -08/30/2021 21:46:06 - INFO - __main__ - Step 47100: {'lr': 0.0003939292687142967, 'samples': 9043200, 'steps': 47099, 'loss/train': 1.341982126235962} -08/30/2021 21:46:08 - INFO - __main__ - Step 47101: {'lr': 0.0003939249296277837, 'samples': 9043392, 'steps': 47100, 'loss/train': 1.7498527765274048} -08/30/2021 21:46:08 - INFO - __main__ - Step 47102: {'lr': 0.0003939205904764204, 'samples': 9043584, 'steps': 47101, 'loss/train': 0.6947213411331177} -08/30/2021 21:46:09 - INFO - __main__ - Step 47103: {'lr': 0.00039391625126020856, 'samples': 9043776, 'steps': 47102, 'loss/train': 1.2254722118377686} -08/30/2021 21:46:09 - INFO - __main__ - Step 47104: {'lr': 0.0003939119119791504, 'samples': 9043968, 'steps': 47103, 'loss/train': 1.9305309057235718} -08/30/2021 21:46:09 - INFO - __main__ - Step 47105: {'lr': 0.0003939075726332477, 'samples': 9044160, 'steps': 47104, 'loss/train': 1.6418644189834595} -08/30/2021 21:46:10 - INFO - __main__ - Step 47106: {'lr': 0.00039390323322250253, 'samples': 9044352, 'steps': 47105, 'loss/train': 0.999724805355072} -08/30/2021 21:46:11 - INFO - __main__ - Step 47107: {'lr': 0.0003938988937469168, 'samples': 9044544, 'steps': 47106, 'loss/train': 1.5427132844924927} -08/30/2021 21:46:12 - INFO - __main__ - Step 47108: {'lr': 0.0003938945542064923, 'samples': 9044736, 'steps': 47107, 'loss/train': 1.400425672531128} -08/30/2021 21:46:12 - INFO - __main__ - Step 47109: {'lr': 0.00039389021460123125, 'samples': 9044928, 'steps': 47108, 'loss/train': 1.135919213294983} -08/30/2021 21:46:12 - INFO - __main__ - Step 47110: {'lr': 0.0003938858749311355, 'samples': 9045120, 'steps': 47109, 'loss/train': 1.2661519050598145} -08/30/2021 21:46:13 - INFO - __main__ - Step 47111: {'lr': 0.00039388153519620696, 'samples': 9045312, 'steps': 47110, 'loss/train': 0.6855300664901733} -08/30/2021 21:46:14 - INFO - __main__ - Step 47112: {'lr': 0.0003938771953964476, 'samples': 9045504, 'steps': 47111, 'loss/train': 1.3073887825012207} -08/30/2021 21:46:15 - INFO - __main__ - Step 47113: {'lr': 0.0003938728555318594, 'samples': 9045696, 'steps': 47112, 'loss/train': 1.8746938705444336} -08/30/2021 21:46:15 - INFO - __main__ - Step 47114: {'lr': 0.00039386851560244433, 'samples': 9045888, 'steps': 47113, 'loss/train': 1.8838722705841064} -08/30/2021 21:46:15 - INFO - __main__ - Step 47115: {'lr': 0.0003938641756082043, 'samples': 9046080, 'steps': 47114, 'loss/train': 1.3469740152359009} -08/30/2021 21:46:16 - INFO - __main__ - Step 47116: {'lr': 0.00039385983554914136, 'samples': 9046272, 'steps': 47115, 'loss/train': 1.5194928646087646} -08/30/2021 21:46:17 - INFO - __main__ - Step 47117: {'lr': 0.0003938554954252573, 'samples': 9046464, 'steps': 47116, 'loss/train': 1.3795456886291504} -08/30/2021 21:46:18 - INFO - __main__ - Step 47118: {'lr': 0.00039385115523655426, 'samples': 9046656, 'steps': 47117, 'loss/train': 2.304798126220703} -08/30/2021 21:46:18 - INFO - __main__ - Step 47119: {'lr': 0.00039384681498303407, 'samples': 9046848, 'steps': 47118, 'loss/train': 5.85479211807251} -08/30/2021 21:46:19 - INFO - __main__ - Step 47120: {'lr': 0.0003938424746646988, 'samples': 9047040, 'steps': 47119, 'loss/train': 0.5144325494766235} -08/30/2021 21:46:19 - INFO - __main__ - Step 47121: {'lr': 0.00039383813428155027, 'samples': 9047232, 'steps': 47120, 'loss/train': 1.1317442655563354} -08/30/2021 21:46:19 - INFO - __main__ - Step 47122: {'lr': 0.0003938337938335904, 'samples': 9047424, 'steps': 47121, 'loss/train': 2.2960336208343506} -08/30/2021 21:46:21 - INFO - __main__ - Step 47123: {'lr': 0.00039382945332082136, 'samples': 9047616, 'steps': 47122, 'loss/train': 1.7264989614486694} -08/30/2021 21:46:21 - INFO - __main__ - Step 47124: {'lr': 0.00039382511274324496, 'samples': 9047808, 'steps': 47123, 'loss/train': 1.1836076974868774} -08/30/2021 21:46:22 - INFO - __main__ - Step 47125: {'lr': 0.0003938207721008632, 'samples': 9048000, 'steps': 47124, 'loss/train': 0.16168496012687683} -08/30/2021 21:46:22 - INFO - __main__ - Step 47126: {'lr': 0.00039381643139367806, 'samples': 9048192, 'steps': 47125, 'loss/train': 2.9365546703338623} -08/30/2021 21:46:22 - INFO - __main__ - Step 47127: {'lr': 0.00039381209062169136, 'samples': 9048384, 'steps': 47126, 'loss/train': 1.4645624160766602} -08/30/2021 21:46:23 - INFO - __main__ - Step 47128: {'lr': 0.0003938077497849052, 'samples': 9048576, 'steps': 47127, 'loss/train': 1.6827888488769531} -08/30/2021 21:46:25 - INFO - __main__ - Step 47129: {'lr': 0.00039380340888332143, 'samples': 9048768, 'steps': 47128, 'loss/train': 2.3274762630462646} -08/30/2021 21:46:25 - INFO - __main__ - Step 47130: {'lr': 0.0003937990679169421, 'samples': 9048960, 'steps': 47129, 'loss/train': 1.2184545993804932} -08/30/2021 21:46:26 - INFO - __main__ - Step 47131: {'lr': 0.0003937947268857692, 'samples': 9049152, 'steps': 47130, 'loss/train': 0.9901658296585083} -08/30/2021 21:46:26 - INFO - __main__ - Step 47132: {'lr': 0.00039379038578980454, 'samples': 9049344, 'steps': 47131, 'loss/train': 0.043276507407426834} -08/30/2021 21:46:26 - INFO - __main__ - Step 47133: {'lr': 0.0003937860446290502, 'samples': 9049536, 'steps': 47132, 'loss/train': 1.4290553331375122} -08/30/2021 21:46:27 - INFO - __main__ - Step 47134: {'lr': 0.0003937817034035081, 'samples': 9049728, 'steps': 47133, 'loss/train': 1.8684417009353638} -08/30/2021 21:46:27 - INFO - __main__ - Step 47135: {'lr': 0.00039377736211318004, 'samples': 9049920, 'steps': 47134, 'loss/train': 0.2874923348426819} -08/30/2021 21:46:29 - INFO - __main__ - Step 47136: {'lr': 0.0003937730207580682, 'samples': 9050112, 'steps': 47135, 'loss/train': 0.13769075274467468} -08/30/2021 21:46:30 - INFO - __main__ - Step 47137: {'lr': 0.0003937686793381745, 'samples': 9050304, 'steps': 47136, 'loss/train': 1.4981313943862915} -08/30/2021 21:46:30 - INFO - __main__ - Step 47138: {'lr': 0.0003937643378535009, 'samples': 9050496, 'steps': 47137, 'loss/train': 1.5889283418655396} -08/30/2021 21:46:30 - INFO - __main__ - Step 47139: {'lr': 0.0003937599963040491, 'samples': 9050688, 'steps': 47138, 'loss/train': 1.4682588577270508} -08/30/2021 21:46:31 - INFO - __main__ - Step 47140: {'lr': 0.0003937556546898214, 'samples': 9050880, 'steps': 47139, 'loss/train': 0.18973694741725922} -08/30/2021 21:46:31 - INFO - __main__ - Step 47141: {'lr': 0.0003937513130108197, 'samples': 9051072, 'steps': 47140, 'loss/train': 0.3625023365020752} -08/30/2021 21:46:33 - INFO - __main__ - Step 47142: {'lr': 0.00039374697126704573, 'samples': 9051264, 'steps': 47141, 'loss/train': 1.8720823526382446} -08/30/2021 21:46:33 - INFO - __main__ - Step 47143: {'lr': 0.0003937426294585017, 'samples': 9051456, 'steps': 47142, 'loss/train': 1.1312073469161987} -08/30/2021 21:46:34 - INFO - __main__ - Step 47144: {'lr': 0.00039373828758518936, 'samples': 9051648, 'steps': 47143, 'loss/train': 1.7806357145309448} -08/30/2021 21:46:34 - INFO - __main__ - Step 47145: {'lr': 0.00039373394564711086, 'samples': 9051840, 'steps': 47144, 'loss/train': 1.7965664863586426} -08/30/2021 21:46:34 - INFO - __main__ - Step 47146: {'lr': 0.00039372960364426803, 'samples': 9052032, 'steps': 47145, 'loss/train': 1.4933303594589233} -08/30/2021 21:46:36 - INFO - __main__ - Step 47147: {'lr': 0.0003937252615766628, 'samples': 9052224, 'steps': 47146, 'loss/train': 0.8132494688034058} -08/30/2021 21:46:36 - INFO - __main__ - Step 47148: {'lr': 0.0003937209194442973, 'samples': 9052416, 'steps': 47147, 'loss/train': 1.3352147340774536} -08/30/2021 21:46:37 - INFO - __main__ - Step 47149: {'lr': 0.00039371657724717325, 'samples': 9052608, 'steps': 47148, 'loss/train': 1.5505788326263428} -08/30/2021 21:46:37 - INFO - __main__ - Step 47150: {'lr': 0.0003937122349852928, 'samples': 9052800, 'steps': 47149, 'loss/train': 1.6834405660629272} -08/30/2021 21:46:38 - INFO - __main__ - Step 47151: {'lr': 0.0003937078926586578, 'samples': 9052992, 'steps': 47150, 'loss/train': 1.6427558660507202} -08/30/2021 21:46:39 - INFO - __main__ - Step 47152: {'lr': 0.0003937035502672703, 'samples': 9053184, 'steps': 47151, 'loss/train': 0.958710253238678} -08/30/2021 21:46:39 - INFO - __main__ - Step 47153: {'lr': 0.0003936992078111321, 'samples': 9053376, 'steps': 47152, 'loss/train': 1.375846266746521} -08/30/2021 21:46:40 - INFO - __main__ - Step 47154: {'lr': 0.0003936948652902453, 'samples': 9053568, 'steps': 47153, 'loss/train': 1.597145676612854} -08/30/2021 21:46:40 - INFO - __main__ - Step 47155: {'lr': 0.0003936905227046119, 'samples': 9053760, 'steps': 47154, 'loss/train': 1.5597662925720215} -08/30/2021 21:46:40 - INFO - __main__ - Step 47156: {'lr': 0.00039368618005423365, 'samples': 9053952, 'steps': 47155, 'loss/train': 1.5827739238739014} -08/30/2021 21:46:42 - INFO - __main__ - Step 47157: {'lr': 0.00039368183733911265, 'samples': 9054144, 'steps': 47156, 'loss/train': 1.0623199939727783} -08/30/2021 21:46:43 - INFO - __main__ - Step 47158: {'lr': 0.00039367749455925086, 'samples': 9054336, 'steps': 47157, 'loss/train': 1.1863417625427246} -08/30/2021 21:46:43 - INFO - __main__ - Step 47159: {'lr': 0.0003936731517146502, 'samples': 9054528, 'steps': 47158, 'loss/train': 0.9572000503540039} -08/30/2021 21:46:44 - INFO - __main__ - Step 47160: {'lr': 0.0003936688088053126, 'samples': 9054720, 'steps': 47159, 'loss/train': 0.9539853930473328} -08/30/2021 21:46:44 - INFO - __main__ - Step 47161: {'lr': 0.0003936644658312401, 'samples': 9054912, 'steps': 47160, 'loss/train': 1.5425822734832764} -08/30/2021 21:46:44 - INFO - __main__ - Step 47162: {'lr': 0.0003936601227924346, 'samples': 9055104, 'steps': 47161, 'loss/train': 0.059844743460416794} -08/30/2021 21:46:46 - INFO - __main__ - Step 47163: {'lr': 0.00039365577968889805, 'samples': 9055296, 'steps': 47162, 'loss/train': 1.5637813806533813} -08/30/2021 21:46:46 - INFO - __main__ - Step 47164: {'lr': 0.0003936514365206324, 'samples': 9055488, 'steps': 47163, 'loss/train': 1.7346241474151611} -08/30/2021 21:46:46 - INFO - __main__ - Step 47165: {'lr': 0.00039364709328763966, 'samples': 9055680, 'steps': 47164, 'loss/train': 1.0631160736083984} -08/30/2021 21:46:47 - INFO - __main__ - Step 47166: {'lr': 0.00039364274998992177, 'samples': 9055872, 'steps': 47165, 'loss/train': 1.503037452697754} -08/30/2021 21:46:47 - INFO - __main__ - Step 47167: {'lr': 0.00039363840662748063, 'samples': 9056064, 'steps': 47166, 'loss/train': 1.1738473176956177} -08/30/2021 21:46:49 - INFO - __main__ - Step 47168: {'lr': 0.0003936340632003183, 'samples': 9056256, 'steps': 47167, 'loss/train': 1.3312121629714966} -08/30/2021 21:46:49 - INFO - __main__ - Step 47169: {'lr': 0.0003936297197084366, 'samples': 9056448, 'steps': 47168, 'loss/train': 2.259002685546875} -08/30/2021 21:46:50 - INFO - __main__ - Step 47170: {'lr': 0.00039362537615183764, 'samples': 9056640, 'steps': 47169, 'loss/train': 1.2216168642044067} -08/30/2021 21:46:50 - INFO - __main__ - Step 47171: {'lr': 0.0003936210325305233, 'samples': 9056832, 'steps': 47170, 'loss/train': 0.9417734742164612} -08/30/2021 21:46:50 - INFO - __main__ - Step 47172: {'lr': 0.0003936166888444954, 'samples': 9057024, 'steps': 47171, 'loss/train': 1.0368679761886597} -08/30/2021 21:46:52 - INFO - __main__ - Step 47173: {'lr': 0.0003936123450937562, 'samples': 9057216, 'steps': 47172, 'loss/train': 1.2912726402282715} -08/30/2021 21:46:52 - INFO - __main__ - Step 47174: {'lr': 0.0003936080012783075, 'samples': 9057408, 'steps': 47173, 'loss/train': 1.5052670240402222} -08/30/2021 21:46:53 - INFO - __main__ - Step 47175: {'lr': 0.0003936036573981512, 'samples': 9057600, 'steps': 47174, 'loss/train': 1.4165047407150269} -08/30/2021 21:46:53 - INFO - __main__ - Step 47176: {'lr': 0.00039359931345328927, 'samples': 9057792, 'steps': 47175, 'loss/train': 0.636588990688324} -08/30/2021 21:46:53 - INFO - __main__ - Step 47177: {'lr': 0.0003935949694437237, 'samples': 9057984, 'steps': 47176, 'loss/train': 1.0945026874542236} -08/30/2021 21:46:55 - INFO - __main__ - Step 47178: {'lr': 0.00039359062536945645, 'samples': 9058176, 'steps': 47177, 'loss/train': 1.099445104598999} -08/30/2021 21:46:55 - INFO - __main__ - Step 47179: {'lr': 0.00039358628123048955, 'samples': 9058368, 'steps': 47178, 'loss/train': 1.7694694995880127} -08/30/2021 21:46:56 - INFO - __main__ - Step 47180: {'lr': 0.0003935819370268249, 'samples': 9058560, 'steps': 47179, 'loss/train': 1.023068904876709} -08/30/2021 21:46:56 - INFO - __main__ - Step 47181: {'lr': 0.00039357759275846437, 'samples': 9058752, 'steps': 47180, 'loss/train': 1.374024510383606} -08/30/2021 21:46:56 - INFO - __main__ - Step 47182: {'lr': 0.00039357324842541, 'samples': 9058944, 'steps': 47181, 'loss/train': 1.5039547681808472} -08/30/2021 21:46:58 - INFO - __main__ - Step 47183: {'lr': 0.0003935689040276638, 'samples': 9059136, 'steps': 47182, 'loss/train': 1.2474969625473022} -08/30/2021 21:46:58 - INFO - __main__ - Step 47184: {'lr': 0.0003935645595652276, 'samples': 9059328, 'steps': 47183, 'loss/train': 1.548696756362915} -08/30/2021 21:46:59 - INFO - __main__ - Step 47185: {'lr': 0.0003935602150381034, 'samples': 9059520, 'steps': 47184, 'loss/train': 0.9608526825904846} -08/30/2021 21:46:59 - INFO - __main__ - Step 47186: {'lr': 0.00039355587044629325, 'samples': 9059712, 'steps': 47185, 'loss/train': 1.438480019569397} -08/30/2021 21:46:59 - INFO - __main__ - Step 47187: {'lr': 0.00039355152578979903, 'samples': 9059904, 'steps': 47186, 'loss/train': 1.0906423330307007} -08/30/2021 21:47:00 - INFO - __main__ - Step 47188: {'lr': 0.0003935471810686228, 'samples': 9060096, 'steps': 47187, 'loss/train': 1.8375911712646484} -08/30/2021 21:47:01 - INFO - __main__ - Step 47189: {'lr': 0.0003935428362827662, 'samples': 9060288, 'steps': 47188, 'loss/train': 1.8356000185012817} -08/30/2021 21:47:02 - INFO - __main__ - Step 47190: {'lr': 0.0003935384914322316, 'samples': 9060480, 'steps': 47189, 'loss/train': 1.4232927560806274} -08/30/2021 21:47:02 - INFO - __main__ - Step 47191: {'lr': 0.0003935341465170207, 'samples': 9060672, 'steps': 47190, 'loss/train': 1.9569494724273682} -08/30/2021 21:47:02 - INFO - __main__ - Step 47192: {'lr': 0.0003935298015371355, 'samples': 9060864, 'steps': 47191, 'loss/train': 1.5322213172912598} -08/30/2021 21:47:03 - INFO - __main__ - Step 47193: {'lr': 0.0003935254564925781, 'samples': 9061056, 'steps': 47192, 'loss/train': 0.9357300996780396} -08/30/2021 21:47:05 - INFO - __main__ - Step 47194: {'lr': 0.0003935211113833502, 'samples': 9061248, 'steps': 47193, 'loss/train': 1.6644103527069092} -08/30/2021 21:47:05 - INFO - __main__ - Step 47195: {'lr': 0.00039351676620945396, 'samples': 9061440, 'steps': 47194, 'loss/train': 1.3437191247940063} -08/30/2021 21:47:06 - INFO - __main__ - Step 47196: {'lr': 0.00039351242097089133, 'samples': 9061632, 'steps': 47195, 'loss/train': 1.4233492612838745} -08/30/2021 21:47:06 - INFO - __main__ - Step 47197: {'lr': 0.0003935080756676641, 'samples': 9061824, 'steps': 47196, 'loss/train': 1.3775190114974976} -08/30/2021 21:47:06 - INFO - __main__ - Step 47198: {'lr': 0.0003935037302997745, 'samples': 9062016, 'steps': 47197, 'loss/train': 1.7171847820281982} -08/30/2021 21:47:08 - INFO - __main__ - Step 47199: {'lr': 0.00039349938486722425, 'samples': 9062208, 'steps': 47198, 'loss/train': 1.541567087173462} -08/30/2021 21:47:08 - INFO - __main__ - Step 47200: {'lr': 0.0003934950393700154, 'samples': 9062400, 'steps': 47199, 'loss/train': 1.4359557628631592} -08/30/2021 21:47:09 - INFO - __main__ - Step 47201: {'lr': 0.0003934906938081499, 'samples': 9062592, 'steps': 47200, 'loss/train': 1.3227238655090332} -08/30/2021 21:47:09 - INFO - __main__ - Step 47202: {'lr': 0.0003934863481816297, 'samples': 9062784, 'steps': 47201, 'loss/train': 2.2633533477783203} -08/30/2021 21:47:09 - INFO - __main__ - Step 47203: {'lr': 0.00039348200249045675, 'samples': 9062976, 'steps': 47202, 'loss/train': 2.111750841140747} -08/30/2021 21:47:11 - INFO - __main__ - Step 47204: {'lr': 0.000393477656734633, 'samples': 9063168, 'steps': 47203, 'loss/train': 1.31951904296875} -08/30/2021 21:47:11 - INFO - __main__ - Step 47205: {'lr': 0.0003934733109141605, 'samples': 9063360, 'steps': 47204, 'loss/train': 1.2697341442108154} -08/30/2021 21:47:12 - INFO - __main__ - Step 47206: {'lr': 0.00039346896502904117, 'samples': 9063552, 'steps': 47205, 'loss/train': 1.754895567893982} -08/30/2021 21:47:12 - INFO - __main__ - Step 47207: {'lr': 0.0003934646190792769, 'samples': 9063744, 'steps': 47206, 'loss/train': 1.533581018447876} -08/30/2021 21:47:12 - INFO - __main__ - Step 47208: {'lr': 0.00039346027306486964, 'samples': 9063936, 'steps': 47207, 'loss/train': 1.1768206357955933} -08/30/2021 21:47:14 - INFO - __main__ - Step 47209: {'lr': 0.00039345592698582146, 'samples': 9064128, 'steps': 47208, 'loss/train': 1.5395684242248535} -08/30/2021 21:47:14 - INFO - __main__ - Step 47210: {'lr': 0.00039345158084213417, 'samples': 9064320, 'steps': 47209, 'loss/train': 1.130729079246521} -08/30/2021 21:47:14 - INFO - __main__ - Step 47211: {'lr': 0.0003934472346338099, 'samples': 9064512, 'steps': 47210, 'loss/train': 1.8665534257888794} -08/30/2021 21:47:15 - INFO - __main__ - Step 47212: {'lr': 0.00039344288836085046, 'samples': 9064704, 'steps': 47211, 'loss/train': 0.8307130932807922} -08/30/2021 21:47:15 - INFO - __main__ - Step 47213: {'lr': 0.0003934385420232579, 'samples': 9064896, 'steps': 47212, 'loss/train': 1.6355105638504028} -08/30/2021 21:47:17 - INFO - __main__ - Step 47214: {'lr': 0.0003934341956210341, 'samples': 9065088, 'steps': 47213, 'loss/train': 1.9811102151870728} -08/30/2021 21:47:17 - INFO - __main__ - Step 47215: {'lr': 0.0003934298491541811, 'samples': 9065280, 'steps': 47214, 'loss/train': 0.6664502620697021} -08/30/2021 21:47:17 - INFO - __main__ - Step 47216: {'lr': 0.0003934255026227008, 'samples': 9065472, 'steps': 47215, 'loss/train': 1.1501413583755493} -08/30/2021 21:47:18 - INFO - __main__ - Step 47217: {'lr': 0.0003934211560265952, 'samples': 9065664, 'steps': 47216, 'loss/train': 1.3039368391036987} -08/30/2021 21:47:18 - INFO - __main__ - Step 47218: {'lr': 0.0003934168093658663, 'samples': 9065856, 'steps': 47217, 'loss/train': 1.2305551767349243} -08/30/2021 21:47:19 - INFO - __main__ - Step 47219: {'lr': 0.0003934124626405159, 'samples': 9066048, 'steps': 47218, 'loss/train': 1.9310535192489624} -08/30/2021 21:47:20 - INFO - __main__ - Step 47220: {'lr': 0.00039340811585054615, 'samples': 9066240, 'steps': 47219, 'loss/train': 1.0418373346328735} -08/30/2021 21:47:21 - INFO - __main__ - Step 47221: {'lr': 0.0003934037689959589, 'samples': 9066432, 'steps': 47220, 'loss/train': 0.6557124853134155} -08/30/2021 21:47:21 - INFO - __main__ - Step 47222: {'lr': 0.00039339942207675604, 'samples': 9066624, 'steps': 47221, 'loss/train': 0.11926555633544922} -08/30/2021 21:47:21 - INFO - __main__ - Step 47223: {'lr': 0.0003933950750929397, 'samples': 9066816, 'steps': 47222, 'loss/train': 1.38284432888031} -08/30/2021 21:47:22 - INFO - __main__ - Step 47224: {'lr': 0.0003933907280445117, 'samples': 9067008, 'steps': 47223, 'loss/train': 1.1271244287490845} -08/30/2021 21:47:23 - INFO - __main__ - Step 47225: {'lr': 0.00039338638093147404, 'samples': 9067200, 'steps': 47224, 'loss/train': 1.3011709451675415} -08/30/2021 21:47:24 - INFO - __main__ - Step 47226: {'lr': 0.00039338203375382873, 'samples': 9067392, 'steps': 47225, 'loss/train': 1.519370675086975} -08/30/2021 21:47:24 - INFO - __main__ - Step 47227: {'lr': 0.00039337768651157766, 'samples': 9067584, 'steps': 47226, 'loss/train': 1.7933515310287476} -08/30/2021 21:47:24 - INFO - __main__ - Step 47228: {'lr': 0.0003933733392047228, 'samples': 9067776, 'steps': 47227, 'loss/train': 0.613797664642334} -08/30/2021 21:47:25 - INFO - __main__ - Step 47229: {'lr': 0.0003933689918332662, 'samples': 9067968, 'steps': 47228, 'loss/train': 1.5601712465286255} -08/30/2021 21:47:26 - INFO - __main__ - Step 47230: {'lr': 0.0003933646443972097, 'samples': 9068160, 'steps': 47229, 'loss/train': 1.699337124824524} -08/30/2021 21:47:27 - INFO - __main__ - Step 47231: {'lr': 0.0003933602968965553, 'samples': 9068352, 'steps': 47230, 'loss/train': 1.508933424949646} -08/30/2021 21:47:27 - INFO - __main__ - Step 47232: {'lr': 0.00039335594933130494, 'samples': 9068544, 'steps': 47231, 'loss/train': 1.45913565158844} -08/30/2021 21:47:28 - INFO - __main__ - Step 47233: {'lr': 0.0003933516017014607, 'samples': 9068736, 'steps': 47232, 'loss/train': 1.5323749780654907} -08/30/2021 21:47:28 - INFO - __main__ - Step 47234: {'lr': 0.0003933472540070243, 'samples': 9068928, 'steps': 47233, 'loss/train': 1.5066059827804565} -08/30/2021 21:47:29 - INFO - __main__ - Step 47235: {'lr': 0.00039334290624799795, 'samples': 9069120, 'steps': 47234, 'loss/train': 0.7128892540931702} -08/30/2021 21:47:30 - INFO - __main__ - Step 47236: {'lr': 0.0003933385584243834, 'samples': 9069312, 'steps': 47235, 'loss/train': 1.6853135824203491} -08/30/2021 21:47:30 - INFO - __main__ - Step 47237: {'lr': 0.0003933342105361828, 'samples': 9069504, 'steps': 47236, 'loss/train': 1.0111676454544067} -08/30/2021 21:47:31 - INFO - __main__ - Step 47238: {'lr': 0.000393329862583398, 'samples': 9069696, 'steps': 47237, 'loss/train': 1.313427209854126} -08/30/2021 21:47:31 - INFO - __main__ - Step 47239: {'lr': 0.00039332551456603093, 'samples': 9069888, 'steps': 47238, 'loss/train': 1.5572577714920044} -08/30/2021 21:47:31 - INFO - __main__ - Step 47240: {'lr': 0.00039332116648408365, 'samples': 9070080, 'steps': 47239, 'loss/train': 1.349772572517395} -08/30/2021 21:47:33 - INFO - __main__ - Step 47241: {'lr': 0.00039331681833755804, 'samples': 9070272, 'steps': 47240, 'loss/train': 1.349863886833191} -08/30/2021 21:47:33 - INFO - __main__ - Step 47242: {'lr': 0.00039331247012645604, 'samples': 9070464, 'steps': 47241, 'loss/train': 1.808831810951233} -08/30/2021 21:47:34 - INFO - __main__ - Step 47243: {'lr': 0.00039330812185077967, 'samples': 9070656, 'steps': 47242, 'loss/train': 1.6437147855758667} -08/30/2021 21:47:34 - INFO - __main__ - Step 47244: {'lr': 0.0003933037735105309, 'samples': 9070848, 'steps': 47243, 'loss/train': 1.2804737091064453} -08/30/2021 21:47:34 - INFO - __main__ - Step 47245: {'lr': 0.00039329942510571165, 'samples': 9071040, 'steps': 47244, 'loss/train': 1.3627424240112305} -08/30/2021 21:47:36 - INFO - __main__ - Step 47246: {'lr': 0.0003932950766363239, 'samples': 9071232, 'steps': 47245, 'loss/train': 1.1552386283874512} -08/30/2021 21:47:37 - INFO - __main__ - Step 47247: {'lr': 0.00039329072810236965, 'samples': 9071424, 'steps': 47246, 'loss/train': 1.071413278579712} -08/30/2021 21:47:37 - INFO - __main__ - Step 47248: {'lr': 0.0003932863795038507, 'samples': 9071616, 'steps': 47247, 'loss/train': 0.11882774531841278} -08/30/2021 21:47:37 - INFO - __main__ - Step 47249: {'lr': 0.0003932820308407692, 'samples': 9071808, 'steps': 47248, 'loss/train': 1.7145575284957886} -08/30/2021 21:47:38 - INFO - __main__ - Step 47250: {'lr': 0.000393277682113127, 'samples': 9072000, 'steps': 47249, 'loss/train': 1.3279597759246826} -08/30/2021 21:47:38 - INFO - __main__ - Step 47251: {'lr': 0.00039327333332092606, 'samples': 9072192, 'steps': 47250, 'loss/train': 1.0670586824417114} -08/30/2021 21:47:41 - INFO - __main__ - Step 47252: {'lr': 0.0003932689844641684, 'samples': 9072384, 'steps': 47251, 'loss/train': 1.458558440208435} -08/30/2021 21:47:41 - INFO - __main__ - Step 47253: {'lr': 0.00039326463554285597, 'samples': 9072576, 'steps': 47252, 'loss/train': 1.4830328226089478} -08/30/2021 21:47:41 - INFO - __main__ - Step 47254: {'lr': 0.00039326028655699063, 'samples': 9072768, 'steps': 47253, 'loss/train': 1.6451884508132935} -08/30/2021 21:47:42 - INFO - __main__ - Step 47255: {'lr': 0.0003932559375065745, 'samples': 9072960, 'steps': 47254, 'loss/train': 1.4628525972366333} -08/30/2021 21:47:42 - INFO - __main__ - Step 47256: {'lr': 0.00039325158839160937, 'samples': 9073152, 'steps': 47255, 'loss/train': 0.9414811730384827} -08/30/2021 21:47:42 - INFO - __main__ - Step 47257: {'lr': 0.0003932472392120974, 'samples': 9073344, 'steps': 47256, 'loss/train': 1.7280681133270264} -08/30/2021 21:47:44 - INFO - __main__ - Step 47258: {'lr': 0.00039324288996804026, 'samples': 9073536, 'steps': 47257, 'loss/train': 1.7407526969909668} -08/30/2021 21:47:44 - INFO - __main__ - Step 47259: {'lr': 0.0003932385406594402, 'samples': 9073728, 'steps': 47258, 'loss/train': 0.9837968349456787} -08/30/2021 21:47:45 - INFO - __main__ - Step 47260: {'lr': 0.0003932341912862991, 'samples': 9073920, 'steps': 47259, 'loss/train': 0.5422816872596741} -08/30/2021 21:47:45 - INFO - __main__ - Step 47261: {'lr': 0.0003932298418486188, 'samples': 9074112, 'steps': 47260, 'loss/train': 1.6922330856323242} -08/30/2021 21:47:45 - INFO - __main__ - Step 47262: {'lr': 0.00039322549234640136, 'samples': 9074304, 'steps': 47261, 'loss/train': 1.4442442655563354} -08/30/2021 21:47:46 - INFO - __main__ - Step 47263: {'lr': 0.00039322114277964875, 'samples': 9074496, 'steps': 47262, 'loss/train': 1.4364198446273804} -08/30/2021 21:47:48 - INFO - __main__ - Step 47264: {'lr': 0.0003932167931483629, 'samples': 9074688, 'steps': 47263, 'loss/train': 1.5787311792373657} -08/30/2021 21:47:49 - INFO - __main__ - Step 47265: {'lr': 0.00039321244345254583, 'samples': 9074880, 'steps': 47264, 'loss/train': 1.5624264478683472} -08/30/2021 21:47:49 - INFO - __main__ - Step 47266: {'lr': 0.0003932080936921993, 'samples': 9075072, 'steps': 47265, 'loss/train': 4.3112897872924805} -08/30/2021 21:47:49 - INFO - __main__ - Step 47267: {'lr': 0.00039320374386732555, 'samples': 9075264, 'steps': 47266, 'loss/train': 4.432944297790527} -08/30/2021 21:47:50 - INFO - __main__ - Step 47268: {'lr': 0.00039319939397792635, 'samples': 9075456, 'steps': 47267, 'loss/train': 1.9740513563156128} -08/30/2021 21:47:50 - INFO - __main__ - Step 47269: {'lr': 0.00039319504402400367, 'samples': 9075648, 'steps': 47268, 'loss/train': 1.079913854598999} -08/30/2021 21:47:52 - INFO - __main__ - Step 47270: {'lr': 0.0003931906940055596, 'samples': 9075840, 'steps': 47269, 'loss/train': 1.2581286430358887} -08/30/2021 21:47:52 - INFO - __main__ - Step 47271: {'lr': 0.00039318634392259593, 'samples': 9076032, 'steps': 47270, 'loss/train': 1.5154542922973633} -08/30/2021 21:47:52 - INFO - __main__ - Step 47272: {'lr': 0.00039318199377511476, 'samples': 9076224, 'steps': 47271, 'loss/train': 0.8166834712028503} -08/30/2021 21:47:53 - INFO - __main__ - Step 47273: {'lr': 0.00039317764356311803, 'samples': 9076416, 'steps': 47272, 'loss/train': 3.0102884769439697} -08/30/2021 21:47:53 - INFO - __main__ - Step 47274: {'lr': 0.00039317329328660754, 'samples': 9076608, 'steps': 47273, 'loss/train': 1.2756074666976929} -08/30/2021 21:47:54 - INFO - __main__ - Step 47275: {'lr': 0.0003931689429455855, 'samples': 9076800, 'steps': 47274, 'loss/train': 1.1009291410446167} -08/30/2021 21:47:55 - INFO - __main__ - Step 47276: {'lr': 0.00039316459254005364, 'samples': 9076992, 'steps': 47275, 'loss/train': 1.7836995124816895} -08/30/2021 21:47:55 - INFO - __main__ - Step 47277: {'lr': 0.00039316024207001403, 'samples': 9077184, 'steps': 47276, 'loss/train': 1.9067935943603516} -08/30/2021 21:47:56 - INFO - __main__ - Step 47278: {'lr': 0.0003931558915354687, 'samples': 9077376, 'steps': 47277, 'loss/train': 1.2166469097137451} -08/30/2021 21:47:56 - INFO - __main__ - Step 47279: {'lr': 0.00039315154093641947, 'samples': 9077568, 'steps': 47278, 'loss/train': 1.7116620540618896} -08/30/2021 21:47:57 - INFO - __main__ - Step 47280: {'lr': 0.00039314719027286837, 'samples': 9077760, 'steps': 47279, 'loss/train': 1.3903424739837646} -08/30/2021 21:47:58 - INFO - __main__ - Step 47281: {'lr': 0.00039314283954481737, 'samples': 9077952, 'steps': 47280, 'loss/train': 0.059253908693790436} -08/30/2021 21:47:58 - INFO - __main__ - Step 47282: {'lr': 0.00039313848875226844, 'samples': 9078144, 'steps': 47281, 'loss/train': 1.5881465673446655} -08/30/2021 21:47:59 - INFO - __main__ - Step 47283: {'lr': 0.0003931341378952235, 'samples': 9078336, 'steps': 47282, 'loss/train': 1.2724661827087402} -08/30/2021 21:47:59 - INFO - __main__ - Step 47284: {'lr': 0.0003931297869736845, 'samples': 9078528, 'steps': 47283, 'loss/train': 1.3937915563583374} -08/30/2021 21:48:00 - INFO - __main__ - Step 47285: {'lr': 0.0003931254359876535, 'samples': 9078720, 'steps': 47284, 'loss/train': 0.7238603234291077} -08/30/2021 21:48:01 - INFO - __main__ - Step 47286: {'lr': 0.00039312108493713227, 'samples': 9078912, 'steps': 47285, 'loss/train': 1.7359777688980103} -08/30/2021 21:48:01 - INFO - __main__ - Step 47287: {'lr': 0.00039311673382212296, 'samples': 9079104, 'steps': 47286, 'loss/train': 1.3183573484420776} -08/30/2021 21:48:02 - INFO - __main__ - Step 47288: {'lr': 0.0003931123826426275, 'samples': 9079296, 'steps': 47287, 'loss/train': 0.08673273026943207} -08/30/2021 21:48:02 - INFO - __main__ - Step 47289: {'lr': 0.00039310803139864777, 'samples': 9079488, 'steps': 47288, 'loss/train': 1.4308583736419678} -08/30/2021 21:48:03 - INFO - __main__ - Step 47290: {'lr': 0.0003931036800901857, 'samples': 9079680, 'steps': 47289, 'loss/train': 1.5248067378997803} -08/30/2021 21:48:04 - INFO - __main__ - Step 47291: {'lr': 0.0003930993287172434, 'samples': 9079872, 'steps': 47290, 'loss/train': 1.4464563131332397} -08/30/2021 21:48:04 - INFO - __main__ - Step 47292: {'lr': 0.0003930949772798227, 'samples': 9080064, 'steps': 47291, 'loss/train': 1.6020326614379883} -08/30/2021 21:48:05 - INFO - __main__ - Step 47293: {'lr': 0.00039309062577792565, 'samples': 9080256, 'steps': 47292, 'loss/train': 1.4132577180862427} -08/30/2021 21:48:05 - INFO - __main__ - Step 47294: {'lr': 0.0003930862742115542, 'samples': 9080448, 'steps': 47293, 'loss/train': 1.614087700843811} -08/30/2021 21:48:07 - INFO - __main__ - Step 47295: {'lr': 0.0003930819225807102, 'samples': 9080640, 'steps': 47294, 'loss/train': 1.2367781400680542} -08/30/2021 21:48:07 - INFO - __main__ - Step 47296: {'lr': 0.00039307757088539574, 'samples': 9080832, 'steps': 47295, 'loss/train': 2.146489381790161} -08/30/2021 21:48:07 - INFO - __main__ - Step 47297: {'lr': 0.0003930732191256128, 'samples': 9081024, 'steps': 47296, 'loss/train': 1.5928442478179932} -08/30/2021 21:48:08 - INFO - __main__ - Step 47298: {'lr': 0.00039306886730136316, 'samples': 9081216, 'steps': 47297, 'loss/train': 2.2303366661071777} -08/30/2021 21:48:08 - INFO - __main__ - Step 47299: {'lr': 0.00039306451541264896, 'samples': 9081408, 'steps': 47298, 'loss/train': 0.9554955959320068} -08/30/2021 21:48:08 - INFO - __main__ - Step 47300: {'lr': 0.0003930601634594721, 'samples': 9081600, 'steps': 47299, 'loss/train': 1.4821048974990845} -08/30/2021 21:48:10 - INFO - __main__ - Step 47301: {'lr': 0.0003930558114418345, 'samples': 9081792, 'steps': 47300, 'loss/train': 1.671755075454712} -08/30/2021 21:48:10 - INFO - __main__ - Step 47302: {'lr': 0.0003930514593597382, 'samples': 9081984, 'steps': 47301, 'loss/train': 1.0608506202697754} -08/30/2021 21:48:11 - INFO - __main__ - Step 47303: {'lr': 0.00039304710721318505, 'samples': 9082176, 'steps': 47302, 'loss/train': 1.6971443891525269} -08/30/2021 21:48:11 - INFO - __main__ - Step 47304: {'lr': 0.0003930427550021771, 'samples': 9082368, 'steps': 47303, 'loss/train': 0.21481195092201233} -08/30/2021 21:48:11 - INFO - __main__ - Step 47305: {'lr': 0.00039303840272671636, 'samples': 9082560, 'steps': 47304, 'loss/train': 1.41652250289917} -08/30/2021 21:48:13 - INFO - __main__ - Step 47306: {'lr': 0.00039303405038680465, 'samples': 9082752, 'steps': 47305, 'loss/train': 1.2006443738937378} -08/30/2021 21:48:14 - INFO - __main__ - Step 47307: {'lr': 0.00039302969798244407, 'samples': 9082944, 'steps': 47306, 'loss/train': 1.6500297784805298} -08/30/2021 21:48:14 - INFO - __main__ - Step 47308: {'lr': 0.0003930253455136365, 'samples': 9083136, 'steps': 47307, 'loss/train': 0.12864425778388977} -08/30/2021 21:48:15 - INFO - __main__ - Step 47309: {'lr': 0.0003930209929803839, 'samples': 9083328, 'steps': 47308, 'loss/train': 1.8450382947921753} -08/30/2021 21:48:15 - INFO - __main__ - Step 47310: {'lr': 0.0003930166403826883, 'samples': 9083520, 'steps': 47309, 'loss/train': 1.412922739982605} -08/30/2021 21:48:17 - INFO - __main__ - Step 47311: {'lr': 0.00039301228772055147, 'samples': 9083712, 'steps': 47310, 'loss/train': 1.0711334943771362} -08/30/2021 21:48:17 - INFO - __main__ - Step 47312: {'lr': 0.0003930079349939756, 'samples': 9083904, 'steps': 47311, 'loss/train': 0.9847979545593262} -08/30/2021 21:48:17 - INFO - __main__ - Step 47313: {'lr': 0.00039300358220296255, 'samples': 9084096, 'steps': 47312, 'loss/train': 1.3400652408599854} -08/30/2021 21:48:18 - INFO - __main__ - Step 47314: {'lr': 0.0003929992293475143, 'samples': 9084288, 'steps': 47313, 'loss/train': 1.718641996383667} -08/30/2021 21:48:18 - INFO - __main__ - Step 47315: {'lr': 0.00039299487642763286, 'samples': 9084480, 'steps': 47314, 'loss/train': 1.306476354598999} -08/30/2021 21:48:20 - INFO - __main__ - Step 47316: {'lr': 0.00039299052344332, 'samples': 9084672, 'steps': 47315, 'loss/train': 1.2910528182983398} -08/30/2021 21:48:20 - INFO - __main__ - Step 47317: {'lr': 0.00039298617039457796, 'samples': 9084864, 'steps': 47316, 'loss/train': 0.380572110414505} -08/30/2021 21:48:21 - INFO - __main__ - Step 47318: {'lr': 0.0003929818172814085, 'samples': 9085056, 'steps': 47317, 'loss/train': 1.2524960041046143} -08/30/2021 21:48:21 - INFO - __main__ - Step 47319: {'lr': 0.00039297746410381357, 'samples': 9085248, 'steps': 47318, 'loss/train': 1.192836046218872} -08/30/2021 21:48:21 - INFO - __main__ - Step 47320: {'lr': 0.00039297311086179535, 'samples': 9085440, 'steps': 47319, 'loss/train': 1.6921825408935547} -08/30/2021 21:48:22 - INFO - __main__ - Step 47321: {'lr': 0.00039296875755535557, 'samples': 9085632, 'steps': 47320, 'loss/train': 1.0637820959091187} -08/30/2021 21:48:23 - INFO - __main__ - Step 47322: {'lr': 0.0003929644041844962, 'samples': 9085824, 'steps': 47321, 'loss/train': 1.711601734161377} -08/30/2021 21:48:24 - INFO - __main__ - Step 47323: {'lr': 0.00039296005074921937, 'samples': 9086016, 'steps': 47322, 'loss/train': 0.10674764215946198} -08/30/2021 21:48:24 - INFO - __main__ - Step 47324: {'lr': 0.0003929556972495269, 'samples': 9086208, 'steps': 47323, 'loss/train': 1.6770915985107422} -08/30/2021 21:48:25 - INFO - __main__ - Step 47325: {'lr': 0.00039295134368542083, 'samples': 9086400, 'steps': 47324, 'loss/train': 0.9848683476448059} -08/30/2021 21:48:25 - INFO - __main__ - Step 47326: {'lr': 0.000392946990056903, 'samples': 9086592, 'steps': 47325, 'loss/train': 1.8454848527908325} -08/30/2021 21:48:27 - INFO - __main__ - Step 47327: {'lr': 0.00039294263636397564, 'samples': 9086784, 'steps': 47326, 'loss/train': 1.303276538848877} -08/30/2021 21:48:27 - INFO - __main__ - Step 47328: {'lr': 0.00039293828260664047, 'samples': 9086976, 'steps': 47327, 'loss/train': 0.07456887513399124} -08/30/2021 21:48:27 - INFO - __main__ - Step 47329: {'lr': 0.0003929339287848994, 'samples': 9087168, 'steps': 47328, 'loss/train': 0.6583238840103149} -08/30/2021 21:48:28 - INFO - __main__ - Step 47330: {'lr': 0.00039292957489875456, 'samples': 9087360, 'steps': 47329, 'loss/train': 1.1777760982513428} -08/30/2021 21:48:28 - INFO - __main__ - Step 47331: {'lr': 0.00039292522094820794, 'samples': 9087552, 'steps': 47330, 'loss/train': 1.2854838371276855} -08/30/2021 21:48:30 - INFO - __main__ - Step 47332: {'lr': 0.00039292086693326134, 'samples': 9087744, 'steps': 47331, 'loss/train': 1.453113079071045} -08/30/2021 21:48:30 - INFO - __main__ - Step 47333: {'lr': 0.0003929165128539168, 'samples': 9087936, 'steps': 47332, 'loss/train': 1.2781678438186646} -08/30/2021 21:48:30 - INFO - __main__ - Step 47334: {'lr': 0.0003929121587101764, 'samples': 9088128, 'steps': 47333, 'loss/train': 2.0703165531158447} -08/30/2021 21:48:31 - INFO - __main__ - Step 47335: {'lr': 0.00039290780450204187, 'samples': 9088320, 'steps': 47334, 'loss/train': 1.426224708557129} -08/30/2021 21:48:31 - INFO - __main__ - Step 47336: {'lr': 0.00039290345022951535, 'samples': 9088512, 'steps': 47335, 'loss/train': 1.387518048286438} -08/30/2021 21:48:33 - INFO - __main__ - Step 47337: {'lr': 0.0003928990958925987, 'samples': 9088704, 'steps': 47336, 'loss/train': 1.381941318511963} -08/30/2021 21:48:33 - INFO - __main__ - Step 47338: {'lr': 0.0003928947414912939, 'samples': 9088896, 'steps': 47337, 'loss/train': 1.4821908473968506} -08/30/2021 21:48:33 - INFO - __main__ - Step 47339: {'lr': 0.00039289038702560304, 'samples': 9089088, 'steps': 47338, 'loss/train': 1.3943333625793457} -08/30/2021 21:48:34 - INFO - __main__ - Step 47340: {'lr': 0.0003928860324955279, 'samples': 9089280, 'steps': 47339, 'loss/train': 1.7870291471481323} -08/30/2021 21:48:34 - INFO - __main__ - Step 47341: {'lr': 0.00039288167790107055, 'samples': 9089472, 'steps': 47340, 'loss/train': 0.9736477136611938} -08/30/2021 21:48:36 - INFO - __main__ - Step 47342: {'lr': 0.00039287732324223287, 'samples': 9089664, 'steps': 47341, 'loss/train': 1.3744133710861206} -08/30/2021 21:48:36 - INFO - __main__ - Step 47343: {'lr': 0.0003928729685190169, 'samples': 9089856, 'steps': 47342, 'loss/train': 1.6169779300689697} -08/30/2021 21:48:37 - INFO - __main__ - Step 47344: {'lr': 0.00039286861373142456, 'samples': 9090048, 'steps': 47343, 'loss/train': 1.1734250783920288} -08/30/2021 21:48:37 - INFO - __main__ - Step 47345: {'lr': 0.0003928642588794579, 'samples': 9090240, 'steps': 47344, 'loss/train': 1.5925641059875488} -08/30/2021 21:48:37 - INFO - __main__ - Step 47346: {'lr': 0.0003928599039631187, 'samples': 9090432, 'steps': 47345, 'loss/train': 1.6263929605484009} -08/30/2021 21:48:38 - INFO - __main__ - Step 47347: {'lr': 0.00039285554898240907, 'samples': 9090624, 'steps': 47346, 'loss/train': 1.6302977800369263} -08/30/2021 21:48:40 - INFO - __main__ - Step 47348: {'lr': 0.0003928511939373309, 'samples': 9090816, 'steps': 47347, 'loss/train': 1.4947547912597656} -08/30/2021 21:48:40 - INFO - __main__ - Step 47349: {'lr': 0.0003928468388278863, 'samples': 9091008, 'steps': 47348, 'loss/train': 1.2743167877197266} -08/30/2021 21:48:41 - INFO - __main__ - Step 47350: {'lr': 0.00039284248365407704, 'samples': 9091200, 'steps': 47349, 'loss/train': 1.8058005571365356} -08/30/2021 21:48:41 - INFO - __main__ - Step 47351: {'lr': 0.00039283812841590514, 'samples': 9091392, 'steps': 47350, 'loss/train': 2.523587226867676} -08/30/2021 21:48:42 - INFO - __main__ - Step 47352: {'lr': 0.0003928337731133727, 'samples': 9091584, 'steps': 47351, 'loss/train': 1.3642462491989136} -08/30/2021 21:48:43 - INFO - __main__ - Step 47353: {'lr': 0.0003928294177464814, 'samples': 9091776, 'steps': 47352, 'loss/train': 1.4685677289962769} -08/30/2021 21:48:44 - INFO - __main__ - Step 47354: {'lr': 0.0003928250623152335, 'samples': 9091968, 'steps': 47353, 'loss/train': 1.6228684186935425} -08/30/2021 21:48:44 - INFO - __main__ - Step 47355: {'lr': 0.00039282070681963076, 'samples': 9092160, 'steps': 47354, 'loss/train': 0.20396752655506134} -08/30/2021 21:48:45 - INFO - __main__ - Step 47356: {'lr': 0.00039281635125967525, 'samples': 9092352, 'steps': 47355, 'loss/train': 0.0710807666182518} -08/30/2021 21:48:45 - INFO - __main__ - Step 47357: {'lr': 0.00039281199563536887, 'samples': 9092544, 'steps': 47356, 'loss/train': 1.3086320161819458} -08/30/2021 21:48:45 - INFO - __main__ - Step 47358: {'lr': 0.00039280763994671363, 'samples': 9092736, 'steps': 47357, 'loss/train': 0.5093753337860107} -08/30/2021 21:48:47 - INFO - __main__ - Step 47359: {'lr': 0.0003928032841937115, 'samples': 9092928, 'steps': 47358, 'loss/train': 0.6711312532424927} -08/30/2021 21:48:47 - INFO - __main__ - Step 47360: {'lr': 0.0003927989283763643, 'samples': 9093120, 'steps': 47359, 'loss/train': 1.0352784395217896} -08/30/2021 21:48:48 - INFO - __main__ - Step 47361: {'lr': 0.0003927945724946742, 'samples': 9093312, 'steps': 47360, 'loss/train': 0.9162634015083313} -08/30/2021 21:48:48 - INFO - __main__ - Step 47362: {'lr': 0.00039279021654864307, 'samples': 9093504, 'steps': 47361, 'loss/train': 1.5815321207046509} -08/30/2021 21:48:48 - INFO - __main__ - Step 47363: {'lr': 0.0003927858605382728, 'samples': 9093696, 'steps': 47362, 'loss/train': 1.7978036403656006} -08/30/2021 21:48:49 - INFO - __main__ - Step 47364: {'lr': 0.0003927815044635655, 'samples': 9093888, 'steps': 47363, 'loss/train': 1.3591214418411255} -08/30/2021 21:48:50 - INFO - __main__ - Step 47365: {'lr': 0.00039277714832452304, 'samples': 9094080, 'steps': 47364, 'loss/train': 1.1065795421600342} -08/30/2021 21:48:51 - INFO - __main__ - Step 47366: {'lr': 0.0003927727921211474, 'samples': 9094272, 'steps': 47365, 'loss/train': 1.1524626016616821} -08/30/2021 21:48:51 - INFO - __main__ - Step 47367: {'lr': 0.00039276843585344046, 'samples': 9094464, 'steps': 47366, 'loss/train': 1.0965452194213867} -08/30/2021 21:48:52 - INFO - __main__ - Step 47368: {'lr': 0.0003927640795214044, 'samples': 9094656, 'steps': 47367, 'loss/train': 1.4337648153305054} -08/30/2021 21:48:52 - INFO - __main__ - Step 47369: {'lr': 0.00039275972312504103, 'samples': 9094848, 'steps': 47368, 'loss/train': 1.6651297807693481} -08/30/2021 21:48:53 - INFO - __main__ - Step 47370: {'lr': 0.0003927553666643523, 'samples': 9095040, 'steps': 47369, 'loss/train': 0.8628102540969849} -08/30/2021 21:48:54 - INFO - __main__ - Step 47371: {'lr': 0.0003927510101393401, 'samples': 9095232, 'steps': 47370, 'loss/train': 1.278727412223816} -08/30/2021 21:48:54 - INFO - __main__ - Step 47372: {'lr': 0.0003927466535500066, 'samples': 9095424, 'steps': 47371, 'loss/train': 1.3257778882980347} -08/30/2021 21:48:55 - INFO - __main__ - Step 47373: {'lr': 0.00039274229689635365, 'samples': 9095616, 'steps': 47372, 'loss/train': 0.7446551322937012} -08/30/2021 21:48:55 - INFO - __main__ - Step 47374: {'lr': 0.00039273794017838327, 'samples': 9095808, 'steps': 47373, 'loss/train': 1.4918280839920044} -08/30/2021 21:48:56 - INFO - __main__ - Step 47375: {'lr': 0.0003927335833960973, 'samples': 9096000, 'steps': 47374, 'loss/train': 1.3082075119018555} -08/30/2021 21:48:57 - INFO - __main__ - Step 47376: {'lr': 0.00039272922654949783, 'samples': 9096192, 'steps': 47375, 'loss/train': 1.3660470247268677} -08/30/2021 21:48:57 - INFO - __main__ - Step 47377: {'lr': 0.0003927248696385868, 'samples': 9096384, 'steps': 47376, 'loss/train': 1.9401534795761108} -08/30/2021 21:48:57 - INFO - __main__ - Step 47378: {'lr': 0.00039272051266336607, 'samples': 9096576, 'steps': 47377, 'loss/train': 1.5061721801757812} -08/30/2021 21:48:58 - INFO - __main__ - Step 47379: {'lr': 0.00039271615562383775, 'samples': 9096768, 'steps': 47378, 'loss/train': 1.7097561359405518} -08/30/2021 21:48:59 - INFO - __main__ - Step 47380: {'lr': 0.00039271179852000366, 'samples': 9096960, 'steps': 47379, 'loss/train': 0.7220338582992554} -08/30/2021 21:49:00 - INFO - __main__ - Step 47381: {'lr': 0.0003927074413518659, 'samples': 9097152, 'steps': 47380, 'loss/train': 0.9531300663948059} -08/30/2021 21:49:00 - INFO - __main__ - Step 47382: {'lr': 0.0003927030841194263, 'samples': 9097344, 'steps': 47381, 'loss/train': 1.2772434949874878} -08/30/2021 21:49:00 - INFO - __main__ - Step 47383: {'lr': 0.00039269872682268697, 'samples': 9097536, 'steps': 47382, 'loss/train': 1.0565341711044312} -08/30/2021 21:49:01 - INFO - __main__ - Step 47384: {'lr': 0.00039269436946164977, 'samples': 9097728, 'steps': 47383, 'loss/train': 1.0536904335021973} -08/30/2021 21:49:02 - INFO - __main__ - Step 47385: {'lr': 0.00039269001203631667, 'samples': 9097920, 'steps': 47384, 'loss/train': 1.4151859283447266} -08/30/2021 21:49:03 - INFO - __main__ - Step 47386: {'lr': 0.0003926856545466896, 'samples': 9098112, 'steps': 47385, 'loss/train': 0.9711772203445435} -08/30/2021 21:49:03 - INFO - __main__ - Step 47387: {'lr': 0.0003926812969927707, 'samples': 9098304, 'steps': 47386, 'loss/train': 1.7893248796463013} -08/30/2021 21:49:04 - INFO - __main__ - Step 47388: {'lr': 0.0003926769393745617, 'samples': 9098496, 'steps': 47387, 'loss/train': 1.298899531364441} -08/30/2021 21:49:04 - INFO - __main__ - Step 47389: {'lr': 0.0003926725816920648, 'samples': 9098688, 'steps': 47388, 'loss/train': 1.5883861780166626} -08/30/2021 21:49:06 - INFO - __main__ - Step 47390: {'lr': 0.0003926682239452817, 'samples': 9098880, 'steps': 47389, 'loss/train': 0.9644375443458557} -08/30/2021 21:49:06 - INFO - __main__ - Step 47391: {'lr': 0.00039266386613421455, 'samples': 9099072, 'steps': 47390, 'loss/train': 1.1020708084106445} -08/30/2021 21:49:07 - INFO - __main__ - Step 47392: {'lr': 0.00039265950825886523, 'samples': 9099264, 'steps': 47391, 'loss/train': 0.19431518018245697} -08/30/2021 21:49:07 - INFO - __main__ - Step 47393: {'lr': 0.00039265515031923585, 'samples': 9099456, 'steps': 47392, 'loss/train': 0.9279852509498596} -08/30/2021 21:49:07 - INFO - __main__ - Step 47394: {'lr': 0.0003926507923153282, 'samples': 9099648, 'steps': 47393, 'loss/train': 0.6067180633544922} -08/30/2021 21:49:08 - INFO - __main__ - Step 47395: {'lr': 0.0003926464342471443, 'samples': 9099840, 'steps': 47394, 'loss/train': 1.6401456594467163} -08/30/2021 21:49:09 - INFO - __main__ - Step 47396: {'lr': 0.00039264207611468607, 'samples': 9100032, 'steps': 47395, 'loss/train': 1.9120762348175049} -08/30/2021 21:49:10 - INFO - __main__ - Step 47397: {'lr': 0.00039263771791795554, 'samples': 9100224, 'steps': 47396, 'loss/train': 1.4913197755813599} -08/30/2021 21:49:10 - INFO - __main__ - Step 47398: {'lr': 0.0003926333596569547, 'samples': 9100416, 'steps': 47397, 'loss/train': 1.4576208591461182} -08/30/2021 21:49:10 - INFO - __main__ - Step 47399: {'lr': 0.00039262900133168544, 'samples': 9100608, 'steps': 47398, 'loss/train': 1.4530779123306274} -08/30/2021 21:49:11 - INFO - __main__ - Step 47400: {'lr': 0.0003926246429421497, 'samples': 9100800, 'steps': 47399, 'loss/train': 1.494839072227478} -08/30/2021 21:49:13 - INFO - __main__ - Step 47401: {'lr': 0.00039262028448834964, 'samples': 9100992, 'steps': 47400, 'loss/train': 1.1281623840332031} -08/30/2021 21:49:14 - INFO - __main__ - Step 47402: {'lr': 0.00039261592597028696, 'samples': 9101184, 'steps': 47401, 'loss/train': 1.382845163345337} -08/30/2021 21:49:14 - INFO - __main__ - Step 47403: {'lr': 0.0003926115673879638, 'samples': 9101376, 'steps': 47402, 'loss/train': 1.2787145376205444} -08/30/2021 21:49:14 - INFO - __main__ - Step 47404: {'lr': 0.000392607208741382, 'samples': 9101568, 'steps': 47403, 'loss/train': 1.7682346105575562} -08/30/2021 21:49:15 - INFO - __main__ - Step 47405: {'lr': 0.00039260285003054365, 'samples': 9101760, 'steps': 47404, 'loss/train': 1.6048250198364258} -08/30/2021 21:49:15 - INFO - __main__ - Step 47406: {'lr': 0.0003925984912554507, 'samples': 9101952, 'steps': 47405, 'loss/train': 1.9606859683990479} -08/30/2021 21:49:17 - INFO - __main__ - Step 47407: {'lr': 0.00039259413241610495, 'samples': 9102144, 'steps': 47406, 'loss/train': 1.7560627460479736} -08/30/2021 21:49:18 - INFO - __main__ - Step 47408: {'lr': 0.0003925897735125086, 'samples': 9102336, 'steps': 47407, 'loss/train': 1.170751690864563} -08/30/2021 21:49:18 - INFO - __main__ - Step 47409: {'lr': 0.00039258541454466344, 'samples': 9102528, 'steps': 47408, 'loss/train': 1.424579381942749} -08/30/2021 21:49:18 - INFO - __main__ - Step 47410: {'lr': 0.0003925810555125715, 'samples': 9102720, 'steps': 47409, 'loss/train': 0.12577219307422638} -08/30/2021 21:49:19 - INFO - __main__ - Step 47411: {'lr': 0.00039257669641623474, 'samples': 9102912, 'steps': 47410, 'loss/train': 0.04750821366906166} -08/30/2021 21:49:19 - INFO - __main__ - Step 47412: {'lr': 0.0003925723372556551, 'samples': 9103104, 'steps': 47411, 'loss/train': 0.2771010398864746} -08/30/2021 21:49:19 - INFO - __main__ - Step 47413: {'lr': 0.00039256797803083457, 'samples': 9103296, 'steps': 47412, 'loss/train': 1.927358865737915} -08/30/2021 21:49:22 - INFO - __main__ - Step 47414: {'lr': 0.00039256361874177517, 'samples': 9103488, 'steps': 47413, 'loss/train': 0.9046767354011536} -08/30/2021 21:49:22 - INFO - __main__ - Step 47415: {'lr': 0.0003925592593884787, 'samples': 9103680, 'steps': 47414, 'loss/train': 1.6944732666015625} -08/30/2021 21:49:22 - INFO - __main__ - Step 47416: {'lr': 0.0003925548999709473, 'samples': 9103872, 'steps': 47415, 'loss/train': 1.658400058746338} -08/30/2021 21:49:23 - INFO - __main__ - Step 47417: {'lr': 0.00039255054048918284, 'samples': 9104064, 'steps': 47416, 'loss/train': 1.794282078742981} -08/30/2021 21:49:23 - INFO - __main__ - Step 47418: {'lr': 0.00039254618094318726, 'samples': 9104256, 'steps': 47417, 'loss/train': 1.8073607683181763} -08/30/2021 21:49:23 - INFO - __main__ - Step 47419: {'lr': 0.0003925418213329627, 'samples': 9104448, 'steps': 47418, 'loss/train': 1.5887683629989624} -08/30/2021 21:49:24 - INFO - __main__ - Step 47420: {'lr': 0.0003925374616585109, 'samples': 9104640, 'steps': 47419, 'loss/train': 1.5960773229599} -08/30/2021 21:49:26 - INFO - __main__ - Step 47421: {'lr': 0.00039253310191983393, 'samples': 9104832, 'steps': 47420, 'loss/train': 1.1781538724899292} -08/30/2021 21:49:26 - INFO - __main__ - Step 47422: {'lr': 0.0003925287421169337, 'samples': 9105024, 'steps': 47421, 'loss/train': 0.784122109413147} -08/30/2021 21:49:27 - INFO - __main__ - Step 47423: {'lr': 0.00039252438224981237, 'samples': 9105216, 'steps': 47422, 'loss/train': 1.922245740890503} -08/30/2021 21:49:27 - INFO - __main__ - Step 47424: {'lr': 0.0003925200223184716, 'samples': 9105408, 'steps': 47423, 'loss/train': 0.8925718665122986} -08/30/2021 21:49:27 - INFO - __main__ - Step 47425: {'lr': 0.0003925156623229136, 'samples': 9105600, 'steps': 47424, 'loss/train': 1.8791476488113403} -08/30/2021 21:49:29 - INFO - __main__ - Step 47426: {'lr': 0.00039251130226314015, 'samples': 9105792, 'steps': 47425, 'loss/train': 1.4244506359100342} -08/30/2021 21:49:29 - INFO - __main__ - Step 47427: {'lr': 0.00039250694213915335, 'samples': 9105984, 'steps': 47426, 'loss/train': 1.4092888832092285} -08/30/2021 21:49:30 - INFO - __main__ - Step 47428: {'lr': 0.0003925025819509551, 'samples': 9106176, 'steps': 47427, 'loss/train': 1.921508550643921} -08/30/2021 21:49:30 - INFO - __main__ - Step 47429: {'lr': 0.00039249822169854745, 'samples': 9106368, 'steps': 47428, 'loss/train': 1.3877923488616943} -08/30/2021 21:49:31 - INFO - __main__ - Step 47430: {'lr': 0.0003924938613819322, 'samples': 9106560, 'steps': 47429, 'loss/train': 1.2928165197372437} -08/30/2021 21:49:32 - INFO - __main__ - Step 47431: {'lr': 0.0003924895010011115, 'samples': 9106752, 'steps': 47430, 'loss/train': 0.1274806261062622} -08/30/2021 21:49:33 - INFO - __main__ - Step 47432: {'lr': 0.0003924851405560872, 'samples': 9106944, 'steps': 47431, 'loss/train': 1.6685556173324585} -08/30/2021 21:49:33 - INFO - __main__ - Step 47433: {'lr': 0.00039248078004686126, 'samples': 9107136, 'steps': 47432, 'loss/train': 0.8660440444946289} -08/30/2021 21:49:34 - INFO - __main__ - Step 47434: {'lr': 0.00039247641947343575, 'samples': 9107328, 'steps': 47433, 'loss/train': 1.1961708068847656} -08/30/2021 21:49:34 - INFO - __main__ - Step 47435: {'lr': 0.0003924720588358126, 'samples': 9107520, 'steps': 47434, 'loss/train': 1.08945631980896} -08/30/2021 21:49:34 - INFO - __main__ - Step 47436: {'lr': 0.0003924676981339936, 'samples': 9107712, 'steps': 47435, 'loss/train': 1.3576847314834595} -08/30/2021 21:49:35 - INFO - __main__ - Step 47437: {'lr': 0.00039246333736798095, 'samples': 9107904, 'steps': 47436, 'loss/train': 2.1324586868286133} -08/30/2021 21:49:36 - INFO - __main__ - Step 47438: {'lr': 0.0003924589765377765, 'samples': 9108096, 'steps': 47437, 'loss/train': 1.4530651569366455} -08/30/2021 21:49:37 - INFO - __main__ - Step 47439: {'lr': 0.00039245461564338223, 'samples': 9108288, 'steps': 47438, 'loss/train': 2.4995298385620117} -08/30/2021 21:49:37 - INFO - __main__ - Step 47440: {'lr': 0.00039245025468480013, 'samples': 9108480, 'steps': 47439, 'loss/train': 1.6787322759628296} -08/30/2021 21:49:38 - INFO - __main__ - Step 47441: {'lr': 0.00039244589366203207, 'samples': 9108672, 'steps': 47440, 'loss/train': 0.7857919931411743} -08/30/2021 21:49:38 - INFO - __main__ - Step 47442: {'lr': 0.0003924415325750802, 'samples': 9108864, 'steps': 47441, 'loss/train': 0.9463993310928345} -08/30/2021 21:49:39 - INFO - __main__ - Step 47443: {'lr': 0.0003924371714239463, 'samples': 9109056, 'steps': 47442, 'loss/train': 1.5027315616607666} -08/30/2021 21:49:40 - INFO - __main__ - Step 47444: {'lr': 0.0003924328102086324, 'samples': 9109248, 'steps': 47443, 'loss/train': 1.0893957614898682} -08/30/2021 21:49:40 - INFO - __main__ - Step 47445: {'lr': 0.0003924284489291405, 'samples': 9109440, 'steps': 47444, 'loss/train': 1.009865403175354} -08/30/2021 21:49:41 - INFO - __main__ - Step 47446: {'lr': 0.00039242408758547256, 'samples': 9109632, 'steps': 47445, 'loss/train': 2.0451200008392334} -08/30/2021 21:49:41 - INFO - __main__ - Step 47447: {'lr': 0.0003924197261776304, 'samples': 9109824, 'steps': 47446, 'loss/train': 1.5461087226867676} -08/30/2021 21:49:43 - INFO - __main__ - Step 47448: {'lr': 0.0003924153647056163, 'samples': 9110016, 'steps': 47447, 'loss/train': 1.535399317741394} -08/30/2021 21:49:43 - INFO - __main__ - Step 47449: {'lr': 0.0003924110031694319, 'samples': 9110208, 'steps': 47448, 'loss/train': 1.4370900392532349} -08/30/2021 21:49:43 - INFO - __main__ - Step 47450: {'lr': 0.00039240664156907937, 'samples': 9110400, 'steps': 47449, 'loss/train': 1.9424941539764404} -08/30/2021 21:49:44 - INFO - __main__ - Step 47451: {'lr': 0.00039240227990456055, 'samples': 9110592, 'steps': 47450, 'loss/train': 1.3079520463943481} -08/30/2021 21:49:44 - INFO - __main__ - Step 47452: {'lr': 0.00039239791817587746, 'samples': 9110784, 'steps': 47451, 'loss/train': 1.511841058731079} -08/30/2021 21:49:44 - INFO - __main__ - Step 47453: {'lr': 0.0003923935563830321, 'samples': 9110976, 'steps': 47452, 'loss/train': 1.8246479034423828} -08/30/2021 21:49:46 - INFO - __main__ - Step 47454: {'lr': 0.0003923891945260264, 'samples': 9111168, 'steps': 47453, 'loss/train': 0.06469002366065979} -08/30/2021 21:49:47 - INFO - __main__ - Step 47455: {'lr': 0.00039238483260486235, 'samples': 9111360, 'steps': 47454, 'loss/train': 0.39675575494766235} -08/30/2021 21:49:47 - INFO - __main__ - Step 47456: {'lr': 0.0003923804706195418, 'samples': 9111552, 'steps': 47455, 'loss/train': 1.219374179840088} -08/30/2021 21:49:47 - INFO - __main__ - Step 47457: {'lr': 0.0003923761085700669, 'samples': 9111744, 'steps': 47456, 'loss/train': 0.9257020354270935} -08/30/2021 21:49:48 - INFO - __main__ - Step 47458: {'lr': 0.0003923717464564395, 'samples': 9111936, 'steps': 47457, 'loss/train': 1.6188582181930542} -08/30/2021 21:49:49 - INFO - __main__ - Step 47459: {'lr': 0.00039236738427866154, 'samples': 9112128, 'steps': 47458, 'loss/train': 1.765936017036438} -08/30/2021 21:49:49 - INFO - __main__ - Step 47460: {'lr': 0.000392363022036735, 'samples': 9112320, 'steps': 47459, 'loss/train': 1.5301679372787476} -08/30/2021 21:49:50 - INFO - __main__ - Step 47461: {'lr': 0.00039235865973066196, 'samples': 9112512, 'steps': 47460, 'loss/train': 1.359564185142517} -08/30/2021 21:49:50 - INFO - __main__ - Step 47462: {'lr': 0.00039235429736044435, 'samples': 9112704, 'steps': 47461, 'loss/train': 1.1371489763259888} -08/30/2021 21:49:51 - INFO - __main__ - Step 47463: {'lr': 0.00039234993492608404, 'samples': 9112896, 'steps': 47462, 'loss/train': 1.474984049797058} -08/30/2021 21:49:52 - INFO - __main__ - Step 47464: {'lr': 0.0003923455724275831, 'samples': 9113088, 'steps': 47463, 'loss/train': 0.7468206882476807} -08/30/2021 21:49:52 - INFO - __main__ - Step 47465: {'lr': 0.0003923412098649433, 'samples': 9113280, 'steps': 47464, 'loss/train': 1.3695276975631714} -08/30/2021 21:49:53 - INFO - __main__ - Step 47466: {'lr': 0.0003923368472381668, 'samples': 9113472, 'steps': 47465, 'loss/train': 1.4852293729782104} -08/30/2021 21:49:53 - INFO - __main__ - Step 47467: {'lr': 0.0003923324845472556, 'samples': 9113664, 'steps': 47466, 'loss/train': 1.7139065265655518} -08/30/2021 21:49:53 - INFO - __main__ - Step 47468: {'lr': 0.0003923281217922115, 'samples': 9113856, 'steps': 47467, 'loss/train': 2.0019984245300293} -08/30/2021 21:49:55 - INFO - __main__ - Step 47469: {'lr': 0.0003923237589730366, 'samples': 9114048, 'steps': 47468, 'loss/train': 0.5439435839653015} -08/30/2021 21:49:55 - INFO - __main__ - Step 47470: {'lr': 0.00039231939608973276, 'samples': 9114240, 'steps': 47469, 'loss/train': 0.8051151633262634} -08/30/2021 21:49:56 - INFO - __main__ - Step 47471: {'lr': 0.000392315033142302, 'samples': 9114432, 'steps': 47470, 'loss/train': 1.8148776292800903} -08/30/2021 21:49:56 - INFO - __main__ - Step 47472: {'lr': 0.0003923106701307463, 'samples': 9114624, 'steps': 47471, 'loss/train': 1.5005706548690796} -08/30/2021 21:49:56 - INFO - __main__ - Step 47473: {'lr': 0.0003923063070550676, 'samples': 9114816, 'steps': 47472, 'loss/train': 1.4210914373397827} -08/30/2021 21:49:58 - INFO - __main__ - Step 47474: {'lr': 0.00039230194391526784, 'samples': 9115008, 'steps': 47473, 'loss/train': 1.538997769355774} -08/30/2021 21:49:59 - INFO - __main__ - Step 47475: {'lr': 0.00039229758071134907, 'samples': 9115200, 'steps': 47474, 'loss/train': 1.7825133800506592} -08/30/2021 21:49:59 - INFO - __main__ - Step 47476: {'lr': 0.0003922932174433132, 'samples': 9115392, 'steps': 47475, 'loss/train': 0.8834695219993591} -08/30/2021 21:50:00 - INFO - __main__ - Step 47477: {'lr': 0.0003922888541111622, 'samples': 9115584, 'steps': 47476, 'loss/train': 1.6944807767868042} -08/30/2021 21:50:00 - INFO - __main__ - Step 47478: {'lr': 0.00039228449071489804, 'samples': 9115776, 'steps': 47477, 'loss/train': 1.2691766023635864} -08/30/2021 21:50:00 - INFO - __main__ - Step 47479: {'lr': 0.0003922801272545227, 'samples': 9115968, 'steps': 47478, 'loss/train': 1.378496766090393} -08/30/2021 21:50:02 - INFO - __main__ - Step 47480: {'lr': 0.000392275763730038, 'samples': 9116160, 'steps': 47479, 'loss/train': 1.267137050628662} -08/30/2021 21:50:02 - INFO - __main__ - Step 47481: {'lr': 0.00039227140014144615, 'samples': 9116352, 'steps': 47480, 'loss/train': 1.0980186462402344} -08/30/2021 21:50:03 - INFO - __main__ - Step 47482: {'lr': 0.00039226703648874905, 'samples': 9116544, 'steps': 47481, 'loss/train': 1.189841389656067} -08/30/2021 21:50:03 - INFO - __main__ - Step 47483: {'lr': 0.00039226267277194855, 'samples': 9116736, 'steps': 47482, 'loss/train': 1.4233750104904175} -08/30/2021 21:50:03 - INFO - __main__ - Step 47484: {'lr': 0.0003922583089910467, 'samples': 9116928, 'steps': 47483, 'loss/train': 1.0525566339492798} -08/30/2021 21:50:05 - INFO - __main__ - Step 47485: {'lr': 0.0003922539451460454, 'samples': 9117120, 'steps': 47484, 'loss/train': 1.0316088199615479} -08/30/2021 21:50:05 - INFO - __main__ - Step 47486: {'lr': 0.00039224958123694676, 'samples': 9117312, 'steps': 47485, 'loss/train': 1.5966614484786987} -08/30/2021 21:50:05 - INFO - __main__ - Step 47487: {'lr': 0.0003922452172637526, 'samples': 9117504, 'steps': 47486, 'loss/train': 1.7844959497451782} -08/30/2021 21:50:06 - INFO - __main__ - Step 47488: {'lr': 0.000392240853226465, 'samples': 9117696, 'steps': 47487, 'loss/train': 1.2453421354293823} -08/30/2021 21:50:06 - INFO - __main__ - Step 47489: {'lr': 0.0003922364891250858, 'samples': 9117888, 'steps': 47488, 'loss/train': 1.7250230312347412} -08/30/2021 21:50:08 - INFO - __main__ - Step 47490: {'lr': 0.00039223212495961704, 'samples': 9118080, 'steps': 47489, 'loss/train': 1.206486463546753} -08/30/2021 21:50:08 - INFO - __main__ - Step 47491: {'lr': 0.0003922277607300607, 'samples': 9118272, 'steps': 47490, 'loss/train': 0.9815263152122498} -08/30/2021 21:50:09 - INFO - __main__ - Step 47492: {'lr': 0.0003922233964364187, 'samples': 9118464, 'steps': 47491, 'loss/train': 1.0688601732254028} -08/30/2021 21:50:09 - INFO - __main__ - Step 47493: {'lr': 0.000392219032078693, 'samples': 9118656, 'steps': 47492, 'loss/train': 1.7482033967971802} -08/30/2021 21:50:09 - INFO - __main__ - Step 47494: {'lr': 0.0003922146676568856, 'samples': 9118848, 'steps': 47493, 'loss/train': 1.4080946445465088} -08/30/2021 21:50:11 - INFO - __main__ - Step 47495: {'lr': 0.0003922103031709986, 'samples': 9119040, 'steps': 47494, 'loss/train': 1.4170136451721191} -08/30/2021 21:50:11 - INFO - __main__ - Step 47496: {'lr': 0.0003922059386210337, 'samples': 9119232, 'steps': 47495, 'loss/train': 0.5779529809951782} -08/30/2021 21:50:11 - INFO - __main__ - Step 47497: {'lr': 0.0003922015740069931, 'samples': 9119424, 'steps': 47496, 'loss/train': 1.0202704668045044} -08/30/2021 21:50:12 - INFO - __main__ - Step 47498: {'lr': 0.0003921972093288786, 'samples': 9119616, 'steps': 47497, 'loss/train': 0.9841870069503784} -08/30/2021 21:50:12 - INFO - __main__ - Step 47499: {'lr': 0.00039219284458669217, 'samples': 9119808, 'steps': 47498, 'loss/train': 1.5301270484924316} -08/30/2021 21:50:14 - INFO - __main__ - Step 47500: {'lr': 0.00039218847978043594, 'samples': 9120000, 'steps': 47499, 'loss/train': 1.0793498754501343} -08/30/2021 21:50:14 - INFO - __main__ - Step 47501: {'lr': 0.00039218411491011176, 'samples': 9120192, 'steps': 47500, 'loss/train': 0.859450101852417} -08/30/2021 21:50:14 - INFO - __main__ - Step 47502: {'lr': 0.0003921797499757216, 'samples': 9120384, 'steps': 47501, 'loss/train': 1.2548826932907104} -08/30/2021 21:50:15 - INFO - __main__ - Step 47503: {'lr': 0.0003921753849772674, 'samples': 9120576, 'steps': 47502, 'loss/train': 0.47821664810180664} -08/30/2021 21:50:15 - INFO - __main__ - Step 47504: {'lr': 0.0003921710199147512, 'samples': 9120768, 'steps': 47503, 'loss/train': 1.3237571716308594} -08/30/2021 21:50:17 - INFO - __main__ - Step 47505: {'lr': 0.0003921666547881749, 'samples': 9120960, 'steps': 47504, 'loss/train': 0.6785144209861755} -08/30/2021 21:50:17 - INFO - __main__ - Step 47506: {'lr': 0.00039216228959754055, 'samples': 9121152, 'steps': 47505, 'loss/train': 2.1855690479278564} -08/30/2021 21:50:17 - INFO - __main__ - Step 47507: {'lr': 0.00039215792434285, 'samples': 9121344, 'steps': 47506, 'loss/train': 1.2324528694152832} -08/30/2021 21:50:18 - INFO - __main__ - Step 47508: {'lr': 0.00039215355902410534, 'samples': 9121536, 'steps': 47507, 'loss/train': 1.0141741037368774} -08/30/2021 21:50:18 - INFO - __main__ - Step 47509: {'lr': 0.0003921491936413085, 'samples': 9121728, 'steps': 47508, 'loss/train': 1.500723958015442} -08/30/2021 21:50:18 - INFO - __main__ - Step 47510: {'lr': 0.0003921448281944614, 'samples': 9121920, 'steps': 47509, 'loss/train': 1.2323713302612305} -08/30/2021 21:50:20 - INFO - __main__ - Step 47511: {'lr': 0.000392140462683566, 'samples': 9122112, 'steps': 47510, 'loss/train': 1.747552514076233} -08/30/2021 21:50:20 - INFO - __main__ - Step 47512: {'lr': 0.0003921360971086243, 'samples': 9122304, 'steps': 47511, 'loss/train': 1.82868492603302} -08/30/2021 21:50:21 - INFO - __main__ - Step 47513: {'lr': 0.0003921317314696383, 'samples': 9122496, 'steps': 47512, 'loss/train': 1.50871741771698} -08/30/2021 21:50:21 - INFO - __main__ - Step 47514: {'lr': 0.0003921273657666099, 'samples': 9122688, 'steps': 47513, 'loss/train': 1.6595972776412964} -08/30/2021 21:50:21 - INFO - __main__ - Step 47515: {'lr': 0.0003921229999995412, 'samples': 9122880, 'steps': 47514, 'loss/train': 0.7272273898124695} -08/30/2021 21:50:23 - INFO - __main__ - Step 47516: {'lr': 0.000392118634168434, 'samples': 9123072, 'steps': 47515, 'loss/train': 2.1457037925720215} -08/30/2021 21:50:23 - INFO - __main__ - Step 47517: {'lr': 0.00039211426827329035, 'samples': 9123264, 'steps': 47516, 'loss/train': 1.6039600372314453} -08/30/2021 21:50:24 - INFO - __main__ - Step 47518: {'lr': 0.0003921099023141121, 'samples': 9123456, 'steps': 47517, 'loss/train': 1.5681538581848145} -08/30/2021 21:50:24 - INFO - __main__ - Step 47519: {'lr': 0.0003921055362909015, 'samples': 9123648, 'steps': 47518, 'loss/train': 0.8581191897392273} -08/30/2021 21:50:24 - INFO - __main__ - Step 47520: {'lr': 0.0003921011702036602, 'samples': 9123840, 'steps': 47519, 'loss/train': 1.4746692180633545} -08/30/2021 21:50:26 - INFO - __main__ - Step 47521: {'lr': 0.00039209680405239035, 'samples': 9124032, 'steps': 47520, 'loss/train': 1.566706895828247} -08/30/2021 21:50:26 - INFO - __main__ - Step 47522: {'lr': 0.0003920924378370939, 'samples': 9124224, 'steps': 47521, 'loss/train': 1.1851613521575928} -08/30/2021 21:50:27 - INFO - __main__ - Step 47523: {'lr': 0.0003920880715577728, 'samples': 9124416, 'steps': 47522, 'loss/train': 1.1102629899978638} -08/30/2021 21:50:27 - INFO - __main__ - Step 47524: {'lr': 0.00039208370521442895, 'samples': 9124608, 'steps': 47523, 'loss/train': 1.5686856508255005} -08/30/2021 21:50:27 - INFO - __main__ - Step 47525: {'lr': 0.0003920793388070644, 'samples': 9124800, 'steps': 47524, 'loss/train': 0.8846790790557861} -08/30/2021 21:50:29 - INFO - __main__ - Step 47526: {'lr': 0.0003920749723356811, 'samples': 9124992, 'steps': 47525, 'loss/train': 1.4392623901367188} -08/30/2021 21:50:29 - INFO - __main__ - Step 47527: {'lr': 0.000392070605800281, 'samples': 9125184, 'steps': 47526, 'loss/train': 1.339270830154419} -08/30/2021 21:50:30 - INFO - __main__ - Step 47528: {'lr': 0.00039206623920086603, 'samples': 9125376, 'steps': 47527, 'loss/train': 1.602022647857666} -08/30/2021 21:50:30 - INFO - __main__ - Step 47529: {'lr': 0.0003920618725374383, 'samples': 9125568, 'steps': 47528, 'loss/train': 1.8743805885314941} -08/30/2021 21:50:30 - INFO - __main__ - Step 47530: {'lr': 0.00039205750580999964, 'samples': 9125760, 'steps': 47529, 'loss/train': 1.496177077293396} -08/30/2021 21:50:32 - INFO - __main__ - Step 47531: {'lr': 0.0003920531390185521, 'samples': 9125952, 'steps': 47530, 'loss/train': 1.705356240272522} -08/30/2021 21:50:33 - INFO - __main__ - Step 47532: {'lr': 0.00039204877216309755, 'samples': 9126144, 'steps': 47531, 'loss/train': 0.45835936069488525} -08/30/2021 21:50:33 - INFO - __main__ - Step 47533: {'lr': 0.00039204440524363805, 'samples': 9126336, 'steps': 47532, 'loss/train': 1.1870044469833374} -08/30/2021 21:50:34 - INFO - __main__ - Step 47534: {'lr': 0.0003920400382601755, 'samples': 9126528, 'steps': 47533, 'loss/train': 1.445563554763794} -08/30/2021 21:50:34 - INFO - __main__ - Step 47535: {'lr': 0.00039203567121271187, 'samples': 9126720, 'steps': 47534, 'loss/train': 0.9779070615768433} -08/30/2021 21:50:35 - INFO - __main__ - Step 47536: {'lr': 0.00039203130410124927, 'samples': 9126912, 'steps': 47535, 'loss/train': 1.7712767124176025} -08/30/2021 21:50:36 - INFO - __main__ - Step 47537: {'lr': 0.0003920269369257895, 'samples': 9127104, 'steps': 47536, 'loss/train': 0.8141536116600037} -08/30/2021 21:50:36 - INFO - __main__ - Step 47538: {'lr': 0.0003920225696863345, 'samples': 9127296, 'steps': 47537, 'loss/train': 1.448149561882019} -08/30/2021 21:50:37 - INFO - __main__ - Step 47539: {'lr': 0.00039201820238288644, 'samples': 9127488, 'steps': 47538, 'loss/train': 1.2583411931991577} -08/30/2021 21:50:37 - INFO - __main__ - Step 47540: {'lr': 0.00039201383501544706, 'samples': 9127680, 'steps': 47539, 'loss/train': 1.6331803798675537} -08/30/2021 21:50:39 - INFO - __main__ - Step 47541: {'lr': 0.00039200946758401856, 'samples': 9127872, 'steps': 47540, 'loss/train': 1.4651482105255127} -08/30/2021 21:50:39 - INFO - __main__ - Step 47542: {'lr': 0.00039200510008860273, 'samples': 9128064, 'steps': 47541, 'loss/train': 1.3782695531845093} -08/30/2021 21:50:39 - INFO - __main__ - Step 47543: {'lr': 0.0003920007325292016, 'samples': 9128256, 'steps': 47542, 'loss/train': 2.249802589416504} -08/30/2021 21:50:40 - INFO - __main__ - Step 47544: {'lr': 0.00039199636490581713, 'samples': 9128448, 'steps': 47543, 'loss/train': 1.2696423530578613} -08/30/2021 21:50:40 - INFO - __main__ - Step 47545: {'lr': 0.00039199199721845127, 'samples': 9128640, 'steps': 47544, 'loss/train': 0.7399950623512268} -08/30/2021 21:50:42 - INFO - __main__ - Step 47546: {'lr': 0.000391987629467106, 'samples': 9128832, 'steps': 47545, 'loss/train': 0.9999672770500183} -08/30/2021 21:50:42 - INFO - __main__ - Step 47547: {'lr': 0.00039198326165178335, 'samples': 9129024, 'steps': 47546, 'loss/train': 1.477217674255371} -08/30/2021 21:50:42 - INFO - __main__ - Step 47548: {'lr': 0.0003919788937724852, 'samples': 9129216, 'steps': 47547, 'loss/train': 1.8754897117614746} -08/30/2021 21:50:43 - INFO - __main__ - Step 47549: {'lr': 0.0003919745258292135, 'samples': 9129408, 'steps': 47548, 'loss/train': 4.169376850128174} -08/30/2021 21:50:43 - INFO - __main__ - Step 47550: {'lr': 0.00039197015782197034, 'samples': 9129600, 'steps': 47549, 'loss/train': 1.6852302551269531} -08/30/2021 21:50:43 - INFO - __main__ - Step 47551: {'lr': 0.0003919657897507576, 'samples': 9129792, 'steps': 47550, 'loss/train': 1.4910401105880737} -08/30/2021 21:50:45 - INFO - __main__ - Step 47552: {'lr': 0.0003919614216155772, 'samples': 9129984, 'steps': 47551, 'loss/train': 1.3738433122634888} -08/30/2021 21:50:45 - INFO - __main__ - Step 47553: {'lr': 0.0003919570534164313, 'samples': 9130176, 'steps': 47552, 'loss/train': 1.4206960201263428} -08/30/2021 21:50:46 - INFO - __main__ - Step 47554: {'lr': 0.0003919526851533216, 'samples': 9130368, 'steps': 47553, 'loss/train': 1.335051417350769} -08/30/2021 21:50:46 - INFO - __main__ - Step 47555: {'lr': 0.00039194831682625033, 'samples': 9130560, 'steps': 47554, 'loss/train': 1.690909504890442} -08/30/2021 21:50:46 - INFO - __main__ - Step 47556: {'lr': 0.0003919439484352193, 'samples': 9130752, 'steps': 47555, 'loss/train': 0.09721633791923523} -08/30/2021 21:50:48 - INFO - __main__ - Step 47557: {'lr': 0.00039193957998023057, 'samples': 9130944, 'steps': 47556, 'loss/train': 0.9456935524940491} -08/30/2021 21:50:48 - INFO - __main__ - Step 47558: {'lr': 0.000391935211461286, 'samples': 9131136, 'steps': 47557, 'loss/train': 0.6503803133964539} -08/30/2021 21:50:49 - INFO - __main__ - Step 47559: {'lr': 0.00039193084287838755, 'samples': 9131328, 'steps': 47558, 'loss/train': 0.7927486896514893} -08/30/2021 21:50:49 - INFO - __main__ - Step 47560: {'lr': 0.0003919264742315373, 'samples': 9131520, 'steps': 47559, 'loss/train': 1.5858039855957031} -08/30/2021 21:50:49 - INFO - __main__ - Step 47561: {'lr': 0.00039192210552073723, 'samples': 9131712, 'steps': 47560, 'loss/train': 1.0409817695617676} -08/30/2021 21:50:51 - INFO - __main__ - Step 47562: {'lr': 0.0003919177367459892, 'samples': 9131904, 'steps': 47561, 'loss/train': 1.0228266716003418} -08/30/2021 21:50:51 - INFO - __main__ - Step 47563: {'lr': 0.00039191336790729526, 'samples': 9132096, 'steps': 47562, 'loss/train': 1.468979001045227} -08/30/2021 21:50:52 - INFO - __main__ - Step 47564: {'lr': 0.00039190899900465727, 'samples': 9132288, 'steps': 47563, 'loss/train': 1.1165070533752441} -08/30/2021 21:50:52 - INFO - __main__ - Step 47565: {'lr': 0.0003919046300380773, 'samples': 9132480, 'steps': 47564, 'loss/train': 1.1435688734054565} -08/30/2021 21:50:52 - INFO - __main__ - Step 47566: {'lr': 0.00039190026100755735, 'samples': 9132672, 'steps': 47565, 'loss/train': 1.1976114511489868} -08/30/2021 21:50:54 - INFO - __main__ - Step 47567: {'lr': 0.00039189589191309927, 'samples': 9132864, 'steps': 47566, 'loss/train': 1.7406421899795532} -08/30/2021 21:50:54 - INFO - __main__ - Step 47568: {'lr': 0.00039189152275470514, 'samples': 9133056, 'steps': 47567, 'loss/train': 1.0698328018188477} -08/30/2021 21:50:55 - INFO - __main__ - Step 47569: {'lr': 0.0003918871535323769, 'samples': 9133248, 'steps': 47568, 'loss/train': 1.104062795639038} -08/30/2021 21:50:55 - INFO - __main__ - Step 47570: {'lr': 0.0003918827842461165, 'samples': 9133440, 'steps': 47569, 'loss/train': 1.4716874361038208} -08/30/2021 21:50:55 - INFO - __main__ - Step 47571: {'lr': 0.0003918784148959258, 'samples': 9133632, 'steps': 47570, 'loss/train': 1.5160268545150757} -08/30/2021 21:50:57 - INFO - __main__ - Step 47572: {'lr': 0.0003918740454818069, 'samples': 9133824, 'steps': 47571, 'loss/train': 1.2590101957321167} -08/30/2021 21:50:57 - INFO - __main__ - Step 47573: {'lr': 0.0003918696760037618, 'samples': 9134016, 'steps': 47572, 'loss/train': 1.2887803316116333} -08/30/2021 21:50:58 - INFO - __main__ - Step 47574: {'lr': 0.0003918653064617924, 'samples': 9134208, 'steps': 47573, 'loss/train': 1.6382392644882202} -08/30/2021 21:50:58 - INFO - __main__ - Step 47575: {'lr': 0.00039186093685590064, 'samples': 9134400, 'steps': 47574, 'loss/train': 0.8733863830566406} -08/30/2021 21:50:58 - INFO - __main__ - Step 47576: {'lr': 0.0003918565671860886, 'samples': 9134592, 'steps': 47575, 'loss/train': 1.272176742553711} -08/30/2021 21:51:00 - INFO - __main__ - Step 47577: {'lr': 0.00039185219745235816, 'samples': 9134784, 'steps': 47576, 'loss/train': 0.7759772539138794} -08/30/2021 21:51:00 - INFO - __main__ - Step 47578: {'lr': 0.0003918478276547113, 'samples': 9134976, 'steps': 47577, 'loss/train': 1.5864347219467163} -08/30/2021 21:51:01 - INFO - __main__ - Step 47579: {'lr': 0.00039184345779315, 'samples': 9135168, 'steps': 47578, 'loss/train': 0.9600334763526917} -08/30/2021 21:51:01 - INFO - __main__ - Step 47580: {'lr': 0.0003918390878676762, 'samples': 9135360, 'steps': 47579, 'loss/train': 1.842550277709961} -08/30/2021 21:51:01 - INFO - __main__ - Step 47581: {'lr': 0.00039183471787829194, 'samples': 9135552, 'steps': 47580, 'loss/train': 1.8136920928955078} -08/30/2021 21:51:02 - INFO - __main__ - Step 47582: {'lr': 0.0003918303478249991, 'samples': 9135744, 'steps': 47581, 'loss/train': 1.4065524339675903} -08/30/2021 21:51:04 - INFO - __main__ - Step 47583: {'lr': 0.0003918259777077997, 'samples': 9135936, 'steps': 47582, 'loss/train': 1.5654438734054565} -08/30/2021 21:51:04 - INFO - __main__ - Step 47584: {'lr': 0.00039182160752669577, 'samples': 9136128, 'steps': 47583, 'loss/train': 1.805586576461792} -08/30/2021 21:51:05 - INFO - __main__ - Step 47585: {'lr': 0.0003918172372816892, 'samples': 9136320, 'steps': 47584, 'loss/train': 1.0967366695404053} -08/30/2021 21:51:05 - INFO - __main__ - Step 47586: {'lr': 0.0003918128669727818, 'samples': 9136512, 'steps': 47585, 'loss/train': 1.576042890548706} -08/30/2021 21:51:05 - INFO - __main__ - Step 47587: {'lr': 0.00039180849659997593, 'samples': 9136704, 'steps': 47586, 'loss/train': 1.7267149686813354} -08/30/2021 21:51:07 - INFO - __main__ - Step 47588: {'lr': 0.00039180412616327323, 'samples': 9136896, 'steps': 47587, 'loss/train': 1.9029110670089722} -08/30/2021 21:51:07 - INFO - __main__ - Step 47589: {'lr': 0.00039179975566267585, 'samples': 9137088, 'steps': 47588, 'loss/train': 0.7890552878379822} -08/30/2021 21:51:08 - INFO - __main__ - Step 47590: {'lr': 0.00039179538509818556, 'samples': 9137280, 'steps': 47589, 'loss/train': 1.4764454364776611} -08/30/2021 21:51:08 - INFO - __main__ - Step 47591: {'lr': 0.0003917910144698046, 'samples': 9137472, 'steps': 47590, 'loss/train': 1.6669155359268188} -08/30/2021 21:51:08 - INFO - __main__ - Step 47592: {'lr': 0.0003917866437775347, 'samples': 9137664, 'steps': 47591, 'loss/train': 0.9721720218658447} -08/30/2021 21:51:10 - INFO - __main__ - Step 47593: {'lr': 0.000391782273021378, 'samples': 9137856, 'steps': 47592, 'loss/train': 0.14700405299663544} -08/30/2021 21:51:10 - INFO - __main__ - Step 47594: {'lr': 0.00039177790220133637, 'samples': 9138048, 'steps': 47593, 'loss/train': 2.0277597904205322} -08/30/2021 21:51:11 - INFO - __main__ - Step 47595: {'lr': 0.0003917735313174117, 'samples': 9138240, 'steps': 47594, 'loss/train': 1.2065784931182861} -08/30/2021 21:51:11 - INFO - __main__ - Step 47596: {'lr': 0.0003917691603696062, 'samples': 9138432, 'steps': 47595, 'loss/train': 1.2386913299560547} -08/30/2021 21:51:11 - INFO - __main__ - Step 47597: {'lr': 0.0003917647893579217, 'samples': 9138624, 'steps': 47596, 'loss/train': 1.1212928295135498} -08/30/2021 21:51:13 - INFO - __main__ - Step 47598: {'lr': 0.0003917604182823601, 'samples': 9138816, 'steps': 47597, 'loss/train': 2.062592029571533} -08/30/2021 21:51:13 - INFO - __main__ - Step 47599: {'lr': 0.00039175604714292346, 'samples': 9139008, 'steps': 47598, 'loss/train': 0.6993901133537292} -08/30/2021 21:51:14 - INFO - __main__ - Step 47600: {'lr': 0.00039175167593961377, 'samples': 9139200, 'steps': 47599, 'loss/train': 1.723766565322876} -08/30/2021 21:51:14 - INFO - __main__ - Step 47601: {'lr': 0.0003917473046724329, 'samples': 9139392, 'steps': 47600, 'loss/train': 1.776467204093933} -08/30/2021 21:51:14 - INFO - __main__ - Step 47602: {'lr': 0.000391742933341383, 'samples': 9139584, 'steps': 47601, 'loss/train': 1.4710078239440918} -08/30/2021 21:51:16 - INFO - __main__ - Step 47603: {'lr': 0.00039173856194646585, 'samples': 9139776, 'steps': 47602, 'loss/train': 0.7388753890991211} -08/30/2021 21:51:16 - INFO - __main__ - Step 47604: {'lr': 0.00039173419048768343, 'samples': 9139968, 'steps': 47603, 'loss/train': 1.710203766822815} -08/30/2021 21:51:17 - INFO - __main__ - Step 47605: {'lr': 0.0003917298189650378, 'samples': 9140160, 'steps': 47604, 'loss/train': 1.5066584348678589} -08/30/2021 21:51:17 - INFO - __main__ - Step 47606: {'lr': 0.00039172544737853097, 'samples': 9140352, 'steps': 47605, 'loss/train': 1.441505789756775} -08/30/2021 21:51:17 - INFO - __main__ - Step 47607: {'lr': 0.00039172107572816477, 'samples': 9140544, 'steps': 47606, 'loss/train': 1.1783387660980225} -08/30/2021 21:51:19 - INFO - __main__ - Step 47608: {'lr': 0.00039171670401394134, 'samples': 9140736, 'steps': 47607, 'loss/train': 1.3212872743606567} -08/30/2021 21:51:20 - INFO - __main__ - Step 47609: {'lr': 0.00039171233223586247, 'samples': 9140928, 'steps': 47608, 'loss/train': 0.5811963677406311} -08/30/2021 21:51:20 - INFO - __main__ - Step 47610: {'lr': 0.0003917079603939302, 'samples': 9141120, 'steps': 47609, 'loss/train': 1.2613604068756104} -08/30/2021 21:51:20 - INFO - __main__ - Step 47611: {'lr': 0.0003917035884881465, 'samples': 9141312, 'steps': 47610, 'loss/train': 0.19551026821136475} -08/30/2021 21:51:21 - INFO - __main__ - Step 47612: {'lr': 0.00039169921651851337, 'samples': 9141504, 'steps': 47611, 'loss/train': 0.7926893830299377} -08/30/2021 21:51:21 - INFO - __main__ - Step 47613: {'lr': 0.0003916948444850328, 'samples': 9141696, 'steps': 47612, 'loss/train': 1.088605523109436} -08/30/2021 21:51:23 - INFO - __main__ - Step 47614: {'lr': 0.0003916904723877067, 'samples': 9141888, 'steps': 47613, 'loss/train': 1.3022652864456177} -08/30/2021 21:51:23 - INFO - __main__ - Step 47615: {'lr': 0.000391686100226537, 'samples': 9142080, 'steps': 47614, 'loss/train': 1.158038854598999} -08/30/2021 21:51:23 - INFO - __main__ - Step 47616: {'lr': 0.00039168172800152577, 'samples': 9142272, 'steps': 47615, 'loss/train': 1.601486325263977} -08/30/2021 21:51:24 - INFO - __main__ - Step 47617: {'lr': 0.0003916773557126749, 'samples': 9142464, 'steps': 47616, 'loss/train': 1.1697089672088623} -08/30/2021 21:51:24 - INFO - __main__ - Step 47618: {'lr': 0.00039167298335998646, 'samples': 9142656, 'steps': 47617, 'loss/train': 1.6931227445602417} -08/30/2021 21:51:26 - INFO - __main__ - Step 47619: {'lr': 0.0003916686109434624, 'samples': 9142848, 'steps': 47618, 'loss/train': 1.5393420457839966} -08/30/2021 21:51:26 - INFO - __main__ - Step 47620: {'lr': 0.00039166423846310463, 'samples': 9143040, 'steps': 47619, 'loss/train': 1.480875849723816} -08/30/2021 21:51:26 - INFO - __main__ - Step 47621: {'lr': 0.00039165986591891506, 'samples': 9143232, 'steps': 47620, 'loss/train': 0.6889795064926147} -08/30/2021 21:51:27 - INFO - __main__ - Step 47622: {'lr': 0.0003916554933108958, 'samples': 9143424, 'steps': 47621, 'loss/train': 1.7952052354812622} -08/30/2021 21:51:27 - INFO - __main__ - Step 47623: {'lr': 0.00039165112063904874, 'samples': 9143616, 'steps': 47622, 'loss/train': 1.2486134767532349} -08/30/2021 21:51:29 - INFO - __main__ - Step 47624: {'lr': 0.0003916467479033759, 'samples': 9143808, 'steps': 47623, 'loss/train': 1.7592450380325317} -08/30/2021 21:51:29 - INFO - __main__ - Step 47625: {'lr': 0.00039164237510387915, 'samples': 9144000, 'steps': 47624, 'loss/train': 1.065859317779541} -08/30/2021 21:51:29 - INFO - __main__ - Step 47626: {'lr': 0.0003916380022405606, 'samples': 9144192, 'steps': 47625, 'loss/train': 1.2433457374572754} -08/30/2021 21:51:30 - INFO - __main__ - Step 47627: {'lr': 0.0003916336293134222, 'samples': 9144384, 'steps': 47626, 'loss/train': 1.419934868812561} -08/30/2021 21:51:30 - INFO - __main__ - Step 47628: {'lr': 0.0003916292563224657, 'samples': 9144576, 'steps': 47627, 'loss/train': 1.0608665943145752} -08/30/2021 21:51:32 - INFO - __main__ - Step 47629: {'lr': 0.00039162488326769334, 'samples': 9144768, 'steps': 47628, 'loss/train': 1.278180480003357} -08/30/2021 21:51:32 - INFO - __main__ - Step 47630: {'lr': 0.00039162051014910706, 'samples': 9144960, 'steps': 47629, 'loss/train': 1.1645411252975464} -08/30/2021 21:51:32 - INFO - __main__ - Step 47631: {'lr': 0.0003916161369667087, 'samples': 9145152, 'steps': 47630, 'loss/train': 1.5614615678787231} -08/30/2021 21:51:33 - INFO - __main__ - Step 47632: {'lr': 0.0003916117637205003, 'samples': 9145344, 'steps': 47631, 'loss/train': 1.0071594715118408} -08/30/2021 21:51:33 - INFO - __main__ - Step 47633: {'lr': 0.00039160739041048376, 'samples': 9145536, 'steps': 47632, 'loss/train': 1.1946840286254883} -08/30/2021 21:51:35 - INFO - __main__ - Step 47634: {'lr': 0.0003916030170366612, 'samples': 9145728, 'steps': 47633, 'loss/train': 0.9085675477981567} -08/30/2021 21:51:36 - INFO - __main__ - Step 47635: {'lr': 0.0003915986435990345, 'samples': 9145920, 'steps': 47634, 'loss/train': 1.7320348024368286} -08/30/2021 21:51:36 - INFO - __main__ - Step 47636: {'lr': 0.0003915942700976056, 'samples': 9146112, 'steps': 47635, 'loss/train': 1.090275764465332} -08/30/2021 21:51:36 - INFO - __main__ - Step 47637: {'lr': 0.0003915898965323765, 'samples': 9146304, 'steps': 47636, 'loss/train': 0.6358849406242371} -08/30/2021 21:51:37 - INFO - __main__ - Step 47638: {'lr': 0.00039158552290334927, 'samples': 9146496, 'steps': 47637, 'loss/train': 1.4608738422393799} -08/30/2021 21:51:38 - INFO - __main__ - Step 47639: {'lr': 0.00039158114921052567, 'samples': 9146688, 'steps': 47638, 'loss/train': 1.7298426628112793} -08/30/2021 21:51:39 - INFO - __main__ - Step 47640: {'lr': 0.0003915767754539078, 'samples': 9146880, 'steps': 47639, 'loss/train': 1.4851280450820923} -08/30/2021 21:51:39 - INFO - __main__ - Step 47641: {'lr': 0.0003915724016334977, 'samples': 9147072, 'steps': 47640, 'loss/train': 1.4141086339950562} -08/30/2021 21:51:39 - INFO - __main__ - Step 47642: {'lr': 0.00039156802774929723, 'samples': 9147264, 'steps': 47641, 'loss/train': 1.5010415315628052} -08/30/2021 21:51:40 - INFO - __main__ - Step 47643: {'lr': 0.00039156365380130844, 'samples': 9147456, 'steps': 47642, 'loss/train': 1.7737804651260376} -08/30/2021 21:51:42 - INFO - __main__ - Step 47644: {'lr': 0.00039155927978953316, 'samples': 9147648, 'steps': 47643, 'loss/train': 1.9736300706863403} -08/30/2021 21:51:42 - INFO - __main__ - Step 47645: {'lr': 0.00039155490571397345, 'samples': 9147840, 'steps': 47644, 'loss/train': 1.2133373022079468} -08/30/2021 21:51:43 - INFO - __main__ - Step 47646: {'lr': 0.0003915505315746313, 'samples': 9148032, 'steps': 47645, 'loss/train': 2.050436496734619} -08/30/2021 21:51:43 - INFO - __main__ - Step 47647: {'lr': 0.00039154615737150867, 'samples': 9148224, 'steps': 47646, 'loss/train': 0.4955146610736847} -08/30/2021 21:51:43 - INFO - __main__ - Step 47648: {'lr': 0.00039154178310460755, 'samples': 9148416, 'steps': 47647, 'loss/train': 2.5190417766571045} -08/30/2021 21:51:44 - INFO - __main__ - Step 47649: {'lr': 0.00039153740877392987, 'samples': 9148608, 'steps': 47648, 'loss/train': 1.6596466302871704} -08/30/2021 21:51:45 - INFO - __main__ - Step 47650: {'lr': 0.0003915330343794777, 'samples': 9148800, 'steps': 47649, 'loss/train': 1.7659639120101929} -08/30/2021 21:51:46 - INFO - __main__ - Step 47651: {'lr': 0.0003915286599212529, 'samples': 9148992, 'steps': 47650, 'loss/train': 1.4008673429489136} -08/30/2021 21:51:46 - INFO - __main__ - Step 47652: {'lr': 0.0003915242853992573, 'samples': 9149184, 'steps': 47651, 'loss/train': 1.771010398864746} -08/30/2021 21:51:46 - INFO - __main__ - Step 47653: {'lr': 0.0003915199108134932, 'samples': 9149376, 'steps': 47652, 'loss/train': 0.19851015508174896} -08/30/2021 21:51:47 - INFO - __main__ - Step 47654: {'lr': 0.00039151553616396234, 'samples': 9149568, 'steps': 47653, 'loss/train': 1.6640305519104004} -08/30/2021 21:51:49 - INFO - __main__ - Step 47655: {'lr': 0.0003915111614506668, 'samples': 9149760, 'steps': 47654, 'loss/train': 1.647017478942871} -08/30/2021 21:51:49 - INFO - __main__ - Step 47656: {'lr': 0.0003915067866736085, 'samples': 9149952, 'steps': 47655, 'loss/train': 0.43213528394699097} -08/30/2021 21:51:50 - INFO - __main__ - Step 47657: {'lr': 0.0003915024118327895, 'samples': 9150144, 'steps': 47656, 'loss/train': 1.7160296440124512} -08/30/2021 21:51:50 - INFO - __main__ - Step 47658: {'lr': 0.0003914980369282116, 'samples': 9150336, 'steps': 47657, 'loss/train': 1.2589799165725708} -08/30/2021 21:51:50 - INFO - __main__ - Step 47659: {'lr': 0.0003914936619598769, 'samples': 9150528, 'steps': 47658, 'loss/train': 1.67231285572052} -08/30/2021 21:51:51 - INFO - __main__ - Step 47660: {'lr': 0.0003914892869277873, 'samples': 9150720, 'steps': 47659, 'loss/train': 0.037424180656671524} -08/30/2021 21:51:52 - INFO - __main__ - Step 47661: {'lr': 0.0003914849118319449, 'samples': 9150912, 'steps': 47660, 'loss/train': 0.0350780114531517} -08/30/2021 21:51:52 - INFO - __main__ - Step 47662: {'lr': 0.0003914805366723515, 'samples': 9151104, 'steps': 47661, 'loss/train': 1.2098432779312134} -08/30/2021 21:51:53 - INFO - __main__ - Step 47663: {'lr': 0.0003914761614490092, 'samples': 9151296, 'steps': 47662, 'loss/train': 1.0824904441833496} -08/30/2021 21:51:53 - INFO - __main__ - Step 47664: {'lr': 0.0003914717861619199, 'samples': 9151488, 'steps': 47663, 'loss/train': 1.6083405017852783} -08/30/2021 21:51:53 - INFO - __main__ - Step 47665: {'lr': 0.00039146741081108567, 'samples': 9151680, 'steps': 47664, 'loss/train': 1.360947608947754} -08/30/2021 21:51:55 - INFO - __main__ - Step 47666: {'lr': 0.0003914630353965083, 'samples': 9151872, 'steps': 47665, 'loss/train': 1.2947280406951904} -08/30/2021 21:51:56 - INFO - __main__ - Step 47667: {'lr': 0.00039145865991818994, 'samples': 9152064, 'steps': 47666, 'loss/train': 0.07312767207622528} -08/30/2021 21:51:56 - INFO - __main__ - Step 47668: {'lr': 0.00039145428437613246, 'samples': 9152256, 'steps': 47667, 'loss/train': 1.3473976850509644} -08/30/2021 21:51:56 - INFO - __main__ - Step 47669: {'lr': 0.0003914499087703379, 'samples': 9152448, 'steps': 47668, 'loss/train': 1.1242252588272095} -08/30/2021 21:51:57 - INFO - __main__ - Step 47670: {'lr': 0.00039144553310080816, 'samples': 9152640, 'steps': 47669, 'loss/train': 1.4932323694229126} -08/30/2021 21:51:58 - INFO - __main__ - Step 47671: {'lr': 0.0003914411573675453, 'samples': 9152832, 'steps': 47670, 'loss/train': 1.550141453742981} -08/30/2021 21:51:59 - INFO - __main__ - Step 47672: {'lr': 0.0003914367815705511, 'samples': 9153024, 'steps': 47671, 'loss/train': 1.6797983646392822} -08/30/2021 21:51:59 - INFO - __main__ - Step 47673: {'lr': 0.00039143240570982776, 'samples': 9153216, 'steps': 47672, 'loss/train': 0.8465274572372437} -08/30/2021 21:51:59 - INFO - __main__ - Step 47674: {'lr': 0.00039142802978537716, 'samples': 9153408, 'steps': 47673, 'loss/train': 1.4265611171722412} -08/30/2021 21:52:00 - INFO - __main__ - Step 47675: {'lr': 0.00039142365379720123, 'samples': 9153600, 'steps': 47674, 'loss/train': 0.9644783139228821} -08/30/2021 21:52:02 - INFO - __main__ - Step 47676: {'lr': 0.0003914192777453021, 'samples': 9153792, 'steps': 47675, 'loss/train': 1.1561638116836548} -08/30/2021 21:52:02 - INFO - __main__ - Step 47677: {'lr': 0.00039141490162968154, 'samples': 9153984, 'steps': 47676, 'loss/train': 1.2505598068237305} -08/30/2021 21:52:02 - INFO - __main__ - Step 47678: {'lr': 0.0003914105254503416, 'samples': 9154176, 'steps': 47677, 'loss/train': 0.14060133695602417} -08/30/2021 21:52:03 - INFO - __main__ - Step 47679: {'lr': 0.00039140614920728424, 'samples': 9154368, 'steps': 47678, 'loss/train': 1.32106614112854} -08/30/2021 21:52:03 - INFO - __main__ - Step 47680: {'lr': 0.0003914017729005115, 'samples': 9154560, 'steps': 47679, 'loss/train': 1.5116673707962036} -08/30/2021 21:52:05 - INFO - __main__ - Step 47681: {'lr': 0.00039139739653002527, 'samples': 9154752, 'steps': 47680, 'loss/train': 1.3136156797409058} -08/30/2021 21:52:05 - INFO - __main__ - Step 47682: {'lr': 0.00039139302009582753, 'samples': 9154944, 'steps': 47681, 'loss/train': 1.2316099405288696} -08/30/2021 21:52:06 - INFO - __main__ - Step 47683: {'lr': 0.00039138864359792035, 'samples': 9155136, 'steps': 47682, 'loss/train': 1.121056079864502} -08/30/2021 21:52:06 - INFO - __main__ - Step 47684: {'lr': 0.0003913842670363056, 'samples': 9155328, 'steps': 47683, 'loss/train': 0.18311218917369843} -08/30/2021 21:52:06 - INFO - __main__ - Step 47685: {'lr': 0.0003913798904109853, 'samples': 9155520, 'steps': 47684, 'loss/train': 0.2778708338737488} -08/30/2021 21:52:07 - INFO - __main__ - Step 47686: {'lr': 0.0003913755137219614, 'samples': 9155712, 'steps': 47685, 'loss/train': 1.6655666828155518} -08/30/2021 21:52:08 - INFO - __main__ - Step 47687: {'lr': 0.00039137113696923587, 'samples': 9155904, 'steps': 47686, 'loss/train': 0.5548986792564392} -08/30/2021 21:52:09 - INFO - __main__ - Step 47688: {'lr': 0.00039136676015281063, 'samples': 9156096, 'steps': 47687, 'loss/train': 1.1955080032348633} -08/30/2021 21:52:09 - INFO - __main__ - Step 47689: {'lr': 0.00039136238327268776, 'samples': 9156288, 'steps': 47688, 'loss/train': 1.114600419998169} -08/30/2021 21:52:09 - INFO - __main__ - Step 47690: {'lr': 0.0003913580063288692, 'samples': 9156480, 'steps': 47689, 'loss/train': 1.1117278337478638} -08/30/2021 21:52:10 - INFO - __main__ - Step 47691: {'lr': 0.0003913536293213569, 'samples': 9156672, 'steps': 47690, 'loss/train': 1.5939730405807495} -08/30/2021 21:52:10 - INFO - __main__ - Step 47692: {'lr': 0.00039134925225015277, 'samples': 9156864, 'steps': 47691, 'loss/train': 1.0508226156234741} -08/30/2021 21:52:12 - INFO - __main__ - Step 47693: {'lr': 0.0003913448751152589, 'samples': 9157056, 'steps': 47692, 'loss/train': 2.471090078353882} -08/30/2021 21:52:12 - INFO - __main__ - Step 47694: {'lr': 0.0003913404979166772, 'samples': 9157248, 'steps': 47693, 'loss/train': 1.124953269958496} -08/30/2021 21:52:13 - INFO - __main__ - Step 47695: {'lr': 0.00039133612065440964, 'samples': 9157440, 'steps': 47694, 'loss/train': 1.1248496770858765} -08/30/2021 21:52:13 - INFO - __main__ - Step 47696: {'lr': 0.0003913317433284582, 'samples': 9157632, 'steps': 47695, 'loss/train': 1.6754659414291382} -08/30/2021 21:52:13 - INFO - __main__ - Step 47697: {'lr': 0.0003913273659388249, 'samples': 9157824, 'steps': 47696, 'loss/train': 1.3552273511886597} -08/30/2021 21:52:15 - INFO - __main__ - Step 47698: {'lr': 0.0003913229884855117, 'samples': 9158016, 'steps': 47697, 'loss/train': 2.4169790744781494} -08/30/2021 21:52:16 - INFO - __main__ - Step 47699: {'lr': 0.00039131861096852044, 'samples': 9158208, 'steps': 47698, 'loss/train': 1.438448429107666} -08/30/2021 21:52:16 - INFO - __main__ - Step 47700: {'lr': 0.0003913142333878533, 'samples': 9158400, 'steps': 47699, 'loss/train': 1.4683477878570557} -08/30/2021 21:52:16 - INFO - __main__ - Step 47701: {'lr': 0.0003913098557435121, 'samples': 9158592, 'steps': 47700, 'loss/train': 1.1579670906066895} -08/30/2021 21:52:17 - INFO - __main__ - Step 47702: {'lr': 0.00039130547803549877, 'samples': 9158784, 'steps': 47701, 'loss/train': 0.5222880244255066} -08/30/2021 21:52:18 - INFO - __main__ - Step 47703: {'lr': 0.00039130110026381547, 'samples': 9158976, 'steps': 47702, 'loss/train': 1.1332464218139648} -08/30/2021 21:52:18 - INFO - __main__ - Step 47704: {'lr': 0.00039129672242846407, 'samples': 9159168, 'steps': 47703, 'loss/train': 1.3162339925765991} -08/30/2021 21:52:19 - INFO - __main__ - Step 47705: {'lr': 0.0003912923445294465, 'samples': 9159360, 'steps': 47704, 'loss/train': 1.6958369016647339} -08/30/2021 21:52:19 - INFO - __main__ - Step 47706: {'lr': 0.00039128796656676487, 'samples': 9159552, 'steps': 47705, 'loss/train': 1.4678961038589478} -08/30/2021 21:52:20 - INFO - __main__ - Step 47707: {'lr': 0.000391283588540421, 'samples': 9159744, 'steps': 47706, 'loss/train': 1.2647621631622314} -08/30/2021 21:52:20 - INFO - __main__ - Step 47708: {'lr': 0.00039127921045041693, 'samples': 9159936, 'steps': 47707, 'loss/train': 1.7813242673873901} -08/30/2021 21:52:22 - INFO - __main__ - Step 47709: {'lr': 0.00039127483229675457, 'samples': 9160128, 'steps': 47708, 'loss/train': 1.9884852170944214} -08/30/2021 21:52:22 - INFO - __main__ - Step 47710: {'lr': 0.0003912704540794361, 'samples': 9160320, 'steps': 47709, 'loss/train': 1.2117905616760254} -08/30/2021 21:52:22 - INFO - __main__ - Step 47711: {'lr': 0.0003912660757984632, 'samples': 9160512, 'steps': 47710, 'loss/train': 2.0725977420806885} -08/30/2021 21:52:23 - INFO - __main__ - Step 47712: {'lr': 0.00039126169745383807, 'samples': 9160704, 'steps': 47711, 'loss/train': 1.0492584705352783} -08/30/2021 21:52:23 - INFO - __main__ - Step 47713: {'lr': 0.00039125731904556254, 'samples': 9160896, 'steps': 47712, 'loss/train': 1.644363284111023} -08/30/2021 21:52:25 - INFO - __main__ - Step 47714: {'lr': 0.0003912529405736387, 'samples': 9161088, 'steps': 47713, 'loss/train': 1.2478951215744019} -08/30/2021 21:52:25 - INFO - __main__ - Step 47715: {'lr': 0.00039124856203806834, 'samples': 9161280, 'steps': 47714, 'loss/train': 1.6116446256637573} -08/30/2021 21:52:26 - INFO - __main__ - Step 47716: {'lr': 0.0003912441834388537, 'samples': 9161472, 'steps': 47715, 'loss/train': 0.12646691501140594} -08/30/2021 21:52:26 - INFO - __main__ - Step 47717: {'lr': 0.00039123980477599664, 'samples': 9161664, 'steps': 47716, 'loss/train': 1.5476903915405273} -08/30/2021 21:52:26 - INFO - __main__ - Step 47718: {'lr': 0.00039123542604949904, 'samples': 9161856, 'steps': 47717, 'loss/train': 0.11959554255008698} -08/30/2021 21:52:28 - INFO - __main__ - Step 47719: {'lr': 0.0003912310472593629, 'samples': 9162048, 'steps': 47718, 'loss/train': 1.5829530954360962} -08/30/2021 21:52:29 - INFO - __main__ - Step 47720: {'lr': 0.0003912266684055902, 'samples': 9162240, 'steps': 47719, 'loss/train': 1.357043743133545} -08/30/2021 21:52:29 - INFO - __main__ - Step 47721: {'lr': 0.000391222289488183, 'samples': 9162432, 'steps': 47720, 'loss/train': 1.4404535293579102} -08/30/2021 21:52:29 - INFO - __main__ - Step 47722: {'lr': 0.00039121791050714317, 'samples': 9162624, 'steps': 47721, 'loss/train': 1.5500365495681763} -08/30/2021 21:52:30 - INFO - __main__ - Step 47723: {'lr': 0.0003912135314624728, 'samples': 9162816, 'steps': 47722, 'loss/train': 1.1916786432266235} -08/30/2021 21:52:30 - INFO - __main__ - Step 47724: {'lr': 0.00039120915235417377, 'samples': 9163008, 'steps': 47723, 'loss/train': 1.1242374181747437} -08/30/2021 21:52:32 - INFO - __main__ - Step 47725: {'lr': 0.0003912047731822481, 'samples': 9163200, 'steps': 47724, 'loss/train': 2.36653470993042} -08/30/2021 21:52:32 - INFO - __main__ - Step 47726: {'lr': 0.0003912003939466977, 'samples': 9163392, 'steps': 47725, 'loss/train': 1.5357462167739868} -08/30/2021 21:52:32 - INFO - __main__ - Step 47727: {'lr': 0.0003911960146475245, 'samples': 9163584, 'steps': 47726, 'loss/train': 1.4503769874572754} -08/30/2021 21:52:33 - INFO - __main__ - Step 47728: {'lr': 0.0003911916352847307, 'samples': 9163776, 'steps': 47727, 'loss/train': 1.131748080253601} -08/30/2021 21:52:33 - INFO - __main__ - Step 47729: {'lr': 0.0003911872558583181, 'samples': 9163968, 'steps': 47728, 'loss/train': 2.0050408840179443} -08/30/2021 21:52:35 - INFO - __main__ - Step 47730: {'lr': 0.00039118287636828866, 'samples': 9164160, 'steps': 47729, 'loss/train': 1.6159602403640747} -08/30/2021 21:52:35 - INFO - __main__ - Step 47731: {'lr': 0.0003911784968146444, 'samples': 9164352, 'steps': 47730, 'loss/train': 1.4069621562957764} -08/30/2021 21:52:35 - INFO - __main__ - Step 47732: {'lr': 0.00039117411719738726, 'samples': 9164544, 'steps': 47731, 'loss/train': 1.5779651403427124} -08/30/2021 21:52:36 - INFO - __main__ - Step 47733: {'lr': 0.0003911697375165193, 'samples': 9164736, 'steps': 47732, 'loss/train': 0.6587130427360535} -08/30/2021 21:52:36 - INFO - __main__ - Step 47734: {'lr': 0.00039116535777204237, 'samples': 9164928, 'steps': 47733, 'loss/train': 0.37427887320518494} -08/30/2021 21:52:36 - INFO - __main__ - Step 47735: {'lr': 0.00039116097796395856, 'samples': 9165120, 'steps': 47734, 'loss/train': 0.9871906638145447} -08/30/2021 21:52:38 - INFO - __main__ - Step 47736: {'lr': 0.00039115659809226975, 'samples': 9165312, 'steps': 47735, 'loss/train': 1.377522349357605} -08/30/2021 21:52:39 - INFO - __main__ - Step 47737: {'lr': 0.00039115221815697797, 'samples': 9165504, 'steps': 47736, 'loss/train': 0.12300369888544083} -08/30/2021 21:52:39 - INFO - __main__ - Step 47738: {'lr': 0.00039114783815808526, 'samples': 9165696, 'steps': 47737, 'loss/train': 1.6736088991165161} -08/30/2021 21:52:39 - INFO - __main__ - Step 47739: {'lr': 0.0003911434580955934, 'samples': 9165888, 'steps': 47738, 'loss/train': 0.9321932792663574} -08/30/2021 21:52:40 - INFO - __main__ - Step 47740: {'lr': 0.00039113907796950453, 'samples': 9166080, 'steps': 47739, 'loss/train': 1.7272741794586182} -08/30/2021 21:52:41 - INFO - __main__ - Step 47741: {'lr': 0.0003911346977798206, 'samples': 9166272, 'steps': 47740, 'loss/train': 0.4666619300842285} -08/30/2021 21:52:42 - INFO - __main__ - Step 47742: {'lr': 0.0003911303175265435, 'samples': 9166464, 'steps': 47741, 'loss/train': 1.4512208700180054} -08/30/2021 21:52:42 - INFO - __main__ - Step 47743: {'lr': 0.00039112593720967524, 'samples': 9166656, 'steps': 47742, 'loss/train': 1.0627355575561523} -08/30/2021 21:52:42 - INFO - __main__ - Step 47744: {'lr': 0.00039112155682921785, 'samples': 9166848, 'steps': 47743, 'loss/train': 1.1207740306854248} -08/30/2021 21:52:43 - INFO - __main__ - Step 47745: {'lr': 0.00039111717638517325, 'samples': 9167040, 'steps': 47744, 'loss/train': 0.9456784129142761} -08/30/2021 21:52:45 - INFO - __main__ - Step 47746: {'lr': 0.00039111279587754344, 'samples': 9167232, 'steps': 47745, 'loss/train': 1.540494441986084} -08/30/2021 21:52:45 - INFO - __main__ - Step 47747: {'lr': 0.0003911084153063303, 'samples': 9167424, 'steps': 47746, 'loss/train': 1.6111749410629272} -08/30/2021 21:52:46 - INFO - __main__ - Step 47748: {'lr': 0.000391104034671536, 'samples': 9167616, 'steps': 47747, 'loss/train': 1.0142439603805542} -08/30/2021 21:52:46 - INFO - __main__ - Step 47749: {'lr': 0.00039109965397316236, 'samples': 9167808, 'steps': 47748, 'loss/train': 1.4544976949691772} -08/30/2021 21:52:46 - INFO - __main__ - Step 47750: {'lr': 0.0003910952732112114, 'samples': 9168000, 'steps': 47749, 'loss/train': 1.2413040399551392} -08/30/2021 21:52:48 - INFO - __main__ - Step 47751: {'lr': 0.00039109089238568507, 'samples': 9168192, 'steps': 47750, 'loss/train': 1.8442610502243042} -08/30/2021 21:52:49 - INFO - __main__ - Step 47752: {'lr': 0.00039108651149658534, 'samples': 9168384, 'steps': 47751, 'loss/train': 1.941083312034607} -08/30/2021 21:52:49 - INFO - __main__ - Step 47753: {'lr': 0.0003910821305439143, 'samples': 9168576, 'steps': 47752, 'loss/train': 0.8489578366279602} -08/30/2021 21:52:49 - INFO - __main__ - Step 47754: {'lr': 0.00039107774952767374, 'samples': 9168768, 'steps': 47753, 'loss/train': 0.9137014746665955} -08/30/2021 21:52:50 - INFO - __main__ - Step 47755: {'lr': 0.0003910733684478657, 'samples': 9168960, 'steps': 47754, 'loss/train': 1.9159895181655884} -08/30/2021 21:52:51 - INFO - __main__ - Step 47756: {'lr': 0.00039106898730449223, 'samples': 9169152, 'steps': 47755, 'loss/train': 1.085327386856079} -08/30/2021 21:52:52 - INFO - __main__ - Step 47757: {'lr': 0.0003910646060975553, 'samples': 9169344, 'steps': 47756, 'loss/train': 1.554229974746704} -08/30/2021 21:52:52 - INFO - __main__ - Step 47758: {'lr': 0.00039106022482705675, 'samples': 9169536, 'steps': 47757, 'loss/train': 1.5550178289413452} -08/30/2021 21:52:52 - INFO - __main__ - Step 47759: {'lr': 0.0003910558434929987, 'samples': 9169728, 'steps': 47758, 'loss/train': 1.4158895015716553} -08/30/2021 21:52:53 - INFO - __main__ - Step 47760: {'lr': 0.000391051462095383, 'samples': 9169920, 'steps': 47759, 'loss/train': 1.0833162069320679} -08/30/2021 21:52:53 - INFO - __main__ - Step 47761: {'lr': 0.0003910470806342117, 'samples': 9170112, 'steps': 47760, 'loss/train': 1.4738497734069824} -08/30/2021 21:52:55 - INFO - __main__ - Step 47762: {'lr': 0.00039104269910948675, 'samples': 9170304, 'steps': 47761, 'loss/train': 1.1122866868972778} -08/30/2021 21:52:55 - INFO - __main__ - Step 47763: {'lr': 0.00039103831752121024, 'samples': 9170496, 'steps': 47762, 'loss/train': 1.7349724769592285} -08/30/2021 21:52:55 - INFO - __main__ - Step 47764: {'lr': 0.00039103393586938394, 'samples': 9170688, 'steps': 47763, 'loss/train': 1.354042410850525} -08/30/2021 21:52:56 - INFO - __main__ - Step 47765: {'lr': 0.00039102955415401, 'samples': 9170880, 'steps': 47764, 'loss/train': 2.238220691680908} -08/30/2021 21:52:56 - INFO - __main__ - Step 47766: {'lr': 0.00039102517237509025, 'samples': 9171072, 'steps': 47765, 'loss/train': 1.214213252067566} -08/30/2021 21:52:58 - INFO - __main__ - Step 47767: {'lr': 0.0003910207905326267, 'samples': 9171264, 'steps': 47766, 'loss/train': 0.09470254927873611} -08/30/2021 21:52:58 - INFO - __main__ - Step 47768: {'lr': 0.00039101640862662147, 'samples': 9171456, 'steps': 47767, 'loss/train': 0.06765691190958023} -08/30/2021 21:52:58 - INFO - __main__ - Step 47769: {'lr': 0.0003910120266570764, 'samples': 9171648, 'steps': 47768, 'loss/train': 1.2740015983581543} -08/30/2021 21:52:59 - INFO - __main__ - Step 47770: {'lr': 0.0003910076446239934, 'samples': 9171840, 'steps': 47769, 'loss/train': 1.1646220684051514} -08/30/2021 21:52:59 - INFO - __main__ - Step 47771: {'lr': 0.00039100326252737463, 'samples': 9172032, 'steps': 47770, 'loss/train': 0.7772130370140076} -08/30/2021 21:53:01 - INFO - __main__ - Step 47772: {'lr': 0.00039099888036722187, 'samples': 9172224, 'steps': 47771, 'loss/train': 1.241371989250183} -08/30/2021 21:53:01 - INFO - __main__ - Step 47773: {'lr': 0.00039099449814353725, 'samples': 9172416, 'steps': 47772, 'loss/train': 1.0401647090911865} -08/30/2021 21:53:02 - INFO - __main__ - Step 47774: {'lr': 0.00039099011585632266, 'samples': 9172608, 'steps': 47773, 'loss/train': 2.0747087001800537} -08/30/2021 21:53:02 - INFO - __main__ - Step 47775: {'lr': 0.0003909857335055801, 'samples': 9172800, 'steps': 47774, 'loss/train': 1.495471477508545} -08/30/2021 21:53:02 - INFO - __main__ - Step 47776: {'lr': 0.00039098135109131156, 'samples': 9172992, 'steps': 47775, 'loss/train': 1.5542500019073486} -08/30/2021 21:53:04 - INFO - __main__ - Step 47777: {'lr': 0.00039097696861351895, 'samples': 9173184, 'steps': 47776, 'loss/train': 1.196526288986206} -08/30/2021 21:53:04 - INFO - __main__ - Step 47778: {'lr': 0.00039097258607220445, 'samples': 9173376, 'steps': 47777, 'loss/train': 1.1890817880630493} -08/30/2021 21:53:05 - INFO - __main__ - Step 47779: {'lr': 0.00039096820346736974, 'samples': 9173568, 'steps': 47778, 'loss/train': 1.9189021587371826} -08/30/2021 21:53:05 - INFO - __main__ - Step 47780: {'lr': 0.00039096382079901695, 'samples': 9173760, 'steps': 47779, 'loss/train': 0.8137530088424683} -08/30/2021 21:53:05 - INFO - __main__ - Step 47781: {'lr': 0.000390959438067148, 'samples': 9173952, 'steps': 47780, 'loss/train': 1.1605702638626099} -08/30/2021 21:53:07 - INFO - __main__ - Step 47782: {'lr': 0.000390955055271765, 'samples': 9174144, 'steps': 47781, 'loss/train': 1.4485225677490234} -08/30/2021 21:53:07 - INFO - __main__ - Step 47783: {'lr': 0.00039095067241286973, 'samples': 9174336, 'steps': 47782, 'loss/train': 2.0699949264526367} -08/30/2021 21:53:08 - INFO - __main__ - Step 47784: {'lr': 0.00039094628949046435, 'samples': 9174528, 'steps': 47783, 'loss/train': 2.5348355770111084} -08/30/2021 21:53:08 - INFO - __main__ - Step 47785: {'lr': 0.0003909419065045507, 'samples': 9174720, 'steps': 47784, 'loss/train': 1.4091465473175049} -08/30/2021 21:53:08 - INFO - __main__ - Step 47786: {'lr': 0.0003909375234551308, 'samples': 9174912, 'steps': 47785, 'loss/train': 0.7870063781738281} -08/30/2021 21:53:09 - INFO - __main__ - Step 47787: {'lr': 0.0003909331403422066, 'samples': 9175104, 'steps': 47786, 'loss/train': 1.681264877319336} -08/30/2021 21:53:11 - INFO - __main__ - Step 47788: {'lr': 0.00039092875716578013, 'samples': 9175296, 'steps': 47787, 'loss/train': 1.670573115348816} -08/30/2021 21:53:11 - INFO - __main__ - Step 47789: {'lr': 0.00039092437392585335, 'samples': 9175488, 'steps': 47788, 'loss/train': 1.2213523387908936} -08/30/2021 21:53:11 - INFO - __main__ - Step 47790: {'lr': 0.0003909199906224282, 'samples': 9175680, 'steps': 47789, 'loss/train': 1.4888702630996704} -08/30/2021 21:53:12 - INFO - __main__ - Step 47791: {'lr': 0.00039091560725550676, 'samples': 9175872, 'steps': 47790, 'loss/train': 1.2352653741836548} -08/30/2021 21:53:12 - INFO - __main__ - Step 47792: {'lr': 0.0003909112238250908, 'samples': 9176064, 'steps': 47791, 'loss/train': 0.04455862566828728} -08/30/2021 21:53:14 - INFO - __main__ - Step 47793: {'lr': 0.0003909068403311825, 'samples': 9176256, 'steps': 47792, 'loss/train': 1.3104918003082275} -08/30/2021 21:53:14 - INFO - __main__ - Step 47794: {'lr': 0.0003909024567737837, 'samples': 9176448, 'steps': 47793, 'loss/train': 1.0472642183303833} -08/30/2021 21:53:14 - INFO - __main__ - Step 47795: {'lr': 0.0003908980731528965, 'samples': 9176640, 'steps': 47794, 'loss/train': 1.5005263090133667} -08/30/2021 21:53:15 - INFO - __main__ - Step 47796: {'lr': 0.0003908936894685227, 'samples': 9176832, 'steps': 47795, 'loss/train': 1.6320569515228271} -08/30/2021 21:53:15 - INFO - __main__ - Step 47797: {'lr': 0.0003908893057206644, 'samples': 9177024, 'steps': 47796, 'loss/train': 0.8997487425804138} -08/30/2021 21:53:17 - INFO - __main__ - Step 47798: {'lr': 0.00039088492190932365, 'samples': 9177216, 'steps': 47797, 'loss/train': 1.0634236335754395} -08/30/2021 21:53:17 - INFO - __main__ - Step 47799: {'lr': 0.00039088053803450223, 'samples': 9177408, 'steps': 47798, 'loss/train': 1.648417592048645} -08/30/2021 21:53:17 - INFO - __main__ - Step 47800: {'lr': 0.00039087615409620223, 'samples': 9177600, 'steps': 47799, 'loss/train': 0.7527249455451965} -08/30/2021 21:53:18 - INFO - __main__ - Step 47801: {'lr': 0.00039087177009442567, 'samples': 9177792, 'steps': 47800, 'loss/train': 0.8085160255432129} -08/30/2021 21:53:18 - INFO - __main__ - Step 47802: {'lr': 0.0003908673860291744, 'samples': 9177984, 'steps': 47801, 'loss/train': 1.4453188180923462} -08/30/2021 21:53:20 - INFO - __main__ - Step 47803: {'lr': 0.0003908630019004504, 'samples': 9178176, 'steps': 47802, 'loss/train': 1.3109943866729736} -08/30/2021 21:53:21 - INFO - __main__ - Step 47804: {'lr': 0.00039085861770825586, 'samples': 9178368, 'steps': 47803, 'loss/train': 1.4579682350158691} -08/30/2021 21:53:21 - INFO - __main__ - Step 47805: {'lr': 0.00039085423345259254, 'samples': 9178560, 'steps': 47804, 'loss/train': 0.5984822511672974} -08/30/2021 21:53:21 - INFO - __main__ - Step 47806: {'lr': 0.00039084984913346246, 'samples': 9178752, 'steps': 47805, 'loss/train': 1.1868911981582642} -08/30/2021 21:53:22 - INFO - __main__ - Step 47807: {'lr': 0.0003908454647508676, 'samples': 9178944, 'steps': 47806, 'loss/train': 1.2919950485229492} -08/30/2021 21:53:23 - INFO - __main__ - Step 47808: {'lr': 0.0003908410803048099, 'samples': 9179136, 'steps': 47807, 'loss/train': 1.1233738660812378} -08/30/2021 21:53:24 - INFO - __main__ - Step 47809: {'lr': 0.0003908366957952915, 'samples': 9179328, 'steps': 47808, 'loss/train': 2.2985167503356934} -08/30/2021 21:53:24 - INFO - __main__ - Step 47810: {'lr': 0.0003908323112223142, 'samples': 9179520, 'steps': 47809, 'loss/train': 1.0263887643814087} -08/30/2021 21:53:25 - INFO - __main__ - Step 47811: {'lr': 0.0003908279265858801, 'samples': 9179712, 'steps': 47810, 'loss/train': 0.3828620910644531} -08/30/2021 21:53:25 - INFO - __main__ - Step 47812: {'lr': 0.00039082354188599094, 'samples': 9179904, 'steps': 47811, 'loss/train': 1.3684004545211792} -08/30/2021 21:53:26 - INFO - __main__ - Step 47813: {'lr': 0.00039081915712264897, 'samples': 9180096, 'steps': 47812, 'loss/train': 1.2352933883666992} -08/30/2021 21:53:27 - INFO - __main__ - Step 47814: {'lr': 0.000390814772295856, 'samples': 9180288, 'steps': 47813, 'loss/train': 1.4901241064071655} -08/30/2021 21:53:27 - INFO - __main__ - Step 47815: {'lr': 0.0003908103874056142, 'samples': 9180480, 'steps': 47814, 'loss/train': 0.19271336495876312} -08/30/2021 21:53:28 - INFO - __main__ - Step 47816: {'lr': 0.0003908060024519253, 'samples': 9180672, 'steps': 47815, 'loss/train': 1.2182456254959106} -08/30/2021 21:53:28 - INFO - __main__ - Step 47817: {'lr': 0.0003908016174347915, 'samples': 9180864, 'steps': 47816, 'loss/train': 1.3654496669769287} -08/30/2021 21:53:28 - INFO - __main__ - Step 47818: {'lr': 0.00039079723235421456, 'samples': 9181056, 'steps': 47817, 'loss/train': 2.243772506713867} -08/30/2021 21:53:30 - INFO - __main__ - Step 47819: {'lr': 0.0003907928472101966, 'samples': 9181248, 'steps': 47818, 'loss/train': 1.1528795957565308} -08/30/2021 21:53:31 - INFO - __main__ - Step 47820: {'lr': 0.00039078846200273955, 'samples': 9181440, 'steps': 47819, 'loss/train': 1.8712186813354492} -08/30/2021 21:53:31 - INFO - __main__ - Step 47821: {'lr': 0.00039078407673184536, 'samples': 9181632, 'steps': 47820, 'loss/train': 1.1071661710739136} -08/30/2021 21:53:31 - INFO - __main__ - Step 47822: {'lr': 0.000390779691397516, 'samples': 9181824, 'steps': 47821, 'loss/train': 0.027321387082338333} -08/30/2021 21:53:32 - INFO - __main__ - Step 47823: {'lr': 0.0003907753059997536, 'samples': 9182016, 'steps': 47822, 'loss/train': 1.240317702293396} -08/30/2021 21:53:32 - INFO - __main__ - Step 47824: {'lr': 0.00039077092053855996, 'samples': 9182208, 'steps': 47823, 'loss/train': 1.1229140758514404} -08/30/2021 21:53:34 - INFO - __main__ - Step 47825: {'lr': 0.0003907665350139371, 'samples': 9182400, 'steps': 47824, 'loss/train': 1.1748948097229004} -08/30/2021 21:53:34 - INFO - __main__ - Step 47826: {'lr': 0.00039076214942588704, 'samples': 9182592, 'steps': 47825, 'loss/train': 1.1977704763412476} -08/30/2021 21:53:34 - INFO - __main__ - Step 47827: {'lr': 0.00039075776377441176, 'samples': 9182784, 'steps': 47826, 'loss/train': 1.5836211442947388} -08/30/2021 21:53:35 - INFO - __main__ - Step 47828: {'lr': 0.00039075337805951314, 'samples': 9182976, 'steps': 47827, 'loss/train': 1.2987773418426514} -08/30/2021 21:53:35 - INFO - __main__ - Step 47829: {'lr': 0.0003907489922811932, 'samples': 9183168, 'steps': 47828, 'loss/train': 1.127219319343567} -08/30/2021 21:53:35 - INFO - __main__ - Step 47830: {'lr': 0.000390744606439454, 'samples': 9183360, 'steps': 47829, 'loss/train': 1.4508413076400757} -08/30/2021 21:53:37 - INFO - __main__ - Step 47831: {'lr': 0.00039074022053429746, 'samples': 9183552, 'steps': 47830, 'loss/train': 1.0003811120986938} -08/30/2021 21:53:37 - INFO - __main__ - Step 47832: {'lr': 0.00039073583456572547, 'samples': 9183744, 'steps': 47831, 'loss/train': 1.0092073678970337} -08/30/2021 21:53:38 - INFO - __main__ - Step 47833: {'lr': 0.0003907314485337402, 'samples': 9183936, 'steps': 47832, 'loss/train': 0.6801624894142151} -08/30/2021 21:53:38 - INFO - __main__ - Step 47834: {'lr': 0.00039072706243834345, 'samples': 9184128, 'steps': 47833, 'loss/train': 1.3620165586471558} -08/30/2021 21:53:39 - INFO - __main__ - Step 47835: {'lr': 0.0003907226762795372, 'samples': 9184320, 'steps': 47834, 'loss/train': 1.6177831888198853} -08/30/2021 21:53:40 - INFO - __main__ - Step 47836: {'lr': 0.0003907182900573235, 'samples': 9184512, 'steps': 47835, 'loss/train': 1.9017062187194824} -08/30/2021 21:53:40 - INFO - __main__ - Step 47837: {'lr': 0.00039071390377170434, 'samples': 9184704, 'steps': 47836, 'loss/train': 2.029161214828491} -08/30/2021 21:53:41 - INFO - __main__ - Step 47838: {'lr': 0.00039070951742268173, 'samples': 9184896, 'steps': 47837, 'loss/train': 1.786980390548706} -08/30/2021 21:53:41 - INFO - __main__ - Step 47839: {'lr': 0.00039070513101025753, 'samples': 9185088, 'steps': 47838, 'loss/train': 1.1534768342971802} -08/30/2021 21:53:41 - INFO - __main__ - Step 47840: {'lr': 0.00039070074453443374, 'samples': 9185280, 'steps': 47839, 'loss/train': 2.1194944381713867} -08/30/2021 21:53:43 - INFO - __main__ - Step 47841: {'lr': 0.0003906963579952124, 'samples': 9185472, 'steps': 47840, 'loss/train': 1.5754231214523315} -08/30/2021 21:53:44 - INFO - __main__ - Step 47842: {'lr': 0.0003906919713925954, 'samples': 9185664, 'steps': 47841, 'loss/train': 0.2891518175601959} -08/30/2021 21:53:44 - INFO - __main__ - Step 47843: {'lr': 0.00039068758472658483, 'samples': 9185856, 'steps': 47842, 'loss/train': 1.1745272874832153} -08/30/2021 21:53:44 - INFO - __main__ - Step 47844: {'lr': 0.0003906831979971826, 'samples': 9186048, 'steps': 47843, 'loss/train': 1.2733420133590698} -08/30/2021 21:53:45 - INFO - __main__ - Step 47845: {'lr': 0.0003906788112043907, 'samples': 9186240, 'steps': 47844, 'loss/train': 1.5973608493804932} -08/30/2021 21:53:46 - INFO - __main__ - Step 47846: {'lr': 0.00039067442434821106, 'samples': 9186432, 'steps': 47845, 'loss/train': 1.3231230974197388} -08/30/2021 21:53:47 - INFO - __main__ - Step 47847: {'lr': 0.0003906700374286457, 'samples': 9186624, 'steps': 47846, 'loss/train': 1.4371161460876465} -08/30/2021 21:53:47 - INFO - __main__ - Step 47848: {'lr': 0.0003906656504456966, 'samples': 9186816, 'steps': 47847, 'loss/train': 1.802668809890747} -08/30/2021 21:53:47 - INFO - __main__ - Step 47849: {'lr': 0.0003906612633993657, 'samples': 9187008, 'steps': 47848, 'loss/train': 1.4726520776748657} -08/30/2021 21:53:48 - INFO - __main__ - Step 47850: {'lr': 0.00039065687628965506, 'samples': 9187200, 'steps': 47849, 'loss/train': 1.7587085962295532} -08/30/2021 21:53:49 - INFO - __main__ - Step 47851: {'lr': 0.0003906524891165666, 'samples': 9187392, 'steps': 47850, 'loss/train': 1.3055469989776611} -08/30/2021 21:53:50 - INFO - __main__ - Step 47852: {'lr': 0.00039064810188010223, 'samples': 9187584, 'steps': 47851, 'loss/train': 1.5824121236801147} -08/30/2021 21:53:50 - INFO - __main__ - Step 47853: {'lr': 0.000390643714580264, 'samples': 9187776, 'steps': 47852, 'loss/train': 1.0733797550201416} -08/30/2021 21:53:50 - INFO - __main__ - Step 47854: {'lr': 0.000390639327217054, 'samples': 9187968, 'steps': 47853, 'loss/train': 1.1565110683441162} -08/30/2021 21:53:51 - INFO - __main__ - Step 47855: {'lr': 0.000390634939790474, 'samples': 9188160, 'steps': 47854, 'loss/train': 1.4136343002319336} -08/30/2021 21:53:51 - INFO - __main__ - Step 47856: {'lr': 0.00039063055230052605, 'samples': 9188352, 'steps': 47855, 'loss/train': 1.7883784770965576} -08/30/2021 21:53:54 - INFO - __main__ - Step 47857: {'lr': 0.00039062616474721217, 'samples': 9188544, 'steps': 47856, 'loss/train': 1.0259677171707153} -08/30/2021 21:53:54 - INFO - __main__ - Step 47858: {'lr': 0.00039062177713053436, 'samples': 9188736, 'steps': 47857, 'loss/train': 0.8832210898399353} -08/30/2021 21:53:54 - INFO - __main__ - Step 47859: {'lr': 0.00039061738945049454, 'samples': 9188928, 'steps': 47858, 'loss/train': 1.596526026725769} -08/30/2021 21:53:55 - INFO - __main__ - Step 47860: {'lr': 0.0003906130017070946, 'samples': 9189120, 'steps': 47859, 'loss/train': 1.2877858877182007} -08/30/2021 21:53:55 - INFO - __main__ - Step 47861: {'lr': 0.0003906086139003366, 'samples': 9189312, 'steps': 47860, 'loss/train': 1.2230300903320312} -08/30/2021 21:53:55 - INFO - __main__ - Step 47862: {'lr': 0.00039060422603022266, 'samples': 9189504, 'steps': 47861, 'loss/train': 1.6417721509933472} -08/30/2021 21:53:57 - INFO - __main__ - Step 47863: {'lr': 0.0003905998380967546, 'samples': 9189696, 'steps': 47862, 'loss/train': 1.4069128036499023} -08/30/2021 21:53:57 - INFO - __main__ - Step 47864: {'lr': 0.00039059545009993436, 'samples': 9189888, 'steps': 47863, 'loss/train': 1.6009562015533447} -08/30/2021 21:53:58 - INFO - __main__ - Step 47865: {'lr': 0.00039059106203976403, 'samples': 9190080, 'steps': 47864, 'loss/train': 1.6115458011627197} -08/30/2021 21:53:58 - INFO - __main__ - Step 47866: {'lr': 0.00039058667391624546, 'samples': 9190272, 'steps': 47865, 'loss/train': 1.3307462930679321} -08/30/2021 21:53:58 - INFO - __main__ - Step 47867: {'lr': 0.00039058228572938074, 'samples': 9190464, 'steps': 47866, 'loss/train': 1.7715603113174438} -08/30/2021 21:54:00 - INFO - __main__ - Step 47868: {'lr': 0.00039057789747917184, 'samples': 9190656, 'steps': 47867, 'loss/train': 1.685539722442627} -08/30/2021 21:54:00 - INFO - __main__ - Step 47869: {'lr': 0.00039057350916562065, 'samples': 9190848, 'steps': 47868, 'loss/train': 1.5434104204177856} -08/30/2021 21:54:01 - INFO - __main__ - Step 47870: {'lr': 0.0003905691207887293, 'samples': 9191040, 'steps': 47869, 'loss/train': 1.1712714433670044} -08/30/2021 21:54:01 - INFO - __main__ - Step 47871: {'lr': 0.00039056473234849964, 'samples': 9191232, 'steps': 47870, 'loss/train': 0.8834353089332581} -08/30/2021 21:54:02 - INFO - __main__ - Step 47872: {'lr': 0.0003905603438449337, 'samples': 9191424, 'steps': 47871, 'loss/train': 1.0077705383300781} -08/30/2021 21:54:04 - INFO - __main__ - Step 47873: {'lr': 0.00039055595527803333, 'samples': 9191616, 'steps': 47872, 'loss/train': 0.5067219138145447} -08/30/2021 21:54:04 - INFO - __main__ - Step 47874: {'lr': 0.00039055156664780067, 'samples': 9191808, 'steps': 47873, 'loss/train': 1.157138466835022} -08/30/2021 21:54:05 - INFO - __main__ - Step 47875: {'lr': 0.00039054717795423765, 'samples': 9192000, 'steps': 47874, 'loss/train': 1.508017897605896} -08/30/2021 21:54:05 - INFO - __main__ - Step 47876: {'lr': 0.0003905427891973463, 'samples': 9192192, 'steps': 47875, 'loss/train': 0.22306524217128754} -08/30/2021 21:54:05 - INFO - __main__ - Step 47877: {'lr': 0.0003905384003771285, 'samples': 9192384, 'steps': 47876, 'loss/train': 1.6413267850875854} -08/30/2021 21:54:06 - INFO - __main__ - Step 47878: {'lr': 0.00039053401149358625, 'samples': 9192576, 'steps': 47877, 'loss/train': 1.6126058101654053} -08/30/2021 21:54:06 - INFO - __main__ - Step 47879: {'lr': 0.0003905296225467215, 'samples': 9192768, 'steps': 47878, 'loss/train': 1.5501893758773804} -08/30/2021 21:54:06 - INFO - __main__ - Step 47880: {'lr': 0.0003905252335365364, 'samples': 9192960, 'steps': 47879, 'loss/train': 1.0960619449615479} -08/30/2021 21:54:08 - INFO - __main__ - Step 47881: {'lr': 0.00039052084446303264, 'samples': 9193152, 'steps': 47880, 'loss/train': 1.2098392248153687} -08/30/2021 21:54:09 - INFO - __main__ - Step 47882: {'lr': 0.0003905164553262125, 'samples': 9193344, 'steps': 47881, 'loss/train': 1.3932965993881226} -08/30/2021 21:54:09 - INFO - __main__ - Step 47883: {'lr': 0.0003905120661260777, 'samples': 9193536, 'steps': 47882, 'loss/train': 3.418060064315796} -08/30/2021 21:54:09 - INFO - __main__ - Step 47884: {'lr': 0.00039050767686263035, 'samples': 9193728, 'steps': 47883, 'loss/train': 1.6404333114624023} -08/30/2021 21:54:10 - INFO - __main__ - Step 47885: {'lr': 0.0003905032875358725, 'samples': 9193920, 'steps': 47884, 'loss/train': 2.0146450996398926} -08/30/2021 21:54:11 - INFO - __main__ - Step 47886: {'lr': 0.00039049889814580597, 'samples': 9194112, 'steps': 47885, 'loss/train': 1.7083091735839844} -08/30/2021 21:54:12 - INFO - __main__ - Step 47887: {'lr': 0.00039049450869243276, 'samples': 9194304, 'steps': 47886, 'loss/train': 1.903693437576294} -08/30/2021 21:54:12 - INFO - __main__ - Step 47888: {'lr': 0.00039049011917575494, 'samples': 9194496, 'steps': 47887, 'loss/train': 1.0813472270965576} -08/30/2021 21:54:12 - INFO - __main__ - Step 47889: {'lr': 0.00039048572959577446, 'samples': 9194688, 'steps': 47888, 'loss/train': 0.12155977636575699} -08/30/2021 21:54:13 - INFO - __main__ - Step 47890: {'lr': 0.0003904813399524932, 'samples': 9194880, 'steps': 47889, 'loss/train': 1.5737905502319336} -08/30/2021 21:54:15 - INFO - __main__ - Step 47891: {'lr': 0.0003904769502459133, 'samples': 9195072, 'steps': 47890, 'loss/train': 1.5343148708343506} -08/30/2021 21:54:15 - INFO - __main__ - Step 47892: {'lr': 0.0003904725604760366, 'samples': 9195264, 'steps': 47891, 'loss/train': 1.2744956016540527} -08/30/2021 21:54:15 - INFO - __main__ - Step 47893: {'lr': 0.0003904681706428652, 'samples': 9195456, 'steps': 47892, 'loss/train': 1.2772544622421265} -08/30/2021 21:54:16 - INFO - __main__ - Step 47894: {'lr': 0.000390463780746401, 'samples': 9195648, 'steps': 47893, 'loss/train': 1.5194251537322998} -08/30/2021 21:54:16 - INFO - __main__ - Step 47895: {'lr': 0.00039045939078664595, 'samples': 9195840, 'steps': 47894, 'loss/train': 0.1151193231344223} -08/30/2021 21:54:17 - INFO - __main__ - Step 47896: {'lr': 0.0003904550007636021, 'samples': 9196032, 'steps': 47895, 'loss/train': 1.2806284427642822} -08/30/2021 21:54:18 - INFO - __main__ - Step 47897: {'lr': 0.00039045061067727126, 'samples': 9196224, 'steps': 47896, 'loss/train': 1.4310710430145264} -08/30/2021 21:54:19 - INFO - __main__ - Step 47898: {'lr': 0.0003904462205276557, 'samples': 9196416, 'steps': 47897, 'loss/train': 1.7274322509765625} -08/30/2021 21:54:19 - INFO - __main__ - Step 47899: {'lr': 0.0003904418303147572, 'samples': 9196608, 'steps': 47898, 'loss/train': 1.5581552982330322} -08/30/2021 21:54:19 - INFO - __main__ - Step 47900: {'lr': 0.0003904374400385777, 'samples': 9196800, 'steps': 47899, 'loss/train': 0.18381276726722717} -08/30/2021 21:54:20 - INFO - __main__ - Step 47901: {'lr': 0.0003904330496991194, 'samples': 9196992, 'steps': 47900, 'loss/train': 1.5149794816970825} -08/30/2021 21:54:21 - INFO - __main__ - Step 47902: {'lr': 0.00039042865929638404, 'samples': 9197184, 'steps': 47901, 'loss/train': 0.7306432127952576} -08/30/2021 21:54:22 - INFO - __main__ - Step 47903: {'lr': 0.00039042426883037376, 'samples': 9197376, 'steps': 47902, 'loss/train': 1.137852668762207} -08/30/2021 21:54:22 - INFO - __main__ - Step 47904: {'lr': 0.00039041987830109036, 'samples': 9197568, 'steps': 47903, 'loss/train': 0.8726712465286255} -08/30/2021 21:54:22 - INFO - __main__ - Step 47905: {'lr': 0.000390415487708536, 'samples': 9197760, 'steps': 47904, 'loss/train': 1.6011446714401245} -08/30/2021 21:54:23 - INFO - __main__ - Step 47906: {'lr': 0.0003904110970527126, 'samples': 9197952, 'steps': 47905, 'loss/train': 1.809960961341858} -08/30/2021 21:54:24 - INFO - __main__ - Step 47907: {'lr': 0.00039040670633362206, 'samples': 9198144, 'steps': 47906, 'loss/train': 1.7568812370300293} -08/30/2021 21:54:25 - INFO - __main__ - Step 47908: {'lr': 0.00039040231555126647, 'samples': 9198336, 'steps': 47907, 'loss/train': 1.692173719406128} -08/30/2021 21:54:25 - INFO - __main__ - Step 47909: {'lr': 0.0003903979247056478, 'samples': 9198528, 'steps': 47908, 'loss/train': 1.6197781562805176} -08/30/2021 21:54:25 - INFO - __main__ - Step 47910: {'lr': 0.00039039353379676796, 'samples': 9198720, 'steps': 47909, 'loss/train': 1.9702115058898926} -08/30/2021 21:54:26 - INFO - __main__ - Step 47911: {'lr': 0.0003903891428246289, 'samples': 9198912, 'steps': 47910, 'loss/train': 1.5342292785644531} -08/30/2021 21:54:29 - INFO - __main__ - Step 47912: {'lr': 0.0003903847517892328, 'samples': 9199104, 'steps': 47911, 'loss/train': 1.557690978050232} -08/30/2021 21:54:29 - INFO - __main__ - Step 47913: {'lr': 0.00039038036069058137, 'samples': 9199296, 'steps': 47912, 'loss/train': 0.6306040287017822} -08/30/2021 21:54:30 - INFO - __main__ - Step 47914: {'lr': 0.0003903759695286768, 'samples': 9199488, 'steps': 47913, 'loss/train': 0.5553920865058899} -08/30/2021 21:54:30 - INFO - __main__ - Step 47915: {'lr': 0.0003903715783035209, 'samples': 9199680, 'steps': 47914, 'loss/train': 0.7273662686347961} -08/30/2021 21:54:30 - INFO - __main__ - Step 47916: {'lr': 0.00039036718701511577, 'samples': 9199872, 'steps': 47915, 'loss/train': 0.8915906548500061} -08/30/2021 21:54:31 - INFO - __main__ - Step 47917: {'lr': 0.00039036279566346334, 'samples': 9200064, 'steps': 47916, 'loss/train': 1.5083653926849365} -08/30/2021 21:54:32 - INFO - __main__ - Step 47918: {'lr': 0.0003903584042485656, 'samples': 9200256, 'steps': 47917, 'loss/train': 1.7090014219284058} -08/30/2021 21:54:33 - INFO - __main__ - Step 47919: {'lr': 0.0003903540127704246, 'samples': 9200448, 'steps': 47918, 'loss/train': 1.157689094543457} -08/30/2021 21:54:33 - INFO - __main__ - Step 47920: {'lr': 0.0003903496212290422, 'samples': 9200640, 'steps': 47919, 'loss/train': 1.1067941188812256} -08/30/2021 21:54:33 - INFO - __main__ - Step 47921: {'lr': 0.00039034522962442045, 'samples': 9200832, 'steps': 47920, 'loss/train': 1.3353887796401978} -08/30/2021 21:54:34 - INFO - __main__ - Step 47922: {'lr': 0.0003903408379565612, 'samples': 9201024, 'steps': 47921, 'loss/train': 1.388068437576294} -08/30/2021 21:54:34 - INFO - __main__ - Step 47923: {'lr': 0.0003903364462254666, 'samples': 9201216, 'steps': 47922, 'loss/train': 1.748176097869873} -08/30/2021 21:54:35 - INFO - __main__ - Step 47924: {'lr': 0.0003903320544311386, 'samples': 9201408, 'steps': 47923, 'loss/train': 0.8511806726455688} -08/30/2021 21:54:36 - INFO - __main__ - Step 47925: {'lr': 0.0003903276625735791, 'samples': 9201600, 'steps': 47924, 'loss/train': 1.4516433477401733} -08/30/2021 21:54:36 - INFO - __main__ - Step 47926: {'lr': 0.00039032327065279015, 'samples': 9201792, 'steps': 47925, 'loss/train': 1.4957444667816162} -08/30/2021 21:54:37 - INFO - __main__ - Step 47927: {'lr': 0.0003903188786687737, 'samples': 9201984, 'steps': 47926, 'loss/train': 1.5750483274459839} -08/30/2021 21:54:37 - INFO - __main__ - Step 47928: {'lr': 0.0003903144866215317, 'samples': 9202176, 'steps': 47927, 'loss/train': 1.068113923072815} -08/30/2021 21:54:38 - INFO - __main__ - Step 47929: {'lr': 0.0003903100945110661, 'samples': 9202368, 'steps': 47928, 'loss/train': 1.5552136898040771} -08/30/2021 21:54:39 - INFO - __main__ - Step 47930: {'lr': 0.00039030570233737903, 'samples': 9202560, 'steps': 47929, 'loss/train': 0.5898703336715698} -08/30/2021 21:54:39 - INFO - __main__ - Step 47931: {'lr': 0.0003903013101004724, 'samples': 9202752, 'steps': 47930, 'loss/train': 1.919891595840454} -08/30/2021 21:54:40 - INFO - __main__ - Step 47932: {'lr': 0.00039029691780034814, 'samples': 9202944, 'steps': 47931, 'loss/train': 1.6875079870224} -08/30/2021 21:54:40 - INFO - __main__ - Step 47933: {'lr': 0.00039029252543700823, 'samples': 9203136, 'steps': 47932, 'loss/train': 0.33154863119125366} -08/30/2021 21:54:41 - INFO - __main__ - Step 47934: {'lr': 0.0003902881330104546, 'samples': 9203328, 'steps': 47933, 'loss/train': 0.7379415035247803} -08/30/2021 21:54:42 - INFO - __main__ - Step 47935: {'lr': 0.00039028374052068937, 'samples': 9203520, 'steps': 47934, 'loss/train': 1.36952543258667} -08/30/2021 21:54:42 - INFO - __main__ - Step 47936: {'lr': 0.0003902793479677145, 'samples': 9203712, 'steps': 47935, 'loss/train': 0.9311469197273254} -08/30/2021 21:54:43 - INFO - __main__ - Step 47937: {'lr': 0.00039027495535153185, 'samples': 9203904, 'steps': 47936, 'loss/train': 1.6109387874603271} -08/30/2021 21:54:43 - INFO - __main__ - Step 47938: {'lr': 0.0003902705626721435, 'samples': 9204096, 'steps': 47937, 'loss/train': 1.5544806718826294} -08/30/2021 21:54:45 - INFO - __main__ - Step 47939: {'lr': 0.00039026616992955145, 'samples': 9204288, 'steps': 47938, 'loss/train': 0.9728268980979919} -08/30/2021 21:54:45 - INFO - __main__ - Step 47940: {'lr': 0.0003902617771237575, 'samples': 9204480, 'steps': 47939, 'loss/train': 0.7438373565673828} -08/30/2021 21:54:45 - INFO - __main__ - Step 47941: {'lr': 0.0003902573842547639, 'samples': 9204672, 'steps': 47940, 'loss/train': 1.1454633474349976} -08/30/2021 21:54:46 - INFO - __main__ - Step 47942: {'lr': 0.00039025299132257243, 'samples': 9204864, 'steps': 47941, 'loss/train': 1.1059343814849854} -08/30/2021 21:54:46 - INFO - __main__ - Step 47943: {'lr': 0.00039024859832718505, 'samples': 9205056, 'steps': 47942, 'loss/train': 1.249679684638977} -08/30/2021 21:54:48 - INFO - __main__ - Step 47944: {'lr': 0.0003902442052686039, 'samples': 9205248, 'steps': 47943, 'loss/train': 0.05899669975042343} -08/30/2021 21:54:48 - INFO - __main__ - Step 47945: {'lr': 0.00039023981214683087, 'samples': 9205440, 'steps': 47944, 'loss/train': 1.2613134384155273} -08/30/2021 21:54:48 - INFO - __main__ - Step 47946: {'lr': 0.0003902354189618679, 'samples': 9205632, 'steps': 47945, 'loss/train': 0.7736929655075073} -08/30/2021 21:54:49 - INFO - __main__ - Step 47947: {'lr': 0.00039023102571371707, 'samples': 9205824, 'steps': 47946, 'loss/train': 1.809786319732666} -08/30/2021 21:54:49 - INFO - __main__ - Step 47948: {'lr': 0.0003902266324023803, 'samples': 9206016, 'steps': 47947, 'loss/train': 1.0456798076629639} -08/30/2021 21:54:49 - INFO - __main__ - Step 47949: {'lr': 0.00039022223902785954, 'samples': 9206208, 'steps': 47948, 'loss/train': 1.6305575370788574} -08/30/2021 21:54:51 - INFO - __main__ - Step 47950: {'lr': 0.0003902178455901568, 'samples': 9206400, 'steps': 47949, 'loss/train': 0.6561105847358704} -08/30/2021 21:54:51 - INFO - __main__ - Step 47951: {'lr': 0.00039021345208927404, 'samples': 9206592, 'steps': 47950, 'loss/train': 1.4292510747909546} -08/30/2021 21:54:52 - INFO - __main__ - Step 47952: {'lr': 0.0003902090585252133, 'samples': 9206784, 'steps': 47951, 'loss/train': 1.6782574653625488} -08/30/2021 21:54:52 - INFO - __main__ - Step 47953: {'lr': 0.0003902046648979766, 'samples': 9206976, 'steps': 47952, 'loss/train': 2.1473450660705566} -08/30/2021 21:54:52 - INFO - __main__ - Step 47954: {'lr': 0.00039020027120756573, 'samples': 9207168, 'steps': 47953, 'loss/train': 1.3811249732971191} -08/30/2021 21:54:54 - INFO - __main__ - Step 47955: {'lr': 0.00039019587745398276, 'samples': 9207360, 'steps': 47954, 'loss/train': 1.7682926654815674} -08/30/2021 21:54:54 - INFO - __main__ - Step 47956: {'lr': 0.0003901914836372298, 'samples': 9207552, 'steps': 47955, 'loss/train': 1.0705757141113281} -08/30/2021 21:54:55 - INFO - __main__ - Step 47957: {'lr': 0.00039018708975730864, 'samples': 9207744, 'steps': 47956, 'loss/train': 1.2473047971725464} -08/30/2021 21:54:55 - INFO - __main__ - Step 47958: {'lr': 0.0003901826958142214, 'samples': 9207936, 'steps': 47957, 'loss/train': 1.014862060546875} -08/30/2021 21:54:55 - INFO - __main__ - Step 47959: {'lr': 0.0003901783018079699, 'samples': 9208128, 'steps': 47958, 'loss/train': 1.1212726831436157} -08/30/2021 21:54:57 - INFO - __main__ - Step 47960: {'lr': 0.0003901739077385563, 'samples': 9208320, 'steps': 47959, 'loss/train': 1.769634485244751} -08/30/2021 21:54:57 - INFO - __main__ - Step 47961: {'lr': 0.0003901695136059825, 'samples': 9208512, 'steps': 47960, 'loss/train': 1.6125181913375854} -08/30/2021 21:54:58 - INFO - __main__ - Step 47962: {'lr': 0.00039016511941025045, 'samples': 9208704, 'steps': 47961, 'loss/train': 1.411395788192749} -08/30/2021 21:54:58 - INFO - __main__ - Step 47963: {'lr': 0.0003901607251513622, 'samples': 9208896, 'steps': 47962, 'loss/train': 1.1251847743988037} -08/30/2021 21:54:58 - INFO - __main__ - Step 47964: {'lr': 0.0003901563308293197, 'samples': 9209088, 'steps': 47963, 'loss/train': 0.9561633467674255} -08/30/2021 21:55:00 - INFO - __main__ - Step 47965: {'lr': 0.0003901519364441248, 'samples': 9209280, 'steps': 47964, 'loss/train': 1.2790157794952393} -08/30/2021 21:55:01 - INFO - __main__ - Step 47966: {'lr': 0.0003901475419957797, 'samples': 9209472, 'steps': 47965, 'loss/train': 1.5799431800842285} -08/30/2021 21:55:01 - INFO - __main__ - Step 47967: {'lr': 0.0003901431474842863, 'samples': 9209664, 'steps': 47966, 'loss/train': 2.313375234603882} -08/30/2021 21:55:01 - INFO - __main__ - Step 47968: {'lr': 0.0003901387529096465, 'samples': 9209856, 'steps': 47967, 'loss/train': 1.353843331336975} -08/30/2021 21:55:02 - INFO - __main__ - Step 47969: {'lr': 0.0003901343582718624, 'samples': 9210048, 'steps': 47968, 'loss/train': 1.1205179691314697} -08/30/2021 21:55:04 - INFO - __main__ - Step 47970: {'lr': 0.0003901299635709359, 'samples': 9210240, 'steps': 47969, 'loss/train': 1.6425973176956177} -08/30/2021 21:55:04 - INFO - __main__ - Step 47971: {'lr': 0.00039012556880686897, 'samples': 9210432, 'steps': 47970, 'loss/train': 2.0301880836486816} -08/30/2021 21:55:05 - INFO - __main__ - Step 47972: {'lr': 0.00039012117397966363, 'samples': 9210624, 'steps': 47971, 'loss/train': 1.0088059902191162} -08/30/2021 21:55:05 - INFO - __main__ - Step 47973: {'lr': 0.00039011677908932184, 'samples': 9210816, 'steps': 47972, 'loss/train': 0.5545100569725037} -08/30/2021 21:55:05 - INFO - __main__ - Step 47974: {'lr': 0.00039011238413584566, 'samples': 9211008, 'steps': 47973, 'loss/train': 1.1089811325073242} -08/30/2021 21:55:07 - INFO - __main__ - Step 47975: {'lr': 0.0003901079891192369, 'samples': 9211200, 'steps': 47974, 'loss/train': 1.461216926574707} -08/30/2021 21:55:07 - INFO - __main__ - Step 47976: {'lr': 0.00039010359403949776, 'samples': 9211392, 'steps': 47975, 'loss/train': 0.5487602353096008} -08/30/2021 21:55:08 - INFO - __main__ - Step 47977: {'lr': 0.00039009919889663005, 'samples': 9211584, 'steps': 47976, 'loss/train': 0.881941556930542} -08/30/2021 21:55:08 - INFO - __main__ - Step 47978: {'lr': 0.00039009480369063575, 'samples': 9211776, 'steps': 47977, 'loss/train': 1.8178044557571411} -08/30/2021 21:55:08 - INFO - __main__ - Step 47979: {'lr': 0.000390090408421517, 'samples': 9211968, 'steps': 47978, 'loss/train': 0.7355507016181946} -08/30/2021 21:55:10 - INFO - __main__ - Step 47980: {'lr': 0.0003900860130892756, 'samples': 9212160, 'steps': 47979, 'loss/train': 1.2027751207351685} -08/30/2021 21:55:10 - INFO - __main__ - Step 47981: {'lr': 0.0003900816176939136, 'samples': 9212352, 'steps': 47980, 'loss/train': 0.8195446729660034} -08/30/2021 21:55:11 - INFO - __main__ - Step 47982: {'lr': 0.000390077222235433, 'samples': 9212544, 'steps': 47981, 'loss/train': 1.8953591585159302} -08/30/2021 21:55:11 - INFO - __main__ - Step 47983: {'lr': 0.0003900728267138357, 'samples': 9212736, 'steps': 47982, 'loss/train': 1.4434648752212524} -08/30/2021 21:55:12 - INFO - __main__ - Step 47984: {'lr': 0.0003900684311291238, 'samples': 9212928, 'steps': 47983, 'loss/train': 1.8007526397705078} -08/30/2021 21:55:13 - INFO - __main__ - Step 47985: {'lr': 0.0003900640354812992, 'samples': 9213120, 'steps': 47984, 'loss/train': 1.681673526763916} -08/30/2021 21:55:13 - INFO - __main__ - Step 47986: {'lr': 0.000390059639770364, 'samples': 9213312, 'steps': 47985, 'loss/train': 1.1255621910095215} -08/30/2021 21:55:14 - INFO - __main__ - Step 47987: {'lr': 0.0003900552439963201, 'samples': 9213504, 'steps': 47986, 'loss/train': 1.6035668849945068} -08/30/2021 21:55:14 - INFO - __main__ - Step 47988: {'lr': 0.0003900508481591694, 'samples': 9213696, 'steps': 47987, 'loss/train': 1.3248248100280762} -08/30/2021 21:55:14 - INFO - __main__ - Step 47989: {'lr': 0.00039004645225891387, 'samples': 9213888, 'steps': 47988, 'loss/train': 1.7217713594436646} -08/30/2021 21:55:16 - INFO - __main__ - Step 47990: {'lr': 0.0003900420562955557, 'samples': 9214080, 'steps': 47989, 'loss/train': 1.5362060070037842} -08/30/2021 21:55:16 - INFO - __main__ - Step 47991: {'lr': 0.0003900376602690966, 'samples': 9214272, 'steps': 47990, 'loss/train': 0.669004499912262} -08/30/2021 21:55:17 - INFO - __main__ - Step 47992: {'lr': 0.0003900332641795388, 'samples': 9214464, 'steps': 47991, 'loss/train': 1.6353973150253296} -08/30/2021 21:55:17 - INFO - __main__ - Step 47993: {'lr': 0.0003900288680268842, 'samples': 9214656, 'steps': 47992, 'loss/train': 1.7858846187591553} -08/30/2021 21:55:17 - INFO - __main__ - Step 47994: {'lr': 0.00039002447181113464, 'samples': 9214848, 'steps': 47993, 'loss/train': 1.558007001876831} -08/30/2021 21:55:18 - INFO - __main__ - Step 47995: {'lr': 0.0003900200755322923, 'samples': 9215040, 'steps': 47994, 'loss/train': 1.27335786819458} -08/30/2021 21:55:19 - INFO - __main__ - Step 47996: {'lr': 0.0003900156791903591, 'samples': 9215232, 'steps': 47995, 'loss/train': 0.9494937062263489} -08/30/2021 21:55:20 - INFO - __main__ - Step 47997: {'lr': 0.0003900112827853369, 'samples': 9215424, 'steps': 47996, 'loss/train': 1.9481124877929688} -08/30/2021 21:55:20 - INFO - __main__ - Step 47998: {'lr': 0.0003900068863172278, 'samples': 9215616, 'steps': 47997, 'loss/train': 1.7428592443466187} -08/30/2021 21:55:20 - INFO - __main__ - Step 47999: {'lr': 0.0003900024897860338, 'samples': 9215808, 'steps': 47998, 'loss/train': 0.9841916561126709} -08/30/2021 21:55:21 - INFO - __main__ - Step 48000: {'lr': 0.00038999809319175684, 'samples': 9216000, 'steps': 47999, 'loss/train': 1.3682252168655396} -08/30/2021 21:55:22 - INFO - __main__ - Step 48001: {'lr': 0.0003899936965343989, 'samples': 9216192, 'steps': 48000, 'loss/train': 0.7294800281524658} -08/30/2021 21:55:23 - INFO - __main__ - Step 48002: {'lr': 0.00038998929981396194, 'samples': 9216384, 'steps': 48001, 'loss/train': 0.6029478907585144} -08/30/2021 21:55:23 - INFO - __main__ - Step 48003: {'lr': 0.0003899849030304479, 'samples': 9216576, 'steps': 48002, 'loss/train': 1.418975830078125} -08/30/2021 21:55:23 - INFO - __main__ - Step 48004: {'lr': 0.0003899805061838589, 'samples': 9216768, 'steps': 48003, 'loss/train': 1.1456586122512817} -08/30/2021 21:55:24 - INFO - __main__ - Step 48005: {'lr': 0.0003899761092741968, 'samples': 9216960, 'steps': 48004, 'loss/train': 3.1620686054229736} -08/30/2021 21:55:25 - INFO - __main__ - Step 48006: {'lr': 0.00038997171230146366, 'samples': 9217152, 'steps': 48005, 'loss/train': 1.820265293121338} -08/30/2021 21:55:26 - INFO - __main__ - Step 48007: {'lr': 0.0003899673152656614, 'samples': 9217344, 'steps': 48006, 'loss/train': 0.8522946834564209} -08/30/2021 21:55:26 - INFO - __main__ - Step 48008: {'lr': 0.0003899629181667921, 'samples': 9217536, 'steps': 48007, 'loss/train': 1.411366581916809} -08/30/2021 21:55:26 - INFO - __main__ - Step 48009: {'lr': 0.0003899585210048576, 'samples': 9217728, 'steps': 48008, 'loss/train': 1.2145556211471558} -08/30/2021 21:55:27 - INFO - __main__ - Step 48010: {'lr': 0.0003899541237798599, 'samples': 9217920, 'steps': 48009, 'loss/train': 1.6335562467575073} -08/30/2021 21:55:28 - INFO - __main__ - Step 48011: {'lr': 0.0003899497264918012, 'samples': 9218112, 'steps': 48010, 'loss/train': 1.4699443578720093} -08/30/2021 21:55:28 - INFO - __main__ - Step 48012: {'lr': 0.00038994532914068313, 'samples': 9218304, 'steps': 48011, 'loss/train': 1.651854157447815} -08/30/2021 21:55:29 - INFO - __main__ - Step 48013: {'lr': 0.00038994093172650804, 'samples': 9218496, 'steps': 48012, 'loss/train': 0.6458513736724854} -08/30/2021 21:55:29 - INFO - __main__ - Step 48014: {'lr': 0.00038993653424927754, 'samples': 9218688, 'steps': 48013, 'loss/train': 1.3805373907089233} -08/30/2021 21:55:29 - INFO - __main__ - Step 48015: {'lr': 0.00038993213670899385, 'samples': 9218880, 'steps': 48014, 'loss/train': 1.4443672895431519} -08/30/2021 21:55:31 - INFO - __main__ - Step 48016: {'lr': 0.000389927739105659, 'samples': 9219072, 'steps': 48015, 'loss/train': 1.6568262577056885} -08/30/2021 21:55:31 - INFO - __main__ - Step 48017: {'lr': 0.0003899233414392748, 'samples': 9219264, 'steps': 48016, 'loss/train': 1.719864845275879} -08/30/2021 21:55:32 - INFO - __main__ - Step 48018: {'lr': 0.0003899189437098433, 'samples': 9219456, 'steps': 48017, 'loss/train': 1.2093226909637451} -08/30/2021 21:55:32 - INFO - __main__ - Step 48019: {'lr': 0.00038991454591736643, 'samples': 9219648, 'steps': 48018, 'loss/train': 0.6396217346191406} -08/30/2021 21:55:32 - INFO - __main__ - Step 48020: {'lr': 0.00038991014806184635, 'samples': 9219840, 'steps': 48019, 'loss/train': 1.373793363571167} -08/30/2021 21:55:34 - INFO - __main__ - Step 48021: {'lr': 0.0003899057501432848, 'samples': 9220032, 'steps': 48020, 'loss/train': 1.309171438217163} -08/30/2021 21:55:35 - INFO - __main__ - Step 48022: {'lr': 0.0003899013521616839, 'samples': 9220224, 'steps': 48021, 'loss/train': 1.4871996641159058} -08/30/2021 21:55:35 - INFO - __main__ - Step 48023: {'lr': 0.0003898969541170456, 'samples': 9220416, 'steps': 48022, 'loss/train': 1.4128605127334595} -08/30/2021 21:55:36 - INFO - __main__ - Step 48024: {'lr': 0.0003898925560093719, 'samples': 9220608, 'steps': 48023, 'loss/train': 0.7613070607185364} -08/30/2021 21:55:36 - INFO - __main__ - Step 48025: {'lr': 0.00038988815783866485, 'samples': 9220800, 'steps': 48024, 'loss/train': 1.3089985847473145} -08/30/2021 21:55:37 - INFO - __main__ - Step 48026: {'lr': 0.00038988375960492626, 'samples': 9220992, 'steps': 48025, 'loss/train': 1.4384922981262207} -08/30/2021 21:55:38 - INFO - __main__ - Step 48027: {'lr': 0.0003898793613081583, 'samples': 9221184, 'steps': 48026, 'loss/train': 0.5155933499336243} -08/30/2021 21:55:38 - INFO - __main__ - Step 48028: {'lr': 0.0003898749629483628, 'samples': 9221376, 'steps': 48027, 'loss/train': 0.04614232853055} -08/30/2021 21:55:39 - INFO - __main__ - Step 48029: {'lr': 0.00038987056452554177, 'samples': 9221568, 'steps': 48028, 'loss/train': 1.3231110572814941} -08/30/2021 21:55:39 - INFO - __main__ - Step 48030: {'lr': 0.0003898661660396973, 'samples': 9221760, 'steps': 48029, 'loss/train': 1.7507843971252441} -08/30/2021 21:55:40 - INFO - __main__ - Step 48031: {'lr': 0.00038986176749083117, 'samples': 9221952, 'steps': 48030, 'loss/train': 1.6523869037628174} -08/30/2021 21:55:41 - INFO - __main__ - Step 48032: {'lr': 0.0003898573688789456, 'samples': 9222144, 'steps': 48031, 'loss/train': 0.8921321630477905} -08/30/2021 21:55:41 - INFO - __main__ - Step 48033: {'lr': 0.0003898529702040424, 'samples': 9222336, 'steps': 48032, 'loss/train': 1.3697538375854492} -08/30/2021 21:55:42 - INFO - __main__ - Step 48034: {'lr': 0.00038984857146612365, 'samples': 9222528, 'steps': 48033, 'loss/train': 1.581619381904602} -08/30/2021 21:55:42 - INFO - __main__ - Step 48035: {'lr': 0.00038984417266519126, 'samples': 9222720, 'steps': 48034, 'loss/train': 1.5477761030197144} -08/30/2021 21:55:44 - INFO - __main__ - Step 48036: {'lr': 0.00038983977380124726, 'samples': 9222912, 'steps': 48035, 'loss/train': 0.9938199520111084} -08/30/2021 21:55:44 - INFO - __main__ - Step 48037: {'lr': 0.0003898353748742936, 'samples': 9223104, 'steps': 48036, 'loss/train': 0.9710741639137268} -08/30/2021 21:55:44 - INFO - __main__ - Step 48038: {'lr': 0.00038983097588433225, 'samples': 9223296, 'steps': 48037, 'loss/train': 2.5571200847625732} -08/30/2021 21:55:45 - INFO - __main__ - Step 48039: {'lr': 0.00038982657683136524, 'samples': 9223488, 'steps': 48038, 'loss/train': 1.3827848434448242} -08/30/2021 21:55:45 - INFO - __main__ - Step 48040: {'lr': 0.00038982217771539466, 'samples': 9223680, 'steps': 48039, 'loss/train': 1.2979451417922974} -08/30/2021 21:55:46 - INFO - __main__ - Step 48041: {'lr': 0.0003898177785364222, 'samples': 9223872, 'steps': 48040, 'loss/train': 0.8472513556480408} -08/30/2021 21:55:47 - INFO - __main__ - Step 48042: {'lr': 0.00038981337929445004, 'samples': 9224064, 'steps': 48041, 'loss/train': 0.0789189413189888} -08/30/2021 21:55:48 - INFO - __main__ - Step 48043: {'lr': 0.0003898089799894802, 'samples': 9224256, 'steps': 48042, 'loss/train': 1.749300479888916} -08/30/2021 21:55:48 - INFO - __main__ - Step 48044: {'lr': 0.0003898045806215145, 'samples': 9224448, 'steps': 48043, 'loss/train': 0.13373838365077972} -08/30/2021 21:55:48 - INFO - __main__ - Step 48045: {'lr': 0.00038980018119055506, 'samples': 9224640, 'steps': 48044, 'loss/train': 2.0769262313842773} -08/30/2021 21:55:49 - INFO - __main__ - Step 48046: {'lr': 0.00038979578169660384, 'samples': 9224832, 'steps': 48045, 'loss/train': 1.142823576927185} -08/30/2021 21:55:50 - INFO - __main__ - Step 48047: {'lr': 0.0003897913821396628, 'samples': 9225024, 'steps': 48046, 'loss/train': 1.7016246318817139} -08/30/2021 21:55:51 - INFO - __main__ - Step 48048: {'lr': 0.0003897869825197339, 'samples': 9225216, 'steps': 48047, 'loss/train': 1.712834119796753} -08/30/2021 21:55:51 - INFO - __main__ - Step 48049: {'lr': 0.0003897825828368191, 'samples': 9225408, 'steps': 48048, 'loss/train': 1.0804564952850342} -08/30/2021 21:55:52 - INFO - __main__ - Step 48050: {'lr': 0.0003897781830909204, 'samples': 9225600, 'steps': 48049, 'loss/train': 1.0883190631866455} -08/30/2021 21:55:52 - INFO - __main__ - Step 48051: {'lr': 0.00038977378328203987, 'samples': 9225792, 'steps': 48050, 'loss/train': 1.942132830619812} -08/30/2021 21:55:53 - INFO - __main__ - Step 48052: {'lr': 0.0003897693834101794, 'samples': 9225984, 'steps': 48051, 'loss/train': 1.2460460662841797} -08/30/2021 21:55:54 - INFO - __main__ - Step 48053: {'lr': 0.00038976498347534106, 'samples': 9226176, 'steps': 48052, 'loss/train': 1.46304190158844} -08/30/2021 21:55:54 - INFO - __main__ - Step 48054: {'lr': 0.0003897605834775267, 'samples': 9226368, 'steps': 48053, 'loss/train': 1.3460031747817993} -08/30/2021 21:55:54 - INFO - __main__ - Step 48055: {'lr': 0.00038975618341673845, 'samples': 9226560, 'steps': 48054, 'loss/train': 1.151011347770691} -08/30/2021 21:55:55 - INFO - __main__ - Step 48056: {'lr': 0.0003897517832929782, 'samples': 9226752, 'steps': 48055, 'loss/train': 1.1946170330047607} -08/30/2021 21:55:56 - INFO - __main__ - Step 48057: {'lr': 0.00038974738310624797, 'samples': 9226944, 'steps': 48056, 'loss/train': 1.568045973777771} -08/30/2021 21:55:57 - INFO - __main__ - Step 48058: {'lr': 0.00038974298285654967, 'samples': 9227136, 'steps': 48057, 'loss/train': 1.9462419748306274} -08/30/2021 21:55:57 - INFO - __main__ - Step 48059: {'lr': 0.0003897385825438854, 'samples': 9227328, 'steps': 48058, 'loss/train': 0.6368768811225891} -08/30/2021 21:55:57 - INFO - __main__ - Step 48060: {'lr': 0.0003897341821682571, 'samples': 9227520, 'steps': 48059, 'loss/train': 1.0692126750946045} -08/30/2021 21:55:58 - INFO - __main__ - Step 48061: {'lr': 0.0003897297817296667, 'samples': 9227712, 'steps': 48060, 'loss/train': 1.8624049425125122} -08/30/2021 21:56:00 - INFO - __main__ - Step 48062: {'lr': 0.00038972538122811613, 'samples': 9227904, 'steps': 48061, 'loss/train': 1.4940840005874634} -08/30/2021 21:56:00 - INFO - __main__ - Step 48063: {'lr': 0.00038972098066360753, 'samples': 9228096, 'steps': 48062, 'loss/train': 1.4992592334747314} -08/30/2021 21:56:00 - INFO - __main__ - Step 48064: {'lr': 0.0003897165800361427, 'samples': 9228288, 'steps': 48063, 'loss/train': 0.04728345572948456} -08/30/2021 21:56:01 - INFO - __main__ - Step 48065: {'lr': 0.0003897121793457239, 'samples': 9228480, 'steps': 48064, 'loss/train': 1.349684476852417} -08/30/2021 21:56:01 - INFO - __main__ - Step 48066: {'lr': 0.0003897077785923529, 'samples': 9228672, 'steps': 48065, 'loss/train': 0.16502012312412262} -08/30/2021 21:56:02 - INFO - __main__ - Step 48067: {'lr': 0.0003897033777760318, 'samples': 9228864, 'steps': 48066, 'loss/train': 1.3611706495285034} -08/30/2021 21:56:03 - INFO - __main__ - Step 48068: {'lr': 0.0003896989768967624, 'samples': 9229056, 'steps': 48067, 'loss/train': 0.6744688153266907} -08/30/2021 21:56:04 - INFO - __main__ - Step 48069: {'lr': 0.0003896945759545468, 'samples': 9229248, 'steps': 48068, 'loss/train': 5.85368537902832} -08/30/2021 21:56:04 - INFO - __main__ - Step 48070: {'lr': 0.000389690174949387, 'samples': 9229440, 'steps': 48069, 'loss/train': 5.836464881896973} -08/30/2021 21:56:05 - INFO - __main__ - Step 48071: {'lr': 0.00038968577388128503, 'samples': 9229632, 'steps': 48070, 'loss/train': 1.3360096216201782} -08/30/2021 21:56:05 - INFO - __main__ - Step 48072: {'lr': 0.00038968137275024274, 'samples': 9229824, 'steps': 48071, 'loss/train': 1.7021456956863403} -08/30/2021 21:56:05 - INFO - __main__ - Step 48073: {'lr': 0.0003896769715562622, 'samples': 9230016, 'steps': 48072, 'loss/train': 0.9753689169883728} -08/30/2021 21:56:08 - INFO - __main__ - Step 48074: {'lr': 0.0003896725702993453, 'samples': 9230208, 'steps': 48073, 'loss/train': 1.4867280721664429} -08/30/2021 21:56:08 - INFO - __main__ - Step 48075: {'lr': 0.0003896681689794942, 'samples': 9230400, 'steps': 48074, 'loss/train': 0.6709274649620056} -08/30/2021 21:56:09 - INFO - __main__ - Step 48076: {'lr': 0.00038966376759671075, 'samples': 9230592, 'steps': 48075, 'loss/train': 1.626508116722107} -08/30/2021 21:56:09 - INFO - __main__ - Step 48077: {'lr': 0.00038965936615099694, 'samples': 9230784, 'steps': 48076, 'loss/train': 0.4990983307361603} -08/30/2021 21:56:09 - INFO - __main__ - Step 48078: {'lr': 0.0003896549646423548, 'samples': 9230976, 'steps': 48077, 'loss/train': 0.9760861396789551} -08/30/2021 21:56:10 - INFO - __main__ - Step 48079: {'lr': 0.0003896505630707863, 'samples': 9231168, 'steps': 48078, 'loss/train': 1.4228544235229492} -08/30/2021 21:56:10 - INFO - __main__ - Step 48080: {'lr': 0.00038964616143629337, 'samples': 9231360, 'steps': 48079, 'loss/train': 0.6009047627449036} -08/30/2021 21:56:11 - INFO - __main__ - Step 48081: {'lr': 0.00038964175973887807, 'samples': 9231552, 'steps': 48080, 'loss/train': 0.40620696544647217} -08/30/2021 21:56:13 - INFO - __main__ - Step 48082: {'lr': 0.0003896373579785423, 'samples': 9231744, 'steps': 48081, 'loss/train': 0.3924275040626526} -08/30/2021 21:56:13 - INFO - __main__ - Step 48083: {'lr': 0.00038963295615528803, 'samples': 9231936, 'steps': 48082, 'loss/train': 1.9669965505599976} -08/30/2021 21:56:13 - INFO - __main__ - Step 48084: {'lr': 0.00038962855426911746, 'samples': 9232128, 'steps': 48083, 'loss/train': 1.495212435722351} -08/30/2021 21:56:14 - INFO - __main__ - Step 48085: {'lr': 0.00038962415232003233, 'samples': 9232320, 'steps': 48084, 'loss/train': 1.4255551099777222} -08/30/2021 21:56:14 - INFO - __main__ - Step 48086: {'lr': 0.00038961975030803474, 'samples': 9232512, 'steps': 48085, 'loss/train': 0.03670331463217735} -08/30/2021 21:56:16 - INFO - __main__ - Step 48087: {'lr': 0.00038961534823312664, 'samples': 9232704, 'steps': 48086, 'loss/train': 1.2051409482955933} -08/30/2021 21:56:16 - INFO - __main__ - Step 48088: {'lr': 0.00038961094609531, 'samples': 9232896, 'steps': 48087, 'loss/train': 0.8676460385322571} -08/30/2021 21:56:16 - INFO - __main__ - Step 48089: {'lr': 0.00038960654389458684, 'samples': 9233088, 'steps': 48088, 'loss/train': 1.1531951427459717} -08/30/2021 21:56:17 - INFO - __main__ - Step 48090: {'lr': 0.0003896021416309591, 'samples': 9233280, 'steps': 48089, 'loss/train': 1.3840491771697998} -08/30/2021 21:56:17 - INFO - __main__ - Step 48091: {'lr': 0.0003895977393044288, 'samples': 9233472, 'steps': 48090, 'loss/train': 2.1008269786834717} -08/30/2021 21:56:19 - INFO - __main__ - Step 48092: {'lr': 0.00038959333691499794, 'samples': 9233664, 'steps': 48091, 'loss/train': 1.0274615287780762} -08/30/2021 21:56:19 - INFO - __main__ - Step 48093: {'lr': 0.00038958893446266844, 'samples': 9233856, 'steps': 48092, 'loss/train': 1.6036871671676636} -08/30/2021 21:56:19 - INFO - __main__ - Step 48094: {'lr': 0.00038958453194744237, 'samples': 9234048, 'steps': 48093, 'loss/train': 1.0566166639328003} -08/30/2021 21:56:20 - INFO - __main__ - Step 48095: {'lr': 0.0003895801293693216, 'samples': 9234240, 'steps': 48094, 'loss/train': 1.053208589553833} -08/30/2021 21:56:20 - INFO - __main__ - Step 48096: {'lr': 0.0003895757267283082, 'samples': 9234432, 'steps': 48095, 'loss/train': 2.430922508239746} -08/30/2021 21:56:22 - INFO - __main__ - Step 48097: {'lr': 0.0003895713240244042, 'samples': 9234624, 'steps': 48096, 'loss/train': 1.8209210634231567} -08/30/2021 21:56:22 - INFO - __main__ - Step 48098: {'lr': 0.0003895669212576114, 'samples': 9234816, 'steps': 48097, 'loss/train': 1.0672640800476074} -08/30/2021 21:56:23 - INFO - __main__ - Step 48099: {'lr': 0.000389562518427932, 'samples': 9235008, 'steps': 48098, 'loss/train': 0.047764554619789124} -08/30/2021 21:56:23 - INFO - __main__ - Step 48100: {'lr': 0.00038955811553536787, 'samples': 9235200, 'steps': 48099, 'loss/train': 1.649141788482666} -08/30/2021 21:56:23 - INFO - __main__ - Step 48101: {'lr': 0.00038955371257992096, 'samples': 9235392, 'steps': 48100, 'loss/train': 0.9659141898155212} -08/30/2021 21:56:24 - INFO - __main__ - Step 48102: {'lr': 0.0003895493095615933, 'samples': 9235584, 'steps': 48101, 'loss/train': 1.4187041521072388} -08/30/2021 21:56:25 - INFO - __main__ - Step 48103: {'lr': 0.00038954490648038687, 'samples': 9235776, 'steps': 48102, 'loss/train': 1.3778592348098755} -08/30/2021 21:56:26 - INFO - __main__ - Step 48104: {'lr': 0.0003895405033363037, 'samples': 9235968, 'steps': 48103, 'loss/train': 1.2677559852600098} -08/30/2021 21:56:26 - INFO - __main__ - Step 48105: {'lr': 0.0003895361001293457, 'samples': 9236160, 'steps': 48104, 'loss/train': 1.3955543041229248} -08/30/2021 21:56:27 - INFO - __main__ - Step 48106: {'lr': 0.0003895316968595149, 'samples': 9236352, 'steps': 48105, 'loss/train': 1.6083626747131348} -08/30/2021 21:56:27 - INFO - __main__ - Step 48107: {'lr': 0.0003895272935268133, 'samples': 9236544, 'steps': 48106, 'loss/train': 1.3801171779632568} -08/30/2021 21:56:28 - INFO - __main__ - Step 48108: {'lr': 0.0003895228901312428, 'samples': 9236736, 'steps': 48107, 'loss/train': 0.6153112649917603} -08/30/2021 21:56:29 - INFO - __main__ - Step 48109: {'lr': 0.0003895184866728054, 'samples': 9236928, 'steps': 48108, 'loss/train': 1.0506694316864014} -08/30/2021 21:56:29 - INFO - __main__ - Step 48110: {'lr': 0.0003895140831515033, 'samples': 9237120, 'steps': 48109, 'loss/train': 1.713735580444336} -08/30/2021 21:56:30 - INFO - __main__ - Step 48111: {'lr': 0.0003895096795673381, 'samples': 9237312, 'steps': 48110, 'loss/train': 1.699536919593811} -08/30/2021 21:56:30 - INFO - __main__ - Step 48112: {'lr': 0.0003895052759203121, 'samples': 9237504, 'steps': 48111, 'loss/train': 1.416006088256836} -08/30/2021 21:56:32 - INFO - __main__ - Step 48113: {'lr': 0.0003895008722104272, 'samples': 9237696, 'steps': 48112, 'loss/train': 0.8337977528572083} -08/30/2021 21:56:32 - INFO - __main__ - Step 48114: {'lr': 0.00038949646843768526, 'samples': 9237888, 'steps': 48113, 'loss/train': 1.8441437482833862} -08/30/2021 21:56:33 - INFO - __main__ - Step 48115: {'lr': 0.00038949206460208845, 'samples': 9238080, 'steps': 48114, 'loss/train': 1.6917622089385986} -08/30/2021 21:56:33 - INFO - __main__ - Step 48116: {'lr': 0.0003894876607036386, 'samples': 9238272, 'steps': 48115, 'loss/train': 1.933457374572754} -08/30/2021 21:56:33 - INFO - __main__ - Step 48117: {'lr': 0.0003894832567423379, 'samples': 9238464, 'steps': 48116, 'loss/train': 1.2408145666122437} -08/30/2021 21:56:34 - INFO - __main__ - Step 48118: {'lr': 0.00038947885271818807, 'samples': 9238656, 'steps': 48117, 'loss/train': 1.8722898960113525} -08/30/2021 21:56:35 - INFO - __main__ - Step 48119: {'lr': 0.0003894744486311912, 'samples': 9238848, 'steps': 48118, 'loss/train': 0.07304657250642776} -08/30/2021 21:56:36 - INFO - __main__ - Step 48120: {'lr': 0.00038947004448134937, 'samples': 9239040, 'steps': 48119, 'loss/train': 1.9490514993667603} -08/30/2021 21:56:36 - INFO - __main__ - Step 48121: {'lr': 0.0003894656402686645, 'samples': 9239232, 'steps': 48120, 'loss/train': 1.4795867204666138} -08/30/2021 21:56:36 - INFO - __main__ - Step 48122: {'lr': 0.00038946123599313846, 'samples': 9239424, 'steps': 48121, 'loss/train': 1.2509700059890747} -08/30/2021 21:56:37 - INFO - __main__ - Step 48123: {'lr': 0.0003894568316547734, 'samples': 9239616, 'steps': 48122, 'loss/train': 1.1257843971252441} -08/30/2021 21:56:38 - INFO - __main__ - Step 48124: {'lr': 0.00038945242725357127, 'samples': 9239808, 'steps': 48123, 'loss/train': 0.9880104064941406} -08/30/2021 21:56:39 - INFO - __main__ - Step 48125: {'lr': 0.000389448022789534, 'samples': 9240000, 'steps': 48124, 'loss/train': 0.9245656132698059} -08/30/2021 21:56:39 - INFO - __main__ - Step 48126: {'lr': 0.0003894436182626636, 'samples': 9240192, 'steps': 48125, 'loss/train': 0.11599001288414001} -08/30/2021 21:56:39 - INFO - __main__ - Step 48127: {'lr': 0.00038943921367296213, 'samples': 9240384, 'steps': 48126, 'loss/train': 1.3803465366363525} -08/30/2021 21:56:40 - INFO - __main__ - Step 48128: {'lr': 0.00038943480902043146, 'samples': 9240576, 'steps': 48127, 'loss/train': 1.1955361366271973} -08/30/2021 21:56:41 - INFO - __main__ - Step 48129: {'lr': 0.0003894304043050736, 'samples': 9240768, 'steps': 48128, 'loss/train': 1.4488136768341064} -08/30/2021 21:56:42 - INFO - __main__ - Step 48130: {'lr': 0.0003894259995268905, 'samples': 9240960, 'steps': 48129, 'loss/train': 0.925774335861206} -08/30/2021 21:56:42 - INFO - __main__ - Step 48131: {'lr': 0.00038942159468588423, 'samples': 9241152, 'steps': 48130, 'loss/train': 0.7424302697181702} -08/30/2021 21:56:42 - INFO - __main__ - Step 48132: {'lr': 0.00038941718978205674, 'samples': 9241344, 'steps': 48131, 'loss/train': 1.6279820203781128} -08/30/2021 21:56:43 - INFO - __main__ - Step 48133: {'lr': 0.0003894127848154101, 'samples': 9241536, 'steps': 48132, 'loss/train': 1.5197559595108032} -08/30/2021 21:56:45 - INFO - __main__ - Step 48134: {'lr': 0.0003894083797859461, 'samples': 9241728, 'steps': 48133, 'loss/train': 0.6270791888237} -08/30/2021 21:56:45 - INFO - __main__ - Step 48135: {'lr': 0.00038940397469366695, 'samples': 9241920, 'steps': 48134, 'loss/train': 1.4272571802139282} -08/30/2021 21:56:46 - INFO - __main__ - Step 48136: {'lr': 0.0003893995695385744, 'samples': 9242112, 'steps': 48135, 'loss/train': 1.1951262950897217} -08/30/2021 21:56:46 - INFO - __main__ - Step 48137: {'lr': 0.0003893951643206706, 'samples': 9242304, 'steps': 48136, 'loss/train': 1.4697294235229492} -08/30/2021 21:56:46 - INFO - __main__ - Step 48138: {'lr': 0.00038939075903995744, 'samples': 9242496, 'steps': 48137, 'loss/train': 1.3757773637771606} -08/30/2021 21:56:48 - INFO - __main__ - Step 48139: {'lr': 0.000389386353696437, 'samples': 9242688, 'steps': 48138, 'loss/train': 1.4908357858657837} -08/30/2021 21:56:48 - INFO - __main__ - Step 48140: {'lr': 0.0003893819482901113, 'samples': 9242880, 'steps': 48139, 'loss/train': 0.48751139640808105} -08/30/2021 21:56:49 - INFO - __main__ - Step 48141: {'lr': 0.0003893775428209822, 'samples': 9243072, 'steps': 48140, 'loss/train': 1.1304608583450317} -08/30/2021 21:56:49 - INFO - __main__ - Step 48142: {'lr': 0.00038937313728905164, 'samples': 9243264, 'steps': 48141, 'loss/train': 1.231481909751892} -08/30/2021 21:56:49 - INFO - __main__ - Step 48143: {'lr': 0.0003893687316943218, 'samples': 9243456, 'steps': 48142, 'loss/train': 1.433244228363037} -08/30/2021 21:56:50 - INFO - __main__ - Step 48144: {'lr': 0.0003893643260367945, 'samples': 9243648, 'steps': 48143, 'loss/train': 1.7612348794937134} -08/30/2021 21:56:51 - INFO - __main__ - Step 48145: {'lr': 0.00038935992031647183, 'samples': 9243840, 'steps': 48144, 'loss/train': 1.9286956787109375} -08/30/2021 21:56:52 - INFO - __main__ - Step 48146: {'lr': 0.00038935551453335573, 'samples': 9244032, 'steps': 48145, 'loss/train': 1.3823174238204956} -08/30/2021 21:56:52 - INFO - __main__ - Step 48147: {'lr': 0.00038935110868744817, 'samples': 9244224, 'steps': 48146, 'loss/train': 1.4182697534561157} -08/30/2021 21:56:52 - INFO - __main__ - Step 48148: {'lr': 0.0003893467027787511, 'samples': 9244416, 'steps': 48147, 'loss/train': 1.5436605215072632} -08/30/2021 21:56:53 - INFO - __main__ - Step 48149: {'lr': 0.00038934229680726663, 'samples': 9244608, 'steps': 48148, 'loss/train': 1.4788745641708374} -08/30/2021 21:56:54 - INFO - __main__ - Step 48150: {'lr': 0.0003893378907729966, 'samples': 9244800, 'steps': 48149, 'loss/train': 1.4899238348007202} -08/30/2021 21:56:55 - INFO - __main__ - Step 48151: {'lr': 0.0003893334846759431, 'samples': 9244992, 'steps': 48150, 'loss/train': 1.5928133726119995} -08/30/2021 21:56:55 - INFO - __main__ - Step 48152: {'lr': 0.0003893290785161081, 'samples': 9245184, 'steps': 48151, 'loss/train': 1.5416806936264038} -08/30/2021 21:56:55 - INFO - __main__ - Step 48153: {'lr': 0.00038932467229349353, 'samples': 9245376, 'steps': 48152, 'loss/train': 1.5753623247146606} -08/30/2021 21:56:56 - INFO - __main__ - Step 48154: {'lr': 0.0003893202660081014, 'samples': 9245568, 'steps': 48153, 'loss/train': 1.5248019695281982} -08/30/2021 21:56:57 - INFO - __main__ - Step 48155: {'lr': 0.00038931585965993384, 'samples': 9245760, 'steps': 48154, 'loss/train': 0.8895750641822815} -08/30/2021 21:56:58 - INFO - __main__ - Step 48156: {'lr': 0.0003893114532489926, 'samples': 9245952, 'steps': 48155, 'loss/train': 1.3698105812072754} -08/30/2021 21:56:58 - INFO - __main__ - Step 48157: {'lr': 0.00038930704677527975, 'samples': 9246144, 'steps': 48156, 'loss/train': 0.3844267725944519} -08/30/2021 21:56:58 - INFO - __main__ - Step 48158: {'lr': 0.00038930264023879737, 'samples': 9246336, 'steps': 48157, 'loss/train': 1.3581583499908447} -08/30/2021 21:56:59 - INFO - __main__ - Step 48159: {'lr': 0.0003892982336395473, 'samples': 9246528, 'steps': 48158, 'loss/train': 1.4068442583084106} -08/30/2021 21:57:00 - INFO - __main__ - Step 48160: {'lr': 0.00038929382697753157, 'samples': 9246720, 'steps': 48159, 'loss/train': 1.2846893072128296} -08/30/2021 21:57:01 - INFO - __main__ - Step 48161: {'lr': 0.00038928942025275227, 'samples': 9246912, 'steps': 48160, 'loss/train': 1.0771214962005615} -08/30/2021 21:57:01 - INFO - __main__ - Step 48162: {'lr': 0.00038928501346521127, 'samples': 9247104, 'steps': 48161, 'loss/train': 1.3963046073913574} -08/30/2021 21:57:01 - INFO - __main__ - Step 48163: {'lr': 0.0003892806066149106, 'samples': 9247296, 'steps': 48162, 'loss/train': 0.7078620791435242} -08/30/2021 21:57:02 - INFO - __main__ - Step 48164: {'lr': 0.00038927619970185225, 'samples': 9247488, 'steps': 48163, 'loss/train': 1.7483363151550293} -08/30/2021 21:57:03 - INFO - __main__ - Step 48165: {'lr': 0.0003892717927260382, 'samples': 9247680, 'steps': 48164, 'loss/train': 1.5239465236663818} -08/30/2021 21:57:04 - INFO - __main__ - Step 48166: {'lr': 0.00038926738568747035, 'samples': 9247872, 'steps': 48165, 'loss/train': 0.5878647565841675} -08/30/2021 21:57:04 - INFO - __main__ - Step 48167: {'lr': 0.0003892629785861509, 'samples': 9248064, 'steps': 48166, 'loss/train': 1.365415096282959} -08/30/2021 21:57:04 - INFO - __main__ - Step 48168: {'lr': 0.00038925857142208155, 'samples': 9248256, 'steps': 48167, 'loss/train': 0.9016124606132507} -08/30/2021 21:57:05 - INFO - __main__ - Step 48169: {'lr': 0.0003892541641952645, 'samples': 9248448, 'steps': 48168, 'loss/train': 1.375416874885559} -08/30/2021 21:57:06 - INFO - __main__ - Step 48170: {'lr': 0.00038924975690570173, 'samples': 9248640, 'steps': 48169, 'loss/train': 0.7157394289970398} -08/30/2021 21:57:07 - INFO - __main__ - Step 48171: {'lr': 0.0003892453495533951, 'samples': 9248832, 'steps': 48170, 'loss/train': 1.1825578212738037} -08/30/2021 21:57:07 - INFO - __main__ - Step 48172: {'lr': 0.0003892409421383467, 'samples': 9249024, 'steps': 48171, 'loss/train': 0.9246358871459961} -08/30/2021 21:57:07 - INFO - __main__ - Step 48173: {'lr': 0.0003892365346605584, 'samples': 9249216, 'steps': 48172, 'loss/train': 1.4163233041763306} -08/30/2021 21:57:08 - INFO - __main__ - Step 48174: {'lr': 0.0003892321271200324, 'samples': 9249408, 'steps': 48173, 'loss/train': 1.3543813228607178} -08/30/2021 21:57:09 - INFO - __main__ - Step 48175: {'lr': 0.0003892277195167705, 'samples': 9249600, 'steps': 48174, 'loss/train': 1.419616937637329} -08/30/2021 21:57:10 - INFO - __main__ - Step 48176: {'lr': 0.00038922331185077465, 'samples': 9249792, 'steps': 48175, 'loss/train': 1.7056647539138794} -08/30/2021 21:57:10 - INFO - __main__ - Step 48177: {'lr': 0.000389218904122047, 'samples': 9249984, 'steps': 48176, 'loss/train': 3.6409785747528076} -08/30/2021 21:57:11 - INFO - __main__ - Step 48178: {'lr': 0.00038921449633058945, 'samples': 9250176, 'steps': 48177, 'loss/train': 0.8499018549919128} -08/30/2021 21:57:11 - INFO - __main__ - Step 48179: {'lr': 0.00038921008847640407, 'samples': 9250368, 'steps': 48178, 'loss/train': 1.1665587425231934} -08/30/2021 21:57:13 - INFO - __main__ - Step 48180: {'lr': 0.0003892056805594926, 'samples': 9250560, 'steps': 48179, 'loss/train': 1.4057285785675049} -08/30/2021 21:57:13 - INFO - __main__ - Step 48181: {'lr': 0.0003892012725798574, 'samples': 9250752, 'steps': 48180, 'loss/train': 1.4164289236068726} -08/30/2021 21:57:13 - INFO - __main__ - Step 48182: {'lr': 0.00038919686453750015, 'samples': 9250944, 'steps': 48181, 'loss/train': 1.7442010641098022} -08/30/2021 21:57:14 - INFO - __main__ - Step 48183: {'lr': 0.0003891924564324229, 'samples': 9251136, 'steps': 48182, 'loss/train': 1.5402005910873413} -08/30/2021 21:57:14 - INFO - __main__ - Step 48184: {'lr': 0.0003891880482646277, 'samples': 9251328, 'steps': 48183, 'loss/train': 1.1800891160964966} -08/30/2021 21:57:16 - INFO - __main__ - Step 48185: {'lr': 0.00038918364003411656, 'samples': 9251520, 'steps': 48184, 'loss/train': 1.1317538022994995} -08/30/2021 21:57:16 - INFO - __main__ - Step 48186: {'lr': 0.0003891792317408914, 'samples': 9251712, 'steps': 48185, 'loss/train': 1.2964351177215576} -08/30/2021 21:57:16 - INFO - __main__ - Step 48187: {'lr': 0.00038917482338495424, 'samples': 9251904, 'steps': 48186, 'loss/train': 1.8063730001449585} -08/30/2021 21:57:17 - INFO - __main__ - Step 48188: {'lr': 0.000389170414966307, 'samples': 9252096, 'steps': 48187, 'loss/train': 1.4626551866531372} -08/30/2021 21:57:17 - INFO - __main__ - Step 48189: {'lr': 0.0003891660064849518, 'samples': 9252288, 'steps': 48188, 'loss/train': 1.568405032157898} -08/30/2021 21:57:19 - INFO - __main__ - Step 48190: {'lr': 0.00038916159794089044, 'samples': 9252480, 'steps': 48189, 'loss/train': 1.222964882850647} -08/30/2021 21:57:20 - INFO - __main__ - Step 48191: {'lr': 0.00038915718933412515, 'samples': 9252672, 'steps': 48190, 'loss/train': 1.3123953342437744} -08/30/2021 21:57:20 - INFO - __main__ - Step 48192: {'lr': 0.0003891527806646576, 'samples': 9252864, 'steps': 48191, 'loss/train': 1.147048830986023} -08/30/2021 21:57:20 - INFO - __main__ - Step 48193: {'lr': 0.0003891483719324901, 'samples': 9253056, 'steps': 48192, 'loss/train': 1.331035852432251} -08/30/2021 21:57:21 - INFO - __main__ - Step 48194: {'lr': 0.00038914396313762445, 'samples': 9253248, 'steps': 48193, 'loss/train': 1.5172207355499268} -08/30/2021 21:57:21 - INFO - __main__ - Step 48195: {'lr': 0.00038913955428006265, 'samples': 9253440, 'steps': 48194, 'loss/train': 1.5401694774627686} -08/30/2021 21:57:23 - INFO - __main__ - Step 48196: {'lr': 0.00038913514535980675, 'samples': 9253632, 'steps': 48195, 'loss/train': 0.1042097806930542} -08/30/2021 21:57:23 - INFO - __main__ - Step 48197: {'lr': 0.0003891307363768587, 'samples': 9253824, 'steps': 48196, 'loss/train': 1.6444669961929321} -08/30/2021 21:57:23 - INFO - __main__ - Step 48198: {'lr': 0.00038912632733122045, 'samples': 9254016, 'steps': 48197, 'loss/train': 1.709092617034912} -08/30/2021 21:57:24 - INFO - __main__ - Step 48199: {'lr': 0.000389121918222894, 'samples': 9254208, 'steps': 48198, 'loss/train': 1.2692484855651855} -08/30/2021 21:57:24 - INFO - __main__ - Step 48200: {'lr': 0.0003891175090518814, 'samples': 9254400, 'steps': 48199, 'loss/train': 1.3176255226135254} -08/30/2021 21:57:26 - INFO - __main__ - Step 48201: {'lr': 0.00038911309981818466, 'samples': 9254592, 'steps': 48200, 'loss/train': 1.8013050556182861} -08/30/2021 21:57:26 - INFO - __main__ - Step 48202: {'lr': 0.00038910869052180563, 'samples': 9254784, 'steps': 48201, 'loss/train': 1.311497449874878} -08/30/2021 21:57:26 - INFO - __main__ - Step 48203: {'lr': 0.00038910428116274644, 'samples': 9254976, 'steps': 48202, 'loss/train': 1.6864207983016968} -08/30/2021 21:57:27 - INFO - __main__ - Step 48204: {'lr': 0.0003890998717410089, 'samples': 9255168, 'steps': 48203, 'loss/train': 1.054111123085022} -08/30/2021 21:57:27 - INFO - __main__ - Step 48205: {'lr': 0.0003890954622565952, 'samples': 9255360, 'steps': 48204, 'loss/train': 1.192077398300171} -08/30/2021 21:57:29 - INFO - __main__ - Step 48206: {'lr': 0.00038909105270950716, 'samples': 9255552, 'steps': 48205, 'loss/train': 0.4235106110572815} -08/30/2021 21:57:29 - INFO - __main__ - Step 48207: {'lr': 0.0003890866430997468, 'samples': 9255744, 'steps': 48206, 'loss/train': 1.1917065382003784} -08/30/2021 21:57:30 - INFO - __main__ - Step 48208: {'lr': 0.0003890822334273163, 'samples': 9255936, 'steps': 48207, 'loss/train': 1.5207353830337524} -08/30/2021 21:57:30 - INFO - __main__ - Step 48209: {'lr': 0.0003890778236922174, 'samples': 9256128, 'steps': 48208, 'loss/train': 1.5800981521606445} -08/30/2021 21:57:30 - INFO - __main__ - Step 48210: {'lr': 0.00038907341389445217, 'samples': 9256320, 'steps': 48209, 'loss/train': 1.5544887781143188} -08/30/2021 21:57:32 - INFO - __main__ - Step 48211: {'lr': 0.0003890690040340226, 'samples': 9256512, 'steps': 48210, 'loss/train': 1.1500834226608276} -08/30/2021 21:57:32 - INFO - __main__ - Step 48212: {'lr': 0.00038906459411093075, 'samples': 9256704, 'steps': 48211, 'loss/train': 1.1569143533706665} -08/30/2021 21:57:33 - INFO - __main__ - Step 48213: {'lr': 0.0003890601841251785, 'samples': 9256896, 'steps': 48212, 'loss/train': 1.6261870861053467} -08/30/2021 21:57:33 - INFO - __main__ - Step 48214: {'lr': 0.0003890557740767678, 'samples': 9257088, 'steps': 48213, 'loss/train': 0.5921133160591125} -08/30/2021 21:57:33 - INFO - __main__ - Step 48215: {'lr': 0.00038905136396570085, 'samples': 9257280, 'steps': 48214, 'loss/train': 1.7807836532592773} -08/30/2021 21:57:35 - INFO - __main__ - Step 48216: {'lr': 0.0003890469537919794, 'samples': 9257472, 'steps': 48215, 'loss/train': 1.232125997543335} -08/30/2021 21:57:36 - INFO - __main__ - Step 48217: {'lr': 0.0003890425435556055, 'samples': 9257664, 'steps': 48216, 'loss/train': 1.121621012687683} -08/30/2021 21:57:36 - INFO - __main__ - Step 48218: {'lr': 0.0003890381332565813, 'samples': 9257856, 'steps': 48217, 'loss/train': 1.8275268077850342} -08/30/2021 21:57:36 - INFO - __main__ - Step 48219: {'lr': 0.00038903372289490865, 'samples': 9258048, 'steps': 48218, 'loss/train': 1.3870809078216553} -08/30/2021 21:57:37 - INFO - __main__ - Step 48220: {'lr': 0.0003890293124705895, 'samples': 9258240, 'steps': 48219, 'loss/train': 1.0716545581817627} -08/30/2021 21:57:37 - INFO - __main__ - Step 48221: {'lr': 0.0003890249019836259, 'samples': 9258432, 'steps': 48220, 'loss/train': 2.0319488048553467} -08/30/2021 21:57:39 - INFO - __main__ - Step 48222: {'lr': 0.0003890204914340198, 'samples': 9258624, 'steps': 48221, 'loss/train': 1.296714425086975} -08/30/2021 21:57:39 - INFO - __main__ - Step 48223: {'lr': 0.00038901608082177327, 'samples': 9258816, 'steps': 48222, 'loss/train': 0.04402359947562218} -08/30/2021 21:57:39 - INFO - __main__ - Step 48224: {'lr': 0.0003890116701468882, 'samples': 9259008, 'steps': 48223, 'loss/train': 1.3679606914520264} -08/30/2021 21:57:40 - INFO - __main__ - Step 48225: {'lr': 0.0003890072594093666, 'samples': 9259200, 'steps': 48224, 'loss/train': 0.8457120060920715} -08/30/2021 21:57:40 - INFO - __main__ - Step 48226: {'lr': 0.00038900284860921046, 'samples': 9259392, 'steps': 48225, 'loss/train': 1.311064600944519} -08/30/2021 21:57:42 - INFO - __main__ - Step 48227: {'lr': 0.00038899843774642184, 'samples': 9259584, 'steps': 48226, 'loss/train': 3.014810085296631} -08/30/2021 21:57:42 - INFO - __main__ - Step 48228: {'lr': 0.00038899402682100265, 'samples': 9259776, 'steps': 48227, 'loss/train': 1.0211178064346313} -08/30/2021 21:57:42 - INFO - __main__ - Step 48229: {'lr': 0.0003889896158329549, 'samples': 9259968, 'steps': 48228, 'loss/train': 1.471662163734436} -08/30/2021 21:57:43 - INFO - __main__ - Step 48230: {'lr': 0.00038898520478228055, 'samples': 9260160, 'steps': 48229, 'loss/train': 0.9295299053192139} -08/30/2021 21:57:43 - INFO - __main__ - Step 48231: {'lr': 0.00038898079366898164, 'samples': 9260352, 'steps': 48230, 'loss/train': 2.265153408050537} -08/30/2021 21:57:45 - INFO - __main__ - Step 48232: {'lr': 0.0003889763824930601, 'samples': 9260544, 'steps': 48231, 'loss/train': 1.3204606771469116} -08/30/2021 21:57:45 - INFO - __main__ - Step 48233: {'lr': 0.00038897197125451795, 'samples': 9260736, 'steps': 48232, 'loss/train': 1.5183383226394653} -08/30/2021 21:57:46 - INFO - __main__ - Step 48234: {'lr': 0.0003889675599533572, 'samples': 9260928, 'steps': 48233, 'loss/train': 1.4311165809631348} -08/30/2021 21:57:46 - INFO - __main__ - Step 48235: {'lr': 0.0003889631485895798, 'samples': 9261120, 'steps': 48234, 'loss/train': 1.4235327243804932} -08/30/2021 21:57:46 - INFO - __main__ - Step 48236: {'lr': 0.00038895873716318776, 'samples': 9261312, 'steps': 48235, 'loss/train': 1.9887962341308594} -08/30/2021 21:57:48 - INFO - __main__ - Step 48237: {'lr': 0.000388954325674183, 'samples': 9261504, 'steps': 48236, 'loss/train': 0.8699989914894104} -08/30/2021 21:57:48 - INFO - __main__ - Step 48238: {'lr': 0.00038894991412256766, 'samples': 9261696, 'steps': 48237, 'loss/train': 1.5515996217727661} -08/30/2021 21:57:48 - INFO - __main__ - Step 48239: {'lr': 0.00038894550250834355, 'samples': 9261888, 'steps': 48238, 'loss/train': 1.2451509237289429} -08/30/2021 21:57:49 - INFO - __main__ - Step 48240: {'lr': 0.00038894109083151274, 'samples': 9262080, 'steps': 48239, 'loss/train': 1.6446844339370728} -08/30/2021 21:57:49 - INFO - __main__ - Step 48241: {'lr': 0.0003889366790920773, 'samples': 9262272, 'steps': 48240, 'loss/train': 1.305234432220459} -08/30/2021 21:57:51 - INFO - __main__ - Step 48242: {'lr': 0.00038893226729003904, 'samples': 9262464, 'steps': 48241, 'loss/train': 2.496769905090332} -08/30/2021 21:57:52 - INFO - __main__ - Step 48243: {'lr': 0.0003889278554254001, 'samples': 9262656, 'steps': 48242, 'loss/train': 0.2142036408185959} -08/30/2021 21:57:52 - INFO - __main__ - Step 48244: {'lr': 0.00038892344349816246, 'samples': 9262848, 'steps': 48243, 'loss/train': 1.3455396890640259} -08/30/2021 21:57:52 - INFO - __main__ - Step 48245: {'lr': 0.00038891903150832795, 'samples': 9263040, 'steps': 48244, 'loss/train': 1.6460636854171753} -08/30/2021 21:57:53 - INFO - __main__ - Step 48246: {'lr': 0.00038891461945589866, 'samples': 9263232, 'steps': 48245, 'loss/train': 1.3758220672607422} -08/30/2021 21:57:53 - INFO - __main__ - Step 48247: {'lr': 0.0003889102073408767, 'samples': 9263424, 'steps': 48246, 'loss/train': 1.6581454277038574} -08/30/2021 21:57:55 - INFO - __main__ - Step 48248: {'lr': 0.0003889057951632639, 'samples': 9263616, 'steps': 48247, 'loss/train': 0.8149415850639343} -08/30/2021 21:57:55 - INFO - __main__ - Step 48249: {'lr': 0.0003889013829230623, 'samples': 9263808, 'steps': 48248, 'loss/train': 1.3481032848358154} -08/30/2021 21:57:56 - INFO - __main__ - Step 48250: {'lr': 0.00038889697062027384, 'samples': 9264000, 'steps': 48249, 'loss/train': 1.7648568153381348} -08/30/2021 21:57:56 - INFO - __main__ - Step 48251: {'lr': 0.00038889255825490053, 'samples': 9264192, 'steps': 48250, 'loss/train': 1.4959568977355957} -08/30/2021 21:57:56 - INFO - __main__ - Step 48252: {'lr': 0.0003888881458269444, 'samples': 9264384, 'steps': 48251, 'loss/train': 1.0035902261734009} -08/30/2021 21:57:58 - INFO - __main__ - Step 48253: {'lr': 0.00038888373333640746, 'samples': 9264576, 'steps': 48252, 'loss/train': 1.2284576892852783} -08/30/2021 21:57:58 - INFO - __main__ - Step 48254: {'lr': 0.00038887932078329165, 'samples': 9264768, 'steps': 48253, 'loss/train': 1.819913625717163} -08/30/2021 21:57:59 - INFO - __main__ - Step 48255: {'lr': 0.00038887490816759895, 'samples': 9264960, 'steps': 48254, 'loss/train': 1.5095142126083374} -08/30/2021 21:57:59 - INFO - __main__ - Step 48256: {'lr': 0.00038887049548933135, 'samples': 9265152, 'steps': 48255, 'loss/train': 1.1086269617080688} -08/30/2021 21:57:59 - INFO - __main__ - Step 48257: {'lr': 0.0003888660827484908, 'samples': 9265344, 'steps': 48256, 'loss/train': 1.3071212768554688} -08/30/2021 21:58:01 - INFO - __main__ - Step 48258: {'lr': 0.00038886166994507945, 'samples': 9265536, 'steps': 48257, 'loss/train': 1.7825593948364258} -08/30/2021 21:58:01 - INFO - __main__ - Step 48259: {'lr': 0.00038885725707909905, 'samples': 9265728, 'steps': 48258, 'loss/train': 1.3432456254959106} -08/30/2021 21:58:02 - INFO - __main__ - Step 48260: {'lr': 0.0003888528441505518, 'samples': 9265920, 'steps': 48259, 'loss/train': 1.4666707515716553} -08/30/2021 21:58:02 - INFO - __main__ - Step 48261: {'lr': 0.00038884843115943955, 'samples': 9266112, 'steps': 48260, 'loss/train': 1.1235095262527466} -08/30/2021 21:58:02 - INFO - __main__ - Step 48262: {'lr': 0.00038884401810576434, 'samples': 9266304, 'steps': 48261, 'loss/train': 1.0756359100341797} -08/30/2021 21:58:04 - INFO - __main__ - Step 48263: {'lr': 0.0003888396049895282, 'samples': 9266496, 'steps': 48262, 'loss/train': 1.815375566482544} -08/30/2021 21:58:04 - INFO - __main__ - Step 48264: {'lr': 0.000388835191810733, 'samples': 9266688, 'steps': 48263, 'loss/train': 1.6188507080078125} -08/30/2021 21:58:05 - INFO - __main__ - Step 48265: {'lr': 0.0003888307785693809, 'samples': 9266880, 'steps': 48264, 'loss/train': 1.4475008249282837} -08/30/2021 21:58:05 - INFO - __main__ - Step 48266: {'lr': 0.0003888263652654738, 'samples': 9267072, 'steps': 48265, 'loss/train': 1.5052590370178223} -08/30/2021 21:58:05 - INFO - __main__ - Step 48267: {'lr': 0.0003888219518990136, 'samples': 9267264, 'steps': 48266, 'loss/train': 1.113168716430664} -08/30/2021 21:58:07 - INFO - __main__ - Step 48268: {'lr': 0.0003888175384700024, 'samples': 9267456, 'steps': 48267, 'loss/train': 1.3512853384017944} -08/30/2021 21:58:07 - INFO - __main__ - Step 48269: {'lr': 0.0003888131249784421, 'samples': 9267648, 'steps': 48268, 'loss/train': 1.8217908143997192} -08/30/2021 21:58:08 - INFO - __main__ - Step 48270: {'lr': 0.00038880871142433484, 'samples': 9267840, 'steps': 48269, 'loss/train': 1.1951217651367188} -08/30/2021 21:58:08 - INFO - __main__ - Step 48271: {'lr': 0.0003888042978076825, 'samples': 9268032, 'steps': 48270, 'loss/train': 0.6636618971824646} -08/30/2021 21:58:08 - INFO - __main__ - Step 48272: {'lr': 0.00038879988412848706, 'samples': 9268224, 'steps': 48271, 'loss/train': 1.0012128353118896} -08/30/2021 21:58:10 - INFO - __main__ - Step 48273: {'lr': 0.00038879547038675054, 'samples': 9268416, 'steps': 48272, 'loss/train': 2.0873050689697266} -08/30/2021 21:58:10 - INFO - __main__ - Step 48274: {'lr': 0.0003887910565824749, 'samples': 9268608, 'steps': 48273, 'loss/train': 0.6913456916809082} -08/30/2021 21:58:11 - INFO - __main__ - Step 48275: {'lr': 0.0003887866427156622, 'samples': 9268800, 'steps': 48274, 'loss/train': 1.6065735816955566} -08/30/2021 21:58:11 - INFO - __main__ - Step 48276: {'lr': 0.00038878222878631444, 'samples': 9268992, 'steps': 48275, 'loss/train': 1.3543517589569092} -08/30/2021 21:58:11 - INFO - __main__ - Step 48277: {'lr': 0.0003887778147944334, 'samples': 9269184, 'steps': 48276, 'loss/train': 1.6978094577789307} -08/30/2021 21:58:13 - INFO - __main__ - Step 48278: {'lr': 0.0003887734007400213, 'samples': 9269376, 'steps': 48277, 'loss/train': 0.6138620972633362} -08/30/2021 21:58:13 - INFO - __main__ - Step 48279: {'lr': 0.00038876898662308, 'samples': 9269568, 'steps': 48278, 'loss/train': 1.3005942106246948} -08/30/2021 21:58:14 - INFO - __main__ - Step 48280: {'lr': 0.00038876457244361166, 'samples': 9269760, 'steps': 48279, 'loss/train': 1.3384491205215454} -08/30/2021 21:58:14 - INFO - __main__ - Step 48281: {'lr': 0.000388760158201618, 'samples': 9269952, 'steps': 48280, 'loss/train': 1.2069329023361206} -08/30/2021 21:58:14 - INFO - __main__ - Step 48282: {'lr': 0.0003887557438971012, 'samples': 9270144, 'steps': 48281, 'loss/train': 1.4133845567703247} -08/30/2021 21:58:15 - INFO - __main__ - Step 48283: {'lr': 0.0003887513295300632, 'samples': 9270336, 'steps': 48282, 'loss/train': 1.0987493991851807} -08/30/2021 21:58:16 - INFO - __main__ - Step 48284: {'lr': 0.00038874691510050604, 'samples': 9270528, 'steps': 48283, 'loss/train': 1.3501638174057007} -08/30/2021 21:58:17 - INFO - __main__ - Step 48285: {'lr': 0.00038874250060843163, 'samples': 9270720, 'steps': 48284, 'loss/train': 1.2690856456756592} -08/30/2021 21:58:17 - INFO - __main__ - Step 48286: {'lr': 0.00038873808605384197, 'samples': 9270912, 'steps': 48285, 'loss/train': 1.2772575616836548} -08/30/2021 21:58:17 - INFO - __main__ - Step 48287: {'lr': 0.0003887336714367391, 'samples': 9271104, 'steps': 48286, 'loss/train': 1.1695002317428589} -08/30/2021 21:58:18 - INFO - __main__ - Step 48288: {'lr': 0.00038872925675712493, 'samples': 9271296, 'steps': 48287, 'loss/train': 1.7818000316619873} -08/30/2021 21:58:19 - INFO - __main__ - Step 48289: {'lr': 0.0003887248420150016, 'samples': 9271488, 'steps': 48288, 'loss/train': 1.5280708074569702} -08/30/2021 21:58:20 - INFO - __main__ - Step 48290: {'lr': 0.00038872042721037087, 'samples': 9271680, 'steps': 48289, 'loss/train': 1.4469332695007324} -08/30/2021 21:58:20 - INFO - __main__ - Step 48291: {'lr': 0.00038871601234323494, 'samples': 9271872, 'steps': 48290, 'loss/train': 1.1884874105453491} -08/30/2021 21:58:20 - INFO - __main__ - Step 48292: {'lr': 0.00038871159741359567, 'samples': 9272064, 'steps': 48291, 'loss/train': 1.6146996021270752} -08/30/2021 21:58:21 - INFO - __main__ - Step 48293: {'lr': 0.0003887071824214551, 'samples': 9272256, 'steps': 48292, 'loss/train': 1.3789864778518677} -08/30/2021 21:58:23 - INFO - __main__ - Step 48294: {'lr': 0.0003887027673668152, 'samples': 9272448, 'steps': 48293, 'loss/train': 1.115086317062378} -08/30/2021 21:58:23 - INFO - __main__ - Step 48295: {'lr': 0.0003886983522496781, 'samples': 9272640, 'steps': 48294, 'loss/train': 1.1463960409164429} -08/30/2021 21:58:24 - INFO - __main__ - Step 48296: {'lr': 0.00038869393707004554, 'samples': 9272832, 'steps': 48295, 'loss/train': 1.7747620344161987} -08/30/2021 21:58:24 - INFO - __main__ - Step 48297: {'lr': 0.00038868952182791964, 'samples': 9273024, 'steps': 48296, 'loss/train': 1.1227610111236572} -08/30/2021 21:58:24 - INFO - __main__ - Step 48298: {'lr': 0.0003886851065233024, 'samples': 9273216, 'steps': 48297, 'loss/train': 1.5021138191223145} -08/30/2021 21:58:26 - INFO - __main__ - Step 48299: {'lr': 0.0003886806911561958, 'samples': 9273408, 'steps': 48298, 'loss/train': 1.6091890335083008} -08/30/2021 21:58:26 - INFO - __main__ - Step 48300: {'lr': 0.0003886762757266018, 'samples': 9273600, 'steps': 48299, 'loss/train': 1.3598541021347046} -08/30/2021 21:58:27 - INFO - __main__ - Step 48301: {'lr': 0.0003886718602345224, 'samples': 9273792, 'steps': 48300, 'loss/train': 1.5867159366607666} -08/30/2021 21:58:27 - INFO - __main__ - Step 48302: {'lr': 0.0003886674446799596, 'samples': 9273984, 'steps': 48301, 'loss/train': 1.312446117401123} -08/30/2021 21:58:27 - INFO - __main__ - Step 48303: {'lr': 0.00038866302906291546, 'samples': 9274176, 'steps': 48302, 'loss/train': 0.038343943655490875} -08/30/2021 21:58:29 - INFO - __main__ - Step 48304: {'lr': 0.0003886586133833918, 'samples': 9274368, 'steps': 48303, 'loss/train': 1.187606692314148} -08/30/2021 21:58:29 - INFO - __main__ - Step 48305: {'lr': 0.00038865419764139077, 'samples': 9274560, 'steps': 48304, 'loss/train': 0.21710127592086792} -08/30/2021 21:58:30 - INFO - __main__ - Step 48306: {'lr': 0.00038864978183691425, 'samples': 9274752, 'steps': 48305, 'loss/train': 1.1679391860961914} -08/30/2021 21:58:30 - INFO - __main__ - Step 48307: {'lr': 0.00038864536596996437, 'samples': 9274944, 'steps': 48306, 'loss/train': 1.4437044858932495} -08/30/2021 21:58:31 - INFO - __main__ - Step 48308: {'lr': 0.0003886409500405429, 'samples': 9275136, 'steps': 48307, 'loss/train': 0.963511049747467} -08/30/2021 21:58:32 - INFO - __main__ - Step 48309: {'lr': 0.00038863653404865207, 'samples': 9275328, 'steps': 48308, 'loss/train': 1.4042670726776123} -08/30/2021 21:58:32 - INFO - __main__ - Step 48310: {'lr': 0.0003886321179942937, 'samples': 9275520, 'steps': 48309, 'loss/train': 1.1079864501953125} -08/30/2021 21:58:33 - INFO - __main__ - Step 48311: {'lr': 0.0003886277018774699, 'samples': 9275712, 'steps': 48310, 'loss/train': 1.093345284461975} -08/30/2021 21:58:33 - INFO - __main__ - Step 48312: {'lr': 0.0003886232856981825, 'samples': 9275904, 'steps': 48311, 'loss/train': 1.77463698387146} -08/30/2021 21:58:34 - INFO - __main__ - Step 48313: {'lr': 0.00038861886945643363, 'samples': 9276096, 'steps': 48312, 'loss/train': 1.984765887260437} -08/30/2021 21:58:35 - INFO - __main__ - Step 48314: {'lr': 0.00038861445315222523, 'samples': 9276288, 'steps': 48313, 'loss/train': 0.5787181258201599} -08/30/2021 21:58:36 - INFO - __main__ - Step 48315: {'lr': 0.00038861003678555936, 'samples': 9276480, 'steps': 48314, 'loss/train': 0.8000352382659912} -08/30/2021 21:58:36 - INFO - __main__ - Step 48316: {'lr': 0.00038860562035643786, 'samples': 9276672, 'steps': 48315, 'loss/train': 1.992283582687378} -08/30/2021 21:58:37 - INFO - __main__ - Step 48317: {'lr': 0.00038860120386486285, 'samples': 9276864, 'steps': 48316, 'loss/train': 1.4223742485046387} -08/30/2021 21:58:37 - INFO - __main__ - Step 48318: {'lr': 0.00038859678731083627, 'samples': 9277056, 'steps': 48317, 'loss/train': 1.3210381269454956} -08/30/2021 21:58:37 - INFO - __main__ - Step 48319: {'lr': 0.0003885923706943601, 'samples': 9277248, 'steps': 48318, 'loss/train': 0.06078751012682915} -08/30/2021 21:58:39 - INFO - __main__ - Step 48320: {'lr': 0.00038858795401543634, 'samples': 9277440, 'steps': 48319, 'loss/train': 1.268423080444336} -08/30/2021 21:58:39 - INFO - __main__ - Step 48321: {'lr': 0.000388583537274067, 'samples': 9277632, 'steps': 48320, 'loss/train': 1.5062557458877563} -08/30/2021 21:58:39 - INFO - __main__ - Step 48322: {'lr': 0.0003885791204702541, 'samples': 9277824, 'steps': 48321, 'loss/train': 1.3718653917312622} -08/30/2021 21:58:40 - INFO - __main__ - Step 48323: {'lr': 0.0003885747036039995, 'samples': 9278016, 'steps': 48322, 'loss/train': 1.2255308628082275} -08/30/2021 21:58:40 - INFO - __main__ - Step 48324: {'lr': 0.0003885702866753054, 'samples': 9278208, 'steps': 48323, 'loss/train': 1.0981525182724} -08/30/2021 21:58:42 - INFO - __main__ - Step 48325: {'lr': 0.00038856586968417353, 'samples': 9278400, 'steps': 48324, 'loss/train': 1.5038059949874878} -08/30/2021 21:58:42 - INFO - __main__ - Step 48326: {'lr': 0.00038856145263060606, 'samples': 9278592, 'steps': 48325, 'loss/train': 1.1133569478988647} -08/30/2021 21:58:43 - INFO - __main__ - Step 48327: {'lr': 0.00038855703551460497, 'samples': 9278784, 'steps': 48326, 'loss/train': 1.0519733428955078} -08/30/2021 21:58:43 - INFO - __main__ - Step 48328: {'lr': 0.00038855261833617216, 'samples': 9278976, 'steps': 48327, 'loss/train': 0.07743918895721436} -08/30/2021 21:58:43 - INFO - __main__ - Step 48329: {'lr': 0.00038854820109530974, 'samples': 9279168, 'steps': 48328, 'loss/train': 0.9702709317207336} -08/30/2021 21:58:45 - INFO - __main__ - Step 48330: {'lr': 0.00038854378379201966, 'samples': 9279360, 'steps': 48329, 'loss/train': 1.2366012334823608} -08/30/2021 21:58:45 - INFO - __main__ - Step 48331: {'lr': 0.0003885393664263038, 'samples': 9279552, 'steps': 48330, 'loss/train': 1.2706016302108765} -08/30/2021 21:58:46 - INFO - __main__ - Step 48332: {'lr': 0.00038853494899816434, 'samples': 9279744, 'steps': 48331, 'loss/train': 1.6393556594848633} -08/30/2021 21:58:46 - INFO - __main__ - Step 48333: {'lr': 0.0003885305315076031, 'samples': 9279936, 'steps': 48332, 'loss/train': 1.8684183359146118} -08/30/2021 21:58:46 - INFO - __main__ - Step 48334: {'lr': 0.0003885261139546221, 'samples': 9280128, 'steps': 48333, 'loss/train': 1.480150818824768} -08/30/2021 21:58:48 - INFO - __main__ - Step 48335: {'lr': 0.00038852169633922344, 'samples': 9280320, 'steps': 48334, 'loss/train': 1.5422346591949463} -08/30/2021 21:58:48 - INFO - __main__ - Step 48336: {'lr': 0.00038851727866140906, 'samples': 9280512, 'steps': 48335, 'loss/train': 1.3034451007843018} -08/30/2021 21:58:49 - INFO - __main__ - Step 48337: {'lr': 0.00038851286092118095, 'samples': 9280704, 'steps': 48336, 'loss/train': 0.8110340237617493} -08/30/2021 21:58:49 - INFO - __main__ - Step 48338: {'lr': 0.0003885084431185411, 'samples': 9280896, 'steps': 48337, 'loss/train': 1.1553807258605957} -08/30/2021 21:58:49 - INFO - __main__ - Step 48339: {'lr': 0.0003885040252534913, 'samples': 9281088, 'steps': 48338, 'loss/train': 0.9764419794082642} -08/30/2021 21:58:50 - INFO - __main__ - Step 48340: {'lr': 0.00038849960732603386, 'samples': 9281280, 'steps': 48339, 'loss/train': 0.7394328117370605} -08/30/2021 21:58:51 - INFO - __main__ - Step 48341: {'lr': 0.00038849518933617064, 'samples': 9281472, 'steps': 48340, 'loss/train': 1.1356828212738037} -08/30/2021 21:58:52 - INFO - __main__ - Step 48342: {'lr': 0.0003884907712839036, 'samples': 9281664, 'steps': 48341, 'loss/train': 1.5415717363357544} -08/30/2021 21:58:52 - INFO - __main__ - Step 48343: {'lr': 0.00038848635316923475, 'samples': 9281856, 'steps': 48342, 'loss/train': 1.4904346466064453} -08/30/2021 21:58:52 - INFO - __main__ - Step 48344: {'lr': 0.0003884819349921661, 'samples': 9282048, 'steps': 48343, 'loss/train': 1.1626802682876587} -08/30/2021 21:58:53 - INFO - __main__ - Step 48345: {'lr': 0.0003884775167526996, 'samples': 9282240, 'steps': 48344, 'loss/train': 2.119408130645752} -08/30/2021 21:58:54 - INFO - __main__ - Step 48346: {'lr': 0.0003884730984508373, 'samples': 9282432, 'steps': 48345, 'loss/train': 1.39040207862854} -08/30/2021 21:58:55 - INFO - __main__ - Step 48347: {'lr': 0.0003884686800865812, 'samples': 9282624, 'steps': 48346, 'loss/train': 1.1078393459320068} -08/30/2021 21:58:55 - INFO - __main__ - Step 48348: {'lr': 0.0003884642616599331, 'samples': 9282816, 'steps': 48347, 'loss/train': 0.9484126567840576} -08/30/2021 21:58:55 - INFO - __main__ - Step 48349: {'lr': 0.00038845984317089526, 'samples': 9283008, 'steps': 48348, 'loss/train': 1.0910555124282837} -08/30/2021 21:58:56 - INFO - __main__ - Step 48350: {'lr': 0.00038845542461946953, 'samples': 9283200, 'steps': 48349, 'loss/train': 1.940859317779541} -08/30/2021 21:58:58 - INFO - __main__ - Step 48351: {'lr': 0.00038845100600565794, 'samples': 9283392, 'steps': 48350, 'loss/train': 1.7277929782867432} -08/30/2021 21:58:58 - INFO - __main__ - Step 48352: {'lr': 0.00038844658732946244, 'samples': 9283584, 'steps': 48351, 'loss/train': 1.2096253633499146} -08/30/2021 21:58:59 - INFO - __main__ - Step 48353: {'lr': 0.000388442168590885, 'samples': 9283776, 'steps': 48352, 'loss/train': 1.2793059349060059} -08/30/2021 21:58:59 - INFO - __main__ - Step 48354: {'lr': 0.00038843774978992773, 'samples': 9283968, 'steps': 48353, 'loss/train': 1.665263056755066} -08/30/2021 21:58:59 - INFO - __main__ - Step 48355: {'lr': 0.0003884333309265925, 'samples': 9284160, 'steps': 48354, 'loss/train': 1.4314162731170654} -08/30/2021 21:59:00 - INFO - __main__ - Step 48356: {'lr': 0.00038842891200088135, 'samples': 9284352, 'steps': 48355, 'loss/train': 1.1668885946273804} -08/30/2021 21:59:02 - INFO - __main__ - Step 48357: {'lr': 0.0003884244930127963, 'samples': 9284544, 'steps': 48356, 'loss/train': 1.2831779718399048} -08/30/2021 21:59:02 - INFO - __main__ - Step 48358: {'lr': 0.0003884200739623393, 'samples': 9284736, 'steps': 48357, 'loss/train': 1.6840825080871582} -08/30/2021 21:59:02 - INFO - __main__ - Step 48359: {'lr': 0.00038841565484951237, 'samples': 9284928, 'steps': 48358, 'loss/train': 1.087289571762085} -08/30/2021 21:59:03 - INFO - __main__ - Step 48360: {'lr': 0.0003884112356743175, 'samples': 9285120, 'steps': 48359, 'loss/train': 1.6617010831832886} -08/30/2021 21:59:03 - INFO - __main__ - Step 48361: {'lr': 0.0003884068164367566, 'samples': 9285312, 'steps': 48360, 'loss/train': 1.6421316862106323} -08/30/2021 21:59:05 - INFO - __main__ - Step 48362: {'lr': 0.00038840239713683165, 'samples': 9285504, 'steps': 48361, 'loss/train': 1.23919677734375} -08/30/2021 21:59:05 - INFO - __main__ - Step 48363: {'lr': 0.0003883979777745449, 'samples': 9285696, 'steps': 48362, 'loss/train': 0.9007788896560669} -08/30/2021 21:59:05 - INFO - __main__ - Step 48364: {'lr': 0.00038839355834989806, 'samples': 9285888, 'steps': 48363, 'loss/train': 1.819191813468933} -08/30/2021 21:59:06 - INFO - __main__ - Step 48365: {'lr': 0.0003883891388628932, 'samples': 9286080, 'steps': 48364, 'loss/train': 1.2570253610610962} -08/30/2021 21:59:06 - INFO - __main__ - Step 48366: {'lr': 0.0003883847193135323, 'samples': 9286272, 'steps': 48365, 'loss/train': 0.1363932490348816} -08/30/2021 21:59:08 - INFO - __main__ - Step 48367: {'lr': 0.0003883802997018174, 'samples': 9286464, 'steps': 48366, 'loss/train': 1.0962309837341309} -08/30/2021 21:59:08 - INFO - __main__ - Step 48368: {'lr': 0.00038837588002775054, 'samples': 9286656, 'steps': 48367, 'loss/train': 1.1666758060455322} -08/30/2021 21:59:08 - INFO - __main__ - Step 48369: {'lr': 0.0003883714602913336, 'samples': 9286848, 'steps': 48368, 'loss/train': 1.0255509614944458} -08/30/2021 21:59:09 - INFO - __main__ - Step 48370: {'lr': 0.00038836704049256864, 'samples': 9287040, 'steps': 48369, 'loss/train': 1.2940367460250854} -08/30/2021 21:59:09 - INFO - __main__ - Step 48371: {'lr': 0.0003883626206314577, 'samples': 9287232, 'steps': 48370, 'loss/train': 1.3935354948043823} -08/30/2021 21:59:09 - INFO - __main__ - Step 48372: {'lr': 0.0003883582007080025, 'samples': 9287424, 'steps': 48371, 'loss/train': 1.1138713359832764} -08/30/2021 21:59:11 - INFO - __main__ - Step 48373: {'lr': 0.0003883537807222054, 'samples': 9287616, 'steps': 48372, 'loss/train': 1.8047584295272827} -08/30/2021 21:59:11 - INFO - __main__ - Step 48374: {'lr': 0.0003883493606740681, 'samples': 9287808, 'steps': 48373, 'loss/train': 1.9533841609954834} -08/30/2021 21:59:12 - INFO - __main__ - Step 48375: {'lr': 0.0003883449405635928, 'samples': 9288000, 'steps': 48374, 'loss/train': 1.3703405857086182} -08/30/2021 21:59:12 - INFO - __main__ - Step 48376: {'lr': 0.0003883405203907814, 'samples': 9288192, 'steps': 48375, 'loss/train': 1.1228867769241333} -08/30/2021 21:59:12 - INFO - __main__ - Step 48377: {'lr': 0.0003883361001556359, 'samples': 9288384, 'steps': 48376, 'loss/train': 1.0904194116592407} -08/30/2021 21:59:14 - INFO - __main__ - Step 48378: {'lr': 0.0003883316798581582, 'samples': 9288576, 'steps': 48377, 'loss/train': 0.3879660367965698} -08/30/2021 21:59:14 - INFO - __main__ - Step 48379: {'lr': 0.0003883272594983505, 'samples': 9288768, 'steps': 48378, 'loss/train': 1.7464022636413574} -08/30/2021 21:59:15 - INFO - __main__ - Step 48380: {'lr': 0.00038832283907621457, 'samples': 9288960, 'steps': 48379, 'loss/train': 1.7930223941802979} -08/30/2021 21:59:15 - INFO - __main__ - Step 48381: {'lr': 0.00038831841859175253, 'samples': 9289152, 'steps': 48380, 'loss/train': 1.3664124011993408} -08/30/2021 21:59:16 - INFO - __main__ - Step 48382: {'lr': 0.0003883139980449664, 'samples': 9289344, 'steps': 48381, 'loss/train': 1.7374769449234009} -08/30/2021 21:59:17 - INFO - __main__ - Step 48383: {'lr': 0.00038830957743585807, 'samples': 9289536, 'steps': 48382, 'loss/train': 0.6134921312332153} -08/30/2021 21:59:17 - INFO - __main__ - Step 48384: {'lr': 0.0003883051567644296, 'samples': 9289728, 'steps': 48383, 'loss/train': 1.443073034286499} -08/30/2021 21:59:18 - INFO - __main__ - Step 48385: {'lr': 0.00038830073603068297, 'samples': 9289920, 'steps': 48384, 'loss/train': 0.6213002800941467} -08/30/2021 21:59:18 - INFO - __main__ - Step 48386: {'lr': 0.00038829631523462003, 'samples': 9290112, 'steps': 48385, 'loss/train': 1.1812790632247925} -08/30/2021 21:59:18 - INFO - __main__ - Step 48387: {'lr': 0.000388291894376243, 'samples': 9290304, 'steps': 48386, 'loss/train': 1.1856460571289062} -08/30/2021 21:59:20 - INFO - __main__ - Step 48388: {'lr': 0.0003882874734555538, 'samples': 9290496, 'steps': 48387, 'loss/train': 1.2674168348312378} -08/30/2021 21:59:20 - INFO - __main__ - Step 48389: {'lr': 0.00038828305247255447, 'samples': 9290688, 'steps': 48388, 'loss/train': 1.4452506303787231} -08/30/2021 21:59:21 - INFO - __main__ - Step 48390: {'lr': 0.00038827863142724685, 'samples': 9290880, 'steps': 48389, 'loss/train': 1.6292476654052734} -08/30/2021 21:59:21 - INFO - __main__ - Step 48391: {'lr': 0.00038827421031963294, 'samples': 9291072, 'steps': 48390, 'loss/train': 0.7993712425231934} -08/30/2021 21:59:21 - INFO - __main__ - Step 48392: {'lr': 0.0003882697891497149, 'samples': 9291264, 'steps': 48391, 'loss/train': 1.254414677619934} -08/30/2021 21:59:23 - INFO - __main__ - Step 48393: {'lr': 0.00038826536791749454, 'samples': 9291456, 'steps': 48392, 'loss/train': 1.0764840841293335} -08/30/2021 21:59:23 - INFO - __main__ - Step 48394: {'lr': 0.00038826094662297404, 'samples': 9291648, 'steps': 48393, 'loss/train': 1.522329568862915} -08/30/2021 21:59:24 - INFO - __main__ - Step 48395: {'lr': 0.0003882565252661553, 'samples': 9291840, 'steps': 48394, 'loss/train': 1.815787672996521} -08/30/2021 21:59:24 - INFO - __main__ - Step 48396: {'lr': 0.00038825210384704024, 'samples': 9292032, 'steps': 48395, 'loss/train': 1.24665367603302} -08/30/2021 21:59:25 - INFO - __main__ - Step 48397: {'lr': 0.0003882476823656309, 'samples': 9292224, 'steps': 48396, 'loss/train': 1.9732352495193481} -08/30/2021 21:59:25 - INFO - __main__ - Step 48398: {'lr': 0.00038824326082192935, 'samples': 9292416, 'steps': 48397, 'loss/train': 1.3705459833145142} -08/30/2021 21:59:26 - INFO - __main__ - Step 48399: {'lr': 0.0003882388392159375, 'samples': 9292608, 'steps': 48398, 'loss/train': 1.7985793352127075} -08/30/2021 21:59:27 - INFO - __main__ - Step 48400: {'lr': 0.0003882344175476573, 'samples': 9292800, 'steps': 48399, 'loss/train': 1.1154745817184448} -08/30/2021 21:59:27 - INFO - __main__ - Step 48401: {'lr': 0.00038822999581709087, 'samples': 9292992, 'steps': 48400, 'loss/train': 1.4069701433181763} -08/30/2021 21:59:28 - INFO - __main__ - Step 48402: {'lr': 0.0003882255740242401, 'samples': 9293184, 'steps': 48401, 'loss/train': 1.6385899782180786} -08/30/2021 21:59:28 - INFO - __main__ - Step 48403: {'lr': 0.0003882211521691071, 'samples': 9293376, 'steps': 48402, 'loss/train': 1.8790549039840698} -08/30/2021 21:59:30 - INFO - __main__ - Step 48404: {'lr': 0.0003882167302516937, 'samples': 9293568, 'steps': 48403, 'loss/train': 1.8087621927261353} -08/30/2021 21:59:30 - INFO - __main__ - Step 48405: {'lr': 0.000388212308272002, 'samples': 9293760, 'steps': 48404, 'loss/train': 0.7198596596717834} -08/30/2021 21:59:31 - INFO - __main__ - Step 48406: {'lr': 0.00038820788623003397, 'samples': 9293952, 'steps': 48405, 'loss/train': 0.9973756074905396} -08/30/2021 21:59:31 - INFO - __main__ - Step 48407: {'lr': 0.00038820346412579156, 'samples': 9294144, 'steps': 48406, 'loss/train': 1.493796467781067} -08/30/2021 21:59:31 - INFO - __main__ - Step 48408: {'lr': 0.0003881990419592768, 'samples': 9294336, 'steps': 48407, 'loss/train': 1.2681516408920288} -08/30/2021 21:59:33 - INFO - __main__ - Step 48409: {'lr': 0.00038819461973049177, 'samples': 9294528, 'steps': 48408, 'loss/train': 1.3363465070724487} -08/30/2021 21:59:33 - INFO - __main__ - Step 48410: {'lr': 0.00038819019743943834, 'samples': 9294720, 'steps': 48409, 'loss/train': 2.367302894592285} -08/30/2021 21:59:34 - INFO - __main__ - Step 48411: {'lr': 0.00038818577508611854, 'samples': 9294912, 'steps': 48410, 'loss/train': 1.161450982093811} -08/30/2021 21:59:34 - INFO - __main__ - Step 48412: {'lr': 0.00038818135267053435, 'samples': 9295104, 'steps': 48411, 'loss/train': 1.2520462274551392} -08/30/2021 21:59:34 - INFO - __main__ - Step 48413: {'lr': 0.00038817693019268775, 'samples': 9295296, 'steps': 48412, 'loss/train': 1.4962916374206543} -08/30/2021 21:59:36 - INFO - __main__ - Step 48414: {'lr': 0.0003881725076525808, 'samples': 9295488, 'steps': 48413, 'loss/train': 1.604047179222107} -08/30/2021 21:59:36 - INFO - __main__ - Step 48415: {'lr': 0.0003881680850502154, 'samples': 9295680, 'steps': 48414, 'loss/train': 1.1570351123809814} -08/30/2021 21:59:37 - INFO - __main__ - Step 48416: {'lr': 0.00038816366238559366, 'samples': 9295872, 'steps': 48415, 'loss/train': 1.3183537721633911} -08/30/2021 21:59:37 - INFO - __main__ - Step 48417: {'lr': 0.00038815923965871747, 'samples': 9296064, 'steps': 48416, 'loss/train': 1.0234194993972778} -08/30/2021 21:59:37 - INFO - __main__ - Step 48418: {'lr': 0.00038815481686958883, 'samples': 9296256, 'steps': 48417, 'loss/train': 1.5382137298583984} -08/30/2021 21:59:39 - INFO - __main__ - Step 48419: {'lr': 0.0003881503940182098, 'samples': 9296448, 'steps': 48418, 'loss/train': 0.362134724855423} -08/30/2021 21:59:39 - INFO - __main__ - Step 48420: {'lr': 0.0003881459711045823, 'samples': 9296640, 'steps': 48419, 'loss/train': 1.6999907493591309} -08/30/2021 21:59:40 - INFO - __main__ - Step 48421: {'lr': 0.0003881415481287084, 'samples': 9296832, 'steps': 48420, 'loss/train': 0.5085893273353577} -08/30/2021 21:59:40 - INFO - __main__ - Step 48422: {'lr': 0.00038813712509058995, 'samples': 9297024, 'steps': 48421, 'loss/train': 1.0744240283966064} -08/30/2021 21:59:40 - INFO - __main__ - Step 48423: {'lr': 0.0003881327019902292, 'samples': 9297216, 'steps': 48422, 'loss/train': 1.4352797269821167} -08/30/2021 21:59:42 - INFO - __main__ - Step 48424: {'lr': 0.00038812827882762793, 'samples': 9297408, 'steps': 48423, 'loss/train': 1.353934645652771} -08/30/2021 21:59:42 - INFO - __main__ - Step 48425: {'lr': 0.00038812385560278815, 'samples': 9297600, 'steps': 48424, 'loss/train': 1.5925509929656982} -08/30/2021 21:59:43 - INFO - __main__ - Step 48426: {'lr': 0.0003881194323157119, 'samples': 9297792, 'steps': 48425, 'loss/train': 1.344125747680664} -08/30/2021 21:59:43 - INFO - __main__ - Step 48427: {'lr': 0.00038811500896640116, 'samples': 9297984, 'steps': 48426, 'loss/train': 1.7305984497070312} -08/30/2021 21:59:43 - INFO - __main__ - Step 48428: {'lr': 0.0003881105855548579, 'samples': 9298176, 'steps': 48427, 'loss/train': 1.3240357637405396} -08/30/2021 21:59:45 - INFO - __main__ - Step 48429: {'lr': 0.00038810616208108416, 'samples': 9298368, 'steps': 48428, 'loss/train': 0.5368484258651733} -08/30/2021 21:59:45 - INFO - __main__ - Step 48430: {'lr': 0.00038810173854508204, 'samples': 9298560, 'steps': 48429, 'loss/train': 1.1445903778076172} -08/30/2021 21:59:46 - INFO - __main__ - Step 48431: {'lr': 0.0003880973149468533, 'samples': 9298752, 'steps': 48430, 'loss/train': 1.6752376556396484} -08/30/2021 21:59:46 - INFO - __main__ - Step 48432: {'lr': 0.00038809289128640003, 'samples': 9298944, 'steps': 48431, 'loss/train': 1.3629772663116455} -08/30/2021 21:59:46 - INFO - __main__ - Step 48433: {'lr': 0.00038808846756372426, 'samples': 9299136, 'steps': 48432, 'loss/train': 0.5924604535102844} -08/30/2021 21:59:48 - INFO - __main__ - Step 48434: {'lr': 0.0003880840437788279, 'samples': 9299328, 'steps': 48433, 'loss/train': 0.0446803979575634} -08/30/2021 21:59:48 - INFO - __main__ - Step 48435: {'lr': 0.00038807961993171306, 'samples': 9299520, 'steps': 48434, 'loss/train': 1.0644896030426025} -08/30/2021 21:59:49 - INFO - __main__ - Step 48436: {'lr': 0.00038807519602238174, 'samples': 9299712, 'steps': 48435, 'loss/train': 1.1155132055282593} -08/30/2021 21:59:49 - INFO - __main__ - Step 48437: {'lr': 0.00038807077205083577, 'samples': 9299904, 'steps': 48436, 'loss/train': 1.0517810583114624} -08/30/2021 21:59:49 - INFO - __main__ - Step 48438: {'lr': 0.0003880663480170772, 'samples': 9300096, 'steps': 48437, 'loss/train': 0.8353077173233032} -08/30/2021 21:59:51 - INFO - __main__ - Step 48439: {'lr': 0.00038806192392110817, 'samples': 9300288, 'steps': 48438, 'loss/train': 1.4676532745361328} -08/30/2021 21:59:51 - INFO - __main__ - Step 48440: {'lr': 0.0003880574997629305, 'samples': 9300480, 'steps': 48439, 'loss/train': 2.0629382133483887} -08/30/2021 21:59:52 - INFO - __main__ - Step 48441: {'lr': 0.0003880530755425462, 'samples': 9300672, 'steps': 48440, 'loss/train': 1.1311228275299072} -08/30/2021 21:59:52 - INFO - __main__ - Step 48442: {'lr': 0.0003880486512599574, 'samples': 9300864, 'steps': 48441, 'loss/train': 1.1981433629989624} -08/30/2021 21:59:52 - INFO - __main__ - Step 48443: {'lr': 0.00038804422691516606, 'samples': 9301056, 'steps': 48442, 'loss/train': 0.9683637619018555} -08/30/2021 21:59:54 - INFO - __main__ - Step 48444: {'lr': 0.0003880398025081741, 'samples': 9301248, 'steps': 48443, 'loss/train': 1.5106436014175415} -08/30/2021 21:59:54 - INFO - __main__ - Step 48445: {'lr': 0.0003880353780389834, 'samples': 9301440, 'steps': 48444, 'loss/train': 1.2463641166687012} -08/30/2021 21:59:55 - INFO - __main__ - Step 48446: {'lr': 0.0003880309535075962, 'samples': 9301632, 'steps': 48445, 'loss/train': 1.7059900760650635} -08/30/2021 21:59:55 - INFO - __main__ - Step 48447: {'lr': 0.00038802652891401434, 'samples': 9301824, 'steps': 48446, 'loss/train': 0.9859436750411987} -08/30/2021 21:59:55 - INFO - __main__ - Step 48448: {'lr': 0.0003880221042582399, 'samples': 9302016, 'steps': 48447, 'loss/train': 1.3285859823226929} -08/30/2021 21:59:56 - INFO - __main__ - Step 48449: {'lr': 0.0003880176795402748, 'samples': 9302208, 'steps': 48448, 'loss/train': 0.9440991878509521} -08/30/2021 21:59:57 - INFO - __main__ - Step 48450: {'lr': 0.00038801325476012113, 'samples': 9302400, 'steps': 48449, 'loss/train': 1.6010005474090576} -08/30/2021 21:59:58 - INFO - __main__ - Step 48451: {'lr': 0.00038800882991778073, 'samples': 9302592, 'steps': 48450, 'loss/train': 1.1128400564193726} -08/30/2021 21:59:58 - INFO - __main__ - Step 48452: {'lr': 0.00038800440501325574, 'samples': 9302784, 'steps': 48451, 'loss/train': 1.4798130989074707} -08/30/2021 21:59:58 - INFO - __main__ - Step 48453: {'lr': 0.000387999980046548, 'samples': 9302976, 'steps': 48452, 'loss/train': 1.504532814025879} -08/30/2021 21:59:59 - INFO - __main__ - Step 48454: {'lr': 0.0003879955550176597, 'samples': 9303168, 'steps': 48453, 'loss/train': 1.6498000621795654} -08/30/2021 22:00:00 - INFO - __main__ - Step 48455: {'lr': 0.00038799112992659267, 'samples': 9303360, 'steps': 48454, 'loss/train': 1.0734919309616089} -08/30/2021 22:00:01 - INFO - __main__ - Step 48456: {'lr': 0.00038798670477334894, 'samples': 9303552, 'steps': 48455, 'loss/train': 1.2962626218795776} -08/30/2021 22:00:01 - INFO - __main__ - Step 48457: {'lr': 0.00038798227955793066, 'samples': 9303744, 'steps': 48456, 'loss/train': 1.6801810264587402} -08/30/2021 22:00:01 - INFO - __main__ - Step 48458: {'lr': 0.0003879778542803396, 'samples': 9303936, 'steps': 48457, 'loss/train': 1.099550724029541} -08/30/2021 22:00:02 - INFO - __main__ - Step 48459: {'lr': 0.00038797342894057783, 'samples': 9304128, 'steps': 48458, 'loss/train': 1.2253131866455078} -08/30/2021 22:00:03 - INFO - __main__ - Step 48460: {'lr': 0.0003879690035386474, 'samples': 9304320, 'steps': 48459, 'loss/train': 2.109959363937378} -08/30/2021 22:00:04 - INFO - __main__ - Step 48461: {'lr': 0.0003879645780745503, 'samples': 9304512, 'steps': 48460, 'loss/train': 0.7420564293861389} -08/30/2021 22:00:04 - INFO - __main__ - Step 48462: {'lr': 0.0003879601525482884, 'samples': 9304704, 'steps': 48461, 'loss/train': 1.545756220817566} -08/30/2021 22:00:05 - INFO - __main__ - Step 48463: {'lr': 0.00038795572695986394, 'samples': 9304896, 'steps': 48462, 'loss/train': 0.545409619808197} -08/30/2021 22:00:05 - INFO - __main__ - Step 48464: {'lr': 0.00038795130130927857, 'samples': 9305088, 'steps': 48463, 'loss/train': 2.039393663406372} -08/30/2021 22:00:07 - INFO - __main__ - Step 48465: {'lr': 0.0003879468755965346, 'samples': 9305280, 'steps': 48464, 'loss/train': 0.049927160143852234} -08/30/2021 22:00:07 - INFO - __main__ - Step 48466: {'lr': 0.00038794244982163383, 'samples': 9305472, 'steps': 48465, 'loss/train': 1.8855663537979126} -08/30/2021 22:00:07 - INFO - __main__ - Step 48467: {'lr': 0.0003879380239845783, 'samples': 9305664, 'steps': 48466, 'loss/train': 1.4282443523406982} -08/30/2021 22:00:08 - INFO - __main__ - Step 48468: {'lr': 0.0003879335980853701, 'samples': 9305856, 'steps': 48467, 'loss/train': 1.460593581199646} -08/30/2021 22:00:08 - INFO - __main__ - Step 48469: {'lr': 0.00038792917212401114, 'samples': 9306048, 'steps': 48468, 'loss/train': 1.587393879890442} -08/30/2021 22:00:09 - INFO - __main__ - Step 48470: {'lr': 0.0003879247461005034, 'samples': 9306240, 'steps': 48469, 'loss/train': 1.1955863237380981} -08/30/2021 22:00:10 - INFO - __main__ - Step 48471: {'lr': 0.0003879203200148489, 'samples': 9306432, 'steps': 48470, 'loss/train': 0.9549295902252197} -08/30/2021 22:00:10 - INFO - __main__ - Step 48472: {'lr': 0.0003879158938670496, 'samples': 9306624, 'steps': 48471, 'loss/train': 1.173951506614685} -08/30/2021 22:00:11 - INFO - __main__ - Step 48473: {'lr': 0.0003879114676571076, 'samples': 9306816, 'steps': 48472, 'loss/train': 1.5563071966171265} -08/30/2021 22:00:11 - INFO - __main__ - Step 48474: {'lr': 0.00038790704138502475, 'samples': 9307008, 'steps': 48473, 'loss/train': 1.4330594539642334} -08/30/2021 22:00:12 - INFO - __main__ - Step 48475: {'lr': 0.0003879026150508032, 'samples': 9307200, 'steps': 48474, 'loss/train': 0.9032770395278931} -08/30/2021 22:00:13 - INFO - __main__ - Step 48476: {'lr': 0.00038789818865444473, 'samples': 9307392, 'steps': 48475, 'loss/train': 1.3034579753875732} -08/30/2021 22:00:13 - INFO - __main__ - Step 48477: {'lr': 0.0003878937621959516, 'samples': 9307584, 'steps': 48476, 'loss/train': 1.8261030912399292} -08/30/2021 22:00:14 - INFO - __main__ - Step 48478: {'lr': 0.0003878893356753256, 'samples': 9307776, 'steps': 48477, 'loss/train': 0.9689961075782776} -08/30/2021 22:00:14 - INFO - __main__ - Step 48479: {'lr': 0.0003878849090925688, 'samples': 9307968, 'steps': 48478, 'loss/train': 1.4118194580078125} -08/30/2021 22:00:15 - INFO - __main__ - Step 48480: {'lr': 0.00038788048244768316, 'samples': 9308160, 'steps': 48479, 'loss/train': 1.6663236618041992} -08/30/2021 22:00:16 - INFO - __main__ - Step 48481: {'lr': 0.00038787605574067076, 'samples': 9308352, 'steps': 48480, 'loss/train': 1.6399551630020142} -08/30/2021 22:00:16 - INFO - __main__ - Step 48482: {'lr': 0.0003878716289715335, 'samples': 9308544, 'steps': 48481, 'loss/train': 0.5260775089263916} -08/30/2021 22:00:17 - INFO - __main__ - Step 48483: {'lr': 0.0003878672021402734, 'samples': 9308736, 'steps': 48482, 'loss/train': 4.811079978942871} -08/30/2021 22:00:17 - INFO - __main__ - Step 48484: {'lr': 0.00038786277524689245, 'samples': 9308928, 'steps': 48483, 'loss/train': 1.3441731929779053} -08/30/2021 22:00:18 - INFO - __main__ - Step 48485: {'lr': 0.0003878583482913927, 'samples': 9309120, 'steps': 48484, 'loss/train': 1.588223934173584} -08/30/2021 22:00:19 - INFO - __main__ - Step 48486: {'lr': 0.00038785392127377603, 'samples': 9309312, 'steps': 48485, 'loss/train': 1.7102043628692627} -08/30/2021 22:00:19 - INFO - __main__ - Step 48487: {'lr': 0.0003878494941940447, 'samples': 9309504, 'steps': 48486, 'loss/train': 1.1020991802215576} -08/30/2021 22:00:19 - INFO - __main__ - Step 48488: {'lr': 0.0003878450670522004, 'samples': 9309696, 'steps': 48487, 'loss/train': 1.5877913236618042} -08/30/2021 22:00:20 - INFO - __main__ - Step 48489: {'lr': 0.00038784063984824516, 'samples': 9309888, 'steps': 48488, 'loss/train': 1.4161159992218018} -08/30/2021 22:00:22 - INFO - __main__ - Step 48490: {'lr': 0.00038783621258218115, 'samples': 9310080, 'steps': 48489, 'loss/train': 0.1848432719707489} -08/30/2021 22:00:22 - INFO - __main__ - Step 48491: {'lr': 0.00038783178525401025, 'samples': 9310272, 'steps': 48490, 'loss/train': 0.2881789803504944} -08/30/2021 22:00:23 - INFO - __main__ - Step 48492: {'lr': 0.00038782735786373445, 'samples': 9310464, 'steps': 48491, 'loss/train': 1.5090851783752441} -08/30/2021 22:00:23 - INFO - __main__ - Step 48493: {'lr': 0.00038782293041135583, 'samples': 9310656, 'steps': 48492, 'loss/train': 1.3842346668243408} -08/30/2021 22:00:23 - INFO - __main__ - Step 48494: {'lr': 0.0003878185028968763, 'samples': 9310848, 'steps': 48493, 'loss/train': 1.8749058246612549} -08/30/2021 22:00:24 - INFO - __main__ - Step 48495: {'lr': 0.00038781407532029785, 'samples': 9311040, 'steps': 48494, 'loss/train': 1.3964929580688477} -08/30/2021 22:00:25 - INFO - __main__ - Step 48496: {'lr': 0.0003878096476816225, 'samples': 9311232, 'steps': 48495, 'loss/train': 1.5425902605056763} -08/30/2021 22:00:26 - INFO - __main__ - Step 48497: {'lr': 0.0003878052199808523, 'samples': 9311424, 'steps': 48496, 'loss/train': 2.0943737030029297} -08/30/2021 22:00:26 - INFO - __main__ - Step 48498: {'lr': 0.0003878007922179891, 'samples': 9311616, 'steps': 48497, 'loss/train': 0.5705732107162476} -08/30/2021 22:00:26 - INFO - __main__ - Step 48499: {'lr': 0.0003877963643930351, 'samples': 9311808, 'steps': 48498, 'loss/train': 1.2632553577423096} -08/30/2021 22:00:27 - INFO - __main__ - Step 48500: {'lr': 0.00038779193650599213, 'samples': 9312000, 'steps': 48499, 'loss/train': 0.9077624678611755} -08/30/2021 22:00:28 - INFO - __main__ - Step 48501: {'lr': 0.0003877875085568622, 'samples': 9312192, 'steps': 48500, 'loss/train': 1.6068578958511353} -08/30/2021 22:00:29 - INFO - __main__ - Step 48502: {'lr': 0.0003877830805456474, 'samples': 9312384, 'steps': 48501, 'loss/train': 1.3240727186203003} -08/30/2021 22:00:29 - INFO - __main__ - Step 48503: {'lr': 0.00038777865247234967, 'samples': 9312576, 'steps': 48502, 'loss/train': 1.2507191896438599} -08/30/2021 22:00:29 - INFO - __main__ - Step 48504: {'lr': 0.00038777422433697106, 'samples': 9312768, 'steps': 48503, 'loss/train': 1.4361670017242432} -08/30/2021 22:00:30 - INFO - __main__ - Step 48505: {'lr': 0.00038776979613951347, 'samples': 9312960, 'steps': 48504, 'loss/train': 1.8598394393920898} -08/30/2021 22:00:32 - INFO - __main__ - Step 48506: {'lr': 0.00038776536787997885, 'samples': 9313152, 'steps': 48505, 'loss/train': 0.8972229957580566} -08/30/2021 22:00:32 - INFO - __main__ - Step 48507: {'lr': 0.0003877609395583693, 'samples': 9313344, 'steps': 48506, 'loss/train': 1.6361212730407715} -08/30/2021 22:00:32 - INFO - __main__ - Step 48508: {'lr': 0.0003877565111746869, 'samples': 9313536, 'steps': 48507, 'loss/train': 1.3830232620239258} -08/30/2021 22:00:33 - INFO - __main__ - Step 48509: {'lr': 0.00038775208272893346, 'samples': 9313728, 'steps': 48508, 'loss/train': 1.616654396057129} -08/30/2021 22:00:33 - INFO - __main__ - Step 48510: {'lr': 0.0003877476542211111, 'samples': 9313920, 'steps': 48509, 'loss/train': 0.15169793367385864} -08/30/2021 22:00:35 - INFO - __main__ - Step 48511: {'lr': 0.0003877432256512218, 'samples': 9314112, 'steps': 48510, 'loss/train': 0.7469132542610168} -08/30/2021 22:00:35 - INFO - __main__ - Step 48512: {'lr': 0.00038773879701926747, 'samples': 9314304, 'steps': 48511, 'loss/train': 1.6190145015716553} -08/30/2021 22:00:35 - INFO - __main__ - Step 48513: {'lr': 0.0003877343683252501, 'samples': 9314496, 'steps': 48512, 'loss/train': 1.1561778783798218} -08/30/2021 22:00:36 - INFO - __main__ - Step 48514: {'lr': 0.00038772993956917183, 'samples': 9314688, 'steps': 48513, 'loss/train': 0.7685527801513672} -08/30/2021 22:00:36 - INFO - __main__ - Step 48515: {'lr': 0.00038772551075103457, 'samples': 9314880, 'steps': 48514, 'loss/train': 1.1655855178833008} -08/30/2021 22:00:36 - INFO - __main__ - Step 48516: {'lr': 0.00038772108187084034, 'samples': 9315072, 'steps': 48515, 'loss/train': 1.05631685256958} -08/30/2021 22:00:39 - INFO - __main__ - Step 48517: {'lr': 0.00038771665292859116, 'samples': 9315264, 'steps': 48516, 'loss/train': 1.5202178955078125} -08/30/2021 22:00:39 - INFO - __main__ - Step 48518: {'lr': 0.00038771222392428885, 'samples': 9315456, 'steps': 48517, 'loss/train': 0.0706179291009903} -08/30/2021 22:00:40 - INFO - __main__ - Step 48519: {'lr': 0.0003877077948579356, 'samples': 9315648, 'steps': 48518, 'loss/train': 0.4329894781112671} -08/30/2021 22:00:40 - INFO - __main__ - Step 48520: {'lr': 0.00038770336572953334, 'samples': 9315840, 'steps': 48519, 'loss/train': 1.4072073698043823} -08/30/2021 22:00:40 - INFO - __main__ - Step 48521: {'lr': 0.00038769893653908404, 'samples': 9316032, 'steps': 48520, 'loss/train': 1.2309231758117676} -08/30/2021 22:00:41 - INFO - __main__ - Step 48522: {'lr': 0.0003876945072865898, 'samples': 9316224, 'steps': 48521, 'loss/train': 1.207040786743164} -08/30/2021 22:00:41 - INFO - __main__ - Step 48523: {'lr': 0.0003876900779720525, 'samples': 9316416, 'steps': 48522, 'loss/train': 2.160245180130005} -08/30/2021 22:00:42 - INFO - __main__ - Step 48524: {'lr': 0.0003876856485954742, 'samples': 9316608, 'steps': 48523, 'loss/train': 2.266228199005127} -08/30/2021 22:00:43 - INFO - __main__ - Step 48525: {'lr': 0.00038768121915685685, 'samples': 9316800, 'steps': 48524, 'loss/train': 1.5202691555023193} -08/30/2021 22:00:43 - INFO - __main__ - Step 48526: {'lr': 0.00038767678965620245, 'samples': 9316992, 'steps': 48525, 'loss/train': 1.0634765625} -08/30/2021 22:00:44 - INFO - __main__ - Step 48527: {'lr': 0.00038767236009351304, 'samples': 9317184, 'steps': 48526, 'loss/train': 2.2997090816497803} -08/30/2021 22:00:44 - INFO - __main__ - Step 48528: {'lr': 0.00038766793046879057, 'samples': 9317376, 'steps': 48527, 'loss/train': 1.6402528285980225} -08/30/2021 22:00:46 - INFO - __main__ - Step 48529: {'lr': 0.000387663500782037, 'samples': 9317568, 'steps': 48528, 'loss/train': 1.3543519973754883} -08/30/2021 22:00:46 - INFO - __main__ - Step 48530: {'lr': 0.00038765907103325447, 'samples': 9317760, 'steps': 48529, 'loss/train': 1.1279032230377197} -08/30/2021 22:00:46 - INFO - __main__ - Step 48531: {'lr': 0.00038765464122244485, 'samples': 9317952, 'steps': 48530, 'loss/train': 1.2232149839401245} -08/30/2021 22:00:47 - INFO - __main__ - Step 48532: {'lr': 0.0003876502113496102, 'samples': 9318144, 'steps': 48531, 'loss/train': 1.2406408786773682} -08/30/2021 22:00:47 - INFO - __main__ - Step 48533: {'lr': 0.00038764578141475245, 'samples': 9318336, 'steps': 48532, 'loss/train': 1.344740390777588} -08/30/2021 22:00:49 - INFO - __main__ - Step 48534: {'lr': 0.0003876413514178736, 'samples': 9318528, 'steps': 48533, 'loss/train': 1.5499004125595093} -08/30/2021 22:00:49 - INFO - __main__ - Step 48535: {'lr': 0.0003876369213589758, 'samples': 9318720, 'steps': 48534, 'loss/train': 0.9566710591316223} -08/30/2021 22:00:49 - INFO - __main__ - Step 48536: {'lr': 0.0003876324912380608, 'samples': 9318912, 'steps': 48535, 'loss/train': 0.08877792209386826} -08/30/2021 22:00:50 - INFO - __main__ - Step 48537: {'lr': 0.00038762806105513084, 'samples': 9319104, 'steps': 48536, 'loss/train': 1.6251089572906494} -08/30/2021 22:00:50 - INFO - __main__ - Step 48538: {'lr': 0.0003876236308101877, 'samples': 9319296, 'steps': 48537, 'loss/train': 1.4864169359207153} -08/30/2021 22:00:53 - INFO - __main__ - Step 48539: {'lr': 0.0003876192005032335, 'samples': 9319488, 'steps': 48538, 'loss/train': 3.7254464626312256} -08/30/2021 22:00:53 - INFO - __main__ - Step 48540: {'lr': 0.00038761477013427026, 'samples': 9319680, 'steps': 48539, 'loss/train': 1.8291910886764526} -08/30/2021 22:00:54 - INFO - __main__ - Step 48541: {'lr': 0.00038761033970329987, 'samples': 9319872, 'steps': 48540, 'loss/train': 1.4286510944366455} -08/30/2021 22:00:54 - INFO - __main__ - Step 48542: {'lr': 0.00038760590921032445, 'samples': 9320064, 'steps': 48541, 'loss/train': 1.8013432025909424} -08/30/2021 22:00:54 - INFO - __main__ - Step 48543: {'lr': 0.0003876014786553459, 'samples': 9320256, 'steps': 48542, 'loss/train': 1.7205475568771362} -08/30/2021 22:00:55 - INFO - __main__ - Step 48544: {'lr': 0.00038759704803836625, 'samples': 9320448, 'steps': 48543, 'loss/train': 1.7732487916946411} -08/30/2021 22:00:55 - INFO - __main__ - Step 48545: {'lr': 0.00038759261735938743, 'samples': 9320640, 'steps': 48544, 'loss/train': 1.4101994037628174} -08/30/2021 22:00:55 - INFO - __main__ - Step 48546: {'lr': 0.00038758818661841155, 'samples': 9320832, 'steps': 48545, 'loss/train': 1.1383955478668213} -08/30/2021 22:00:56 - INFO - __main__ - Step 48547: {'lr': 0.0003875837558154406, 'samples': 9321024, 'steps': 48546, 'loss/train': 1.2493377923965454} -08/30/2021 22:00:58 - INFO - __main__ - Step 48548: {'lr': 0.0003875793249504765, 'samples': 9321216, 'steps': 48547, 'loss/train': 2.0622549057006836} -08/30/2021 22:00:58 - INFO - __main__ - Step 48549: {'lr': 0.00038757489402352124, 'samples': 9321408, 'steps': 48548, 'loss/train': 1.9969414472579956} -08/30/2021 22:00:59 - INFO - __main__ - Step 48550: {'lr': 0.0003875704630345769, 'samples': 9321600, 'steps': 48549, 'loss/train': 1.2790120840072632} -08/30/2021 22:00:59 - INFO - __main__ - Step 48551: {'lr': 0.00038756603198364544, 'samples': 9321792, 'steps': 48550, 'loss/train': 1.49632728099823} -08/30/2021 22:00:59 - INFO - __main__ - Step 48552: {'lr': 0.0003875616008707288, 'samples': 9321984, 'steps': 48551, 'loss/train': 1.6404567956924438} -08/30/2021 22:01:01 - INFO - __main__ - Step 48553: {'lr': 0.00038755716969582913, 'samples': 9322176, 'steps': 48552, 'loss/train': 0.1912604123353958} -08/30/2021 22:01:02 - INFO - __main__ - Step 48554: {'lr': 0.0003875527384589482, 'samples': 9322368, 'steps': 48553, 'loss/train': 0.8276629447937012} -08/30/2021 22:01:02 - INFO - __main__ - Step 48555: {'lr': 0.00038754830716008815, 'samples': 9322560, 'steps': 48554, 'loss/train': 0.9975128769874573} -08/30/2021 22:01:02 - INFO - __main__ - Step 48556: {'lr': 0.000387543875799251, 'samples': 9322752, 'steps': 48555, 'loss/train': 1.35439932346344} -08/30/2021 22:01:03 - INFO - __main__ - Step 48557: {'lr': 0.0003875394443764387, 'samples': 9322944, 'steps': 48556, 'loss/train': 1.3460139036178589} -08/30/2021 22:01:04 - INFO - __main__ - Step 48558: {'lr': 0.00038753501289165324, 'samples': 9323136, 'steps': 48557, 'loss/train': 1.215519666671753} -08/30/2021 22:01:05 - INFO - __main__ - Step 48559: {'lr': 0.0003875305813448966, 'samples': 9323328, 'steps': 48558, 'loss/train': 0.38438525795936584} -08/30/2021 22:01:05 - INFO - __main__ - Step 48560: {'lr': 0.00038752614973617085, 'samples': 9323520, 'steps': 48559, 'loss/train': 1.8800326585769653} -08/30/2021 22:01:05 - INFO - __main__ - Step 48561: {'lr': 0.0003875217180654779, 'samples': 9323712, 'steps': 48560, 'loss/train': 1.5727200508117676} -08/30/2021 22:01:06 - INFO - __main__ - Step 48562: {'lr': 0.00038751728633281974, 'samples': 9323904, 'steps': 48561, 'loss/train': 1.336424469947815} -08/30/2021 22:01:07 - INFO - __main__ - Step 48563: {'lr': 0.00038751285453819846, 'samples': 9324096, 'steps': 48562, 'loss/train': 1.8624446392059326} -08/30/2021 22:01:07 - INFO - __main__ - Step 48564: {'lr': 0.000387508422681616, 'samples': 9324288, 'steps': 48563, 'loss/train': 1.509786605834961} -08/30/2021 22:01:08 - INFO - __main__ - Step 48565: {'lr': 0.0003875039907630744, 'samples': 9324480, 'steps': 48564, 'loss/train': 1.1738789081573486} -08/30/2021 22:01:08 - INFO - __main__ - Step 48566: {'lr': 0.0003874995587825756, 'samples': 9324672, 'steps': 48565, 'loss/train': 1.6788603067398071} -08/30/2021 22:01:08 - INFO - __main__ - Step 48567: {'lr': 0.00038749512674012167, 'samples': 9324864, 'steps': 48566, 'loss/train': 2.1085872650146484} -08/30/2021 22:01:10 - INFO - __main__ - Step 48568: {'lr': 0.0003874906946357145, 'samples': 9325056, 'steps': 48567, 'loss/train': 1.2281612157821655} -08/30/2021 22:01:10 - INFO - __main__ - Step 48569: {'lr': 0.00038748626246935613, 'samples': 9325248, 'steps': 48568, 'loss/train': 1.6194109916687012} -08/30/2021 22:01:11 - INFO - __main__ - Step 48570: {'lr': 0.0003874818302410486, 'samples': 9325440, 'steps': 48569, 'loss/train': 1.574687123298645} -08/30/2021 22:01:11 - INFO - __main__ - Step 48571: {'lr': 0.00038747739795079396, 'samples': 9325632, 'steps': 48570, 'loss/train': 1.2672604322433472} -08/30/2021 22:01:11 - INFO - __main__ - Step 48572: {'lr': 0.000387472965598594, 'samples': 9325824, 'steps': 48571, 'loss/train': 1.5044519901275635} -08/30/2021 22:01:12 - INFO - __main__ - Step 48573: {'lr': 0.0003874685331844509, 'samples': 9326016, 'steps': 48572, 'loss/train': 1.6884443759918213} -08/30/2021 22:01:13 - INFO - __main__ - Step 48574: {'lr': 0.0003874641007083666, 'samples': 9326208, 'steps': 48573, 'loss/train': 1.3984692096710205} -08/30/2021 22:01:14 - INFO - __main__ - Step 48575: {'lr': 0.00038745966817034305, 'samples': 9326400, 'steps': 48574, 'loss/train': 0.9498159885406494} -08/30/2021 22:01:14 - INFO - __main__ - Step 48576: {'lr': 0.0003874552355703823, 'samples': 9326592, 'steps': 48575, 'loss/train': 1.2195899486541748} -08/30/2021 22:01:14 - INFO - __main__ - Step 48577: {'lr': 0.00038745080290848635, 'samples': 9326784, 'steps': 48576, 'loss/train': 1.8267135620117188} -08/30/2021 22:01:15 - INFO - __main__ - Step 48578: {'lr': 0.0003874463701846573, 'samples': 9326976, 'steps': 48577, 'loss/train': 1.5567800998687744} -08/30/2021 22:01:17 - INFO - __main__ - Step 48579: {'lr': 0.0003874419373988969, 'samples': 9327168, 'steps': 48578, 'loss/train': 1.8793991804122925} -08/30/2021 22:01:17 - INFO - __main__ - Step 48580: {'lr': 0.0003874375045512073, 'samples': 9327360, 'steps': 48579, 'loss/train': 0.9314099550247192} -08/30/2021 22:01:18 - INFO - __main__ - Step 48581: {'lr': 0.0003874330716415905, 'samples': 9327552, 'steps': 48580, 'loss/train': 1.1739728450775146} -08/30/2021 22:01:18 - INFO - __main__ - Step 48582: {'lr': 0.00038742863867004853, 'samples': 9327744, 'steps': 48581, 'loss/train': 1.144687533378601} -08/30/2021 22:01:18 - INFO - __main__ - Step 48583: {'lr': 0.0003874242056365833, 'samples': 9327936, 'steps': 48582, 'loss/train': 2.282952070236206} -08/30/2021 22:01:19 - INFO - __main__ - Step 48584: {'lr': 0.0003874197725411969, 'samples': 9328128, 'steps': 48583, 'loss/train': 0.7288729548454285} -08/30/2021 22:01:20 - INFO - __main__ - Step 48585: {'lr': 0.00038741533938389117, 'samples': 9328320, 'steps': 48584, 'loss/train': 0.5451220870018005} -08/30/2021 22:01:21 - INFO - __main__ - Step 48586: {'lr': 0.00038741090616466824, 'samples': 9328512, 'steps': 48585, 'loss/train': 1.2091689109802246} -08/30/2021 22:01:21 - INFO - __main__ - Step 48587: {'lr': 0.0003874064728835301, 'samples': 9328704, 'steps': 48586, 'loss/train': 1.4198529720306396} -08/30/2021 22:01:21 - INFO - __main__ - Step 48588: {'lr': 0.0003874020395404787, 'samples': 9328896, 'steps': 48587, 'loss/train': 1.4191687107086182} -08/30/2021 22:01:22 - INFO - __main__ - Step 48589: {'lr': 0.00038739760613551606, 'samples': 9329088, 'steps': 48588, 'loss/train': 1.0444717407226562} -08/30/2021 22:01:23 - INFO - __main__ - Step 48590: {'lr': 0.0003873931726686442, 'samples': 9329280, 'steps': 48589, 'loss/train': 1.896647334098816} -08/30/2021 22:01:24 - INFO - __main__ - Step 48591: {'lr': 0.0003873887391398651, 'samples': 9329472, 'steps': 48590, 'loss/train': 1.8076246976852417} -08/30/2021 22:01:24 - INFO - __main__ - Step 48592: {'lr': 0.0003873843055491807, 'samples': 9329664, 'steps': 48591, 'loss/train': 1.717578411102295} -08/30/2021 22:01:24 - INFO - __main__ - Step 48593: {'lr': 0.00038737987189659315, 'samples': 9329856, 'steps': 48592, 'loss/train': 1.5724797248840332} -08/30/2021 22:01:25 - INFO - __main__ - Step 48594: {'lr': 0.00038737543818210423, 'samples': 9330048, 'steps': 48593, 'loss/train': 0.06825880706310272} -08/30/2021 22:01:26 - INFO - __main__ - Step 48595: {'lr': 0.00038737100440571615, 'samples': 9330240, 'steps': 48594, 'loss/train': 1.4919979572296143} -08/30/2021 22:01:27 - INFO - __main__ - Step 48596: {'lr': 0.00038736657056743075, 'samples': 9330432, 'steps': 48595, 'loss/train': 0.07968267053365707} -08/30/2021 22:01:27 - INFO - __main__ - Step 48597: {'lr': 0.0003873621366672502, 'samples': 9330624, 'steps': 48596, 'loss/train': 0.06861887127161026} -08/30/2021 22:01:28 - INFO - __main__ - Step 48598: {'lr': 0.0003873577027051763, 'samples': 9330816, 'steps': 48597, 'loss/train': 1.5271934270858765} -08/30/2021 22:01:28 - INFO - __main__ - Step 48599: {'lr': 0.0003873532686812111, 'samples': 9331008, 'steps': 48598, 'loss/train': 0.9882999658584595} -08/30/2021 22:01:30 - INFO - __main__ - Step 48600: {'lr': 0.0003873488345953567, 'samples': 9331200, 'steps': 48599, 'loss/train': 1.1225131750106812} -08/30/2021 22:01:31 - INFO - __main__ - Step 48601: {'lr': 0.00038734440044761503, 'samples': 9331392, 'steps': 48600, 'loss/train': 1.5609920024871826} -08/30/2021 22:01:31 - INFO - __main__ - Step 48602: {'lr': 0.0003873399662379881, 'samples': 9331584, 'steps': 48601, 'loss/train': 0.691584587097168} -08/30/2021 22:01:31 - INFO - __main__ - Step 48603: {'lr': 0.00038733553196647786, 'samples': 9331776, 'steps': 48602, 'loss/train': 1.5188713073730469} -08/30/2021 22:01:32 - INFO - __main__ - Step 48604: {'lr': 0.00038733109763308644, 'samples': 9331968, 'steps': 48603, 'loss/train': 0.040184203535318375} -08/30/2021 22:01:32 - INFO - __main__ - Step 48605: {'lr': 0.0003873266632378157, 'samples': 9332160, 'steps': 48604, 'loss/train': 0.03341313824057579} -08/30/2021 22:01:34 - INFO - __main__ - Step 48606: {'lr': 0.00038732222878066764, 'samples': 9332352, 'steps': 48605, 'loss/train': 0.9039045572280884} -08/30/2021 22:01:35 - INFO - __main__ - Step 48607: {'lr': 0.0003873177942616444, 'samples': 9332544, 'steps': 48606, 'loss/train': 1.539287805557251} -08/30/2021 22:01:35 - INFO - __main__ - Step 48608: {'lr': 0.0003873133596807478, 'samples': 9332736, 'steps': 48607, 'loss/train': 1.449718952178955} -08/30/2021 22:01:35 - INFO - __main__ - Step 48609: {'lr': 0.00038730892503797986, 'samples': 9332928, 'steps': 48608, 'loss/train': 1.5010136365890503} -08/30/2021 22:01:36 - INFO - __main__ - Step 48610: {'lr': 0.00038730449033334277, 'samples': 9333120, 'steps': 48609, 'loss/train': 2.045989513397217} -08/30/2021 22:01:36 - INFO - __main__ - Step 48611: {'lr': 0.00038730005556683833, 'samples': 9333312, 'steps': 48610, 'loss/train': 1.9787211418151855} -08/30/2021 22:01:38 - INFO - __main__ - Step 48612: {'lr': 0.00038729562073846856, 'samples': 9333504, 'steps': 48611, 'loss/train': 1.6157768964767456} -08/30/2021 22:01:39 - INFO - __main__ - Step 48613: {'lr': 0.00038729118584823557, 'samples': 9333696, 'steps': 48612, 'loss/train': 0.7498517036437988} -08/30/2021 22:01:39 - INFO - __main__ - Step 48614: {'lr': 0.0003872867508961413, 'samples': 9333888, 'steps': 48613, 'loss/train': 1.5510752201080322} -08/30/2021 22:01:39 - INFO - __main__ - Step 48615: {'lr': 0.00038728231588218767, 'samples': 9334080, 'steps': 48614, 'loss/train': 1.334282636642456} -08/30/2021 22:01:40 - INFO - __main__ - Step 48616: {'lr': 0.00038727788080637684, 'samples': 9334272, 'steps': 48615, 'loss/train': 5.3211541175842285} -08/30/2021 22:01:40 - INFO - __main__ - Step 48617: {'lr': 0.00038727344566871064, 'samples': 9334464, 'steps': 48616, 'loss/train': 2.221296787261963} -08/30/2021 22:01:42 - INFO - __main__ - Step 48618: {'lr': 0.00038726901046919114, 'samples': 9334656, 'steps': 48617, 'loss/train': 1.4681886434555054} -08/30/2021 22:01:42 - INFO - __main__ - Step 48619: {'lr': 0.00038726457520782046, 'samples': 9334848, 'steps': 48618, 'loss/train': 1.652093768119812} -08/30/2021 22:01:42 - INFO - __main__ - Step 48620: {'lr': 0.00038726013988460027, 'samples': 9335040, 'steps': 48619, 'loss/train': 1.3608489036560059} -08/30/2021 22:01:43 - INFO - __main__ - Step 48621: {'lr': 0.00038725570449953296, 'samples': 9335232, 'steps': 48620, 'loss/train': 0.09964090585708618} -08/30/2021 22:01:43 - INFO - __main__ - Step 48622: {'lr': 0.0003872512690526203, 'samples': 9335424, 'steps': 48621, 'loss/train': 1.790815830230713} -08/30/2021 22:01:45 - INFO - __main__ - Step 48623: {'lr': 0.0003872468335438643, 'samples': 9335616, 'steps': 48622, 'loss/train': 0.8979711532592773} -08/30/2021 22:01:45 - INFO - __main__ - Step 48624: {'lr': 0.000387242397973267, 'samples': 9335808, 'steps': 48623, 'loss/train': 2.186614751815796} -08/30/2021 22:01:46 - INFO - __main__ - Step 48625: {'lr': 0.0003872379623408304, 'samples': 9336000, 'steps': 48624, 'loss/train': 2.225583076477051} -08/30/2021 22:01:46 - INFO - __main__ - Step 48626: {'lr': 0.0003872335266465565, 'samples': 9336192, 'steps': 48625, 'loss/train': 1.8306851387023926} -08/30/2021 22:01:46 - INFO - __main__ - Step 48627: {'lr': 0.00038722909089044735, 'samples': 9336384, 'steps': 48626, 'loss/train': 1.453413486480713} -08/30/2021 22:01:48 - INFO - __main__ - Step 48628: {'lr': 0.0003872246550725048, 'samples': 9336576, 'steps': 48627, 'loss/train': 1.4319450855255127} -08/30/2021 22:01:48 - INFO - __main__ - Step 48629: {'lr': 0.000387220219192731, 'samples': 9336768, 'steps': 48628, 'loss/train': 1.2898825407028198} -08/30/2021 22:01:49 - INFO - __main__ - Step 48630: {'lr': 0.00038721578325112785, 'samples': 9336960, 'steps': 48629, 'loss/train': 1.2649275064468384} -08/30/2021 22:01:49 - INFO - __main__ - Step 48631: {'lr': 0.00038721134724769733, 'samples': 9337152, 'steps': 48630, 'loss/train': 1.6351832151412964} -08/30/2021 22:01:49 - INFO - __main__ - Step 48632: {'lr': 0.00038720691118244164, 'samples': 9337344, 'steps': 48631, 'loss/train': 1.378145694732666} -08/30/2021 22:01:50 - INFO - __main__ - Step 48633: {'lr': 0.00038720247505536257, 'samples': 9337536, 'steps': 48632, 'loss/train': 1.890519142150879} -08/30/2021 22:01:51 - INFO - __main__ - Step 48634: {'lr': 0.0003871980388664621, 'samples': 9337728, 'steps': 48633, 'loss/train': 1.4490344524383545} -08/30/2021 22:01:52 - INFO - __main__ - Step 48635: {'lr': 0.00038719360261574233, 'samples': 9337920, 'steps': 48634, 'loss/train': 2.115863561630249} -08/30/2021 22:01:52 - INFO - __main__ - Step 48636: {'lr': 0.00038718916630320533, 'samples': 9338112, 'steps': 48635, 'loss/train': 1.0540931224822998} -08/30/2021 22:01:52 - INFO - __main__ - Step 48637: {'lr': 0.0003871847299288529, 'samples': 9338304, 'steps': 48636, 'loss/train': 1.5217387676239014} -08/30/2021 22:01:53 - INFO - __main__ - Step 48638: {'lr': 0.00038718029349268723, 'samples': 9338496, 'steps': 48637, 'loss/train': 0.6063851118087769} -08/30/2021 22:01:54 - INFO - __main__ - Step 48639: {'lr': 0.00038717585699471024, 'samples': 9338688, 'steps': 48638, 'loss/train': 1.37833571434021} -08/30/2021 22:01:54 - INFO - __main__ - Step 48640: {'lr': 0.0003871714204349239, 'samples': 9338880, 'steps': 48639, 'loss/train': 1.0108524560928345} -08/30/2021 22:01:55 - INFO - __main__ - Step 48641: {'lr': 0.00038716698381333027, 'samples': 9339072, 'steps': 48640, 'loss/train': 2.2253668308258057} -08/30/2021 22:01:55 - INFO - __main__ - Step 48642: {'lr': 0.0003871625471299313, 'samples': 9339264, 'steps': 48641, 'loss/train': 1.5927236080169678} -08/30/2021 22:01:56 - INFO - __main__ - Step 48643: {'lr': 0.00038715811038472894, 'samples': 9339456, 'steps': 48642, 'loss/train': 1.748753547668457} -08/30/2021 22:01:56 - INFO - __main__ - Step 48644: {'lr': 0.0003871536735777252, 'samples': 9339648, 'steps': 48643, 'loss/train': 1.4262044429779053} -08/30/2021 22:01:58 - INFO - __main__ - Step 48645: {'lr': 0.0003871492367089223, 'samples': 9339840, 'steps': 48644, 'loss/train': 1.225915551185608} -08/30/2021 22:01:58 - INFO - __main__ - Step 48646: {'lr': 0.000387144799778322, 'samples': 9340032, 'steps': 48645, 'loss/train': 1.203242540359497} -08/30/2021 22:01:58 - INFO - __main__ - Step 48647: {'lr': 0.00038714036278592636, 'samples': 9340224, 'steps': 48646, 'loss/train': 1.8290691375732422} -08/30/2021 22:01:59 - INFO - __main__ - Step 48648: {'lr': 0.0003871359257317374, 'samples': 9340416, 'steps': 48647, 'loss/train': 0.9520112872123718} -08/30/2021 22:01:59 - INFO - __main__ - Step 48649: {'lr': 0.0003871314886157571, 'samples': 9340608, 'steps': 48648, 'loss/train': 1.862069845199585} -08/30/2021 22:02:00 - INFO - __main__ - Step 48650: {'lr': 0.0003871270514379874, 'samples': 9340800, 'steps': 48649, 'loss/train': 1.5161504745483398} -08/30/2021 22:02:01 - INFO - __main__ - Step 48651: {'lr': 0.00038712261419843056, 'samples': 9340992, 'steps': 48650, 'loss/train': 0.9336527585983276} -08/30/2021 22:02:01 - INFO - __main__ - Step 48652: {'lr': 0.00038711817689708817, 'samples': 9341184, 'steps': 48651, 'loss/train': 0.7322373390197754} -08/30/2021 22:02:02 - INFO - __main__ - Step 48653: {'lr': 0.00038711373953396257, 'samples': 9341376, 'steps': 48652, 'loss/train': 1.7435458898544312} -08/30/2021 22:02:02 - INFO - __main__ - Step 48654: {'lr': 0.0003871093021090556, 'samples': 9341568, 'steps': 48653, 'loss/train': 2.6974470615386963} -08/30/2021 22:02:03 - INFO - __main__ - Step 48655: {'lr': 0.0003871048646223693, 'samples': 9341760, 'steps': 48654, 'loss/train': 1.5399779081344604} -08/30/2021 22:02:04 - INFO - __main__ - Step 48656: {'lr': 0.00038710042707390557, 'samples': 9341952, 'steps': 48655, 'loss/train': 1.410839319229126} -08/30/2021 22:02:04 - INFO - __main__ - Step 48657: {'lr': 0.00038709598946366666, 'samples': 9342144, 'steps': 48656, 'loss/train': 3.0726022720336914} -08/30/2021 22:02:05 - INFO - __main__ - Step 48658: {'lr': 0.00038709155179165436, 'samples': 9342336, 'steps': 48657, 'loss/train': 0.8205497860908508} -08/30/2021 22:02:05 - INFO - __main__ - Step 48659: {'lr': 0.00038708711405787067, 'samples': 9342528, 'steps': 48658, 'loss/train': 1.7225418090820312} -08/30/2021 22:02:07 - INFO - __main__ - Step 48660: {'lr': 0.0003870826762623177, 'samples': 9342720, 'steps': 48659, 'loss/train': 1.789350152015686} -08/30/2021 22:02:08 - INFO - __main__ - Step 48661: {'lr': 0.00038707823840499736, 'samples': 9342912, 'steps': 48660, 'loss/train': 1.518591284751892} -08/30/2021 22:02:08 - INFO - __main__ - Step 48662: {'lr': 0.0003870738004859117, 'samples': 9343104, 'steps': 48661, 'loss/train': 1.6038150787353516} -08/30/2021 22:02:09 - INFO - __main__ - Step 48663: {'lr': 0.0003870693625050626, 'samples': 9343296, 'steps': 48662, 'loss/train': 1.012636423110962} -08/30/2021 22:02:09 - INFO - __main__ - Step 48664: {'lr': 0.00038706492446245234, 'samples': 9343488, 'steps': 48663, 'loss/train': 0.10666092485189438} -08/30/2021 22:02:11 - INFO - __main__ - Step 48665: {'lr': 0.00038706048635808266, 'samples': 9343680, 'steps': 48664, 'loss/train': 1.1385022401809692} -08/30/2021 22:02:11 - INFO - __main__ - Step 48666: {'lr': 0.0003870560481919556, 'samples': 9343872, 'steps': 48665, 'loss/train': 1.7361559867858887} -08/30/2021 22:02:11 - INFO - __main__ - Step 48667: {'lr': 0.00038705160996407325, 'samples': 9344064, 'steps': 48666, 'loss/train': 1.2121331691741943} -08/30/2021 22:02:12 - INFO - __main__ - Step 48668: {'lr': 0.00038704717167443753, 'samples': 9344256, 'steps': 48667, 'loss/train': 0.8323307633399963} -08/30/2021 22:02:12 - INFO - __main__ - Step 48669: {'lr': 0.0003870427333230505, 'samples': 9344448, 'steps': 48668, 'loss/train': 1.4936115741729736} -08/30/2021 22:02:14 - INFO - __main__ - Step 48670: {'lr': 0.00038703829490991407, 'samples': 9344640, 'steps': 48669, 'loss/train': 1.1054717302322388} -08/30/2021 22:02:15 - INFO - __main__ - Step 48671: {'lr': 0.0003870338564350303, 'samples': 9344832, 'steps': 48670, 'loss/train': 1.3486878871917725} -08/30/2021 22:02:15 - INFO - __main__ - Step 48672: {'lr': 0.0003870294178984013, 'samples': 9345024, 'steps': 48671, 'loss/train': 1.659084677696228} -08/30/2021 22:02:15 - INFO - __main__ - Step 48673: {'lr': 0.0003870249793000289, 'samples': 9345216, 'steps': 48672, 'loss/train': 0.09946160018444061} -08/30/2021 22:02:16 - INFO - __main__ - Step 48674: {'lr': 0.0003870205406399151, 'samples': 9345408, 'steps': 48673, 'loss/train': 1.4737313985824585} -08/30/2021 22:02:16 - INFO - __main__ - Step 48675: {'lr': 0.000387016101918062, 'samples': 9345600, 'steps': 48674, 'loss/train': 1.0012191534042358} -08/30/2021 22:02:17 - INFO - __main__ - Step 48676: {'lr': 0.0003870116631344716, 'samples': 9345792, 'steps': 48675, 'loss/train': 0.1555851697921753} -08/30/2021 22:02:18 - INFO - __main__ - Step 48677: {'lr': 0.0003870072242891458, 'samples': 9345984, 'steps': 48676, 'loss/train': 1.399659276008606} -08/30/2021 22:02:18 - INFO - __main__ - Step 48678: {'lr': 0.0003870027853820867, 'samples': 9346176, 'steps': 48677, 'loss/train': 2.079132556915283} -08/30/2021 22:02:19 - INFO - __main__ - Step 48679: {'lr': 0.0003869983464132962, 'samples': 9346368, 'steps': 48678, 'loss/train': 2.057727813720703} -08/30/2021 22:02:19 - INFO - __main__ - Step 48680: {'lr': 0.0003869939073827764, 'samples': 9346560, 'steps': 48679, 'loss/train': 1.645869493484497} -08/30/2021 22:02:21 - INFO - __main__ - Step 48681: {'lr': 0.00038698946829052926, 'samples': 9346752, 'steps': 48680, 'loss/train': 1.690539002418518} -08/30/2021 22:02:21 - INFO - __main__ - Step 48682: {'lr': 0.00038698502913655673, 'samples': 9346944, 'steps': 48681, 'loss/train': 1.7273426055908203} -08/30/2021 22:02:21 - INFO - __main__ - Step 48683: {'lr': 0.00038698058992086095, 'samples': 9347136, 'steps': 48682, 'loss/train': 1.6277151107788086} -08/30/2021 22:02:22 - INFO - __main__ - Step 48684: {'lr': 0.0003869761506434438, 'samples': 9347328, 'steps': 48683, 'loss/train': 1.2992688417434692} -08/30/2021 22:02:22 - INFO - __main__ - Step 48685: {'lr': 0.0003869717113043073, 'samples': 9347520, 'steps': 48684, 'loss/train': 1.895695447921753} -08/30/2021 22:02:22 - INFO - __main__ - Step 48686: {'lr': 0.00038696727190345347, 'samples': 9347712, 'steps': 48685, 'loss/train': 1.1242011785507202} -08/30/2021 22:02:24 - INFO - __main__ - Step 48687: {'lr': 0.00038696283244088426, 'samples': 9347904, 'steps': 48686, 'loss/train': 1.6465619802474976} -08/30/2021 22:02:24 - INFO - __main__ - Step 48688: {'lr': 0.0003869583929166017, 'samples': 9348096, 'steps': 48687, 'loss/train': 1.2890759706497192} -08/30/2021 22:02:25 - INFO - __main__ - Step 48689: {'lr': 0.0003869539533306079, 'samples': 9348288, 'steps': 48688, 'loss/train': 1.1586542129516602} -08/30/2021 22:02:25 - INFO - __main__ - Step 48690: {'lr': 0.00038694951368290463, 'samples': 9348480, 'steps': 48689, 'loss/train': 1.6542549133300781} -08/30/2021 22:02:25 - INFO - __main__ - Step 48691: {'lr': 0.0003869450739734941, 'samples': 9348672, 'steps': 48690, 'loss/train': 1.0293065309524536} -08/30/2021 22:02:27 - INFO - __main__ - Step 48692: {'lr': 0.00038694063420237823, 'samples': 9348864, 'steps': 48691, 'loss/train': 1.182291030883789} -08/30/2021 22:02:27 - INFO - __main__ - Step 48693: {'lr': 0.00038693619436955907, 'samples': 9349056, 'steps': 48692, 'loss/train': 1.0384904146194458} -08/30/2021 22:02:28 - INFO - __main__ - Step 48694: {'lr': 0.0003869317544750385, 'samples': 9349248, 'steps': 48693, 'loss/train': 1.405635118484497} -08/30/2021 22:02:28 - INFO - __main__ - Step 48695: {'lr': 0.0003869273145188186, 'samples': 9349440, 'steps': 48694, 'loss/train': 1.4013278484344482} -08/30/2021 22:02:28 - INFO - __main__ - Step 48696: {'lr': 0.00038692287450090143, 'samples': 9349632, 'steps': 48695, 'loss/train': 1.0663057565689087} -08/30/2021 22:02:30 - INFO - __main__ - Step 48697: {'lr': 0.0003869184344212888, 'samples': 9349824, 'steps': 48696, 'loss/train': 1.4166395664215088} -08/30/2021 22:02:31 - INFO - __main__ - Step 48698: {'lr': 0.00038691399427998296, 'samples': 9350016, 'steps': 48697, 'loss/train': 1.0973402261734009} -08/30/2021 22:02:31 - INFO - __main__ - Step 48699: {'lr': 0.0003869095540769858, 'samples': 9350208, 'steps': 48698, 'loss/train': 0.11965186893939972} -08/30/2021 22:02:31 - INFO - __main__ - Step 48700: {'lr': 0.0003869051138122992, 'samples': 9350400, 'steps': 48699, 'loss/train': 1.6753551959991455} -08/30/2021 22:02:32 - INFO - __main__ - Step 48701: {'lr': 0.0003869006734859253, 'samples': 9350592, 'steps': 48700, 'loss/train': 1.0675082206726074} -08/30/2021 22:02:33 - INFO - __main__ - Step 48702: {'lr': 0.00038689623309786617, 'samples': 9350784, 'steps': 48701, 'loss/train': 1.283065676689148} -08/30/2021 22:02:34 - INFO - __main__ - Step 48703: {'lr': 0.00038689179264812356, 'samples': 9350976, 'steps': 48702, 'loss/train': 1.254591703414917} -08/30/2021 22:02:34 - INFO - __main__ - Step 48704: {'lr': 0.00038688735213669967, 'samples': 9351168, 'steps': 48703, 'loss/train': 1.1807243824005127} -08/30/2021 22:02:34 - INFO - __main__ - Step 48705: {'lr': 0.00038688291156359654, 'samples': 9351360, 'steps': 48704, 'loss/train': 1.4753825664520264} -08/30/2021 22:02:35 - INFO - __main__ - Step 48706: {'lr': 0.000386878470928816, 'samples': 9351552, 'steps': 48705, 'loss/train': 1.469362497329712} -08/30/2021 22:02:35 - INFO - __main__ - Step 48707: {'lr': 0.0003868740302323601, 'samples': 9351744, 'steps': 48706, 'loss/train': 1.3168137073516846} -08/30/2021 22:02:36 - INFO - __main__ - Step 48708: {'lr': 0.00038686958947423096, 'samples': 9351936, 'steps': 48707, 'loss/train': 1.1679786443710327} -08/30/2021 22:02:37 - INFO - __main__ - Step 48709: {'lr': 0.00038686514865443047, 'samples': 9352128, 'steps': 48708, 'loss/train': 1.2505630254745483} -08/30/2021 22:02:37 - INFO - __main__ - Step 48710: {'lr': 0.00038686070777296057, 'samples': 9352320, 'steps': 48709, 'loss/train': 1.2325536012649536} -08/30/2021 22:02:38 - INFO - __main__ - Step 48711: {'lr': 0.00038685626682982347, 'samples': 9352512, 'steps': 48710, 'loss/train': 1.2659049034118652} -08/30/2021 22:02:38 - INFO - __main__ - Step 48712: {'lr': 0.000386851825825021, 'samples': 9352704, 'steps': 48711, 'loss/train': 1.2162539958953857} -08/30/2021 22:02:40 - INFO - __main__ - Step 48713: {'lr': 0.0003868473847585552, 'samples': 9352896, 'steps': 48712, 'loss/train': 1.3787950277328491} -08/30/2021 22:02:40 - INFO - __main__ - Step 48714: {'lr': 0.00038684294363042806, 'samples': 9353088, 'steps': 48713, 'loss/train': 1.356581687927246} -08/30/2021 22:02:41 - INFO - __main__ - Step 48715: {'lr': 0.00038683850244064164, 'samples': 9353280, 'steps': 48714, 'loss/train': 1.8732585906982422} -08/30/2021 22:02:41 - INFO - __main__ - Step 48716: {'lr': 0.0003868340611891978, 'samples': 9353472, 'steps': 48715, 'loss/train': 1.5974364280700684} -08/30/2021 22:02:41 - INFO - __main__ - Step 48717: {'lr': 0.0003868296198760988, 'samples': 9353664, 'steps': 48716, 'loss/train': 1.2716572284698486} -08/30/2021 22:02:43 - INFO - __main__ - Step 48718: {'lr': 0.00038682517850134634, 'samples': 9353856, 'steps': 48717, 'loss/train': 0.8481349945068359} -08/30/2021 22:02:44 - INFO - __main__ - Step 48719: {'lr': 0.0003868207370649427, 'samples': 9354048, 'steps': 48718, 'loss/train': 1.2210620641708374} -08/30/2021 22:02:44 - INFO - __main__ - Step 48720: {'lr': 0.0003868162955668897, 'samples': 9354240, 'steps': 48719, 'loss/train': 1.0997753143310547} -08/30/2021 22:02:44 - INFO - __main__ - Step 48721: {'lr': 0.0003868118540071894, 'samples': 9354432, 'steps': 48720, 'loss/train': 1.3661706447601318} -08/30/2021 22:02:45 - INFO - __main__ - Step 48722: {'lr': 0.0003868074123858437, 'samples': 9354624, 'steps': 48721, 'loss/train': 0.8031905293464661} -08/30/2021 22:02:46 - INFO - __main__ - Step 48723: {'lr': 0.0003868029707028548, 'samples': 9354816, 'steps': 48722, 'loss/train': 1.1705511808395386} -08/30/2021 22:02:47 - INFO - __main__ - Step 48724: {'lr': 0.00038679852895822454, 'samples': 9355008, 'steps': 48723, 'loss/train': 1.1623700857162476} -08/30/2021 22:02:47 - INFO - __main__ - Step 48725: {'lr': 0.000386794087151955, 'samples': 9355200, 'steps': 48724, 'loss/train': 1.208777904510498} -08/30/2021 22:02:47 - INFO - __main__ - Step 48726: {'lr': 0.00038678964528404816, 'samples': 9355392, 'steps': 48725, 'loss/train': 1.2652634382247925} -08/30/2021 22:02:48 - INFO - __main__ - Step 48727: {'lr': 0.000386785203354506, 'samples': 9355584, 'steps': 48726, 'loss/train': 1.4759992361068726} -08/30/2021 22:02:49 - INFO - __main__ - Step 48728: {'lr': 0.0003867807613633305, 'samples': 9355776, 'steps': 48727, 'loss/train': 0.10973817110061646} -08/30/2021 22:02:50 - INFO - __main__ - Step 48729: {'lr': 0.0003867763193105237, 'samples': 9355968, 'steps': 48728, 'loss/train': 0.14093215763568878} -08/30/2021 22:02:50 - INFO - __main__ - Step 48730: {'lr': 0.00038677187719608763, 'samples': 9356160, 'steps': 48729, 'loss/train': 0.9056994915008545} -08/30/2021 22:02:50 - INFO - __main__ - Step 48731: {'lr': 0.00038676743502002434, 'samples': 9356352, 'steps': 48730, 'loss/train': 1.218212604522705} -08/30/2021 22:02:51 - INFO - __main__ - Step 48732: {'lr': 0.0003867629927823357, 'samples': 9356544, 'steps': 48731, 'loss/train': 1.4684395790100098} -08/30/2021 22:02:52 - INFO - __main__ - Step 48733: {'lr': 0.0003867585504830237, 'samples': 9356736, 'steps': 48732, 'loss/train': 1.312386155128479} -08/30/2021 22:02:53 - INFO - __main__ - Step 48734: {'lr': 0.00038675410812209044, 'samples': 9356928, 'steps': 48733, 'loss/train': 2.101454973220825} -08/30/2021 22:02:53 - INFO - __main__ - Step 48735: {'lr': 0.0003867496656995379, 'samples': 9357120, 'steps': 48734, 'loss/train': 1.7242871522903442} -08/30/2021 22:02:54 - INFO - __main__ - Step 48736: {'lr': 0.0003867452232153681, 'samples': 9357312, 'steps': 48735, 'loss/train': 1.1259361505508423} -08/30/2021 22:02:54 - INFO - __main__ - Step 48737: {'lr': 0.00038674078066958296, 'samples': 9357504, 'steps': 48736, 'loss/train': 1.1440268754959106} -08/30/2021 22:02:54 - INFO - __main__ - Step 48738: {'lr': 0.0003867363380621846, 'samples': 9357696, 'steps': 48737, 'loss/train': 1.0000988245010376} -08/30/2021 22:02:56 - INFO - __main__ - Step 48739: {'lr': 0.0003867318953931749, 'samples': 9357888, 'steps': 48738, 'loss/train': 0.8937061429023743} -08/30/2021 22:02:57 - INFO - __main__ - Step 48740: {'lr': 0.00038672745266255594, 'samples': 9358080, 'steps': 48739, 'loss/train': 0.8546640276908875} -08/30/2021 22:02:57 - INFO - __main__ - Step 48741: {'lr': 0.0003867230098703297, 'samples': 9358272, 'steps': 48740, 'loss/train': 1.2698071002960205} -08/30/2021 22:02:57 - INFO - __main__ - Step 48742: {'lr': 0.00038671856701649813, 'samples': 9358464, 'steps': 48741, 'loss/train': 4.387177467346191} -08/30/2021 22:02:58 - INFO - __main__ - Step 48743: {'lr': 0.0003867141241010633, 'samples': 9358656, 'steps': 48742, 'loss/train': 1.956860065460205} -08/30/2021 22:02:58 - INFO - __main__ - Step 48744: {'lr': 0.00038670968112402724, 'samples': 9358848, 'steps': 48743, 'loss/train': 1.6871875524520874} -08/30/2021 22:02:59 - INFO - __main__ - Step 48745: {'lr': 0.00038670523808539194, 'samples': 9359040, 'steps': 48744, 'loss/train': 1.1926343441009521} -08/30/2021 22:03:00 - INFO - __main__ - Step 48746: {'lr': 0.0003867007949851593, 'samples': 9359232, 'steps': 48745, 'loss/train': 1.7859184741973877} -08/30/2021 22:03:00 - INFO - __main__ - Step 48747: {'lr': 0.0003866963518233314, 'samples': 9359424, 'steps': 48746, 'loss/train': 1.6357057094573975} -08/30/2021 22:03:01 - INFO - __main__ - Step 48748: {'lr': 0.00038669190859991025, 'samples': 9359616, 'steps': 48747, 'loss/train': 1.3583440780639648} -08/30/2021 22:03:01 - INFO - __main__ - Step 48749: {'lr': 0.00038668746531489787, 'samples': 9359808, 'steps': 48748, 'loss/train': 1.5124634504318237} -08/30/2021 22:03:02 - INFO - __main__ - Step 48750: {'lr': 0.0003866830219682962, 'samples': 9360000, 'steps': 48749, 'loss/train': 1.5280160903930664} -08/30/2021 22:03:03 - INFO - __main__ - Step 48751: {'lr': 0.00038667857856010727, 'samples': 9360192, 'steps': 48750, 'loss/train': 1.3867889642715454} -08/30/2021 22:03:03 - INFO - __main__ - Step 48752: {'lr': 0.00038667413509033306, 'samples': 9360384, 'steps': 48751, 'loss/train': 1.306039571762085} -08/30/2021 22:03:04 - INFO - __main__ - Step 48753: {'lr': 0.0003866696915589756, 'samples': 9360576, 'steps': 48752, 'loss/train': 2.0511984825134277} -08/30/2021 22:03:04 - INFO - __main__ - Step 48754: {'lr': 0.0003866652479660369, 'samples': 9360768, 'steps': 48753, 'loss/train': 1.418534517288208} -08/30/2021 22:03:06 - INFO - __main__ - Step 48755: {'lr': 0.00038666080431151896, 'samples': 9360960, 'steps': 48754, 'loss/train': 0.6822006106376648} -08/30/2021 22:03:06 - INFO - __main__ - Step 48756: {'lr': 0.00038665636059542367, 'samples': 9361152, 'steps': 48755, 'loss/train': 1.70613694190979} -08/30/2021 22:03:07 - INFO - __main__ - Step 48757: {'lr': 0.00038665191681775323, 'samples': 9361344, 'steps': 48756, 'loss/train': 1.1581143140792847} -08/30/2021 22:03:07 - INFO - __main__ - Step 48758: {'lr': 0.00038664747297850955, 'samples': 9361536, 'steps': 48757, 'loss/train': 1.32694673538208} -08/30/2021 22:03:07 - INFO - __main__ - Step 48759: {'lr': 0.00038664302907769456, 'samples': 9361728, 'steps': 48758, 'loss/train': 1.8530160188674927} -08/30/2021 22:03:08 - INFO - __main__ - Step 48760: {'lr': 0.00038663858511531034, 'samples': 9361920, 'steps': 48759, 'loss/train': 1.2440946102142334} -08/30/2021 22:03:09 - INFO - __main__ - Step 48761: {'lr': 0.000386634141091359, 'samples': 9362112, 'steps': 48760, 'loss/train': 1.301032304763794} -08/30/2021 22:03:10 - INFO - __main__ - Step 48762: {'lr': 0.0003866296970058423, 'samples': 9362304, 'steps': 48761, 'loss/train': 1.8586019277572632} -08/30/2021 22:03:10 - INFO - __main__ - Step 48763: {'lr': 0.0003866252528587624, 'samples': 9362496, 'steps': 48762, 'loss/train': 1.463564157485962} -08/30/2021 22:03:10 - INFO - __main__ - Step 48764: {'lr': 0.00038662080865012127, 'samples': 9362688, 'steps': 48763, 'loss/train': 1.4040064811706543} -08/30/2021 22:03:11 - INFO - __main__ - Step 48765: {'lr': 0.00038661636437992093, 'samples': 9362880, 'steps': 48764, 'loss/train': 1.363713026046753} -08/30/2021 22:03:12 - INFO - __main__ - Step 48766: {'lr': 0.0003866119200481634, 'samples': 9363072, 'steps': 48765, 'loss/train': 1.459545373916626} -08/30/2021 22:03:13 - INFO - __main__ - Step 48767: {'lr': 0.00038660747565485054, 'samples': 9363264, 'steps': 48766, 'loss/train': 1.904281735420227} -08/30/2021 22:03:13 - INFO - __main__ - Step 48768: {'lr': 0.0003866030311999845, 'samples': 9363456, 'steps': 48767, 'loss/train': 0.7655251026153564} -08/30/2021 22:03:13 - INFO - __main__ - Step 48769: {'lr': 0.0003865985866835673, 'samples': 9363648, 'steps': 48768, 'loss/train': 1.2952150106430054} -08/30/2021 22:03:14 - INFO - __main__ - Step 48770: {'lr': 0.00038659414210560087, 'samples': 9363840, 'steps': 48769, 'loss/train': 1.252069354057312} -08/30/2021 22:03:16 - INFO - __main__ - Step 48771: {'lr': 0.00038658969746608717, 'samples': 9364032, 'steps': 48770, 'loss/train': 1.5985147953033447} -08/30/2021 22:03:16 - INFO - __main__ - Step 48772: {'lr': 0.0003865852527650283, 'samples': 9364224, 'steps': 48771, 'loss/train': 1.8734334707260132} -08/30/2021 22:03:17 - INFO - __main__ - Step 48773: {'lr': 0.0003865808080024262, 'samples': 9364416, 'steps': 48772, 'loss/train': 1.3664510250091553} -08/30/2021 22:03:17 - INFO - __main__ - Step 48774: {'lr': 0.00038657636317828293, 'samples': 9364608, 'steps': 48773, 'loss/train': 1.2749916315078735} -08/30/2021 22:03:17 - INFO - __main__ - Step 48775: {'lr': 0.00038657191829260043, 'samples': 9364800, 'steps': 48774, 'loss/train': 1.3623124361038208} -08/30/2021 22:03:19 - INFO - __main__ - Step 48776: {'lr': 0.00038656747334538073, 'samples': 9364992, 'steps': 48775, 'loss/train': 1.9370123147964478} -08/30/2021 22:03:19 - INFO - __main__ - Step 48777: {'lr': 0.00038656302833662583, 'samples': 9365184, 'steps': 48776, 'loss/train': 1.8823027610778809} -08/30/2021 22:03:20 - INFO - __main__ - Step 48778: {'lr': 0.00038655858326633774, 'samples': 9365376, 'steps': 48777, 'loss/train': 1.4413312673568726} -08/30/2021 22:03:20 - INFO - __main__ - Step 48779: {'lr': 0.0003865541381345185, 'samples': 9365568, 'steps': 48778, 'loss/train': 1.325539231300354} -08/30/2021 22:03:20 - INFO - __main__ - Step 48780: {'lr': 0.00038654969294117, 'samples': 9365760, 'steps': 48779, 'loss/train': 1.5048428773880005} -08/30/2021 22:03:21 - INFO - __main__ - Step 48781: {'lr': 0.0003865452476862944, 'samples': 9365952, 'steps': 48780, 'loss/train': 1.2868441343307495} -08/30/2021 22:03:22 - INFO - __main__ - Step 48782: {'lr': 0.0003865408023698935, 'samples': 9366144, 'steps': 48781, 'loss/train': 1.2281959056854248} -08/30/2021 22:03:23 - INFO - __main__ - Step 48783: {'lr': 0.00038653635699196956, 'samples': 9366336, 'steps': 48782, 'loss/train': 1.5570204257965088} -08/30/2021 22:03:23 - INFO - __main__ - Step 48784: {'lr': 0.0003865319115525244, 'samples': 9366528, 'steps': 48783, 'loss/train': 1.641545295715332} -08/30/2021 22:03:23 - INFO - __main__ - Step 48785: {'lr': 0.00038652746605156, 'samples': 9366720, 'steps': 48784, 'loss/train': 1.150676965713501} -08/30/2021 22:03:24 - INFO - __main__ - Step 48786: {'lr': 0.0003865230204890785, 'samples': 9366912, 'steps': 48785, 'loss/train': 1.3756340742111206} -08/30/2021 22:03:25 - INFO - __main__ - Step 48787: {'lr': 0.0003865185748650818, 'samples': 9367104, 'steps': 48786, 'loss/train': 1.1080893278121948} -08/30/2021 22:03:26 - INFO - __main__ - Step 48788: {'lr': 0.00038651412917957195, 'samples': 9367296, 'steps': 48787, 'loss/train': 0.9076159000396729} -08/30/2021 22:03:26 - INFO - __main__ - Step 48789: {'lr': 0.000386509683432551, 'samples': 9367488, 'steps': 48788, 'loss/train': 1.5767009258270264} -08/30/2021 22:03:26 - INFO - __main__ - Step 48790: {'lr': 0.0003865052376240208, 'samples': 9367680, 'steps': 48789, 'loss/train': 1.0853540897369385} -08/30/2021 22:03:27 - INFO - __main__ - Step 48791: {'lr': 0.00038650079175398346, 'samples': 9367872, 'steps': 48790, 'loss/train': 1.300365924835205} -08/30/2021 22:03:28 - INFO - __main__ - Step 48792: {'lr': 0.00038649634582244095, 'samples': 9368064, 'steps': 48791, 'loss/train': 0.9238002896308899} -08/30/2021 22:03:29 - INFO - __main__ - Step 48793: {'lr': 0.0003864918998293954, 'samples': 9368256, 'steps': 48792, 'loss/train': 1.3387572765350342} -08/30/2021 22:03:29 - INFO - __main__ - Step 48794: {'lr': 0.0003864874537748486, 'samples': 9368448, 'steps': 48793, 'loss/train': 1.006764531135559} -08/30/2021 22:03:29 - INFO - __main__ - Step 48795: {'lr': 0.00038648300765880276, 'samples': 9368640, 'steps': 48794, 'loss/train': 0.6098302006721497} -08/30/2021 22:03:30 - INFO - __main__ - Step 48796: {'lr': 0.0003864785614812597, 'samples': 9368832, 'steps': 48795, 'loss/train': 0.7445828318595886} -08/30/2021 22:03:31 - INFO - __main__ - Step 48797: {'lr': 0.00038647411524222146, 'samples': 9369024, 'steps': 48796, 'loss/train': 1.2196470499038696} -08/30/2021 22:03:31 - INFO - __main__ - Step 48798: {'lr': 0.00038646966894169014, 'samples': 9369216, 'steps': 48797, 'loss/train': 0.8344257473945618} -08/30/2021 22:03:32 - INFO - __main__ - Step 48799: {'lr': 0.00038646522257966776, 'samples': 9369408, 'steps': 48798, 'loss/train': 1.6496281623840332} -08/30/2021 22:03:32 - INFO - __main__ - Step 48800: {'lr': 0.0003864607761561562, 'samples': 9369600, 'steps': 48799, 'loss/train': 1.2403191328048706} -08/30/2021 22:03:33 - INFO - __main__ - Step 48801: {'lr': 0.00038645632967115753, 'samples': 9369792, 'steps': 48800, 'loss/train': 1.62411630153656} -08/30/2021 22:03:33 - INFO - __main__ - Step 48802: {'lr': 0.0003864518831246737, 'samples': 9369984, 'steps': 48801, 'loss/train': 1.5026872158050537} -08/30/2021 22:03:34 - INFO - __main__ - Step 48803: {'lr': 0.00038644743651670684, 'samples': 9370176, 'steps': 48802, 'loss/train': 1.3241527080535889} -08/30/2021 22:03:35 - INFO - __main__ - Step 48804: {'lr': 0.00038644298984725876, 'samples': 9370368, 'steps': 48803, 'loss/train': 1.9161458015441895} -08/30/2021 22:03:35 - INFO - __main__ - Step 48805: {'lr': 0.00038643854311633166, 'samples': 9370560, 'steps': 48804, 'loss/train': 1.5951666831970215} -08/30/2021 22:03:35 - INFO - __main__ - Step 48806: {'lr': 0.0003864340963239275, 'samples': 9370752, 'steps': 48805, 'loss/train': 1.6425849199295044} -08/30/2021 22:03:36 - INFO - __main__ - Step 48807: {'lr': 0.00038642964947004815, 'samples': 9370944, 'steps': 48806, 'loss/train': 1.3888704776763916} -08/30/2021 22:03:37 - INFO - __main__ - Step 48808: {'lr': 0.0003864252025546957, 'samples': 9371136, 'steps': 48807, 'loss/train': 1.5884183645248413} -08/30/2021 22:03:38 - INFO - __main__ - Step 48809: {'lr': 0.00038642075557787225, 'samples': 9371328, 'steps': 48808, 'loss/train': 1.2967875003814697} -08/30/2021 22:03:38 - INFO - __main__ - Step 48810: {'lr': 0.0003864163085395797, 'samples': 9371520, 'steps': 48809, 'loss/train': 2.3215925693511963} -08/30/2021 22:03:39 - INFO - __main__ - Step 48811: {'lr': 0.00038641186143982, 'samples': 9371712, 'steps': 48810, 'loss/train': 1.638586163520813} -08/30/2021 22:03:39 - INFO - __main__ - Step 48812: {'lr': 0.0003864074142785952, 'samples': 9371904, 'steps': 48811, 'loss/train': 0.7048910856246948} -08/30/2021 22:03:40 - INFO - __main__ - Step 48813: {'lr': 0.0003864029670559074, 'samples': 9372096, 'steps': 48812, 'loss/train': 0.5984480381011963} -08/30/2021 22:03:41 - INFO - __main__ - Step 48814: {'lr': 0.0003863985197717585, 'samples': 9372288, 'steps': 48813, 'loss/train': 1.8973820209503174} -08/30/2021 22:03:41 - INFO - __main__ - Step 48815: {'lr': 0.0003863940724261505, 'samples': 9372480, 'steps': 48814, 'loss/train': 1.1817797422409058} -08/30/2021 22:03:41 - INFO - __main__ - Step 48816: {'lr': 0.0003863896250190855, 'samples': 9372672, 'steps': 48815, 'loss/train': 1.7076836824417114} -08/30/2021 22:03:42 - INFO - __main__ - Step 48817: {'lr': 0.00038638517755056534, 'samples': 9372864, 'steps': 48816, 'loss/train': 1.409352421760559} -08/30/2021 22:03:44 - INFO - __main__ - Step 48818: {'lr': 0.00038638073002059223, 'samples': 9373056, 'steps': 48817, 'loss/train': 1.6329432725906372} -08/30/2021 22:03:44 - INFO - __main__ - Step 48819: {'lr': 0.000386376282429168, 'samples': 9373248, 'steps': 48818, 'loss/train': 0.04905432090163231} -08/30/2021 22:03:44 - INFO - __main__ - Step 48820: {'lr': 0.0003863718347762948, 'samples': 9373440, 'steps': 48819, 'loss/train': 0.043754201382398605} -08/30/2021 22:03:45 - INFO - __main__ - Step 48821: {'lr': 0.0003863673870619744, 'samples': 9373632, 'steps': 48820, 'loss/train': 1.8629157543182373} -08/30/2021 22:03:45 - INFO - __main__ - Step 48822: {'lr': 0.00038636293928620915, 'samples': 9373824, 'steps': 48821, 'loss/train': 1.4572480916976929} -08/30/2021 22:03:45 - INFO - __main__ - Step 48823: {'lr': 0.0003863584914490007, 'samples': 9374016, 'steps': 48822, 'loss/train': 0.354684978723526} -08/30/2021 22:03:47 - INFO - __main__ - Step 48824: {'lr': 0.0003863540435503513, 'samples': 9374208, 'steps': 48823, 'loss/train': 0.7377296686172485} -08/30/2021 22:03:48 - INFO - __main__ - Step 48825: {'lr': 0.0003863495955902629, 'samples': 9374400, 'steps': 48824, 'loss/train': 1.657758116722107} -08/30/2021 22:03:48 - INFO - __main__ - Step 48826: {'lr': 0.00038634514756873746, 'samples': 9374592, 'steps': 48825, 'loss/train': 1.356229305267334} -08/30/2021 22:03:49 - INFO - __main__ - Step 48827: {'lr': 0.000386340699485777, 'samples': 9374784, 'steps': 48826, 'loss/train': 1.508836269378662} -08/30/2021 22:03:49 - INFO - __main__ - Step 48828: {'lr': 0.0003863362513413835, 'samples': 9374976, 'steps': 48827, 'loss/train': 1.3471057415008545} -08/30/2021 22:03:50 - INFO - __main__ - Step 48829: {'lr': 0.00038633180313555894, 'samples': 9375168, 'steps': 48828, 'loss/train': 1.279208779335022} -08/30/2021 22:03:51 - INFO - __main__ - Step 48830: {'lr': 0.0003863273548683054, 'samples': 9375360, 'steps': 48829, 'loss/train': 1.1051563024520874} -08/30/2021 22:03:51 - INFO - __main__ - Step 48831: {'lr': 0.0003863229065396249, 'samples': 9375552, 'steps': 48830, 'loss/train': 1.3010259866714478} -08/30/2021 22:03:52 - INFO - __main__ - Step 48832: {'lr': 0.0003863184581495194, 'samples': 9375744, 'steps': 48831, 'loss/train': 1.3051475286483765} -08/30/2021 22:03:52 - INFO - __main__ - Step 48833: {'lr': 0.0003863140096979909, 'samples': 9375936, 'steps': 48832, 'loss/train': 1.056808590888977} -08/30/2021 22:03:53 - INFO - __main__ - Step 48834: {'lr': 0.00038630956118504146, 'samples': 9376128, 'steps': 48833, 'loss/train': 0.875105082988739} -08/30/2021 22:03:54 - INFO - __main__ - Step 48835: {'lr': 0.00038630511261067294, 'samples': 9376320, 'steps': 48834, 'loss/train': 1.1130019426345825} -08/30/2021 22:03:54 - INFO - __main__ - Step 48836: {'lr': 0.0003863006639748875, 'samples': 9376512, 'steps': 48835, 'loss/train': 1.3328715562820435} -08/30/2021 22:03:55 - INFO - __main__ - Step 48837: {'lr': 0.000386296215277687, 'samples': 9376704, 'steps': 48836, 'loss/train': 1.9974236488342285} -08/30/2021 22:03:55 - INFO - __main__ - Step 48838: {'lr': 0.0003862917665190736, 'samples': 9376896, 'steps': 48837, 'loss/train': 1.3784449100494385} -08/30/2021 22:03:57 - INFO - __main__ - Step 48839: {'lr': 0.0003862873176990492, 'samples': 9377088, 'steps': 48838, 'loss/train': 1.9237213134765625} -08/30/2021 22:03:57 - INFO - __main__ - Step 48840: {'lr': 0.00038628286881761594, 'samples': 9377280, 'steps': 48839, 'loss/train': 1.4314467906951904} -08/30/2021 22:03:57 - INFO - __main__ - Step 48841: {'lr': 0.0003862784198747756, 'samples': 9377472, 'steps': 48840, 'loss/train': 0.1966492086648941} -08/30/2021 22:03:58 - INFO - __main__ - Step 48842: {'lr': 0.0003862739708705304, 'samples': 9377664, 'steps': 48841, 'loss/train': 1.95949125289917} -08/30/2021 22:03:58 - INFO - __main__ - Step 48843: {'lr': 0.0003862695218048822, 'samples': 9377856, 'steps': 48842, 'loss/train': 1.1845020055770874} -08/30/2021 22:04:00 - INFO - __main__ - Step 48844: {'lr': 0.000386265072677833, 'samples': 9378048, 'steps': 48843, 'loss/train': 1.2413744926452637} -08/30/2021 22:04:00 - INFO - __main__ - Step 48845: {'lr': 0.00038626062348938494, 'samples': 9378240, 'steps': 48844, 'loss/train': 0.3717733919620514} -08/30/2021 22:04:01 - INFO - __main__ - Step 48846: {'lr': 0.00038625617423954, 'samples': 9378432, 'steps': 48845, 'loss/train': 0.07578319311141968} -08/30/2021 22:04:01 - INFO - __main__ - Step 48847: {'lr': 0.00038625172492829995, 'samples': 9378624, 'steps': 48846, 'loss/train': 1.8362623453140259} -08/30/2021 22:04:01 - INFO - __main__ - Step 48848: {'lr': 0.00038624727555566714, 'samples': 9378816, 'steps': 48847, 'loss/train': 1.4770867824554443} -08/30/2021 22:04:02 - INFO - __main__ - Step 48849: {'lr': 0.0003862428261216433, 'samples': 9379008, 'steps': 48848, 'loss/train': 1.720317006111145} -08/30/2021 22:04:03 - INFO - __main__ - Step 48850: {'lr': 0.00038623837662623065, 'samples': 9379200, 'steps': 48849, 'loss/train': 1.3068805932998657} -08/30/2021 22:04:04 - INFO - __main__ - Step 48851: {'lr': 0.000386233927069431, 'samples': 9379392, 'steps': 48850, 'loss/train': 0.20891162753105164} -08/30/2021 22:04:04 - INFO - __main__ - Step 48852: {'lr': 0.0003862294774512465, 'samples': 9379584, 'steps': 48851, 'loss/train': 1.6089826822280884} -08/30/2021 22:04:04 - INFO - __main__ - Step 48853: {'lr': 0.00038622502777167913, 'samples': 9379776, 'steps': 48852, 'loss/train': 0.48764216899871826} -08/30/2021 22:04:05 - INFO - __main__ - Step 48854: {'lr': 0.00038622057803073075, 'samples': 9379968, 'steps': 48853, 'loss/train': 1.1983458995819092} -08/30/2021 22:04:06 - INFO - __main__ - Step 48855: {'lr': 0.0003862161282284036, 'samples': 9380160, 'steps': 48854, 'loss/train': 1.7085390090942383} -08/30/2021 22:04:07 - INFO - __main__ - Step 48856: {'lr': 0.00038621167836469945, 'samples': 9380352, 'steps': 48855, 'loss/train': 1.2399362325668335} -08/30/2021 22:04:07 - INFO - __main__ - Step 48857: {'lr': 0.0003862072284396205, 'samples': 9380544, 'steps': 48856, 'loss/train': 0.9718574285507202} -08/30/2021 22:04:07 - INFO - __main__ - Step 48858: {'lr': 0.00038620277845316867, 'samples': 9380736, 'steps': 48857, 'loss/train': 1.0807909965515137} -08/30/2021 22:04:08 - INFO - __main__ - Step 48859: {'lr': 0.00038619832840534586, 'samples': 9380928, 'steps': 48858, 'loss/train': 0.9542996287345886} -08/30/2021 22:04:09 - INFO - __main__ - Step 48860: {'lr': 0.0003861938782961544, 'samples': 9381120, 'steps': 48859, 'loss/train': 1.150165319442749} -08/30/2021 22:04:10 - INFO - __main__ - Step 48861: {'lr': 0.0003861894281255959, 'samples': 9381312, 'steps': 48860, 'loss/train': 1.0504695177078247} -08/30/2021 22:04:10 - INFO - __main__ - Step 48862: {'lr': 0.0003861849778936726, 'samples': 9381504, 'steps': 48861, 'loss/train': 3.8373653888702393} -08/30/2021 22:04:10 - INFO - __main__ - Step 48863: {'lr': 0.00038618052760038647, 'samples': 9381696, 'steps': 48862, 'loss/train': 1.8387144804000854} -08/30/2021 22:04:11 - INFO - __main__ - Step 48864: {'lr': 0.00038617607724573944, 'samples': 9381888, 'steps': 48863, 'loss/train': 0.1540784239768982} -08/30/2021 22:04:12 - INFO - __main__ - Step 48865: {'lr': 0.0003861716268297336, 'samples': 9382080, 'steps': 48864, 'loss/train': 0.9872737526893616} -08/30/2021 22:04:13 - INFO - __main__ - Step 48866: {'lr': 0.000386167176352371, 'samples': 9382272, 'steps': 48865, 'loss/train': 0.6970322132110596} -08/30/2021 22:04:13 - INFO - __main__ - Step 48867: {'lr': 0.00038616272581365354, 'samples': 9382464, 'steps': 48866, 'loss/train': 1.0987118482589722} -08/30/2021 22:04:13 - INFO - __main__ - Step 48868: {'lr': 0.00038615827521358315, 'samples': 9382656, 'steps': 48867, 'loss/train': 1.129199504852295} -08/30/2021 22:04:14 - INFO - __main__ - Step 48869: {'lr': 0.00038615382455216204, 'samples': 9382848, 'steps': 48868, 'loss/train': 1.5722532272338867} -08/30/2021 22:04:16 - INFO - __main__ - Step 48870: {'lr': 0.0003861493738293921, 'samples': 9383040, 'steps': 48869, 'loss/train': 1.3339334726333618} -08/30/2021 22:04:16 - INFO - __main__ - Step 48871: {'lr': 0.0003861449230452753, 'samples': 9383232, 'steps': 48870, 'loss/train': 1.812423586845398} -08/30/2021 22:04:16 - INFO - __main__ - Step 48872: {'lr': 0.00038614047219981374, 'samples': 9383424, 'steps': 48871, 'loss/train': 1.188661813735962} -08/30/2021 22:04:17 - INFO - __main__ - Step 48873: {'lr': 0.0003861360212930094, 'samples': 9383616, 'steps': 48872, 'loss/train': 1.4395866394042969} -08/30/2021 22:04:17 - INFO - __main__ - Step 48874: {'lr': 0.0003861315703248643, 'samples': 9383808, 'steps': 48873, 'loss/train': 1.8299689292907715} -08/30/2021 22:04:19 - INFO - __main__ - Step 48875: {'lr': 0.0003861271192953804, 'samples': 9384000, 'steps': 48874, 'loss/train': 1.4445850849151611} -08/30/2021 22:04:19 - INFO - __main__ - Step 48876: {'lr': 0.00038612266820455964, 'samples': 9384192, 'steps': 48875, 'loss/train': 1.373655915260315} -08/30/2021 22:04:19 - INFO - __main__ - Step 48877: {'lr': 0.0003861182170524041, 'samples': 9384384, 'steps': 48876, 'loss/train': 0.6758992075920105} -08/30/2021 22:04:20 - INFO - __main__ - Step 48878: {'lr': 0.0003861137658389159, 'samples': 9384576, 'steps': 48877, 'loss/train': 1.1939611434936523} -08/30/2021 22:04:20 - INFO - __main__ - Step 48879: {'lr': 0.0003861093145640969, 'samples': 9384768, 'steps': 48878, 'loss/train': 1.2324585914611816} -08/30/2021 22:04:22 - INFO - __main__ - Step 48880: {'lr': 0.00038610486322794915, 'samples': 9384960, 'steps': 48879, 'loss/train': 0.9681851267814636} -08/30/2021 22:04:23 - INFO - __main__ - Step 48881: {'lr': 0.0003861004118304746, 'samples': 9385152, 'steps': 48880, 'loss/train': 1.161491870880127} -08/30/2021 22:04:23 - INFO - __main__ - Step 48882: {'lr': 0.0003860959603716754, 'samples': 9385344, 'steps': 48881, 'loss/train': 1.2258241176605225} -08/30/2021 22:04:23 - INFO - __main__ - Step 48883: {'lr': 0.00038609150885155337, 'samples': 9385536, 'steps': 48882, 'loss/train': 0.5083160996437073} -08/30/2021 22:04:24 - INFO - __main__ - Step 48884: {'lr': 0.0003860870572701106, 'samples': 9385728, 'steps': 48883, 'loss/train': 1.3246307373046875} -08/30/2021 22:04:24 - INFO - __main__ - Step 48885: {'lr': 0.0003860826056273492, 'samples': 9385920, 'steps': 48884, 'loss/train': 1.828690767288208} -08/30/2021 22:04:26 - INFO - __main__ - Step 48886: {'lr': 0.0003860781539232709, 'samples': 9386112, 'steps': 48885, 'loss/train': 1.5244758129119873} -08/30/2021 22:04:26 - INFO - __main__ - Step 48887: {'lr': 0.0003860737021578781, 'samples': 9386304, 'steps': 48886, 'loss/train': 1.7214467525482178} -08/30/2021 22:04:26 - INFO - __main__ - Step 48888: {'lr': 0.00038606925033117246, 'samples': 9386496, 'steps': 48887, 'loss/train': 1.25721275806427} -08/30/2021 22:04:27 - INFO - __main__ - Step 48889: {'lr': 0.00038606479844315614, 'samples': 9386688, 'steps': 48888, 'loss/train': 1.7863469123840332} -08/30/2021 22:04:27 - INFO - __main__ - Step 48890: {'lr': 0.00038606034649383116, 'samples': 9386880, 'steps': 48889, 'loss/train': 1.0416723489761353} -08/30/2021 22:04:28 - INFO - __main__ - Step 48891: {'lr': 0.0003860558944831994, 'samples': 9387072, 'steps': 48890, 'loss/train': 1.6393935680389404} -08/30/2021 22:04:29 - INFO - __main__ - Step 48892: {'lr': 0.000386051442411263, 'samples': 9387264, 'steps': 48891, 'loss/train': 1.5236557722091675} -08/30/2021 22:04:29 - INFO - __main__ - Step 48893: {'lr': 0.00038604699027802394, 'samples': 9387456, 'steps': 48892, 'loss/train': 1.3921586275100708} -08/30/2021 22:04:30 - INFO - __main__ - Step 48894: {'lr': 0.0003860425380834842, 'samples': 9387648, 'steps': 48893, 'loss/train': 0.5640357136726379} -08/30/2021 22:04:30 - INFO - __main__ - Step 48895: {'lr': 0.0003860380858276458, 'samples': 9387840, 'steps': 48894, 'loss/train': 1.8777879476547241} -08/30/2021 22:04:31 - INFO - __main__ - Step 48896: {'lr': 0.0003860336335105107, 'samples': 9388032, 'steps': 48895, 'loss/train': 1.0305182933807373} -08/30/2021 22:04:32 - INFO - __main__ - Step 48897: {'lr': 0.000386029181132081, 'samples': 9388224, 'steps': 48896, 'loss/train': 1.4447362422943115} -08/30/2021 22:04:32 - INFO - __main__ - Step 48898: {'lr': 0.0003860247286923586, 'samples': 9388416, 'steps': 48897, 'loss/train': 1.4515936374664307} -08/30/2021 22:04:33 - INFO - __main__ - Step 48899: {'lr': 0.0003860202761913455, 'samples': 9388608, 'steps': 48898, 'loss/train': 1.4361896514892578} -08/30/2021 22:04:33 - INFO - __main__ - Step 48900: {'lr': 0.00038601582362904384, 'samples': 9388800, 'steps': 48899, 'loss/train': 1.861391305923462} -08/30/2021 22:04:34 - INFO - __main__ - Step 48901: {'lr': 0.0003860113710054556, 'samples': 9388992, 'steps': 48900, 'loss/train': 1.129175066947937} -08/30/2021 22:04:35 - INFO - __main__ - Step 48902: {'lr': 0.00038600691832058265, 'samples': 9389184, 'steps': 48901, 'loss/train': 1.0938245058059692} -08/30/2021 22:04:35 - INFO - __main__ - Step 48903: {'lr': 0.0003860024655744271, 'samples': 9389376, 'steps': 48902, 'loss/train': 1.6246204376220703} -08/30/2021 22:04:36 - INFO - __main__ - Step 48904: {'lr': 0.000385998012766991, 'samples': 9389568, 'steps': 48903, 'loss/train': 1.0381877422332764} -08/30/2021 22:04:36 - INFO - __main__ - Step 48905: {'lr': 0.0003859935598982762, 'samples': 9389760, 'steps': 48904, 'loss/train': 1.2635709047317505} -08/30/2021 22:04:37 - INFO - __main__ - Step 48906: {'lr': 0.0003859891069682848, 'samples': 9389952, 'steps': 48905, 'loss/train': 0.6974548697471619} -08/30/2021 22:04:38 - INFO - __main__ - Step 48907: {'lr': 0.0003859846539770189, 'samples': 9390144, 'steps': 48906, 'loss/train': 1.1524872779846191} -08/30/2021 22:04:38 - INFO - __main__ - Step 48908: {'lr': 0.0003859802009244804, 'samples': 9390336, 'steps': 48907, 'loss/train': 0.04876082018017769} -08/30/2021 22:04:39 - INFO - __main__ - Step 48909: {'lr': 0.00038597574781067123, 'samples': 9390528, 'steps': 48908, 'loss/train': 1.3122353553771973} -08/30/2021 22:04:39 - INFO - __main__ - Step 48910: {'lr': 0.0003859712946355936, 'samples': 9390720, 'steps': 48909, 'loss/train': 0.6884896159172058} -08/30/2021 22:04:40 - INFO - __main__ - Step 48911: {'lr': 0.0003859668413992493, 'samples': 9390912, 'steps': 48910, 'loss/train': 1.178629755973816} -08/30/2021 22:04:41 - INFO - __main__ - Step 48912: {'lr': 0.0003859623881016404, 'samples': 9391104, 'steps': 48911, 'loss/train': 1.3759442567825317} -08/30/2021 22:04:41 - INFO - __main__ - Step 48913: {'lr': 0.000385957934742769, 'samples': 9391296, 'steps': 48912, 'loss/train': 0.03345291689038277} -08/30/2021 22:04:42 - INFO - __main__ - Step 48914: {'lr': 0.0003859534813226372, 'samples': 9391488, 'steps': 48913, 'loss/train': 1.1845836639404297} -08/30/2021 22:04:42 - INFO - __main__ - Step 48915: {'lr': 0.00038594902784124663, 'samples': 9391680, 'steps': 48914, 'loss/train': 1.2679426670074463} -08/30/2021 22:04:44 - INFO - __main__ - Step 48916: {'lr': 0.00038594457429859966, 'samples': 9391872, 'steps': 48915, 'loss/train': 0.6124281883239746} -08/30/2021 22:04:44 - INFO - __main__ - Step 48917: {'lr': 0.00038594012069469814, 'samples': 9392064, 'steps': 48916, 'loss/train': 1.376297950744629} -08/30/2021 22:04:44 - INFO - __main__ - Step 48918: {'lr': 0.0003859356670295441, 'samples': 9392256, 'steps': 48917, 'loss/train': 1.6040748357772827} -08/30/2021 22:04:45 - INFO - __main__ - Step 48919: {'lr': 0.00038593121330313953, 'samples': 9392448, 'steps': 48918, 'loss/train': 1.0200928449630737} -08/30/2021 22:04:45 - INFO - __main__ - Step 48920: {'lr': 0.0003859267595154865, 'samples': 9392640, 'steps': 48919, 'loss/train': 1.6063692569732666} -08/30/2021 22:04:46 - INFO - __main__ - Step 48921: {'lr': 0.0003859223056665869, 'samples': 9392832, 'steps': 48920, 'loss/train': 0.5206479430198669} -08/30/2021 22:04:47 - INFO - __main__ - Step 48922: {'lr': 0.00038591785175644283, 'samples': 9393024, 'steps': 48921, 'loss/train': 0.9892064929008484} -08/30/2021 22:04:47 - INFO - __main__ - Step 48923: {'lr': 0.0003859133977850563, 'samples': 9393216, 'steps': 48922, 'loss/train': 1.2768689393997192} -08/30/2021 22:04:48 - INFO - __main__ - Step 48924: {'lr': 0.00038590894375242925, 'samples': 9393408, 'steps': 48923, 'loss/train': 1.22904372215271} -08/30/2021 22:04:48 - INFO - __main__ - Step 48925: {'lr': 0.0003859044896585637, 'samples': 9393600, 'steps': 48924, 'loss/train': 1.7870597839355469} -08/30/2021 22:04:48 - INFO - __main__ - Step 48926: {'lr': 0.00038590003550346177, 'samples': 9393792, 'steps': 48925, 'loss/train': 1.990837812423706} -08/30/2021 22:04:50 - INFO - __main__ - Step 48927: {'lr': 0.0003858955812871254, 'samples': 9393984, 'steps': 48926, 'loss/train': 0.5840023756027222} -08/30/2021 22:04:50 - INFO - __main__ - Step 48928: {'lr': 0.0003858911270095565, 'samples': 9394176, 'steps': 48927, 'loss/train': 1.9934320449829102} -08/30/2021 22:04:51 - INFO - __main__ - Step 48929: {'lr': 0.00038588667267075715, 'samples': 9394368, 'steps': 48928, 'loss/train': 0.8887355327606201} -08/30/2021 22:04:51 - INFO - __main__ - Step 48930: {'lr': 0.0003858822182707294, 'samples': 9394560, 'steps': 48929, 'loss/train': 1.5476365089416504} -08/30/2021 22:04:51 - INFO - __main__ - Step 48931: {'lr': 0.00038587776380947516, 'samples': 9394752, 'steps': 48930, 'loss/train': 0.06992319226264954} -08/30/2021 22:04:54 - INFO - __main__ - Step 48932: {'lr': 0.0003858733092869966, 'samples': 9394944, 'steps': 48931, 'loss/train': 1.5100784301757812} -08/30/2021 22:04:54 - INFO - __main__ - Step 48933: {'lr': 0.00038586885470329554, 'samples': 9395136, 'steps': 48932, 'loss/train': 1.2027466297149658} -08/30/2021 22:04:54 - INFO - __main__ - Step 48934: {'lr': 0.0003858644000583741, 'samples': 9395328, 'steps': 48933, 'loss/train': 1.4855645895004272} -08/30/2021 22:04:55 - INFO - __main__ - Step 48935: {'lr': 0.0003858599453522342, 'samples': 9395520, 'steps': 48934, 'loss/train': 1.2240182161331177} -08/30/2021 22:04:55 - INFO - __main__ - Step 48936: {'lr': 0.000385855490584878, 'samples': 9395712, 'steps': 48935, 'loss/train': 0.6295226216316223} -08/30/2021 22:04:57 - INFO - __main__ - Step 48937: {'lr': 0.0003858510357563074, 'samples': 9395904, 'steps': 48936, 'loss/train': 1.3402289152145386} -08/30/2021 22:04:57 - INFO - __main__ - Step 48938: {'lr': 0.00038584658086652433, 'samples': 9396096, 'steps': 48937, 'loss/train': 1.4372090101242065} -08/30/2021 22:04:57 - INFO - __main__ - Step 48939: {'lr': 0.00038584212591553105, 'samples': 9396288, 'steps': 48938, 'loss/train': 1.3219102621078491} -08/30/2021 22:04:58 - INFO - __main__ - Step 48940: {'lr': 0.00038583767090332924, 'samples': 9396480, 'steps': 48939, 'loss/train': 1.308092474937439} -08/30/2021 22:04:58 - INFO - __main__ - Step 48941: {'lr': 0.00038583321582992113, 'samples': 9396672, 'steps': 48940, 'loss/train': 1.9299805164337158} -08/30/2021 22:05:00 - INFO - __main__ - Step 48942: {'lr': 0.0003858287606953087, 'samples': 9396864, 'steps': 48941, 'loss/train': 1.8272383213043213} -08/30/2021 22:05:00 - INFO - __main__ - Step 48943: {'lr': 0.00038582430549949386, 'samples': 9397056, 'steps': 48942, 'loss/train': 0.9642685055732727} -08/30/2021 22:05:01 - INFO - __main__ - Step 48944: {'lr': 0.00038581985024247877, 'samples': 9397248, 'steps': 48943, 'loss/train': 1.1718032360076904} -08/30/2021 22:05:01 - INFO - __main__ - Step 48945: {'lr': 0.0003858153949242653, 'samples': 9397440, 'steps': 48944, 'loss/train': 0.06403294205665588} -08/30/2021 22:05:01 - INFO - __main__ - Step 48946: {'lr': 0.00038581093954485554, 'samples': 9397632, 'steps': 48945, 'loss/train': 1.5827386379241943} -08/30/2021 22:05:02 - INFO - __main__ - Step 48947: {'lr': 0.00038580648410425146, 'samples': 9397824, 'steps': 48946, 'loss/train': 1.8211649656295776} -08/30/2021 22:05:03 - INFO - __main__ - Step 48948: {'lr': 0.00038580202860245507, 'samples': 9398016, 'steps': 48947, 'loss/train': 1.4734798669815063} -08/30/2021 22:05:03 - INFO - __main__ - Step 48949: {'lr': 0.00038579757303946826, 'samples': 9398208, 'steps': 48948, 'loss/train': 1.2593379020690918} -08/30/2021 22:05:04 - INFO - __main__ - Step 48950: {'lr': 0.0003857931174152933, 'samples': 9398400, 'steps': 48949, 'loss/train': 1.5898241996765137} -08/30/2021 22:05:04 - INFO - __main__ - Step 48951: {'lr': 0.000385788661729932, 'samples': 9398592, 'steps': 48950, 'loss/train': 1.2492865324020386} -08/30/2021 22:05:06 - INFO - __main__ - Step 48952: {'lr': 0.0003857842059833865, 'samples': 9398784, 'steps': 48951, 'loss/train': 1.3450074195861816} -08/30/2021 22:05:06 - INFO - __main__ - Step 48953: {'lr': 0.0003857797501756587, 'samples': 9398976, 'steps': 48952, 'loss/train': 1.014382243156433} -08/30/2021 22:05:06 - INFO - __main__ - Step 48954: {'lr': 0.0003857752943067506, 'samples': 9399168, 'steps': 48953, 'loss/train': 1.793885350227356} -08/30/2021 22:05:07 - INFO - __main__ - Step 48955: {'lr': 0.0003857708383766643, 'samples': 9399360, 'steps': 48954, 'loss/train': 1.1865606307983398} -08/30/2021 22:05:07 - INFO - __main__ - Step 48956: {'lr': 0.00038576638238540167, 'samples': 9399552, 'steps': 48955, 'loss/train': 0.9951339960098267} -08/30/2021 22:05:08 - INFO - __main__ - Step 48957: {'lr': 0.00038576192633296485, 'samples': 9399744, 'steps': 48956, 'loss/train': 1.3709392547607422} -08/30/2021 22:05:09 - INFO - __main__ - Step 48958: {'lr': 0.00038575747021935583, 'samples': 9399936, 'steps': 48957, 'loss/train': 1.641698956489563} -08/30/2021 22:05:09 - INFO - __main__ - Step 48959: {'lr': 0.0003857530140445765, 'samples': 9400128, 'steps': 48958, 'loss/train': 1.6269811391830444} -08/30/2021 22:05:10 - INFO - __main__ - Step 48960: {'lr': 0.00038574855780862903, 'samples': 9400320, 'steps': 48959, 'loss/train': 1.3960156440734863} -08/30/2021 22:05:10 - INFO - __main__ - Step 48961: {'lr': 0.0003857441015115154, 'samples': 9400512, 'steps': 48960, 'loss/train': 1.5628035068511963} -08/30/2021 22:05:10 - INFO - __main__ - Step 48962: {'lr': 0.00038573964515323754, 'samples': 9400704, 'steps': 48961, 'loss/train': 1.8988583087921143} -08/30/2021 22:05:12 - INFO - __main__ - Step 48963: {'lr': 0.0003857351887337974, 'samples': 9400896, 'steps': 48962, 'loss/train': 1.569704532623291} -08/30/2021 22:05:13 - INFO - __main__ - Step 48964: {'lr': 0.00038573073225319724, 'samples': 9401088, 'steps': 48963, 'loss/train': 1.144771695137024} -08/30/2021 22:05:13 - INFO - __main__ - Step 48965: {'lr': 0.00038572627571143873, 'samples': 9401280, 'steps': 48964, 'loss/train': 1.7368896007537842} -08/30/2021 22:05:13 - INFO - __main__ - Step 48966: {'lr': 0.0003857218191085242, 'samples': 9401472, 'steps': 48965, 'loss/train': 1.4399389028549194} -08/30/2021 22:05:14 - INFO - __main__ - Step 48967: {'lr': 0.0003857173624444554, 'samples': 9401664, 'steps': 48966, 'loss/train': 0.6976837515830994} -08/30/2021 22:05:15 - INFO - __main__ - Step 48968: {'lr': 0.00038571290571923455, 'samples': 9401856, 'steps': 48967, 'loss/train': 0.8567972183227539} -08/30/2021 22:05:16 - INFO - __main__ - Step 48969: {'lr': 0.0003857084489328635, 'samples': 9402048, 'steps': 48968, 'loss/train': 1.2729710340499878} -08/30/2021 22:05:16 - INFO - __main__ - Step 48970: {'lr': 0.00038570399208534437, 'samples': 9402240, 'steps': 48969, 'loss/train': 1.094132900238037} -08/30/2021 22:05:17 - INFO - __main__ - Step 48971: {'lr': 0.000385699535176679, 'samples': 9402432, 'steps': 48970, 'loss/train': 1.727378487586975} -08/30/2021 22:05:17 - INFO - __main__ - Step 48972: {'lr': 0.00038569507820686956, 'samples': 9402624, 'steps': 48971, 'loss/train': 0.02724265865981579} -08/30/2021 22:05:17 - INFO - __main__ - Step 48973: {'lr': 0.000385690621175918, 'samples': 9402816, 'steps': 48972, 'loss/train': 1.346278429031372} -08/30/2021 22:05:19 - INFO - __main__ - Step 48974: {'lr': 0.0003856861640838265, 'samples': 9403008, 'steps': 48973, 'loss/train': 0.9433966279029846} -08/30/2021 22:05:20 - INFO - __main__ - Step 48975: {'lr': 0.00038568170693059677, 'samples': 9403200, 'steps': 48974, 'loss/train': 1.6088309288024902} -08/30/2021 22:05:20 - INFO - __main__ - Step 48976: {'lr': 0.000385677249716231, 'samples': 9403392, 'steps': 48975, 'loss/train': 1.4307420253753662} -08/30/2021 22:05:20 - INFO - __main__ - Step 48977: {'lr': 0.0003856727924407311, 'samples': 9403584, 'steps': 48976, 'loss/train': 1.0638583898544312} -08/30/2021 22:05:21 - INFO - __main__ - Step 48978: {'lr': 0.0003856683351040992, 'samples': 9403776, 'steps': 48977, 'loss/train': 0.4514577090740204} -08/30/2021 22:05:21 - INFO - __main__ - Step 48979: {'lr': 0.00038566387770633715, 'samples': 9403968, 'steps': 48978, 'loss/train': 0.28638121485710144} -08/30/2021 22:05:23 - INFO - __main__ - Step 48980: {'lr': 0.00038565942024744703, 'samples': 9404160, 'steps': 48979, 'loss/train': 1.5438251495361328} -08/30/2021 22:05:23 - INFO - __main__ - Step 48981: {'lr': 0.000385654962727431, 'samples': 9404352, 'steps': 48980, 'loss/train': 1.0712181329727173} -08/30/2021 22:05:23 - INFO - __main__ - Step 48982: {'lr': 0.00038565050514629087, 'samples': 9404544, 'steps': 48981, 'loss/train': 1.0263208150863647} -08/30/2021 22:05:24 - INFO - __main__ - Step 48983: {'lr': 0.0003856460475040288, 'samples': 9404736, 'steps': 48982, 'loss/train': 1.5323868989944458} -08/30/2021 22:05:24 - INFO - __main__ - Step 48984: {'lr': 0.00038564158980064657, 'samples': 9404928, 'steps': 48983, 'loss/train': 1.7161959409713745} -08/30/2021 22:05:26 - INFO - __main__ - Step 48985: {'lr': 0.0003856371320361464, 'samples': 9405120, 'steps': 48984, 'loss/train': 1.8002005815505981} -08/30/2021 22:05:27 - INFO - __main__ - Step 48986: {'lr': 0.00038563267421053024, 'samples': 9405312, 'steps': 48985, 'loss/train': 1.0854445695877075} -08/30/2021 22:05:27 - INFO - __main__ - Step 48987: {'lr': 0.0003856282163238001, 'samples': 9405504, 'steps': 48986, 'loss/train': 1.325804591178894} -08/30/2021 22:05:27 - INFO - __main__ - Step 48988: {'lr': 0.000385623758375958, 'samples': 9405696, 'steps': 48987, 'loss/train': 1.0465092658996582} -08/30/2021 22:05:28 - INFO - __main__ - Step 48989: {'lr': 0.0003856193003670058, 'samples': 9405888, 'steps': 48988, 'loss/train': 0.7524456977844238} -08/30/2021 22:05:29 - INFO - __main__ - Step 48990: {'lr': 0.0003856148422969458, 'samples': 9406080, 'steps': 48989, 'loss/train': 1.0065088272094727} -08/30/2021 22:05:30 - INFO - __main__ - Step 48991: {'lr': 0.0003856103841657797, 'samples': 9406272, 'steps': 48990, 'loss/train': 1.1180819272994995} -08/30/2021 22:05:30 - INFO - __main__ - Step 48992: {'lr': 0.00038560592597350975, 'samples': 9406464, 'steps': 48991, 'loss/train': 0.7776837348937988} -08/30/2021 22:05:30 - INFO - __main__ - Step 48993: {'lr': 0.0003856014677201378, 'samples': 9406656, 'steps': 48992, 'loss/train': 1.5926661491394043} -08/30/2021 22:05:31 - INFO - __main__ - Step 48994: {'lr': 0.000385597009405666, 'samples': 9406848, 'steps': 48993, 'loss/train': 1.502701997756958} -08/30/2021 22:05:32 - INFO - __main__ - Step 48995: {'lr': 0.0003855925510300962, 'samples': 9407040, 'steps': 48994, 'loss/train': 0.35187649726867676} -08/30/2021 22:05:33 - INFO - __main__ - Step 48996: {'lr': 0.0003855880925934305, 'samples': 9407232, 'steps': 48995, 'loss/train': 1.3718417882919312} -08/30/2021 22:05:33 - INFO - __main__ - Step 48997: {'lr': 0.000385583634095671, 'samples': 9407424, 'steps': 48996, 'loss/train': 1.366726279258728} -08/30/2021 22:05:34 - INFO - __main__ - Step 48998: {'lr': 0.00038557917553681944, 'samples': 9407616, 'steps': 48997, 'loss/train': 1.1551061868667603} -08/30/2021 22:05:34 - INFO - __main__ - Step 48999: {'lr': 0.00038557471691687804, 'samples': 9407808, 'steps': 48998, 'loss/train': 0.06604742258787155} -08/30/2021 22:05:34 - INFO - __main__ - Step 49000: {'lr': 0.0003855702582358489, 'samples': 9408000, 'steps': 48999, 'loss/train': 0.05074768513441086} -08/30/2021 22:05:36 - INFO - __main__ - Step 49001: {'lr': 0.00038556579949373384, 'samples': 9408192, 'steps': 49000, 'loss/train': 1.6001778841018677} -08/30/2021 22:05:36 - INFO - __main__ - Step 49002: {'lr': 0.00038556134069053484, 'samples': 9408384, 'steps': 49001, 'loss/train': 0.16883888840675354} -08/30/2021 22:05:37 - INFO - __main__ - Step 49003: {'lr': 0.00038555688182625406, 'samples': 9408576, 'steps': 49002, 'loss/train': 1.1565419435501099} -08/30/2021 22:05:37 - INFO - __main__ - Step 49004: {'lr': 0.0003855524229008934, 'samples': 9408768, 'steps': 49003, 'loss/train': 0.05974424630403519} -08/30/2021 22:05:37 - INFO - __main__ - Step 49005: {'lr': 0.0003855479639144549, 'samples': 9408960, 'steps': 49004, 'loss/train': 0.8605421781539917} -08/30/2021 22:05:39 - INFO - __main__ - Step 49006: {'lr': 0.0003855435048669406, 'samples': 9409152, 'steps': 49005, 'loss/train': 1.5286893844604492} -08/30/2021 22:05:40 - INFO - __main__ - Step 49007: {'lr': 0.0003855390457583525, 'samples': 9409344, 'steps': 49006, 'loss/train': 1.5339139699935913} -08/30/2021 22:05:40 - INFO - __main__ - Step 49008: {'lr': 0.0003855345865886926, 'samples': 9409536, 'steps': 49007, 'loss/train': 1.1174426078796387} -08/30/2021 22:05:40 - INFO - __main__ - Step 49009: {'lr': 0.0003855301273579629, 'samples': 9409728, 'steps': 49008, 'loss/train': 1.479286789894104} -08/30/2021 22:05:41 - INFO - __main__ - Step 49010: {'lr': 0.0003855256680661654, 'samples': 9409920, 'steps': 49009, 'loss/train': 1.000381350517273} -08/30/2021 22:05:42 - INFO - __main__ - Step 49011: {'lr': 0.00038552120871330217, 'samples': 9410112, 'steps': 49010, 'loss/train': 0.09208838641643524} -08/30/2021 22:05:43 - INFO - __main__ - Step 49012: {'lr': 0.0003855167492993751, 'samples': 9410304, 'steps': 49011, 'loss/train': 2.397510528564453} -08/30/2021 22:05:43 - INFO - __main__ - Step 49013: {'lr': 0.00038551228982438635, 'samples': 9410496, 'steps': 49012, 'loss/train': 1.698974847793579} -08/30/2021 22:05:43 - INFO - __main__ - Step 49014: {'lr': 0.00038550783028833786, 'samples': 9410688, 'steps': 49013, 'loss/train': 1.7288204431533813} -08/30/2021 22:05:44 - INFO - __main__ - Step 49015: {'lr': 0.00038550337069123155, 'samples': 9410880, 'steps': 49014, 'loss/train': 1.5784059762954712} -08/30/2021 22:05:45 - INFO - __main__ - Step 49016: {'lr': 0.00038549891103306953, 'samples': 9411072, 'steps': 49015, 'loss/train': 0.041614703834056854} -08/30/2021 22:05:46 - INFO - __main__ - Step 49017: {'lr': 0.00038549445131385386, 'samples': 9411264, 'steps': 49016, 'loss/train': 1.5330461263656616} -08/30/2021 22:05:46 - INFO - __main__ - Step 49018: {'lr': 0.00038548999153358645, 'samples': 9411456, 'steps': 49017, 'loss/train': 1.3942714929580688} -08/30/2021 22:05:46 - INFO - __main__ - Step 49019: {'lr': 0.0003854855316922693, 'samples': 9411648, 'steps': 49018, 'loss/train': 0.940632700920105} -08/30/2021 22:05:47 - INFO - __main__ - Step 49020: {'lr': 0.0003854810717899045, 'samples': 9411840, 'steps': 49019, 'loss/train': 1.4342384338378906} -08/30/2021 22:05:47 - INFO - __main__ - Step 49021: {'lr': 0.0003854766118264941, 'samples': 9412032, 'steps': 49020, 'loss/train': 1.3366179466247559} -08/30/2021 22:05:49 - INFO - __main__ - Step 49022: {'lr': 0.0003854721518020399, 'samples': 9412224, 'steps': 49021, 'loss/train': 1.6159183979034424} -08/30/2021 22:05:49 - INFO - __main__ - Step 49023: {'lr': 0.00038546769171654403, 'samples': 9412416, 'steps': 49022, 'loss/train': 1.5129677057266235} -08/30/2021 22:05:49 - INFO - __main__ - Step 49024: {'lr': 0.00038546323157000856, 'samples': 9412608, 'steps': 49023, 'loss/train': 0.7947247624397278} -08/30/2021 22:05:50 - INFO - __main__ - Step 49025: {'lr': 0.00038545877136243544, 'samples': 9412800, 'steps': 49024, 'loss/train': 2.404702663421631} -08/30/2021 22:05:50 - INFO - __main__ - Step 49026: {'lr': 0.00038545431109382667, 'samples': 9412992, 'steps': 49025, 'loss/train': 1.0186800956726074} -08/30/2021 22:05:52 - INFO - __main__ - Step 49027: {'lr': 0.0003854498507641843, 'samples': 9413184, 'steps': 49026, 'loss/train': 1.428654670715332} -08/30/2021 22:05:52 - INFO - __main__ - Step 49028: {'lr': 0.00038544539037351037, 'samples': 9413376, 'steps': 49027, 'loss/train': 1.2143417596817017} -08/30/2021 22:05:52 - INFO - __main__ - Step 49029: {'lr': 0.0003854409299218068, 'samples': 9413568, 'steps': 49028, 'loss/train': 1.7249650955200195} -08/30/2021 22:05:53 - INFO - __main__ - Step 49030: {'lr': 0.00038543646940907564, 'samples': 9413760, 'steps': 49029, 'loss/train': 5.788559913635254} -08/30/2021 22:05:53 - INFO - __main__ - Step 49031: {'lr': 0.0003854320088353188, 'samples': 9413952, 'steps': 49030, 'loss/train': 2.2537002563476562} -08/30/2021 22:05:55 - INFO - __main__ - Step 49032: {'lr': 0.0003854275482005385, 'samples': 9414144, 'steps': 49031, 'loss/train': 1.6331944465637207} -08/30/2021 22:05:55 - INFO - __main__ - Step 49033: {'lr': 0.0003854230875047366, 'samples': 9414336, 'steps': 49032, 'loss/train': 1.2995882034301758} -08/30/2021 22:05:56 - INFO - __main__ - Step 49034: {'lr': 0.0003854186267479151, 'samples': 9414528, 'steps': 49033, 'loss/train': 1.2372866868972778} -08/30/2021 22:05:56 - INFO - __main__ - Step 49035: {'lr': 0.00038541416593007615, 'samples': 9414720, 'steps': 49034, 'loss/train': 0.025636833161115646} -08/30/2021 22:05:56 - INFO - __main__ - Step 49036: {'lr': 0.00038540970505122164, 'samples': 9414912, 'steps': 49035, 'loss/train': 1.113980770111084} -08/30/2021 22:05:57 - INFO - __main__ - Step 49037: {'lr': 0.0003854052441113536, 'samples': 9415104, 'steps': 49036, 'loss/train': 0.12852731347084045} -08/30/2021 22:05:59 - INFO - __main__ - Step 49038: {'lr': 0.00038540078311047397, 'samples': 9415296, 'steps': 49037, 'loss/train': 1.3197351694107056} -08/30/2021 22:06:00 - INFO - __main__ - Step 49039: {'lr': 0.0003853963220485849, 'samples': 9415488, 'steps': 49038, 'loss/train': 1.1949341297149658} -08/30/2021 22:06:00 - INFO - __main__ - Step 49040: {'lr': 0.00038539186092568833, 'samples': 9415680, 'steps': 49039, 'loss/train': 2.6087334156036377} -08/30/2021 22:06:00 - INFO - __main__ - Step 49041: {'lr': 0.00038538739974178633, 'samples': 9415872, 'steps': 49040, 'loss/train': 1.5769902467727661} -08/30/2021 22:06:01 - INFO - __main__ - Step 49042: {'lr': 0.00038538293849688077, 'samples': 9416064, 'steps': 49041, 'loss/train': 1.2928646802902222} -08/30/2021 22:06:01 - INFO - __main__ - Step 49043: {'lr': 0.0003853784771909739, 'samples': 9416256, 'steps': 49042, 'loss/train': 0.06994496285915375} -08/30/2021 22:06:02 - INFO - __main__ - Step 49044: {'lr': 0.0003853740158240674, 'samples': 9416448, 'steps': 49043, 'loss/train': 1.356127142906189} -08/30/2021 22:06:03 - INFO - __main__ - Step 49045: {'lr': 0.0003853695543961635, 'samples': 9416640, 'steps': 49044, 'loss/train': 1.8946690559387207} -08/30/2021 22:06:03 - INFO - __main__ - Step 49046: {'lr': 0.00038536509290726417, 'samples': 9416832, 'steps': 49045, 'loss/train': 1.2499479055404663} -08/30/2021 22:06:04 - INFO - __main__ - Step 49047: {'lr': 0.00038536063135737145, 'samples': 9417024, 'steps': 49046, 'loss/train': 0.9454519748687744} -08/30/2021 22:06:04 - INFO - __main__ - Step 49048: {'lr': 0.0003853561697464874, 'samples': 9417216, 'steps': 49047, 'loss/train': 1.106493353843689} -08/30/2021 22:06:06 - INFO - __main__ - Step 49049: {'lr': 0.0003853517080746138, 'samples': 9417408, 'steps': 49048, 'loss/train': 1.9031293392181396} -08/30/2021 22:06:06 - INFO - __main__ - Step 49050: {'lr': 0.00038534724634175285, 'samples': 9417600, 'steps': 49049, 'loss/train': 1.9974815845489502} -08/30/2021 22:06:06 - INFO - __main__ - Step 49051: {'lr': 0.0003853427845479065, 'samples': 9417792, 'steps': 49050, 'loss/train': 1.4240002632141113} -08/30/2021 22:06:07 - INFO - __main__ - Step 49052: {'lr': 0.0003853383226930768, 'samples': 9417984, 'steps': 49051, 'loss/train': 1.643623948097229} -08/30/2021 22:06:07 - INFO - __main__ - Step 49053: {'lr': 0.00038533386077726573, 'samples': 9418176, 'steps': 49052, 'loss/train': 1.0840246677398682} -08/30/2021 22:06:09 - INFO - __main__ - Step 49054: {'lr': 0.00038532939880047535, 'samples': 9418368, 'steps': 49053, 'loss/train': 1.6964430809020996} -08/30/2021 22:06:09 - INFO - __main__ - Step 49055: {'lr': 0.00038532493676270765, 'samples': 9418560, 'steps': 49054, 'loss/train': 1.2003834247589111} -08/30/2021 22:06:10 - INFO - __main__ - Step 49056: {'lr': 0.0003853204746639646, 'samples': 9418752, 'steps': 49055, 'loss/train': 1.6735671758651733} -08/30/2021 22:06:10 - INFO - __main__ - Step 49057: {'lr': 0.0003853160125042482, 'samples': 9418944, 'steps': 49056, 'loss/train': 0.05597090348601341} -08/30/2021 22:06:10 - INFO - __main__ - Step 49058: {'lr': 0.00038531155028356047, 'samples': 9419136, 'steps': 49057, 'loss/train': 0.05793747678399086} -08/30/2021 22:06:12 - INFO - __main__ - Step 49059: {'lr': 0.0003853070880019035, 'samples': 9419328, 'steps': 49058, 'loss/train': 1.2153240442276} -08/30/2021 22:06:13 - INFO - __main__ - Step 49060: {'lr': 0.0003853026256592792, 'samples': 9419520, 'steps': 49059, 'loss/train': 1.1163966655731201} -08/30/2021 22:06:13 - INFO - __main__ - Step 49061: {'lr': 0.0003852981632556897, 'samples': 9419712, 'steps': 49060, 'loss/train': 1.5554616451263428} -08/30/2021 22:06:13 - INFO - __main__ - Step 49062: {'lr': 0.0003852937007911369, 'samples': 9419904, 'steps': 49061, 'loss/train': 1.268764853477478} -08/30/2021 22:06:14 - INFO - __main__ - Step 49063: {'lr': 0.00038528923826562287, 'samples': 9420096, 'steps': 49062, 'loss/train': 0.5437546968460083} -08/30/2021 22:06:15 - INFO - __main__ - Step 49064: {'lr': 0.00038528477567914955, 'samples': 9420288, 'steps': 49063, 'loss/train': 0.05685457959771156} -08/30/2021 22:06:16 - INFO - __main__ - Step 49065: {'lr': 0.000385280313031719, 'samples': 9420480, 'steps': 49064, 'loss/train': 1.2891452312469482} -08/30/2021 22:06:16 - INFO - __main__ - Step 49066: {'lr': 0.00038527585032333326, 'samples': 9420672, 'steps': 49065, 'loss/train': 1.0293633937835693} -08/30/2021 22:06:16 - INFO - __main__ - Step 49067: {'lr': 0.00038527138755399423, 'samples': 9420864, 'steps': 49066, 'loss/train': 1.389180064201355} -08/30/2021 22:06:17 - INFO - __main__ - Step 49068: {'lr': 0.00038526692472370407, 'samples': 9421056, 'steps': 49067, 'loss/train': 1.0328811407089233} -08/30/2021 22:06:19 - INFO - __main__ - Step 49069: {'lr': 0.0003852624618324647, 'samples': 9421248, 'steps': 49068, 'loss/train': 1.6344799995422363} -08/30/2021 22:06:19 - INFO - __main__ - Step 49070: {'lr': 0.0003852579988802782, 'samples': 9421440, 'steps': 49069, 'loss/train': 1.729058027267456} -08/30/2021 22:06:20 - INFO - __main__ - Step 49071: {'lr': 0.00038525353586714645, 'samples': 9421632, 'steps': 49070, 'loss/train': 0.9593988060951233} -08/30/2021 22:06:20 - INFO - __main__ - Step 49072: {'lr': 0.0003852490727930716, 'samples': 9421824, 'steps': 49071, 'loss/train': 1.533362865447998} -08/30/2021 22:06:20 - INFO - __main__ - Step 49073: {'lr': 0.00038524460965805557, 'samples': 9422016, 'steps': 49072, 'loss/train': 1.2628542184829712} -08/30/2021 22:06:21 - INFO - __main__ - Step 49074: {'lr': 0.00038524014646210044, 'samples': 9422208, 'steps': 49073, 'loss/train': 1.5083762407302856} -08/30/2021 22:06:22 - INFO - __main__ - Step 49075: {'lr': 0.00038523568320520817, 'samples': 9422400, 'steps': 49074, 'loss/train': 0.08774276822805405} -08/30/2021 22:06:23 - INFO - __main__ - Step 49076: {'lr': 0.0003852312198873808, 'samples': 9422592, 'steps': 49075, 'loss/train': 1.3700473308563232} -08/30/2021 22:06:23 - INFO - __main__ - Step 49077: {'lr': 0.0003852267565086203, 'samples': 9422784, 'steps': 49076, 'loss/train': 1.1281664371490479} -08/30/2021 22:06:23 - INFO - __main__ - Step 49078: {'lr': 0.0003852222930689288, 'samples': 9422976, 'steps': 49077, 'loss/train': 1.6004756689071655} -08/30/2021 22:06:24 - INFO - __main__ - Step 49079: {'lr': 0.00038521782956830807, 'samples': 9423168, 'steps': 49078, 'loss/train': 1.5095425844192505} -08/30/2021 22:06:25 - INFO - __main__ - Step 49080: {'lr': 0.00038521336600676035, 'samples': 9423360, 'steps': 49079, 'loss/train': 1.3744326829910278} -08/30/2021 22:06:26 - INFO - __main__ - Step 49081: {'lr': 0.00038520890238428763, 'samples': 9423552, 'steps': 49080, 'loss/train': 1.2326339483261108} -08/30/2021 22:06:26 - INFO - __main__ - Step 49082: {'lr': 0.00038520443870089185, 'samples': 9423744, 'steps': 49081, 'loss/train': 1.3077542781829834} -08/30/2021 22:06:26 - INFO - __main__ - Step 49083: {'lr': 0.00038519997495657497, 'samples': 9423936, 'steps': 49082, 'loss/train': 0.3408316373825073} -08/30/2021 22:06:27 - INFO - __main__ - Step 49084: {'lr': 0.0003851955111513391, 'samples': 9424128, 'steps': 49083, 'loss/train': 1.054155707359314} -08/30/2021 22:06:28 - INFO - __main__ - Step 49085: {'lr': 0.0003851910472851862, 'samples': 9424320, 'steps': 49084, 'loss/train': 2.1540746688842773} -08/30/2021 22:06:29 - INFO - __main__ - Step 49086: {'lr': 0.0003851865833581183, 'samples': 9424512, 'steps': 49085, 'loss/train': 1.5708335638046265} -08/30/2021 22:06:29 - INFO - __main__ - Step 49087: {'lr': 0.0003851821193701375, 'samples': 9424704, 'steps': 49086, 'loss/train': 0.4879619777202606} -08/30/2021 22:06:30 - INFO - __main__ - Step 49088: {'lr': 0.0003851776553212456, 'samples': 9424896, 'steps': 49087, 'loss/train': 1.294213056564331} -08/30/2021 22:06:30 - INFO - __main__ - Step 49089: {'lr': 0.0003851731912114448, 'samples': 9425088, 'steps': 49088, 'loss/train': 1.686768651008606} -08/30/2021 22:06:30 - INFO - __main__ - Step 49090: {'lr': 0.00038516872704073704, 'samples': 9425280, 'steps': 49089, 'loss/train': 0.8860755562782288} -08/30/2021 22:06:32 - INFO - __main__ - Step 49091: {'lr': 0.0003851642628091243, 'samples': 9425472, 'steps': 49090, 'loss/train': 1.1916581392288208} -08/30/2021 22:06:32 - INFO - __main__ - Step 49092: {'lr': 0.0003851597985166087, 'samples': 9425664, 'steps': 49091, 'loss/train': 2.623727560043335} -08/30/2021 22:06:33 - INFO - __main__ - Step 49093: {'lr': 0.0003851553341631921, 'samples': 9425856, 'steps': 49092, 'loss/train': 1.8974367380142212} -08/30/2021 22:06:33 - INFO - __main__ - Step 49094: {'lr': 0.0003851508697488766, 'samples': 9426048, 'steps': 49093, 'loss/train': 1.468618631362915} -08/30/2021 22:06:33 - INFO - __main__ - Step 49095: {'lr': 0.0003851464052736643, 'samples': 9426240, 'steps': 49094, 'loss/train': 1.7923316955566406} -08/30/2021 22:06:35 - INFO - __main__ - Step 49096: {'lr': 0.00038514194073755706, 'samples': 9426432, 'steps': 49095, 'loss/train': 1.4214571714401245} -08/30/2021 22:06:36 - INFO - __main__ - Step 49097: {'lr': 0.00038513747614055696, 'samples': 9426624, 'steps': 49096, 'loss/train': 1.5716248750686646} -08/30/2021 22:06:36 - INFO - __main__ - Step 49098: {'lr': 0.0003851330114826659, 'samples': 9426816, 'steps': 49097, 'loss/train': 0.25750911235809326} -08/30/2021 22:06:37 - INFO - __main__ - Step 49099: {'lr': 0.0003851285467638861, 'samples': 9427008, 'steps': 49098, 'loss/train': 0.38401684165000916} -08/30/2021 22:06:37 - INFO - __main__ - Step 49100: {'lr': 0.00038512408198421936, 'samples': 9427200, 'steps': 49099, 'loss/train': 1.4481605291366577} -08/30/2021 22:06:39 - INFO - __main__ - Step 49101: {'lr': 0.0003851196171436679, 'samples': 9427392, 'steps': 49100, 'loss/train': 1.4853707551956177} -08/30/2021 22:06:39 - INFO - __main__ - Step 49102: {'lr': 0.0003851151522422336, 'samples': 9427584, 'steps': 49101, 'loss/train': 0.8223899006843567} -08/30/2021 22:06:40 - INFO - __main__ - Step 49103: {'lr': 0.0003851106872799185, 'samples': 9427776, 'steps': 49102, 'loss/train': 1.9657347202301025} -08/30/2021 22:06:40 - INFO - __main__ - Step 49104: {'lr': 0.00038510622225672455, 'samples': 9427968, 'steps': 49103, 'loss/train': 1.4518288373947144} -08/30/2021 22:06:40 - INFO - __main__ - Step 49105: {'lr': 0.0003851017571726539, 'samples': 9428160, 'steps': 49104, 'loss/train': 1.3620963096618652} -08/30/2021 22:06:41 - INFO - __main__ - Step 49106: {'lr': 0.00038509729202770843, 'samples': 9428352, 'steps': 49105, 'loss/train': 0.09259865432977676} -08/30/2021 22:06:42 - INFO - __main__ - Step 49107: {'lr': 0.00038509282682189016, 'samples': 9428544, 'steps': 49106, 'loss/train': 1.55458664894104} -08/30/2021 22:06:43 - INFO - __main__ - Step 49108: {'lr': 0.0003850883615552012, 'samples': 9428736, 'steps': 49107, 'loss/train': 1.168648362159729} -08/30/2021 22:06:43 - INFO - __main__ - Step 49109: {'lr': 0.0003850838962276436, 'samples': 9428928, 'steps': 49108, 'loss/train': 0.04796629026532173} -08/30/2021 22:06:44 - INFO - __main__ - Step 49110: {'lr': 0.0003850794308392192, 'samples': 9429120, 'steps': 49109, 'loss/train': 1.4770183563232422} -08/30/2021 22:06:44 - INFO - __main__ - Step 49111: {'lr': 0.00038507496538993006, 'samples': 9429312, 'steps': 49110, 'loss/train': 1.256965160369873} -08/30/2021 22:06:46 - INFO - __main__ - Step 49112: {'lr': 0.00038507049987977825, 'samples': 9429504, 'steps': 49111, 'loss/train': 0.637797474861145} -08/30/2021 22:06:46 - INFO - __main__ - Step 49113: {'lr': 0.0003850660343087657, 'samples': 9429696, 'steps': 49112, 'loss/train': 0.7961546182632446} -08/30/2021 22:06:47 - INFO - __main__ - Step 49114: {'lr': 0.0003850615686768946, 'samples': 9429888, 'steps': 49113, 'loss/train': 1.6420841217041016} -08/30/2021 22:06:47 - INFO - __main__ - Step 49115: {'lr': 0.00038505710298416683, 'samples': 9430080, 'steps': 49114, 'loss/train': 1.5022225379943848} -08/30/2021 22:06:48 - INFO - __main__ - Step 49116: {'lr': 0.00038505263723058437, 'samples': 9430272, 'steps': 49115, 'loss/train': 0.7905400991439819} -08/30/2021 22:06:48 - INFO - __main__ - Step 49117: {'lr': 0.0003850481714161492, 'samples': 9430464, 'steps': 49116, 'loss/train': 0.06218510866165161} -08/30/2021 22:06:49 - INFO - __main__ - Step 49118: {'lr': 0.00038504370554086353, 'samples': 9430656, 'steps': 49117, 'loss/train': 0.02573992684483528} -08/30/2021 22:06:50 - INFO - __main__ - Step 49119: {'lr': 0.0003850392396047292, 'samples': 9430848, 'steps': 49118, 'loss/train': 1.3654017448425293} -08/30/2021 22:06:50 - INFO - __main__ - Step 49120: {'lr': 0.0003850347736077483, 'samples': 9431040, 'steps': 49119, 'loss/train': 1.1493711471557617} -08/30/2021 22:06:50 - INFO - __main__ - Step 49121: {'lr': 0.0003850303075499227, 'samples': 9431232, 'steps': 49120, 'loss/train': 0.9882366061210632} -08/30/2021 22:06:51 - INFO - __main__ - Step 49122: {'lr': 0.0003850258414312547, 'samples': 9431424, 'steps': 49121, 'loss/train': 1.4244186878204346} -08/30/2021 22:06:52 - INFO - __main__ - Step 49123: {'lr': 0.000385021375251746, 'samples': 9431616, 'steps': 49122, 'loss/train': 1.4393975734710693} -08/30/2021 22:06:53 - INFO - __main__ - Step 49124: {'lr': 0.00038501690901139883, 'samples': 9431808, 'steps': 49123, 'loss/train': 1.1934809684753418} -08/30/2021 22:06:53 - INFO - __main__ - Step 49125: {'lr': 0.0003850124427102151, 'samples': 9432000, 'steps': 49124, 'loss/train': 1.727146029472351} -08/30/2021 22:06:53 - INFO - __main__ - Step 49126: {'lr': 0.0003850079763481968, 'samples': 9432192, 'steps': 49125, 'loss/train': 1.2128039598464966} -08/30/2021 22:06:54 - INFO - __main__ - Step 49127: {'lr': 0.0003850035099253461, 'samples': 9432384, 'steps': 49126, 'loss/train': 0.6615647077560425} -08/30/2021 22:06:55 - INFO - __main__ - Step 49128: {'lr': 0.00038499904344166483, 'samples': 9432576, 'steps': 49127, 'loss/train': 1.3362478017807007} -08/30/2021 22:06:56 - INFO - __main__ - Step 49129: {'lr': 0.0003849945768971551, 'samples': 9432768, 'steps': 49128, 'loss/train': 1.3057968616485596} -08/30/2021 22:06:56 - INFO - __main__ - Step 49130: {'lr': 0.0003849901102918189, 'samples': 9432960, 'steps': 49129, 'loss/train': 0.24954719841480255} -08/30/2021 22:06:56 - INFO - __main__ - Step 49131: {'lr': 0.00038498564362565826, 'samples': 9433152, 'steps': 49130, 'loss/train': 1.4137929677963257} -08/30/2021 22:06:57 - INFO - __main__ - Step 49132: {'lr': 0.0003849811768986751, 'samples': 9433344, 'steps': 49131, 'loss/train': 1.699936032295227} -08/30/2021 22:06:58 - INFO - __main__ - Step 49133: {'lr': 0.0003849767101108715, 'samples': 9433536, 'steps': 49132, 'loss/train': 1.5967504978179932} -08/30/2021 22:06:59 - INFO - __main__ - Step 49134: {'lr': 0.0003849722432622495, 'samples': 9433728, 'steps': 49133, 'loss/train': 1.2202248573303223} -08/30/2021 22:06:59 - INFO - __main__ - Step 49135: {'lr': 0.0003849677763528111, 'samples': 9433920, 'steps': 49134, 'loss/train': 0.2459113597869873} -08/30/2021 22:06:59 - INFO - __main__ - Step 49136: {'lr': 0.0003849633093825583, 'samples': 9434112, 'steps': 49135, 'loss/train': 0.7782366275787354} -08/30/2021 22:07:00 - INFO - __main__ - Step 49137: {'lr': 0.00038495884235149316, 'samples': 9434304, 'steps': 49136, 'loss/train': 1.1433498859405518} -08/30/2021 22:07:01 - INFO - __main__ - Step 49138: {'lr': 0.0003849543752596176, 'samples': 9434496, 'steps': 49137, 'loss/train': 1.048794150352478} -08/30/2021 22:07:02 - INFO - __main__ - Step 49139: {'lr': 0.00038494990810693366, 'samples': 9434688, 'steps': 49138, 'loss/train': 0.6492387652397156} -08/30/2021 22:07:02 - INFO - __main__ - Step 49140: {'lr': 0.0003849454408934434, 'samples': 9434880, 'steps': 49139, 'loss/train': 0.8339297771453857} -08/30/2021 22:07:03 - INFO - __main__ - Step 49141: {'lr': 0.0003849409736191488, 'samples': 9435072, 'steps': 49140, 'loss/train': 0.9653542041778564} -08/30/2021 22:07:03 - INFO - __main__ - Step 49142: {'lr': 0.00038493650628405196, 'samples': 9435264, 'steps': 49141, 'loss/train': 1.070016622543335} -08/30/2021 22:07:03 - INFO - __main__ - Step 49143: {'lr': 0.0003849320388881547, 'samples': 9435456, 'steps': 49142, 'loss/train': 1.752500295639038} -08/30/2021 22:07:05 - INFO - __main__ - Step 49144: {'lr': 0.0003849275714314592, 'samples': 9435648, 'steps': 49143, 'loss/train': 1.339125394821167} -08/30/2021 22:07:05 - INFO - __main__ - Step 49145: {'lr': 0.0003849231039139674, 'samples': 9435840, 'steps': 49144, 'loss/train': 1.0353636741638184} -08/30/2021 22:07:06 - INFO - __main__ - Step 49146: {'lr': 0.00038491863633568135, 'samples': 9436032, 'steps': 49145, 'loss/train': 1.3980462551116943} -08/30/2021 22:07:06 - INFO - __main__ - Step 49147: {'lr': 0.000384914168696603, 'samples': 9436224, 'steps': 49146, 'loss/train': 1.4324872493743896} -08/30/2021 22:07:06 - INFO - __main__ - Step 49148: {'lr': 0.0003849097009967344, 'samples': 9436416, 'steps': 49147, 'loss/train': 1.2474780082702637} -08/30/2021 22:07:08 - INFO - __main__ - Step 49149: {'lr': 0.0003849052332360777, 'samples': 9436608, 'steps': 49148, 'loss/train': 1.3348233699798584} -08/30/2021 22:07:09 - INFO - __main__ - Step 49150: {'lr': 0.0003849007654146347, 'samples': 9436800, 'steps': 49149, 'loss/train': 1.6907507181167603} -08/30/2021 22:07:09 - INFO - __main__ - Step 49151: {'lr': 0.0003848962975324074, 'samples': 9436992, 'steps': 49150, 'loss/train': 1.3018909692764282} -08/30/2021 22:07:09 - INFO - __main__ - Step 49152: {'lr': 0.00038489182958939804, 'samples': 9437184, 'steps': 49151, 'loss/train': 1.5151299238204956} -08/30/2021 22:07:10 - INFO - __main__ - Step 49153: {'lr': 0.00038488736158560845, 'samples': 9437376, 'steps': 49152, 'loss/train': 1.7668776512145996} -08/30/2021 22:07:10 - INFO - __main__ - Step 49154: {'lr': 0.00038488289352104065, 'samples': 9437568, 'steps': 49153, 'loss/train': 0.10143160820007324} -08/30/2021 22:07:12 - INFO - __main__ - Step 49155: {'lr': 0.0003848784253956968, 'samples': 9437760, 'steps': 49154, 'loss/train': 1.9443635940551758} -08/30/2021 22:07:13 - INFO - __main__ - Step 49156: {'lr': 0.00038487395720957884, 'samples': 9437952, 'steps': 49155, 'loss/train': 1.2713654041290283} -08/30/2021 22:07:13 - INFO - __main__ - Step 49157: {'lr': 0.0003848694889626886, 'samples': 9438144, 'steps': 49156, 'loss/train': 1.399463176727295} -08/30/2021 22:07:13 - INFO - __main__ - Step 49158: {'lr': 0.0003848650206550284, 'samples': 9438336, 'steps': 49157, 'loss/train': 1.6623822450637817} -08/30/2021 22:07:14 - INFO - __main__ - Step 49159: {'lr': 0.0003848605522866, 'samples': 9438528, 'steps': 49158, 'loss/train': 0.09078831970691681} -08/30/2021 22:07:15 - INFO - __main__ - Step 49160: {'lr': 0.00038485608385740555, 'samples': 9438720, 'steps': 49159, 'loss/train': 1.3066836595535278} -08/30/2021 22:07:16 - INFO - __main__ - Step 49161: {'lr': 0.00038485161536744707, 'samples': 9438912, 'steps': 49160, 'loss/train': 0.9863752126693726} -08/30/2021 22:07:16 - INFO - __main__ - Step 49162: {'lr': 0.0003848471468167265, 'samples': 9439104, 'steps': 49161, 'loss/train': 1.2677817344665527} -08/30/2021 22:07:16 - INFO - __main__ - Step 49163: {'lr': 0.00038484267820524586, 'samples': 9439296, 'steps': 49162, 'loss/train': 0.6565447449684143} -08/30/2021 22:07:17 - INFO - __main__ - Step 49164: {'lr': 0.00038483820953300724, 'samples': 9439488, 'steps': 49163, 'loss/train': 1.3577884435653687} -08/30/2021 22:07:18 - INFO - __main__ - Step 49165: {'lr': 0.00038483374080001254, 'samples': 9439680, 'steps': 49164, 'loss/train': 1.3161287307739258} -08/30/2021 22:07:19 - INFO - __main__ - Step 49166: {'lr': 0.00038482927200626386, 'samples': 9439872, 'steps': 49165, 'loss/train': 1.6842350959777832} -08/30/2021 22:07:19 - INFO - __main__ - Step 49167: {'lr': 0.0003848248031517633, 'samples': 9440064, 'steps': 49166, 'loss/train': 1.3498424291610718} -08/30/2021 22:07:19 - INFO - __main__ - Step 49168: {'lr': 0.00038482033423651256, 'samples': 9440256, 'steps': 49167, 'loss/train': 0.8299590349197388} -08/30/2021 22:07:20 - INFO - __main__ - Step 49169: {'lr': 0.00038481586526051406, 'samples': 9440448, 'steps': 49168, 'loss/train': 1.4562487602233887} -08/30/2021 22:07:21 - INFO - __main__ - Step 49170: {'lr': 0.0003848113962237695, 'samples': 9440640, 'steps': 49169, 'loss/train': 1.0819567441940308} -08/30/2021 22:07:22 - INFO - __main__ - Step 49171: {'lr': 0.00038480692712628104, 'samples': 9440832, 'steps': 49170, 'loss/train': 1.4156032800674438} -08/30/2021 22:07:22 - INFO - __main__ - Step 49172: {'lr': 0.0003848024579680506, 'samples': 9441024, 'steps': 49171, 'loss/train': 1.3263633251190186} -08/30/2021 22:07:22 - INFO - __main__ - Step 49173: {'lr': 0.00038479798874908026, 'samples': 9441216, 'steps': 49172, 'loss/train': 1.9806033372879028} -08/30/2021 22:07:23 - INFO - __main__ - Step 49174: {'lr': 0.00038479351946937206, 'samples': 9441408, 'steps': 49173, 'loss/train': 1.4277247190475464} -08/30/2021 22:07:24 - INFO - __main__ - Step 49175: {'lr': 0.000384789050128928, 'samples': 9441600, 'steps': 49174, 'loss/train': 2.0319559574127197} -08/30/2021 22:07:25 - INFO - __main__ - Step 49176: {'lr': 0.0003847845807277501, 'samples': 9441792, 'steps': 49175, 'loss/train': 1.4201515913009644} -08/30/2021 22:07:25 - INFO - __main__ - Step 49177: {'lr': 0.0003847801112658403, 'samples': 9441984, 'steps': 49176, 'loss/train': 1.3669161796569824} -08/30/2021 22:07:25 - INFO - __main__ - Step 49178: {'lr': 0.0003847756417432007, 'samples': 9442176, 'steps': 49177, 'loss/train': 1.3410295248031616} -08/30/2021 22:07:26 - INFO - __main__ - Step 49179: {'lr': 0.00038477117215983316, 'samples': 9442368, 'steps': 49178, 'loss/train': 1.8866170644760132} -08/30/2021 22:07:27 - INFO - __main__ - Step 49180: {'lr': 0.0003847667025157399, 'samples': 9442560, 'steps': 49179, 'loss/train': 1.0135726928710938} -08/30/2021 22:07:28 - INFO - __main__ - Step 49181: {'lr': 0.0003847622328109228, 'samples': 9442752, 'steps': 49180, 'loss/train': 0.07564075291156769} -08/30/2021 22:07:28 - INFO - __main__ - Step 49182: {'lr': 0.000384757763045384, 'samples': 9442944, 'steps': 49181, 'loss/train': 0.30715441703796387} -08/30/2021 22:07:28 - INFO - __main__ - Step 49183: {'lr': 0.0003847532932191254, 'samples': 9443136, 'steps': 49182, 'loss/train': 2.2355058193206787} -08/30/2021 22:07:29 - INFO - __main__ - Step 49184: {'lr': 0.000384748823332149, 'samples': 9443328, 'steps': 49183, 'loss/train': 1.1814032793045044} -08/30/2021 22:07:29 - INFO - __main__ - Step 49185: {'lr': 0.0003847443533844569, 'samples': 9443520, 'steps': 49184, 'loss/train': 0.8963515162467957} -08/30/2021 22:07:31 - INFO - __main__ - Step 49186: {'lr': 0.000384739883376051, 'samples': 9443712, 'steps': 49185, 'loss/train': 1.2738615274429321} -08/30/2021 22:07:31 - INFO - __main__ - Step 49187: {'lr': 0.0003847354133069335, 'samples': 9443904, 'steps': 49186, 'loss/train': 1.3274590969085693} -08/30/2021 22:07:31 - INFO - __main__ - Step 49188: {'lr': 0.0003847309431771062, 'samples': 9444096, 'steps': 49187, 'loss/train': 1.1198103427886963} -08/30/2021 22:07:32 - INFO - __main__ - Step 49189: {'lr': 0.00038472647298657135, 'samples': 9444288, 'steps': 49188, 'loss/train': 1.8722938299179077} -08/30/2021 22:07:32 - INFO - __main__ - Step 49190: {'lr': 0.0003847220027353308, 'samples': 9444480, 'steps': 49189, 'loss/train': 1.2559112310409546} -08/30/2021 22:07:34 - INFO - __main__ - Step 49191: {'lr': 0.0003847175324233865, 'samples': 9444672, 'steps': 49190, 'loss/train': 0.05498026683926582} -08/30/2021 22:07:34 - INFO - __main__ - Step 49192: {'lr': 0.00038471306205074054, 'samples': 9444864, 'steps': 49191, 'loss/train': 0.23929549753665924} -08/30/2021 22:07:34 - INFO - __main__ - Step 49193: {'lr': 0.00038470859161739504, 'samples': 9445056, 'steps': 49192, 'loss/train': 1.2826683521270752} -08/30/2021 22:07:35 - INFO - __main__ - Step 49194: {'lr': 0.00038470412112335184, 'samples': 9445248, 'steps': 49193, 'loss/train': 1.2122269868850708} -08/30/2021 22:07:35 - INFO - __main__ - Step 49195: {'lr': 0.0003846996505686131, 'samples': 9445440, 'steps': 49194, 'loss/train': 1.8681303262710571} -08/30/2021 22:07:37 - INFO - __main__ - Step 49196: {'lr': 0.00038469517995318083, 'samples': 9445632, 'steps': 49195, 'loss/train': 1.8390130996704102} -08/30/2021 22:07:37 - INFO - __main__ - Step 49197: {'lr': 0.000384690709277057, 'samples': 9445824, 'steps': 49196, 'loss/train': 1.7137749195098877} -08/30/2021 22:07:38 - INFO - __main__ - Step 49198: {'lr': 0.0003846862385402435, 'samples': 9446016, 'steps': 49197, 'loss/train': 1.2819528579711914} -08/30/2021 22:07:38 - INFO - __main__ - Step 49199: {'lr': 0.00038468176774274253, 'samples': 9446208, 'steps': 49198, 'loss/train': 1.664359211921692} -08/30/2021 22:07:38 - INFO - __main__ - Step 49200: {'lr': 0.000384677296884556, 'samples': 9446400, 'steps': 49199, 'loss/train': 0.8389221429824829} -08/30/2021 22:07:39 - INFO - __main__ - Step 49201: {'lr': 0.000384672825965686, 'samples': 9446592, 'steps': 49200, 'loss/train': 1.6279150247573853} -08/30/2021 22:07:40 - INFO - __main__ - Step 49202: {'lr': 0.0003846683549861344, 'samples': 9446784, 'steps': 49201, 'loss/train': 0.46289634704589844} -08/30/2021 22:07:41 - INFO - __main__ - Step 49203: {'lr': 0.00038466388394590344, 'samples': 9446976, 'steps': 49202, 'loss/train': 1.8024694919586182} -08/30/2021 22:07:41 - INFO - __main__ - Step 49204: {'lr': 0.00038465941284499493, 'samples': 9447168, 'steps': 49203, 'loss/train': 1.3128901720046997} -08/30/2021 22:07:41 - INFO - __main__ - Step 49205: {'lr': 0.00038465494168341105, 'samples': 9447360, 'steps': 49204, 'loss/train': 1.273717999458313} -08/30/2021 22:07:42 - INFO - __main__ - Step 49206: {'lr': 0.00038465047046115365, 'samples': 9447552, 'steps': 49205, 'loss/train': 1.4139982461929321} -08/30/2021 22:07:44 - INFO - __main__ - Step 49207: {'lr': 0.00038464599917822483, 'samples': 9447744, 'steps': 49206, 'loss/train': 1.3037517070770264} -08/30/2021 22:07:44 - INFO - __main__ - Step 49208: {'lr': 0.00038464152783462667, 'samples': 9447936, 'steps': 49207, 'loss/train': 1.5533766746520996} -08/30/2021 22:07:44 - INFO - __main__ - Step 49209: {'lr': 0.0003846370564303611, 'samples': 9448128, 'steps': 49208, 'loss/train': 1.4777576923370361} -08/30/2021 22:07:45 - INFO - __main__ - Step 49210: {'lr': 0.00038463258496543014, 'samples': 9448320, 'steps': 49209, 'loss/train': 1.3325976133346558} -08/30/2021 22:07:45 - INFO - __main__ - Step 49211: {'lr': 0.0003846281134398358, 'samples': 9448512, 'steps': 49210, 'loss/train': 3.1529150009155273} -08/30/2021 22:07:47 - INFO - __main__ - Step 49212: {'lr': 0.0003846236418535801, 'samples': 9448704, 'steps': 49211, 'loss/train': 1.3873063325881958} -08/30/2021 22:07:47 - INFO - __main__ - Step 49213: {'lr': 0.00038461917020666506, 'samples': 9448896, 'steps': 49212, 'loss/train': 1.4782735109329224} -08/30/2021 22:07:47 - INFO - __main__ - Step 49214: {'lr': 0.0003846146984990927, 'samples': 9449088, 'steps': 49213, 'loss/train': 0.1309545338153839} -08/30/2021 22:07:48 - INFO - __main__ - Step 49215: {'lr': 0.00038461022673086506, 'samples': 9449280, 'steps': 49214, 'loss/train': 1.222947597503662} -08/30/2021 22:07:48 - INFO - __main__ - Step 49216: {'lr': 0.0003846057549019841, 'samples': 9449472, 'steps': 49215, 'loss/train': 1.864250659942627} -08/30/2021 22:07:50 - INFO - __main__ - Step 49217: {'lr': 0.0003846012830124519, 'samples': 9449664, 'steps': 49216, 'loss/train': 1.0156919956207275} -08/30/2021 22:07:50 - INFO - __main__ - Step 49218: {'lr': 0.0003845968110622704, 'samples': 9449856, 'steps': 49217, 'loss/train': 0.9880573153495789} -08/30/2021 22:07:50 - INFO - __main__ - Step 49219: {'lr': 0.0003845923390514417, 'samples': 9450048, 'steps': 49218, 'loss/train': 1.7902029752731323} -08/30/2021 22:07:51 - INFO - __main__ - Step 49220: {'lr': 0.0003845878669799677, 'samples': 9450240, 'steps': 49219, 'loss/train': 1.3832365274429321} -08/30/2021 22:07:51 - INFO - __main__ - Step 49221: {'lr': 0.00038458339484785057, 'samples': 9450432, 'steps': 49220, 'loss/train': 0.6814090609550476} -08/30/2021 22:07:53 - INFO - __main__ - Step 49222: {'lr': 0.00038457892265509214, 'samples': 9450624, 'steps': 49221, 'loss/train': 1.1078617572784424} -08/30/2021 22:07:53 - INFO - __main__ - Step 49223: {'lr': 0.00038457445040169467, 'samples': 9450816, 'steps': 49222, 'loss/train': 1.317821741104126} -08/30/2021 22:07:54 - INFO - __main__ - Step 49224: {'lr': 0.00038456997808765993, 'samples': 9451008, 'steps': 49223, 'loss/train': 1.1129207611083984} -08/30/2021 22:07:54 - INFO - __main__ - Step 49225: {'lr': 0.00038456550571299, 'samples': 9451200, 'steps': 49224, 'loss/train': 1.248144507408142} -08/30/2021 22:07:54 - INFO - __main__ - Step 49226: {'lr': 0.000384561033277687, 'samples': 9451392, 'steps': 49225, 'loss/train': 0.04282043129205704} -08/30/2021 22:07:56 - INFO - __main__ - Step 49227: {'lr': 0.00038455656078175283, 'samples': 9451584, 'steps': 49226, 'loss/train': 0.7476810812950134} -08/30/2021 22:07:56 - INFO - __main__ - Step 49228: {'lr': 0.0003845520882251895, 'samples': 9451776, 'steps': 49227, 'loss/train': 1.4731860160827637} -08/30/2021 22:07:56 - INFO - __main__ - Step 49229: {'lr': 0.00038454761560799915, 'samples': 9451968, 'steps': 49228, 'loss/train': 1.58684241771698} -08/30/2021 22:07:57 - INFO - __main__ - Step 49230: {'lr': 0.0003845431429301838, 'samples': 9452160, 'steps': 49229, 'loss/train': 0.8257639408111572} -08/30/2021 22:07:57 - INFO - __main__ - Step 49231: {'lr': 0.0003845386701917453, 'samples': 9452352, 'steps': 49230, 'loss/train': 1.198689341545105} -08/30/2021 22:07:59 - INFO - __main__ - Step 49232: {'lr': 0.0003845341973926857, 'samples': 9452544, 'steps': 49231, 'loss/train': 1.4551129341125488} -08/30/2021 22:07:59 - INFO - __main__ - Step 49233: {'lr': 0.0003845297245330071, 'samples': 9452736, 'steps': 49232, 'loss/train': 1.2291473150253296} -08/30/2021 22:08:00 - INFO - __main__ - Step 49234: {'lr': 0.0003845252516127115, 'samples': 9452928, 'steps': 49233, 'loss/train': 1.5148202180862427} -08/30/2021 22:08:00 - INFO - __main__ - Step 49235: {'lr': 0.0003845207786318009, 'samples': 9453120, 'steps': 49234, 'loss/train': 1.0508157014846802} -08/30/2021 22:08:00 - INFO - __main__ - Step 49236: {'lr': 0.0003845163055902773, 'samples': 9453312, 'steps': 49235, 'loss/train': 1.4602532386779785} -08/30/2021 22:08:01 - INFO - __main__ - Step 49237: {'lr': 0.0003845118324881428, 'samples': 9453504, 'steps': 49236, 'loss/train': 1.648748517036438} -08/30/2021 22:08:02 - INFO - __main__ - Step 49238: {'lr': 0.00038450735932539927, 'samples': 9453696, 'steps': 49237, 'loss/train': 0.32679829001426697} -08/30/2021 22:08:03 - INFO - __main__ - Step 49239: {'lr': 0.0003845028861020488, 'samples': 9453888, 'steps': 49238, 'loss/train': 1.423423409461975} -08/30/2021 22:08:03 - INFO - __main__ - Step 49240: {'lr': 0.0003844984128180934, 'samples': 9454080, 'steps': 49239, 'loss/train': 1.4369245767593384} -08/30/2021 22:08:04 - INFO - __main__ - Step 49241: {'lr': 0.00038449393947353507, 'samples': 9454272, 'steps': 49240, 'loss/train': 1.8922852277755737} -08/30/2021 22:08:04 - INFO - __main__ - Step 49242: {'lr': 0.00038448946606837585, 'samples': 9454464, 'steps': 49241, 'loss/train': 4.198641300201416} -08/30/2021 22:08:05 - INFO - __main__ - Step 49243: {'lr': 0.00038448499260261787, 'samples': 9454656, 'steps': 49242, 'loss/train': 1.6535613536834717} -08/30/2021 22:08:06 - INFO - __main__ - Step 49244: {'lr': 0.0003844805190762629, 'samples': 9454848, 'steps': 49243, 'loss/train': 1.4675184488296509} -08/30/2021 22:08:06 - INFO - __main__ - Step 49245: {'lr': 0.00038447604548931313, 'samples': 9455040, 'steps': 49244, 'loss/train': 1.0234043598175049} -08/30/2021 22:08:07 - INFO - __main__ - Step 49246: {'lr': 0.0003844715718417705, 'samples': 9455232, 'steps': 49245, 'loss/train': 1.3436241149902344} -08/30/2021 22:08:07 - INFO - __main__ - Step 49247: {'lr': 0.0003844670981336371, 'samples': 9455424, 'steps': 49246, 'loss/train': 0.6790292263031006} -08/30/2021 22:08:08 - INFO - __main__ - Step 49248: {'lr': 0.000384462624364915, 'samples': 9455616, 'steps': 49247, 'loss/train': 1.5197412967681885} -08/30/2021 22:08:09 - INFO - __main__ - Step 49249: {'lr': 0.00038445815053560596, 'samples': 9455808, 'steps': 49248, 'loss/train': 1.5542930364608765} -08/30/2021 22:08:09 - INFO - __main__ - Step 49250: {'lr': 0.00038445367664571216, 'samples': 9456000, 'steps': 49249, 'loss/train': 1.1682729721069336} -08/30/2021 22:08:10 - INFO - __main__ - Step 49251: {'lr': 0.00038444920269523563, 'samples': 9456192, 'steps': 49250, 'loss/train': 1.1977733373641968} -08/30/2021 22:08:10 - INFO - __main__ - Step 49252: {'lr': 0.0003844447286841783, 'samples': 9456384, 'steps': 49251, 'loss/train': 1.5462701320648193} -08/30/2021 22:08:11 - INFO - __main__ - Step 49253: {'lr': 0.0003844402546125424, 'samples': 9456576, 'steps': 49252, 'loss/train': 0.2373725175857544} -08/30/2021 22:08:12 - INFO - __main__ - Step 49254: {'lr': 0.00038443578048032975, 'samples': 9456768, 'steps': 49253, 'loss/train': 1.6040765047073364} -08/30/2021 22:08:12 - INFO - __main__ - Step 49255: {'lr': 0.0003844313062875423, 'samples': 9456960, 'steps': 49254, 'loss/train': 1.4305919408798218} -08/30/2021 22:08:13 - INFO - __main__ - Step 49256: {'lr': 0.00038442683203418227, 'samples': 9457152, 'steps': 49255, 'loss/train': 1.3896656036376953} -08/30/2021 22:08:13 - INFO - __main__ - Step 49257: {'lr': 0.0003844223577202516, 'samples': 9457344, 'steps': 49256, 'loss/train': 1.2048274278640747} -08/30/2021 22:08:15 - INFO - __main__ - Step 49258: {'lr': 0.00038441788334575225, 'samples': 9457536, 'steps': 49257, 'loss/train': 1.546325922012329} -08/30/2021 22:08:16 - INFO - __main__ - Step 49259: {'lr': 0.0003844134089106863, 'samples': 9457728, 'steps': 49258, 'loss/train': 1.31949782371521} -08/30/2021 22:08:16 - INFO - __main__ - Step 49260: {'lr': 0.00038440893441505573, 'samples': 9457920, 'steps': 49259, 'loss/train': 1.5841712951660156} -08/30/2021 22:08:16 - INFO - __main__ - Step 49261: {'lr': 0.0003844044598588625, 'samples': 9458112, 'steps': 49260, 'loss/train': 1.8185442686080933} -08/30/2021 22:08:17 - INFO - __main__ - Step 49262: {'lr': 0.0003843999852421088, 'samples': 9458304, 'steps': 49261, 'loss/train': 0.04322107881307602} -08/30/2021 22:08:17 - INFO - __main__ - Step 49263: {'lr': 0.0003843955105647965, 'samples': 9458496, 'steps': 49262, 'loss/train': 1.0817681550979614} -08/30/2021 22:08:18 - INFO - __main__ - Step 49264: {'lr': 0.0003843910358269277, 'samples': 9458688, 'steps': 49263, 'loss/train': 0.05380666255950928} -08/30/2021 22:08:19 - INFO - __main__ - Step 49265: {'lr': 0.0003843865610285043, 'samples': 9458880, 'steps': 49264, 'loss/train': 1.3266944885253906} -08/30/2021 22:08:19 - INFO - __main__ - Step 49266: {'lr': 0.0003843820861695284, 'samples': 9459072, 'steps': 49265, 'loss/train': 1.446295142173767} -08/30/2021 22:08:20 - INFO - __main__ - Step 49267: {'lr': 0.00038437761125000204, 'samples': 9459264, 'steps': 49266, 'loss/train': 1.4948248863220215} -08/30/2021 22:08:20 - INFO - __main__ - Step 49268: {'lr': 0.00038437313626992723, 'samples': 9459456, 'steps': 49267, 'loss/train': 1.1032837629318237} -08/30/2021 22:08:22 - INFO - __main__ - Step 49269: {'lr': 0.0003843686612293059, 'samples': 9459648, 'steps': 49268, 'loss/train': 0.5796222686767578} -08/30/2021 22:08:22 - INFO - __main__ - Step 49270: {'lr': 0.0003843641861281402, 'samples': 9459840, 'steps': 49269, 'loss/train': 1.481544852256775} -08/30/2021 22:08:22 - INFO - __main__ - Step 49271: {'lr': 0.00038435971096643196, 'samples': 9460032, 'steps': 49270, 'loss/train': 0.8321482539176941} -08/30/2021 22:08:23 - INFO - __main__ - Step 49272: {'lr': 0.00038435523574418336, 'samples': 9460224, 'steps': 49271, 'loss/train': 1.2183438539505005} -08/30/2021 22:08:23 - INFO - __main__ - Step 49273: {'lr': 0.0003843507604613964, 'samples': 9460416, 'steps': 49272, 'loss/train': 1.5134491920471191} -08/30/2021 22:08:24 - INFO - __main__ - Step 49274: {'lr': 0.00038434628511807296, 'samples': 9460608, 'steps': 49273, 'loss/train': 0.6419780254364014} -08/30/2021 22:08:25 - INFO - __main__ - Step 49275: {'lr': 0.00038434180971421523, 'samples': 9460800, 'steps': 49274, 'loss/train': 1.5866234302520752} -08/30/2021 22:08:25 - INFO - __main__ - Step 49276: {'lr': 0.0003843373342498251, 'samples': 9460992, 'steps': 49275, 'loss/train': 0.7980654835700989} -08/30/2021 22:08:26 - INFO - __main__ - Step 49277: {'lr': 0.00038433285872490475, 'samples': 9461184, 'steps': 49276, 'loss/train': 1.5908366441726685} -08/30/2021 22:08:26 - INFO - __main__ - Step 49278: {'lr': 0.000384328383139456, 'samples': 9461376, 'steps': 49277, 'loss/train': 1.6412440538406372} -08/30/2021 22:08:26 - INFO - __main__ - Step 49279: {'lr': 0.000384323907493481, 'samples': 9461568, 'steps': 49278, 'loss/train': 1.5419632196426392} -08/30/2021 22:08:28 - INFO - __main__ - Step 49280: {'lr': 0.0003843194317869817, 'samples': 9461760, 'steps': 49279, 'loss/train': 1.3067244291305542} -08/30/2021 22:08:28 - INFO - __main__ - Step 49281: {'lr': 0.0003843149560199601, 'samples': 9461952, 'steps': 49280, 'loss/train': 1.2367156744003296} -08/30/2021 22:08:29 - INFO - __main__ - Step 49282: {'lr': 0.0003843104801924183, 'samples': 9462144, 'steps': 49281, 'loss/train': 1.2822291851043701} -08/30/2021 22:08:29 - INFO - __main__ - Step 49283: {'lr': 0.00038430600430435825, 'samples': 9462336, 'steps': 49282, 'loss/train': 1.815993070602417} -08/30/2021 22:08:29 - INFO - __main__ - Step 49284: {'lr': 0.000384301528355782, 'samples': 9462528, 'steps': 49283, 'loss/train': 1.6723556518554688} -08/30/2021 22:08:31 - INFO - __main__ - Step 49285: {'lr': 0.00038429705234669157, 'samples': 9462720, 'steps': 49284, 'loss/train': 1.1135339736938477} -08/30/2021 22:08:32 - INFO - __main__ - Step 49286: {'lr': 0.00038429257627708893, 'samples': 9462912, 'steps': 49285, 'loss/train': 1.359188199043274} -08/30/2021 22:08:32 - INFO - __main__ - Step 49287: {'lr': 0.00038428810014697615, 'samples': 9463104, 'steps': 49286, 'loss/train': 1.1317414045333862} -08/30/2021 22:08:32 - INFO - __main__ - Step 49288: {'lr': 0.00038428362395635514, 'samples': 9463296, 'steps': 49287, 'loss/train': 1.7288060188293457} -08/30/2021 22:08:33 - INFO - __main__ - Step 49289: {'lr': 0.0003842791477052281, 'samples': 9463488, 'steps': 49288, 'loss/train': 0.21582379937171936} -08/30/2021 22:08:33 - INFO - __main__ - Step 49290: {'lr': 0.00038427467139359696, 'samples': 9463680, 'steps': 49289, 'loss/train': 0.48793405294418335} -08/30/2021 22:08:35 - INFO - __main__ - Step 49291: {'lr': 0.00038427019502146364, 'samples': 9463872, 'steps': 49290, 'loss/train': 1.7250391244888306} -08/30/2021 22:08:35 - INFO - __main__ - Step 49292: {'lr': 0.0003842657185888303, 'samples': 9464064, 'steps': 49291, 'loss/train': 1.3810476064682007} -08/30/2021 22:08:35 - INFO - __main__ - Step 49293: {'lr': 0.00038426124209569885, 'samples': 9464256, 'steps': 49292, 'loss/train': 1.6160986423492432} -08/30/2021 22:08:36 - INFO - __main__ - Step 49294: {'lr': 0.00038425676554207133, 'samples': 9464448, 'steps': 49293, 'loss/train': 0.27751803398132324} -08/30/2021 22:08:36 - INFO - __main__ - Step 49295: {'lr': 0.0003842522889279499, 'samples': 9464640, 'steps': 49294, 'loss/train': 1.7591522932052612} -08/30/2021 22:08:38 - INFO - __main__ - Step 49296: {'lr': 0.00038424781225333636, 'samples': 9464832, 'steps': 49295, 'loss/train': 0.8963214755058289} -08/30/2021 22:08:38 - INFO - __main__ - Step 49297: {'lr': 0.0003842433355182329, 'samples': 9465024, 'steps': 49296, 'loss/train': 3.1488471031188965} -08/30/2021 22:08:39 - INFO - __main__ - Step 49298: {'lr': 0.0003842388587226414, 'samples': 9465216, 'steps': 49297, 'loss/train': 1.3312585353851318} -08/30/2021 22:08:39 - INFO - __main__ - Step 49299: {'lr': 0.000384234381866564, 'samples': 9465408, 'steps': 49298, 'loss/train': 1.4373165369033813} -08/30/2021 22:08:39 - INFO - __main__ - Step 49300: {'lr': 0.00038422990495000267, 'samples': 9465600, 'steps': 49299, 'loss/train': 0.09126025438308716} -08/30/2021 22:08:40 - INFO - __main__ - Step 49301: {'lr': 0.00038422542797295935, 'samples': 9465792, 'steps': 49300, 'loss/train': 0.33187004923820496} -08/30/2021 22:08:40 - INFO - __main__ - Step 49302: {'lr': 0.0003842209509354362, 'samples': 9465984, 'steps': 49301, 'loss/train': 0.9662020206451416} -08/30/2021 22:08:42 - INFO - __main__ - Step 49303: {'lr': 0.00038421647383743505, 'samples': 9466176, 'steps': 49302, 'loss/train': 1.3036764860153198} -08/30/2021 22:08:42 - INFO - __main__ - Step 49304: {'lr': 0.00038421199667895814, 'samples': 9466368, 'steps': 49303, 'loss/train': 1.3093466758728027} -08/30/2021 22:08:43 - INFO - __main__ - Step 49305: {'lr': 0.0003842075194600073, 'samples': 9466560, 'steps': 49304, 'loss/train': 1.181131362915039} -08/30/2021 22:08:43 - INFO - __main__ - Step 49306: {'lr': 0.00038420304218058466, 'samples': 9466752, 'steps': 49305, 'loss/train': 1.411622166633606} -08/30/2021 22:08:43 - INFO - __main__ - Step 49307: {'lr': 0.00038419856484069216, 'samples': 9466944, 'steps': 49306, 'loss/train': 1.4452733993530273} -08/30/2021 22:08:45 - INFO - __main__ - Step 49308: {'lr': 0.0003841940874403319, 'samples': 9467136, 'steps': 49307, 'loss/train': 0.11862015724182129} -08/30/2021 22:08:45 - INFO - __main__ - Step 49309: {'lr': 0.0003841896099795058, 'samples': 9467328, 'steps': 49308, 'loss/train': 0.39663875102996826} -08/30/2021 22:08:46 - INFO - __main__ - Step 49310: {'lr': 0.00038418513245821605, 'samples': 9467520, 'steps': 49309, 'loss/train': 0.5722724795341492} -08/30/2021 22:08:46 - INFO - __main__ - Step 49311: {'lr': 0.0003841806548764645, 'samples': 9467712, 'steps': 49310, 'loss/train': 1.5263508558273315} -08/30/2021 22:08:46 - INFO - __main__ - Step 49312: {'lr': 0.0003841761772342531, 'samples': 9467904, 'steps': 49311, 'loss/train': 0.9048899412155151} -08/30/2021 22:08:48 - INFO - __main__ - Step 49313: {'lr': 0.0003841716995315841, 'samples': 9468096, 'steps': 49312, 'loss/train': 1.241011619567871} -08/30/2021 22:08:48 - INFO - __main__ - Step 49314: {'lr': 0.00038416722176845943, 'samples': 9468288, 'steps': 49313, 'loss/train': 1.4199984073638916} -08/30/2021 22:08:49 - INFO - __main__ - Step 49315: {'lr': 0.000384162743944881, 'samples': 9468480, 'steps': 49314, 'loss/train': 1.339867353439331} -08/30/2021 22:08:49 - INFO - __main__ - Step 49316: {'lr': 0.0003841582660608509, 'samples': 9468672, 'steps': 49315, 'loss/train': 1.6245360374450684} -08/30/2021 22:08:49 - INFO - __main__ - Step 49317: {'lr': 0.00038415378811637124, 'samples': 9468864, 'steps': 49316, 'loss/train': 1.7857468128204346} -08/30/2021 22:08:52 - INFO - __main__ - Step 49318: {'lr': 0.00038414931011144393, 'samples': 9469056, 'steps': 49317, 'loss/train': 1.3455666303634644} -08/30/2021 22:08:52 - INFO - __main__ - Step 49319: {'lr': 0.000384144832046071, 'samples': 9469248, 'steps': 49318, 'loss/train': 1.9347959756851196} -08/30/2021 22:08:52 - INFO - __main__ - Step 49320: {'lr': 0.0003841403539202545, 'samples': 9469440, 'steps': 49319, 'loss/train': 1.1906849145889282} -08/30/2021 22:08:53 - INFO - __main__ - Step 49321: {'lr': 0.00038413587573399635, 'samples': 9469632, 'steps': 49320, 'loss/train': 1.1730536222457886} -08/30/2021 22:08:53 - INFO - __main__ - Step 49322: {'lr': 0.0003841313974872986, 'samples': 9469824, 'steps': 49321, 'loss/train': 1.3707752227783203} -08/30/2021 22:08:54 - INFO - __main__ - Step 49323: {'lr': 0.00038412691918016345, 'samples': 9470016, 'steps': 49322, 'loss/train': 1.0285190343856812} -08/30/2021 22:08:55 - INFO - __main__ - Step 49324: {'lr': 0.00038412244081259273, 'samples': 9470208, 'steps': 49323, 'loss/train': 1.0527369976043701} -08/30/2021 22:08:55 - INFO - __main__ - Step 49325: {'lr': 0.00038411796238458853, 'samples': 9470400, 'steps': 49324, 'loss/train': 1.8493014574050903} -08/30/2021 22:08:56 - INFO - __main__ - Step 49326: {'lr': 0.00038411348389615286, 'samples': 9470592, 'steps': 49325, 'loss/train': 1.1464709043502808} -08/30/2021 22:08:56 - INFO - __main__ - Step 49327: {'lr': 0.00038410900534728765, 'samples': 9470784, 'steps': 49326, 'loss/train': 1.5225107669830322} -08/30/2021 22:08:58 - INFO - __main__ - Step 49328: {'lr': 0.000384104526737995, 'samples': 9470976, 'steps': 49327, 'loss/train': 1.741552472114563} -08/30/2021 22:08:58 - INFO - __main__ - Step 49329: {'lr': 0.0003841000480682769, 'samples': 9471168, 'steps': 49328, 'loss/train': 1.9028974771499634} -08/30/2021 22:08:58 - INFO - __main__ - Step 49330: {'lr': 0.0003840955693381355, 'samples': 9471360, 'steps': 49329, 'loss/train': 1.6996532678604126} -08/30/2021 22:08:59 - INFO - __main__ - Step 49331: {'lr': 0.0003840910905475726, 'samples': 9471552, 'steps': 49330, 'loss/train': 1.088881015777588} -08/30/2021 22:08:59 - INFO - __main__ - Step 49332: {'lr': 0.0003840866116965904, 'samples': 9471744, 'steps': 49331, 'loss/train': 1.2434372901916504} -08/30/2021 22:08:59 - INFO - __main__ - Step 49333: {'lr': 0.00038408213278519083, 'samples': 9471936, 'steps': 49332, 'loss/train': 1.1687560081481934} -08/30/2021 22:09:01 - INFO - __main__ - Step 49334: {'lr': 0.0003840776538133759, 'samples': 9472128, 'steps': 49333, 'loss/train': 0.5918006300926208} -08/30/2021 22:09:02 - INFO - __main__ - Step 49335: {'lr': 0.00038407317478114764, 'samples': 9472320, 'steps': 49334, 'loss/train': 1.5982314348220825} -08/30/2021 22:09:02 - INFO - __main__ - Step 49336: {'lr': 0.00038406869568850805, 'samples': 9472512, 'steps': 49335, 'loss/train': 1.2378559112548828} -08/30/2021 22:09:02 - INFO - __main__ - Step 49337: {'lr': 0.00038406421653545926, 'samples': 9472704, 'steps': 49336, 'loss/train': 0.5362732410430908} -08/30/2021 22:09:03 - INFO - __main__ - Step 49338: {'lr': 0.00038405973732200317, 'samples': 9472896, 'steps': 49337, 'loss/train': 1.3490744829177856} -08/30/2021 22:09:04 - INFO - __main__ - Step 49339: {'lr': 0.0003840552580481418, 'samples': 9473088, 'steps': 49338, 'loss/train': 1.5935252904891968} -08/30/2021 22:09:04 - INFO - __main__ - Step 49340: {'lr': 0.00038405077871387716, 'samples': 9473280, 'steps': 49339, 'loss/train': 1.2003512382507324} -08/30/2021 22:09:05 - INFO - __main__ - Step 49341: {'lr': 0.00038404629931921137, 'samples': 9473472, 'steps': 49340, 'loss/train': 1.1513137817382812} -08/30/2021 22:09:05 - INFO - __main__ - Step 49342: {'lr': 0.0003840418198641463, 'samples': 9473664, 'steps': 49341, 'loss/train': 1.4045181274414062} -08/30/2021 22:09:05 - INFO - __main__ - Step 49343: {'lr': 0.0003840373403486842, 'samples': 9473856, 'steps': 49342, 'loss/train': 0.7895429134368896} -08/30/2021 22:09:07 - INFO - __main__ - Step 49344: {'lr': 0.0003840328607728269, 'samples': 9474048, 'steps': 49343, 'loss/train': 1.3992438316345215} -08/30/2021 22:09:07 - INFO - __main__ - Step 49345: {'lr': 0.0003840283811365764, 'samples': 9474240, 'steps': 49344, 'loss/train': 2.078401803970337} -08/30/2021 22:09:08 - INFO - __main__ - Step 49346: {'lr': 0.00038402390143993484, 'samples': 9474432, 'steps': 49345, 'loss/train': 1.3841291666030884} -08/30/2021 22:09:08 - INFO - __main__ - Step 49347: {'lr': 0.0003840194216829042, 'samples': 9474624, 'steps': 49346, 'loss/train': 0.9066892266273499} -08/30/2021 22:09:09 - INFO - __main__ - Step 49348: {'lr': 0.00038401494186548633, 'samples': 9474816, 'steps': 49347, 'loss/train': 1.1779420375823975} -08/30/2021 22:09:10 - INFO - __main__ - Step 49349: {'lr': 0.0003840104619876835, 'samples': 9475008, 'steps': 49348, 'loss/train': 1.8947360515594482} -08/30/2021 22:09:11 - INFO - __main__ - Step 49350: {'lr': 0.0003840059820494976, 'samples': 9475200, 'steps': 49349, 'loss/train': 1.7193268537521362} -08/30/2021 22:09:11 - INFO - __main__ - Step 49351: {'lr': 0.00038400150205093075, 'samples': 9475392, 'steps': 49350, 'loss/train': 1.2958611249923706} -08/30/2021 22:09:11 - INFO - __main__ - Step 49352: {'lr': 0.00038399702199198486, 'samples': 9475584, 'steps': 49351, 'loss/train': 1.5861743688583374} -08/30/2021 22:09:12 - INFO - __main__ - Step 49353: {'lr': 0.00038399254187266186, 'samples': 9475776, 'steps': 49352, 'loss/train': 0.9506011009216309} -08/30/2021 22:09:13 - INFO - __main__ - Step 49354: {'lr': 0.000383988061692964, 'samples': 9475968, 'steps': 49353, 'loss/train': 1.5978995561599731} -08/30/2021 22:09:14 - INFO - __main__ - Step 49355: {'lr': 0.0003839835814528931, 'samples': 9476160, 'steps': 49354, 'loss/train': 1.2448289394378662} -08/30/2021 22:09:14 - INFO - __main__ - Step 49356: {'lr': 0.0003839791011524514, 'samples': 9476352, 'steps': 49355, 'loss/train': 1.210731029510498} -08/30/2021 22:09:14 - INFO - __main__ - Step 49357: {'lr': 0.0003839746207916407, 'samples': 9476544, 'steps': 49356, 'loss/train': 1.3754315376281738} -08/30/2021 22:09:15 - INFO - __main__ - Step 49358: {'lr': 0.0003839701403704631, 'samples': 9476736, 'steps': 49357, 'loss/train': 1.206537127494812} -08/30/2021 22:09:16 - INFO - __main__ - Step 49359: {'lr': 0.00038396565988892063, 'samples': 9476928, 'steps': 49358, 'loss/train': 1.6833325624465942} -08/30/2021 22:09:17 - INFO - __main__ - Step 49360: {'lr': 0.00038396117934701537, 'samples': 9477120, 'steps': 49359, 'loss/train': 1.2171975374221802} -08/30/2021 22:09:17 - INFO - __main__ - Step 49361: {'lr': 0.00038395669874474915, 'samples': 9477312, 'steps': 49360, 'loss/train': 0.09465812891721725} -08/30/2021 22:09:17 - INFO - __main__ - Step 49362: {'lr': 0.00038395221808212415, 'samples': 9477504, 'steps': 49361, 'loss/train': 1.7135801315307617} -08/30/2021 22:09:18 - INFO - __main__ - Step 49363: {'lr': 0.0003839477373591423, 'samples': 9477696, 'steps': 49362, 'loss/train': 1.6088014841079712} -08/30/2021 22:09:19 - INFO - __main__ - Step 49364: {'lr': 0.0003839432565758059, 'samples': 9477888, 'steps': 49363, 'loss/train': 1.7376768589019775} -08/30/2021 22:09:20 - INFO - __main__ - Step 49365: {'lr': 0.0003839387757321165, 'samples': 9478080, 'steps': 49364, 'loss/train': 0.3677865266799927} -08/30/2021 22:09:20 - INFO - __main__ - Step 49366: {'lr': 0.0003839342948280764, 'samples': 9478272, 'steps': 49365, 'loss/train': 1.654752254486084} -08/30/2021 22:09:21 - INFO - __main__ - Step 49367: {'lr': 0.00038392981386368763, 'samples': 9478464, 'steps': 49366, 'loss/train': 1.5803627967834473} -08/30/2021 22:09:21 - INFO - __main__ - Step 49368: {'lr': 0.0003839253328389521, 'samples': 9478656, 'steps': 49367, 'loss/train': 1.4564448595046997} -08/30/2021 22:09:21 - INFO - __main__ - Step 49369: {'lr': 0.00038392085175387186, 'samples': 9478848, 'steps': 49368, 'loss/train': 1.250160813331604} -08/30/2021 22:09:24 - INFO - __main__ - Step 49370: {'lr': 0.000383916370608449, 'samples': 9479040, 'steps': 49369, 'loss/train': 1.2121021747589111} -08/30/2021 22:09:24 - INFO - __main__ - Step 49371: {'lr': 0.0003839118894026855, 'samples': 9479232, 'steps': 49370, 'loss/train': 1.5944617986679077} -08/30/2021 22:09:24 - INFO - __main__ - Step 49372: {'lr': 0.0003839074081365833, 'samples': 9479424, 'steps': 49371, 'loss/train': 1.2362544536590576} -08/30/2021 22:09:25 - INFO - __main__ - Step 49373: {'lr': 0.0003839029268101446, 'samples': 9479616, 'steps': 49372, 'loss/train': 0.6072336435317993} -08/30/2021 22:09:25 - INFO - __main__ - Step 49374: {'lr': 0.00038389844542337123, 'samples': 9479808, 'steps': 49373, 'loss/train': 1.4622094631195068} -08/30/2021 22:09:27 - INFO - __main__ - Step 49375: {'lr': 0.0003838939639762653, 'samples': 9480000, 'steps': 49374, 'loss/train': 0.26569798588752747} -08/30/2021 22:09:27 - INFO - __main__ - Step 49376: {'lr': 0.00038388948246882883, 'samples': 9480192, 'steps': 49375, 'loss/train': 1.557763695716858} -08/30/2021 22:09:27 - INFO - __main__ - Step 49377: {'lr': 0.0003838850009010638, 'samples': 9480384, 'steps': 49376, 'loss/train': 1.0884987115859985} -08/30/2021 22:09:28 - INFO - __main__ - Step 49378: {'lr': 0.0003838805192729723, 'samples': 9480576, 'steps': 49377, 'loss/train': 0.9593924880027771} -08/30/2021 22:09:28 - INFO - __main__ - Step 49379: {'lr': 0.00038387603758455624, 'samples': 9480768, 'steps': 49378, 'loss/train': 1.7927411794662476} -08/30/2021 22:09:29 - INFO - __main__ - Step 49380: {'lr': 0.00038387155583581773, 'samples': 9480960, 'steps': 49379, 'loss/train': 1.7089567184448242} -08/30/2021 22:09:30 - INFO - __main__ - Step 49381: {'lr': 0.00038386707402675877, 'samples': 9481152, 'steps': 49380, 'loss/train': 0.8583994507789612} -08/30/2021 22:09:30 - INFO - __main__ - Step 49382: {'lr': 0.00038386259215738135, 'samples': 9481344, 'steps': 49381, 'loss/train': 1.130814552307129} -08/30/2021 22:09:31 - INFO - __main__ - Step 49383: {'lr': 0.0003838581102276876, 'samples': 9481536, 'steps': 49382, 'loss/train': 1.6091268062591553} -08/30/2021 22:09:31 - INFO - __main__ - Step 49384: {'lr': 0.00038385362823767935, 'samples': 9481728, 'steps': 49383, 'loss/train': 1.6003414392471313} -08/30/2021 22:09:33 - INFO - __main__ - Step 49385: {'lr': 0.00038384914618735873, 'samples': 9481920, 'steps': 49384, 'loss/train': 1.8464782238006592} -08/30/2021 22:09:33 - INFO - __main__ - Step 49386: {'lr': 0.0003838446640767278, 'samples': 9482112, 'steps': 49385, 'loss/train': 1.2683963775634766} -08/30/2021 22:09:34 - INFO - __main__ - Step 49387: {'lr': 0.00038384018190578843, 'samples': 9482304, 'steps': 49386, 'loss/train': 1.3003493547439575} -08/30/2021 22:09:34 - INFO - __main__ - Step 49388: {'lr': 0.0003838356996745429, 'samples': 9482496, 'steps': 49387, 'loss/train': 1.158971905708313} -08/30/2021 22:09:35 - INFO - __main__ - Step 49389: {'lr': 0.00038383121738299296, 'samples': 9482688, 'steps': 49388, 'loss/train': 1.5438778400421143} -08/30/2021 22:09:35 - INFO - __main__ - Step 49390: {'lr': 0.00038382673503114075, 'samples': 9482880, 'steps': 49389, 'loss/train': 1.5751315355300903} -08/30/2021 22:09:36 - INFO - __main__ - Step 49391: {'lr': 0.0003838222526189883, 'samples': 9483072, 'steps': 49390, 'loss/train': 0.08660253137350082} -08/30/2021 22:09:37 - INFO - __main__ - Step 49392: {'lr': 0.0003838177701465376, 'samples': 9483264, 'steps': 49391, 'loss/train': 1.6198095083236694} -08/30/2021 22:09:37 - INFO - __main__ - Step 49393: {'lr': 0.00038381328761379063, 'samples': 9483456, 'steps': 49392, 'loss/train': 1.456913948059082} -08/30/2021 22:09:37 - INFO - __main__ - Step 49394: {'lr': 0.0003838088050207496, 'samples': 9483648, 'steps': 49393, 'loss/train': 1.3473281860351562} -08/30/2021 22:09:38 - INFO - __main__ - Step 49395: {'lr': 0.00038380432236741625, 'samples': 9483840, 'steps': 49394, 'loss/train': 0.7261760234832764} -08/30/2021 22:09:39 - INFO - __main__ - Step 49396: {'lr': 0.0003837998396537927, 'samples': 9484032, 'steps': 49395, 'loss/train': 1.481816053390503} -08/30/2021 22:09:40 - INFO - __main__ - Step 49397: {'lr': 0.0003837953568798811, 'samples': 9484224, 'steps': 49396, 'loss/train': 1.5362592935562134} -08/30/2021 22:09:40 - INFO - __main__ - Step 49398: {'lr': 0.00038379087404568333, 'samples': 9484416, 'steps': 49397, 'loss/train': 1.5976382493972778} -08/30/2021 22:09:41 - INFO - __main__ - Step 49399: {'lr': 0.00038378639115120154, 'samples': 9484608, 'steps': 49398, 'loss/train': 0.9332494735717773} -08/30/2021 22:09:41 - INFO - __main__ - Step 49400: {'lr': 0.0003837819081964377, 'samples': 9484800, 'steps': 49399, 'loss/train': 1.2511084079742432} -08/30/2021 22:09:42 - INFO - __main__ - Step 49401: {'lr': 0.0003837774251813936, 'samples': 9484992, 'steps': 49400, 'loss/train': 0.3496077060699463} -08/30/2021 22:09:43 - INFO - __main__ - Step 49402: {'lr': 0.0003837729421060716, 'samples': 9485184, 'steps': 49401, 'loss/train': 1.514067530632019} -08/30/2021 22:09:43 - INFO - __main__ - Step 49403: {'lr': 0.00038376845897047354, 'samples': 9485376, 'steps': 49402, 'loss/train': 1.1421542167663574} -08/30/2021 22:09:43 - INFO - __main__ - Step 49404: {'lr': 0.00038376397577460144, 'samples': 9485568, 'steps': 49403, 'loss/train': 1.1896404027938843} -08/30/2021 22:09:44 - INFO - __main__ - Step 49405: {'lr': 0.00038375949251845745, 'samples': 9485760, 'steps': 49404, 'loss/train': 0.8072686195373535} -08/30/2021 22:09:45 - INFO - __main__ - Step 49406: {'lr': 0.0003837550092020434, 'samples': 9485952, 'steps': 49405, 'loss/train': 1.6520885229110718} -08/30/2021 22:09:46 - INFO - __main__ - Step 49407: {'lr': 0.0003837505258253615, 'samples': 9486144, 'steps': 49406, 'loss/train': 1.38993501663208} -08/30/2021 22:09:46 - INFO - __main__ - Step 49408: {'lr': 0.0003837460423884136, 'samples': 9486336, 'steps': 49407, 'loss/train': 1.1067701578140259} -08/30/2021 22:09:46 - INFO - __main__ - Step 49409: {'lr': 0.00038374155889120176, 'samples': 9486528, 'steps': 49408, 'loss/train': 0.7197641730308533} -08/30/2021 22:09:47 - INFO - __main__ - Step 49410: {'lr': 0.0003837370753337281, 'samples': 9486720, 'steps': 49409, 'loss/train': 1.0605894327163696} -08/30/2021 22:09:47 - INFO - __main__ - Step 49411: {'lr': 0.00038373259171599463, 'samples': 9486912, 'steps': 49410, 'loss/train': 1.4700936079025269} -08/30/2021 22:09:49 - INFO - __main__ - Step 49412: {'lr': 0.0003837281080380033, 'samples': 9487104, 'steps': 49411, 'loss/train': 1.697468638420105} -08/30/2021 22:09:49 - INFO - __main__ - Step 49413: {'lr': 0.00038372362429975603, 'samples': 9487296, 'steps': 49412, 'loss/train': 1.6221933364868164} -08/30/2021 22:09:50 - INFO - __main__ - Step 49414: {'lr': 0.0003837191405012551, 'samples': 9487488, 'steps': 49413, 'loss/train': 1.7777656316757202} -08/30/2021 22:09:50 - INFO - __main__ - Step 49415: {'lr': 0.00038371465664250226, 'samples': 9487680, 'steps': 49414, 'loss/train': 0.2903272807598114} -08/30/2021 22:09:50 - INFO - __main__ - Step 49416: {'lr': 0.0003837101727234997, 'samples': 9487872, 'steps': 49415, 'loss/train': 5.898153781890869} -08/30/2021 22:09:52 - INFO - __main__ - Step 49417: {'lr': 0.0003837056887442495, 'samples': 9488064, 'steps': 49416, 'loss/train': 0.8973371386528015} -08/30/2021 22:09:52 - INFO - __main__ - Step 49418: {'lr': 0.00038370120470475355, 'samples': 9488256, 'steps': 49417, 'loss/train': 1.488458275794983} -08/30/2021 22:09:53 - INFO - __main__ - Step 49419: {'lr': 0.0003836967206050138, 'samples': 9488448, 'steps': 49418, 'loss/train': 1.4495447874069214} -08/30/2021 22:09:53 - INFO - __main__ - Step 49420: {'lr': 0.0003836922364450325, 'samples': 9488640, 'steps': 49419, 'loss/train': 1.8584849834442139} -08/30/2021 22:09:53 - INFO - __main__ - Step 49421: {'lr': 0.0003836877522248114, 'samples': 9488832, 'steps': 49420, 'loss/train': 1.1529241800308228} -08/30/2021 22:09:54 - INFO - __main__ - Step 49422: {'lr': 0.0003836832679443527, 'samples': 9489024, 'steps': 49421, 'loss/train': 1.2306180000305176} -08/30/2021 22:09:56 - INFO - __main__ - Step 49423: {'lr': 0.00038367878360365845, 'samples': 9489216, 'steps': 49422, 'loss/train': 1.336978554725647} -08/30/2021 22:09:56 - INFO - __main__ - Step 49424: {'lr': 0.00038367429920273054, 'samples': 9489408, 'steps': 49423, 'loss/train': 0.7112210392951965} -08/30/2021 22:09:56 - INFO - __main__ - Step 49425: {'lr': 0.00038366981474157114, 'samples': 9489600, 'steps': 49424, 'loss/train': 1.4397872686386108} -08/30/2021 22:09:57 - INFO - __main__ - Step 49426: {'lr': 0.00038366533022018214, 'samples': 9489792, 'steps': 49425, 'loss/train': 1.533323884010315} -08/30/2021 22:09:57 - INFO - __main__ - Step 49427: {'lr': 0.0003836608456385655, 'samples': 9489984, 'steps': 49426, 'loss/train': 1.4056570529937744} -08/30/2021 22:09:59 - INFO - __main__ - Step 49428: {'lr': 0.00038365636099672347, 'samples': 9490176, 'steps': 49427, 'loss/train': 1.6726080179214478} -08/30/2021 22:09:59 - INFO - __main__ - Step 49429: {'lr': 0.0003836518762946579, 'samples': 9490368, 'steps': 49428, 'loss/train': 1.3833744525909424} -08/30/2021 22:09:59 - INFO - __main__ - Step 49430: {'lr': 0.0003836473915323709, 'samples': 9490560, 'steps': 49429, 'loss/train': 1.5137934684753418} -08/30/2021 22:10:00 - INFO - __main__ - Step 49431: {'lr': 0.0003836429067098645, 'samples': 9490752, 'steps': 49430, 'loss/train': 0.8328871130943298} -08/30/2021 22:10:00 - INFO - __main__ - Step 49432: {'lr': 0.0003836384218271405, 'samples': 9490944, 'steps': 49431, 'loss/train': 1.5596773624420166} -08/30/2021 22:10:02 - INFO - __main__ - Step 49433: {'lr': 0.00038363393688420116, 'samples': 9491136, 'steps': 49432, 'loss/train': 1.1320542097091675} -08/30/2021 22:10:02 - INFO - __main__ - Step 49434: {'lr': 0.0003836294518810485, 'samples': 9491328, 'steps': 49433, 'loss/train': 1.5863744020462036} -08/30/2021 22:10:02 - INFO - __main__ - Step 49435: {'lr': 0.00038362496681768434, 'samples': 9491520, 'steps': 49434, 'loss/train': 1.1333986520767212} -08/30/2021 22:10:03 - INFO - __main__ - Step 49436: {'lr': 0.0003836204816941109, 'samples': 9491712, 'steps': 49435, 'loss/train': 1.4573496580123901} -08/30/2021 22:10:03 - INFO - __main__ - Step 49437: {'lr': 0.0003836159965103301, 'samples': 9491904, 'steps': 49436, 'loss/train': 1.6631131172180176} -08/30/2021 22:10:05 - INFO - __main__ - Step 49438: {'lr': 0.0003836115112663441, 'samples': 9492096, 'steps': 49437, 'loss/train': 1.154723882675171} -08/30/2021 22:10:05 - INFO - __main__ - Step 49439: {'lr': 0.0003836070259621548, 'samples': 9492288, 'steps': 49438, 'loss/train': 1.4596904516220093} -08/30/2021 22:10:06 - INFO - __main__ - Step 49440: {'lr': 0.0003836025405977641, 'samples': 9492480, 'steps': 49439, 'loss/train': 1.4924565553665161} -08/30/2021 22:10:06 - INFO - __main__ - Step 49441: {'lr': 0.00038359805517317427, 'samples': 9492672, 'steps': 49440, 'loss/train': 1.5082950592041016} -08/30/2021 22:10:06 - INFO - __main__ - Step 49442: {'lr': 0.00038359356968838723, 'samples': 9492864, 'steps': 49441, 'loss/train': 1.4074862003326416} -08/30/2021 22:10:07 - INFO - __main__ - Step 49443: {'lr': 0.00038358908414340485, 'samples': 9493056, 'steps': 49442, 'loss/train': 1.6441724300384521} -08/30/2021 22:10:08 - INFO - __main__ - Step 49444: {'lr': 0.0003835845985382294, 'samples': 9493248, 'steps': 49443, 'loss/train': 1.5533626079559326} -08/30/2021 22:10:09 - INFO - __main__ - Step 49445: {'lr': 0.00038358011287286287, 'samples': 9493440, 'steps': 49444, 'loss/train': 1.7546589374542236} -08/30/2021 22:10:09 - INFO - __main__ - Step 49446: {'lr': 0.0003835756271473071, 'samples': 9493632, 'steps': 49445, 'loss/train': 1.1725339889526367} -08/30/2021 22:10:09 - INFO - __main__ - Step 49447: {'lr': 0.0003835711413615642, 'samples': 9493824, 'steps': 49446, 'loss/train': 0.717629075050354} -08/30/2021 22:10:10 - INFO - __main__ - Step 49448: {'lr': 0.0003835666555156362, 'samples': 9494016, 'steps': 49447, 'loss/train': 2.4399120807647705} -08/30/2021 22:10:11 - INFO - __main__ - Step 49449: {'lr': 0.00038356216960952515, 'samples': 9494208, 'steps': 49448, 'loss/train': 1.2204011678695679} -08/30/2021 22:10:12 - INFO - __main__ - Step 49450: {'lr': 0.0003835576836432331, 'samples': 9494400, 'steps': 49449, 'loss/train': 1.36895751953125} -08/30/2021 22:10:12 - INFO - __main__ - Step 49451: {'lr': 0.000383553197616762, 'samples': 9494592, 'steps': 49450, 'loss/train': 1.116050124168396} -08/30/2021 22:10:13 - INFO - __main__ - Step 49452: {'lr': 0.00038354871153011385, 'samples': 9494784, 'steps': 49451, 'loss/train': 1.5069406032562256} -08/30/2021 22:10:13 - INFO - __main__ - Step 49453: {'lr': 0.0003835442253832907, 'samples': 9494976, 'steps': 49452, 'loss/train': 0.8713278770446777} -08/30/2021 22:10:14 - INFO - __main__ - Step 49454: {'lr': 0.00038353973917629457, 'samples': 9495168, 'steps': 49453, 'loss/train': 0.7570756077766418} -08/30/2021 22:10:15 - INFO - __main__ - Step 49455: {'lr': 0.0003835352529091275, 'samples': 9495360, 'steps': 49454, 'loss/train': 1.2459245920181274} -08/30/2021 22:10:15 - INFO - __main__ - Step 49456: {'lr': 0.0003835307665817915, 'samples': 9495552, 'steps': 49455, 'loss/train': 0.1712222546339035} -08/30/2021 22:10:15 - INFO - __main__ - Step 49457: {'lr': 0.0003835262801942887, 'samples': 9495744, 'steps': 49456, 'loss/train': 1.789059042930603} -08/30/2021 22:10:16 - INFO - __main__ - Step 49458: {'lr': 0.000383521793746621, 'samples': 9495936, 'steps': 49457, 'loss/train': 1.8182224035263062} -08/30/2021 22:10:17 - INFO - __main__ - Step 49459: {'lr': 0.00038351730723879034, 'samples': 9496128, 'steps': 49458, 'loss/train': 1.7775760889053345} -08/30/2021 22:10:18 - INFO - __main__ - Step 49460: {'lr': 0.0003835128206707989, 'samples': 9496320, 'steps': 49459, 'loss/train': 1.4985154867172241} -08/30/2021 22:10:18 - INFO - __main__ - Step 49461: {'lr': 0.00038350833404264865, 'samples': 9496512, 'steps': 49460, 'loss/train': 1.3443094491958618} -08/30/2021 22:10:19 - INFO - __main__ - Step 49462: {'lr': 0.0003835038473543416, 'samples': 9496704, 'steps': 49461, 'loss/train': 0.8598469495773315} -08/30/2021 22:10:19 - INFO - __main__ - Step 49463: {'lr': 0.0003834993606058798, 'samples': 9496896, 'steps': 49462, 'loss/train': 0.36771276593208313} -08/30/2021 22:10:21 - INFO - __main__ - Step 49464: {'lr': 0.00038349487379726513, 'samples': 9497088, 'steps': 49463, 'loss/train': 1.5126025676727295} -08/30/2021 22:10:21 - INFO - __main__ - Step 49465: {'lr': 0.0003834903869284999, 'samples': 9497280, 'steps': 49464, 'loss/train': 1.4187909364700317} -08/30/2021 22:10:22 - INFO - __main__ - Step 49466: {'lr': 0.00038348589999958585, 'samples': 9497472, 'steps': 49465, 'loss/train': 1.547430157661438} -08/30/2021 22:10:22 - INFO - __main__ - Step 49467: {'lr': 0.00038348141301052505, 'samples': 9497664, 'steps': 49466, 'loss/train': 1.3662631511688232} -08/30/2021 22:10:22 - INFO - __main__ - Step 49468: {'lr': 0.00038347692596131977, 'samples': 9497856, 'steps': 49467, 'loss/train': 0.1770838499069214} -08/30/2021 22:10:23 - INFO - __main__ - Step 49469: {'lr': 0.0003834724388519717, 'samples': 9498048, 'steps': 49468, 'loss/train': 0.22132369875907898} -08/30/2021 22:10:24 - INFO - __main__ - Step 49470: {'lr': 0.00038346795168248306, 'samples': 9498240, 'steps': 49469, 'loss/train': 1.1906710863113403} -08/30/2021 22:10:25 - INFO - __main__ - Step 49471: {'lr': 0.00038346346445285585, 'samples': 9498432, 'steps': 49470, 'loss/train': 1.5501283407211304} -08/30/2021 22:10:25 - INFO - __main__ - Step 49472: {'lr': 0.0003834589771630921, 'samples': 9498624, 'steps': 49471, 'loss/train': 1.5011506080627441} -08/30/2021 22:10:25 - INFO - __main__ - Step 49473: {'lr': 0.0003834544898131936, 'samples': 9498816, 'steps': 49472, 'loss/train': 1.8528144359588623} -08/30/2021 22:10:26 - INFO - __main__ - Step 49474: {'lr': 0.00038345000240316276, 'samples': 9499008, 'steps': 49473, 'loss/train': 1.3612840175628662} -08/30/2021 22:10:27 - INFO - __main__ - Step 49475: {'lr': 0.00038344551493300135, 'samples': 9499200, 'steps': 49474, 'loss/train': 1.6891896724700928} -08/30/2021 22:10:27 - INFO - __main__ - Step 49476: {'lr': 0.00038344102740271144, 'samples': 9499392, 'steps': 49475, 'loss/train': 0.7574342489242554} -08/30/2021 22:10:28 - INFO - __main__ - Step 49477: {'lr': 0.00038343653981229504, 'samples': 9499584, 'steps': 49476, 'loss/train': 1.5855237245559692} -08/30/2021 22:10:28 - INFO - __main__ - Step 49478: {'lr': 0.00038343205216175426, 'samples': 9499776, 'steps': 49477, 'loss/train': 0.7812578082084656} -08/30/2021 22:10:28 - INFO - __main__ - Step 49479: {'lr': 0.000383427564451091, 'samples': 9499968, 'steps': 49478, 'loss/train': 1.486604928970337} -08/30/2021 22:10:30 - INFO - __main__ - Step 49480: {'lr': 0.00038342307668030737, 'samples': 9500160, 'steps': 49479, 'loss/train': 1.6912150382995605} -08/30/2021 22:10:31 - INFO - __main__ - Step 49481: {'lr': 0.0003834185888494053, 'samples': 9500352, 'steps': 49480, 'loss/train': 0.8896346092224121} -08/30/2021 22:10:31 - INFO - __main__ - Step 49482: {'lr': 0.00038341410095838694, 'samples': 9500544, 'steps': 49481, 'loss/train': 1.469557285308838} -08/30/2021 22:10:32 - INFO - __main__ - Step 49483: {'lr': 0.0003834096130072542, 'samples': 9500736, 'steps': 49482, 'loss/train': 0.09400922805070877} -08/30/2021 22:10:32 - INFO - __main__ - Step 49484: {'lr': 0.00038340512499600917, 'samples': 9500928, 'steps': 49483, 'loss/train': 0.7293932437896729} -08/30/2021 22:10:34 - INFO - __main__ - Step 49485: {'lr': 0.00038340063692465386, 'samples': 9501120, 'steps': 49484, 'loss/train': 0.972122311592102} -08/30/2021 22:10:34 - INFO - __main__ - Step 49486: {'lr': 0.00038339614879319027, 'samples': 9501312, 'steps': 49485, 'loss/train': 1.702094554901123} -08/30/2021 22:10:34 - INFO - __main__ - Step 49487: {'lr': 0.00038339166060162046, 'samples': 9501504, 'steps': 49486, 'loss/train': 0.8908302187919617} -08/30/2021 22:10:35 - INFO - __main__ - Step 49488: {'lr': 0.00038338717234994633, 'samples': 9501696, 'steps': 49487, 'loss/train': 1.3802777528762817} -08/30/2021 22:10:35 - INFO - __main__ - Step 49489: {'lr': 0.0003833826840381701, 'samples': 9501888, 'steps': 49488, 'loss/train': 0.2174101173877716} -08/30/2021 22:10:36 - INFO - __main__ - Step 49490: {'lr': 0.00038337819566629363, 'samples': 9502080, 'steps': 49489, 'loss/train': 0.3199485242366791} -08/30/2021 22:10:37 - INFO - __main__ - Step 49491: {'lr': 0.000383373707234319, 'samples': 9502272, 'steps': 49490, 'loss/train': 1.3139634132385254} -08/30/2021 22:10:37 - INFO - __main__ - Step 49492: {'lr': 0.0003833692187422483, 'samples': 9502464, 'steps': 49491, 'loss/train': 1.0583555698394775} -08/30/2021 22:10:38 - INFO - __main__ - Step 49493: {'lr': 0.0003833647301900835, 'samples': 9502656, 'steps': 49492, 'loss/train': 1.6221011877059937} -08/30/2021 22:10:38 - INFO - __main__ - Step 49494: {'lr': 0.00038336024157782655, 'samples': 9502848, 'steps': 49493, 'loss/train': 1.476187825202942} -08/30/2021 22:10:39 - INFO - __main__ - Step 49495: {'lr': 0.00038335575290547954, 'samples': 9503040, 'steps': 49494, 'loss/train': 1.7007817029953003} -08/30/2021 22:10:40 - INFO - __main__ - Step 49496: {'lr': 0.0003833512641730445, 'samples': 9503232, 'steps': 49495, 'loss/train': 1.1251637935638428} -08/30/2021 22:10:40 - INFO - __main__ - Step 49497: {'lr': 0.0003833467753805234, 'samples': 9503424, 'steps': 49496, 'loss/train': 1.5556890964508057} -08/30/2021 22:10:41 - INFO - __main__ - Step 49498: {'lr': 0.00038334228652791837, 'samples': 9503616, 'steps': 49497, 'loss/train': 1.5392955541610718} -08/30/2021 22:10:41 - INFO - __main__ - Step 49499: {'lr': 0.00038333779761523133, 'samples': 9503808, 'steps': 49498, 'loss/train': 1.281488299369812} -08/30/2021 22:10:42 - INFO - __main__ - Step 49500: {'lr': 0.0003833333086424643, 'samples': 9504000, 'steps': 49499, 'loss/train': 1.2796951532363892} -08/30/2021 22:10:43 - INFO - __main__ - Step 49501: {'lr': 0.00038332881960961943, 'samples': 9504192, 'steps': 49500, 'loss/train': 1.130244255065918} -08/30/2021 22:10:43 - INFO - __main__ - Step 49502: {'lr': 0.0003833243305166986, 'samples': 9504384, 'steps': 49501, 'loss/train': 1.5526087284088135} -08/30/2021 22:10:43 - INFO - __main__ - Step 49503: {'lr': 0.00038331984136370377, 'samples': 9504576, 'steps': 49502, 'loss/train': 1.8512752056121826} -08/30/2021 22:10:44 - INFO - __main__ - Step 49504: {'lr': 0.0003833153521506372, 'samples': 9504768, 'steps': 49503, 'loss/train': 1.1084262132644653} -08/30/2021 22:10:45 - INFO - __main__ - Step 49505: {'lr': 0.00038331086287750083, 'samples': 9504960, 'steps': 49504, 'loss/train': 0.960732102394104} -08/30/2021 22:10:46 - INFO - __main__ - Step 49506: {'lr': 0.0003833063735442966, 'samples': 9505152, 'steps': 49505, 'loss/train': 1.3818302154541016} -08/30/2021 22:10:46 - INFO - __main__ - Step 49507: {'lr': 0.0003833018841510265, 'samples': 9505344, 'steps': 49506, 'loss/train': 1.2723408937454224} -08/30/2021 22:10:46 - INFO - __main__ - Step 49508: {'lr': 0.00038329739469769277, 'samples': 9505536, 'steps': 49507, 'loss/train': 0.9524272084236145} -08/30/2021 22:10:47 - INFO - __main__ - Step 49509: {'lr': 0.0003832929051842972, 'samples': 9505728, 'steps': 49508, 'loss/train': 1.4414458274841309} -08/30/2021 22:10:48 - INFO - __main__ - Step 49510: {'lr': 0.0003832884156108418, 'samples': 9505920, 'steps': 49509, 'loss/train': 1.0479592084884644} -08/30/2021 22:10:49 - INFO - __main__ - Step 49511: {'lr': 0.0003832839259773289, 'samples': 9506112, 'steps': 49510, 'loss/train': 1.2010400295257568} -08/30/2021 22:10:49 - INFO - __main__ - Step 49512: {'lr': 0.00038327943628376025, 'samples': 9506304, 'steps': 49511, 'loss/train': 0.9394859671592712} -08/30/2021 22:10:49 - INFO - __main__ - Step 49513: {'lr': 0.00038327494653013787, 'samples': 9506496, 'steps': 49512, 'loss/train': 1.3414398431777954} -08/30/2021 22:10:50 - INFO - __main__ - Step 49514: {'lr': 0.00038327045671646386, 'samples': 9506688, 'steps': 49513, 'loss/train': 1.532314419746399} -08/30/2021 22:10:50 - INFO - __main__ - Step 49515: {'lr': 0.00038326596684274035, 'samples': 9506880, 'steps': 49514, 'loss/train': 1.3462707996368408} -08/30/2021 22:10:52 - INFO - __main__ - Step 49516: {'lr': 0.00038326147690896916, 'samples': 9507072, 'steps': 49515, 'loss/train': 1.6698299646377563} -08/30/2021 22:10:52 - INFO - __main__ - Step 49517: {'lr': 0.00038325698691515247, 'samples': 9507264, 'steps': 49516, 'loss/train': 1.0764703750610352} -08/30/2021 22:10:53 - INFO - __main__ - Step 49518: {'lr': 0.00038325249686129223, 'samples': 9507456, 'steps': 49517, 'loss/train': 1.1404021978378296} -08/30/2021 22:10:53 - INFO - __main__ - Step 49519: {'lr': 0.0003832480067473904, 'samples': 9507648, 'steps': 49518, 'loss/train': 1.0500565767288208} -08/30/2021 22:10:53 - INFO - __main__ - Step 49520: {'lr': 0.0003832435165734491, 'samples': 9507840, 'steps': 49519, 'loss/train': 0.098548024892807} -08/30/2021 22:10:55 - INFO - __main__ - Step 49521: {'lr': 0.0003832390263394704, 'samples': 9508032, 'steps': 49520, 'loss/train': 1.14603853225708} -08/30/2021 22:10:55 - INFO - __main__ - Step 49522: {'lr': 0.0003832345360454561, 'samples': 9508224, 'steps': 49521, 'loss/train': 1.502983570098877} -08/30/2021 22:10:56 - INFO - __main__ - Step 49523: {'lr': 0.00038323004569140853, 'samples': 9508416, 'steps': 49522, 'loss/train': 0.08808526396751404} -08/30/2021 22:10:56 - INFO - __main__ - Step 49524: {'lr': 0.0003832255552773295, 'samples': 9508608, 'steps': 49523, 'loss/train': 0.9545467495918274} -08/30/2021 22:10:56 - INFO - __main__ - Step 49525: {'lr': 0.00038322106480322105, 'samples': 9508800, 'steps': 49524, 'loss/train': 1.339537262916565} -08/30/2021 22:10:58 - INFO - __main__ - Step 49526: {'lr': 0.00038321657426908527, 'samples': 9508992, 'steps': 49525, 'loss/train': 1.5905567407608032} -08/30/2021 22:10:58 - INFO - __main__ - Step 49527: {'lr': 0.0003832120836749242, 'samples': 9509184, 'steps': 49526, 'loss/train': 3.320098638534546} -08/30/2021 22:10:59 - INFO - __main__ - Step 49528: {'lr': 0.0003832075930207398, 'samples': 9509376, 'steps': 49527, 'loss/train': 0.9618931412696838} -08/30/2021 22:10:59 - INFO - __main__ - Step 49529: {'lr': 0.0003832031023065341, 'samples': 9509568, 'steps': 49528, 'loss/train': 1.247646450996399} -08/30/2021 22:11:00 - INFO - __main__ - Step 49530: {'lr': 0.0003831986115323092, 'samples': 9509760, 'steps': 49529, 'loss/train': 0.8380870223045349} -08/30/2021 22:11:02 - INFO - __main__ - Step 49531: {'lr': 0.00038319412069806694, 'samples': 9509952, 'steps': 49530, 'loss/train': 1.433803915977478} -08/30/2021 22:11:02 - INFO - __main__ - Step 49532: {'lr': 0.00038318962980380956, 'samples': 9510144, 'steps': 49531, 'loss/train': 1.0234384536743164} -08/30/2021 22:11:02 - INFO - __main__ - Step 49533: {'lr': 0.0003831851388495389, 'samples': 9510336, 'steps': 49532, 'loss/train': 0.9962560534477234} -08/30/2021 22:11:03 - INFO - __main__ - Step 49534: {'lr': 0.0003831806478352572, 'samples': 9510528, 'steps': 49533, 'loss/train': 1.8146426677703857} -08/30/2021 22:11:03 - INFO - __main__ - Step 49535: {'lr': 0.00038317615676096623, 'samples': 9510720, 'steps': 49534, 'loss/train': 1.069488525390625} -08/30/2021 22:11:05 - INFO - __main__ - Step 49536: {'lr': 0.00038317166562666817, 'samples': 9510912, 'steps': 49535, 'loss/train': 2.022279977798462} -08/30/2021 22:11:05 - INFO - __main__ - Step 49537: {'lr': 0.00038316717443236505, 'samples': 9511104, 'steps': 49536, 'loss/train': 1.5333529710769653} -08/30/2021 22:11:06 - INFO - __main__ - Step 49538: {'lr': 0.0003831626831780588, 'samples': 9511296, 'steps': 49537, 'loss/train': 1.7128392457962036} -08/30/2021 22:11:06 - INFO - __main__ - Step 49539: {'lr': 0.0003831581918637516, 'samples': 9511488, 'steps': 49538, 'loss/train': 1.4405306577682495} -08/30/2021 22:11:06 - INFO - __main__ - Step 49540: {'lr': 0.0003831537004894453, 'samples': 9511680, 'steps': 49539, 'loss/train': 0.8412823677062988} -08/30/2021 22:11:07 - INFO - __main__ - Step 49541: {'lr': 0.000383149209055142, 'samples': 9511872, 'steps': 49540, 'loss/train': 1.2243174314498901} -08/30/2021 22:11:08 - INFO - __main__ - Step 49542: {'lr': 0.00038314471756084373, 'samples': 9512064, 'steps': 49541, 'loss/train': 1.3091679811477661} -08/30/2021 22:11:09 - INFO - __main__ - Step 49543: {'lr': 0.0003831402260065525, 'samples': 9512256, 'steps': 49542, 'loss/train': 0.5797540545463562} -08/30/2021 22:11:09 - INFO - __main__ - Step 49544: {'lr': 0.00038313573439227035, 'samples': 9512448, 'steps': 49543, 'loss/train': 1.5811721086502075} -08/30/2021 22:11:09 - INFO - __main__ - Step 49545: {'lr': 0.0003831312427179993, 'samples': 9512640, 'steps': 49544, 'loss/train': 0.9819427132606506} -08/30/2021 22:11:10 - INFO - __main__ - Step 49546: {'lr': 0.00038312675098374136, 'samples': 9512832, 'steps': 49545, 'loss/train': 0.9778226017951965} -08/30/2021 22:11:11 - INFO - __main__ - Step 49547: {'lr': 0.0003831222591894985, 'samples': 9513024, 'steps': 49546, 'loss/train': 1.5419055223464966} -08/30/2021 22:11:12 - INFO - __main__ - Step 49548: {'lr': 0.0003831177673352729, 'samples': 9513216, 'steps': 49547, 'loss/train': 0.6110632419586182} -08/30/2021 22:11:12 - INFO - __main__ - Step 49549: {'lr': 0.00038311327542106646, 'samples': 9513408, 'steps': 49548, 'loss/train': 1.0220229625701904} -08/30/2021 22:11:13 - INFO - __main__ - Step 49550: {'lr': 0.00038310878344688116, 'samples': 9513600, 'steps': 49549, 'loss/train': 1.3049097061157227} -08/30/2021 22:11:13 - INFO - __main__ - Step 49551: {'lr': 0.0003831042914127192, 'samples': 9513792, 'steps': 49550, 'loss/train': 0.6687270402908325} -08/30/2021 22:11:14 - INFO - __main__ - Step 49552: {'lr': 0.00038309979931858243, 'samples': 9513984, 'steps': 49551, 'loss/train': 1.1881481409072876} -08/30/2021 22:11:15 - INFO - __main__ - Step 49553: {'lr': 0.00038309530716447297, 'samples': 9514176, 'steps': 49552, 'loss/train': 1.430482029914856} -08/30/2021 22:11:15 - INFO - __main__ - Step 49554: {'lr': 0.00038309081495039275, 'samples': 9514368, 'steps': 49553, 'loss/train': 1.108932375907898} -08/30/2021 22:11:16 - INFO - __main__ - Step 49555: {'lr': 0.00038308632267634396, 'samples': 9514560, 'steps': 49554, 'loss/train': 1.0717090368270874} -08/30/2021 22:11:16 - INFO - __main__ - Step 49556: {'lr': 0.00038308183034232844, 'samples': 9514752, 'steps': 49555, 'loss/train': 1.1739131212234497} -08/30/2021 22:11:17 - INFO - __main__ - Step 49557: {'lr': 0.0003830773379483484, 'samples': 9514944, 'steps': 49556, 'loss/train': 1.8572793006896973} -08/30/2021 22:11:18 - INFO - __main__ - Step 49558: {'lr': 0.0003830728454944057, 'samples': 9515136, 'steps': 49557, 'loss/train': 0.8058309555053711} -08/30/2021 22:11:18 - INFO - __main__ - Step 49559: {'lr': 0.00038306835298050255, 'samples': 9515328, 'steps': 49558, 'loss/train': 1.7848989963531494} -08/30/2021 22:11:18 - INFO - __main__ - Step 49560: {'lr': 0.0003830638604066407, 'samples': 9515520, 'steps': 49559, 'loss/train': 1.4342689514160156} -08/30/2021 22:11:19 - INFO - __main__ - Step 49561: {'lr': 0.00038305936777282233, 'samples': 9515712, 'steps': 49560, 'loss/train': 1.6363073587417603} -08/30/2021 22:11:20 - INFO - __main__ - Step 49562: {'lr': 0.00038305487507904956, 'samples': 9515904, 'steps': 49561, 'loss/train': 1.8470708131790161} -08/30/2021 22:11:21 - INFO - __main__ - Step 49563: {'lr': 0.0003830503823253243, 'samples': 9516096, 'steps': 49562, 'loss/train': 1.5975967645645142} -08/30/2021 22:11:21 - INFO - __main__ - Step 49564: {'lr': 0.0003830458895116485, 'samples': 9516288, 'steps': 49563, 'loss/train': 1.101426362991333} -08/30/2021 22:11:21 - INFO - __main__ - Step 49565: {'lr': 0.0003830413966380243, 'samples': 9516480, 'steps': 49564, 'loss/train': 1.2336184978485107} -08/30/2021 22:11:22 - INFO - __main__ - Step 49566: {'lr': 0.00038303690370445384, 'samples': 9516672, 'steps': 49565, 'loss/train': 1.0507433414459229} -08/30/2021 22:11:23 - INFO - __main__ - Step 49567: {'lr': 0.00038303241071093884, 'samples': 9516864, 'steps': 49566, 'loss/train': 1.242356300354004} -08/30/2021 22:11:24 - INFO - __main__ - Step 49568: {'lr': 0.00038302791765748156, 'samples': 9517056, 'steps': 49567, 'loss/train': 1.2988349199295044} -08/30/2021 22:11:24 - INFO - __main__ - Step 49569: {'lr': 0.0003830234245440839, 'samples': 9517248, 'steps': 49568, 'loss/train': 2.0660808086395264} -08/30/2021 22:11:24 - INFO - __main__ - Step 49570: {'lr': 0.000383018931370748, 'samples': 9517440, 'steps': 49569, 'loss/train': 1.0381982326507568} -08/30/2021 22:11:25 - INFO - __main__ - Step 49571: {'lr': 0.00038301443813747583, 'samples': 9517632, 'steps': 49570, 'loss/train': 1.5061399936676025} -08/30/2021 22:11:25 - INFO - __main__ - Step 49572: {'lr': 0.00038300994484426936, 'samples': 9517824, 'steps': 49571, 'loss/train': 1.7023953199386597} -08/30/2021 22:11:27 - INFO - __main__ - Step 49573: {'lr': 0.0003830054514911307, 'samples': 9518016, 'steps': 49572, 'loss/train': 1.211342215538025} -08/30/2021 22:11:28 - INFO - __main__ - Step 49574: {'lr': 0.0003830009580780618, 'samples': 9518208, 'steps': 49573, 'loss/train': 0.4964197874069214} -08/30/2021 22:11:28 - INFO - __main__ - Step 49575: {'lr': 0.00038299646460506474, 'samples': 9518400, 'steps': 49574, 'loss/train': 1.1801362037658691} -08/30/2021 22:11:29 - INFO - __main__ - Step 49576: {'lr': 0.0003829919710721415, 'samples': 9518592, 'steps': 49575, 'loss/train': 1.0538371801376343} -08/30/2021 22:11:29 - INFO - __main__ - Step 49577: {'lr': 0.0003829874774792941, 'samples': 9518784, 'steps': 49576, 'loss/train': 1.0418047904968262} -08/30/2021 22:11:31 - INFO - __main__ - Step 49578: {'lr': 0.00038298298382652467, 'samples': 9518976, 'steps': 49577, 'loss/train': 1.5571428537368774} -08/30/2021 22:11:31 - INFO - __main__ - Step 49579: {'lr': 0.00038297849011383517, 'samples': 9519168, 'steps': 49578, 'loss/train': 0.24694758653640747} -08/30/2021 22:11:31 - INFO - __main__ - Step 49580: {'lr': 0.0003829739963412276, 'samples': 9519360, 'steps': 49579, 'loss/train': 1.2840710878372192} -08/30/2021 22:11:32 - INFO - __main__ - Step 49581: {'lr': 0.000382969502508704, 'samples': 9519552, 'steps': 49580, 'loss/train': 1.3830649852752686} -08/30/2021 22:11:32 - INFO - __main__ - Step 49582: {'lr': 0.0003829650086162663, 'samples': 9519744, 'steps': 49581, 'loss/train': 1.7510303258895874} -08/30/2021 22:11:32 - INFO - __main__ - Step 49583: {'lr': 0.0003829605146639167, 'samples': 9519936, 'steps': 49582, 'loss/train': 2.331678628921509} -08/30/2021 22:11:35 - INFO - __main__ - Step 49584: {'lr': 0.00038295602065165714, 'samples': 9520128, 'steps': 49583, 'loss/train': 1.3477237224578857} -08/30/2021 22:11:35 - INFO - __main__ - Step 49585: {'lr': 0.0003829515265794896, 'samples': 9520320, 'steps': 49584, 'loss/train': 1.3703932762145996} -08/30/2021 22:11:35 - INFO - __main__ - Step 49586: {'lr': 0.00038294703244741625, 'samples': 9520512, 'steps': 49585, 'loss/train': 0.8562800884246826} -08/30/2021 22:11:36 - INFO - __main__ - Step 49587: {'lr': 0.000382942538255439, 'samples': 9520704, 'steps': 49586, 'loss/train': 1.125615119934082} -08/30/2021 22:11:36 - INFO - __main__ - Step 49588: {'lr': 0.0003829380440035598, 'samples': 9520896, 'steps': 49587, 'loss/train': 1.6854792833328247} -08/30/2021 22:11:38 - INFO - __main__ - Step 49589: {'lr': 0.0003829335496917808, 'samples': 9521088, 'steps': 49588, 'loss/train': 1.639472484588623} -08/30/2021 22:11:38 - INFO - __main__ - Step 49590: {'lr': 0.000382929055320104, 'samples': 9521280, 'steps': 49589, 'loss/train': 1.0702298879623413} -08/30/2021 22:11:38 - INFO - __main__ - Step 49591: {'lr': 0.0003829245608885315, 'samples': 9521472, 'steps': 49590, 'loss/train': 0.6162208914756775} -08/30/2021 22:11:39 - INFO - __main__ - Step 49592: {'lr': 0.0003829200663970652, 'samples': 9521664, 'steps': 49591, 'loss/train': 1.1267777681350708} -08/30/2021 22:11:39 - INFO - __main__ - Step 49593: {'lr': 0.00038291557184570713, 'samples': 9521856, 'steps': 49592, 'loss/train': 1.9720985889434814} -08/30/2021 22:11:41 - INFO - __main__ - Step 49594: {'lr': 0.0003829110772344594, 'samples': 9522048, 'steps': 49593, 'loss/train': 0.8776063919067383} -08/30/2021 22:11:41 - INFO - __main__ - Step 49595: {'lr': 0.000382906582563324, 'samples': 9522240, 'steps': 49594, 'loss/train': 0.8313174247741699} -08/30/2021 22:11:41 - INFO - __main__ - Step 49596: {'lr': 0.00038290208783230286, 'samples': 9522432, 'steps': 49595, 'loss/train': 0.8462598323822021} -08/30/2021 22:11:42 - INFO - __main__ - Step 49597: {'lr': 0.00038289759304139815, 'samples': 9522624, 'steps': 49596, 'loss/train': 1.3606739044189453} -08/30/2021 22:11:42 - INFO - __main__ - Step 49598: {'lr': 0.0003828930981906118, 'samples': 9522816, 'steps': 49597, 'loss/train': 0.4701923727989197} -08/30/2021 22:11:44 - INFO - __main__ - Step 49599: {'lr': 0.000382888603279946, 'samples': 9523008, 'steps': 49598, 'loss/train': 1.1950565576553345} -08/30/2021 22:11:44 - INFO - __main__ - Step 49600: {'lr': 0.00038288410830940246, 'samples': 9523200, 'steps': 49599, 'loss/train': 0.8796842694282532} -08/30/2021 22:11:45 - INFO - __main__ - Step 49601: {'lr': 0.00038287961327898346, 'samples': 9523392, 'steps': 49600, 'loss/train': 1.0335707664489746} -08/30/2021 22:11:45 - INFO - __main__ - Step 49602: {'lr': 0.000382875118188691, 'samples': 9523584, 'steps': 49601, 'loss/train': 0.765018880367279} -08/30/2021 22:11:45 - INFO - __main__ - Step 49603: {'lr': 0.000382870623038527, 'samples': 9523776, 'steps': 49602, 'loss/train': 1.7459690570831299} -08/30/2021 22:11:47 - INFO - __main__ - Step 49604: {'lr': 0.0003828661278284936, 'samples': 9523968, 'steps': 49603, 'loss/train': 0.6471412181854248} -08/30/2021 22:11:47 - INFO - __main__ - Step 49605: {'lr': 0.00038286163255859276, 'samples': 9524160, 'steps': 49604, 'loss/train': 1.786392331123352} -08/30/2021 22:11:48 - INFO - __main__ - Step 49606: {'lr': 0.0003828571372288265, 'samples': 9524352, 'steps': 49605, 'loss/train': 1.6381694078445435} -08/30/2021 22:11:48 - INFO - __main__ - Step 49607: {'lr': 0.00038285264183919696, 'samples': 9524544, 'steps': 49606, 'loss/train': 2.197564125061035} -08/30/2021 22:11:48 - INFO - __main__ - Step 49608: {'lr': 0.00038284814638970594, 'samples': 9524736, 'steps': 49607, 'loss/train': 1.5324078798294067} -08/30/2021 22:11:50 - INFO - __main__ - Step 49609: {'lr': 0.00038284365088035564, 'samples': 9524928, 'steps': 49608, 'loss/train': 1.219322681427002} -08/30/2021 22:11:50 - INFO - __main__ - Step 49610: {'lr': 0.00038283915531114806, 'samples': 9525120, 'steps': 49609, 'loss/train': 1.273169755935669} -08/30/2021 22:11:51 - INFO - __main__ - Step 49611: {'lr': 0.0003828346596820852, 'samples': 9525312, 'steps': 49610, 'loss/train': 1.4314746856689453} -08/30/2021 22:11:51 - INFO - __main__ - Step 49612: {'lr': 0.00038283016399316905, 'samples': 9525504, 'steps': 49611, 'loss/train': 2.4046475887298584} -08/30/2021 22:11:51 - INFO - __main__ - Step 49613: {'lr': 0.00038282566824440176, 'samples': 9525696, 'steps': 49612, 'loss/train': 0.26548632979393005} -08/30/2021 22:11:52 - INFO - __main__ - Step 49614: {'lr': 0.0003828211724357852, 'samples': 9525888, 'steps': 49613, 'loss/train': 1.704612135887146} -08/30/2021 22:11:53 - INFO - __main__ - Step 49615: {'lr': 0.00038281667656732144, 'samples': 9526080, 'steps': 49614, 'loss/train': 0.39868637919425964} -08/30/2021 22:11:54 - INFO - __main__ - Step 49616: {'lr': 0.0003828121806390126, 'samples': 9526272, 'steps': 49615, 'loss/train': 1.5058345794677734} -08/30/2021 22:11:54 - INFO - __main__ - Step 49617: {'lr': 0.0003828076846508606, 'samples': 9526464, 'steps': 49616, 'loss/train': 1.2298740148544312} -08/30/2021 22:11:55 - INFO - __main__ - Step 49618: {'lr': 0.00038280318860286756, 'samples': 9526656, 'steps': 49617, 'loss/train': 1.2124298810958862} -08/30/2021 22:11:55 - INFO - __main__ - Step 49619: {'lr': 0.0003827986924950354, 'samples': 9526848, 'steps': 49618, 'loss/train': 1.8423925638198853} -08/30/2021 22:11:57 - INFO - __main__ - Step 49620: {'lr': 0.0003827941963273663, 'samples': 9527040, 'steps': 49619, 'loss/train': 0.8608068227767944} -08/30/2021 22:11:57 - INFO - __main__ - Step 49621: {'lr': 0.00038278970009986206, 'samples': 9527232, 'steps': 49620, 'loss/train': 1.0913867950439453} -08/30/2021 22:11:57 - INFO - __main__ - Step 49622: {'lr': 0.0003827852038125249, 'samples': 9527424, 'steps': 49621, 'loss/train': 1.6545668840408325} -08/30/2021 22:11:58 - INFO - __main__ - Step 49623: {'lr': 0.00038278070746535674, 'samples': 9527616, 'steps': 49622, 'loss/train': 1.1301075220108032} -08/30/2021 22:11:58 - INFO - __main__ - Step 49624: {'lr': 0.0003827762110583597, 'samples': 9527808, 'steps': 49623, 'loss/train': 0.03578347712755203} -08/30/2021 22:12:00 - INFO - __main__ - Step 49625: {'lr': 0.0003827717145915357, 'samples': 9528000, 'steps': 49624, 'loss/train': 2.1218557357788086} -08/30/2021 22:12:00 - INFO - __main__ - Step 49626: {'lr': 0.0003827672180648868, 'samples': 9528192, 'steps': 49625, 'loss/train': 1.7013319730758667} -08/30/2021 22:12:00 - INFO - __main__ - Step 49627: {'lr': 0.0003827627214784151, 'samples': 9528384, 'steps': 49626, 'loss/train': 0.7905079126358032} -08/30/2021 22:12:01 - INFO - __main__ - Step 49628: {'lr': 0.0003827582248321225, 'samples': 9528576, 'steps': 49627, 'loss/train': 1.1278719902038574} -08/30/2021 22:12:01 - INFO - __main__ - Step 49629: {'lr': 0.0003827537281260111, 'samples': 9528768, 'steps': 49628, 'loss/train': 0.26504695415496826} -08/30/2021 22:12:03 - INFO - __main__ - Step 49630: {'lr': 0.00038274923136008294, 'samples': 9528960, 'steps': 49629, 'loss/train': 1.3159563541412354} -08/30/2021 22:12:03 - INFO - __main__ - Step 49631: {'lr': 0.00038274473453434, 'samples': 9529152, 'steps': 49630, 'loss/train': 1.014441967010498} -08/30/2021 22:12:03 - INFO - __main__ - Step 49632: {'lr': 0.0003827402376487844, 'samples': 9529344, 'steps': 49631, 'loss/train': 1.3989652395248413} -08/30/2021 22:12:04 - INFO - __main__ - Step 49633: {'lr': 0.0003827357407034181, 'samples': 9529536, 'steps': 49632, 'loss/train': 1.4955639839172363} -08/30/2021 22:12:04 - INFO - __main__ - Step 49634: {'lr': 0.00038273124369824304, 'samples': 9529728, 'steps': 49633, 'loss/train': 1.5302200317382812} -08/30/2021 22:12:05 - INFO - __main__ - Step 49635: {'lr': 0.00038272674663326136, 'samples': 9529920, 'steps': 49634, 'loss/train': 1.4749906063079834} -08/30/2021 22:12:06 - INFO - __main__ - Step 49636: {'lr': 0.000382722249508475, 'samples': 9530112, 'steps': 49635, 'loss/train': 1.2865924835205078} -08/30/2021 22:12:06 - INFO - __main__ - Step 49637: {'lr': 0.00038271775232388616, 'samples': 9530304, 'steps': 49636, 'loss/train': 1.2680777311325073} -08/30/2021 22:12:07 - INFO - __main__ - Step 49638: {'lr': 0.00038271325507949666, 'samples': 9530496, 'steps': 49637, 'loss/train': 1.290576457977295} -08/30/2021 22:12:07 - INFO - __main__ - Step 49639: {'lr': 0.00038270875777530864, 'samples': 9530688, 'steps': 49638, 'loss/train': 1.6442703008651733} -08/30/2021 22:12:09 - INFO - __main__ - Step 49640: {'lr': 0.0003827042604113241, 'samples': 9530880, 'steps': 49639, 'loss/train': 1.3259234428405762} -08/30/2021 22:12:09 - INFO - __main__ - Step 49641: {'lr': 0.0003826997629875451, 'samples': 9531072, 'steps': 49640, 'loss/train': 1.1789066791534424} -08/30/2021 22:12:10 - INFO - __main__ - Step 49642: {'lr': 0.0003826952655039736, 'samples': 9531264, 'steps': 49641, 'loss/train': 1.4378935098648071} -08/30/2021 22:12:10 - INFO - __main__ - Step 49643: {'lr': 0.0003826907679606117, 'samples': 9531456, 'steps': 49642, 'loss/train': 1.1316323280334473} -08/30/2021 22:12:10 - INFO - __main__ - Step 49644: {'lr': 0.00038268627035746133, 'samples': 9531648, 'steps': 49643, 'loss/train': 0.5237854719161987} -08/30/2021 22:12:11 - INFO - __main__ - Step 49645: {'lr': 0.00038268177269452463, 'samples': 9531840, 'steps': 49644, 'loss/train': 1.2391196489334106} -08/30/2021 22:12:13 - INFO - __main__ - Step 49646: {'lr': 0.0003826772749718036, 'samples': 9532032, 'steps': 49645, 'loss/train': 0.7716188430786133} -08/30/2021 22:12:13 - INFO - __main__ - Step 49647: {'lr': 0.00038267277718930014, 'samples': 9532224, 'steps': 49646, 'loss/train': 1.127185344696045} -08/30/2021 22:12:13 - INFO - __main__ - Step 49648: {'lr': 0.0003826682793470164, 'samples': 9532416, 'steps': 49647, 'loss/train': 1.1896660327911377} -08/30/2021 22:12:14 - INFO - __main__ - Step 49649: {'lr': 0.0003826637814449544, 'samples': 9532608, 'steps': 49648, 'loss/train': 1.9542824029922485} -08/30/2021 22:12:14 - INFO - __main__ - Step 49650: {'lr': 0.00038265928348311614, 'samples': 9532800, 'steps': 49649, 'loss/train': 1.5729920864105225} -08/30/2021 22:12:16 - INFO - __main__ - Step 49651: {'lr': 0.0003826547854615037, 'samples': 9532992, 'steps': 49650, 'loss/train': 0.04735864698886871} -08/30/2021 22:12:16 - INFO - __main__ - Step 49652: {'lr': 0.000382650287380119, 'samples': 9533184, 'steps': 49651, 'loss/train': 1.5125199556350708} -08/30/2021 22:12:16 - INFO - __main__ - Step 49653: {'lr': 0.00038264578923896415, 'samples': 9533376, 'steps': 49652, 'loss/train': 1.7394583225250244} -08/30/2021 22:12:17 - INFO - __main__ - Step 49654: {'lr': 0.00038264129103804113, 'samples': 9533568, 'steps': 49653, 'loss/train': 1.409911036491394} -08/30/2021 22:12:17 - INFO - __main__ - Step 49655: {'lr': 0.00038263679277735196, 'samples': 9533760, 'steps': 49654, 'loss/train': 0.8430184721946716} -08/30/2021 22:12:19 - INFO - __main__ - Step 49656: {'lr': 0.0003826322944568988, 'samples': 9533952, 'steps': 49655, 'loss/train': 1.3635603189468384} -08/30/2021 22:12:19 - INFO - __main__ - Step 49657: {'lr': 0.00038262779607668354, 'samples': 9534144, 'steps': 49656, 'loss/train': 0.9720028042793274} -08/30/2021 22:12:19 - INFO - __main__ - Step 49658: {'lr': 0.0003826232976367082, 'samples': 9534336, 'steps': 49657, 'loss/train': 1.8901889324188232} -08/30/2021 22:12:20 - INFO - __main__ - Step 49659: {'lr': 0.0003826187991369749, 'samples': 9534528, 'steps': 49658, 'loss/train': 1.0283443927764893} -08/30/2021 22:12:20 - INFO - __main__ - Step 49660: {'lr': 0.00038261430057748557, 'samples': 9534720, 'steps': 49659, 'loss/train': 1.441989779472351} -08/30/2021 22:12:22 - INFO - __main__ - Step 49661: {'lr': 0.0003826098019582423, 'samples': 9534912, 'steps': 49660, 'loss/train': 0.9568517208099365} -08/30/2021 22:12:22 - INFO - __main__ - Step 49662: {'lr': 0.00038260530327924715, 'samples': 9535104, 'steps': 49661, 'loss/train': 1.2110334634780884} -08/30/2021 22:12:22 - INFO - __main__ - Step 49663: {'lr': 0.00038260080454050207, 'samples': 9535296, 'steps': 49662, 'loss/train': 0.420901894569397} -08/30/2021 22:12:23 - INFO - __main__ - Step 49664: {'lr': 0.00038259630574200904, 'samples': 9535488, 'steps': 49663, 'loss/train': 1.2216628789901733} -08/30/2021 22:12:23 - INFO - __main__ - Step 49665: {'lr': 0.0003825918068837702, 'samples': 9535680, 'steps': 49664, 'loss/train': 1.2758723497390747} -08/30/2021 22:12:25 - INFO - __main__ - Step 49666: {'lr': 0.00038258730796578757, 'samples': 9535872, 'steps': 49665, 'loss/train': 1.599077820777893} -08/30/2021 22:12:25 - INFO - __main__ - Step 49667: {'lr': 0.0003825828089880631, 'samples': 9536064, 'steps': 49666, 'loss/train': 0.9477130174636841} -08/30/2021 22:12:26 - INFO - __main__ - Step 49668: {'lr': 0.00038257830995059894, 'samples': 9536256, 'steps': 49667, 'loss/train': 1.3110496997833252} -08/30/2021 22:12:26 - INFO - __main__ - Step 49669: {'lr': 0.00038257381085339694, 'samples': 9536448, 'steps': 49668, 'loss/train': 0.9027947783470154} -08/30/2021 22:12:26 - INFO - __main__ - Step 49670: {'lr': 0.00038256931169645925, 'samples': 9536640, 'steps': 49669, 'loss/train': 1.4737378358840942} -08/30/2021 22:12:28 - INFO - __main__ - Step 49671: {'lr': 0.00038256481247978793, 'samples': 9536832, 'steps': 49670, 'loss/train': 1.3816382884979248} -08/30/2021 22:12:28 - INFO - __main__ - Step 49672: {'lr': 0.00038256031320338494, 'samples': 9537024, 'steps': 49671, 'loss/train': 1.2973017692565918} -08/30/2021 22:12:28 - INFO - __main__ - Step 49673: {'lr': 0.0003825558138672523, 'samples': 9537216, 'steps': 49672, 'loss/train': 0.9309566617012024} -08/30/2021 22:12:29 - INFO - __main__ - Step 49674: {'lr': 0.00038255131447139203, 'samples': 9537408, 'steps': 49673, 'loss/train': 1.5804880857467651} -08/30/2021 22:12:29 - INFO - __main__ - Step 49675: {'lr': 0.00038254681501580625, 'samples': 9537600, 'steps': 49674, 'loss/train': 1.2980644702911377} -08/30/2021 22:12:31 - INFO - __main__ - Step 49676: {'lr': 0.00038254231550049686, 'samples': 9537792, 'steps': 49675, 'loss/train': 1.7197462320327759} -08/30/2021 22:12:31 - INFO - __main__ - Step 49677: {'lr': 0.00038253781592546593, 'samples': 9537984, 'steps': 49676, 'loss/train': 0.36219343543052673} -08/30/2021 22:12:31 - INFO - __main__ - Step 49678: {'lr': 0.0003825333162907155, 'samples': 9538176, 'steps': 49677, 'loss/train': 0.4128420054912567} -08/30/2021 22:12:32 - INFO - __main__ - Step 49679: {'lr': 0.0003825288165962477, 'samples': 9538368, 'steps': 49678, 'loss/train': 1.2414288520812988} -08/30/2021 22:12:32 - INFO - __main__ - Step 49680: {'lr': 0.0003825243168420644, 'samples': 9538560, 'steps': 49679, 'loss/train': 1.3402949571609497} -08/30/2021 22:12:34 - INFO - __main__ - Step 49681: {'lr': 0.00038251981702816767, 'samples': 9538752, 'steps': 49680, 'loss/train': 1.510880947113037} -08/30/2021 22:12:34 - INFO - __main__ - Step 49682: {'lr': 0.00038251531715455955, 'samples': 9538944, 'steps': 49681, 'loss/train': 1.0666968822479248} -08/30/2021 22:12:34 - INFO - __main__ - Step 49683: {'lr': 0.00038251081722124214, 'samples': 9539136, 'steps': 49682, 'loss/train': 0.9895131587982178} -08/30/2021 22:12:35 - INFO - __main__ - Step 49684: {'lr': 0.0003825063172282174, 'samples': 9539328, 'steps': 49683, 'loss/train': 0.8254391551017761} -08/30/2021 22:12:35 - INFO - __main__ - Step 49685: {'lr': 0.00038250181717548726, 'samples': 9539520, 'steps': 49684, 'loss/train': 1.0771102905273438} -08/30/2021 22:12:37 - INFO - __main__ - Step 49686: {'lr': 0.0003824973170630539, 'samples': 9539712, 'steps': 49685, 'loss/train': 1.2612708806991577} -08/30/2021 22:12:37 - INFO - __main__ - Step 49687: {'lr': 0.0003824928168909193, 'samples': 9539904, 'steps': 49686, 'loss/train': 1.3444955348968506} -08/30/2021 22:12:37 - INFO - __main__ - Step 49688: {'lr': 0.00038248831665908546, 'samples': 9540096, 'steps': 49687, 'loss/train': 1.7309826612472534} -08/30/2021 22:12:38 - INFO - __main__ - Step 49689: {'lr': 0.0003824838163675545, 'samples': 9540288, 'steps': 49688, 'loss/train': 0.333211213350296} -08/30/2021 22:12:38 - INFO - __main__ - Step 49690: {'lr': 0.0003824793160163283, 'samples': 9540480, 'steps': 49689, 'loss/train': 1.595306158065796} -08/30/2021 22:12:40 - INFO - __main__ - Step 49691: {'lr': 0.000382474815605409, 'samples': 9540672, 'steps': 49690, 'loss/train': 0.7322412133216858} -08/30/2021 22:12:41 - INFO - __main__ - Step 49692: {'lr': 0.00038247031513479856, 'samples': 9540864, 'steps': 49691, 'loss/train': 0.041530169546604156} -08/30/2021 22:12:41 - INFO - __main__ - Step 49693: {'lr': 0.0003824658146044991, 'samples': 9541056, 'steps': 49692, 'loss/train': 1.3264636993408203} -08/30/2021 22:12:42 - INFO - __main__ - Step 49694: {'lr': 0.0003824613140145125, 'samples': 9541248, 'steps': 49693, 'loss/train': 1.4436217546463013} -08/30/2021 22:12:42 - INFO - __main__ - Step 49695: {'lr': 0.00038245681336484096, 'samples': 9541440, 'steps': 49694, 'loss/train': 1.6068975925445557} -08/30/2021 22:12:42 - INFO - __main__ - Step 49696: {'lr': 0.00038245231265548633, 'samples': 9541632, 'steps': 49695, 'loss/train': 0.9332612156867981} -08/30/2021 22:12:44 - INFO - __main__ - Step 49697: {'lr': 0.0003824478118864508, 'samples': 9541824, 'steps': 49696, 'loss/train': 0.031258419156074524} -08/30/2021 22:12:45 - INFO - __main__ - Step 49698: {'lr': 0.0003824433110577363, 'samples': 9542016, 'steps': 49697, 'loss/train': 1.2822026014328003} -08/30/2021 22:12:45 - INFO - __main__ - Step 49699: {'lr': 0.0003824388101693449, 'samples': 9542208, 'steps': 49698, 'loss/train': 0.2977379262447357} -08/30/2021 22:12:45 - INFO - __main__ - Step 49700: {'lr': 0.00038243430922127865, 'samples': 9542400, 'steps': 49699, 'loss/train': 1.7197608947753906} -08/30/2021 22:12:46 - INFO - __main__ - Step 49701: {'lr': 0.00038242980821353954, 'samples': 9542592, 'steps': 49700, 'loss/train': 1.38543701171875} -08/30/2021 22:12:46 - INFO - __main__ - Step 49702: {'lr': 0.00038242530714612953, 'samples': 9542784, 'steps': 49701, 'loss/train': 0.06924241781234741} -08/30/2021 22:12:47 - INFO - __main__ - Step 49703: {'lr': 0.00038242080601905083, 'samples': 9542976, 'steps': 49702, 'loss/train': 0.6161973476409912} -08/30/2021 22:12:48 - INFO - __main__ - Step 49704: {'lr': 0.0003824163048323053, 'samples': 9543168, 'steps': 49703, 'loss/train': 1.0991592407226562} -08/30/2021 22:12:48 - INFO - __main__ - Step 49705: {'lr': 0.000382411803585895, 'samples': 9543360, 'steps': 49704, 'loss/train': 1.4899581670761108} -08/30/2021 22:12:49 - INFO - __main__ - Step 49706: {'lr': 0.000382407302279822, 'samples': 9543552, 'steps': 49705, 'loss/train': 1.731083631515503} -08/30/2021 22:12:49 - INFO - __main__ - Step 49707: {'lr': 0.0003824028009140883, 'samples': 9543744, 'steps': 49706, 'loss/train': 1.0906201601028442} -08/30/2021 22:12:51 - INFO - __main__ - Step 49708: {'lr': 0.000382398299488696, 'samples': 9543936, 'steps': 49707, 'loss/train': 1.4632432460784912} -08/30/2021 22:12:51 - INFO - __main__ - Step 49709: {'lr': 0.000382393798003647, 'samples': 9544128, 'steps': 49708, 'loss/train': 1.1668860912322998} -08/30/2021 22:12:52 - INFO - __main__ - Step 49710: {'lr': 0.00038238929645894345, 'samples': 9544320, 'steps': 49709, 'loss/train': 0.9777527451515198} -08/30/2021 22:12:52 - INFO - __main__ - Step 49711: {'lr': 0.00038238479485458725, 'samples': 9544512, 'steps': 49710, 'loss/train': 1.2632591724395752} -08/30/2021 22:12:52 - INFO - __main__ - Step 49712: {'lr': 0.0003823802931905806, 'samples': 9544704, 'steps': 49711, 'loss/train': 1.6812973022460938} -08/30/2021 22:12:54 - INFO - __main__ - Step 49713: {'lr': 0.0003823757914669254, 'samples': 9544896, 'steps': 49712, 'loss/train': 1.3029990196228027} -08/30/2021 22:12:54 - INFO - __main__ - Step 49714: {'lr': 0.00038237128968362366, 'samples': 9545088, 'steps': 49713, 'loss/train': 0.8617534637451172} -08/30/2021 22:12:55 - INFO - __main__ - Step 49715: {'lr': 0.0003823667878406776, 'samples': 9545280, 'steps': 49714, 'loss/train': 0.7684113383293152} -08/30/2021 22:12:55 - INFO - __main__ - Step 49716: {'lr': 0.000382362285938089, 'samples': 9545472, 'steps': 49715, 'loss/train': 2.6685233116149902} -08/30/2021 22:12:55 - INFO - __main__ - Step 49717: {'lr': 0.00038235778397586, 'samples': 9545664, 'steps': 49716, 'loss/train': 1.2324090003967285} -08/30/2021 22:12:56 - INFO - __main__ - Step 49718: {'lr': 0.00038235328195399253, 'samples': 9545856, 'steps': 49717, 'loss/train': 1.503272533416748} -08/30/2021 22:12:57 - INFO - __main__ - Step 49719: {'lr': 0.0003823487798724888, 'samples': 9546048, 'steps': 49718, 'loss/train': 0.04580173268914223} -08/30/2021 22:12:58 - INFO - __main__ - Step 49720: {'lr': 0.00038234427773135084, 'samples': 9546240, 'steps': 49719, 'loss/train': 1.355670690536499} -08/30/2021 22:12:58 - INFO - __main__ - Step 49721: {'lr': 0.00038233977553058055, 'samples': 9546432, 'steps': 49720, 'loss/train': 2.0083348751068115} -08/30/2021 22:12:59 - INFO - __main__ - Step 49722: {'lr': 0.0003823352732701799, 'samples': 9546624, 'steps': 49721, 'loss/train': 1.3676416873931885} -08/30/2021 22:12:59 - INFO - __main__ - Step 49723: {'lr': 0.0003823307709501511, 'samples': 9546816, 'steps': 49722, 'loss/train': 1.2437701225280762} -08/30/2021 22:13:00 - INFO - __main__ - Step 49724: {'lr': 0.0003823262685704961, 'samples': 9547008, 'steps': 49723, 'loss/train': 0.050234027206897736} -08/30/2021 22:13:01 - INFO - __main__ - Step 49725: {'lr': 0.00038232176613121687, 'samples': 9547200, 'steps': 49724, 'loss/train': 0.9303320050239563} -08/30/2021 22:13:01 - INFO - __main__ - Step 49726: {'lr': 0.00038231726363231554, 'samples': 9547392, 'steps': 49725, 'loss/train': 1.0685924291610718} -08/30/2021 22:13:01 - INFO - __main__ - Step 49727: {'lr': 0.0003823127610737941, 'samples': 9547584, 'steps': 49726, 'loss/train': 0.8104143142700195} -08/30/2021 22:13:02 - INFO - __main__ - Step 49728: {'lr': 0.00038230825845565454, 'samples': 9547776, 'steps': 49727, 'loss/train': 0.8963868618011475} -08/30/2021 22:13:03 - INFO - __main__ - Step 49729: {'lr': 0.00038230375577789894, 'samples': 9547968, 'steps': 49728, 'loss/train': 1.4387993812561035} -08/30/2021 22:13:04 - INFO - __main__ - Step 49730: {'lr': 0.0003822992530405293, 'samples': 9548160, 'steps': 49729, 'loss/train': 1.1440261602401733} -08/30/2021 22:13:04 - INFO - __main__ - Step 49731: {'lr': 0.00038229475024354766, 'samples': 9548352, 'steps': 49730, 'loss/train': 1.3108282089233398} -08/30/2021 22:13:04 - INFO - __main__ - Step 49732: {'lr': 0.00038229024738695605, 'samples': 9548544, 'steps': 49731, 'loss/train': 1.523683786392212} -08/30/2021 22:13:05 - INFO - __main__ - Step 49733: {'lr': 0.0003822857444707565, 'samples': 9548736, 'steps': 49732, 'loss/train': 1.5838416814804077} -08/30/2021 22:13:06 - INFO - __main__ - Step 49734: {'lr': 0.00038228124149495104, 'samples': 9548928, 'steps': 49733, 'loss/train': 1.4662511348724365} -08/30/2021 22:13:07 - INFO - __main__ - Step 49735: {'lr': 0.0003822767384595417, 'samples': 9549120, 'steps': 49734, 'loss/train': 1.0484226942062378} -08/30/2021 22:13:07 - INFO - __main__ - Step 49736: {'lr': 0.0003822722353645305, 'samples': 9549312, 'steps': 49735, 'loss/train': 0.8739673495292664} -08/30/2021 22:13:07 - INFO - __main__ - Step 49737: {'lr': 0.00038226773220991937, 'samples': 9549504, 'steps': 49736, 'loss/train': 1.1348925828933716} -08/30/2021 22:13:08 - INFO - __main__ - Step 49738: {'lr': 0.0003822632289957105, 'samples': 9549696, 'steps': 49737, 'loss/train': 1.018144130706787} -08/30/2021 22:13:09 - INFO - __main__ - Step 49739: {'lr': 0.000382258725721906, 'samples': 9549888, 'steps': 49738, 'loss/train': 1.5319018363952637} -08/30/2021 22:13:10 - INFO - __main__ - Step 49740: {'lr': 0.0003822542223885076, 'samples': 9550080, 'steps': 49739, 'loss/train': 1.4723345041275024} -08/30/2021 22:13:10 - INFO - __main__ - Step 49741: {'lr': 0.0003822497189955175, 'samples': 9550272, 'steps': 49740, 'loss/train': 1.5046100616455078} -08/30/2021 22:13:11 - INFO - __main__ - Step 49742: {'lr': 0.0003822452155429378, 'samples': 9550464, 'steps': 49741, 'loss/train': 1.0838719606399536} -08/30/2021 22:13:11 - INFO - __main__ - Step 49743: {'lr': 0.0003822407120307704, 'samples': 9550656, 'steps': 49742, 'loss/train': 1.1902461051940918} -08/30/2021 22:13:12 - INFO - __main__ - Step 49744: {'lr': 0.0003822362084590174, 'samples': 9550848, 'steps': 49743, 'loss/train': 1.4791418313980103} -08/30/2021 22:13:13 - INFO - __main__ - Step 49745: {'lr': 0.0003822317048276808, 'samples': 9551040, 'steps': 49744, 'loss/train': 1.482893466949463} -08/30/2021 22:13:13 - INFO - __main__ - Step 49746: {'lr': 0.0003822272011367626, 'samples': 9551232, 'steps': 49745, 'loss/train': 0.046908844262361526} -08/30/2021 22:13:14 - INFO - __main__ - Step 49747: {'lr': 0.0003822226973862649, 'samples': 9551424, 'steps': 49746, 'loss/train': 1.421980619430542} -08/30/2021 22:13:14 - INFO - __main__ - Step 49748: {'lr': 0.00038221819357618967, 'samples': 9551616, 'steps': 49747, 'loss/train': 0.943286120891571} -08/30/2021 22:13:14 - INFO - __main__ - Step 49749: {'lr': 0.0003822136897065389, 'samples': 9551808, 'steps': 49748, 'loss/train': 0.44666239619255066} -08/30/2021 22:13:16 - INFO - __main__ - Step 49750: {'lr': 0.0003822091857773148, 'samples': 9552000, 'steps': 49749, 'loss/train': 1.1273568868637085} -08/30/2021 22:13:17 - INFO - __main__ - Step 49751: {'lr': 0.00038220468178851917, 'samples': 9552192, 'steps': 49750, 'loss/train': 2.1853973865509033} -08/30/2021 22:13:17 - INFO - __main__ - Step 49752: {'lr': 0.00038220017774015427, 'samples': 9552384, 'steps': 49751, 'loss/train': 1.0996079444885254} -08/30/2021 22:13:18 - INFO - __main__ - Step 49753: {'lr': 0.00038219567363222183, 'samples': 9552576, 'steps': 49752, 'loss/train': 0.9311907887458801} -08/30/2021 22:13:18 - INFO - __main__ - Step 49754: {'lr': 0.00038219116946472425, 'samples': 9552768, 'steps': 49753, 'loss/train': 1.5368413925170898} -08/30/2021 22:13:19 - INFO - __main__ - Step 49755: {'lr': 0.0003821866652376633, 'samples': 9552960, 'steps': 49754, 'loss/train': 1.522527813911438} -08/30/2021 22:13:20 - INFO - __main__ - Step 49756: {'lr': 0.0003821821609510411, 'samples': 9553152, 'steps': 49755, 'loss/train': 0.6353611946105957} -08/30/2021 22:13:20 - INFO - __main__ - Step 49757: {'lr': 0.0003821776566048596, 'samples': 9553344, 'steps': 49756, 'loss/train': 1.2988874912261963} -08/30/2021 22:13:21 - INFO - __main__ - Step 49758: {'lr': 0.0003821731521991209, 'samples': 9553536, 'steps': 49757, 'loss/train': 1.1676123142242432} -08/30/2021 22:13:21 - INFO - __main__ - Step 49759: {'lr': 0.00038216864773382703, 'samples': 9553728, 'steps': 49758, 'loss/train': 1.4098976850509644} -08/30/2021 22:13:23 - INFO - __main__ - Step 49760: {'lr': 0.00038216414320898004, 'samples': 9553920, 'steps': 49759, 'loss/train': 1.2838845252990723} -08/30/2021 22:13:23 - INFO - __main__ - Step 49761: {'lr': 0.0003821596386245819, 'samples': 9554112, 'steps': 49760, 'loss/train': 1.0469671487808228} -08/30/2021 22:13:23 - INFO - __main__ - Step 49762: {'lr': 0.00038215513398063465, 'samples': 9554304, 'steps': 49761, 'loss/train': 1.294045329093933} -08/30/2021 22:13:24 - INFO - __main__ - Step 49763: {'lr': 0.00038215062927714037, 'samples': 9554496, 'steps': 49762, 'loss/train': 1.5076699256896973} -08/30/2021 22:13:24 - INFO - __main__ - Step 49764: {'lr': 0.000382146124514101, 'samples': 9554688, 'steps': 49763, 'loss/train': 1.3536831140518188} -08/30/2021 22:13:26 - INFO - __main__ - Step 49765: {'lr': 0.00038214161969151865, 'samples': 9554880, 'steps': 49764, 'loss/train': 0.9425990581512451} -08/30/2021 22:13:26 - INFO - __main__ - Step 49766: {'lr': 0.0003821371148093954, 'samples': 9555072, 'steps': 49765, 'loss/train': 1.1800950765609741} -08/30/2021 22:13:27 - INFO - __main__ - Step 49767: {'lr': 0.0003821326098677331, 'samples': 9555264, 'steps': 49766, 'loss/train': 0.9455059766769409} -08/30/2021 22:13:27 - INFO - __main__ - Step 49768: {'lr': 0.00038212810486653394, 'samples': 9555456, 'steps': 49767, 'loss/train': 1.3309293985366821} -08/30/2021 22:13:28 - INFO - __main__ - Step 49769: {'lr': 0.0003821235998057999, 'samples': 9555648, 'steps': 49768, 'loss/train': 3.0551741123199463} -08/30/2021 22:13:28 - INFO - __main__ - Step 49770: {'lr': 0.00038211909468553295, 'samples': 9555840, 'steps': 49769, 'loss/train': 4.082547187805176} -08/30/2021 22:13:30 - INFO - __main__ - Step 49771: {'lr': 0.00038211458950573526, 'samples': 9556032, 'steps': 49770, 'loss/train': 1.1977760791778564} -08/30/2021 22:13:30 - INFO - __main__ - Step 49772: {'lr': 0.0003821100842664087, 'samples': 9556224, 'steps': 49771, 'loss/train': 1.6944628953933716} -08/30/2021 22:13:30 - INFO - __main__ - Step 49773: {'lr': 0.00038210557896755536, 'samples': 9556416, 'steps': 49772, 'loss/train': 0.04313196241855621} -08/30/2021 22:13:31 - INFO - __main__ - Step 49774: {'lr': 0.0003821010736091774, 'samples': 9556608, 'steps': 49773, 'loss/train': 1.4688575267791748} -08/30/2021 22:13:31 - INFO - __main__ - Step 49775: {'lr': 0.00038209656819127664, 'samples': 9556800, 'steps': 49774, 'loss/train': 1.7247586250305176} -08/30/2021 22:13:33 - INFO - __main__ - Step 49776: {'lr': 0.0003820920627138552, 'samples': 9556992, 'steps': 49775, 'loss/train': 0.9166179299354553} -08/30/2021 22:13:33 - INFO - __main__ - Step 49777: {'lr': 0.00038208755717691515, 'samples': 9557184, 'steps': 49776, 'loss/train': 1.9556865692138672} -08/30/2021 22:13:33 - INFO - __main__ - Step 49778: {'lr': 0.00038208305158045846, 'samples': 9557376, 'steps': 49777, 'loss/train': 1.462591528892517} -08/30/2021 22:13:34 - INFO - __main__ - Step 49779: {'lr': 0.0003820785459244872, 'samples': 9557568, 'steps': 49778, 'loss/train': 0.6248871684074402} -08/30/2021 22:13:34 - INFO - __main__ - Step 49780: {'lr': 0.00038207404020900343, 'samples': 9557760, 'steps': 49779, 'loss/train': 1.3465285301208496} -08/30/2021 22:13:36 - INFO - __main__ - Step 49781: {'lr': 0.0003820695344340091, 'samples': 9557952, 'steps': 49780, 'loss/train': 2.1117501258850098} -08/30/2021 22:13:36 - INFO - __main__ - Step 49782: {'lr': 0.00038206502859950624, 'samples': 9558144, 'steps': 49781, 'loss/train': 1.4538969993591309} -08/30/2021 22:13:37 - INFO - __main__ - Step 49783: {'lr': 0.000382060522705497, 'samples': 9558336, 'steps': 49782, 'loss/train': 1.5920535326004028} -08/30/2021 22:13:37 - INFO - __main__ - Step 49784: {'lr': 0.0003820560167519832, 'samples': 9558528, 'steps': 49783, 'loss/train': 1.7279406785964966} -08/30/2021 22:13:37 - INFO - __main__ - Step 49785: {'lr': 0.000382051510738967, 'samples': 9558720, 'steps': 49784, 'loss/train': 1.3205997943878174} -08/30/2021 22:13:38 - INFO - __main__ - Step 49786: {'lr': 0.0003820470046664506, 'samples': 9558912, 'steps': 49785, 'loss/train': 1.0998303890228271} -08/30/2021 22:13:39 - INFO - __main__ - Step 49787: {'lr': 0.0003820424985344357, 'samples': 9559104, 'steps': 49786, 'loss/train': 1.9888184070587158} -08/30/2021 22:13:40 - INFO - __main__ - Step 49788: {'lr': 0.0003820379923429246, 'samples': 9559296, 'steps': 49787, 'loss/train': 1.4241983890533447} -08/30/2021 22:13:40 - INFO - __main__ - Step 49789: {'lr': 0.00038203348609191915, 'samples': 9559488, 'steps': 49788, 'loss/train': 1.0431121587753296} -08/30/2021 22:13:40 - INFO - __main__ - Step 49790: {'lr': 0.00038202897978142144, 'samples': 9559680, 'steps': 49789, 'loss/train': 1.8512325286865234} -08/30/2021 22:13:41 - INFO - __main__ - Step 49791: {'lr': 0.00038202447341143355, 'samples': 9559872, 'steps': 49790, 'loss/train': 1.1772205829620361} -08/30/2021 22:13:42 - INFO - __main__ - Step 49792: {'lr': 0.0003820199669819574, 'samples': 9560064, 'steps': 49791, 'loss/train': 1.40646493434906} -08/30/2021 22:13:43 - INFO - __main__ - Step 49793: {'lr': 0.00038201546049299517, 'samples': 9560256, 'steps': 49792, 'loss/train': 1.4943504333496094} -08/30/2021 22:13:43 - INFO - __main__ - Step 49794: {'lr': 0.00038201095394454874, 'samples': 9560448, 'steps': 49793, 'loss/train': 0.9948331117630005} -08/30/2021 22:13:43 - INFO - __main__ - Step 49795: {'lr': 0.0003820064473366203, 'samples': 9560640, 'steps': 49794, 'loss/train': 1.3066593408584595} -08/30/2021 22:13:44 - INFO - __main__ - Step 49796: {'lr': 0.00038200194066921166, 'samples': 9560832, 'steps': 49795, 'loss/train': 1.463216781616211} -08/30/2021 22:13:45 - INFO - __main__ - Step 49797: {'lr': 0.00038199743394232513, 'samples': 9561024, 'steps': 49796, 'loss/train': 1.5691516399383545} -08/30/2021 22:13:46 - INFO - __main__ - Step 49798: {'lr': 0.0003819929271559625, 'samples': 9561216, 'steps': 49797, 'loss/train': 0.4486684203147888} -08/30/2021 22:13:46 - INFO - __main__ - Step 49799: {'lr': 0.00038198842031012594, 'samples': 9561408, 'steps': 49798, 'loss/train': 0.9006960988044739} -08/30/2021 22:13:46 - INFO - __main__ - Step 49800: {'lr': 0.00038198391340481735, 'samples': 9561600, 'steps': 49799, 'loss/train': 1.9151670932769775} -08/30/2021 22:13:47 - INFO - __main__ - Step 49801: {'lr': 0.0003819794064400389, 'samples': 9561792, 'steps': 49800, 'loss/train': 1.4824037551879883} -08/30/2021 22:13:49 - INFO - __main__ - Step 49802: {'lr': 0.00038197489941579264, 'samples': 9561984, 'steps': 49801, 'loss/train': 1.3782626390457153} -08/30/2021 22:13:49 - INFO - __main__ - Step 49803: {'lr': 0.00038197039233208043, 'samples': 9562176, 'steps': 49802, 'loss/train': 1.398019552230835} -08/30/2021 22:13:49 - INFO - __main__ - Step 49804: {'lr': 0.0003819658851889044, 'samples': 9562368, 'steps': 49803, 'loss/train': 1.6332396268844604} -08/30/2021 22:13:50 - INFO - __main__ - Step 49805: {'lr': 0.00038196137798626663, 'samples': 9562560, 'steps': 49804, 'loss/train': 1.5197279453277588} -08/30/2021 22:13:50 - INFO - __main__ - Step 49806: {'lr': 0.00038195687072416906, 'samples': 9562752, 'steps': 49805, 'loss/train': 1.3784159421920776} -08/30/2021 22:13:50 - INFO - __main__ - Step 49807: {'lr': 0.00038195236340261374, 'samples': 9562944, 'steps': 49806, 'loss/train': 1.3762362003326416} -08/30/2021 22:13:52 - INFO - __main__ - Step 49808: {'lr': 0.0003819478560216029, 'samples': 9563136, 'steps': 49807, 'loss/train': 1.9439811706542969} -08/30/2021 22:13:53 - INFO - __main__ - Step 49809: {'lr': 0.00038194334858113817, 'samples': 9563328, 'steps': 49808, 'loss/train': 1.3838212490081787} -08/30/2021 22:13:53 - INFO - __main__ - Step 49810: {'lr': 0.0003819388410812219, 'samples': 9563520, 'steps': 49809, 'loss/train': 1.0086147785186768} -08/30/2021 22:13:53 - INFO - __main__ - Step 49811: {'lr': 0.00038193433352185597, 'samples': 9563712, 'steps': 49810, 'loss/train': 1.0823484659194946} -08/30/2021 22:13:54 - INFO - __main__ - Step 49812: {'lr': 0.0003819298259030425, 'samples': 9563904, 'steps': 49811, 'loss/train': 1.707214593887329} -08/30/2021 22:13:55 - INFO - __main__ - Step 49813: {'lr': 0.00038192531822478347, 'samples': 9564096, 'steps': 49812, 'loss/train': 0.020786872133612633} -08/30/2021 22:13:56 - INFO - __main__ - Step 49814: {'lr': 0.000381920810487081, 'samples': 9564288, 'steps': 49813, 'loss/train': 0.21956177055835724} -08/30/2021 22:13:56 - INFO - __main__ - Step 49815: {'lr': 0.0003819163026899369, 'samples': 9564480, 'steps': 49814, 'loss/train': 2.2562546730041504} -08/30/2021 22:13:56 - INFO - __main__ - Step 49816: {'lr': 0.00038191179483335346, 'samples': 9564672, 'steps': 49815, 'loss/train': 1.0328961610794067} -08/30/2021 22:13:57 - INFO - __main__ - Step 49817: {'lr': 0.0003819072869173326, 'samples': 9564864, 'steps': 49816, 'loss/train': 1.1331558227539062} -08/30/2021 22:13:57 - INFO - __main__ - Step 49818: {'lr': 0.0003819027789418764, 'samples': 9565056, 'steps': 49817, 'loss/train': 0.9301910400390625} -08/30/2021 22:13:59 - INFO - __main__ - Step 49819: {'lr': 0.0003818982709069867, 'samples': 9565248, 'steps': 49818, 'loss/train': 1.204207181930542} -08/30/2021 22:13:59 - INFO - __main__ - Step 49820: {'lr': 0.00038189376281266575, 'samples': 9565440, 'steps': 49819, 'loss/train': 0.8300979137420654} -08/30/2021 22:14:00 - INFO - __main__ - Step 49821: {'lr': 0.00038188925465891554, 'samples': 9565632, 'steps': 49820, 'loss/train': 1.497221827507019} -08/30/2021 22:14:00 - INFO - __main__ - Step 49822: {'lr': 0.000381884746445738, 'samples': 9565824, 'steps': 49821, 'loss/train': 1.5963858366012573} -08/30/2021 22:14:00 - INFO - __main__ - Step 49823: {'lr': 0.0003818802381731353, 'samples': 9566016, 'steps': 49822, 'loss/train': 1.3128944635391235} -08/30/2021 22:14:02 - INFO - __main__ - Step 49824: {'lr': 0.00038187572984110937, 'samples': 9566208, 'steps': 49823, 'loss/train': 1.3278546333312988} -08/30/2021 22:14:02 - INFO - __main__ - Step 49825: {'lr': 0.00038187122144966225, 'samples': 9566400, 'steps': 49824, 'loss/train': 1.9274048805236816} -08/30/2021 22:14:03 - INFO - __main__ - Step 49826: {'lr': 0.000381866712998796, 'samples': 9566592, 'steps': 49825, 'loss/train': 1.241894006729126} -08/30/2021 22:14:03 - INFO - __main__ - Step 49827: {'lr': 0.0003818622044885126, 'samples': 9566784, 'steps': 49826, 'loss/train': 1.2455166578292847} -08/30/2021 22:14:03 - INFO - __main__ - Step 49828: {'lr': 0.00038185769591881426, 'samples': 9566976, 'steps': 49827, 'loss/train': 0.985876739025116} -08/30/2021 22:14:05 - INFO - __main__ - Step 49829: {'lr': 0.00038185318728970277, 'samples': 9567168, 'steps': 49828, 'loss/train': 2.085016965866089} -08/30/2021 22:14:06 - INFO - __main__ - Step 49830: {'lr': 0.00038184867860118036, 'samples': 9567360, 'steps': 49829, 'loss/train': 1.0317169427871704} -08/30/2021 22:14:06 - INFO - __main__ - Step 49831: {'lr': 0.0003818441698532488, 'samples': 9567552, 'steps': 49830, 'loss/train': 1.3614450693130493} -08/30/2021 22:14:06 - INFO - __main__ - Step 49832: {'lr': 0.00038183966104591037, 'samples': 9567744, 'steps': 49831, 'loss/train': 1.1619430780410767} -08/30/2021 22:14:07 - INFO - __main__ - Step 49833: {'lr': 0.0003818351521791671, 'samples': 9567936, 'steps': 49832, 'loss/train': 0.08117188513278961} -08/30/2021 22:14:08 - INFO - __main__ - Step 49834: {'lr': 0.0003818306432530209, 'samples': 9568128, 'steps': 49833, 'loss/train': 0.24984338879585266} -08/30/2021 22:14:09 - INFO - __main__ - Step 49835: {'lr': 0.0003818261342674738, 'samples': 9568320, 'steps': 49834, 'loss/train': 1.6425518989562988} -08/30/2021 22:14:09 - INFO - __main__ - Step 49836: {'lr': 0.00038182162522252795, 'samples': 9568512, 'steps': 49835, 'loss/train': 1.0567774772644043} -08/30/2021 22:14:09 - INFO - __main__ - Step 49837: {'lr': 0.0003818171161181853, 'samples': 9568704, 'steps': 49836, 'loss/train': 3.106945276260376} -08/30/2021 22:14:10 - INFO - __main__ - Step 49838: {'lr': 0.00038181260695444784, 'samples': 9568896, 'steps': 49837, 'loss/train': 1.4562439918518066} -08/30/2021 22:14:11 - INFO - __main__ - Step 49839: {'lr': 0.00038180809773131764, 'samples': 9569088, 'steps': 49838, 'loss/train': 1.548840880393982} -08/30/2021 22:14:12 - INFO - __main__ - Step 49840: {'lr': 0.0003818035884487968, 'samples': 9569280, 'steps': 49839, 'loss/train': 1.1457788944244385} -08/30/2021 22:14:12 - INFO - __main__ - Step 49841: {'lr': 0.0003817990791068873, 'samples': 9569472, 'steps': 49840, 'loss/train': 1.4783170223236084} -08/30/2021 22:14:12 - INFO - __main__ - Step 49842: {'lr': 0.00038179456970559116, 'samples': 9569664, 'steps': 49841, 'loss/train': 0.8052507042884827} -08/30/2021 22:14:13 - INFO - __main__ - Step 49843: {'lr': 0.0003817900602449104, 'samples': 9569856, 'steps': 49842, 'loss/train': 1.5514938831329346} -08/30/2021 22:14:14 - INFO - __main__ - Step 49844: {'lr': 0.0003817855507248471, 'samples': 9570048, 'steps': 49843, 'loss/train': 0.9434102773666382} -08/30/2021 22:14:15 - INFO - __main__ - Step 49845: {'lr': 0.00038178104114540326, 'samples': 9570240, 'steps': 49844, 'loss/train': 1.6355791091918945} -08/30/2021 22:14:15 - INFO - __main__ - Step 49846: {'lr': 0.0003817765315065809, 'samples': 9570432, 'steps': 49845, 'loss/train': 1.291693091392517} -08/30/2021 22:14:15 - INFO - __main__ - Step 49847: {'lr': 0.000381772021808382, 'samples': 9570624, 'steps': 49846, 'loss/train': 0.9509743452072144} -08/30/2021 22:14:16 - INFO - __main__ - Step 49848: {'lr': 0.00038176751205080885, 'samples': 9570816, 'steps': 49847, 'loss/train': 1.1592611074447632} -08/30/2021 22:14:17 - INFO - __main__ - Step 49849: {'lr': 0.00038176300223386313, 'samples': 9571008, 'steps': 49848, 'loss/train': 0.9572741389274597} -08/30/2021 22:14:18 - INFO - __main__ - Step 49850: {'lr': 0.00038175849235754704, 'samples': 9571200, 'steps': 49849, 'loss/train': 1.5450934171676636} -08/30/2021 22:14:18 - INFO - __main__ - Step 49851: {'lr': 0.00038175398242186264, 'samples': 9571392, 'steps': 49850, 'loss/train': 1.2566306591033936} -08/30/2021 22:14:18 - INFO - __main__ - Step 49852: {'lr': 0.00038174947242681194, 'samples': 9571584, 'steps': 49851, 'loss/train': 1.3757431507110596} -08/30/2021 22:14:19 - INFO - __main__ - Step 49853: {'lr': 0.000381744962372397, 'samples': 9571776, 'steps': 49852, 'loss/train': 0.3873279392719269} -08/30/2021 22:14:21 - INFO - __main__ - Step 49854: {'lr': 0.00038174045225861976, 'samples': 9571968, 'steps': 49853, 'loss/train': 1.4917348623275757} -08/30/2021 22:14:21 - INFO - __main__ - Step 49855: {'lr': 0.00038173594208548234, 'samples': 9572160, 'steps': 49854, 'loss/train': 1.7407726049423218} -08/30/2021 22:14:22 - INFO - __main__ - Step 49856: {'lr': 0.00038173143185298665, 'samples': 9572352, 'steps': 49855, 'loss/train': 0.6799062490463257} -08/30/2021 22:14:22 - INFO - __main__ - Step 49857: {'lr': 0.00038172692156113484, 'samples': 9572544, 'steps': 49856, 'loss/train': 2.867138385772705} -08/30/2021 22:14:22 - INFO - __main__ - Step 49858: {'lr': 0.000381722411209929, 'samples': 9572736, 'steps': 49857, 'loss/train': 0.786793053150177} -08/30/2021 22:14:23 - INFO - __main__ - Step 49859: {'lr': 0.00038171790079937097, 'samples': 9572928, 'steps': 49858, 'loss/train': 0.5406507849693298} -08/30/2021 22:14:24 - INFO - __main__ - Step 49860: {'lr': 0.000381713390329463, 'samples': 9573120, 'steps': 49859, 'loss/train': 0.47808048129081726} -08/30/2021 22:14:25 - INFO - __main__ - Step 49861: {'lr': 0.00038170887980020683, 'samples': 9573312, 'steps': 49860, 'loss/train': 1.080627202987671} -08/30/2021 22:14:25 - INFO - __main__ - Step 49862: {'lr': 0.0003817043692116049, 'samples': 9573504, 'steps': 49861, 'loss/train': 1.9295005798339844} -08/30/2021 22:14:25 - INFO - __main__ - Step 49863: {'lr': 0.00038169985856365885, 'samples': 9573696, 'steps': 49862, 'loss/train': 1.2276242971420288} -08/30/2021 22:14:26 - INFO - __main__ - Step 49864: {'lr': 0.00038169534785637097, 'samples': 9573888, 'steps': 49863, 'loss/train': 0.9743057489395142} -08/30/2021 22:14:27 - INFO - __main__ - Step 49865: {'lr': 0.00038169083708974313, 'samples': 9574080, 'steps': 49864, 'loss/train': 1.4043761491775513} -08/30/2021 22:14:28 - INFO - __main__ - Step 49866: {'lr': 0.0003816863262637774, 'samples': 9574272, 'steps': 49865, 'loss/train': 1.5645949840545654} -08/30/2021 22:14:28 - INFO - __main__ - Step 49867: {'lr': 0.0003816818153784759, 'samples': 9574464, 'steps': 49866, 'loss/train': 0.762726902961731} -08/30/2021 22:14:28 - INFO - __main__ - Step 49868: {'lr': 0.00038167730443384063, 'samples': 9574656, 'steps': 49867, 'loss/train': 1.2686876058578491} -08/30/2021 22:14:29 - INFO - __main__ - Step 49869: {'lr': 0.0003816727934298736, 'samples': 9574848, 'steps': 49868, 'loss/train': 1.263796329498291} -08/30/2021 22:14:30 - INFO - __main__ - Step 49870: {'lr': 0.0003816682823665768, 'samples': 9575040, 'steps': 49869, 'loss/train': 1.100020408630371} -08/30/2021 22:14:31 - INFO - __main__ - Step 49871: {'lr': 0.0003816637712439523, 'samples': 9575232, 'steps': 49870, 'loss/train': 1.3270772695541382} -08/30/2021 22:14:31 - INFO - __main__ - Step 49872: {'lr': 0.0003816592600620021, 'samples': 9575424, 'steps': 49871, 'loss/train': 5.723047733306885} -08/30/2021 22:14:31 - INFO - __main__ - Step 49873: {'lr': 0.0003816547488207284, 'samples': 9575616, 'steps': 49872, 'loss/train': 1.449615716934204} -08/30/2021 22:14:32 - INFO - __main__ - Step 49874: {'lr': 0.00038165023752013294, 'samples': 9575808, 'steps': 49873, 'loss/train': 1.69248628616333} -08/30/2021 22:14:33 - INFO - __main__ - Step 49875: {'lr': 0.00038164572616021807, 'samples': 9576000, 'steps': 49874, 'loss/train': 1.406014323234558} -08/30/2021 22:14:34 - INFO - __main__ - Step 49876: {'lr': 0.0003816412147409856, 'samples': 9576192, 'steps': 49875, 'loss/train': 1.1755253076553345} -08/30/2021 22:14:34 - INFO - __main__ - Step 49877: {'lr': 0.0003816367032624376, 'samples': 9576384, 'steps': 49876, 'loss/train': 0.09784774482250214} -08/30/2021 22:14:35 - INFO - __main__ - Step 49878: {'lr': 0.0003816321917245761, 'samples': 9576576, 'steps': 49877, 'loss/train': 1.019940733909607} -08/30/2021 22:14:35 - INFO - __main__ - Step 49879: {'lr': 0.00038162768012740323, 'samples': 9576768, 'steps': 49878, 'loss/train': 1.0620776414871216} -08/30/2021 22:14:37 - INFO - __main__ - Step 49880: {'lr': 0.00038162316847092096, 'samples': 9576960, 'steps': 49879, 'loss/train': 1.82549250125885} -08/30/2021 22:14:37 - INFO - __main__ - Step 49881: {'lr': 0.0003816186567551313, 'samples': 9577152, 'steps': 49880, 'loss/train': 0.7739014625549316} -08/30/2021 22:14:38 - INFO - __main__ - Step 49882: {'lr': 0.0003816141449800364, 'samples': 9577344, 'steps': 49881, 'loss/train': 1.5781736373901367} -08/30/2021 22:14:38 - INFO - __main__ - Step 49883: {'lr': 0.00038160963314563806, 'samples': 9577536, 'steps': 49882, 'loss/train': 2.0784504413604736} -08/30/2021 22:14:38 - INFO - __main__ - Step 49884: {'lr': 0.00038160512125193853, 'samples': 9577728, 'steps': 49883, 'loss/train': 1.4156413078308105} -08/30/2021 22:14:39 - INFO - __main__ - Step 49885: {'lr': 0.0003816006092989397, 'samples': 9577920, 'steps': 49884, 'loss/train': 4.68715763092041} -08/30/2021 22:14:40 - INFO - __main__ - Step 49886: {'lr': 0.0003815960972866437, 'samples': 9578112, 'steps': 49885, 'loss/train': 1.1393882036209106} -08/30/2021 22:14:41 - INFO - __main__ - Step 49887: {'lr': 0.00038159158521505255, 'samples': 9578304, 'steps': 49886, 'loss/train': 1.1316070556640625} -08/30/2021 22:14:41 - INFO - __main__ - Step 49888: {'lr': 0.0003815870730841683, 'samples': 9578496, 'steps': 49887, 'loss/train': 1.9979842901229858} -08/30/2021 22:14:41 - INFO - __main__ - Step 49889: {'lr': 0.00038158256089399287, 'samples': 9578688, 'steps': 49888, 'loss/train': 1.2268280982971191} -08/30/2021 22:14:42 - INFO - __main__ - Step 49890: {'lr': 0.0003815780486445284, 'samples': 9578880, 'steps': 49889, 'loss/train': 1.1332812309265137} -08/30/2021 22:14:43 - INFO - __main__ - Step 49891: {'lr': 0.00038157353633577686, 'samples': 9579072, 'steps': 49890, 'loss/train': 1.4598584175109863} -08/30/2021 22:14:44 - INFO - __main__ - Step 49892: {'lr': 0.0003815690239677403, 'samples': 9579264, 'steps': 49891, 'loss/train': 1.551299810409546} -08/30/2021 22:14:44 - INFO - __main__ - Step 49893: {'lr': 0.00038156451154042084, 'samples': 9579456, 'steps': 49892, 'loss/train': 2.0841121673583984} -08/30/2021 22:14:44 - INFO - __main__ - Step 49894: {'lr': 0.0003815599990538203, 'samples': 9579648, 'steps': 49893, 'loss/train': 3.4649205207824707} -08/30/2021 22:14:45 - INFO - __main__ - Step 49895: {'lr': 0.00038155548650794103, 'samples': 9579840, 'steps': 49894, 'loss/train': 0.7513778209686279} -08/30/2021 22:14:45 - INFO - __main__ - Step 49896: {'lr': 0.00038155097390278484, 'samples': 9580032, 'steps': 49895, 'loss/train': 0.6828315258026123} -08/30/2021 22:14:47 - INFO - __main__ - Step 49897: {'lr': 0.0003815464612383538, 'samples': 9580224, 'steps': 49896, 'loss/train': 1.1336301565170288} -08/30/2021 22:14:47 - INFO - __main__ - Step 49898: {'lr': 0.0003815419485146499, 'samples': 9580416, 'steps': 49897, 'loss/train': 1.6544756889343262} -08/30/2021 22:14:47 - INFO - __main__ - Step 49899: {'lr': 0.0003815374357316753, 'samples': 9580608, 'steps': 49898, 'loss/train': 0.8168324828147888} -08/30/2021 22:14:48 - INFO - __main__ - Step 49900: {'lr': 0.0003815329228894319, 'samples': 9580800, 'steps': 49899, 'loss/train': 1.5095332860946655} -08/30/2021 22:14:48 - INFO - __main__ - Step 49901: {'lr': 0.0003815284099879218, 'samples': 9580992, 'steps': 49900, 'loss/train': 1.1146937608718872} -08/30/2021 22:14:50 - INFO - __main__ - Step 49902: {'lr': 0.00038152389702714705, 'samples': 9581184, 'steps': 49901, 'loss/train': 1.2158877849578857} -08/30/2021 22:14:50 - INFO - __main__ - Step 49903: {'lr': 0.0003815193840071097, 'samples': 9581376, 'steps': 49902, 'loss/train': 1.292009711265564} -08/30/2021 22:14:50 - INFO - __main__ - Step 49904: {'lr': 0.0003815148709278117, 'samples': 9581568, 'steps': 49903, 'loss/train': 1.187833547592163} -08/30/2021 22:14:51 - INFO - __main__ - Step 49905: {'lr': 0.00038151035778925514, 'samples': 9581760, 'steps': 49904, 'loss/train': 1.393072247505188} -08/30/2021 22:14:51 - INFO - __main__ - Step 49906: {'lr': 0.000381505844591442, 'samples': 9581952, 'steps': 49905, 'loss/train': 1.677585244178772} -08/30/2021 22:14:53 - INFO - __main__ - Step 49907: {'lr': 0.0003815013313343744, 'samples': 9582144, 'steps': 49906, 'loss/train': 0.9656486511230469} -08/30/2021 22:14:53 - INFO - __main__ - Step 49908: {'lr': 0.0003814968180180544, 'samples': 9582336, 'steps': 49907, 'loss/train': 0.9414292573928833} -08/30/2021 22:14:54 - INFO - __main__ - Step 49909: {'lr': 0.00038149230464248386, 'samples': 9582528, 'steps': 49908, 'loss/train': 1.4174463748931885} -08/30/2021 22:14:54 - INFO - __main__ - Step 49910: {'lr': 0.000381487791207665, 'samples': 9582720, 'steps': 49909, 'loss/train': 1.4325464963912964} -08/30/2021 22:14:54 - INFO - __main__ - Step 49911: {'lr': 0.0003814832777135997, 'samples': 9582912, 'steps': 49910, 'loss/train': 1.3477137088775635} -08/30/2021 22:14:56 - INFO - __main__ - Step 49912: {'lr': 0.00038147876416029004, 'samples': 9583104, 'steps': 49911, 'loss/train': 1.5271865129470825} -08/30/2021 22:14:57 - INFO - __main__ - Step 49913: {'lr': 0.0003814742505477381, 'samples': 9583296, 'steps': 49912, 'loss/train': 1.6888169050216675} -08/30/2021 22:14:57 - INFO - __main__ - Step 49914: {'lr': 0.0003814697368759459, 'samples': 9583488, 'steps': 49913, 'loss/train': 1.732778787612915} -08/30/2021 22:14:57 - INFO - __main__ - Step 49915: {'lr': 0.0003814652231449155, 'samples': 9583680, 'steps': 49914, 'loss/train': 0.14118877053260803} -08/30/2021 22:14:58 - INFO - __main__ - Step 49916: {'lr': 0.0003814607093546489, 'samples': 9583872, 'steps': 49915, 'loss/train': 2.1029610633850098} -08/30/2021 22:14:58 - INFO - __main__ - Step 49917: {'lr': 0.0003814561955051481, 'samples': 9584064, 'steps': 49916, 'loss/train': 1.1900182962417603} -08/30/2021 22:15:00 - INFO - __main__ - Step 49918: {'lr': 0.00038145168159641515, 'samples': 9584256, 'steps': 49917, 'loss/train': 1.322786808013916} -08/30/2021 22:15:00 - INFO - __main__ - Step 49919: {'lr': 0.0003814471676284521, 'samples': 9584448, 'steps': 49918, 'loss/train': 1.9398250579833984} -08/30/2021 22:15:01 - INFO - __main__ - Step 49920: {'lr': 0.00038144265360126107, 'samples': 9584640, 'steps': 49919, 'loss/train': 0.888759434223175} -08/30/2021 22:15:01 - INFO - __main__ - Step 49921: {'lr': 0.00038143813951484396, 'samples': 9584832, 'steps': 49920, 'loss/train': 1.331196904182434} -08/30/2021 22:15:01 - INFO - __main__ - Step 49922: {'lr': 0.0003814336253692028, 'samples': 9585024, 'steps': 49921, 'loss/train': 1.416749119758606} -08/30/2021 22:15:03 - INFO - __main__ - Step 49923: {'lr': 0.0003814291111643397, 'samples': 9585216, 'steps': 49922, 'loss/train': 0.09901145100593567} -08/30/2021 22:15:03 - INFO - __main__ - Step 49924: {'lr': 0.00038142459690025665, 'samples': 9585408, 'steps': 49923, 'loss/train': 1.4845200777053833} -08/30/2021 22:15:04 - INFO - __main__ - Step 49925: {'lr': 0.0003814200825769558, 'samples': 9585600, 'steps': 49924, 'loss/train': 1.0127054452896118} -08/30/2021 22:15:04 - INFO - __main__ - Step 49926: {'lr': 0.000381415568194439, 'samples': 9585792, 'steps': 49925, 'loss/train': 2.016517162322998} -08/30/2021 22:15:04 - INFO - __main__ - Step 49927: {'lr': 0.00038141105375270846, 'samples': 9585984, 'steps': 49926, 'loss/train': 1.6244580745697021} -08/30/2021 22:15:06 - INFO - __main__ - Step 49928: {'lr': 0.00038140653925176606, 'samples': 9586176, 'steps': 49927, 'loss/train': 1.630874514579773} -08/30/2021 22:15:06 - INFO - __main__ - Step 49929: {'lr': 0.0003814020246916139, 'samples': 9586368, 'steps': 49928, 'loss/train': 0.8663868308067322} -08/30/2021 22:15:07 - INFO - __main__ - Step 49930: {'lr': 0.000381397510072254, 'samples': 9586560, 'steps': 49929, 'loss/train': 0.6792960166931152} -08/30/2021 22:15:07 - INFO - __main__ - Step 49931: {'lr': 0.0003813929953936884, 'samples': 9586752, 'steps': 49930, 'loss/train': 1.2131116390228271} -08/30/2021 22:15:07 - INFO - __main__ - Step 49932: {'lr': 0.00038138848065591923, 'samples': 9586944, 'steps': 49931, 'loss/train': 0.6229634881019592} -08/30/2021 22:15:09 - INFO - __main__ - Step 49933: {'lr': 0.00038138396585894843, 'samples': 9587136, 'steps': 49932, 'loss/train': 1.458230972290039} -08/30/2021 22:15:09 - INFO - __main__ - Step 49934: {'lr': 0.0003813794510027779, 'samples': 9587328, 'steps': 49933, 'loss/train': 0.5613172650337219} -08/30/2021 22:15:10 - INFO - __main__ - Step 49935: {'lr': 0.00038137493608741, 'samples': 9587520, 'steps': 49934, 'loss/train': 1.5147184133529663} -08/30/2021 22:15:10 - INFO - __main__ - Step 49936: {'lr': 0.0003813704211128465, 'samples': 9587712, 'steps': 49935, 'loss/train': 1.3081154823303223} -08/30/2021 22:15:10 - INFO - __main__ - Step 49937: {'lr': 0.0003813659060790895, 'samples': 9587904, 'steps': 49936, 'loss/train': 1.000442385673523} -08/30/2021 22:15:11 - INFO - __main__ - Step 49938: {'lr': 0.00038136139098614107, 'samples': 9588096, 'steps': 49937, 'loss/train': 1.4864379167556763} -08/30/2021 22:15:12 - INFO - __main__ - Step 49939: {'lr': 0.00038135687583400326, 'samples': 9588288, 'steps': 49938, 'loss/train': 1.852515697479248} -08/30/2021 22:15:13 - INFO - __main__ - Step 49940: {'lr': 0.000381352360622678, 'samples': 9588480, 'steps': 49939, 'loss/train': 1.3297425508499146} -08/30/2021 22:15:13 - INFO - __main__ - Step 49941: {'lr': 0.00038134784535216737, 'samples': 9588672, 'steps': 49940, 'loss/train': 1.7343114614486694} -08/30/2021 22:15:14 - INFO - __main__ - Step 49942: {'lr': 0.0003813433300224735, 'samples': 9588864, 'steps': 49941, 'loss/train': 0.04141373187303543} -08/30/2021 22:15:14 - INFO - __main__ - Step 49943: {'lr': 0.0003813388146335983, 'samples': 9589056, 'steps': 49942, 'loss/train': 1.479673981666565} -08/30/2021 22:15:14 - INFO - __main__ - Step 49944: {'lr': 0.00038133429918554395, 'samples': 9589248, 'steps': 49943, 'loss/train': 1.3206608295440674} -08/30/2021 22:15:16 - INFO - __main__ - Step 49945: {'lr': 0.00038132978367831226, 'samples': 9589440, 'steps': 49944, 'loss/train': 1.159934163093567} -08/30/2021 22:15:16 - INFO - __main__ - Step 49946: {'lr': 0.00038132526811190547, 'samples': 9589632, 'steps': 49945, 'loss/train': 0.05921933427453041} -08/30/2021 22:15:17 - INFO - __main__ - Step 49947: {'lr': 0.00038132075248632557, 'samples': 9589824, 'steps': 49946, 'loss/train': 2.090723991394043} -08/30/2021 22:15:17 - INFO - __main__ - Step 49948: {'lr': 0.0003813162368015745, 'samples': 9590016, 'steps': 49947, 'loss/train': 1.540015697479248} -08/30/2021 22:15:17 - INFO - __main__ - Step 49949: {'lr': 0.00038131172105765446, 'samples': 9590208, 'steps': 49948, 'loss/train': 1.2368717193603516} -08/30/2021 22:15:19 - INFO - __main__ - Step 49950: {'lr': 0.0003813072052545673, 'samples': 9590400, 'steps': 49949, 'loss/train': 1.4749137163162231} -08/30/2021 22:15:19 - INFO - __main__ - Step 49951: {'lr': 0.00038130268939231513, 'samples': 9590592, 'steps': 49950, 'loss/train': 1.6987398862838745} -08/30/2021 22:15:20 - INFO - __main__ - Step 49952: {'lr': 0.0003812981734709, 'samples': 9590784, 'steps': 49951, 'loss/train': 1.3168388605117798} -08/30/2021 22:15:20 - INFO - __main__ - Step 49953: {'lr': 0.00038129365749032395, 'samples': 9590976, 'steps': 49952, 'loss/train': 1.61680006980896} -08/30/2021 22:15:20 - INFO - __main__ - Step 49954: {'lr': 0.000381289141450589, 'samples': 9591168, 'steps': 49953, 'loss/train': 1.9050722122192383} -08/30/2021 22:15:21 - INFO - __main__ - Step 49955: {'lr': 0.00038128462535169715, 'samples': 9591360, 'steps': 49954, 'loss/train': 1.700305461883545} -08/30/2021 22:15:22 - INFO - __main__ - Step 49956: {'lr': 0.00038128010919365066, 'samples': 9591552, 'steps': 49955, 'loss/train': 1.3154253959655762} -08/30/2021 22:15:23 - INFO - __main__ - Step 49957: {'lr': 0.0003812755929764512, 'samples': 9591744, 'steps': 49956, 'loss/train': 0.9426714181900024} -08/30/2021 22:15:23 - INFO - __main__ - Step 49958: {'lr': 0.000381271076700101, 'samples': 9591936, 'steps': 49957, 'loss/train': 0.10984140634536743} -08/30/2021 22:15:24 - INFO - __main__ - Step 49959: {'lr': 0.00038126656036460206, 'samples': 9592128, 'steps': 49958, 'loss/train': 0.8538442254066467} -08/30/2021 22:15:24 - INFO - __main__ - Step 49960: {'lr': 0.0003812620439699565, 'samples': 9592320, 'steps': 49959, 'loss/train': 1.570562720298767} -08/30/2021 22:15:26 - INFO - __main__ - Step 49961: {'lr': 0.00038125752751616625, 'samples': 9592512, 'steps': 49960, 'loss/train': 0.10712048411369324} -08/30/2021 22:15:27 - INFO - __main__ - Step 49962: {'lr': 0.00038125301100323344, 'samples': 9592704, 'steps': 49961, 'loss/train': 0.9405786991119385} -08/30/2021 22:15:27 - INFO - __main__ - Step 49963: {'lr': 0.00038124849443116, 'samples': 9592896, 'steps': 49962, 'loss/train': 1.2084598541259766} -08/30/2021 22:15:28 - INFO - __main__ - Step 49964: {'lr': 0.000381243977799948, 'samples': 9593088, 'steps': 49963, 'loss/train': 1.7010899782180786} -08/30/2021 22:15:28 - INFO - __main__ - Step 49965: {'lr': 0.0003812394611095995, 'samples': 9593280, 'steps': 49964, 'loss/train': 1.2085901498794556} -08/30/2021 22:15:30 - INFO - __main__ - Step 49966: {'lr': 0.0003812349443601165, 'samples': 9593472, 'steps': 49965, 'loss/train': 1.409525752067566} -08/30/2021 22:15:30 - INFO - __main__ - Step 49967: {'lr': 0.0003812304275515012, 'samples': 9593664, 'steps': 49966, 'loss/train': 1.1673520803451538} -08/30/2021 22:15:31 - INFO - __main__ - Step 49968: {'lr': 0.00038122591068375536, 'samples': 9593856, 'steps': 49967, 'loss/train': 0.3900246024131775} -08/30/2021 22:15:31 - INFO - __main__ - Step 49969: {'lr': 0.00038122139375688116, 'samples': 9594048, 'steps': 49968, 'loss/train': 1.0771349668502808} -08/30/2021 22:15:32 - INFO - __main__ - Step 49970: {'lr': 0.0003812168767708807, 'samples': 9594240, 'steps': 49969, 'loss/train': 0.16064275801181793} -08/30/2021 22:15:32 - INFO - __main__ - Step 49971: {'lr': 0.0003812123597257559, 'samples': 9594432, 'steps': 49970, 'loss/train': 1.4943517446517944} -08/30/2021 22:15:33 - INFO - __main__ - Step 49972: {'lr': 0.00038120784262150875, 'samples': 9594624, 'steps': 49971, 'loss/train': 0.05315021425485611} -08/30/2021 22:15:34 - INFO - __main__ - Step 49973: {'lr': 0.0003812033254581414, 'samples': 9594816, 'steps': 49972, 'loss/train': 2.0069777965545654} -08/30/2021 22:15:34 - INFO - __main__ - Step 49974: {'lr': 0.0003811988082356559, 'samples': 9595008, 'steps': 49973, 'loss/train': 1.4596290588378906} -08/30/2021 22:15:34 - INFO - __main__ - Step 49975: {'lr': 0.0003811942909540542, 'samples': 9595200, 'steps': 49974, 'loss/train': 1.361367106437683} -08/30/2021 22:15:35 - INFO - __main__ - Step 49976: {'lr': 0.0003811897736133385, 'samples': 9595392, 'steps': 49975, 'loss/train': 1.651120901107788} -08/30/2021 22:15:36 - INFO - __main__ - Step 49977: {'lr': 0.0003811852562135106, 'samples': 9595584, 'steps': 49976, 'loss/train': 1.5983085632324219} -08/30/2021 22:15:37 - INFO - __main__ - Step 49978: {'lr': 0.0003811807387545727, 'samples': 9595776, 'steps': 49977, 'loss/train': 1.715244174003601} -08/30/2021 22:15:37 - INFO - __main__ - Step 49979: {'lr': 0.0003811762212365267, 'samples': 9595968, 'steps': 49978, 'loss/train': 1.5426217317581177} -08/30/2021 22:15:37 - INFO - __main__ - Step 49980: {'lr': 0.0003811717036593748, 'samples': 9596160, 'steps': 49979, 'loss/train': 1.709546685218811} -08/30/2021 22:15:38 - INFO - __main__ - Step 49981: {'lr': 0.00038116718602311896, 'samples': 9596352, 'steps': 49980, 'loss/train': 1.6222771406173706} -08/30/2021 22:15:39 - INFO - __main__ - Step 49982: {'lr': 0.00038116266832776113, 'samples': 9596544, 'steps': 49981, 'loss/train': 1.7393566370010376} -08/30/2021 22:15:40 - INFO - __main__ - Step 49983: {'lr': 0.0003811581505733035, 'samples': 9596736, 'steps': 49982, 'loss/train': 1.9680745601654053} -08/30/2021 22:15:40 - INFO - __main__ - Step 49984: {'lr': 0.000381153632759748, 'samples': 9596928, 'steps': 49983, 'loss/train': 1.2211098670959473} -08/30/2021 22:15:40 - INFO - __main__ - Step 49985: {'lr': 0.0003811491148870967, 'samples': 9597120, 'steps': 49984, 'loss/train': 1.4524140357971191} -08/30/2021 22:15:41 - INFO - __main__ - Step 49986: {'lr': 0.0003811445969553516, 'samples': 9597312, 'steps': 49985, 'loss/train': 1.1627111434936523} -08/30/2021 22:15:42 - INFO - __main__ - Step 49987: {'lr': 0.00038114007896451486, 'samples': 9597504, 'steps': 49986, 'loss/train': 1.5767033100128174} -08/30/2021 22:15:43 - INFO - __main__ - Step 49988: {'lr': 0.0003811355609145883, 'samples': 9597696, 'steps': 49987, 'loss/train': 1.5722547769546509} -08/30/2021 22:15:43 - INFO - __main__ - Step 49989: {'lr': 0.0003811310428055742, 'samples': 9597888, 'steps': 49988, 'loss/train': 0.6168616414070129} -08/30/2021 22:15:43 - INFO - __main__ - Step 49990: {'lr': 0.00038112652463747444, 'samples': 9598080, 'steps': 49989, 'loss/train': 1.0592572689056396} -08/30/2021 22:15:44 - INFO - __main__ - Step 49991: {'lr': 0.00038112200641029104, 'samples': 9598272, 'steps': 49990, 'loss/train': 1.398459792137146} -08/30/2021 22:15:45 - INFO - __main__ - Step 49992: {'lr': 0.00038111748812402616, 'samples': 9598464, 'steps': 49991, 'loss/train': 0.803909957408905} -08/30/2021 22:15:46 - INFO - __main__ - Step 49993: {'lr': 0.0003811129697786817, 'samples': 9598656, 'steps': 49992, 'loss/train': 1.50918710231781} -08/30/2021 22:15:46 - INFO - __main__ - Step 49994: {'lr': 0.00038110845137425976, 'samples': 9598848, 'steps': 49993, 'loss/train': 1.0690501928329468} -08/30/2021 22:15:46 - INFO - __main__ - Step 49995: {'lr': 0.0003811039329107624, 'samples': 9599040, 'steps': 49994, 'loss/train': 1.7483011484146118} -08/30/2021 22:15:47 - INFO - __main__ - Step 49996: {'lr': 0.00038109941438819165, 'samples': 9599232, 'steps': 49995, 'loss/train': 1.6299405097961426} -08/30/2021 22:15:47 - INFO - __main__ - Step 49997: {'lr': 0.00038109489580654955, 'samples': 9599424, 'steps': 49996, 'loss/train': 0.7644880414009094} -08/30/2021 22:15:49 - INFO - __main__ - Step 49998: {'lr': 0.00038109037716583806, 'samples': 9599616, 'steps': 49997, 'loss/train': 1.2841774225234985} -08/30/2021 22:15:50 - INFO - __main__ - Step 49999: {'lr': 0.0003810858584660593, 'samples': 9599808, 'steps': 49998, 'loss/train': 1.5746294260025024} -08/30/2021 22:15:50 - INFO - __main__ - Step 50000: {'lr': 0.0003810813397072152, 'samples': 9600000, 'steps': 49999, 'loss/train': 1.3064301013946533} -08/30/2021 22:15:50 - INFO - __main__ - Step 50001: {'lr': 0.00038107682088930797, 'samples': 9600192, 'steps': 50000, 'loss/train': 1.0298306941986084} -08/30/2021 22:15:51 - INFO - __main__ - Step 50002: {'lr': 0.00038107230201233944, 'samples': 9600384, 'steps': 50001, 'loss/train': 0.0941631868481636} -08/30/2021 22:15:52 - INFO - __main__ - Step 50003: {'lr': 0.00038106778307631187, 'samples': 9600576, 'steps': 50002, 'loss/train': 0.1259710192680359} -08/30/2021 22:15:53 - INFO - __main__ - Step 50004: {'lr': 0.0003810632640812271, 'samples': 9600768, 'steps': 50003, 'loss/train': 1.1675041913986206} -08/30/2021 22:15:53 - INFO - __main__ - Step 50005: {'lr': 0.00038105874502708726, 'samples': 9600960, 'steps': 50004, 'loss/train': 1.560531735420227} -08/30/2021 22:15:53 - INFO - __main__ - Step 50006: {'lr': 0.0003810542259138944, 'samples': 9601152, 'steps': 50005, 'loss/train': 1.4806926250457764} -08/30/2021 22:15:54 - INFO - __main__ - Step 50007: {'lr': 0.0003810497067416505, 'samples': 9601344, 'steps': 50006, 'loss/train': 1.1481035947799683} -08/30/2021 22:15:55 - INFO - __main__ - Step 50008: {'lr': 0.0003810451875103576, 'samples': 9601536, 'steps': 50007, 'loss/train': 1.7544904947280884} -08/30/2021 22:15:56 - INFO - __main__ - Step 50009: {'lr': 0.0003810406682200178, 'samples': 9601728, 'steps': 50008, 'loss/train': 1.4128069877624512} -08/30/2021 22:15:56 - INFO - __main__ - Step 50010: {'lr': 0.0003810361488706331, 'samples': 9601920, 'steps': 50009, 'loss/train': 0.9419867396354675} -08/30/2021 22:15:56 - INFO - __main__ - Step 50011: {'lr': 0.0003810316294622056, 'samples': 9602112, 'steps': 50010, 'loss/train': 0.8903459906578064} -08/30/2021 22:15:57 - INFO - __main__ - Step 50012: {'lr': 0.0003810271099947371, 'samples': 9602304, 'steps': 50011, 'loss/train': 1.6325072050094604} -08/30/2021 22:15:59 - INFO - __main__ - Step 50013: {'lr': 0.00038102259046822993, 'samples': 9602496, 'steps': 50012, 'loss/train': 1.376466155052185} -08/30/2021 22:15:59 - INFO - __main__ - Step 50014: {'lr': 0.00038101807088268595, 'samples': 9602688, 'steps': 50013, 'loss/train': 1.5262771844863892} -08/30/2021 22:16:00 - INFO - __main__ - Step 50015: {'lr': 0.00038101355123810733, 'samples': 9602880, 'steps': 50014, 'loss/train': 1.2302452325820923} -08/30/2021 22:16:00 - INFO - __main__ - Step 50016: {'lr': 0.00038100903153449596, 'samples': 9603072, 'steps': 50015, 'loss/train': 1.1891863346099854} -08/30/2021 22:16:00 - INFO - __main__ - Step 50017: {'lr': 0.00038100451177185395, 'samples': 9603264, 'steps': 50016, 'loss/train': 1.2596502304077148} -08/30/2021 22:16:02 - INFO - __main__ - Step 50018: {'lr': 0.0003809999919501833, 'samples': 9603456, 'steps': 50017, 'loss/train': 1.7209770679473877} -08/30/2021 22:16:03 - INFO - __main__ - Step 50019: {'lr': 0.00038099547206948617, 'samples': 9603648, 'steps': 50018, 'loss/train': 1.014421820640564} -08/30/2021 22:16:03 - INFO - __main__ - Step 50020: {'lr': 0.0003809909521297644, 'samples': 9603840, 'steps': 50019, 'loss/train': 1.2036447525024414} -08/30/2021 22:16:03 - INFO - __main__ - Step 50021: {'lr': 0.00038098643213102014, 'samples': 9604032, 'steps': 50020, 'loss/train': 0.49280133843421936} -08/30/2021 22:16:04 - INFO - __main__ - Step 50022: {'lr': 0.0003809819120732554, 'samples': 9604224, 'steps': 50021, 'loss/train': 1.688100814819336} -08/30/2021 22:16:04 - INFO - __main__ - Step 50023: {'lr': 0.00038097739195647233, 'samples': 9604416, 'steps': 50022, 'loss/train': 1.0814008712768555} -08/30/2021 22:16:05 - INFO - __main__ - Step 50024: {'lr': 0.0003809728717806728, 'samples': 9604608, 'steps': 50023, 'loss/train': 0.11027158796787262} -08/30/2021 22:16:06 - INFO - __main__ - Step 50025: {'lr': 0.00038096835154585897, 'samples': 9604800, 'steps': 50024, 'loss/train': 1.3086692094802856} -08/30/2021 22:16:06 - INFO - __main__ - Step 50026: {'lr': 0.0003809638312520327, 'samples': 9604992, 'steps': 50025, 'loss/train': 1.3395917415618896} -08/30/2021 22:16:07 - INFO - __main__ - Step 50027: {'lr': 0.0003809593108991962, 'samples': 9605184, 'steps': 50026, 'loss/train': 1.5631290674209595} -08/30/2021 22:16:07 - INFO - __main__ - Step 50028: {'lr': 0.0003809547904873515, 'samples': 9605376, 'steps': 50027, 'loss/train': 1.7063641548156738} -08/30/2021 22:16:09 - INFO - __main__ - Step 50029: {'lr': 0.0003809502700165006, 'samples': 9605568, 'steps': 50028, 'loss/train': 1.2550994157791138} -08/30/2021 22:16:09 - INFO - __main__ - Step 50030: {'lr': 0.00038094574948664554, 'samples': 9605760, 'steps': 50029, 'loss/train': 0.6143820881843567} -08/30/2021 22:16:10 - INFO - __main__ - Step 50031: {'lr': 0.00038094122889778824, 'samples': 9605952, 'steps': 50030, 'loss/train': 0.872804582118988} -08/30/2021 22:16:10 - INFO - __main__ - Step 50032: {'lr': 0.000380936708249931, 'samples': 9606144, 'steps': 50031, 'loss/train': 1.2021774053573608} -08/30/2021 22:16:10 - INFO - __main__ - Step 50033: {'lr': 0.0003809321875430756, 'samples': 9606336, 'steps': 50032, 'loss/train': 1.6694682836532593} -08/30/2021 22:16:12 - INFO - __main__ - Step 50034: {'lr': 0.0003809276667772241, 'samples': 9606528, 'steps': 50033, 'loss/train': 2.275981903076172} -08/30/2021 22:16:12 - INFO - __main__ - Step 50035: {'lr': 0.00038092314595237873, 'samples': 9606720, 'steps': 50034, 'loss/train': 1.3710722923278809} -08/30/2021 22:16:13 - INFO - __main__ - Step 50036: {'lr': 0.0003809186250685414, 'samples': 9606912, 'steps': 50035, 'loss/train': 1.6243427991867065} -08/30/2021 22:16:13 - INFO - __main__ - Step 50037: {'lr': 0.0003809141041257141, 'samples': 9607104, 'steps': 50036, 'loss/train': 0.24902775883674622} -08/30/2021 22:16:13 - INFO - __main__ - Step 50038: {'lr': 0.000380909583123899, 'samples': 9607296, 'steps': 50037, 'loss/train': 1.0140602588653564} -08/30/2021 22:16:14 - INFO - __main__ - Step 50039: {'lr': 0.00038090506206309805, 'samples': 9607488, 'steps': 50038, 'loss/train': 1.3978636264801025} -08/30/2021 22:16:16 - INFO - __main__ - Step 50040: {'lr': 0.00038090054094331324, 'samples': 9607680, 'steps': 50039, 'loss/train': 1.7784162759780884} -08/30/2021 22:16:16 - INFO - __main__ - Step 50041: {'lr': 0.0003808960197645467, 'samples': 9607872, 'steps': 50040, 'loss/train': 1.0483201742172241} -08/30/2021 22:16:16 - INFO - __main__ - Step 50042: {'lr': 0.00038089149852680036, 'samples': 9608064, 'steps': 50041, 'loss/train': 1.3781033754348755} -08/30/2021 22:16:17 - INFO - __main__ - Step 50043: {'lr': 0.00038088697723007647, 'samples': 9608256, 'steps': 50042, 'loss/train': 1.945577621459961} -08/30/2021 22:16:17 - INFO - __main__ - Step 50044: {'lr': 0.00038088245587437685, 'samples': 9608448, 'steps': 50043, 'loss/train': 0.03787803649902344} -08/30/2021 22:16:17 - INFO - __main__ - Step 50045: {'lr': 0.00038087793445970363, 'samples': 9608640, 'steps': 50044, 'loss/train': 1.1329152584075928} -08/30/2021 22:16:19 - INFO - __main__ - Step 50046: {'lr': 0.0003808734129860588, 'samples': 9608832, 'steps': 50045, 'loss/train': 1.4633455276489258} -08/30/2021 22:16:20 - INFO - __main__ - Step 50047: {'lr': 0.0003808688914534445, 'samples': 9609024, 'steps': 50046, 'loss/train': 0.5694299340248108} -08/30/2021 22:16:20 - INFO - __main__ - Step 50048: {'lr': 0.00038086436986186267, 'samples': 9609216, 'steps': 50047, 'loss/train': 1.269545555114746} -08/30/2021 22:16:20 - INFO - __main__ - Step 50049: {'lr': 0.00038085984821131536, 'samples': 9609408, 'steps': 50048, 'loss/train': 1.433971643447876} -08/30/2021 22:16:21 - INFO - __main__ - Step 50050: {'lr': 0.00038085532650180464, 'samples': 9609600, 'steps': 50049, 'loss/train': 1.0071122646331787} -08/30/2021 22:16:22 - INFO - __main__ - Step 50051: {'lr': 0.0003808508047333325, 'samples': 9609792, 'steps': 50050, 'loss/train': 0.8194466829299927} -08/30/2021 22:16:23 - INFO - __main__ - Step 50052: {'lr': 0.000380846282905901, 'samples': 9609984, 'steps': 50051, 'loss/train': 1.3815641403198242} -08/30/2021 22:16:23 - INFO - __main__ - Step 50053: {'lr': 0.0003808417610195122, 'samples': 9610176, 'steps': 50052, 'loss/train': 1.128920078277588} -08/30/2021 22:16:23 - INFO - __main__ - Step 50054: {'lr': 0.0003808372390741681, 'samples': 9610368, 'steps': 50053, 'loss/train': 0.8643597960472107} -08/30/2021 22:16:24 - INFO - __main__ - Step 50055: {'lr': 0.0003808327170698708, 'samples': 9610560, 'steps': 50054, 'loss/train': 1.538956642150879} -08/30/2021 22:16:25 - INFO - __main__ - Step 50056: {'lr': 0.0003808281950066223, 'samples': 9610752, 'steps': 50055, 'loss/train': 1.0728232860565186} -08/30/2021 22:16:26 - INFO - __main__ - Step 50057: {'lr': 0.0003808236728844246, 'samples': 9610944, 'steps': 50056, 'loss/train': 1.6719036102294922} -08/30/2021 22:16:26 - INFO - __main__ - Step 50058: {'lr': 0.0003808191507032798, 'samples': 9611136, 'steps': 50057, 'loss/train': 1.0060703754425049} -08/30/2021 22:16:26 - INFO - __main__ - Step 50059: {'lr': 0.00038081462846318984, 'samples': 9611328, 'steps': 50058, 'loss/train': 1.6246259212493896} -08/30/2021 22:16:27 - INFO - __main__ - Step 50060: {'lr': 0.000380810106164157, 'samples': 9611520, 'steps': 50059, 'loss/train': 1.2512034177780151} -08/30/2021 22:16:28 - INFO - __main__ - Step 50061: {'lr': 0.000380805583806183, 'samples': 9611712, 'steps': 50060, 'loss/train': 1.6808745861053467} -08/30/2021 22:16:29 - INFO - __main__ - Step 50062: {'lr': 0.00038080106138927, 'samples': 9611904, 'steps': 50061, 'loss/train': 0.9136414527893066} -08/30/2021 22:16:29 - INFO - __main__ - Step 50063: {'lr': 0.00038079653891342016, 'samples': 9612096, 'steps': 50062, 'loss/train': 2.0557808876037598} -08/30/2021 22:16:29 - INFO - __main__ - Step 50064: {'lr': 0.0003807920163786353, 'samples': 9612288, 'steps': 50063, 'loss/train': 1.7106549739837646} -08/30/2021 22:16:30 - INFO - __main__ - Step 50065: {'lr': 0.00038078749378491763, 'samples': 9612480, 'steps': 50064, 'loss/train': 1.437264323234558} -08/30/2021 22:16:31 - INFO - __main__ - Step 50066: {'lr': 0.00038078297113226925, 'samples': 9612672, 'steps': 50065, 'loss/train': 1.0924086570739746} -08/30/2021 22:16:32 - INFO - __main__ - Step 50067: {'lr': 0.00038077844842069193, 'samples': 9612864, 'steps': 50066, 'loss/train': 1.2689344882965088} -08/30/2021 22:16:32 - INFO - __main__ - Step 50068: {'lr': 0.00038077392565018784, 'samples': 9613056, 'steps': 50067, 'loss/train': 1.675586462020874} -08/30/2021 22:16:32 - INFO - __main__ - Step 50069: {'lr': 0.0003807694028207591, 'samples': 9613248, 'steps': 50068, 'loss/train': 1.4385607242584229} -08/30/2021 22:16:33 - INFO - __main__ - Step 50070: {'lr': 0.0003807648799324077, 'samples': 9613440, 'steps': 50069, 'loss/train': 1.1776790618896484} -08/30/2021 22:16:33 - INFO - __main__ - Step 50071: {'lr': 0.0003807603569851357, 'samples': 9613632, 'steps': 50070, 'loss/train': 0.06844732910394669} -08/30/2021 22:16:36 - INFO - __main__ - Step 50072: {'lr': 0.0003807558339789451, 'samples': 9613824, 'steps': 50071, 'loss/train': 1.8619381189346313} -08/30/2021 22:16:36 - INFO - __main__ - Step 50073: {'lr': 0.00038075131091383783, 'samples': 9614016, 'steps': 50072, 'loss/train': 1.88219153881073} -08/30/2021 22:16:37 - INFO - __main__ - Step 50074: {'lr': 0.0003807467877898161, 'samples': 9614208, 'steps': 50073, 'loss/train': 1.1046810150146484} -08/30/2021 22:16:37 - INFO - __main__ - Step 50075: {'lr': 0.00038074226460688186, 'samples': 9614400, 'steps': 50074, 'loss/train': 0.528259813785553} -08/30/2021 22:16:38 - INFO - __main__ - Step 50076: {'lr': 0.0003807377413650372, 'samples': 9614592, 'steps': 50075, 'loss/train': 0.4769894778728485} -08/30/2021 22:16:38 - INFO - __main__ - Step 50077: {'lr': 0.0003807332180642842, 'samples': 9614784, 'steps': 50076, 'loss/train': 1.3407303094863892} -08/30/2021 22:16:39 - INFO - __main__ - Step 50078: {'lr': 0.00038072869470462465, 'samples': 9614976, 'steps': 50077, 'loss/train': 0.6660121083259583} -08/30/2021 22:16:40 - INFO - __main__ - Step 50079: {'lr': 0.00038072417128606095, 'samples': 9615168, 'steps': 50078, 'loss/train': 1.3219343423843384} -08/30/2021 22:16:40 - INFO - __main__ - Step 50080: {'lr': 0.00038071964780859486, 'samples': 9615360, 'steps': 50079, 'loss/train': 1.218739628791809} -08/30/2021 22:16:41 - INFO - __main__ - Step 50081: {'lr': 0.0003807151242722285, 'samples': 9615552, 'steps': 50080, 'loss/train': 1.5216811895370483} -08/30/2021 22:16:41 - INFO - __main__ - Step 50082: {'lr': 0.00038071060067696393, 'samples': 9615744, 'steps': 50081, 'loss/train': 1.7325550317764282} -08/30/2021 22:16:43 - INFO - __main__ - Step 50083: {'lr': 0.00038070607702280325, 'samples': 9615936, 'steps': 50082, 'loss/train': 1.2911477088928223} -08/30/2021 22:16:43 - INFO - __main__ - Step 50084: {'lr': 0.00038070155330974844, 'samples': 9616128, 'steps': 50083, 'loss/train': 1.4418026208877563} -08/30/2021 22:16:43 - INFO - __main__ - Step 50085: {'lr': 0.0003806970295378014, 'samples': 9616320, 'steps': 50084, 'loss/train': 1.720677375793457} -08/30/2021 22:16:44 - INFO - __main__ - Step 50086: {'lr': 0.00038069250570696433, 'samples': 9616512, 'steps': 50085, 'loss/train': 1.7577153444290161} -08/30/2021 22:16:44 - INFO - __main__ - Step 50087: {'lr': 0.00038068798181723927, 'samples': 9616704, 'steps': 50086, 'loss/train': 1.112426996231079} -08/30/2021 22:16:46 - INFO - __main__ - Step 50088: {'lr': 0.00038068345786862825, 'samples': 9616896, 'steps': 50087, 'loss/train': 1.7923065423965454} -08/30/2021 22:16:46 - INFO - __main__ - Step 50089: {'lr': 0.0003806789338611333, 'samples': 9617088, 'steps': 50088, 'loss/train': 1.0503278970718384} -08/30/2021 22:16:47 - INFO - __main__ - Step 50090: {'lr': 0.00038067440979475635, 'samples': 9617280, 'steps': 50089, 'loss/train': 1.3894175291061401} -08/30/2021 22:16:47 - INFO - __main__ - Step 50091: {'lr': 0.0003806698856694996, 'samples': 9617472, 'steps': 50090, 'loss/train': 1.0337897539138794} -08/30/2021 22:16:47 - INFO - __main__ - Step 50092: {'lr': 0.00038066536148536495, 'samples': 9617664, 'steps': 50091, 'loss/train': 0.5578261613845825} -08/30/2021 22:16:48 - INFO - __main__ - Step 50093: {'lr': 0.00038066083724235455, 'samples': 9617856, 'steps': 50092, 'loss/train': 1.3270683288574219} -08/30/2021 22:16:49 - INFO - __main__ - Step 50094: {'lr': 0.00038065631294047035, 'samples': 9618048, 'steps': 50093, 'loss/train': 1.4695450067520142} -08/30/2021 22:16:50 - INFO - __main__ - Step 50095: {'lr': 0.0003806517885797145, 'samples': 9618240, 'steps': 50094, 'loss/train': 1.1843640804290771} -08/30/2021 22:16:50 - INFO - __main__ - Step 50096: {'lr': 0.0003806472641600889, 'samples': 9618432, 'steps': 50095, 'loss/train': 0.98862624168396} -08/30/2021 22:16:50 - INFO - __main__ - Step 50097: {'lr': 0.00038064273968159575, 'samples': 9618624, 'steps': 50096, 'loss/train': 1.46336030960083} -08/30/2021 22:16:51 - INFO - __main__ - Step 50098: {'lr': 0.00038063821514423694, 'samples': 9618816, 'steps': 50097, 'loss/train': 1.015445590019226} -08/30/2021 22:16:52 - INFO - __main__ - Step 50099: {'lr': 0.00038063369054801456, 'samples': 9619008, 'steps': 50098, 'loss/train': 2.0989749431610107} -08/30/2021 22:16:53 - INFO - __main__ - Step 50100: {'lr': 0.00038062916589293064, 'samples': 9619200, 'steps': 50099, 'loss/train': 0.8163864612579346} -08/30/2021 22:16:53 - INFO - __main__ - Step 50101: {'lr': 0.0003806246411789872, 'samples': 9619392, 'steps': 50100, 'loss/train': 1.8185945749282837} -08/30/2021 22:16:53 - INFO - __main__ - Step 50102: {'lr': 0.00038062011640618636, 'samples': 9619584, 'steps': 50101, 'loss/train': 1.1335031986236572} -08/30/2021 22:16:54 - INFO - __main__ - Step 50103: {'lr': 0.00038061559157453014, 'samples': 9619776, 'steps': 50102, 'loss/train': 1.093127727508545} -08/30/2021 22:16:55 - INFO - __main__ - Step 50104: {'lr': 0.00038061106668402055, 'samples': 9619968, 'steps': 50103, 'loss/train': 0.33705976605415344} -08/30/2021 22:16:56 - INFO - __main__ - Step 50105: {'lr': 0.0003806065417346596, 'samples': 9620160, 'steps': 50104, 'loss/train': 1.2665024995803833} -08/30/2021 22:16:56 - INFO - __main__ - Step 50106: {'lr': 0.00038060201672644934, 'samples': 9620352, 'steps': 50105, 'loss/train': 1.192352294921875} -08/30/2021 22:16:56 - INFO - __main__ - Step 50107: {'lr': 0.00038059749165939184, 'samples': 9620544, 'steps': 50106, 'loss/train': 1.0885837078094482} -08/30/2021 22:16:57 - INFO - __main__ - Step 50108: {'lr': 0.00038059296653348917, 'samples': 9620736, 'steps': 50107, 'loss/train': 1.464859962463379} -08/30/2021 22:16:58 - INFO - __main__ - Step 50109: {'lr': 0.00038058844134874326, 'samples': 9620928, 'steps': 50108, 'loss/train': 0.5432927012443542} -08/30/2021 22:16:59 - INFO - __main__ - Step 50110: {'lr': 0.0003805839161051563, 'samples': 9621120, 'steps': 50109, 'loss/train': 1.8091411590576172} -08/30/2021 22:16:59 - INFO - __main__ - Step 50111: {'lr': 0.00038057939080273016, 'samples': 9621312, 'steps': 50110, 'loss/train': 1.6873996257781982} -08/30/2021 22:16:59 - INFO - __main__ - Step 50112: {'lr': 0.00038057486544146703, 'samples': 9621504, 'steps': 50111, 'loss/train': 1.5108884572982788} -08/30/2021 22:17:00 - INFO - __main__ - Step 50113: {'lr': 0.0003805703400213688, 'samples': 9621696, 'steps': 50112, 'loss/train': 0.902436375617981} -08/30/2021 22:17:01 - INFO - __main__ - Step 50114: {'lr': 0.0003805658145424376, 'samples': 9621888, 'steps': 50113, 'loss/train': 1.0551910400390625} -08/30/2021 22:17:02 - INFO - __main__ - Step 50115: {'lr': 0.00038056128900467546, 'samples': 9622080, 'steps': 50114, 'loss/train': 0.05183906480669975} -08/30/2021 22:17:02 - INFO - __main__ - Step 50116: {'lr': 0.00038055676340808446, 'samples': 9622272, 'steps': 50115, 'loss/train': 1.3731881380081177} -08/30/2021 22:17:03 - INFO - __main__ - Step 50117: {'lr': 0.00038055223775266666, 'samples': 9622464, 'steps': 50116, 'loss/train': 1.4042104482650757} -08/30/2021 22:17:03 - INFO - __main__ - Step 50118: {'lr': 0.0003805477120384239, 'samples': 9622656, 'steps': 50117, 'loss/train': 1.8434213399887085} -08/30/2021 22:17:04 - INFO - __main__ - Step 50119: {'lr': 0.00038054318626535845, 'samples': 9622848, 'steps': 50118, 'loss/train': 0.9863468408584595} -08/30/2021 22:17:05 - INFO - __main__ - Step 50120: {'lr': 0.00038053866043347216, 'samples': 9623040, 'steps': 50119, 'loss/train': 1.615834355354309} -08/30/2021 22:17:05 - INFO - __main__ - Step 50121: {'lr': 0.00038053413454276725, 'samples': 9623232, 'steps': 50120, 'loss/train': 2.0354504585266113} -08/30/2021 22:17:06 - INFO - __main__ - Step 50122: {'lr': 0.00038052960859324557, 'samples': 9623424, 'steps': 50121, 'loss/train': 0.7636065483093262} -08/30/2021 22:17:06 - INFO - __main__ - Step 50123: {'lr': 0.0003805250825849094, 'samples': 9623616, 'steps': 50122, 'loss/train': 1.6923234462738037} -08/30/2021 22:17:08 - INFO - __main__ - Step 50124: {'lr': 0.0003805205565177606, 'samples': 9623808, 'steps': 50123, 'loss/train': 1.1398009061813354} -08/30/2021 22:17:08 - INFO - __main__ - Step 50125: {'lr': 0.0003805160303918013, 'samples': 9624000, 'steps': 50124, 'loss/train': 0.85948246717453} -08/30/2021 22:17:09 - INFO - __main__ - Step 50126: {'lr': 0.0003805115042070333, 'samples': 9624192, 'steps': 50125, 'loss/train': 1.2117767333984375} -08/30/2021 22:17:09 - INFO - __main__ - Step 50127: {'lr': 0.000380506977963459, 'samples': 9624384, 'steps': 50126, 'loss/train': 1.723537564277649} -08/30/2021 22:17:09 - INFO - __main__ - Step 50128: {'lr': 0.00038050245166108024, 'samples': 9624576, 'steps': 50127, 'loss/train': 1.4526232481002808} -08/30/2021 22:17:11 - INFO - __main__ - Step 50129: {'lr': 0.000380497925299899, 'samples': 9624768, 'steps': 50128, 'loss/train': 1.0510504245758057} -08/30/2021 22:17:12 - INFO - __main__ - Step 50130: {'lr': 0.0003804933988799175, 'samples': 9624960, 'steps': 50129, 'loss/train': 0.7681604623794556} -08/30/2021 22:17:12 - INFO - __main__ - Step 50131: {'lr': 0.0003804888724011377, 'samples': 9625152, 'steps': 50130, 'loss/train': 1.7104781866073608} -08/30/2021 22:17:12 - INFO - __main__ - Step 50132: {'lr': 0.00038048434586356164, 'samples': 9625344, 'steps': 50131, 'loss/train': 0.9986642599105835} -08/30/2021 22:17:13 - INFO - __main__ - Step 50133: {'lr': 0.0003804798192671912, 'samples': 9625536, 'steps': 50132, 'loss/train': 1.1631078720092773} -08/30/2021 22:17:15 - INFO - __main__ - Step 50134: {'lr': 0.00038047529261202876, 'samples': 9625728, 'steps': 50133, 'loss/train': 0.39178749918937683} -08/30/2021 22:17:15 - INFO - __main__ - Step 50135: {'lr': 0.0003804707658980761, 'samples': 9625920, 'steps': 50134, 'loss/train': 1.1198288202285767} -08/30/2021 22:17:16 - INFO - __main__ - Step 50136: {'lr': 0.0003804662391253352, 'samples': 9626112, 'steps': 50135, 'loss/train': 1.1382800340652466} -08/30/2021 22:17:16 - INFO - __main__ - Step 50137: {'lr': 0.00038046171229380837, 'samples': 9626304, 'steps': 50136, 'loss/train': 1.644508957862854} -08/30/2021 22:17:16 - INFO - __main__ - Step 50138: {'lr': 0.0003804571854034975, 'samples': 9626496, 'steps': 50137, 'loss/train': 0.9787462949752808} -08/30/2021 22:17:17 - INFO - __main__ - Step 50139: {'lr': 0.0003804526584544046, 'samples': 9626688, 'steps': 50138, 'loss/train': 0.9741015434265137} -08/30/2021 22:17:18 - INFO - __main__ - Step 50140: {'lr': 0.0003804481314465317, 'samples': 9626880, 'steps': 50139, 'loss/train': 0.9444351196289062} -08/30/2021 22:17:19 - INFO - __main__ - Step 50141: {'lr': 0.0003804436043798809, 'samples': 9627072, 'steps': 50140, 'loss/train': 1.2524003982543945} -08/30/2021 22:17:19 - INFO - __main__ - Step 50142: {'lr': 0.00038043907725445424, 'samples': 9627264, 'steps': 50141, 'loss/train': 1.5802050828933716} -08/30/2021 22:17:19 - INFO - __main__ - Step 50143: {'lr': 0.00038043455007025375, 'samples': 9627456, 'steps': 50142, 'loss/train': 1.3089563846588135} -08/30/2021 22:17:20 - INFO - __main__ - Step 50144: {'lr': 0.00038043002282728153, 'samples': 9627648, 'steps': 50143, 'loss/train': 1.042677879333496} -08/30/2021 22:17:21 - INFO - __main__ - Step 50145: {'lr': 0.00038042549552553954, 'samples': 9627840, 'steps': 50144, 'loss/train': 1.0575764179229736} -08/30/2021 22:17:22 - INFO - __main__ - Step 50146: {'lr': 0.00038042096816502967, 'samples': 9628032, 'steps': 50145, 'loss/train': 0.6534714698791504} -08/30/2021 22:17:22 - INFO - __main__ - Step 50147: {'lr': 0.0003804164407457543, 'samples': 9628224, 'steps': 50146, 'loss/train': 1.341222882270813} -08/30/2021 22:17:22 - INFO - __main__ - Step 50148: {'lr': 0.0003804119132677152, 'samples': 9628416, 'steps': 50147, 'loss/train': 1.072319746017456} -08/30/2021 22:17:23 - INFO - __main__ - Step 50149: {'lr': 0.0003804073857309145, 'samples': 9628608, 'steps': 50148, 'loss/train': 1.2148807048797607} -08/30/2021 22:17:24 - INFO - __main__ - Step 50150: {'lr': 0.00038040285813535434, 'samples': 9628800, 'steps': 50149, 'loss/train': 1.297415018081665} -08/30/2021 22:17:25 - INFO - __main__ - Step 50151: {'lr': 0.0003803983304810367, 'samples': 9628992, 'steps': 50150, 'loss/train': 1.0965957641601562} -08/30/2021 22:17:25 - INFO - __main__ - Step 50152: {'lr': 0.0003803938027679634, 'samples': 9629184, 'steps': 50151, 'loss/train': 1.2132761478424072} -08/30/2021 22:17:25 - INFO - __main__ - Step 50153: {'lr': 0.0003803892749961368, 'samples': 9629376, 'steps': 50152, 'loss/train': 1.1536738872528076} -08/30/2021 22:17:26 - INFO - __main__ - Step 50154: {'lr': 0.0003803847471655587, 'samples': 9629568, 'steps': 50153, 'loss/train': 1.0383530855178833} -08/30/2021 22:17:26 - INFO - __main__ - Step 50155: {'lr': 0.00038038021927623133, 'samples': 9629760, 'steps': 50154, 'loss/train': 5.870924472808838} -08/30/2021 22:17:28 - INFO - __main__ - Step 50156: {'lr': 0.00038037569132815663, 'samples': 9629952, 'steps': 50155, 'loss/train': 0.046317603439092636} -08/30/2021 22:17:28 - INFO - __main__ - Step 50157: {'lr': 0.0003803711633213367, 'samples': 9630144, 'steps': 50156, 'loss/train': 1.8635798692703247} -08/30/2021 22:17:29 - INFO - __main__ - Step 50158: {'lr': 0.0003803666352557735, 'samples': 9630336, 'steps': 50157, 'loss/train': 1.14349365234375} -08/30/2021 22:17:29 - INFO - __main__ - Step 50159: {'lr': 0.0003803621071314691, 'samples': 9630528, 'steps': 50158, 'loss/train': 0.5619362592697144} -08/30/2021 22:17:29 - INFO - __main__ - Step 50160: {'lr': 0.0003803575789484255, 'samples': 9630720, 'steps': 50159, 'loss/train': 1.2430082559585571} -08/30/2021 22:17:31 - INFO - __main__ - Step 50161: {'lr': 0.0003803530507066448, 'samples': 9630912, 'steps': 50160, 'loss/train': 1.3744922876358032} -08/30/2021 22:17:32 - INFO - __main__ - Step 50162: {'lr': 0.00038034852240612907, 'samples': 9631104, 'steps': 50161, 'loss/train': 1.3385076522827148} -08/30/2021 22:17:32 - INFO - __main__ - Step 50163: {'lr': 0.00038034399404688024, 'samples': 9631296, 'steps': 50162, 'loss/train': 0.037527214735746384} -08/30/2021 22:17:32 - INFO - __main__ - Step 50164: {'lr': 0.00038033946562890055, 'samples': 9631488, 'steps': 50163, 'loss/train': 1.4838230609893799} -08/30/2021 22:17:33 - INFO - __main__ - Step 50165: {'lr': 0.0003803349371521918, 'samples': 9631680, 'steps': 50164, 'loss/train': 1.676430106163025} -08/30/2021 22:17:33 - INFO - __main__ - Step 50166: {'lr': 0.00038033040861675617, 'samples': 9631872, 'steps': 50165, 'loss/train': 1.8885140419006348} -08/30/2021 22:17:33 - INFO - __main__ - Step 50167: {'lr': 0.0003803258800225956, 'samples': 9632064, 'steps': 50166, 'loss/train': 1.8753783702850342} -08/30/2021 22:17:35 - INFO - __main__ - Step 50168: {'lr': 0.0003803213513697123, 'samples': 9632256, 'steps': 50167, 'loss/train': 1.232132911682129} -08/30/2021 22:17:35 - INFO - __main__ - Step 50169: {'lr': 0.0003803168226581082, 'samples': 9632448, 'steps': 50168, 'loss/train': 1.1798596382141113} -08/30/2021 22:17:36 - INFO - __main__ - Step 50170: {'lr': 0.00038031229388778526, 'samples': 9632640, 'steps': 50169, 'loss/train': 1.291684627532959} -08/30/2021 22:17:36 - INFO - __main__ - Step 50171: {'lr': 0.00038030776505874577, 'samples': 9632832, 'steps': 50170, 'loss/train': 1.5367623567581177} -08/30/2021 22:17:36 - INFO - __main__ - Step 50172: {'lr': 0.0003803032361709915, 'samples': 9633024, 'steps': 50171, 'loss/train': 1.1160755157470703} -08/30/2021 22:17:38 - INFO - __main__ - Step 50173: {'lr': 0.00038029870722452455, 'samples': 9633216, 'steps': 50172, 'loss/train': 1.8505613803863525} -08/30/2021 22:17:38 - INFO - __main__ - Step 50174: {'lr': 0.0003802941782193471, 'samples': 9633408, 'steps': 50173, 'loss/train': 1.6613337993621826} -08/30/2021 22:17:39 - INFO - __main__ - Step 50175: {'lr': 0.00038028964915546107, 'samples': 9633600, 'steps': 50174, 'loss/train': 1.0176063776016235} -08/30/2021 22:17:39 - INFO - __main__ - Step 50176: {'lr': 0.00038028512003286853, 'samples': 9633792, 'steps': 50175, 'loss/train': 1.6487009525299072} -08/30/2021 22:17:39 - INFO - __main__ - Step 50177: {'lr': 0.00038028059085157165, 'samples': 9633984, 'steps': 50176, 'loss/train': 1.3987069129943848} -08/30/2021 22:17:40 - INFO - __main__ - Step 50178: {'lr': 0.0003802760616115722, 'samples': 9634176, 'steps': 50177, 'loss/train': 1.7523374557495117} -08/30/2021 22:17:42 - INFO - __main__ - Step 50179: {'lr': 0.0003802715323128724, 'samples': 9634368, 'steps': 50178, 'loss/train': 1.3484731912612915} -08/30/2021 22:17:42 - INFO - __main__ - Step 50180: {'lr': 0.00038026700295547424, 'samples': 9634560, 'steps': 50179, 'loss/train': 1.0260473489761353} -08/30/2021 22:17:42 - INFO - __main__ - Step 50181: {'lr': 0.0003802624735393798, 'samples': 9634752, 'steps': 50180, 'loss/train': 1.3888907432556152} -08/30/2021 22:17:43 - INFO - __main__ - Step 50182: {'lr': 0.00038025794406459115, 'samples': 9634944, 'steps': 50181, 'loss/train': 1.3685919046401978} -08/30/2021 22:17:43 - INFO - __main__ - Step 50183: {'lr': 0.00038025341453111017, 'samples': 9635136, 'steps': 50182, 'loss/train': 0.9743738174438477} -08/30/2021 22:17:45 - INFO - __main__ - Step 50184: {'lr': 0.0003802488849389391, 'samples': 9635328, 'steps': 50183, 'loss/train': 1.1471487283706665} -08/30/2021 22:17:45 - INFO - __main__ - Step 50185: {'lr': 0.0003802443552880799, 'samples': 9635520, 'steps': 50184, 'loss/train': 0.0739254504442215} -08/30/2021 22:17:46 - INFO - __main__ - Step 50186: {'lr': 0.00038023982557853456, 'samples': 9635712, 'steps': 50185, 'loss/train': 1.7395588159561157} -08/30/2021 22:17:46 - INFO - __main__ - Step 50187: {'lr': 0.00038023529581030516, 'samples': 9635904, 'steps': 50186, 'loss/train': 1.0424436330795288} -08/30/2021 22:17:46 - INFO - __main__ - Step 50188: {'lr': 0.00038023076598339375, 'samples': 9636096, 'steps': 50187, 'loss/train': 0.9814770817756653} -08/30/2021 22:17:48 - INFO - __main__ - Step 50189: {'lr': 0.0003802262360978024, 'samples': 9636288, 'steps': 50188, 'loss/train': 1.5759168863296509} -08/30/2021 22:17:48 - INFO - __main__ - Step 50190: {'lr': 0.00038022170615353314, 'samples': 9636480, 'steps': 50189, 'loss/train': 1.680824875831604} -08/30/2021 22:17:49 - INFO - __main__ - Step 50191: {'lr': 0.00038021717615058795, 'samples': 9636672, 'steps': 50190, 'loss/train': 1.755846619606018} -08/30/2021 22:17:49 - INFO - __main__ - Step 50192: {'lr': 0.00038021264608896884, 'samples': 9636864, 'steps': 50191, 'loss/train': 0.7993203997612} -08/30/2021 22:17:49 - INFO - __main__ - Step 50193: {'lr': 0.000380208115968678, 'samples': 9637056, 'steps': 50192, 'loss/train': 1.2606840133666992} -08/30/2021 22:17:51 - INFO - __main__ - Step 50194: {'lr': 0.00038020358578971737, 'samples': 9637248, 'steps': 50193, 'loss/train': 0.9867759346961975} -08/30/2021 22:17:51 - INFO - __main__ - Step 50195: {'lr': 0.000380199055552089, 'samples': 9637440, 'steps': 50194, 'loss/train': 0.3496303856372833} -08/30/2021 22:17:52 - INFO - __main__ - Step 50196: {'lr': 0.000380194525255795, 'samples': 9637632, 'steps': 50195, 'loss/train': 1.1464449167251587} -08/30/2021 22:17:52 - INFO - __main__ - Step 50197: {'lr': 0.0003801899949008373, 'samples': 9637824, 'steps': 50196, 'loss/train': 0.5101274847984314} -08/30/2021 22:17:52 - INFO - __main__ - Step 50198: {'lr': 0.000380185464487218, 'samples': 9638016, 'steps': 50197, 'loss/train': 1.5690900087356567} -08/30/2021 22:17:54 - INFO - __main__ - Step 50199: {'lr': 0.00038018093401493916, 'samples': 9638208, 'steps': 50198, 'loss/train': 0.6451753973960876} -08/30/2021 22:17:54 - INFO - __main__ - Step 50200: {'lr': 0.00038017640348400286, 'samples': 9638400, 'steps': 50199, 'loss/train': 1.6852253675460815} -08/30/2021 22:17:55 - INFO - __main__ - Step 50201: {'lr': 0.000380171872894411, 'samples': 9638592, 'steps': 50200, 'loss/train': 1.1046643257141113} -08/30/2021 22:17:55 - INFO - __main__ - Step 50202: {'lr': 0.00038016734224616565, 'samples': 9638784, 'steps': 50201, 'loss/train': 2.0317699909210205} -08/30/2021 22:17:55 - INFO - __main__ - Step 50203: {'lr': 0.000380162811539269, 'samples': 9638976, 'steps': 50202, 'loss/train': 1.5801845788955688} -08/30/2021 22:17:56 - INFO - __main__ - Step 50204: {'lr': 0.0003801582807737229, 'samples': 9639168, 'steps': 50203, 'loss/train': 1.3906358480453491} -08/30/2021 22:17:57 - INFO - __main__ - Step 50205: {'lr': 0.00038015374994952966, 'samples': 9639360, 'steps': 50204, 'loss/train': 1.4581975936889648} -08/30/2021 22:17:58 - INFO - __main__ - Step 50206: {'lr': 0.0003801492190666911, 'samples': 9639552, 'steps': 50205, 'loss/train': 1.3912845849990845} -08/30/2021 22:17:58 - INFO - __main__ - Step 50207: {'lr': 0.00038014468812520917, 'samples': 9639744, 'steps': 50206, 'loss/train': 1.1278738975524902} -08/30/2021 22:17:59 - INFO - __main__ - Step 50208: {'lr': 0.00038014015712508617, 'samples': 9639936, 'steps': 50207, 'loss/train': 1.8937790393829346} -08/30/2021 22:17:59 - INFO - __main__ - Step 50209: {'lr': 0.000380135626066324, 'samples': 9640128, 'steps': 50208, 'loss/train': 1.2781879901885986} -08/30/2021 22:18:00 - INFO - __main__ - Step 50210: {'lr': 0.00038013109494892467, 'samples': 9640320, 'steps': 50209, 'loss/train': 0.06123127415776253} -08/30/2021 22:18:01 - INFO - __main__ - Step 50211: {'lr': 0.00038012656377289035, 'samples': 9640512, 'steps': 50210, 'loss/train': 1.832229495048523} -08/30/2021 22:18:01 - INFO - __main__ - Step 50212: {'lr': 0.000380122032538223, 'samples': 9640704, 'steps': 50211, 'loss/train': 1.796499252319336} -08/30/2021 22:18:02 - INFO - __main__ - Step 50213: {'lr': 0.0003801175012449246, 'samples': 9640896, 'steps': 50212, 'loss/train': 1.6021469831466675} -08/30/2021 22:18:02 - INFO - __main__ - Step 50214: {'lr': 0.0003801129698929974, 'samples': 9641088, 'steps': 50213, 'loss/train': 0.9251230359077454} -08/30/2021 22:18:03 - INFO - __main__ - Step 50215: {'lr': 0.00038010843848244316, 'samples': 9641280, 'steps': 50214, 'loss/train': 1.1046028137207031} -08/30/2021 22:18:04 - INFO - __main__ - Step 50216: {'lr': 0.00038010390701326415, 'samples': 9641472, 'steps': 50215, 'loss/train': 1.921939730644226} -08/30/2021 22:18:04 - INFO - __main__ - Step 50217: {'lr': 0.00038009937548546223, 'samples': 9641664, 'steps': 50216, 'loss/train': 1.8867669105529785} -08/30/2021 22:18:04 - INFO - __main__ - Step 50218: {'lr': 0.0003800948438990397, 'samples': 9641856, 'steps': 50217, 'loss/train': 1.297231674194336} -08/30/2021 22:18:05 - INFO - __main__ - Step 50219: {'lr': 0.0003800903122539983, 'samples': 9642048, 'steps': 50218, 'loss/train': 3.336740016937256} -08/30/2021 22:18:06 - INFO - __main__ - Step 50220: {'lr': 0.00038008578055034024, 'samples': 9642240, 'steps': 50219, 'loss/train': 1.1903597116470337} -08/30/2021 22:18:07 - INFO - __main__ - Step 50221: {'lr': 0.0003800812487880676, 'samples': 9642432, 'steps': 50220, 'loss/train': 1.0843539237976074} -08/30/2021 22:18:07 - INFO - __main__ - Step 50222: {'lr': 0.00038007671696718226, 'samples': 9642624, 'steps': 50221, 'loss/train': 1.0503097772598267} -08/30/2021 22:18:07 - INFO - __main__ - Step 50223: {'lr': 0.0003800721850876864, 'samples': 9642816, 'steps': 50222, 'loss/train': 1.3597859144210815} -08/30/2021 22:18:08 - INFO - __main__ - Step 50224: {'lr': 0.00038006765314958205, 'samples': 9643008, 'steps': 50223, 'loss/train': 1.6349124908447266} -08/30/2021 22:18:09 - INFO - __main__ - Step 50225: {'lr': 0.00038006312115287125, 'samples': 9643200, 'steps': 50224, 'loss/train': 1.5726463794708252} -08/30/2021 22:18:10 - INFO - __main__ - Step 50226: {'lr': 0.00038005858909755596, 'samples': 9643392, 'steps': 50225, 'loss/train': 1.8197311162948608} -08/30/2021 22:18:10 - INFO - __main__ - Step 50227: {'lr': 0.00038005405698363824, 'samples': 9643584, 'steps': 50226, 'loss/train': 0.7995738387107849} -08/30/2021 22:18:10 - INFO - __main__ - Step 50228: {'lr': 0.0003800495248111202, 'samples': 9643776, 'steps': 50227, 'loss/train': 1.4944809675216675} -08/30/2021 22:18:11 - INFO - __main__ - Step 50229: {'lr': 0.00038004499258000393, 'samples': 9643968, 'steps': 50228, 'loss/train': 1.3478763103485107} -08/30/2021 22:18:11 - INFO - __main__ - Step 50230: {'lr': 0.0003800404602902913, 'samples': 9644160, 'steps': 50229, 'loss/train': 1.4178478717803955} -08/30/2021 22:18:12 - INFO - __main__ - Step 50231: {'lr': 0.0003800359279419845, 'samples': 9644352, 'steps': 50230, 'loss/train': 1.462038278579712} -08/30/2021 22:18:13 - INFO - __main__ - Step 50232: {'lr': 0.0003800313955350855, 'samples': 9644544, 'steps': 50231, 'loss/train': 2.0806963443756104} -08/30/2021 22:18:13 - INFO - __main__ - Step 50233: {'lr': 0.0003800268630695963, 'samples': 9644736, 'steps': 50232, 'loss/train': 1.3585331439971924} -08/30/2021 22:18:14 - INFO - __main__ - Step 50234: {'lr': 0.00038002233054551906, 'samples': 9644928, 'steps': 50233, 'loss/train': 1.4059019088745117} -08/30/2021 22:18:14 - INFO - __main__ - Step 50235: {'lr': 0.00038001779796285575, 'samples': 9645120, 'steps': 50234, 'loss/train': 1.7459365129470825} -08/30/2021 22:18:16 - INFO - __main__ - Step 50236: {'lr': 0.0003800132653216084, 'samples': 9645312, 'steps': 50235, 'loss/train': 1.4470959901809692} -08/30/2021 22:18:16 - INFO - __main__ - Step 50237: {'lr': 0.00038000873262177914, 'samples': 9645504, 'steps': 50236, 'loss/train': 1.6705679893493652} -08/30/2021 22:18:17 - INFO - __main__ - Step 50238: {'lr': 0.00038000419986336997, 'samples': 9645696, 'steps': 50237, 'loss/train': 1.4107708930969238} -08/30/2021 22:18:17 - INFO - __main__ - Step 50239: {'lr': 0.0003799996670463828, 'samples': 9645888, 'steps': 50238, 'loss/train': 1.6455039978027344} -08/30/2021 22:18:17 - INFO - __main__ - Step 50240: {'lr': 0.0003799951341708199, 'samples': 9646080, 'steps': 50239, 'loss/train': 1.4050010442733765} -08/30/2021 22:18:19 - INFO - __main__ - Step 50241: {'lr': 0.0003799906012366832, 'samples': 9646272, 'steps': 50240, 'loss/train': 1.0024943351745605} -08/30/2021 22:18:20 - INFO - __main__ - Step 50242: {'lr': 0.0003799860682439746, 'samples': 9646464, 'steps': 50241, 'loss/train': 0.7941561341285706} -08/30/2021 22:18:20 - INFO - __main__ - Step 50243: {'lr': 0.0003799815351926964, 'samples': 9646656, 'steps': 50242, 'loss/train': 0.028776539489626884} -08/30/2021 22:18:20 - INFO - __main__ - Step 50244: {'lr': 0.0003799770020828505, 'samples': 9646848, 'steps': 50243, 'loss/train': 1.7470147609710693} -08/30/2021 22:18:21 - INFO - __main__ - Step 50245: {'lr': 0.000379972468914439, 'samples': 9647040, 'steps': 50244, 'loss/train': 1.233689546585083} -08/30/2021 22:18:21 - INFO - __main__ - Step 50246: {'lr': 0.0003799679356874639, 'samples': 9647232, 'steps': 50245, 'loss/train': 4.052657604217529} -08/30/2021 22:18:23 - INFO - __main__ - Step 50247: {'lr': 0.0003799634024019272, 'samples': 9647424, 'steps': 50246, 'loss/train': 0.2852233946323395} -08/30/2021 22:18:23 - INFO - __main__ - Step 50248: {'lr': 0.0003799588690578311, 'samples': 9647616, 'steps': 50247, 'loss/train': 1.3783186674118042} -08/30/2021 22:18:23 - INFO - __main__ - Step 50249: {'lr': 0.0003799543356551773, 'samples': 9647808, 'steps': 50248, 'loss/train': 0.5411971807479858} -08/30/2021 22:18:24 - INFO - __main__ - Step 50250: {'lr': 0.00037994980219396835, 'samples': 9648000, 'steps': 50249, 'loss/train': 1.6253989934921265} -08/30/2021 22:18:24 - INFO - __main__ - Step 50251: {'lr': 0.00037994526867420595, 'samples': 9648192, 'steps': 50250, 'loss/train': 1.4940087795257568} -08/30/2021 22:18:26 - INFO - __main__ - Step 50252: {'lr': 0.0003799407350958922, 'samples': 9648384, 'steps': 50251, 'loss/train': 1.0193008184432983} -08/30/2021 22:18:26 - INFO - __main__ - Step 50253: {'lr': 0.00037993620145902914, 'samples': 9648576, 'steps': 50252, 'loss/train': 1.3059289455413818} -08/30/2021 22:18:26 - INFO - __main__ - Step 50254: {'lr': 0.00037993166776361883, 'samples': 9648768, 'steps': 50253, 'loss/train': 1.4135570526123047} -08/30/2021 22:18:27 - INFO - __main__ - Step 50255: {'lr': 0.0003799271340096633, 'samples': 9648960, 'steps': 50254, 'loss/train': 1.5801522731781006} -08/30/2021 22:18:27 - INFO - __main__ - Step 50256: {'lr': 0.00037992260019716463, 'samples': 9649152, 'steps': 50255, 'loss/train': 0.34532809257507324} -08/30/2021 22:18:29 - INFO - __main__ - Step 50257: {'lr': 0.00037991806632612485, 'samples': 9649344, 'steps': 50256, 'loss/train': 1.2366377115249634} -08/30/2021 22:18:29 - INFO - __main__ - Step 50258: {'lr': 0.000379913532396546, 'samples': 9649536, 'steps': 50257, 'loss/train': 1.3541903495788574} -08/30/2021 22:18:29 - INFO - __main__ - Step 50259: {'lr': 0.0003799089984084302, 'samples': 9649728, 'steps': 50258, 'loss/train': 0.9174428582191467} -08/30/2021 22:18:30 - INFO - __main__ - Step 50260: {'lr': 0.00037990446436177925, 'samples': 9649920, 'steps': 50259, 'loss/train': 1.7744241952896118} -08/30/2021 22:18:30 - INFO - __main__ - Step 50261: {'lr': 0.0003798999302565954, 'samples': 9650112, 'steps': 50260, 'loss/train': 0.7895450592041016} -08/30/2021 22:18:32 - INFO - __main__ - Step 50262: {'lr': 0.0003798953960928807, 'samples': 9650304, 'steps': 50261, 'loss/train': 1.240599274635315} -08/30/2021 22:18:32 - INFO - __main__ - Step 50263: {'lr': 0.0003798908618706371, 'samples': 9650496, 'steps': 50262, 'loss/train': 1.2873766422271729} -08/30/2021 22:18:32 - INFO - __main__ - Step 50264: {'lr': 0.0003798863275898667, 'samples': 9650688, 'steps': 50263, 'loss/train': 1.3467903137207031} -08/30/2021 22:18:33 - INFO - __main__ - Step 50265: {'lr': 0.00037988179325057156, 'samples': 9650880, 'steps': 50264, 'loss/train': 1.462780237197876} -08/30/2021 22:18:33 - INFO - __main__ - Step 50266: {'lr': 0.0003798772588527536, 'samples': 9651072, 'steps': 50265, 'loss/train': 1.1951463222503662} -08/30/2021 22:18:35 - INFO - __main__ - Step 50267: {'lr': 0.000379872724396415, 'samples': 9651264, 'steps': 50266, 'loss/train': 0.9749053716659546} -08/30/2021 22:18:35 - INFO - __main__ - Step 50268: {'lr': 0.00037986818988155775, 'samples': 9651456, 'steps': 50267, 'loss/train': 1.768110752105713} -08/30/2021 22:18:36 - INFO - __main__ - Step 50269: {'lr': 0.0003798636553081839, 'samples': 9651648, 'steps': 50268, 'loss/train': 1.5099670886993408} -08/30/2021 22:18:36 - INFO - __main__ - Step 50270: {'lr': 0.0003798591206762955, 'samples': 9651840, 'steps': 50269, 'loss/train': 1.041815996170044} -08/30/2021 22:18:36 - INFO - __main__ - Step 50271: {'lr': 0.0003798545859858945, 'samples': 9652032, 'steps': 50270, 'loss/train': 1.6618454456329346} -08/30/2021 22:18:37 - INFO - __main__ - Step 50272: {'lr': 0.0003798500512369832, 'samples': 9652224, 'steps': 50271, 'loss/train': 1.0841186046600342} -08/30/2021 22:18:38 - INFO - __main__ - Step 50273: {'lr': 0.00037984551642956336, 'samples': 9652416, 'steps': 50272, 'loss/train': 1.355236291885376} -08/30/2021 22:18:39 - INFO - __main__ - Step 50274: {'lr': 0.0003798409815636371, 'samples': 9652608, 'steps': 50273, 'loss/train': 1.4197198152542114} -08/30/2021 22:18:39 - INFO - __main__ - Step 50275: {'lr': 0.00037983644663920656, 'samples': 9652800, 'steps': 50274, 'loss/train': 1.5416332483291626} -08/30/2021 22:18:39 - INFO - __main__ - Step 50276: {'lr': 0.0003798319116562737, 'samples': 9652992, 'steps': 50275, 'loss/train': 1.149187684059143} -08/30/2021 22:18:40 - INFO - __main__ - Step 50277: {'lr': 0.00037982737661484056, 'samples': 9653184, 'steps': 50276, 'loss/train': 1.7272168397903442} -08/30/2021 22:18:41 - INFO - __main__ - Step 50278: {'lr': 0.00037982284151490933, 'samples': 9653376, 'steps': 50277, 'loss/train': 1.2712172269821167} -08/30/2021 22:18:41 - INFO - __main__ - Step 50279: {'lr': 0.00037981830635648177, 'samples': 9653568, 'steps': 50278, 'loss/train': 1.16634202003479} -08/30/2021 22:18:42 - INFO - __main__ - Step 50280: {'lr': 0.0003798137711395602, 'samples': 9653760, 'steps': 50279, 'loss/train': 1.7253309488296509} -08/30/2021 22:18:42 - INFO - __main__ - Step 50281: {'lr': 0.00037980923586414646, 'samples': 9653952, 'steps': 50280, 'loss/train': 1.3690147399902344} -08/30/2021 22:18:43 - INFO - __main__ - Step 50282: {'lr': 0.0003798047005302427, 'samples': 9654144, 'steps': 50281, 'loss/train': 1.2669169902801514} -08/30/2021 22:18:44 - INFO - __main__ - Step 50283: {'lr': 0.000379800165137851, 'samples': 9654336, 'steps': 50282, 'loss/train': 1.4882246255874634} -08/30/2021 22:18:45 - INFO - __main__ - Step 50284: {'lr': 0.00037979562968697324, 'samples': 9654528, 'steps': 50283, 'loss/train': 1.9820116758346558} -08/30/2021 22:18:45 - INFO - __main__ - Step 50285: {'lr': 0.0003797910941776117, 'samples': 9654720, 'steps': 50284, 'loss/train': 1.7118568420410156} -08/30/2021 22:18:46 - INFO - __main__ - Step 50286: {'lr': 0.00037978655860976826, 'samples': 9654912, 'steps': 50285, 'loss/train': 1.5190916061401367} -08/30/2021 22:18:46 - INFO - __main__ - Step 50287: {'lr': 0.00037978202298344496, 'samples': 9655104, 'steps': 50286, 'loss/train': 1.8288257122039795} -08/30/2021 22:18:48 - INFO - __main__ - Step 50288: {'lr': 0.0003797774872986439, 'samples': 9655296, 'steps': 50287, 'loss/train': 0.6033830642700195} -08/30/2021 22:18:49 - INFO - __main__ - Step 50289: {'lr': 0.00037977295155536706, 'samples': 9655488, 'steps': 50288, 'loss/train': 1.1985756158828735} -08/30/2021 22:18:49 - INFO - __main__ - Step 50290: {'lr': 0.00037976841575361665, 'samples': 9655680, 'steps': 50289, 'loss/train': 0.9769416451454163} -08/30/2021 22:18:49 - INFO - __main__ - Step 50291: {'lr': 0.00037976387989339445, 'samples': 9655872, 'steps': 50290, 'loss/train': 1.0939730405807495} -08/30/2021 22:18:50 - INFO - __main__ - Step 50292: {'lr': 0.0003797593439747028, 'samples': 9656064, 'steps': 50291, 'loss/train': 1.545101523399353} -08/30/2021 22:18:50 - INFO - __main__ - Step 50293: {'lr': 0.0003797548079975435, 'samples': 9656256, 'steps': 50292, 'loss/train': 1.7050976753234863} -08/30/2021 22:18:51 - INFO - __main__ - Step 50294: {'lr': 0.0003797502719619187, 'samples': 9656448, 'steps': 50293, 'loss/train': 0.9694483876228333} -08/30/2021 22:18:52 - INFO - __main__ - Step 50295: {'lr': 0.0003797457358678304, 'samples': 9656640, 'steps': 50294, 'loss/train': 2.092941999435425} -08/30/2021 22:18:52 - INFO - __main__ - Step 50296: {'lr': 0.0003797411997152807, 'samples': 9656832, 'steps': 50295, 'loss/train': 0.906765341758728} -08/30/2021 22:18:53 - INFO - __main__ - Step 50297: {'lr': 0.0003797366635042716, 'samples': 9657024, 'steps': 50296, 'loss/train': 1.4587798118591309} -08/30/2021 22:18:53 - INFO - __main__ - Step 50298: {'lr': 0.0003797321272348052, 'samples': 9657216, 'steps': 50297, 'loss/train': 1.3294745683670044} -08/30/2021 22:18:54 - INFO - __main__ - Step 50299: {'lr': 0.00037972759090688354, 'samples': 9657408, 'steps': 50298, 'loss/train': 1.305353045463562} -08/30/2021 22:18:55 - INFO - __main__ - Step 50300: {'lr': 0.0003797230545205086, 'samples': 9657600, 'steps': 50299, 'loss/train': 1.376690149307251} -08/30/2021 22:18:55 - INFO - __main__ - Step 50301: {'lr': 0.00037971851807568237, 'samples': 9657792, 'steps': 50300, 'loss/train': 1.4243135452270508} -08/30/2021 22:18:56 - INFO - __main__ - Step 50302: {'lr': 0.000379713981572407, 'samples': 9657984, 'steps': 50301, 'loss/train': 1.6837401390075684} -08/30/2021 22:18:56 - INFO - __main__ - Step 50303: {'lr': 0.0003797094450106846, 'samples': 9658176, 'steps': 50302, 'loss/train': 0.6461941599845886} -08/30/2021 22:18:57 - INFO - __main__ - Step 50304: {'lr': 0.00037970490839051707, 'samples': 9658368, 'steps': 50303, 'loss/train': 1.561486840248108} -08/30/2021 22:18:58 - INFO - __main__ - Step 50305: {'lr': 0.00037970037171190655, 'samples': 9658560, 'steps': 50304, 'loss/train': 1.327067494392395} -08/30/2021 22:18:58 - INFO - __main__ - Step 50306: {'lr': 0.000379695834974855, 'samples': 9658752, 'steps': 50305, 'loss/train': 1.5158920288085938} -08/30/2021 22:18:58 - INFO - __main__ - Step 50307: {'lr': 0.0003796912981793645, 'samples': 9658944, 'steps': 50306, 'loss/train': 1.2947555780410767} -08/30/2021 22:18:59 - INFO - __main__ - Step 50308: {'lr': 0.0003796867613254371, 'samples': 9659136, 'steps': 50307, 'loss/train': 1.4602837562561035} -08/30/2021 22:19:00 - INFO - __main__ - Step 50309: {'lr': 0.0003796822244130749, 'samples': 9659328, 'steps': 50308, 'loss/train': 1.7762531042099} -08/30/2021 22:19:01 - INFO - __main__ - Step 50310: {'lr': 0.00037967768744227984, 'samples': 9659520, 'steps': 50309, 'loss/train': 1.1557931900024414} -08/30/2021 22:19:01 - INFO - __main__ - Step 50311: {'lr': 0.000379673150413054, 'samples': 9659712, 'steps': 50310, 'loss/train': 1.5500409603118896} -08/30/2021 22:19:01 - INFO - __main__ - Step 50312: {'lr': 0.00037966861332539947, 'samples': 9659904, 'steps': 50311, 'loss/train': 1.2352476119995117} -08/30/2021 22:19:02 - INFO - __main__ - Step 50313: {'lr': 0.0003796640761793183, 'samples': 9660096, 'steps': 50312, 'loss/train': 1.4126312732696533} -08/30/2021 22:19:03 - INFO - __main__ - Step 50314: {'lr': 0.00037965953897481244, 'samples': 9660288, 'steps': 50313, 'loss/train': 1.2851961851119995} -08/30/2021 22:19:04 - INFO - __main__ - Step 50315: {'lr': 0.00037965500171188406, 'samples': 9660480, 'steps': 50314, 'loss/train': 0.9955987334251404} -08/30/2021 22:19:04 - INFO - __main__ - Step 50316: {'lr': 0.00037965046439053507, 'samples': 9660672, 'steps': 50315, 'loss/train': 1.4403796195983887} -08/30/2021 22:19:04 - INFO - __main__ - Step 50317: {'lr': 0.00037964592701076753, 'samples': 9660864, 'steps': 50316, 'loss/train': 0.4701976180076599} -08/30/2021 22:19:05 - INFO - __main__ - Step 50318: {'lr': 0.00037964138957258367, 'samples': 9661056, 'steps': 50317, 'loss/train': 1.1875450611114502} -08/30/2021 22:19:06 - INFO - __main__ - Step 50319: {'lr': 0.0003796368520759854, 'samples': 9661248, 'steps': 50318, 'loss/train': 1.6138051748275757} -08/30/2021 22:19:07 - INFO - __main__ - Step 50320: {'lr': 0.00037963231452097467, 'samples': 9661440, 'steps': 50319, 'loss/train': 0.9892135262489319} -08/30/2021 22:19:07 - INFO - __main__ - Step 50321: {'lr': 0.00037962777690755365, 'samples': 9661632, 'steps': 50320, 'loss/train': 1.0777478218078613} -08/30/2021 22:19:07 - INFO - __main__ - Step 50322: {'lr': 0.00037962323923572427, 'samples': 9661824, 'steps': 50321, 'loss/train': 1.306260347366333} -08/30/2021 22:19:08 - INFO - __main__ - Step 50323: {'lr': 0.0003796187015054888, 'samples': 9662016, 'steps': 50322, 'loss/train': 1.6018210649490356} -08/30/2021 22:19:09 - INFO - __main__ - Step 50324: {'lr': 0.00037961416371684907, 'samples': 9662208, 'steps': 50323, 'loss/train': 1.436275839805603} -08/30/2021 22:19:10 - INFO - __main__ - Step 50325: {'lr': 0.0003796096258698073, 'samples': 9662400, 'steps': 50324, 'loss/train': 5.0564165115356445} -08/30/2021 22:19:10 - INFO - __main__ - Step 50326: {'lr': 0.0003796050879643653, 'samples': 9662592, 'steps': 50325, 'loss/train': 0.43818843364715576} -08/30/2021 22:19:10 - INFO - __main__ - Step 50327: {'lr': 0.0003796005500005253, 'samples': 9662784, 'steps': 50326, 'loss/train': 1.1391857862472534} -08/30/2021 22:19:11 - INFO - __main__ - Step 50328: {'lr': 0.0003795960119782893, 'samples': 9662976, 'steps': 50327, 'loss/train': 0.9795698523521423} -08/30/2021 22:19:11 - INFO - __main__ - Step 50329: {'lr': 0.0003795914738976594, 'samples': 9663168, 'steps': 50328, 'loss/train': 1.904693841934204} -08/30/2021 22:19:13 - INFO - __main__ - Step 50330: {'lr': 0.00037958693575863747, 'samples': 9663360, 'steps': 50329, 'loss/train': 1.0364373922348022} -08/30/2021 22:19:13 - INFO - __main__ - Step 50331: {'lr': 0.0003795823975612257, 'samples': 9663552, 'steps': 50330, 'loss/train': 1.6892534494400024} -08/30/2021 22:19:13 - INFO - __main__ - Step 50332: {'lr': 0.0003795778593054261, 'samples': 9663744, 'steps': 50331, 'loss/train': 1.587531566619873} -08/30/2021 22:19:14 - INFO - __main__ - Step 50333: {'lr': 0.00037957332099124066, 'samples': 9663936, 'steps': 50332, 'loss/train': 1.622420072555542} -08/30/2021 22:19:14 - INFO - __main__ - Step 50334: {'lr': 0.00037956878261867163, 'samples': 9664128, 'steps': 50333, 'loss/train': 0.9953628182411194} -08/30/2021 22:19:16 - INFO - __main__ - Step 50335: {'lr': 0.0003795642441877208, 'samples': 9664320, 'steps': 50334, 'loss/train': 0.8345320224761963} -08/30/2021 22:19:16 - INFO - __main__ - Step 50336: {'lr': 0.0003795597056983903, 'samples': 9664512, 'steps': 50335, 'loss/train': 1.5275577306747437} -08/30/2021 22:19:17 - INFO - __main__ - Step 50337: {'lr': 0.0003795551671506823, 'samples': 9664704, 'steps': 50336, 'loss/train': 0.9670859575271606} -08/30/2021 22:19:17 - INFO - __main__ - Step 50338: {'lr': 0.0003795506285445987, 'samples': 9664896, 'steps': 50337, 'loss/train': 1.4572319984436035} -08/30/2021 22:19:18 - INFO - __main__ - Step 50339: {'lr': 0.0003795460898801415, 'samples': 9665088, 'steps': 50338, 'loss/train': 0.7685204148292542} -08/30/2021 22:19:18 - INFO - __main__ - Step 50340: {'lr': 0.00037954155115731294, 'samples': 9665280, 'steps': 50339, 'loss/train': 0.5451868772506714} -08/30/2021 22:19:20 - INFO - __main__ - Step 50341: {'lr': 0.0003795370123761149, 'samples': 9665472, 'steps': 50340, 'loss/train': 0.10526406764984131} -08/30/2021 22:19:20 - INFO - __main__ - Step 50342: {'lr': 0.00037953247353654946, 'samples': 9665664, 'steps': 50341, 'loss/train': 1.0455020666122437} -08/30/2021 22:19:21 - INFO - __main__ - Step 50343: {'lr': 0.00037952793463861867, 'samples': 9665856, 'steps': 50342, 'loss/train': 1.2337244749069214} -08/30/2021 22:19:21 - INFO - __main__ - Step 50344: {'lr': 0.0003795233956823246, 'samples': 9666048, 'steps': 50343, 'loss/train': 1.4961755275726318} -08/30/2021 22:19:21 - INFO - __main__ - Step 50345: {'lr': 0.0003795188566676694, 'samples': 9666240, 'steps': 50344, 'loss/train': 1.1911262273788452} -08/30/2021 22:19:23 - INFO - __main__ - Step 50346: {'lr': 0.00037951431759465496, 'samples': 9666432, 'steps': 50345, 'loss/train': 1.1223008632659912} -08/30/2021 22:19:23 - INFO - __main__ - Step 50347: {'lr': 0.0003795097784632833, 'samples': 9666624, 'steps': 50346, 'loss/train': 1.3112791776657104} -08/30/2021 22:19:24 - INFO - __main__ - Step 50348: {'lr': 0.00037950523927355657, 'samples': 9666816, 'steps': 50347, 'loss/train': 1.2560820579528809} -08/30/2021 22:19:24 - INFO - __main__ - Step 50349: {'lr': 0.0003795007000254768, 'samples': 9667008, 'steps': 50348, 'loss/train': 1.2496765851974487} -08/30/2021 22:19:24 - INFO - __main__ - Step 50350: {'lr': 0.00037949616071904593, 'samples': 9667200, 'steps': 50349, 'loss/train': 1.2681217193603516} -08/30/2021 22:19:26 - INFO - __main__ - Step 50351: {'lr': 0.0003794916213542662, 'samples': 9667392, 'steps': 50350, 'loss/train': 1.5068633556365967} -08/30/2021 22:19:26 - INFO - __main__ - Step 50352: {'lr': 0.00037948708193113947, 'samples': 9667584, 'steps': 50351, 'loss/train': 1.3616275787353516} -08/30/2021 22:19:27 - INFO - __main__ - Step 50353: {'lr': 0.00037948254244966786, 'samples': 9667776, 'steps': 50352, 'loss/train': 0.043509628623723984} -08/30/2021 22:19:27 - INFO - __main__ - Step 50354: {'lr': 0.00037947800290985344, 'samples': 9667968, 'steps': 50353, 'loss/train': 0.15662576258182526} -08/30/2021 22:19:27 - INFO - __main__ - Step 50355: {'lr': 0.00037947346331169816, 'samples': 9668160, 'steps': 50354, 'loss/train': 1.4839528799057007} -08/30/2021 22:19:29 - INFO - __main__ - Step 50356: {'lr': 0.00037946892365520423, 'samples': 9668352, 'steps': 50355, 'loss/train': 1.3777185678482056} -08/30/2021 22:19:29 - INFO - __main__ - Step 50357: {'lr': 0.00037946438394037356, 'samples': 9668544, 'steps': 50356, 'loss/train': 1.4273455142974854} -08/30/2021 22:19:30 - INFO - __main__ - Step 50358: {'lr': 0.00037945984416720826, 'samples': 9668736, 'steps': 50357, 'loss/train': 0.8957129716873169} -08/30/2021 22:19:30 - INFO - __main__ - Step 50359: {'lr': 0.0003794553043357104, 'samples': 9668928, 'steps': 50358, 'loss/train': 0.31405848264694214} -08/30/2021 22:19:30 - INFO - __main__ - Step 50360: {'lr': 0.0003794507644458819, 'samples': 9669120, 'steps': 50359, 'loss/train': 1.2366201877593994} -08/30/2021 22:19:32 - INFO - __main__ - Step 50361: {'lr': 0.00037944622449772485, 'samples': 9669312, 'steps': 50360, 'loss/train': 2.2917444705963135} -08/30/2021 22:19:33 - INFO - __main__ - Step 50362: {'lr': 0.0003794416844912414, 'samples': 9669504, 'steps': 50361, 'loss/train': 1.1970480680465698} -08/30/2021 22:19:33 - INFO - __main__ - Step 50363: {'lr': 0.0003794371444264335, 'samples': 9669696, 'steps': 50362, 'loss/train': 1.3240857124328613} -08/30/2021 22:19:33 - INFO - __main__ - Step 50364: {'lr': 0.00037943260430330317, 'samples': 9669888, 'steps': 50363, 'loss/train': 1.0201549530029297} -08/30/2021 22:19:34 - INFO - __main__ - Step 50365: {'lr': 0.00037942806412185254, 'samples': 9670080, 'steps': 50364, 'loss/train': 0.054349396377801895} -08/30/2021 22:19:35 - INFO - __main__ - Step 50366: {'lr': 0.0003794235238820837, 'samples': 9670272, 'steps': 50365, 'loss/train': 1.5971604585647583} -08/30/2021 22:19:35 - INFO - __main__ - Step 50367: {'lr': 0.0003794189835839985, 'samples': 9670464, 'steps': 50366, 'loss/train': 1.0613186359405518} -08/30/2021 22:19:36 - INFO - __main__ - Step 50368: {'lr': 0.0003794144432275992, 'samples': 9670656, 'steps': 50367, 'loss/train': 1.5632760524749756} -08/30/2021 22:19:36 - INFO - __main__ - Step 50369: {'lr': 0.0003794099028128877, 'samples': 9670848, 'steps': 50368, 'loss/train': 0.7975529432296753} -08/30/2021 22:19:37 - INFO - __main__ - Step 50370: {'lr': 0.0003794053623398661, 'samples': 9671040, 'steps': 50369, 'loss/train': 1.3893669843673706} -08/30/2021 22:19:37 - INFO - __main__ - Step 50371: {'lr': 0.00037940082180853643, 'samples': 9671232, 'steps': 50370, 'loss/train': 1.3412561416625977} -08/30/2021 22:19:38 - INFO - __main__ - Step 50372: {'lr': 0.0003793962812189008, 'samples': 9671424, 'steps': 50371, 'loss/train': 0.7391544580459595} -08/30/2021 22:19:39 - INFO - __main__ - Step 50373: {'lr': 0.00037939174057096114, 'samples': 9671616, 'steps': 50372, 'loss/train': 0.9940875768661499} -08/30/2021 22:19:39 - INFO - __main__ - Step 50374: {'lr': 0.0003793871998647196, 'samples': 9671808, 'steps': 50373, 'loss/train': 1.8421117067337036} -08/30/2021 22:19:40 - INFO - __main__ - Step 50375: {'lr': 0.00037938265910017813, 'samples': 9672000, 'steps': 50374, 'loss/train': 1.3282018899917603} -08/30/2021 22:19:40 - INFO - __main__ - Step 50376: {'lr': 0.0003793781182773388, 'samples': 9672192, 'steps': 50375, 'loss/train': 1.5118070840835571} -08/30/2021 22:19:41 - INFO - __main__ - Step 50377: {'lr': 0.00037937357739620383, 'samples': 9672384, 'steps': 50376, 'loss/train': 1.5946418046951294} -08/30/2021 22:19:42 - INFO - __main__ - Step 50378: {'lr': 0.000379369036456775, 'samples': 9672576, 'steps': 50377, 'loss/train': 1.3112256526947021} -08/30/2021 22:19:42 - INFO - __main__ - Step 50379: {'lr': 0.00037936449545905457, 'samples': 9672768, 'steps': 50378, 'loss/train': 1.4268401861190796} -08/30/2021 22:19:43 - INFO - __main__ - Step 50380: {'lr': 0.0003793599544030444, 'samples': 9672960, 'steps': 50379, 'loss/train': 1.6437456607818604} -08/30/2021 22:19:43 - INFO - __main__ - Step 50381: {'lr': 0.00037935541328874665, 'samples': 9673152, 'steps': 50380, 'loss/train': 1.082747459411621} -08/30/2021 22:19:45 - INFO - __main__ - Step 50382: {'lr': 0.0003793508721161634, 'samples': 9673344, 'steps': 50381, 'loss/train': 0.9482505321502686} -08/30/2021 22:19:45 - INFO - __main__ - Step 50383: {'lr': 0.00037934633088529656, 'samples': 9673536, 'steps': 50382, 'loss/train': 1.4113882780075073} -08/30/2021 22:19:45 - INFO - __main__ - Step 50384: {'lr': 0.00037934178959614834, 'samples': 9673728, 'steps': 50383, 'loss/train': 1.3113954067230225} -08/30/2021 22:19:46 - INFO - __main__ - Step 50385: {'lr': 0.00037933724824872067, 'samples': 9673920, 'steps': 50384, 'loss/train': 0.44477683305740356} -08/30/2021 22:19:46 - INFO - __main__ - Step 50386: {'lr': 0.00037933270684301567, 'samples': 9674112, 'steps': 50385, 'loss/train': 1.4813883304595947} -08/30/2021 22:19:46 - INFO - __main__ - Step 50387: {'lr': 0.00037932816537903535, 'samples': 9674304, 'steps': 50386, 'loss/train': 1.17421293258667} -08/30/2021 22:19:48 - INFO - __main__ - Step 50388: {'lr': 0.0003793236238567817, 'samples': 9674496, 'steps': 50387, 'loss/train': 0.2824392318725586} -08/30/2021 22:19:48 - INFO - __main__ - Step 50389: {'lr': 0.00037931908227625686, 'samples': 9674688, 'steps': 50388, 'loss/train': 1.0637861490249634} -08/30/2021 22:19:49 - INFO - __main__ - Step 50390: {'lr': 0.0003793145406374628, 'samples': 9674880, 'steps': 50389, 'loss/train': 2.0855588912963867} -08/30/2021 22:19:49 - INFO - __main__ - Step 50391: {'lr': 0.0003793099989404016, 'samples': 9675072, 'steps': 50390, 'loss/train': 2.438366651535034} -08/30/2021 22:19:50 - INFO - __main__ - Step 50392: {'lr': 0.00037930545718507536, 'samples': 9675264, 'steps': 50391, 'loss/train': 0.3896178603172302} -08/30/2021 22:19:51 - INFO - __main__ - Step 50393: {'lr': 0.000379300915371486, 'samples': 9675456, 'steps': 50392, 'loss/train': 0.053256504237651825} -08/30/2021 22:19:52 - INFO - __main__ - Step 50394: {'lr': 0.00037929637349963573, 'samples': 9675648, 'steps': 50393, 'loss/train': 1.3573461771011353} -08/30/2021 22:19:52 - INFO - __main__ - Step 50395: {'lr': 0.00037929183156952653, 'samples': 9675840, 'steps': 50394, 'loss/train': 1.1020805835723877} -08/30/2021 22:19:52 - INFO - __main__ - Step 50396: {'lr': 0.00037928728958116034, 'samples': 9676032, 'steps': 50395, 'loss/train': 1.466937780380249} -08/30/2021 22:19:53 - INFO - __main__ - Step 50397: {'lr': 0.0003792827475345393, 'samples': 9676224, 'steps': 50396, 'loss/train': 2.017697334289551} -08/30/2021 22:19:55 - INFO - __main__ - Step 50398: {'lr': 0.00037927820542966545, 'samples': 9676416, 'steps': 50397, 'loss/train': 0.3912416100502014} -08/30/2021 22:19:55 - INFO - __main__ - Step 50399: {'lr': 0.0003792736632665409, 'samples': 9676608, 'steps': 50398, 'loss/train': 0.9029219150543213} -08/30/2021 22:19:55 - INFO - __main__ - Step 50400: {'lr': 0.0003792691210451676, 'samples': 9676800, 'steps': 50399, 'loss/train': 1.422010064125061} -08/30/2021 22:19:56 - INFO - __main__ - Step 50401: {'lr': 0.0003792645787655476, 'samples': 9676992, 'steps': 50400, 'loss/train': 1.333550214767456} -08/30/2021 22:19:56 - INFO - __main__ - Step 50402: {'lr': 0.000379260036427683, 'samples': 9677184, 'steps': 50401, 'loss/train': 1.3777899742126465} -08/30/2021 22:19:58 - INFO - __main__ - Step 50403: {'lr': 0.0003792554940315758, 'samples': 9677376, 'steps': 50402, 'loss/train': 1.3697956800460815} -08/30/2021 22:19:58 - INFO - __main__ - Step 50404: {'lr': 0.00037925095157722807, 'samples': 9677568, 'steps': 50403, 'loss/train': 1.6141688823699951} -08/30/2021 22:19:59 - INFO - __main__ - Step 50405: {'lr': 0.0003792464090646419, 'samples': 9677760, 'steps': 50404, 'loss/train': 1.0716619491577148} -08/30/2021 22:19:59 - INFO - __main__ - Step 50406: {'lr': 0.00037924186649381924, 'samples': 9677952, 'steps': 50405, 'loss/train': 1.2296751737594604} -08/30/2021 22:19:59 - INFO - __main__ - Step 50407: {'lr': 0.00037923732386476225, 'samples': 9678144, 'steps': 50406, 'loss/train': 1.3345345258712769} -08/30/2021 22:20:01 - INFO - __main__ - Step 50408: {'lr': 0.0003792327811774728, 'samples': 9678336, 'steps': 50407, 'loss/train': 0.9169405698776245} -08/30/2021 22:20:01 - INFO - __main__ - Step 50409: {'lr': 0.00037922823843195317, 'samples': 9678528, 'steps': 50408, 'loss/train': 1.1381680965423584} -08/30/2021 22:20:02 - INFO - __main__ - Step 50410: {'lr': 0.00037922369562820525, 'samples': 9678720, 'steps': 50409, 'loss/train': 1.4404726028442383} -08/30/2021 22:20:02 - INFO - __main__ - Step 50411: {'lr': 0.00037921915276623106, 'samples': 9678912, 'steps': 50410, 'loss/train': 1.7571897506713867} -08/30/2021 22:20:02 - INFO - __main__ - Step 50412: {'lr': 0.00037921460984603284, 'samples': 9679104, 'steps': 50411, 'loss/train': 1.0104024410247803} -08/30/2021 22:20:03 - INFO - __main__ - Step 50413: {'lr': 0.0003792100668676125, 'samples': 9679296, 'steps': 50412, 'loss/train': 0.17325729131698608} -08/30/2021 22:20:04 - INFO - __main__ - Step 50414: {'lr': 0.000379205523830972, 'samples': 9679488, 'steps': 50413, 'loss/train': 1.3279976844787598} -08/30/2021 22:20:05 - INFO - __main__ - Step 50415: {'lr': 0.0003792009807361135, 'samples': 9679680, 'steps': 50414, 'loss/train': 1.4849002361297607} -08/30/2021 22:20:05 - INFO - __main__ - Step 50416: {'lr': 0.00037919643758303913, 'samples': 9679872, 'steps': 50415, 'loss/train': 1.2370009422302246} -08/30/2021 22:20:05 - INFO - __main__ - Step 50417: {'lr': 0.0003791918943717507, 'samples': 9680064, 'steps': 50416, 'loss/train': 0.8366214632987976} -08/30/2021 22:20:06 - INFO - __main__ - Step 50418: {'lr': 0.0003791873511022505, 'samples': 9680256, 'steps': 50417, 'loss/train': 0.03460828959941864} -08/30/2021 22:20:07 - INFO - __main__ - Step 50419: {'lr': 0.0003791828077745405, 'samples': 9680448, 'steps': 50418, 'loss/train': 1.2640575170516968} -08/30/2021 22:20:08 - INFO - __main__ - Step 50420: {'lr': 0.00037917826438862263, 'samples': 9680640, 'steps': 50419, 'loss/train': 1.0997360944747925} -08/30/2021 22:20:08 - INFO - __main__ - Step 50421: {'lr': 0.0003791737209444991, 'samples': 9680832, 'steps': 50420, 'loss/train': 0.8631041646003723} -08/30/2021 22:20:08 - INFO - __main__ - Step 50422: {'lr': 0.00037916917744217185, 'samples': 9681024, 'steps': 50421, 'loss/train': 1.4901387691497803} -08/30/2021 22:20:09 - INFO - __main__ - Step 50423: {'lr': 0.0003791646338816429, 'samples': 9681216, 'steps': 50422, 'loss/train': 1.4181979894638062} -08/30/2021 22:20:10 - INFO - __main__ - Step 50424: {'lr': 0.0003791600902629144, 'samples': 9681408, 'steps': 50423, 'loss/train': 1.0080450773239136} -08/30/2021 22:20:11 - INFO - __main__ - Step 50425: {'lr': 0.0003791555465859884, 'samples': 9681600, 'steps': 50424, 'loss/train': 1.7133841514587402} -08/30/2021 22:20:11 - INFO - __main__ - Step 50426: {'lr': 0.0003791510028508669, 'samples': 9681792, 'steps': 50425, 'loss/train': 1.6686477661132812} -08/30/2021 22:20:12 - INFO - __main__ - Step 50427: {'lr': 0.0003791464590575519, 'samples': 9681984, 'steps': 50426, 'loss/train': 1.200631022453308} -08/30/2021 22:20:12 - INFO - __main__ - Step 50428: {'lr': 0.0003791419152060455, 'samples': 9682176, 'steps': 50427, 'loss/train': 0.030982481315732002} -08/30/2021 22:20:12 - INFO - __main__ - Step 50429: {'lr': 0.00037913737129634977, 'samples': 9682368, 'steps': 50428, 'loss/train': 1.3544490337371826} -08/30/2021 22:20:14 - INFO - __main__ - Step 50430: {'lr': 0.00037913282732846676, 'samples': 9682560, 'steps': 50429, 'loss/train': 1.3566209077835083} -08/30/2021 22:20:14 - INFO - __main__ - Step 50431: {'lr': 0.0003791282833023985, 'samples': 9682752, 'steps': 50430, 'loss/train': 1.3717893362045288} -08/30/2021 22:20:15 - INFO - __main__ - Step 50432: {'lr': 0.0003791237392181469, 'samples': 9682944, 'steps': 50431, 'loss/train': 1.493273377418518} -08/30/2021 22:20:15 - INFO - __main__ - Step 50433: {'lr': 0.0003791191950757143, 'samples': 9683136, 'steps': 50432, 'loss/train': 1.629561424255371} -08/30/2021 22:20:15 - INFO - __main__ - Step 50434: {'lr': 0.0003791146508751025, 'samples': 9683328, 'steps': 50433, 'loss/train': 0.8616991639137268} -08/30/2021 22:20:17 - INFO - __main__ - Step 50435: {'lr': 0.00037911010661631364, 'samples': 9683520, 'steps': 50434, 'loss/train': 1.4288216829299927} -08/30/2021 22:20:17 - INFO - __main__ - Step 50436: {'lr': 0.0003791055622993498, 'samples': 9683712, 'steps': 50435, 'loss/train': 1.7565444707870483} -08/30/2021 22:20:18 - INFO - __main__ - Step 50437: {'lr': 0.0003791010179242129, 'samples': 9683904, 'steps': 50436, 'loss/train': 1.4624242782592773} -08/30/2021 22:20:18 - INFO - __main__ - Step 50438: {'lr': 0.0003790964734909051, 'samples': 9684096, 'steps': 50437, 'loss/train': 1.2148696184158325} -08/30/2021 22:20:18 - INFO - __main__ - Step 50439: {'lr': 0.00037909192899942846, 'samples': 9684288, 'steps': 50438, 'loss/train': 1.2736929655075073} -08/30/2021 22:20:20 - INFO - __main__ - Step 50440: {'lr': 0.00037908738444978495, 'samples': 9684480, 'steps': 50439, 'loss/train': 1.385855793952942} -08/30/2021 22:20:20 - INFO - __main__ - Step 50441: {'lr': 0.00037908283984197666, 'samples': 9684672, 'steps': 50440, 'loss/train': 0.09207213670015335} -08/30/2021 22:20:21 - INFO - __main__ - Step 50442: {'lr': 0.0003790782951760057, 'samples': 9684864, 'steps': 50441, 'loss/train': 1.4321266412734985} -08/30/2021 22:20:21 - INFO - __main__ - Step 50443: {'lr': 0.000379073750451874, 'samples': 9685056, 'steps': 50442, 'loss/train': 0.9199109077453613} -08/30/2021 22:20:21 - INFO - __main__ - Step 50444: {'lr': 0.00037906920566958363, 'samples': 9685248, 'steps': 50443, 'loss/train': 1.519266128540039} -08/30/2021 22:20:22 - INFO - __main__ - Step 50445: {'lr': 0.0003790646608291367, 'samples': 9685440, 'steps': 50444, 'loss/train': 1.294013500213623} -08/30/2021 22:20:23 - INFO - __main__ - Step 50446: {'lr': 0.00037906011593053527, 'samples': 9685632, 'steps': 50445, 'loss/train': 1.2787879705429077} -08/30/2021 22:20:24 - INFO - __main__ - Step 50447: {'lr': 0.00037905557097378127, 'samples': 9685824, 'steps': 50446, 'loss/train': 2.162569999694824} -08/30/2021 22:20:24 - INFO - __main__ - Step 50448: {'lr': 0.00037905102595887685, 'samples': 9686016, 'steps': 50447, 'loss/train': 0.8693594932556152} -08/30/2021 22:20:25 - INFO - __main__ - Step 50449: {'lr': 0.00037904648088582407, 'samples': 9686208, 'steps': 50448, 'loss/train': 1.4210799932479858} -08/30/2021 22:20:25 - INFO - __main__ - Step 50450: {'lr': 0.0003790419357546249, 'samples': 9686400, 'steps': 50449, 'loss/train': 1.338752269744873} -08/30/2021 22:20:27 - INFO - __main__ - Step 50451: {'lr': 0.0003790373905652814, 'samples': 9686592, 'steps': 50450, 'loss/train': 1.6669880151748657} -08/30/2021 22:20:28 - INFO - __main__ - Step 50452: {'lr': 0.0003790328453177957, 'samples': 9686784, 'steps': 50451, 'loss/train': 0.9682377576828003} -08/30/2021 22:20:28 - INFO - __main__ - Step 50453: {'lr': 0.0003790283000121697, 'samples': 9686976, 'steps': 50452, 'loss/train': 1.7377610206604004} -08/30/2021 22:20:28 - INFO - __main__ - Step 50454: {'lr': 0.0003790237546484056, 'samples': 9687168, 'steps': 50453, 'loss/train': 2.087350368499756} -08/30/2021 22:20:29 - INFO - __main__ - Step 50455: {'lr': 0.00037901920922650534, 'samples': 9687360, 'steps': 50454, 'loss/train': 0.06459533423185349} -08/30/2021 22:20:30 - INFO - __main__ - Step 50456: {'lr': 0.0003790146637464711, 'samples': 9687552, 'steps': 50455, 'loss/train': 1.022745132446289} -08/30/2021 22:20:31 - INFO - __main__ - Step 50457: {'lr': 0.0003790101182083048, 'samples': 9687744, 'steps': 50456, 'loss/train': 1.688386082649231} -08/30/2021 22:20:31 - INFO - __main__ - Step 50458: {'lr': 0.0003790055726120085, 'samples': 9687936, 'steps': 50457, 'loss/train': 1.0698438882827759} -08/30/2021 22:20:31 - INFO - __main__ - Step 50459: {'lr': 0.0003790010269575844, 'samples': 9688128, 'steps': 50458, 'loss/train': 1.3004378080368042} -08/30/2021 22:20:32 - INFO - __main__ - Step 50460: {'lr': 0.00037899648124503426, 'samples': 9688320, 'steps': 50459, 'loss/train': 1.3318828344345093} -08/30/2021 22:20:33 - INFO - __main__ - Step 50461: {'lr': 0.0003789919354743604, 'samples': 9688512, 'steps': 50460, 'loss/train': 1.0920735597610474} -08/30/2021 22:20:34 - INFO - __main__ - Step 50462: {'lr': 0.00037898738964556474, 'samples': 9688704, 'steps': 50461, 'loss/train': 1.713529109954834} -08/30/2021 22:20:34 - INFO - __main__ - Step 50463: {'lr': 0.0003789828437586494, 'samples': 9688896, 'steps': 50462, 'loss/train': 1.3665308952331543} -08/30/2021 22:20:34 - INFO - __main__ - Step 50464: {'lr': 0.0003789782978136163, 'samples': 9689088, 'steps': 50463, 'loss/train': 1.498956561088562} -08/30/2021 22:20:35 - INFO - __main__ - Step 50465: {'lr': 0.0003789737518104676, 'samples': 9689280, 'steps': 50464, 'loss/train': 2.150615930557251} -08/30/2021 22:20:36 - INFO - __main__ - Step 50466: {'lr': 0.0003789692057492053, 'samples': 9689472, 'steps': 50465, 'loss/train': 1.1512203216552734} -08/30/2021 22:20:37 - INFO - __main__ - Step 50467: {'lr': 0.0003789646596298315, 'samples': 9689664, 'steps': 50466, 'loss/train': 1.5628005266189575} -08/30/2021 22:20:37 - INFO - __main__ - Step 50468: {'lr': 0.0003789601134523482, 'samples': 9689856, 'steps': 50467, 'loss/train': 1.2388564348220825} -08/30/2021 22:20:37 - INFO - __main__ - Step 50469: {'lr': 0.0003789555672167575, 'samples': 9690048, 'steps': 50468, 'loss/train': 0.8184484839439392} -08/30/2021 22:20:38 - INFO - __main__ - Step 50470: {'lr': 0.00037895102092306134, 'samples': 9690240, 'steps': 50469, 'loss/train': 1.483014702796936} -08/30/2021 22:20:39 - INFO - __main__ - Step 50471: {'lr': 0.00037894647457126186, 'samples': 9690432, 'steps': 50470, 'loss/train': 1.4407098293304443} -08/30/2021 22:20:40 - INFO - __main__ - Step 50472: {'lr': 0.00037894192816136107, 'samples': 9690624, 'steps': 50471, 'loss/train': 1.1762523651123047} -08/30/2021 22:20:40 - INFO - __main__ - Step 50473: {'lr': 0.00037893738169336114, 'samples': 9690816, 'steps': 50472, 'loss/train': 1.4748085737228394} -08/30/2021 22:20:40 - INFO - __main__ - Step 50474: {'lr': 0.00037893283516726397, 'samples': 9691008, 'steps': 50473, 'loss/train': 1.5161131620407104} -08/30/2021 22:20:41 - INFO - __main__ - Step 50475: {'lr': 0.0003789282885830716, 'samples': 9691200, 'steps': 50474, 'loss/train': 1.1971051692962646} -08/30/2021 22:20:42 - INFO - __main__ - Step 50476: {'lr': 0.0003789237419407862, 'samples': 9691392, 'steps': 50475, 'loss/train': 1.5350041389465332} -08/30/2021 22:20:43 - INFO - __main__ - Step 50477: {'lr': 0.00037891919524040964, 'samples': 9691584, 'steps': 50476, 'loss/train': 1.3255949020385742} -08/30/2021 22:20:43 - INFO - __main__ - Step 50478: {'lr': 0.0003789146484819442, 'samples': 9691776, 'steps': 50477, 'loss/train': 1.07156240940094} -08/30/2021 22:20:43 - INFO - __main__ - Step 50479: {'lr': 0.00037891010166539175, 'samples': 9691968, 'steps': 50478, 'loss/train': 1.3630187511444092} -08/30/2021 22:20:44 - INFO - __main__ - Step 50480: {'lr': 0.00037890555479075437, 'samples': 9692160, 'steps': 50479, 'loss/train': 0.5146199464797974} -08/30/2021 22:20:44 - INFO - __main__ - Step 50481: {'lr': 0.0003789010078580342, 'samples': 9692352, 'steps': 50480, 'loss/train': 1.1166805028915405} -08/30/2021 22:20:46 - INFO - __main__ - Step 50482: {'lr': 0.00037889646086723325, 'samples': 9692544, 'steps': 50481, 'loss/train': 1.5784718990325928} -08/30/2021 22:20:46 - INFO - __main__ - Step 50483: {'lr': 0.0003788919138183534, 'samples': 9692736, 'steps': 50482, 'loss/train': 0.40377771854400635} -08/30/2021 22:20:46 - INFO - __main__ - Step 50484: {'lr': 0.000378887366711397, 'samples': 9692928, 'steps': 50483, 'loss/train': 0.8656853437423706} -08/30/2021 22:20:47 - INFO - __main__ - Step 50485: {'lr': 0.0003788828195463658, 'samples': 9693120, 'steps': 50484, 'loss/train': 1.388512134552002} -08/30/2021 22:20:47 - INFO - __main__ - Step 50486: {'lr': 0.0003788782723232621, 'samples': 9693312, 'steps': 50485, 'loss/train': 1.1282594203948975} -08/30/2021 22:20:49 - INFO - __main__ - Step 50487: {'lr': 0.00037887372504208784, 'samples': 9693504, 'steps': 50486, 'loss/train': 0.29486918449401855} -08/30/2021 22:20:49 - INFO - __main__ - Step 50488: {'lr': 0.000378869177702845, 'samples': 9693696, 'steps': 50487, 'loss/train': 0.04244080185890198} -08/30/2021 22:20:50 - INFO - __main__ - Step 50489: {'lr': 0.00037886463030553576, 'samples': 9693888, 'steps': 50488, 'loss/train': 1.0847463607788086} -08/30/2021 22:20:50 - INFO - __main__ - Step 50490: {'lr': 0.0003788600828501621, 'samples': 9694080, 'steps': 50489, 'loss/train': 1.067902684211731} -08/30/2021 22:20:51 - INFO - __main__ - Step 50491: {'lr': 0.000378855535336726, 'samples': 9694272, 'steps': 50490, 'loss/train': 1.4128140211105347} -08/30/2021 22:20:52 - INFO - __main__ - Step 50492: {'lr': 0.00037885098776522966, 'samples': 9694464, 'steps': 50491, 'loss/train': 1.4622515439987183} -08/30/2021 22:20:53 - INFO - __main__ - Step 50493: {'lr': 0.00037884644013567504, 'samples': 9694656, 'steps': 50492, 'loss/train': 1.5088398456573486} -08/30/2021 22:20:53 - INFO - __main__ - Step 50494: {'lr': 0.0003788418924480642, 'samples': 9694848, 'steps': 50493, 'loss/train': 1.3884984254837036} -08/30/2021 22:20:54 - INFO - __main__ - Step 50495: {'lr': 0.00037883734470239914, 'samples': 9695040, 'steps': 50494, 'loss/train': 1.083364725112915} -08/30/2021 22:20:54 - INFO - __main__ - Step 50496: {'lr': 0.00037883279689868203, 'samples': 9695232, 'steps': 50495, 'loss/train': 2.148885726928711} -08/30/2021 22:20:54 - INFO - __main__ - Step 50497: {'lr': 0.00037882824903691484, 'samples': 9695424, 'steps': 50496, 'loss/train': 1.3913482427597046} -08/30/2021 22:20:56 - INFO - __main__ - Step 50498: {'lr': 0.00037882370111709963, 'samples': 9695616, 'steps': 50497, 'loss/train': 1.215844750404358} -08/30/2021 22:20:57 - INFO - __main__ - Step 50499: {'lr': 0.00037881915313923845, 'samples': 9695808, 'steps': 50498, 'loss/train': 0.9273170232772827} -08/30/2021 22:20:57 - INFO - __main__ - Step 50500: {'lr': 0.0003788146051033333, 'samples': 9696000, 'steps': 50499, 'loss/train': 0.028722768649458885} -08/30/2021 22:20:57 - INFO - __main__ - Step 50501: {'lr': 0.0003788100570093863, 'samples': 9696192, 'steps': 50500, 'loss/train': 1.482971429824829} -08/30/2021 22:20:58 - INFO - __main__ - Step 50502: {'lr': 0.0003788055088573995, 'samples': 9696384, 'steps': 50501, 'loss/train': 0.9697481989860535} -08/30/2021 22:20:58 - INFO - __main__ - Step 50503: {'lr': 0.0003788009606473749, 'samples': 9696576, 'steps': 50502, 'loss/train': 1.6186118125915527} -08/30/2021 22:21:00 - INFO - __main__ - Step 50504: {'lr': 0.0003787964123793146, 'samples': 9696768, 'steps': 50503, 'loss/train': 0.5148093104362488} -08/30/2021 22:21:00 - INFO - __main__ - Step 50505: {'lr': 0.0003787918640532206, 'samples': 9696960, 'steps': 50504, 'loss/train': 1.8639370203018188} -08/30/2021 22:21:00 - INFO - __main__ - Step 50506: {'lr': 0.000378787315669095, 'samples': 9697152, 'steps': 50505, 'loss/train': 1.7922765016555786} -08/30/2021 22:21:01 - INFO - __main__ - Step 50507: {'lr': 0.00037878276722693984, 'samples': 9697344, 'steps': 50506, 'loss/train': 1.0665982961654663} -08/30/2021 22:21:01 - INFO - __main__ - Step 50508: {'lr': 0.00037877821872675705, 'samples': 9697536, 'steps': 50507, 'loss/train': 2.1430463790893555} -08/30/2021 22:21:03 - INFO - __main__ - Step 50509: {'lr': 0.00037877367016854886, 'samples': 9697728, 'steps': 50508, 'loss/train': 1.5658303499221802} -08/30/2021 22:21:04 - INFO - __main__ - Step 50510: {'lr': 0.00037876912155231725, 'samples': 9697920, 'steps': 50509, 'loss/train': 1.7043001651763916} -08/30/2021 22:21:04 - INFO - __main__ - Step 50511: {'lr': 0.0003787645728780642, 'samples': 9698112, 'steps': 50510, 'loss/train': 1.4626330137252808} -08/30/2021 22:21:05 - INFO - __main__ - Step 50512: {'lr': 0.0003787600241457918, 'samples': 9698304, 'steps': 50511, 'loss/train': 0.7246716618537903} -08/30/2021 22:21:05 - INFO - __main__ - Step 50513: {'lr': 0.0003787554753555022, 'samples': 9698496, 'steps': 50512, 'loss/train': 0.1511334329843521} -08/30/2021 22:21:05 - INFO - __main__ - Step 50514: {'lr': 0.00037875092650719737, 'samples': 9698688, 'steps': 50513, 'loss/train': 1.238606572151184} -08/30/2021 22:21:07 - INFO - __main__ - Step 50515: {'lr': 0.0003787463776008794, 'samples': 9698880, 'steps': 50514, 'loss/train': 1.3823033571243286} -08/30/2021 22:21:07 - INFO - __main__ - Step 50516: {'lr': 0.00037874182863655015, 'samples': 9699072, 'steps': 50515, 'loss/train': 1.6361545324325562} -08/30/2021 22:21:08 - INFO - __main__ - Step 50517: {'lr': 0.00037873727961421197, 'samples': 9699264, 'steps': 50516, 'loss/train': 0.05841180682182312} -08/30/2021 22:21:08 - INFO - __main__ - Step 50518: {'lr': 0.00037873273053386664, 'samples': 9699456, 'steps': 50517, 'loss/train': 1.4625422954559326} -08/30/2021 22:21:09 - INFO - __main__ - Step 50519: {'lr': 0.00037872818139551633, 'samples': 9699648, 'steps': 50518, 'loss/train': 1.781665563583374} -08/30/2021 22:21:10 - INFO - __main__ - Step 50520: {'lr': 0.0003787236321991632, 'samples': 9699840, 'steps': 50519, 'loss/train': 0.7029191851615906} -08/30/2021 22:21:11 - INFO - __main__ - Step 50521: {'lr': 0.0003787190829448092, 'samples': 9700032, 'steps': 50520, 'loss/train': 1.6387474536895752} -08/30/2021 22:21:11 - INFO - __main__ - Step 50522: {'lr': 0.00037871453363245625, 'samples': 9700224, 'steps': 50521, 'loss/train': 0.0813499167561531} -08/30/2021 22:21:12 - INFO - __main__ - Step 50523: {'lr': 0.0003787099842621066, 'samples': 9700416, 'steps': 50522, 'loss/train': 1.9128237962722778} -08/30/2021 22:21:12 - INFO - __main__ - Step 50524: {'lr': 0.0003787054348337621, 'samples': 9700608, 'steps': 50523, 'loss/train': 1.0082141160964966} -08/30/2021 22:21:13 - INFO - __main__ - Step 50525: {'lr': 0.000378700885347425, 'samples': 9700800, 'steps': 50524, 'loss/train': 1.7036052942276} -08/30/2021 22:21:14 - INFO - __main__ - Step 50526: {'lr': 0.0003786963358030973, 'samples': 9700992, 'steps': 50525, 'loss/train': 1.4115265607833862} -08/30/2021 22:21:14 - INFO - __main__ - Step 50527: {'lr': 0.000378691786200781, 'samples': 9701184, 'steps': 50526, 'loss/train': 0.047478705644607544} -08/30/2021 22:21:15 - INFO - __main__ - Step 50528: {'lr': 0.0003786872365404781, 'samples': 9701376, 'steps': 50527, 'loss/train': 1.170424222946167} -08/30/2021 22:21:15 - INFO - __main__ - Step 50529: {'lr': 0.00037868268682219073, 'samples': 9701568, 'steps': 50528, 'loss/train': 1.1574803590774536} -08/30/2021 22:21:16 - INFO - __main__ - Step 50530: {'lr': 0.000378678137045921, 'samples': 9701760, 'steps': 50529, 'loss/train': 0.46257394552230835} -08/30/2021 22:21:17 - INFO - __main__ - Step 50531: {'lr': 0.0003786735872116709, 'samples': 9701952, 'steps': 50530, 'loss/train': 1.9290759563446045} -08/30/2021 22:21:17 - INFO - __main__ - Step 50532: {'lr': 0.00037866903731944234, 'samples': 9702144, 'steps': 50531, 'loss/train': 1.5081276893615723} -08/30/2021 22:21:18 - INFO - __main__ - Step 50533: {'lr': 0.0003786644873692376, 'samples': 9702336, 'steps': 50532, 'loss/train': 1.5965487957000732} -08/30/2021 22:21:18 - INFO - __main__ - Step 50534: {'lr': 0.0003786599373610586, 'samples': 9702528, 'steps': 50533, 'loss/train': 0.8760868906974792} -08/30/2021 22:21:19 - INFO - __main__ - Step 50535: {'lr': 0.00037865538729490745, 'samples': 9702720, 'steps': 50534, 'loss/train': 0.978447675704956} -08/30/2021 22:21:20 - INFO - __main__ - Step 50536: {'lr': 0.00037865083717078605, 'samples': 9702912, 'steps': 50535, 'loss/train': 1.0426462888717651} -08/30/2021 22:21:20 - INFO - __main__ - Step 50537: {'lr': 0.00037864628698869676, 'samples': 9703104, 'steps': 50536, 'loss/train': 1.335335612297058} -08/30/2021 22:21:21 - INFO - __main__ - Step 50538: {'lr': 0.0003786417367486413, 'samples': 9703296, 'steps': 50537, 'loss/train': 1.4903407096862793} -08/30/2021 22:21:21 - INFO - __main__ - Step 50539: {'lr': 0.00037863718645062184, 'samples': 9703488, 'steps': 50538, 'loss/train': 1.087868332862854} -08/30/2021 22:21:23 - INFO - __main__ - Step 50540: {'lr': 0.00037863263609464056, 'samples': 9703680, 'steps': 50539, 'loss/train': 0.1528826504945755} -08/30/2021 22:21:23 - INFO - __main__ - Step 50541: {'lr': 0.00037862808568069935, 'samples': 9703872, 'steps': 50540, 'loss/train': 1.6069130897521973} -08/30/2021 22:21:23 - INFO - __main__ - Step 50542: {'lr': 0.00037862353520880026, 'samples': 9704064, 'steps': 50541, 'loss/train': 0.04344052076339722} -08/30/2021 22:21:24 - INFO - __main__ - Step 50543: {'lr': 0.0003786189846789454, 'samples': 9704256, 'steps': 50542, 'loss/train': 1.616071105003357} -08/30/2021 22:21:24 - INFO - __main__ - Step 50544: {'lr': 0.00037861443409113683, 'samples': 9704448, 'steps': 50543, 'loss/train': 0.6492910981178284} -08/30/2021 22:21:26 - INFO - __main__ - Step 50545: {'lr': 0.0003786098834453766, 'samples': 9704640, 'steps': 50544, 'loss/train': 1.0638542175292969} -08/30/2021 22:21:26 - INFO - __main__ - Step 50546: {'lr': 0.00037860533274166675, 'samples': 9704832, 'steps': 50545, 'loss/train': 0.8705479502677917} -08/30/2021 22:21:27 - INFO - __main__ - Step 50547: {'lr': 0.0003786007819800094, 'samples': 9705024, 'steps': 50546, 'loss/train': 1.601859211921692} -08/30/2021 22:21:27 - INFO - __main__ - Step 50548: {'lr': 0.00037859623116040633, 'samples': 9705216, 'steps': 50547, 'loss/train': 1.2495027780532837} -08/30/2021 22:21:27 - INFO - __main__ - Step 50549: {'lr': 0.00037859168028285984, 'samples': 9705408, 'steps': 50548, 'loss/train': 1.7164394855499268} -08/30/2021 22:21:29 - INFO - __main__ - Step 50550: {'lr': 0.000378587129347372, 'samples': 9705600, 'steps': 50549, 'loss/train': 0.05807496979832649} -08/30/2021 22:21:29 - INFO - __main__ - Step 50551: {'lr': 0.00037858257835394473, 'samples': 9705792, 'steps': 50550, 'loss/train': 1.4299025535583496} -08/30/2021 22:21:30 - INFO - __main__ - Step 50552: {'lr': 0.0003785780273025802, 'samples': 9705984, 'steps': 50551, 'loss/train': 2.5643904209136963} -08/30/2021 22:21:30 - INFO - __main__ - Step 50553: {'lr': 0.00037857347619328033, 'samples': 9706176, 'steps': 50552, 'loss/train': 1.5339922904968262} -08/30/2021 22:21:30 - INFO - __main__ - Step 50554: {'lr': 0.0003785689250260472, 'samples': 9706368, 'steps': 50553, 'loss/train': 1.4461265802383423} -08/30/2021 22:21:31 - INFO - __main__ - Step 50555: {'lr': 0.00037856437380088295, 'samples': 9706560, 'steps': 50554, 'loss/train': 0.8127725124359131} -08/30/2021 22:21:33 - INFO - __main__ - Step 50556: {'lr': 0.0003785598225177896, 'samples': 9706752, 'steps': 50555, 'loss/train': 1.147077202796936} -08/30/2021 22:21:33 - INFO - __main__ - Step 50557: {'lr': 0.0003785552711767691, 'samples': 9706944, 'steps': 50556, 'loss/train': 1.4499472379684448} -08/30/2021 22:21:33 - INFO - __main__ - Step 50558: {'lr': 0.0003785507197778236, 'samples': 9707136, 'steps': 50557, 'loss/train': 1.9343966245651245} -08/30/2021 22:21:34 - INFO - __main__ - Step 50559: {'lr': 0.0003785461683209552, 'samples': 9707328, 'steps': 50558, 'loss/train': 0.39147353172302246} -08/30/2021 22:21:34 - INFO - __main__ - Step 50560: {'lr': 0.00037854161680616586, 'samples': 9707520, 'steps': 50559, 'loss/train': 0.29870110750198364} -08/30/2021 22:21:36 - INFO - __main__ - Step 50561: {'lr': 0.00037853706523345766, 'samples': 9707712, 'steps': 50560, 'loss/train': 1.3760384321212769} -08/30/2021 22:21:37 - INFO - __main__ - Step 50562: {'lr': 0.0003785325136028326, 'samples': 9707904, 'steps': 50561, 'loss/train': 1.5541393756866455} -08/30/2021 22:21:37 - INFO - __main__ - Step 50563: {'lr': 0.0003785279619142927, 'samples': 9708096, 'steps': 50562, 'loss/train': 1.1044286489486694} -08/30/2021 22:21:37 - INFO - __main__ - Step 50564: {'lr': 0.0003785234101678402, 'samples': 9708288, 'steps': 50563, 'loss/train': 1.921372890472412} -08/30/2021 22:21:38 - INFO - __main__ - Step 50565: {'lr': 0.000378518858363477, 'samples': 9708480, 'steps': 50564, 'loss/train': 1.6993879079818726} -08/30/2021 22:21:40 - INFO - __main__ - Step 50566: {'lr': 0.00037851430650120516, 'samples': 9708672, 'steps': 50565, 'loss/train': 1.389115810394287} -08/30/2021 22:21:40 - INFO - __main__ - Step 50567: {'lr': 0.00037850975458102686, 'samples': 9708864, 'steps': 50566, 'loss/train': 1.2794448137283325} -08/30/2021 22:21:41 - INFO - __main__ - Step 50568: {'lr': 0.000378505202602944, 'samples': 9709056, 'steps': 50567, 'loss/train': 0.5103938579559326} -08/30/2021 22:21:41 - INFO - __main__ - Step 50569: {'lr': 0.0003785006505669586, 'samples': 9709248, 'steps': 50568, 'loss/train': 1.9048649072647095} -08/30/2021 22:21:42 - INFO - __main__ - Step 50570: {'lr': 0.0003784960984730728, 'samples': 9709440, 'steps': 50569, 'loss/train': 1.2146530151367188} -08/30/2021 22:21:42 - INFO - __main__ - Step 50571: {'lr': 0.00037849154632128867, 'samples': 9709632, 'steps': 50570, 'loss/train': 1.0356727838516235} -08/30/2021 22:21:43 - INFO - __main__ - Step 50572: {'lr': 0.0003784869941116082, 'samples': 9709824, 'steps': 50571, 'loss/train': 1.3006784915924072} -08/30/2021 22:21:44 - INFO - __main__ - Step 50573: {'lr': 0.00037848244184403356, 'samples': 9710016, 'steps': 50572, 'loss/train': 0.6703782677650452} -08/30/2021 22:21:44 - INFO - __main__ - Step 50574: {'lr': 0.0003784778895185667, 'samples': 9710208, 'steps': 50573, 'loss/train': 2.58648681640625} -08/30/2021 22:21:45 - INFO - __main__ - Step 50575: {'lr': 0.00037847333713520966, 'samples': 9710400, 'steps': 50574, 'loss/train': 1.1255229711532593} -08/30/2021 22:21:45 - INFO - __main__ - Step 50576: {'lr': 0.0003784687846939645, 'samples': 9710592, 'steps': 50575, 'loss/train': 1.249817967414856} -08/30/2021 22:21:45 - INFO - __main__ - Step 50577: {'lr': 0.00037846423219483325, 'samples': 9710784, 'steps': 50576, 'loss/train': 1.1773347854614258} -08/30/2021 22:21:47 - INFO - __main__ - Step 50578: {'lr': 0.00037845967963781807, 'samples': 9710976, 'steps': 50577, 'loss/train': 1.519844651222229} -08/30/2021 22:21:48 - INFO - __main__ - Step 50579: {'lr': 0.00037845512702292097, 'samples': 9711168, 'steps': 50578, 'loss/train': 0.25411728024482727} -08/30/2021 22:21:48 - INFO - __main__ - Step 50580: {'lr': 0.00037845057435014384, 'samples': 9711360, 'steps': 50579, 'loss/train': 1.3524072170257568} -08/30/2021 22:21:48 - INFO - __main__ - Step 50581: {'lr': 0.000378446021619489, 'samples': 9711552, 'steps': 50580, 'loss/train': 0.03329068422317505} -08/30/2021 22:21:49 - INFO - __main__ - Step 50582: {'lr': 0.0003784414688309583, 'samples': 9711744, 'steps': 50581, 'loss/train': 0.5245922803878784} -08/30/2021 22:21:49 - INFO - __main__ - Step 50583: {'lr': 0.0003784369159845539, 'samples': 9711936, 'steps': 50582, 'loss/train': 1.2498857975006104} -08/30/2021 22:21:50 - INFO - __main__ - Step 50584: {'lr': 0.00037843236308027776, 'samples': 9712128, 'steps': 50583, 'loss/train': 1.6137168407440186} -08/30/2021 22:21:51 - INFO - __main__ - Step 50585: {'lr': 0.000378427810118132, 'samples': 9712320, 'steps': 50584, 'loss/train': 1.053935170173645} -08/30/2021 22:21:51 - INFO - __main__ - Step 50586: {'lr': 0.0003784232570981186, 'samples': 9712512, 'steps': 50585, 'loss/train': 1.5806196928024292} -08/30/2021 22:21:52 - INFO - __main__ - Step 50587: {'lr': 0.0003784187040202398, 'samples': 9712704, 'steps': 50586, 'loss/train': 1.338905692100525} -08/30/2021 22:21:52 - INFO - __main__ - Step 50588: {'lr': 0.0003784141508844974, 'samples': 9712896, 'steps': 50587, 'loss/train': 0.5765265822410583} -08/30/2021 22:21:54 - INFO - __main__ - Step 50589: {'lr': 0.00037840959769089354, 'samples': 9713088, 'steps': 50588, 'loss/train': 1.534320592880249} -08/30/2021 22:21:54 - INFO - __main__ - Step 50590: {'lr': 0.00037840504443943033, 'samples': 9713280, 'steps': 50589, 'loss/train': 0.05563338100910187} -08/30/2021 22:21:54 - INFO - __main__ - Step 50591: {'lr': 0.00037840049113010976, 'samples': 9713472, 'steps': 50590, 'loss/train': 0.9809242486953735} -08/30/2021 22:21:55 - INFO - __main__ - Step 50592: {'lr': 0.000378395937762934, 'samples': 9713664, 'steps': 50591, 'loss/train': 0.6632370948791504} -08/30/2021 22:21:55 - INFO - __main__ - Step 50593: {'lr': 0.000378391384337905, 'samples': 9713856, 'steps': 50592, 'loss/train': 0.3154948949813843} -08/30/2021 22:21:57 - INFO - __main__ - Step 50594: {'lr': 0.00037838683085502473, 'samples': 9714048, 'steps': 50593, 'loss/train': 1.2037947177886963} -08/30/2021 22:21:57 - INFO - __main__ - Step 50595: {'lr': 0.0003783822773142954, 'samples': 9714240, 'steps': 50594, 'loss/train': 1.5460710525512695} -08/30/2021 22:21:58 - INFO - __main__ - Step 50596: {'lr': 0.00037837772371571897, 'samples': 9714432, 'steps': 50595, 'loss/train': 1.322776198387146} -08/30/2021 22:21:58 - INFO - __main__ - Step 50597: {'lr': 0.0003783731700592975, 'samples': 9714624, 'steps': 50596, 'loss/train': 1.6035116910934448} -08/30/2021 22:21:58 - INFO - __main__ - Step 50598: {'lr': 0.0003783686163450332, 'samples': 9714816, 'steps': 50597, 'loss/train': 1.2744885683059692} -08/30/2021 22:21:59 - INFO - __main__ - Step 50599: {'lr': 0.0003783640625729278, 'samples': 9715008, 'steps': 50598, 'loss/train': 2.1898765563964844} -08/30/2021 22:22:00 - INFO - __main__ - Step 50600: {'lr': 0.00037835950874298365, 'samples': 9715200, 'steps': 50599, 'loss/train': 1.3047624826431274} -08/30/2021 22:22:01 - INFO - __main__ - Step 50601: {'lr': 0.0003783549548552027, 'samples': 9715392, 'steps': 50600, 'loss/train': 1.4861668348312378} -08/30/2021 22:22:01 - INFO - __main__ - Step 50602: {'lr': 0.00037835040090958684, 'samples': 9715584, 'steps': 50601, 'loss/train': 1.672282338142395} -08/30/2021 22:22:02 - INFO - __main__ - Step 50603: {'lr': 0.0003783458469061384, 'samples': 9715776, 'steps': 50602, 'loss/train': 0.045012570917606354} -08/30/2021 22:22:02 - INFO - __main__ - Step 50604: {'lr': 0.0003783412928448593, 'samples': 9715968, 'steps': 50603, 'loss/train': 0.03242423012852669} -08/30/2021 22:22:02 - INFO - __main__ - Step 50605: {'lr': 0.00037833673872575153, 'samples': 9716160, 'steps': 50604, 'loss/train': 0.6731354594230652} -08/30/2021 22:22:04 - INFO - __main__ - Step 50606: {'lr': 0.00037833218454881725, 'samples': 9716352, 'steps': 50605, 'loss/train': 1.4134920835494995} -08/30/2021 22:22:04 - INFO - __main__ - Step 50607: {'lr': 0.0003783276303140584, 'samples': 9716544, 'steps': 50606, 'loss/train': 1.3130464553833008} -08/30/2021 22:22:05 - INFO - __main__ - Step 50608: {'lr': 0.0003783230760214772, 'samples': 9716736, 'steps': 50607, 'loss/train': 1.403700828552246} -08/30/2021 22:22:05 - INFO - __main__ - Step 50609: {'lr': 0.00037831852167107563, 'samples': 9716928, 'steps': 50608, 'loss/train': 0.7292937636375427} -08/30/2021 22:22:05 - INFO - __main__ - Step 50610: {'lr': 0.0003783139672628556, 'samples': 9717120, 'steps': 50609, 'loss/train': 1.15536630153656} -08/30/2021 22:22:07 - INFO - __main__ - Step 50611: {'lr': 0.0003783094127968193, 'samples': 9717312, 'steps': 50610, 'loss/train': 1.1272286176681519} -08/30/2021 22:22:07 - INFO - __main__ - Step 50612: {'lr': 0.0003783048582729688, 'samples': 9717504, 'steps': 50611, 'loss/train': 1.3782473802566528} -08/30/2021 22:22:08 - INFO - __main__ - Step 50613: {'lr': 0.0003783003036913061, 'samples': 9717696, 'steps': 50612, 'loss/train': 1.7438559532165527} -08/30/2021 22:22:08 - INFO - __main__ - Step 50614: {'lr': 0.0003782957490518332, 'samples': 9717888, 'steps': 50613, 'loss/train': 1.1090965270996094} -08/30/2021 22:22:08 - INFO - __main__ - Step 50615: {'lr': 0.00037829119435455226, 'samples': 9718080, 'steps': 50614, 'loss/train': 1.247815489768982} -08/30/2021 22:22:10 - INFO - __main__ - Step 50616: {'lr': 0.00037828663959946527, 'samples': 9718272, 'steps': 50615, 'loss/train': 0.22780205309391022} -08/30/2021 22:22:11 - INFO - __main__ - Step 50617: {'lr': 0.0003782820847865743, 'samples': 9718464, 'steps': 50616, 'loss/train': 0.8544297218322754} -08/30/2021 22:22:11 - INFO - __main__ - Step 50618: {'lr': 0.0003782775299158815, 'samples': 9718656, 'steps': 50617, 'loss/train': 1.479225516319275} -08/30/2021 22:22:12 - INFO - __main__ - Step 50619: {'lr': 0.0003782729749873887, 'samples': 9718848, 'steps': 50618, 'loss/train': 1.4865379333496094} -08/30/2021 22:22:12 - INFO - __main__ - Step 50620: {'lr': 0.0003782684200010981, 'samples': 9719040, 'steps': 50619, 'loss/train': 1.1960105895996094} -08/30/2021 22:22:12 - INFO - __main__ - Step 50621: {'lr': 0.0003782638649570118, 'samples': 9719232, 'steps': 50620, 'loss/train': 1.5717151165008545} -08/30/2021 22:22:14 - INFO - __main__ - Step 50622: {'lr': 0.00037825930985513177, 'samples': 9719424, 'steps': 50621, 'loss/train': 1.8007010221481323} -08/30/2021 22:22:15 - INFO - __main__ - Step 50623: {'lr': 0.00037825475469546, 'samples': 9719616, 'steps': 50622, 'loss/train': 0.6238455176353455} -08/30/2021 22:22:15 - INFO - __main__ - Step 50624: {'lr': 0.00037825019947799863, 'samples': 9719808, 'steps': 50623, 'loss/train': 1.347244143486023} -08/30/2021 22:22:15 - INFO - __main__ - Step 50625: {'lr': 0.0003782456442027498, 'samples': 9720000, 'steps': 50624, 'loss/train': 0.048339203000068665} -08/30/2021 22:22:16 - INFO - __main__ - Step 50626: {'lr': 0.0003782410888697153, 'samples': 9720192, 'steps': 50625, 'loss/train': 0.06834381073713303} -08/30/2021 22:22:16 - INFO - __main__ - Step 50627: {'lr': 0.00037823653347889745, 'samples': 9720384, 'steps': 50626, 'loss/train': 1.3234820365905762} -08/30/2021 22:22:18 - INFO - __main__ - Step 50628: {'lr': 0.0003782319780302982, 'samples': 9720576, 'steps': 50627, 'loss/train': 0.47812315821647644} -08/30/2021 22:22:18 - INFO - __main__ - Step 50629: {'lr': 0.00037822742252391963, 'samples': 9720768, 'steps': 50628, 'loss/train': 1.8109053373336792} -08/30/2021 22:22:18 - INFO - __main__ - Step 50630: {'lr': 0.0003782228669597637, 'samples': 9720960, 'steps': 50629, 'loss/train': 1.818223476409912} -08/30/2021 22:22:19 - INFO - __main__ - Step 50631: {'lr': 0.00037821831133783246, 'samples': 9721152, 'steps': 50630, 'loss/train': 1.5177974700927734} -08/30/2021 22:22:19 - INFO - __main__ - Step 50632: {'lr': 0.00037821375565812816, 'samples': 9721344, 'steps': 50631, 'loss/train': 1.5178747177124023} -08/30/2021 22:22:21 - INFO - __main__ - Step 50633: {'lr': 0.00037820919992065263, 'samples': 9721536, 'steps': 50632, 'loss/train': 0.8809749484062195} -08/30/2021 22:22:21 - INFO - __main__ - Step 50634: {'lr': 0.00037820464412540805, 'samples': 9721728, 'steps': 50633, 'loss/train': 1.5660545825958252} -08/30/2021 22:22:22 - INFO - __main__ - Step 50635: {'lr': 0.0003782000882723965, 'samples': 9721920, 'steps': 50634, 'loss/train': 1.637805700302124} -08/30/2021 22:22:22 - INFO - __main__ - Step 50636: {'lr': 0.00037819553236161985, 'samples': 9722112, 'steps': 50635, 'loss/train': 1.397648572921753} -08/30/2021 22:22:22 - INFO - __main__ - Step 50637: {'lr': 0.0003781909763930803, 'samples': 9722304, 'steps': 50636, 'loss/train': 0.9804012775421143} -08/30/2021 22:22:24 - INFO - __main__ - Step 50638: {'lr': 0.00037818642036677993, 'samples': 9722496, 'steps': 50637, 'loss/train': 0.0505664125084877} -08/30/2021 22:22:24 - INFO - __main__ - Step 50639: {'lr': 0.00037818186428272064, 'samples': 9722688, 'steps': 50638, 'loss/train': 1.3688198328018188} -08/30/2021 22:22:25 - INFO - __main__ - Step 50640: {'lr': 0.00037817730814090466, 'samples': 9722880, 'steps': 50639, 'loss/train': 1.3044573068618774} -08/30/2021 22:22:25 - INFO - __main__ - Step 50641: {'lr': 0.000378172751941334, 'samples': 9723072, 'steps': 50640, 'loss/train': 1.3556833267211914} -08/30/2021 22:22:25 - INFO - __main__ - Step 50642: {'lr': 0.0003781681956840106, 'samples': 9723264, 'steps': 50641, 'loss/train': 1.100357174873352} -08/30/2021 22:22:27 - INFO - __main__ - Step 50643: {'lr': 0.0003781636393689366, 'samples': 9723456, 'steps': 50642, 'loss/train': 1.4393939971923828} -08/30/2021 22:22:27 - INFO - __main__ - Step 50644: {'lr': 0.0003781590829961141, 'samples': 9723648, 'steps': 50643, 'loss/train': 1.3772292137145996} -08/30/2021 22:22:28 - INFO - __main__ - Step 50645: {'lr': 0.000378154526565545, 'samples': 9723840, 'steps': 50644, 'loss/train': 0.7441801428794861} -08/30/2021 22:22:28 - INFO - __main__ - Step 50646: {'lr': 0.00037814997007723153, 'samples': 9724032, 'steps': 50645, 'loss/train': 1.5719969272613525} -08/30/2021 22:22:28 - INFO - __main__ - Step 50647: {'lr': 0.0003781454135311756, 'samples': 9724224, 'steps': 50646, 'loss/train': 1.1818315982818604} -08/30/2021 22:22:29 - INFO - __main__ - Step 50648: {'lr': 0.0003781408569273794, 'samples': 9724416, 'steps': 50647, 'loss/train': 1.627143144607544} -08/30/2021 22:22:30 - INFO - __main__ - Step 50649: {'lr': 0.0003781363002658448, 'samples': 9724608, 'steps': 50648, 'loss/train': 1.5164395570755005} -08/30/2021 22:22:31 - INFO - __main__ - Step 50650: {'lr': 0.000378131743546574, 'samples': 9724800, 'steps': 50649, 'loss/train': 1.37466561794281} -08/30/2021 22:22:31 - INFO - __main__ - Step 50651: {'lr': 0.000378127186769569, 'samples': 9724992, 'steps': 50650, 'loss/train': 1.1438621282577515} -08/30/2021 22:22:32 - INFO - __main__ - Step 50652: {'lr': 0.00037812262993483194, 'samples': 9725184, 'steps': 50651, 'loss/train': 0.6153126358985901} -08/30/2021 22:22:32 - INFO - __main__ - Step 50653: {'lr': 0.0003781180730423648, 'samples': 9725376, 'steps': 50652, 'loss/train': 1.7729638814926147} -08/30/2021 22:22:34 - INFO - __main__ - Step 50654: {'lr': 0.00037811351609216956, 'samples': 9725568, 'steps': 50653, 'loss/train': 0.06994570046663284} -08/30/2021 22:22:34 - INFO - __main__ - Step 50655: {'lr': 0.00037810895908424837, 'samples': 9725760, 'steps': 50654, 'loss/train': 1.0513792037963867} -08/30/2021 22:22:35 - INFO - __main__ - Step 50656: {'lr': 0.0003781044020186033, 'samples': 9725952, 'steps': 50655, 'loss/train': 1.371777057647705} -08/30/2021 22:22:35 - INFO - __main__ - Step 50657: {'lr': 0.0003780998448952363, 'samples': 9726144, 'steps': 50656, 'loss/train': 1.4858083724975586} -08/30/2021 22:22:35 - INFO - __main__ - Step 50658: {'lr': 0.0003780952877141495, 'samples': 9726336, 'steps': 50657, 'loss/train': 1.456172227859497} -08/30/2021 22:22:36 - INFO - __main__ - Step 50659: {'lr': 0.0003780907304753449, 'samples': 9726528, 'steps': 50658, 'loss/train': 2.0115907192230225} -08/30/2021 22:22:37 - INFO - __main__ - Step 50660: {'lr': 0.0003780861731788247, 'samples': 9726720, 'steps': 50659, 'loss/train': 0.04644060879945755} -08/30/2021 22:22:38 - INFO - __main__ - Step 50661: {'lr': 0.0003780816158245908, 'samples': 9726912, 'steps': 50660, 'loss/train': 1.6447889804840088} -08/30/2021 22:22:38 - INFO - __main__ - Step 50662: {'lr': 0.0003780770584126453, 'samples': 9727104, 'steps': 50661, 'loss/train': 0.19531315565109253} -08/30/2021 22:22:39 - INFO - __main__ - Step 50663: {'lr': 0.0003780725009429903, 'samples': 9727296, 'steps': 50662, 'loss/train': 1.3399301767349243} -08/30/2021 22:22:39 - INFO - __main__ - Step 50664: {'lr': 0.00037806794341562773, 'samples': 9727488, 'steps': 50663, 'loss/train': 1.8560758829116821} -08/30/2021 22:22:39 - INFO - __main__ - Step 50665: {'lr': 0.00037806338583055976, 'samples': 9727680, 'steps': 50664, 'loss/train': 1.35336172580719} -08/30/2021 22:22:41 - INFO - __main__ - Step 50666: {'lr': 0.0003780588281877884, 'samples': 9727872, 'steps': 50665, 'loss/train': 1.3639845848083496} -08/30/2021 22:22:41 - INFO - __main__ - Step 50667: {'lr': 0.00037805427048731566, 'samples': 9728064, 'steps': 50666, 'loss/train': 1.2685130834579468} -08/30/2021 22:22:42 - INFO - __main__ - Step 50668: {'lr': 0.0003780497127291437, 'samples': 9728256, 'steps': 50667, 'loss/train': 1.0669279098510742} -08/30/2021 22:22:42 - INFO - __main__ - Step 50669: {'lr': 0.0003780451549132745, 'samples': 9728448, 'steps': 50668, 'loss/train': 1.935593843460083} -08/30/2021 22:22:42 - INFO - __main__ - Step 50670: {'lr': 0.00037804059703971016, 'samples': 9728640, 'steps': 50669, 'loss/train': 1.0550918579101562} -08/30/2021 22:22:44 - INFO - __main__ - Step 50671: {'lr': 0.00037803603910845264, 'samples': 9728832, 'steps': 50670, 'loss/train': 1.9273122549057007} -08/30/2021 22:22:44 - INFO - __main__ - Step 50672: {'lr': 0.00037803148111950407, 'samples': 9729024, 'steps': 50671, 'loss/train': 1.7545077800750732} -08/30/2021 22:22:45 - INFO - __main__ - Step 50673: {'lr': 0.0003780269230728665, 'samples': 9729216, 'steps': 50672, 'loss/train': 0.3329651653766632} -08/30/2021 22:22:45 - INFO - __main__ - Step 50674: {'lr': 0.000378022364968542, 'samples': 9729408, 'steps': 50673, 'loss/train': 1.3416147232055664} -08/30/2021 22:22:45 - INFO - __main__ - Step 50675: {'lr': 0.00037801780680653263, 'samples': 9729600, 'steps': 50674, 'loss/train': 1.5747259855270386} -08/30/2021 22:22:48 - INFO - __main__ - Step 50676: {'lr': 0.0003780132485868403, 'samples': 9729792, 'steps': 50675, 'loss/train': 0.9510841369628906} -08/30/2021 22:22:48 - INFO - __main__ - Step 50677: {'lr': 0.0003780086903094673, 'samples': 9729984, 'steps': 50676, 'loss/train': 0.2769656777381897} -08/30/2021 22:22:49 - INFO - __main__ - Step 50678: {'lr': 0.0003780041319744154, 'samples': 9730176, 'steps': 50677, 'loss/train': 1.0700489282608032} -08/30/2021 22:22:49 - INFO - __main__ - Step 50679: {'lr': 0.00037799957358168693, 'samples': 9730368, 'steps': 50678, 'loss/train': 0.45007649064064026} -08/30/2021 22:22:49 - INFO - __main__ - Step 50680: {'lr': 0.0003779950151312838, 'samples': 9730560, 'steps': 50679, 'loss/train': 0.2423430234193802} -08/30/2021 22:22:50 - INFO - __main__ - Step 50681: {'lr': 0.0003779904566232081, 'samples': 9730752, 'steps': 50680, 'loss/train': 1.6182368993759155} -08/30/2021 22:22:51 - INFO - __main__ - Step 50682: {'lr': 0.0003779858980574619, 'samples': 9730944, 'steps': 50681, 'loss/train': 1.6783785820007324} -08/30/2021 22:22:52 - INFO - __main__ - Step 50683: {'lr': 0.0003779813394340472, 'samples': 9731136, 'steps': 50682, 'loss/train': 1.2892950773239136} -08/30/2021 22:22:52 - INFO - __main__ - Step 50684: {'lr': 0.0003779767807529661, 'samples': 9731328, 'steps': 50683, 'loss/train': 1.0813039541244507} -08/30/2021 22:22:52 - INFO - __main__ - Step 50685: {'lr': 0.0003779722220142206, 'samples': 9731520, 'steps': 50684, 'loss/train': 1.3954010009765625} -08/30/2021 22:22:53 - INFO - __main__ - Step 50686: {'lr': 0.00037796766321781286, 'samples': 9731712, 'steps': 50685, 'loss/train': 1.099147915840149} -08/30/2021 22:22:53 - INFO - __main__ - Step 50687: {'lr': 0.00037796310436374474, 'samples': 9731904, 'steps': 50686, 'loss/train': 1.5850473642349243} -08/30/2021 22:22:55 - INFO - __main__ - Step 50688: {'lr': 0.0003779585454520186, 'samples': 9732096, 'steps': 50687, 'loss/train': 1.374234914779663} -08/30/2021 22:22:55 - INFO - __main__ - Step 50689: {'lr': 0.0003779539864826362, 'samples': 9732288, 'steps': 50688, 'loss/train': 1.4728293418884277} -08/30/2021 22:22:56 - INFO - __main__ - Step 50690: {'lr': 0.0003779494274555997, 'samples': 9732480, 'steps': 50689, 'loss/train': 0.2392479032278061} -08/30/2021 22:22:56 - INFO - __main__ - Step 50691: {'lr': 0.0003779448683709111, 'samples': 9732672, 'steps': 50690, 'loss/train': 1.3580857515335083} -08/30/2021 22:22:56 - INFO - __main__ - Step 50692: {'lr': 0.0003779403092285727, 'samples': 9732864, 'steps': 50691, 'loss/train': 1.157630205154419} -08/30/2021 22:22:58 - INFO - __main__ - Step 50693: {'lr': 0.00037793575002858625, 'samples': 9733056, 'steps': 50692, 'loss/train': 0.6986561417579651} -08/30/2021 22:22:58 - INFO - __main__ - Step 50694: {'lr': 0.00037793119077095396, 'samples': 9733248, 'steps': 50693, 'loss/train': 1.0183249711990356} -08/30/2021 22:22:59 - INFO - __main__ - Step 50695: {'lr': 0.00037792663145567784, 'samples': 9733440, 'steps': 50694, 'loss/train': 0.871319055557251} -08/30/2021 22:22:59 - INFO - __main__ - Step 50696: {'lr': 0.00037792207208275995, 'samples': 9733632, 'steps': 50695, 'loss/train': 1.73435640335083} -08/30/2021 22:23:00 - INFO - __main__ - Step 50697: {'lr': 0.0003779175126522023, 'samples': 9733824, 'steps': 50696, 'loss/train': 1.746621012687683} -08/30/2021 22:23:01 - INFO - __main__ - Step 50698: {'lr': 0.0003779129531640071, 'samples': 9734016, 'steps': 50697, 'loss/train': 1.3059147596359253} -08/30/2021 22:23:01 - INFO - __main__ - Step 50699: {'lr': 0.0003779083936181762, 'samples': 9734208, 'steps': 50698, 'loss/train': 1.700587511062622} -08/30/2021 22:23:02 - INFO - __main__ - Step 50700: {'lr': 0.0003779038340147118, 'samples': 9734400, 'steps': 50699, 'loss/train': 1.0194019079208374} -08/30/2021 22:23:02 - INFO - __main__ - Step 50701: {'lr': 0.0003778992743536159, 'samples': 9734592, 'steps': 50700, 'loss/train': 1.5755808353424072} -08/30/2021 22:23:02 - INFO - __main__ - Step 50702: {'lr': 0.0003778947146348906, 'samples': 9734784, 'steps': 50701, 'loss/train': 1.6223037242889404} -08/30/2021 22:23:04 - INFO - __main__ - Step 50703: {'lr': 0.00037789015485853786, 'samples': 9734976, 'steps': 50702, 'loss/train': 1.345376968383789} -08/30/2021 22:23:04 - INFO - __main__ - Step 50704: {'lr': 0.0003778855950245598, 'samples': 9735168, 'steps': 50703, 'loss/train': 1.318848729133606} -08/30/2021 22:23:05 - INFO - __main__ - Step 50705: {'lr': 0.00037788103513295844, 'samples': 9735360, 'steps': 50704, 'loss/train': 1.4883267879486084} -08/30/2021 22:23:05 - INFO - __main__ - Step 50706: {'lr': 0.00037787647518373586, 'samples': 9735552, 'steps': 50705, 'loss/train': 0.7998714447021484} -08/30/2021 22:23:05 - INFO - __main__ - Step 50707: {'lr': 0.0003778719151768941, 'samples': 9735744, 'steps': 50706, 'loss/train': 1.5309160947799683} -08/30/2021 22:23:07 - INFO - __main__ - Step 50708: {'lr': 0.0003778673551124353, 'samples': 9735936, 'steps': 50707, 'loss/train': 1.6601982116699219} -08/30/2021 22:23:07 - INFO - __main__ - Step 50709: {'lr': 0.0003778627949903615, 'samples': 9736128, 'steps': 50708, 'loss/train': 1.2267168760299683} -08/30/2021 22:23:08 - INFO - __main__ - Step 50710: {'lr': 0.00037785823481067455, 'samples': 9736320, 'steps': 50709, 'loss/train': 1.2138028144836426} -08/30/2021 22:23:08 - INFO - __main__ - Step 50711: {'lr': 0.0003778536745733767, 'samples': 9736512, 'steps': 50710, 'loss/train': 1.454527497291565} -08/30/2021 22:23:08 - INFO - __main__ - Step 50712: {'lr': 0.00037784911427846997, 'samples': 9736704, 'steps': 50711, 'loss/train': 1.4463690519332886} -08/30/2021 22:23:10 - INFO - __main__ - Step 50713: {'lr': 0.0003778445539259564, 'samples': 9736896, 'steps': 50712, 'loss/train': 1.2544445991516113} -08/30/2021 22:23:10 - INFO - __main__ - Step 50714: {'lr': 0.000377839993515838, 'samples': 9737088, 'steps': 50713, 'loss/train': 1.6325585842132568} -08/30/2021 22:23:11 - INFO - __main__ - Step 50715: {'lr': 0.000377835433048117, 'samples': 9737280, 'steps': 50714, 'loss/train': 1.6144853830337524} -08/30/2021 22:23:11 - INFO - __main__ - Step 50716: {'lr': 0.00037783087252279523, 'samples': 9737472, 'steps': 50715, 'loss/train': 1.4328558444976807} -08/30/2021 22:23:11 - INFO - __main__ - Step 50717: {'lr': 0.0003778263119398748, 'samples': 9737664, 'steps': 50716, 'loss/train': 4.1941819190979} -08/30/2021 22:23:13 - INFO - __main__ - Step 50718: {'lr': 0.00037782175129935793, 'samples': 9737856, 'steps': 50717, 'loss/train': 1.4083696603775024} -08/30/2021 22:23:13 - INFO - __main__ - Step 50719: {'lr': 0.0003778171906012464, 'samples': 9738048, 'steps': 50718, 'loss/train': 1.7509175539016724} -08/30/2021 22:23:14 - INFO - __main__ - Step 50720: {'lr': 0.0003778126298455425, 'samples': 9738240, 'steps': 50719, 'loss/train': 1.3796314001083374} -08/30/2021 22:23:14 - INFO - __main__ - Step 50721: {'lr': 0.0003778080690322483, 'samples': 9738432, 'steps': 50720, 'loss/train': 1.4508436918258667} -08/30/2021 22:23:14 - INFO - __main__ - Step 50722: {'lr': 0.0003778035081613656, 'samples': 9738624, 'steps': 50721, 'loss/train': 1.225346565246582} -08/30/2021 22:23:15 - INFO - __main__ - Step 50723: {'lr': 0.00037779894723289666, 'samples': 9738816, 'steps': 50722, 'loss/train': 1.5549176931381226} -08/30/2021 22:23:16 - INFO - __main__ - Step 50724: {'lr': 0.00037779438624684346, 'samples': 9739008, 'steps': 50723, 'loss/train': 1.0372271537780762} -08/30/2021 22:23:17 - INFO - __main__ - Step 50725: {'lr': 0.00037778982520320813, 'samples': 9739200, 'steps': 50724, 'loss/train': 1.463087797164917} -08/30/2021 22:23:17 - INFO - __main__ - Step 50726: {'lr': 0.00037778526410199266, 'samples': 9739392, 'steps': 50725, 'loss/train': 1.1884992122650146} -08/30/2021 22:23:17 - INFO - __main__ - Step 50727: {'lr': 0.0003777807029431992, 'samples': 9739584, 'steps': 50726, 'loss/train': 1.1037424802780151} -08/30/2021 22:23:18 - INFO - __main__ - Step 50728: {'lr': 0.0003777761417268296, 'samples': 9739776, 'steps': 50727, 'loss/train': 1.0655313730239868} -08/30/2021 22:23:20 - INFO - __main__ - Step 50729: {'lr': 0.00037777158045288606, 'samples': 9739968, 'steps': 50728, 'loss/train': 1.3737667798995972} -08/30/2021 22:23:20 - INFO - __main__ - Step 50730: {'lr': 0.00037776701912137066, 'samples': 9740160, 'steps': 50729, 'loss/train': 1.2113629579544067} -08/30/2021 22:23:20 - INFO - __main__ - Step 50731: {'lr': 0.00037776245773228547, 'samples': 9740352, 'steps': 50730, 'loss/train': 0.4998539388179779} -08/30/2021 22:23:21 - INFO - __main__ - Step 50732: {'lr': 0.0003777578962856324, 'samples': 9740544, 'steps': 50731, 'loss/train': 0.7186129093170166} -08/30/2021 22:23:21 - INFO - __main__ - Step 50733: {'lr': 0.0003777533347814136, 'samples': 9740736, 'steps': 50732, 'loss/train': 1.3341388702392578} -08/30/2021 22:23:23 - INFO - __main__ - Step 50734: {'lr': 0.0003777487732196312, 'samples': 9740928, 'steps': 50733, 'loss/train': 1.3012912273406982} -08/30/2021 22:23:24 - INFO - __main__ - Step 50735: {'lr': 0.00037774421160028705, 'samples': 9741120, 'steps': 50734, 'loss/train': 1.3807263374328613} -08/30/2021 22:23:24 - INFO - __main__ - Step 50736: {'lr': 0.0003777396499233834, 'samples': 9741312, 'steps': 50735, 'loss/train': 1.053460717201233} -08/30/2021 22:23:24 - INFO - __main__ - Step 50737: {'lr': 0.00037773508818892223, 'samples': 9741504, 'steps': 50736, 'loss/train': 0.1664726883172989} -08/30/2021 22:23:25 - INFO - __main__ - Step 50738: {'lr': 0.0003777305263969056, 'samples': 9741696, 'steps': 50737, 'loss/train': 0.3396371304988861} -08/30/2021 22:23:25 - INFO - __main__ - Step 50739: {'lr': 0.00037772596454733554, 'samples': 9741888, 'steps': 50738, 'loss/train': 0.07335926592350006} -08/30/2021 22:23:26 - INFO - __main__ - Step 50740: {'lr': 0.00037772140264021416, 'samples': 9742080, 'steps': 50739, 'loss/train': 1.772095799446106} -08/30/2021 22:23:27 - INFO - __main__ - Step 50741: {'lr': 0.00037771684067554345, 'samples': 9742272, 'steps': 50740, 'loss/train': 2.0000312328338623} -08/30/2021 22:23:27 - INFO - __main__ - Step 50742: {'lr': 0.0003777122786533255, 'samples': 9742464, 'steps': 50741, 'loss/train': 0.5390012860298157} -08/30/2021 22:23:28 - INFO - __main__ - Step 50743: {'lr': 0.0003777077165735625, 'samples': 9742656, 'steps': 50742, 'loss/train': 1.1910369396209717} -08/30/2021 22:23:28 - INFO - __main__ - Step 50744: {'lr': 0.0003777031544362562, 'samples': 9742848, 'steps': 50743, 'loss/train': 1.55131995677948} -08/30/2021 22:23:29 - INFO - __main__ - Step 50745: {'lr': 0.0003776985922414089, 'samples': 9743040, 'steps': 50744, 'loss/train': 1.2937159538269043} -08/30/2021 22:23:30 - INFO - __main__ - Step 50746: {'lr': 0.0003776940299890226, 'samples': 9743232, 'steps': 50745, 'loss/train': 1.1952322721481323} -08/30/2021 22:23:30 - INFO - __main__ - Step 50747: {'lr': 0.0003776894676790993, 'samples': 9743424, 'steps': 50746, 'loss/train': 0.9407305717468262} -08/30/2021 22:23:31 - INFO - __main__ - Step 50748: {'lr': 0.0003776849053116411, 'samples': 9743616, 'steps': 50747, 'loss/train': 1.1303645372390747} -08/30/2021 22:23:31 - INFO - __main__ - Step 50749: {'lr': 0.00037768034288665015, 'samples': 9743808, 'steps': 50748, 'loss/train': 0.8534497618675232} -08/30/2021 22:23:33 - INFO - __main__ - Step 50750: {'lr': 0.0003776757804041283, 'samples': 9744000, 'steps': 50749, 'loss/train': 0.7190511226654053} -08/30/2021 22:23:33 - INFO - __main__ - Step 50751: {'lr': 0.00037767121786407774, 'samples': 9744192, 'steps': 50750, 'loss/train': 1.504826545715332} -08/30/2021 22:23:33 - INFO - __main__ - Step 50752: {'lr': 0.00037766665526650054, 'samples': 9744384, 'steps': 50751, 'loss/train': 0.06696536391973495} -08/30/2021 22:23:34 - INFO - __main__ - Step 50753: {'lr': 0.0003776620926113986, 'samples': 9744576, 'steps': 50752, 'loss/train': 1.5380003452301025} -08/30/2021 22:23:34 - INFO - __main__ - Step 50754: {'lr': 0.0003776575298987742, 'samples': 9744768, 'steps': 50753, 'loss/train': 1.5041019916534424} -08/30/2021 22:23:34 - INFO - __main__ - Step 50755: {'lr': 0.00037765296712862927, 'samples': 9744960, 'steps': 50754, 'loss/train': 0.3582809269428253} -08/30/2021 22:23:36 - INFO - __main__ - Step 50756: {'lr': 0.00037764840430096593, 'samples': 9745152, 'steps': 50755, 'loss/train': 1.0493816137313843} -08/30/2021 22:23:37 - INFO - __main__ - Step 50757: {'lr': 0.0003776438414157861, 'samples': 9745344, 'steps': 50756, 'loss/train': 1.361534833908081} -08/30/2021 22:23:37 - INFO - __main__ - Step 50758: {'lr': 0.00037763927847309195, 'samples': 9745536, 'steps': 50757, 'loss/train': 0.1652563065290451} -08/30/2021 22:23:38 - INFO - __main__ - Step 50759: {'lr': 0.00037763471547288554, 'samples': 9745728, 'steps': 50758, 'loss/train': 0.8140980005264282} -08/30/2021 22:23:38 - INFO - __main__ - Step 50760: {'lr': 0.00037763015241516887, 'samples': 9745920, 'steps': 50759, 'loss/train': 0.7804386615753174} -08/30/2021 22:23:40 - INFO - __main__ - Step 50761: {'lr': 0.00037762558929994394, 'samples': 9746112, 'steps': 50760, 'loss/train': 0.8359727263450623} -08/30/2021 22:23:40 - INFO - __main__ - Step 50762: {'lr': 0.00037762102612721305, 'samples': 9746304, 'steps': 50761, 'loss/train': 0.09572537243366241} -08/30/2021 22:23:41 - INFO - __main__ - Step 50763: {'lr': 0.00037761646289697796, 'samples': 9746496, 'steps': 50762, 'loss/train': 0.6907109618186951} -08/30/2021 22:23:41 - INFO - __main__ - Step 50764: {'lr': 0.0003776118996092409, 'samples': 9746688, 'steps': 50763, 'loss/train': 0.20398925244808197} -08/30/2021 22:23:42 - INFO - __main__ - Step 50765: {'lr': 0.00037760733626400396, 'samples': 9746880, 'steps': 50764, 'loss/train': 1.4890995025634766} -08/30/2021 22:23:42 - INFO - __main__ - Step 50766: {'lr': 0.00037760277286126906, 'samples': 9747072, 'steps': 50765, 'loss/train': 1.0068615674972534} -08/30/2021 22:23:43 - INFO - __main__ - Step 50767: {'lr': 0.00037759820940103827, 'samples': 9747264, 'steps': 50766, 'loss/train': 1.196533203125} -08/30/2021 22:23:44 - INFO - __main__ - Step 50768: {'lr': 0.0003775936458833138, 'samples': 9747456, 'steps': 50767, 'loss/train': 1.5830824375152588} -08/30/2021 22:23:44 - INFO - __main__ - Step 50769: {'lr': 0.00037758908230809757, 'samples': 9747648, 'steps': 50768, 'loss/train': 1.7705957889556885} -08/30/2021 22:23:44 - INFO - __main__ - Step 50770: {'lr': 0.0003775845186753917, 'samples': 9747840, 'steps': 50769, 'loss/train': 1.1866025924682617} -08/30/2021 22:23:45 - INFO - __main__ - Step 50771: {'lr': 0.00037757995498519814, 'samples': 9748032, 'steps': 50770, 'loss/train': 2.459285020828247} -08/30/2021 22:23:46 - INFO - __main__ - Step 50772: {'lr': 0.00037757539123751906, 'samples': 9748224, 'steps': 50771, 'loss/train': 1.2626683712005615} -08/30/2021 22:23:47 - INFO - __main__ - Step 50773: {'lr': 0.00037757082743235644, 'samples': 9748416, 'steps': 50772, 'loss/train': 2.0133116245269775} -08/30/2021 22:23:47 - INFO - __main__ - Step 50774: {'lr': 0.00037756626356971236, 'samples': 9748608, 'steps': 50773, 'loss/train': 1.4486150741577148} -08/30/2021 22:23:47 - INFO - __main__ - Step 50775: {'lr': 0.00037756169964958897, 'samples': 9748800, 'steps': 50774, 'loss/train': 1.3006083965301514} -08/30/2021 22:23:48 - INFO - __main__ - Step 50776: {'lr': 0.00037755713567198823, 'samples': 9748992, 'steps': 50775, 'loss/train': 1.3877253532409668} -08/30/2021 22:23:48 - INFO - __main__ - Step 50777: {'lr': 0.00037755257163691214, 'samples': 9749184, 'steps': 50776, 'loss/train': 1.1668713092803955} -08/30/2021 22:23:50 - INFO - __main__ - Step 50778: {'lr': 0.00037754800754436293, 'samples': 9749376, 'steps': 50777, 'loss/train': 1.3054708242416382} -08/30/2021 22:23:50 - INFO - __main__ - Step 50779: {'lr': 0.0003775434433943425, 'samples': 9749568, 'steps': 50778, 'loss/train': 0.7419930696487427} -08/30/2021 22:23:51 - INFO - __main__ - Step 50780: {'lr': 0.00037753887918685295, 'samples': 9749760, 'steps': 50779, 'loss/train': 1.4362772703170776} -08/30/2021 22:23:51 - INFO - __main__ - Step 50781: {'lr': 0.0003775343149218964, 'samples': 9749952, 'steps': 50780, 'loss/train': 1.3387871980667114} -08/30/2021 22:23:51 - INFO - __main__ - Step 50782: {'lr': 0.0003775297505994748, 'samples': 9750144, 'steps': 50781, 'loss/train': 0.7080039381980896} -08/30/2021 22:23:53 - INFO - __main__ - Step 50783: {'lr': 0.0003775251862195903, 'samples': 9750336, 'steps': 50782, 'loss/train': 0.0829143077135086} -08/30/2021 22:23:53 - INFO - __main__ - Step 50784: {'lr': 0.0003775206217822449, 'samples': 9750528, 'steps': 50783, 'loss/train': 1.8504304885864258} -08/30/2021 22:23:54 - INFO - __main__ - Step 50785: {'lr': 0.00037751605728744063, 'samples': 9750720, 'steps': 50784, 'loss/train': 0.8786010146141052} -08/30/2021 22:23:54 - INFO - __main__ - Step 50786: {'lr': 0.0003775114927351797, 'samples': 9750912, 'steps': 50785, 'loss/train': 2.1746597290039062} -08/30/2021 22:23:54 - INFO - __main__ - Step 50787: {'lr': 0.00037750692812546396, 'samples': 9751104, 'steps': 50786, 'loss/train': 1.4306563138961792} -08/30/2021 22:23:56 - INFO - __main__ - Step 50788: {'lr': 0.00037750236345829557, 'samples': 9751296, 'steps': 50787, 'loss/train': 1.1955486536026} -08/30/2021 22:23:57 - INFO - __main__ - Step 50789: {'lr': 0.0003774977987336767, 'samples': 9751488, 'steps': 50788, 'loss/train': 1.3215488195419312} -08/30/2021 22:23:57 - INFO - __main__ - Step 50790: {'lr': 0.0003774932339516092, 'samples': 9751680, 'steps': 50789, 'loss/train': 1.497776746749878} -08/30/2021 22:23:58 - INFO - __main__ - Step 50791: {'lr': 0.00037748866911209525, 'samples': 9751872, 'steps': 50790, 'loss/train': 0.5976358652114868} -08/30/2021 22:23:58 - INFO - __main__ - Step 50792: {'lr': 0.00037748410421513677, 'samples': 9752064, 'steps': 50791, 'loss/train': 1.2239258289337158} -08/30/2021 22:24:00 - INFO - __main__ - Step 50793: {'lr': 0.000377479539260736, 'samples': 9752256, 'steps': 50792, 'loss/train': 0.9326513409614563} -08/30/2021 22:24:00 - INFO - __main__ - Step 50794: {'lr': 0.0003774749742488949, 'samples': 9752448, 'steps': 50793, 'loss/train': 1.2791025638580322} -08/30/2021 22:24:00 - INFO - __main__ - Step 50795: {'lr': 0.0003774704091796156, 'samples': 9752640, 'steps': 50794, 'loss/train': 1.532116413116455} -08/30/2021 22:24:01 - INFO - __main__ - Step 50796: {'lr': 0.00037746584405290006, 'samples': 9752832, 'steps': 50795, 'loss/train': 1.0717099905014038} -08/30/2021 22:24:01 - INFO - __main__ - Step 50797: {'lr': 0.00037746127886875035, 'samples': 9753024, 'steps': 50796, 'loss/train': 0.7889087796211243} -08/30/2021 22:24:03 - INFO - __main__ - Step 50798: {'lr': 0.0003774567136271686, 'samples': 9753216, 'steps': 50797, 'loss/train': 1.5086945295333862} -08/30/2021 22:24:03 - INFO - __main__ - Step 50799: {'lr': 0.0003774521483281568, 'samples': 9753408, 'steps': 50798, 'loss/train': 0.9860463738441467} -08/30/2021 22:24:03 - INFO - __main__ - Step 50800: {'lr': 0.00037744758297171706, 'samples': 9753600, 'steps': 50799, 'loss/train': 1.648983359336853} -08/30/2021 22:24:04 - INFO - __main__ - Step 50801: {'lr': 0.00037744301755785137, 'samples': 9753792, 'steps': 50800, 'loss/train': 1.3219642639160156} -08/30/2021 22:24:04 - INFO - __main__ - Step 50802: {'lr': 0.0003774384520865618, 'samples': 9753984, 'steps': 50801, 'loss/train': 2.6102852821350098} -08/30/2021 22:24:06 - INFO - __main__ - Step 50803: {'lr': 0.0003774338865578505, 'samples': 9754176, 'steps': 50802, 'loss/train': 1.436866283416748} -08/30/2021 22:24:06 - INFO - __main__ - Step 50804: {'lr': 0.00037742932097171945, 'samples': 9754368, 'steps': 50803, 'loss/train': 0.9029049277305603} -08/30/2021 22:24:07 - INFO - __main__ - Step 50805: {'lr': 0.0003774247553281707, 'samples': 9754560, 'steps': 50804, 'loss/train': 0.15741406381130219} -08/30/2021 22:24:07 - INFO - __main__ - Step 50806: {'lr': 0.00037742018962720625, 'samples': 9754752, 'steps': 50805, 'loss/train': 1.3621734380722046} -08/30/2021 22:24:07 - INFO - __main__ - Step 50807: {'lr': 0.0003774156238688282, 'samples': 9754944, 'steps': 50806, 'loss/train': 1.3569810390472412} -08/30/2021 22:24:09 - INFO - __main__ - Step 50808: {'lr': 0.00037741105805303874, 'samples': 9755136, 'steps': 50807, 'loss/train': 0.6315385103225708} -08/30/2021 22:24:09 - INFO - __main__ - Step 50809: {'lr': 0.0003774064921798399, 'samples': 9755328, 'steps': 50808, 'loss/train': 1.1026027202606201} -08/30/2021 22:24:10 - INFO - __main__ - Step 50810: {'lr': 0.00037740192624923354, 'samples': 9755520, 'steps': 50809, 'loss/train': 1.164373517036438} -08/30/2021 22:24:10 - INFO - __main__ - Step 50811: {'lr': 0.00037739736026122186, 'samples': 9755712, 'steps': 50810, 'loss/train': 1.2390820980072021} -08/30/2021 22:24:10 - INFO - __main__ - Step 50812: {'lr': 0.00037739279421580683, 'samples': 9755904, 'steps': 50811, 'loss/train': 1.2341911792755127} -08/30/2021 22:24:11 - INFO - __main__ - Step 50813: {'lr': 0.00037738822811299067, 'samples': 9756096, 'steps': 50812, 'loss/train': 1.5592031478881836} -08/30/2021 22:24:13 - INFO - __main__ - Step 50814: {'lr': 0.00037738366195277527, 'samples': 9756288, 'steps': 50813, 'loss/train': 0.9190251231193542} -08/30/2021 22:24:13 - INFO - __main__ - Step 50815: {'lr': 0.0003773790957351628, 'samples': 9756480, 'steps': 50814, 'loss/train': 1.2230150699615479} -08/30/2021 22:24:14 - INFO - __main__ - Step 50816: {'lr': 0.00037737452946015533, 'samples': 9756672, 'steps': 50815, 'loss/train': 1.4425054788589478} -08/30/2021 22:24:14 - INFO - __main__ - Step 50817: {'lr': 0.0003773699631277548, 'samples': 9756864, 'steps': 50816, 'loss/train': 1.3997374773025513} -08/30/2021 22:24:14 - INFO - __main__ - Step 50818: {'lr': 0.00037736539673796334, 'samples': 9757056, 'steps': 50817, 'loss/train': 1.0377663373947144} -08/30/2021 22:24:15 - INFO - __main__ - Step 50819: {'lr': 0.00037736083029078294, 'samples': 9757248, 'steps': 50818, 'loss/train': 0.18664397299289703} -08/30/2021 22:24:16 - INFO - __main__ - Step 50820: {'lr': 0.00037735626378621577, 'samples': 9757440, 'steps': 50819, 'loss/train': 0.09894146770238876} -08/30/2021 22:24:17 - INFO - __main__ - Step 50821: {'lr': 0.00037735169722426384, 'samples': 9757632, 'steps': 50820, 'loss/train': 1.3256279230117798} -08/30/2021 22:24:17 - INFO - __main__ - Step 50822: {'lr': 0.0003773471306049292, 'samples': 9757824, 'steps': 50821, 'loss/train': 0.5024879574775696} -08/30/2021 22:24:17 - INFO - __main__ - Step 50823: {'lr': 0.00037734256392821393, 'samples': 9758016, 'steps': 50822, 'loss/train': 1.3245830535888672} -08/30/2021 22:24:18 - INFO - __main__ - Step 50824: {'lr': 0.00037733799719411997, 'samples': 9758208, 'steps': 50823, 'loss/train': 1.5943431854248047} -08/30/2021 22:24:19 - INFO - __main__ - Step 50825: {'lr': 0.00037733343040264954, 'samples': 9758400, 'steps': 50824, 'loss/train': 1.8687024116516113} -08/30/2021 22:24:19 - INFO - __main__ - Step 50826: {'lr': 0.00037732886355380465, 'samples': 9758592, 'steps': 50825, 'loss/train': 1.554660439491272} -08/30/2021 22:24:20 - INFO - __main__ - Step 50827: {'lr': 0.00037732429664758725, 'samples': 9758784, 'steps': 50826, 'loss/train': 1.1154029369354248} -08/30/2021 22:24:20 - INFO - __main__ - Step 50828: {'lr': 0.0003773197296839996, 'samples': 9758976, 'steps': 50827, 'loss/train': 0.7243592739105225} -08/30/2021 22:24:21 - INFO - __main__ - Step 50829: {'lr': 0.00037731516266304355, 'samples': 9759168, 'steps': 50828, 'loss/train': 1.5961356163024902} -08/30/2021 22:24:22 - INFO - __main__ - Step 50830: {'lr': 0.00037731059558472136, 'samples': 9759360, 'steps': 50829, 'loss/train': 1.117758870124817} -08/30/2021 22:24:22 - INFO - __main__ - Step 50831: {'lr': 0.00037730602844903495, 'samples': 9759552, 'steps': 50830, 'loss/train': 1.626081943511963} -08/30/2021 22:24:23 - INFO - __main__ - Step 50832: {'lr': 0.00037730146125598634, 'samples': 9759744, 'steps': 50831, 'loss/train': 1.2703133821487427} -08/30/2021 22:24:23 - INFO - __main__ - Step 50833: {'lr': 0.0003772968940055777, 'samples': 9759936, 'steps': 50832, 'loss/train': 1.4722568988800049} -08/30/2021 22:24:24 - INFO - __main__ - Step 50834: {'lr': 0.000377292326697811, 'samples': 9760128, 'steps': 50833, 'loss/train': 2.081751585006714} -08/30/2021 22:24:25 - INFO - __main__ - Step 50835: {'lr': 0.00037728775933268844, 'samples': 9760320, 'steps': 50834, 'loss/train': 1.4873360395431519} -08/30/2021 22:24:26 - INFO - __main__ - Step 50836: {'lr': 0.0003772831919102119, 'samples': 9760512, 'steps': 50835, 'loss/train': 1.6102399826049805} -08/30/2021 22:24:26 - INFO - __main__ - Step 50837: {'lr': 0.00037727862443038353, 'samples': 9760704, 'steps': 50836, 'loss/train': 0.8270599842071533} -08/30/2021 22:24:26 - INFO - __main__ - Step 50838: {'lr': 0.00037727405689320535, 'samples': 9760896, 'steps': 50837, 'loss/train': 1.7081242799758911} -08/30/2021 22:24:27 - INFO - __main__ - Step 50839: {'lr': 0.00037726948929867955, 'samples': 9761088, 'steps': 50838, 'loss/train': 1.9270517826080322} -08/30/2021 22:24:29 - INFO - __main__ - Step 50840: {'lr': 0.00037726492164680796, 'samples': 9761280, 'steps': 50839, 'loss/train': 1.621097207069397} -08/30/2021 22:24:30 - INFO - __main__ - Step 50841: {'lr': 0.00037726035393759286, 'samples': 9761472, 'steps': 50840, 'loss/train': 0.26181456446647644} -08/30/2021 22:24:30 - INFO - __main__ - Step 50842: {'lr': 0.00037725578617103605, 'samples': 9761664, 'steps': 50841, 'loss/train': 0.050110358744859695} -08/30/2021 22:24:30 - INFO - __main__ - Step 50843: {'lr': 0.00037725121834713995, 'samples': 9761856, 'steps': 50842, 'loss/train': 1.1070399284362793} -08/30/2021 22:24:31 - INFO - __main__ - Step 50844: {'lr': 0.0003772466504659063, 'samples': 9762048, 'steps': 50843, 'loss/train': 2.2391281127929688} -08/30/2021 22:24:31 - INFO - __main__ - Step 50845: {'lr': 0.00037724208252733725, 'samples': 9762240, 'steps': 50844, 'loss/train': 1.3113831281661987} -08/30/2021 22:24:32 - INFO - __main__ - Step 50846: {'lr': 0.000377237514531435, 'samples': 9762432, 'steps': 50845, 'loss/train': 1.7394315004348755} -08/30/2021 22:24:33 - INFO - __main__ - Step 50847: {'lr': 0.0003772329464782014, 'samples': 9762624, 'steps': 50846, 'loss/train': 0.8904613852500916} -08/30/2021 22:24:33 - INFO - __main__ - Step 50848: {'lr': 0.00037722837836763856, 'samples': 9762816, 'steps': 50847, 'loss/train': 1.858169674873352} -08/30/2021 22:24:34 - INFO - __main__ - Step 50849: {'lr': 0.0003772238101997486, 'samples': 9763008, 'steps': 50848, 'loss/train': 1.2896208763122559} -08/30/2021 22:24:34 - INFO - __main__ - Step 50850: {'lr': 0.0003772192419745336, 'samples': 9763200, 'steps': 50849, 'loss/train': 1.2179913520812988} -08/30/2021 22:24:35 - INFO - __main__ - Step 50851: {'lr': 0.0003772146736919956, 'samples': 9763392, 'steps': 50850, 'loss/train': 1.60283625125885} -08/30/2021 22:24:36 - INFO - __main__ - Step 50852: {'lr': 0.0003772101053521366, 'samples': 9763584, 'steps': 50851, 'loss/train': 1.0214512348175049} -08/30/2021 22:24:36 - INFO - __main__ - Step 50853: {'lr': 0.0003772055369549586, 'samples': 9763776, 'steps': 50852, 'loss/train': 1.3520445823669434} -08/30/2021 22:24:37 - INFO - __main__ - Step 50854: {'lr': 0.0003772009685004638, 'samples': 9763968, 'steps': 50853, 'loss/train': 1.1115528345108032} -08/30/2021 22:24:37 - INFO - __main__ - Step 50855: {'lr': 0.0003771963999886543, 'samples': 9764160, 'steps': 50854, 'loss/train': 1.5564624071121216} -08/30/2021 22:24:38 - INFO - __main__ - Step 50856: {'lr': 0.000377191831419532, 'samples': 9764352, 'steps': 50855, 'loss/train': 1.6926746368408203} -08/30/2021 22:24:39 - INFO - __main__ - Step 50857: {'lr': 0.000377187262793099, 'samples': 9764544, 'steps': 50856, 'loss/train': 1.6538127660751343} -08/30/2021 22:24:39 - INFO - __main__ - Step 50858: {'lr': 0.0003771826941093574, 'samples': 9764736, 'steps': 50857, 'loss/train': 1.132995843887329} -08/30/2021 22:24:40 - INFO - __main__ - Step 50859: {'lr': 0.0003771781253683092, 'samples': 9764928, 'steps': 50858, 'loss/train': 1.0015689134597778} -08/30/2021 22:24:40 - INFO - __main__ - Step 50860: {'lr': 0.00037717355656995653, 'samples': 9765120, 'steps': 50859, 'loss/train': 1.5820631980895996} -08/30/2021 22:24:42 - INFO - __main__ - Step 50861: {'lr': 0.0003771689877143015, 'samples': 9765312, 'steps': 50860, 'loss/train': 1.3109848499298096} -08/30/2021 22:24:42 - INFO - __main__ - Step 50862: {'lr': 0.000377164418801346, 'samples': 9765504, 'steps': 50861, 'loss/train': 1.454015851020813} -08/30/2021 22:24:42 - INFO - __main__ - Step 50863: {'lr': 0.0003771598498310922, 'samples': 9765696, 'steps': 50862, 'loss/train': 0.051448971033096313} -08/30/2021 22:24:43 - INFO - __main__ - Step 50864: {'lr': 0.0003771552808035421, 'samples': 9765888, 'steps': 50863, 'loss/train': 1.291578769683838} -08/30/2021 22:24:43 - INFO - __main__ - Step 50865: {'lr': 0.0003771507117186978, 'samples': 9766080, 'steps': 50864, 'loss/train': 1.318737506866455} -08/30/2021 22:24:43 - INFO - __main__ - Step 50866: {'lr': 0.0003771461425765614, 'samples': 9766272, 'steps': 50865, 'loss/train': 1.200408697128296} -08/30/2021 22:24:45 - INFO - __main__ - Step 50867: {'lr': 0.00037714157337713483, 'samples': 9766464, 'steps': 50866, 'loss/train': 0.03980109468102455} -08/30/2021 22:24:45 - INFO - __main__ - Step 50868: {'lr': 0.0003771370041204203, 'samples': 9766656, 'steps': 50867, 'loss/train': 1.5331251621246338} -08/30/2021 22:24:46 - INFO - __main__ - Step 50869: {'lr': 0.0003771324348064198, 'samples': 9766848, 'steps': 50868, 'loss/train': 1.0888392925262451} -08/30/2021 22:24:46 - INFO - __main__ - Step 50870: {'lr': 0.00037712786543513534, 'samples': 9767040, 'steps': 50869, 'loss/train': 1.5546096563339233} -08/30/2021 22:24:46 - INFO - __main__ - Step 50871: {'lr': 0.000377123296006569, 'samples': 9767232, 'steps': 50870, 'loss/train': 0.9032530784606934} -08/30/2021 22:24:48 - INFO - __main__ - Step 50872: {'lr': 0.000377118726520723, 'samples': 9767424, 'steps': 50871, 'loss/train': 1.0285224914550781} -08/30/2021 22:24:48 - INFO - __main__ - Step 50873: {'lr': 0.0003771141569775991, 'samples': 9767616, 'steps': 50872, 'loss/train': 1.7842652797698975} -08/30/2021 22:24:49 - INFO - __main__ - Step 50874: {'lr': 0.0003771095873771996, 'samples': 9767808, 'steps': 50873, 'loss/train': 2.094590902328491} -08/30/2021 22:24:49 - INFO - __main__ - Step 50875: {'lr': 0.0003771050177195265, 'samples': 9768000, 'steps': 50874, 'loss/train': 1.2735671997070312} -08/30/2021 22:24:49 - INFO - __main__ - Step 50876: {'lr': 0.0003771004480045818, 'samples': 9768192, 'steps': 50875, 'loss/train': 0.539814829826355} -08/30/2021 22:24:51 - INFO - __main__ - Step 50877: {'lr': 0.00037709587823236767, 'samples': 9768384, 'steps': 50876, 'loss/train': 1.3838486671447754} -08/30/2021 22:24:52 - INFO - __main__ - Step 50878: {'lr': 0.00037709130840288605, 'samples': 9768576, 'steps': 50877, 'loss/train': 0.22401279211044312} -08/30/2021 22:24:52 - INFO - __main__ - Step 50879: {'lr': 0.00037708673851613903, 'samples': 9768768, 'steps': 50878, 'loss/train': 1.4722766876220703} -08/30/2021 22:24:52 - INFO - __main__ - Step 50880: {'lr': 0.00037708216857212863, 'samples': 9768960, 'steps': 50879, 'loss/train': 1.3142516613006592} -08/30/2021 22:24:53 - INFO - __main__ - Step 50881: {'lr': 0.0003770775985708571, 'samples': 9769152, 'steps': 50880, 'loss/train': 1.6077675819396973} -08/30/2021 22:24:54 - INFO - __main__ - Step 50882: {'lr': 0.0003770730285123263, 'samples': 9769344, 'steps': 50881, 'loss/train': 1.0561434030532837} -08/30/2021 22:24:55 - INFO - __main__ - Step 50883: {'lr': 0.0003770684583965384, 'samples': 9769536, 'steps': 50882, 'loss/train': 1.8479206562042236} -08/30/2021 22:24:55 - INFO - __main__ - Step 50884: {'lr': 0.0003770638882234953, 'samples': 9769728, 'steps': 50883, 'loss/train': 0.8280871510505676} -08/30/2021 22:24:55 - INFO - __main__ - Step 50885: {'lr': 0.0003770593179931993, 'samples': 9769920, 'steps': 50884, 'loss/train': 1.3128963708877563} -08/30/2021 22:24:56 - INFO - __main__ - Step 50886: {'lr': 0.00037705474770565215, 'samples': 9770112, 'steps': 50885, 'loss/train': 1.4274985790252686} -08/30/2021 22:24:56 - INFO - __main__ - Step 50887: {'lr': 0.00037705017736085623, 'samples': 9770304, 'steps': 50886, 'loss/train': 1.536376714706421} -08/30/2021 22:24:58 - INFO - __main__ - Step 50888: {'lr': 0.00037704560695881346, 'samples': 9770496, 'steps': 50887, 'loss/train': 1.8148274421691895} -08/30/2021 22:24:58 - INFO - __main__ - Step 50889: {'lr': 0.0003770410364995259, 'samples': 9770688, 'steps': 50888, 'loss/train': 0.20914511382579803} -08/30/2021 22:24:58 - INFO - __main__ - Step 50890: {'lr': 0.00037703646598299554, 'samples': 9770880, 'steps': 50889, 'loss/train': 1.3130958080291748} -08/30/2021 22:24:59 - INFO - __main__ - Step 50891: {'lr': 0.00037703189540922463, 'samples': 9771072, 'steps': 50890, 'loss/train': 1.4951297044754028} -08/30/2021 22:24:59 - INFO - __main__ - Step 50892: {'lr': 0.000377027324778215, 'samples': 9771264, 'steps': 50891, 'loss/train': 0.37270689010620117} -08/30/2021 22:25:02 - INFO - __main__ - Step 50893: {'lr': 0.0003770227540899689, 'samples': 9771456, 'steps': 50892, 'loss/train': 1.3048276901245117} -08/30/2021 22:25:02 - INFO - __main__ - Step 50894: {'lr': 0.0003770181833444882, 'samples': 9771648, 'steps': 50893, 'loss/train': 1.3916434049606323} -08/30/2021 22:25:02 - INFO - __main__ - Step 50895: {'lr': 0.0003770136125417751, 'samples': 9771840, 'steps': 50894, 'loss/train': 1.4974582195281982} -08/30/2021 22:25:03 - INFO - __main__ - Step 50896: {'lr': 0.0003770090416818317, 'samples': 9772032, 'steps': 50895, 'loss/train': 0.9585852026939392} -08/30/2021 22:25:03 - INFO - __main__ - Step 50897: {'lr': 0.00037700447076465996, 'samples': 9772224, 'steps': 50896, 'loss/train': 1.51726233959198} -08/30/2021 22:25:03 - INFO - __main__ - Step 50898: {'lr': 0.0003769998997902619, 'samples': 9772416, 'steps': 50897, 'loss/train': 1.329371690750122} -08/30/2021 22:25:05 - INFO - __main__ - Step 50899: {'lr': 0.00037699532875863976, 'samples': 9772608, 'steps': 50898, 'loss/train': 1.7552887201309204} -08/30/2021 22:25:05 - INFO - __main__ - Step 50900: {'lr': 0.0003769907576697954, 'samples': 9772800, 'steps': 50899, 'loss/train': 1.707064151763916} -08/30/2021 22:25:06 - INFO - __main__ - Step 50901: {'lr': 0.000376986186523731, 'samples': 9772992, 'steps': 50900, 'loss/train': 0.8977749943733215} -08/30/2021 22:25:06 - INFO - __main__ - Step 50902: {'lr': 0.0003769816153204485, 'samples': 9773184, 'steps': 50901, 'loss/train': 0.9819461107254028} -08/30/2021 22:25:06 - INFO - __main__ - Step 50903: {'lr': 0.00037697704405995015, 'samples': 9773376, 'steps': 50902, 'loss/train': 1.3400992155075073} -08/30/2021 22:25:08 - INFO - __main__ - Step 50904: {'lr': 0.0003769724727422379, 'samples': 9773568, 'steps': 50903, 'loss/train': 1.7477514743804932} -08/30/2021 22:25:09 - INFO - __main__ - Step 50905: {'lr': 0.0003769679013673137, 'samples': 9773760, 'steps': 50904, 'loss/train': 0.528209924697876} -08/30/2021 22:25:09 - INFO - __main__ - Step 50906: {'lr': 0.00037696332993517983, 'samples': 9773952, 'steps': 50905, 'loss/train': 1.5773422718048096} -08/30/2021 22:25:09 - INFO - __main__ - Step 50907: {'lr': 0.0003769587584458382, 'samples': 9774144, 'steps': 50906, 'loss/train': 0.6630872488021851} -08/30/2021 22:25:10 - INFO - __main__ - Step 50908: {'lr': 0.00037695418689929095, 'samples': 9774336, 'steps': 50907, 'loss/train': 1.2419148683547974} -08/30/2021 22:25:11 - INFO - __main__ - Step 50909: {'lr': 0.00037694961529554006, 'samples': 9774528, 'steps': 50908, 'loss/train': 1.29733407497406} -08/30/2021 22:25:11 - INFO - __main__ - Step 50910: {'lr': 0.0003769450436345877, 'samples': 9774720, 'steps': 50909, 'loss/train': 1.2948863506317139} -08/30/2021 22:25:12 - INFO - __main__ - Step 50911: {'lr': 0.00037694047191643576, 'samples': 9774912, 'steps': 50910, 'loss/train': 1.1586613655090332} -08/30/2021 22:25:12 - INFO - __main__ - Step 50912: {'lr': 0.00037693590014108646, 'samples': 9775104, 'steps': 50911, 'loss/train': 1.039445161819458} -08/30/2021 22:25:13 - INFO - __main__ - Step 50913: {'lr': 0.0003769313283085418, 'samples': 9775296, 'steps': 50912, 'loss/train': 1.25136137008667} -08/30/2021 22:25:14 - INFO - __main__ - Step 50914: {'lr': 0.0003769267564188038, 'samples': 9775488, 'steps': 50913, 'loss/train': 1.4407514333724976} -08/30/2021 22:25:15 - INFO - __main__ - Step 50915: {'lr': 0.0003769221844718746, 'samples': 9775680, 'steps': 50914, 'loss/train': 1.3715497255325317} -08/30/2021 22:25:15 - INFO - __main__ - Step 50916: {'lr': 0.00037691761246775625, 'samples': 9775872, 'steps': 50915, 'loss/train': 1.3548270463943481} -08/30/2021 22:25:15 - INFO - __main__ - Step 50917: {'lr': 0.00037691304040645074, 'samples': 9776064, 'steps': 50916, 'loss/train': 1.1928681135177612} -08/30/2021 22:25:16 - INFO - __main__ - Step 50918: {'lr': 0.00037690846828796024, 'samples': 9776256, 'steps': 50917, 'loss/train': 1.4730546474456787} -08/30/2021 22:25:17 - INFO - __main__ - Step 50919: {'lr': 0.00037690389611228664, 'samples': 9776448, 'steps': 50918, 'loss/train': 0.21903111040592194} -08/30/2021 22:25:18 - INFO - __main__ - Step 50920: {'lr': 0.00037689932387943216, 'samples': 9776640, 'steps': 50919, 'loss/train': 1.240023136138916} -08/30/2021 22:25:18 - INFO - __main__ - Step 50921: {'lr': 0.0003768947515893988, 'samples': 9776832, 'steps': 50920, 'loss/train': 1.4727351665496826} -08/30/2021 22:25:18 - INFO - __main__ - Step 50922: {'lr': 0.0003768901792421886, 'samples': 9777024, 'steps': 50921, 'loss/train': 0.9558790326118469} -08/30/2021 22:25:19 - INFO - __main__ - Step 50923: {'lr': 0.0003768856068378036, 'samples': 9777216, 'steps': 50922, 'loss/train': 1.3771542310714722} -08/30/2021 22:25:20 - INFO - __main__ - Step 50924: {'lr': 0.000376881034376246, 'samples': 9777408, 'steps': 50923, 'loss/train': 0.45340245962142944} -08/30/2021 22:25:21 - INFO - __main__ - Step 50925: {'lr': 0.0003768764618575178, 'samples': 9777600, 'steps': 50924, 'loss/train': 1.293688178062439} -08/30/2021 22:25:21 - INFO - __main__ - Step 50926: {'lr': 0.00037687188928162087, 'samples': 9777792, 'steps': 50925, 'loss/train': 1.6255319118499756} -08/30/2021 22:25:21 - INFO - __main__ - Step 50927: {'lr': 0.00037686731664855755, 'samples': 9777984, 'steps': 50926, 'loss/train': 1.837478756904602} -08/30/2021 22:25:22 - INFO - __main__ - Step 50928: {'lr': 0.0003768627439583297, 'samples': 9778176, 'steps': 50927, 'loss/train': 1.4847376346588135} -08/30/2021 22:25:22 - INFO - __main__ - Step 50929: {'lr': 0.00037685817121093946, 'samples': 9778368, 'steps': 50928, 'loss/train': 1.1166173219680786} -08/30/2021 22:25:24 - INFO - __main__ - Step 50930: {'lr': 0.000376853598406389, 'samples': 9778560, 'steps': 50929, 'loss/train': 1.0932608842849731} -08/30/2021 22:25:24 - INFO - __main__ - Step 50931: {'lr': 0.00037684902554468015, 'samples': 9778752, 'steps': 50930, 'loss/train': 1.0910321474075317} -08/30/2021 22:25:24 - INFO - __main__ - Step 50932: {'lr': 0.0003768444526258151, 'samples': 9778944, 'steps': 50931, 'loss/train': 1.4822059869766235} -08/30/2021 22:25:25 - INFO - __main__ - Step 50933: {'lr': 0.0003768398796497959, 'samples': 9779136, 'steps': 50932, 'loss/train': 0.870415985584259} -08/30/2021 22:25:25 - INFO - __main__ - Step 50934: {'lr': 0.00037683530661662457, 'samples': 9779328, 'steps': 50933, 'loss/train': 1.47185218334198} -08/30/2021 22:25:27 - INFO - __main__ - Step 50935: {'lr': 0.00037683073352630327, 'samples': 9779520, 'steps': 50934, 'loss/train': 1.5783512592315674} -08/30/2021 22:25:27 - INFO - __main__ - Step 50936: {'lr': 0.000376826160378834, 'samples': 9779712, 'steps': 50935, 'loss/train': 0.9159941673278809} -08/30/2021 22:25:27 - INFO - __main__ - Step 50937: {'lr': 0.0003768215871742188, 'samples': 9779904, 'steps': 50936, 'loss/train': 1.404692530632019} -08/30/2021 22:25:28 - INFO - __main__ - Step 50938: {'lr': 0.00037681701391245983, 'samples': 9780096, 'steps': 50937, 'loss/train': 1.6873672008514404} -08/30/2021 22:25:28 - INFO - __main__ - Step 50939: {'lr': 0.0003768124405935589, 'samples': 9780288, 'steps': 50938, 'loss/train': 1.4844799041748047} -08/30/2021 22:25:30 - INFO - __main__ - Step 50940: {'lr': 0.00037680786721751834, 'samples': 9780480, 'steps': 50939, 'loss/train': 1.6213657855987549} -08/30/2021 22:25:30 - INFO - __main__ - Step 50941: {'lr': 0.0003768032937843401, 'samples': 9780672, 'steps': 50940, 'loss/train': 0.6705363392829895} -08/30/2021 22:25:30 - INFO - __main__ - Step 50942: {'lr': 0.00037679872029402627, 'samples': 9780864, 'steps': 50941, 'loss/train': 0.8061746954917908} -08/30/2021 22:25:31 - INFO - __main__ - Step 50943: {'lr': 0.0003767941467465789, 'samples': 9781056, 'steps': 50942, 'loss/train': 1.5418555736541748} -08/30/2021 22:25:31 - INFO - __main__ - Step 50944: {'lr': 0.000376789573142, 'samples': 9781248, 'steps': 50943, 'loss/train': 1.365171194076538} -08/30/2021 22:25:33 - INFO - __main__ - Step 50945: {'lr': 0.0003767849994802918, 'samples': 9781440, 'steps': 50944, 'loss/train': 1.3933255672454834} -08/30/2021 22:25:33 - INFO - __main__ - Step 50946: {'lr': 0.0003767804257614561, 'samples': 9781632, 'steps': 50945, 'loss/train': 1.0017657279968262} -08/30/2021 22:25:34 - INFO - __main__ - Step 50947: {'lr': 0.00037677585198549516, 'samples': 9781824, 'steps': 50946, 'loss/train': 1.5424386262893677} -08/30/2021 22:25:34 - INFO - __main__ - Step 50948: {'lr': 0.00037677127815241086, 'samples': 9782016, 'steps': 50947, 'loss/train': 1.5783275365829468} -08/30/2021 22:25:34 - INFO - __main__ - Step 50949: {'lr': 0.00037676670426220547, 'samples': 9782208, 'steps': 50948, 'loss/train': 1.4499647617340088} -08/30/2021 22:25:35 - INFO - __main__ - Step 50950: {'lr': 0.00037676213031488095, 'samples': 9782400, 'steps': 50949, 'loss/train': 0.8235907554626465} -08/30/2021 22:25:37 - INFO - __main__ - Step 50951: {'lr': 0.0003767575563104394, 'samples': 9782592, 'steps': 50950, 'loss/train': 1.3277612924575806} -08/30/2021 22:25:37 - INFO - __main__ - Step 50952: {'lr': 0.00037675298224888287, 'samples': 9782784, 'steps': 50951, 'loss/train': 1.6856927871704102} -08/30/2021 22:25:37 - INFO - __main__ - Step 50953: {'lr': 0.0003767484081302133, 'samples': 9782976, 'steps': 50952, 'loss/train': 1.3247592449188232} -08/30/2021 22:25:38 - INFO - __main__ - Step 50954: {'lr': 0.000376743833954433, 'samples': 9783168, 'steps': 50953, 'loss/train': 1.1527340412139893} -08/30/2021 22:25:38 - INFO - __main__ - Step 50955: {'lr': 0.00037673925972154376, 'samples': 9783360, 'steps': 50954, 'loss/train': 0.8363124132156372} -08/30/2021 22:25:40 - INFO - __main__ - Step 50956: {'lr': 0.00037673468543154777, 'samples': 9783552, 'steps': 50955, 'loss/train': 1.054368257522583} -08/30/2021 22:25:40 - INFO - __main__ - Step 50957: {'lr': 0.0003767301110844472, 'samples': 9783744, 'steps': 50956, 'loss/train': 2.1103508472442627} -08/30/2021 22:25:41 - INFO - __main__ - Step 50958: {'lr': 0.0003767255366802439, 'samples': 9783936, 'steps': 50957, 'loss/train': 1.6950081586837769} -08/30/2021 22:25:41 - INFO - __main__ - Step 50959: {'lr': 0.00037672096221894004, 'samples': 9784128, 'steps': 50958, 'loss/train': 1.2313460111618042} -08/30/2021 22:25:41 - INFO - __main__ - Step 50960: {'lr': 0.0003767163877005376, 'samples': 9784320, 'steps': 50959, 'loss/train': 1.5555827617645264} -08/30/2021 22:25:43 - INFO - __main__ - Step 50961: {'lr': 0.0003767118131250388, 'samples': 9784512, 'steps': 50960, 'loss/train': 1.2279070615768433} -08/30/2021 22:25:43 - INFO - __main__ - Step 50962: {'lr': 0.00037670723849244557, 'samples': 9784704, 'steps': 50961, 'loss/train': 0.7368555665016174} -08/30/2021 22:25:44 - INFO - __main__ - Step 50963: {'lr': 0.0003767026638027601, 'samples': 9784896, 'steps': 50962, 'loss/train': 1.827950119972229} -08/30/2021 22:25:44 - INFO - __main__ - Step 50964: {'lr': 0.00037669808905598434, 'samples': 9785088, 'steps': 50963, 'loss/train': 1.7964262962341309} -08/30/2021 22:25:44 - INFO - __main__ - Step 50965: {'lr': 0.0003766935142521203, 'samples': 9785280, 'steps': 50964, 'loss/train': 0.9194609522819519} -08/30/2021 22:25:46 - INFO - __main__ - Step 50966: {'lr': 0.00037668893939117023, 'samples': 9785472, 'steps': 50965, 'loss/train': 1.1977851390838623} -08/30/2021 22:25:46 - INFO - __main__ - Step 50967: {'lr': 0.000376684364473136, 'samples': 9785664, 'steps': 50966, 'loss/train': 0.770944356918335} -08/30/2021 22:25:47 - INFO - __main__ - Step 50968: {'lr': 0.00037667978949801974, 'samples': 9785856, 'steps': 50967, 'loss/train': 1.216599464416504} -08/30/2021 22:25:47 - INFO - __main__ - Step 50969: {'lr': 0.00037667521446582355, 'samples': 9786048, 'steps': 50968, 'loss/train': 1.0586565732955933} -08/30/2021 22:25:47 - INFO - __main__ - Step 50970: {'lr': 0.00037667063937654944, 'samples': 9786240, 'steps': 50969, 'loss/train': 1.0758748054504395} -08/30/2021 22:25:49 - INFO - __main__ - Step 50971: {'lr': 0.00037666606423019956, 'samples': 9786432, 'steps': 50970, 'loss/train': 1.2091621160507202} -08/30/2021 22:25:49 - INFO - __main__ - Step 50972: {'lr': 0.00037666148902677576, 'samples': 9786624, 'steps': 50971, 'loss/train': 1.2704368829727173} -08/30/2021 22:25:50 - INFO - __main__ - Step 50973: {'lr': 0.0003766569137662804, 'samples': 9786816, 'steps': 50972, 'loss/train': 0.9434016942977905} -08/30/2021 22:25:50 - INFO - __main__ - Step 50974: {'lr': 0.00037665233844871534, 'samples': 9787008, 'steps': 50973, 'loss/train': 1.3591214418411255} -08/30/2021 22:25:50 - INFO - __main__ - Step 50975: {'lr': 0.0003766477630740827, 'samples': 9787200, 'steps': 50974, 'loss/train': 1.1668370962142944} -08/30/2021 22:25:52 - INFO - __main__ - Step 50976: {'lr': 0.00037664318764238445, 'samples': 9787392, 'steps': 50975, 'loss/train': 1.9410172700881958} -08/30/2021 22:25:52 - INFO - __main__ - Step 50977: {'lr': 0.0003766386121536228, 'samples': 9787584, 'steps': 50976, 'loss/train': 1.7867932319641113} -08/30/2021 22:25:52 - INFO - __main__ - Step 50978: {'lr': 0.00037663403660779984, 'samples': 9787776, 'steps': 50977, 'loss/train': 1.4452104568481445} -08/30/2021 22:25:53 - INFO - __main__ - Step 50979: {'lr': 0.00037662946100491736, 'samples': 9787968, 'steps': 50978, 'loss/train': 1.193568468093872} -08/30/2021 22:25:53 - INFO - __main__ - Step 50980: {'lr': 0.00037662488534497766, 'samples': 9788160, 'steps': 50979, 'loss/train': 0.6591973304748535} -08/30/2021 22:25:54 - INFO - __main__ - Step 50981: {'lr': 0.0003766203096279828, 'samples': 9788352, 'steps': 50980, 'loss/train': 1.4129118919372559} -08/30/2021 22:25:55 - INFO - __main__ - Step 50982: {'lr': 0.00037661573385393477, 'samples': 9788544, 'steps': 50981, 'loss/train': 1.5191997289657593} -08/30/2021 22:25:55 - INFO - __main__ - Step 50983: {'lr': 0.0003766111580228356, 'samples': 9788736, 'steps': 50982, 'loss/train': 1.4790685176849365} -08/30/2021 22:25:56 - INFO - __main__ - Step 50984: {'lr': 0.00037660658213468744, 'samples': 9788928, 'steps': 50983, 'loss/train': 2.0044775009155273} -08/30/2021 22:25:56 - INFO - __main__ - Step 50985: {'lr': 0.00037660200618949225, 'samples': 9789120, 'steps': 50984, 'loss/train': 1.2575911283493042} -08/30/2021 22:25:56 - INFO - __main__ - Step 50986: {'lr': 0.0003765974301872522, 'samples': 9789312, 'steps': 50985, 'loss/train': 1.569093942642212} -08/30/2021 22:25:58 - INFO - __main__ - Step 50987: {'lr': 0.0003765928541279693, 'samples': 9789504, 'steps': 50986, 'loss/train': 0.814099907875061} -08/30/2021 22:25:58 - INFO - __main__ - Step 50988: {'lr': 0.0003765882780116455, 'samples': 9789696, 'steps': 50987, 'loss/train': 1.704711675643921} -08/30/2021 22:25:59 - INFO - __main__ - Step 50989: {'lr': 0.0003765837018382831, 'samples': 9789888, 'steps': 50988, 'loss/train': 0.9379704594612122} -08/30/2021 22:25:59 - INFO - __main__ - Step 50990: {'lr': 0.0003765791256078841, 'samples': 9790080, 'steps': 50989, 'loss/train': 1.3221157789230347} -08/30/2021 22:25:59 - INFO - __main__ - Step 50991: {'lr': 0.00037657454932045036, 'samples': 9790272, 'steps': 50990, 'loss/train': 1.6199997663497925} -08/30/2021 22:26:02 - INFO - __main__ - Step 50992: {'lr': 0.00037656997297598417, 'samples': 9790464, 'steps': 50991, 'loss/train': 1.477184772491455} -08/30/2021 22:26:02 - INFO - __main__ - Step 50993: {'lr': 0.0003765653965744874, 'samples': 9790656, 'steps': 50992, 'loss/train': 0.8813958764076233} -08/30/2021 22:26:02 - INFO - __main__ - Step 50994: {'lr': 0.00037656082011596224, 'samples': 9790848, 'steps': 50993, 'loss/train': 1.374882698059082} -08/30/2021 22:26:03 - INFO - __main__ - Step 50995: {'lr': 0.00037655624360041084, 'samples': 9791040, 'steps': 50994, 'loss/train': 0.09208963811397552} -08/30/2021 22:26:03 - INFO - __main__ - Step 50996: {'lr': 0.00037655166702783507, 'samples': 9791232, 'steps': 50995, 'loss/train': 1.3419182300567627} -08/30/2021 22:26:05 - INFO - __main__ - Step 50997: {'lr': 0.0003765470903982371, 'samples': 9791424, 'steps': 50996, 'loss/train': 1.0198330879211426} -08/30/2021 22:26:05 - INFO - __main__ - Step 50998: {'lr': 0.0003765425137116189, 'samples': 9791616, 'steps': 50997, 'loss/train': 0.6795632243156433} -08/30/2021 22:26:06 - INFO - __main__ - Step 50999: {'lr': 0.00037653793696798267, 'samples': 9791808, 'steps': 50998, 'loss/train': 0.1587800830602646} -08/30/2021 22:26:06 - INFO - __main__ - Step 51000: {'lr': 0.0003765333601673303, 'samples': 9792000, 'steps': 50999, 'loss/train': 1.6997179985046387} -08/30/2021 22:26:07 - INFO - __main__ - Step 51001: {'lr': 0.0003765287833096641, 'samples': 9792192, 'steps': 51000, 'loss/train': 0.9439852833747864} -08/30/2021 22:26:07 - INFO - __main__ - Step 51002: {'lr': 0.00037652420639498583, 'samples': 9792384, 'steps': 51001, 'loss/train': 0.8181083798408508} -08/30/2021 22:26:09 - INFO - __main__ - Step 51003: {'lr': 0.00037651962942329784, 'samples': 9792576, 'steps': 51002, 'loss/train': 2.2781405448913574} -08/30/2021 22:26:10 - INFO - __main__ - Step 51004: {'lr': 0.0003765150523946019, 'samples': 9792768, 'steps': 51003, 'loss/train': 1.070449709892273} -08/30/2021 22:26:10 - INFO - __main__ - Step 51005: {'lr': 0.00037651047530890035, 'samples': 9792960, 'steps': 51004, 'loss/train': 1.507706880569458} -08/30/2021 22:26:10 - INFO - __main__ - Step 51006: {'lr': 0.0003765058981661952, 'samples': 9793152, 'steps': 51005, 'loss/train': 1.3608185052871704} -08/30/2021 22:26:11 - INFO - __main__ - Step 51007: {'lr': 0.0003765013209664883, 'samples': 9793344, 'steps': 51006, 'loss/train': 1.2262402772903442} -08/30/2021 22:26:12 - INFO - __main__ - Step 51008: {'lr': 0.00037649674370978195, 'samples': 9793536, 'steps': 51007, 'loss/train': 1.3377485275268555} -08/30/2021 22:26:13 - INFO - __main__ - Step 51009: {'lr': 0.000376492166396078, 'samples': 9793728, 'steps': 51008, 'loss/train': 1.5474079847335815} -08/30/2021 22:26:13 - INFO - __main__ - Step 51010: {'lr': 0.0003764875890253787, 'samples': 9793920, 'steps': 51009, 'loss/train': 1.4240821599960327} -08/30/2021 22:26:14 - INFO - __main__ - Step 51011: {'lr': 0.0003764830115976861, 'samples': 9794112, 'steps': 51010, 'loss/train': 0.49576616287231445} -08/30/2021 22:26:14 - INFO - __main__ - Step 51012: {'lr': 0.00037647843411300213, 'samples': 9794304, 'steps': 51011, 'loss/train': 0.06136703118681908} -08/30/2021 22:26:16 - INFO - __main__ - Step 51013: {'lr': 0.00037647385657132895, 'samples': 9794496, 'steps': 51012, 'loss/train': 1.6304805278778076} -08/30/2021 22:26:16 - INFO - __main__ - Step 51014: {'lr': 0.0003764692789726686, 'samples': 9794688, 'steps': 51013, 'loss/train': 1.4706993103027344} -08/30/2021 22:26:16 - INFO - __main__ - Step 51015: {'lr': 0.00037646470131702314, 'samples': 9794880, 'steps': 51014, 'loss/train': 0.032574210315942764} -08/30/2021 22:26:17 - INFO - __main__ - Step 51016: {'lr': 0.00037646012360439463, 'samples': 9795072, 'steps': 51015, 'loss/train': 1.276258945465088} -08/30/2021 22:26:17 - INFO - __main__ - Step 51017: {'lr': 0.0003764555458347851, 'samples': 9795264, 'steps': 51016, 'loss/train': 1.5600028038024902} -08/30/2021 22:26:17 - INFO - __main__ - Step 51018: {'lr': 0.00037645096800819684, 'samples': 9795456, 'steps': 51017, 'loss/train': 1.8636372089385986} -08/30/2021 22:26:19 - INFO - __main__ - Step 51019: {'lr': 0.00037644639012463155, 'samples': 9795648, 'steps': 51018, 'loss/train': 0.23138362169265747} -08/30/2021 22:26:19 - INFO - __main__ - Step 51020: {'lr': 0.00037644181218409156, 'samples': 9795840, 'steps': 51019, 'loss/train': 1.5921701192855835} -08/30/2021 22:26:20 - INFO - __main__ - Step 51021: {'lr': 0.0003764372341865788, 'samples': 9796032, 'steps': 51020, 'loss/train': 1.307142734527588} -08/30/2021 22:26:20 - INFO - __main__ - Step 51022: {'lr': 0.00037643265613209533, 'samples': 9796224, 'steps': 51021, 'loss/train': 1.2661389112472534} -08/30/2021 22:26:21 - INFO - __main__ - Step 51023: {'lr': 0.00037642807802064327, 'samples': 9796416, 'steps': 51022, 'loss/train': 0.9044985175132751} -08/30/2021 22:26:22 - INFO - __main__ - Step 51024: {'lr': 0.00037642349985222474, 'samples': 9796608, 'steps': 51023, 'loss/train': 0.41017019748687744} -08/30/2021 22:26:23 - INFO - __main__ - Step 51025: {'lr': 0.0003764189216268417, 'samples': 9796800, 'steps': 51024, 'loss/train': 1.484224796295166} -08/30/2021 22:26:23 - INFO - __main__ - Step 51026: {'lr': 0.0003764143433444962, 'samples': 9796992, 'steps': 51025, 'loss/train': 1.3008670806884766} -08/30/2021 22:26:23 - INFO - __main__ - Step 51027: {'lr': 0.00037640976500519035, 'samples': 9797184, 'steps': 51026, 'loss/train': 0.5754580497741699} -08/30/2021 22:26:24 - INFO - __main__ - Step 51028: {'lr': 0.0003764051866089262, 'samples': 9797376, 'steps': 51027, 'loss/train': 1.3381850719451904} -08/30/2021 22:26:25 - INFO - __main__ - Step 51029: {'lr': 0.00037640060815570585, 'samples': 9797568, 'steps': 51028, 'loss/train': 1.01432204246521} -08/30/2021 22:26:26 - INFO - __main__ - Step 51030: {'lr': 0.0003763960296455314, 'samples': 9797760, 'steps': 51029, 'loss/train': 1.67357337474823} -08/30/2021 22:26:26 - INFO - __main__ - Step 51031: {'lr': 0.0003763914510784048, 'samples': 9797952, 'steps': 51030, 'loss/train': 1.4265296459197998} -08/30/2021 22:26:27 - INFO - __main__ - Step 51032: {'lr': 0.00037638687245432817, 'samples': 9798144, 'steps': 51031, 'loss/train': 1.2338874340057373} -08/30/2021 22:26:27 - INFO - __main__ - Step 51033: {'lr': 0.00037638229377330356, 'samples': 9798336, 'steps': 51032, 'loss/train': 5.946896553039551} -08/30/2021 22:26:27 - INFO - __main__ - Step 51034: {'lr': 0.00037637771503533303, 'samples': 9798528, 'steps': 51033, 'loss/train': 5.8254241943359375} -08/30/2021 22:26:29 - INFO - __main__ - Step 51035: {'lr': 0.00037637313624041863, 'samples': 9798720, 'steps': 51034, 'loss/train': 1.847798466682434} -08/30/2021 22:26:29 - INFO - __main__ - Step 51036: {'lr': 0.00037636855738856247, 'samples': 9798912, 'steps': 51035, 'loss/train': 0.8923953175544739} -08/30/2021 22:26:30 - INFO - __main__ - Step 51037: {'lr': 0.00037636397847976656, 'samples': 9799104, 'steps': 51036, 'loss/train': 1.4600393772125244} -08/30/2021 22:26:30 - INFO - __main__ - Step 51038: {'lr': 0.00037635939951403307, 'samples': 9799296, 'steps': 51037, 'loss/train': 2.040217161178589} -08/30/2021 22:26:30 - INFO - __main__ - Step 51039: {'lr': 0.00037635482049136395, 'samples': 9799488, 'steps': 51038, 'loss/train': 1.0636835098266602} -08/30/2021 22:26:31 - INFO - __main__ - Step 51040: {'lr': 0.0003763502414117612, 'samples': 9799680, 'steps': 51039, 'loss/train': 1.5607802867889404} -08/30/2021 22:26:32 - INFO - __main__ - Step 51041: {'lr': 0.0003763456622752271, 'samples': 9799872, 'steps': 51040, 'loss/train': 1.3773200511932373} -08/30/2021 22:26:33 - INFO - __main__ - Step 51042: {'lr': 0.0003763410830817635, 'samples': 9800064, 'steps': 51041, 'loss/train': 0.6044677495956421} -08/30/2021 22:26:33 - INFO - __main__ - Step 51043: {'lr': 0.00037633650383137263, 'samples': 9800256, 'steps': 51042, 'loss/train': 1.3890656232833862} -08/30/2021 22:26:33 - INFO - __main__ - Step 51044: {'lr': 0.0003763319245240565, 'samples': 9800448, 'steps': 51043, 'loss/train': 0.9743980169296265} -08/30/2021 22:26:34 - INFO - __main__ - Step 51045: {'lr': 0.00037632734515981715, 'samples': 9800640, 'steps': 51044, 'loss/train': 1.0391114950180054} -08/30/2021 22:26:35 - INFO - __main__ - Step 51046: {'lr': 0.00037632276573865657, 'samples': 9800832, 'steps': 51045, 'loss/train': 1.7304145097732544} -08/30/2021 22:26:36 - INFO - __main__ - Step 51047: {'lr': 0.00037631818626057695, 'samples': 9801024, 'steps': 51046, 'loss/train': 0.8279850482940674} -08/30/2021 22:26:36 - INFO - __main__ - Step 51048: {'lr': 0.0003763136067255803, 'samples': 9801216, 'steps': 51047, 'loss/train': 1.1320995092391968} -08/30/2021 22:26:36 - INFO - __main__ - Step 51049: {'lr': 0.00037630902713366865, 'samples': 9801408, 'steps': 51048, 'loss/train': 1.310449242591858} -08/30/2021 22:26:37 - INFO - __main__ - Step 51050: {'lr': 0.00037630444748484415, 'samples': 9801600, 'steps': 51049, 'loss/train': 1.2691503763198853} -08/30/2021 22:26:38 - INFO - __main__ - Step 51051: {'lr': 0.00037629986777910885, 'samples': 9801792, 'steps': 51050, 'loss/train': 1.329351782798767} -08/30/2021 22:26:39 - INFO - __main__ - Step 51052: {'lr': 0.00037629528801646475, 'samples': 9801984, 'steps': 51051, 'loss/train': 1.1222641468048096} -08/30/2021 22:26:39 - INFO - __main__ - Step 51053: {'lr': 0.0003762907081969139, 'samples': 9802176, 'steps': 51052, 'loss/train': 1.2861281633377075} -08/30/2021 22:26:39 - INFO - __main__ - Step 51054: {'lr': 0.00037628612832045846, 'samples': 9802368, 'steps': 51053, 'loss/train': 1.512338638305664} -08/30/2021 22:26:40 - INFO - __main__ - Step 51055: {'lr': 0.0003762815483871004, 'samples': 9802560, 'steps': 51054, 'loss/train': 1.5725440979003906} -08/30/2021 22:26:42 - INFO - __main__ - Step 51056: {'lr': 0.00037627696839684176, 'samples': 9802752, 'steps': 51055, 'loss/train': 1.3401360511779785} -08/30/2021 22:26:42 - INFO - __main__ - Step 51057: {'lr': 0.0003762723883496848, 'samples': 9802944, 'steps': 51056, 'loss/train': 1.83293879032135} -08/30/2021 22:26:43 - INFO - __main__ - Step 51058: {'lr': 0.00037626780824563145, 'samples': 9803136, 'steps': 51057, 'loss/train': 1.2921923398971558} -08/30/2021 22:26:43 - INFO - __main__ - Step 51059: {'lr': 0.0003762632280846837, 'samples': 9803328, 'steps': 51058, 'loss/train': 1.3698080778121948} -08/30/2021 22:26:43 - INFO - __main__ - Step 51060: {'lr': 0.00037625864786684364, 'samples': 9803520, 'steps': 51059, 'loss/train': 0.8140104413032532} -08/30/2021 22:26:45 - INFO - __main__ - Step 51061: {'lr': 0.00037625406759211346, 'samples': 9803712, 'steps': 51060, 'loss/train': 1.9415984153747559} -08/30/2021 22:26:45 - INFO - __main__ - Step 51062: {'lr': 0.00037624948726049513, 'samples': 9803904, 'steps': 51061, 'loss/train': 0.5403301119804382} -08/30/2021 22:26:46 - INFO - __main__ - Step 51063: {'lr': 0.0003762449068719907, 'samples': 9804096, 'steps': 51062, 'loss/train': 0.5302300453186035} -08/30/2021 22:26:46 - INFO - __main__ - Step 51064: {'lr': 0.00037624032642660234, 'samples': 9804288, 'steps': 51063, 'loss/train': 0.9016693234443665} -08/30/2021 22:26:46 - INFO - __main__ - Step 51065: {'lr': 0.00037623574592433195, 'samples': 9804480, 'steps': 51064, 'loss/train': 1.92802095413208} -08/30/2021 22:26:48 - INFO - __main__ - Step 51066: {'lr': 0.00037623116536518176, 'samples': 9804672, 'steps': 51065, 'loss/train': 1.5189765691757202} -08/30/2021 22:26:48 - INFO - __main__ - Step 51067: {'lr': 0.00037622658474915373, 'samples': 9804864, 'steps': 51066, 'loss/train': 0.8574656248092651} -08/30/2021 22:26:49 - INFO - __main__ - Step 51068: {'lr': 0.0003762220040762499, 'samples': 9805056, 'steps': 51067, 'loss/train': 1.0047905445098877} -08/30/2021 22:26:49 - INFO - __main__ - Step 51069: {'lr': 0.0003762174233464724, 'samples': 9805248, 'steps': 51068, 'loss/train': 1.1985036134719849} -08/30/2021 22:26:49 - INFO - __main__ - Step 51070: {'lr': 0.00037621284255982324, 'samples': 9805440, 'steps': 51069, 'loss/train': 1.8381924629211426} -08/30/2021 22:26:51 - INFO - __main__ - Step 51071: {'lr': 0.0003762082617163046, 'samples': 9805632, 'steps': 51070, 'loss/train': 1.524709701538086} -08/30/2021 22:26:52 - INFO - __main__ - Step 51072: {'lr': 0.0003762036808159185, 'samples': 9805824, 'steps': 51071, 'loss/train': 1.2687848806381226} -08/30/2021 22:26:52 - INFO - __main__ - Step 51073: {'lr': 0.0003761990998586669, 'samples': 9806016, 'steps': 51072, 'loss/train': 0.7302113175392151} -08/30/2021 22:26:52 - INFO - __main__ - Step 51074: {'lr': 0.0003761945188445519, 'samples': 9806208, 'steps': 51073, 'loss/train': 1.64555823802948} -08/30/2021 22:26:53 - INFO - __main__ - Step 51075: {'lr': 0.00037618993777357567, 'samples': 9806400, 'steps': 51074, 'loss/train': 0.1517094522714615} -08/30/2021 22:26:54 - INFO - __main__ - Step 51076: {'lr': 0.00037618535664574014, 'samples': 9806592, 'steps': 51075, 'loss/train': 0.7418529391288757} -08/30/2021 22:26:55 - INFO - __main__ - Step 51077: {'lr': 0.0003761807754610475, 'samples': 9806784, 'steps': 51076, 'loss/train': 1.3080519437789917} -08/30/2021 22:26:55 - INFO - __main__ - Step 51078: {'lr': 0.0003761761942194997, 'samples': 9806976, 'steps': 51077, 'loss/train': 1.0140433311462402} -08/30/2021 22:26:55 - INFO - __main__ - Step 51079: {'lr': 0.00037617161292109887, 'samples': 9807168, 'steps': 51078, 'loss/train': 1.57699453830719} -08/30/2021 22:26:56 - INFO - __main__ - Step 51080: {'lr': 0.0003761670315658471, 'samples': 9807360, 'steps': 51079, 'loss/train': 1.6466772556304932} -08/30/2021 22:26:57 - INFO - __main__ - Step 51081: {'lr': 0.0003761624501537463, 'samples': 9807552, 'steps': 51080, 'loss/train': 1.5381520986557007} -08/30/2021 22:26:57 - INFO - __main__ - Step 51082: {'lr': 0.00037615786868479875, 'samples': 9807744, 'steps': 51081, 'loss/train': 1.18941330909729} -08/30/2021 22:26:58 - INFO - __main__ - Step 51083: {'lr': 0.0003761532871590063, 'samples': 9807936, 'steps': 51082, 'loss/train': 1.2548831701278687} -08/30/2021 22:26:58 - INFO - __main__ - Step 51084: {'lr': 0.0003761487055763713, 'samples': 9808128, 'steps': 51083, 'loss/train': 1.1112098693847656} -08/30/2021 22:26:59 - INFO - __main__ - Step 51085: {'lr': 0.0003761441239368955, 'samples': 9808320, 'steps': 51084, 'loss/train': 1.2736133337020874} -08/30/2021 22:27:00 - INFO - __main__ - Step 51086: {'lr': 0.0003761395422405811, 'samples': 9808512, 'steps': 51085, 'loss/train': 1.235261082649231} -08/30/2021 22:27:00 - INFO - __main__ - Step 51087: {'lr': 0.00037613496048743023, 'samples': 9808704, 'steps': 51086, 'loss/train': 1.9329742193222046} -08/30/2021 22:27:01 - INFO - __main__ - Step 51088: {'lr': 0.00037613037867744494, 'samples': 9808896, 'steps': 51087, 'loss/train': 1.3166897296905518} -08/30/2021 22:27:01 - INFO - __main__ - Step 51089: {'lr': 0.00037612579681062713, 'samples': 9809088, 'steps': 51088, 'loss/train': 1.9982270002365112} -08/30/2021 22:27:01 - INFO - __main__ - Step 51090: {'lr': 0.000376121214886979, 'samples': 9809280, 'steps': 51089, 'loss/train': 1.3550151586532593} -08/30/2021 22:27:03 - INFO - __main__ - Step 51091: {'lr': 0.00037611663290650267, 'samples': 9809472, 'steps': 51090, 'loss/train': 1.4045321941375732} -08/30/2021 22:27:03 - INFO - __main__ - Step 51092: {'lr': 0.0003761120508692001, 'samples': 9809664, 'steps': 51091, 'loss/train': 1.3623402118682861} -08/30/2021 22:27:04 - INFO - __main__ - Step 51093: {'lr': 0.00037610746877507343, 'samples': 9809856, 'steps': 51092, 'loss/train': 1.6759140491485596} -08/30/2021 22:27:04 - INFO - __main__ - Step 51094: {'lr': 0.0003761028866241246, 'samples': 9810048, 'steps': 51093, 'loss/train': 1.1017138957977295} -08/30/2021 22:27:04 - INFO - __main__ - Step 51095: {'lr': 0.00037609830441635573, 'samples': 9810240, 'steps': 51094, 'loss/train': 1.4433974027633667} -08/30/2021 22:27:05 - INFO - __main__ - Step 51096: {'lr': 0.00037609372215176897, 'samples': 9810432, 'steps': 51095, 'loss/train': 1.3323721885681152} -08/30/2021 22:27:06 - INFO - __main__ - Step 51097: {'lr': 0.0003760891398303663, 'samples': 9810624, 'steps': 51096, 'loss/train': 1.3992011547088623} -08/30/2021 22:27:07 - INFO - __main__ - Step 51098: {'lr': 0.0003760845574521499, 'samples': 9810816, 'steps': 51097, 'loss/train': 1.0762879848480225} -08/30/2021 22:27:07 - INFO - __main__ - Step 51099: {'lr': 0.00037607997501712165, 'samples': 9811008, 'steps': 51098, 'loss/train': 1.576791763305664} -08/30/2021 22:27:07 - INFO - __main__ - Step 51100: {'lr': 0.0003760753925252838, 'samples': 9811200, 'steps': 51099, 'loss/train': 1.6294625997543335} -08/30/2021 22:27:08 - INFO - __main__ - Step 51101: {'lr': 0.0003760708099766382, 'samples': 9811392, 'steps': 51100, 'loss/train': 1.4208580255508423} -08/30/2021 22:27:10 - INFO - __main__ - Step 51102: {'lr': 0.00037606622737118713, 'samples': 9811584, 'steps': 51101, 'loss/train': 1.3910399675369263} -08/30/2021 22:27:10 - INFO - __main__ - Step 51103: {'lr': 0.00037606164470893247, 'samples': 9811776, 'steps': 51102, 'loss/train': 1.2674756050109863} -08/30/2021 22:27:11 - INFO - __main__ - Step 51104: {'lr': 0.00037605706198987646, 'samples': 9811968, 'steps': 51103, 'loss/train': 1.0044111013412476} -08/30/2021 22:27:11 - INFO - __main__ - Step 51105: {'lr': 0.0003760524792140211, 'samples': 9812160, 'steps': 51104, 'loss/train': 1.3432573080062866} -08/30/2021 22:27:11 - INFO - __main__ - Step 51106: {'lr': 0.0003760478963813684, 'samples': 9812352, 'steps': 51105, 'loss/train': 0.8721525073051453} -08/30/2021 22:27:13 - INFO - __main__ - Step 51107: {'lr': 0.00037604331349192047, 'samples': 9812544, 'steps': 51106, 'loss/train': 1.1137263774871826} -08/30/2021 22:27:14 - INFO - __main__ - Step 51108: {'lr': 0.00037603873054567927, 'samples': 9812736, 'steps': 51107, 'loss/train': 1.4222512245178223} -08/30/2021 22:27:14 - INFO - __main__ - Step 51109: {'lr': 0.00037603414754264707, 'samples': 9812928, 'steps': 51108, 'loss/train': 1.319298267364502} -08/30/2021 22:27:15 - INFO - __main__ - Step 51110: {'lr': 0.00037602956448282577, 'samples': 9813120, 'steps': 51109, 'loss/train': 1.4606393575668335} -08/30/2021 22:27:15 - INFO - __main__ - Step 51111: {'lr': 0.00037602498136621754, 'samples': 9813312, 'steps': 51110, 'loss/train': 1.8039977550506592} -08/30/2021 22:27:15 - INFO - __main__ - Step 51112: {'lr': 0.00037602039819282444, 'samples': 9813504, 'steps': 51111, 'loss/train': 1.6095964908599854} -08/30/2021 22:27:16 - INFO - __main__ - Step 51113: {'lr': 0.00037601581496264847, 'samples': 9813696, 'steps': 51112, 'loss/train': 1.3599810600280762} -08/30/2021 22:27:18 - INFO - __main__ - Step 51114: {'lr': 0.0003760112316756917, 'samples': 9813888, 'steps': 51113, 'loss/train': 0.9863927960395813} -08/30/2021 22:27:18 - INFO - __main__ - Step 51115: {'lr': 0.0003760066483319562, 'samples': 9814080, 'steps': 51114, 'loss/train': 0.5862434506416321} -08/30/2021 22:27:19 - INFO - __main__ - Step 51116: {'lr': 0.000376002064931444, 'samples': 9814272, 'steps': 51115, 'loss/train': 2.3102502822875977} -08/30/2021 22:27:19 - INFO - __main__ - Step 51117: {'lr': 0.00037599748147415724, 'samples': 9814464, 'steps': 51116, 'loss/train': 1.5437085628509521} -08/30/2021 22:27:19 - INFO - __main__ - Step 51118: {'lr': 0.000375992897960098, 'samples': 9814656, 'steps': 51117, 'loss/train': 1.741047978401184} -08/30/2021 22:27:21 - INFO - __main__ - Step 51119: {'lr': 0.0003759883143892683, 'samples': 9814848, 'steps': 51118, 'loss/train': 1.3197335004806519} -08/30/2021 22:27:21 - INFO - __main__ - Step 51120: {'lr': 0.00037598373076167023, 'samples': 9815040, 'steps': 51119, 'loss/train': 1.4412221908569336} -08/30/2021 22:27:22 - INFO - __main__ - Step 51121: {'lr': 0.0003759791470773058, 'samples': 9815232, 'steps': 51120, 'loss/train': 1.1492435932159424} -08/30/2021 22:27:22 - INFO - __main__ - Step 51122: {'lr': 0.0003759745633361771, 'samples': 9815424, 'steps': 51121, 'loss/train': 1.8508864641189575} -08/30/2021 22:27:22 - INFO - __main__ - Step 51123: {'lr': 0.0003759699795382863, 'samples': 9815616, 'steps': 51122, 'loss/train': 1.3926717042922974} -08/30/2021 22:27:24 - INFO - __main__ - Step 51124: {'lr': 0.00037596539568363524, 'samples': 9815808, 'steps': 51123, 'loss/train': 1.5257015228271484} -08/30/2021 22:27:24 - INFO - __main__ - Step 51125: {'lr': 0.0003759608117722262, 'samples': 9816000, 'steps': 51124, 'loss/train': 0.9977713823318481} -08/30/2021 22:27:25 - INFO - __main__ - Step 51126: {'lr': 0.00037595622780406114, 'samples': 9816192, 'steps': 51125, 'loss/train': 1.4593037366867065} -08/30/2021 22:27:25 - INFO - __main__ - Step 51127: {'lr': 0.0003759516437791421, 'samples': 9816384, 'steps': 51126, 'loss/train': 1.0894402265548706} -08/30/2021 22:27:25 - INFO - __main__ - Step 51128: {'lr': 0.0003759470596974712, 'samples': 9816576, 'steps': 51127, 'loss/train': 1.4496800899505615} -08/30/2021 22:27:27 - INFO - __main__ - Step 51129: {'lr': 0.0003759424755590505, 'samples': 9816768, 'steps': 51128, 'loss/train': 1.4660627841949463} -08/30/2021 22:27:27 - INFO - __main__ - Step 51130: {'lr': 0.0003759378913638822, 'samples': 9816960, 'steps': 51129, 'loss/train': 1.0081418752670288} -08/30/2021 22:27:28 - INFO - __main__ - Step 51131: {'lr': 0.0003759333071119681, 'samples': 9817152, 'steps': 51130, 'loss/train': 1.3580737113952637} -08/30/2021 22:27:28 - INFO - __main__ - Step 51132: {'lr': 0.0003759287228033104, 'samples': 9817344, 'steps': 51131, 'loss/train': 1.2268321514129639} -08/30/2021 22:27:28 - INFO - __main__ - Step 51133: {'lr': 0.0003759241384379112, 'samples': 9817536, 'steps': 51132, 'loss/train': 1.9298758506774902} -08/30/2021 22:27:30 - INFO - __main__ - Step 51134: {'lr': 0.0003759195540157725, 'samples': 9817728, 'steps': 51133, 'loss/train': 1.9323010444641113} -08/30/2021 22:27:31 - INFO - __main__ - Step 51135: {'lr': 0.00037591496953689644, 'samples': 9817920, 'steps': 51134, 'loss/train': 1.1901570558547974} -08/30/2021 22:27:31 - INFO - __main__ - Step 51136: {'lr': 0.00037591038500128495, 'samples': 9818112, 'steps': 51135, 'loss/train': 1.7500919103622437} -08/30/2021 22:27:31 - INFO - __main__ - Step 51137: {'lr': 0.00037590580040894024, 'samples': 9818304, 'steps': 51136, 'loss/train': 1.491097331047058} -08/30/2021 22:27:32 - INFO - __main__ - Step 51138: {'lr': 0.0003759012157598643, 'samples': 9818496, 'steps': 51137, 'loss/train': 1.2977385520935059} -08/30/2021 22:27:32 - INFO - __main__ - Step 51139: {'lr': 0.00037589663105405924, 'samples': 9818688, 'steps': 51138, 'loss/train': 0.034214574843645096} -08/30/2021 22:27:34 - INFO - __main__ - Step 51140: {'lr': 0.00037589204629152705, 'samples': 9818880, 'steps': 51139, 'loss/train': 1.4670284986495972} -08/30/2021 22:27:34 - INFO - __main__ - Step 51141: {'lr': 0.00037588746147226994, 'samples': 9819072, 'steps': 51140, 'loss/train': 1.605432152748108} -08/30/2021 22:27:34 - INFO - __main__ - Step 51142: {'lr': 0.00037588287659628977, 'samples': 9819264, 'steps': 51141, 'loss/train': 1.2759867906570435} -08/30/2021 22:27:35 - INFO - __main__ - Step 51143: {'lr': 0.0003758782916635888, 'samples': 9819456, 'steps': 51142, 'loss/train': 1.6266380548477173} -08/30/2021 22:27:35 - INFO - __main__ - Step 51144: {'lr': 0.000375873706674169, 'samples': 9819648, 'steps': 51143, 'loss/train': 1.7305018901824951} -08/30/2021 22:27:37 - INFO - __main__ - Step 51145: {'lr': 0.0003758691216280324, 'samples': 9819840, 'steps': 51144, 'loss/train': 1.1952332258224487} -08/30/2021 22:27:37 - INFO - __main__ - Step 51146: {'lr': 0.00037586453652518117, 'samples': 9820032, 'steps': 51145, 'loss/train': 1.9703680276870728} -08/30/2021 22:27:37 - INFO - __main__ - Step 51147: {'lr': 0.00037585995136561734, 'samples': 9820224, 'steps': 51146, 'loss/train': 0.6473832726478577} -08/30/2021 22:27:38 - INFO - __main__ - Step 51148: {'lr': 0.0003758553661493429, 'samples': 9820416, 'steps': 51147, 'loss/train': 0.26936134696006775} -08/30/2021 22:27:38 - INFO - __main__ - Step 51149: {'lr': 0.00037585078087635994, 'samples': 9820608, 'steps': 51148, 'loss/train': 1.6861234903335571} -08/30/2021 22:27:40 - INFO - __main__ - Step 51150: {'lr': 0.00037584619554667065, 'samples': 9820800, 'steps': 51149, 'loss/train': 1.373807668685913} -08/30/2021 22:27:41 - INFO - __main__ - Step 51151: {'lr': 0.000375841610160277, 'samples': 9820992, 'steps': 51150, 'loss/train': 1.2162147760391235} -08/30/2021 22:27:41 - INFO - __main__ - Step 51152: {'lr': 0.00037583702471718106, 'samples': 9821184, 'steps': 51151, 'loss/train': 0.9273143410682678} -08/30/2021 22:27:41 - INFO - __main__ - Step 51153: {'lr': 0.00037583243921738484, 'samples': 9821376, 'steps': 51152, 'loss/train': 1.786708116531372} -08/30/2021 22:27:42 - INFO - __main__ - Step 51154: {'lr': 0.0003758278536608905, 'samples': 9821568, 'steps': 51153, 'loss/train': 1.7401949167251587} -08/30/2021 22:27:42 - INFO - __main__ - Step 51155: {'lr': 0.00037582326804770004, 'samples': 9821760, 'steps': 51154, 'loss/train': 1.1159836053848267} -08/30/2021 22:27:43 - INFO - __main__ - Step 51156: {'lr': 0.0003758186823778156, 'samples': 9821952, 'steps': 51155, 'loss/train': 1.6246800422668457} -08/30/2021 22:27:44 - INFO - __main__ - Step 51157: {'lr': 0.0003758140966512392, 'samples': 9822144, 'steps': 51156, 'loss/train': 1.1771578788757324} -08/30/2021 22:27:44 - INFO - __main__ - Step 51158: {'lr': 0.0003758095108679729, 'samples': 9822336, 'steps': 51157, 'loss/train': 1.7330979108810425} -08/30/2021 22:27:45 - INFO - __main__ - Step 51159: {'lr': 0.0003758049250280188, 'samples': 9822528, 'steps': 51158, 'loss/train': 0.45754772424697876} -08/30/2021 22:27:45 - INFO - __main__ - Step 51160: {'lr': 0.0003758003391313789, 'samples': 9822720, 'steps': 51159, 'loss/train': 1.5674817562103271} -08/30/2021 22:27:47 - INFO - __main__ - Step 51161: {'lr': 0.00037579575317805525, 'samples': 9822912, 'steps': 51160, 'loss/train': 0.47780969738960266} -08/30/2021 22:27:47 - INFO - __main__ - Step 51162: {'lr': 0.00037579116716805007, 'samples': 9823104, 'steps': 51161, 'loss/train': 1.261548399925232} -08/30/2021 22:27:47 - INFO - __main__ - Step 51163: {'lr': 0.00037578658110136535, 'samples': 9823296, 'steps': 51162, 'loss/train': 1.2016081809997559} -08/30/2021 22:27:48 - INFO - __main__ - Step 51164: {'lr': 0.00037578199497800304, 'samples': 9823488, 'steps': 51163, 'loss/train': 1.8022922277450562} -08/30/2021 22:27:48 - INFO - __main__ - Step 51165: {'lr': 0.0003757774087979654, 'samples': 9823680, 'steps': 51164, 'loss/train': 1.188241720199585} -08/30/2021 22:27:49 - INFO - __main__ - Step 51166: {'lr': 0.0003757728225612543, 'samples': 9823872, 'steps': 51165, 'loss/train': 1.1344610452651978} -08/30/2021 22:27:51 - INFO - __main__ - Step 51167: {'lr': 0.00037576823626787203, 'samples': 9824064, 'steps': 51166, 'loss/train': 1.4764689207077026} -08/30/2021 22:27:51 - INFO - __main__ - Step 51168: {'lr': 0.00037576364991782045, 'samples': 9824256, 'steps': 51167, 'loss/train': 1.1658306121826172} -08/30/2021 22:27:51 - INFO - __main__ - Step 51169: {'lr': 0.00037575906351110174, 'samples': 9824448, 'steps': 51168, 'loss/train': 1.5185136795043945} -08/30/2021 22:27:52 - INFO - __main__ - Step 51170: {'lr': 0.0003757544770477179, 'samples': 9824640, 'steps': 51169, 'loss/train': 1.618928074836731} -08/30/2021 22:27:52 - INFO - __main__ - Step 51171: {'lr': 0.00037574989052767106, 'samples': 9824832, 'steps': 51170, 'loss/train': 1.0890928506851196} -08/30/2021 22:27:54 - INFO - __main__ - Step 51172: {'lr': 0.0003757453039509633, 'samples': 9825024, 'steps': 51171, 'loss/train': 1.8198953866958618} -08/30/2021 22:27:54 - INFO - __main__ - Step 51173: {'lr': 0.0003757407173175966, 'samples': 9825216, 'steps': 51172, 'loss/train': 1.3152436017990112} -08/30/2021 22:27:55 - INFO - __main__ - Step 51174: {'lr': 0.00037573613062757304, 'samples': 9825408, 'steps': 51173, 'loss/train': 1.2258979082107544} -08/30/2021 22:27:55 - INFO - __main__ - Step 51175: {'lr': 0.00037573154388089483, 'samples': 9825600, 'steps': 51174, 'loss/train': 1.0650404691696167} -08/30/2021 22:27:55 - INFO - __main__ - Step 51176: {'lr': 0.00037572695707756385, 'samples': 9825792, 'steps': 51175, 'loss/train': 1.4242565631866455} -08/30/2021 22:27:57 - INFO - __main__ - Step 51177: {'lr': 0.0003757223702175822, 'samples': 9825984, 'steps': 51176, 'loss/train': 1.0386673212051392} -08/30/2021 22:27:57 - INFO - __main__ - Step 51178: {'lr': 0.00037571778330095206, 'samples': 9826176, 'steps': 51177, 'loss/train': 1.1864923238754272} -08/30/2021 22:27:58 - INFO - __main__ - Step 51179: {'lr': 0.00037571319632767543, 'samples': 9826368, 'steps': 51178, 'loss/train': 1.5223625898361206} -08/30/2021 22:27:58 - INFO - __main__ - Step 51180: {'lr': 0.0003757086092977544, 'samples': 9826560, 'steps': 51179, 'loss/train': 1.0784481763839722} -08/30/2021 22:27:58 - INFO - __main__ - Step 51181: {'lr': 0.00037570402221119093, 'samples': 9826752, 'steps': 51180, 'loss/train': 1.181361198425293} -08/30/2021 22:27:59 - INFO - __main__ - Step 51182: {'lr': 0.0003756994350679872, 'samples': 9826944, 'steps': 51181, 'loss/train': 1.0486514568328857} -08/30/2021 22:28:00 - INFO - __main__ - Step 51183: {'lr': 0.00037569484786814525, 'samples': 9827136, 'steps': 51182, 'loss/train': 0.5431240200996399} -08/30/2021 22:28:01 - INFO - __main__ - Step 51184: {'lr': 0.0003756902606116671, 'samples': 9827328, 'steps': 51183, 'loss/train': 0.3380163609981537} -08/30/2021 22:28:01 - INFO - __main__ - Step 51185: {'lr': 0.00037568567329855483, 'samples': 9827520, 'steps': 51184, 'loss/train': 1.1516462564468384} -08/30/2021 22:28:01 - INFO - __main__ - Step 51186: {'lr': 0.00037568108592881067, 'samples': 9827712, 'steps': 51185, 'loss/train': 1.8121020793914795} -08/30/2021 22:28:02 - INFO - __main__ - Step 51187: {'lr': 0.00037567649850243646, 'samples': 9827904, 'steps': 51186, 'loss/train': 1.3071725368499756} -08/30/2021 22:28:03 - INFO - __main__ - Step 51188: {'lr': 0.00037567191101943437, 'samples': 9828096, 'steps': 51187, 'loss/train': 0.9554001688957214} -08/30/2021 22:28:04 - INFO - __main__ - Step 51189: {'lr': 0.00037566732347980647, 'samples': 9828288, 'steps': 51188, 'loss/train': 1.4962131977081299} -08/30/2021 22:28:04 - INFO - __main__ - Step 51190: {'lr': 0.0003756627358835548, 'samples': 9828480, 'steps': 51189, 'loss/train': 2.084181070327759} -08/30/2021 22:28:05 - INFO - __main__ - Step 51191: {'lr': 0.00037565814823068143, 'samples': 9828672, 'steps': 51190, 'loss/train': 1.4744069576263428} -08/30/2021 22:28:05 - INFO - __main__ - Step 51192: {'lr': 0.0003756535605211885, 'samples': 9828864, 'steps': 51191, 'loss/train': 1.8504951000213623} -08/30/2021 22:28:06 - INFO - __main__ - Step 51193: {'lr': 0.000375648972755078, 'samples': 9829056, 'steps': 51192, 'loss/train': 0.9381686449050903} -08/30/2021 22:28:07 - INFO - __main__ - Step 51194: {'lr': 0.00037564438493235195, 'samples': 9829248, 'steps': 51193, 'loss/train': 1.825701355934143} -08/30/2021 22:28:07 - INFO - __main__ - Step 51195: {'lr': 0.0003756397970530125, 'samples': 9829440, 'steps': 51194, 'loss/train': 1.492292046546936} -08/30/2021 22:28:08 - INFO - __main__ - Step 51196: {'lr': 0.00037563520911706175, 'samples': 9829632, 'steps': 51195, 'loss/train': 1.1246968507766724} -08/30/2021 22:28:08 - INFO - __main__ - Step 51197: {'lr': 0.0003756306211245016, 'samples': 9829824, 'steps': 51196, 'loss/train': 1.5996488332748413} -08/30/2021 22:28:10 - INFO - __main__ - Step 51198: {'lr': 0.0003756260330753343, 'samples': 9830016, 'steps': 51197, 'loss/train': 0.8708871006965637} -08/30/2021 22:28:10 - INFO - __main__ - Step 51199: {'lr': 0.00037562144496956193, 'samples': 9830208, 'steps': 51198, 'loss/train': 1.4325201511383057} -08/30/2021 22:28:11 - INFO - __main__ - Step 51200: {'lr': 0.0003756168568071864, 'samples': 9830400, 'steps': 51199, 'loss/train': 1.40663480758667} -08/30/2021 22:28:11 - INFO - __main__ - Step 51201: {'lr': 0.0003756122685882098, 'samples': 9830592, 'steps': 51200, 'loss/train': 1.6266249418258667} -08/30/2021 22:28:11 - INFO - __main__ - Step 51202: {'lr': 0.00037560768031263427, 'samples': 9830784, 'steps': 51201, 'loss/train': 1.7748383283615112} -08/30/2021 22:28:12 - INFO - __main__ - Step 51203: {'lr': 0.0003756030919804619, 'samples': 9830976, 'steps': 51202, 'loss/train': 0.03139752894639969} -08/30/2021 22:28:13 - INFO - __main__ - Step 51204: {'lr': 0.00037559850359169465, 'samples': 9831168, 'steps': 51203, 'loss/train': 1.3134340047836304} -08/30/2021 22:28:14 - INFO - __main__ - Step 51205: {'lr': 0.0003755939151463347, 'samples': 9831360, 'steps': 51204, 'loss/train': 0.9820114970207214} -08/30/2021 22:28:14 - INFO - __main__ - Step 51206: {'lr': 0.0003755893266443842, 'samples': 9831552, 'steps': 51205, 'loss/train': 0.6933907270431519} -08/30/2021 22:28:14 - INFO - __main__ - Step 51207: {'lr': 0.0003755847380858449, 'samples': 9831744, 'steps': 51206, 'loss/train': 1.7568676471710205} -08/30/2021 22:28:15 - INFO - __main__ - Step 51208: {'lr': 0.0003755801494707191, 'samples': 9831936, 'steps': 51207, 'loss/train': 0.8567339777946472} -08/30/2021 22:28:15 - INFO - __main__ - Step 51209: {'lr': 0.00037557556079900886, 'samples': 9832128, 'steps': 51208, 'loss/train': 0.8565500974655151} -08/30/2021 22:28:17 - INFO - __main__ - Step 51210: {'lr': 0.0003755709720707161, 'samples': 9832320, 'steps': 51209, 'loss/train': 1.8114852905273438} -08/30/2021 22:28:17 - INFO - __main__ - Step 51211: {'lr': 0.00037556638328584314, 'samples': 9832512, 'steps': 51210, 'loss/train': 1.401003360748291} -08/30/2021 22:28:17 - INFO - __main__ - Step 51212: {'lr': 0.0003755617944443919, 'samples': 9832704, 'steps': 51211, 'loss/train': 1.4610581398010254} -08/30/2021 22:28:18 - INFO - __main__ - Step 51213: {'lr': 0.00037555720554636443, 'samples': 9832896, 'steps': 51212, 'loss/train': 1.4754494428634644} -08/30/2021 22:28:18 - INFO - __main__ - Step 51214: {'lr': 0.00037555261659176275, 'samples': 9833088, 'steps': 51213, 'loss/train': 1.045066475868225} -08/30/2021 22:28:20 - INFO - __main__ - Step 51215: {'lr': 0.00037554802758058903, 'samples': 9833280, 'steps': 51214, 'loss/train': 1.2011256217956543} -08/30/2021 22:28:20 - INFO - __main__ - Step 51216: {'lr': 0.0003755434385128453, 'samples': 9833472, 'steps': 51215, 'loss/train': 1.1464295387268066} -08/30/2021 22:28:21 - INFO - __main__ - Step 51217: {'lr': 0.00037553884938853365, 'samples': 9833664, 'steps': 51216, 'loss/train': 1.6095163822174072} -08/30/2021 22:28:21 - INFO - __main__ - Step 51218: {'lr': 0.0003755342602076561, 'samples': 9833856, 'steps': 51217, 'loss/train': 1.522133469581604} -08/30/2021 22:28:21 - INFO - __main__ - Step 51219: {'lr': 0.0003755296709702148, 'samples': 9834048, 'steps': 51218, 'loss/train': 1.2341580390930176} -08/30/2021 22:28:24 - INFO - __main__ - Step 51220: {'lr': 0.0003755250816762118, 'samples': 9834240, 'steps': 51219, 'loss/train': 0.7191727161407471} -08/30/2021 22:28:24 - INFO - __main__ - Step 51221: {'lr': 0.00037552049232564906, 'samples': 9834432, 'steps': 51220, 'loss/train': 1.31636643409729} -08/30/2021 22:28:25 - INFO - __main__ - Step 51222: {'lr': 0.0003755159029185288, 'samples': 9834624, 'steps': 51221, 'loss/train': 1.9489468336105347} -08/30/2021 22:28:25 - INFO - __main__ - Step 51223: {'lr': 0.0003755113134548529, 'samples': 9834816, 'steps': 51222, 'loss/train': 1.0711981058120728} -08/30/2021 22:28:25 - INFO - __main__ - Step 51224: {'lr': 0.00037550672393462357, 'samples': 9835008, 'steps': 51223, 'loss/train': 1.2760934829711914} -08/30/2021 22:28:27 - INFO - __main__ - Step 51225: {'lr': 0.0003755021343578429, 'samples': 9835200, 'steps': 51224, 'loss/train': 1.8748730421066284} -08/30/2021 22:28:27 - INFO - __main__ - Step 51226: {'lr': 0.0003754975447245129, 'samples': 9835392, 'steps': 51225, 'loss/train': 0.5550345778465271} -08/30/2021 22:28:28 - INFO - __main__ - Step 51227: {'lr': 0.00037549295503463563, 'samples': 9835584, 'steps': 51226, 'loss/train': 1.4395395517349243} -08/30/2021 22:28:28 - INFO - __main__ - Step 51228: {'lr': 0.0003754883652882132, 'samples': 9835776, 'steps': 51227, 'loss/train': 1.1457983255386353} -08/30/2021 22:28:28 - INFO - __main__ - Step 51229: {'lr': 0.00037548377548524755, 'samples': 9835968, 'steps': 51228, 'loss/train': 1.4728339910507202} -08/30/2021 22:28:29 - INFO - __main__ - Step 51230: {'lr': 0.0003754791856257409, 'samples': 9836160, 'steps': 51229, 'loss/train': 1.1951260566711426} -08/30/2021 22:28:30 - INFO - __main__ - Step 51231: {'lr': 0.00037547459570969527, 'samples': 9836352, 'steps': 51230, 'loss/train': 1.1749898195266724} -08/30/2021 22:28:31 - INFO - __main__ - Step 51232: {'lr': 0.0003754700057371127, 'samples': 9836544, 'steps': 51231, 'loss/train': 0.9670997858047485} -08/30/2021 22:28:31 - INFO - __main__ - Step 51233: {'lr': 0.0003754654157079954, 'samples': 9836736, 'steps': 51232, 'loss/train': 1.418890118598938} -08/30/2021 22:28:31 - INFO - __main__ - Step 51234: {'lr': 0.00037546082562234516, 'samples': 9836928, 'steps': 51233, 'loss/train': 1.05770742893219} -08/30/2021 22:28:33 - INFO - __main__ - Step 51235: {'lr': 0.00037545623548016426, 'samples': 9837120, 'steps': 51234, 'loss/train': 1.0730671882629395} -08/30/2021 22:28:34 - INFO - __main__ - Step 51236: {'lr': 0.00037545164528145474, 'samples': 9837312, 'steps': 51235, 'loss/train': 1.0975688695907593} -08/30/2021 22:28:34 - INFO - __main__ - Step 51237: {'lr': 0.00037544705502621866, 'samples': 9837504, 'steps': 51236, 'loss/train': 1.9775018692016602} -08/30/2021 22:28:34 - INFO - __main__ - Step 51238: {'lr': 0.000375442464714458, 'samples': 9837696, 'steps': 51237, 'loss/train': 0.09726051241159439} -08/30/2021 22:28:35 - INFO - __main__ - Step 51239: {'lr': 0.000375437874346175, 'samples': 9837888, 'steps': 51238, 'loss/train': 1.9660171270370483} -08/30/2021 22:28:35 - INFO - __main__ - Step 51240: {'lr': 0.0003754332839213716, 'samples': 9838080, 'steps': 51239, 'loss/train': 0.04566191881895065} -08/30/2021 22:28:36 - INFO - __main__ - Step 51241: {'lr': 0.00037542869344004987, 'samples': 9838272, 'steps': 51240, 'loss/train': 1.3567794561386108} -08/30/2021 22:28:37 - INFO - __main__ - Step 51242: {'lr': 0.0003754241029022119, 'samples': 9838464, 'steps': 51241, 'loss/train': 1.5516606569290161} -08/30/2021 22:28:37 - INFO - __main__ - Step 51243: {'lr': 0.00037541951230785975, 'samples': 9838656, 'steps': 51242, 'loss/train': 0.9326587915420532} -08/30/2021 22:28:38 - INFO - __main__ - Step 51244: {'lr': 0.00037541492165699554, 'samples': 9838848, 'steps': 51243, 'loss/train': 2.3089091777801514} -08/30/2021 22:28:38 - INFO - __main__ - Step 51245: {'lr': 0.0003754103309496213, 'samples': 9839040, 'steps': 51244, 'loss/train': 1.4722384214401245} -08/30/2021 22:28:40 - INFO - __main__ - Step 51246: {'lr': 0.00037540574018573913, 'samples': 9839232, 'steps': 51245, 'loss/train': 1.128090739250183} -08/30/2021 22:28:40 - INFO - __main__ - Step 51247: {'lr': 0.00037540114936535107, 'samples': 9839424, 'steps': 51246, 'loss/train': 0.14142058789730072} -08/30/2021 22:28:40 - INFO - __main__ - Step 51248: {'lr': 0.0003753965584884591, 'samples': 9839616, 'steps': 51247, 'loss/train': 1.6668299436569214} -08/30/2021 22:28:41 - INFO - __main__ - Step 51249: {'lr': 0.00037539196755506546, 'samples': 9839808, 'steps': 51248, 'loss/train': 1.832000732421875} -08/30/2021 22:28:41 - INFO - __main__ - Step 51250: {'lr': 0.0003753873765651721, 'samples': 9840000, 'steps': 51249, 'loss/train': 1.020297646522522} -08/30/2021 22:28:43 - INFO - __main__ - Step 51251: {'lr': 0.0003753827855187811, 'samples': 9840192, 'steps': 51250, 'loss/train': 1.5167356729507446} -08/30/2021 22:28:43 - INFO - __main__ - Step 51252: {'lr': 0.00037537819441589457, 'samples': 9840384, 'steps': 51251, 'loss/train': 1.5461879968643188} -08/30/2021 22:28:43 - INFO - __main__ - Step 51253: {'lr': 0.0003753736032565146, 'samples': 9840576, 'steps': 51252, 'loss/train': 1.443919062614441} -08/30/2021 22:28:44 - INFO - __main__ - Step 51254: {'lr': 0.0003753690120406432, 'samples': 9840768, 'steps': 51253, 'loss/train': 1.263695478439331} -08/30/2021 22:28:44 - INFO - __main__ - Step 51255: {'lr': 0.00037536442076828235, 'samples': 9840960, 'steps': 51254, 'loss/train': 0.6945824027061462} -08/30/2021 22:28:46 - INFO - __main__ - Step 51256: {'lr': 0.00037535982943943437, 'samples': 9841152, 'steps': 51255, 'loss/train': 1.1249960660934448} -08/30/2021 22:28:46 - INFO - __main__ - Step 51257: {'lr': 0.0003753552380541011, 'samples': 9841344, 'steps': 51256, 'loss/train': 1.596789002418518} -08/30/2021 22:28:46 - INFO - __main__ - Step 51258: {'lr': 0.00037535064661228476, 'samples': 9841536, 'steps': 51257, 'loss/train': 1.0218546390533447} -08/30/2021 22:28:47 - INFO - __main__ - Step 51259: {'lr': 0.00037534605511398736, 'samples': 9841728, 'steps': 51258, 'loss/train': 1.5047143697738647} -08/30/2021 22:28:47 - INFO - __main__ - Step 51260: {'lr': 0.0003753414635592109, 'samples': 9841920, 'steps': 51259, 'loss/train': 1.1775612831115723} -08/30/2021 22:28:49 - INFO - __main__ - Step 51261: {'lr': 0.0003753368719479575, 'samples': 9842112, 'steps': 51260, 'loss/train': 1.62895667552948} -08/30/2021 22:28:49 - INFO - __main__ - Step 51262: {'lr': 0.00037533228028022923, 'samples': 9842304, 'steps': 51261, 'loss/train': 1.2367775440216064} -08/30/2021 22:28:50 - INFO - __main__ - Step 51263: {'lr': 0.0003753276885560283, 'samples': 9842496, 'steps': 51262, 'loss/train': 1.105407476425171} -08/30/2021 22:28:50 - INFO - __main__ - Step 51264: {'lr': 0.0003753230967753566, 'samples': 9842688, 'steps': 51263, 'loss/train': 1.9365652799606323} -08/30/2021 22:28:50 - INFO - __main__ - Step 51265: {'lr': 0.00037531850493821616, 'samples': 9842880, 'steps': 51264, 'loss/train': 1.5902912616729736} -08/30/2021 22:28:52 - INFO - __main__ - Step 51266: {'lr': 0.00037531391304460916, 'samples': 9843072, 'steps': 51265, 'loss/train': 1.4760328531265259} -08/30/2021 22:28:52 - INFO - __main__ - Step 51267: {'lr': 0.00037530932109453767, 'samples': 9843264, 'steps': 51266, 'loss/train': 1.6036605834960938} -08/30/2021 22:28:53 - INFO - __main__ - Step 51268: {'lr': 0.00037530472908800375, 'samples': 9843456, 'steps': 51267, 'loss/train': 1.474384069442749} -08/30/2021 22:28:53 - INFO - __main__ - Step 51269: {'lr': 0.0003753001370250094, 'samples': 9843648, 'steps': 51268, 'loss/train': 1.5217070579528809} -08/30/2021 22:28:53 - INFO - __main__ - Step 51270: {'lr': 0.00037529554490555686, 'samples': 9843840, 'steps': 51269, 'loss/train': 0.9764329791069031} -08/30/2021 22:28:55 - INFO - __main__ - Step 51271: {'lr': 0.00037529095272964796, 'samples': 9844032, 'steps': 51270, 'loss/train': 1.4690406322479248} -08/30/2021 22:28:55 - INFO - __main__ - Step 51272: {'lr': 0.0003752863604972849, 'samples': 9844224, 'steps': 51271, 'loss/train': 1.3600951433181763} -08/30/2021 22:28:56 - INFO - __main__ - Step 51273: {'lr': 0.00037528176820846975, 'samples': 9844416, 'steps': 51272, 'loss/train': 1.4935764074325562} -08/30/2021 22:28:56 - INFO - __main__ - Step 51274: {'lr': 0.00037527717586320457, 'samples': 9844608, 'steps': 51273, 'loss/train': 1.0626734495162964} -08/30/2021 22:28:56 - INFO - __main__ - Step 51275: {'lr': 0.00037527258346149153, 'samples': 9844800, 'steps': 51274, 'loss/train': 1.2351486682891846} -08/30/2021 22:28:57 - INFO - __main__ - Step 51276: {'lr': 0.0003752679910033325, 'samples': 9844992, 'steps': 51275, 'loss/train': 1.9000072479248047} -08/30/2021 22:28:59 - INFO - __main__ - Step 51277: {'lr': 0.00037526339848872956, 'samples': 9845184, 'steps': 51276, 'loss/train': 1.7238506078720093} -08/30/2021 22:28:59 - INFO - __main__ - Step 51278: {'lr': 0.000375258805917685, 'samples': 9845376, 'steps': 51277, 'loss/train': 1.5105801820755005} -08/30/2021 22:29:00 - INFO - __main__ - Step 51279: {'lr': 0.0003752542132902007, 'samples': 9845568, 'steps': 51278, 'loss/train': 1.4521934986114502} -08/30/2021 22:29:00 - INFO - __main__ - Step 51280: {'lr': 0.00037524962060627885, 'samples': 9845760, 'steps': 51279, 'loss/train': 1.3687751293182373} -08/30/2021 22:29:00 - INFO - __main__ - Step 51281: {'lr': 0.0003752450278659214, 'samples': 9845952, 'steps': 51280, 'loss/train': 1.4386978149414062} -08/30/2021 22:29:02 - INFO - __main__ - Step 51282: {'lr': 0.00037524043506913045, 'samples': 9846144, 'steps': 51281, 'loss/train': 1.0775789022445679} -08/30/2021 22:29:02 - INFO - __main__ - Step 51283: {'lr': 0.0003752358422159081, 'samples': 9846336, 'steps': 51282, 'loss/train': 1.1652660369873047} -08/30/2021 22:29:03 - INFO - __main__ - Step 51284: {'lr': 0.0003752312493062564, 'samples': 9846528, 'steps': 51283, 'loss/train': 1.4689677953720093} -08/30/2021 22:29:03 - INFO - __main__ - Step 51285: {'lr': 0.0003752266563401775, 'samples': 9846720, 'steps': 51284, 'loss/train': 0.9760374426841736} -08/30/2021 22:29:04 - INFO - __main__ - Step 51286: {'lr': 0.00037522206331767335, 'samples': 9846912, 'steps': 51285, 'loss/train': 0.7064561247825623} -08/30/2021 22:29:05 - INFO - __main__ - Step 51287: {'lr': 0.00037521747023874606, 'samples': 9847104, 'steps': 51286, 'loss/train': 2.410125970840454} -08/30/2021 22:29:05 - INFO - __main__ - Step 51288: {'lr': 0.0003752128771033978, 'samples': 9847296, 'steps': 51287, 'loss/train': 1.2347930669784546} -08/30/2021 22:29:06 - INFO - __main__ - Step 51289: {'lr': 0.0003752082839116304, 'samples': 9847488, 'steps': 51288, 'loss/train': 0.9653266072273254} -08/30/2021 22:29:06 - INFO - __main__ - Step 51290: {'lr': 0.0003752036906634462, 'samples': 9847680, 'steps': 51289, 'loss/train': 1.2839741706848145} -08/30/2021 22:29:06 - INFO - __main__ - Step 51291: {'lr': 0.0003751990973588471, 'samples': 9847872, 'steps': 51290, 'loss/train': 1.5282231569290161} -08/30/2021 22:29:08 - INFO - __main__ - Step 51292: {'lr': 0.0003751945039978353, 'samples': 9848064, 'steps': 51291, 'loss/train': 1.4868710041046143} -08/30/2021 22:29:08 - INFO - __main__ - Step 51293: {'lr': 0.00037518991058041267, 'samples': 9848256, 'steps': 51292, 'loss/train': 1.5949047803878784} -08/30/2021 22:29:09 - INFO - __main__ - Step 51294: {'lr': 0.00037518531710658144, 'samples': 9848448, 'steps': 51293, 'loss/train': 1.6631672382354736} -08/30/2021 22:29:09 - INFO - __main__ - Step 51295: {'lr': 0.0003751807235763437, 'samples': 9848640, 'steps': 51294, 'loss/train': 1.4661540985107422} -08/30/2021 22:29:09 - INFO - __main__ - Step 51296: {'lr': 0.00037517612998970136, 'samples': 9848832, 'steps': 51295, 'loss/train': 1.4969547986984253} -08/30/2021 22:29:11 - INFO - __main__ - Step 51297: {'lr': 0.00037517153634665664, 'samples': 9849024, 'steps': 51296, 'loss/train': 1.6464662551879883} -08/30/2021 22:29:11 - INFO - __main__ - Step 51298: {'lr': 0.0003751669426472115, 'samples': 9849216, 'steps': 51297, 'loss/train': 0.9657031297683716} -08/30/2021 22:29:12 - INFO - __main__ - Step 51299: {'lr': 0.0003751623488913681, 'samples': 9849408, 'steps': 51298, 'loss/train': 1.131405234336853} -08/30/2021 22:29:12 - INFO - __main__ - Step 51300: {'lr': 0.00037515775507912855, 'samples': 9849600, 'steps': 51299, 'loss/train': 1.3076097965240479} -08/30/2021 22:29:12 - INFO - __main__ - Step 51301: {'lr': 0.0003751531612104948, 'samples': 9849792, 'steps': 51300, 'loss/train': 0.25848427414894104} -08/30/2021 22:29:14 - INFO - __main__ - Step 51302: {'lr': 0.00037514856728546893, 'samples': 9849984, 'steps': 51301, 'loss/train': 1.4348535537719727} -08/30/2021 22:29:14 - INFO - __main__ - Step 51303: {'lr': 0.00037514397330405306, 'samples': 9850176, 'steps': 51302, 'loss/train': 1.7946664094924927} -08/30/2021 22:29:15 - INFO - __main__ - Step 51304: {'lr': 0.00037513937926624924, 'samples': 9850368, 'steps': 51303, 'loss/train': 1.256117820739746} -08/30/2021 22:29:15 - INFO - __main__ - Step 51305: {'lr': 0.0003751347851720596, 'samples': 9850560, 'steps': 51304, 'loss/train': 1.2072410583496094} -08/30/2021 22:29:15 - INFO - __main__ - Step 51306: {'lr': 0.00037513019102148606, 'samples': 9850752, 'steps': 51305, 'loss/train': 0.5593969821929932} -08/30/2021 22:29:17 - INFO - __main__ - Step 51307: {'lr': 0.0003751255968145309, 'samples': 9850944, 'steps': 51306, 'loss/train': 1.917822241783142} -08/30/2021 22:29:18 - INFO - __main__ - Step 51308: {'lr': 0.00037512100255119603, 'samples': 9851136, 'steps': 51307, 'loss/train': 0.7802227139472961} -08/30/2021 22:29:18 - INFO - __main__ - Step 51309: {'lr': 0.0003751164082314835, 'samples': 9851328, 'steps': 51308, 'loss/train': 0.05756458640098572} -08/30/2021 22:29:18 - INFO - __main__ - Step 51310: {'lr': 0.00037511181385539553, 'samples': 9851520, 'steps': 51309, 'loss/train': 0.9711182117462158} -08/30/2021 22:29:19 - INFO - __main__ - Step 51311: {'lr': 0.00037510721942293415, 'samples': 9851712, 'steps': 51310, 'loss/train': 1.6188971996307373} -08/30/2021 22:29:19 - INFO - __main__ - Step 51312: {'lr': 0.0003751026249341013, 'samples': 9851904, 'steps': 51311, 'loss/train': 1.1854959726333618} -08/30/2021 22:29:21 - INFO - __main__ - Step 51313: {'lr': 0.0003750980303888991, 'samples': 9852096, 'steps': 51312, 'loss/train': 1.1292489767074585} -08/30/2021 22:29:21 - INFO - __main__ - Step 51314: {'lr': 0.0003750934357873298, 'samples': 9852288, 'steps': 51313, 'loss/train': 0.8393359780311584} -08/30/2021 22:29:22 - INFO - __main__ - Step 51315: {'lr': 0.00037508884112939523, 'samples': 9852480, 'steps': 51314, 'loss/train': 1.280697226524353} -08/30/2021 22:29:22 - INFO - __main__ - Step 51316: {'lr': 0.0003750842464150975, 'samples': 9852672, 'steps': 51315, 'loss/train': 1.4953235387802124} -08/30/2021 22:29:22 - INFO - __main__ - Step 51317: {'lr': 0.0003750796516444389, 'samples': 9852864, 'steps': 51316, 'loss/train': 1.2516376972198486} -08/30/2021 22:29:24 - INFO - __main__ - Step 51318: {'lr': 0.0003750750568174212, 'samples': 9853056, 'steps': 51317, 'loss/train': 1.1759735345840454} -08/30/2021 22:29:24 - INFO - __main__ - Step 51319: {'lr': 0.00037507046193404665, 'samples': 9853248, 'steps': 51318, 'loss/train': 1.674957275390625} -08/30/2021 22:29:25 - INFO - __main__ - Step 51320: {'lr': 0.0003750658669943173, 'samples': 9853440, 'steps': 51319, 'loss/train': 1.8563592433929443} -08/30/2021 22:29:25 - INFO - __main__ - Step 51321: {'lr': 0.00037506127199823523, 'samples': 9853632, 'steps': 51320, 'loss/train': 0.7560064792633057} -08/30/2021 22:29:25 - INFO - __main__ - Step 51322: {'lr': 0.00037505667694580244, 'samples': 9853824, 'steps': 51321, 'loss/train': 1.113816261291504} -08/30/2021 22:29:27 - INFO - __main__ - Step 51323: {'lr': 0.000375052081837021, 'samples': 9854016, 'steps': 51322, 'loss/train': 0.9332059621810913} -08/30/2021 22:29:27 - INFO - __main__ - Step 51324: {'lr': 0.0003750474866718931, 'samples': 9854208, 'steps': 51323, 'loss/train': 1.5627442598342896} -08/30/2021 22:29:28 - INFO - __main__ - Step 51325: {'lr': 0.0003750428914504207, 'samples': 9854400, 'steps': 51324, 'loss/train': 0.509478747844696} -08/30/2021 22:29:28 - INFO - __main__ - Step 51326: {'lr': 0.0003750382961726059, 'samples': 9854592, 'steps': 51325, 'loss/train': 1.2357443571090698} -08/30/2021 22:29:28 - INFO - __main__ - Step 51327: {'lr': 0.0003750337008384508, 'samples': 9854784, 'steps': 51326, 'loss/train': 1.1114829778671265} -08/30/2021 22:29:30 - INFO - __main__ - Step 51328: {'lr': 0.0003750291054479574, 'samples': 9854976, 'steps': 51327, 'loss/train': 1.0996270179748535} -08/30/2021 22:29:31 - INFO - __main__ - Step 51329: {'lr': 0.0003750245100011278, 'samples': 9855168, 'steps': 51328, 'loss/train': 1.6564158201217651} -08/30/2021 22:29:31 - INFO - __main__ - Step 51330: {'lr': 0.00037501991449796415, 'samples': 9855360, 'steps': 51329, 'loss/train': 2.057136297225952} -08/30/2021 22:29:32 - INFO - __main__ - Step 51331: {'lr': 0.0003750153189384684, 'samples': 9855552, 'steps': 51330, 'loss/train': 1.3453997373580933} -08/30/2021 22:29:32 - INFO - __main__ - Step 51332: {'lr': 0.00037501072332264267, 'samples': 9855744, 'steps': 51331, 'loss/train': 2.3266890048980713} -08/30/2021 22:29:33 - INFO - __main__ - Step 51333: {'lr': 0.0003750061276504891, 'samples': 9855936, 'steps': 51332, 'loss/train': 1.254947304725647} -08/30/2021 22:29:34 - INFO - __main__ - Step 51334: {'lr': 0.0003750015319220097, 'samples': 9856128, 'steps': 51333, 'loss/train': 1.49747633934021} -08/30/2021 22:29:34 - INFO - __main__ - Step 51335: {'lr': 0.0003749969361372065, 'samples': 9856320, 'steps': 51334, 'loss/train': 1.5871186256408691} -08/30/2021 22:29:35 - INFO - __main__ - Step 51336: {'lr': 0.0003749923402960816, 'samples': 9856512, 'steps': 51335, 'loss/train': 1.6737924814224243} -08/30/2021 22:29:35 - INFO - __main__ - Step 51337: {'lr': 0.00037498774439863704, 'samples': 9856704, 'steps': 51336, 'loss/train': 1.835592269897461} -08/30/2021 22:29:35 - INFO - __main__ - Step 51338: {'lr': 0.000374983148444875, 'samples': 9856896, 'steps': 51337, 'loss/train': 1.2666033506393433} -08/30/2021 22:29:37 - INFO - __main__ - Step 51339: {'lr': 0.00037497855243479744, 'samples': 9857088, 'steps': 51338, 'loss/train': 1.1092997789382935} -08/30/2021 22:29:37 - INFO - __main__ - Step 51340: {'lr': 0.0003749739563684065, 'samples': 9857280, 'steps': 51339, 'loss/train': 1.1301703453063965} -08/30/2021 22:29:38 - INFO - __main__ - Step 51341: {'lr': 0.00037496936024570426, 'samples': 9857472, 'steps': 51340, 'loss/train': 1.421207308769226} -08/30/2021 22:29:38 - INFO - __main__ - Step 51342: {'lr': 0.0003749647640666927, 'samples': 9857664, 'steps': 51341, 'loss/train': 1.42851984500885} -08/30/2021 22:29:38 - INFO - __main__ - Step 51343: {'lr': 0.000374960167831374, 'samples': 9857856, 'steps': 51342, 'loss/train': 1.6294177770614624} -08/30/2021 22:29:40 - INFO - __main__ - Step 51344: {'lr': 0.00037495557153975016, 'samples': 9858048, 'steps': 51343, 'loss/train': 1.4724314212799072} -08/30/2021 22:29:40 - INFO - __main__ - Step 51345: {'lr': 0.0003749509751918232, 'samples': 9858240, 'steps': 51344, 'loss/train': 1.4510048627853394} -08/30/2021 22:29:41 - INFO - __main__ - Step 51346: {'lr': 0.0003749463787875953, 'samples': 9858432, 'steps': 51345, 'loss/train': 1.2277531623840332} -08/30/2021 22:29:41 - INFO - __main__ - Step 51347: {'lr': 0.00037494178232706847, 'samples': 9858624, 'steps': 51346, 'loss/train': 1.0561978816986084} -08/30/2021 22:29:42 - INFO - __main__ - Step 51348: {'lr': 0.00037493718581024484, 'samples': 9858816, 'steps': 51347, 'loss/train': 1.7972724437713623} -08/30/2021 22:29:43 - INFO - __main__ - Step 51349: {'lr': 0.0003749325892371264, 'samples': 9859008, 'steps': 51348, 'loss/train': 1.624428391456604} -08/30/2021 22:29:44 - INFO - __main__ - Step 51350: {'lr': 0.0003749279926077153, 'samples': 9859200, 'steps': 51349, 'loss/train': 0.8268048763275146} -08/30/2021 22:29:44 - INFO - __main__ - Step 51351: {'lr': 0.0003749233959220136, 'samples': 9859392, 'steps': 51350, 'loss/train': 0.9024322032928467} -08/30/2021 22:29:44 - INFO - __main__ - Step 51352: {'lr': 0.00037491879918002323, 'samples': 9859584, 'steps': 51351, 'loss/train': 0.89680415391922} -08/30/2021 22:29:45 - INFO - __main__ - Step 51353: {'lr': 0.0003749142023817465, 'samples': 9859776, 'steps': 51352, 'loss/train': 1.2557790279388428} -08/30/2021 22:29:45 - INFO - __main__ - Step 51354: {'lr': 0.00037490960552718534, 'samples': 9859968, 'steps': 51353, 'loss/train': 5.8465094566345215} -08/30/2021 22:29:47 - INFO - __main__ - Step 51355: {'lr': 0.00037490500861634183, 'samples': 9860160, 'steps': 51354, 'loss/train': 1.375968337059021} -08/30/2021 22:29:47 - INFO - __main__ - Step 51356: {'lr': 0.00037490041164921803, 'samples': 9860352, 'steps': 51355, 'loss/train': 1.1428078413009644} -08/30/2021 22:29:48 - INFO - __main__ - Step 51357: {'lr': 0.000374895814625816, 'samples': 9860544, 'steps': 51356, 'loss/train': 0.0932147428393364} -08/30/2021 22:29:48 - INFO - __main__ - Step 51358: {'lr': 0.00037489121754613787, 'samples': 9860736, 'steps': 51357, 'loss/train': 1.2024534940719604} -08/30/2021 22:29:48 - INFO - __main__ - Step 51359: {'lr': 0.00037488662041018574, 'samples': 9860928, 'steps': 51358, 'loss/train': 1.1072344779968262} -08/30/2021 22:29:50 - INFO - __main__ - Step 51360: {'lr': 0.00037488202321796156, 'samples': 9861120, 'steps': 51359, 'loss/train': 1.6473231315612793} -08/30/2021 22:29:50 - INFO - __main__ - Step 51361: {'lr': 0.0003748774259694675, 'samples': 9861312, 'steps': 51360, 'loss/train': 1.4028126001358032} -08/30/2021 22:29:50 - INFO - __main__ - Step 51362: {'lr': 0.00037487282866470565, 'samples': 9861504, 'steps': 51361, 'loss/train': 0.8303579092025757} -08/30/2021 22:29:51 - INFO - __main__ - Step 51363: {'lr': 0.00037486823130367786, 'samples': 9861696, 'steps': 51362, 'loss/train': 1.4941444396972656} -08/30/2021 22:29:51 - INFO - __main__ - Step 51364: {'lr': 0.0003748636338863865, 'samples': 9861888, 'steps': 51363, 'loss/train': 1.4180796146392822} -08/30/2021 22:29:53 - INFO - __main__ - Step 51365: {'lr': 0.0003748590364128335, 'samples': 9862080, 'steps': 51364, 'loss/train': 0.11163672059774399} -08/30/2021 22:29:54 - INFO - __main__ - Step 51366: {'lr': 0.00037485443888302095, 'samples': 9862272, 'steps': 51365, 'loss/train': 1.5435107946395874} -08/30/2021 22:29:54 - INFO - __main__ - Step 51367: {'lr': 0.00037484984129695096, 'samples': 9862464, 'steps': 51366, 'loss/train': 1.807789921760559} -08/30/2021 22:29:54 - INFO - __main__ - Step 51368: {'lr': 0.00037484524365462545, 'samples': 9862656, 'steps': 51367, 'loss/train': 0.9509342312812805} -08/30/2021 22:29:55 - INFO - __main__ - Step 51369: {'lr': 0.0003748406459560466, 'samples': 9862848, 'steps': 51368, 'loss/train': 1.2699956893920898} -08/30/2021 22:29:55 - INFO - __main__ - Step 51370: {'lr': 0.0003748360482012166, 'samples': 9863040, 'steps': 51369, 'loss/train': 0.11819048970937729} -08/30/2021 22:29:56 - INFO - __main__ - Step 51371: {'lr': 0.00037483145039013735, 'samples': 9863232, 'steps': 51370, 'loss/train': 1.3368152379989624} -08/30/2021 22:29:57 - INFO - __main__ - Step 51372: {'lr': 0.0003748268525228109, 'samples': 9863424, 'steps': 51371, 'loss/train': 1.1307731866836548} -08/30/2021 22:29:57 - INFO - __main__ - Step 51373: {'lr': 0.00037482225459923945, 'samples': 9863616, 'steps': 51372, 'loss/train': 1.1255041360855103} -08/30/2021 22:29:58 - INFO - __main__ - Step 51374: {'lr': 0.00037481765661942506, 'samples': 9863808, 'steps': 51373, 'loss/train': 0.43376192450523376} -08/30/2021 22:29:58 - INFO - __main__ - Step 51375: {'lr': 0.0003748130585833697, 'samples': 9864000, 'steps': 51374, 'loss/train': 0.8339983820915222} -08/30/2021 22:29:59 - INFO - __main__ - Step 51376: {'lr': 0.0003748084604910755, 'samples': 9864192, 'steps': 51375, 'loss/train': 1.5910978317260742} -08/30/2021 22:30:00 - INFO - __main__ - Step 51377: {'lr': 0.0003748038623425446, 'samples': 9864384, 'steps': 51376, 'loss/train': 1.4316824674606323} -08/30/2021 22:30:00 - INFO - __main__ - Step 51378: {'lr': 0.00037479926413777896, 'samples': 9864576, 'steps': 51377, 'loss/train': 1.5871822834014893} -08/30/2021 22:30:01 - INFO - __main__ - Step 51379: {'lr': 0.0003747946658767807, 'samples': 9864768, 'steps': 51378, 'loss/train': 1.4499775171279907} -08/30/2021 22:30:01 - INFO - __main__ - Step 51380: {'lr': 0.0003747900675595519, 'samples': 9864960, 'steps': 51379, 'loss/train': 1.1597874164581299} -08/30/2021 22:30:03 - INFO - __main__ - Step 51381: {'lr': 0.00037478546918609464, 'samples': 9865152, 'steps': 51380, 'loss/train': 1.4608900547027588} -08/30/2021 22:30:03 - INFO - __main__ - Step 51382: {'lr': 0.00037478087075641095, 'samples': 9865344, 'steps': 51381, 'loss/train': 1.5292834043502808} -08/30/2021 22:30:03 - INFO - __main__ - Step 51383: {'lr': 0.00037477627227050286, 'samples': 9865536, 'steps': 51382, 'loss/train': 2.05181884765625} -08/30/2021 22:30:04 - INFO - __main__ - Step 51384: {'lr': 0.0003747716737283726, 'samples': 9865728, 'steps': 51383, 'loss/train': 0.7129995226860046} -08/30/2021 22:30:04 - INFO - __main__ - Step 51385: {'lr': 0.00037476707513002213, 'samples': 9865920, 'steps': 51384, 'loss/train': 1.353680968284607} -08/30/2021 22:30:06 - INFO - __main__ - Step 51386: {'lr': 0.0003747624764754535, 'samples': 9866112, 'steps': 51385, 'loss/train': 0.06397978961467743} -08/30/2021 22:30:07 - INFO - __main__ - Step 51387: {'lr': 0.00037475787776466887, 'samples': 9866304, 'steps': 51386, 'loss/train': 0.8257332444190979} -08/30/2021 22:30:07 - INFO - __main__ - Step 51388: {'lr': 0.00037475327899767026, 'samples': 9866496, 'steps': 51387, 'loss/train': 1.0156002044677734} -08/30/2021 22:30:07 - INFO - __main__ - Step 51389: {'lr': 0.0003747486801744597, 'samples': 9866688, 'steps': 51388, 'loss/train': 1.4870741367340088} -08/30/2021 22:30:08 - INFO - __main__ - Step 51390: {'lr': 0.0003747440812950393, 'samples': 9866880, 'steps': 51389, 'loss/train': 1.0778515338897705} -08/30/2021 22:30:10 - INFO - __main__ - Step 51391: {'lr': 0.0003747394823594112, 'samples': 9867072, 'steps': 51390, 'loss/train': 1.197513461112976} -08/30/2021 22:30:11 - INFO - __main__ - Step 51392: {'lr': 0.00037473488336757743, 'samples': 9867264, 'steps': 51391, 'loss/train': 1.507083535194397} -08/30/2021 22:30:11 - INFO - __main__ - Step 51393: {'lr': 0.00037473028431954006, 'samples': 9867456, 'steps': 51392, 'loss/train': 0.9903676509857178} -08/30/2021 22:30:11 - INFO - __main__ - Step 51394: {'lr': 0.00037472568521530107, 'samples': 9867648, 'steps': 51393, 'loss/train': 1.18123197555542} -08/30/2021 22:30:12 - INFO - __main__ - Step 51395: {'lr': 0.0003747210860548627, 'samples': 9867840, 'steps': 51394, 'loss/train': 1.7999238967895508} -08/30/2021 22:30:12 - INFO - __main__ - Step 51396: {'lr': 0.00037471648683822683, 'samples': 9868032, 'steps': 51395, 'loss/train': 1.7751226425170898} -08/30/2021 22:30:12 - INFO - __main__ - Step 51397: {'lr': 0.0003747118875653957, 'samples': 9868224, 'steps': 51396, 'loss/train': 1.803802728652954} -08/30/2021 22:30:13 - INFO - __main__ - Step 51398: {'lr': 0.00037470728823637135, 'samples': 9868416, 'steps': 51397, 'loss/train': 0.15961065888404846} -08/30/2021 22:30:14 - INFO - __main__ - Step 51399: {'lr': 0.0003747026888511558, 'samples': 9868608, 'steps': 51398, 'loss/train': 1.3193204402923584} -08/30/2021 22:30:15 - INFO - __main__ - Step 51400: {'lr': 0.00037469808940975106, 'samples': 9868800, 'steps': 51399, 'loss/train': 1.1885268688201904} -08/30/2021 22:30:15 - INFO - __main__ - Step 51401: {'lr': 0.00037469348991215934, 'samples': 9868992, 'steps': 51400, 'loss/train': 1.084804892539978} -08/30/2021 22:30:15 - INFO - __main__ - Step 51402: {'lr': 0.00037468889035838264, 'samples': 9869184, 'steps': 51401, 'loss/train': 1.316615343093872} -08/30/2021 22:30:16 - INFO - __main__ - Step 51403: {'lr': 0.0003746842907484231, 'samples': 9869376, 'steps': 51402, 'loss/train': 1.0453486442565918} -08/30/2021 22:30:17 - INFO - __main__ - Step 51404: {'lr': 0.0003746796910822827, 'samples': 9869568, 'steps': 51403, 'loss/train': 0.6009833812713623} -08/30/2021 22:30:18 - INFO - __main__ - Step 51405: {'lr': 0.0003746750913599636, 'samples': 9869760, 'steps': 51404, 'loss/train': 1.174621343612671} -08/30/2021 22:30:18 - INFO - __main__ - Step 51406: {'lr': 0.00037467049158146777, 'samples': 9869952, 'steps': 51405, 'loss/train': 1.8217114210128784} -08/30/2021 22:30:18 - INFO - __main__ - Step 51407: {'lr': 0.00037466589174679733, 'samples': 9870144, 'steps': 51406, 'loss/train': 1.3290667533874512} -08/30/2021 22:30:19 - INFO - __main__ - Step 51408: {'lr': 0.0003746612918559544, 'samples': 9870336, 'steps': 51407, 'loss/train': 1.3627574443817139} -08/30/2021 22:30:20 - INFO - __main__ - Step 51409: {'lr': 0.00037465669190894107, 'samples': 9870528, 'steps': 51408, 'loss/train': 1.7998628616333008} -08/30/2021 22:30:21 - INFO - __main__ - Step 51410: {'lr': 0.00037465209190575927, 'samples': 9870720, 'steps': 51409, 'loss/train': 0.9656294584274292} -08/30/2021 22:30:21 - INFO - __main__ - Step 51411: {'lr': 0.00037464749184641123, 'samples': 9870912, 'steps': 51410, 'loss/train': 1.280968427658081} -08/30/2021 22:30:22 - INFO - __main__ - Step 51412: {'lr': 0.0003746428917308989, 'samples': 9871104, 'steps': 51411, 'loss/train': 1.2487115859985352} -08/30/2021 22:30:22 - INFO - __main__ - Step 51413: {'lr': 0.0003746382915592244, 'samples': 9871296, 'steps': 51412, 'loss/train': 1.6149616241455078} -08/30/2021 22:30:22 - INFO - __main__ - Step 51414: {'lr': 0.0003746336913313898, 'samples': 9871488, 'steps': 51413, 'loss/train': 1.5198841094970703} -08/30/2021 22:30:24 - INFO - __main__ - Step 51415: {'lr': 0.0003746290910473973, 'samples': 9871680, 'steps': 51414, 'loss/train': 4.683076858520508} -08/30/2021 22:30:25 - INFO - __main__ - Step 51416: {'lr': 0.00037462449070724876, 'samples': 9871872, 'steps': 51415, 'loss/train': 1.9120951890945435} -08/30/2021 22:30:25 - INFO - __main__ - Step 51417: {'lr': 0.00037461989031094636, 'samples': 9872064, 'steps': 51416, 'loss/train': 1.7031983137130737} -08/30/2021 22:30:25 - INFO - __main__ - Step 51418: {'lr': 0.00037461528985849215, 'samples': 9872256, 'steps': 51417, 'loss/train': 0.8126934766769409} -08/30/2021 22:30:26 - INFO - __main__ - Step 51419: {'lr': 0.0003746106893498882, 'samples': 9872448, 'steps': 51418, 'loss/train': 1.5206992626190186} -08/30/2021 22:30:27 - INFO - __main__ - Step 51420: {'lr': 0.00037460608878513656, 'samples': 9872640, 'steps': 51419, 'loss/train': 1.5701783895492554} -08/30/2021 22:30:28 - INFO - __main__ - Step 51421: {'lr': 0.00037460148816423946, 'samples': 9872832, 'steps': 51420, 'loss/train': 1.339674472808838} -08/30/2021 22:30:28 - INFO - __main__ - Step 51422: {'lr': 0.0003745968874871988, 'samples': 9873024, 'steps': 51421, 'loss/train': 1.094204068183899} -08/30/2021 22:30:28 - INFO - __main__ - Step 51423: {'lr': 0.00037459228675401667, 'samples': 9873216, 'steps': 51422, 'loss/train': 0.7770503759384155} -08/30/2021 22:30:29 - INFO - __main__ - Step 51424: {'lr': 0.00037458768596469516, 'samples': 9873408, 'steps': 51423, 'loss/train': 1.3026182651519775} -08/30/2021 22:30:31 - INFO - __main__ - Step 51425: {'lr': 0.0003745830851192364, 'samples': 9873600, 'steps': 51424, 'loss/train': 0.05961012840270996} -08/30/2021 22:30:31 - INFO - __main__ - Step 51426: {'lr': 0.00037457848421764247, 'samples': 9873792, 'steps': 51425, 'loss/train': 1.2662992477416992} -08/30/2021 22:30:32 - INFO - __main__ - Step 51427: {'lr': 0.0003745738832599153, 'samples': 9873984, 'steps': 51426, 'loss/train': 0.8151814937591553} -08/30/2021 22:30:32 - INFO - __main__ - Step 51428: {'lr': 0.0003745692822460572, 'samples': 9874176, 'steps': 51427, 'loss/train': 1.4519838094711304} -08/30/2021 22:30:32 - INFO - __main__ - Step 51429: {'lr': 0.00037456468117607, 'samples': 9874368, 'steps': 51428, 'loss/train': 1.6214792728424072} -08/30/2021 22:30:33 - INFO - __main__ - Step 51430: {'lr': 0.0003745600800499559, 'samples': 9874560, 'steps': 51429, 'loss/train': 1.1946426630020142} -08/30/2021 22:30:34 - INFO - __main__ - Step 51431: {'lr': 0.0003745554788677169, 'samples': 9874752, 'steps': 51430, 'loss/train': 0.8256950378417969} -08/30/2021 22:30:35 - INFO - __main__ - Step 51432: {'lr': 0.0003745508776293551, 'samples': 9874944, 'steps': 51431, 'loss/train': 1.9110429286956787} -08/30/2021 22:30:35 - INFO - __main__ - Step 51433: {'lr': 0.0003745462763348727, 'samples': 9875136, 'steps': 51432, 'loss/train': 1.3494125604629517} -08/30/2021 22:30:35 - INFO - __main__ - Step 51434: {'lr': 0.00037454167498427165, 'samples': 9875328, 'steps': 51433, 'loss/train': 1.4760828018188477} -08/30/2021 22:30:36 - INFO - __main__ - Step 51435: {'lr': 0.0003745370735775541, 'samples': 9875520, 'steps': 51434, 'loss/train': 0.4241074323654175} -08/30/2021 22:30:36 - INFO - __main__ - Step 51436: {'lr': 0.00037453247211472195, 'samples': 9875712, 'steps': 51435, 'loss/train': 1.6919045448303223} -08/30/2021 22:30:38 - INFO - __main__ - Step 51437: {'lr': 0.0003745278705957774, 'samples': 9875904, 'steps': 51436, 'loss/train': 1.81698477268219} -08/30/2021 22:30:39 - INFO - __main__ - Step 51438: {'lr': 0.00037452326902072256, 'samples': 9876096, 'steps': 51437, 'loss/train': 1.704921841621399} -08/30/2021 22:30:39 - INFO - __main__ - Step 51439: {'lr': 0.0003745186673895594, 'samples': 9876288, 'steps': 51438, 'loss/train': 1.6699382066726685} -08/30/2021 22:30:39 - INFO - __main__ - Step 51440: {'lr': 0.0003745140657022901, 'samples': 9876480, 'steps': 51439, 'loss/train': 0.807083010673523} -08/30/2021 22:30:40 - INFO - __main__ - Step 51441: {'lr': 0.0003745094639589167, 'samples': 9876672, 'steps': 51440, 'loss/train': 1.2464178800582886} -08/30/2021 22:30:41 - INFO - __main__ - Step 51442: {'lr': 0.00037450486215944123, 'samples': 9876864, 'steps': 51441, 'loss/train': 0.7804450392723083} -08/30/2021 22:30:42 - INFO - __main__ - Step 51443: {'lr': 0.0003745002603038658, 'samples': 9877056, 'steps': 51442, 'loss/train': 1.2219847440719604} -08/30/2021 22:30:42 - INFO - __main__ - Step 51444: {'lr': 0.00037449565839219246, 'samples': 9877248, 'steps': 51443, 'loss/train': 1.6360878944396973} -08/30/2021 22:30:43 - INFO - __main__ - Step 51445: {'lr': 0.0003744910564244233, 'samples': 9877440, 'steps': 51444, 'loss/train': 0.06180236488580704} -08/30/2021 22:30:43 - INFO - __main__ - Step 51446: {'lr': 0.0003744864544005604, 'samples': 9877632, 'steps': 51445, 'loss/train': 2.03151273727417} -08/30/2021 22:30:44 - INFO - __main__ - Step 51447: {'lr': 0.0003744818523206058, 'samples': 9877824, 'steps': 51446, 'loss/train': 1.0139405727386475} -08/30/2021 22:30:45 - INFO - __main__ - Step 51448: {'lr': 0.00037447725018456167, 'samples': 9878016, 'steps': 51447, 'loss/train': 0.9331154227256775} -08/30/2021 22:30:45 - INFO - __main__ - Step 51449: {'lr': 0.00037447264799243, 'samples': 9878208, 'steps': 51448, 'loss/train': 1.5400375127792358} -08/30/2021 22:30:46 - INFO - __main__ - Step 51450: {'lr': 0.00037446804574421276, 'samples': 9878400, 'steps': 51449, 'loss/train': 1.3505369424819946} -08/30/2021 22:30:46 - INFO - __main__ - Step 51451: {'lr': 0.00037446344343991224, 'samples': 9878592, 'steps': 51450, 'loss/train': 1.5118086338043213} -08/30/2021 22:30:47 - INFO - __main__ - Step 51452: {'lr': 0.0003744588410795304, 'samples': 9878784, 'steps': 51451, 'loss/train': 0.2807227373123169} -08/30/2021 22:30:48 - INFO - __main__ - Step 51453: {'lr': 0.00037445423866306926, 'samples': 9878976, 'steps': 51452, 'loss/train': 1.968727707862854} -08/30/2021 22:30:48 - INFO - __main__ - Step 51454: {'lr': 0.00037444963619053103, 'samples': 9879168, 'steps': 51453, 'loss/train': 1.283005952835083} -08/30/2021 22:30:49 - INFO - __main__ - Step 51455: {'lr': 0.00037444503366191776, 'samples': 9879360, 'steps': 51454, 'loss/train': 1.7621018886566162} -08/30/2021 22:30:49 - INFO - __main__ - Step 51456: {'lr': 0.00037444043107723134, 'samples': 9879552, 'steps': 51455, 'loss/train': 1.3220256567001343} -08/30/2021 22:30:50 - INFO - __main__ - Step 51457: {'lr': 0.0003744358284364741, 'samples': 9879744, 'steps': 51456, 'loss/train': 0.8543890714645386} -08/30/2021 22:30:51 - INFO - __main__ - Step 51458: {'lr': 0.00037443122573964794, 'samples': 9879936, 'steps': 51457, 'loss/train': 1.2022067308425903} -08/30/2021 22:30:51 - INFO - __main__ - Step 51459: {'lr': 0.000374426622986755, 'samples': 9880128, 'steps': 51458, 'loss/train': 1.0412627458572388} -08/30/2021 22:30:51 - INFO - __main__ - Step 51460: {'lr': 0.0003744220201777974, 'samples': 9880320, 'steps': 51459, 'loss/train': 1.9175645112991333} -08/30/2021 22:30:52 - INFO - __main__ - Step 51461: {'lr': 0.0003744174173127771, 'samples': 9880512, 'steps': 51460, 'loss/train': 1.3595013618469238} -08/30/2021 22:30:53 - INFO - __main__ - Step 51462: {'lr': 0.00037441281439169624, 'samples': 9880704, 'steps': 51461, 'loss/train': 1.637851357460022} -08/30/2021 22:30:54 - INFO - __main__ - Step 51463: {'lr': 0.0003744082114145568, 'samples': 9880896, 'steps': 51462, 'loss/train': 1.3366448879241943} -08/30/2021 22:30:54 - INFO - __main__ - Step 51464: {'lr': 0.00037440360838136106, 'samples': 9881088, 'steps': 51463, 'loss/train': 1.0917524099349976} -08/30/2021 22:30:55 - INFO - __main__ - Step 51465: {'lr': 0.0003743990052921109, 'samples': 9881280, 'steps': 51464, 'loss/train': 1.0069018602371216} -08/30/2021 22:30:55 - INFO - __main__ - Step 51466: {'lr': 0.00037439440214680854, 'samples': 9881472, 'steps': 51465, 'loss/train': 0.7022767663002014} -08/30/2021 22:30:57 - INFO - __main__ - Step 51467: {'lr': 0.00037438979894545595, 'samples': 9881664, 'steps': 51466, 'loss/train': 1.1021631956100464} -08/30/2021 22:30:58 - INFO - __main__ - Step 51468: {'lr': 0.0003743851956880553, 'samples': 9881856, 'steps': 51467, 'loss/train': 1.211194396018982} -08/30/2021 22:30:58 - INFO - __main__ - Step 51469: {'lr': 0.00037438059237460846, 'samples': 9882048, 'steps': 51468, 'loss/train': 1.7911427021026611} -08/30/2021 22:30:58 - INFO - __main__ - Step 51470: {'lr': 0.0003743759890051177, 'samples': 9882240, 'steps': 51469, 'loss/train': 1.8580384254455566} -08/30/2021 22:30:59 - INFO - __main__ - Step 51471: {'lr': 0.00037437138557958505, 'samples': 9882432, 'steps': 51470, 'loss/train': 1.078689694404602} -08/30/2021 22:30:59 - INFO - __main__ - Step 51472: {'lr': 0.0003743667820980126, 'samples': 9882624, 'steps': 51471, 'loss/train': 0.030787423253059387} -08/30/2021 22:30:59 - INFO - __main__ - Step 51473: {'lr': 0.0003743621785604024, 'samples': 9882816, 'steps': 51472, 'loss/train': 2.127434253692627} -08/30/2021 22:31:01 - INFO - __main__ - Step 51474: {'lr': 0.00037435757496675646, 'samples': 9883008, 'steps': 51473, 'loss/train': 0.20036016404628754} -08/30/2021 22:31:01 - INFO - __main__ - Step 51475: {'lr': 0.000374352971317077, 'samples': 9883200, 'steps': 51474, 'loss/train': 0.9834887981414795} -08/30/2021 22:31:02 - INFO - __main__ - Step 51476: {'lr': 0.0003743483676113659, 'samples': 9883392, 'steps': 51475, 'loss/train': 1.5811645984649658} -08/30/2021 22:31:02 - INFO - __main__ - Step 51477: {'lr': 0.00037434376384962544, 'samples': 9883584, 'steps': 51476, 'loss/train': 1.6965177059173584} -08/30/2021 22:31:02 - INFO - __main__ - Step 51478: {'lr': 0.00037433916003185757, 'samples': 9883776, 'steps': 51477, 'loss/train': 1.8264700174331665} -08/30/2021 22:31:03 - INFO - __main__ - Step 51479: {'lr': 0.0003743345561580644, 'samples': 9883968, 'steps': 51478, 'loss/train': 1.6330749988555908} -08/30/2021 22:31:04 - INFO - __main__ - Step 51480: {'lr': 0.0003743299522282479, 'samples': 9884160, 'steps': 51479, 'loss/train': 1.5845221281051636} -08/30/2021 22:31:05 - INFO - __main__ - Step 51481: {'lr': 0.0003743253482424104, 'samples': 9884352, 'steps': 51480, 'loss/train': 1.718029260635376} -08/30/2021 22:31:05 - INFO - __main__ - Step 51482: {'lr': 0.00037432074420055376, 'samples': 9884544, 'steps': 51481, 'loss/train': 1.2749820947647095} -08/30/2021 22:31:05 - INFO - __main__ - Step 51483: {'lr': 0.00037431614010268013, 'samples': 9884736, 'steps': 51482, 'loss/train': 1.039206862449646} -08/30/2021 22:31:06 - INFO - __main__ - Step 51484: {'lr': 0.0003743115359487915, 'samples': 9884928, 'steps': 51483, 'loss/train': 1.1909019947052002} -08/30/2021 22:31:07 - INFO - __main__ - Step 51485: {'lr': 0.00037430693173889, 'samples': 9885120, 'steps': 51484, 'loss/train': 1.4576939344406128} -08/30/2021 22:31:08 - INFO - __main__ - Step 51486: {'lr': 0.00037430232747297774, 'samples': 9885312, 'steps': 51485, 'loss/train': 1.173467755317688} -08/30/2021 22:31:08 - INFO - __main__ - Step 51487: {'lr': 0.00037429772315105683, 'samples': 9885504, 'steps': 51486, 'loss/train': 1.9440302848815918} -08/30/2021 22:31:08 - INFO - __main__ - Step 51488: {'lr': 0.0003742931187731293, 'samples': 9885696, 'steps': 51487, 'loss/train': 1.4747331142425537} -08/30/2021 22:31:09 - INFO - __main__ - Step 51489: {'lr': 0.00037428851433919707, 'samples': 9885888, 'steps': 51488, 'loss/train': 1.3980581760406494} -08/30/2021 22:31:11 - INFO - __main__ - Step 51490: {'lr': 0.0003742839098492625, 'samples': 9886080, 'steps': 51489, 'loss/train': 1.4674938917160034} -08/30/2021 22:31:11 - INFO - __main__ - Step 51491: {'lr': 0.0003742793053033274, 'samples': 9886272, 'steps': 51490, 'loss/train': 1.2544020414352417} -08/30/2021 22:31:12 - INFO - __main__ - Step 51492: {'lr': 0.000374274700701394, 'samples': 9886464, 'steps': 51491, 'loss/train': 1.1741329431533813} -08/30/2021 22:31:12 - INFO - __main__ - Step 51493: {'lr': 0.00037427009604346437, 'samples': 9886656, 'steps': 51492, 'loss/train': 1.168109655380249} -08/30/2021 22:31:12 - INFO - __main__ - Step 51494: {'lr': 0.0003742654913295405, 'samples': 9886848, 'steps': 51493, 'loss/train': 0.13102193176746368} -08/30/2021 22:31:14 - INFO - __main__ - Step 51495: {'lr': 0.0003742608865596246, 'samples': 9887040, 'steps': 51494, 'loss/train': 1.9099037647247314} -08/30/2021 22:31:14 - INFO - __main__ - Step 51496: {'lr': 0.0003742562817337186, 'samples': 9887232, 'steps': 51495, 'loss/train': 1.4433385133743286} -08/30/2021 22:31:15 - INFO - __main__ - Step 51497: {'lr': 0.0003742516768518247, 'samples': 9887424, 'steps': 51496, 'loss/train': 1.8039155006408691} -08/30/2021 22:31:15 - INFO - __main__ - Step 51498: {'lr': 0.0003742470719139448, 'samples': 9887616, 'steps': 51497, 'loss/train': 1.3243900537490845} -08/30/2021 22:31:15 - INFO - __main__ - Step 51499: {'lr': 0.0003742424669200811, 'samples': 9887808, 'steps': 51498, 'loss/train': 1.358375072479248} -08/30/2021 22:31:17 - INFO - __main__ - Step 51500: {'lr': 0.00037423786187023574, 'samples': 9888000, 'steps': 51499, 'loss/train': 1.7329976558685303} -08/30/2021 22:31:17 - INFO - __main__ - Step 51501: {'lr': 0.00037423325676441064, 'samples': 9888192, 'steps': 51500, 'loss/train': 1.1874157190322876} -08/30/2021 22:31:18 - INFO - __main__ - Step 51502: {'lr': 0.0003742286516026081, 'samples': 9888384, 'steps': 51501, 'loss/train': 0.9082269668579102} -08/30/2021 22:31:18 - INFO - __main__ - Step 51503: {'lr': 0.0003742240463848299, 'samples': 9888576, 'steps': 51502, 'loss/train': 1.2705663442611694} -08/30/2021 22:31:18 - INFO - __main__ - Step 51504: {'lr': 0.0003742194411110783, 'samples': 9888768, 'steps': 51503, 'loss/train': 1.6481341123580933} -08/30/2021 22:31:19 - INFO - __main__ - Step 51505: {'lr': 0.00037421483578135536, 'samples': 9888960, 'steps': 51504, 'loss/train': 1.2350645065307617} -08/30/2021 22:31:20 - INFO - __main__ - Step 51506: {'lr': 0.0003742102303956631, 'samples': 9889152, 'steps': 51505, 'loss/train': 0.5643467307090759} -08/30/2021 22:31:21 - INFO - __main__ - Step 51507: {'lr': 0.0003742056249540036, 'samples': 9889344, 'steps': 51506, 'loss/train': 1.4980963468551636} -08/30/2021 22:31:21 - INFO - __main__ - Step 51508: {'lr': 0.00037420101945637906, 'samples': 9889536, 'steps': 51507, 'loss/train': 1.1526356935501099} -08/30/2021 22:31:21 - INFO - __main__ - Step 51509: {'lr': 0.00037419641390279136, 'samples': 9889728, 'steps': 51508, 'loss/train': 0.9649524688720703} -08/30/2021 22:31:22 - INFO - __main__ - Step 51510: {'lr': 0.00037419180829324273, 'samples': 9889920, 'steps': 51509, 'loss/train': 1.904329538345337} -08/30/2021 22:31:23 - INFO - __main__ - Step 51511: {'lr': 0.0003741872026277351, 'samples': 9890112, 'steps': 51510, 'loss/train': 0.3085313141345978} -08/30/2021 22:31:24 - INFO - __main__ - Step 51512: {'lr': 0.00037418259690627075, 'samples': 9890304, 'steps': 51511, 'loss/train': 1.0710434913635254} -08/30/2021 22:31:24 - INFO - __main__ - Step 51513: {'lr': 0.0003741779911288516, 'samples': 9890496, 'steps': 51512, 'loss/train': 1.2834514379501343} -08/30/2021 22:31:25 - INFO - __main__ - Step 51514: {'lr': 0.0003741733852954797, 'samples': 9890688, 'steps': 51513, 'loss/train': 1.7014063596725464} -08/30/2021 22:31:25 - INFO - __main__ - Step 51515: {'lr': 0.00037416877940615737, 'samples': 9890880, 'steps': 51514, 'loss/train': 1.2408925294876099} -08/30/2021 22:31:27 - INFO - __main__ - Step 51516: {'lr': 0.00037416417346088635, 'samples': 9891072, 'steps': 51515, 'loss/train': 1.4154435396194458} -08/30/2021 22:31:27 - INFO - __main__ - Step 51517: {'lr': 0.0003741595674596688, 'samples': 9891264, 'steps': 51516, 'loss/train': 1.280374526977539} -08/30/2021 22:31:27 - INFO - __main__ - Step 51518: {'lr': 0.000374154961402507, 'samples': 9891456, 'steps': 51517, 'loss/train': 5.858405113220215} -08/30/2021 22:31:28 - INFO - __main__ - Step 51519: {'lr': 0.00037415035528940284, 'samples': 9891648, 'steps': 51518, 'loss/train': 1.4920510053634644} -08/30/2021 22:31:28 - INFO - __main__ - Step 51520: {'lr': 0.00037414574912035845, 'samples': 9891840, 'steps': 51519, 'loss/train': 2.1044516563415527} -08/30/2021 22:31:28 - INFO - __main__ - Step 51521: {'lr': 0.0003741411428953759, 'samples': 9892032, 'steps': 51520, 'loss/train': 1.1028512716293335} -08/30/2021 22:31:30 - INFO - __main__ - Step 51522: {'lr': 0.00037413653661445736, 'samples': 9892224, 'steps': 51521, 'loss/train': 0.17945143580436707} -08/30/2021 22:31:31 - INFO - __main__ - Step 51523: {'lr': 0.00037413193027760466, 'samples': 9892416, 'steps': 51522, 'loss/train': 1.2250851392745972} -08/30/2021 22:31:31 - INFO - __main__ - Step 51524: {'lr': 0.00037412732388482015, 'samples': 9892608, 'steps': 51523, 'loss/train': 1.5527629852294922} -08/30/2021 22:31:31 - INFO - __main__ - Step 51525: {'lr': 0.0003741227174361057, 'samples': 9892800, 'steps': 51524, 'loss/train': 1.3103173971176147} -08/30/2021 22:31:32 - INFO - __main__ - Step 51526: {'lr': 0.00037411811093146345, 'samples': 9892992, 'steps': 51525, 'loss/train': 1.5848549604415894} -08/30/2021 22:31:34 - INFO - __main__ - Step 51527: {'lr': 0.0003741135043708956, 'samples': 9893184, 'steps': 51526, 'loss/train': 1.7637684345245361} -08/30/2021 22:31:34 - INFO - __main__ - Step 51528: {'lr': 0.000374108897754404, 'samples': 9893376, 'steps': 51527, 'loss/train': 1.4846374988555908} -08/30/2021 22:31:34 - INFO - __main__ - Step 51529: {'lr': 0.00037410429108199097, 'samples': 9893568, 'steps': 51528, 'loss/train': 1.4613293409347534} -08/30/2021 22:31:35 - INFO - __main__ - Step 51530: {'lr': 0.0003740996843536584, 'samples': 9893760, 'steps': 51529, 'loss/train': 0.06214777007699013} -08/30/2021 22:31:35 - INFO - __main__ - Step 51531: {'lr': 0.00037409507756940843, 'samples': 9893952, 'steps': 51530, 'loss/train': 1.5488176345825195} -08/30/2021 22:31:35 - INFO - __main__ - Step 51532: {'lr': 0.00037409047072924307, 'samples': 9894144, 'steps': 51531, 'loss/train': 0.15970462560653687} -08/30/2021 22:31:37 - INFO - __main__ - Step 51533: {'lr': 0.0003740858638331646, 'samples': 9894336, 'steps': 51532, 'loss/train': 0.24809174239635468} -08/30/2021 22:31:38 - INFO - __main__ - Step 51534: {'lr': 0.0003740812568811748, 'samples': 9894528, 'steps': 51533, 'loss/train': 0.7790964841842651} -08/30/2021 22:31:38 - INFO - __main__ - Step 51535: {'lr': 0.000374076649873276, 'samples': 9894720, 'steps': 51534, 'loss/train': 1.446571946144104} -08/30/2021 22:31:38 - INFO - __main__ - Step 51536: {'lr': 0.00037407204280947014, 'samples': 9894912, 'steps': 51535, 'loss/train': 1.1602075099945068} -08/30/2021 22:31:39 - INFO - __main__ - Step 51537: {'lr': 0.0003740674356897593, 'samples': 9895104, 'steps': 51536, 'loss/train': 1.8485909700393677} -08/30/2021 22:31:41 - INFO - __main__ - Step 51538: {'lr': 0.0003740628285141457, 'samples': 9895296, 'steps': 51537, 'loss/train': 1.1973363161087036} -08/30/2021 22:31:41 - INFO - __main__ - Step 51539: {'lr': 0.00037405822128263125, 'samples': 9895488, 'steps': 51538, 'loss/train': 1.3499199151992798} -08/30/2021 22:31:42 - INFO - __main__ - Step 51540: {'lr': 0.000374053613995218, 'samples': 9895680, 'steps': 51539, 'loss/train': 1.5263172388076782} -08/30/2021 22:31:42 - INFO - __main__ - Step 51541: {'lr': 0.0003740490066519082, 'samples': 9895872, 'steps': 51540, 'loss/train': 1.528464436531067} -08/30/2021 22:31:42 - INFO - __main__ - Step 51542: {'lr': 0.0003740443992527038, 'samples': 9896064, 'steps': 51541, 'loss/train': 1.3877899646759033} -08/30/2021 22:31:43 - INFO - __main__ - Step 51543: {'lr': 0.00037403979179760687, 'samples': 9896256, 'steps': 51542, 'loss/train': 0.10983399301767349} -08/30/2021 22:31:43 - INFO - __main__ - Step 51544: {'lr': 0.0003740351842866196, 'samples': 9896448, 'steps': 51543, 'loss/train': 1.4278217554092407} -08/30/2021 22:31:45 - INFO - __main__ - Step 51545: {'lr': 0.0003740305767197439, 'samples': 9896640, 'steps': 51544, 'loss/train': 1.0563499927520752} -08/30/2021 22:31:45 - INFO - __main__ - Step 51546: {'lr': 0.0003740259690969821, 'samples': 9896832, 'steps': 51545, 'loss/train': 1.3931564092636108} -08/30/2021 22:31:46 - INFO - __main__ - Step 51547: {'lr': 0.00037402136141833595, 'samples': 9897024, 'steps': 51546, 'loss/train': 1.6741191148757935} -08/30/2021 22:31:46 - INFO - __main__ - Step 51548: {'lr': 0.0003740167536838077, 'samples': 9897216, 'steps': 51547, 'loss/train': 1.303240418434143} -08/30/2021 22:31:46 - INFO - __main__ - Step 51549: {'lr': 0.0003740121458933995, 'samples': 9897408, 'steps': 51548, 'loss/train': 1.633860468864441} -08/30/2021 22:31:48 - INFO - __main__ - Step 51550: {'lr': 0.0003740075380471133, 'samples': 9897600, 'steps': 51549, 'loss/train': 1.4947450160980225} -08/30/2021 22:31:48 - INFO - __main__ - Step 51551: {'lr': 0.0003740029301449512, 'samples': 9897792, 'steps': 51550, 'loss/train': 1.934906005859375} -08/30/2021 22:31:49 - INFO - __main__ - Step 51552: {'lr': 0.0003739983221869153, 'samples': 9897984, 'steps': 51551, 'loss/train': 1.3299869298934937} -08/30/2021 22:31:49 - INFO - __main__ - Step 51553: {'lr': 0.00037399371417300766, 'samples': 9898176, 'steps': 51552, 'loss/train': 1.2477569580078125} -08/30/2021 22:31:50 - INFO - __main__ - Step 51554: {'lr': 0.00037398910610323034, 'samples': 9898368, 'steps': 51553, 'loss/train': 1.0288652181625366} -08/30/2021 22:31:50 - INFO - __main__ - Step 51555: {'lr': 0.0003739844979775855, 'samples': 9898560, 'steps': 51554, 'loss/train': 1.0303795337677002} -08/30/2021 22:31:51 - INFO - __main__ - Step 51556: {'lr': 0.0003739798897960752, 'samples': 9898752, 'steps': 51555, 'loss/train': 1.1251752376556396} -08/30/2021 22:31:52 - INFO - __main__ - Step 51557: {'lr': 0.00037397528155870134, 'samples': 9898944, 'steps': 51556, 'loss/train': 1.8401908874511719} -08/30/2021 22:31:52 - INFO - __main__ - Step 51558: {'lr': 0.00037397067326546616, 'samples': 9899136, 'steps': 51557, 'loss/train': 2.5792136192321777} -08/30/2021 22:31:53 - INFO - __main__ - Step 51559: {'lr': 0.0003739660649163718, 'samples': 9899328, 'steps': 51558, 'loss/train': 1.583563208580017} -08/30/2021 22:31:53 - INFO - __main__ - Step 51560: {'lr': 0.0003739614565114202, 'samples': 9899520, 'steps': 51559, 'loss/train': 1.0671730041503906} -08/30/2021 22:31:55 - INFO - __main__ - Step 51561: {'lr': 0.00037395684805061345, 'samples': 9899712, 'steps': 51560, 'loss/train': 1.0895830392837524} -08/30/2021 22:31:55 - INFO - __main__ - Step 51562: {'lr': 0.00037395223953395375, 'samples': 9899904, 'steps': 51561, 'loss/train': 0.8633602261543274} -08/30/2021 22:31:55 - INFO - __main__ - Step 51563: {'lr': 0.000373947630961443, 'samples': 9900096, 'steps': 51562, 'loss/train': 1.289513349533081} -08/30/2021 22:31:56 - INFO - __main__ - Step 51564: {'lr': 0.00037394302233308336, 'samples': 9900288, 'steps': 51563, 'loss/train': 0.9341845512390137} -08/30/2021 22:31:56 - INFO - __main__ - Step 51565: {'lr': 0.0003739384136488769, 'samples': 9900480, 'steps': 51564, 'loss/train': 1.650567889213562} -08/30/2021 22:31:58 - INFO - __main__ - Step 51566: {'lr': 0.00037393380490882575, 'samples': 9900672, 'steps': 51565, 'loss/train': 1.0414856672286987} -08/30/2021 22:31:58 - INFO - __main__ - Step 51567: {'lr': 0.0003739291961129319, 'samples': 9900864, 'steps': 51566, 'loss/train': 1.7716565132141113} -08/30/2021 22:31:58 - INFO - __main__ - Step 51568: {'lr': 0.0003739245872611975, 'samples': 9901056, 'steps': 51567, 'loss/train': 1.4202914237976074} -08/30/2021 22:31:59 - INFO - __main__ - Step 51569: {'lr': 0.0003739199783536246, 'samples': 9901248, 'steps': 51568, 'loss/train': 1.3330029249191284} -08/30/2021 22:31:59 - INFO - __main__ - Step 51570: {'lr': 0.0003739153693902152, 'samples': 9901440, 'steps': 51569, 'loss/train': 1.644285798072815} -08/30/2021 22:32:00 - INFO - __main__ - Step 51571: {'lr': 0.0003739107603709715, 'samples': 9901632, 'steps': 51570, 'loss/train': 1.5177286863327026} -08/30/2021 22:32:01 - INFO - __main__ - Step 51572: {'lr': 0.00037390615129589554, 'samples': 9901824, 'steps': 51571, 'loss/train': 1.6142197847366333} -08/30/2021 22:32:01 - INFO - __main__ - Step 51573: {'lr': 0.00037390154216498933, 'samples': 9902016, 'steps': 51572, 'loss/train': 1.4646210670471191} -08/30/2021 22:32:02 - INFO - __main__ - Step 51574: {'lr': 0.000373896932978255, 'samples': 9902208, 'steps': 51573, 'loss/train': 1.1083478927612305} -08/30/2021 22:32:02 - INFO - __main__ - Step 51575: {'lr': 0.00037389232373569463, 'samples': 9902400, 'steps': 51574, 'loss/train': 1.113458275794983} -08/30/2021 22:32:04 - INFO - __main__ - Step 51576: {'lr': 0.0003738877144373104, 'samples': 9902592, 'steps': 51575, 'loss/train': 1.0290260314941406} -08/30/2021 22:32:04 - INFO - __main__ - Step 51577: {'lr': 0.0003738831050831042, 'samples': 9902784, 'steps': 51576, 'loss/train': 1.7404829263687134} -08/30/2021 22:32:05 - INFO - __main__ - Step 51578: {'lr': 0.0003738784956730781, 'samples': 9902976, 'steps': 51577, 'loss/train': 1.306673288345337} -08/30/2021 22:32:05 - INFO - __main__ - Step 51579: {'lr': 0.0003738738862072343, 'samples': 9903168, 'steps': 51578, 'loss/train': 1.9081714153289795} -08/30/2021 22:32:05 - INFO - __main__ - Step 51580: {'lr': 0.00037386927668557493, 'samples': 9903360, 'steps': 51579, 'loss/train': 1.2259036302566528} -08/30/2021 22:32:07 - INFO - __main__ - Step 51581: {'lr': 0.0003738646671081019, 'samples': 9903552, 'steps': 51580, 'loss/train': 0.6796914935112} -08/30/2021 22:32:07 - INFO - __main__ - Step 51582: {'lr': 0.00037386005747481744, 'samples': 9903744, 'steps': 51581, 'loss/train': 1.4337469339370728} -08/30/2021 22:32:07 - INFO - __main__ - Step 51583: {'lr': 0.00037385544778572346, 'samples': 9903936, 'steps': 51582, 'loss/train': 1.0164211988449097} -08/30/2021 22:32:08 - INFO - __main__ - Step 51584: {'lr': 0.00037385083804082213, 'samples': 9904128, 'steps': 51583, 'loss/train': 1.9585940837860107} -08/30/2021 22:32:08 - INFO - __main__ - Step 51585: {'lr': 0.00037384622824011555, 'samples': 9904320, 'steps': 51584, 'loss/train': 2.0327370166778564} -08/30/2021 22:32:10 - INFO - __main__ - Step 51586: {'lr': 0.00037384161838360574, 'samples': 9904512, 'steps': 51585, 'loss/train': 1.8917208909988403} -08/30/2021 22:32:11 - INFO - __main__ - Step 51587: {'lr': 0.00037383700847129487, 'samples': 9904704, 'steps': 51586, 'loss/train': 0.3373853266239166} -08/30/2021 22:32:11 - INFO - __main__ - Step 51588: {'lr': 0.0003738323985031849, 'samples': 9904896, 'steps': 51587, 'loss/train': 0.38460031151771545} -08/30/2021 22:32:11 - INFO - __main__ - Step 51589: {'lr': 0.000373827788479278, 'samples': 9905088, 'steps': 51588, 'loss/train': 1.1099581718444824} -08/30/2021 22:32:12 - INFO - __main__ - Step 51590: {'lr': 0.0003738231783995762, 'samples': 9905280, 'steps': 51589, 'loss/train': 1.6286319494247437} -08/30/2021 22:32:12 - INFO - __main__ - Step 51591: {'lr': 0.00037381856826408156, 'samples': 9905472, 'steps': 51590, 'loss/train': 1.7703702449798584} -08/30/2021 22:32:12 - INFO - __main__ - Step 51592: {'lr': 0.00037381395807279625, 'samples': 9905664, 'steps': 51591, 'loss/train': 0.03311726450920105} -08/30/2021 22:32:14 - INFO - __main__ - Step 51593: {'lr': 0.0003738093478257222, 'samples': 9905856, 'steps': 51592, 'loss/train': 0.029038993641734123} -08/30/2021 22:32:14 - INFO - __main__ - Step 51594: {'lr': 0.0003738047375228616, 'samples': 9906048, 'steps': 51593, 'loss/train': 1.3370366096496582} -08/30/2021 22:32:15 - INFO - __main__ - Step 51595: {'lr': 0.00037380012716421647, 'samples': 9906240, 'steps': 51594, 'loss/train': 1.0302993059158325} -08/30/2021 22:32:15 - INFO - __main__ - Step 51596: {'lr': 0.00037379551674978896, 'samples': 9906432, 'steps': 51595, 'loss/train': 1.2916898727416992} -08/30/2021 22:32:15 - INFO - __main__ - Step 51597: {'lr': 0.0003737909062795811, 'samples': 9906624, 'steps': 51596, 'loss/train': 1.0558297634124756} -08/30/2021 22:32:17 - INFO - __main__ - Step 51598: {'lr': 0.00037378629575359493, 'samples': 9906816, 'steps': 51597, 'loss/train': 0.9440423250198364} -08/30/2021 22:32:18 - INFO - __main__ - Step 51599: {'lr': 0.0003737816851718326, 'samples': 9907008, 'steps': 51598, 'loss/train': 1.2873013019561768} -08/30/2021 22:32:18 - INFO - __main__ - Step 51600: {'lr': 0.0003737770745342961, 'samples': 9907200, 'steps': 51599, 'loss/train': 0.8846646547317505} -08/30/2021 22:32:19 - INFO - __main__ - Step 51601: {'lr': 0.0003737724638409876, 'samples': 9907392, 'steps': 51600, 'loss/train': 0.7183449268341064} -08/30/2021 22:32:19 - INFO - __main__ - Step 51602: {'lr': 0.00037376785309190913, 'samples': 9907584, 'steps': 51601, 'loss/train': 1.514360785484314} -08/30/2021 22:32:20 - INFO - __main__ - Step 51603: {'lr': 0.0003737632422870628, 'samples': 9907776, 'steps': 51602, 'loss/train': 1.33913254737854} -08/30/2021 22:32:21 - INFO - __main__ - Step 51604: {'lr': 0.00037375863142645064, 'samples': 9907968, 'steps': 51603, 'loss/train': 1.5239001512527466} -08/30/2021 22:32:21 - INFO - __main__ - Step 51605: {'lr': 0.00037375402051007477, 'samples': 9908160, 'steps': 51604, 'loss/train': 1.7382969856262207} -08/30/2021 22:32:22 - INFO - __main__ - Step 51606: {'lr': 0.00037374940953793724, 'samples': 9908352, 'steps': 51605, 'loss/train': 1.2390068769454956} -08/30/2021 22:32:22 - INFO - __main__ - Step 51607: {'lr': 0.00037374479851004006, 'samples': 9908544, 'steps': 51606, 'loss/train': 1.884042501449585} -08/30/2021 22:32:24 - INFO - __main__ - Step 51608: {'lr': 0.0003737401874263855, 'samples': 9908736, 'steps': 51607, 'loss/train': 1.6969270706176758} -08/30/2021 22:32:24 - INFO - __main__ - Step 51609: {'lr': 0.0003737355762869755, 'samples': 9908928, 'steps': 51608, 'loss/train': 0.8311616778373718} -08/30/2021 22:32:25 - INFO - __main__ - Step 51610: {'lr': 0.0003737309650918121, 'samples': 9909120, 'steps': 51609, 'loss/train': 0.01981472037732601} -08/30/2021 22:32:25 - INFO - __main__ - Step 51611: {'lr': 0.0003737263538408975, 'samples': 9909312, 'steps': 51610, 'loss/train': 1.2087864875793457} -08/30/2021 22:32:25 - INFO - __main__ - Step 51612: {'lr': 0.0003737217425342336, 'samples': 9909504, 'steps': 51611, 'loss/train': 0.050863899290561676} -08/30/2021 22:32:26 - INFO - __main__ - Step 51613: {'lr': 0.0003737171311718227, 'samples': 9909696, 'steps': 51612, 'loss/train': 1.2529886960983276} -08/30/2021 22:32:28 - INFO - __main__ - Step 51614: {'lr': 0.0003737125197536667, 'samples': 9909888, 'steps': 51613, 'loss/train': 0.04510089010000229} -08/30/2021 22:32:28 - INFO - __main__ - Step 51615: {'lr': 0.0003737079082797678, 'samples': 9910080, 'steps': 51614, 'loss/train': 1.7643711566925049} -08/30/2021 22:32:29 - INFO - __main__ - Step 51616: {'lr': 0.000373703296750128, 'samples': 9910272, 'steps': 51615, 'loss/train': 1.0789111852645874} -08/30/2021 22:32:29 - INFO - __main__ - Step 51617: {'lr': 0.0003736986851647495, 'samples': 9910464, 'steps': 51616, 'loss/train': 1.516789436340332} -08/30/2021 22:32:29 - INFO - __main__ - Step 51618: {'lr': 0.00037369407352363417, 'samples': 9910656, 'steps': 51617, 'loss/train': 0.03868023306131363} -08/30/2021 22:32:30 - INFO - __main__ - Step 51619: {'lr': 0.0003736894618267842, 'samples': 9910848, 'steps': 51618, 'loss/train': 0.22338785231113434} -08/30/2021 22:32:31 - INFO - __main__ - Step 51620: {'lr': 0.0003736848500742017, 'samples': 9911040, 'steps': 51619, 'loss/train': 1.5001274347305298} -08/30/2021 22:32:32 - INFO - __main__ - Step 51621: {'lr': 0.0003736802382658887, 'samples': 9911232, 'steps': 51620, 'loss/train': 1.1166435480117798} -08/30/2021 22:32:32 - INFO - __main__ - Step 51622: {'lr': 0.00037367562640184735, 'samples': 9911424, 'steps': 51621, 'loss/train': 0.5407716631889343} -08/30/2021 22:32:32 - INFO - __main__ - Step 51623: {'lr': 0.0003736710144820796, 'samples': 9911616, 'steps': 51622, 'loss/train': 1.6106802225112915} -08/30/2021 22:32:33 - INFO - __main__ - Step 51624: {'lr': 0.00037366640250658767, 'samples': 9911808, 'steps': 51623, 'loss/train': 1.1158663034439087} -08/30/2021 22:32:34 - INFO - __main__ - Step 51625: {'lr': 0.00037366179047537354, 'samples': 9912000, 'steps': 51624, 'loss/train': 1.6539461612701416} -08/30/2021 22:32:35 - INFO - __main__ - Step 51626: {'lr': 0.0003736571783884393, 'samples': 9912192, 'steps': 51625, 'loss/train': 0.9302570819854736} -08/30/2021 22:32:35 - INFO - __main__ - Step 51627: {'lr': 0.00037365256624578695, 'samples': 9912384, 'steps': 51626, 'loss/train': 1.5809532403945923} -08/30/2021 22:32:35 - INFO - __main__ - Step 51628: {'lr': 0.0003736479540474188, 'samples': 9912576, 'steps': 51627, 'loss/train': 1.4287220239639282} -08/30/2021 22:32:36 - INFO - __main__ - Step 51629: {'lr': 0.00037364334179333674, 'samples': 9912768, 'steps': 51628, 'loss/train': 1.338386058807373} -08/30/2021 22:32:37 - INFO - __main__ - Step 51630: {'lr': 0.00037363872948354294, 'samples': 9912960, 'steps': 51629, 'loss/train': 1.6858468055725098} -08/30/2021 22:32:38 - INFO - __main__ - Step 51631: {'lr': 0.00037363411711803935, 'samples': 9913152, 'steps': 51630, 'loss/train': 1.7678496837615967} -08/30/2021 22:32:38 - INFO - __main__ - Step 51632: {'lr': 0.0003736295046968282, 'samples': 9913344, 'steps': 51631, 'loss/train': 1.4017808437347412} -08/30/2021 22:32:38 - INFO - __main__ - Step 51633: {'lr': 0.0003736248922199115, 'samples': 9913536, 'steps': 51632, 'loss/train': 1.5283550024032593} -08/30/2021 22:32:39 - INFO - __main__ - Step 51634: {'lr': 0.0003736202796872913, 'samples': 9913728, 'steps': 51633, 'loss/train': 1.1208016872406006} -08/30/2021 22:32:40 - INFO - __main__ - Step 51635: {'lr': 0.00037361566709896964, 'samples': 9913920, 'steps': 51634, 'loss/train': 1.4629861116409302} -08/30/2021 22:32:41 - INFO - __main__ - Step 51636: {'lr': 0.00037361105445494884, 'samples': 9914112, 'steps': 51635, 'loss/train': 0.7506587505340576} -08/30/2021 22:32:41 - INFO - __main__ - Step 51637: {'lr': 0.0003736064417552307, 'samples': 9914304, 'steps': 51636, 'loss/train': 1.307244062423706} -08/30/2021 22:32:41 - INFO - __main__ - Step 51638: {'lr': 0.0003736018289998174, 'samples': 9914496, 'steps': 51637, 'loss/train': 1.3700740337371826} -08/30/2021 22:32:42 - INFO - __main__ - Step 51639: {'lr': 0.00037359721618871107, 'samples': 9914688, 'steps': 51638, 'loss/train': 1.2720520496368408} -08/30/2021 22:32:43 - INFO - __main__ - Step 51640: {'lr': 0.0003735926033219137, 'samples': 9914880, 'steps': 51639, 'loss/train': 1.3028295040130615} -08/30/2021 22:32:44 - INFO - __main__ - Step 51641: {'lr': 0.00037358799039942744, 'samples': 9915072, 'steps': 51640, 'loss/train': 1.4700137376785278} -08/30/2021 22:32:44 - INFO - __main__ - Step 51642: {'lr': 0.00037358337742125433, 'samples': 9915264, 'steps': 51641, 'loss/train': 1.4409149885177612} -08/30/2021 22:32:44 - INFO - __main__ - Step 51643: {'lr': 0.0003735787643873965, 'samples': 9915456, 'steps': 51642, 'loss/train': 1.2647240161895752} -08/30/2021 22:32:45 - INFO - __main__ - Step 51644: {'lr': 0.00037357415129785586, 'samples': 9915648, 'steps': 51643, 'loss/train': 1.546258807182312} -08/30/2021 22:32:46 - INFO - __main__ - Step 51645: {'lr': 0.00037356953815263473, 'samples': 9915840, 'steps': 51644, 'loss/train': 1.5272432565689087} -08/30/2021 22:32:47 - INFO - __main__ - Step 51646: {'lr': 0.00037356492495173505, 'samples': 9916032, 'steps': 51645, 'loss/train': 1.1103973388671875} -08/30/2021 22:32:47 - INFO - __main__ - Step 51647: {'lr': 0.00037356031169515894, 'samples': 9916224, 'steps': 51646, 'loss/train': 1.0418039560317993} -08/30/2021 22:32:47 - INFO - __main__ - Step 51648: {'lr': 0.0003735556983829084, 'samples': 9916416, 'steps': 51647, 'loss/train': 1.464951992034912} -08/30/2021 22:32:48 - INFO - __main__ - Step 51649: {'lr': 0.00037355108501498557, 'samples': 9916608, 'steps': 51648, 'loss/train': 0.9551159143447876} -08/30/2021 22:32:49 - INFO - __main__ - Step 51650: {'lr': 0.0003735464715913926, 'samples': 9916800, 'steps': 51649, 'loss/train': 1.679457426071167} -08/30/2021 22:32:50 - INFO - __main__ - Step 51651: {'lr': 0.00037354185811213145, 'samples': 9916992, 'steps': 51650, 'loss/train': 1.5624104738235474} -08/30/2021 22:32:50 - INFO - __main__ - Step 51652: {'lr': 0.0003735372445772042, 'samples': 9917184, 'steps': 51651, 'loss/train': 1.495266318321228} -08/30/2021 22:32:50 - INFO - __main__ - Step 51653: {'lr': 0.00037353263098661304, 'samples': 9917376, 'steps': 51652, 'loss/train': 1.7803412675857544} -08/30/2021 22:32:51 - INFO - __main__ - Step 51654: {'lr': 0.00037352801734036, 'samples': 9917568, 'steps': 51653, 'loss/train': 1.6657036542892456} -08/30/2021 22:32:51 - INFO - __main__ - Step 51655: {'lr': 0.00037352340363844706, 'samples': 9917760, 'steps': 51654, 'loss/train': 1.3105398416519165} -08/30/2021 22:32:53 - INFO - __main__ - Step 51656: {'lr': 0.00037351878988087646, 'samples': 9917952, 'steps': 51655, 'loss/train': 1.1532460451126099} -08/30/2021 22:32:54 - INFO - __main__ - Step 51657: {'lr': 0.0003735141760676501, 'samples': 9918144, 'steps': 51656, 'loss/train': 1.3362302780151367} -08/30/2021 22:32:54 - INFO - __main__ - Step 51658: {'lr': 0.0003735095621987703, 'samples': 9918336, 'steps': 51657, 'loss/train': 0.12950551509857178} -08/30/2021 22:32:55 - INFO - __main__ - Step 51659: {'lr': 0.00037350494827423884, 'samples': 9918528, 'steps': 51658, 'loss/train': 0.2063923329114914} -08/30/2021 22:32:55 - INFO - __main__ - Step 51660: {'lr': 0.00037350033429405806, 'samples': 9918720, 'steps': 51659, 'loss/train': 1.121277928352356} -08/30/2021 22:32:57 - INFO - __main__ - Step 51661: {'lr': 0.0003734957202582299, 'samples': 9918912, 'steps': 51660, 'loss/train': 1.0919702053070068} -08/30/2021 22:32:57 - INFO - __main__ - Step 51662: {'lr': 0.00037349110616675653, 'samples': 9919104, 'steps': 51661, 'loss/train': 1.8586196899414062} -08/30/2021 22:32:57 - INFO - __main__ - Step 51663: {'lr': 0.0003734864920196399, 'samples': 9919296, 'steps': 51662, 'loss/train': 1.7960128784179688} -08/30/2021 22:32:58 - INFO - __main__ - Step 51664: {'lr': 0.0003734818778168823, 'samples': 9919488, 'steps': 51663, 'loss/train': 0.9504808187484741} -08/30/2021 22:32:58 - INFO - __main__ - Step 51665: {'lr': 0.0003734772635584855, 'samples': 9919680, 'steps': 51664, 'loss/train': 1.0689635276794434} -08/30/2021 22:32:59 - INFO - __main__ - Step 51666: {'lr': 0.0003734726492444518, 'samples': 9919872, 'steps': 51665, 'loss/train': 1.3270063400268555} -08/30/2021 22:33:00 - INFO - __main__ - Step 51667: {'lr': 0.00037346803487478325, 'samples': 9920064, 'steps': 51666, 'loss/train': 1.2435252666473389} -08/30/2021 22:33:00 - INFO - __main__ - Step 51668: {'lr': 0.0003734634204494819, 'samples': 9920256, 'steps': 51667, 'loss/train': 1.430754542350769} -08/30/2021 22:33:01 - INFO - __main__ - Step 51669: {'lr': 0.0003734588059685499, 'samples': 9920448, 'steps': 51668, 'loss/train': 0.7625913619995117} -08/30/2021 22:33:01 - INFO - __main__ - Step 51670: {'lr': 0.0003734541914319892, 'samples': 9920640, 'steps': 51669, 'loss/train': 1.5677143335342407} -08/30/2021 22:33:03 - INFO - __main__ - Step 51671: {'lr': 0.0003734495768398019, 'samples': 9920832, 'steps': 51670, 'loss/train': 1.373456358909607} -08/30/2021 22:33:03 - INFO - __main__ - Step 51672: {'lr': 0.00037344496219199016, 'samples': 9921024, 'steps': 51671, 'loss/train': 1.219123363494873} -08/30/2021 22:33:04 - INFO - __main__ - Step 51673: {'lr': 0.0003734403474885561, 'samples': 9921216, 'steps': 51672, 'loss/train': 1.0996557474136353} -08/30/2021 22:33:04 - INFO - __main__ - Step 51674: {'lr': 0.00037343573272950167, 'samples': 9921408, 'steps': 51673, 'loss/train': 1.3817435503005981} -08/30/2021 22:33:04 - INFO - __main__ - Step 51675: {'lr': 0.00037343111791482897, 'samples': 9921600, 'steps': 51674, 'loss/train': 0.978774905204773} -08/30/2021 22:33:05 - INFO - __main__ - Step 51676: {'lr': 0.0003734265030445401, 'samples': 9921792, 'steps': 51675, 'loss/train': 1.0237514972686768} -08/30/2021 22:33:05 - INFO - __main__ - Step 51677: {'lr': 0.0003734218881186372, 'samples': 9921984, 'steps': 51676, 'loss/train': 0.02279912680387497} -08/30/2021 22:33:07 - INFO - __main__ - Step 51678: {'lr': 0.00037341727313712237, 'samples': 9922176, 'steps': 51677, 'loss/train': 0.025808101519942284} -08/30/2021 22:33:07 - INFO - __main__ - Step 51679: {'lr': 0.0003734126580999975, 'samples': 9922368, 'steps': 51678, 'loss/train': 1.399193286895752} -08/30/2021 22:33:07 - INFO - __main__ - Step 51680: {'lr': 0.0003734080430072649, 'samples': 9922560, 'steps': 51679, 'loss/train': 0.9727354049682617} -08/30/2021 22:33:08 - INFO - __main__ - Step 51681: {'lr': 0.0003734034278589265, 'samples': 9922752, 'steps': 51680, 'loss/train': 1.0413569211959839} -08/30/2021 22:33:08 - INFO - __main__ - Step 51682: {'lr': 0.0003733988126549843, 'samples': 9922944, 'steps': 51681, 'loss/train': 1.3695199489593506} -08/30/2021 22:33:09 - INFO - __main__ - Step 51683: {'lr': 0.0003733941973954407, 'samples': 9923136, 'steps': 51682, 'loss/train': 1.441453218460083} -08/30/2021 22:33:10 - INFO - __main__ - Step 51684: {'lr': 0.00037338958208029744, 'samples': 9923328, 'steps': 51683, 'loss/train': 4.008942604064941} -08/30/2021 22:33:10 - INFO - __main__ - Step 51685: {'lr': 0.0003733849667095568, 'samples': 9923520, 'steps': 51684, 'loss/train': 1.1269786357879639} -08/30/2021 22:33:11 - INFO - __main__ - Step 51686: {'lr': 0.00037338035128322075, 'samples': 9923712, 'steps': 51685, 'loss/train': 1.1578725576400757} -08/30/2021 22:33:11 - INFO - __main__ - Step 51687: {'lr': 0.00037337573580129143, 'samples': 9923904, 'steps': 51686, 'loss/train': 1.2276599407196045} -08/30/2021 22:33:12 - INFO - __main__ - Step 51688: {'lr': 0.0003733711202637709, 'samples': 9924096, 'steps': 51687, 'loss/train': 1.360328197479248} -08/30/2021 22:33:13 - INFO - __main__ - Step 51689: {'lr': 0.00037336650467066125, 'samples': 9924288, 'steps': 51688, 'loss/train': 1.8080074787139893} -08/30/2021 22:33:13 - INFO - __main__ - Step 51690: {'lr': 0.0003733618890219646, 'samples': 9924480, 'steps': 51689, 'loss/train': 1.5439468622207642} -08/30/2021 22:33:14 - INFO - __main__ - Step 51691: {'lr': 0.000373357273317683, 'samples': 9924672, 'steps': 51690, 'loss/train': 1.2663969993591309} -08/30/2021 22:33:14 - INFO - __main__ - Step 51692: {'lr': 0.00037335265755781844, 'samples': 9924864, 'steps': 51691, 'loss/train': 1.1125068664550781} -08/30/2021 22:33:14 - INFO - __main__ - Step 51693: {'lr': 0.00037334804174237314, 'samples': 9925056, 'steps': 51692, 'loss/train': 1.7361685037612915} -08/30/2021 22:33:16 - INFO - __main__ - Step 51694: {'lr': 0.0003733434258713491, 'samples': 9925248, 'steps': 51693, 'loss/train': 1.3808708190917969} -08/30/2021 22:33:16 - INFO - __main__ - Step 51695: {'lr': 0.00037333880994474834, 'samples': 9925440, 'steps': 51694, 'loss/train': 0.7133839130401611} -08/30/2021 22:33:17 - INFO - __main__ - Step 51696: {'lr': 0.00037333419396257307, 'samples': 9925632, 'steps': 51695, 'loss/train': 1.6381560564041138} -08/30/2021 22:33:17 - INFO - __main__ - Step 51697: {'lr': 0.00037332957792482534, 'samples': 9925824, 'steps': 51696, 'loss/train': 1.2527058124542236} -08/30/2021 22:33:17 - INFO - __main__ - Step 51698: {'lr': 0.0003733249618315072, 'samples': 9926016, 'steps': 51697, 'loss/train': 2.36087965965271} -08/30/2021 22:33:19 - INFO - __main__ - Step 51699: {'lr': 0.0003733203456826207, 'samples': 9926208, 'steps': 51698, 'loss/train': 1.3819410800933838} -08/30/2021 22:33:19 - INFO - __main__ - Step 51700: {'lr': 0.000373315729478168, 'samples': 9926400, 'steps': 51699, 'loss/train': 1.3410474061965942} -08/30/2021 22:33:20 - INFO - __main__ - Step 51701: {'lr': 0.0003733111132181511, 'samples': 9926592, 'steps': 51700, 'loss/train': 1.00484037399292} -08/30/2021 22:33:20 - INFO - __main__ - Step 51702: {'lr': 0.0003733064969025721, 'samples': 9926784, 'steps': 51701, 'loss/train': 1.4844087362289429} -08/30/2021 22:33:20 - INFO - __main__ - Step 51703: {'lr': 0.00037330188053143323, 'samples': 9926976, 'steps': 51702, 'loss/train': 0.9071732759475708} -08/30/2021 22:33:22 - INFO - __main__ - Step 51704: {'lr': 0.0003732972641047363, 'samples': 9927168, 'steps': 51703, 'loss/train': 0.8955970406532288} -08/30/2021 22:33:22 - INFO - __main__ - Step 51705: {'lr': 0.0003732926476224835, 'samples': 9927360, 'steps': 51704, 'loss/train': 1.646584391593933} -08/30/2021 22:33:23 - INFO - __main__ - Step 51706: {'lr': 0.00037328803108467704, 'samples': 9927552, 'steps': 51705, 'loss/train': 1.074128270149231} -08/30/2021 22:33:23 - INFO - __main__ - Step 51707: {'lr': 0.0003732834144913188, 'samples': 9927744, 'steps': 51706, 'loss/train': 1.4815008640289307} -08/30/2021 22:33:23 - INFO - __main__ - Step 51708: {'lr': 0.00037327879784241095, 'samples': 9927936, 'steps': 51707, 'loss/train': 0.9861049652099609} -08/30/2021 22:33:26 - INFO - __main__ - Step 51709: {'lr': 0.00037327418113795565, 'samples': 9928128, 'steps': 51708, 'loss/train': 1.559061050415039} -08/30/2021 22:33:26 - INFO - __main__ - Step 51710: {'lr': 0.0003732695643779549, 'samples': 9928320, 'steps': 51709, 'loss/train': 1.484695553779602} -08/30/2021 22:33:27 - INFO - __main__ - Step 51711: {'lr': 0.0003732649475624108, 'samples': 9928512, 'steps': 51710, 'loss/train': 0.01932797208428383} -08/30/2021 22:33:27 - INFO - __main__ - Step 51712: {'lr': 0.0003732603306913254, 'samples': 9928704, 'steps': 51711, 'loss/train': 1.8199025392532349} -08/30/2021 22:33:27 - INFO - __main__ - Step 51713: {'lr': 0.00037325571376470074, 'samples': 9928896, 'steps': 51712, 'loss/train': 0.43242818117141724} -08/30/2021 22:33:28 - INFO - __main__ - Step 51714: {'lr': 0.00037325109678253897, 'samples': 9929088, 'steps': 51713, 'loss/train': 1.3795090913772583} -08/30/2021 22:33:29 - INFO - __main__ - Step 51715: {'lr': 0.0003732464797448422, 'samples': 9929280, 'steps': 51714, 'loss/train': 2.0980629920959473} -08/30/2021 22:33:30 - INFO - __main__ - Step 51716: {'lr': 0.0003732418626516125, 'samples': 9929472, 'steps': 51715, 'loss/train': 1.4240823984146118} -08/30/2021 22:33:30 - INFO - __main__ - Step 51717: {'lr': 0.0003732372455028519, 'samples': 9929664, 'steps': 51716, 'loss/train': 0.6917343735694885} -08/30/2021 22:33:30 - INFO - __main__ - Step 51718: {'lr': 0.00037323262829856246, 'samples': 9929856, 'steps': 51717, 'loss/train': 1.3072789907455444} -08/30/2021 22:33:31 - INFO - __main__ - Step 51719: {'lr': 0.00037322801103874633, 'samples': 9930048, 'steps': 51718, 'loss/train': 0.7716614007949829} -08/30/2021 22:33:32 - INFO - __main__ - Step 51720: {'lr': 0.00037322339372340555, 'samples': 9930240, 'steps': 51719, 'loss/train': 1.0582247972488403} -08/30/2021 22:33:33 - INFO - __main__ - Step 51721: {'lr': 0.0003732187763525421, 'samples': 9930432, 'steps': 51720, 'loss/train': 1.6641348600387573} -08/30/2021 22:33:33 - INFO - __main__ - Step 51722: {'lr': 0.00037321415892615833, 'samples': 9930624, 'steps': 51721, 'loss/train': 0.6993993520736694} -08/30/2021 22:33:33 - INFO - __main__ - Step 51723: {'lr': 0.0003732095414442561, 'samples': 9930816, 'steps': 51722, 'loss/train': 1.1004928350448608} -08/30/2021 22:33:34 - INFO - __main__ - Step 51724: {'lr': 0.00037320492390683756, 'samples': 9931008, 'steps': 51723, 'loss/train': 0.07755095511674881} -08/30/2021 22:33:35 - INFO - __main__ - Step 51725: {'lr': 0.00037320030631390476, 'samples': 9931200, 'steps': 51724, 'loss/train': 1.4266318082809448} -08/30/2021 22:33:36 - INFO - __main__ - Step 51726: {'lr': 0.00037319568866545983, 'samples': 9931392, 'steps': 51725, 'loss/train': 0.8921300768852234} -08/30/2021 22:33:36 - INFO - __main__ - Step 51727: {'lr': 0.00037319107096150483, 'samples': 9931584, 'steps': 51726, 'loss/train': 0.575541615486145} -08/30/2021 22:33:37 - INFO - __main__ - Step 51728: {'lr': 0.00037318645320204183, 'samples': 9931776, 'steps': 51727, 'loss/train': 1.354965329170227} -08/30/2021 22:33:37 - INFO - __main__ - Step 51729: {'lr': 0.0003731818353870729, 'samples': 9931968, 'steps': 51728, 'loss/train': 3.0695176124572754} -08/30/2021 22:33:37 - INFO - __main__ - Step 51730: {'lr': 0.00037317721751660014, 'samples': 9932160, 'steps': 51729, 'loss/train': 3.347961187362671} -08/30/2021 22:33:39 - INFO - __main__ - Step 51731: {'lr': 0.00037317259959062564, 'samples': 9932352, 'steps': 51730, 'loss/train': 0.39453622698783875} -08/30/2021 22:33:39 - INFO - __main__ - Step 51732: {'lr': 0.0003731679816091514, 'samples': 9932544, 'steps': 51731, 'loss/train': 1.9897546768188477} -08/30/2021 22:33:40 - INFO - __main__ - Step 51733: {'lr': 0.00037316336357217966, 'samples': 9932736, 'steps': 51732, 'loss/train': 1.697346568107605} -08/30/2021 22:33:40 - INFO - __main__ - Step 51734: {'lr': 0.0003731587454797124, 'samples': 9932928, 'steps': 51733, 'loss/train': 1.220609188079834} -08/30/2021 22:33:40 - INFO - __main__ - Step 51735: {'lr': 0.0003731541273317517, 'samples': 9933120, 'steps': 51734, 'loss/train': 1.3236980438232422} -08/30/2021 22:33:42 - INFO - __main__ - Step 51736: {'lr': 0.0003731495091282996, 'samples': 9933312, 'steps': 51735, 'loss/train': 1.49858558177948} -08/30/2021 22:33:42 - INFO - __main__ - Step 51737: {'lr': 0.0003731448908693583, 'samples': 9933504, 'steps': 51736, 'loss/train': 1.320495367050171} -08/30/2021 22:33:43 - INFO - __main__ - Step 51738: {'lr': 0.0003731402725549298, 'samples': 9933696, 'steps': 51737, 'loss/train': 1.24888277053833} -08/30/2021 22:33:43 - INFO - __main__ - Step 51739: {'lr': 0.0003731356541850162, 'samples': 9933888, 'steps': 51738, 'loss/train': 1.5330533981323242} -08/30/2021 22:33:43 - INFO - __main__ - Step 51740: {'lr': 0.0003731310357596195, 'samples': 9934080, 'steps': 51739, 'loss/train': 1.260166883468628} -08/30/2021 22:33:45 - INFO - __main__ - Step 51741: {'lr': 0.0003731264172787419, 'samples': 9934272, 'steps': 51740, 'loss/train': 1.1915870904922485} -08/30/2021 22:33:45 - INFO - __main__ - Step 51742: {'lr': 0.0003731217987423854, 'samples': 9934464, 'steps': 51741, 'loss/train': 1.5375360250473022} -08/30/2021 22:33:46 - INFO - __main__ - Step 51743: {'lr': 0.00037311718015055215, 'samples': 9934656, 'steps': 51742, 'loss/train': 1.421510934829712} -08/30/2021 22:33:46 - INFO - __main__ - Step 51744: {'lr': 0.0003731125615032442, 'samples': 9934848, 'steps': 51743, 'loss/train': 1.353835105895996} -08/30/2021 22:33:46 - INFO - __main__ - Step 51745: {'lr': 0.0003731079428004637, 'samples': 9935040, 'steps': 51744, 'loss/train': 1.5584110021591187} -08/30/2021 22:33:47 - INFO - __main__ - Step 51746: {'lr': 0.00037310332404221256, 'samples': 9935232, 'steps': 51745, 'loss/train': 1.5493760108947754} -08/30/2021 22:33:49 - INFO - __main__ - Step 51747: {'lr': 0.000373098705228493, 'samples': 9935424, 'steps': 51746, 'loss/train': 1.2706648111343384} -08/30/2021 22:33:49 - INFO - __main__ - Step 51748: {'lr': 0.00037309408635930705, 'samples': 9935616, 'steps': 51747, 'loss/train': 0.3625568747520447} -08/30/2021 22:33:49 - INFO - __main__ - Step 51749: {'lr': 0.0003730894674346568, 'samples': 9935808, 'steps': 51748, 'loss/train': 1.7290058135986328} -08/30/2021 22:33:50 - INFO - __main__ - Step 51750: {'lr': 0.00037308484845454434, 'samples': 9936000, 'steps': 51749, 'loss/train': 1.467778205871582} -08/30/2021 22:33:50 - INFO - __main__ - Step 51751: {'lr': 0.0003730802294189718, 'samples': 9936192, 'steps': 51750, 'loss/train': 1.6475639343261719} -08/30/2021 22:33:51 - INFO - __main__ - Step 51752: {'lr': 0.00037307561032794113, 'samples': 9936384, 'steps': 51751, 'loss/train': 0.9193523526191711} -08/30/2021 22:33:52 - INFO - __main__ - Step 51753: {'lr': 0.0003730709911814545, 'samples': 9936576, 'steps': 51752, 'loss/train': 1.5737004280090332} -08/30/2021 22:33:52 - INFO - __main__ - Step 51754: {'lr': 0.000373066371979514, 'samples': 9936768, 'steps': 51753, 'loss/train': 1.540323257446289} -08/30/2021 22:33:53 - INFO - __main__ - Step 51755: {'lr': 0.00037306175272212166, 'samples': 9936960, 'steps': 51754, 'loss/train': 1.3289436101913452} -08/30/2021 22:33:53 - INFO - __main__ - Step 51756: {'lr': 0.0003730571334092796, 'samples': 9937152, 'steps': 51755, 'loss/train': 0.7925437092781067} -08/30/2021 22:33:54 - INFO - __main__ - Step 51757: {'lr': 0.00037305251404099, 'samples': 9937344, 'steps': 51756, 'loss/train': 0.5316606163978577} -08/30/2021 22:33:55 - INFO - __main__ - Step 51758: {'lr': 0.00037304789461725473, 'samples': 9937536, 'steps': 51757, 'loss/train': 1.3171734809875488} -08/30/2021 22:33:55 - INFO - __main__ - Step 51759: {'lr': 0.000373043275138076, 'samples': 9937728, 'steps': 51758, 'loss/train': 0.9147374629974365} -08/30/2021 22:33:56 - INFO - __main__ - Step 51760: {'lr': 0.00037303865560345587, 'samples': 9937920, 'steps': 51759, 'loss/train': 1.0636916160583496} -08/30/2021 22:33:56 - INFO - __main__ - Step 51761: {'lr': 0.00037303403601339643, 'samples': 9938112, 'steps': 51760, 'loss/train': 0.508759081363678} -08/30/2021 22:33:58 - INFO - __main__ - Step 51762: {'lr': 0.0003730294163678997, 'samples': 9938304, 'steps': 51761, 'loss/train': 1.5808589458465576} -08/30/2021 22:33:58 - INFO - __main__ - Step 51763: {'lr': 0.00037302479666696787, 'samples': 9938496, 'steps': 51762, 'loss/train': 1.274237871170044} -08/30/2021 22:33:58 - INFO - __main__ - Step 51764: {'lr': 0.000373020176910603, 'samples': 9938688, 'steps': 51763, 'loss/train': 0.7507188320159912} -08/30/2021 22:33:59 - INFO - __main__ - Step 51765: {'lr': 0.00037301555709880706, 'samples': 9938880, 'steps': 51764, 'loss/train': 1.6534377336502075} -08/30/2021 22:33:59 - INFO - __main__ - Step 51766: {'lr': 0.00037301093723158223, 'samples': 9939072, 'steps': 51765, 'loss/train': 0.9131073355674744} -08/30/2021 22:33:59 - INFO - __main__ - Step 51767: {'lr': 0.0003730063173089306, 'samples': 9939264, 'steps': 51766, 'loss/train': 2.0918335914611816} -08/30/2021 22:34:02 - INFO - __main__ - Step 51768: {'lr': 0.0003730016973308542, 'samples': 9939456, 'steps': 51767, 'loss/train': 1.227973222732544} -08/30/2021 22:34:02 - INFO - __main__ - Step 51769: {'lr': 0.0003729970772973551, 'samples': 9939648, 'steps': 51768, 'loss/train': 1.1515026092529297} -08/30/2021 22:34:02 - INFO - __main__ - Step 51770: {'lr': 0.00037299245720843544, 'samples': 9939840, 'steps': 51769, 'loss/train': 1.055242657661438} -08/30/2021 22:34:03 - INFO - __main__ - Step 51771: {'lr': 0.0003729878370640973, 'samples': 9940032, 'steps': 51770, 'loss/train': 0.9286774396896362} -08/30/2021 22:34:03 - INFO - __main__ - Step 51772: {'lr': 0.0003729832168643428, 'samples': 9940224, 'steps': 51771, 'loss/train': 1.4751461744308472} -08/30/2021 22:34:06 - INFO - __main__ - Step 51773: {'lr': 0.00037297859660917384, 'samples': 9940416, 'steps': 51772, 'loss/train': 1.6746792793273926} -08/30/2021 22:34:06 - INFO - __main__ - Step 51774: {'lr': 0.00037297397629859266, 'samples': 9940608, 'steps': 51773, 'loss/train': 1.4278478622436523} -08/30/2021 22:34:07 - INFO - __main__ - Step 51775: {'lr': 0.0003729693559326013, 'samples': 9940800, 'steps': 51774, 'loss/train': 1.2316800355911255} -08/30/2021 22:34:07 - INFO - __main__ - Step 51776: {'lr': 0.00037296473551120185, 'samples': 9940992, 'steps': 51775, 'loss/train': 1.0251357555389404} -08/30/2021 22:34:07 - INFO - __main__ - Step 51777: {'lr': 0.00037296011503439643, 'samples': 9941184, 'steps': 51776, 'loss/train': 1.8975722789764404} -08/30/2021 22:34:08 - INFO - __main__ - Step 51778: {'lr': 0.00037295549450218704, 'samples': 9941376, 'steps': 51777, 'loss/train': 0.37099891901016235} -08/30/2021 22:34:08 - INFO - __main__ - Step 51779: {'lr': 0.0003729508739145758, 'samples': 9941568, 'steps': 51778, 'loss/train': 0.3667130172252655} -08/30/2021 22:34:10 - INFO - __main__ - Step 51780: {'lr': 0.0003729462532715648, 'samples': 9941760, 'steps': 51779, 'loss/train': 0.33669188618659973} -08/30/2021 22:34:10 - INFO - __main__ - Step 51781: {'lr': 0.0003729416325731561, 'samples': 9941952, 'steps': 51780, 'loss/train': 2.044456720352173} -08/30/2021 22:34:10 - INFO - __main__ - Step 51782: {'lr': 0.0003729370118193518, 'samples': 9942144, 'steps': 51781, 'loss/train': 1.579751968383789} -08/30/2021 22:34:11 - INFO - __main__ - Step 51783: {'lr': 0.00037293239101015397, 'samples': 9942336, 'steps': 51782, 'loss/train': 0.8203944563865662} -08/30/2021 22:34:11 - INFO - __main__ - Step 51784: {'lr': 0.0003729277701455648, 'samples': 9942528, 'steps': 51783, 'loss/train': 1.1906901597976685} -08/30/2021 22:34:12 - INFO - __main__ - Step 51785: {'lr': 0.00037292314922558615, 'samples': 9942720, 'steps': 51784, 'loss/train': 1.8912532329559326} -08/30/2021 22:34:13 - INFO - __main__ - Step 51786: {'lr': 0.0003729185282502203, 'samples': 9942912, 'steps': 51785, 'loss/train': 0.4631793797016144} -08/30/2021 22:34:13 - INFO - __main__ - Step 51787: {'lr': 0.00037291390721946914, 'samples': 9943104, 'steps': 51786, 'loss/train': 1.1479171514511108} -08/30/2021 22:34:14 - INFO - __main__ - Step 51788: {'lr': 0.00037290928613333495, 'samples': 9943296, 'steps': 51787, 'loss/train': 1.2784167528152466} -08/30/2021 22:34:14 - INFO - __main__ - Step 51789: {'lr': 0.00037290466499181977, 'samples': 9943488, 'steps': 51788, 'loss/train': 0.28819194436073303} -08/30/2021 22:34:14 - INFO - __main__ - Step 51790: {'lr': 0.0003729000437949256, 'samples': 9943680, 'steps': 51789, 'loss/train': 1.7119340896606445} -08/30/2021 22:34:16 - INFO - __main__ - Step 51791: {'lr': 0.0003728954225426546, 'samples': 9943872, 'steps': 51790, 'loss/train': 1.2977453470230103} -08/30/2021 22:34:17 - INFO - __main__ - Step 51792: {'lr': 0.00037289080123500886, 'samples': 9944064, 'steps': 51791, 'loss/train': 1.437566876411438} -08/30/2021 22:34:17 - INFO - __main__ - Step 51793: {'lr': 0.0003728861798719903, 'samples': 9944256, 'steps': 51792, 'loss/train': 0.8412335515022278} -08/30/2021 22:34:17 - INFO - __main__ - Step 51794: {'lr': 0.00037288155845360116, 'samples': 9944448, 'steps': 51793, 'loss/train': 1.403337836265564} -08/30/2021 22:34:18 - INFO - __main__ - Step 51795: {'lr': 0.00037287693697984355, 'samples': 9944640, 'steps': 51794, 'loss/train': 1.5479451417922974} -08/30/2021 22:34:19 - INFO - __main__ - Step 51796: {'lr': 0.0003728723154507195, 'samples': 9944832, 'steps': 51795, 'loss/train': 1.93978750705719} -08/30/2021 22:34:20 - INFO - __main__ - Step 51797: {'lr': 0.000372867693866231, 'samples': 9945024, 'steps': 51796, 'loss/train': 1.2946497201919556} -08/30/2021 22:34:20 - INFO - __main__ - Step 51798: {'lr': 0.0003728630722263803, 'samples': 9945216, 'steps': 51797, 'loss/train': 1.226035714149475} -08/30/2021 22:34:20 - INFO - __main__ - Step 51799: {'lr': 0.0003728584505311693, 'samples': 9945408, 'steps': 51798, 'loss/train': 1.3603320121765137} -08/30/2021 22:34:21 - INFO - __main__ - Step 51800: {'lr': 0.0003728538287806002, 'samples': 9945600, 'steps': 51799, 'loss/train': 1.6623071432113647} -08/30/2021 22:34:22 - INFO - __main__ - Step 51801: {'lr': 0.00037284920697467505, 'samples': 9945792, 'steps': 51800, 'loss/train': 1.3876612186431885} -08/30/2021 22:34:23 - INFO - __main__ - Step 51802: {'lr': 0.00037284458511339604, 'samples': 9945984, 'steps': 51801, 'loss/train': 1.4863940477371216} -08/30/2021 22:34:23 - INFO - __main__ - Step 51803: {'lr': 0.00037283996319676505, 'samples': 9946176, 'steps': 51802, 'loss/train': 1.1048009395599365} -08/30/2021 22:34:23 - INFO - __main__ - Step 51804: {'lr': 0.0003728353412247843, 'samples': 9946368, 'steps': 51803, 'loss/train': 1.4630974531173706} -08/30/2021 22:34:24 - INFO - __main__ - Step 51805: {'lr': 0.0003728307191974558, 'samples': 9946560, 'steps': 51804, 'loss/train': 1.4835635423660278} -08/30/2021 22:34:25 - INFO - __main__ - Step 51806: {'lr': 0.00037282609711478175, 'samples': 9946752, 'steps': 51805, 'loss/train': 1.3914366960525513} -08/30/2021 22:34:26 - INFO - __main__ - Step 51807: {'lr': 0.00037282147497676415, 'samples': 9946944, 'steps': 51806, 'loss/train': 1.6220390796661377} -08/30/2021 22:34:26 - INFO - __main__ - Step 51808: {'lr': 0.000372816852783405, 'samples': 9947136, 'steps': 51807, 'loss/train': 1.3874956369400024} -08/30/2021 22:34:26 - INFO - __main__ - Step 51809: {'lr': 0.0003728122305347066, 'samples': 9947328, 'steps': 51808, 'loss/train': 1.1157251596450806} -08/30/2021 22:34:27 - INFO - __main__ - Step 51810: {'lr': 0.00037280760823067086, 'samples': 9947520, 'steps': 51809, 'loss/train': 1.3168820142745972} -08/30/2021 22:34:28 - INFO - __main__ - Step 51811: {'lr': 0.00037280298587129984, 'samples': 9947712, 'steps': 51810, 'loss/train': 0.6487297415733337} -08/30/2021 22:34:29 - INFO - __main__ - Step 51812: {'lr': 0.0003727983634565958, 'samples': 9947904, 'steps': 51811, 'loss/train': 1.470218300819397} -08/30/2021 22:34:29 - INFO - __main__ - Step 51813: {'lr': 0.0003727937409865606, 'samples': 9948096, 'steps': 51812, 'loss/train': 0.892719566822052} -08/30/2021 22:34:29 - INFO - __main__ - Step 51814: {'lr': 0.0003727891184611965, 'samples': 9948288, 'steps': 51813, 'loss/train': 1.0866458415985107} -08/30/2021 22:34:30 - INFO - __main__ - Step 51815: {'lr': 0.0003727844958805055, 'samples': 9948480, 'steps': 51814, 'loss/train': 1.1836897134780884} -08/30/2021 22:34:31 - INFO - __main__ - Step 51816: {'lr': 0.0003727798732444897, 'samples': 9948672, 'steps': 51815, 'loss/train': 1.414215087890625} -08/30/2021 22:34:32 - INFO - __main__ - Step 51817: {'lr': 0.00037277525055315114, 'samples': 9948864, 'steps': 51816, 'loss/train': 2.360086441040039} -08/30/2021 22:34:32 - INFO - __main__ - Step 51818: {'lr': 0.0003727706278064921, 'samples': 9949056, 'steps': 51817, 'loss/train': 1.2951818704605103} -08/30/2021 22:34:32 - INFO - __main__ - Step 51819: {'lr': 0.00037276600500451434, 'samples': 9949248, 'steps': 51818, 'loss/train': 1.3951317071914673} -08/30/2021 22:34:33 - INFO - __main__ - Step 51820: {'lr': 0.00037276138214722016, 'samples': 9949440, 'steps': 51819, 'loss/train': 1.3718186616897583} -08/30/2021 22:34:33 - INFO - __main__ - Step 51821: {'lr': 0.0003727567592346116, 'samples': 9949632, 'steps': 51820, 'loss/train': 0.9237263202667236} -08/30/2021 22:34:35 - INFO - __main__ - Step 51822: {'lr': 0.00037275213626669076, 'samples': 9949824, 'steps': 51821, 'loss/train': 1.4530959129333496} -08/30/2021 22:34:36 - INFO - __main__ - Step 51823: {'lr': 0.00037274751324345966, 'samples': 9950016, 'steps': 51822, 'loss/train': 1.5151957273483276} -08/30/2021 22:34:36 - INFO - __main__ - Step 51824: {'lr': 0.0003727428901649205, 'samples': 9950208, 'steps': 51823, 'loss/train': 1.773315668106079} -08/30/2021 22:34:36 - INFO - __main__ - Step 51825: {'lr': 0.00037273826703107527, 'samples': 9950400, 'steps': 51824, 'loss/train': 1.4654994010925293} -08/30/2021 22:34:37 - INFO - __main__ - Step 51826: {'lr': 0.000372733643841926, 'samples': 9950592, 'steps': 51825, 'loss/train': 1.6336032152175903} -08/30/2021 22:34:39 - INFO - __main__ - Step 51827: {'lr': 0.00037272902059747487, 'samples': 9950784, 'steps': 51826, 'loss/train': 0.771109402179718} -08/30/2021 22:34:39 - INFO - __main__ - Step 51828: {'lr': 0.00037272439729772397, 'samples': 9950976, 'steps': 51827, 'loss/train': 1.550333023071289} -08/30/2021 22:34:40 - INFO - __main__ - Step 51829: {'lr': 0.00037271977394267534, 'samples': 9951168, 'steps': 51828, 'loss/train': 0.03464927524328232} -08/30/2021 22:34:40 - INFO - __main__ - Step 51830: {'lr': 0.0003727151505323311, 'samples': 9951360, 'steps': 51829, 'loss/train': 0.025755373761057854} -08/30/2021 22:34:40 - INFO - __main__ - Step 51831: {'lr': 0.0003727105270666933, 'samples': 9951552, 'steps': 51830, 'loss/train': 1.8752171993255615} -08/30/2021 22:34:41 - INFO - __main__ - Step 51832: {'lr': 0.00037270590354576396, 'samples': 9951744, 'steps': 51831, 'loss/train': 1.1250269412994385} -08/30/2021 22:34:42 - INFO - __main__ - Step 51833: {'lr': 0.0003727012799695453, 'samples': 9951936, 'steps': 51832, 'loss/train': 1.627541184425354} -08/30/2021 22:34:43 - INFO - __main__ - Step 51834: {'lr': 0.0003726966563380393, 'samples': 9952128, 'steps': 51833, 'loss/train': 1.692149043083191} -08/30/2021 22:34:43 - INFO - __main__ - Step 51835: {'lr': 0.00037269203265124807, 'samples': 9952320, 'steps': 51834, 'loss/train': 1.229498267173767} -08/30/2021 22:34:44 - INFO - __main__ - Step 51836: {'lr': 0.00037268740890917374, 'samples': 9952512, 'steps': 51835, 'loss/train': 0.7132439613342285} -08/30/2021 22:34:44 - INFO - __main__ - Step 51837: {'lr': 0.0003726827851118183, 'samples': 9952704, 'steps': 51836, 'loss/train': 1.7350763082504272} -08/30/2021 22:34:44 - INFO - __main__ - Step 51838: {'lr': 0.00037267816125918394, 'samples': 9952896, 'steps': 51837, 'loss/train': 1.4118082523345947} -08/30/2021 22:34:46 - INFO - __main__ - Step 51839: {'lr': 0.00037267353735127276, 'samples': 9953088, 'steps': 51838, 'loss/train': 0.5707834959030151} -08/30/2021 22:34:46 - INFO - __main__ - Step 51840: {'lr': 0.00037266891338808667, 'samples': 9953280, 'steps': 51839, 'loss/train': 1.6818580627441406} -08/30/2021 22:34:47 - INFO - __main__ - Step 51841: {'lr': 0.00037266428936962785, 'samples': 9953472, 'steps': 51840, 'loss/train': 1.5431554317474365} -08/30/2021 22:34:47 - INFO - __main__ - Step 51842: {'lr': 0.00037265966529589846, 'samples': 9953664, 'steps': 51841, 'loss/train': 1.2983708381652832} -08/30/2021 22:34:47 - INFO - __main__ - Step 51843: {'lr': 0.0003726550411669005, 'samples': 9953856, 'steps': 51842, 'loss/train': 1.130833625793457} -08/30/2021 22:34:49 - INFO - __main__ - Step 51844: {'lr': 0.000372650416982636, 'samples': 9954048, 'steps': 51843, 'loss/train': 1.2864400148391724} -08/30/2021 22:34:50 - INFO - __main__ - Step 51845: {'lr': 0.0003726457927431073, 'samples': 9954240, 'steps': 51844, 'loss/train': 1.660396695137024} -08/30/2021 22:34:50 - INFO - __main__ - Step 51846: {'lr': 0.0003726411684483161, 'samples': 9954432, 'steps': 51845, 'loss/train': 0.02651946246623993} -08/30/2021 22:34:51 - INFO - __main__ - Step 51847: {'lr': 0.0003726365440982648, 'samples': 9954624, 'steps': 51846, 'loss/train': 0.06892168521881104} -08/30/2021 22:34:51 - INFO - __main__ - Step 51848: {'lr': 0.00037263191969295537, 'samples': 9954816, 'steps': 51847, 'loss/train': 2.1675353050231934} -08/30/2021 22:34:51 - INFO - __main__ - Step 51849: {'lr': 0.0003726272952323898, 'samples': 9955008, 'steps': 51848, 'loss/train': 0.35434576869010925} -08/30/2021 22:34:53 - INFO - __main__ - Step 51850: {'lr': 0.0003726226707165703, 'samples': 9955200, 'steps': 51849, 'loss/train': 1.1533006429672241} -08/30/2021 22:34:53 - INFO - __main__ - Step 51851: {'lr': 0.000372618046145499, 'samples': 9955392, 'steps': 51850, 'loss/train': 1.7156795263290405} -08/30/2021 22:34:54 - INFO - __main__ - Step 51852: {'lr': 0.0003726134215191778, 'samples': 9955584, 'steps': 51851, 'loss/train': 0.8948954939842224} -08/30/2021 22:34:54 - INFO - __main__ - Step 51853: {'lr': 0.0003726087968376089, 'samples': 9955776, 'steps': 51852, 'loss/train': 1.0862714052200317} -08/30/2021 22:34:55 - INFO - __main__ - Step 51854: {'lr': 0.0003726041721007944, 'samples': 9955968, 'steps': 51853, 'loss/train': 1.7077580690383911} -08/30/2021 22:34:56 - INFO - __main__ - Step 51855: {'lr': 0.0003725995473087363, 'samples': 9956160, 'steps': 51854, 'loss/train': 1.6299303770065308} -08/30/2021 22:34:57 - INFO - __main__ - Step 51856: {'lr': 0.0003725949224614368, 'samples': 9956352, 'steps': 51855, 'loss/train': 1.7085137367248535} -08/30/2021 22:34:57 - INFO - __main__ - Step 51857: {'lr': 0.00037259029755889783, 'samples': 9956544, 'steps': 51856, 'loss/train': 1.4361802339553833} -08/30/2021 22:34:58 - INFO - __main__ - Step 51858: {'lr': 0.00037258567260112165, 'samples': 9956736, 'steps': 51857, 'loss/train': 0.0754077360033989} -08/30/2021 22:34:58 - INFO - __main__ - Step 51859: {'lr': 0.00037258104758811024, 'samples': 9956928, 'steps': 51858, 'loss/train': 1.4254209995269775} -08/30/2021 22:34:59 - INFO - __main__ - Step 51860: {'lr': 0.00037257642251986567, 'samples': 9957120, 'steps': 51859, 'loss/train': 0.05069465562701225} -08/30/2021 22:35:00 - INFO - __main__ - Step 51861: {'lr': 0.00037257179739639006, 'samples': 9957312, 'steps': 51860, 'loss/train': 1.6155613660812378} -08/30/2021 22:35:00 - INFO - __main__ - Step 51862: {'lr': 0.00037256717221768556, 'samples': 9957504, 'steps': 51861, 'loss/train': 1.1297948360443115} -08/30/2021 22:35:01 - INFO - __main__ - Step 51863: {'lr': 0.0003725625469837541, 'samples': 9957696, 'steps': 51862, 'loss/train': 1.1255016326904297} -08/30/2021 22:35:01 - INFO - __main__ - Step 51864: {'lr': 0.00037255792169459785, 'samples': 9957888, 'steps': 51863, 'loss/train': 1.4773226976394653} -08/30/2021 22:35:01 - INFO - __main__ - Step 51865: {'lr': 0.00037255329635021896, 'samples': 9958080, 'steps': 51864, 'loss/train': 1.4688013792037964} -08/30/2021 22:35:03 - INFO - __main__ - Step 51866: {'lr': 0.0003725486709506194, 'samples': 9958272, 'steps': 51865, 'loss/train': 1.5012935400009155} -08/30/2021 22:35:04 - INFO - __main__ - Step 51867: {'lr': 0.0003725440454958013, 'samples': 9958464, 'steps': 51866, 'loss/train': 1.6771867275238037} -08/30/2021 22:35:04 - INFO - __main__ - Step 51868: {'lr': 0.0003725394199857667, 'samples': 9958656, 'steps': 51867, 'loss/train': 0.592327356338501} -08/30/2021 22:35:04 - INFO - __main__ - Step 51869: {'lr': 0.0003725347944205178, 'samples': 9958848, 'steps': 51868, 'loss/train': 0.18364876508712769} -08/30/2021 22:35:05 - INFO - __main__ - Step 51870: {'lr': 0.0003725301688000566, 'samples': 9959040, 'steps': 51869, 'loss/train': 0.5639804005622864} -08/30/2021 22:35:06 - INFO - __main__ - Step 51871: {'lr': 0.0003725255431243852, 'samples': 9959232, 'steps': 51870, 'loss/train': 1.3463943004608154} -08/30/2021 22:35:07 - INFO - __main__ - Step 51872: {'lr': 0.00037252091739350566, 'samples': 9959424, 'steps': 51871, 'loss/train': 0.9146784543991089} -08/30/2021 22:35:07 - INFO - __main__ - Step 51873: {'lr': 0.0003725162916074201, 'samples': 9959616, 'steps': 51872, 'loss/train': 1.3303477764129639} -08/30/2021 22:35:07 - INFO - __main__ - Step 51874: {'lr': 0.0003725116657661306, 'samples': 9959808, 'steps': 51873, 'loss/train': 1.2069082260131836} -08/30/2021 22:35:08 - INFO - __main__ - Step 51875: {'lr': 0.00037250703986963917, 'samples': 9960000, 'steps': 51874, 'loss/train': 0.5643643736839294} -08/30/2021 22:35:10 - INFO - __main__ - Step 51876: {'lr': 0.000372502413917948, 'samples': 9960192, 'steps': 51875, 'loss/train': 1.7402911186218262} -08/30/2021 22:35:10 - INFO - __main__ - Step 51877: {'lr': 0.00037249778791105916, 'samples': 9960384, 'steps': 51876, 'loss/train': 1.5554461479187012} -08/30/2021 22:35:10 - INFO - __main__ - Step 51878: {'lr': 0.0003724931618489747, 'samples': 9960576, 'steps': 51877, 'loss/train': 1.2836854457855225} -08/30/2021 22:35:11 - INFO - __main__ - Step 51879: {'lr': 0.0003724885357316967, 'samples': 9960768, 'steps': 51878, 'loss/train': 0.6971196532249451} -08/30/2021 22:35:11 - INFO - __main__ - Step 51880: {'lr': 0.00037248390955922726, 'samples': 9960960, 'steps': 51879, 'loss/train': 1.4496119022369385} -08/30/2021 22:35:13 - INFO - __main__ - Step 51881: {'lr': 0.00037247928333156844, 'samples': 9961152, 'steps': 51880, 'loss/train': 1.3063400983810425} -08/30/2021 22:35:13 - INFO - __main__ - Step 51882: {'lr': 0.0003724746570487223, 'samples': 9961344, 'steps': 51881, 'loss/train': 1.3679530620574951} -08/30/2021 22:35:14 - INFO - __main__ - Step 51883: {'lr': 0.00037247003071069106, 'samples': 9961536, 'steps': 51882, 'loss/train': 1.1247488260269165} -08/30/2021 22:35:14 - INFO - __main__ - Step 51884: {'lr': 0.0003724654043174767, 'samples': 9961728, 'steps': 51883, 'loss/train': 1.2774298191070557} -08/30/2021 22:35:14 - INFO - __main__ - Step 51885: {'lr': 0.0003724607778690813, 'samples': 9961920, 'steps': 51884, 'loss/train': 1.5299878120422363} -08/30/2021 22:35:15 - INFO - __main__ - Step 51886: {'lr': 0.00037245615136550695, 'samples': 9962112, 'steps': 51885, 'loss/train': 1.7156078815460205} -08/30/2021 22:35:16 - INFO - __main__ - Step 51887: {'lr': 0.00037245152480675577, 'samples': 9962304, 'steps': 51886, 'loss/train': 0.4460705816745758} -08/30/2021 22:35:17 - INFO - __main__ - Step 51888: {'lr': 0.0003724468981928298, 'samples': 9962496, 'steps': 51887, 'loss/train': 1.4482715129852295} -08/30/2021 22:35:17 - INFO - __main__ - Step 51889: {'lr': 0.00037244227152373113, 'samples': 9962688, 'steps': 51888, 'loss/train': 0.8630905151367188} -08/30/2021 22:35:17 - INFO - __main__ - Step 51890: {'lr': 0.0003724376447994619, 'samples': 9962880, 'steps': 51889, 'loss/train': 1.7183257341384888} -08/30/2021 22:35:18 - INFO - __main__ - Step 51891: {'lr': 0.00037243301802002414, 'samples': 9963072, 'steps': 51890, 'loss/train': 1.396705150604248} -08/30/2021 22:35:19 - INFO - __main__ - Step 51892: {'lr': 0.00037242839118542, 'samples': 9963264, 'steps': 51891, 'loss/train': 1.525964617729187} -08/30/2021 22:35:20 - INFO - __main__ - Step 51893: {'lr': 0.00037242376429565143, 'samples': 9963456, 'steps': 51892, 'loss/train': 0.7317933440208435} -08/30/2021 22:35:20 - INFO - __main__ - Step 51894: {'lr': 0.0003724191373507206, 'samples': 9963648, 'steps': 51893, 'loss/train': 0.027184000238776207} -08/30/2021 22:35:21 - INFO - __main__ - Step 51895: {'lr': 0.00037241451035062965, 'samples': 9963840, 'steps': 51894, 'loss/train': 1.7417263984680176} -08/30/2021 22:35:21 - INFO - __main__ - Step 51896: {'lr': 0.0003724098832953806, 'samples': 9964032, 'steps': 51895, 'loss/train': 1.6496121883392334} -08/30/2021 22:35:22 - INFO - __main__ - Step 51897: {'lr': 0.00037240525618497555, 'samples': 9964224, 'steps': 51896, 'loss/train': 1.286798357963562} -08/30/2021 22:35:23 - INFO - __main__ - Step 51898: {'lr': 0.00037240062901941663, 'samples': 9964416, 'steps': 51897, 'loss/train': 1.3271620273590088} -08/30/2021 22:35:23 - INFO - __main__ - Step 51899: {'lr': 0.0003723960017987058, 'samples': 9964608, 'steps': 51898, 'loss/train': 1.5280787944793701} -08/30/2021 22:35:24 - INFO - __main__ - Step 51900: {'lr': 0.00037239137452284527, 'samples': 9964800, 'steps': 51899, 'loss/train': 2.311554193496704} -08/30/2021 22:35:24 - INFO - __main__ - Step 51901: {'lr': 0.0003723867471918371, 'samples': 9964992, 'steps': 51900, 'loss/train': 1.63205885887146} -08/30/2021 22:35:26 - INFO - __main__ - Step 51902: {'lr': 0.00037238211980568326, 'samples': 9965184, 'steps': 51901, 'loss/train': 1.3498841524124146} -08/30/2021 22:35:26 - INFO - __main__ - Step 51903: {'lr': 0.00037237749236438593, 'samples': 9965376, 'steps': 51902, 'loss/train': 1.3161925077438354} -08/30/2021 22:35:26 - INFO - __main__ - Step 51904: {'lr': 0.0003723728648679472, 'samples': 9965568, 'steps': 51903, 'loss/train': 0.850733757019043} -08/30/2021 22:35:27 - INFO - __main__ - Step 51905: {'lr': 0.0003723682373163693, 'samples': 9965760, 'steps': 51904, 'loss/train': 1.23153817653656} -08/30/2021 22:35:27 - INFO - __main__ - Step 51906: {'lr': 0.0003723636097096539, 'samples': 9965952, 'steps': 51905, 'loss/train': 1.7081217765808105} -08/30/2021 22:35:27 - INFO - __main__ - Step 51907: {'lr': 0.00037235898204780347, 'samples': 9966144, 'steps': 51906, 'loss/train': 0.5396932363510132} -08/30/2021 22:35:29 - INFO - __main__ - Step 51908: {'lr': 0.00037235435433082004, 'samples': 9966336, 'steps': 51907, 'loss/train': 1.856209397315979} -08/30/2021 22:35:29 - INFO - __main__ - Step 51909: {'lr': 0.0003723497265587055, 'samples': 9966528, 'steps': 51908, 'loss/train': 1.919226884841919} -08/30/2021 22:35:30 - INFO - __main__ - Step 51910: {'lr': 0.0003723450987314622, 'samples': 9966720, 'steps': 51909, 'loss/train': 1.2813091278076172} -08/30/2021 22:35:30 - INFO - __main__ - Step 51911: {'lr': 0.00037234047084909195, 'samples': 9966912, 'steps': 51910, 'loss/train': 1.027509331703186} -08/30/2021 22:35:31 - INFO - __main__ - Step 51912: {'lr': 0.0003723358429115971, 'samples': 9967104, 'steps': 51911, 'loss/train': 1.440931797027588} -08/30/2021 22:35:32 - INFO - __main__ - Step 51913: {'lr': 0.00037233121491897953, 'samples': 9967296, 'steps': 51912, 'loss/train': 1.0619441270828247} -08/30/2021 22:35:33 - INFO - __main__ - Step 51914: {'lr': 0.00037232658687124135, 'samples': 9967488, 'steps': 51913, 'loss/train': 0.057625818997621536} -08/30/2021 22:35:33 - INFO - __main__ - Step 51915: {'lr': 0.00037232195876838484, 'samples': 9967680, 'steps': 51914, 'loss/train': 1.4565588235855103} -08/30/2021 22:35:33 - INFO - __main__ - Step 51916: {'lr': 0.00037231733061041176, 'samples': 9967872, 'steps': 51915, 'loss/train': 0.8500802516937256} -08/30/2021 22:35:34 - INFO - __main__ - Step 51917: {'lr': 0.0003723127023973245, 'samples': 9968064, 'steps': 51916, 'loss/train': 2.0979974269866943} -08/30/2021 22:35:35 - INFO - __main__ - Step 51918: {'lr': 0.00037230807412912505, 'samples': 9968256, 'steps': 51917, 'loss/train': 1.2710801362991333} -08/30/2021 22:35:36 - INFO - __main__ - Step 51919: {'lr': 0.00037230344580581543, 'samples': 9968448, 'steps': 51918, 'loss/train': 1.476787805557251} -08/30/2021 22:35:36 - INFO - __main__ - Step 51920: {'lr': 0.00037229881742739776, 'samples': 9968640, 'steps': 51919, 'loss/train': 1.0626276731491089} -08/30/2021 22:35:36 - INFO - __main__ - Step 51921: {'lr': 0.0003722941889938741, 'samples': 9968832, 'steps': 51920, 'loss/train': 0.6248576641082764} -08/30/2021 22:35:37 - INFO - __main__ - Step 51922: {'lr': 0.0003722895605052466, 'samples': 9969024, 'steps': 51921, 'loss/train': 0.8725528717041016} -08/30/2021 22:35:37 - INFO - __main__ - Step 51923: {'lr': 0.0003722849319615173, 'samples': 9969216, 'steps': 51922, 'loss/train': 1.7207883596420288} -08/30/2021 22:35:39 - INFO - __main__ - Step 51924: {'lr': 0.0003722803033626883, 'samples': 9969408, 'steps': 51923, 'loss/train': 1.4032286405563354} -08/30/2021 22:35:39 - INFO - __main__ - Step 51925: {'lr': 0.0003722756747087617, 'samples': 9969600, 'steps': 51924, 'loss/train': 1.3273437023162842} -08/30/2021 22:35:40 - INFO - __main__ - Step 51926: {'lr': 0.0003722710459997395, 'samples': 9969792, 'steps': 51925, 'loss/train': 0.8548556566238403} -08/30/2021 22:35:40 - INFO - __main__ - Step 51927: {'lr': 0.00037226641723562393, 'samples': 9969984, 'steps': 51926, 'loss/train': 1.0427029132843018} -08/30/2021 22:35:40 - INFO - __main__ - Step 51928: {'lr': 0.000372261788416417, 'samples': 9970176, 'steps': 51927, 'loss/train': 0.09846016764640808} -08/30/2021 22:35:42 - INFO - __main__ - Step 51929: {'lr': 0.00037225715954212075, 'samples': 9970368, 'steps': 51928, 'loss/train': 0.4199332892894745} -08/30/2021 22:35:42 - INFO - __main__ - Step 51930: {'lr': 0.00037225253061273734, 'samples': 9970560, 'steps': 51929, 'loss/train': 1.4638190269470215} -08/30/2021 22:35:43 - INFO - __main__ - Step 51931: {'lr': 0.0003722479016282688, 'samples': 9970752, 'steps': 51930, 'loss/train': 0.0759798064827919} -08/30/2021 22:35:43 - INFO - __main__ - Step 51932: {'lr': 0.00037224327258871724, 'samples': 9970944, 'steps': 51931, 'loss/train': 1.5944095849990845} -08/30/2021 22:35:43 - INFO - __main__ - Step 51933: {'lr': 0.00037223864349408484, 'samples': 9971136, 'steps': 51932, 'loss/train': 1.1476593017578125} -08/30/2021 22:35:44 - INFO - __main__ - Step 51934: {'lr': 0.0003722340143443735, 'samples': 9971328, 'steps': 51933, 'loss/train': 1.0609651803970337} -08/30/2021 22:35:46 - INFO - __main__ - Step 51935: {'lr': 0.0003722293851395854, 'samples': 9971520, 'steps': 51934, 'loss/train': 1.1517436504364014} -08/30/2021 22:35:46 - INFO - __main__ - Step 51936: {'lr': 0.00037222475587972263, 'samples': 9971712, 'steps': 51935, 'loss/train': 0.8537135720252991} -08/30/2021 22:35:47 - INFO - __main__ - Step 51937: {'lr': 0.00037222012656478733, 'samples': 9971904, 'steps': 51936, 'loss/train': 0.8171143531799316} -08/30/2021 22:35:47 - INFO - __main__ - Step 51938: {'lr': 0.00037221549719478145, 'samples': 9972096, 'steps': 51937, 'loss/train': 1.122235655784607} -08/30/2021 22:35:48 - INFO - __main__ - Step 51939: {'lr': 0.0003722108677697072, 'samples': 9972288, 'steps': 51938, 'loss/train': 0.7304782867431641} -08/30/2021 22:35:49 - INFO - __main__ - Step 51940: {'lr': 0.00037220623828956655, 'samples': 9972480, 'steps': 51939, 'loss/train': 1.3031141757965088} -08/30/2021 22:35:50 - INFO - __main__ - Step 51941: {'lr': 0.00037220160875436176, 'samples': 9972672, 'steps': 51940, 'loss/train': 1.3918569087982178} -08/30/2021 22:35:50 - INFO - __main__ - Step 51942: {'lr': 0.0003721969791640948, 'samples': 9972864, 'steps': 51941, 'loss/train': 1.4810817241668701} -08/30/2021 22:35:50 - INFO - __main__ - Step 51943: {'lr': 0.0003721923495187677, 'samples': 9973056, 'steps': 51942, 'loss/train': 1.3126007318496704} -08/30/2021 22:35:51 - INFO - __main__ - Step 51944: {'lr': 0.00037218771981838264, 'samples': 9973248, 'steps': 51943, 'loss/train': 1.2253798246383667} -08/30/2021 22:35:51 - INFO - __main__ - Step 51945: {'lr': 0.0003721830900629416, 'samples': 9973440, 'steps': 51944, 'loss/train': 2.083449363708496} -08/30/2021 22:35:53 - INFO - __main__ - Step 51946: {'lr': 0.00037217846025244686, 'samples': 9973632, 'steps': 51945, 'loss/train': 1.0989153385162354} -08/30/2021 22:35:53 - INFO - __main__ - Step 51947: {'lr': 0.0003721738303869004, 'samples': 9973824, 'steps': 51946, 'loss/train': 1.8225184679031372} -08/30/2021 22:35:53 - INFO - __main__ - Step 51948: {'lr': 0.0003721692004663042, 'samples': 9974016, 'steps': 51947, 'loss/train': 0.9767679572105408} -08/30/2021 22:35:54 - INFO - __main__ - Step 51949: {'lr': 0.0003721645704906605, 'samples': 9974208, 'steps': 51948, 'loss/train': 1.4346401691436768} -08/30/2021 22:35:54 - INFO - __main__ - Step 51950: {'lr': 0.0003721599404599713, 'samples': 9974400, 'steps': 51949, 'loss/train': 0.3948131501674652} -08/30/2021 22:35:56 - INFO - __main__ - Step 51951: {'lr': 0.0003721553103742388, 'samples': 9974592, 'steps': 51950, 'loss/train': 1.1726425886154175} -08/30/2021 22:35:56 - INFO - __main__ - Step 51952: {'lr': 0.00037215068023346495, 'samples': 9974784, 'steps': 51951, 'loss/train': 1.3587422370910645} -08/30/2021 22:35:57 - INFO - __main__ - Step 51953: {'lr': 0.0003721460500376518, 'samples': 9974976, 'steps': 51952, 'loss/train': 1.444991111755371} -08/30/2021 22:35:57 - INFO - __main__ - Step 51954: {'lr': 0.00037214141978680166, 'samples': 9975168, 'steps': 51953, 'loss/train': 1.0682071447372437} -08/30/2021 22:35:57 - INFO - __main__ - Step 51955: {'lr': 0.00037213678948091637, 'samples': 9975360, 'steps': 51954, 'loss/train': 1.6608946323394775} -08/30/2021 22:35:59 - INFO - __main__ - Step 51956: {'lr': 0.0003721321591199982, 'samples': 9975552, 'steps': 51955, 'loss/train': 0.06225641071796417} -08/30/2021 22:36:00 - INFO - __main__ - Step 51957: {'lr': 0.00037212752870404917, 'samples': 9975744, 'steps': 51956, 'loss/train': 1.4211546182632446} -08/30/2021 22:36:00 - INFO - __main__ - Step 51958: {'lr': 0.0003721228982330713, 'samples': 9975936, 'steps': 51957, 'loss/train': 1.5941846370697021} -08/30/2021 22:36:00 - INFO - __main__ - Step 51959: {'lr': 0.0003721182677070668, 'samples': 9976128, 'steps': 51958, 'loss/train': 0.2025655210018158} -08/30/2021 22:36:01 - INFO - __main__ - Step 51960: {'lr': 0.00037211363712603767, 'samples': 9976320, 'steps': 51959, 'loss/train': 1.375752329826355} -08/30/2021 22:36:02 - INFO - __main__ - Step 51961: {'lr': 0.00037210900648998604, 'samples': 9976512, 'steps': 51960, 'loss/train': 0.9909582734107971} -08/30/2021 22:36:03 - INFO - __main__ - Step 51962: {'lr': 0.0003721043757989139, 'samples': 9976704, 'steps': 51961, 'loss/train': 1.0279664993286133} -08/30/2021 22:36:03 - INFO - __main__ - Step 51963: {'lr': 0.0003720997450528235, 'samples': 9976896, 'steps': 51962, 'loss/train': 1.1620796918869019} -08/30/2021 22:36:03 - INFO - __main__ - Step 51964: {'lr': 0.0003720951142517168, 'samples': 9977088, 'steps': 51963, 'loss/train': 1.258919596672058} -08/30/2021 22:36:04 - INFO - __main__ - Step 51965: {'lr': 0.0003720904833955959, 'samples': 9977280, 'steps': 51964, 'loss/train': 1.443966031074524} -08/30/2021 22:36:05 - INFO - __main__ - Step 51966: {'lr': 0.000372085852484463, 'samples': 9977472, 'steps': 51965, 'loss/train': 1.1282204389572144} -08/30/2021 22:36:06 - INFO - __main__ - Step 51967: {'lr': 0.00037208122151832004, 'samples': 9977664, 'steps': 51966, 'loss/train': 1.1799874305725098} -08/30/2021 22:36:06 - INFO - __main__ - Step 51968: {'lr': 0.0003720765904971691, 'samples': 9977856, 'steps': 51967, 'loss/train': 1.1374404430389404} -08/30/2021 22:36:06 - INFO - __main__ - Step 51969: {'lr': 0.0003720719594210124, 'samples': 9978048, 'steps': 51968, 'loss/train': 2.00117826461792} -08/30/2021 22:36:07 - INFO - __main__ - Step 51970: {'lr': 0.00037206732828985197, 'samples': 9978240, 'steps': 51969, 'loss/train': 0.6365982294082642} -08/30/2021 22:36:08 - INFO - __main__ - Step 51971: {'lr': 0.00037206269710368987, 'samples': 9978432, 'steps': 51970, 'loss/train': 1.8698856830596924} -08/30/2021 22:36:09 - INFO - __main__ - Step 51972: {'lr': 0.0003720580658625282, 'samples': 9978624, 'steps': 51971, 'loss/train': 1.4233675003051758} -08/30/2021 22:36:09 - INFO - __main__ - Step 51973: {'lr': 0.00037205343456636907, 'samples': 9978816, 'steps': 51972, 'loss/train': 1.457370638847351} -08/30/2021 22:36:10 - INFO - __main__ - Step 51974: {'lr': 0.0003720488032152145, 'samples': 9979008, 'steps': 51973, 'loss/train': 0.949581503868103} -08/30/2021 22:36:10 - INFO - __main__ - Step 51975: {'lr': 0.0003720441718090667, 'samples': 9979200, 'steps': 51974, 'loss/train': 0.05510852485895157} -08/30/2021 22:36:12 - INFO - __main__ - Step 51976: {'lr': 0.0003720395403479276, 'samples': 9979392, 'steps': 51975, 'loss/train': 1.61943781375885} -08/30/2021 22:36:12 - INFO - __main__ - Step 51977: {'lr': 0.00037203490883179935, 'samples': 9979584, 'steps': 51976, 'loss/train': 1.7899806499481201} -08/30/2021 22:36:12 - INFO - __main__ - Step 51978: {'lr': 0.0003720302772606841, 'samples': 9979776, 'steps': 51977, 'loss/train': 1.0794782638549805} -08/30/2021 22:36:13 - INFO - __main__ - Step 51979: {'lr': 0.00037202564563458394, 'samples': 9979968, 'steps': 51978, 'loss/train': 1.0243253707885742} -08/30/2021 22:36:13 - INFO - __main__ - Step 51980: {'lr': 0.00037202101395350084, 'samples': 9980160, 'steps': 51979, 'loss/train': 1.1207071542739868} -08/30/2021 22:36:13 - INFO - __main__ - Step 51981: {'lr': 0.0003720163822174369, 'samples': 9980352, 'steps': 51980, 'loss/train': 1.4508756399154663} -08/30/2021 22:36:15 - INFO - __main__ - Step 51982: {'lr': 0.0003720117504263944, 'samples': 9980544, 'steps': 51981, 'loss/train': 0.9407844543457031} -08/30/2021 22:36:15 - INFO - __main__ - Step 51983: {'lr': 0.0003720071185803752, 'samples': 9980736, 'steps': 51982, 'loss/train': 1.5013949871063232} -08/30/2021 22:36:16 - INFO - __main__ - Step 51984: {'lr': 0.00037200248667938155, 'samples': 9980928, 'steps': 51983, 'loss/train': 1.2867027521133423} -08/30/2021 22:36:16 - INFO - __main__ - Step 51985: {'lr': 0.00037199785472341536, 'samples': 9981120, 'steps': 51984, 'loss/train': 0.037992969155311584} -08/30/2021 22:36:16 - INFO - __main__ - Step 51986: {'lr': 0.00037199322271247887, 'samples': 9981312, 'steps': 51985, 'loss/train': 0.4052225947380066} -08/30/2021 22:36:19 - INFO - __main__ - Step 51987: {'lr': 0.00037198859064657415, 'samples': 9981504, 'steps': 51986, 'loss/train': 1.1930993795394897} -08/30/2021 22:36:19 - INFO - __main__ - Step 51988: {'lr': 0.0003719839585257032, 'samples': 9981696, 'steps': 51987, 'loss/train': 1.5854802131652832} -08/30/2021 22:36:19 - INFO - __main__ - Step 51989: {'lr': 0.0003719793263498681, 'samples': 9981888, 'steps': 51988, 'loss/train': 0.11612052470445633} -08/30/2021 22:36:20 - INFO - __main__ - Step 51990: {'lr': 0.00037197469411907115, 'samples': 9982080, 'steps': 51989, 'loss/train': 1.6547197103500366} -08/30/2021 22:36:20 - INFO - __main__ - Step 51991: {'lr': 0.0003719700618333142, 'samples': 9982272, 'steps': 51990, 'loss/train': 1.1363204717636108} -08/30/2021 22:36:20 - INFO - __main__ - Step 51992: {'lr': 0.0003719654294925994, 'samples': 9982464, 'steps': 51991, 'loss/train': 0.4997813105583191} -08/30/2021 22:36:22 - INFO - __main__ - Step 51993: {'lr': 0.00037196079709692894, 'samples': 9982656, 'steps': 51992, 'loss/train': 1.7195322513580322} -08/30/2021 22:36:23 - INFO - __main__ - Step 51994: {'lr': 0.0003719561646463048, 'samples': 9982848, 'steps': 51993, 'loss/train': 1.1932653188705444} -08/30/2021 22:36:23 - INFO - __main__ - Step 51995: {'lr': 0.00037195153214072903, 'samples': 9983040, 'steps': 51994, 'loss/train': 1.6880711317062378} -08/30/2021 22:36:23 - INFO - __main__ - Step 51996: {'lr': 0.0003719468995802038, 'samples': 9983232, 'steps': 51995, 'loss/train': 0.8421748280525208} -08/30/2021 22:36:24 - INFO - __main__ - Step 51997: {'lr': 0.0003719422669647312, 'samples': 9983424, 'steps': 51996, 'loss/train': 1.7453234195709229} -08/30/2021 22:36:25 - INFO - __main__ - Step 51998: {'lr': 0.0003719376342943133, 'samples': 9983616, 'steps': 51997, 'loss/train': 1.647517442703247} -08/30/2021 22:36:26 - INFO - __main__ - Step 51999: {'lr': 0.00037193300156895223, 'samples': 9983808, 'steps': 51998, 'loss/train': 1.2749403715133667} -08/30/2021 22:36:26 - INFO - __main__ - Step 52000: {'lr': 0.00037192836878864995, 'samples': 9984000, 'steps': 51999, 'loss/train': 0.9716050624847412} -08/30/2021 22:36:26 - INFO - __main__ - Step 52001: {'lr': 0.00037192373595340864, 'samples': 9984192, 'steps': 52000, 'loss/train': 1.064461350440979} -08/30/2021 22:36:27 - INFO - __main__ - Step 52002: {'lr': 0.0003719191030632304, 'samples': 9984384, 'steps': 52001, 'loss/train': 0.6413258910179138} -08/30/2021 22:36:28 - INFO - __main__ - Step 52003: {'lr': 0.0003719144701181173, 'samples': 9984576, 'steps': 52002, 'loss/train': 2.2944822311401367} -08/30/2021 22:36:29 - INFO - __main__ - Step 52004: {'lr': 0.0003719098371180714, 'samples': 9984768, 'steps': 52003, 'loss/train': 1.0969287157058716} -08/30/2021 22:36:29 - INFO - __main__ - Step 52005: {'lr': 0.00037190520406309483, 'samples': 9984960, 'steps': 52004, 'loss/train': 0.8896622061729431} -08/30/2021 22:36:29 - INFO - __main__ - Step 52006: {'lr': 0.00037190057095318966, 'samples': 9985152, 'steps': 52005, 'loss/train': 1.1797174215316772} -08/30/2021 22:36:30 - INFO - __main__ - Step 52007: {'lr': 0.00037189593778835794, 'samples': 9985344, 'steps': 52006, 'loss/train': 1.0873112678527832} -08/30/2021 22:36:30 - INFO - __main__ - Step 52008: {'lr': 0.0003718913045686018, 'samples': 9985536, 'steps': 52007, 'loss/train': 1.479310154914856} -08/30/2021 22:36:33 - INFO - __main__ - Step 52009: {'lr': 0.0003718866712939233, 'samples': 9985728, 'steps': 52008, 'loss/train': 0.2769359350204468} -08/30/2021 22:36:33 - INFO - __main__ - Step 52010: {'lr': 0.00037188203796432464, 'samples': 9985920, 'steps': 52009, 'loss/train': 1.4753742218017578} -08/30/2021 22:36:34 - INFO - __main__ - Step 52011: {'lr': 0.00037187740457980776, 'samples': 9986112, 'steps': 52010, 'loss/train': 0.6255351901054382} -08/30/2021 22:36:34 - INFO - __main__ - Step 52012: {'lr': 0.0003718727711403748, 'samples': 9986304, 'steps': 52011, 'loss/train': 1.1509250402450562} -08/30/2021 22:36:34 - INFO - __main__ - Step 52013: {'lr': 0.00037186813764602785, 'samples': 9986496, 'steps': 52012, 'loss/train': 1.5531744956970215} -08/30/2021 22:36:35 - INFO - __main__ - Step 52014: {'lr': 0.00037186350409676894, 'samples': 9986688, 'steps': 52013, 'loss/train': 1.7630598545074463} -08/30/2021 22:36:35 - INFO - __main__ - Step 52015: {'lr': 0.00037185887049260023, 'samples': 9986880, 'steps': 52014, 'loss/train': 0.562222421169281} -08/30/2021 22:36:37 - INFO - __main__ - Step 52016: {'lr': 0.0003718542368335239, 'samples': 9987072, 'steps': 52015, 'loss/train': 0.5183826088905334} -08/30/2021 22:36:37 - INFO - __main__ - Step 52017: {'lr': 0.0003718496031195419, 'samples': 9987264, 'steps': 52016, 'loss/train': 1.7556639909744263} -08/30/2021 22:36:37 - INFO - __main__ - Step 52018: {'lr': 0.00037184496935065625, 'samples': 9987456, 'steps': 52017, 'loss/train': 1.5615830421447754} -08/30/2021 22:36:38 - INFO - __main__ - Step 52019: {'lr': 0.0003718403355268692, 'samples': 9987648, 'steps': 52018, 'loss/train': 0.07880722731351852} -08/30/2021 22:36:38 - INFO - __main__ - Step 52020: {'lr': 0.0003718357016481828, 'samples': 9987840, 'steps': 52019, 'loss/train': 0.891784131526947} -08/30/2021 22:36:40 - INFO - __main__ - Step 52021: {'lr': 0.00037183106771459905, 'samples': 9988032, 'steps': 52020, 'loss/train': 1.7741683721542358} -08/30/2021 22:36:40 - INFO - __main__ - Step 52022: {'lr': 0.00037182643372612014, 'samples': 9988224, 'steps': 52021, 'loss/train': 1.2698322534561157} -08/30/2021 22:36:40 - INFO - __main__ - Step 52023: {'lr': 0.00037182179968274807, 'samples': 9988416, 'steps': 52022, 'loss/train': 4.820176124572754} -08/30/2021 22:36:41 - INFO - __main__ - Step 52024: {'lr': 0.00037181716558448507, 'samples': 9988608, 'steps': 52023, 'loss/train': 1.3155553340911865} -08/30/2021 22:36:41 - INFO - __main__ - Step 52025: {'lr': 0.0003718125314313331, 'samples': 9988800, 'steps': 52024, 'loss/train': 1.8372255563735962} -08/30/2021 22:36:42 - INFO - __main__ - Step 52026: {'lr': 0.0003718078972232943, 'samples': 9988992, 'steps': 52025, 'loss/train': 1.7179555892944336} -08/30/2021 22:36:43 - INFO - __main__ - Step 52027: {'lr': 0.0003718032629603707, 'samples': 9989184, 'steps': 52026, 'loss/train': 1.6634650230407715} -08/30/2021 22:36:43 - INFO - __main__ - Step 52028: {'lr': 0.00037179862864256444, 'samples': 9989376, 'steps': 52027, 'loss/train': 1.3627899885177612} -08/30/2021 22:36:44 - INFO - __main__ - Step 52029: {'lr': 0.00037179399426987757, 'samples': 9989568, 'steps': 52028, 'loss/train': 0.6802630424499512} -08/30/2021 22:36:44 - INFO - __main__ - Step 52030: {'lr': 0.0003717893598423122, 'samples': 9989760, 'steps': 52029, 'loss/train': 1.467929720878601} -08/30/2021 22:36:45 - INFO - __main__ - Step 52031: {'lr': 0.0003717847253598705, 'samples': 9989952, 'steps': 52030, 'loss/train': 1.5111241340637207} -08/30/2021 22:36:46 - INFO - __main__ - Step 52032: {'lr': 0.0003717800908225544, 'samples': 9990144, 'steps': 52031, 'loss/train': 0.6221545338630676} -08/30/2021 22:36:46 - INFO - __main__ - Step 52033: {'lr': 0.0003717754562303661, 'samples': 9990336, 'steps': 52032, 'loss/train': 1.3588640689849854} -08/30/2021 22:36:47 - INFO - __main__ - Step 52034: {'lr': 0.00037177082158330773, 'samples': 9990528, 'steps': 52033, 'loss/train': 1.880616307258606} -08/30/2021 22:36:47 - INFO - __main__ - Step 52035: {'lr': 0.0003717661868813812, 'samples': 9990720, 'steps': 52034, 'loss/train': 1.8729760646820068} -08/30/2021 22:36:49 - INFO - __main__ - Step 52036: {'lr': 0.00037176155212458875, 'samples': 9990912, 'steps': 52035, 'loss/train': 1.0188407897949219} -08/30/2021 22:36:49 - INFO - __main__ - Step 52037: {'lr': 0.0003717569173129324, 'samples': 9991104, 'steps': 52036, 'loss/train': 1.1100980043411255} -08/30/2021 22:36:50 - INFO - __main__ - Step 52038: {'lr': 0.0003717522824464143, 'samples': 9991296, 'steps': 52037, 'loss/train': 1.7405463457107544} -08/30/2021 22:36:50 - INFO - __main__ - Step 52039: {'lr': 0.0003717476475250365, 'samples': 9991488, 'steps': 52038, 'loss/train': 1.369011640548706} -08/30/2021 22:36:50 - INFO - __main__ - Step 52040: {'lr': 0.0003717430125488011, 'samples': 9991680, 'steps': 52039, 'loss/train': 1.4352734088897705} -08/30/2021 22:36:51 - INFO - __main__ - Step 52041: {'lr': 0.0003717383775177101, 'samples': 9991872, 'steps': 52040, 'loss/train': 1.677634835243225} -08/30/2021 22:36:52 - INFO - __main__ - Step 52042: {'lr': 0.0003717337424317657, 'samples': 9992064, 'steps': 52041, 'loss/train': 1.1222599744796753} -08/30/2021 22:36:53 - INFO - __main__ - Step 52043: {'lr': 0.00037172910729097006, 'samples': 9992256, 'steps': 52042, 'loss/train': 1.6967636346817017} -08/30/2021 22:36:53 - INFO - __main__ - Step 52044: {'lr': 0.000371724472095325, 'samples': 9992448, 'steps': 52043, 'loss/train': 1.6835474967956543} -08/30/2021 22:36:54 - INFO - __main__ - Step 52045: {'lr': 0.00037171983684483286, 'samples': 9992640, 'steps': 52044, 'loss/train': 1.676937222480774} -08/30/2021 22:36:54 - INFO - __main__ - Step 52046: {'lr': 0.00037171520153949565, 'samples': 9992832, 'steps': 52045, 'loss/train': 1.9934661388397217} -08/30/2021 22:36:54 - INFO - __main__ - Step 52047: {'lr': 0.00037171056617931543, 'samples': 9993024, 'steps': 52046, 'loss/train': 1.194975733757019} -08/30/2021 22:36:56 - INFO - __main__ - Step 52048: {'lr': 0.00037170593076429426, 'samples': 9993216, 'steps': 52047, 'loss/train': 0.9336037039756775} -08/30/2021 22:36:57 - INFO - __main__ - Step 52049: {'lr': 0.00037170129529443436, 'samples': 9993408, 'steps': 52048, 'loss/train': 1.780676245689392} -08/30/2021 22:36:57 - INFO - __main__ - Step 52050: {'lr': 0.0003716966597697377, 'samples': 9993600, 'steps': 52049, 'loss/train': 1.480969786643982} -08/30/2021 22:36:58 - INFO - __main__ - Step 52051: {'lr': 0.0003716920241902064, 'samples': 9993792, 'steps': 52050, 'loss/train': 1.4542555809020996} -08/30/2021 22:36:58 - INFO - __main__ - Step 52052: {'lr': 0.0003716873885558425, 'samples': 9993984, 'steps': 52051, 'loss/train': 1.0908305644989014} -08/30/2021 22:37:00 - INFO - __main__ - Step 52053: {'lr': 0.0003716827528666482, 'samples': 9994176, 'steps': 52052, 'loss/train': 1.7947149276733398} -08/30/2021 22:37:00 - INFO - __main__ - Step 52054: {'lr': 0.0003716781171226255, 'samples': 9994368, 'steps': 52053, 'loss/train': 1.534867286682129} -08/30/2021 22:37:00 - INFO - __main__ - Step 52055: {'lr': 0.00037167348132377656, 'samples': 9994560, 'steps': 52054, 'loss/train': 1.3611438274383545} -08/30/2021 22:37:01 - INFO - __main__ - Step 52056: {'lr': 0.0003716688454701034, 'samples': 9994752, 'steps': 52055, 'loss/train': 1.6660186052322388} -08/30/2021 22:37:01 - INFO - __main__ - Step 52057: {'lr': 0.00037166420956160815, 'samples': 9994944, 'steps': 52056, 'loss/train': 1.7995336055755615} -08/30/2021 22:37:03 - INFO - __main__ - Step 52058: {'lr': 0.0003716595735982928, 'samples': 9995136, 'steps': 52057, 'loss/train': 0.8728925585746765} -08/30/2021 22:37:03 - INFO - __main__ - Step 52059: {'lr': 0.0003716549375801597, 'samples': 9995328, 'steps': 52058, 'loss/train': 1.3943653106689453} -08/30/2021 22:37:04 - INFO - __main__ - Step 52060: {'lr': 0.0003716503015072106, 'samples': 9995520, 'steps': 52059, 'loss/train': 1.5521290302276611} -08/30/2021 22:37:04 - INFO - __main__ - Step 52061: {'lr': 0.00037164566537944776, 'samples': 9995712, 'steps': 52060, 'loss/train': 1.5097190141677856} -08/30/2021 22:37:04 - INFO - __main__ - Step 52062: {'lr': 0.00037164102919687335, 'samples': 9995904, 'steps': 52061, 'loss/train': 1.5647640228271484} -08/30/2021 22:37:06 - INFO - __main__ - Step 52063: {'lr': 0.00037163639295948933, 'samples': 9996096, 'steps': 52062, 'loss/train': 0.07066015899181366} -08/30/2021 22:37:07 - INFO - __main__ - Step 52064: {'lr': 0.0003716317566672978, 'samples': 9996288, 'steps': 52063, 'loss/train': 1.2351046800613403} -08/30/2021 22:37:07 - INFO - __main__ - Step 52065: {'lr': 0.00037162712032030095, 'samples': 9996480, 'steps': 52064, 'loss/train': 1.1107736825942993} -08/30/2021 22:37:07 - INFO - __main__ - Step 52066: {'lr': 0.00037162248391850076, 'samples': 9996672, 'steps': 52065, 'loss/train': 1.7825418710708618} -08/30/2021 22:37:08 - INFO - __main__ - Step 52067: {'lr': 0.0003716178474618993, 'samples': 9996864, 'steps': 52066, 'loss/train': 0.6627397537231445} -08/30/2021 22:37:09 - INFO - __main__ - Step 52068: {'lr': 0.0003716132109504988, 'samples': 9997056, 'steps': 52067, 'loss/train': 1.4266213178634644} -08/30/2021 22:37:10 - INFO - __main__ - Step 52069: {'lr': 0.0003716085743843012, 'samples': 9997248, 'steps': 52068, 'loss/train': 1.1553900241851807} -08/30/2021 22:37:10 - INFO - __main__ - Step 52070: {'lr': 0.0003716039377633087, 'samples': 9997440, 'steps': 52069, 'loss/train': 1.0581462383270264} -08/30/2021 22:37:10 - INFO - __main__ - Step 52071: {'lr': 0.00037159930108752326, 'samples': 9997632, 'steps': 52070, 'loss/train': 1.471582055091858} -08/30/2021 22:37:11 - INFO - __main__ - Step 52072: {'lr': 0.0003715946643569471, 'samples': 9997824, 'steps': 52071, 'loss/train': 1.2319146394729614} -08/30/2021 22:37:11 - INFO - __main__ - Step 52073: {'lr': 0.0003715900275715823, 'samples': 9998016, 'steps': 52072, 'loss/train': 1.4516321420669556} -08/30/2021 22:37:12 - INFO - __main__ - Step 52074: {'lr': 0.0003715853907314309, 'samples': 9998208, 'steps': 52073, 'loss/train': 1.4245095252990723} -08/30/2021 22:37:13 - INFO - __main__ - Step 52075: {'lr': 0.0003715807538364949, 'samples': 9998400, 'steps': 52074, 'loss/train': 1.6345106363296509} -08/30/2021 22:37:13 - INFO - __main__ - Step 52076: {'lr': 0.00037157611688677666, 'samples': 9998592, 'steps': 52075, 'loss/train': 0.7477751970291138} -08/30/2021 22:37:14 - INFO - __main__ - Step 52077: {'lr': 0.000371571479882278, 'samples': 9998784, 'steps': 52076, 'loss/train': 1.1907473802566528} -08/30/2021 22:37:14 - INFO - __main__ - Step 52078: {'lr': 0.00037156684282300105, 'samples': 9998976, 'steps': 52077, 'loss/train': 0.293177992105484} -08/30/2021 22:37:15 - INFO - __main__ - Step 52079: {'lr': 0.00037156220570894806, 'samples': 9999168, 'steps': 52078, 'loss/train': 1.0104323625564575} -08/30/2021 22:37:16 - INFO - __main__ - Step 52080: {'lr': 0.00037155756854012097, 'samples': 9999360, 'steps': 52079, 'loss/train': 1.7753924131393433} -08/30/2021 22:37:16 - INFO - __main__ - Step 52081: {'lr': 0.000371552931316522, 'samples': 9999552, 'steps': 52080, 'loss/train': 1.3313931226730347} -08/30/2021 22:37:17 - INFO - __main__ - Step 52082: {'lr': 0.00037154829403815307, 'samples': 9999744, 'steps': 52081, 'loss/train': 0.6239817142486572} -08/30/2021 22:37:17 - INFO - __main__ - Step 52083: {'lr': 0.0003715436567050163, 'samples': 9999936, 'steps': 52082, 'loss/train': 1.0077084302902222} -08/30/2021 22:37:18 - INFO - __main__ - Step 52084: {'lr': 0.0003715390193171139, 'samples': 10000128, 'steps': 52083, 'loss/train': 1.0066760778427124} -08/30/2021 22:37:19 - INFO - __main__ - Step 52085: {'lr': 0.0003715343818744479, 'samples': 10000320, 'steps': 52084, 'loss/train': 1.5821036100387573} -08/30/2021 22:37:19 - INFO - __main__ - Step 52086: {'lr': 0.0003715297443770203, 'samples': 10000512, 'steps': 52085, 'loss/train': 1.5655094385147095} -08/30/2021 22:37:20 - INFO - __main__ - Step 52087: {'lr': 0.0003715251068248334, 'samples': 10000704, 'steps': 52086, 'loss/train': 1.7501640319824219} -08/30/2021 22:37:20 - INFO - __main__ - Step 52088: {'lr': 0.00037152046921788906, 'samples': 10000896, 'steps': 52087, 'loss/train': 1.6460504531860352} -08/30/2021 22:37:21 - INFO - __main__ - Step 52089: {'lr': 0.00037151583155618957, 'samples': 10001088, 'steps': 52088, 'loss/train': 1.6560243368148804} -08/30/2021 22:37:22 - INFO - __main__ - Step 52090: {'lr': 0.00037151119383973684, 'samples': 10001280, 'steps': 52089, 'loss/train': 1.2341288328170776} -08/30/2021 22:37:22 - INFO - __main__ - Step 52091: {'lr': 0.0003715065560685331, 'samples': 10001472, 'steps': 52090, 'loss/train': 0.990084171295166} -08/30/2021 22:37:23 - INFO - __main__ - Step 52092: {'lr': 0.00037150191824258027, 'samples': 10001664, 'steps': 52091, 'loss/train': 1.0835883617401123} -08/30/2021 22:37:23 - INFO - __main__ - Step 52093: {'lr': 0.00037149728036188067, 'samples': 10001856, 'steps': 52092, 'loss/train': 1.2725456953048706} -08/30/2021 22:37:25 - INFO - __main__ - Step 52094: {'lr': 0.0003714926424264363, 'samples': 10002048, 'steps': 52093, 'loss/train': 1.4082059860229492} -08/30/2021 22:37:25 - INFO - __main__ - Step 52095: {'lr': 0.00037148800443624906, 'samples': 10002240, 'steps': 52094, 'loss/train': 1.820439100265503} -08/30/2021 22:37:25 - INFO - __main__ - Step 52096: {'lr': 0.0003714833663913213, 'samples': 10002432, 'steps': 52095, 'loss/train': 1.0115790367126465} -08/30/2021 22:37:26 - INFO - __main__ - Step 52097: {'lr': 0.00037147872829165497, 'samples': 10002624, 'steps': 52096, 'loss/train': 1.428789734840393} -08/30/2021 22:37:26 - INFO - __main__ - Step 52098: {'lr': 0.00037147409013725226, 'samples': 10002816, 'steps': 52097, 'loss/train': 1.3908092975616455} -08/30/2021 22:37:29 - INFO - __main__ - Step 52099: {'lr': 0.00037146945192811513, 'samples': 10003008, 'steps': 52098, 'loss/train': 1.1992634534835815} -08/30/2021 22:37:29 - INFO - __main__ - Step 52100: {'lr': 0.00037146481366424585, 'samples': 10003200, 'steps': 52099, 'loss/train': 2.1207642555236816} -08/30/2021 22:37:29 - INFO - __main__ - Step 52101: {'lr': 0.0003714601753456463, 'samples': 10003392, 'steps': 52100, 'loss/train': 1.0706340074539185} -08/30/2021 22:37:30 - INFO - __main__ - Step 52102: {'lr': 0.0003714555369723187, 'samples': 10003584, 'steps': 52101, 'loss/train': 1.0396418571472168} -08/30/2021 22:37:30 - INFO - __main__ - Step 52103: {'lr': 0.00037145089854426504, 'samples': 10003776, 'steps': 52102, 'loss/train': 1.6776082515716553} -08/30/2021 22:37:30 - INFO - __main__ - Step 52104: {'lr': 0.0003714462600614876, 'samples': 10003968, 'steps': 52103, 'loss/train': 1.7215911149978638} -08/30/2021 22:37:31 - INFO - __main__ - Step 52105: {'lr': 0.0003714416215239883, 'samples': 10004160, 'steps': 52104, 'loss/train': 1.7245113849639893} -08/30/2021 22:37:32 - INFO - __main__ - Step 52106: {'lr': 0.00037143698293176923, 'samples': 10004352, 'steps': 52105, 'loss/train': 1.390758752822876} -08/30/2021 22:37:33 - INFO - __main__ - Step 52107: {'lr': 0.0003714323442848326, 'samples': 10004544, 'steps': 52106, 'loss/train': 1.1921907663345337} -08/30/2021 22:37:33 - INFO - __main__ - Step 52108: {'lr': 0.0003714277055831804, 'samples': 10004736, 'steps': 52107, 'loss/train': 0.7346904277801514} -08/30/2021 22:37:33 - INFO - __main__ - Step 52109: {'lr': 0.00037142306682681476, 'samples': 10004928, 'steps': 52108, 'loss/train': 1.2465084791183472} -08/30/2021 22:37:34 - INFO - __main__ - Step 52110: {'lr': 0.00037141842801573775, 'samples': 10005120, 'steps': 52109, 'loss/train': 1.4384232759475708} -08/30/2021 22:37:35 - INFO - __main__ - Step 52111: {'lr': 0.00037141378914995146, 'samples': 10005312, 'steps': 52110, 'loss/train': 1.146830439567566} -08/30/2021 22:37:36 - INFO - __main__ - Step 52112: {'lr': 0.000371409150229458, 'samples': 10005504, 'steps': 52111, 'loss/train': 1.3251440525054932} -08/30/2021 22:37:36 - INFO - __main__ - Step 52113: {'lr': 0.00037140451125425945, 'samples': 10005696, 'steps': 52112, 'loss/train': 1.4773778915405273} -08/30/2021 22:37:36 - INFO - __main__ - Step 52114: {'lr': 0.0003713998722243579, 'samples': 10005888, 'steps': 52113, 'loss/train': 1.0111289024353027} -08/30/2021 22:37:37 - INFO - __main__ - Step 52115: {'lr': 0.00037139523313975544, 'samples': 10006080, 'steps': 52114, 'loss/train': 1.1920995712280273} -08/30/2021 22:37:38 - INFO - __main__ - Step 52116: {'lr': 0.00037139059400045416, 'samples': 10006272, 'steps': 52115, 'loss/train': 1.3523542881011963} -08/30/2021 22:37:39 - INFO - __main__ - Step 52117: {'lr': 0.00037138595480645613, 'samples': 10006464, 'steps': 52116, 'loss/train': 1.4828168153762817} -08/30/2021 22:37:39 - INFO - __main__ - Step 52118: {'lr': 0.0003713813155577635, 'samples': 10006656, 'steps': 52117, 'loss/train': 1.3772011995315552} -08/30/2021 22:37:39 - INFO - __main__ - Step 52119: {'lr': 0.0003713766762543783, 'samples': 10006848, 'steps': 52118, 'loss/train': 0.9362785220146179} -08/30/2021 22:37:40 - INFO - __main__ - Step 52120: {'lr': 0.0003713720368963027, 'samples': 10007040, 'steps': 52119, 'loss/train': 0.9265331029891968} -08/30/2021 22:37:41 - INFO - __main__ - Step 52121: {'lr': 0.0003713673974835387, 'samples': 10007232, 'steps': 52120, 'loss/train': 1.0374274253845215} -08/30/2021 22:37:42 - INFO - __main__ - Step 52122: {'lr': 0.0003713627580160884, 'samples': 10007424, 'steps': 52121, 'loss/train': 0.9954937696456909} -08/30/2021 22:37:42 - INFO - __main__ - Step 52123: {'lr': 0.0003713581184939539, 'samples': 10007616, 'steps': 52122, 'loss/train': 0.8861151933670044} -08/30/2021 22:37:42 - INFO - __main__ - Step 52124: {'lr': 0.00037135347891713733, 'samples': 10007808, 'steps': 52123, 'loss/train': 1.0496761798858643} -08/30/2021 22:37:43 - INFO - __main__ - Step 52125: {'lr': 0.00037134883928564074, 'samples': 10008000, 'steps': 52124, 'loss/train': 0.9004316926002502} -08/30/2021 22:37:44 - INFO - __main__ - Step 52126: {'lr': 0.00037134419959946626, 'samples': 10008192, 'steps': 52125, 'loss/train': 0.8226781487464905} -08/30/2021 22:37:45 - INFO - __main__ - Step 52127: {'lr': 0.00037133955985861595, 'samples': 10008384, 'steps': 52126, 'loss/train': 1.577428936958313} -08/30/2021 22:37:45 - INFO - __main__ - Step 52128: {'lr': 0.00037133492006309187, 'samples': 10008576, 'steps': 52127, 'loss/train': 1.1534955501556396} -08/30/2021 22:37:45 - INFO - __main__ - Step 52129: {'lr': 0.00037133028021289625, 'samples': 10008768, 'steps': 52128, 'loss/train': 1.4131879806518555} -08/30/2021 22:37:46 - INFO - __main__ - Step 52130: {'lr': 0.000371325640308031, 'samples': 10008960, 'steps': 52129, 'loss/train': 1.516191840171814} -08/30/2021 22:37:47 - INFO - __main__ - Step 52131: {'lr': 0.0003713210003484982, 'samples': 10009152, 'steps': 52130, 'loss/train': 0.9559731483459473} -08/30/2021 22:37:48 - INFO - __main__ - Step 52132: {'lr': 0.00037131636033430017, 'samples': 10009344, 'steps': 52131, 'loss/train': 1.8400068283081055} -08/30/2021 22:37:48 - INFO - __main__ - Step 52133: {'lr': 0.0003713117202654388, 'samples': 10009536, 'steps': 52132, 'loss/train': 1.833272933959961} -08/30/2021 22:37:49 - INFO - __main__ - Step 52134: {'lr': 0.0003713070801419163, 'samples': 10009728, 'steps': 52133, 'loss/train': 0.6838832497596741} -08/30/2021 22:37:49 - INFO - __main__ - Step 52135: {'lr': 0.00037130243996373466, 'samples': 10009920, 'steps': 52134, 'loss/train': 1.1680952310562134} -08/30/2021 22:37:50 - INFO - __main__ - Step 52136: {'lr': 0.00037129779973089596, 'samples': 10010112, 'steps': 52135, 'loss/train': 0.8663227558135986} -08/30/2021 22:37:51 - INFO - __main__ - Step 52137: {'lr': 0.0003712931594434024, 'samples': 10010304, 'steps': 52136, 'loss/train': 0.971187174320221} -08/30/2021 22:37:51 - INFO - __main__ - Step 52138: {'lr': 0.000371288519101256, 'samples': 10010496, 'steps': 52137, 'loss/train': 1.7072018384933472} -08/30/2021 22:37:52 - INFO - __main__ - Step 52139: {'lr': 0.00037128387870445883, 'samples': 10010688, 'steps': 52138, 'loss/train': 1.5136617422103882} -08/30/2021 22:37:52 - INFO - __main__ - Step 52140: {'lr': 0.00037127923825301315, 'samples': 10010880, 'steps': 52139, 'loss/train': 1.391979694366455} -08/30/2021 22:37:53 - INFO - __main__ - Step 52141: {'lr': 0.0003712745977469208, 'samples': 10011072, 'steps': 52140, 'loss/train': 1.9358543157577515} -08/30/2021 22:37:54 - INFO - __main__ - Step 52142: {'lr': 0.000371269957186184, 'samples': 10011264, 'steps': 52141, 'loss/train': 1.4657580852508545} -08/30/2021 22:37:54 - INFO - __main__ - Step 52143: {'lr': 0.0003712653165708048, 'samples': 10011456, 'steps': 52142, 'loss/train': 1.6507071256637573} -08/30/2021 22:37:55 - INFO - __main__ - Step 52144: {'lr': 0.00037126067590078537, 'samples': 10011648, 'steps': 52143, 'loss/train': 1.2737295627593994} -08/30/2021 22:37:55 - INFO - __main__ - Step 52145: {'lr': 0.00037125603517612773, 'samples': 10011840, 'steps': 52144, 'loss/train': 1.0407233238220215} -08/30/2021 22:37:55 - INFO - __main__ - Step 52146: {'lr': 0.00037125139439683405, 'samples': 10012032, 'steps': 52145, 'loss/train': 1.5681606531143188} -08/30/2021 22:37:57 - INFO - __main__ - Step 52147: {'lr': 0.00037124675356290635, 'samples': 10012224, 'steps': 52146, 'loss/train': 1.1434236764907837} -08/30/2021 22:37:57 - INFO - __main__ - Step 52148: {'lr': 0.00037124211267434667, 'samples': 10012416, 'steps': 52147, 'loss/train': 0.8472527861595154} -08/30/2021 22:37:58 - INFO - __main__ - Step 52149: {'lr': 0.0003712374717311572, 'samples': 10012608, 'steps': 52148, 'loss/train': 0.7128331065177917} -08/30/2021 22:37:58 - INFO - __main__ - Step 52150: {'lr': 0.00037123283073333996, 'samples': 10012800, 'steps': 52149, 'loss/train': 1.4185506105422974} -08/30/2021 22:37:59 - INFO - __main__ - Step 52151: {'lr': 0.0003712281896808971, 'samples': 10012992, 'steps': 52150, 'loss/train': 0.8081114888191223} -08/30/2021 22:38:01 - INFO - __main__ - Step 52152: {'lr': 0.0003712235485738307, 'samples': 10013184, 'steps': 52151, 'loss/train': 1.2397840023040771} -08/30/2021 22:38:01 - INFO - __main__ - Step 52153: {'lr': 0.0003712189074121428, 'samples': 10013376, 'steps': 52152, 'loss/train': 1.8307979106903076} -08/30/2021 22:38:01 - INFO - __main__ - Step 52154: {'lr': 0.0003712142661958356, 'samples': 10013568, 'steps': 52153, 'loss/train': 1.4430568218231201} -08/30/2021 22:38:02 - INFO - __main__ - Step 52155: {'lr': 0.0003712096249249111, 'samples': 10013760, 'steps': 52154, 'loss/train': 1.2210968732833862} -08/30/2021 22:38:02 - INFO - __main__ - Step 52156: {'lr': 0.00037120498359937136, 'samples': 10013952, 'steps': 52155, 'loss/train': 1.3309707641601562} -08/30/2021 22:38:04 - INFO - __main__ - Step 52157: {'lr': 0.0003712003422192186, 'samples': 10014144, 'steps': 52156, 'loss/train': 1.5481278896331787} -08/30/2021 22:38:04 - INFO - __main__ - Step 52158: {'lr': 0.00037119570078445477, 'samples': 10014336, 'steps': 52157, 'loss/train': 0.0915670245885849} -08/30/2021 22:38:05 - INFO - __main__ - Step 52159: {'lr': 0.00037119105929508207, 'samples': 10014528, 'steps': 52158, 'loss/train': 1.116216778755188} -08/30/2021 22:38:05 - INFO - __main__ - Step 52160: {'lr': 0.0003711864177511025, 'samples': 10014720, 'steps': 52159, 'loss/train': 1.5935803651809692} -08/30/2021 22:38:05 - INFO - __main__ - Step 52161: {'lr': 0.0003711817761525183, 'samples': 10014912, 'steps': 52160, 'loss/train': 1.2124431133270264} -08/30/2021 22:38:07 - INFO - __main__ - Step 52162: {'lr': 0.00037117713449933136, 'samples': 10015104, 'steps': 52161, 'loss/train': 1.8988696336746216} -08/30/2021 22:38:08 - INFO - __main__ - Step 52163: {'lr': 0.0003711724927915439, 'samples': 10015296, 'steps': 52162, 'loss/train': 0.6315200328826904} -08/30/2021 22:38:08 - INFO - __main__ - Step 52164: {'lr': 0.000371167851029158, 'samples': 10015488, 'steps': 52163, 'loss/train': 1.9108906984329224} -08/30/2021 22:38:08 - INFO - __main__ - Step 52165: {'lr': 0.0003711632092121757, 'samples': 10015680, 'steps': 52164, 'loss/train': 0.9522110223770142} -08/30/2021 22:38:09 - INFO - __main__ - Step 52166: {'lr': 0.00037115856734059916, 'samples': 10015872, 'steps': 52165, 'loss/train': 1.7165749073028564} -08/30/2021 22:38:09 - INFO - __main__ - Step 52167: {'lr': 0.0003711539254144305, 'samples': 10016064, 'steps': 52166, 'loss/train': 2.210855484008789} -08/30/2021 22:38:10 - INFO - __main__ - Step 52168: {'lr': 0.0003711492834336717, 'samples': 10016256, 'steps': 52167, 'loss/train': 1.2202154397964478} -08/30/2021 22:38:11 - INFO - __main__ - Step 52169: {'lr': 0.00037114464139832487, 'samples': 10016448, 'steps': 52168, 'loss/train': 1.1902647018432617} -08/30/2021 22:38:11 - INFO - __main__ - Step 52170: {'lr': 0.00037113999930839215, 'samples': 10016640, 'steps': 52169, 'loss/train': 1.1605207920074463} -08/30/2021 22:38:12 - INFO - __main__ - Step 52171: {'lr': 0.00037113535716387565, 'samples': 10016832, 'steps': 52170, 'loss/train': 0.37961018085479736} -08/30/2021 22:38:12 - INFO - __main__ - Step 52172: {'lr': 0.00037113071496477733, 'samples': 10017024, 'steps': 52171, 'loss/train': 2.154611349105835} -08/30/2021 22:38:13 - INFO - __main__ - Step 52173: {'lr': 0.0003711260727110995, 'samples': 10017216, 'steps': 52172, 'loss/train': 1.8900772333145142} -08/30/2021 22:38:14 - INFO - __main__ - Step 52174: {'lr': 0.0003711214304028441, 'samples': 10017408, 'steps': 52173, 'loss/train': 1.3742018938064575} -08/30/2021 22:38:14 - INFO - __main__ - Step 52175: {'lr': 0.00037111678804001324, 'samples': 10017600, 'steps': 52174, 'loss/train': 0.8828253149986267} -08/30/2021 22:38:15 - INFO - __main__ - Step 52176: {'lr': 0.00037111214562260896, 'samples': 10017792, 'steps': 52175, 'loss/train': 1.2733354568481445} -08/30/2021 22:38:15 - INFO - __main__ - Step 52177: {'lr': 0.0003711075031506335, 'samples': 10017984, 'steps': 52176, 'loss/train': 1.278172254562378} -08/30/2021 22:38:17 - INFO - __main__ - Step 52178: {'lr': 0.0003711028606240888, 'samples': 10018176, 'steps': 52177, 'loss/train': 1.385245680809021} -08/30/2021 22:38:17 - INFO - __main__ - Step 52179: {'lr': 0.00037109821804297706, 'samples': 10018368, 'steps': 52178, 'loss/train': 1.2209218740463257} -08/30/2021 22:38:17 - INFO - __main__ - Step 52180: {'lr': 0.00037109357540730033, 'samples': 10018560, 'steps': 52179, 'loss/train': 0.7813698649406433} -08/30/2021 22:38:18 - INFO - __main__ - Step 52181: {'lr': 0.00037108893271706075, 'samples': 10018752, 'steps': 52180, 'loss/train': 1.4978376626968384} -08/30/2021 22:38:18 - INFO - __main__ - Step 52182: {'lr': 0.0003710842899722603, 'samples': 10018944, 'steps': 52181, 'loss/train': 1.4047669172286987} -08/30/2021 22:38:20 - INFO - __main__ - Step 52183: {'lr': 0.00037107964717290117, 'samples': 10019136, 'steps': 52182, 'loss/train': 1.5158789157867432} -08/30/2021 22:38:20 - INFO - __main__ - Step 52184: {'lr': 0.0003710750043189854, 'samples': 10019328, 'steps': 52183, 'loss/train': 1.3145015239715576} -08/30/2021 22:38:20 - INFO - __main__ - Step 52185: {'lr': 0.0003710703614105151, 'samples': 10019520, 'steps': 52184, 'loss/train': 1.0919619798660278} -08/30/2021 22:38:21 - INFO - __main__ - Step 52186: {'lr': 0.0003710657184474924, 'samples': 10019712, 'steps': 52185, 'loss/train': 1.3718923330307007} -08/30/2021 22:38:21 - INFO - __main__ - Step 52187: {'lr': 0.00037106107542991937, 'samples': 10019904, 'steps': 52186, 'loss/train': 1.3808432817459106} -08/30/2021 22:38:23 - INFO - __main__ - Step 52188: {'lr': 0.00037105643235779803, 'samples': 10020096, 'steps': 52187, 'loss/train': 1.8743278980255127} -08/30/2021 22:38:23 - INFO - __main__ - Step 52189: {'lr': 0.0003710517892311305, 'samples': 10020288, 'steps': 52188, 'loss/train': 1.4995646476745605} -08/30/2021 22:38:23 - INFO - __main__ - Step 52190: {'lr': 0.00037104714604991896, 'samples': 10020480, 'steps': 52189, 'loss/train': 1.7942461967468262} -08/30/2021 22:38:24 - INFO - __main__ - Step 52191: {'lr': 0.0003710425028141654, 'samples': 10020672, 'steps': 52190, 'loss/train': 0.6056779623031616} -08/30/2021 22:38:24 - INFO - __main__ - Step 52192: {'lr': 0.000371037859523872, 'samples': 10020864, 'steps': 52191, 'loss/train': 0.7994875311851501} -08/30/2021 22:38:25 - INFO - __main__ - Step 52193: {'lr': 0.00037103321617904076, 'samples': 10021056, 'steps': 52192, 'loss/train': 2.1128311157226562} -08/30/2021 22:38:26 - INFO - __main__ - Step 52194: {'lr': 0.00037102857277967387, 'samples': 10021248, 'steps': 52193, 'loss/train': 0.6603522896766663} -08/30/2021 22:38:26 - INFO - __main__ - Step 52195: {'lr': 0.0003710239293257734, 'samples': 10021440, 'steps': 52194, 'loss/train': 1.5604076385498047} -08/30/2021 22:38:27 - INFO - __main__ - Step 52196: {'lr': 0.00037101928581734136, 'samples': 10021632, 'steps': 52195, 'loss/train': 1.013862133026123} -08/30/2021 22:38:27 - INFO - __main__ - Step 52197: {'lr': 0.00037101464225437986, 'samples': 10021824, 'steps': 52196, 'loss/train': 1.314492106437683} -08/30/2021 22:38:28 - INFO - __main__ - Step 52198: {'lr': 0.0003710099986368911, 'samples': 10022016, 'steps': 52197, 'loss/train': 1.556799292564392} -08/30/2021 22:38:29 - INFO - __main__ - Step 52199: {'lr': 0.0003710053549648771, 'samples': 10022208, 'steps': 52198, 'loss/train': 1.0115553140640259} -08/30/2021 22:38:29 - INFO - __main__ - Step 52200: {'lr': 0.00037100071123833994, 'samples': 10022400, 'steps': 52199, 'loss/train': 1.64149808883667} -08/30/2021 22:38:30 - INFO - __main__ - Step 52201: {'lr': 0.0003709960674572817, 'samples': 10022592, 'steps': 52200, 'loss/train': 1.6783696413040161} -08/30/2021 22:38:30 - INFO - __main__ - Step 52202: {'lr': 0.00037099142362170454, 'samples': 10022784, 'steps': 52201, 'loss/train': 1.3250700235366821} -08/30/2021 22:38:32 - INFO - __main__ - Step 52203: {'lr': 0.0003709867797316105, 'samples': 10022976, 'steps': 52202, 'loss/train': 1.408653974533081} -08/30/2021 22:38:32 - INFO - __main__ - Step 52204: {'lr': 0.0003709821357870016, 'samples': 10023168, 'steps': 52203, 'loss/train': 1.126314640045166} -08/30/2021 22:38:33 - INFO - __main__ - Step 52205: {'lr': 0.0003709774917878802, 'samples': 10023360, 'steps': 52204, 'loss/train': 1.7212632894515991} -08/30/2021 22:38:33 - INFO - __main__ - Step 52206: {'lr': 0.00037097284773424805, 'samples': 10023552, 'steps': 52205, 'loss/train': 0.5544514060020447} -08/30/2021 22:38:33 - INFO - __main__ - Step 52207: {'lr': 0.0003709682036261075, 'samples': 10023744, 'steps': 52206, 'loss/train': 0.03223726153373718} -08/30/2021 22:38:34 - INFO - __main__ - Step 52208: {'lr': 0.00037096355946346045, 'samples': 10023936, 'steps': 52207, 'loss/train': 1.404617190361023} -08/30/2021 22:38:36 - INFO - __main__ - Step 52209: {'lr': 0.00037095891524630914, 'samples': 10024128, 'steps': 52208, 'loss/train': 1.5098602771759033} -08/30/2021 22:38:36 - INFO - __main__ - Step 52210: {'lr': 0.00037095427097465564, 'samples': 10024320, 'steps': 52209, 'loss/train': 1.3243461847305298} -08/30/2021 22:38:37 - INFO - __main__ - Step 52211: {'lr': 0.00037094962664850194, 'samples': 10024512, 'steps': 52210, 'loss/train': 1.4143859148025513} -08/30/2021 22:38:37 - INFO - __main__ - Step 52212: {'lr': 0.00037094498226785023, 'samples': 10024704, 'steps': 52211, 'loss/train': 0.0280526801943779} -08/30/2021 22:38:37 - INFO - __main__ - Step 52213: {'lr': 0.00037094033783270256, 'samples': 10024896, 'steps': 52212, 'loss/train': 1.2864248752593994} -08/30/2021 22:38:39 - INFO - __main__ - Step 52214: {'lr': 0.0003709356933430611, 'samples': 10025088, 'steps': 52213, 'loss/train': 0.8989865779876709} -08/30/2021 22:38:39 - INFO - __main__ - Step 52215: {'lr': 0.00037093104879892786, 'samples': 10025280, 'steps': 52214, 'loss/train': 1.8137493133544922} -08/30/2021 22:38:40 - INFO - __main__ - Step 52216: {'lr': 0.000370926404200305, 'samples': 10025472, 'steps': 52215, 'loss/train': 1.4083799123764038} -08/30/2021 22:38:40 - INFO - __main__ - Step 52217: {'lr': 0.0003709217595471945, 'samples': 10025664, 'steps': 52216, 'loss/train': 0.9888001680374146} -08/30/2021 22:38:40 - INFO - __main__ - Step 52218: {'lr': 0.0003709171148395985, 'samples': 10025856, 'steps': 52217, 'loss/train': 1.1968246698379517} -08/30/2021 22:38:41 - INFO - __main__ - Step 52219: {'lr': 0.00037091247007751916, 'samples': 10026048, 'steps': 52218, 'loss/train': 1.0894849300384521} -08/30/2021 22:38:42 - INFO - __main__ - Step 52220: {'lr': 0.0003709078252609585, 'samples': 10026240, 'steps': 52219, 'loss/train': 1.170340895652771} -08/30/2021 22:38:43 - INFO - __main__ - Step 52221: {'lr': 0.0003709031803899187, 'samples': 10026432, 'steps': 52220, 'loss/train': 0.9565987586975098} -08/30/2021 22:38:43 - INFO - __main__ - Step 52222: {'lr': 0.0003708985354644017, 'samples': 10026624, 'steps': 52221, 'loss/train': 1.477920413017273} -08/30/2021 22:38:43 - INFO - __main__ - Step 52223: {'lr': 0.00037089389048440975, 'samples': 10026816, 'steps': 52222, 'loss/train': 1.4444735050201416} -08/30/2021 22:38:44 - INFO - __main__ - Step 52224: {'lr': 0.0003708892454499448, 'samples': 10027008, 'steps': 52223, 'loss/train': 0.848482608795166} -08/30/2021 22:38:45 - INFO - __main__ - Step 52225: {'lr': 0.00037088460036100915, 'samples': 10027200, 'steps': 52224, 'loss/train': 1.201964259147644} -08/30/2021 22:38:46 - INFO - __main__ - Step 52226: {'lr': 0.0003708799552176046, 'samples': 10027392, 'steps': 52225, 'loss/train': 1.1147754192352295} -08/30/2021 22:38:46 - INFO - __main__ - Step 52227: {'lr': 0.0003708753100197336, 'samples': 10027584, 'steps': 52226, 'loss/train': 1.2671598196029663} -08/30/2021 22:38:46 - INFO - __main__ - Step 52228: {'lr': 0.00037087066476739795, 'samples': 10027776, 'steps': 52227, 'loss/train': 0.6710507869720459} -08/30/2021 22:38:47 - INFO - __main__ - Step 52229: {'lr': 0.0003708660194605998, 'samples': 10027968, 'steps': 52228, 'loss/train': 0.7408491969108582} -08/30/2021 22:38:48 - INFO - __main__ - Step 52230: {'lr': 0.0003708613740993414, 'samples': 10028160, 'steps': 52229, 'loss/train': 0.5190768837928772} -08/30/2021 22:38:49 - INFO - __main__ - Step 52231: {'lr': 0.00037085672868362464, 'samples': 10028352, 'steps': 52230, 'loss/train': 1.8946200609207153} -08/30/2021 22:38:49 - INFO - __main__ - Step 52232: {'lr': 0.0003708520832134518, 'samples': 10028544, 'steps': 52231, 'loss/train': 1.4070595502853394} -08/30/2021 22:38:49 - INFO - __main__ - Step 52233: {'lr': 0.00037084743768882474, 'samples': 10028736, 'steps': 52232, 'loss/train': 1.028970718383789} -08/30/2021 22:38:50 - INFO - __main__ - Step 52234: {'lr': 0.00037084279210974577, 'samples': 10028928, 'steps': 52233, 'loss/train': 0.7259479761123657} -08/30/2021 22:38:51 - INFO - __main__ - Step 52235: {'lr': 0.00037083814647621686, 'samples': 10029120, 'steps': 52234, 'loss/train': 0.802712082862854} -08/30/2021 22:38:52 - INFO - __main__ - Step 52236: {'lr': 0.0003708335007882402, 'samples': 10029312, 'steps': 52235, 'loss/train': 1.1849919557571411} -08/30/2021 22:38:52 - INFO - __main__ - Step 52237: {'lr': 0.00037082885504581775, 'samples': 10029504, 'steps': 52236, 'loss/train': 1.521113634109497} -08/30/2021 22:38:52 - INFO - __main__ - Step 52238: {'lr': 0.0003708242092489518, 'samples': 10029696, 'steps': 52237, 'loss/train': 1.4894156455993652} -08/30/2021 22:38:53 - INFO - __main__ - Step 52239: {'lr': 0.0003708195633976442, 'samples': 10029888, 'steps': 52238, 'loss/train': 1.1013530492782593} -08/30/2021 22:38:54 - INFO - __main__ - Step 52240: {'lr': 0.0003708149174918972, 'samples': 10030080, 'steps': 52239, 'loss/train': 1.670696496963501} -08/30/2021 22:38:55 - INFO - __main__ - Step 52241: {'lr': 0.000370810271531713, 'samples': 10030272, 'steps': 52240, 'loss/train': 2.102803945541382} -08/30/2021 22:38:55 - INFO - __main__ - Step 52242: {'lr': 0.0003708056255170934, 'samples': 10030464, 'steps': 52241, 'loss/train': 0.8963179588317871} -08/30/2021 22:38:55 - INFO - __main__ - Step 52243: {'lr': 0.0003708009794480407, 'samples': 10030656, 'steps': 52242, 'loss/train': 1.285918951034546} -08/30/2021 22:38:56 - INFO - __main__ - Step 52244: {'lr': 0.0003707963333245569, 'samples': 10030848, 'steps': 52243, 'loss/train': 1.614464521408081} -08/30/2021 22:38:57 - INFO - __main__ - Step 52245: {'lr': 0.0003707916871466442, 'samples': 10031040, 'steps': 52244, 'loss/train': 1.2795166969299316} -08/30/2021 22:38:58 - INFO - __main__ - Step 52246: {'lr': 0.0003707870409143046, 'samples': 10031232, 'steps': 52245, 'loss/train': 1.3110697269439697} -08/30/2021 22:38:58 - INFO - __main__ - Step 52247: {'lr': 0.00037078239462754023, 'samples': 10031424, 'steps': 52246, 'loss/train': 1.2178854942321777} -08/30/2021 22:38:59 - INFO - __main__ - Step 52248: {'lr': 0.0003707777482863532, 'samples': 10031616, 'steps': 52247, 'loss/train': 0.05008105933666229} -08/30/2021 22:38:59 - INFO - __main__ - Step 52249: {'lr': 0.00037077310189074554, 'samples': 10031808, 'steps': 52248, 'loss/train': 1.2083594799041748} -08/30/2021 22:39:00 - INFO - __main__ - Step 52250: {'lr': 0.0003707684554407194, 'samples': 10032000, 'steps': 52249, 'loss/train': 1.4056837558746338} -08/30/2021 22:39:01 - INFO - __main__ - Step 52251: {'lr': 0.0003707638089362769, 'samples': 10032192, 'steps': 52250, 'loss/train': 1.2372404336929321} -08/30/2021 22:39:01 - INFO - __main__ - Step 52252: {'lr': 0.00037075916237742, 'samples': 10032384, 'steps': 52251, 'loss/train': 0.036106839776039124} -08/30/2021 22:39:02 - INFO - __main__ - Step 52253: {'lr': 0.00037075451576415095, 'samples': 10032576, 'steps': 52252, 'loss/train': 1.2156604528427124} -08/30/2021 22:39:02 - INFO - __main__ - Step 52254: {'lr': 0.00037074986909647173, 'samples': 10032768, 'steps': 52253, 'loss/train': 1.2154524326324463} -08/30/2021 22:39:02 - INFO - __main__ - Step 52255: {'lr': 0.00037074522237438455, 'samples': 10032960, 'steps': 52254, 'loss/train': 1.1037936210632324} -08/30/2021 22:39:04 - INFO - __main__ - Step 52256: {'lr': 0.0003707405755978914, 'samples': 10033152, 'steps': 52255, 'loss/train': 0.24889405071735382} -08/30/2021 22:39:04 - INFO - __main__ - Step 52257: {'lr': 0.00037073592876699443, 'samples': 10033344, 'steps': 52256, 'loss/train': 1.2274162769317627} -08/30/2021 22:39:05 - INFO - __main__ - Step 52258: {'lr': 0.0003707312818816956, 'samples': 10033536, 'steps': 52257, 'loss/train': 1.145326018333435} -08/30/2021 22:39:05 - INFO - __main__ - Step 52259: {'lr': 0.00037072663494199724, 'samples': 10033728, 'steps': 52258, 'loss/train': 1.2771406173706055} -08/30/2021 22:39:05 - INFO - __main__ - Step 52260: {'lr': 0.0003707219879479013, 'samples': 10033920, 'steps': 52259, 'loss/train': 1.2544595003128052} -08/30/2021 22:39:08 - INFO - __main__ - Step 52261: {'lr': 0.0003707173408994099, 'samples': 10034112, 'steps': 52260, 'loss/train': 1.2631003856658936} -08/30/2021 22:39:08 - INFO - __main__ - Step 52262: {'lr': 0.0003707126937965251, 'samples': 10034304, 'steps': 52261, 'loss/train': 2.133697509765625} -08/30/2021 22:39:08 - INFO - __main__ - Step 52263: {'lr': 0.0003707080466392491, 'samples': 10034496, 'steps': 52262, 'loss/train': 1.2249665260314941} -08/30/2021 22:39:09 - INFO - __main__ - Step 52264: {'lr': 0.0003707033994275838, 'samples': 10034688, 'steps': 52263, 'loss/train': 1.5853255987167358} -08/30/2021 22:39:09 - INFO - __main__ - Step 52265: {'lr': 0.0003706987521615315, 'samples': 10034880, 'steps': 52264, 'loss/train': 1.1202856302261353} -08/30/2021 22:39:11 - INFO - __main__ - Step 52266: {'lr': 0.0003706941048410941, 'samples': 10035072, 'steps': 52265, 'loss/train': 1.6441651582717896} -08/30/2021 22:39:11 - INFO - __main__ - Step 52267: {'lr': 0.0003706894574662739, 'samples': 10035264, 'steps': 52266, 'loss/train': 1.4115123748779297} -08/30/2021 22:39:12 - INFO - __main__ - Step 52268: {'lr': 0.0003706848100370729, 'samples': 10035456, 'steps': 52267, 'loss/train': 1.4814977645874023} -08/30/2021 22:39:12 - INFO - __main__ - Step 52269: {'lr': 0.00037068016255349315, 'samples': 10035648, 'steps': 52268, 'loss/train': 1.3032234907150269} -08/30/2021 22:39:12 - INFO - __main__ - Step 52270: {'lr': 0.0003706755150155368, 'samples': 10035840, 'steps': 52269, 'loss/train': 1.1801214218139648} -08/30/2021 22:39:14 - INFO - __main__ - Step 52271: {'lr': 0.0003706708674232059, 'samples': 10036032, 'steps': 52270, 'loss/train': 2.0028908252716064} -08/30/2021 22:39:14 - INFO - __main__ - Step 52272: {'lr': 0.0003706662197765025, 'samples': 10036224, 'steps': 52271, 'loss/train': 1.1603450775146484} -08/30/2021 22:39:15 - INFO - __main__ - Step 52273: {'lr': 0.00037066157207542885, 'samples': 10036416, 'steps': 52272, 'loss/train': 0.9355124831199646} -08/30/2021 22:39:15 - INFO - __main__ - Step 52274: {'lr': 0.00037065692431998695, 'samples': 10036608, 'steps': 52273, 'loss/train': 1.1618053913116455} -08/30/2021 22:39:15 - INFO - __main__ - Step 52275: {'lr': 0.00037065227651017897, 'samples': 10036800, 'steps': 52274, 'loss/train': 1.3768295049667358} -08/30/2021 22:39:17 - INFO - __main__ - Step 52276: {'lr': 0.0003706476286460068, 'samples': 10036992, 'steps': 52275, 'loss/train': 1.458606481552124} -08/30/2021 22:39:17 - INFO - __main__ - Step 52277: {'lr': 0.0003706429807274728, 'samples': 10037184, 'steps': 52276, 'loss/train': 0.9733828902244568} -08/30/2021 22:39:18 - INFO - __main__ - Step 52278: {'lr': 0.0003706383327545788, 'samples': 10037376, 'steps': 52277, 'loss/train': 0.6269864439964294} -08/30/2021 22:39:18 - INFO - __main__ - Step 52279: {'lr': 0.0003706336847273271, 'samples': 10037568, 'steps': 52278, 'loss/train': 1.1764856576919556} -08/30/2021 22:39:18 - INFO - __main__ - Step 52280: {'lr': 0.00037062903664571975, 'samples': 10037760, 'steps': 52279, 'loss/train': 1.7229739427566528} -08/30/2021 22:39:19 - INFO - __main__ - Step 52281: {'lr': 0.00037062438850975877, 'samples': 10037952, 'steps': 52280, 'loss/train': 0.32705265283584595} -08/30/2021 22:39:20 - INFO - __main__ - Step 52282: {'lr': 0.00037061974031944635, 'samples': 10038144, 'steps': 52281, 'loss/train': 1.6630194187164307} -08/30/2021 22:39:21 - INFO - __main__ - Step 52283: {'lr': 0.0003706150920747845, 'samples': 10038336, 'steps': 52282, 'loss/train': 1.8692938089370728} -08/30/2021 22:39:21 - INFO - __main__ - Step 52284: {'lr': 0.00037061044377577535, 'samples': 10038528, 'steps': 52283, 'loss/train': 1.044979453086853} -08/30/2021 22:39:21 - INFO - __main__ - Step 52285: {'lr': 0.00037060579542242094, 'samples': 10038720, 'steps': 52284, 'loss/train': 1.1428381204605103} -08/30/2021 22:39:22 - INFO - __main__ - Step 52286: {'lr': 0.00037060114701472355, 'samples': 10038912, 'steps': 52285, 'loss/train': 1.7768486738204956} -08/30/2021 22:39:23 - INFO - __main__ - Step 52287: {'lr': 0.00037059649855268503, 'samples': 10039104, 'steps': 52286, 'loss/train': 1.559008002281189} -08/30/2021 22:39:24 - INFO - __main__ - Step 52288: {'lr': 0.0003705918500363077, 'samples': 10039296, 'steps': 52287, 'loss/train': 1.487499475479126} -08/30/2021 22:39:24 - INFO - __main__ - Step 52289: {'lr': 0.0003705872014655934, 'samples': 10039488, 'steps': 52288, 'loss/train': 1.2089561223983765} -08/30/2021 22:39:24 - INFO - __main__ - Step 52290: {'lr': 0.0003705825528405445, 'samples': 10039680, 'steps': 52289, 'loss/train': 1.0980134010314941} -08/30/2021 22:39:25 - INFO - __main__ - Step 52291: {'lr': 0.0003705779041611629, 'samples': 10039872, 'steps': 52290, 'loss/train': 0.9486036896705627} -08/30/2021 22:39:27 - INFO - __main__ - Step 52292: {'lr': 0.00037057325542745075, 'samples': 10040064, 'steps': 52291, 'loss/train': 0.9440996646881104} -08/30/2021 22:39:27 - INFO - __main__ - Step 52293: {'lr': 0.00037056860663941014, 'samples': 10040256, 'steps': 52292, 'loss/train': 1.1637372970581055} -08/30/2021 22:39:28 - INFO - __main__ - Step 52294: {'lr': 0.0003705639577970432, 'samples': 10040448, 'steps': 52293, 'loss/train': 0.6139895915985107} -08/30/2021 22:39:28 - INFO - __main__ - Step 52295: {'lr': 0.00037055930890035203, 'samples': 10040640, 'steps': 52294, 'loss/train': 1.789811372756958} -08/30/2021 22:39:28 - INFO - __main__ - Step 52296: {'lr': 0.00037055465994933866, 'samples': 10040832, 'steps': 52295, 'loss/train': 1.6707935333251953} -08/30/2021 22:39:29 - INFO - __main__ - Step 52297: {'lr': 0.00037055001094400523, 'samples': 10041024, 'steps': 52296, 'loss/train': 0.9426714181900024} -08/30/2021 22:39:29 - INFO - __main__ - Step 52298: {'lr': 0.0003705453618843538, 'samples': 10041216, 'steps': 52297, 'loss/train': 1.2685478925704956} -08/30/2021 22:39:31 - INFO - __main__ - Step 52299: {'lr': 0.00037054071277038654, 'samples': 10041408, 'steps': 52298, 'loss/train': 1.4617962837219238} -08/30/2021 22:39:31 - INFO - __main__ - Step 52300: {'lr': 0.00037053606360210544, 'samples': 10041600, 'steps': 52299, 'loss/train': 1.7167713642120361} -08/30/2021 22:39:32 - INFO - __main__ - Step 52301: {'lr': 0.00037053141437951264, 'samples': 10041792, 'steps': 52300, 'loss/train': 1.043386459350586} -08/30/2021 22:39:32 - INFO - __main__ - Step 52302: {'lr': 0.00037052676510261043, 'samples': 10041984, 'steps': 52301, 'loss/train': 1.5842963457107544} -08/30/2021 22:39:32 - INFO - __main__ - Step 52303: {'lr': 0.00037052211577140047, 'samples': 10042176, 'steps': 52302, 'loss/train': 0.8494521975517273} -08/30/2021 22:39:34 - INFO - __main__ - Step 52304: {'lr': 0.00037051746638588526, 'samples': 10042368, 'steps': 52303, 'loss/train': 1.5008400678634644} -08/30/2021 22:39:34 - INFO - __main__ - Step 52305: {'lr': 0.00037051281694606666, 'samples': 10042560, 'steps': 52304, 'loss/train': 1.7783734798431396} -08/30/2021 22:39:35 - INFO - __main__ - Step 52306: {'lr': 0.00037050816745194686, 'samples': 10042752, 'steps': 52305, 'loss/train': 1.68411386013031} -08/30/2021 22:39:35 - INFO - __main__ - Step 52307: {'lr': 0.00037050351790352795, 'samples': 10042944, 'steps': 52306, 'loss/train': 1.420371174812317} -08/30/2021 22:39:35 - INFO - __main__ - Step 52308: {'lr': 0.00037049886830081203, 'samples': 10043136, 'steps': 52307, 'loss/train': 1.277109980583191} -08/30/2021 22:39:37 - INFO - __main__ - Step 52309: {'lr': 0.00037049421864380116, 'samples': 10043328, 'steps': 52308, 'loss/train': 0.07898920774459839} -08/30/2021 22:39:37 - INFO - __main__ - Step 52310: {'lr': 0.00037048956893249746, 'samples': 10043520, 'steps': 52309, 'loss/train': 1.2166470289230347} -08/30/2021 22:39:38 - INFO - __main__ - Step 52311: {'lr': 0.00037048491916690304, 'samples': 10043712, 'steps': 52310, 'loss/train': 1.446404218673706} -08/30/2021 22:39:38 - INFO - __main__ - Step 52312: {'lr': 0.00037048026934701997, 'samples': 10043904, 'steps': 52311, 'loss/train': 0.5290502309799194} -08/30/2021 22:39:38 - INFO - __main__ - Step 52313: {'lr': 0.0003704756194728503, 'samples': 10044096, 'steps': 52312, 'loss/train': 0.045182596892118454} -08/30/2021 22:39:40 - INFO - __main__ - Step 52314: {'lr': 0.0003704709695443962, 'samples': 10044288, 'steps': 52313, 'loss/train': 1.4563908576965332} -08/30/2021 22:39:41 - INFO - __main__ - Step 52315: {'lr': 0.00037046631956165975, 'samples': 10044480, 'steps': 52314, 'loss/train': 1.4502958059310913} -08/30/2021 22:39:41 - INFO - __main__ - Step 52316: {'lr': 0.00037046166952464307, 'samples': 10044672, 'steps': 52315, 'loss/train': 3.084468126296997} -08/30/2021 22:39:42 - INFO - __main__ - Step 52317: {'lr': 0.00037045701943334814, 'samples': 10044864, 'steps': 52316, 'loss/train': 0.8483191728591919} -08/30/2021 22:39:42 - INFO - __main__ - Step 52318: {'lr': 0.0003704523692877772, 'samples': 10045056, 'steps': 52317, 'loss/train': 1.269869327545166} -08/30/2021 22:39:43 - INFO - __main__ - Step 52319: {'lr': 0.00037044771908793225, 'samples': 10045248, 'steps': 52318, 'loss/train': 4.282064914703369} -08/30/2021 22:39:44 - INFO - __main__ - Step 52320: {'lr': 0.0003704430688338154, 'samples': 10045440, 'steps': 52319, 'loss/train': 0.5108669996261597} -08/30/2021 22:39:44 - INFO - __main__ - Step 52321: {'lr': 0.0003704384185254288, 'samples': 10045632, 'steps': 52320, 'loss/train': 0.8352671265602112} -08/30/2021 22:39:45 - INFO - __main__ - Step 52322: {'lr': 0.00037043376816277453, 'samples': 10045824, 'steps': 52321, 'loss/train': 1.8320648670196533} -08/30/2021 22:39:45 - INFO - __main__ - Step 52323: {'lr': 0.00037042911774585465, 'samples': 10046016, 'steps': 52322, 'loss/train': 1.0616240501403809} -08/30/2021 22:39:45 - INFO - __main__ - Step 52324: {'lr': 0.0003704244672746712, 'samples': 10046208, 'steps': 52323, 'loss/train': 0.8754017949104309} -08/30/2021 22:39:47 - INFO - __main__ - Step 52325: {'lr': 0.00037041981674922644, 'samples': 10046400, 'steps': 52324, 'loss/train': 1.6019108295440674} -08/30/2021 22:39:47 - INFO - __main__ - Step 52326: {'lr': 0.00037041516616952223, 'samples': 10046592, 'steps': 52325, 'loss/train': 0.7316842675209045} -08/30/2021 22:39:48 - INFO - __main__ - Step 52327: {'lr': 0.0003704105155355609, 'samples': 10046784, 'steps': 52326, 'loss/train': 1.4071804285049438} -08/30/2021 22:39:48 - INFO - __main__ - Step 52328: {'lr': 0.0003704058648473445, 'samples': 10046976, 'steps': 52327, 'loss/train': 1.074450135231018} -08/30/2021 22:39:48 - INFO - __main__ - Step 52329: {'lr': 0.000370401214104875, 'samples': 10047168, 'steps': 52328, 'loss/train': 2.788742780685425} -08/30/2021 22:39:50 - INFO - __main__ - Step 52330: {'lr': 0.0003703965633081546, 'samples': 10047360, 'steps': 52329, 'loss/train': 1.180933952331543} -08/30/2021 22:39:50 - INFO - __main__ - Step 52331: {'lr': 0.00037039191245718536, 'samples': 10047552, 'steps': 52330, 'loss/train': 1.1655426025390625} -08/30/2021 22:39:51 - INFO - __main__ - Step 52332: {'lr': 0.00037038726155196934, 'samples': 10047744, 'steps': 52331, 'loss/train': 0.07808967679738998} -08/30/2021 22:39:51 - INFO - __main__ - Step 52333: {'lr': 0.00037038261059250873, 'samples': 10047936, 'steps': 52332, 'loss/train': 1.2504870891571045} -08/30/2021 22:39:51 - INFO - __main__ - Step 52334: {'lr': 0.0003703779595788056, 'samples': 10048128, 'steps': 52333, 'loss/train': 1.4041295051574707} -08/30/2021 22:39:53 - INFO - __main__ - Step 52335: {'lr': 0.00037037330851086194, 'samples': 10048320, 'steps': 52334, 'loss/train': 1.4801279306411743} -08/30/2021 22:39:53 - INFO - __main__ - Step 52336: {'lr': 0.00037036865738868, 'samples': 10048512, 'steps': 52335, 'loss/train': 1.13273024559021} -08/30/2021 22:39:54 - INFO - __main__ - Step 52337: {'lr': 0.00037036400621226175, 'samples': 10048704, 'steps': 52336, 'loss/train': 1.8517225980758667} -08/30/2021 22:39:54 - INFO - __main__ - Step 52338: {'lr': 0.00037035935498160933, 'samples': 10048896, 'steps': 52337, 'loss/train': 1.3364348411560059} -08/30/2021 22:39:54 - INFO - __main__ - Step 52339: {'lr': 0.00037035470369672484, 'samples': 10049088, 'steps': 52338, 'loss/train': 0.5864757299423218} -08/30/2021 22:39:56 - INFO - __main__ - Step 52340: {'lr': 0.0003703500523576104, 'samples': 10049280, 'steps': 52339, 'loss/train': 1.467815637588501} -08/30/2021 22:39:56 - INFO - __main__ - Step 52341: {'lr': 0.0003703454009642681, 'samples': 10049472, 'steps': 52340, 'loss/train': 1.2310173511505127} -08/30/2021 22:39:57 - INFO - __main__ - Step 52342: {'lr': 0.0003703407495167, 'samples': 10049664, 'steps': 52341, 'loss/train': 1.3627800941467285} -08/30/2021 22:39:57 - INFO - __main__ - Step 52343: {'lr': 0.0003703360980149082, 'samples': 10049856, 'steps': 52342, 'loss/train': 1.3972407579421997} -08/30/2021 22:39:57 - INFO - __main__ - Step 52344: {'lr': 0.00037033144645889487, 'samples': 10050048, 'steps': 52343, 'loss/train': 1.2970020771026611} -08/30/2021 22:39:59 - INFO - __main__ - Step 52345: {'lr': 0.000370326794848662, 'samples': 10050240, 'steps': 52344, 'loss/train': 1.2972080707550049} -08/30/2021 22:39:59 - INFO - __main__ - Step 52346: {'lr': 0.00037032214318421174, 'samples': 10050432, 'steps': 52345, 'loss/train': 1.8222229480743408} -08/30/2021 22:40:00 - INFO - __main__ - Step 52347: {'lr': 0.00037031749146554616, 'samples': 10050624, 'steps': 52346, 'loss/train': 1.2135664224624634} -08/30/2021 22:40:00 - INFO - __main__ - Step 52348: {'lr': 0.00037031283969266737, 'samples': 10050816, 'steps': 52347, 'loss/train': 1.1267591714859009} -08/30/2021 22:40:00 - INFO - __main__ - Step 52349: {'lr': 0.0003703081878655775, 'samples': 10051008, 'steps': 52348, 'loss/train': 1.8772066831588745} -08/30/2021 22:40:02 - INFO - __main__ - Step 52350: {'lr': 0.00037030353598427866, 'samples': 10051200, 'steps': 52349, 'loss/train': 1.3223580121994019} -08/30/2021 22:40:02 - INFO - __main__ - Step 52351: {'lr': 0.0003702988840487728, 'samples': 10051392, 'steps': 52350, 'loss/train': 1.4786609411239624} -08/30/2021 22:40:03 - INFO - __main__ - Step 52352: {'lr': 0.0003702942320590622, 'samples': 10051584, 'steps': 52351, 'loss/train': 1.244758129119873} -08/30/2021 22:40:03 - INFO - __main__ - Step 52353: {'lr': 0.00037028958001514886, 'samples': 10051776, 'steps': 52352, 'loss/train': 1.202074646949768} -08/30/2021 22:40:03 - INFO - __main__ - Step 52354: {'lr': 0.00037028492791703484, 'samples': 10051968, 'steps': 52353, 'loss/train': 0.9333009123802185} -08/30/2021 22:40:05 - INFO - __main__ - Step 52355: {'lr': 0.0003702802757647223, 'samples': 10052160, 'steps': 52354, 'loss/train': 0.4106811583042145} -08/30/2021 22:40:05 - INFO - __main__ - Step 52356: {'lr': 0.0003702756235582134, 'samples': 10052352, 'steps': 52355, 'loss/train': 1.2768062353134155} -08/30/2021 22:40:06 - INFO - __main__ - Step 52357: {'lr': 0.00037027097129751016, 'samples': 10052544, 'steps': 52356, 'loss/train': 0.8792566061019897} -08/30/2021 22:40:06 - INFO - __main__ - Step 52358: {'lr': 0.0003702663189826146, 'samples': 10052736, 'steps': 52357, 'loss/train': 1.7622770071029663} -08/30/2021 22:40:06 - INFO - __main__ - Step 52359: {'lr': 0.0003702616666135289, 'samples': 10052928, 'steps': 52358, 'loss/train': 1.0969775915145874} -08/30/2021 22:40:08 - INFO - __main__ - Step 52360: {'lr': 0.0003702570141902552, 'samples': 10053120, 'steps': 52359, 'loss/train': 1.6986440420150757} -08/30/2021 22:40:08 - INFO - __main__ - Step 52361: {'lr': 0.00037025236171279546, 'samples': 10053312, 'steps': 52360, 'loss/train': 1.5727958679199219} -08/30/2021 22:40:08 - INFO - __main__ - Step 52362: {'lr': 0.000370247709181152, 'samples': 10053504, 'steps': 52361, 'loss/train': 1.4509665966033936} -08/30/2021 22:40:09 - INFO - __main__ - Step 52363: {'lr': 0.00037024305659532665, 'samples': 10053696, 'steps': 52362, 'loss/train': 1.1041913032531738} -08/30/2021 22:40:09 - INFO - __main__ - Step 52364: {'lr': 0.00037023840395532167, 'samples': 10053888, 'steps': 52363, 'loss/train': 1.389992594718933} -08/30/2021 22:40:10 - INFO - __main__ - Step 52365: {'lr': 0.0003702337512611391, 'samples': 10054080, 'steps': 52364, 'loss/train': 1.3814351558685303} -08/30/2021 22:40:11 - INFO - __main__ - Step 52366: {'lr': 0.00037022909851278107, 'samples': 10054272, 'steps': 52365, 'loss/train': 0.6395887136459351} -08/30/2021 22:40:11 - INFO - __main__ - Step 52367: {'lr': 0.0003702244457102497, 'samples': 10054464, 'steps': 52366, 'loss/train': 1.6485730409622192} -08/30/2021 22:40:12 - INFO - __main__ - Step 52368: {'lr': 0.000370219792853547, 'samples': 10054656, 'steps': 52367, 'loss/train': 1.6054531335830688} -08/30/2021 22:40:12 - INFO - __main__ - Step 52369: {'lr': 0.0003702151399426752, 'samples': 10054848, 'steps': 52368, 'loss/train': 1.5226519107818604} -08/30/2021 22:40:13 - INFO - __main__ - Step 52370: {'lr': 0.0003702104869776362, 'samples': 10055040, 'steps': 52369, 'loss/train': 1.3941231966018677} -08/30/2021 22:40:14 - INFO - __main__ - Step 52371: {'lr': 0.0003702058339584323, 'samples': 10055232, 'steps': 52370, 'loss/train': 1.1772795915603638} -08/30/2021 22:40:15 - INFO - __main__ - Step 52372: {'lr': 0.00037020118088506546, 'samples': 10055424, 'steps': 52371, 'loss/train': 1.3694539070129395} -08/30/2021 22:40:15 - INFO - __main__ - Step 52373: {'lr': 0.0003701965277575378, 'samples': 10055616, 'steps': 52372, 'loss/train': 1.0295183658599854} -08/30/2021 22:40:16 - INFO - __main__ - Step 52374: {'lr': 0.0003701918745758515, 'samples': 10055808, 'steps': 52373, 'loss/train': 1.2487298250198364} -08/30/2021 22:40:16 - INFO - __main__ - Step 52375: {'lr': 0.00037018722134000856, 'samples': 10056000, 'steps': 52374, 'loss/train': 1.340018391609192} -08/30/2021 22:40:18 - INFO - __main__ - Step 52376: {'lr': 0.00037018256805001115, 'samples': 10056192, 'steps': 52375, 'loss/train': 0.907055139541626} -08/30/2021 22:40:18 - INFO - __main__ - Step 52377: {'lr': 0.00037017791470586126, 'samples': 10056384, 'steps': 52376, 'loss/train': 0.720424234867096} -08/30/2021 22:40:18 - INFO - __main__ - Step 52378: {'lr': 0.0003701732613075611, 'samples': 10056576, 'steps': 52377, 'loss/train': 1.5016816854476929} -08/30/2021 22:40:19 - INFO - __main__ - Step 52379: {'lr': 0.00037016860785511274, 'samples': 10056768, 'steps': 52378, 'loss/train': 1.357456922531128} -08/30/2021 22:40:19 - INFO - __main__ - Step 52380: {'lr': 0.00037016395434851825, 'samples': 10056960, 'steps': 52379, 'loss/train': 1.652008056640625} -08/30/2021 22:40:21 - INFO - __main__ - Step 52381: {'lr': 0.0003701593007877797, 'samples': 10057152, 'steps': 52380, 'loss/train': 1.3944809436798096} -08/30/2021 22:40:21 - INFO - __main__ - Step 52382: {'lr': 0.00037015464717289924, 'samples': 10057344, 'steps': 52381, 'loss/train': 1.0370922088623047} -08/30/2021 22:40:21 - INFO - __main__ - Step 52383: {'lr': 0.000370149993503879, 'samples': 10057536, 'steps': 52382, 'loss/train': 1.397559404373169} -08/30/2021 22:40:22 - INFO - __main__ - Step 52384: {'lr': 0.000370145339780721, 'samples': 10057728, 'steps': 52383, 'loss/train': 0.9382269382476807} -08/30/2021 22:40:22 - INFO - __main__ - Step 52385: {'lr': 0.0003701406860034273, 'samples': 10057920, 'steps': 52384, 'loss/train': 0.9200490713119507} -08/30/2021 22:40:24 - INFO - __main__ - Step 52386: {'lr': 0.0003701360321720001, 'samples': 10058112, 'steps': 52385, 'loss/train': 1.21071457862854} -08/30/2021 22:40:24 - INFO - __main__ - Step 52387: {'lr': 0.0003701313782864415, 'samples': 10058304, 'steps': 52386, 'loss/train': 1.793806552886963} -08/30/2021 22:40:24 - INFO - __main__ - Step 52388: {'lr': 0.0003701267243467535, 'samples': 10058496, 'steps': 52387, 'loss/train': 1.447556734085083} -08/30/2021 22:40:25 - INFO - __main__ - Step 52389: {'lr': 0.00037012207035293834, 'samples': 10058688, 'steps': 52388, 'loss/train': 0.9450122117996216} -08/30/2021 22:40:25 - INFO - __main__ - Step 52390: {'lr': 0.00037011741630499796, 'samples': 10058880, 'steps': 52389, 'loss/train': 0.9967343807220459} -08/30/2021 22:40:27 - INFO - __main__ - Step 52391: {'lr': 0.00037011276220293447, 'samples': 10059072, 'steps': 52390, 'loss/train': 0.8369120955467224} -08/30/2021 22:40:27 - INFO - __main__ - Step 52392: {'lr': 0.0003701081080467501, 'samples': 10059264, 'steps': 52391, 'loss/train': 1.4139078855514526} -08/30/2021 22:40:28 - INFO - __main__ - Step 52393: {'lr': 0.0003701034538364468, 'samples': 10059456, 'steps': 52392, 'loss/train': 1.3424862623214722} -08/30/2021 22:40:28 - INFO - __main__ - Step 52394: {'lr': 0.0003700987995720269, 'samples': 10059648, 'steps': 52393, 'loss/train': 0.15181411802768707} -08/30/2021 22:40:28 - INFO - __main__ - Step 52395: {'lr': 0.0003700941452534922, 'samples': 10059840, 'steps': 52394, 'loss/train': 1.1930989027023315} -08/30/2021 22:40:30 - INFO - __main__ - Step 52396: {'lr': 0.0003700894908808449, 'samples': 10060032, 'steps': 52395, 'loss/train': 1.1837990283966064} -08/30/2021 22:40:30 - INFO - __main__ - Step 52397: {'lr': 0.0003700848364540872, 'samples': 10060224, 'steps': 52396, 'loss/train': 1.0149868726730347} -08/30/2021 22:40:31 - INFO - __main__ - Step 52398: {'lr': 0.0003700801819732211, 'samples': 10060416, 'steps': 52397, 'loss/train': 1.2782669067382812} -08/30/2021 22:40:31 - INFO - __main__ - Step 52399: {'lr': 0.0003700755274382487, 'samples': 10060608, 'steps': 52398, 'loss/train': 1.7821123600006104} -08/30/2021 22:40:31 - INFO - __main__ - Step 52400: {'lr': 0.0003700708728491722, 'samples': 10060800, 'steps': 52399, 'loss/train': 1.3672199249267578} -08/30/2021 22:40:32 - INFO - __main__ - Step 52401: {'lr': 0.0003700662182059936, 'samples': 10060992, 'steps': 52400, 'loss/train': 1.58430814743042} -08/30/2021 22:40:33 - INFO - __main__ - Step 52402: {'lr': 0.0003700615635087149, 'samples': 10061184, 'steps': 52401, 'loss/train': 1.5426716804504395} -08/30/2021 22:40:34 - INFO - __main__ - Step 52403: {'lr': 0.00037005690875733843, 'samples': 10061376, 'steps': 52402, 'loss/train': 1.6156574487686157} -08/30/2021 22:40:34 - INFO - __main__ - Step 52404: {'lr': 0.00037005225395186616, 'samples': 10061568, 'steps': 52403, 'loss/train': 0.9607453942298889} -08/30/2021 22:40:34 - INFO - __main__ - Step 52405: {'lr': 0.00037004759909230016, 'samples': 10061760, 'steps': 52404, 'loss/train': 1.4426928758621216} -08/30/2021 22:40:35 - INFO - __main__ - Step 52406: {'lr': 0.0003700429441786426, 'samples': 10061952, 'steps': 52405, 'loss/train': 2.022247791290283} -08/30/2021 22:40:36 - INFO - __main__ - Step 52407: {'lr': 0.0003700382892108955, 'samples': 10062144, 'steps': 52406, 'loss/train': 1.1005101203918457} -08/30/2021 22:40:37 - INFO - __main__ - Step 52408: {'lr': 0.000370033634189061, 'samples': 10062336, 'steps': 52407, 'loss/train': 1.1651203632354736} -08/30/2021 22:40:37 - INFO - __main__ - Step 52409: {'lr': 0.00037002897911314126, 'samples': 10062528, 'steps': 52408, 'loss/train': 1.8726836442947388} -08/30/2021 22:40:37 - INFO - __main__ - Step 52410: {'lr': 0.0003700243239831382, 'samples': 10062720, 'steps': 52409, 'loss/train': 1.4716858863830566} -08/30/2021 22:40:38 - INFO - __main__ - Step 52411: {'lr': 0.00037001966879905414, 'samples': 10062912, 'steps': 52410, 'loss/train': 0.6313852071762085} -08/30/2021 22:40:39 - INFO - __main__ - Step 52412: {'lr': 0.00037001501356089103, 'samples': 10063104, 'steps': 52411, 'loss/train': 0.39188385009765625} -08/30/2021 22:40:40 - INFO - __main__ - Step 52413: {'lr': 0.00037001035826865096, 'samples': 10063296, 'steps': 52412, 'loss/train': 1.2267366647720337} -08/30/2021 22:40:40 - INFO - __main__ - Step 52414: {'lr': 0.00037000570292233613, 'samples': 10063488, 'steps': 52413, 'loss/train': 1.1633687019348145} -08/30/2021 22:40:40 - INFO - __main__ - Step 52415: {'lr': 0.00037000104752194857, 'samples': 10063680, 'steps': 52414, 'loss/train': 1.654394507408142} -08/30/2021 22:40:41 - INFO - __main__ - Step 52416: {'lr': 0.0003699963920674905, 'samples': 10063872, 'steps': 52415, 'loss/train': 0.7835513949394226} -08/30/2021 22:40:42 - INFO - __main__ - Step 52417: {'lr': 0.00036999173655896374, 'samples': 10064064, 'steps': 52416, 'loss/train': 0.6513194441795349} -08/30/2021 22:40:43 - INFO - __main__ - Step 52418: {'lr': 0.00036998708099637064, 'samples': 10064256, 'steps': 52417, 'loss/train': 1.0289289951324463} -08/30/2021 22:40:43 - INFO - __main__ - Step 52419: {'lr': 0.00036998242537971315, 'samples': 10064448, 'steps': 52418, 'loss/train': 1.5378395318984985} -08/30/2021 22:40:43 - INFO - __main__ - Step 52420: {'lr': 0.00036997776970899344, 'samples': 10064640, 'steps': 52419, 'loss/train': 0.5900610089302063} -08/30/2021 22:40:44 - INFO - __main__ - Step 52421: {'lr': 0.0003699731139842136, 'samples': 10064832, 'steps': 52420, 'loss/train': 1.4941169023513794} -08/30/2021 22:40:46 - INFO - __main__ - Step 52422: {'lr': 0.0003699684582053758, 'samples': 10065024, 'steps': 52421, 'loss/train': 1.9544343948364258} -08/30/2021 22:40:46 - INFO - __main__ - Step 52423: {'lr': 0.00036996380237248205, 'samples': 10065216, 'steps': 52422, 'loss/train': 1.8961485624313354} -08/30/2021 22:40:46 - INFO - __main__ - Step 52424: {'lr': 0.0003699591464855344, 'samples': 10065408, 'steps': 52423, 'loss/train': 1.8910959959030151} -08/30/2021 22:40:47 - INFO - __main__ - Step 52425: {'lr': 0.00036995449054453503, 'samples': 10065600, 'steps': 52424, 'loss/train': 1.1313529014587402} -08/30/2021 22:40:47 - INFO - __main__ - Step 52426: {'lr': 0.00036994983454948605, 'samples': 10065792, 'steps': 52425, 'loss/train': 1.0586100816726685} -08/30/2021 22:40:48 - INFO - __main__ - Step 52427: {'lr': 0.0003699451785003895, 'samples': 10065984, 'steps': 52426, 'loss/train': 0.24465444684028625} -08/30/2021 22:40:49 - INFO - __main__ - Step 52428: {'lr': 0.0003699405223972475, 'samples': 10066176, 'steps': 52427, 'loss/train': 1.4322913885116577} -08/30/2021 22:40:49 - INFO - __main__ - Step 52429: {'lr': 0.0003699358662400622, 'samples': 10066368, 'steps': 52428, 'loss/train': 1.0574884414672852} -08/30/2021 22:40:50 - INFO - __main__ - Step 52430: {'lr': 0.00036993121002883557, 'samples': 10066560, 'steps': 52429, 'loss/train': 1.6161199808120728} -08/30/2021 22:40:50 - INFO - __main__ - Step 52431: {'lr': 0.0003699265537635698, 'samples': 10066752, 'steps': 52430, 'loss/train': 1.2440955638885498} -08/30/2021 22:40:50 - INFO - __main__ - Step 52432: {'lr': 0.000369921897444267, 'samples': 10066944, 'steps': 52431, 'loss/train': 1.5929423570632935} -08/30/2021 22:40:52 - INFO - __main__ - Step 52433: {'lr': 0.00036991724107092927, 'samples': 10067136, 'steps': 52432, 'loss/train': 0.774193525314331} -08/30/2021 22:40:53 - INFO - __main__ - Step 52434: {'lr': 0.00036991258464355863, 'samples': 10067328, 'steps': 52433, 'loss/train': 1.5099691152572632} -08/30/2021 22:40:53 - INFO - __main__ - Step 52435: {'lr': 0.00036990792816215726, 'samples': 10067520, 'steps': 52434, 'loss/train': 0.6877488493919373} -08/30/2021 22:40:53 - INFO - __main__ - Step 52436: {'lr': 0.0003699032716267273, 'samples': 10067712, 'steps': 52435, 'loss/train': 1.5035206079483032} -08/30/2021 22:40:54 - INFO - __main__ - Step 52437: {'lr': 0.00036989861503727064, 'samples': 10067904, 'steps': 52436, 'loss/train': 0.06316174566745758} -08/30/2021 22:40:56 - INFO - __main__ - Step 52438: {'lr': 0.0003698939583937896, 'samples': 10068096, 'steps': 52437, 'loss/train': 1.3215692043304443} -08/30/2021 22:40:56 - INFO - __main__ - Step 52439: {'lr': 0.0003698893016962861, 'samples': 10068288, 'steps': 52438, 'loss/train': 1.4051921367645264} -08/30/2021 22:40:57 - INFO - __main__ - Step 52440: {'lr': 0.00036988464494476243, 'samples': 10068480, 'steps': 52439, 'loss/train': 1.5172953605651855} -08/30/2021 22:40:57 - INFO - __main__ - Step 52441: {'lr': 0.0003698799881392205, 'samples': 10068672, 'steps': 52440, 'loss/train': 2.1231069564819336} -08/30/2021 22:40:57 - INFO - __main__ - Step 52442: {'lr': 0.00036987533127966253, 'samples': 10068864, 'steps': 52441, 'loss/train': 2.6003541946411133} -08/30/2021 22:40:58 - INFO - __main__ - Step 52443: {'lr': 0.0003698706743660907, 'samples': 10069056, 'steps': 52442, 'loss/train': 1.0377814769744873} -08/30/2021 22:40:59 - INFO - __main__ - Step 52444: {'lr': 0.0003698660173985069, 'samples': 10069248, 'steps': 52443, 'loss/train': 1.5682061910629272} -08/30/2021 22:41:00 - INFO - __main__ - Step 52445: {'lr': 0.0003698613603769133, 'samples': 10069440, 'steps': 52444, 'loss/train': 0.562687873840332} -08/30/2021 22:41:00 - INFO - __main__ - Step 52446: {'lr': 0.00036985670330131205, 'samples': 10069632, 'steps': 52445, 'loss/train': 0.48358389735221863} -08/30/2021 22:41:01 - INFO - __main__ - Step 52447: {'lr': 0.0003698520461717052, 'samples': 10069824, 'steps': 52446, 'loss/train': 1.5141595602035522} -08/30/2021 22:41:01 - INFO - __main__ - Step 52448: {'lr': 0.0003698473889880949, 'samples': 10070016, 'steps': 52447, 'loss/train': 1.0403631925582886} -08/30/2021 22:41:01 - INFO - __main__ - Step 52449: {'lr': 0.0003698427317504832, 'samples': 10070208, 'steps': 52448, 'loss/train': 1.3709241151809692} -08/30/2021 22:41:03 - INFO - __main__ - Step 52450: {'lr': 0.00036983807445887217, 'samples': 10070400, 'steps': 52449, 'loss/train': 1.142431378364563} -08/30/2021 22:41:04 - INFO - __main__ - Step 52451: {'lr': 0.00036983341711326403, 'samples': 10070592, 'steps': 52450, 'loss/train': 0.9625751972198486} -08/30/2021 22:41:04 - INFO - __main__ - Step 52452: {'lr': 0.00036982875971366074, 'samples': 10070784, 'steps': 52451, 'loss/train': 0.9042155146598816} -08/30/2021 22:41:04 - INFO - __main__ - Step 52453: {'lr': 0.00036982410226006445, 'samples': 10070976, 'steps': 52452, 'loss/train': 0.9322705864906311} -08/30/2021 22:41:05 - INFO - __main__ - Step 52454: {'lr': 0.0003698194447524773, 'samples': 10071168, 'steps': 52453, 'loss/train': 0.038686178624629974} -08/30/2021 22:41:06 - INFO - __main__ - Step 52455: {'lr': 0.0003698147871909014, 'samples': 10071360, 'steps': 52454, 'loss/train': 1.4055453538894653} -08/30/2021 22:41:07 - INFO - __main__ - Step 52456: {'lr': 0.0003698101295753388, 'samples': 10071552, 'steps': 52455, 'loss/train': 0.5228376388549805} -08/30/2021 22:41:07 - INFO - __main__ - Step 52457: {'lr': 0.00036980547190579153, 'samples': 10071744, 'steps': 52456, 'loss/train': 2.513827085494995} -08/30/2021 22:41:07 - INFO - __main__ - Step 52458: {'lr': 0.0003698008141822618, 'samples': 10071936, 'steps': 52457, 'loss/train': 0.13966025412082672} -08/30/2021 22:41:08 - INFO - __main__ - Step 52459: {'lr': 0.00036979615640475165, 'samples': 10072128, 'steps': 52458, 'loss/train': 1.3464133739471436} -08/30/2021 22:41:10 - INFO - __main__ - Step 52460: {'lr': 0.0003697914985732632, 'samples': 10072320, 'steps': 52459, 'loss/train': 1.2128422260284424} -08/30/2021 22:41:10 - INFO - __main__ - Step 52461: {'lr': 0.0003697868406877986, 'samples': 10072512, 'steps': 52460, 'loss/train': 0.7102416157722473} -08/30/2021 22:41:11 - INFO - __main__ - Step 52462: {'lr': 0.00036978218274835993, 'samples': 10072704, 'steps': 52461, 'loss/train': 1.5965269804000854} -08/30/2021 22:41:11 - INFO - __main__ - Step 52463: {'lr': 0.0003697775247549492, 'samples': 10072896, 'steps': 52462, 'loss/train': 1.4233697652816772} -08/30/2021 22:41:11 - INFO - __main__ - Step 52464: {'lr': 0.00036977286670756854, 'samples': 10073088, 'steps': 52463, 'loss/train': 0.836117148399353} -08/30/2021 22:41:12 - INFO - __main__ - Step 52465: {'lr': 0.00036976820860622005, 'samples': 10073280, 'steps': 52464, 'loss/train': 1.2603391408920288} -08/30/2021 22:41:13 - INFO - __main__ - Step 52466: {'lr': 0.00036976355045090594, 'samples': 10073472, 'steps': 52465, 'loss/train': 0.262428879737854} -08/30/2021 22:41:14 - INFO - __main__ - Step 52467: {'lr': 0.00036975889224162816, 'samples': 10073664, 'steps': 52466, 'loss/train': 1.2860455513000488} -08/30/2021 22:41:14 - INFO - __main__ - Step 52468: {'lr': 0.000369754233978389, 'samples': 10073856, 'steps': 52467, 'loss/train': 1.350841760635376} -08/30/2021 22:41:14 - INFO - __main__ - Step 52469: {'lr': 0.00036974957566119027, 'samples': 10074048, 'steps': 52468, 'loss/train': 1.792843222618103} -08/30/2021 22:41:15 - INFO - __main__ - Step 52470: {'lr': 0.00036974491729003427, 'samples': 10074240, 'steps': 52469, 'loss/train': 1.0194296836853027} -08/30/2021 22:41:15 - INFO - __main__ - Step 52471: {'lr': 0.00036974025886492306, 'samples': 10074432, 'steps': 52470, 'loss/train': 1.2405890226364136} -08/30/2021 22:41:16 - INFO - __main__ - Step 52472: {'lr': 0.00036973560038585876, 'samples': 10074624, 'steps': 52471, 'loss/train': 0.6181724071502686} -08/30/2021 22:41:17 - INFO - __main__ - Step 52473: {'lr': 0.0003697309418528435, 'samples': 10074816, 'steps': 52472, 'loss/train': 1.273592472076416} -08/30/2021 22:41:17 - INFO - __main__ - Step 52474: {'lr': 0.0003697262832658792, 'samples': 10075008, 'steps': 52473, 'loss/train': 1.6522210836410522} -08/30/2021 22:41:18 - INFO - __main__ - Step 52475: {'lr': 0.00036972162462496817, 'samples': 10075200, 'steps': 52474, 'loss/train': 1.5360100269317627} -08/30/2021 22:41:18 - INFO - __main__ - Step 52476: {'lr': 0.0003697169659301124, 'samples': 10075392, 'steps': 52475, 'loss/train': 1.3837968111038208} -08/30/2021 22:41:20 - INFO - __main__ - Step 52477: {'lr': 0.000369712307181314, 'samples': 10075584, 'steps': 52476, 'loss/train': 0.6994937658309937} -08/30/2021 22:41:20 - INFO - __main__ - Step 52478: {'lr': 0.00036970764837857505, 'samples': 10075776, 'steps': 52477, 'loss/train': 1.1775614023208618} -08/30/2021 22:41:21 - INFO - __main__ - Step 52479: {'lr': 0.0003697029895218978, 'samples': 10075968, 'steps': 52478, 'loss/train': 0.9720891118049622} -08/30/2021 22:41:21 - INFO - __main__ - Step 52480: {'lr': 0.0003696983306112842, 'samples': 10076160, 'steps': 52479, 'loss/train': 1.5918302536010742} -08/30/2021 22:41:21 - INFO - __main__ - Step 52481: {'lr': 0.00036969367164673626, 'samples': 10076352, 'steps': 52480, 'loss/train': 1.1739903688430786} -08/30/2021 22:41:23 - INFO - __main__ - Step 52482: {'lr': 0.0003696890126282563, 'samples': 10076544, 'steps': 52481, 'loss/train': 1.0913363695144653} -08/30/2021 22:41:24 - INFO - __main__ - Step 52483: {'lr': 0.0003696843535558463, 'samples': 10076736, 'steps': 52482, 'loss/train': 1.670129656791687} -08/30/2021 22:41:24 - INFO - __main__ - Step 52484: {'lr': 0.0003696796944295084, 'samples': 10076928, 'steps': 52483, 'loss/train': 1.112436294555664} -08/30/2021 22:41:25 - INFO - __main__ - Step 52485: {'lr': 0.00036967503524924463, 'samples': 10077120, 'steps': 52484, 'loss/train': 1.0224189758300781} -08/30/2021 22:41:25 - INFO - __main__ - Step 52486: {'lr': 0.00036967037601505715, 'samples': 10077312, 'steps': 52485, 'loss/train': 0.052959855645895004} -08/30/2021 22:41:27 - INFO - __main__ - Step 52487: {'lr': 0.000369665716726948, 'samples': 10077504, 'steps': 52486, 'loss/train': 0.562862753868103} -08/30/2021 22:41:27 - INFO - __main__ - Step 52488: {'lr': 0.0003696610573849194, 'samples': 10077696, 'steps': 52487, 'loss/train': 1.8712139129638672} -08/30/2021 22:41:28 - INFO - __main__ - Step 52489: {'lr': 0.0003696563979889733, 'samples': 10077888, 'steps': 52488, 'loss/train': 1.3993226289749146} -08/30/2021 22:41:28 - INFO - __main__ - Step 52490: {'lr': 0.00036965173853911195, 'samples': 10078080, 'steps': 52489, 'loss/train': 1.3976120948791504} -08/30/2021 22:41:28 - INFO - __main__ - Step 52491: {'lr': 0.0003696470790353373, 'samples': 10078272, 'steps': 52490, 'loss/train': 0.6348013281822205} -08/30/2021 22:41:29 - INFO - __main__ - Step 52492: {'lr': 0.0003696424194776516, 'samples': 10078464, 'steps': 52491, 'loss/train': 0.23405209183692932} -08/30/2021 22:41:30 - INFO - __main__ - Step 52493: {'lr': 0.0003696377598660569, 'samples': 10078656, 'steps': 52492, 'loss/train': 1.1613837480545044} -08/30/2021 22:41:31 - INFO - __main__ - Step 52494: {'lr': 0.0003696331002005551, 'samples': 10078848, 'steps': 52493, 'loss/train': 1.0103240013122559} -08/30/2021 22:41:31 - INFO - __main__ - Step 52495: {'lr': 0.00036962844048114856, 'samples': 10079040, 'steps': 52494, 'loss/train': 0.973655104637146} -08/30/2021 22:41:31 - INFO - __main__ - Step 52496: {'lr': 0.0003696237807078393, 'samples': 10079232, 'steps': 52495, 'loss/train': 1.0134670734405518} -08/30/2021 22:41:32 - INFO - __main__ - Step 52497: {'lr': 0.00036961912088062947, 'samples': 10079424, 'steps': 52496, 'loss/train': 1.5024104118347168} -08/30/2021 22:41:33 - INFO - __main__ - Step 52498: {'lr': 0.00036961446099952104, 'samples': 10079616, 'steps': 52497, 'loss/train': 0.07937592267990112} -08/30/2021 22:41:34 - INFO - __main__ - Step 52499: {'lr': 0.0003696098010645162, 'samples': 10079808, 'steps': 52498, 'loss/train': 1.2193210124969482} -08/30/2021 22:41:34 - INFO - __main__ - Step 52500: {'lr': 0.00036960514107561707, 'samples': 10080000, 'steps': 52499, 'loss/train': 1.5616309642791748} -08/30/2021 22:41:34 - INFO - __main__ - Step 52501: {'lr': 0.00036960048103282564, 'samples': 10080192, 'steps': 52500, 'loss/train': 1.1157374382019043} -08/30/2021 22:41:35 - INFO - __main__ - Step 52502: {'lr': 0.00036959582093614406, 'samples': 10080384, 'steps': 52501, 'loss/train': 0.07532504945993423} -08/30/2021 22:41:37 - INFO - __main__ - Step 52503: {'lr': 0.00036959116078557453, 'samples': 10080576, 'steps': 52502, 'loss/train': 1.396376132965088} -08/30/2021 22:41:37 - INFO - __main__ - Step 52504: {'lr': 0.000369586500581119, 'samples': 10080768, 'steps': 52503, 'loss/train': 1.2233335971832275} -08/30/2021 22:41:37 - INFO - __main__ - Step 52505: {'lr': 0.00036958184032277974, 'samples': 10080960, 'steps': 52504, 'loss/train': 3.483546018600464} -08/30/2021 22:41:38 - INFO - __main__ - Step 52506: {'lr': 0.0003695771800105586, 'samples': 10081152, 'steps': 52505, 'loss/train': 1.3218752145767212} -08/30/2021 22:41:38 - INFO - __main__ - Step 52507: {'lr': 0.0003695725196444579, 'samples': 10081344, 'steps': 52506, 'loss/train': 1.6886030435562134} -08/30/2021 22:41:39 - INFO - __main__ - Step 52508: {'lr': 0.0003695678592244797, 'samples': 10081536, 'steps': 52507, 'loss/train': 1.9253101348876953} -08/30/2021 22:41:40 - INFO - __main__ - Step 52509: {'lr': 0.00036956319875062604, 'samples': 10081728, 'steps': 52508, 'loss/train': 1.2918356657028198} -08/30/2021 22:41:40 - INFO - __main__ - Step 52510: {'lr': 0.0003695585382228991, 'samples': 10081920, 'steps': 52509, 'loss/train': 1.4245799779891968} -08/30/2021 22:41:40 - INFO - __main__ - Step 52511: {'lr': 0.0003695538776413009, 'samples': 10082112, 'steps': 52510, 'loss/train': 0.7877821326255798} -08/30/2021 22:41:41 - INFO - __main__ - Step 52512: {'lr': 0.0003695492170058335, 'samples': 10082304, 'steps': 52511, 'loss/train': 1.5490591526031494} -08/30/2021 22:41:41 - INFO - __main__ - Step 52513: {'lr': 0.0003695445563164991, 'samples': 10082496, 'steps': 52512, 'loss/train': 1.1672179698944092} -08/30/2021 22:41:43 - INFO - __main__ - Step 52514: {'lr': 0.00036953989557329976, 'samples': 10082688, 'steps': 52513, 'loss/train': 0.7706567049026489} -08/30/2021 22:41:43 - INFO - __main__ - Step 52515: {'lr': 0.0003695352347762376, 'samples': 10082880, 'steps': 52514, 'loss/train': 0.786012589931488} -08/30/2021 22:41:44 - INFO - __main__ - Step 52516: {'lr': 0.00036953057392531474, 'samples': 10083072, 'steps': 52515, 'loss/train': 0.6681938767433167} -08/30/2021 22:41:44 - INFO - __main__ - Step 52517: {'lr': 0.00036952591302053325, 'samples': 10083264, 'steps': 52516, 'loss/train': 1.8670202493667603} -08/30/2021 22:41:44 - INFO - __main__ - Step 52518: {'lr': 0.00036952125206189516, 'samples': 10083456, 'steps': 52517, 'loss/train': 1.0553967952728271} -08/30/2021 22:41:46 - INFO - __main__ - Step 52519: {'lr': 0.00036951659104940274, 'samples': 10083648, 'steps': 52518, 'loss/train': 1.5796645879745483} -08/30/2021 22:41:46 - INFO - __main__ - Step 52520: {'lr': 0.0003695119299830579, 'samples': 10083840, 'steps': 52519, 'loss/train': 0.9981122016906738} -08/30/2021 22:41:47 - INFO - __main__ - Step 52521: {'lr': 0.0003695072688628628, 'samples': 10084032, 'steps': 52520, 'loss/train': 1.8536217212677002} -08/30/2021 22:41:47 - INFO - __main__ - Step 52522: {'lr': 0.00036950260768881963, 'samples': 10084224, 'steps': 52521, 'loss/train': 1.5423587560653687} -08/30/2021 22:41:47 - INFO - __main__ - Step 52523: {'lr': 0.00036949794646093045, 'samples': 10084416, 'steps': 52522, 'loss/train': 1.0003702640533447} -08/30/2021 22:41:49 - INFO - __main__ - Step 52524: {'lr': 0.00036949328517919735, 'samples': 10084608, 'steps': 52523, 'loss/train': 0.9841527938842773} -08/30/2021 22:41:49 - INFO - __main__ - Step 52525: {'lr': 0.0003694886238436224, 'samples': 10084800, 'steps': 52524, 'loss/train': 1.6726547479629517} -08/30/2021 22:41:50 - INFO - __main__ - Step 52526: {'lr': 0.0003694839624542077, 'samples': 10084992, 'steps': 52525, 'loss/train': 1.4632002115249634} -08/30/2021 22:41:50 - INFO - __main__ - Step 52527: {'lr': 0.0003694793010109553, 'samples': 10085184, 'steps': 52526, 'loss/train': 1.161631464958191} -08/30/2021 22:41:50 - INFO - __main__ - Step 52528: {'lr': 0.00036947463951386743, 'samples': 10085376, 'steps': 52527, 'loss/train': 1.6286373138427734} -08/30/2021 22:41:52 - INFO - __main__ - Step 52529: {'lr': 0.0003694699779629461, 'samples': 10085568, 'steps': 52528, 'loss/train': 1.0300238132476807} -08/30/2021 22:41:52 - INFO - __main__ - Step 52530: {'lr': 0.0003694653163581936, 'samples': 10085760, 'steps': 52529, 'loss/train': 1.3218671083450317} -08/30/2021 22:41:52 - INFO - __main__ - Step 52531: {'lr': 0.0003694606546996117, 'samples': 10085952, 'steps': 52530, 'loss/train': 1.1095834970474243} -08/30/2021 22:41:53 - INFO - __main__ - Step 52532: {'lr': 0.0003694559929872028, 'samples': 10086144, 'steps': 52531, 'loss/train': 1.039170265197754} -08/30/2021 22:41:53 - INFO - __main__ - Step 52533: {'lr': 0.00036945133122096875, 'samples': 10086336, 'steps': 52532, 'loss/train': 1.1130396127700806} -08/30/2021 22:41:56 - INFO - __main__ - Step 52534: {'lr': 0.0003694466694009118, 'samples': 10086528, 'steps': 52533, 'loss/train': 1.0446165800094604} -08/30/2021 22:41:56 - INFO - __main__ - Step 52535: {'lr': 0.00036944200752703405, 'samples': 10086720, 'steps': 52534, 'loss/train': 0.8081503510475159} -08/30/2021 22:41:56 - INFO - __main__ - Step 52536: {'lr': 0.0003694373455993376, 'samples': 10086912, 'steps': 52535, 'loss/train': 1.6280200481414795} -08/30/2021 22:41:57 - INFO - __main__ - Step 52537: {'lr': 0.0003694326836178245, 'samples': 10087104, 'steps': 52536, 'loss/train': 1.4756191968917847} -08/30/2021 22:41:57 - INFO - __main__ - Step 52538: {'lr': 0.0003694280215824969, 'samples': 10087296, 'steps': 52537, 'loss/train': 1.6719201803207397} -08/30/2021 22:41:59 - INFO - __main__ - Step 52539: {'lr': 0.0003694233594933568, 'samples': 10087488, 'steps': 52538, 'loss/train': 0.06519880890846252} -08/30/2021 22:41:59 - INFO - __main__ - Step 52540: {'lr': 0.00036941869735040647, 'samples': 10087680, 'steps': 52539, 'loss/train': 1.1394243240356445} -08/30/2021 22:41:59 - INFO - __main__ - Step 52541: {'lr': 0.0003694140351536479, 'samples': 10087872, 'steps': 52540, 'loss/train': 0.9822244048118591} -08/30/2021 22:42:00 - INFO - __main__ - Step 52542: {'lr': 0.00036940937290308315, 'samples': 10088064, 'steps': 52541, 'loss/train': 0.8806066513061523} -08/30/2021 22:42:00 - INFO - __main__ - Step 52543: {'lr': 0.0003694047105987144, 'samples': 10088256, 'steps': 52542, 'loss/train': 0.9883493185043335} -08/30/2021 22:42:01 - INFO - __main__ - Step 52544: {'lr': 0.00036940004824054376, 'samples': 10088448, 'steps': 52543, 'loss/train': 1.0795314311981201} -08/30/2021 22:42:02 - INFO - __main__ - Step 52545: {'lr': 0.0003693953858285733, 'samples': 10088640, 'steps': 52544, 'loss/train': 1.1583116054534912} -08/30/2021 22:42:02 - INFO - __main__ - Step 52546: {'lr': 0.0003693907233628051, 'samples': 10088832, 'steps': 52545, 'loss/train': 1.451675534248352} -08/30/2021 22:42:03 - INFO - __main__ - Step 52547: {'lr': 0.00036938606084324123, 'samples': 10089024, 'steps': 52546, 'loss/train': 1.2852673530578613} -08/30/2021 22:42:03 - INFO - __main__ - Step 52548: {'lr': 0.00036938139826988393, 'samples': 10089216, 'steps': 52547, 'loss/train': 0.8709478378295898} -08/30/2021 22:42:03 - INFO - __main__ - Step 52549: {'lr': 0.0003693767356427352, 'samples': 10089408, 'steps': 52548, 'loss/train': 2.075584650039673} -08/30/2021 22:42:05 - INFO - __main__ - Step 52550: {'lr': 0.00036937207296179717, 'samples': 10089600, 'steps': 52549, 'loss/train': 1.4703457355499268} -08/30/2021 22:42:06 - INFO - __main__ - Step 52551: {'lr': 0.0003693674102270719, 'samples': 10089792, 'steps': 52550, 'loss/train': 4.392197608947754} -08/30/2021 22:42:06 - INFO - __main__ - Step 52552: {'lr': 0.0003693627474385615, 'samples': 10089984, 'steps': 52551, 'loss/train': 1.2339626550674438} -08/30/2021 22:42:06 - INFO - __main__ - Step 52553: {'lr': 0.00036935808459626806, 'samples': 10090176, 'steps': 52552, 'loss/train': 0.08571885526180267} -08/30/2021 22:42:07 - INFO - __main__ - Step 52554: {'lr': 0.00036935342170019375, 'samples': 10090368, 'steps': 52553, 'loss/train': 0.11021265387535095} -08/30/2021 22:42:07 - INFO - __main__ - Step 52555: {'lr': 0.00036934875875034063, 'samples': 10090560, 'steps': 52554, 'loss/train': 0.6586523652076721} -08/30/2021 22:42:09 - INFO - __main__ - Step 52556: {'lr': 0.0003693440957467108, 'samples': 10090752, 'steps': 52555, 'loss/train': 1.1877292394638062} -08/30/2021 22:42:09 - INFO - __main__ - Step 52557: {'lr': 0.00036933943268930636, 'samples': 10090944, 'steps': 52556, 'loss/train': 1.6580500602722168} -08/30/2021 22:42:09 - INFO - __main__ - Step 52558: {'lr': 0.00036933476957812944, 'samples': 10091136, 'steps': 52557, 'loss/train': 1.4758145809173584} -08/30/2021 22:42:10 - INFO - __main__ - Step 52559: {'lr': 0.0003693301064131821, 'samples': 10091328, 'steps': 52558, 'loss/train': 1.507752537727356} -08/30/2021 22:42:10 - INFO - __main__ - Step 52560: {'lr': 0.0003693254431944664, 'samples': 10091520, 'steps': 52559, 'loss/train': 1.9612290859222412} -08/30/2021 22:42:10 - INFO - __main__ - Step 52561: {'lr': 0.00036932077992198455, 'samples': 10091712, 'steps': 52560, 'loss/train': 0.7714027762413025} -08/30/2021 22:42:12 - INFO - __main__ - Step 52562: {'lr': 0.0003693161165957386, 'samples': 10091904, 'steps': 52561, 'loss/train': 0.5221697688102722} -08/30/2021 22:42:12 - INFO - __main__ - Step 52563: {'lr': 0.0003693114532157306, 'samples': 10092096, 'steps': 52562, 'loss/train': 1.4347823858261108} -08/30/2021 22:42:13 - INFO - __main__ - Step 52564: {'lr': 0.00036930678978196283, 'samples': 10092288, 'steps': 52563, 'loss/train': 1.3313177824020386} -08/30/2021 22:42:13 - INFO - __main__ - Step 52565: {'lr': 0.00036930212629443716, 'samples': 10092480, 'steps': 52564, 'loss/train': 1.804288625717163} -08/30/2021 22:42:13 - INFO - __main__ - Step 52566: {'lr': 0.00036929746275315577, 'samples': 10092672, 'steps': 52565, 'loss/train': 1.411015510559082} -08/30/2021 22:42:15 - INFO - __main__ - Step 52567: {'lr': 0.0003692927991581208, 'samples': 10092864, 'steps': 52566, 'loss/train': 1.4452924728393555} -08/30/2021 22:42:15 - INFO - __main__ - Step 52568: {'lr': 0.0003692881355093344, 'samples': 10093056, 'steps': 52567, 'loss/train': 1.1412122249603271} -08/30/2021 22:42:16 - INFO - __main__ - Step 52569: {'lr': 0.00036928347180679847, 'samples': 10093248, 'steps': 52568, 'loss/train': 1.6784499883651733} -08/30/2021 22:42:16 - INFO - __main__ - Step 52570: {'lr': 0.0003692788080505154, 'samples': 10093440, 'steps': 52569, 'loss/train': 1.5619900226593018} -08/30/2021 22:42:16 - INFO - __main__ - Step 52571: {'lr': 0.0003692741442404871, 'samples': 10093632, 'steps': 52570, 'loss/train': 1.658601999282837} -08/30/2021 22:42:18 - INFO - __main__ - Step 52572: {'lr': 0.0003692694803767157, 'samples': 10093824, 'steps': 52571, 'loss/train': 1.1120797395706177} -08/30/2021 22:42:19 - INFO - __main__ - Step 52573: {'lr': 0.0003692648164592033, 'samples': 10094016, 'steps': 52572, 'loss/train': 1.9891489744186401} -08/30/2021 22:42:19 - INFO - __main__ - Step 52574: {'lr': 0.00036926015248795195, 'samples': 10094208, 'steps': 52573, 'loss/train': 1.211263656616211} -08/30/2021 22:42:19 - INFO - __main__ - Step 52575: {'lr': 0.0003692554884629639, 'samples': 10094400, 'steps': 52574, 'loss/train': 1.5121631622314453} -08/30/2021 22:42:20 - INFO - __main__ - Step 52576: {'lr': 0.00036925082438424116, 'samples': 10094592, 'steps': 52575, 'loss/train': 0.8200514912605286} -08/30/2021 22:42:21 - INFO - __main__ - Step 52577: {'lr': 0.00036924616025178585, 'samples': 10094784, 'steps': 52576, 'loss/train': 1.1563302278518677} -08/30/2021 22:42:22 - INFO - __main__ - Step 52578: {'lr': 0.0003692414960656, 'samples': 10094976, 'steps': 52577, 'loss/train': 1.3313965797424316} -08/30/2021 22:42:22 - INFO - __main__ - Step 52579: {'lr': 0.00036923683182568586, 'samples': 10095168, 'steps': 52578, 'loss/train': 1.2651478052139282} -08/30/2021 22:42:22 - INFO - __main__ - Step 52580: {'lr': 0.00036923216753204536, 'samples': 10095360, 'steps': 52579, 'loss/train': 1.4931687116622925} -08/30/2021 22:42:23 - INFO - __main__ - Step 52581: {'lr': 0.00036922750318468074, 'samples': 10095552, 'steps': 52580, 'loss/train': 1.0046278238296509} -08/30/2021 22:42:24 - INFO - __main__ - Step 52582: {'lr': 0.00036922283878359396, 'samples': 10095744, 'steps': 52581, 'loss/train': 0.8828812837600708} -08/30/2021 22:42:25 - INFO - __main__ - Step 52583: {'lr': 0.0003692181743287873, 'samples': 10095936, 'steps': 52582, 'loss/train': 0.6817058324813843} -08/30/2021 22:42:25 - INFO - __main__ - Step 52584: {'lr': 0.0003692135098202628, 'samples': 10096128, 'steps': 52583, 'loss/train': 1.639438271522522} -08/30/2021 22:42:25 - INFO - __main__ - Step 52585: {'lr': 0.0003692088452580225, 'samples': 10096320, 'steps': 52584, 'loss/train': 1.2934675216674805} -08/30/2021 22:42:26 - INFO - __main__ - Step 52586: {'lr': 0.00036920418064206845, 'samples': 10096512, 'steps': 52585, 'loss/train': 1.506569266319275} -08/30/2021 22:42:28 - INFO - __main__ - Step 52587: {'lr': 0.0003691995159724029, 'samples': 10096704, 'steps': 52586, 'loss/train': 1.4008046388626099} -08/30/2021 22:42:28 - INFO - __main__ - Step 52588: {'lr': 0.00036919485124902785, 'samples': 10096896, 'steps': 52587, 'loss/train': 0.9199028015136719} -08/30/2021 22:42:28 - INFO - __main__ - Step 52589: {'lr': 0.00036919018647194545, 'samples': 10097088, 'steps': 52588, 'loss/train': 1.547400712966919} -08/30/2021 22:42:29 - INFO - __main__ - Step 52590: {'lr': 0.0003691855216411578, 'samples': 10097280, 'steps': 52589, 'loss/train': 1.3237316608428955} -08/30/2021 22:42:29 - INFO - __main__ - Step 52591: {'lr': 0.00036918085675666706, 'samples': 10097472, 'steps': 52590, 'loss/train': 0.9180843234062195} -08/30/2021 22:42:30 - INFO - __main__ - Step 52592: {'lr': 0.00036917619181847525, 'samples': 10097664, 'steps': 52591, 'loss/train': 1.5750412940979004} -08/30/2021 22:42:31 - INFO - __main__ - Step 52593: {'lr': 0.00036917152682658437, 'samples': 10097856, 'steps': 52592, 'loss/train': 0.6543641090393066} -08/30/2021 22:42:32 - INFO - __main__ - Step 52594: {'lr': 0.0003691668617809968, 'samples': 10098048, 'steps': 52593, 'loss/train': 1.0030410289764404} -08/30/2021 22:42:32 - INFO - __main__ - Step 52595: {'lr': 0.00036916219668171435, 'samples': 10098240, 'steps': 52594, 'loss/train': 0.15339718759059906} -08/30/2021 22:42:33 - INFO - __main__ - Step 52596: {'lr': 0.0003691575315287393, 'samples': 10098432, 'steps': 52595, 'loss/train': 1.2302451133728027} -08/30/2021 22:42:33 - INFO - __main__ - Step 52597: {'lr': 0.00036915286632207374, 'samples': 10098624, 'steps': 52596, 'loss/train': 1.6820393800735474} -08/30/2021 22:42:34 - INFO - __main__ - Step 52598: {'lr': 0.0003691482010617197, 'samples': 10098816, 'steps': 52597, 'loss/train': 0.985542893409729} -08/30/2021 22:42:35 - INFO - __main__ - Step 52599: {'lr': 0.00036914353574767935, 'samples': 10099008, 'steps': 52598, 'loss/train': 1.9780583381652832} -08/30/2021 22:42:35 - INFO - __main__ - Step 52600: {'lr': 0.0003691388703799547, 'samples': 10099200, 'steps': 52599, 'loss/train': 1.3220382928848267} -08/30/2021 22:42:36 - INFO - __main__ - Step 52601: {'lr': 0.00036913420495854793, 'samples': 10099392, 'steps': 52600, 'loss/train': 1.5783418416976929} -08/30/2021 22:42:36 - INFO - __main__ - Step 52602: {'lr': 0.00036912953948346115, 'samples': 10099584, 'steps': 52601, 'loss/train': 1.1676360368728638} -08/30/2021 22:42:38 - INFO - __main__ - Step 52603: {'lr': 0.00036912487395469645, 'samples': 10099776, 'steps': 52602, 'loss/train': 1.9210675954818726} -08/30/2021 22:42:38 - INFO - __main__ - Step 52604: {'lr': 0.0003691202083722559, 'samples': 10099968, 'steps': 52603, 'loss/train': 1.2477043867111206} -08/30/2021 22:42:39 - INFO - __main__ - Step 52605: {'lr': 0.0003691155427361416, 'samples': 10100160, 'steps': 52604, 'loss/train': 0.9537261724472046} -08/30/2021 22:42:39 - INFO - __main__ - Step 52606: {'lr': 0.0003691108770463557, 'samples': 10100352, 'steps': 52605, 'loss/train': 1.6194697618484497} -08/30/2021 22:42:39 - INFO - __main__ - Step 52607: {'lr': 0.00036910621130290027, 'samples': 10100544, 'steps': 52606, 'loss/train': 1.5384349822998047} -08/30/2021 22:42:41 - INFO - __main__ - Step 52608: {'lr': 0.0003691015455057775, 'samples': 10100736, 'steps': 52607, 'loss/train': 0.14303551614284515} -08/30/2021 22:42:42 - INFO - __main__ - Step 52609: {'lr': 0.0003690968796549893, 'samples': 10100928, 'steps': 52608, 'loss/train': 1.1941648721694946} -08/30/2021 22:42:42 - INFO - __main__ - Step 52610: {'lr': 0.0003690922137505379, 'samples': 10101120, 'steps': 52609, 'loss/train': 1.174319863319397} -08/30/2021 22:42:42 - INFO - __main__ - Step 52611: {'lr': 0.00036908754779242545, 'samples': 10101312, 'steps': 52610, 'loss/train': 0.8619337677955627} -08/30/2021 22:42:43 - INFO - __main__ - Step 52612: {'lr': 0.00036908288178065393, 'samples': 10101504, 'steps': 52611, 'loss/train': 1.4088321924209595} -08/30/2021 22:42:43 - INFO - __main__ - Step 52613: {'lr': 0.00036907821571522553, 'samples': 10101696, 'steps': 52612, 'loss/train': 1.6077200174331665} -08/30/2021 22:42:45 - INFO - __main__ - Step 52614: {'lr': 0.0003690735495961423, 'samples': 10101888, 'steps': 52613, 'loss/train': 1.0514719486236572} -08/30/2021 22:42:45 - INFO - __main__ - Step 52615: {'lr': 0.0003690688834234064, 'samples': 10102080, 'steps': 52614, 'loss/train': 1.4516382217407227} -08/30/2021 22:42:45 - INFO - __main__ - Step 52616: {'lr': 0.0003690642171970198, 'samples': 10102272, 'steps': 52615, 'loss/train': 1.3071733713150024} -08/30/2021 22:42:46 - INFO - __main__ - Step 52617: {'lr': 0.0003690595509169848, 'samples': 10102464, 'steps': 52616, 'loss/train': 1.0561918020248413} -08/30/2021 22:42:46 - INFO - __main__ - Step 52618: {'lr': 0.00036905488458330337, 'samples': 10102656, 'steps': 52617, 'loss/train': 0.8344602584838867} -08/30/2021 22:42:48 - INFO - __main__ - Step 52619: {'lr': 0.00036905021819597767, 'samples': 10102848, 'steps': 52618, 'loss/train': 1.8325072526931763} -08/30/2021 22:42:48 - INFO - __main__ - Step 52620: {'lr': 0.00036904555175500977, 'samples': 10103040, 'steps': 52619, 'loss/train': 1.5285195112228394} -08/30/2021 22:42:49 - INFO - __main__ - Step 52621: {'lr': 0.00036904088526040177, 'samples': 10103232, 'steps': 52620, 'loss/train': 0.07646815478801727} -08/30/2021 22:42:49 - INFO - __main__ - Step 52622: {'lr': 0.00036903621871215575, 'samples': 10103424, 'steps': 52621, 'loss/train': 1.5410460233688354} -08/30/2021 22:42:49 - INFO - __main__ - Step 52623: {'lr': 0.0003690315521102739, 'samples': 10103616, 'steps': 52622, 'loss/train': 1.5301294326782227} -08/30/2021 22:42:51 - INFO - __main__ - Step 52624: {'lr': 0.0003690268854547583, 'samples': 10103808, 'steps': 52623, 'loss/train': 0.24799980223178864} -08/30/2021 22:42:51 - INFO - __main__ - Step 52625: {'lr': 0.00036902221874561097, 'samples': 10104000, 'steps': 52624, 'loss/train': 1.080647587776184} -08/30/2021 22:42:52 - INFO - __main__ - Step 52626: {'lr': 0.00036901755198283403, 'samples': 10104192, 'steps': 52625, 'loss/train': 2.303861379623413} -08/30/2021 22:42:52 - INFO - __main__ - Step 52627: {'lr': 0.0003690128851664297, 'samples': 10104384, 'steps': 52626, 'loss/train': 0.7482075691223145} -08/30/2021 22:42:52 - INFO - __main__ - Step 52628: {'lr': 0.0003690082182964, 'samples': 10104576, 'steps': 52627, 'loss/train': 1.6616662740707397} -08/30/2021 22:42:54 - INFO - __main__ - Step 52629: {'lr': 0.00036900355137274696, 'samples': 10104768, 'steps': 52628, 'loss/train': 1.4044233560562134} -08/30/2021 22:42:54 - INFO - __main__ - Step 52630: {'lr': 0.00036899888439547276, 'samples': 10104960, 'steps': 52629, 'loss/train': 1.37495756149292} -08/30/2021 22:42:55 - INFO - __main__ - Step 52631: {'lr': 0.00036899421736457955, 'samples': 10105152, 'steps': 52630, 'loss/train': 1.475831151008606} -08/30/2021 22:42:55 - INFO - __main__ - Step 52632: {'lr': 0.00036898955028006936, 'samples': 10105344, 'steps': 52631, 'loss/train': 1.1597403287887573} -08/30/2021 22:42:55 - INFO - __main__ - Step 52633: {'lr': 0.0003689848831419443, 'samples': 10105536, 'steps': 52632, 'loss/train': 0.05094965919852257} -08/30/2021 22:42:57 - INFO - __main__ - Step 52634: {'lr': 0.0003689802159502065, 'samples': 10105728, 'steps': 52633, 'loss/train': 1.598905086517334} -08/30/2021 22:42:58 - INFO - __main__ - Step 52635: {'lr': 0.00036897554870485804, 'samples': 10105920, 'steps': 52634, 'loss/train': 1.7844258546829224} -08/30/2021 22:42:58 - INFO - __main__ - Step 52636: {'lr': 0.000368970881405901, 'samples': 10106112, 'steps': 52635, 'loss/train': 1.5041440725326538} -08/30/2021 22:42:58 - INFO - __main__ - Step 52637: {'lr': 0.0003689662140533376, 'samples': 10106304, 'steps': 52636, 'loss/train': 1.1380068063735962} -08/30/2021 22:42:59 - INFO - __main__ - Step 52638: {'lr': 0.00036896154664716987, 'samples': 10106496, 'steps': 52637, 'loss/train': 1.655505895614624} -08/30/2021 22:43:01 - INFO - __main__ - Step 52639: {'lr': 0.00036895687918739984, 'samples': 10106688, 'steps': 52638, 'loss/train': 1.340161919593811} -08/30/2021 22:43:01 - INFO - __main__ - Step 52640: {'lr': 0.0003689522116740296, 'samples': 10106880, 'steps': 52639, 'loss/train': 1.5741502046585083} -08/30/2021 22:43:02 - INFO - __main__ - Step 52641: {'lr': 0.0003689475441070615, 'samples': 10107072, 'steps': 52640, 'loss/train': 0.921815037727356} -08/30/2021 22:43:02 - INFO - __main__ - Step 52642: {'lr': 0.0003689428764864974, 'samples': 10107264, 'steps': 52641, 'loss/train': 1.598400354385376} -08/30/2021 22:43:02 - INFO - __main__ - Step 52643: {'lr': 0.0003689382088123394, 'samples': 10107456, 'steps': 52642, 'loss/train': 1.4491839408874512} -08/30/2021 22:43:03 - INFO - __main__ - Step 52644: {'lr': 0.0003689335410845898, 'samples': 10107648, 'steps': 52643, 'loss/train': 0.5983690023422241} -08/30/2021 22:43:05 - INFO - __main__ - Step 52645: {'lr': 0.00036892887330325054, 'samples': 10107840, 'steps': 52644, 'loss/train': 1.2478861808776855} -08/30/2021 22:43:05 - INFO - __main__ - Step 52646: {'lr': 0.00036892420546832375, 'samples': 10108032, 'steps': 52645, 'loss/train': 1.0929803848266602} -08/30/2021 22:43:05 - INFO - __main__ - Step 52647: {'lr': 0.0003689195375798115, 'samples': 10108224, 'steps': 52646, 'loss/train': 2.4148240089416504} -08/30/2021 22:43:06 - INFO - __main__ - Step 52648: {'lr': 0.00036891486963771603, 'samples': 10108416, 'steps': 52647, 'loss/train': 1.5363584756851196} -08/30/2021 22:43:06 - INFO - __main__ - Step 52649: {'lr': 0.00036891020164203924, 'samples': 10108608, 'steps': 52648, 'loss/train': 1.0536298751831055} -08/30/2021 22:43:07 - INFO - __main__ - Step 52650: {'lr': 0.00036890553359278345, 'samples': 10108800, 'steps': 52649, 'loss/train': 0.6469190716743469} -08/30/2021 22:43:08 - INFO - __main__ - Step 52651: {'lr': 0.0003689008654899507, 'samples': 10108992, 'steps': 52650, 'loss/train': 5.747594356536865} -08/30/2021 22:43:08 - INFO - __main__ - Step 52652: {'lr': 0.00036889619733354297, 'samples': 10109184, 'steps': 52651, 'loss/train': 1.6629053354263306} -08/30/2021 22:43:09 - INFO - __main__ - Step 52653: {'lr': 0.0003688915291235625, 'samples': 10109376, 'steps': 52652, 'loss/train': 1.4267748594284058} -08/30/2021 22:43:09 - INFO - __main__ - Step 52654: {'lr': 0.0003688868608600113, 'samples': 10109568, 'steps': 52653, 'loss/train': 0.9135183095932007} -08/30/2021 22:43:09 - INFO - __main__ - Step 52655: {'lr': 0.00036888219254289147, 'samples': 10109760, 'steps': 52654, 'loss/train': 1.3949719667434692} -08/30/2021 22:43:11 - INFO - __main__ - Step 52656: {'lr': 0.0003688775241722052, 'samples': 10109952, 'steps': 52655, 'loss/train': 0.8932076096534729} -08/30/2021 22:43:11 - INFO - __main__ - Step 52657: {'lr': 0.0003688728557479546, 'samples': 10110144, 'steps': 52656, 'loss/train': 1.6523542404174805} -08/30/2021 22:43:12 - INFO - __main__ - Step 52658: {'lr': 0.00036886818727014173, 'samples': 10110336, 'steps': 52657, 'loss/train': 1.1122334003448486} -08/30/2021 22:43:12 - INFO - __main__ - Step 52659: {'lr': 0.0003688635187387686, 'samples': 10110528, 'steps': 52658, 'loss/train': 1.2266416549682617} -08/30/2021 22:43:12 - INFO - __main__ - Step 52660: {'lr': 0.0003688588501538375, 'samples': 10110720, 'steps': 52659, 'loss/train': 1.3486294746398926} -08/30/2021 22:43:14 - INFO - __main__ - Step 52661: {'lr': 0.00036885418151535033, 'samples': 10110912, 'steps': 52660, 'loss/train': 0.9828211665153503} -08/30/2021 22:43:15 - INFO - __main__ - Step 52662: {'lr': 0.00036884951282330935, 'samples': 10111104, 'steps': 52661, 'loss/train': 0.13739511370658875} -08/30/2021 22:43:15 - INFO - __main__ - Step 52663: {'lr': 0.00036884484407771664, 'samples': 10111296, 'steps': 52662, 'loss/train': 0.30096691846847534} -08/30/2021 22:43:15 - INFO - __main__ - Step 52664: {'lr': 0.00036884017527857426, 'samples': 10111488, 'steps': 52663, 'loss/train': 0.5852181911468506} -08/30/2021 22:43:16 - INFO - __main__ - Step 52665: {'lr': 0.0003688355064258844, 'samples': 10111680, 'steps': 52664, 'loss/train': 1.3313403129577637} -08/30/2021 22:43:16 - INFO - __main__ - Step 52666: {'lr': 0.00036883083751964896, 'samples': 10111872, 'steps': 52665, 'loss/train': 1.8639763593673706} -08/30/2021 22:43:17 - INFO - __main__ - Step 52667: {'lr': 0.00036882616855987027, 'samples': 10112064, 'steps': 52666, 'loss/train': 0.8944418430328369} -08/30/2021 22:43:18 - INFO - __main__ - Step 52668: {'lr': 0.0003688214995465503, 'samples': 10112256, 'steps': 52667, 'loss/train': 1.2589043378829956} -08/30/2021 22:43:18 - INFO - __main__ - Step 52669: {'lr': 0.00036881683047969115, 'samples': 10112448, 'steps': 52668, 'loss/train': 1.3450703620910645} -08/30/2021 22:43:19 - INFO - __main__ - Step 52670: {'lr': 0.00036881216135929506, 'samples': 10112640, 'steps': 52669, 'loss/train': 1.783084750175476} -08/30/2021 22:43:19 - INFO - __main__ - Step 52671: {'lr': 0.0003688074921853641, 'samples': 10112832, 'steps': 52670, 'loss/train': 0.8529743552207947} -08/30/2021 22:43:20 - INFO - __main__ - Step 52672: {'lr': 0.0003688028229579002, 'samples': 10113024, 'steps': 52671, 'loss/train': 1.4379161596298218} -08/30/2021 22:43:21 - INFO - __main__ - Step 52673: {'lr': 0.0003687981536769056, 'samples': 10113216, 'steps': 52672, 'loss/train': 1.2739863395690918} -08/30/2021 22:43:21 - INFO - __main__ - Step 52674: {'lr': 0.00036879348434238235, 'samples': 10113408, 'steps': 52673, 'loss/train': 0.9519485831260681} -08/30/2021 22:43:22 - INFO - __main__ - Step 52675: {'lr': 0.00036878881495433264, 'samples': 10113600, 'steps': 52674, 'loss/train': 1.9314029216766357} -08/30/2021 22:43:22 - INFO - __main__ - Step 52676: {'lr': 0.0003687841455127585, 'samples': 10113792, 'steps': 52675, 'loss/train': 1.0641555786132812} -08/30/2021 22:43:23 - INFO - __main__ - Step 52677: {'lr': 0.0003687794760176621, 'samples': 10113984, 'steps': 52676, 'loss/train': 1.4101535081863403} -08/30/2021 22:43:24 - INFO - __main__ - Step 52678: {'lr': 0.0003687748064690455, 'samples': 10114176, 'steps': 52677, 'loss/train': 0.6032649278640747} -08/30/2021 22:43:24 - INFO - __main__ - Step 52679: {'lr': 0.0003687701368669108, 'samples': 10114368, 'steps': 52678, 'loss/train': 0.7004330158233643} -08/30/2021 22:43:25 - INFO - __main__ - Step 52680: {'lr': 0.0003687654672112601, 'samples': 10114560, 'steps': 52679, 'loss/train': 0.7790058255195618} -08/30/2021 22:43:25 - INFO - __main__ - Step 52681: {'lr': 0.00036876079750209544, 'samples': 10114752, 'steps': 52680, 'loss/train': 1.4016163349151611} -08/30/2021 22:43:25 - INFO - __main__ - Step 52682: {'lr': 0.00036875612773941906, 'samples': 10114944, 'steps': 52681, 'loss/train': 1.2279847860336304} -08/30/2021 22:43:27 - INFO - __main__ - Step 52683: {'lr': 0.00036875145792323303, 'samples': 10115136, 'steps': 52682, 'loss/train': 1.1010525226593018} -08/30/2021 22:43:27 - INFO - __main__ - Step 52684: {'lr': 0.0003687467880535394, 'samples': 10115328, 'steps': 52683, 'loss/train': 0.8829358816146851} -08/30/2021 22:43:28 - INFO - __main__ - Step 52685: {'lr': 0.00036874211813034034, 'samples': 10115520, 'steps': 52684, 'loss/train': 0.8388954401016235} -08/30/2021 22:43:28 - INFO - __main__ - Step 52686: {'lr': 0.00036873744815363785, 'samples': 10115712, 'steps': 52685, 'loss/train': 1.8235160112380981} -08/30/2021 22:43:28 - INFO - __main__ - Step 52687: {'lr': 0.0003687327781234341, 'samples': 10115904, 'steps': 52686, 'loss/train': 1.9645105600357056} -08/30/2021 22:43:30 - INFO - __main__ - Step 52688: {'lr': 0.0003687281080397312, 'samples': 10116096, 'steps': 52687, 'loss/train': 0.9194105267524719} -08/30/2021 22:43:30 - INFO - __main__ - Step 52689: {'lr': 0.0003687234379025313, 'samples': 10116288, 'steps': 52688, 'loss/train': 1.5918776988983154} -08/30/2021 22:43:31 - INFO - __main__ - Step 52690: {'lr': 0.00036871876771183635, 'samples': 10116480, 'steps': 52689, 'loss/train': 1.2447401285171509} -08/30/2021 22:43:31 - INFO - __main__ - Step 52691: {'lr': 0.0003687140974676486, 'samples': 10116672, 'steps': 52690, 'loss/train': 1.4222571849822998} -08/30/2021 22:43:31 - INFO - __main__ - Step 52692: {'lr': 0.0003687094271699702, 'samples': 10116864, 'steps': 52691, 'loss/train': 1.7469810247421265} -08/30/2021 22:43:33 - INFO - __main__ - Step 52693: {'lr': 0.00036870475681880313, 'samples': 10117056, 'steps': 52692, 'loss/train': 0.7537859082221985} -08/30/2021 22:43:33 - INFO - __main__ - Step 52694: {'lr': 0.00036870008641414945, 'samples': 10117248, 'steps': 52693, 'loss/train': 1.3100506067276} -08/30/2021 22:43:34 - INFO - __main__ - Step 52695: {'lr': 0.0003686954159560114, 'samples': 10117440, 'steps': 52694, 'loss/train': 0.9604321718215942} -08/30/2021 22:43:34 - INFO - __main__ - Step 52696: {'lr': 0.00036869074544439097, 'samples': 10117632, 'steps': 52695, 'loss/train': 0.7988246083259583} -08/30/2021 22:43:34 - INFO - __main__ - Step 52697: {'lr': 0.00036868607487929034, 'samples': 10117824, 'steps': 52696, 'loss/train': 1.2913399934768677} -08/30/2021 22:43:37 - INFO - __main__ - Step 52698: {'lr': 0.00036868140426071165, 'samples': 10118016, 'steps': 52697, 'loss/train': 2.644193649291992} -08/30/2021 22:43:37 - INFO - __main__ - Step 52699: {'lr': 0.00036867673358865696, 'samples': 10118208, 'steps': 52698, 'loss/train': 1.2751719951629639} -08/30/2021 22:43:37 - INFO - __main__ - Step 52700: {'lr': 0.0003686720628631283, 'samples': 10118400, 'steps': 52699, 'loss/train': 1.481706976890564} -08/30/2021 22:43:38 - INFO - __main__ - Step 52701: {'lr': 0.0003686673920841278, 'samples': 10118592, 'steps': 52700, 'loss/train': 1.2402658462524414} -08/30/2021 22:43:38 - INFO - __main__ - Step 52702: {'lr': 0.0003686627212516577, 'samples': 10118784, 'steps': 52701, 'loss/train': 1.3068758249282837} -08/30/2021 22:43:40 - INFO - __main__ - Step 52703: {'lr': 0.0003686580503657199, 'samples': 10118976, 'steps': 52702, 'loss/train': 1.7609869241714478} -08/30/2021 22:43:40 - INFO - __main__ - Step 52704: {'lr': 0.00036865337942631674, 'samples': 10119168, 'steps': 52703, 'loss/train': 0.024495387449860573} -08/30/2021 22:43:41 - INFO - __main__ - Step 52705: {'lr': 0.00036864870843345015, 'samples': 10119360, 'steps': 52704, 'loss/train': 0.024711281061172485} -08/30/2021 22:43:41 - INFO - __main__ - Step 52706: {'lr': 0.00036864403738712226, 'samples': 10119552, 'steps': 52705, 'loss/train': 1.6923173666000366} -08/30/2021 22:43:41 - INFO - __main__ - Step 52707: {'lr': 0.00036863936628733524, 'samples': 10119744, 'steps': 52706, 'loss/train': 1.699450135231018} -08/30/2021 22:43:42 - INFO - __main__ - Step 52708: {'lr': 0.0003686346951340911, 'samples': 10119936, 'steps': 52707, 'loss/train': 1.4208524227142334} -08/30/2021 22:43:43 - INFO - __main__ - Step 52709: {'lr': 0.000368630023927392, 'samples': 10120128, 'steps': 52708, 'loss/train': 1.3344050645828247} -08/30/2021 22:43:44 - INFO - __main__ - Step 52710: {'lr': 0.00036862535266724006, 'samples': 10120320, 'steps': 52709, 'loss/train': 1.0172569751739502} -08/30/2021 22:43:44 - INFO - __main__ - Step 52711: {'lr': 0.0003686206813536374, 'samples': 10120512, 'steps': 52710, 'loss/train': 1.1167689561843872} -08/30/2021 22:43:44 - INFO - __main__ - Step 52712: {'lr': 0.0003686160099865861, 'samples': 10120704, 'steps': 52711, 'loss/train': 1.4729176759719849} -08/30/2021 22:43:45 - INFO - __main__ - Step 52713: {'lr': 0.00036861133856608817, 'samples': 10120896, 'steps': 52712, 'loss/train': 1.7260874509811401} -08/30/2021 22:43:46 - INFO - __main__ - Step 52714: {'lr': 0.0003686066670921459, 'samples': 10121088, 'steps': 52713, 'loss/train': 0.37413209676742554} -08/30/2021 22:43:47 - INFO - __main__ - Step 52715: {'lr': 0.00036860199556476125, 'samples': 10121280, 'steps': 52714, 'loss/train': 1.3504774570465088} -08/30/2021 22:43:47 - INFO - __main__ - Step 52716: {'lr': 0.0003685973239839364, 'samples': 10121472, 'steps': 52715, 'loss/train': 1.494686484336853} -08/30/2021 22:43:47 - INFO - __main__ - Step 52717: {'lr': 0.0003685926523496733, 'samples': 10121664, 'steps': 52716, 'loss/train': 1.6282421350479126} -08/30/2021 22:43:48 - INFO - __main__ - Step 52718: {'lr': 0.0003685879806619743, 'samples': 10121856, 'steps': 52717, 'loss/train': 1.5516606569290161} -08/30/2021 22:43:50 - INFO - __main__ - Step 52719: {'lr': 0.0003685833089208414, 'samples': 10122048, 'steps': 52718, 'loss/train': 1.2628803253173828} -08/30/2021 22:43:50 - INFO - __main__ - Step 52720: {'lr': 0.00036857863712627664, 'samples': 10122240, 'steps': 52719, 'loss/train': 1.076051950454712} -08/30/2021 22:43:50 - INFO - __main__ - Step 52721: {'lr': 0.0003685739652782822, 'samples': 10122432, 'steps': 52720, 'loss/train': 1.0960218906402588} -08/30/2021 22:43:51 - INFO - __main__ - Step 52722: {'lr': 0.00036856929337686015, 'samples': 10122624, 'steps': 52721, 'loss/train': 1.4360874891281128} -08/30/2021 22:43:51 - INFO - __main__ - Step 52723: {'lr': 0.0003685646214220126, 'samples': 10122816, 'steps': 52722, 'loss/train': 1.5417126417160034} -08/30/2021 22:43:52 - INFO - __main__ - Step 52724: {'lr': 0.00036855994941374165, 'samples': 10123008, 'steps': 52723, 'loss/train': 0.7886225581169128} -08/30/2021 22:43:53 - INFO - __main__ - Step 52725: {'lr': 0.0003685552773520495, 'samples': 10123200, 'steps': 52724, 'loss/train': 0.16519133746623993} -08/30/2021 22:43:54 - INFO - __main__ - Step 52726: {'lr': 0.0003685506052369381, 'samples': 10123392, 'steps': 52725, 'loss/train': 1.3718961477279663} -08/30/2021 22:43:54 - INFO - __main__ - Step 52727: {'lr': 0.00036854593306840955, 'samples': 10123584, 'steps': 52726, 'loss/train': 2.813539505004883} -08/30/2021 22:43:54 - INFO - __main__ - Step 52728: {'lr': 0.0003685412608464661, 'samples': 10123776, 'steps': 52727, 'loss/train': 0.997939944267273} -08/30/2021 22:43:55 - INFO - __main__ - Step 52729: {'lr': 0.00036853658857110986, 'samples': 10123968, 'steps': 52728, 'loss/train': 1.1285297870635986} -08/30/2021 22:43:56 - INFO - __main__ - Step 52730: {'lr': 0.0003685319162423428, 'samples': 10124160, 'steps': 52729, 'loss/train': 1.2043447494506836} -08/30/2021 22:43:57 - INFO - __main__ - Step 52731: {'lr': 0.0003685272438601671, 'samples': 10124352, 'steps': 52730, 'loss/train': 1.3782126903533936} -08/30/2021 22:43:57 - INFO - __main__ - Step 52732: {'lr': 0.0003685225714245848, 'samples': 10124544, 'steps': 52731, 'loss/train': 0.021239491179585457} -08/30/2021 22:43:58 - INFO - __main__ - Step 52733: {'lr': 0.0003685178989355981, 'samples': 10124736, 'steps': 52732, 'loss/train': 1.3095142841339111} -08/30/2021 22:43:58 - INFO - __main__ - Step 52734: {'lr': 0.00036851322639320903, 'samples': 10124928, 'steps': 52733, 'loss/train': 1.214749813079834} -08/30/2021 22:43:58 - INFO - __main__ - Step 52735: {'lr': 0.00036850855379741984, 'samples': 10125120, 'steps': 52734, 'loss/train': 1.3897874355316162} -08/30/2021 22:44:00 - INFO - __main__ - Step 52736: {'lr': 0.0003685038811482324, 'samples': 10125312, 'steps': 52735, 'loss/train': 0.20550435781478882} -08/30/2021 22:44:00 - INFO - __main__ - Step 52737: {'lr': 0.00036849920844564903, 'samples': 10125504, 'steps': 52736, 'loss/train': 1.525870442390442} -08/30/2021 22:44:01 - INFO - __main__ - Step 52738: {'lr': 0.00036849453568967174, 'samples': 10125696, 'steps': 52737, 'loss/train': 1.565938949584961} -08/30/2021 22:44:01 - INFO - __main__ - Step 52739: {'lr': 0.0003684898628803026, 'samples': 10125888, 'steps': 52738, 'loss/train': 1.300466537475586} -08/30/2021 22:44:01 - INFO - __main__ - Step 52740: {'lr': 0.00036848519001754374, 'samples': 10126080, 'steps': 52739, 'loss/train': 1.3676319122314453} -08/30/2021 22:44:03 - INFO - __main__ - Step 52741: {'lr': 0.0003684805171013973, 'samples': 10126272, 'steps': 52740, 'loss/train': 1.0476268529891968} -08/30/2021 22:44:03 - INFO - __main__ - Step 52742: {'lr': 0.00036847584413186537, 'samples': 10126464, 'steps': 52741, 'loss/train': 0.9034698605537415} -08/30/2021 22:44:04 - INFO - __main__ - Step 52743: {'lr': 0.0003684711711089501, 'samples': 10126656, 'steps': 52742, 'loss/train': 1.2026904821395874} -08/30/2021 22:44:04 - INFO - __main__ - Step 52744: {'lr': 0.00036846649803265344, 'samples': 10126848, 'steps': 52743, 'loss/train': 1.3953644037246704} -08/30/2021 22:44:04 - INFO - __main__ - Step 52745: {'lr': 0.0003684618249029776, 'samples': 10127040, 'steps': 52744, 'loss/train': 1.542578935623169} -08/30/2021 22:44:07 - INFO - __main__ - Step 52746: {'lr': 0.0003684571517199248, 'samples': 10127232, 'steps': 52745, 'loss/train': 1.8095014095306396} -08/30/2021 22:44:07 - INFO - __main__ - Step 52747: {'lr': 0.000368452478483497, 'samples': 10127424, 'steps': 52746, 'loss/train': 0.9871047735214233} -08/30/2021 22:44:07 - INFO - __main__ - Step 52748: {'lr': 0.0003684478051936964, 'samples': 10127616, 'steps': 52747, 'loss/train': 0.023514069616794586} -08/30/2021 22:44:08 - INFO - __main__ - Step 52749: {'lr': 0.0003684431318505249, 'samples': 10127808, 'steps': 52748, 'loss/train': 0.7879209518432617} -08/30/2021 22:44:08 - INFO - __main__ - Step 52750: {'lr': 0.0003684384584539848, 'samples': 10128000, 'steps': 52749, 'loss/train': 1.3596289157867432} -08/30/2021 22:44:09 - INFO - __main__ - Step 52751: {'lr': 0.0003684337850040782, 'samples': 10128192, 'steps': 52750, 'loss/train': 1.2347923517227173} -08/30/2021 22:44:09 - INFO - __main__ - Step 52752: {'lr': 0.00036842911150080716, 'samples': 10128384, 'steps': 52751, 'loss/train': 0.4994010627269745} -08/30/2021 22:44:09 - INFO - __main__ - Step 52753: {'lr': 0.0003684244379441738, 'samples': 10128576, 'steps': 52752, 'loss/train': 0.3623597025871277} -08/30/2021 22:44:11 - INFO - __main__ - Step 52754: {'lr': 0.00036841976433418024, 'samples': 10128768, 'steps': 52753, 'loss/train': 0.3428556025028229} -08/30/2021 22:44:12 - INFO - __main__ - Step 52755: {'lr': 0.0003684150906708285, 'samples': 10128960, 'steps': 52754, 'loss/train': 1.9974740743637085} -08/30/2021 22:44:12 - INFO - __main__ - Step 52756: {'lr': 0.00036841041695412076, 'samples': 10129152, 'steps': 52755, 'loss/train': 1.3867050409317017} -08/30/2021 22:44:12 - INFO - __main__ - Step 52757: {'lr': 0.00036840574318405914, 'samples': 10129344, 'steps': 52756, 'loss/train': 1.2944309711456299} -08/30/2021 22:44:13 - INFO - __main__ - Step 52758: {'lr': 0.00036840106936064567, 'samples': 10129536, 'steps': 52757, 'loss/train': 0.9662535190582275} -08/30/2021 22:44:14 - INFO - __main__ - Step 52759: {'lr': 0.0003683963954838826, 'samples': 10129728, 'steps': 52758, 'loss/train': 1.1422621011734009} -08/30/2021 22:44:15 - INFO - __main__ - Step 52760: {'lr': 0.00036839172155377184, 'samples': 10129920, 'steps': 52759, 'loss/train': 1.7032216787338257} -08/30/2021 22:44:15 - INFO - __main__ - Step 52761: {'lr': 0.0003683870475703156, 'samples': 10130112, 'steps': 52760, 'loss/train': 0.7078521847724915} -08/30/2021 22:44:15 - INFO - __main__ - Step 52762: {'lr': 0.000368382373533516, 'samples': 10130304, 'steps': 52761, 'loss/train': 0.4826919138431549} -08/30/2021 22:44:16 - INFO - __main__ - Step 52763: {'lr': 0.0003683776994433752, 'samples': 10130496, 'steps': 52762, 'loss/train': 0.8229062557220459} -08/30/2021 22:44:17 - INFO - __main__ - Step 52764: {'lr': 0.0003683730252998951, 'samples': 10130688, 'steps': 52763, 'loss/train': 1.6432713270187378} -08/30/2021 22:44:18 - INFO - __main__ - Step 52765: {'lr': 0.00036836835110307803, 'samples': 10130880, 'steps': 52764, 'loss/train': 1.085395336151123} -08/30/2021 22:44:18 - INFO - __main__ - Step 52766: {'lr': 0.00036836367685292605, 'samples': 10131072, 'steps': 52765, 'loss/train': 0.8023868799209595} -08/30/2021 22:44:18 - INFO - __main__ - Step 52767: {'lr': 0.00036835900254944114, 'samples': 10131264, 'steps': 52766, 'loss/train': 1.3463640213012695} -08/30/2021 22:44:19 - INFO - __main__ - Step 52768: {'lr': 0.0003683543281926255, 'samples': 10131456, 'steps': 52767, 'loss/train': 1.7986454963684082} -08/30/2021 22:44:20 - INFO - __main__ - Step 52769: {'lr': 0.0003683496537824813, 'samples': 10131648, 'steps': 52768, 'loss/train': 0.844243586063385} -08/30/2021 22:44:20 - INFO - __main__ - Step 52770: {'lr': 0.0003683449793190105, 'samples': 10131840, 'steps': 52769, 'loss/train': 1.4779090881347656} -08/30/2021 22:44:21 - INFO - __main__ - Step 52771: {'lr': 0.0003683403048022153, 'samples': 10132032, 'steps': 52770, 'loss/train': 1.3560630083084106} -08/30/2021 22:44:21 - INFO - __main__ - Step 52772: {'lr': 0.0003683356302320978, 'samples': 10132224, 'steps': 52771, 'loss/train': 1.6022785902023315} -08/30/2021 22:44:22 - INFO - __main__ - Step 52773: {'lr': 0.00036833095560866007, 'samples': 10132416, 'steps': 52772, 'loss/train': 1.4472960233688354} -08/30/2021 22:44:24 - INFO - __main__ - Step 52774: {'lr': 0.00036832628093190424, 'samples': 10132608, 'steps': 52773, 'loss/train': 1.2739747762680054} -08/30/2021 22:44:24 - INFO - __main__ - Step 52775: {'lr': 0.0003683216062018324, 'samples': 10132800, 'steps': 52774, 'loss/train': 0.766843318939209} -08/30/2021 22:44:24 - INFO - __main__ - Step 52776: {'lr': 0.0003683169314184467, 'samples': 10132992, 'steps': 52775, 'loss/train': 1.2117451429367065} -08/30/2021 22:44:25 - INFO - __main__ - Step 52777: {'lr': 0.00036831225658174915, 'samples': 10133184, 'steps': 52776, 'loss/train': 1.4466413259506226} -08/30/2021 22:44:25 - INFO - __main__ - Step 52778: {'lr': 0.000368307581691742, 'samples': 10133376, 'steps': 52777, 'loss/train': 6.41992712020874} -08/30/2021 22:44:26 - INFO - __main__ - Step 52779: {'lr': 0.0003683029067484273, 'samples': 10133568, 'steps': 52778, 'loss/train': 0.06106307730078697} -08/30/2021 22:44:27 - INFO - __main__ - Step 52780: {'lr': 0.0003682982317518071, 'samples': 10133760, 'steps': 52779, 'loss/train': 1.038874626159668} -08/30/2021 22:44:28 - INFO - __main__ - Step 52781: {'lr': 0.00036829355670188355, 'samples': 10133952, 'steps': 52780, 'loss/train': 1.8153637647628784} -08/30/2021 22:44:28 - INFO - __main__ - Step 52782: {'lr': 0.0003682888815986587, 'samples': 10134144, 'steps': 52781, 'loss/train': 1.672353744506836} -08/30/2021 22:44:28 - INFO - __main__ - Step 52783: {'lr': 0.00036828420644213474, 'samples': 10134336, 'steps': 52782, 'loss/train': 1.8601869344711304} -08/30/2021 22:44:29 - INFO - __main__ - Step 52784: {'lr': 0.00036827953123231373, 'samples': 10134528, 'steps': 52783, 'loss/train': 1.755374789237976} -08/30/2021 22:44:29 - INFO - __main__ - Step 52785: {'lr': 0.00036827485596919773, 'samples': 10134720, 'steps': 52784, 'loss/train': 1.6547623872756958} -08/30/2021 22:44:30 - INFO - __main__ - Step 52786: {'lr': 0.00036827018065278903, 'samples': 10134912, 'steps': 52785, 'loss/train': 1.2991185188293457} -08/30/2021 22:44:31 - INFO - __main__ - Step 52787: {'lr': 0.00036826550528308956, 'samples': 10135104, 'steps': 52786, 'loss/train': 1.0934385061264038} -08/30/2021 22:44:31 - INFO - __main__ - Step 52788: {'lr': 0.00036826082986010145, 'samples': 10135296, 'steps': 52787, 'loss/train': 1.4156596660614014} -08/30/2021 22:44:32 - INFO - __main__ - Step 52789: {'lr': 0.00036825615438382687, 'samples': 10135488, 'steps': 52788, 'loss/train': 1.6095339059829712} -08/30/2021 22:44:32 - INFO - __main__ - Step 52790: {'lr': 0.00036825147885426786, 'samples': 10135680, 'steps': 52789, 'loss/train': 1.0748971700668335} -08/30/2021 22:44:34 - INFO - __main__ - Step 52791: {'lr': 0.00036824680327142656, 'samples': 10135872, 'steps': 52790, 'loss/train': 1.3358403444290161} -08/30/2021 22:44:34 - INFO - __main__ - Step 52792: {'lr': 0.0003682421276353051, 'samples': 10136064, 'steps': 52791, 'loss/train': 1.1452604532241821} -08/30/2021 22:44:34 - INFO - __main__ - Step 52793: {'lr': 0.0003682374519459056, 'samples': 10136256, 'steps': 52792, 'loss/train': 1.3747785091400146} -08/30/2021 22:44:35 - INFO - __main__ - Step 52794: {'lr': 0.00036823277620323, 'samples': 10136448, 'steps': 52793, 'loss/train': 1.704042673110962} -08/30/2021 22:44:35 - INFO - __main__ - Step 52795: {'lr': 0.00036822810040728065, 'samples': 10136640, 'steps': 52794, 'loss/train': 1.478071928024292} -08/30/2021 22:44:36 - INFO - __main__ - Step 52796: {'lr': 0.00036822342455805954, 'samples': 10136832, 'steps': 52795, 'loss/train': 1.4351744651794434} -08/30/2021 22:44:37 - INFO - __main__ - Step 52797: {'lr': 0.0003682187486555687, 'samples': 10137024, 'steps': 52796, 'loss/train': 1.449101209640503} -08/30/2021 22:44:37 - INFO - __main__ - Step 52798: {'lr': 0.0003682140726998104, 'samples': 10137216, 'steps': 52797, 'loss/train': 1.6020257472991943} -08/30/2021 22:44:38 - INFO - __main__ - Step 52799: {'lr': 0.0003682093966907867, 'samples': 10137408, 'steps': 52798, 'loss/train': 0.8282920718193054} -08/30/2021 22:44:38 - INFO - __main__ - Step 52800: {'lr': 0.00036820472062849954, 'samples': 10137600, 'steps': 52799, 'loss/train': 1.7056143283843994} -08/30/2021 22:44:40 - INFO - __main__ - Step 52801: {'lr': 0.0003682000445129512, 'samples': 10137792, 'steps': 52800, 'loss/train': 1.5834660530090332} -08/30/2021 22:44:40 - INFO - __main__ - Step 52802: {'lr': 0.00036819536834414374, 'samples': 10137984, 'steps': 52801, 'loss/train': 1.1081442832946777} -08/30/2021 22:44:40 - INFO - __main__ - Step 52803: {'lr': 0.00036819069212207933, 'samples': 10138176, 'steps': 52802, 'loss/train': 1.2475008964538574} -08/30/2021 22:44:41 - INFO - __main__ - Step 52804: {'lr': 0.00036818601584675994, 'samples': 10138368, 'steps': 52803, 'loss/train': 1.6573153734207153} -08/30/2021 22:44:41 - INFO - __main__ - Step 52805: {'lr': 0.0003681813395181878, 'samples': 10138560, 'steps': 52804, 'loss/train': 1.216860294342041} -08/30/2021 22:44:43 - INFO - __main__ - Step 52806: {'lr': 0.000368176663136365, 'samples': 10138752, 'steps': 52805, 'loss/train': 1.4358131885528564} -08/30/2021 22:44:44 - INFO - __main__ - Step 52807: {'lr': 0.00036817198670129357, 'samples': 10138944, 'steps': 52806, 'loss/train': 1.004723072052002} -08/30/2021 22:44:44 - INFO - __main__ - Step 52808: {'lr': 0.00036816731021297567, 'samples': 10139136, 'steps': 52807, 'loss/train': 1.0727159976959229} -08/30/2021 22:44:45 - INFO - __main__ - Step 52809: {'lr': 0.0003681626336714134, 'samples': 10139328, 'steps': 52808, 'loss/train': 2.0693864822387695} -08/30/2021 22:44:45 - INFO - __main__ - Step 52810: {'lr': 0.00036815795707660886, 'samples': 10139520, 'steps': 52809, 'loss/train': 0.33582019805908203} -08/30/2021 22:44:45 - INFO - __main__ - Step 52811: {'lr': 0.00036815328042856424, 'samples': 10139712, 'steps': 52810, 'loss/train': 1.613366961479187} -08/30/2021 22:44:47 - INFO - __main__ - Step 52812: {'lr': 0.0003681486037272815, 'samples': 10139904, 'steps': 52811, 'loss/train': 1.600266933441162} -08/30/2021 22:44:47 - INFO - __main__ - Step 52813: {'lr': 0.0003681439269727629, 'samples': 10140096, 'steps': 52812, 'loss/train': 1.3165990114212036} -08/30/2021 22:44:48 - INFO - __main__ - Step 52814: {'lr': 0.00036813925016501036, 'samples': 10140288, 'steps': 52813, 'loss/train': 1.8699873685836792} -08/30/2021 22:44:48 - INFO - __main__ - Step 52815: {'lr': 0.00036813457330402616, 'samples': 10140480, 'steps': 52814, 'loss/train': 1.1939752101898193} -08/30/2021 22:44:48 - INFO - __main__ - Step 52816: {'lr': 0.0003681298963898124, 'samples': 10140672, 'steps': 52815, 'loss/train': 1.0365192890167236} -08/30/2021 22:44:50 - INFO - __main__ - Step 52817: {'lr': 0.000368125219422371, 'samples': 10140864, 'steps': 52816, 'loss/train': 1.1778470277786255} -08/30/2021 22:44:50 - INFO - __main__ - Step 52818: {'lr': 0.00036812054240170427, 'samples': 10141056, 'steps': 52817, 'loss/train': 2.0488033294677734} -08/30/2021 22:44:51 - INFO - __main__ - Step 52819: {'lr': 0.00036811586532781425, 'samples': 10141248, 'steps': 52818, 'loss/train': 0.12901750206947327} -08/30/2021 22:44:51 - INFO - __main__ - Step 52820: {'lr': 0.0003681111882007031, 'samples': 10141440, 'steps': 52819, 'loss/train': 1.6754236221313477} -08/30/2021 22:44:51 - INFO - __main__ - Step 52821: {'lr': 0.0003681065110203728, 'samples': 10141632, 'steps': 52820, 'loss/train': 1.4286178350448608} -08/30/2021 22:44:53 - INFO - __main__ - Step 52822: {'lr': 0.0003681018337868255, 'samples': 10141824, 'steps': 52821, 'loss/train': 1.1651772260665894} -08/30/2021 22:44:54 - INFO - __main__ - Step 52823: {'lr': 0.00036809715650006335, 'samples': 10142016, 'steps': 52822, 'loss/train': 1.5365095138549805} -08/30/2021 22:44:54 - INFO - __main__ - Step 52824: {'lr': 0.0003680924791600885, 'samples': 10142208, 'steps': 52823, 'loss/train': 1.7767486572265625} -08/30/2021 22:44:54 - INFO - __main__ - Step 52825: {'lr': 0.000368087801766903, 'samples': 10142400, 'steps': 52824, 'loss/train': 0.14912737905979156} -08/30/2021 22:44:55 - INFO - __main__ - Step 52826: {'lr': 0.0003680831243205089, 'samples': 10142592, 'steps': 52825, 'loss/train': 0.8397039175033569} -08/30/2021 22:44:56 - INFO - __main__ - Step 52827: {'lr': 0.00036807844682090843, 'samples': 10142784, 'steps': 52826, 'loss/train': 0.9851338863372803} -08/30/2021 22:44:57 - INFO - __main__ - Step 52828: {'lr': 0.0003680737692681036, 'samples': 10142976, 'steps': 52827, 'loss/train': 1.3993828296661377} -08/30/2021 22:44:57 - INFO - __main__ - Step 52829: {'lr': 0.0003680690916620966, 'samples': 10143168, 'steps': 52828, 'loss/train': 1.6471260786056519} -08/30/2021 22:44:57 - INFO - __main__ - Step 52830: {'lr': 0.00036806441400288935, 'samples': 10143360, 'steps': 52829, 'loss/train': 0.07215423882007599} -08/30/2021 22:44:58 - INFO - __main__ - Step 52831: {'lr': 0.00036805973629048416, 'samples': 10143552, 'steps': 52830, 'loss/train': 3.7563297748565674} -08/30/2021 22:44:58 - INFO - __main__ - Step 52832: {'lr': 0.0003680550585248831, 'samples': 10143744, 'steps': 52831, 'loss/train': 1.5225003957748413} -08/30/2021 22:45:00 - INFO - __main__ - Step 52833: {'lr': 0.0003680503807060883, 'samples': 10143936, 'steps': 52832, 'loss/train': 0.7888264060020447} -08/30/2021 22:45:00 - INFO - __main__ - Step 52834: {'lr': 0.0003680457028341018, 'samples': 10144128, 'steps': 52833, 'loss/train': 1.6530288457870483} -08/30/2021 22:45:01 - INFO - __main__ - Step 52835: {'lr': 0.00036804102490892567, 'samples': 10144320, 'steps': 52834, 'loss/train': 1.5260083675384521} -08/30/2021 22:45:01 - INFO - __main__ - Step 52836: {'lr': 0.0003680363469305621, 'samples': 10144512, 'steps': 52835, 'loss/train': 1.8343027830123901} -08/30/2021 22:45:01 - INFO - __main__ - Step 52837: {'lr': 0.00036803166889901316, 'samples': 10144704, 'steps': 52836, 'loss/train': 1.5902246236801147} -08/30/2021 22:45:03 - INFO - __main__ - Step 52838: {'lr': 0.000368026990814281, 'samples': 10144896, 'steps': 52837, 'loss/train': 1.5834227800369263} -08/30/2021 22:45:03 - INFO - __main__ - Step 52839: {'lr': 0.00036802231267636773, 'samples': 10145088, 'steps': 52838, 'loss/train': 0.12509818375110626} -08/30/2021 22:45:04 - INFO - __main__ - Step 52840: {'lr': 0.0003680176344852754, 'samples': 10145280, 'steps': 52839, 'loss/train': 1.5758237838745117} -08/30/2021 22:45:04 - INFO - __main__ - Step 52841: {'lr': 0.00036801295624100616, 'samples': 10145472, 'steps': 52840, 'loss/train': 0.2538892328739166} -08/30/2021 22:45:04 - INFO - __main__ - Step 52842: {'lr': 0.00036800827794356206, 'samples': 10145664, 'steps': 52841, 'loss/train': 2.8197221755981445} -08/30/2021 22:45:06 - INFO - __main__ - Step 52843: {'lr': 0.0003680035995929453, 'samples': 10145856, 'steps': 52842, 'loss/train': 1.5177109241485596} -08/30/2021 22:45:06 - INFO - __main__ - Step 52844: {'lr': 0.00036799892118915785, 'samples': 10146048, 'steps': 52843, 'loss/train': 1.5815762281417847} -08/30/2021 22:45:07 - INFO - __main__ - Step 52845: {'lr': 0.0003679942427322019, 'samples': 10146240, 'steps': 52844, 'loss/train': 0.985563337802887} -08/30/2021 22:45:07 - INFO - __main__ - Step 52846: {'lr': 0.00036798956422207975, 'samples': 10146432, 'steps': 52845, 'loss/train': 0.5850203037261963} -08/30/2021 22:45:07 - INFO - __main__ - Step 52847: {'lr': 0.0003679848856587932, 'samples': 10146624, 'steps': 52846, 'loss/train': 1.5630192756652832} -08/30/2021 22:45:09 - INFO - __main__ - Step 52848: {'lr': 0.0003679802070423445, 'samples': 10146816, 'steps': 52847, 'loss/train': 1.2434501647949219} -08/30/2021 22:45:10 - INFO - __main__ - Step 52849: {'lr': 0.0003679755283727357, 'samples': 10147008, 'steps': 52848, 'loss/train': 4.8473052978515625} -08/30/2021 22:45:10 - INFO - __main__ - Step 52850: {'lr': 0.0003679708496499689, 'samples': 10147200, 'steps': 52849, 'loss/train': 0.43993982672691345} -08/30/2021 22:45:10 - INFO - __main__ - Step 52851: {'lr': 0.0003679661708740463, 'samples': 10147392, 'steps': 52850, 'loss/train': 1.4335788488388062} -08/30/2021 22:45:11 - INFO - __main__ - Step 52852: {'lr': 0.00036796149204497, 'samples': 10147584, 'steps': 52851, 'loss/train': 1.569490909576416} -08/30/2021 22:45:11 - INFO - __main__ - Step 52853: {'lr': 0.0003679568131627421, 'samples': 10147776, 'steps': 52852, 'loss/train': 1.167616605758667} -08/30/2021 22:45:13 - INFO - __main__ - Step 52854: {'lr': 0.0003679521342273647, 'samples': 10147968, 'steps': 52853, 'loss/train': 1.3393454551696777} -08/30/2021 22:45:13 - INFO - __main__ - Step 52855: {'lr': 0.00036794745523883977, 'samples': 10148160, 'steps': 52854, 'loss/train': 1.5885943174362183} -08/30/2021 22:45:14 - INFO - __main__ - Step 52856: {'lr': 0.0003679427761971696, 'samples': 10148352, 'steps': 52855, 'loss/train': 0.5337668061256409} -08/30/2021 22:45:14 - INFO - __main__ - Step 52857: {'lr': 0.0003679380971023562, 'samples': 10148544, 'steps': 52856, 'loss/train': 0.060671236366033554} -08/30/2021 22:45:14 - INFO - __main__ - Step 52858: {'lr': 0.00036793341795440175, 'samples': 10148736, 'steps': 52857, 'loss/train': 1.6230326890945435} -08/30/2021 22:45:16 - INFO - __main__ - Step 52859: {'lr': 0.00036792873875330837, 'samples': 10148928, 'steps': 52858, 'loss/train': 0.6809663772583008} -08/30/2021 22:45:16 - INFO - __main__ - Step 52860: {'lr': 0.000367924059499078, 'samples': 10149120, 'steps': 52859, 'loss/train': 1.2868061065673828} -08/30/2021 22:45:17 - INFO - __main__ - Step 52861: {'lr': 0.000367919380191713, 'samples': 10149312, 'steps': 52860, 'loss/train': 1.0583810806274414} -08/30/2021 22:45:17 - INFO - __main__ - Step 52862: {'lr': 0.0003679147008312153, 'samples': 10149504, 'steps': 52861, 'loss/train': 2.0262184143066406} -08/30/2021 22:45:17 - INFO - __main__ - Step 52863: {'lr': 0.000367910021417587, 'samples': 10149696, 'steps': 52862, 'loss/train': 1.402963399887085} -08/30/2021 22:45:19 - INFO - __main__ - Step 52864: {'lr': 0.0003679053419508303, 'samples': 10149888, 'steps': 52863, 'loss/train': 0.9775792360305786} -08/30/2021 22:45:20 - INFO - __main__ - Step 52865: {'lr': 0.0003679006624309472, 'samples': 10150080, 'steps': 52864, 'loss/train': 0.4156869649887085} -08/30/2021 22:45:20 - INFO - __main__ - Step 52866: {'lr': 0.00036789598285794003, 'samples': 10150272, 'steps': 52865, 'loss/train': 1.5188993215560913} -08/30/2021 22:45:20 - INFO - __main__ - Step 52867: {'lr': 0.0003678913032318107, 'samples': 10150464, 'steps': 52866, 'loss/train': 1.3779767751693726} -08/30/2021 22:45:21 - INFO - __main__ - Step 52868: {'lr': 0.0003678866235525613, 'samples': 10150656, 'steps': 52867, 'loss/train': 0.6728357076644897} -08/30/2021 22:45:21 - INFO - __main__ - Step 52869: {'lr': 0.00036788194382019406, 'samples': 10150848, 'steps': 52868, 'loss/train': 1.3757350444793701} -08/30/2021 22:45:23 - INFO - __main__ - Step 52870: {'lr': 0.000367877264034711, 'samples': 10151040, 'steps': 52869, 'loss/train': 1.8382889032363892} -08/30/2021 22:45:23 - INFO - __main__ - Step 52871: {'lr': 0.0003678725841961144, 'samples': 10151232, 'steps': 52870, 'loss/train': 1.571977138519287} -08/30/2021 22:45:23 - INFO - __main__ - Step 52872: {'lr': 0.00036786790430440606, 'samples': 10151424, 'steps': 52871, 'loss/train': 1.1862865686416626} -08/30/2021 22:45:24 - INFO - __main__ - Step 52873: {'lr': 0.0003678632243595883, 'samples': 10151616, 'steps': 52872, 'loss/train': 1.3522124290466309} -08/30/2021 22:45:24 - INFO - __main__ - Step 52874: {'lr': 0.0003678585443616632, 'samples': 10151808, 'steps': 52873, 'loss/train': 1.2177828550338745} -08/30/2021 22:45:26 - INFO - __main__ - Step 52875: {'lr': 0.0003678538643106329, 'samples': 10152000, 'steps': 52874, 'loss/train': 0.6633574962615967} -08/30/2021 22:45:26 - INFO - __main__ - Step 52876: {'lr': 0.0003678491842064995, 'samples': 10152192, 'steps': 52875, 'loss/train': 1.3696953058242798} -08/30/2021 22:45:26 - INFO - __main__ - Step 52877: {'lr': 0.00036784450404926493, 'samples': 10152384, 'steps': 52876, 'loss/train': 1.2297606468200684} -08/30/2021 22:45:27 - INFO - __main__ - Step 52878: {'lr': 0.00036783982383893155, 'samples': 10152576, 'steps': 52877, 'loss/train': 1.6480772495269775} -08/30/2021 22:45:27 - INFO - __main__ - Step 52879: {'lr': 0.0003678351435755014, 'samples': 10152768, 'steps': 52878, 'loss/train': 1.6736863851547241} -08/30/2021 22:45:29 - INFO - __main__ - Step 52880: {'lr': 0.0003678304632589764, 'samples': 10152960, 'steps': 52879, 'loss/train': 1.8834729194641113} -08/30/2021 22:45:29 - INFO - __main__ - Step 52881: {'lr': 0.00036782578288935893, 'samples': 10153152, 'steps': 52880, 'loss/train': 1.7674905061721802} -08/30/2021 22:45:30 - INFO - __main__ - Step 52882: {'lr': 0.000367821102466651, 'samples': 10153344, 'steps': 52881, 'loss/train': 1.6400136947631836} -08/30/2021 22:45:30 - INFO - __main__ - Step 52883: {'lr': 0.0003678164219908546, 'samples': 10153536, 'steps': 52882, 'loss/train': 9.2638578414917} -08/30/2021 22:45:30 - INFO - __main__ - Step 52884: {'lr': 0.00036781174146197207, 'samples': 10153728, 'steps': 52883, 'loss/train': 2.1339919567108154} -08/30/2021 22:45:31 - INFO - __main__ - Step 52885: {'lr': 0.00036780706088000524, 'samples': 10153920, 'steps': 52884, 'loss/train': 1.4225355386734009} -08/30/2021 22:45:32 - INFO - __main__ - Step 52886: {'lr': 0.0003678023802449564, 'samples': 10154112, 'steps': 52885, 'loss/train': 1.3051801919937134} -08/30/2021 22:45:33 - INFO - __main__ - Step 52887: {'lr': 0.0003677976995568277, 'samples': 10154304, 'steps': 52886, 'loss/train': 0.088077612221241} -08/30/2021 22:45:33 - INFO - __main__ - Step 52888: {'lr': 0.00036779301881562115, 'samples': 10154496, 'steps': 52887, 'loss/train': 1.0581823587417603} -08/30/2021 22:45:33 - INFO - __main__ - Step 52889: {'lr': 0.00036778833802133886, 'samples': 10154688, 'steps': 52888, 'loss/train': 1.6545796394348145} -08/30/2021 22:45:34 - INFO - __main__ - Step 52890: {'lr': 0.000367783657173983, 'samples': 10154880, 'steps': 52889, 'loss/train': 1.7570533752441406} -08/30/2021 22:45:35 - INFO - __main__ - Step 52891: {'lr': 0.0003677789762735556, 'samples': 10155072, 'steps': 52890, 'loss/train': 1.131620168685913} -08/30/2021 22:45:36 - INFO - __main__ - Step 52892: {'lr': 0.0003677742953200588, 'samples': 10155264, 'steps': 52891, 'loss/train': 1.521576166152954} -08/30/2021 22:45:36 - INFO - __main__ - Step 52893: {'lr': 0.0003677696143134948, 'samples': 10155456, 'steps': 52892, 'loss/train': 1.0028271675109863} -08/30/2021 22:45:36 - INFO - __main__ - Step 52894: {'lr': 0.00036776493325386554, 'samples': 10155648, 'steps': 52893, 'loss/train': 4.157871246337891} -08/30/2021 22:45:37 - INFO - __main__ - Step 52895: {'lr': 0.00036776025214117325, 'samples': 10155840, 'steps': 52894, 'loss/train': 2.172318935394287} -08/30/2021 22:45:38 - INFO - __main__ - Step 52896: {'lr': 0.00036775557097542, 'samples': 10156032, 'steps': 52895, 'loss/train': 1.2730040550231934} -08/30/2021 22:45:39 - INFO - __main__ - Step 52897: {'lr': 0.00036775088975660793, 'samples': 10156224, 'steps': 52896, 'loss/train': 1.6778171062469482} -08/30/2021 22:45:39 - INFO - __main__ - Step 52898: {'lr': 0.0003677462084847391, 'samples': 10156416, 'steps': 52897, 'loss/train': 1.2212762832641602} -08/30/2021 22:45:40 - INFO - __main__ - Step 52899: {'lr': 0.0003677415271598157, 'samples': 10156608, 'steps': 52898, 'loss/train': 0.9911786317825317} -08/30/2021 22:45:40 - INFO - __main__ - Step 52900: {'lr': 0.00036773684578183976, 'samples': 10156800, 'steps': 52899, 'loss/train': 1.7771943807601929} -08/30/2021 22:45:42 - INFO - __main__ - Step 52901: {'lr': 0.00036773216435081335, 'samples': 10156992, 'steps': 52900, 'loss/train': 1.9092345237731934} -08/30/2021 22:45:42 - INFO - __main__ - Step 52902: {'lr': 0.00036772748286673866, 'samples': 10157184, 'steps': 52901, 'loss/train': 1.510646104812622} -08/30/2021 22:45:42 - INFO - __main__ - Step 52903: {'lr': 0.00036772280132961786, 'samples': 10157376, 'steps': 52902, 'loss/train': 1.662872076034546} -08/30/2021 22:45:43 - INFO - __main__ - Step 52904: {'lr': 0.0003677181197394529, 'samples': 10157568, 'steps': 52903, 'loss/train': 1.9470168352127075} -08/30/2021 22:45:43 - INFO - __main__ - Step 52905: {'lr': 0.000367713438096246, 'samples': 10157760, 'steps': 52904, 'loss/train': 1.2834594249725342} -08/30/2021 22:45:44 - INFO - __main__ - Step 52906: {'lr': 0.00036770875639999923, 'samples': 10157952, 'steps': 52905, 'loss/train': 1.3543715476989746} -08/30/2021 22:45:45 - INFO - __main__ - Step 52907: {'lr': 0.0003677040746507148, 'samples': 10158144, 'steps': 52906, 'loss/train': 0.7779142260551453} -08/30/2021 22:45:45 - INFO - __main__ - Step 52908: {'lr': 0.00036769939284839463, 'samples': 10158336, 'steps': 52907, 'loss/train': 1.8947523832321167} -08/30/2021 22:45:46 - INFO - __main__ - Step 52909: {'lr': 0.000367694710993041, 'samples': 10158528, 'steps': 52908, 'loss/train': 1.7517786026000977} -08/30/2021 22:45:46 - INFO - __main__ - Step 52910: {'lr': 0.00036769002908465585, 'samples': 10158720, 'steps': 52909, 'loss/train': 1.7450008392333984} -08/30/2021 22:45:46 - INFO - __main__ - Step 52911: {'lr': 0.0003676853471232415, 'samples': 10158912, 'steps': 52910, 'loss/train': 1.2192262411117554} -08/30/2021 22:45:48 - INFO - __main__ - Step 52912: {'lr': 0.00036768066510879985, 'samples': 10159104, 'steps': 52911, 'loss/train': 1.3875399827957153} -08/30/2021 22:45:48 - INFO - __main__ - Step 52913: {'lr': 0.0003676759830413332, 'samples': 10159296, 'steps': 52912, 'loss/train': 0.710380494594574} -08/30/2021 22:45:49 - INFO - __main__ - Step 52914: {'lr': 0.0003676713009208435, 'samples': 10159488, 'steps': 52913, 'loss/train': 1.0504858493804932} -08/30/2021 22:45:49 - INFO - __main__ - Step 52915: {'lr': 0.000367666618747333, 'samples': 10159680, 'steps': 52914, 'loss/train': 2.033491373062134} -08/30/2021 22:45:49 - INFO - __main__ - Step 52916: {'lr': 0.0003676619365208036, 'samples': 10159872, 'steps': 52915, 'loss/train': 1.360023021697998} -08/30/2021 22:45:51 - INFO - __main__ - Step 52917: {'lr': 0.0003676572542412576, 'samples': 10160064, 'steps': 52916, 'loss/train': 1.6952009201049805} -08/30/2021 22:45:51 - INFO - __main__ - Step 52918: {'lr': 0.00036765257190869715, 'samples': 10160256, 'steps': 52917, 'loss/train': 1.649714708328247} -08/30/2021 22:45:52 - INFO - __main__ - Step 52919: {'lr': 0.0003676478895231242, 'samples': 10160448, 'steps': 52918, 'loss/train': 1.833362340927124} -08/30/2021 22:45:52 - INFO - __main__ - Step 52920: {'lr': 0.00036764320708454094, 'samples': 10160640, 'steps': 52919, 'loss/train': 2.5058720111846924} -08/30/2021 22:45:52 - INFO - __main__ - Step 52921: {'lr': 0.0003676385245929494, 'samples': 10160832, 'steps': 52920, 'loss/train': 1.0672963857650757} -08/30/2021 22:45:55 - INFO - __main__ - Step 52922: {'lr': 0.00036763384204835186, 'samples': 10161024, 'steps': 52921, 'loss/train': 1.3552619218826294} -08/30/2021 22:45:55 - INFO - __main__ - Step 52923: {'lr': 0.0003676291594507503, 'samples': 10161216, 'steps': 52922, 'loss/train': 1.1720116138458252} -08/30/2021 22:45:55 - INFO - __main__ - Step 52924: {'lr': 0.0003676244768001468, 'samples': 10161408, 'steps': 52923, 'loss/train': 1.8418108224868774} -08/30/2021 22:45:56 - INFO - __main__ - Step 52925: {'lr': 0.00036761979409654353, 'samples': 10161600, 'steps': 52924, 'loss/train': 1.462021827697754} -08/30/2021 22:45:56 - INFO - __main__ - Step 52926: {'lr': 0.0003676151113399427, 'samples': 10161792, 'steps': 52925, 'loss/train': 1.1038837432861328} -08/30/2021 22:45:57 - INFO - __main__ - Step 52927: {'lr': 0.0003676104285303463, 'samples': 10161984, 'steps': 52926, 'loss/train': 0.15758973360061646} -08/30/2021 22:45:58 - INFO - __main__ - Step 52928: {'lr': 0.00036760574566775634, 'samples': 10162176, 'steps': 52927, 'loss/train': 1.0593544244766235} -08/30/2021 22:45:58 - INFO - __main__ - Step 52929: {'lr': 0.0003676010627521751, 'samples': 10162368, 'steps': 52928, 'loss/train': 1.4163261651992798} -08/30/2021 22:45:59 - INFO - __main__ - Step 52930: {'lr': 0.00036759637978360467, 'samples': 10162560, 'steps': 52929, 'loss/train': 1.3818470239639282} -08/30/2021 22:45:59 - INFO - __main__ - Step 52931: {'lr': 0.00036759169676204705, 'samples': 10162752, 'steps': 52930, 'loss/train': 1.3914273977279663} -08/30/2021 22:45:59 - INFO - __main__ - Step 52932: {'lr': 0.0003675870136875045, 'samples': 10162944, 'steps': 52931, 'loss/train': 1.4438437223434448} -08/30/2021 22:46:01 - INFO - __main__ - Step 52933: {'lr': 0.00036758233055997905, 'samples': 10163136, 'steps': 52932, 'loss/train': 1.2895777225494385} -08/30/2021 22:46:01 - INFO - __main__ - Step 52934: {'lr': 0.0003675776473794728, 'samples': 10163328, 'steps': 52933, 'loss/train': 0.2727830410003662} -08/30/2021 22:46:02 - INFO - __main__ - Step 52935: {'lr': 0.00036757296414598786, 'samples': 10163520, 'steps': 52934, 'loss/train': 1.4995088577270508} -08/30/2021 22:46:02 - INFO - __main__ - Step 52936: {'lr': 0.00036756828085952637, 'samples': 10163712, 'steps': 52935, 'loss/train': 1.610569953918457} -08/30/2021 22:46:02 - INFO - __main__ - Step 52937: {'lr': 0.0003675635975200904, 'samples': 10163904, 'steps': 52936, 'loss/train': 0.9813700318336487} -08/30/2021 22:46:04 - INFO - __main__ - Step 52938: {'lr': 0.0003675589141276821, 'samples': 10164096, 'steps': 52937, 'loss/train': 2.048440456390381} -08/30/2021 22:46:04 - INFO - __main__ - Step 52939: {'lr': 0.0003675542306823036, 'samples': 10164288, 'steps': 52938, 'loss/train': 1.1392234563827515} -08/30/2021 22:46:05 - INFO - __main__ - Step 52940: {'lr': 0.000367549547183957, 'samples': 10164480, 'steps': 52939, 'loss/train': 1.495479941368103} -08/30/2021 22:46:05 - INFO - __main__ - Step 52941: {'lr': 0.0003675448636326443, 'samples': 10164672, 'steps': 52940, 'loss/train': 1.6654627323150635} -08/30/2021 22:46:05 - INFO - __main__ - Step 52942: {'lr': 0.0003675401800283678, 'samples': 10164864, 'steps': 52941, 'loss/train': 1.827637791633606} -08/30/2021 22:46:07 - INFO - __main__ - Step 52943: {'lr': 0.0003675354963711294, 'samples': 10165056, 'steps': 52942, 'loss/train': 1.5564132928848267} -08/30/2021 22:46:08 - INFO - __main__ - Step 52944: {'lr': 0.00036753081266093136, 'samples': 10165248, 'steps': 52943, 'loss/train': 0.9640160202980042} -08/30/2021 22:46:08 - INFO - __main__ - Step 52945: {'lr': 0.00036752612889777577, 'samples': 10165440, 'steps': 52944, 'loss/train': 1.2663378715515137} -08/30/2021 22:46:08 - INFO - __main__ - Step 52946: {'lr': 0.0003675214450816647, 'samples': 10165632, 'steps': 52945, 'loss/train': 2.169135332107544} -08/30/2021 22:46:09 - INFO - __main__ - Step 52947: {'lr': 0.00036751676121260035, 'samples': 10165824, 'steps': 52946, 'loss/train': 0.6767752170562744} -08/30/2021 22:46:10 - INFO - __main__ - Step 52948: {'lr': 0.00036751207729058465, 'samples': 10166016, 'steps': 52947, 'loss/train': 1.3219033479690552} -08/30/2021 22:46:10 - INFO - __main__ - Step 52949: {'lr': 0.00036750739331561986, 'samples': 10166208, 'steps': 52948, 'loss/train': 1.090736746788025} -08/30/2021 22:46:11 - INFO - __main__ - Step 52950: {'lr': 0.0003675027092877081, 'samples': 10166400, 'steps': 52949, 'loss/train': 1.9434583187103271} -08/30/2021 22:46:11 - INFO - __main__ - Step 52951: {'lr': 0.0003674980252068514, 'samples': 10166592, 'steps': 52950, 'loss/train': 0.6372240781784058} -08/30/2021 22:46:12 - INFO - __main__ - Step 52952: {'lr': 0.0003674933410730519, 'samples': 10166784, 'steps': 52951, 'loss/train': 1.5540742874145508} -08/30/2021 22:46:13 - INFO - __main__ - Step 52953: {'lr': 0.00036748865688631175, 'samples': 10166976, 'steps': 52952, 'loss/train': 1.0596449375152588} -08/30/2021 22:46:13 - INFO - __main__ - Step 52954: {'lr': 0.000367483972646633, 'samples': 10167168, 'steps': 52953, 'loss/train': 1.7599678039550781} -08/30/2021 22:46:14 - INFO - __main__ - Step 52955: {'lr': 0.00036747928835401773, 'samples': 10167360, 'steps': 52954, 'loss/train': 1.2872885465621948} -08/30/2021 22:46:14 - INFO - __main__ - Step 52956: {'lr': 0.00036747460400846815, 'samples': 10167552, 'steps': 52955, 'loss/train': 1.8222973346710205} -08/30/2021 22:46:14 - INFO - __main__ - Step 52957: {'lr': 0.00036746991960998635, 'samples': 10167744, 'steps': 52956, 'loss/train': 1.5619595050811768} -08/30/2021 22:46:16 - INFO - __main__ - Step 52958: {'lr': 0.00036746523515857434, 'samples': 10167936, 'steps': 52957, 'loss/train': 1.4632941484451294} -08/30/2021 22:46:16 - INFO - __main__ - Step 52959: {'lr': 0.00036746055065423435, 'samples': 10168128, 'steps': 52958, 'loss/train': 1.4835357666015625} -08/30/2021 22:46:17 - INFO - __main__ - Step 52960: {'lr': 0.0003674558660969685, 'samples': 10168320, 'steps': 52959, 'loss/train': 1.514636516571045} -08/30/2021 22:46:17 - INFO - __main__ - Step 52961: {'lr': 0.0003674511814867788, 'samples': 10168512, 'steps': 52960, 'loss/train': 1.3876765966415405} -08/30/2021 22:46:18 - INFO - __main__ - Step 52962: {'lr': 0.00036744649682366744, 'samples': 10168704, 'steps': 52961, 'loss/train': 1.4712228775024414} -08/30/2021 22:46:18 - INFO - __main__ - Step 52963: {'lr': 0.0003674418121076365, 'samples': 10168896, 'steps': 52962, 'loss/train': 0.9659256339073181} -08/30/2021 22:46:19 - INFO - __main__ - Step 52964: {'lr': 0.00036743712733868807, 'samples': 10169088, 'steps': 52963, 'loss/train': 0.9840158224105835} -08/30/2021 22:46:20 - INFO - __main__ - Step 52965: {'lr': 0.00036743244251682424, 'samples': 10169280, 'steps': 52964, 'loss/train': 1.1047409772872925} -08/30/2021 22:46:20 - INFO - __main__ - Step 52966: {'lr': 0.00036742775764204717, 'samples': 10169472, 'steps': 52965, 'loss/train': 1.4516327381134033} -08/30/2021 22:46:21 - INFO - __main__ - Step 52967: {'lr': 0.000367423072714359, 'samples': 10169664, 'steps': 52966, 'loss/train': 1.3878978490829468} -08/30/2021 22:46:21 - INFO - __main__ - Step 52968: {'lr': 0.00036741838773376187, 'samples': 10169856, 'steps': 52967, 'loss/train': 1.4295021295547485} -08/30/2021 22:46:23 - INFO - __main__ - Step 52969: {'lr': 0.00036741370270025776, 'samples': 10170048, 'steps': 52968, 'loss/train': 1.4250948429107666} -08/30/2021 22:46:23 - INFO - __main__ - Step 52970: {'lr': 0.0003674090176138488, 'samples': 10170240, 'steps': 52969, 'loss/train': 1.7038239240646362} -08/30/2021 22:46:23 - INFO - __main__ - Step 52971: {'lr': 0.0003674043324745372, 'samples': 10170432, 'steps': 52970, 'loss/train': 1.3187508583068848} -08/30/2021 22:46:24 - INFO - __main__ - Step 52972: {'lr': 0.000367399647282325, 'samples': 10170624, 'steps': 52971, 'loss/train': 1.6203367710113525} -08/30/2021 22:46:24 - INFO - __main__ - Step 52973: {'lr': 0.0003673949620372143, 'samples': 10170816, 'steps': 52972, 'loss/train': 1.4784064292907715} -08/30/2021 22:46:26 - INFO - __main__ - Step 52974: {'lr': 0.0003673902767392074, 'samples': 10171008, 'steps': 52973, 'loss/train': 1.2993137836456299} -08/30/2021 22:46:26 - INFO - __main__ - Step 52975: {'lr': 0.00036738559138830613, 'samples': 10171200, 'steps': 52974, 'loss/train': 1.7943003177642822} -08/30/2021 22:46:26 - INFO - __main__ - Step 52976: {'lr': 0.0003673809059845127, 'samples': 10171392, 'steps': 52975, 'loss/train': 1.8203996419906616} -08/30/2021 22:46:27 - INFO - __main__ - Step 52977: {'lr': 0.00036737622052782933, 'samples': 10171584, 'steps': 52976, 'loss/train': 1.5651434659957886} -08/30/2021 22:46:27 - INFO - __main__ - Step 52978: {'lr': 0.000367371535018258, 'samples': 10171776, 'steps': 52977, 'loss/train': 1.6012505292892456} -08/30/2021 22:46:28 - INFO - __main__ - Step 52979: {'lr': 0.00036736684945580083, 'samples': 10171968, 'steps': 52978, 'loss/train': 0.6337563395500183} -08/30/2021 22:46:29 - INFO - __main__ - Step 52980: {'lr': 0.00036736216384046, 'samples': 10172160, 'steps': 52979, 'loss/train': 1.217097520828247} -08/30/2021 22:46:30 - INFO - __main__ - Step 52981: {'lr': 0.00036735747817223766, 'samples': 10172352, 'steps': 52980, 'loss/train': 1.2732174396514893} -08/30/2021 22:46:30 - INFO - __main__ - Step 52982: {'lr': 0.00036735279245113573, 'samples': 10172544, 'steps': 52981, 'loss/train': 1.4605273008346558} -08/30/2021 22:46:31 - INFO - __main__ - Step 52983: {'lr': 0.0003673481066771565, 'samples': 10172736, 'steps': 52982, 'loss/train': 1.8992276191711426} -08/30/2021 22:46:31 - INFO - __main__ - Step 52984: {'lr': 0.00036734342085030205, 'samples': 10172928, 'steps': 52983, 'loss/train': 1.651639461517334} -08/30/2021 22:46:32 - INFO - __main__ - Step 52985: {'lr': 0.0003673387349705744, 'samples': 10173120, 'steps': 52984, 'loss/train': 1.3642909526824951} -08/30/2021 22:46:33 - INFO - __main__ - Step 52986: {'lr': 0.00036733404903797575, 'samples': 10173312, 'steps': 52985, 'loss/train': 1.6846660375595093} -08/30/2021 22:46:33 - INFO - __main__ - Step 52987: {'lr': 0.00036732936305250826, 'samples': 10173504, 'steps': 52986, 'loss/train': 0.7596871852874756} -08/30/2021 22:46:34 - INFO - __main__ - Step 52988: {'lr': 0.00036732467701417387, 'samples': 10173696, 'steps': 52987, 'loss/train': 1.7918012142181396} -08/30/2021 22:46:34 - INFO - __main__ - Step 52989: {'lr': 0.00036731999092297487, 'samples': 10173888, 'steps': 52988, 'loss/train': 0.9866682291030884} -08/30/2021 22:46:36 - INFO - __main__ - Step 52990: {'lr': 0.0003673153047789132, 'samples': 10174080, 'steps': 52989, 'loss/train': 1.1140183210372925} -08/30/2021 22:46:36 - INFO - __main__ - Step 52991: {'lr': 0.0003673106185819911, 'samples': 10174272, 'steps': 52990, 'loss/train': 1.376823902130127} -08/30/2021 22:46:36 - INFO - __main__ - Step 52992: {'lr': 0.00036730593233221074, 'samples': 10174464, 'steps': 52991, 'loss/train': 1.2224533557891846} -08/30/2021 22:46:37 - INFO - __main__ - Step 52993: {'lr': 0.000367301246029574, 'samples': 10174656, 'steps': 52992, 'loss/train': 1.5230166912078857} -08/30/2021 22:46:37 - INFO - __main__ - Step 52994: {'lr': 0.00036729655967408326, 'samples': 10174848, 'steps': 52993, 'loss/train': 0.0942855179309845} -08/30/2021 22:46:39 - INFO - __main__ - Step 52995: {'lr': 0.00036729187326574043, 'samples': 10175040, 'steps': 52994, 'loss/train': 1.4928103685379028} -08/30/2021 22:46:39 - INFO - __main__ - Step 52996: {'lr': 0.00036728718680454763, 'samples': 10175232, 'steps': 52995, 'loss/train': 1.3302651643753052} -08/30/2021 22:46:40 - INFO - __main__ - Step 52997: {'lr': 0.0003672825002905071, 'samples': 10175424, 'steps': 52996, 'loss/train': 2.0062875747680664} -08/30/2021 22:46:40 - INFO - __main__ - Step 52998: {'lr': 0.0003672778137236209, 'samples': 10175616, 'steps': 52997, 'loss/train': 1.104461908340454} -08/30/2021 22:46:40 - INFO - __main__ - Step 52999: {'lr': 0.0003672731271038911, 'samples': 10175808, 'steps': 52998, 'loss/train': 1.7488676309585571} -08/30/2021 22:46:42 - INFO - __main__ - Step 53000: {'lr': 0.0003672684404313199, 'samples': 10176000, 'steps': 52999, 'loss/train': 1.5353302955627441} -08/30/2021 22:46:42 - INFO - __main__ - Step 53001: {'lr': 0.00036726375370590926, 'samples': 10176192, 'steps': 53000, 'loss/train': 1.9689027070999146} -08/30/2021 22:46:43 - INFO - __main__ - Step 53002: {'lr': 0.0003672590669276614, 'samples': 10176384, 'steps': 53001, 'loss/train': 1.2587339878082275} -08/30/2021 22:46:43 - INFO - __main__ - Step 53003: {'lr': 0.0003672543800965784, 'samples': 10176576, 'steps': 53002, 'loss/train': 0.8535210490226746} -08/30/2021 22:46:43 - INFO - __main__ - Step 53004: {'lr': 0.00036724969321266245, 'samples': 10176768, 'steps': 53003, 'loss/train': 1.713154911994934} -08/30/2021 22:46:44 - INFO - __main__ - Step 53005: {'lr': 0.0003672450062759156, 'samples': 10176960, 'steps': 53004, 'loss/train': 1.4972234964370728} -08/30/2021 22:46:45 - INFO - __main__ - Step 53006: {'lr': 0.00036724031928633995, 'samples': 10177152, 'steps': 53005, 'loss/train': 3.3697025775909424} -08/30/2021 22:46:46 - INFO - __main__ - Step 53007: {'lr': 0.00036723563224393753, 'samples': 10177344, 'steps': 53006, 'loss/train': 1.5223716497421265} -08/30/2021 22:46:46 - INFO - __main__ - Step 53008: {'lr': 0.0003672309451487106, 'samples': 10177536, 'steps': 53007, 'loss/train': 1.276400089263916} -08/30/2021 22:46:46 - INFO - __main__ - Step 53009: {'lr': 0.0003672262580006612, 'samples': 10177728, 'steps': 53008, 'loss/train': 1.304882287979126} -08/30/2021 22:46:47 - INFO - __main__ - Step 53010: {'lr': 0.00036722157079979153, 'samples': 10177920, 'steps': 53009, 'loss/train': 1.6667906045913696} -08/30/2021 22:46:48 - INFO - __main__ - Step 53011: {'lr': 0.0003672168835461036, 'samples': 10178112, 'steps': 53010, 'loss/train': 1.0986615419387817} -08/30/2021 22:46:49 - INFO - __main__ - Step 53012: {'lr': 0.00036721219623959956, 'samples': 10178304, 'steps': 53011, 'loss/train': 1.2280393838882446} -08/30/2021 22:46:49 - INFO - __main__ - Step 53013: {'lr': 0.00036720750888028143, 'samples': 10178496, 'steps': 53012, 'loss/train': 1.118146300315857} -08/30/2021 22:46:50 - INFO - __main__ - Step 53014: {'lr': 0.0003672028214681515, 'samples': 10178688, 'steps': 53013, 'loss/train': 0.0921279564499855} -08/30/2021 22:46:50 - INFO - __main__ - Step 53015: {'lr': 0.00036719813400321174, 'samples': 10178880, 'steps': 53014, 'loss/train': 1.11503005027771} -08/30/2021 22:46:52 - INFO - __main__ - Step 53016: {'lr': 0.0003671934464854643, 'samples': 10179072, 'steps': 53015, 'loss/train': 1.5488438606262207} -08/30/2021 22:46:52 - INFO - __main__ - Step 53017: {'lr': 0.00036718875891491134, 'samples': 10179264, 'steps': 53016, 'loss/train': 0.9068090915679932} -08/30/2021 22:46:52 - INFO - __main__ - Step 53018: {'lr': 0.0003671840712915549, 'samples': 10179456, 'steps': 53017, 'loss/train': 1.3363335132598877} -08/30/2021 22:46:53 - INFO - __main__ - Step 53019: {'lr': 0.0003671793836153972, 'samples': 10179648, 'steps': 53018, 'loss/train': 1.0532034635543823} -08/30/2021 22:46:53 - INFO - __main__ - Step 53020: {'lr': 0.00036717469588644017, 'samples': 10179840, 'steps': 53019, 'loss/train': 1.3713171482086182} -08/30/2021 22:46:54 - INFO - __main__ - Step 53021: {'lr': 0.000367170008104686, 'samples': 10180032, 'steps': 53020, 'loss/train': 1.546654224395752} -08/30/2021 22:46:55 - INFO - __main__ - Step 53022: {'lr': 0.000367165320270137, 'samples': 10180224, 'steps': 53021, 'loss/train': 1.233120322227478} -08/30/2021 22:46:55 - INFO - __main__ - Step 53023: {'lr': 0.000367160632382795, 'samples': 10180416, 'steps': 53022, 'loss/train': 1.8887003660202026} -08/30/2021 22:46:56 - INFO - __main__ - Step 53024: {'lr': 0.00036715594444266224, 'samples': 10180608, 'steps': 53023, 'loss/train': 2.006420612335205} -08/30/2021 22:46:56 - INFO - __main__ - Step 53025: {'lr': 0.0003671512564497408, 'samples': 10180800, 'steps': 53024, 'loss/train': 1.4312664270401} -08/30/2021 22:46:58 - INFO - __main__ - Step 53026: {'lr': 0.0003671465684040328, 'samples': 10180992, 'steps': 53025, 'loss/train': 1.4332363605499268} -08/30/2021 22:46:58 - INFO - __main__ - Step 53027: {'lr': 0.00036714188030554046, 'samples': 10181184, 'steps': 53026, 'loss/train': 1.1092573404312134} -08/30/2021 22:46:58 - INFO - __main__ - Step 53028: {'lr': 0.00036713719215426577, 'samples': 10181376, 'steps': 53027, 'loss/train': 0.8608169555664062} -08/30/2021 22:46:59 - INFO - __main__ - Step 53029: {'lr': 0.0003671325039502108, 'samples': 10181568, 'steps': 53028, 'loss/train': 1.4866570234298706} -08/30/2021 22:46:59 - INFO - __main__ - Step 53030: {'lr': 0.0003671278156933778, 'samples': 10181760, 'steps': 53029, 'loss/train': 0.697790801525116} -08/30/2021 22:46:59 - INFO - __main__ - Step 53031: {'lr': 0.00036712312738376875, 'samples': 10181952, 'steps': 53030, 'loss/train': 0.49303168058395386} -08/30/2021 22:47:01 - INFO - __main__ - Step 53032: {'lr': 0.00036711843902138586, 'samples': 10182144, 'steps': 53031, 'loss/train': 1.3356133699417114} -08/30/2021 22:47:02 - INFO - __main__ - Step 53033: {'lr': 0.0003671137506062312, 'samples': 10182336, 'steps': 53032, 'loss/train': 1.5197365283966064} -08/30/2021 22:47:02 - INFO - __main__ - Step 53034: {'lr': 0.000367109062138307, 'samples': 10182528, 'steps': 53033, 'loss/train': 1.443939447402954} -08/30/2021 22:47:03 - INFO - __main__ - Step 53035: {'lr': 0.00036710437361761513, 'samples': 10182720, 'steps': 53034, 'loss/train': 1.565474033355713} -08/30/2021 22:47:03 - INFO - __main__ - Step 53036: {'lr': 0.00036709968504415786, 'samples': 10182912, 'steps': 53035, 'loss/train': 1.7932683229446411} -08/30/2021 22:47:05 - INFO - __main__ - Step 53037: {'lr': 0.00036709499641793725, 'samples': 10183104, 'steps': 53036, 'loss/train': 1.0941112041473389} -08/30/2021 22:47:05 - INFO - __main__ - Step 53038: {'lr': 0.00036709030773895545, 'samples': 10183296, 'steps': 53037, 'loss/train': 0.04810842499136925} -08/30/2021 22:47:05 - INFO - __main__ - Step 53039: {'lr': 0.0003670856190072146, 'samples': 10183488, 'steps': 53038, 'loss/train': 1.2002418041229248} -08/30/2021 22:47:06 - INFO - __main__ - Step 53040: {'lr': 0.00036708093022271677, 'samples': 10183680, 'steps': 53039, 'loss/train': 0.39169299602508545} -08/30/2021 22:47:06 - INFO - __main__ - Step 53041: {'lr': 0.0003670762413854641, 'samples': 10183872, 'steps': 53040, 'loss/train': 1.084177017211914} -08/30/2021 22:47:08 - INFO - __main__ - Step 53042: {'lr': 0.0003670715524954587, 'samples': 10184064, 'steps': 53041, 'loss/train': 1.513096570968628} -08/30/2021 22:47:08 - INFO - __main__ - Step 53043: {'lr': 0.0003670668635527026, 'samples': 10184256, 'steps': 53042, 'loss/train': 1.4138253927230835} -08/30/2021 22:47:09 - INFO - __main__ - Step 53044: {'lr': 0.00036706217455719805, 'samples': 10184448, 'steps': 53043, 'loss/train': 0.12862081825733185} -08/30/2021 22:47:09 - INFO - __main__ - Step 53045: {'lr': 0.000367057485508947, 'samples': 10184640, 'steps': 53044, 'loss/train': 0.04579971358180046} -08/30/2021 22:47:10 - INFO - __main__ - Step 53046: {'lr': 0.0003670527964079517, 'samples': 10184832, 'steps': 53045, 'loss/train': 1.066494345664978} -08/30/2021 22:47:10 - INFO - __main__ - Step 53047: {'lr': 0.0003670481072542142, 'samples': 10185024, 'steps': 53046, 'loss/train': 0.6270720362663269} -08/30/2021 22:47:11 - INFO - __main__ - Step 53048: {'lr': 0.0003670434180477367, 'samples': 10185216, 'steps': 53047, 'loss/train': 1.6485673189163208} -08/30/2021 22:47:12 - INFO - __main__ - Step 53049: {'lr': 0.00036703872878852115, 'samples': 10185408, 'steps': 53048, 'loss/train': 1.623889446258545} -08/30/2021 22:47:12 - INFO - __main__ - Step 53050: {'lr': 0.00036703403947656977, 'samples': 10185600, 'steps': 53049, 'loss/train': 1.3428325653076172} -08/30/2021 22:47:12 - INFO - __main__ - Step 53051: {'lr': 0.0003670293501118847, 'samples': 10185792, 'steps': 53050, 'loss/train': 0.9774247407913208} -08/30/2021 22:47:13 - INFO - __main__ - Step 53052: {'lr': 0.00036702466069446797, 'samples': 10185984, 'steps': 53051, 'loss/train': 1.6507772207260132} -08/30/2021 22:47:15 - INFO - __main__ - Step 53053: {'lr': 0.00036701997122432173, 'samples': 10186176, 'steps': 53052, 'loss/train': 0.6613092422485352} -08/30/2021 22:47:15 - INFO - __main__ - Step 53054: {'lr': 0.00036701528170144813, 'samples': 10186368, 'steps': 53053, 'loss/train': 1.5881325006484985} -08/30/2021 22:47:16 - INFO - __main__ - Step 53055: {'lr': 0.0003670105921258493, 'samples': 10186560, 'steps': 53054, 'loss/train': 0.9100768566131592} -08/30/2021 22:47:16 - INFO - __main__ - Step 53056: {'lr': 0.0003670059024975272, 'samples': 10186752, 'steps': 53055, 'loss/train': 0.02837066724896431} -08/30/2021 22:47:16 - INFO - __main__ - Step 53057: {'lr': 0.00036700121281648415, 'samples': 10186944, 'steps': 53056, 'loss/train': 1.1765162944793701} -08/30/2021 22:47:17 - INFO - __main__ - Step 53058: {'lr': 0.000366996523082722, 'samples': 10187136, 'steps': 53057, 'loss/train': 1.3230974674224854} -08/30/2021 22:47:19 - INFO - __main__ - Step 53059: {'lr': 0.00036699183329624315, 'samples': 10187328, 'steps': 53058, 'loss/train': 0.1231624037027359} -08/30/2021 22:47:19 - INFO - __main__ - Step 53060: {'lr': 0.00036698714345704956, 'samples': 10187520, 'steps': 53059, 'loss/train': 1.0395394563674927} -08/30/2021 22:47:20 - INFO - __main__ - Step 53061: {'lr': 0.00036698245356514336, 'samples': 10187712, 'steps': 53060, 'loss/train': 1.0675544738769531} -08/30/2021 22:47:20 - INFO - __main__ - Step 53062: {'lr': 0.0003669777636205267, 'samples': 10187904, 'steps': 53061, 'loss/train': 0.022404806688427925} -08/30/2021 22:47:20 - INFO - __main__ - Step 53063: {'lr': 0.00036697307362320165, 'samples': 10188096, 'steps': 53062, 'loss/train': 0.022075502201914787} -08/30/2021 22:47:21 - INFO - __main__ - Step 53064: {'lr': 0.0003669683835731703, 'samples': 10188288, 'steps': 53063, 'loss/train': 1.3558034896850586} -08/30/2021 22:47:21 - INFO - __main__ - Step 53065: {'lr': 0.00036696369347043477, 'samples': 10188480, 'steps': 53064, 'loss/train': 1.1132031679153442} -08/30/2021 22:47:22 - INFO - __main__ - Step 53066: {'lr': 0.00036695900331499735, 'samples': 10188672, 'steps': 53065, 'loss/train': 0.710574746131897} -08/30/2021 22:47:23 - INFO - __main__ - Step 53067: {'lr': 0.0003669543131068599, 'samples': 10188864, 'steps': 53066, 'loss/train': 1.6990859508514404} -08/30/2021 22:47:23 - INFO - __main__ - Step 53068: {'lr': 0.0003669496228460247, 'samples': 10189056, 'steps': 53067, 'loss/train': 1.8454500436782837} -08/30/2021 22:47:24 - INFO - __main__ - Step 53069: {'lr': 0.00036694493253249373, 'samples': 10189248, 'steps': 53068, 'loss/train': 1.8786671161651611} -08/30/2021 22:47:24 - INFO - __main__ - Step 53070: {'lr': 0.0003669402421662692, 'samples': 10189440, 'steps': 53069, 'loss/train': 1.2989208698272705} -08/30/2021 22:47:26 - INFO - __main__ - Step 53071: {'lr': 0.0003669355517473532, 'samples': 10189632, 'steps': 53070, 'loss/train': 1.2290717363357544} -08/30/2021 22:47:26 - INFO - __main__ - Step 53072: {'lr': 0.0003669308612757479, 'samples': 10189824, 'steps': 53071, 'loss/train': 1.2725080251693726} -08/30/2021 22:47:27 - INFO - __main__ - Step 53073: {'lr': 0.0003669261707514553, 'samples': 10190016, 'steps': 53072, 'loss/train': 0.49253711104393005} -08/30/2021 22:47:27 - INFO - __main__ - Step 53074: {'lr': 0.0003669214801744776, 'samples': 10190208, 'steps': 53073, 'loss/train': 1.5833349227905273} -08/30/2021 22:47:27 - INFO - __main__ - Step 53075: {'lr': 0.0003669167895448169, 'samples': 10190400, 'steps': 53074, 'loss/train': 1.4562004804611206} -08/30/2021 22:47:29 - INFO - __main__ - Step 53076: {'lr': 0.0003669120988624752, 'samples': 10190592, 'steps': 53075, 'loss/train': 1.7953530550003052} -08/30/2021 22:47:29 - INFO - __main__ - Step 53077: {'lr': 0.0003669074081274548, 'samples': 10190784, 'steps': 53076, 'loss/train': 1.2561743259429932} -08/30/2021 22:47:30 - INFO - __main__ - Step 53078: {'lr': 0.0003669027173397577, 'samples': 10190976, 'steps': 53077, 'loss/train': 1.3289263248443604} -08/30/2021 22:47:30 - INFO - __main__ - Step 53079: {'lr': 0.00036689802649938607, 'samples': 10191168, 'steps': 53078, 'loss/train': 0.41601547598838806} -08/30/2021 22:47:30 - INFO - __main__ - Step 53080: {'lr': 0.00036689333560634195, 'samples': 10191360, 'steps': 53079, 'loss/train': 1.1768739223480225} -08/30/2021 22:47:32 - INFO - __main__ - Step 53081: {'lr': 0.00036688864466062756, 'samples': 10191552, 'steps': 53080, 'loss/train': 1.187766432762146} -08/30/2021 22:47:32 - INFO - __main__ - Step 53082: {'lr': 0.0003668839536622449, 'samples': 10191744, 'steps': 53081, 'loss/train': 1.200555682182312} -08/30/2021 22:47:33 - INFO - __main__ - Step 53083: {'lr': 0.0003668792626111962, 'samples': 10191936, 'steps': 53082, 'loss/train': 1.66214120388031} -08/30/2021 22:47:33 - INFO - __main__ - Step 53084: {'lr': 0.0003668745715074834, 'samples': 10192128, 'steps': 53083, 'loss/train': 1.0854735374450684} -08/30/2021 22:47:33 - INFO - __main__ - Step 53085: {'lr': 0.00036686988035110877, 'samples': 10192320, 'steps': 53084, 'loss/train': 0.23303203284740448} -08/30/2021 22:47:35 - INFO - __main__ - Step 53086: {'lr': 0.0003668651891420744, 'samples': 10192512, 'steps': 53085, 'loss/train': 1.7780293226242065} -08/30/2021 22:47:35 - INFO - __main__ - Step 53087: {'lr': 0.0003668604978803823, 'samples': 10192704, 'steps': 53086, 'loss/train': 0.5159832239151001} -08/30/2021 22:47:36 - INFO - __main__ - Step 53088: {'lr': 0.0003668558065660348, 'samples': 10192896, 'steps': 53087, 'loss/train': 1.6527228355407715} -08/30/2021 22:47:36 - INFO - __main__ - Step 53089: {'lr': 0.0003668511151990338, 'samples': 10193088, 'steps': 53088, 'loss/train': 1.2927652597427368} -08/30/2021 22:47:36 - INFO - __main__ - Step 53090: {'lr': 0.0003668464237793815, 'samples': 10193280, 'steps': 53089, 'loss/train': 1.52219557762146} -08/30/2021 22:47:37 - INFO - __main__ - Step 53091: {'lr': 0.00036684173230707996, 'samples': 10193472, 'steps': 53090, 'loss/train': 2.626725673675537} -08/30/2021 22:47:39 - INFO - __main__ - Step 53092: {'lr': 0.00036683704078213137, 'samples': 10193664, 'steps': 53091, 'loss/train': 1.0025660991668701} -08/30/2021 22:47:39 - INFO - __main__ - Step 53093: {'lr': 0.00036683234920453783, 'samples': 10193856, 'steps': 53092, 'loss/train': 0.6256605982780457} -08/30/2021 22:47:40 - INFO - __main__ - Step 53094: {'lr': 0.0003668276575743014, 'samples': 10194048, 'steps': 53093, 'loss/train': 1.2839723825454712} -08/30/2021 22:47:40 - INFO - __main__ - Step 53095: {'lr': 0.0003668229658914243, 'samples': 10194240, 'steps': 53094, 'loss/train': 1.1742956638336182} -08/30/2021 22:47:40 - INFO - __main__ - Step 53096: {'lr': 0.0003668182741559085, 'samples': 10194432, 'steps': 53095, 'loss/train': 1.7711315155029297} -08/30/2021 22:47:42 - INFO - __main__ - Step 53097: {'lr': 0.00036681358236775625, 'samples': 10194624, 'steps': 53096, 'loss/train': 1.163830280303955} -08/30/2021 22:47:42 - INFO - __main__ - Step 53098: {'lr': 0.00036680889052696954, 'samples': 10194816, 'steps': 53097, 'loss/train': 1.4291363954544067} -08/30/2021 22:47:43 - INFO - __main__ - Step 53099: {'lr': 0.00036680419863355056, 'samples': 10195008, 'steps': 53098, 'loss/train': 1.1183979511260986} -08/30/2021 22:47:43 - INFO - __main__ - Step 53100: {'lr': 0.0003667995066875014, 'samples': 10195200, 'steps': 53099, 'loss/train': 1.6739184856414795} -08/30/2021 22:47:43 - INFO - __main__ - Step 53101: {'lr': 0.00036679481468882425, 'samples': 10195392, 'steps': 53100, 'loss/train': 1.6509748697280884} -08/30/2021 22:47:45 - INFO - __main__ - Step 53102: {'lr': 0.00036679012263752115, 'samples': 10195584, 'steps': 53101, 'loss/train': 1.403045654296875} -08/30/2021 22:47:45 - INFO - __main__ - Step 53103: {'lr': 0.00036678543053359413, 'samples': 10195776, 'steps': 53102, 'loss/train': 1.9423904418945312} -08/30/2021 22:47:46 - INFO - __main__ - Step 53104: {'lr': 0.0003667807383770455, 'samples': 10195968, 'steps': 53103, 'loss/train': 1.424591302871704} -08/30/2021 22:47:46 - INFO - __main__ - Step 53105: {'lr': 0.00036677604616787717, 'samples': 10196160, 'steps': 53104, 'loss/train': 0.9685341119766235} -08/30/2021 22:47:47 - INFO - __main__ - Step 53106: {'lr': 0.00036677135390609145, 'samples': 10196352, 'steps': 53105, 'loss/train': 2.101757287979126} -08/30/2021 22:47:48 - INFO - __main__ - Step 53107: {'lr': 0.0003667666615916903, 'samples': 10196544, 'steps': 53106, 'loss/train': 0.03861301764845848} -08/30/2021 22:47:49 - INFO - __main__ - Step 53108: {'lr': 0.00036676196922467595, 'samples': 10196736, 'steps': 53107, 'loss/train': 0.8503670692443848} -08/30/2021 22:47:49 - INFO - __main__ - Step 53109: {'lr': 0.00036675727680505045, 'samples': 10196928, 'steps': 53108, 'loss/train': 1.0691540241241455} -08/30/2021 22:47:49 - INFO - __main__ - Step 53110: {'lr': 0.0003667525843328159, 'samples': 10197120, 'steps': 53109, 'loss/train': 1.2914034128189087} -08/30/2021 22:47:50 - INFO - __main__ - Step 53111: {'lr': 0.0003667478918079744, 'samples': 10197312, 'steps': 53110, 'loss/train': 1.4227043390274048} -08/30/2021 22:47:51 - INFO - __main__ - Step 53112: {'lr': 0.0003667431992305281, 'samples': 10197504, 'steps': 53111, 'loss/train': 1.1425765752792358} -08/30/2021 22:47:52 - INFO - __main__ - Step 53113: {'lr': 0.0003667385066004792, 'samples': 10197696, 'steps': 53112, 'loss/train': 1.0420361757278442} -08/30/2021 22:47:52 - INFO - __main__ - Step 53114: {'lr': 0.0003667338139178297, 'samples': 10197888, 'steps': 53113, 'loss/train': 0.8898513913154602} -08/30/2021 22:47:52 - INFO - __main__ - Step 53115: {'lr': 0.0003667291211825817, 'samples': 10198080, 'steps': 53114, 'loss/train': 1.3359873294830322} -08/30/2021 22:47:53 - INFO - __main__ - Step 53116: {'lr': 0.0003667244283947374, 'samples': 10198272, 'steps': 53115, 'loss/train': 1.20332670211792} -08/30/2021 22:47:53 - INFO - __main__ - Step 53117: {'lr': 0.0003667197355542989, 'samples': 10198464, 'steps': 53116, 'loss/train': 0.6552751660346985} -08/30/2021 22:47:55 - INFO - __main__ - Step 53118: {'lr': 0.0003667150426612682, 'samples': 10198656, 'steps': 53117, 'loss/train': 1.5831595659255981} -08/30/2021 22:47:55 - INFO - __main__ - Step 53119: {'lr': 0.0003667103497156475, 'samples': 10198848, 'steps': 53118, 'loss/train': 1.1328293085098267} -08/30/2021 22:47:55 - INFO - __main__ - Step 53120: {'lr': 0.00036670565671743905, 'samples': 10199040, 'steps': 53119, 'loss/train': 1.2508949041366577} -08/30/2021 22:47:56 - INFO - __main__ - Step 53121: {'lr': 0.0003667009636666447, 'samples': 10199232, 'steps': 53120, 'loss/train': 1.647360920906067} -08/30/2021 22:47:56 - INFO - __main__ - Step 53122: {'lr': 0.00036669627056326685, 'samples': 10199424, 'steps': 53121, 'loss/train': 0.7447426915168762} -08/30/2021 22:47:58 - INFO - __main__ - Step 53123: {'lr': 0.0003666915774073073, 'samples': 10199616, 'steps': 53122, 'loss/train': 1.2288435697555542} -08/30/2021 22:47:58 - INFO - __main__ - Step 53124: {'lr': 0.00036668688419876837, 'samples': 10199808, 'steps': 53123, 'loss/train': 0.4710957407951355} -08/30/2021 22:47:58 - INFO - __main__ - Step 53125: {'lr': 0.0003666821909376522, 'samples': 10200000, 'steps': 53124, 'loss/train': 1.7645479440689087} -08/30/2021 22:47:59 - INFO - __main__ - Step 53126: {'lr': 0.00036667749762396074, 'samples': 10200192, 'steps': 53125, 'loss/train': 1.1250778436660767} -08/30/2021 22:47:59 - INFO - __main__ - Step 53127: {'lr': 0.0003666728042576962, 'samples': 10200384, 'steps': 53126, 'loss/train': 1.566033959388733} -08/30/2021 22:48:01 - INFO - __main__ - Step 53128: {'lr': 0.0003666681108388608, 'samples': 10200576, 'steps': 53127, 'loss/train': 1.7354872226715088} -08/30/2021 22:48:01 - INFO - __main__ - Step 53129: {'lr': 0.0003666634173674565, 'samples': 10200768, 'steps': 53128, 'loss/train': 1.3731133937835693} -08/30/2021 22:48:01 - INFO - __main__ - Step 53130: {'lr': 0.00036665872384348543, 'samples': 10200960, 'steps': 53129, 'loss/train': 1.2538998126983643} -08/30/2021 22:48:02 - INFO - __main__ - Step 53131: {'lr': 0.00036665403026694976, 'samples': 10201152, 'steps': 53130, 'loss/train': 0.9703413844108582} -08/30/2021 22:48:02 - INFO - __main__ - Step 53132: {'lr': 0.0003666493366378516, 'samples': 10201344, 'steps': 53131, 'loss/train': 1.2547544240951538} -08/30/2021 22:48:04 - INFO - __main__ - Step 53133: {'lr': 0.00036664464295619296, 'samples': 10201536, 'steps': 53132, 'loss/train': 1.7632980346679688} -08/30/2021 22:48:04 - INFO - __main__ - Step 53134: {'lr': 0.0003666399492219762, 'samples': 10201728, 'steps': 53133, 'loss/train': 1.574918508529663} -08/30/2021 22:48:05 - INFO - __main__ - Step 53135: {'lr': 0.0003666352554352032, 'samples': 10201920, 'steps': 53134, 'loss/train': 1.9045681953430176} -08/30/2021 22:48:05 - INFO - __main__ - Step 53136: {'lr': 0.00036663056159587614, 'samples': 10202112, 'steps': 53135, 'loss/train': 0.059278469532728195} -08/30/2021 22:48:05 - INFO - __main__ - Step 53137: {'lr': 0.0003666258677039971, 'samples': 10202304, 'steps': 53136, 'loss/train': 1.2600656747817993} -08/30/2021 22:48:06 - INFO - __main__ - Step 53138: {'lr': 0.00036662117375956834, 'samples': 10202496, 'steps': 53137, 'loss/train': 1.1118632555007935} -08/30/2021 22:48:07 - INFO - __main__ - Step 53139: {'lr': 0.00036661647976259185, 'samples': 10202688, 'steps': 53138, 'loss/train': 1.5370559692382812} -08/30/2021 22:48:08 - INFO - __main__ - Step 53140: {'lr': 0.0003666117857130698, 'samples': 10202880, 'steps': 53139, 'loss/train': 1.055375337600708} -08/30/2021 22:48:08 - INFO - __main__ - Step 53141: {'lr': 0.00036660709161100423, 'samples': 10203072, 'steps': 53140, 'loss/train': 1.829869270324707} -08/30/2021 22:48:08 - INFO - __main__ - Step 53142: {'lr': 0.0003666023974563973, 'samples': 10203264, 'steps': 53141, 'loss/train': 1.3564083576202393} -08/30/2021 22:48:09 - INFO - __main__ - Step 53143: {'lr': 0.0003665977032492511, 'samples': 10203456, 'steps': 53142, 'loss/train': 1.0254392623901367} -08/30/2021 22:48:11 - INFO - __main__ - Step 53144: {'lr': 0.00036659300898956784, 'samples': 10203648, 'steps': 53143, 'loss/train': 1.7108354568481445} -08/30/2021 22:48:11 - INFO - __main__ - Step 53145: {'lr': 0.0003665883146773496, 'samples': 10203840, 'steps': 53144, 'loss/train': 1.274196743965149} -08/30/2021 22:48:11 - INFO - __main__ - Step 53146: {'lr': 0.0003665836203125984, 'samples': 10204032, 'steps': 53145, 'loss/train': 1.2545244693756104} -08/30/2021 22:48:12 - INFO - __main__ - Step 53147: {'lr': 0.0003665789258953164, 'samples': 10204224, 'steps': 53146, 'loss/train': 1.4287270307540894} -08/30/2021 22:48:12 - INFO - __main__ - Step 53148: {'lr': 0.00036657423142550576, 'samples': 10204416, 'steps': 53147, 'loss/train': 1.3680726289749146} -08/30/2021 22:48:14 - INFO - __main__ - Step 53149: {'lr': 0.00036656953690316865, 'samples': 10204608, 'steps': 53148, 'loss/train': 2.4107770919799805} -08/30/2021 22:48:14 - INFO - __main__ - Step 53150: {'lr': 0.000366564842328307, 'samples': 10204800, 'steps': 53149, 'loss/train': 1.1396530866622925} -08/30/2021 22:48:14 - INFO - __main__ - Step 53151: {'lr': 0.0003665601477009231, 'samples': 10204992, 'steps': 53150, 'loss/train': 0.936739981174469} -08/30/2021 22:48:15 - INFO - __main__ - Step 53152: {'lr': 0.00036655545302101894, 'samples': 10205184, 'steps': 53151, 'loss/train': 2.040178060531616} -08/30/2021 22:48:15 - INFO - __main__ - Step 53153: {'lr': 0.00036655075828859673, 'samples': 10205376, 'steps': 53152, 'loss/train': 0.8591750264167786} -08/30/2021 22:48:17 - INFO - __main__ - Step 53154: {'lr': 0.0003665460635036585, 'samples': 10205568, 'steps': 53153, 'loss/train': 1.7109917402267456} -08/30/2021 22:48:17 - INFO - __main__ - Step 53155: {'lr': 0.00036654136866620646, 'samples': 10205760, 'steps': 53154, 'loss/train': 1.1160075664520264} -08/30/2021 22:48:17 - INFO - __main__ - Step 53156: {'lr': 0.0003665366737762427, 'samples': 10205952, 'steps': 53155, 'loss/train': 1.077751874923706} -08/30/2021 22:48:18 - INFO - __main__ - Step 53157: {'lr': 0.0003665319788337692, 'samples': 10206144, 'steps': 53156, 'loss/train': 1.0127267837524414} -08/30/2021 22:48:18 - INFO - __main__ - Step 53158: {'lr': 0.0003665272838387883, 'samples': 10206336, 'steps': 53157, 'loss/train': 1.58287513256073} -08/30/2021 22:48:20 - INFO - __main__ - Step 53159: {'lr': 0.00036652258879130194, 'samples': 10206528, 'steps': 53158, 'loss/train': 1.1335201263427734} -08/30/2021 22:48:20 - INFO - __main__ - Step 53160: {'lr': 0.0003665178936913123, 'samples': 10206720, 'steps': 53159, 'loss/train': 0.8323636651039124} -08/30/2021 22:48:21 - INFO - __main__ - Step 53161: {'lr': 0.0003665131985388215, 'samples': 10206912, 'steps': 53160, 'loss/train': 1.0658328533172607} -08/30/2021 22:48:21 - INFO - __main__ - Step 53162: {'lr': 0.00036650850333383174, 'samples': 10207104, 'steps': 53161, 'loss/train': 1.0367801189422607} -08/30/2021 22:48:21 - INFO - __main__ - Step 53163: {'lr': 0.000366503808076345, 'samples': 10207296, 'steps': 53162, 'loss/train': 1.3140429258346558} -08/30/2021 22:48:22 - INFO - __main__ - Step 53164: {'lr': 0.00036649911276636336, 'samples': 10207488, 'steps': 53163, 'loss/train': 1.3835654258728027} -08/30/2021 22:48:23 - INFO - __main__ - Step 53165: {'lr': 0.0003664944174038891, 'samples': 10207680, 'steps': 53164, 'loss/train': 2.0678176879882812} -08/30/2021 22:48:24 - INFO - __main__ - Step 53166: {'lr': 0.0003664897219889242, 'samples': 10207872, 'steps': 53165, 'loss/train': 1.299597978591919} -08/30/2021 22:48:24 - INFO - __main__ - Step 53167: {'lr': 0.0003664850265214709, 'samples': 10208064, 'steps': 53166, 'loss/train': 1.2662023305892944} -08/30/2021 22:48:24 - INFO - __main__ - Step 53168: {'lr': 0.00036648033100153117, 'samples': 10208256, 'steps': 53167, 'loss/train': 1.2045398950576782} -08/30/2021 22:48:25 - INFO - __main__ - Step 53169: {'lr': 0.0003664756354291073, 'samples': 10208448, 'steps': 53168, 'loss/train': 1.1443707942962646} -08/30/2021 22:48:26 - INFO - __main__ - Step 53170: {'lr': 0.0003664709398042012, 'samples': 10208640, 'steps': 53169, 'loss/train': 0.04853302612900734} -08/30/2021 22:48:27 - INFO - __main__ - Step 53171: {'lr': 0.00036646624412681514, 'samples': 10208832, 'steps': 53170, 'loss/train': 1.3704601526260376} -08/30/2021 22:48:27 - INFO - __main__ - Step 53172: {'lr': 0.0003664615483969511, 'samples': 10209024, 'steps': 53171, 'loss/train': 1.043784260749817} -08/30/2021 22:48:27 - INFO - __main__ - Step 53173: {'lr': 0.0003664568526146114, 'samples': 10209216, 'steps': 53172, 'loss/train': 1.3911161422729492} -08/30/2021 22:48:28 - INFO - __main__ - Step 53174: {'lr': 0.000366452156779798, 'samples': 10209408, 'steps': 53173, 'loss/train': 1.2773371934890747} -08/30/2021 22:48:29 - INFO - __main__ - Step 53175: {'lr': 0.000366447460892513, 'samples': 10209600, 'steps': 53174, 'loss/train': 1.1461070775985718} -08/30/2021 22:48:29 - INFO - __main__ - Step 53176: {'lr': 0.0003664427649527587, 'samples': 10209792, 'steps': 53175, 'loss/train': 1.1184347867965698} -08/30/2021 22:48:30 - INFO - __main__ - Step 53177: {'lr': 0.000366438068960537, 'samples': 10209984, 'steps': 53176, 'loss/train': 1.164221167564392} -08/30/2021 22:48:30 - INFO - __main__ - Step 53178: {'lr': 0.0003664333729158501, 'samples': 10210176, 'steps': 53177, 'loss/train': 1.2854918241500854} -08/30/2021 22:48:31 - INFO - __main__ - Step 53179: {'lr': 0.0003664286768187002, 'samples': 10210368, 'steps': 53178, 'loss/train': 1.6035661697387695} -08/30/2021 22:48:32 - INFO - __main__ - Step 53180: {'lr': 0.0003664239806690892, 'samples': 10210560, 'steps': 53179, 'loss/train': 0.7715705037117004} -08/30/2021 22:48:32 - INFO - __main__ - Step 53181: {'lr': 0.00036641928446701943, 'samples': 10210752, 'steps': 53180, 'loss/train': 1.0717874765396118} -08/30/2021 22:48:33 - INFO - __main__ - Step 53182: {'lr': 0.00036641458821249295, 'samples': 10210944, 'steps': 53181, 'loss/train': 1.0671672821044922} -08/30/2021 22:48:33 - INFO - __main__ - Step 53183: {'lr': 0.00036640989190551184, 'samples': 10211136, 'steps': 53182, 'loss/train': 1.3902512788772583} -08/30/2021 22:48:33 - INFO - __main__ - Step 53184: {'lr': 0.00036640519554607823, 'samples': 10211328, 'steps': 53183, 'loss/train': 1.3211222887039185} -08/30/2021 22:48:35 - INFO - __main__ - Step 53185: {'lr': 0.00036640049913419417, 'samples': 10211520, 'steps': 53184, 'loss/train': 1.404670238494873} -08/30/2021 22:48:35 - INFO - __main__ - Step 53186: {'lr': 0.00036639580266986183, 'samples': 10211712, 'steps': 53185, 'loss/train': 1.5652908086776733} -08/30/2021 22:48:36 - INFO - __main__ - Step 53187: {'lr': 0.00036639110615308343, 'samples': 10211904, 'steps': 53186, 'loss/train': 1.5481977462768555} -08/30/2021 22:48:36 - INFO - __main__ - Step 53188: {'lr': 0.0003663864095838609, 'samples': 10212096, 'steps': 53187, 'loss/train': 0.6847036480903625} -08/30/2021 22:48:36 - INFO - __main__ - Step 53189: {'lr': 0.0003663817129621966, 'samples': 10212288, 'steps': 53188, 'loss/train': 0.2752286493778229} -08/30/2021 22:48:38 - INFO - __main__ - Step 53190: {'lr': 0.0003663770162880924, 'samples': 10212480, 'steps': 53189, 'loss/train': 1.2976406812667847} -08/30/2021 22:48:39 - INFO - __main__ - Step 53191: {'lr': 0.00036637231956155046, 'samples': 10212672, 'steps': 53190, 'loss/train': 2.2436041831970215} -08/30/2021 22:48:39 - INFO - __main__ - Step 53192: {'lr': 0.000366367622782573, 'samples': 10212864, 'steps': 53191, 'loss/train': 1.1812256574630737} -08/30/2021 22:48:39 - INFO - __main__ - Step 53193: {'lr': 0.0003663629259511621, 'samples': 10213056, 'steps': 53192, 'loss/train': 1.5116875171661377} -08/30/2021 22:48:40 - INFO - __main__ - Step 53194: {'lr': 0.00036635822906731986, 'samples': 10213248, 'steps': 53193, 'loss/train': 1.1701563596725464} -08/30/2021 22:48:40 - INFO - __main__ - Step 53195: {'lr': 0.0003663535321310484, 'samples': 10213440, 'steps': 53194, 'loss/train': 1.5494961738586426} -08/30/2021 22:48:42 - INFO - __main__ - Step 53196: {'lr': 0.00036634883514234987, 'samples': 10213632, 'steps': 53195, 'loss/train': 1.2427462339401245} -08/30/2021 22:48:42 - INFO - __main__ - Step 53197: {'lr': 0.00036634413810122626, 'samples': 10213824, 'steps': 53196, 'loss/train': 1.6782783269882202} -08/30/2021 22:48:42 - INFO - __main__ - Step 53198: {'lr': 0.0003663394410076798, 'samples': 10214016, 'steps': 53197, 'loss/train': 1.3597197532653809} -08/30/2021 22:48:43 - INFO - __main__ - Step 53199: {'lr': 0.00036633474386171263, 'samples': 10214208, 'steps': 53198, 'loss/train': 0.4300593137741089} -08/30/2021 22:48:43 - INFO - __main__ - Step 53200: {'lr': 0.00036633004666332674, 'samples': 10214400, 'steps': 53199, 'loss/train': 1.6808253526687622} -08/30/2021 22:48:45 - INFO - __main__ - Step 53201: {'lr': 0.0003663253494125244, 'samples': 10214592, 'steps': 53200, 'loss/train': 1.1583746671676636} -08/30/2021 22:48:46 - INFO - __main__ - Step 53202: {'lr': 0.0003663206521093076, 'samples': 10214784, 'steps': 53201, 'loss/train': 2.1961965560913086} -08/30/2021 22:48:46 - INFO - __main__ - Step 53203: {'lr': 0.00036631595475367855, 'samples': 10214976, 'steps': 53202, 'loss/train': 1.0480351448059082} -08/30/2021 22:48:46 - INFO - __main__ - Step 53204: {'lr': 0.0003663112573456393, 'samples': 10215168, 'steps': 53203, 'loss/train': 1.6802586317062378} -08/30/2021 22:48:47 - INFO - __main__ - Step 53205: {'lr': 0.00036630655988519203, 'samples': 10215360, 'steps': 53204, 'loss/train': 1.7026524543762207} -08/30/2021 22:48:48 - INFO - __main__ - Step 53206: {'lr': 0.00036630186237233877, 'samples': 10215552, 'steps': 53205, 'loss/train': 1.1888130903244019} -08/30/2021 22:48:49 - INFO - __main__ - Step 53207: {'lr': 0.00036629716480708174, 'samples': 10215744, 'steps': 53206, 'loss/train': 1.4900892972946167} -08/30/2021 22:48:49 - INFO - __main__ - Step 53208: {'lr': 0.00036629246718942294, 'samples': 10215936, 'steps': 53207, 'loss/train': 0.8244256377220154} -08/30/2021 22:48:49 - INFO - __main__ - Step 53209: {'lr': 0.0003662877695193646, 'samples': 10216128, 'steps': 53208, 'loss/train': 1.4629201889038086} -08/30/2021 22:48:50 - INFO - __main__ - Step 53210: {'lr': 0.00036628307179690877, 'samples': 10216320, 'steps': 53209, 'loss/train': 0.2627696692943573} -08/30/2021 22:48:52 - INFO - __main__ - Step 53211: {'lr': 0.0003662783740220576, 'samples': 10216512, 'steps': 53210, 'loss/train': 1.0426281690597534} -08/30/2021 22:48:53 - INFO - __main__ - Step 53212: {'lr': 0.00036627367619481316, 'samples': 10216704, 'steps': 53211, 'loss/train': 1.1042983531951904} -08/30/2021 22:48:53 - INFO - __main__ - Step 53213: {'lr': 0.00036626897831517756, 'samples': 10216896, 'steps': 53212, 'loss/train': 1.2236188650131226} -08/30/2021 22:48:53 - INFO - __main__ - Step 53214: {'lr': 0.000366264280383153, 'samples': 10217088, 'steps': 53213, 'loss/train': 1.517566204071045} -08/30/2021 22:48:54 - INFO - __main__ - Step 53215: {'lr': 0.00036625958239874156, 'samples': 10217280, 'steps': 53214, 'loss/train': 0.4312618374824524} -08/30/2021 22:48:54 - INFO - __main__ - Step 53216: {'lr': 0.0003662548843619454, 'samples': 10217472, 'steps': 53215, 'loss/train': 0.4052829444408417} -08/30/2021 22:48:54 - INFO - __main__ - Step 53217: {'lr': 0.00036625018627276646, 'samples': 10217664, 'steps': 53216, 'loss/train': 1.099495768547058} -08/30/2021 22:48:56 - INFO - __main__ - Step 53218: {'lr': 0.0003662454881312071, 'samples': 10217856, 'steps': 53217, 'loss/train': 1.353546380996704} -08/30/2021 22:48:56 - INFO - __main__ - Step 53219: {'lr': 0.0003662407899372692, 'samples': 10218048, 'steps': 53218, 'loss/train': 1.8712952136993408} -08/30/2021 22:48:56 - INFO - __main__ - Step 53220: {'lr': 0.000366236091690955, 'samples': 10218240, 'steps': 53219, 'loss/train': 1.2671988010406494} -08/30/2021 22:48:57 - INFO - __main__ - Step 53221: {'lr': 0.00036623139339226664, 'samples': 10218432, 'steps': 53220, 'loss/train': 1.942024827003479} -08/30/2021 22:48:57 - INFO - __main__ - Step 53222: {'lr': 0.00036622669504120627, 'samples': 10218624, 'steps': 53221, 'loss/train': 1.6858413219451904} -08/30/2021 22:48:59 - INFO - __main__ - Step 53223: {'lr': 0.0003662219966377759, 'samples': 10218816, 'steps': 53222, 'loss/train': 1.6491044759750366} -08/30/2021 22:48:59 - INFO - __main__ - Step 53224: {'lr': 0.0003662172981819777, 'samples': 10219008, 'steps': 53223, 'loss/train': 1.4158514738082886} -08/30/2021 22:49:00 - INFO - __main__ - Step 53225: {'lr': 0.00036621259967381374, 'samples': 10219200, 'steps': 53224, 'loss/train': 0.0857100561261177} -08/30/2021 22:49:00 - INFO - __main__ - Step 53226: {'lr': 0.0003662079011132862, 'samples': 10219392, 'steps': 53225, 'loss/train': 2.865140199661255} -08/30/2021 22:49:00 - INFO - __main__ - Step 53227: {'lr': 0.0003662032025003972, 'samples': 10219584, 'steps': 53226, 'loss/train': 1.760138750076294} -08/30/2021 22:49:02 - INFO - __main__ - Step 53228: {'lr': 0.0003661985038351488, 'samples': 10219776, 'steps': 53227, 'loss/train': 1.2502361536026} -08/30/2021 22:49:02 - INFO - __main__ - Step 53229: {'lr': 0.0003661938051175432, 'samples': 10219968, 'steps': 53228, 'loss/train': 0.8863047957420349} -08/30/2021 22:49:03 - INFO - __main__ - Step 53230: {'lr': 0.0003661891063475824, 'samples': 10220160, 'steps': 53229, 'loss/train': 1.418977975845337} -08/30/2021 22:49:03 - INFO - __main__ - Step 53231: {'lr': 0.0003661844075252686, 'samples': 10220352, 'steps': 53230, 'loss/train': 1.4624571800231934} -08/30/2021 22:49:03 - INFO - __main__ - Step 53232: {'lr': 0.0003661797086506039, 'samples': 10220544, 'steps': 53231, 'loss/train': 1.3781826496124268} -08/30/2021 22:49:05 - INFO - __main__ - Step 53233: {'lr': 0.0003661750097235904, 'samples': 10220736, 'steps': 53232, 'loss/train': 1.2332086563110352} -08/30/2021 22:49:06 - INFO - __main__ - Step 53234: {'lr': 0.00036617031074423023, 'samples': 10220928, 'steps': 53233, 'loss/train': 1.2848411798477173} -08/30/2021 22:49:06 - INFO - __main__ - Step 53235: {'lr': 0.00036616561171252547, 'samples': 10221120, 'steps': 53234, 'loss/train': 1.5117601156234741} -08/30/2021 22:49:06 - INFO - __main__ - Step 53236: {'lr': 0.0003661609126284784, 'samples': 10221312, 'steps': 53235, 'loss/train': 1.5077972412109375} -08/30/2021 22:49:07 - INFO - __main__ - Step 53237: {'lr': 0.00036615621349209094, 'samples': 10221504, 'steps': 53236, 'loss/train': 0.6492274403572083} -08/30/2021 22:49:07 - INFO - __main__ - Step 53238: {'lr': 0.00036615151430336536, 'samples': 10221696, 'steps': 53237, 'loss/train': 1.3716254234313965} -08/30/2021 22:49:08 - INFO - __main__ - Step 53239: {'lr': 0.0003661468150623036, 'samples': 10221888, 'steps': 53238, 'loss/train': 1.6493276357650757} -08/30/2021 22:49:09 - INFO - __main__ - Step 53240: {'lr': 0.0003661421157689079, 'samples': 10222080, 'steps': 53239, 'loss/train': 0.5903933048248291} -08/30/2021 22:49:09 - INFO - __main__ - Step 53241: {'lr': 0.00036613741642318033, 'samples': 10222272, 'steps': 53240, 'loss/train': 0.7079034447669983} -08/30/2021 22:49:10 - INFO - __main__ - Step 53242: {'lr': 0.00036613271702512306, 'samples': 10222464, 'steps': 53241, 'loss/train': 1.8750361204147339} -08/30/2021 22:49:10 - INFO - __main__ - Step 53243: {'lr': 0.00036612801757473823, 'samples': 10222656, 'steps': 53242, 'loss/train': 1.4853777885437012} -08/30/2021 22:49:11 - INFO - __main__ - Step 53244: {'lr': 0.00036612331807202785, 'samples': 10222848, 'steps': 53243, 'loss/train': 1.665930986404419} -08/30/2021 22:49:12 - INFO - __main__ - Step 53245: {'lr': 0.00036611861851699415, 'samples': 10223040, 'steps': 53244, 'loss/train': 1.3020669221878052} -08/30/2021 22:49:12 - INFO - __main__ - Step 53246: {'lr': 0.00036611391890963913, 'samples': 10223232, 'steps': 53245, 'loss/train': 1.5422465801239014} -08/30/2021 22:49:13 - INFO - __main__ - Step 53247: {'lr': 0.000366109219249965, 'samples': 10223424, 'steps': 53246, 'loss/train': 1.1618731021881104} -08/30/2021 22:49:13 - INFO - __main__ - Step 53248: {'lr': 0.00036610451953797386, 'samples': 10223616, 'steps': 53247, 'loss/train': 1.1686583757400513} -08/30/2021 22:49:14 - INFO - __main__ - Step 53249: {'lr': 0.0003660998197736677, 'samples': 10223808, 'steps': 53248, 'loss/train': 1.0477544069290161} -08/30/2021 22:49:15 - INFO - __main__ - Step 53250: {'lr': 0.00036609511995704894, 'samples': 10224000, 'steps': 53249, 'loss/train': 0.7289081811904907} -08/30/2021 22:49:15 - INFO - __main__ - Step 53251: {'lr': 0.0003660904200881194, 'samples': 10224192, 'steps': 53250, 'loss/train': 1.335196852684021} -08/30/2021 22:49:16 - INFO - __main__ - Step 53252: {'lr': 0.00036608572016688136, 'samples': 10224384, 'steps': 53251, 'loss/train': 1.3050537109375} -08/30/2021 22:49:16 - INFO - __main__ - Step 53253: {'lr': 0.00036608102019333684, 'samples': 10224576, 'steps': 53252, 'loss/train': 1.310990571975708} -08/30/2021 22:49:18 - INFO - __main__ - Step 53254: {'lr': 0.00036607632016748796, 'samples': 10224768, 'steps': 53253, 'loss/train': 1.2805341482162476} -08/30/2021 22:49:19 - INFO - __main__ - Step 53255: {'lr': 0.00036607162008933696, 'samples': 10224960, 'steps': 53254, 'loss/train': 1.602102518081665} -08/30/2021 22:49:19 - INFO - __main__ - Step 53256: {'lr': 0.00036606691995888594, 'samples': 10225152, 'steps': 53255, 'loss/train': 1.5757710933685303} -08/30/2021 22:49:19 - INFO - __main__ - Step 53257: {'lr': 0.00036606221977613686, 'samples': 10225344, 'steps': 53256, 'loss/train': 0.6729387640953064} -08/30/2021 22:49:20 - INFO - __main__ - Step 53258: {'lr': 0.0003660575195410919, 'samples': 10225536, 'steps': 53257, 'loss/train': 1.706623911857605} -08/30/2021 22:49:20 - INFO - __main__ - Step 53259: {'lr': 0.0003660528192537533, 'samples': 10225728, 'steps': 53258, 'loss/train': 1.0621718168258667} -08/30/2021 22:49:21 - INFO - __main__ - Step 53260: {'lr': 0.00036604811891412296, 'samples': 10225920, 'steps': 53259, 'loss/train': 1.0937594175338745} -08/30/2021 22:49:22 - INFO - __main__ - Step 53261: {'lr': 0.00036604341852220325, 'samples': 10226112, 'steps': 53260, 'loss/train': 1.6766093969345093} -08/30/2021 22:49:22 - INFO - __main__ - Step 53262: {'lr': 0.00036603871807799616, 'samples': 10226304, 'steps': 53261, 'loss/train': 0.7190766930580139} -08/30/2021 22:49:23 - INFO - __main__ - Step 53263: {'lr': 0.0003660340175815038, 'samples': 10226496, 'steps': 53262, 'loss/train': 1.536271095275879} -08/30/2021 22:49:23 - INFO - __main__ - Step 53264: {'lr': 0.0003660293170327283, 'samples': 10226688, 'steps': 53263, 'loss/train': 0.6218279600143433} -08/30/2021 22:49:24 - INFO - __main__ - Step 53265: {'lr': 0.0003660246164316717, 'samples': 10226880, 'steps': 53264, 'loss/train': 1.1906983852386475} -08/30/2021 22:49:25 - INFO - __main__ - Step 53266: {'lr': 0.00036601991577833634, 'samples': 10227072, 'steps': 53265, 'loss/train': 1.0640814304351807} -08/30/2021 22:49:25 - INFO - __main__ - Step 53267: {'lr': 0.00036601521507272414, 'samples': 10227264, 'steps': 53266, 'loss/train': 0.5387945175170898} -08/30/2021 22:49:26 - INFO - __main__ - Step 53268: {'lr': 0.00036601051431483725, 'samples': 10227456, 'steps': 53267, 'loss/train': 1.8342547416687012} -08/30/2021 22:49:26 - INFO - __main__ - Step 53269: {'lr': 0.0003660058135046778, 'samples': 10227648, 'steps': 53268, 'loss/train': 1.051466941833496} -08/30/2021 22:49:27 - INFO - __main__ - Step 53270: {'lr': 0.000366001112642248, 'samples': 10227840, 'steps': 53269, 'loss/train': 0.9883494973182678} -08/30/2021 22:49:28 - INFO - __main__ - Step 53271: {'lr': 0.00036599641172754984, 'samples': 10228032, 'steps': 53270, 'loss/train': 1.3072794675827026} -08/30/2021 22:49:28 - INFO - __main__ - Step 53272: {'lr': 0.0003659917107605854, 'samples': 10228224, 'steps': 53271, 'loss/train': 1.2601321935653687} -08/30/2021 22:49:29 - INFO - __main__ - Step 53273: {'lr': 0.000365987009741357, 'samples': 10228416, 'steps': 53272, 'loss/train': 1.71773099899292} -08/30/2021 22:49:29 - INFO - __main__ - Step 53274: {'lr': 0.0003659823086698666, 'samples': 10228608, 'steps': 53273, 'loss/train': 1.490798830986023} -08/30/2021 22:49:30 - INFO - __main__ - Step 53275: {'lr': 0.0003659776075461164, 'samples': 10228800, 'steps': 53274, 'loss/train': 1.0880540609359741} -08/30/2021 22:49:31 - INFO - __main__ - Step 53276: {'lr': 0.0003659729063701084, 'samples': 10228992, 'steps': 53275, 'loss/train': 1.42315673828125} -08/30/2021 22:49:31 - INFO - __main__ - Step 53277: {'lr': 0.00036596820514184485, 'samples': 10229184, 'steps': 53276, 'loss/train': 1.5079480409622192} -08/30/2021 22:49:32 - INFO - __main__ - Step 53278: {'lr': 0.00036596350386132784, 'samples': 10229376, 'steps': 53277, 'loss/train': 1.35906183719635} -08/30/2021 22:49:32 - INFO - __main__ - Step 53279: {'lr': 0.0003659588025285594, 'samples': 10229568, 'steps': 53278, 'loss/train': 1.203540325164795} -08/30/2021 22:49:33 - INFO - __main__ - Step 53280: {'lr': 0.0003659541011435418, 'samples': 10229760, 'steps': 53279, 'loss/train': 0.21066060662269592} -08/30/2021 22:49:34 - INFO - __main__ - Step 53281: {'lr': 0.00036594939970627704, 'samples': 10229952, 'steps': 53280, 'loss/train': 0.9715648889541626} -08/30/2021 22:49:34 - INFO - __main__ - Step 53282: {'lr': 0.0003659446982167672, 'samples': 10230144, 'steps': 53281, 'loss/train': 0.45380842685699463} -08/30/2021 22:49:35 - INFO - __main__ - Step 53283: {'lr': 0.00036593999667501457, 'samples': 10230336, 'steps': 53282, 'loss/train': 1.51667320728302} -08/30/2021 22:49:35 - INFO - __main__ - Step 53284: {'lr': 0.0003659352950810211, 'samples': 10230528, 'steps': 53283, 'loss/train': 1.5380358695983887} -08/30/2021 22:49:36 - INFO - __main__ - Step 53285: {'lr': 0.00036593059343478904, 'samples': 10230720, 'steps': 53284, 'loss/train': 1.4115374088287354} -08/30/2021 22:49:37 - INFO - __main__ - Step 53286: {'lr': 0.0003659258917363204, 'samples': 10230912, 'steps': 53285, 'loss/train': 1.128061056137085} -08/30/2021 22:49:37 - INFO - __main__ - Step 53287: {'lr': 0.0003659211899856173, 'samples': 10231104, 'steps': 53286, 'loss/train': 1.0784072875976562} -08/30/2021 22:49:37 - INFO - __main__ - Step 53288: {'lr': 0.0003659164881826819, 'samples': 10231296, 'steps': 53287, 'loss/train': 1.7698003053665161} -08/30/2021 22:49:38 - INFO - __main__ - Step 53289: {'lr': 0.00036591178632751635, 'samples': 10231488, 'steps': 53288, 'loss/train': 1.0029443502426147} -08/30/2021 22:49:40 - INFO - __main__ - Step 53290: {'lr': 0.00036590708442012275, 'samples': 10231680, 'steps': 53289, 'loss/train': 1.8331496715545654} -08/30/2021 22:49:40 - INFO - __main__ - Step 53291: {'lr': 0.0003659023824605033, 'samples': 10231872, 'steps': 53290, 'loss/train': 1.4333231449127197} -08/30/2021 22:49:41 - INFO - __main__ - Step 53292: {'lr': 0.0003658976804486599, 'samples': 10232064, 'steps': 53291, 'loss/train': 0.10715776681900024} -08/30/2021 22:49:41 - INFO - __main__ - Step 53293: {'lr': 0.0003658929783845948, 'samples': 10232256, 'steps': 53292, 'loss/train': 1.3528579473495483} -08/30/2021 22:49:41 - INFO - __main__ - Step 53294: {'lr': 0.0003658882762683101, 'samples': 10232448, 'steps': 53293, 'loss/train': 2.088239908218384} -08/30/2021 22:49:43 - INFO - __main__ - Step 53295: {'lr': 0.000365883574099808, 'samples': 10232640, 'steps': 53294, 'loss/train': 1.1306835412979126} -08/30/2021 22:49:43 - INFO - __main__ - Step 53296: {'lr': 0.00036587887187909045, 'samples': 10232832, 'steps': 53295, 'loss/train': 1.503839135169983} -08/30/2021 22:49:44 - INFO - __main__ - Step 53297: {'lr': 0.0003658741696061598, 'samples': 10233024, 'steps': 53296, 'loss/train': 1.6324217319488525} -08/30/2021 22:49:44 - INFO - __main__ - Step 53298: {'lr': 0.0003658694672810179, 'samples': 10233216, 'steps': 53297, 'loss/train': 1.487068772315979} -08/30/2021 22:49:44 - INFO - __main__ - Step 53299: {'lr': 0.00036586476490366713, 'samples': 10233408, 'steps': 53298, 'loss/train': 1.649052619934082} -08/30/2021 22:49:46 - INFO - __main__ - Step 53300: {'lr': 0.0003658600624741094, 'samples': 10233600, 'steps': 53299, 'loss/train': 0.8337749242782593} -08/30/2021 22:49:47 - INFO - __main__ - Step 53301: {'lr': 0.00036585535999234697, 'samples': 10233792, 'steps': 53300, 'loss/train': 1.2434320449829102} -08/30/2021 22:49:47 - INFO - __main__ - Step 53302: {'lr': 0.0003658506574583819, 'samples': 10233984, 'steps': 53301, 'loss/train': 1.61161208152771} -08/30/2021 22:49:47 - INFO - __main__ - Step 53303: {'lr': 0.0003658459548722163, 'samples': 10234176, 'steps': 53302, 'loss/train': 0.10066486150026321} -08/30/2021 22:49:48 - INFO - __main__ - Step 53304: {'lr': 0.00036584125223385224, 'samples': 10234368, 'steps': 53303, 'loss/train': 1.3928028345108032} -08/30/2021 22:49:49 - INFO - __main__ - Step 53305: {'lr': 0.0003658365495432919, 'samples': 10234560, 'steps': 53304, 'loss/train': 0.902204692363739} -08/30/2021 22:49:50 - INFO - __main__ - Step 53306: {'lr': 0.0003658318468005375, 'samples': 10234752, 'steps': 53305, 'loss/train': 1.4073790311813354} -08/30/2021 22:49:50 - INFO - __main__ - Step 53307: {'lr': 0.000365827144005591, 'samples': 10234944, 'steps': 53306, 'loss/train': 0.7341249585151672} -08/30/2021 22:49:50 - INFO - __main__ - Step 53308: {'lr': 0.0003658224411584545, 'samples': 10235136, 'steps': 53307, 'loss/train': 1.2515068054199219} -08/30/2021 22:49:51 - INFO - __main__ - Step 53309: {'lr': 0.0003658177382591303, 'samples': 10235328, 'steps': 53308, 'loss/train': 1.8078511953353882} -08/30/2021 22:49:51 - INFO - __main__ - Step 53310: {'lr': 0.0003658130353076204, 'samples': 10235520, 'steps': 53309, 'loss/train': 1.35354745388031} -08/30/2021 22:49:53 - INFO - __main__ - Step 53311: {'lr': 0.00036580833230392696, 'samples': 10235712, 'steps': 53310, 'loss/train': 1.947704792022705} -08/30/2021 22:49:54 - INFO - __main__ - Step 53312: {'lr': 0.00036580362924805204, 'samples': 10235904, 'steps': 53311, 'loss/train': 1.1198803186416626} -08/30/2021 22:49:54 - INFO - __main__ - Step 53313: {'lr': 0.0003657989261399978, 'samples': 10236096, 'steps': 53312, 'loss/train': 1.2369558811187744} -08/30/2021 22:49:54 - INFO - __main__ - Step 53314: {'lr': 0.0003657942229797663, 'samples': 10236288, 'steps': 53313, 'loss/train': 1.7686184644699097} -08/30/2021 22:49:55 - INFO - __main__ - Step 53315: {'lr': 0.00036578951976735973, 'samples': 10236480, 'steps': 53314, 'loss/train': 1.7382127046585083} -08/30/2021 22:49:57 - INFO - __main__ - Step 53316: {'lr': 0.00036578481650278023, 'samples': 10236672, 'steps': 53315, 'loss/train': 1.2438435554504395} -08/30/2021 22:49:57 - INFO - __main__ - Step 53317: {'lr': 0.0003657801131860299, 'samples': 10236864, 'steps': 53316, 'loss/train': 1.2964054346084595} -08/30/2021 22:49:57 - INFO - __main__ - Step 53318: {'lr': 0.0003657754098171108, 'samples': 10237056, 'steps': 53317, 'loss/train': 0.5095234513282776} -08/30/2021 22:49:58 - INFO - __main__ - Step 53319: {'lr': 0.0003657707063960251, 'samples': 10237248, 'steps': 53318, 'loss/train': 0.06290942430496216} -08/30/2021 22:49:58 - INFO - __main__ - Step 53320: {'lr': 0.00036576600292277477, 'samples': 10237440, 'steps': 53319, 'loss/train': 1.496840238571167} -08/30/2021 22:50:00 - INFO - __main__ - Step 53321: {'lr': 0.0003657612993973622, 'samples': 10237632, 'steps': 53320, 'loss/train': 0.04907238483428955} -08/30/2021 22:50:01 - INFO - __main__ - Step 53322: {'lr': 0.00036575659581978935, 'samples': 10237824, 'steps': 53321, 'loss/train': 1.3841993808746338} -08/30/2021 22:50:01 - INFO - __main__ - Step 53323: {'lr': 0.0003657518921900583, 'samples': 10238016, 'steps': 53322, 'loss/train': 1.1822389364242554} -08/30/2021 22:50:01 - INFO - __main__ - Step 53324: {'lr': 0.0003657471885081714, 'samples': 10238208, 'steps': 53323, 'loss/train': 1.4025685787200928} -08/30/2021 22:50:02 - INFO - __main__ - Step 53325: {'lr': 0.0003657424847741305, 'samples': 10238400, 'steps': 53324, 'loss/train': 0.6211552023887634} -08/30/2021 22:50:03 - INFO - __main__ - Step 53326: {'lr': 0.0003657377809879378, 'samples': 10238592, 'steps': 53325, 'loss/train': 0.05562727153301239} -08/30/2021 22:50:03 - INFO - __main__ - Step 53327: {'lr': 0.0003657330771495955, 'samples': 10238784, 'steps': 53326, 'loss/train': 1.2233649492263794} -08/30/2021 22:50:04 - INFO - __main__ - Step 53328: {'lr': 0.0003657283732591056, 'samples': 10238976, 'steps': 53327, 'loss/train': 0.9608726501464844} -08/30/2021 22:50:04 - INFO - __main__ - Step 53329: {'lr': 0.00036572366931647034, 'samples': 10239168, 'steps': 53328, 'loss/train': 1.360880732536316} -08/30/2021 22:50:05 - INFO - __main__ - Step 53330: {'lr': 0.0003657189653216918, 'samples': 10239360, 'steps': 53329, 'loss/train': 1.8871315717697144} -08/30/2021 22:50:05 - INFO - __main__ - Step 53331: {'lr': 0.000365714261274772, 'samples': 10239552, 'steps': 53330, 'loss/train': 0.4087035059928894} -08/30/2021 22:50:06 - INFO - __main__ - Step 53332: {'lr': 0.00036570955717571315, 'samples': 10239744, 'steps': 53331, 'loss/train': 1.1405770778656006} -08/30/2021 22:50:07 - INFO - __main__ - Step 53333: {'lr': 0.0003657048530245174, 'samples': 10239936, 'steps': 53332, 'loss/train': 1.3580645322799683} -08/30/2021 22:50:07 - INFO - __main__ - Step 53334: {'lr': 0.0003657001488211868, 'samples': 10240128, 'steps': 53333, 'loss/train': 1.4621342420578003} -08/30/2021 22:50:08 - INFO - __main__ - Step 53335: {'lr': 0.00036569544456572346, 'samples': 10240320, 'steps': 53334, 'loss/train': 1.2501530647277832} -08/30/2021 22:50:08 - INFO - __main__ - Step 53336: {'lr': 0.0003656907402581296, 'samples': 10240512, 'steps': 53335, 'loss/train': 1.380635142326355} -08/30/2021 22:50:09 - INFO - __main__ - Step 53337: {'lr': 0.00036568603589840734, 'samples': 10240704, 'steps': 53336, 'loss/train': 1.2424951791763306} -08/30/2021 22:50:10 - INFO - __main__ - Step 53338: {'lr': 0.00036568133148655855, 'samples': 10240896, 'steps': 53337, 'loss/train': 0.7611114382743835} -08/30/2021 22:50:10 - INFO - __main__ - Step 53339: {'lr': 0.0003656766270225857, 'samples': 10241088, 'steps': 53338, 'loss/train': 1.4231979846954346} -08/30/2021 22:50:11 - INFO - __main__ - Step 53340: {'lr': 0.00036567192250649066, 'samples': 10241280, 'steps': 53339, 'loss/train': 1.501531720161438} -08/30/2021 22:50:11 - INFO - __main__ - Step 53341: {'lr': 0.0003656672179382757, 'samples': 10241472, 'steps': 53340, 'loss/train': 1.5909029245376587} -08/30/2021 22:50:12 - INFO - __main__ - Step 53342: {'lr': 0.00036566251331794284, 'samples': 10241664, 'steps': 53341, 'loss/train': 1.3575444221496582} -08/30/2021 22:50:13 - INFO - __main__ - Step 53343: {'lr': 0.00036565780864549423, 'samples': 10241856, 'steps': 53342, 'loss/train': 0.8783314824104309} -08/30/2021 22:50:13 - INFO - __main__ - Step 53344: {'lr': 0.00036565310392093204, 'samples': 10242048, 'steps': 53343, 'loss/train': 0.6195229291915894} -08/30/2021 22:50:14 - INFO - __main__ - Step 53345: {'lr': 0.0003656483991442583, 'samples': 10242240, 'steps': 53344, 'loss/train': 0.7540102005004883} -08/30/2021 22:50:14 - INFO - __main__ - Step 53346: {'lr': 0.0003656436943154752, 'samples': 10242432, 'steps': 53345, 'loss/train': 1.4529738426208496} -08/30/2021 22:50:16 - INFO - __main__ - Step 53347: {'lr': 0.0003656389894345848, 'samples': 10242624, 'steps': 53346, 'loss/train': 1.165108323097229} -08/30/2021 22:50:16 - INFO - __main__ - Step 53348: {'lr': 0.0003656342845015893, 'samples': 10242816, 'steps': 53347, 'loss/train': 0.38638120889663696} -08/30/2021 22:50:17 - INFO - __main__ - Step 53349: {'lr': 0.00036562957951649075, 'samples': 10243008, 'steps': 53348, 'loss/train': 2.063819169998169} -08/30/2021 22:50:17 - INFO - __main__ - Step 53350: {'lr': 0.00036562487447929133, 'samples': 10243200, 'steps': 53349, 'loss/train': 1.6993876695632935} -08/30/2021 22:50:17 - INFO - __main__ - Step 53351: {'lr': 0.0003656201693899931, 'samples': 10243392, 'steps': 53350, 'loss/train': 1.561079978942871} -08/30/2021 22:50:18 - INFO - __main__ - Step 53352: {'lr': 0.0003656154642485982, 'samples': 10243584, 'steps': 53351, 'loss/train': 1.5431150197982788} -08/30/2021 22:50:19 - INFO - __main__ - Step 53353: {'lr': 0.00036561075905510874, 'samples': 10243776, 'steps': 53352, 'loss/train': 1.9697879552841187} -08/30/2021 22:50:20 - INFO - __main__ - Step 53354: {'lr': 0.00036560605380952686, 'samples': 10243968, 'steps': 53353, 'loss/train': 1.225656270980835} -08/30/2021 22:50:20 - INFO - __main__ - Step 53355: {'lr': 0.00036560134851185475, 'samples': 10244160, 'steps': 53354, 'loss/train': 1.7060719728469849} -08/30/2021 22:50:20 - INFO - __main__ - Step 53356: {'lr': 0.00036559664316209437, 'samples': 10244352, 'steps': 53355, 'loss/train': 2.1476950645446777} -08/30/2021 22:50:21 - INFO - __main__ - Step 53357: {'lr': 0.00036559193776024794, 'samples': 10244544, 'steps': 53356, 'loss/train': 1.9014744758605957} -08/30/2021 22:50:22 - INFO - __main__ - Step 53358: {'lr': 0.00036558723230631764, 'samples': 10244736, 'steps': 53357, 'loss/train': 1.180708885192871} -08/30/2021 22:50:23 - INFO - __main__ - Step 53359: {'lr': 0.00036558252680030546, 'samples': 10244928, 'steps': 53358, 'loss/train': 1.5608084201812744} -08/30/2021 22:50:23 - INFO - __main__ - Step 53360: {'lr': 0.0003655778212422135, 'samples': 10245120, 'steps': 53359, 'loss/train': 1.2837883234024048} -08/30/2021 22:50:23 - INFO - __main__ - Step 53361: {'lr': 0.0003655731156320441, 'samples': 10245312, 'steps': 53360, 'loss/train': 1.1438615322113037} -08/30/2021 22:50:24 - INFO - __main__ - Step 53362: {'lr': 0.00036556840996979914, 'samples': 10245504, 'steps': 53361, 'loss/train': 0.6098493337631226} -08/30/2021 22:50:26 - INFO - __main__ - Step 53363: {'lr': 0.0003655637042554809, 'samples': 10245696, 'steps': 53362, 'loss/train': 1.3798049688339233} -08/30/2021 22:50:26 - INFO - __main__ - Step 53364: {'lr': 0.0003655589984890914, 'samples': 10245888, 'steps': 53363, 'loss/train': 0.43864381313323975} -08/30/2021 22:50:26 - INFO - __main__ - Step 53365: {'lr': 0.00036555429267063277, 'samples': 10246080, 'steps': 53364, 'loss/train': 1.6588486433029175} -08/30/2021 22:50:27 - INFO - __main__ - Step 53366: {'lr': 0.0003655495868001072, 'samples': 10246272, 'steps': 53365, 'loss/train': 0.6482540965080261} -08/30/2021 22:50:27 - INFO - __main__ - Step 53367: {'lr': 0.00036554488087751674, 'samples': 10246464, 'steps': 53366, 'loss/train': 1.4537341594696045} -08/30/2021 22:50:29 - INFO - __main__ - Step 53368: {'lr': 0.00036554017490286354, 'samples': 10246656, 'steps': 53367, 'loss/train': 0.735163688659668} -08/30/2021 22:50:29 - INFO - __main__ - Step 53369: {'lr': 0.0003655354688761498, 'samples': 10246848, 'steps': 53368, 'loss/train': 1.0079963207244873} -08/30/2021 22:50:29 - INFO - __main__ - Step 53370: {'lr': 0.00036553076279737743, 'samples': 10247040, 'steps': 53369, 'loss/train': 2.027679204940796} -08/30/2021 22:50:30 - INFO - __main__ - Step 53371: {'lr': 0.0003655260566665488, 'samples': 10247232, 'steps': 53370, 'loss/train': 1.3684278726577759} -08/30/2021 22:50:30 - INFO - __main__ - Step 53372: {'lr': 0.0003655213504836659, 'samples': 10247424, 'steps': 53371, 'loss/train': 0.054646577686071396} -08/30/2021 22:50:32 - INFO - __main__ - Step 53373: {'lr': 0.00036551664424873084, 'samples': 10247616, 'steps': 53372, 'loss/train': 0.9775164723396301} -08/30/2021 22:50:32 - INFO - __main__ - Step 53374: {'lr': 0.00036551193796174577, 'samples': 10247808, 'steps': 53373, 'loss/train': 0.478732705116272} -08/30/2021 22:50:32 - INFO - __main__ - Step 53375: {'lr': 0.0003655072316227127, 'samples': 10248000, 'steps': 53374, 'loss/train': 1.375588059425354} -08/30/2021 22:50:33 - INFO - __main__ - Step 53376: {'lr': 0.000365502525231634, 'samples': 10248192, 'steps': 53375, 'loss/train': 1.2375893592834473} -08/30/2021 22:50:33 - INFO - __main__ - Step 53377: {'lr': 0.00036549781878851155, 'samples': 10248384, 'steps': 53376, 'loss/train': 1.5337711572647095} -08/30/2021 22:50:36 - INFO - __main__ - Step 53378: {'lr': 0.0003654931122933476, 'samples': 10248576, 'steps': 53377, 'loss/train': 0.7631622552871704} -08/30/2021 22:50:36 - INFO - __main__ - Step 53379: {'lr': 0.0003654884057461443, 'samples': 10248768, 'steps': 53378, 'loss/train': 0.9616112112998962} -08/30/2021 22:50:36 - INFO - __main__ - Step 53380: {'lr': 0.0003654836991469036, 'samples': 10248960, 'steps': 53379, 'loss/train': 1.5635032653808594} -08/30/2021 22:50:37 - INFO - __main__ - Step 53381: {'lr': 0.00036547899249562776, 'samples': 10249152, 'steps': 53380, 'loss/train': 1.335044503211975} -08/30/2021 22:50:37 - INFO - __main__ - Step 53382: {'lr': 0.00036547428579231886, 'samples': 10249344, 'steps': 53381, 'loss/train': 0.7292966246604919} -08/30/2021 22:50:38 - INFO - __main__ - Step 53383: {'lr': 0.000365469579036979, 'samples': 10249536, 'steps': 53382, 'loss/train': 0.7539511919021606} -08/30/2021 22:50:38 - INFO - __main__ - Step 53384: {'lr': 0.00036546487222961045, 'samples': 10249728, 'steps': 53383, 'loss/train': 0.9448441863059998} -08/30/2021 22:50:39 - INFO - __main__ - Step 53385: {'lr': 0.0003654601653702151, 'samples': 10249920, 'steps': 53384, 'loss/train': 1.141711711883545} -08/30/2021 22:50:40 - INFO - __main__ - Step 53386: {'lr': 0.0003654554584587952, 'samples': 10250112, 'steps': 53385, 'loss/train': 0.6322513222694397} -08/30/2021 22:50:40 - INFO - __main__ - Step 53387: {'lr': 0.0003654507514953529, 'samples': 10250304, 'steps': 53386, 'loss/train': 1.5990222692489624} -08/30/2021 22:50:41 - INFO - __main__ - Step 53388: {'lr': 0.0003654460444798902, 'samples': 10250496, 'steps': 53387, 'loss/train': 1.595096468925476} -08/30/2021 22:50:41 - INFO - __main__ - Step 53389: {'lr': 0.00036544133741240936, 'samples': 10250688, 'steps': 53388, 'loss/train': 1.534311294555664} -08/30/2021 22:50:42 - INFO - __main__ - Step 53390: {'lr': 0.0003654366302929124, 'samples': 10250880, 'steps': 53389, 'loss/train': 1.4573383331298828} -08/30/2021 22:50:43 - INFO - __main__ - Step 53391: {'lr': 0.0003654319231214015, 'samples': 10251072, 'steps': 53390, 'loss/train': 1.0705103874206543} -08/30/2021 22:50:43 - INFO - __main__ - Step 53392: {'lr': 0.00036542721589787877, 'samples': 10251264, 'steps': 53391, 'loss/train': 1.228500485420227} -08/30/2021 22:50:44 - INFO - __main__ - Step 53393: {'lr': 0.0003654225086223463, 'samples': 10251456, 'steps': 53392, 'loss/train': 1.6676151752471924} -08/30/2021 22:50:44 - INFO - __main__ - Step 53394: {'lr': 0.00036541780129480616, 'samples': 10251648, 'steps': 53393, 'loss/train': 1.5204026699066162} -08/30/2021 22:50:44 - INFO - __main__ - Step 53395: {'lr': 0.00036541309391526064, 'samples': 10251840, 'steps': 53394, 'loss/train': 0.040608614683151245} -08/30/2021 22:50:46 - INFO - __main__ - Step 53396: {'lr': 0.0003654083864837117, 'samples': 10252032, 'steps': 53395, 'loss/train': 0.45272374153137207} -08/30/2021 22:50:46 - INFO - __main__ - Step 53397: {'lr': 0.0003654036790001616, 'samples': 10252224, 'steps': 53396, 'loss/train': 1.3975297212600708} -08/30/2021 22:50:46 - INFO - __main__ - Step 53398: {'lr': 0.00036539897146461227, 'samples': 10252416, 'steps': 53397, 'loss/train': 0.8202672600746155} -08/30/2021 22:50:47 - INFO - __main__ - Step 53399: {'lr': 0.000365394263877066, 'samples': 10252608, 'steps': 53398, 'loss/train': 1.1654084920883179} -08/30/2021 22:50:47 - INFO - __main__ - Step 53400: {'lr': 0.0003653895562375248, 'samples': 10252800, 'steps': 53399, 'loss/train': 1.170444369316101} -08/30/2021 22:50:49 - INFO - __main__ - Step 53401: {'lr': 0.0003653848485459909, 'samples': 10252992, 'steps': 53400, 'loss/train': 1.4426257610321045} -08/30/2021 22:50:49 - INFO - __main__ - Step 53402: {'lr': 0.0003653801408024664, 'samples': 10253184, 'steps': 53401, 'loss/train': 1.434010624885559} -08/30/2021 22:50:49 - INFO - __main__ - Step 53403: {'lr': 0.00036537543300695335, 'samples': 10253376, 'steps': 53402, 'loss/train': 1.500929355621338} -08/30/2021 22:50:50 - INFO - __main__ - Step 53404: {'lr': 0.0003653707251594539, 'samples': 10253568, 'steps': 53403, 'loss/train': 1.3784416913986206} -08/30/2021 22:50:50 - INFO - __main__ - Step 53405: {'lr': 0.0003653660172599702, 'samples': 10253760, 'steps': 53404, 'loss/train': 1.2231831550598145} -08/30/2021 22:50:52 - INFO - __main__ - Step 53406: {'lr': 0.00036536130930850435, 'samples': 10253952, 'steps': 53405, 'loss/train': 1.5195879936218262} -08/30/2021 22:50:52 - INFO - __main__ - Step 53407: {'lr': 0.0003653566013050585, 'samples': 10254144, 'steps': 53406, 'loss/train': 0.8204035758972168} -08/30/2021 22:50:52 - INFO - __main__ - Step 53408: {'lr': 0.0003653518932496347, 'samples': 10254336, 'steps': 53407, 'loss/train': 0.37187647819519043} -08/30/2021 22:50:53 - INFO - __main__ - Step 53409: {'lr': 0.00036534718514223517, 'samples': 10254528, 'steps': 53408, 'loss/train': 1.2747961282730103} -08/30/2021 22:50:53 - INFO - __main__ - Step 53410: {'lr': 0.00036534247698286195, 'samples': 10254720, 'steps': 53409, 'loss/train': 0.8585013747215271} -08/30/2021 22:50:55 - INFO - __main__ - Step 53411: {'lr': 0.0003653377687715171, 'samples': 10254912, 'steps': 53410, 'loss/train': 1.2029095888137817} -08/30/2021 22:50:55 - INFO - __main__ - Step 53412: {'lr': 0.00036533306050820296, 'samples': 10255104, 'steps': 53411, 'loss/train': 1.298954725265503} -08/30/2021 22:50:56 - INFO - __main__ - Step 53413: {'lr': 0.00036532835219292147, 'samples': 10255296, 'steps': 53412, 'loss/train': 1.1649186611175537} -08/30/2021 22:50:56 - INFO - __main__ - Step 53414: {'lr': 0.0003653236438256748, 'samples': 10255488, 'steps': 53413, 'loss/train': 1.058119535446167} -08/30/2021 22:50:56 - INFO - __main__ - Step 53415: {'lr': 0.0003653189354064652, 'samples': 10255680, 'steps': 53414, 'loss/train': 0.74858158826828} -08/30/2021 22:50:57 - INFO - __main__ - Step 53416: {'lr': 0.0003653142269352945, 'samples': 10255872, 'steps': 53415, 'loss/train': 1.3596488237380981} -08/30/2021 22:50:58 - INFO - __main__ - Step 53417: {'lr': 0.00036530951841216505, 'samples': 10256064, 'steps': 53416, 'loss/train': 1.2551789283752441} -08/30/2021 22:50:59 - INFO - __main__ - Step 53418: {'lr': 0.00036530480983707885, 'samples': 10256256, 'steps': 53417, 'loss/train': 1.7117927074432373} -08/30/2021 22:50:59 - INFO - __main__ - Step 53419: {'lr': 0.0003653001012100382, 'samples': 10256448, 'steps': 53418, 'loss/train': 0.9548460841178894} -08/30/2021 22:50:59 - INFO - __main__ - Step 53420: {'lr': 0.00036529539253104507, 'samples': 10256640, 'steps': 53419, 'loss/train': 1.1545995473861694} -08/30/2021 22:51:00 - INFO - __main__ - Step 53421: {'lr': 0.00036529068380010155, 'samples': 10256832, 'steps': 53420, 'loss/train': 1.5638716220855713} -08/30/2021 22:51:02 - INFO - __main__ - Step 53422: {'lr': 0.00036528597501720984, 'samples': 10257024, 'steps': 53421, 'loss/train': 1.3269634246826172} -08/30/2021 22:51:02 - INFO - __main__ - Step 53423: {'lr': 0.00036528126618237206, 'samples': 10257216, 'steps': 53422, 'loss/train': 0.14268846809864044} -08/30/2021 22:51:03 - INFO - __main__ - Step 53424: {'lr': 0.00036527655729559036, 'samples': 10257408, 'steps': 53423, 'loss/train': 0.7545961141586304} -08/30/2021 22:51:03 - INFO - __main__ - Step 53425: {'lr': 0.0003652718483568668, 'samples': 10257600, 'steps': 53424, 'loss/train': 2.6051790714263916} -08/30/2021 22:51:03 - INFO - __main__ - Step 53426: {'lr': 0.00036526713936620354, 'samples': 10257792, 'steps': 53425, 'loss/train': 1.2532936334609985} -08/30/2021 22:51:05 - INFO - __main__ - Step 53427: {'lr': 0.00036526243032360264, 'samples': 10257984, 'steps': 53426, 'loss/train': 0.9665814638137817} -08/30/2021 22:51:05 - INFO - __main__ - Step 53428: {'lr': 0.0003652577212290663, 'samples': 10258176, 'steps': 53427, 'loss/train': 1.752152919769287} -08/30/2021 22:51:06 - INFO - __main__ - Step 53429: {'lr': 0.0003652530120825966, 'samples': 10258368, 'steps': 53428, 'loss/train': 1.6265177726745605} -08/30/2021 22:51:06 - INFO - __main__ - Step 53430: {'lr': 0.0003652483028841956, 'samples': 10258560, 'steps': 53429, 'loss/train': 1.3366334438323975} -08/30/2021 22:51:06 - INFO - __main__ - Step 53431: {'lr': 0.0003652435936338656, 'samples': 10258752, 'steps': 53430, 'loss/train': 1.371620535850525} -08/30/2021 22:51:08 - INFO - __main__ - Step 53432: {'lr': 0.00036523888433160864, 'samples': 10258944, 'steps': 53431, 'loss/train': 1.4021217823028564} -08/30/2021 22:51:08 - INFO - __main__ - Step 53433: {'lr': 0.00036523417497742673, 'samples': 10259136, 'steps': 53432, 'loss/train': 1.6641066074371338} -08/30/2021 22:51:09 - INFO - __main__ - Step 53434: {'lr': 0.00036522946557132206, 'samples': 10259328, 'steps': 53433, 'loss/train': 1.2567930221557617} -08/30/2021 22:51:09 - INFO - __main__ - Step 53435: {'lr': 0.00036522475611329685, 'samples': 10259520, 'steps': 53434, 'loss/train': 1.4252620935440063} -08/30/2021 22:51:09 - INFO - __main__ - Step 53436: {'lr': 0.00036522004660335304, 'samples': 10259712, 'steps': 53435, 'loss/train': 0.14292070269584656} -08/30/2021 22:51:11 - INFO - __main__ - Step 53437: {'lr': 0.000365215337041493, 'samples': 10259904, 'steps': 53436, 'loss/train': 1.4430783987045288} -08/30/2021 22:51:12 - INFO - __main__ - Step 53438: {'lr': 0.00036521062742771865, 'samples': 10260096, 'steps': 53437, 'loss/train': 1.1252435445785522} -08/30/2021 22:51:12 - INFO - __main__ - Step 53439: {'lr': 0.0003652059177620322, 'samples': 10260288, 'steps': 53438, 'loss/train': 1.7982990741729736} -08/30/2021 22:51:12 - INFO - __main__ - Step 53440: {'lr': 0.00036520120804443563, 'samples': 10260480, 'steps': 53439, 'loss/train': 1.3511203527450562} -08/30/2021 22:51:13 - INFO - __main__ - Step 53441: {'lr': 0.00036519649827493117, 'samples': 10260672, 'steps': 53440, 'loss/train': 0.39136233925819397} -08/30/2021 22:51:14 - INFO - __main__ - Step 53442: {'lr': 0.000365191788453521, 'samples': 10260864, 'steps': 53441, 'loss/train': 1.3825815916061401} -08/30/2021 22:51:15 - INFO - __main__ - Step 53443: {'lr': 0.0003651870785802072, 'samples': 10261056, 'steps': 53442, 'loss/train': 0.5633563995361328} -08/30/2021 22:51:15 - INFO - __main__ - Step 53444: {'lr': 0.00036518236865499187, 'samples': 10261248, 'steps': 53443, 'loss/train': 1.306609869003296} -08/30/2021 22:51:15 - INFO - __main__ - Step 53445: {'lr': 0.0003651776586778772, 'samples': 10261440, 'steps': 53444, 'loss/train': 1.2627437114715576} -08/30/2021 22:51:16 - INFO - __main__ - Step 53446: {'lr': 0.00036517294864886517, 'samples': 10261632, 'steps': 53445, 'loss/train': 0.8276983499526978} -08/30/2021 22:51:16 - INFO - __main__ - Step 53447: {'lr': 0.00036516823856795806, 'samples': 10261824, 'steps': 53446, 'loss/train': 1.5608497858047485} -08/30/2021 22:51:17 - INFO - __main__ - Step 53448: {'lr': 0.0003651635284351579, 'samples': 10262016, 'steps': 53447, 'loss/train': 1.156587839126587} -08/30/2021 22:51:18 - INFO - __main__ - Step 53449: {'lr': 0.00036515881825046676, 'samples': 10262208, 'steps': 53448, 'loss/train': 1.5529667139053345} -08/30/2021 22:51:18 - INFO - __main__ - Step 53450: {'lr': 0.00036515410801388686, 'samples': 10262400, 'steps': 53449, 'loss/train': 0.9423414468765259} -08/30/2021 22:51:19 - INFO - __main__ - Step 53451: {'lr': 0.0003651493977254204, 'samples': 10262592, 'steps': 53450, 'loss/train': 0.8619718551635742} -08/30/2021 22:51:20 - INFO - __main__ - Step 53452: {'lr': 0.0003651446873850693, 'samples': 10262784, 'steps': 53451, 'loss/train': 0.8839391469955444} -08/30/2021 22:51:21 - INFO - __main__ - Step 53453: {'lr': 0.0003651399769928358, 'samples': 10262976, 'steps': 53452, 'loss/train': 1.1584831476211548} -08/30/2021 22:51:21 - INFO - __main__ - Step 53454: {'lr': 0.000365135266548722, 'samples': 10263168, 'steps': 53453, 'loss/train': 1.6461392641067505} -08/30/2021 22:51:21 - INFO - __main__ - Step 53455: {'lr': 0.00036513055605273, 'samples': 10263360, 'steps': 53454, 'loss/train': 1.6310418844223022} -08/30/2021 22:51:22 - INFO - __main__ - Step 53456: {'lr': 0.0003651258455048619, 'samples': 10263552, 'steps': 53455, 'loss/train': 0.8739601969718933} -08/30/2021 22:51:22 - INFO - __main__ - Step 53457: {'lr': 0.00036512113490512, 'samples': 10263744, 'steps': 53456, 'loss/train': 1.4671311378479004} -08/30/2021 22:51:23 - INFO - __main__ - Step 53458: {'lr': 0.00036511642425350626, 'samples': 10263936, 'steps': 53457, 'loss/train': 0.11801846325397491} -08/30/2021 22:51:24 - INFO - __main__ - Step 53459: {'lr': 0.00036511171355002283, 'samples': 10264128, 'steps': 53458, 'loss/train': 0.5840108394622803} -08/30/2021 22:51:24 - INFO - __main__ - Step 53460: {'lr': 0.0003651070027946718, 'samples': 10264320, 'steps': 53459, 'loss/train': 1.3782750368118286} -08/30/2021 22:51:25 - INFO - __main__ - Step 53461: {'lr': 0.0003651022919874554, 'samples': 10264512, 'steps': 53460, 'loss/train': 1.2199827432632446} -08/30/2021 22:51:25 - INFO - __main__ - Step 53462: {'lr': 0.0003650975811283756, 'samples': 10264704, 'steps': 53461, 'loss/train': 1.2753008604049683} -08/30/2021 22:51:26 - INFO - __main__ - Step 53463: {'lr': 0.00036509287021743465, 'samples': 10264896, 'steps': 53462, 'loss/train': 1.5252403020858765} -08/30/2021 22:51:27 - INFO - __main__ - Step 53464: {'lr': 0.00036508815925463456, 'samples': 10265088, 'steps': 53463, 'loss/train': 0.8326263427734375} -08/30/2021 22:51:27 - INFO - __main__ - Step 53465: {'lr': 0.0003650834482399776, 'samples': 10265280, 'steps': 53464, 'loss/train': 0.8398168087005615} -08/30/2021 22:51:28 - INFO - __main__ - Step 53466: {'lr': 0.00036507873717346584, 'samples': 10265472, 'steps': 53465, 'loss/train': 1.22458815574646} -08/30/2021 22:51:28 - INFO - __main__ - Step 53467: {'lr': 0.00036507402605510134, 'samples': 10265664, 'steps': 53466, 'loss/train': 1.3852087259292603} -08/30/2021 22:51:30 - INFO - __main__ - Step 53468: {'lr': 0.00036506931488488627, 'samples': 10265856, 'steps': 53467, 'loss/train': 1.3797937631607056} -08/30/2021 22:51:30 - INFO - __main__ - Step 53469: {'lr': 0.0003650646036628227, 'samples': 10266048, 'steps': 53468, 'loss/train': 1.412377119064331} -08/30/2021 22:51:30 - INFO - __main__ - Step 53470: {'lr': 0.0003650598923889128, 'samples': 10266240, 'steps': 53469, 'loss/train': 0.08793564140796661} -08/30/2021 22:51:31 - INFO - __main__ - Step 53471: {'lr': 0.0003650551810631587, 'samples': 10266432, 'steps': 53470, 'loss/train': 1.978947401046753} -08/30/2021 22:51:31 - INFO - __main__ - Step 53472: {'lr': 0.00036505046968556253, 'samples': 10266624, 'steps': 53471, 'loss/train': 1.0977704524993896} -08/30/2021 22:51:33 - INFO - __main__ - Step 53473: {'lr': 0.0003650457582561264, 'samples': 10266816, 'steps': 53472, 'loss/train': 1.2934050559997559} -08/30/2021 22:51:34 - INFO - __main__ - Step 53474: {'lr': 0.0003650410467748524, 'samples': 10267008, 'steps': 53473, 'loss/train': 1.2697805166244507} -08/30/2021 22:51:34 - INFO - __main__ - Step 53475: {'lr': 0.0003650363352417427, 'samples': 10267200, 'steps': 53474, 'loss/train': 1.6234385967254639} -08/30/2021 22:51:35 - INFO - __main__ - Step 53476: {'lr': 0.00036503162365679936, 'samples': 10267392, 'steps': 53475, 'loss/train': 0.7800869941711426} -08/30/2021 22:51:35 - INFO - __main__ - Step 53477: {'lr': 0.00036502691202002456, 'samples': 10267584, 'steps': 53476, 'loss/train': 1.6124154329299927} -08/30/2021 22:51:35 - INFO - __main__ - Step 53478: {'lr': 0.00036502220033142045, 'samples': 10267776, 'steps': 53477, 'loss/train': 1.523951768875122} -08/30/2021 22:51:37 - INFO - __main__ - Step 53479: {'lr': 0.0003650174885909891, 'samples': 10267968, 'steps': 53478, 'loss/train': 1.639223337173462} -08/30/2021 22:51:38 - INFO - __main__ - Step 53480: {'lr': 0.0003650127767987326, 'samples': 10268160, 'steps': 53479, 'loss/train': 0.05455992743372917} -08/30/2021 22:51:38 - INFO - __main__ - Step 53481: {'lr': 0.00036500806495465315, 'samples': 10268352, 'steps': 53480, 'loss/train': 0.4502923786640167} -08/30/2021 22:51:38 - INFO - __main__ - Step 53482: {'lr': 0.0003650033530587529, 'samples': 10268544, 'steps': 53481, 'loss/train': 1.1247785091400146} -08/30/2021 22:51:39 - INFO - __main__ - Step 53483: {'lr': 0.00036499864111103384, 'samples': 10268736, 'steps': 53482, 'loss/train': 0.3981146812438965} -08/30/2021 22:51:40 - INFO - __main__ - Step 53484: {'lr': 0.00036499392911149817, 'samples': 10268928, 'steps': 53483, 'loss/train': 1.386189579963684} -08/30/2021 22:51:41 - INFO - __main__ - Step 53485: {'lr': 0.00036498921706014804, 'samples': 10269120, 'steps': 53484, 'loss/train': 1.434557318687439} -08/30/2021 22:51:41 - INFO - __main__ - Step 53486: {'lr': 0.00036498450495698557, 'samples': 10269312, 'steps': 53485, 'loss/train': 1.1038395166397095} -08/30/2021 22:51:41 - INFO - __main__ - Step 53487: {'lr': 0.00036497979280201276, 'samples': 10269504, 'steps': 53486, 'loss/train': 1.2938913106918335} -08/30/2021 22:51:42 - INFO - __main__ - Step 53488: {'lr': 0.0003649750805952319, 'samples': 10269696, 'steps': 53487, 'loss/train': 1.657962441444397} -08/30/2021 22:51:43 - INFO - __main__ - Step 53489: {'lr': 0.000364970368336645, 'samples': 10269888, 'steps': 53488, 'loss/train': 2.8993301391601562} -08/30/2021 22:51:44 - INFO - __main__ - Step 53490: {'lr': 0.0003649656560262542, 'samples': 10270080, 'steps': 53489, 'loss/train': 1.1926651000976562} -08/30/2021 22:51:44 - INFO - __main__ - Step 53491: {'lr': 0.00036496094366406166, 'samples': 10270272, 'steps': 53490, 'loss/train': 0.9238526225090027} -08/30/2021 22:51:45 - INFO - __main__ - Step 53492: {'lr': 0.0003649562312500696, 'samples': 10270464, 'steps': 53491, 'loss/train': 1.444689154624939} -08/30/2021 22:51:45 - INFO - __main__ - Step 53493: {'lr': 0.00036495151878427994, 'samples': 10270656, 'steps': 53492, 'loss/train': 1.4126598834991455} -08/30/2021 22:51:46 - INFO - __main__ - Step 53494: {'lr': 0.00036494680626669495, 'samples': 10270848, 'steps': 53493, 'loss/train': 1.0082255601882935} -08/30/2021 22:51:47 - INFO - __main__ - Step 53495: {'lr': 0.00036494209369731666, 'samples': 10271040, 'steps': 53494, 'loss/train': 0.8961471319198608} -08/30/2021 22:51:47 - INFO - __main__ - Step 53496: {'lr': 0.0003649373810761473, 'samples': 10271232, 'steps': 53495, 'loss/train': 0.65122389793396} -08/30/2021 22:51:48 - INFO - __main__ - Step 53497: {'lr': 0.00036493266840318886, 'samples': 10271424, 'steps': 53496, 'loss/train': 1.2869007587432861} -08/30/2021 22:51:48 - INFO - __main__ - Step 53498: {'lr': 0.0003649279556784436, 'samples': 10271616, 'steps': 53497, 'loss/train': 0.5302497744560242} -08/30/2021 22:51:49 - INFO - __main__ - Step 53499: {'lr': 0.0003649232429019135, 'samples': 10271808, 'steps': 53498, 'loss/train': 1.598929524421692} -08/30/2021 22:51:50 - INFO - __main__ - Step 53500: {'lr': 0.0003649185300736008, 'samples': 10272000, 'steps': 53499, 'loss/train': 1.7576169967651367} -08/30/2021 22:51:50 - INFO - __main__ - Step 53501: {'lr': 0.0003649138171935076, 'samples': 10272192, 'steps': 53500, 'loss/train': 1.0426875352859497} -08/30/2021 22:51:51 - INFO - __main__ - Step 53502: {'lr': 0.0003649091042616359, 'samples': 10272384, 'steps': 53501, 'loss/train': 1.349707007408142} -08/30/2021 22:51:51 - INFO - __main__ - Step 53503: {'lr': 0.000364904391277988, 'samples': 10272576, 'steps': 53502, 'loss/train': 1.4303089380264282} -08/30/2021 22:51:51 - INFO - __main__ - Step 53504: {'lr': 0.00036489967824256597, 'samples': 10272768, 'steps': 53503, 'loss/train': 3.495563507080078} -08/30/2021 22:51:53 - INFO - __main__ - Step 53505: {'lr': 0.000364894965155372, 'samples': 10272960, 'steps': 53504, 'loss/train': 1.4231292009353638} -08/30/2021 22:51:54 - INFO - __main__ - Step 53506: {'lr': 0.000364890252016408, 'samples': 10273152, 'steps': 53505, 'loss/train': 1.551091194152832} -08/30/2021 22:51:54 - INFO - __main__ - Step 53507: {'lr': 0.0003648855388256763, 'samples': 10273344, 'steps': 53506, 'loss/train': 1.722885012626648} -08/30/2021 22:51:54 - INFO - __main__ - Step 53508: {'lr': 0.0003648808255831789, 'samples': 10273536, 'steps': 53507, 'loss/train': 1.0195305347442627} -08/30/2021 22:51:55 - INFO - __main__ - Step 53509: {'lr': 0.00036487611228891805, 'samples': 10273728, 'steps': 53508, 'loss/train': 1.283014178276062} -08/30/2021 22:51:56 - INFO - __main__ - Step 53510: {'lr': 0.00036487139894289566, 'samples': 10273920, 'steps': 53509, 'loss/train': 1.020158052444458} -08/30/2021 22:51:57 - INFO - __main__ - Step 53511: {'lr': 0.0003648666855451141, 'samples': 10274112, 'steps': 53510, 'loss/train': 1.0939558744430542} -08/30/2021 22:51:57 - INFO - __main__ - Step 53512: {'lr': 0.0003648619720955754, 'samples': 10274304, 'steps': 53511, 'loss/train': 2.010610818862915} -08/30/2021 22:51:57 - INFO - __main__ - Step 53513: {'lr': 0.00036485725859428163, 'samples': 10274496, 'steps': 53512, 'loss/train': 1.1178526878356934} -08/30/2021 22:51:58 - INFO - __main__ - Step 53514: {'lr': 0.00036485254504123495, 'samples': 10274688, 'steps': 53513, 'loss/train': 1.5793871879577637} -08/30/2021 22:51:59 - INFO - __main__ - Step 53515: {'lr': 0.00036484783143643745, 'samples': 10274880, 'steps': 53514, 'loss/train': 1.0669639110565186} -08/30/2021 22:52:00 - INFO - __main__ - Step 53516: {'lr': 0.0003648431177798913, 'samples': 10275072, 'steps': 53515, 'loss/train': 2.1173694133758545} -08/30/2021 22:52:00 - INFO - __main__ - Step 53517: {'lr': 0.00036483840407159864, 'samples': 10275264, 'steps': 53516, 'loss/train': 1.7722991704940796} -08/30/2021 22:52:00 - INFO - __main__ - Step 53518: {'lr': 0.0003648336903115616, 'samples': 10275456, 'steps': 53517, 'loss/train': 1.443000078201294} -08/30/2021 22:52:01 - INFO - __main__ - Step 53519: {'lr': 0.0003648289764997823, 'samples': 10275648, 'steps': 53518, 'loss/train': 1.2102855443954468} -08/30/2021 22:52:02 - INFO - __main__ - Step 53520: {'lr': 0.00036482426263626265, 'samples': 10275840, 'steps': 53519, 'loss/train': 1.4799578189849854} -08/30/2021 22:52:03 - INFO - __main__ - Step 53521: {'lr': 0.0003648195487210051, 'samples': 10276032, 'steps': 53520, 'loss/train': 1.193872094154358} -08/30/2021 22:52:03 - INFO - __main__ - Step 53522: {'lr': 0.0003648148347540116, 'samples': 10276224, 'steps': 53521, 'loss/train': 1.3264586925506592} -08/30/2021 22:52:03 - INFO - __main__ - Step 53523: {'lr': 0.0003648101207352843, 'samples': 10276416, 'steps': 53522, 'loss/train': 1.4574564695358276} -08/30/2021 22:52:04 - INFO - __main__ - Step 53524: {'lr': 0.00036480540666482535, 'samples': 10276608, 'steps': 53523, 'loss/train': 1.1356863975524902} -08/30/2021 22:52:06 - INFO - __main__ - Step 53525: {'lr': 0.00036480069254263693, 'samples': 10276800, 'steps': 53524, 'loss/train': 0.6236507296562195} -08/30/2021 22:52:07 - INFO - __main__ - Step 53526: {'lr': 0.000364795978368721, 'samples': 10276992, 'steps': 53525, 'loss/train': 1.2939671277999878} -08/30/2021 22:52:07 - INFO - __main__ - Step 53527: {'lr': 0.0003647912641430798, 'samples': 10277184, 'steps': 53526, 'loss/train': 0.9056761264801025} -08/30/2021 22:52:07 - INFO - __main__ - Step 53528: {'lr': 0.0003647865498657154, 'samples': 10277376, 'steps': 53527, 'loss/train': 1.0268940925598145} -08/30/2021 22:52:08 - INFO - __main__ - Step 53529: {'lr': 0.0003647818355366299, 'samples': 10277568, 'steps': 53528, 'loss/train': 2.517875909805298} -08/30/2021 22:52:08 - INFO - __main__ - Step 53530: {'lr': 0.00036477712115582555, 'samples': 10277760, 'steps': 53529, 'loss/train': 1.992435336112976} -08/30/2021 22:52:10 - INFO - __main__ - Step 53531: {'lr': 0.0003647724067233044, 'samples': 10277952, 'steps': 53530, 'loss/train': 0.8576481938362122} -08/30/2021 22:52:10 - INFO - __main__ - Step 53532: {'lr': 0.00036476769223906864, 'samples': 10278144, 'steps': 53531, 'loss/train': 1.5434718132019043} -08/30/2021 22:52:11 - INFO - __main__ - Step 53533: {'lr': 0.0003647629777031202, 'samples': 10278336, 'steps': 53532, 'loss/train': 1.200901985168457} -08/30/2021 22:52:11 - INFO - __main__ - Step 53534: {'lr': 0.0003647582631154614, 'samples': 10278528, 'steps': 53533, 'loss/train': 1.8989466428756714} -08/30/2021 22:52:11 - INFO - __main__ - Step 53535: {'lr': 0.00036475354847609434, 'samples': 10278720, 'steps': 53534, 'loss/train': 1.4029427766799927} -08/30/2021 22:52:13 - INFO - __main__ - Step 53536: {'lr': 0.000364748833785021, 'samples': 10278912, 'steps': 53535, 'loss/train': 1.9528943300247192} -08/30/2021 22:52:13 - INFO - __main__ - Step 53537: {'lr': 0.0003647441190422437, 'samples': 10279104, 'steps': 53536, 'loss/train': 1.6159769296646118} -08/30/2021 22:52:14 - INFO - __main__ - Step 53538: {'lr': 0.00036473940424776443, 'samples': 10279296, 'steps': 53537, 'loss/train': 1.4012949466705322} -08/30/2021 22:52:14 - INFO - __main__ - Step 53539: {'lr': 0.0003647346894015853, 'samples': 10279488, 'steps': 53538, 'loss/train': 1.6042912006378174} -08/30/2021 22:52:14 - INFO - __main__ - Step 53540: {'lr': 0.0003647299745037085, 'samples': 10279680, 'steps': 53539, 'loss/train': 1.0776602029800415} -08/30/2021 22:52:16 - INFO - __main__ - Step 53541: {'lr': 0.00036472525955413626, 'samples': 10279872, 'steps': 53540, 'loss/train': 1.5056815147399902} -08/30/2021 22:52:16 - INFO - __main__ - Step 53542: {'lr': 0.00036472054455287053, 'samples': 10280064, 'steps': 53541, 'loss/train': 1.3808598518371582} -08/30/2021 22:52:17 - INFO - __main__ - Step 53543: {'lr': 0.00036471582949991347, 'samples': 10280256, 'steps': 53542, 'loss/train': 2.001156806945801} -08/30/2021 22:52:17 - INFO - __main__ - Step 53544: {'lr': 0.0003647111143952672, 'samples': 10280448, 'steps': 53543, 'loss/train': 1.7043068408966064} -08/30/2021 22:52:17 - INFO - __main__ - Step 53545: {'lr': 0.0003647063992389339, 'samples': 10280640, 'steps': 53544, 'loss/train': 1.573975682258606} -08/30/2021 22:52:19 - INFO - __main__ - Step 53546: {'lr': 0.00036470168403091567, 'samples': 10280832, 'steps': 53545, 'loss/train': 1.301865577697754} -08/30/2021 22:52:20 - INFO - __main__ - Step 53547: {'lr': 0.00036469696877121464, 'samples': 10281024, 'steps': 53546, 'loss/train': 1.6805670261383057} -08/30/2021 22:52:20 - INFO - __main__ - Step 53548: {'lr': 0.000364692253459833, 'samples': 10281216, 'steps': 53547, 'loss/train': 0.7505008578300476} -08/30/2021 22:52:20 - INFO - __main__ - Step 53549: {'lr': 0.0003646875380967727, 'samples': 10281408, 'steps': 53548, 'loss/train': 1.2794783115386963} -08/30/2021 22:52:21 - INFO - __main__ - Step 53550: {'lr': 0.00036468282268203595, 'samples': 10281600, 'steps': 53549, 'loss/train': 2.3715789318084717} -08/30/2021 22:52:21 - INFO - __main__ - Step 53551: {'lr': 0.0003646781072156249, 'samples': 10281792, 'steps': 53550, 'loss/train': 1.349063515663147} -08/30/2021 22:52:23 - INFO - __main__ - Step 53552: {'lr': 0.00036467339169754173, 'samples': 10281984, 'steps': 53551, 'loss/train': 0.6878082752227783} -08/30/2021 22:52:23 - INFO - __main__ - Step 53553: {'lr': 0.0003646686761277884, 'samples': 10282176, 'steps': 53552, 'loss/train': 1.3104041814804077} -08/30/2021 22:52:23 - INFO - __main__ - Step 53554: {'lr': 0.00036466396050636725, 'samples': 10282368, 'steps': 53553, 'loss/train': 1.3920091390609741} -08/30/2021 22:52:24 - INFO - __main__ - Step 53555: {'lr': 0.0003646592448332802, 'samples': 10282560, 'steps': 53554, 'loss/train': 0.8019581437110901} -08/30/2021 22:52:24 - INFO - __main__ - Step 53556: {'lr': 0.00036465452910852946, 'samples': 10282752, 'steps': 53555, 'loss/train': 1.3756120204925537} -08/30/2021 22:52:26 - INFO - __main__ - Step 53557: {'lr': 0.00036464981333211724, 'samples': 10282944, 'steps': 53556, 'loss/train': 1.5004515647888184} -08/30/2021 22:52:26 - INFO - __main__ - Step 53558: {'lr': 0.0003646450975040455, 'samples': 10283136, 'steps': 53557, 'loss/train': 1.5661299228668213} -08/30/2021 22:52:27 - INFO - __main__ - Step 53559: {'lr': 0.00036464038162431657, 'samples': 10283328, 'steps': 53558, 'loss/train': 1.9571486711502075} -08/30/2021 22:52:27 - INFO - __main__ - Step 53560: {'lr': 0.00036463566569293235, 'samples': 10283520, 'steps': 53559, 'loss/train': 1.5035619735717773} -08/30/2021 22:52:27 - INFO - __main__ - Step 53561: {'lr': 0.0003646309497098951, 'samples': 10283712, 'steps': 53560, 'loss/train': 1.8263338804244995} -08/30/2021 22:52:28 - INFO - __main__ - Step 53562: {'lr': 0.00036462623367520684, 'samples': 10283904, 'steps': 53561, 'loss/train': 1.520851731300354} -08/30/2021 22:52:29 - INFO - __main__ - Step 53563: {'lr': 0.00036462151758886985, 'samples': 10284096, 'steps': 53562, 'loss/train': 2.425801992416382} -08/30/2021 22:52:30 - INFO - __main__ - Step 53564: {'lr': 0.0003646168014508861, 'samples': 10284288, 'steps': 53563, 'loss/train': 1.1778380870819092} -08/30/2021 22:52:30 - INFO - __main__ - Step 53565: {'lr': 0.00036461208526125785, 'samples': 10284480, 'steps': 53564, 'loss/train': 1.2143785953521729} -08/30/2021 22:52:31 - INFO - __main__ - Step 53566: {'lr': 0.0003646073690199872, 'samples': 10284672, 'steps': 53565, 'loss/train': 1.1335147619247437} -08/30/2021 22:52:31 - INFO - __main__ - Step 53567: {'lr': 0.00036460265272707617, 'samples': 10284864, 'steps': 53566, 'loss/train': 1.2677206993103027} -08/30/2021 22:52:32 - INFO - __main__ - Step 53568: {'lr': 0.000364597936382527, 'samples': 10285056, 'steps': 53567, 'loss/train': 1.5351126194000244} -08/30/2021 22:52:33 - INFO - __main__ - Step 53569: {'lr': 0.0003645932199863417, 'samples': 10285248, 'steps': 53568, 'loss/train': 1.2966172695159912} -08/30/2021 22:52:33 - INFO - __main__ - Step 53570: {'lr': 0.00036458850353852246, 'samples': 10285440, 'steps': 53569, 'loss/train': 0.4543309807777405} -08/30/2021 22:52:33 - INFO - __main__ - Step 53571: {'lr': 0.0003645837870390715, 'samples': 10285632, 'steps': 53570, 'loss/train': 1.1566879749298096} -08/30/2021 22:52:34 - INFO - __main__ - Step 53572: {'lr': 0.00036457907048799084, 'samples': 10285824, 'steps': 53571, 'loss/train': 1.687994360923767} -08/30/2021 22:52:36 - INFO - __main__ - Step 53573: {'lr': 0.00036457435388528257, 'samples': 10286016, 'steps': 53572, 'loss/train': 0.6456499099731445} -08/30/2021 22:52:36 - INFO - __main__ - Step 53574: {'lr': 0.0003645696372309488, 'samples': 10286208, 'steps': 53573, 'loss/train': 1.6295289993286133} -08/30/2021 22:52:36 - INFO - __main__ - Step 53575: {'lr': 0.00036456492052499185, 'samples': 10286400, 'steps': 53574, 'loss/train': 1.1518089771270752} -08/30/2021 22:52:37 - INFO - __main__ - Step 53576: {'lr': 0.00036456020376741363, 'samples': 10286592, 'steps': 53575, 'loss/train': 1.277836561203003} -08/30/2021 22:52:37 - INFO - __main__ - Step 53577: {'lr': 0.0003645554869582164, 'samples': 10286784, 'steps': 53576, 'loss/train': 0.33677440881729126} -08/30/2021 22:52:37 - INFO - __main__ - Step 53578: {'lr': 0.0003645507700974022, 'samples': 10286976, 'steps': 53577, 'loss/train': 1.091191053390503} -08/30/2021 22:52:38 - INFO - __main__ - Step 53579: {'lr': 0.00036454605318497323, 'samples': 10287168, 'steps': 53578, 'loss/train': 1.3166148662567139} -08/30/2021 22:52:39 - INFO - __main__ - Step 53580: {'lr': 0.00036454133622093154, 'samples': 10287360, 'steps': 53579, 'loss/train': 0.6587302684783936} -08/30/2021 22:52:40 - INFO - __main__ - Step 53581: {'lr': 0.00036453661920527933, 'samples': 10287552, 'steps': 53580, 'loss/train': 1.1824767589569092} -08/30/2021 22:52:40 - INFO - __main__ - Step 53582: {'lr': 0.0003645319021380186, 'samples': 10287744, 'steps': 53581, 'loss/train': 1.2667876482009888} -08/30/2021 22:52:40 - INFO - __main__ - Step 53583: {'lr': 0.00036452718501915165, 'samples': 10287936, 'steps': 53582, 'loss/train': 0.3757949769496918} -08/30/2021 22:52:41 - INFO - __main__ - Step 53584: {'lr': 0.00036452246784868047, 'samples': 10288128, 'steps': 53583, 'loss/train': 0.5303133130073547} -08/30/2021 22:52:43 - INFO - __main__ - Step 53585: {'lr': 0.0003645177506266072, 'samples': 10288320, 'steps': 53584, 'loss/train': 1.7345420122146606} -08/30/2021 22:52:43 - INFO - __main__ - Step 53586: {'lr': 0.0003645130333529342, 'samples': 10288512, 'steps': 53585, 'loss/train': 1.2740157842636108} -08/30/2021 22:52:44 - INFO - __main__ - Step 53587: {'lr': 0.0003645083160276632, 'samples': 10288704, 'steps': 53586, 'loss/train': 1.4862607717514038} -08/30/2021 22:52:44 - INFO - __main__ - Step 53588: {'lr': 0.0003645035986507966, 'samples': 10288896, 'steps': 53587, 'loss/train': 1.404309630393982} -08/30/2021 22:52:44 - INFO - __main__ - Step 53589: {'lr': 0.00036449888122233636, 'samples': 10289088, 'steps': 53588, 'loss/train': 1.5585339069366455} -08/30/2021 22:52:46 - INFO - __main__ - Step 53590: {'lr': 0.00036449416374228474, 'samples': 10289280, 'steps': 53589, 'loss/train': 1.390363335609436} -08/30/2021 22:52:47 - INFO - __main__ - Step 53591: {'lr': 0.00036448944621064386, 'samples': 10289472, 'steps': 53590, 'loss/train': 2.0829086303710938} -08/30/2021 22:52:47 - INFO - __main__ - Step 53592: {'lr': 0.00036448472862741577, 'samples': 10289664, 'steps': 53591, 'loss/train': 1.330190658569336} -08/30/2021 22:52:47 - INFO - __main__ - Step 53593: {'lr': 0.0003644800109926026, 'samples': 10289856, 'steps': 53592, 'loss/train': 1.5439928770065308} -08/30/2021 22:52:48 - INFO - __main__ - Step 53594: {'lr': 0.00036447529330620653, 'samples': 10290048, 'steps': 53593, 'loss/train': 0.9738254547119141} -08/30/2021 22:52:49 - INFO - __main__ - Step 53595: {'lr': 0.0003644705755682296, 'samples': 10290240, 'steps': 53594, 'loss/train': 1.4617013931274414} -08/30/2021 22:52:50 - INFO - __main__ - Step 53596: {'lr': 0.00036446585777867406, 'samples': 10290432, 'steps': 53595, 'loss/train': 1.7266370058059692} -08/30/2021 22:52:50 - INFO - __main__ - Step 53597: {'lr': 0.0003644611399375419, 'samples': 10290624, 'steps': 53596, 'loss/train': 1.4301815032958984} -08/30/2021 22:52:50 - INFO - __main__ - Step 53598: {'lr': 0.0003644564220448354, 'samples': 10290816, 'steps': 53597, 'loss/train': 1.1844182014465332} -08/30/2021 22:52:51 - INFO - __main__ - Step 53599: {'lr': 0.0003644517041005566, 'samples': 10291008, 'steps': 53598, 'loss/train': 1.2154752016067505} -08/30/2021 22:52:52 - INFO - __main__ - Step 53600: {'lr': 0.0003644469861047076, 'samples': 10291200, 'steps': 53599, 'loss/train': 1.3206616640090942} -08/30/2021 22:52:53 - INFO - __main__ - Step 53601: {'lr': 0.0003644422680572906, 'samples': 10291392, 'steps': 53600, 'loss/train': 0.04915463551878929} -08/30/2021 22:52:53 - INFO - __main__ - Step 53602: {'lr': 0.00036443754995830763, 'samples': 10291584, 'steps': 53601, 'loss/train': 0.9714437127113342} -08/30/2021 22:52:53 - INFO - __main__ - Step 53603: {'lr': 0.0003644328318077609, 'samples': 10291776, 'steps': 53602, 'loss/train': 1.9094164371490479} -08/30/2021 22:52:54 - INFO - __main__ - Step 53604: {'lr': 0.0003644281136056524, 'samples': 10291968, 'steps': 53603, 'loss/train': 1.4263784885406494} -08/30/2021 22:52:55 - INFO - __main__ - Step 53605: {'lr': 0.00036442339535198444, 'samples': 10292160, 'steps': 53604, 'loss/train': 1.1671565771102905} -08/30/2021 22:52:56 - INFO - __main__ - Step 53606: {'lr': 0.00036441867704675913, 'samples': 10292352, 'steps': 53605, 'loss/train': 1.1522252559661865} -08/30/2021 22:52:56 - INFO - __main__ - Step 53607: {'lr': 0.00036441395868997843, 'samples': 10292544, 'steps': 53606, 'loss/train': 0.9276661276817322} -08/30/2021 22:52:56 - INFO - __main__ - Step 53608: {'lr': 0.00036440924028164457, 'samples': 10292736, 'steps': 53607, 'loss/train': 1.4873414039611816} -08/30/2021 22:52:57 - INFO - __main__ - Step 53609: {'lr': 0.0003644045218217597, 'samples': 10292928, 'steps': 53608, 'loss/train': 1.9295828342437744} -08/30/2021 22:52:57 - INFO - __main__ - Step 53610: {'lr': 0.000364399803310326, 'samples': 10293120, 'steps': 53609, 'loss/train': 1.6021238565444946} -08/30/2021 22:52:59 - INFO - __main__ - Step 53611: {'lr': 0.0003643950847473453, 'samples': 10293312, 'steps': 53610, 'loss/train': 1.492674708366394} -08/30/2021 22:52:59 - INFO - __main__ - Step 53612: {'lr': 0.0003643903661328201, 'samples': 10293504, 'steps': 53611, 'loss/train': 0.8950345516204834} -08/30/2021 22:52:59 - INFO - __main__ - Step 53613: {'lr': 0.0003643856474667524, 'samples': 10293696, 'steps': 53612, 'loss/train': 1.5756936073303223} -08/30/2021 22:53:00 - INFO - __main__ - Step 53614: {'lr': 0.0003643809287491442, 'samples': 10293888, 'steps': 53613, 'loss/train': 2.132282257080078} -08/30/2021 22:53:00 - INFO - __main__ - Step 53615: {'lr': 0.00036437620997999777, 'samples': 10294080, 'steps': 53614, 'loss/train': 1.177676796913147} -08/30/2021 22:53:02 - INFO - __main__ - Step 53616: {'lr': 0.0003643714911593151, 'samples': 10294272, 'steps': 53615, 'loss/train': 1.4318127632141113} -08/30/2021 22:53:02 - INFO - __main__ - Step 53617: {'lr': 0.00036436677228709845, 'samples': 10294464, 'steps': 53616, 'loss/train': 1.320518970489502} -08/30/2021 22:53:02 - INFO - __main__ - Step 53618: {'lr': 0.00036436205336334995, 'samples': 10294656, 'steps': 53617, 'loss/train': 1.4042026996612549} -08/30/2021 22:53:03 - INFO - __main__ - Step 53619: {'lr': 0.0003643573343880716, 'samples': 10294848, 'steps': 53618, 'loss/train': 1.5927362442016602} -08/30/2021 22:53:03 - INFO - __main__ - Step 53620: {'lr': 0.00036435261536126566, 'samples': 10295040, 'steps': 53619, 'loss/train': 1.2768652439117432} -08/30/2021 22:53:05 - INFO - __main__ - Step 53621: {'lr': 0.0003643478962829342, 'samples': 10295232, 'steps': 53620, 'loss/train': 1.4479957818984985} -08/30/2021 22:53:05 - INFO - __main__ - Step 53622: {'lr': 0.0003643431771530793, 'samples': 10295424, 'steps': 53621, 'loss/train': 0.927509069442749} -08/30/2021 22:53:05 - INFO - __main__ - Step 53623: {'lr': 0.0003643384579717031, 'samples': 10295616, 'steps': 53622, 'loss/train': 1.726568579673767} -08/30/2021 22:53:06 - INFO - __main__ - Step 53624: {'lr': 0.0003643337387388078, 'samples': 10295808, 'steps': 53623, 'loss/train': 1.381607174873352} -08/30/2021 22:53:06 - INFO - __main__ - Step 53625: {'lr': 0.00036432901945439544, 'samples': 10296000, 'steps': 53624, 'loss/train': 1.8157492876052856} -08/30/2021 22:53:08 - INFO - __main__ - Step 53626: {'lr': 0.0003643243001184683, 'samples': 10296192, 'steps': 53625, 'loss/train': 0.9247584939002991} -08/30/2021 22:53:08 - INFO - __main__ - Step 53627: {'lr': 0.00036431958073102825, 'samples': 10296384, 'steps': 53626, 'loss/train': 1.437009334564209} -08/30/2021 22:53:08 - INFO - __main__ - Step 53628: {'lr': 0.00036431486129207767, 'samples': 10296576, 'steps': 53627, 'loss/train': 1.3408094644546509} -08/30/2021 22:53:09 - INFO - __main__ - Step 53629: {'lr': 0.00036431014180161853, 'samples': 10296768, 'steps': 53628, 'loss/train': 1.5201278924942017} -08/30/2021 22:53:09 - INFO - __main__ - Step 53630: {'lr': 0.000364305422259653, 'samples': 10296960, 'steps': 53629, 'loss/train': 1.462058424949646} -08/30/2021 22:53:11 - INFO - __main__ - Step 53631: {'lr': 0.0003643007026661832, 'samples': 10297152, 'steps': 53630, 'loss/train': 1.388784646987915} -08/30/2021 22:53:11 - INFO - __main__ - Step 53632: {'lr': 0.0003642959830212113, 'samples': 10297344, 'steps': 53631, 'loss/train': 0.9494279623031616} -08/30/2021 22:53:12 - INFO - __main__ - Step 53633: {'lr': 0.0003642912633247394, 'samples': 10297536, 'steps': 53632, 'loss/train': 1.1987769603729248} -08/30/2021 22:53:12 - INFO - __main__ - Step 53634: {'lr': 0.0003642865435767696, 'samples': 10297728, 'steps': 53633, 'loss/train': 2.458717107772827} -08/30/2021 22:53:12 - INFO - __main__ - Step 53635: {'lr': 0.00036428182377730407, 'samples': 10297920, 'steps': 53634, 'loss/train': 1.3919092416763306} -08/30/2021 22:53:13 - INFO - __main__ - Step 53636: {'lr': 0.00036427710392634483, 'samples': 10298112, 'steps': 53635, 'loss/train': 0.031980302184820175} -08/30/2021 22:53:15 - INFO - __main__ - Step 53637: {'lr': 0.0003642723840238942, 'samples': 10298304, 'steps': 53636, 'loss/train': 1.202775001525879} -08/30/2021 22:53:16 - INFO - __main__ - Step 53638: {'lr': 0.0003642676640699542, 'samples': 10298496, 'steps': 53637, 'loss/train': 1.4996012449264526} -08/30/2021 22:53:16 - INFO - __main__ - Step 53639: {'lr': 0.0003642629440645269, 'samples': 10298688, 'steps': 53638, 'loss/train': 1.7215982675552368} -08/30/2021 22:53:16 - INFO - __main__ - Step 53640: {'lr': 0.00036425822400761444, 'samples': 10298880, 'steps': 53639, 'loss/train': 1.4854384660720825} -08/30/2021 22:53:17 - INFO - __main__ - Step 53641: {'lr': 0.000364253503899219, 'samples': 10299072, 'steps': 53640, 'loss/train': 1.1110572814941406} -08/30/2021 22:53:18 - INFO - __main__ - Step 53642: {'lr': 0.00036424878373934275, 'samples': 10299264, 'steps': 53641, 'loss/train': 1.4678090810775757} -08/30/2021 22:53:19 - INFO - __main__ - Step 53643: {'lr': 0.0003642440635279877, 'samples': 10299456, 'steps': 53642, 'loss/train': 1.320936679840088} -08/30/2021 22:53:19 - INFO - __main__ - Step 53644: {'lr': 0.0003642393432651561, 'samples': 10299648, 'steps': 53643, 'loss/train': 2.0022051334381104} -08/30/2021 22:53:19 - INFO - __main__ - Step 53645: {'lr': 0.00036423462295085, 'samples': 10299840, 'steps': 53644, 'loss/train': 0.9051774740219116} -08/30/2021 22:53:20 - INFO - __main__ - Step 53646: {'lr': 0.00036422990258507155, 'samples': 10300032, 'steps': 53645, 'loss/train': 0.39250320196151733} -08/30/2021 22:53:21 - INFO - __main__ - Step 53647: {'lr': 0.00036422518216782285, 'samples': 10300224, 'steps': 53646, 'loss/train': 1.6496013402938843} -08/30/2021 22:53:22 - INFO - __main__ - Step 53648: {'lr': 0.00036422046169910604, 'samples': 10300416, 'steps': 53647, 'loss/train': 1.0909745693206787} -08/30/2021 22:53:22 - INFO - __main__ - Step 53649: {'lr': 0.00036421574117892323, 'samples': 10300608, 'steps': 53648, 'loss/train': 0.055397044867277145} -08/30/2021 22:53:23 - INFO - __main__ - Step 53650: {'lr': 0.0003642110206072766, 'samples': 10300800, 'steps': 53649, 'loss/train': 0.6435099244117737} -08/30/2021 22:53:23 - INFO - __main__ - Step 53651: {'lr': 0.0003642062999841682, 'samples': 10300992, 'steps': 53650, 'loss/train': 1.5886059999465942} -08/30/2021 22:53:24 - INFO - __main__ - Step 53652: {'lr': 0.00036420157930960027, 'samples': 10301184, 'steps': 53651, 'loss/train': 0.5165435075759888} -08/30/2021 22:53:25 - INFO - __main__ - Step 53653: {'lr': 0.00036419685858357485, 'samples': 10301376, 'steps': 53652, 'loss/train': 1.1679151058197021} -08/30/2021 22:53:25 - INFO - __main__ - Step 53654: {'lr': 0.0003641921378060941, 'samples': 10301568, 'steps': 53653, 'loss/train': 1.5994067192077637} -08/30/2021 22:53:25 - INFO - __main__ - Step 53655: {'lr': 0.00036418741697716013, 'samples': 10301760, 'steps': 53654, 'loss/train': 0.8237423896789551} -08/30/2021 22:53:26 - INFO - __main__ - Step 53656: {'lr': 0.00036418269609677506, 'samples': 10301952, 'steps': 53655, 'loss/train': 1.3924806118011475} -08/30/2021 22:53:27 - INFO - __main__ - Step 53657: {'lr': 0.000364177975164941, 'samples': 10302144, 'steps': 53656, 'loss/train': 0.8165030479431152} -08/30/2021 22:53:28 - INFO - __main__ - Step 53658: {'lr': 0.0003641732541816601, 'samples': 10302336, 'steps': 53657, 'loss/train': 1.3477058410644531} -08/30/2021 22:53:28 - INFO - __main__ - Step 53659: {'lr': 0.0003641685331469346, 'samples': 10302528, 'steps': 53658, 'loss/train': 1.491005539894104} -08/30/2021 22:53:28 - INFO - __main__ - Step 53660: {'lr': 0.0003641638120607665, 'samples': 10302720, 'steps': 53659, 'loss/train': 1.7326476573944092} -08/30/2021 22:53:29 - INFO - __main__ - Step 53661: {'lr': 0.00036415909092315786, 'samples': 10302912, 'steps': 53660, 'loss/train': 0.343622624874115} -08/30/2021 22:53:29 - INFO - __main__ - Step 53662: {'lr': 0.00036415436973411095, 'samples': 10303104, 'steps': 53661, 'loss/train': 1.4072625637054443} -08/30/2021 22:53:31 - INFO - __main__ - Step 53663: {'lr': 0.0003641496484936278, 'samples': 10303296, 'steps': 53662, 'loss/train': 0.9885417819023132} -08/30/2021 22:53:31 - INFO - __main__ - Step 53664: {'lr': 0.0003641449272017106, 'samples': 10303488, 'steps': 53663, 'loss/train': 0.91515052318573} -08/30/2021 22:53:32 - INFO - __main__ - Step 53665: {'lr': 0.00036414020585836144, 'samples': 10303680, 'steps': 53664, 'loss/train': 1.0116825103759766} -08/30/2021 22:53:32 - INFO - __main__ - Step 53666: {'lr': 0.00036413548446358255, 'samples': 10303872, 'steps': 53665, 'loss/train': 0.559353232383728} -08/30/2021 22:53:32 - INFO - __main__ - Step 53667: {'lr': 0.0003641307630173759, 'samples': 10304064, 'steps': 53666, 'loss/train': 1.0364325046539307} -08/30/2021 22:53:34 - INFO - __main__ - Step 53668: {'lr': 0.0003641260415197437, 'samples': 10304256, 'steps': 53667, 'loss/train': 1.8374452590942383} -08/30/2021 22:53:34 - INFO - __main__ - Step 53669: {'lr': 0.0003641213199706881, 'samples': 10304448, 'steps': 53668, 'loss/train': 1.1233552694320679} -08/30/2021 22:53:35 - INFO - __main__ - Step 53670: {'lr': 0.0003641165983702111, 'samples': 10304640, 'steps': 53669, 'loss/train': 1.882941722869873} -08/30/2021 22:53:35 - INFO - __main__ - Step 53671: {'lr': 0.000364111876718315, 'samples': 10304832, 'steps': 53670, 'loss/train': 0.7725663185119629} -08/30/2021 22:53:36 - INFO - __main__ - Step 53672: {'lr': 0.0003641071550150019, 'samples': 10305024, 'steps': 53671, 'loss/train': 0.8464277386665344} -08/30/2021 22:53:36 - INFO - __main__ - Step 53673: {'lr': 0.00036410243326027373, 'samples': 10305216, 'steps': 53672, 'loss/train': 1.7000603675842285} -08/30/2021 22:53:38 - INFO - __main__ - Step 53674: {'lr': 0.0003640977114541328, 'samples': 10305408, 'steps': 53673, 'loss/train': 1.5568926334381104} -08/30/2021 22:53:38 - INFO - __main__ - Step 53675: {'lr': 0.0003640929895965813, 'samples': 10305600, 'steps': 53674, 'loss/train': 0.826578676700592} -08/30/2021 22:53:39 - INFO - __main__ - Step 53676: {'lr': 0.0003640882676876212, 'samples': 10305792, 'steps': 53675, 'loss/train': 1.554081678390503} -08/30/2021 22:53:39 - INFO - __main__ - Step 53677: {'lr': 0.0003640835457272547, 'samples': 10305984, 'steps': 53676, 'loss/train': 1.6683779954910278} -08/30/2021 22:53:39 - INFO - __main__ - Step 53678: {'lr': 0.00036407882371548394, 'samples': 10306176, 'steps': 53677, 'loss/train': 1.8408193588256836} -08/30/2021 22:53:41 - INFO - __main__ - Step 53679: {'lr': 0.00036407410165231096, 'samples': 10306368, 'steps': 53678, 'loss/train': 0.4423947334289551} -08/30/2021 22:53:41 - INFO - __main__ - Step 53680: {'lr': 0.000364069379537738, 'samples': 10306560, 'steps': 53679, 'loss/train': 1.6478915214538574} -08/30/2021 22:53:42 - INFO - __main__ - Step 53681: {'lr': 0.0003640646573717671, 'samples': 10306752, 'steps': 53680, 'loss/train': 1.6639094352722168} -08/30/2021 22:53:42 - INFO - __main__ - Step 53682: {'lr': 0.00036405993515440044, 'samples': 10306944, 'steps': 53681, 'loss/train': 0.8151056170463562} -08/30/2021 22:53:42 - INFO - __main__ - Step 53683: {'lr': 0.0003640552128856401, 'samples': 10307136, 'steps': 53682, 'loss/train': 1.445812702178955} -08/30/2021 22:53:44 - INFO - __main__ - Step 53684: {'lr': 0.00036405049056548834, 'samples': 10307328, 'steps': 53683, 'loss/train': 1.7645049095153809} -08/30/2021 22:53:45 - INFO - __main__ - Step 53685: {'lr': 0.0003640457681939471, 'samples': 10307520, 'steps': 53684, 'loss/train': 1.2873436212539673} -08/30/2021 22:53:45 - INFO - __main__ - Step 53686: {'lr': 0.0003640410457710186, 'samples': 10307712, 'steps': 53685, 'loss/train': 1.4765723943710327} -08/30/2021 22:53:45 - INFO - __main__ - Step 53687: {'lr': 0.000364036323296705, 'samples': 10307904, 'steps': 53686, 'loss/train': 1.4670441150665283} -08/30/2021 22:53:46 - INFO - __main__ - Step 53688: {'lr': 0.0003640316007710084, 'samples': 10308096, 'steps': 53687, 'loss/train': 1.1963099241256714} -08/30/2021 22:53:46 - INFO - __main__ - Step 53689: {'lr': 0.0003640268781939309, 'samples': 10308288, 'steps': 53688, 'loss/train': 1.2051911354064941} -08/30/2021 22:53:48 - INFO - __main__ - Step 53690: {'lr': 0.0003640221555654747, 'samples': 10308480, 'steps': 53689, 'loss/train': 0.9849037528038025} -08/30/2021 22:53:48 - INFO - __main__ - Step 53691: {'lr': 0.0003640174328856418, 'samples': 10308672, 'steps': 53690, 'loss/train': 1.4371440410614014} -08/30/2021 22:53:48 - INFO - __main__ - Step 53692: {'lr': 0.0003640127101544344, 'samples': 10308864, 'steps': 53691, 'loss/train': 1.3826385736465454} -08/30/2021 22:53:49 - INFO - __main__ - Step 53693: {'lr': 0.00036400798737185465, 'samples': 10309056, 'steps': 53692, 'loss/train': 1.2004871368408203} -08/30/2021 22:53:49 - INFO - __main__ - Step 53694: {'lr': 0.0003640032645379047, 'samples': 10309248, 'steps': 53693, 'loss/train': 0.4266481399536133} -08/30/2021 22:53:51 - INFO - __main__ - Step 53695: {'lr': 0.0003639985416525866, 'samples': 10309440, 'steps': 53694, 'loss/train': 1.4924750328063965} -08/30/2021 22:53:52 - INFO - __main__ - Step 53696: {'lr': 0.00036399381871590254, 'samples': 10309632, 'steps': 53695, 'loss/train': 0.5292871594429016} -08/30/2021 22:53:52 - INFO - __main__ - Step 53697: {'lr': 0.0003639890957278546, 'samples': 10309824, 'steps': 53696, 'loss/train': 1.360403060913086} -08/30/2021 22:53:52 - INFO - __main__ - Step 53698: {'lr': 0.0003639843726884449, 'samples': 10310016, 'steps': 53697, 'loss/train': 1.595663070678711} -08/30/2021 22:53:53 - INFO - __main__ - Step 53699: {'lr': 0.0003639796495976757, 'samples': 10310208, 'steps': 53698, 'loss/train': 1.8290520906448364} -08/30/2021 22:53:55 - INFO - __main__ - Step 53700: {'lr': 0.000363974926455549, 'samples': 10310400, 'steps': 53699, 'loss/train': 1.1834489107131958} -08/30/2021 22:53:55 - INFO - __main__ - Step 53701: {'lr': 0.0003639702032620669, 'samples': 10310592, 'steps': 53700, 'loss/train': 1.1344308853149414} -08/30/2021 22:53:55 - INFO - __main__ - Step 53702: {'lr': 0.00036396548001723164, 'samples': 10310784, 'steps': 53701, 'loss/train': 1.1612474918365479} -08/30/2021 22:53:56 - INFO - __main__ - Step 53703: {'lr': 0.00036396075672104523, 'samples': 10310976, 'steps': 53702, 'loss/train': 1.5016802549362183} -08/30/2021 22:53:56 - INFO - __main__ - Step 53704: {'lr': 0.00036395603337350987, 'samples': 10311168, 'steps': 53703, 'loss/train': 0.2191607803106308} -08/30/2021 22:53:58 - INFO - __main__ - Step 53705: {'lr': 0.0003639513099746277, 'samples': 10311360, 'steps': 53704, 'loss/train': 1.7161669731140137} -08/30/2021 22:53:58 - INFO - __main__ - Step 53706: {'lr': 0.0003639465865244008, 'samples': 10311552, 'steps': 53705, 'loss/train': 0.9623885750770569} -08/30/2021 22:53:59 - INFO - __main__ - Step 53707: {'lr': 0.0003639418630228314, 'samples': 10311744, 'steps': 53706, 'loss/train': 0.3749837279319763} -08/30/2021 22:53:59 - INFO - __main__ - Step 53708: {'lr': 0.00036393713946992156, 'samples': 10311936, 'steps': 53707, 'loss/train': 1.331856369972229} -08/30/2021 22:53:59 - INFO - __main__ - Step 53709: {'lr': 0.0003639324158656733, 'samples': 10312128, 'steps': 53708, 'loss/train': 1.3522496223449707} -08/30/2021 22:54:01 - INFO - __main__ - Step 53710: {'lr': 0.00036392769221008895, 'samples': 10312320, 'steps': 53709, 'loss/train': 1.4969886541366577} -08/30/2021 22:54:02 - INFO - __main__ - Step 53711: {'lr': 0.0003639229685031705, 'samples': 10312512, 'steps': 53710, 'loss/train': 1.0851818323135376} -08/30/2021 22:54:02 - INFO - __main__ - Step 53712: {'lr': 0.0003639182447449201, 'samples': 10312704, 'steps': 53711, 'loss/train': 1.4043091535568237} -08/30/2021 22:54:02 - INFO - __main__ - Step 53713: {'lr': 0.00036391352093533995, 'samples': 10312896, 'steps': 53712, 'loss/train': 1.6672462224960327} -08/30/2021 22:54:03 - INFO - __main__ - Step 53714: {'lr': 0.0003639087970744321, 'samples': 10313088, 'steps': 53713, 'loss/train': 1.19981050491333} -08/30/2021 22:54:03 - INFO - __main__ - Step 53715: {'lr': 0.00036390407316219865, 'samples': 10313280, 'steps': 53714, 'loss/train': 1.2523813247680664} -08/30/2021 22:54:04 - INFO - __main__ - Step 53716: {'lr': 0.0003638993491986419, 'samples': 10313472, 'steps': 53715, 'loss/train': 1.0711724758148193} -08/30/2021 22:54:05 - INFO - __main__ - Step 53717: {'lr': 0.0003638946251837637, 'samples': 10313664, 'steps': 53716, 'loss/train': 0.2546384632587433} -08/30/2021 22:54:05 - INFO - __main__ - Step 53718: {'lr': 0.0003638899011175664, 'samples': 10313856, 'steps': 53717, 'loss/train': 1.007988452911377} -08/30/2021 22:54:06 - INFO - __main__ - Step 53719: {'lr': 0.00036388517700005214, 'samples': 10314048, 'steps': 53718, 'loss/train': 2.3122098445892334} -08/30/2021 22:54:06 - INFO - __main__ - Step 53720: {'lr': 0.00036388045283122295, 'samples': 10314240, 'steps': 53719, 'loss/train': 1.3735408782958984} -08/30/2021 22:54:07 - INFO - __main__ - Step 53721: {'lr': 0.00036387572861108097, 'samples': 10314432, 'steps': 53720, 'loss/train': 1.0783125162124634} -08/30/2021 22:54:08 - INFO - __main__ - Step 53722: {'lr': 0.0003638710043396283, 'samples': 10314624, 'steps': 53721, 'loss/train': 1.3310192823410034} -08/30/2021 22:54:08 - INFO - __main__ - Step 53723: {'lr': 0.0003638662800168672, 'samples': 10314816, 'steps': 53722, 'loss/train': 1.37336003780365} -08/30/2021 22:54:09 - INFO - __main__ - Step 53724: {'lr': 0.00036386155564279967, 'samples': 10315008, 'steps': 53723, 'loss/train': 1.2942947149276733} -08/30/2021 22:54:09 - INFO - __main__ - Step 53725: {'lr': 0.00036385683121742786, 'samples': 10315200, 'steps': 53724, 'loss/train': 1.5524836778640747} -08/30/2021 22:54:11 - INFO - __main__ - Step 53726: {'lr': 0.00036385210674075394, 'samples': 10315392, 'steps': 53725, 'loss/train': 1.1527496576309204} -08/30/2021 22:54:11 - INFO - __main__ - Step 53727: {'lr': 0.00036384738221278, 'samples': 10315584, 'steps': 53726, 'loss/train': 0.9081522822380066} -08/30/2021 22:54:11 - INFO - __main__ - Step 53728: {'lr': 0.0003638426576335082, 'samples': 10315776, 'steps': 53727, 'loss/train': 1.3712269067764282} -08/30/2021 22:54:12 - INFO - __main__ - Step 53729: {'lr': 0.00036383793300294063, 'samples': 10315968, 'steps': 53728, 'loss/train': 1.0714738368988037} -08/30/2021 22:54:12 - INFO - __main__ - Step 53730: {'lr': 0.00036383320832107945, 'samples': 10316160, 'steps': 53729, 'loss/train': 0.9009466171264648} -08/30/2021 22:54:14 - INFO - __main__ - Step 53731: {'lr': 0.0003638284835879268, 'samples': 10316352, 'steps': 53730, 'loss/train': 1.203413963317871} -08/30/2021 22:54:14 - INFO - __main__ - Step 53732: {'lr': 0.0003638237588034848, 'samples': 10316544, 'steps': 53731, 'loss/train': 1.6881147623062134} -08/30/2021 22:54:14 - INFO - __main__ - Step 53733: {'lr': 0.00036381903396775556, 'samples': 10316736, 'steps': 53732, 'loss/train': 1.3158241510391235} -08/30/2021 22:54:15 - INFO - __main__ - Step 53734: {'lr': 0.00036381430908074126, 'samples': 10316928, 'steps': 53733, 'loss/train': 1.3051568269729614} -08/30/2021 22:54:15 - INFO - __main__ - Step 53735: {'lr': 0.00036380958414244393, 'samples': 10317120, 'steps': 53734, 'loss/train': 1.6689780950546265} -08/30/2021 22:54:16 - INFO - __main__ - Step 53736: {'lr': 0.0003638048591528658, 'samples': 10317312, 'steps': 53735, 'loss/train': 1.6852327585220337} -08/30/2021 22:54:17 - INFO - __main__ - Step 53737: {'lr': 0.0003638001341120089, 'samples': 10317504, 'steps': 53736, 'loss/train': 1.3018109798431396} -08/30/2021 22:54:17 - INFO - __main__ - Step 53738: {'lr': 0.00036379540901987546, 'samples': 10317696, 'steps': 53737, 'loss/train': 1.543308138847351} -08/30/2021 22:54:18 - INFO - __main__ - Step 53739: {'lr': 0.0003637906838764675, 'samples': 10317888, 'steps': 53738, 'loss/train': 1.4458061456680298} -08/30/2021 22:54:18 - INFO - __main__ - Step 53740: {'lr': 0.00036378595868178737, 'samples': 10318080, 'steps': 53739, 'loss/train': 1.2234148979187012} -08/30/2021 22:54:18 - INFO - __main__ - Step 53741: {'lr': 0.00036378123343583694, 'samples': 10318272, 'steps': 53740, 'loss/train': 1.3705779314041138} -08/30/2021 22:54:20 - INFO - __main__ - Step 53742: {'lr': 0.0003637765081386184, 'samples': 10318464, 'steps': 53741, 'loss/train': 1.3987308740615845} -08/30/2021 22:54:20 - INFO - __main__ - Step 53743: {'lr': 0.000363771782790134, 'samples': 10318656, 'steps': 53742, 'loss/train': 1.2078702449798584} -08/30/2021 22:54:21 - INFO - __main__ - Step 53744: {'lr': 0.0003637670573903857, 'samples': 10318848, 'steps': 53743, 'loss/train': 1.135398030281067} -08/30/2021 22:54:21 - INFO - __main__ - Step 53745: {'lr': 0.0003637623319393758, 'samples': 10319040, 'steps': 53744, 'loss/train': 1.2414087057113647} -08/30/2021 22:54:21 - INFO - __main__ - Step 53746: {'lr': 0.0003637576064371063, 'samples': 10319232, 'steps': 53745, 'loss/train': 1.2687788009643555} -08/30/2021 22:54:23 - INFO - __main__ - Step 53747: {'lr': 0.0003637528808835794, 'samples': 10319424, 'steps': 53746, 'loss/train': 1.3661324977874756} -08/30/2021 22:54:24 - INFO - __main__ - Step 53748: {'lr': 0.00036374815527879725, 'samples': 10319616, 'steps': 53747, 'loss/train': 1.5377265214920044} -08/30/2021 22:54:24 - INFO - __main__ - Step 53749: {'lr': 0.0003637434296227619, 'samples': 10319808, 'steps': 53748, 'loss/train': 1.4059460163116455} -08/30/2021 22:54:25 - INFO - __main__ - Step 53750: {'lr': 0.0003637387039154755, 'samples': 10320000, 'steps': 53749, 'loss/train': 1.0428352355957031} -08/30/2021 22:54:25 - INFO - __main__ - Step 53751: {'lr': 0.0003637339781569402, 'samples': 10320192, 'steps': 53750, 'loss/train': 1.9516690969467163} -08/30/2021 22:54:27 - INFO - __main__ - Step 53752: {'lr': 0.0003637292523471581, 'samples': 10320384, 'steps': 53751, 'loss/train': 1.1140462160110474} -08/30/2021 22:54:27 - INFO - __main__ - Step 53753: {'lr': 0.0003637245264861314, 'samples': 10320576, 'steps': 53752, 'loss/train': 1.531790018081665} -08/30/2021 22:54:27 - INFO - __main__ - Step 53754: {'lr': 0.0003637198005738622, 'samples': 10320768, 'steps': 53753, 'loss/train': 0.9442309141159058} -08/30/2021 22:54:28 - INFO - __main__ - Step 53755: {'lr': 0.0003637150746103526, 'samples': 10320960, 'steps': 53754, 'loss/train': 1.8018577098846436} -08/30/2021 22:54:28 - INFO - __main__ - Step 53756: {'lr': 0.0003637103485956047, 'samples': 10321152, 'steps': 53755, 'loss/train': 0.9417364597320557} -08/30/2021 22:54:30 - INFO - __main__ - Step 53757: {'lr': 0.0003637056225296207, 'samples': 10321344, 'steps': 53756, 'loss/train': 0.40262842178344727} -08/30/2021 22:54:30 - INFO - __main__ - Step 53758: {'lr': 0.00036370089641240264, 'samples': 10321536, 'steps': 53757, 'loss/train': 1.619067907333374} -08/30/2021 22:54:30 - INFO - __main__ - Step 53759: {'lr': 0.0003636961702439527, 'samples': 10321728, 'steps': 53758, 'loss/train': 0.3672869801521301} -08/30/2021 22:54:31 - INFO - __main__ - Step 53760: {'lr': 0.0003636914440242732, 'samples': 10321920, 'steps': 53759, 'loss/train': 1.1589772701263428} -08/30/2021 22:54:31 - INFO - __main__ - Step 53761: {'lr': 0.00036368671775336597, 'samples': 10322112, 'steps': 53760, 'loss/train': 1.4277900457382202} -08/30/2021 22:54:33 - INFO - __main__ - Step 53762: {'lr': 0.00036368199143123326, 'samples': 10322304, 'steps': 53761, 'loss/train': 1.608929991722107} -08/30/2021 22:54:33 - INFO - __main__ - Step 53763: {'lr': 0.0003636772650578772, 'samples': 10322496, 'steps': 53762, 'loss/train': 1.774794578552246} -08/30/2021 22:54:33 - INFO - __main__ - Step 53764: {'lr': 0.0003636725386332999, 'samples': 10322688, 'steps': 53763, 'loss/train': 1.3371376991271973} -08/30/2021 22:54:34 - INFO - __main__ - Step 53765: {'lr': 0.00036366781215750355, 'samples': 10322880, 'steps': 53764, 'loss/train': 0.15669012069702148} -08/30/2021 22:54:34 - INFO - __main__ - Step 53766: {'lr': 0.0003636630856304902, 'samples': 10323072, 'steps': 53765, 'loss/train': 1.6438034772872925} -08/30/2021 22:54:34 - INFO - __main__ - Step 53767: {'lr': 0.0003636583590522621, 'samples': 10323264, 'steps': 53766, 'loss/train': 1.8038415908813477} -08/30/2021 22:54:36 - INFO - __main__ - Step 53768: {'lr': 0.00036365363242282117, 'samples': 10323456, 'steps': 53767, 'loss/train': 0.9586418271064758} -08/30/2021 22:54:36 - INFO - __main__ - Step 53769: {'lr': 0.00036364890574216974, 'samples': 10323648, 'steps': 53768, 'loss/train': 1.5184835195541382} -08/30/2021 22:54:37 - INFO - __main__ - Step 53770: {'lr': 0.0003636441790103098, 'samples': 10323840, 'steps': 53769, 'loss/train': 0.9286397695541382} -08/30/2021 22:54:37 - INFO - __main__ - Step 53771: {'lr': 0.00036363945222724363, 'samples': 10324032, 'steps': 53770, 'loss/train': 0.04186157509684563} -08/30/2021 22:54:37 - INFO - __main__ - Step 53772: {'lr': 0.0003636347253929733, 'samples': 10324224, 'steps': 53771, 'loss/train': 1.4541516304016113} -08/30/2021 22:54:39 - INFO - __main__ - Step 53773: {'lr': 0.0003636299985075008, 'samples': 10324416, 'steps': 53772, 'loss/train': 1.3696902990341187} -08/30/2021 22:54:40 - INFO - __main__ - Step 53774: {'lr': 0.00036362527157082845, 'samples': 10324608, 'steps': 53773, 'loss/train': 0.9283785223960876} -08/30/2021 22:54:40 - INFO - __main__ - Step 53775: {'lr': 0.00036362054458295836, 'samples': 10324800, 'steps': 53774, 'loss/train': 4.218986988067627} -08/30/2021 22:54:40 - INFO - __main__ - Step 53776: {'lr': 0.0003636158175438925, 'samples': 10324992, 'steps': 53775, 'loss/train': 1.4279903173446655} -08/30/2021 22:54:41 - INFO - __main__ - Step 53777: {'lr': 0.00036361109045363315, 'samples': 10325184, 'steps': 53776, 'loss/train': 0.647429347038269} -08/30/2021 22:54:42 - INFO - __main__ - Step 53778: {'lr': 0.0003636063633121824, 'samples': 10325376, 'steps': 53777, 'loss/train': 1.633341670036316} -08/30/2021 22:54:43 - INFO - __main__ - Step 53779: {'lr': 0.0003636016361195423, 'samples': 10325568, 'steps': 53778, 'loss/train': 1.1774834394454956} -08/30/2021 22:54:43 - INFO - __main__ - Step 53780: {'lr': 0.0003635969088757152, 'samples': 10325760, 'steps': 53779, 'loss/train': 1.7628194093704224} -08/30/2021 22:54:43 - INFO - __main__ - Step 53781: {'lr': 0.000363592181580703, 'samples': 10325952, 'steps': 53780, 'loss/train': 1.734178066253662} -08/30/2021 22:54:44 - INFO - __main__ - Step 53782: {'lr': 0.00036358745423450793, 'samples': 10326144, 'steps': 53781, 'loss/train': 1.1131432056427002} -08/30/2021 22:54:45 - INFO - __main__ - Step 53783: {'lr': 0.00036358272683713214, 'samples': 10326336, 'steps': 53782, 'loss/train': 0.9000319242477417} -08/30/2021 22:54:46 - INFO - __main__ - Step 53784: {'lr': 0.00036357799938857766, 'samples': 10326528, 'steps': 53783, 'loss/train': 1.101102352142334} -08/30/2021 22:54:46 - INFO - __main__ - Step 53785: {'lr': 0.0003635732718888467, 'samples': 10326720, 'steps': 53784, 'loss/train': 1.3329943418502808} -08/30/2021 22:54:46 - INFO - __main__ - Step 53786: {'lr': 0.0003635685443379414, 'samples': 10326912, 'steps': 53785, 'loss/train': 1.4994231462478638} -08/30/2021 22:54:47 - INFO - __main__ - Step 53787: {'lr': 0.0003635638167358639, 'samples': 10327104, 'steps': 53786, 'loss/train': 1.1487504243850708} -08/30/2021 22:54:48 - INFO - __main__ - Step 53788: {'lr': 0.00036355908908261624, 'samples': 10327296, 'steps': 53787, 'loss/train': 1.141757607460022} -08/30/2021 22:54:49 - INFO - __main__ - Step 53789: {'lr': 0.0003635543613782006, 'samples': 10327488, 'steps': 53788, 'loss/train': 1.693282961845398} -08/30/2021 22:54:49 - INFO - __main__ - Step 53790: {'lr': 0.0003635496336226192, 'samples': 10327680, 'steps': 53789, 'loss/train': 1.257690668106079} -08/30/2021 22:54:49 - INFO - __main__ - Step 53791: {'lr': 0.00036354490581587396, 'samples': 10327872, 'steps': 53790, 'loss/train': 1.3951411247253418} -08/30/2021 22:54:50 - INFO - __main__ - Step 53792: {'lr': 0.0003635401779579672, 'samples': 10328064, 'steps': 53791, 'loss/train': 1.1577696800231934} -08/30/2021 22:54:50 - INFO - __main__ - Step 53793: {'lr': 0.000363535450048901, 'samples': 10328256, 'steps': 53792, 'loss/train': 1.5145190954208374} -08/30/2021 22:54:52 - INFO - __main__ - Step 53794: {'lr': 0.00036353072208867746, 'samples': 10328448, 'steps': 53793, 'loss/train': 1.4275929927825928} -08/30/2021 22:54:52 - INFO - __main__ - Step 53795: {'lr': 0.00036352599407729873, 'samples': 10328640, 'steps': 53794, 'loss/train': 0.7977818846702576} -08/30/2021 22:54:53 - INFO - __main__ - Step 53796: {'lr': 0.00036352126601476697, 'samples': 10328832, 'steps': 53795, 'loss/train': 1.3475801944732666} -08/30/2021 22:54:53 - INFO - __main__ - Step 53797: {'lr': 0.0003635165379010842, 'samples': 10329024, 'steps': 53796, 'loss/train': 0.8868166208267212} -08/30/2021 22:54:53 - INFO - __main__ - Step 53798: {'lr': 0.0003635118097362528, 'samples': 10329216, 'steps': 53797, 'loss/train': 1.4683239459991455} -08/30/2021 22:54:56 - INFO - __main__ - Step 53799: {'lr': 0.0003635070815202746, 'samples': 10329408, 'steps': 53798, 'loss/train': 1.843313455581665} -08/30/2021 22:54:56 - INFO - __main__ - Step 53800: {'lr': 0.0003635023532531518, 'samples': 10329600, 'steps': 53799, 'loss/train': 1.0365461111068726} -08/30/2021 22:54:57 - INFO - __main__ - Step 53801: {'lr': 0.00036349762493488667, 'samples': 10329792, 'steps': 53800, 'loss/train': 1.181510090827942} -08/30/2021 22:54:57 - INFO - __main__ - Step 53802: {'lr': 0.0003634928965654813, 'samples': 10329984, 'steps': 53801, 'loss/train': 1.5654984712600708} -08/30/2021 22:54:57 - INFO - __main__ - Step 53803: {'lr': 0.0003634881681449377, 'samples': 10330176, 'steps': 53802, 'loss/train': 1.6878654956817627} -08/30/2021 22:54:58 - INFO - __main__ - Step 53804: {'lr': 0.00036348343967325814, 'samples': 10330368, 'steps': 53803, 'loss/train': 1.4503865242004395} -08/30/2021 22:55:00 - INFO - __main__ - Step 53805: {'lr': 0.00036347871115044466, 'samples': 10330560, 'steps': 53804, 'loss/train': 0.06338923424482346} -08/30/2021 22:55:00 - INFO - __main__ - Step 53806: {'lr': 0.0003634739825764995, 'samples': 10330752, 'steps': 53805, 'loss/train': 1.5886942148208618} -08/30/2021 22:55:01 - INFO - __main__ - Step 53807: {'lr': 0.00036346925395142467, 'samples': 10330944, 'steps': 53806, 'loss/train': 0.026798652485013008} -08/30/2021 22:55:01 - INFO - __main__ - Step 53808: {'lr': 0.00036346452527522233, 'samples': 10331136, 'steps': 53807, 'loss/train': 1.2169519662857056} -08/30/2021 22:55:01 - INFO - __main__ - Step 53809: {'lr': 0.0003634597965478946, 'samples': 10331328, 'steps': 53808, 'loss/train': 1.4164702892303467} -08/30/2021 22:55:02 - INFO - __main__ - Step 53810: {'lr': 0.00036345506776944364, 'samples': 10331520, 'steps': 53809, 'loss/train': 1.6290335655212402} -08/30/2021 22:55:03 - INFO - __main__ - Step 53811: {'lr': 0.00036345033893987164, 'samples': 10331712, 'steps': 53810, 'loss/train': 1.6554316282272339} -08/30/2021 22:55:03 - INFO - __main__ - Step 53812: {'lr': 0.00036344561005918064, 'samples': 10331904, 'steps': 53811, 'loss/train': 0.05251317471265793} -08/30/2021 22:55:04 - INFO - __main__ - Step 53813: {'lr': 0.00036344088112737276, 'samples': 10332096, 'steps': 53812, 'loss/train': 1.0993233919143677} -08/30/2021 22:55:04 - INFO - __main__ - Step 53814: {'lr': 0.0003634361521444502, 'samples': 10332288, 'steps': 53813, 'loss/train': 1.4712518453598022} -08/30/2021 22:55:04 - INFO - __main__ - Step 53815: {'lr': 0.00036343142311041503, 'samples': 10332480, 'steps': 53814, 'loss/train': 1.4359511137008667} -08/30/2021 22:55:06 - INFO - __main__ - Step 53816: {'lr': 0.00036342669402526946, 'samples': 10332672, 'steps': 53815, 'loss/train': 1.2964413166046143} -08/30/2021 22:55:06 - INFO - __main__ - Step 53817: {'lr': 0.0003634219648890156, 'samples': 10332864, 'steps': 53816, 'loss/train': 0.898953914642334} -08/30/2021 22:55:07 - INFO - __main__ - Step 53818: {'lr': 0.00036341723570165545, 'samples': 10333056, 'steps': 53817, 'loss/train': 0.24019961059093475} -08/30/2021 22:55:07 - INFO - __main__ - Step 53819: {'lr': 0.0003634125064631913, 'samples': 10333248, 'steps': 53818, 'loss/train': 1.1429471969604492} -08/30/2021 22:55:07 - INFO - __main__ - Step 53820: {'lr': 0.0003634077771736252, 'samples': 10333440, 'steps': 53819, 'loss/train': 1.3382513523101807} -08/30/2021 22:55:09 - INFO - __main__ - Step 53821: {'lr': 0.00036340304783295937, 'samples': 10333632, 'steps': 53820, 'loss/train': 1.240190029144287} -08/30/2021 22:55:09 - INFO - __main__ - Step 53822: {'lr': 0.0003633983184411958, 'samples': 10333824, 'steps': 53821, 'loss/train': 1.386380672454834} -08/30/2021 22:55:10 - INFO - __main__ - Step 53823: {'lr': 0.00036339358899833675, 'samples': 10334016, 'steps': 53822, 'loss/train': 1.5180798768997192} -08/30/2021 22:55:10 - INFO - __main__ - Step 53824: {'lr': 0.00036338885950438425, 'samples': 10334208, 'steps': 53823, 'loss/train': 1.8599827289581299} -08/30/2021 22:55:10 - INFO - __main__ - Step 53825: {'lr': 0.00036338412995934056, 'samples': 10334400, 'steps': 53824, 'loss/train': 1.0703608989715576} -08/30/2021 22:55:11 - INFO - __main__ - Step 53826: {'lr': 0.00036337940036320764, 'samples': 10334592, 'steps': 53825, 'loss/train': 1.29691481590271} -08/30/2021 22:55:12 - INFO - __main__ - Step 53827: {'lr': 0.0003633746707159877, 'samples': 10334784, 'steps': 53826, 'loss/train': 1.7954680919647217} -08/30/2021 22:55:13 - INFO - __main__ - Step 53828: {'lr': 0.00036336994101768304, 'samples': 10334976, 'steps': 53827, 'loss/train': 1.0407906770706177} -08/30/2021 22:55:13 - INFO - __main__ - Step 53829: {'lr': 0.00036336521126829554, 'samples': 10335168, 'steps': 53828, 'loss/train': 1.5656089782714844} -08/30/2021 22:55:14 - INFO - __main__ - Step 53830: {'lr': 0.00036336048146782743, 'samples': 10335360, 'steps': 53829, 'loss/train': 1.61233651638031} -08/30/2021 22:55:14 - INFO - __main__ - Step 53831: {'lr': 0.00036335575161628076, 'samples': 10335552, 'steps': 53830, 'loss/train': 1.5402565002441406} -08/30/2021 22:55:16 - INFO - __main__ - Step 53832: {'lr': 0.0003633510217136578, 'samples': 10335744, 'steps': 53831, 'loss/train': 2.119866371154785} -08/30/2021 22:55:16 - INFO - __main__ - Step 53833: {'lr': 0.0003633462917599606, 'samples': 10335936, 'steps': 53832, 'loss/train': 0.0717109814286232} -08/30/2021 22:55:16 - INFO - __main__ - Step 53834: {'lr': 0.0003633415617551914, 'samples': 10336128, 'steps': 53833, 'loss/train': 1.3708863258361816} -08/30/2021 22:55:17 - INFO - __main__ - Step 53835: {'lr': 0.0003633368316993521, 'samples': 10336320, 'steps': 53834, 'loss/train': 0.06664194911718369} -08/30/2021 22:55:17 - INFO - __main__ - Step 53836: {'lr': 0.0003633321015924451, 'samples': 10336512, 'steps': 53835, 'loss/train': 1.407045841217041} -08/30/2021 22:55:18 - INFO - __main__ - Step 53837: {'lr': 0.0003633273714344723, 'samples': 10336704, 'steps': 53836, 'loss/train': 1.3898102045059204} -08/30/2021 22:55:19 - INFO - __main__ - Step 53838: {'lr': 0.00036332264122543594, 'samples': 10336896, 'steps': 53837, 'loss/train': 1.17030668258667} -08/30/2021 22:55:19 - INFO - __main__ - Step 53839: {'lr': 0.00036331791096533815, 'samples': 10337088, 'steps': 53838, 'loss/train': 2.188324213027954} -08/30/2021 22:55:20 - INFO - __main__ - Step 53840: {'lr': 0.0003633131806541811, 'samples': 10337280, 'steps': 53839, 'loss/train': 2.024200439453125} -08/30/2021 22:55:20 - INFO - __main__ - Step 53841: {'lr': 0.000363308450291967, 'samples': 10337472, 'steps': 53840, 'loss/train': 1.4124239683151245} -08/30/2021 22:55:22 - INFO - __main__ - Step 53842: {'lr': 0.0003633037198786977, 'samples': 10337664, 'steps': 53841, 'loss/train': 1.634394884109497} -08/30/2021 22:55:22 - INFO - __main__ - Step 53843: {'lr': 0.0003632989894143755, 'samples': 10337856, 'steps': 53842, 'loss/train': 0.44994378089904785} -08/30/2021 22:55:22 - INFO - __main__ - Step 53844: {'lr': 0.0003632942588990025, 'samples': 10338048, 'steps': 53843, 'loss/train': 1.3941727876663208} -08/30/2021 22:55:23 - INFO - __main__ - Step 53845: {'lr': 0.00036328952833258096, 'samples': 10338240, 'steps': 53844, 'loss/train': 1.7511320114135742} -08/30/2021 22:55:23 - INFO - __main__ - Step 53846: {'lr': 0.0003632847977151128, 'samples': 10338432, 'steps': 53845, 'loss/train': 0.9932016730308533} -08/30/2021 22:55:25 - INFO - __main__ - Step 53847: {'lr': 0.0003632800670466003, 'samples': 10338624, 'steps': 53846, 'loss/train': 1.3834797143936157} -08/30/2021 22:55:25 - INFO - __main__ - Step 53848: {'lr': 0.0003632753363270456, 'samples': 10338816, 'steps': 53847, 'loss/train': 1.1966313123703003} -08/30/2021 22:55:26 - INFO - __main__ - Step 53849: {'lr': 0.00036327060555645075, 'samples': 10339008, 'steps': 53848, 'loss/train': 1.1063379049301147} -08/30/2021 22:55:26 - INFO - __main__ - Step 53850: {'lr': 0.0003632658747348179, 'samples': 10339200, 'steps': 53849, 'loss/train': 1.4359912872314453} -08/30/2021 22:55:26 - INFO - __main__ - Step 53851: {'lr': 0.0003632611438621492, 'samples': 10339392, 'steps': 53850, 'loss/train': 1.3796417713165283} -08/30/2021 22:55:27 - INFO - __main__ - Step 53852: {'lr': 0.00036325641293844674, 'samples': 10339584, 'steps': 53851, 'loss/train': 1.2238281965255737} -08/30/2021 22:55:28 - INFO - __main__ - Step 53853: {'lr': 0.0003632516819637127, 'samples': 10339776, 'steps': 53852, 'loss/train': 0.28428390622138977} -08/30/2021 22:55:29 - INFO - __main__ - Step 53854: {'lr': 0.0003632469509379492, 'samples': 10339968, 'steps': 53853, 'loss/train': 1.5513300895690918} -08/30/2021 22:55:29 - INFO - __main__ - Step 53855: {'lr': 0.00036324221986115847, 'samples': 10340160, 'steps': 53854, 'loss/train': 1.444474697113037} -08/30/2021 22:55:30 - INFO - __main__ - Step 53856: {'lr': 0.00036323748873334246, 'samples': 10340352, 'steps': 53855, 'loss/train': 0.8947063684463501} -08/30/2021 22:55:30 - INFO - __main__ - Step 53857: {'lr': 0.00036323275755450335, 'samples': 10340544, 'steps': 53856, 'loss/train': 0.8642876148223877} -08/30/2021 22:55:32 - INFO - __main__ - Step 53858: {'lr': 0.00036322802632464336, 'samples': 10340736, 'steps': 53857, 'loss/train': 0.17101213335990906} -08/30/2021 22:55:32 - INFO - __main__ - Step 53859: {'lr': 0.00036322329504376457, 'samples': 10340928, 'steps': 53858, 'loss/train': 1.3581503629684448} -08/30/2021 22:55:33 - INFO - __main__ - Step 53860: {'lr': 0.0003632185637118691, 'samples': 10341120, 'steps': 53859, 'loss/train': 1.2883199453353882} -08/30/2021 22:55:33 - INFO - __main__ - Step 53861: {'lr': 0.0003632138323289591, 'samples': 10341312, 'steps': 53860, 'loss/train': 1.0590550899505615} -08/30/2021 22:55:34 - INFO - __main__ - Step 53862: {'lr': 0.00036320910089503665, 'samples': 10341504, 'steps': 53861, 'loss/train': 0.952043354511261} -08/30/2021 22:55:35 - INFO - __main__ - Step 53863: {'lr': 0.00036320436941010396, 'samples': 10341696, 'steps': 53862, 'loss/train': 0.9984175562858582} -08/30/2021 22:55:35 - INFO - __main__ - Step 53864: {'lr': 0.00036319963787416313, 'samples': 10341888, 'steps': 53863, 'loss/train': 1.4564708471298218} -08/30/2021 22:55:36 - INFO - __main__ - Step 53865: {'lr': 0.0003631949062872163, 'samples': 10342080, 'steps': 53864, 'loss/train': 1.277030110359192} -08/30/2021 22:55:36 - INFO - __main__ - Step 53866: {'lr': 0.0003631901746492656, 'samples': 10342272, 'steps': 53865, 'loss/train': 0.8510956168174744} -08/30/2021 22:55:36 - INFO - __main__ - Step 53867: {'lr': 0.0003631854429603131, 'samples': 10342464, 'steps': 53866, 'loss/train': 0.8105121850967407} -08/30/2021 22:55:38 - INFO - __main__ - Step 53868: {'lr': 0.00036318071122036104, 'samples': 10342656, 'steps': 53867, 'loss/train': 1.434144377708435} -08/30/2021 22:55:38 - INFO - __main__ - Step 53869: {'lr': 0.0003631759794294115, 'samples': 10342848, 'steps': 53868, 'loss/train': 1.513204574584961} -08/30/2021 22:55:39 - INFO - __main__ - Step 53870: {'lr': 0.00036317124758746656, 'samples': 10343040, 'steps': 53869, 'loss/train': 0.8377476930618286} -08/30/2021 22:55:39 - INFO - __main__ - Step 53871: {'lr': 0.0003631665156945284, 'samples': 10343232, 'steps': 53870, 'loss/train': 1.0416661500930786} -08/30/2021 22:55:39 - INFO - __main__ - Step 53872: {'lr': 0.0003631617837505992, 'samples': 10343424, 'steps': 53871, 'loss/train': 1.3112215995788574} -08/30/2021 22:55:41 - INFO - __main__ - Step 53873: {'lr': 0.00036315705175568103, 'samples': 10343616, 'steps': 53872, 'loss/train': 1.3337771892547607} -08/30/2021 22:55:42 - INFO - __main__ - Step 53874: {'lr': 0.000363152319709776, 'samples': 10343808, 'steps': 53873, 'loss/train': 1.4580767154693604} -08/30/2021 22:55:42 - INFO - __main__ - Step 53875: {'lr': 0.00036314758761288643, 'samples': 10344000, 'steps': 53874, 'loss/train': 0.9202516674995422} -08/30/2021 22:55:42 - INFO - __main__ - Step 53876: {'lr': 0.00036314285546501415, 'samples': 10344192, 'steps': 53875, 'loss/train': 1.021802544593811} -08/30/2021 22:55:43 - INFO - __main__ - Step 53877: {'lr': 0.0003631381232661615, 'samples': 10344384, 'steps': 53876, 'loss/train': 0.9923377633094788} -08/30/2021 22:55:44 - INFO - __main__ - Step 53878: {'lr': 0.0003631333910163305, 'samples': 10344576, 'steps': 53877, 'loss/train': 1.2320740222930908} -08/30/2021 22:55:44 - INFO - __main__ - Step 53879: {'lr': 0.0003631286587155234, 'samples': 10344768, 'steps': 53878, 'loss/train': 1.076094627380371} -08/30/2021 22:55:45 - INFO - __main__ - Step 53880: {'lr': 0.00036312392636374225, 'samples': 10344960, 'steps': 53879, 'loss/train': 2.010040044784546} -08/30/2021 22:55:45 - INFO - __main__ - Step 53881: {'lr': 0.00036311919396098927, 'samples': 10345152, 'steps': 53880, 'loss/train': 0.6335082650184631} -08/30/2021 22:55:46 - INFO - __main__ - Step 53882: {'lr': 0.0003631144615072665, 'samples': 10345344, 'steps': 53881, 'loss/train': 1.3972604274749756} -08/30/2021 22:55:46 - INFO - __main__ - Step 53883: {'lr': 0.000363109729002576, 'samples': 10345536, 'steps': 53882, 'loss/train': 0.9202935099601746} -08/30/2021 22:55:47 - INFO - __main__ - Step 53884: {'lr': 0.0003631049964469201, 'samples': 10345728, 'steps': 53883, 'loss/train': 0.7065900564193726} -08/30/2021 22:55:48 - INFO - __main__ - Step 53885: {'lr': 0.0003631002638403008, 'samples': 10345920, 'steps': 53884, 'loss/train': 1.275734543800354} -08/30/2021 22:55:48 - INFO - __main__ - Step 53886: {'lr': 0.0003630955311827202, 'samples': 10346112, 'steps': 53885, 'loss/train': 1.6717591285705566} -08/30/2021 22:55:49 - INFO - __main__ - Step 53887: {'lr': 0.0003630907984741806, 'samples': 10346304, 'steps': 53886, 'loss/train': 1.4089205265045166} -08/30/2021 22:55:49 - INFO - __main__ - Step 53888: {'lr': 0.00036308606571468406, 'samples': 10346496, 'steps': 53887, 'loss/train': 0.8983347415924072} -08/30/2021 22:55:50 - INFO - __main__ - Step 53889: {'lr': 0.00036308133290423257, 'samples': 10346688, 'steps': 53888, 'loss/train': 1.1579469442367554} -08/30/2021 22:55:51 - INFO - __main__ - Step 53890: {'lr': 0.00036307660004282846, 'samples': 10346880, 'steps': 53889, 'loss/train': 1.1339261531829834} -08/30/2021 22:55:51 - INFO - __main__ - Step 53891: {'lr': 0.0003630718671304737, 'samples': 10347072, 'steps': 53890, 'loss/train': 1.322121500968933} -08/30/2021 22:55:52 - INFO - __main__ - Step 53892: {'lr': 0.0003630671341671705, 'samples': 10347264, 'steps': 53891, 'loss/train': 1.0415552854537964} -08/30/2021 22:55:52 - INFO - __main__ - Step 53893: {'lr': 0.0003630624011529211, 'samples': 10347456, 'steps': 53892, 'loss/train': 1.352339744567871} -08/30/2021 22:55:53 - INFO - __main__ - Step 53894: {'lr': 0.00036305766808772746, 'samples': 10347648, 'steps': 53893, 'loss/train': 0.7083971500396729} -08/30/2021 22:55:54 - INFO - __main__ - Step 53895: {'lr': 0.0003630529349715918, 'samples': 10347840, 'steps': 53894, 'loss/train': 0.7098364233970642} -08/30/2021 22:55:54 - INFO - __main__ - Step 53896: {'lr': 0.0003630482018045163, 'samples': 10348032, 'steps': 53895, 'loss/train': 1.2295888662338257} -08/30/2021 22:55:55 - INFO - __main__ - Step 53897: {'lr': 0.0003630434685865029, 'samples': 10348224, 'steps': 53896, 'loss/train': 0.9266245365142822} -08/30/2021 22:55:55 - INFO - __main__ - Step 53898: {'lr': 0.0003630387353175539, 'samples': 10348416, 'steps': 53897, 'loss/train': 0.2742985486984253} -08/30/2021 22:55:57 - INFO - __main__ - Step 53899: {'lr': 0.0003630340019976713, 'samples': 10348608, 'steps': 53898, 'loss/train': 1.3300591707229614} -08/30/2021 22:55:57 - INFO - __main__ - Step 53900: {'lr': 0.0003630292686268575, 'samples': 10348800, 'steps': 53899, 'loss/train': 0.9842734932899475} -08/30/2021 22:55:57 - INFO - __main__ - Step 53901: {'lr': 0.00036302453520511437, 'samples': 10348992, 'steps': 53900, 'loss/train': 1.2373638153076172} -08/30/2021 22:55:58 - INFO - __main__ - Step 53902: {'lr': 0.0003630198017324441, 'samples': 10349184, 'steps': 53901, 'loss/train': 1.3236435651779175} -08/30/2021 22:55:58 - INFO - __main__ - Step 53903: {'lr': 0.0003630150682088489, 'samples': 10349376, 'steps': 53902, 'loss/train': 0.3450353741645813} -08/30/2021 22:56:00 - INFO - __main__ - Step 53904: {'lr': 0.00036301033463433086, 'samples': 10349568, 'steps': 53903, 'loss/train': 1.9662925004959106} -08/30/2021 22:56:00 - INFO - __main__ - Step 53905: {'lr': 0.0003630056010088921, 'samples': 10349760, 'steps': 53904, 'loss/train': 1.322086215019226} -08/30/2021 22:56:00 - INFO - __main__ - Step 53906: {'lr': 0.00036300086733253466, 'samples': 10349952, 'steps': 53905, 'loss/train': 1.309656023979187} -08/30/2021 22:56:01 - INFO - __main__ - Step 53907: {'lr': 0.0003629961336052609, 'samples': 10350144, 'steps': 53906, 'loss/train': 1.6261889934539795} -08/30/2021 22:56:01 - INFO - __main__ - Step 53908: {'lr': 0.0003629913998270728, 'samples': 10350336, 'steps': 53907, 'loss/train': 1.274661660194397} -08/30/2021 22:56:02 - INFO - __main__ - Step 53909: {'lr': 0.00036298666599797247, 'samples': 10350528, 'steps': 53908, 'loss/train': 1.071433186531067} -08/30/2021 22:56:04 - INFO - __main__ - Step 53910: {'lr': 0.00036298193211796215, 'samples': 10350720, 'steps': 53909, 'loss/train': 1.5784220695495605} -08/30/2021 22:56:04 - INFO - __main__ - Step 53911: {'lr': 0.0003629771981870439, 'samples': 10350912, 'steps': 53910, 'loss/train': 1.6543148756027222} -08/30/2021 22:56:05 - INFO - __main__ - Step 53912: {'lr': 0.0003629724642052198, 'samples': 10351104, 'steps': 53911, 'loss/train': 0.030927233397960663} -08/30/2021 22:56:05 - INFO - __main__ - Step 53913: {'lr': 0.00036296773017249214, 'samples': 10351296, 'steps': 53912, 'loss/train': 0.40828219056129456} -08/30/2021 22:56:05 - INFO - __main__ - Step 53914: {'lr': 0.0003629629960888629, 'samples': 10351488, 'steps': 53913, 'loss/train': 1.3829665184020996} -08/30/2021 22:56:06 - INFO - __main__ - Step 53915: {'lr': 0.00036295826195433434, 'samples': 10351680, 'steps': 53914, 'loss/train': 1.3375792503356934} -08/30/2021 22:56:07 - INFO - __main__ - Step 53916: {'lr': 0.0003629535277689085, 'samples': 10351872, 'steps': 53915, 'loss/train': 1.258182168006897} -08/30/2021 22:56:08 - INFO - __main__ - Step 53917: {'lr': 0.00036294879353258755, 'samples': 10352064, 'steps': 53916, 'loss/train': 1.6508598327636719} -08/30/2021 22:56:08 - INFO - __main__ - Step 53918: {'lr': 0.0003629440592453736, 'samples': 10352256, 'steps': 53917, 'loss/train': 1.5212675333023071} -08/30/2021 22:56:08 - INFO - __main__ - Step 53919: {'lr': 0.0003629393249072688, 'samples': 10352448, 'steps': 53918, 'loss/train': 1.06631600856781} -08/30/2021 22:56:09 - INFO - __main__ - Step 53920: {'lr': 0.00036293459051827526, 'samples': 10352640, 'steps': 53919, 'loss/train': 1.6450555324554443} -08/30/2021 22:56:10 - INFO - __main__ - Step 53921: {'lr': 0.0003629298560783952, 'samples': 10352832, 'steps': 53920, 'loss/train': 1.2475587129592896} -08/30/2021 22:56:11 - INFO - __main__ - Step 53922: {'lr': 0.0003629251215876307, 'samples': 10353024, 'steps': 53921, 'loss/train': 0.6523019075393677} -08/30/2021 22:56:11 - INFO - __main__ - Step 53923: {'lr': 0.0003629203870459838, 'samples': 10353216, 'steps': 53922, 'loss/train': 1.228450059890747} -08/30/2021 22:56:11 - INFO - __main__ - Step 53924: {'lr': 0.00036291565245345677, 'samples': 10353408, 'steps': 53923, 'loss/train': 2.0210907459259033} -08/30/2021 22:56:12 - INFO - __main__ - Step 53925: {'lr': 0.0003629109178100516, 'samples': 10353600, 'steps': 53924, 'loss/train': 1.5081448554992676} -08/30/2021 22:56:13 - INFO - __main__ - Step 53926: {'lr': 0.0003629061831157706, 'samples': 10353792, 'steps': 53925, 'loss/train': 0.6194517612457275} -08/30/2021 22:56:14 - INFO - __main__ - Step 53927: {'lr': 0.00036290144837061586, 'samples': 10353984, 'steps': 53926, 'loss/train': 0.7502023577690125} -08/30/2021 22:56:14 - INFO - __main__ - Step 53928: {'lr': 0.00036289671357458937, 'samples': 10354176, 'steps': 53927, 'loss/train': 1.3222026824951172} -08/30/2021 22:56:14 - INFO - __main__ - Step 53929: {'lr': 0.00036289197872769346, 'samples': 10354368, 'steps': 53928, 'loss/train': 1.545782446861267} -08/30/2021 22:56:15 - INFO - __main__ - Step 53930: {'lr': 0.0003628872438299301, 'samples': 10354560, 'steps': 53929, 'loss/train': 1.1636182069778442} -08/30/2021 22:56:16 - INFO - __main__ - Step 53931: {'lr': 0.0003628825088813015, 'samples': 10354752, 'steps': 53930, 'loss/train': 1.2877557277679443} -08/30/2021 22:56:17 - INFO - __main__ - Step 53932: {'lr': 0.00036287777388180977, 'samples': 10354944, 'steps': 53931, 'loss/train': 1.791764497756958} -08/30/2021 22:56:17 - INFO - __main__ - Step 53933: {'lr': 0.00036287303883145703, 'samples': 10355136, 'steps': 53932, 'loss/train': 1.1045094728469849} -08/30/2021 22:56:17 - INFO - __main__ - Step 53934: {'lr': 0.00036286830373024546, 'samples': 10355328, 'steps': 53933, 'loss/train': 1.4776878356933594} -08/30/2021 22:56:18 - INFO - __main__ - Step 53935: {'lr': 0.00036286356857817727, 'samples': 10355520, 'steps': 53934, 'loss/train': 0.37960898876190186} -08/30/2021 22:56:19 - INFO - __main__ - Step 53936: {'lr': 0.0003628588333752544, 'samples': 10355712, 'steps': 53935, 'loss/train': 0.4761931896209717} -08/30/2021 22:56:20 - INFO - __main__ - Step 53937: {'lr': 0.0003628540981214791, 'samples': 10355904, 'steps': 53936, 'loss/train': 0.9485270380973816} -08/30/2021 22:56:20 - INFO - __main__ - Step 53938: {'lr': 0.00036284936281685354, 'samples': 10356096, 'steps': 53937, 'loss/train': 1.2968593835830688} -08/30/2021 22:56:20 - INFO - __main__ - Step 53939: {'lr': 0.0003628446274613797, 'samples': 10356288, 'steps': 53938, 'loss/train': 1.0184592008590698} -08/30/2021 22:56:21 - INFO - __main__ - Step 53940: {'lr': 0.00036283989205505987, 'samples': 10356480, 'steps': 53939, 'loss/train': 1.2882018089294434} -08/30/2021 22:56:22 - INFO - __main__ - Step 53941: {'lr': 0.00036283515659789615, 'samples': 10356672, 'steps': 53940, 'loss/train': 1.6255367994308472} -08/30/2021 22:56:23 - INFO - __main__ - Step 53942: {'lr': 0.0003628304210898906, 'samples': 10356864, 'steps': 53941, 'loss/train': 1.82087242603302} -08/30/2021 22:56:23 - INFO - __main__ - Step 53943: {'lr': 0.00036282568553104545, 'samples': 10357056, 'steps': 53942, 'loss/train': 1.032686710357666} -08/30/2021 22:56:23 - INFO - __main__ - Step 53944: {'lr': 0.00036282094992136273, 'samples': 10357248, 'steps': 53943, 'loss/train': 1.8840587139129639} -08/30/2021 22:56:24 - INFO - __main__ - Step 53945: {'lr': 0.00036281621426084465, 'samples': 10357440, 'steps': 53944, 'loss/train': 1.3175116777420044} -08/30/2021 22:56:26 - INFO - __main__ - Step 53946: {'lr': 0.0003628114785494934, 'samples': 10357632, 'steps': 53945, 'loss/train': 1.7962939739227295} -08/30/2021 22:56:26 - INFO - __main__ - Step 53947: {'lr': 0.00036280674278731096, 'samples': 10357824, 'steps': 53946, 'loss/train': 0.9019666910171509} -08/30/2021 22:56:27 - INFO - __main__ - Step 53948: {'lr': 0.00036280200697429957, 'samples': 10358016, 'steps': 53947, 'loss/train': 1.2212061882019043} -08/30/2021 22:56:27 - INFO - __main__ - Step 53949: {'lr': 0.00036279727111046127, 'samples': 10358208, 'steps': 53948, 'loss/train': 0.2895715534687042} -08/30/2021 22:56:27 - INFO - __main__ - Step 53950: {'lr': 0.0003627925351957983, 'samples': 10358400, 'steps': 53949, 'loss/train': 1.3136773109436035} -08/30/2021 22:56:28 - INFO - __main__ - Step 53951: {'lr': 0.0003627877992303128, 'samples': 10358592, 'steps': 53950, 'loss/train': 0.860072672367096} -08/30/2021 22:56:29 - INFO - __main__ - Step 53952: {'lr': 0.0003627830632140068, 'samples': 10358784, 'steps': 53951, 'loss/train': 1.6536394357681274} -08/30/2021 22:56:30 - INFO - __main__ - Step 53953: {'lr': 0.0003627783271468825, 'samples': 10358976, 'steps': 53952, 'loss/train': 1.5553181171417236} -08/30/2021 22:56:30 - INFO - __main__ - Step 53954: {'lr': 0.0003627735910289421, 'samples': 10359168, 'steps': 53953, 'loss/train': 1.3697348833084106} -08/30/2021 22:56:30 - INFO - __main__ - Step 53955: {'lr': 0.0003627688548601876, 'samples': 10359360, 'steps': 53954, 'loss/train': 1.366170883178711} -08/30/2021 22:56:31 - INFO - __main__ - Step 53956: {'lr': 0.00036276411864062116, 'samples': 10359552, 'steps': 53955, 'loss/train': 0.8351635336875916} -08/30/2021 22:56:31 - INFO - __main__ - Step 53957: {'lr': 0.00036275938237024505, 'samples': 10359744, 'steps': 53956, 'loss/train': 0.4959670305252075} -08/30/2021 22:56:33 - INFO - __main__ - Step 53958: {'lr': 0.00036275464604906116, 'samples': 10359936, 'steps': 53957, 'loss/train': 0.8398715257644653} -08/30/2021 22:56:34 - INFO - __main__ - Step 53959: {'lr': 0.0003627499096770719, 'samples': 10360128, 'steps': 53958, 'loss/train': 0.6449087262153625} -08/30/2021 22:56:34 - INFO - __main__ - Step 53960: {'lr': 0.0003627451732542791, 'samples': 10360320, 'steps': 53959, 'loss/train': 1.228438138961792} -08/30/2021 22:56:35 - INFO - __main__ - Step 53961: {'lr': 0.00036274043678068526, 'samples': 10360512, 'steps': 53960, 'loss/train': 2.020247459411621} -08/30/2021 22:56:35 - INFO - __main__ - Step 53962: {'lr': 0.0003627357002562923, 'samples': 10360704, 'steps': 53961, 'loss/train': 1.0533267259597778} -08/30/2021 22:56:37 - INFO - __main__ - Step 53963: {'lr': 0.0003627309636811023, 'samples': 10360896, 'steps': 53962, 'loss/train': 1.6192445755004883} -08/30/2021 22:56:37 - INFO - __main__ - Step 53964: {'lr': 0.00036272622705511745, 'samples': 10361088, 'steps': 53963, 'loss/train': 1.4473854303359985} -08/30/2021 22:56:38 - INFO - __main__ - Step 53965: {'lr': 0.0003627214903783399, 'samples': 10361280, 'steps': 53964, 'loss/train': 1.6189736127853394} -08/30/2021 22:56:38 - INFO - __main__ - Step 53966: {'lr': 0.00036271675365077185, 'samples': 10361472, 'steps': 53965, 'loss/train': 1.1956008672714233} -08/30/2021 22:56:38 - INFO - __main__ - Step 53967: {'lr': 0.0003627120168724153, 'samples': 10361664, 'steps': 53966, 'loss/train': 1.1789737939834595} -08/30/2021 22:56:40 - INFO - __main__ - Step 53968: {'lr': 0.00036270728004327246, 'samples': 10361856, 'steps': 53967, 'loss/train': 1.464616060256958} -08/30/2021 22:56:41 - INFO - __main__ - Step 53969: {'lr': 0.0003627025431633455, 'samples': 10362048, 'steps': 53968, 'loss/train': 1.041573166847229} -08/30/2021 22:56:41 - INFO - __main__ - Step 53970: {'lr': 0.00036269780623263647, 'samples': 10362240, 'steps': 53969, 'loss/train': 0.054159682244062424} -08/30/2021 22:56:41 - INFO - __main__ - Step 53971: {'lr': 0.00036269306925114765, 'samples': 10362432, 'steps': 53970, 'loss/train': 1.5363587141036987} -08/30/2021 22:56:42 - INFO - __main__ - Step 53972: {'lr': 0.000362688332218881, 'samples': 10362624, 'steps': 53971, 'loss/train': 1.858013391494751} -08/30/2021 22:56:43 - INFO - __main__ - Step 53973: {'lr': 0.0003626835951358387, 'samples': 10362816, 'steps': 53972, 'loss/train': 1.1408942937850952} -08/30/2021 22:56:44 - INFO - __main__ - Step 53974: {'lr': 0.00036267885800202296, 'samples': 10363008, 'steps': 53973, 'loss/train': 1.701961636543274} -08/30/2021 22:56:44 - INFO - __main__ - Step 53975: {'lr': 0.00036267412081743576, 'samples': 10363200, 'steps': 53974, 'loss/train': 1.3819730281829834} -08/30/2021 22:56:45 - INFO - __main__ - Step 53976: {'lr': 0.00036266938358207944, 'samples': 10363392, 'steps': 53975, 'loss/train': 1.580741047859192} -08/30/2021 22:56:45 - INFO - __main__ - Step 53977: {'lr': 0.0003626646462959561, 'samples': 10363584, 'steps': 53976, 'loss/train': 1.0083789825439453} -08/30/2021 22:56:46 - INFO - __main__ - Step 53978: {'lr': 0.00036265990895906767, 'samples': 10363776, 'steps': 53977, 'loss/train': 0.06872133910655975} -08/30/2021 22:56:47 - INFO - __main__ - Step 53979: {'lr': 0.0003626551715714165, 'samples': 10363968, 'steps': 53978, 'loss/train': 1.282861351966858} -08/30/2021 22:56:47 - INFO - __main__ - Step 53980: {'lr': 0.00036265043413300456, 'samples': 10364160, 'steps': 53979, 'loss/train': 1.0948063135147095} -08/30/2021 22:56:47 - INFO - __main__ - Step 53981: {'lr': 0.0003626456966438342, 'samples': 10364352, 'steps': 53980, 'loss/train': 0.9879094958305359} -08/30/2021 22:56:48 - INFO - __main__ - Step 53982: {'lr': 0.00036264095910390736, 'samples': 10364544, 'steps': 53981, 'loss/train': 0.9718050360679626} -08/30/2021 22:56:48 - INFO - __main__ - Step 53983: {'lr': 0.0003626362215132263, 'samples': 10364736, 'steps': 53982, 'loss/train': 1.7662581205368042} -08/30/2021 22:56:50 - INFO - __main__ - Step 53984: {'lr': 0.00036263148387179303, 'samples': 10364928, 'steps': 53983, 'loss/train': 1.705222725868225} -08/30/2021 22:56:50 - INFO - __main__ - Step 53985: {'lr': 0.0003626267461796097, 'samples': 10365120, 'steps': 53984, 'loss/train': 1.0252137184143066} -08/30/2021 22:56:51 - INFO - __main__ - Step 53986: {'lr': 0.0003626220084366786, 'samples': 10365312, 'steps': 53985, 'loss/train': 1.329757571220398} -08/30/2021 22:56:51 - INFO - __main__ - Step 53987: {'lr': 0.0003626172706430017, 'samples': 10365504, 'steps': 53986, 'loss/train': 1.3617582321166992} -08/30/2021 22:56:51 - INFO - __main__ - Step 53988: {'lr': 0.0003626125327985812, 'samples': 10365696, 'steps': 53987, 'loss/train': 1.3035142421722412} -08/30/2021 22:56:53 - INFO - __main__ - Step 53989: {'lr': 0.0003626077949034193, 'samples': 10365888, 'steps': 53988, 'loss/train': 1.2522143125534058} -08/30/2021 22:56:53 - INFO - __main__ - Step 53990: {'lr': 0.000362603056957518, 'samples': 10366080, 'steps': 53989, 'loss/train': 0.7440615296363831} -08/30/2021 22:56:54 - INFO - __main__ - Step 53991: {'lr': 0.0003625983189608795, 'samples': 10366272, 'steps': 53990, 'loss/train': 1.0405722856521606} -08/30/2021 22:56:54 - INFO - __main__ - Step 53992: {'lr': 0.00036259358091350597, 'samples': 10366464, 'steps': 53991, 'loss/train': 0.7481604218482971} -08/30/2021 22:56:54 - INFO - __main__ - Step 53993: {'lr': 0.0003625888428153995, 'samples': 10366656, 'steps': 53992, 'loss/train': 1.3331502676010132} -08/30/2021 22:56:56 - INFO - __main__ - Step 53994: {'lr': 0.0003625841046665622, 'samples': 10366848, 'steps': 53993, 'loss/train': 0.9002139568328857} -08/30/2021 22:56:57 - INFO - __main__ - Step 53995: {'lr': 0.00036257936646699626, 'samples': 10367040, 'steps': 53994, 'loss/train': 1.5377739667892456} -08/30/2021 22:56:57 - INFO - __main__ - Step 53996: {'lr': 0.00036257462821670387, 'samples': 10367232, 'steps': 53995, 'loss/train': 1.515584111213684} -08/30/2021 22:56:57 - INFO - __main__ - Step 53997: {'lr': 0.00036256988991568696, 'samples': 10367424, 'steps': 53996, 'loss/train': 1.3562283515930176} -08/30/2021 22:56:58 - INFO - __main__ - Step 53998: {'lr': 0.0003625651515639479, 'samples': 10367616, 'steps': 53997, 'loss/train': 1.437071681022644} -08/30/2021 22:57:00 - INFO - __main__ - Step 53999: {'lr': 0.00036256041316148864, 'samples': 10367808, 'steps': 53998, 'loss/train': 1.1273692846298218} -08/30/2021 22:57:00 - INFO - __main__ - Step 54000: {'lr': 0.0003625556747083114, 'samples': 10368000, 'steps': 53999, 'loss/train': 0.9582331776618958} -08/30/2021 22:57:01 - INFO - __main__ - Step 54001: {'lr': 0.0003625509362044183, 'samples': 10368192, 'steps': 54000, 'loss/train': 0.9439205527305603} -08/30/2021 22:57:01 - INFO - __main__ - Step 54002: {'lr': 0.00036254619764981155, 'samples': 10368384, 'steps': 54001, 'loss/train': 1.3519387245178223} -08/30/2021 22:57:01 - INFO - __main__ - Step 54003: {'lr': 0.0003625414590444932, 'samples': 10368576, 'steps': 54002, 'loss/train': 1.909079670906067} -08/30/2021 22:57:02 - INFO - __main__ - Step 54004: {'lr': 0.0003625367203884654, 'samples': 10368768, 'steps': 54003, 'loss/train': 1.7615684270858765} -08/30/2021 22:57:04 - INFO - __main__ - Step 54005: {'lr': 0.0003625319816817303, 'samples': 10368960, 'steps': 54004, 'loss/train': 1.708850622177124} -08/30/2021 22:57:04 - INFO - __main__ - Step 54006: {'lr': 0.00036252724292429, 'samples': 10369152, 'steps': 54005, 'loss/train': 1.1089848279953003} -08/30/2021 22:57:04 - INFO - __main__ - Step 54007: {'lr': 0.00036252250411614666, 'samples': 10369344, 'steps': 54006, 'loss/train': 1.6467301845550537} -08/30/2021 22:57:05 - INFO - __main__ - Step 54008: {'lr': 0.0003625177652573024, 'samples': 10369536, 'steps': 54007, 'loss/train': 1.2013165950775146} -08/30/2021 22:57:05 - INFO - __main__ - Step 54009: {'lr': 0.0003625130263477595, 'samples': 10369728, 'steps': 54008, 'loss/train': 1.2774794101715088} -08/30/2021 22:57:05 - INFO - __main__ - Step 54010: {'lr': 0.00036250828738751986, 'samples': 10369920, 'steps': 54009, 'loss/train': 2.4317800998687744} -08/30/2021 22:57:07 - INFO - __main__ - Step 54011: {'lr': 0.0003625035483765857, 'samples': 10370112, 'steps': 54010, 'loss/train': 1.6654589176177979} -08/30/2021 22:57:08 - INFO - __main__ - Step 54012: {'lr': 0.00036249880931495923, 'samples': 10370304, 'steps': 54011, 'loss/train': 1.2266253232955933} -08/30/2021 22:57:08 - INFO - __main__ - Step 54013: {'lr': 0.00036249407020264246, 'samples': 10370496, 'steps': 54012, 'loss/train': 1.8434330224990845} -08/30/2021 22:57:08 - INFO - __main__ - Step 54014: {'lr': 0.00036248933103963767, 'samples': 10370688, 'steps': 54013, 'loss/train': 0.9791733622550964} -08/30/2021 22:57:09 - INFO - __main__ - Step 54015: {'lr': 0.0003624845918259469, 'samples': 10370880, 'steps': 54014, 'loss/train': 1.4361388683319092} -08/30/2021 22:57:09 - INFO - __main__ - Step 54016: {'lr': 0.00036247985256157236, 'samples': 10371072, 'steps': 54015, 'loss/train': 1.578568458557129} -08/30/2021 22:57:11 - INFO - __main__ - Step 54017: {'lr': 0.0003624751132465161, 'samples': 10371264, 'steps': 54016, 'loss/train': 1.1097666025161743} -08/30/2021 22:57:12 - INFO - __main__ - Step 54018: {'lr': 0.00036247037388078017, 'samples': 10371456, 'steps': 54017, 'loss/train': 1.1587128639221191} -08/30/2021 22:57:12 - INFO - __main__ - Step 54019: {'lr': 0.00036246563446436697, 'samples': 10371648, 'steps': 54018, 'loss/train': 1.7240855693817139} -08/30/2021 22:57:12 - INFO - __main__ - Step 54020: {'lr': 0.00036246089499727843, 'samples': 10371840, 'steps': 54019, 'loss/train': 1.9333378076553345} -08/30/2021 22:57:13 - INFO - __main__ - Step 54021: {'lr': 0.0003624561554795168, 'samples': 10372032, 'steps': 54020, 'loss/train': 1.7124807834625244} -08/30/2021 22:57:14 - INFO - __main__ - Step 54022: {'lr': 0.0003624514159110841, 'samples': 10372224, 'steps': 54021, 'loss/train': 0.33069729804992676} -08/30/2021 22:57:15 - INFO - __main__ - Step 54023: {'lr': 0.0003624466762919826, 'samples': 10372416, 'steps': 54022, 'loss/train': 1.3345967531204224} -08/30/2021 22:57:15 - INFO - __main__ - Step 54024: {'lr': 0.00036244193662221427, 'samples': 10372608, 'steps': 54023, 'loss/train': 1.2936688661575317} -08/30/2021 22:57:16 - INFO - __main__ - Step 54025: {'lr': 0.0003624371969017814, 'samples': 10372800, 'steps': 54024, 'loss/train': 1.475222110748291} -08/30/2021 22:57:16 - INFO - __main__ - Step 54026: {'lr': 0.000362432457130686, 'samples': 10372992, 'steps': 54025, 'loss/train': 1.2372760772705078} -08/30/2021 22:57:17 - INFO - __main__ - Step 54027: {'lr': 0.0003624277173089303, 'samples': 10373184, 'steps': 54026, 'loss/train': 1.0800518989562988} -08/30/2021 22:57:18 - INFO - __main__ - Step 54028: {'lr': 0.0003624229774365165, 'samples': 10373376, 'steps': 54027, 'loss/train': 1.245154619216919} -08/30/2021 22:57:18 - INFO - __main__ - Step 54029: {'lr': 0.00036241823751344656, 'samples': 10373568, 'steps': 54028, 'loss/train': 1.5563030242919922} -08/30/2021 22:57:18 - INFO - __main__ - Step 54030: {'lr': 0.0003624134975397227, 'samples': 10373760, 'steps': 54029, 'loss/train': 1.5903006792068481} -08/30/2021 22:57:19 - INFO - __main__ - Step 54031: {'lr': 0.0003624087575153471, 'samples': 10373952, 'steps': 54030, 'loss/train': 1.2951852083206177} -08/30/2021 22:57:20 - INFO - __main__ - Step 54032: {'lr': 0.00036240401744032174, 'samples': 10374144, 'steps': 54031, 'loss/train': 0.353877991437912} -08/30/2021 22:57:21 - INFO - __main__ - Step 54033: {'lr': 0.00036239927731464896, 'samples': 10374336, 'steps': 54032, 'loss/train': 0.9869309067726135} -08/30/2021 22:57:21 - INFO - __main__ - Step 54034: {'lr': 0.0003623945371383307, 'samples': 10374528, 'steps': 54033, 'loss/train': 1.4709755182266235} -08/30/2021 22:57:22 - INFO - __main__ - Step 54035: {'lr': 0.0003623897969113693, 'samples': 10374720, 'steps': 54034, 'loss/train': 3.0739753246307373} -08/30/2021 22:57:22 - INFO - __main__ - Step 54036: {'lr': 0.00036238505663376675, 'samples': 10374912, 'steps': 54035, 'loss/train': 1.386664867401123} -08/30/2021 22:57:22 - INFO - __main__ - Step 54037: {'lr': 0.00036238031630552527, 'samples': 10375104, 'steps': 54036, 'loss/train': 1.0370498895645142} -08/30/2021 22:57:24 - INFO - __main__ - Step 54038: {'lr': 0.0003623755759266469, 'samples': 10375296, 'steps': 54037, 'loss/train': 0.8300610780715942} -08/30/2021 22:57:24 - INFO - __main__ - Step 54039: {'lr': 0.00036237083549713387, 'samples': 10375488, 'steps': 54038, 'loss/train': 1.830101490020752} -08/30/2021 22:57:25 - INFO - __main__ - Step 54040: {'lr': 0.0003623660950169882, 'samples': 10375680, 'steps': 54039, 'loss/train': 1.7232962846755981} -08/30/2021 22:57:25 - INFO - __main__ - Step 54041: {'lr': 0.00036236135448621215, 'samples': 10375872, 'steps': 54040, 'loss/train': 1.449582815170288} -08/30/2021 22:57:25 - INFO - __main__ - Step 54042: {'lr': 0.0003623566139048078, 'samples': 10376064, 'steps': 54041, 'loss/train': 1.3240938186645508} -08/30/2021 22:57:27 - INFO - __main__ - Step 54043: {'lr': 0.00036235187327277735, 'samples': 10376256, 'steps': 54042, 'loss/train': 1.7063496112823486} -08/30/2021 22:57:27 - INFO - __main__ - Step 54044: {'lr': 0.0003623471325901228, 'samples': 10376448, 'steps': 54043, 'loss/train': 0.9686894416809082} -08/30/2021 22:57:28 - INFO - __main__ - Step 54045: {'lr': 0.00036234239185684643, 'samples': 10376640, 'steps': 54044, 'loss/train': 1.565123200416565} -08/30/2021 22:57:28 - INFO - __main__ - Step 54046: {'lr': 0.00036233765107295023, 'samples': 10376832, 'steps': 54045, 'loss/train': 1.407694935798645} -08/30/2021 22:57:28 - INFO - __main__ - Step 54047: {'lr': 0.00036233291023843653, 'samples': 10377024, 'steps': 54046, 'loss/train': 1.0453904867172241} -08/30/2021 22:57:30 - INFO - __main__ - Step 54048: {'lr': 0.00036232816935330723, 'samples': 10377216, 'steps': 54047, 'loss/train': 1.4748709201812744} -08/30/2021 22:57:30 - INFO - __main__ - Step 54049: {'lr': 0.00036232342841756467, 'samples': 10377408, 'steps': 54048, 'loss/train': 1.144144058227539} -08/30/2021 22:57:31 - INFO - __main__ - Step 54050: {'lr': 0.00036231868743121095, 'samples': 10377600, 'steps': 54049, 'loss/train': 1.3348273038864136} -08/30/2021 22:57:31 - INFO - __main__ - Step 54051: {'lr': 0.0003623139463942481, 'samples': 10377792, 'steps': 54050, 'loss/train': 0.9061219096183777} -08/30/2021 22:57:32 - INFO - __main__ - Step 54052: {'lr': 0.0003623092053066783, 'samples': 10377984, 'steps': 54051, 'loss/train': 2.7090871334075928} -08/30/2021 22:57:33 - INFO - __main__ - Step 54053: {'lr': 0.0003623044641685037, 'samples': 10378176, 'steps': 54052, 'loss/train': 1.5605658292770386} -08/30/2021 22:57:34 - INFO - __main__ - Step 54054: {'lr': 0.00036229972297972644, 'samples': 10378368, 'steps': 54053, 'loss/train': 1.7433743476867676} -08/30/2021 22:57:34 - INFO - __main__ - Step 54055: {'lr': 0.00036229498174034867, 'samples': 10378560, 'steps': 54054, 'loss/train': 2.418992042541504} -08/30/2021 22:57:34 - INFO - __main__ - Step 54056: {'lr': 0.00036229024045037264, 'samples': 10378752, 'steps': 54055, 'loss/train': 1.3381084203720093} -08/30/2021 22:57:35 - INFO - __main__ - Step 54057: {'lr': 0.00036228549910980026, 'samples': 10378944, 'steps': 54056, 'loss/train': 1.6885634660720825} -08/30/2021 22:57:35 - INFO - __main__ - Step 54058: {'lr': 0.0003622807577186337, 'samples': 10379136, 'steps': 54057, 'loss/train': 1.3403220176696777} -08/30/2021 22:57:37 - INFO - __main__ - Step 54059: {'lr': 0.0003622760162768752, 'samples': 10379328, 'steps': 54058, 'loss/train': 1.2096168994903564} -08/30/2021 22:57:37 - INFO - __main__ - Step 54060: {'lr': 0.0003622712747845269, 'samples': 10379520, 'steps': 54059, 'loss/train': 1.6528197526931763} -08/30/2021 22:57:37 - INFO - __main__ - Step 54061: {'lr': 0.0003622665332415909, 'samples': 10379712, 'steps': 54060, 'loss/train': 0.06437007337808609} -08/30/2021 22:57:38 - INFO - __main__ - Step 54062: {'lr': 0.00036226179164806926, 'samples': 10379904, 'steps': 54061, 'loss/train': 1.6419748067855835} -08/30/2021 22:57:38 - INFO - __main__ - Step 54063: {'lr': 0.00036225705000396424, 'samples': 10380096, 'steps': 54062, 'loss/train': 0.9441823959350586} -08/30/2021 22:57:40 - INFO - __main__ - Step 54064: {'lr': 0.000362252308309278, 'samples': 10380288, 'steps': 54063, 'loss/train': 1.6567384004592896} -08/30/2021 22:57:40 - INFO - __main__ - Step 54065: {'lr': 0.00036224756656401245, 'samples': 10380480, 'steps': 54064, 'loss/train': 1.1339386701583862} -08/30/2021 22:57:40 - INFO - __main__ - Step 54066: {'lr': 0.0003622428247681699, 'samples': 10380672, 'steps': 54065, 'loss/train': 1.6598219871520996} -08/30/2021 22:57:41 - INFO - __main__ - Step 54067: {'lr': 0.0003622380829217526, 'samples': 10380864, 'steps': 54066, 'loss/train': 1.626612663269043} -08/30/2021 22:57:41 - INFO - __main__ - Step 54068: {'lr': 0.00036223334102476247, 'samples': 10381056, 'steps': 54067, 'loss/train': 1.0829334259033203} -08/30/2021 22:57:43 - INFO - __main__ - Step 54069: {'lr': 0.00036222859907720167, 'samples': 10381248, 'steps': 54068, 'loss/train': 0.7254710793495178} -08/30/2021 22:57:43 - INFO - __main__ - Step 54070: {'lr': 0.00036222385707907254, 'samples': 10381440, 'steps': 54069, 'loss/train': 1.5907626152038574} -08/30/2021 22:57:43 - INFO - __main__ - Step 54071: {'lr': 0.000362219115030377, 'samples': 10381632, 'steps': 54070, 'loss/train': 1.2088876962661743} -08/30/2021 22:57:44 - INFO - __main__ - Step 54072: {'lr': 0.0003622143729311172, 'samples': 10381824, 'steps': 54071, 'loss/train': 1.6792110204696655} -08/30/2021 22:57:44 - INFO - __main__ - Step 54073: {'lr': 0.00036220963078129536, 'samples': 10382016, 'steps': 54072, 'loss/train': 1.7058193683624268} -08/30/2021 22:57:46 - INFO - __main__ - Step 54074: {'lr': 0.0003622048885809136, 'samples': 10382208, 'steps': 54073, 'loss/train': 1.7429540157318115} -08/30/2021 22:57:47 - INFO - __main__ - Step 54075: {'lr': 0.0003622001463299741, 'samples': 10382400, 'steps': 54074, 'loss/train': 1.2515110969543457} -08/30/2021 22:57:47 - INFO - __main__ - Step 54076: {'lr': 0.0003621954040284789, 'samples': 10382592, 'steps': 54075, 'loss/train': 0.630169689655304} -08/30/2021 22:57:47 - INFO - __main__ - Step 54077: {'lr': 0.00036219066167643015, 'samples': 10382784, 'steps': 54076, 'loss/train': 1.4024375677108765} -08/30/2021 22:57:48 - INFO - __main__ - Step 54078: {'lr': 0.00036218591927383, 'samples': 10382976, 'steps': 54077, 'loss/train': 1.435202956199646} -08/30/2021 22:57:49 - INFO - __main__ - Step 54079: {'lr': 0.00036218117682068076, 'samples': 10383168, 'steps': 54078, 'loss/train': 0.29466712474823} -08/30/2021 22:57:50 - INFO - __main__ - Step 54080: {'lr': 0.0003621764343169843, 'samples': 10383360, 'steps': 54079, 'loss/train': 1.1778478622436523} -08/30/2021 22:57:50 - INFO - __main__ - Step 54081: {'lr': 0.0003621716917627429, 'samples': 10383552, 'steps': 54080, 'loss/train': 0.09834454953670502} -08/30/2021 22:57:50 - INFO - __main__ - Step 54082: {'lr': 0.0003621669491579587, 'samples': 10383744, 'steps': 54081, 'loss/train': 1.401611089706421} -08/30/2021 22:57:51 - INFO - __main__ - Step 54083: {'lr': 0.0003621622065026337, 'samples': 10383936, 'steps': 54082, 'loss/train': 1.4323993921279907} -08/30/2021 22:57:52 - INFO - __main__ - Step 54084: {'lr': 0.0003621574637967702, 'samples': 10384128, 'steps': 54083, 'loss/train': 1.2989877462387085} -08/30/2021 22:57:53 - INFO - __main__ - Step 54085: {'lr': 0.00036215272104037023, 'samples': 10384320, 'steps': 54084, 'loss/train': 1.7603942155838013} -08/30/2021 22:57:53 - INFO - __main__ - Step 54086: {'lr': 0.0003621479782334361, 'samples': 10384512, 'steps': 54085, 'loss/train': 1.627334475517273} -08/30/2021 22:57:53 - INFO - __main__ - Step 54087: {'lr': 0.00036214323537596974, 'samples': 10384704, 'steps': 54086, 'loss/train': 1.3577144145965576} -08/30/2021 22:57:54 - INFO - __main__ - Step 54088: {'lr': 0.0003621384924679733, 'samples': 10384896, 'steps': 54087, 'loss/train': 1.2363277673721313} -08/30/2021 22:57:54 - INFO - __main__ - Step 54089: {'lr': 0.00036213374950944913, 'samples': 10385088, 'steps': 54088, 'loss/train': 1.3616971969604492} -08/30/2021 22:57:55 - INFO - __main__ - Step 54090: {'lr': 0.0003621290065003991, 'samples': 10385280, 'steps': 54089, 'loss/train': 1.0444917678833008} -08/30/2021 22:57:56 - INFO - __main__ - Step 54091: {'lr': 0.00036212426344082554, 'samples': 10385472, 'steps': 54090, 'loss/train': 1.1713694334030151} -08/30/2021 22:57:56 - INFO - __main__ - Step 54092: {'lr': 0.0003621195203307305, 'samples': 10385664, 'steps': 54091, 'loss/train': 1.3787810802459717} -08/30/2021 22:57:57 - INFO - __main__ - Step 54093: {'lr': 0.0003621147771701161, 'samples': 10385856, 'steps': 54092, 'loss/train': 1.375692367553711} -08/30/2021 22:57:57 - INFO - __main__ - Step 54094: {'lr': 0.00036211003395898456, 'samples': 10386048, 'steps': 54093, 'loss/train': 1.5688828229904175} -08/30/2021 22:57:59 - INFO - __main__ - Step 54095: {'lr': 0.0003621052906973379, 'samples': 10386240, 'steps': 54094, 'loss/train': 1.0351804494857788} -08/30/2021 22:57:59 - INFO - __main__ - Step 54096: {'lr': 0.0003621005473851784, 'samples': 10386432, 'steps': 54095, 'loss/train': 0.8776874542236328} -08/30/2021 22:57:59 - INFO - __main__ - Step 54097: {'lr': 0.0003620958040225081, 'samples': 10386624, 'steps': 54096, 'loss/train': 1.390691876411438} -08/30/2021 22:58:00 - INFO - __main__ - Step 54098: {'lr': 0.0003620910606093292, 'samples': 10386816, 'steps': 54097, 'loss/train': 1.2313324213027954} -08/30/2021 22:58:00 - INFO - __main__ - Step 54099: {'lr': 0.0003620863171456437, 'samples': 10387008, 'steps': 54098, 'loss/train': 0.034721489995718} -08/30/2021 22:58:02 - INFO - __main__ - Step 54100: {'lr': 0.0003620815736314539, 'samples': 10387200, 'steps': 54099, 'loss/train': 0.8360977172851562} -08/30/2021 22:58:02 - INFO - __main__ - Step 54101: {'lr': 0.0003620768300667618, 'samples': 10387392, 'steps': 54100, 'loss/train': 0.8581121563911438} -08/30/2021 22:58:03 - INFO - __main__ - Step 54102: {'lr': 0.00036207208645156977, 'samples': 10387584, 'steps': 54101, 'loss/train': 0.03505820780992508} -08/30/2021 22:58:03 - INFO - __main__ - Step 54103: {'lr': 0.00036206734278587964, 'samples': 10387776, 'steps': 54102, 'loss/train': 1.4135011434555054} -08/30/2021 22:58:04 - INFO - __main__ - Step 54104: {'lr': 0.0003620625990696937, 'samples': 10387968, 'steps': 54103, 'loss/train': 1.3703819513320923} -08/30/2021 22:58:04 - INFO - __main__ - Step 54105: {'lr': 0.00036205785530301417, 'samples': 10388160, 'steps': 54104, 'loss/train': 1.5602731704711914} -08/30/2021 22:58:05 - INFO - __main__ - Step 54106: {'lr': 0.00036205311148584306, 'samples': 10388352, 'steps': 54105, 'loss/train': 1.3221800327301025} -08/30/2021 22:58:06 - INFO - __main__ - Step 54107: {'lr': 0.00036204836761818255, 'samples': 10388544, 'steps': 54106, 'loss/train': 1.3876063823699951} -08/30/2021 22:58:06 - INFO - __main__ - Step 54108: {'lr': 0.00036204362370003475, 'samples': 10388736, 'steps': 54107, 'loss/train': 0.9098288416862488} -08/30/2021 22:58:07 - INFO - __main__ - Step 54109: {'lr': 0.00036203887973140184, 'samples': 10388928, 'steps': 54108, 'loss/train': 1.562433123588562} -08/30/2021 22:58:07 - INFO - __main__ - Step 54110: {'lr': 0.000362034135712286, 'samples': 10389120, 'steps': 54109, 'loss/train': 1.390947937965393} -08/30/2021 22:58:08 - INFO - __main__ - Step 54111: {'lr': 0.00036202939164268924, 'samples': 10389312, 'steps': 54110, 'loss/train': 1.441522240638733} -08/30/2021 22:58:09 - INFO - __main__ - Step 54112: {'lr': 0.0003620246475226138, 'samples': 10389504, 'steps': 54111, 'loss/train': 1.498203158378601} -08/30/2021 22:58:09 - INFO - __main__ - Step 54113: {'lr': 0.0003620199033520617, 'samples': 10389696, 'steps': 54112, 'loss/train': 1.418110966682434} -08/30/2021 22:58:09 - INFO - __main__ - Step 54114: {'lr': 0.0003620151591310352, 'samples': 10389888, 'steps': 54113, 'loss/train': 1.5095621347427368} -08/30/2021 22:58:10 - INFO - __main__ - Step 54115: {'lr': 0.0003620104148595364, 'samples': 10390080, 'steps': 54114, 'loss/train': 1.5566352605819702} -08/30/2021 22:58:11 - INFO - __main__ - Step 54116: {'lr': 0.00036200567053756746, 'samples': 10390272, 'steps': 54115, 'loss/train': 1.2761110067367554} -08/30/2021 22:58:12 - INFO - __main__ - Step 54117: {'lr': 0.0003620009261651305, 'samples': 10390464, 'steps': 54116, 'loss/train': 1.213962197303772} -08/30/2021 22:58:12 - INFO - __main__ - Step 54118: {'lr': 0.0003619961817422276, 'samples': 10390656, 'steps': 54117, 'loss/train': 1.5254822969436646} -08/30/2021 22:58:12 - INFO - __main__ - Step 54119: {'lr': 0.00036199143726886097, 'samples': 10390848, 'steps': 54118, 'loss/train': 1.5034877061843872} -08/30/2021 22:58:13 - INFO - __main__ - Step 54120: {'lr': 0.00036198669274503274, 'samples': 10391040, 'steps': 54119, 'loss/train': 1.5984971523284912} -08/30/2021 22:58:15 - INFO - __main__ - Step 54121: {'lr': 0.00036198194817074503, 'samples': 10391232, 'steps': 54120, 'loss/train': 1.1868547201156616} -08/30/2021 22:58:15 - INFO - __main__ - Step 54122: {'lr': 0.00036197720354599997, 'samples': 10391424, 'steps': 54121, 'loss/train': 1.0521479845046997} -08/30/2021 22:58:15 - INFO - __main__ - Step 54123: {'lr': 0.0003619724588707997, 'samples': 10391616, 'steps': 54122, 'loss/train': 1.8686732053756714} -08/30/2021 22:58:16 - INFO - __main__ - Step 54124: {'lr': 0.00036196771414514643, 'samples': 10391808, 'steps': 54123, 'loss/train': 1.7459044456481934} -08/30/2021 22:58:16 - INFO - __main__ - Step 54125: {'lr': 0.0003619629693690422, 'samples': 10392000, 'steps': 54124, 'loss/train': 0.03861915320158005} -08/30/2021 22:58:17 - INFO - __main__ - Step 54126: {'lr': 0.00036195822454248916, 'samples': 10392192, 'steps': 54125, 'loss/train': 0.7102423906326294} -08/30/2021 22:58:17 - INFO - __main__ - Step 54127: {'lr': 0.00036195347966548955, 'samples': 10392384, 'steps': 54126, 'loss/train': 1.558639407157898} -08/30/2021 22:58:19 - INFO - __main__ - Step 54128: {'lr': 0.0003619487347380454, 'samples': 10392576, 'steps': 54127, 'loss/train': 2.4915640354156494} -08/30/2021 22:58:20 - INFO - __main__ - Step 54129: {'lr': 0.00036194398976015875, 'samples': 10392768, 'steps': 54128, 'loss/train': 0.8673027157783508} -08/30/2021 22:58:20 - INFO - __main__ - Step 54130: {'lr': 0.00036193924473183205, 'samples': 10392960, 'steps': 54129, 'loss/train': 1.2030518054962158} -08/30/2021 22:58:20 - INFO - __main__ - Step 54131: {'lr': 0.00036193449965306714, 'samples': 10393152, 'steps': 54130, 'loss/train': 1.3709392547607422} -08/30/2021 22:58:21 - INFO - __main__ - Step 54132: {'lr': 0.0003619297545238663, 'samples': 10393344, 'steps': 54131, 'loss/train': 1.8056080341339111} -08/30/2021 22:58:22 - INFO - __main__ - Step 54133: {'lr': 0.00036192500934423163, 'samples': 10393536, 'steps': 54132, 'loss/train': 0.1497471034526825} -08/30/2021 22:58:23 - INFO - __main__ - Step 54134: {'lr': 0.0003619202641141652, 'samples': 10393728, 'steps': 54133, 'loss/train': 1.1492186784744263} -08/30/2021 22:58:23 - INFO - __main__ - Step 54135: {'lr': 0.00036191551883366937, 'samples': 10393920, 'steps': 54134, 'loss/train': 1.6520380973815918} -08/30/2021 22:58:23 - INFO - __main__ - Step 54136: {'lr': 0.000361910773502746, 'samples': 10394112, 'steps': 54135, 'loss/train': 0.6784459352493286} -08/30/2021 22:58:24 - INFO - __main__ - Step 54137: {'lr': 0.00036190602812139757, 'samples': 10394304, 'steps': 54136, 'loss/train': 1.8451042175292969} -08/30/2021 22:58:26 - INFO - __main__ - Step 54138: {'lr': 0.00036190128268962586, 'samples': 10394496, 'steps': 54137, 'loss/train': 0.33997997641563416} -08/30/2021 22:58:26 - INFO - __main__ - Step 54139: {'lr': 0.00036189653720743317, 'samples': 10394688, 'steps': 54138, 'loss/train': 1.1718989610671997} -08/30/2021 22:58:26 - INFO - __main__ - Step 54140: {'lr': 0.0003618917916748216, 'samples': 10394880, 'steps': 54139, 'loss/train': 1.874208927154541} -08/30/2021 22:58:27 - INFO - __main__ - Step 54141: {'lr': 0.00036188704609179333, 'samples': 10395072, 'steps': 54140, 'loss/train': 0.07980351895093918} -08/30/2021 22:58:27 - INFO - __main__ - Step 54142: {'lr': 0.00036188230045835053, 'samples': 10395264, 'steps': 54141, 'loss/train': 1.3706554174423218} -08/30/2021 22:58:29 - INFO - __main__ - Step 54143: {'lr': 0.00036187755477449525, 'samples': 10395456, 'steps': 54142, 'loss/train': 0.09378743171691895} -08/30/2021 22:58:29 - INFO - __main__ - Step 54144: {'lr': 0.00036187280904022973, 'samples': 10395648, 'steps': 54143, 'loss/train': 1.2493839263916016} -08/30/2021 22:58:30 - INFO - __main__ - Step 54145: {'lr': 0.000361868063255556, 'samples': 10395840, 'steps': 54144, 'loss/train': 1.3576929569244385} -08/30/2021 22:58:30 - INFO - __main__ - Step 54146: {'lr': 0.00036186331742047627, 'samples': 10396032, 'steps': 54145, 'loss/train': 1.3930189609527588} -08/30/2021 22:58:30 - INFO - __main__ - Step 54147: {'lr': 0.0003618585715349926, 'samples': 10396224, 'steps': 54146, 'loss/train': 0.05383821204304695} -08/30/2021 22:58:32 - INFO - __main__ - Step 54148: {'lr': 0.00036185382559910723, 'samples': 10396416, 'steps': 54147, 'loss/train': 1.3092625141143799} -08/30/2021 22:58:32 - INFO - __main__ - Step 54149: {'lr': 0.0003618490796128222, 'samples': 10396608, 'steps': 54148, 'loss/train': 0.9480769038200378} -08/30/2021 22:58:33 - INFO - __main__ - Step 54150: {'lr': 0.0003618443335761398, 'samples': 10396800, 'steps': 54149, 'loss/train': 1.4428114891052246} -08/30/2021 22:58:33 - INFO - __main__ - Step 54151: {'lr': 0.00036183958748906204, 'samples': 10396992, 'steps': 54150, 'loss/train': 1.3658024072647095} -08/30/2021 22:58:33 - INFO - __main__ - Step 54152: {'lr': 0.00036183484135159105, 'samples': 10397184, 'steps': 54151, 'loss/train': 1.4825936555862427} -08/30/2021 22:58:35 - INFO - __main__ - Step 54153: {'lr': 0.000361830095163729, 'samples': 10397376, 'steps': 54152, 'loss/train': 1.2851667404174805} -08/30/2021 22:58:35 - INFO - __main__ - Step 54154: {'lr': 0.000361825348925478, 'samples': 10397568, 'steps': 54153, 'loss/train': 1.2316964864730835} -08/30/2021 22:58:36 - INFO - __main__ - Step 54155: {'lr': 0.0003618206026368403, 'samples': 10397760, 'steps': 54154, 'loss/train': 1.2137839794158936} -08/30/2021 22:58:36 - INFO - __main__ - Step 54156: {'lr': 0.00036181585629781795, 'samples': 10397952, 'steps': 54155, 'loss/train': 1.1795769929885864} -08/30/2021 22:58:36 - INFO - __main__ - Step 54157: {'lr': 0.0003618111099084131, 'samples': 10398144, 'steps': 54156, 'loss/train': 1.2153394222259521} -08/30/2021 22:58:37 - INFO - __main__ - Step 54158: {'lr': 0.00036180636346862786, 'samples': 10398336, 'steps': 54157, 'loss/train': 1.553842544555664} -08/30/2021 22:58:38 - INFO - __main__ - Step 54159: {'lr': 0.0003618016169784645, 'samples': 10398528, 'steps': 54158, 'loss/train': 1.4840449094772339} -08/30/2021 22:58:39 - INFO - __main__ - Step 54160: {'lr': 0.0003617968704379249, 'samples': 10398720, 'steps': 54159, 'loss/train': 1.10103440284729} -08/30/2021 22:58:39 - INFO - __main__ - Step 54161: {'lr': 0.0003617921238470114, 'samples': 10398912, 'steps': 54160, 'loss/train': 1.065316081047058} -08/30/2021 22:58:40 - INFO - __main__ - Step 54162: {'lr': 0.00036178737720572615, 'samples': 10399104, 'steps': 54161, 'loss/train': 0.03477616608142853} -08/30/2021 22:58:40 - INFO - __main__ - Step 54163: {'lr': 0.0003617826305140712, 'samples': 10399296, 'steps': 54162, 'loss/train': 0.9488590359687805} -08/30/2021 22:58:41 - INFO - __main__ - Step 54164: {'lr': 0.0003617778837720488, 'samples': 10399488, 'steps': 54163, 'loss/train': 2.0428566932678223} -08/30/2021 22:58:42 - INFO - __main__ - Step 54165: {'lr': 0.00036177313697966087, 'samples': 10399680, 'steps': 54164, 'loss/train': 0.647103488445282} -08/30/2021 22:58:42 - INFO - __main__ - Step 54166: {'lr': 0.00036176839013690975, 'samples': 10399872, 'steps': 54165, 'loss/train': 0.9498745799064636} -08/30/2021 22:58:43 - INFO - __main__ - Step 54167: {'lr': 0.0003617636432437975, 'samples': 10400064, 'steps': 54166, 'loss/train': 1.2474161386489868} -08/30/2021 22:58:43 - INFO - __main__ - Step 54168: {'lr': 0.00036175889630032633, 'samples': 10400256, 'steps': 54167, 'loss/train': 1.1814148426055908} -08/30/2021 22:58:44 - INFO - __main__ - Step 54169: {'lr': 0.0003617541493064983, 'samples': 10400448, 'steps': 54168, 'loss/train': 1.4715523719787598} -08/30/2021 22:58:45 - INFO - __main__ - Step 54170: {'lr': 0.00036174940226231555, 'samples': 10400640, 'steps': 54169, 'loss/train': 1.2243895530700684} -08/30/2021 22:58:45 - INFO - __main__ - Step 54171: {'lr': 0.0003617446551677803, 'samples': 10400832, 'steps': 54170, 'loss/train': 0.5915573239326477} -08/30/2021 22:58:46 - INFO - __main__ - Step 54172: {'lr': 0.0003617399080228946, 'samples': 10401024, 'steps': 54171, 'loss/train': 1.074485421180725} -08/30/2021 22:58:46 - INFO - __main__ - Step 54173: {'lr': 0.0003617351608276606, 'samples': 10401216, 'steps': 54172, 'loss/train': 1.0588046312332153} -08/30/2021 22:58:48 - INFO - __main__ - Step 54174: {'lr': 0.00036173041358208047, 'samples': 10401408, 'steps': 54173, 'loss/train': 1.5918129682540894} -08/30/2021 22:58:49 - INFO - __main__ - Step 54175: {'lr': 0.0003617256662861563, 'samples': 10401600, 'steps': 54174, 'loss/train': 1.5564087629318237} -08/30/2021 22:58:49 - INFO - __main__ - Step 54176: {'lr': 0.00036172091893989033, 'samples': 10401792, 'steps': 54175, 'loss/train': 1.3992847204208374} -08/30/2021 22:58:50 - INFO - __main__ - Step 54177: {'lr': 0.0003617161715432847, 'samples': 10401984, 'steps': 54176, 'loss/train': 1.37216055393219} -08/30/2021 22:58:50 - INFO - __main__ - Step 54178: {'lr': 0.0003617114240963414, 'samples': 10402176, 'steps': 54177, 'loss/train': 1.7359832525253296} -08/30/2021 22:58:50 - INFO - __main__ - Step 54179: {'lr': 0.00036170667659906263, 'samples': 10402368, 'steps': 54178, 'loss/train': 0.7494610548019409} -08/30/2021 22:58:51 - INFO - __main__ - Step 54180: {'lr': 0.0003617019290514506, 'samples': 10402560, 'steps': 54179, 'loss/train': 0.42284879088401794} -08/30/2021 22:58:53 - INFO - __main__ - Step 54181: {'lr': 0.0003616971814535074, 'samples': 10402752, 'steps': 54180, 'loss/train': 0.35809949040412903} -08/30/2021 22:58:53 - INFO - __main__ - Step 54182: {'lr': 0.0003616924338052352, 'samples': 10402944, 'steps': 54181, 'loss/train': 1.7498009204864502} -08/30/2021 22:58:54 - INFO - __main__ - Step 54183: {'lr': 0.00036168768610663605, 'samples': 10403136, 'steps': 54182, 'loss/train': 1.431233525276184} -08/30/2021 22:58:54 - INFO - __main__ - Step 54184: {'lr': 0.0003616829383577123, 'samples': 10403328, 'steps': 54183, 'loss/train': 1.1427468061447144} -08/30/2021 22:58:54 - INFO - __main__ - Step 54185: {'lr': 0.00036167819055846575, 'samples': 10403520, 'steps': 54184, 'loss/train': 1.3367365598678589} -08/30/2021 22:58:56 - INFO - __main__ - Step 54186: {'lr': 0.0003616734427088988, 'samples': 10403712, 'steps': 54185, 'loss/train': 0.16596487164497375} -08/30/2021 22:58:56 - INFO - __main__ - Step 54187: {'lr': 0.00036166869480901354, 'samples': 10403904, 'steps': 54186, 'loss/train': 1.194364309310913} -08/30/2021 22:58:57 - INFO - __main__ - Step 54188: {'lr': 0.0003616639468588121, 'samples': 10404096, 'steps': 54187, 'loss/train': 1.3934091329574585} -08/30/2021 22:58:57 - INFO - __main__ - Step 54189: {'lr': 0.00036165919885829654, 'samples': 10404288, 'steps': 54188, 'loss/train': 0.9677462577819824} -08/30/2021 22:58:57 - INFO - __main__ - Step 54190: {'lr': 0.0003616544508074691, 'samples': 10404480, 'steps': 54189, 'loss/train': 1.6321250200271606} -08/30/2021 22:58:59 - INFO - __main__ - Step 54191: {'lr': 0.00036164970270633195, 'samples': 10404672, 'steps': 54190, 'loss/train': 0.7174428105354309} -08/30/2021 22:58:59 - INFO - __main__ - Step 54192: {'lr': 0.0003616449545548871, 'samples': 10404864, 'steps': 54191, 'loss/train': 1.8042601346969604} -08/30/2021 22:59:00 - INFO - __main__ - Step 54193: {'lr': 0.00036164020635313677, 'samples': 10405056, 'steps': 54192, 'loss/train': 1.4498096704483032} -08/30/2021 22:59:00 - INFO - __main__ - Step 54194: {'lr': 0.0003616354581010831, 'samples': 10405248, 'steps': 54193, 'loss/train': 1.6507689952850342} -08/30/2021 22:59:00 - INFO - __main__ - Step 54195: {'lr': 0.0003616307097987282, 'samples': 10405440, 'steps': 54194, 'loss/train': 1.632206916809082} -08/30/2021 22:59:02 - INFO - __main__ - Step 54196: {'lr': 0.00036162596144607425, 'samples': 10405632, 'steps': 54195, 'loss/train': 1.4007915258407593} -08/30/2021 22:59:03 - INFO - __main__ - Step 54197: {'lr': 0.00036162121304312336, 'samples': 10405824, 'steps': 54196, 'loss/train': 1.2193647623062134} -08/30/2021 22:59:03 - INFO - __main__ - Step 54198: {'lr': 0.0003616164645898776, 'samples': 10406016, 'steps': 54197, 'loss/train': 1.065858006477356} -08/30/2021 22:59:03 - INFO - __main__ - Step 54199: {'lr': 0.0003616117160863393, 'samples': 10406208, 'steps': 54198, 'loss/train': 1.6092778444290161} -08/30/2021 22:59:04 - INFO - __main__ - Step 54200: {'lr': 0.00036160696753251043, 'samples': 10406400, 'steps': 54199, 'loss/train': 3.4266304969787598} -08/30/2021 22:59:04 - INFO - __main__ - Step 54201: {'lr': 0.0003616022189283932, 'samples': 10406592, 'steps': 54200, 'loss/train': 1.0664523839950562} -08/30/2021 22:59:05 - INFO - __main__ - Step 54202: {'lr': 0.00036159747027398963, 'samples': 10406784, 'steps': 54201, 'loss/train': 0.6084858775138855} -08/30/2021 22:59:06 - INFO - __main__ - Step 54203: {'lr': 0.0003615927215693021, 'samples': 10406976, 'steps': 54202, 'loss/train': 0.879784107208252} -08/30/2021 22:59:06 - INFO - __main__ - Step 54204: {'lr': 0.0003615879728143325, 'samples': 10407168, 'steps': 54203, 'loss/train': 1.2554460763931274} -08/30/2021 22:59:07 - INFO - __main__ - Step 54205: {'lr': 0.00036158322400908316, 'samples': 10407360, 'steps': 54204, 'loss/train': 1.0786643028259277} -08/30/2021 22:59:07 - INFO - __main__ - Step 54206: {'lr': 0.00036157847515355614, 'samples': 10407552, 'steps': 54205, 'loss/train': 0.7475901246070862} -08/30/2021 22:59:09 - INFO - __main__ - Step 54207: {'lr': 0.0003615737262477535, 'samples': 10407744, 'steps': 54206, 'loss/train': 1.323480486869812} -08/30/2021 22:59:10 - INFO - __main__ - Step 54208: {'lr': 0.0003615689772916776, 'samples': 10407936, 'steps': 54207, 'loss/train': 0.803510844707489} -08/30/2021 22:59:10 - INFO - __main__ - Step 54209: {'lr': 0.00036156422828533035, 'samples': 10408128, 'steps': 54208, 'loss/train': 0.7921726703643799} -08/30/2021 22:59:11 - INFO - __main__ - Step 54210: {'lr': 0.000361559479228714, 'samples': 10408320, 'steps': 54209, 'loss/train': 1.9012155532836914} -08/30/2021 22:59:11 - INFO - __main__ - Step 54211: {'lr': 0.00036155473012183066, 'samples': 10408512, 'steps': 54210, 'loss/train': 1.127052903175354} -08/30/2021 22:59:11 - INFO - __main__ - Step 54212: {'lr': 0.00036154998096468244, 'samples': 10408704, 'steps': 54211, 'loss/train': 1.3459440469741821} -08/30/2021 22:59:12 - INFO - __main__ - Step 54213: {'lr': 0.00036154523175727153, 'samples': 10408896, 'steps': 54212, 'loss/train': 1.5702800750732422} -08/30/2021 22:59:13 - INFO - __main__ - Step 54214: {'lr': 0.00036154048249960015, 'samples': 10409088, 'steps': 54213, 'loss/train': 1.400362253189087} -08/30/2021 22:59:14 - INFO - __main__ - Step 54215: {'lr': 0.0003615357331916703, 'samples': 10409280, 'steps': 54214, 'loss/train': 1.5849727392196655} -08/30/2021 22:59:14 - INFO - __main__ - Step 54216: {'lr': 0.0003615309838334841, 'samples': 10409472, 'steps': 54215, 'loss/train': 1.2600560188293457} -08/30/2021 22:59:15 - INFO - __main__ - Step 54217: {'lr': 0.00036152623442504386, 'samples': 10409664, 'steps': 54216, 'loss/train': 1.2272979021072388} -08/30/2021 22:59:15 - INFO - __main__ - Step 54218: {'lr': 0.0003615214849663516, 'samples': 10409856, 'steps': 54217, 'loss/train': 0.1535966694355011} -08/30/2021 22:59:16 - INFO - __main__ - Step 54219: {'lr': 0.0003615167354574094, 'samples': 10410048, 'steps': 54218, 'loss/train': 1.2791833877563477} -08/30/2021 22:59:17 - INFO - __main__ - Step 54220: {'lr': 0.0003615119858982196, 'samples': 10410240, 'steps': 54219, 'loss/train': 1.2066028118133545} -08/30/2021 22:59:17 - INFO - __main__ - Step 54221: {'lr': 0.0003615072362887841, 'samples': 10410432, 'steps': 54220, 'loss/train': 1.60999596118927} -08/30/2021 22:59:18 - INFO - __main__ - Step 54222: {'lr': 0.0003615024866291052, 'samples': 10410624, 'steps': 54221, 'loss/train': 0.7926939129829407} -08/30/2021 22:59:18 - INFO - __main__ - Step 54223: {'lr': 0.0003614977369191851, 'samples': 10410816, 'steps': 54222, 'loss/train': 1.4695885181427002} -08/30/2021 22:59:19 - INFO - __main__ - Step 54224: {'lr': 0.00036149298715902573, 'samples': 10411008, 'steps': 54223, 'loss/train': 1.1728781461715698} -08/30/2021 22:59:20 - INFO - __main__ - Step 54225: {'lr': 0.00036148823734862934, 'samples': 10411200, 'steps': 54224, 'loss/train': 1.0331125259399414} -08/30/2021 22:59:20 - INFO - __main__ - Step 54226: {'lr': 0.00036148348748799816, 'samples': 10411392, 'steps': 54225, 'loss/train': 1.4559595584869385} -08/30/2021 22:59:21 - INFO - __main__ - Step 54227: {'lr': 0.00036147873757713417, 'samples': 10411584, 'steps': 54226, 'loss/train': 1.544517159461975} -08/30/2021 22:59:21 - INFO - __main__ - Step 54228: {'lr': 0.0003614739876160396, 'samples': 10411776, 'steps': 54227, 'loss/train': 1.3546228408813477} -08/30/2021 22:59:23 - INFO - __main__ - Step 54229: {'lr': 0.0003614692376047165, 'samples': 10411968, 'steps': 54228, 'loss/train': 1.2377036809921265} -08/30/2021 22:59:23 - INFO - __main__ - Step 54230: {'lr': 0.00036146448754316717, 'samples': 10412160, 'steps': 54229, 'loss/train': 1.2535866498947144} -08/30/2021 22:59:23 - INFO - __main__ - Step 54231: {'lr': 0.0003614597374313937, 'samples': 10412352, 'steps': 54230, 'loss/train': 1.4869279861450195} -08/30/2021 22:59:24 - INFO - __main__ - Step 54232: {'lr': 0.00036145498726939806, 'samples': 10412544, 'steps': 54231, 'loss/train': 0.9444723129272461} -08/30/2021 22:59:24 - INFO - __main__ - Step 54233: {'lr': 0.0003614502370571826, 'samples': 10412736, 'steps': 54232, 'loss/train': 0.5442521572113037} -08/30/2021 22:59:24 - INFO - __main__ - Step 54234: {'lr': 0.00036144548679474943, 'samples': 10412928, 'steps': 54233, 'loss/train': 0.5774440765380859} -08/30/2021 22:59:26 - INFO - __main__ - Step 54235: {'lr': 0.0003614407364821005, 'samples': 10413120, 'steps': 54234, 'loss/train': 3.4268136024475098} -08/30/2021 22:59:27 - INFO - __main__ - Step 54236: {'lr': 0.0003614359861192382, 'samples': 10413312, 'steps': 54235, 'loss/train': 1.2223607301712036} -08/30/2021 22:59:27 - INFO - __main__ - Step 54237: {'lr': 0.00036143123570616455, 'samples': 10413504, 'steps': 54236, 'loss/train': 1.7738897800445557} -08/30/2021 22:59:27 - INFO - __main__ - Step 54238: {'lr': 0.0003614264852428817, 'samples': 10413696, 'steps': 54237, 'loss/train': 1.0485506057739258} -08/30/2021 22:59:28 - INFO - __main__ - Step 54239: {'lr': 0.0003614217347293918, 'samples': 10413888, 'steps': 54238, 'loss/train': 0.057003192603588104} -08/30/2021 22:59:28 - INFO - __main__ - Step 54240: {'lr': 0.000361416984165697, 'samples': 10414080, 'steps': 54239, 'loss/train': 1.8271238803863525} -08/30/2021 22:59:30 - INFO - __main__ - Step 54241: {'lr': 0.0003614122335517994, 'samples': 10414272, 'steps': 54240, 'loss/train': 1.7151165008544922} -08/30/2021 22:59:31 - INFO - __main__ - Step 54242: {'lr': 0.0003614074828877012, 'samples': 10414464, 'steps': 54241, 'loss/train': 1.3838129043579102} -08/30/2021 22:59:31 - INFO - __main__ - Step 54243: {'lr': 0.00036140273217340446, 'samples': 10414656, 'steps': 54242, 'loss/train': 1.9005241394042969} -08/30/2021 22:59:31 - INFO - __main__ - Step 54244: {'lr': 0.00036139798140891134, 'samples': 10414848, 'steps': 54243, 'loss/train': 1.2426371574401855} -08/30/2021 22:59:32 - INFO - __main__ - Step 54245: {'lr': 0.0003613932305942241, 'samples': 10415040, 'steps': 54244, 'loss/train': 1.113200306892395} -08/30/2021 22:59:33 - INFO - __main__ - Step 54246: {'lr': 0.00036138847972934477, 'samples': 10415232, 'steps': 54245, 'loss/train': 1.407149076461792} -08/30/2021 22:59:34 - INFO - __main__ - Step 54247: {'lr': 0.0003613837288142755, 'samples': 10415424, 'steps': 54246, 'loss/train': 1.5452519655227661} -08/30/2021 22:59:34 - INFO - __main__ - Step 54248: {'lr': 0.00036137897784901843, 'samples': 10415616, 'steps': 54247, 'loss/train': 0.7409790754318237} -08/30/2021 22:59:34 - INFO - __main__ - Step 54249: {'lr': 0.00036137422683357566, 'samples': 10415808, 'steps': 54248, 'loss/train': 1.4738839864730835} -08/30/2021 22:59:35 - INFO - __main__ - Step 54250: {'lr': 0.00036136947576794945, 'samples': 10416000, 'steps': 54249, 'loss/train': 1.518761396408081} -08/30/2021 22:59:36 - INFO - __main__ - Step 54251: {'lr': 0.00036136472465214187, 'samples': 10416192, 'steps': 54250, 'loss/train': 1.5369452238082886} -08/30/2021 22:59:37 - INFO - __main__ - Step 54252: {'lr': 0.00036135997348615503, 'samples': 10416384, 'steps': 54251, 'loss/train': 1.0127211809158325} -08/30/2021 22:59:37 - INFO - __main__ - Step 54253: {'lr': 0.00036135522226999115, 'samples': 10416576, 'steps': 54252, 'loss/train': 0.9309428930282593} -08/30/2021 22:59:37 - INFO - __main__ - Step 54254: {'lr': 0.00036135047100365223, 'samples': 10416768, 'steps': 54253, 'loss/train': 0.9776472449302673} -08/30/2021 22:59:38 - INFO - __main__ - Step 54255: {'lr': 0.00036134571968714056, 'samples': 10416960, 'steps': 54254, 'loss/train': 0.6639416813850403} -08/30/2021 22:59:38 - INFO - __main__ - Step 54256: {'lr': 0.00036134096832045825, 'samples': 10417152, 'steps': 54255, 'loss/train': 1.078926682472229} -08/30/2021 22:59:40 - INFO - __main__ - Step 54257: {'lr': 0.0003613362169036074, 'samples': 10417344, 'steps': 54256, 'loss/train': 1.7038991451263428} -08/30/2021 22:59:40 - INFO - __main__ - Step 54258: {'lr': 0.00036133146543659026, 'samples': 10417536, 'steps': 54257, 'loss/train': 1.41621994972229} -08/30/2021 22:59:40 - INFO - __main__ - Step 54259: {'lr': 0.00036132671391940875, 'samples': 10417728, 'steps': 54258, 'loss/train': 1.4720511436462402} -08/30/2021 22:59:41 - INFO - __main__ - Step 54260: {'lr': 0.0003613219623520652, 'samples': 10417920, 'steps': 54259, 'loss/train': 1.2003247737884521} -08/30/2021 22:59:41 - INFO - __main__ - Step 54261: {'lr': 0.00036131721073456163, 'samples': 10418112, 'steps': 54260, 'loss/train': 1.0252692699432373} -08/30/2021 22:59:43 - INFO - __main__ - Step 54262: {'lr': 0.0003613124590669003, 'samples': 10418304, 'steps': 54261, 'loss/train': 0.974557101726532} -08/30/2021 22:59:43 - INFO - __main__ - Step 54263: {'lr': 0.0003613077073490832, 'samples': 10418496, 'steps': 54262, 'loss/train': 1.3212673664093018} -08/30/2021 22:59:44 - INFO - __main__ - Step 54264: {'lr': 0.0003613029555811127, 'samples': 10418688, 'steps': 54263, 'loss/train': 0.159384086728096} -08/30/2021 22:59:44 - INFO - __main__ - Step 54265: {'lr': 0.0003612982037629908, 'samples': 10418880, 'steps': 54264, 'loss/train': 1.466238260269165} -08/30/2021 22:59:44 - INFO - __main__ - Step 54266: {'lr': 0.0003612934518947196, 'samples': 10419072, 'steps': 54265, 'loss/train': 1.327729344367981} -08/30/2021 22:59:46 - INFO - __main__ - Step 54267: {'lr': 0.00036128869997630134, 'samples': 10419264, 'steps': 54266, 'loss/train': 1.7651138305664062} -08/30/2021 22:59:46 - INFO - __main__ - Step 54268: {'lr': 0.000361283948007738, 'samples': 10419456, 'steps': 54267, 'loss/train': 1.2321785688400269} -08/30/2021 22:59:47 - INFO - __main__ - Step 54269: {'lr': 0.00036127919598903186, 'samples': 10419648, 'steps': 54268, 'loss/train': 1.2316728830337524} -08/30/2021 22:59:47 - INFO - __main__ - Step 54270: {'lr': 0.00036127444392018503, 'samples': 10419840, 'steps': 54269, 'loss/train': 1.0768077373504639} -08/30/2021 22:59:47 - INFO - __main__ - Step 54271: {'lr': 0.00036126969180119977, 'samples': 10420032, 'steps': 54270, 'loss/train': 2.1287810802459717} -08/30/2021 22:59:49 - INFO - __main__ - Step 54272: {'lr': 0.000361264939632078, 'samples': 10420224, 'steps': 54271, 'loss/train': 0.8181988596916199} -08/30/2021 22:59:50 - INFO - __main__ - Step 54273: {'lr': 0.00036126018741282194, 'samples': 10420416, 'steps': 54272, 'loss/train': 1.167194128036499} -08/30/2021 22:59:50 - INFO - __main__ - Step 54274: {'lr': 0.0003612554351434338, 'samples': 10420608, 'steps': 54273, 'loss/train': 1.6690635681152344} -08/30/2021 22:59:50 - INFO - __main__ - Step 54275: {'lr': 0.0003612506828239157, 'samples': 10420800, 'steps': 54274, 'loss/train': 1.6225290298461914} -08/30/2021 22:59:51 - INFO - __main__ - Step 54276: {'lr': 0.00036124593045426973, 'samples': 10420992, 'steps': 54275, 'loss/train': 1.4091507196426392} -08/30/2021 22:59:51 - INFO - __main__ - Step 54277: {'lr': 0.00036124117803449805, 'samples': 10421184, 'steps': 54276, 'loss/train': 1.0258644819259644} -08/30/2021 22:59:53 - INFO - __main__ - Step 54278: {'lr': 0.00036123642556460284, 'samples': 10421376, 'steps': 54277, 'loss/train': 0.03130926191806793} -08/30/2021 22:59:53 - INFO - __main__ - Step 54279: {'lr': 0.0003612316730445862, 'samples': 10421568, 'steps': 54278, 'loss/train': 1.3339954614639282} -08/30/2021 22:59:53 - INFO - __main__ - Step 54280: {'lr': 0.00036122692047445027, 'samples': 10421760, 'steps': 54279, 'loss/train': 0.13934817910194397} -08/30/2021 22:59:54 - INFO - __main__ - Step 54281: {'lr': 0.00036122216785419725, 'samples': 10421952, 'steps': 54280, 'loss/train': 1.2006418704986572} -08/30/2021 22:59:54 - INFO - __main__ - Step 54282: {'lr': 0.00036121741518382915, 'samples': 10422144, 'steps': 54281, 'loss/train': 1.534908413887024} -08/30/2021 22:59:56 - INFO - __main__ - Step 54283: {'lr': 0.00036121266246334825, 'samples': 10422336, 'steps': 54282, 'loss/train': 1.3351444005966187} -08/30/2021 22:59:56 - INFO - __main__ - Step 54284: {'lr': 0.00036120790969275667, 'samples': 10422528, 'steps': 54283, 'loss/train': 1.4599113464355469} -08/30/2021 22:59:56 - INFO - __main__ - Step 54285: {'lr': 0.0003612031568720565, 'samples': 10422720, 'steps': 54284, 'loss/train': 1.071659803390503} -08/30/2021 22:59:57 - INFO - __main__ - Step 54286: {'lr': 0.0003611984040012499, 'samples': 10422912, 'steps': 54285, 'loss/train': 0.8707094192504883} -08/30/2021 22:59:57 - INFO - __main__ - Step 54287: {'lr': 0.000361193651080339, 'samples': 10423104, 'steps': 54286, 'loss/train': 1.6434024572372437} -08/30/2021 22:59:59 - INFO - __main__ - Step 54288: {'lr': 0.000361188898109326, 'samples': 10423296, 'steps': 54287, 'loss/train': 1.622084617614746} -08/30/2021 22:59:59 - INFO - __main__ - Step 54289: {'lr': 0.00036118414508821295, 'samples': 10423488, 'steps': 54288, 'loss/train': 1.411124587059021} -08/30/2021 22:59:59 - INFO - __main__ - Step 54290: {'lr': 0.0003611793920170021, 'samples': 10423680, 'steps': 54289, 'loss/train': 1.420058012008667} -08/30/2021 23:00:00 - INFO - __main__ - Step 54291: {'lr': 0.0003611746388956955, 'samples': 10423872, 'steps': 54290, 'loss/train': 1.2150386571884155} -08/30/2021 23:00:00 - INFO - __main__ - Step 54292: {'lr': 0.00036116988572429534, 'samples': 10424064, 'steps': 54291, 'loss/train': 1.2232204675674438} -08/30/2021 23:00:02 - INFO - __main__ - Step 54293: {'lr': 0.0003611651325028037, 'samples': 10424256, 'steps': 54292, 'loss/train': 0.9685659408569336} -08/30/2021 23:00:03 - INFO - __main__ - Step 54294: {'lr': 0.0003611603792312228, 'samples': 10424448, 'steps': 54293, 'loss/train': 1.0455782413482666} -08/30/2021 23:00:03 - INFO - __main__ - Step 54295: {'lr': 0.0003611556259095547, 'samples': 10424640, 'steps': 54294, 'loss/train': 1.7435473203659058} -08/30/2021 23:00:04 - INFO - __main__ - Step 54296: {'lr': 0.00036115087253780164, 'samples': 10424832, 'steps': 54295, 'loss/train': 1.2525943517684937} -08/30/2021 23:00:04 - INFO - __main__ - Step 54297: {'lr': 0.0003611461191159657, 'samples': 10425024, 'steps': 54296, 'loss/train': 1.840232014656067} -08/30/2021 23:00:04 - INFO - __main__ - Step 54298: {'lr': 0.00036114136564404905, 'samples': 10425216, 'steps': 54297, 'loss/train': 0.4785672128200531} -08/30/2021 23:00:06 - INFO - __main__ - Step 54299: {'lr': 0.0003611366121220538, 'samples': 10425408, 'steps': 54298, 'loss/train': 1.0064611434936523} -08/30/2021 23:00:06 - INFO - __main__ - Step 54300: {'lr': 0.0003611318585499821, 'samples': 10425600, 'steps': 54299, 'loss/train': 1.299284815788269} -08/30/2021 23:00:07 - INFO - __main__ - Step 54301: {'lr': 0.00036112710492783605, 'samples': 10425792, 'steps': 54300, 'loss/train': 0.7138924598693848} -08/30/2021 23:00:07 - INFO - __main__ - Step 54302: {'lr': 0.0003611223512556179, 'samples': 10425984, 'steps': 54301, 'loss/train': 0.9210470914840698} -08/30/2021 23:00:07 - INFO - __main__ - Step 54303: {'lr': 0.0003611175975333297, 'samples': 10426176, 'steps': 54302, 'loss/train': 1.1328192949295044} -08/30/2021 23:00:09 - INFO - __main__ - Step 54304: {'lr': 0.0003611128437609737, 'samples': 10426368, 'steps': 54303, 'loss/train': 1.5380455255508423} -08/30/2021 23:00:09 - INFO - __main__ - Step 54305: {'lr': 0.00036110808993855195, 'samples': 10426560, 'steps': 54304, 'loss/train': 1.72883939743042} -08/30/2021 23:00:10 - INFO - __main__ - Step 54306: {'lr': 0.0003611033360660666, 'samples': 10426752, 'steps': 54305, 'loss/train': 1.994649887084961} -08/30/2021 23:00:10 - INFO - __main__ - Step 54307: {'lr': 0.00036109858214351977, 'samples': 10426944, 'steps': 54306, 'loss/train': 0.8268476724624634} -08/30/2021 23:00:10 - INFO - __main__ - Step 54308: {'lr': 0.0003610938281709136, 'samples': 10427136, 'steps': 54307, 'loss/train': 3.1488285064697266} -08/30/2021 23:00:12 - INFO - __main__ - Step 54309: {'lr': 0.0003610890741482503, 'samples': 10427328, 'steps': 54308, 'loss/train': 0.8107359409332275} -08/30/2021 23:00:12 - INFO - __main__ - Step 54310: {'lr': 0.000361084320075532, 'samples': 10427520, 'steps': 54309, 'loss/train': 1.6099568605422974} -08/30/2021 23:00:13 - INFO - __main__ - Step 54311: {'lr': 0.00036107956595276083, 'samples': 10427712, 'steps': 54310, 'loss/train': 1.3700376749038696} -08/30/2021 23:00:13 - INFO - __main__ - Step 54312: {'lr': 0.00036107481177993897, 'samples': 10427904, 'steps': 54311, 'loss/train': 0.1530822068452835} -08/30/2021 23:00:14 - INFO - __main__ - Step 54313: {'lr': 0.0003610700575570684, 'samples': 10428096, 'steps': 54312, 'loss/train': 1.2222754955291748} -08/30/2021 23:00:15 - INFO - __main__ - Step 54314: {'lr': 0.00036106530328415136, 'samples': 10428288, 'steps': 54313, 'loss/train': 1.2541207075119019} -08/30/2021 23:00:15 - INFO - __main__ - Step 54315: {'lr': 0.0003610605489611901, 'samples': 10428480, 'steps': 54314, 'loss/train': 0.7728841304779053} -08/30/2021 23:00:16 - INFO - __main__ - Step 54316: {'lr': 0.0003610557945881866, 'samples': 10428672, 'steps': 54315, 'loss/train': 1.279334545135498} -08/30/2021 23:00:16 - INFO - __main__ - Step 54317: {'lr': 0.0003610510401651431, 'samples': 10428864, 'steps': 54316, 'loss/train': 1.0612679719924927} -08/30/2021 23:00:17 - INFO - __main__ - Step 54318: {'lr': 0.00036104628569206176, 'samples': 10429056, 'steps': 54317, 'loss/train': 0.7022980451583862} -08/30/2021 23:00:17 - INFO - __main__ - Step 54319: {'lr': 0.00036104153116894465, 'samples': 10429248, 'steps': 54318, 'loss/train': 0.8806092143058777} -08/30/2021 23:00:18 - INFO - __main__ - Step 54320: {'lr': 0.00036103677659579393, 'samples': 10429440, 'steps': 54319, 'loss/train': 1.2294496297836304} -08/30/2021 23:00:19 - INFO - __main__ - Step 54321: {'lr': 0.0003610320219726118, 'samples': 10429632, 'steps': 54320, 'loss/train': 1.6851475238800049} -08/30/2021 23:00:19 - INFO - __main__ - Step 54322: {'lr': 0.00036102726729940026, 'samples': 10429824, 'steps': 54321, 'loss/train': 1.4001877307891846} -08/30/2021 23:00:19 - INFO - __main__ - Step 54323: {'lr': 0.0003610225125761616, 'samples': 10430016, 'steps': 54322, 'loss/train': 1.3912405967712402} -08/30/2021 23:00:20 - INFO - __main__ - Step 54324: {'lr': 0.0003610177578028979, 'samples': 10430208, 'steps': 54323, 'loss/train': 1.9676052331924438} -08/30/2021 23:00:21 - INFO - __main__ - Step 54325: {'lr': 0.0003610130029796114, 'samples': 10430400, 'steps': 54324, 'loss/train': 1.4980096817016602} -08/30/2021 23:00:22 - INFO - __main__ - Step 54326: {'lr': 0.000361008248106304, 'samples': 10430592, 'steps': 54325, 'loss/train': 1.413459300994873} -08/30/2021 23:00:22 - INFO - __main__ - Step 54327: {'lr': 0.0003610034931829781, 'samples': 10430784, 'steps': 54326, 'loss/train': 1.151256799697876} -08/30/2021 23:00:22 - INFO - __main__ - Step 54328: {'lr': 0.0003609987382096357, 'samples': 10430976, 'steps': 54327, 'loss/train': 1.3196914196014404} -08/30/2021 23:00:23 - INFO - __main__ - Step 54329: {'lr': 0.00036099398318627896, 'samples': 10431168, 'steps': 54328, 'loss/train': 1.2981704473495483} -08/30/2021 23:00:24 - INFO - __main__ - Step 54330: {'lr': 0.00036098922811291, 'samples': 10431360, 'steps': 54329, 'loss/train': 1.1940737962722778} -08/30/2021 23:00:25 - INFO - __main__ - Step 54331: {'lr': 0.00036098447298953107, 'samples': 10431552, 'steps': 54330, 'loss/train': 1.2637882232666016} -08/30/2021 23:00:25 - INFO - __main__ - Step 54332: {'lr': 0.00036097971781614435, 'samples': 10431744, 'steps': 54331, 'loss/train': 1.6388776302337646} -08/30/2021 23:00:25 - INFO - __main__ - Step 54333: {'lr': 0.0003609749625927518, 'samples': 10431936, 'steps': 54332, 'loss/train': 1.606168508529663} -08/30/2021 23:00:26 - INFO - __main__ - Step 54334: {'lr': 0.0003609702073193556, 'samples': 10432128, 'steps': 54333, 'loss/train': 0.9753102660179138} -08/30/2021 23:00:27 - INFO - __main__ - Step 54335: {'lr': 0.000360965451995958, 'samples': 10432320, 'steps': 54334, 'loss/train': 1.518958330154419} -08/30/2021 23:00:28 - INFO - __main__ - Step 54336: {'lr': 0.000360960696622561, 'samples': 10432512, 'steps': 54335, 'loss/train': 0.04328807443380356} -08/30/2021 23:00:28 - INFO - __main__ - Step 54337: {'lr': 0.0003609559411991669, 'samples': 10432704, 'steps': 54336, 'loss/train': 0.8732128739356995} -08/30/2021 23:00:29 - INFO - __main__ - Step 54338: {'lr': 0.00036095118572577773, 'samples': 10432896, 'steps': 54337, 'loss/train': 0.049343254417181015} -08/30/2021 23:00:29 - INFO - __main__ - Step 54339: {'lr': 0.00036094643020239564, 'samples': 10433088, 'steps': 54338, 'loss/train': 1.0345513820648193} -08/30/2021 23:00:30 - INFO - __main__ - Step 54340: {'lr': 0.0003609416746290228, 'samples': 10433280, 'steps': 54339, 'loss/train': 1.2922474145889282} -08/30/2021 23:00:31 - INFO - __main__ - Step 54341: {'lr': 0.00036093691900566146, 'samples': 10433472, 'steps': 54340, 'loss/train': 1.583540678024292} -08/30/2021 23:00:31 - INFO - __main__ - Step 54342: {'lr': 0.00036093216333231356, 'samples': 10433664, 'steps': 54341, 'loss/train': 1.385217308998108} -08/30/2021 23:00:32 - INFO - __main__ - Step 54343: {'lr': 0.0003609274076089813, 'samples': 10433856, 'steps': 54342, 'loss/train': 1.4844633340835571} -08/30/2021 23:00:32 - INFO - __main__ - Step 54344: {'lr': 0.00036092265183566705, 'samples': 10434048, 'steps': 54343, 'loss/train': 1.3687350749969482} -08/30/2021 23:00:33 - INFO - __main__ - Step 54345: {'lr': 0.0003609178960123726, 'samples': 10434240, 'steps': 54344, 'loss/train': 0.6998049020767212} -08/30/2021 23:00:34 - INFO - __main__ - Step 54346: {'lr': 0.0003609131401391003, 'samples': 10434432, 'steps': 54345, 'loss/train': 1.0882056951522827} -08/30/2021 23:00:34 - INFO - __main__ - Step 54347: {'lr': 0.00036090838421585223, 'samples': 10434624, 'steps': 54346, 'loss/train': 1.3963369131088257} -08/30/2021 23:00:34 - INFO - __main__ - Step 54348: {'lr': 0.0003609036282426306, 'samples': 10434816, 'steps': 54347, 'loss/train': 1.0777093172073364} -08/30/2021 23:00:35 - INFO - __main__ - Step 54349: {'lr': 0.0003608988722194375, 'samples': 10435008, 'steps': 54348, 'loss/train': 1.2569193840026855} -08/30/2021 23:00:37 - INFO - __main__ - Step 54350: {'lr': 0.000360894116146275, 'samples': 10435200, 'steps': 54349, 'loss/train': 1.5837812423706055} -08/30/2021 23:00:37 - INFO - __main__ - Step 54351: {'lr': 0.0003608893600231454, 'samples': 10435392, 'steps': 54350, 'loss/train': 1.5440295934677124} -08/30/2021 23:00:38 - INFO - __main__ - Step 54352: {'lr': 0.00036088460385005076, 'samples': 10435584, 'steps': 54351, 'loss/train': 0.9434706568717957} -08/30/2021 23:00:38 - INFO - __main__ - Step 54353: {'lr': 0.00036087984762699316, 'samples': 10435776, 'steps': 54352, 'loss/train': 1.3542704582214355} -08/30/2021 23:00:38 - INFO - __main__ - Step 54354: {'lr': 0.00036087509135397487, 'samples': 10435968, 'steps': 54353, 'loss/train': 0.21786858141422272} -08/30/2021 23:00:40 - INFO - __main__ - Step 54355: {'lr': 0.00036087033503099796, 'samples': 10436160, 'steps': 54354, 'loss/train': 1.5578293800354004} -08/30/2021 23:00:40 - INFO - __main__ - Step 54356: {'lr': 0.00036086557865806464, 'samples': 10436352, 'steps': 54355, 'loss/train': 1.0738296508789062} -08/30/2021 23:00:41 - INFO - __main__ - Step 54357: {'lr': 0.000360860822235177, 'samples': 10436544, 'steps': 54356, 'loss/train': 1.2405059337615967} -08/30/2021 23:00:41 - INFO - __main__ - Step 54358: {'lr': 0.0003608560657623371, 'samples': 10436736, 'steps': 54357, 'loss/train': 0.8637553453445435} -08/30/2021 23:00:41 - INFO - __main__ - Step 54359: {'lr': 0.0003608513092395472, 'samples': 10436928, 'steps': 54358, 'loss/train': 1.900701880455017} -08/30/2021 23:00:43 - INFO - __main__ - Step 54360: {'lr': 0.00036084655266680946, 'samples': 10437120, 'steps': 54359, 'loss/train': 0.2656385004520416} -08/30/2021 23:00:43 - INFO - __main__ - Step 54361: {'lr': 0.00036084179604412594, 'samples': 10437312, 'steps': 54360, 'loss/train': 1.4094173908233643} -08/30/2021 23:00:44 - INFO - __main__ - Step 54362: {'lr': 0.00036083703937149877, 'samples': 10437504, 'steps': 54361, 'loss/train': 1.896064043045044} -08/30/2021 23:00:44 - INFO - __main__ - Step 54363: {'lr': 0.0003608322826489302, 'samples': 10437696, 'steps': 54362, 'loss/train': 0.8309762477874756} -08/30/2021 23:00:44 - INFO - __main__ - Step 54364: {'lr': 0.00036082752587642225, 'samples': 10437888, 'steps': 54363, 'loss/train': 0.1629410833120346} -08/30/2021 23:00:45 - INFO - __main__ - Step 54365: {'lr': 0.00036082276905397714, 'samples': 10438080, 'steps': 54364, 'loss/train': 0.3419945538043976} -08/30/2021 23:00:46 - INFO - __main__ - Step 54366: {'lr': 0.0003608180121815971, 'samples': 10438272, 'steps': 54365, 'loss/train': 1.1949297189712524} -08/30/2021 23:00:47 - INFO - __main__ - Step 54367: {'lr': 0.0003608132552592841, 'samples': 10438464, 'steps': 54366, 'loss/train': 1.0680665969848633} -08/30/2021 23:00:47 - INFO - __main__ - Step 54368: {'lr': 0.0003608084982870404, 'samples': 10438656, 'steps': 54367, 'loss/train': 0.6926573514938354} -08/30/2021 23:00:47 - INFO - __main__ - Step 54369: {'lr': 0.00036080374126486804, 'samples': 10438848, 'steps': 54368, 'loss/train': 1.5133802890777588} -08/30/2021 23:00:48 - INFO - __main__ - Step 54370: {'lr': 0.00036079898419276923, 'samples': 10439040, 'steps': 54369, 'loss/train': 1.3536357879638672} -08/30/2021 23:00:49 - INFO - __main__ - Step 54371: {'lr': 0.0003607942270707461, 'samples': 10439232, 'steps': 54370, 'loss/train': 0.04309569299221039} -08/30/2021 23:00:50 - INFO - __main__ - Step 54372: {'lr': 0.0003607894698988009, 'samples': 10439424, 'steps': 54371, 'loss/train': 0.8834048509597778} -08/30/2021 23:00:50 - INFO - __main__ - Step 54373: {'lr': 0.0003607847126769356, 'samples': 10439616, 'steps': 54372, 'loss/train': 0.8419795036315918} -08/30/2021 23:00:50 - INFO - __main__ - Step 54374: {'lr': 0.0003607799554051524, 'samples': 10439808, 'steps': 54373, 'loss/train': 1.3162957429885864} -08/30/2021 23:00:51 - INFO - __main__ - Step 54375: {'lr': 0.0003607751980834535, 'samples': 10440000, 'steps': 54374, 'loss/train': 0.9299314618110657} -08/30/2021 23:00:51 - INFO - __main__ - Step 54376: {'lr': 0.00036077044071184094, 'samples': 10440192, 'steps': 54375, 'loss/train': 1.0959758758544922} -08/30/2021 23:00:53 - INFO - __main__ - Step 54377: {'lr': 0.00036076568329031694, 'samples': 10440384, 'steps': 54376, 'loss/train': 1.0444085597991943} -08/30/2021 23:00:53 - INFO - __main__ - Step 54378: {'lr': 0.0003607609258188837, 'samples': 10440576, 'steps': 54377, 'loss/train': 1.097976803779602} -08/30/2021 23:00:53 - INFO - __main__ - Step 54379: {'lr': 0.00036075616829754333, 'samples': 10440768, 'steps': 54378, 'loss/train': 1.7999595403671265} -08/30/2021 23:00:54 - INFO - __main__ - Step 54380: {'lr': 0.0003607514107262978, 'samples': 10440960, 'steps': 54379, 'loss/train': 1.6188349723815918} -08/30/2021 23:00:54 - INFO - __main__ - Step 54381: {'lr': 0.0003607466531051495, 'samples': 10441152, 'steps': 54380, 'loss/train': 1.3003886938095093} -08/30/2021 23:00:55 - INFO - __main__ - Step 54382: {'lr': 0.0003607418954341004, 'samples': 10441344, 'steps': 54381, 'loss/train': 2.1505913734436035} -08/30/2021 23:00:56 - INFO - __main__ - Step 54383: {'lr': 0.00036073713771315276, 'samples': 10441536, 'steps': 54382, 'loss/train': 1.0358531475067139} -08/30/2021 23:00:56 - INFO - __main__ - Step 54384: {'lr': 0.00036073237994230863, 'samples': 10441728, 'steps': 54383, 'loss/train': 1.5749377012252808} -08/30/2021 23:00:57 - INFO - __main__ - Step 54385: {'lr': 0.0003607276221215702, 'samples': 10441920, 'steps': 54384, 'loss/train': 0.6855916380882263} -08/30/2021 23:00:57 - INFO - __main__ - Step 54386: {'lr': 0.0003607228642509397, 'samples': 10442112, 'steps': 54385, 'loss/train': 0.33559802174568176} -08/30/2021 23:00:59 - INFO - __main__ - Step 54387: {'lr': 0.00036071810633041913, 'samples': 10442304, 'steps': 54386, 'loss/train': 2.230074882507324} -08/30/2021 23:00:59 - INFO - __main__ - Step 54388: {'lr': 0.0003607133483600107, 'samples': 10442496, 'steps': 54387, 'loss/train': 1.9957389831542969} -08/30/2021 23:00:59 - INFO - __main__ - Step 54389: {'lr': 0.00036070859033971646, 'samples': 10442688, 'steps': 54388, 'loss/train': 0.13232050836086273} -08/30/2021 23:01:00 - INFO - __main__ - Step 54390: {'lr': 0.00036070383226953875, 'samples': 10442880, 'steps': 54389, 'loss/train': 1.6840497255325317} -08/30/2021 23:01:00 - INFO - __main__ - Step 54391: {'lr': 0.0003606990741494795, 'samples': 10443072, 'steps': 54390, 'loss/train': 1.5031099319458008} -08/30/2021 23:01:02 - INFO - __main__ - Step 54392: {'lr': 0.00036069431597954103, 'samples': 10443264, 'steps': 54391, 'loss/train': 1.273067831993103} -08/30/2021 23:01:03 - INFO - __main__ - Step 54393: {'lr': 0.0003606895577597254, 'samples': 10443456, 'steps': 54392, 'loss/train': 0.6100627779960632} -08/30/2021 23:01:03 - INFO - __main__ - Step 54394: {'lr': 0.0003606847994900347, 'samples': 10443648, 'steps': 54393, 'loss/train': 1.554357886314392} -08/30/2021 23:01:03 - INFO - __main__ - Step 54395: {'lr': 0.00036068004117047127, 'samples': 10443840, 'steps': 54394, 'loss/train': 1.1624020338058472} -08/30/2021 23:01:04 - INFO - __main__ - Step 54396: {'lr': 0.000360675282801037, 'samples': 10444032, 'steps': 54395, 'loss/train': 1.2031679153442383} -08/30/2021 23:01:04 - INFO - __main__ - Step 54397: {'lr': 0.0003606705243817342, 'samples': 10444224, 'steps': 54396, 'loss/train': 1.2400147914886475} -08/30/2021 23:01:06 - INFO - __main__ - Step 54398: {'lr': 0.00036066576591256496, 'samples': 10444416, 'steps': 54397, 'loss/train': 1.6306027173995972} -08/30/2021 23:01:06 - INFO - __main__ - Step 54399: {'lr': 0.00036066100739353145, 'samples': 10444608, 'steps': 54398, 'loss/train': 1.288132905960083} -08/30/2021 23:01:06 - INFO - __main__ - Step 54400: {'lr': 0.0003606562488246358, 'samples': 10444800, 'steps': 54399, 'loss/train': 1.6223887205123901} -08/30/2021 23:01:07 - INFO - __main__ - Step 54401: {'lr': 0.00036065149020588015, 'samples': 10444992, 'steps': 54400, 'loss/train': 0.9524000287055969} -08/30/2021 23:01:07 - INFO - __main__ - Step 54402: {'lr': 0.00036064673153726664, 'samples': 10445184, 'steps': 54401, 'loss/train': 1.3720989227294922} -08/30/2021 23:01:09 - INFO - __main__ - Step 54403: {'lr': 0.0003606419728187974, 'samples': 10445376, 'steps': 54402, 'loss/train': 1.35567307472229} -08/30/2021 23:01:10 - INFO - __main__ - Step 54404: {'lr': 0.00036063721405047463, 'samples': 10445568, 'steps': 54403, 'loss/train': 1.614539623260498} -08/30/2021 23:01:10 - INFO - __main__ - Step 54405: {'lr': 0.00036063245523230037, 'samples': 10445760, 'steps': 54404, 'loss/train': 1.5119376182556152} -08/30/2021 23:01:10 - INFO - __main__ - Step 54406: {'lr': 0.0003606276963642769, 'samples': 10445952, 'steps': 54405, 'loss/train': 1.8646962642669678} -08/30/2021 23:01:11 - INFO - __main__ - Step 54407: {'lr': 0.00036062293744640637, 'samples': 10446144, 'steps': 54406, 'loss/train': 1.4430432319641113} -08/30/2021 23:01:11 - INFO - __main__ - Step 54408: {'lr': 0.0003606181784786907, 'samples': 10446336, 'steps': 54407, 'loss/train': 0.9834067821502686} -08/30/2021 23:01:13 - INFO - __main__ - Step 54409: {'lr': 0.00036061341946113225, 'samples': 10446528, 'steps': 54408, 'loss/train': 0.208884134888649} -08/30/2021 23:01:13 - INFO - __main__ - Step 54410: {'lr': 0.0003606086603937331, 'samples': 10446720, 'steps': 54409, 'loss/train': 1.9072211980819702} -08/30/2021 23:01:14 - INFO - __main__ - Step 54411: {'lr': 0.00036060390127649536, 'samples': 10446912, 'steps': 54410, 'loss/train': 0.8430742025375366} -08/30/2021 23:01:14 - INFO - __main__ - Step 54412: {'lr': 0.00036059914210942126, 'samples': 10447104, 'steps': 54411, 'loss/train': 2.041823387145996} -08/30/2021 23:01:14 - INFO - __main__ - Step 54413: {'lr': 0.0003605943828925129, 'samples': 10447296, 'steps': 54412, 'loss/train': 0.1184265986084938} -08/30/2021 23:01:16 - INFO - __main__ - Step 54414: {'lr': 0.0003605896236257724, 'samples': 10447488, 'steps': 54413, 'loss/train': 1.146912693977356} -08/30/2021 23:01:16 - INFO - __main__ - Step 54415: {'lr': 0.0003605848643092019, 'samples': 10447680, 'steps': 54414, 'loss/train': 0.8741188049316406} -08/30/2021 23:01:17 - INFO - __main__ - Step 54416: {'lr': 0.00036058010494280357, 'samples': 10447872, 'steps': 54415, 'loss/train': 0.8910341262817383} -08/30/2021 23:01:17 - INFO - __main__ - Step 54417: {'lr': 0.00036057534552657954, 'samples': 10448064, 'steps': 54416, 'loss/train': 0.7433121204376221} -08/30/2021 23:01:17 - INFO - __main__ - Step 54418: {'lr': 0.000360570586060532, 'samples': 10448256, 'steps': 54417, 'loss/train': 1.8967901468276978} -08/30/2021 23:01:19 - INFO - __main__ - Step 54419: {'lr': 0.0003605658265446631, 'samples': 10448448, 'steps': 54418, 'loss/train': 0.9716705679893494} -08/30/2021 23:01:19 - INFO - __main__ - Step 54420: {'lr': 0.00036056106697897485, 'samples': 10448640, 'steps': 54419, 'loss/train': 0.08413762599229813} -08/30/2021 23:01:20 - INFO - __main__ - Step 54421: {'lr': 0.0003605563073634696, 'samples': 10448832, 'steps': 54420, 'loss/train': 1.1478928327560425} -08/30/2021 23:01:20 - INFO - __main__ - Step 54422: {'lr': 0.00036055154769814923, 'samples': 10449024, 'steps': 54421, 'loss/train': 1.341420292854309} -08/30/2021 23:01:20 - INFO - __main__ - Step 54423: {'lr': 0.0003605467879830161, 'samples': 10449216, 'steps': 54422, 'loss/train': 1.4099433422088623} -08/30/2021 23:01:21 - INFO - __main__ - Step 54424: {'lr': 0.00036054202821807235, 'samples': 10449408, 'steps': 54423, 'loss/train': 1.181523323059082} -08/30/2021 23:01:22 - INFO - __main__ - Step 54425: {'lr': 0.00036053726840332004, 'samples': 10449600, 'steps': 54424, 'loss/train': 0.3803408741950989} -08/30/2021 23:01:23 - INFO - __main__ - Step 54426: {'lr': 0.00036053250853876134, 'samples': 10449792, 'steps': 54425, 'loss/train': 1.6077316999435425} -08/30/2021 23:01:23 - INFO - __main__ - Step 54427: {'lr': 0.0003605277486243984, 'samples': 10449984, 'steps': 54426, 'loss/train': 1.8009928464889526} -08/30/2021 23:01:23 - INFO - __main__ - Step 54428: {'lr': 0.0003605229886602334, 'samples': 10450176, 'steps': 54427, 'loss/train': 0.8881281614303589} -08/30/2021 23:01:24 - INFO - __main__ - Step 54429: {'lr': 0.0003605182286462683, 'samples': 10450368, 'steps': 54428, 'loss/train': 1.1170265674591064} -08/30/2021 23:01:25 - INFO - __main__ - Step 54430: {'lr': 0.00036051346858250556, 'samples': 10450560, 'steps': 54429, 'loss/train': 1.2654304504394531} -08/30/2021 23:01:26 - INFO - __main__ - Step 54431: {'lr': 0.0003605087084689471, 'samples': 10450752, 'steps': 54430, 'loss/train': 1.262196660041809} -08/30/2021 23:01:26 - INFO - __main__ - Step 54432: {'lr': 0.0003605039483055951, 'samples': 10450944, 'steps': 54431, 'loss/train': 1.9821951389312744} -08/30/2021 23:01:26 - INFO - __main__ - Step 54433: {'lr': 0.00036049918809245173, 'samples': 10451136, 'steps': 54432, 'loss/train': 1.5487759113311768} -08/30/2021 23:01:27 - INFO - __main__ - Step 54434: {'lr': 0.00036049442782951915, 'samples': 10451328, 'steps': 54433, 'loss/train': 1.6200807094573975} -08/30/2021 23:01:28 - INFO - __main__ - Step 54435: {'lr': 0.00036048966751679945, 'samples': 10451520, 'steps': 54434, 'loss/train': 2.2839179039001465} -08/30/2021 23:01:29 - INFO - __main__ - Step 54436: {'lr': 0.0003604849071542948, 'samples': 10451712, 'steps': 54435, 'loss/train': 1.0905177593231201} -08/30/2021 23:01:29 - INFO - __main__ - Step 54437: {'lr': 0.0003604801467420074, 'samples': 10451904, 'steps': 54436, 'loss/train': 1.3238178491592407} -08/30/2021 23:01:29 - INFO - __main__ - Step 54438: {'lr': 0.00036047538627993937, 'samples': 10452096, 'steps': 54437, 'loss/train': 1.1375893354415894} -08/30/2021 23:01:30 - INFO - __main__ - Step 54439: {'lr': 0.00036047062576809283, 'samples': 10452288, 'steps': 54438, 'loss/train': 1.2887464761734009} -08/30/2021 23:01:32 - INFO - __main__ - Step 54440: {'lr': 0.0003604658652064699, 'samples': 10452480, 'steps': 54439, 'loss/train': 1.3201395273208618} -08/30/2021 23:01:33 - INFO - __main__ - Step 54441: {'lr': 0.00036046110459507275, 'samples': 10452672, 'steps': 54440, 'loss/train': 1.0068236589431763} -08/30/2021 23:01:33 - INFO - __main__ - Step 54442: {'lr': 0.00036045634393390354, 'samples': 10452864, 'steps': 54441, 'loss/train': 1.1214576959609985} -08/30/2021 23:01:33 - INFO - __main__ - Step 54443: {'lr': 0.0003604515832229644, 'samples': 10453056, 'steps': 54442, 'loss/train': 1.3695833683013916} -08/30/2021 23:01:34 - INFO - __main__ - Step 54444: {'lr': 0.0003604468224622575, 'samples': 10453248, 'steps': 54443, 'loss/train': 0.32771575450897217} -08/30/2021 23:01:34 - INFO - __main__ - Step 54445: {'lr': 0.00036044206165178496, 'samples': 10453440, 'steps': 54444, 'loss/train': 2.2965939044952393} -08/30/2021 23:01:34 - INFO - __main__ - Step 54446: {'lr': 0.00036043730079154897, 'samples': 10453632, 'steps': 54445, 'loss/train': 2.2613685131073} -08/30/2021 23:01:36 - INFO - __main__ - Step 54447: {'lr': 0.00036043253988155157, 'samples': 10453824, 'steps': 54446, 'loss/train': 0.7324656248092651} -08/30/2021 23:01:37 - INFO - __main__ - Step 54448: {'lr': 0.00036042777892179503, 'samples': 10454016, 'steps': 54447, 'loss/train': 1.4372731447219849} -08/30/2021 23:01:37 - INFO - __main__ - Step 54449: {'lr': 0.0003604230179122814, 'samples': 10454208, 'steps': 54448, 'loss/train': 1.3258905410766602} -08/30/2021 23:01:38 - INFO - __main__ - Step 54450: {'lr': 0.0003604182568530128, 'samples': 10454400, 'steps': 54449, 'loss/train': 1.7881958484649658} -08/30/2021 23:01:38 - INFO - __main__ - Step 54451: {'lr': 0.0003604134957439915, 'samples': 10454592, 'steps': 54450, 'loss/train': 1.5566935539245605} -08/30/2021 23:01:40 - INFO - __main__ - Step 54452: {'lr': 0.00036040873458521963, 'samples': 10454784, 'steps': 54451, 'loss/train': 1.0344430208206177} -08/30/2021 23:01:40 - INFO - __main__ - Step 54453: {'lr': 0.0003604039733766992, 'samples': 10454976, 'steps': 54452, 'loss/train': 1.550994634628296} -08/30/2021 23:01:41 - INFO - __main__ - Step 54454: {'lr': 0.00036039921211843254, 'samples': 10455168, 'steps': 54453, 'loss/train': 1.847101092338562} -08/30/2021 23:01:41 - INFO - __main__ - Step 54455: {'lr': 0.0003603944508104216, 'samples': 10455360, 'steps': 54454, 'loss/train': 0.6563199758529663} -08/30/2021 23:01:41 - INFO - __main__ - Step 54456: {'lr': 0.0003603896894526687, 'samples': 10455552, 'steps': 54455, 'loss/train': 1.5809701681137085} -08/30/2021 23:01:42 - INFO - __main__ - Step 54457: {'lr': 0.00036038492804517586, 'samples': 10455744, 'steps': 54456, 'loss/train': 1.3193213939666748} -08/30/2021 23:01:44 - INFO - __main__ - Step 54458: {'lr': 0.00036038016658794525, 'samples': 10455936, 'steps': 54457, 'loss/train': 1.637620210647583} -08/30/2021 23:01:44 - INFO - __main__ - Step 54459: {'lr': 0.0003603754050809791, 'samples': 10456128, 'steps': 54458, 'loss/train': 0.02939906343817711} -08/30/2021 23:01:44 - INFO - __main__ - Step 54460: {'lr': 0.0003603706435242795, 'samples': 10456320, 'steps': 54459, 'loss/train': 1.4809588193893433} -08/30/2021 23:01:45 - INFO - __main__ - Step 54461: {'lr': 0.00036036588191784856, 'samples': 10456512, 'steps': 54460, 'loss/train': 1.7653968334197998} -08/30/2021 23:01:45 - INFO - __main__ - Step 54462: {'lr': 0.0003603611202616885, 'samples': 10456704, 'steps': 54461, 'loss/train': 1.6733763217926025} -08/30/2021 23:01:45 - INFO - __main__ - Step 54463: {'lr': 0.0003603563585558014, 'samples': 10456896, 'steps': 54462, 'loss/train': 1.5711159706115723} -08/30/2021 23:01:47 - INFO - __main__ - Step 54464: {'lr': 0.00036035159680018937, 'samples': 10457088, 'steps': 54463, 'loss/train': 1.2288029193878174} -08/30/2021 23:01:47 - INFO - __main__ - Step 54465: {'lr': 0.00036034683499485467, 'samples': 10457280, 'steps': 54464, 'loss/train': 1.8389629125595093} -08/30/2021 23:01:48 - INFO - __main__ - Step 54466: {'lr': 0.0003603420731397994, 'samples': 10457472, 'steps': 54465, 'loss/train': 0.7039991021156311} -08/30/2021 23:01:48 - INFO - __main__ - Step 54467: {'lr': 0.00036033731123502567, 'samples': 10457664, 'steps': 54466, 'loss/train': 1.7743483781814575} -08/30/2021 23:01:49 - INFO - __main__ - Step 54468: {'lr': 0.00036033254928053565, 'samples': 10457856, 'steps': 54467, 'loss/train': 1.220398187637329} -08/30/2021 23:01:51 - INFO - __main__ - Step 54469: {'lr': 0.0003603277872763315, 'samples': 10458048, 'steps': 54468, 'loss/train': 1.172669768333435} -08/30/2021 23:01:51 - INFO - __main__ - Step 54470: {'lr': 0.0003603230252224153, 'samples': 10458240, 'steps': 54469, 'loss/train': 1.4810055494308472} -08/30/2021 23:01:52 - INFO - __main__ - Step 54471: {'lr': 0.0003603182631187893, 'samples': 10458432, 'steps': 54470, 'loss/train': 1.2743890285491943} -08/30/2021 23:01:52 - INFO - __main__ - Step 54472: {'lr': 0.00036031350096545555, 'samples': 10458624, 'steps': 54471, 'loss/train': 1.6858956813812256} -08/30/2021 23:01:52 - INFO - __main__ - Step 54473: {'lr': 0.0003603087387624163, 'samples': 10458816, 'steps': 54472, 'loss/train': 1.0888733863830566} -08/30/2021 23:01:53 - INFO - __main__ - Step 54474: {'lr': 0.0003603039765096736, 'samples': 10459008, 'steps': 54473, 'loss/train': 1.8485932350158691} -08/30/2021 23:01:53 - INFO - __main__ - Step 54475: {'lr': 0.00036029921420722966, 'samples': 10459200, 'steps': 54474, 'loss/train': 0.028074083849787712} -08/30/2021 23:01:55 - INFO - __main__ - Step 54476: {'lr': 0.0003602944518550866, 'samples': 10459392, 'steps': 54475, 'loss/train': 0.024364106357097626} -08/30/2021 23:01:55 - INFO - __main__ - Step 54477: {'lr': 0.00036028968945324647, 'samples': 10459584, 'steps': 54476, 'loss/train': 1.4906941652297974} -08/30/2021 23:01:55 - INFO - __main__ - Step 54478: {'lr': 0.00036028492700171166, 'samples': 10459776, 'steps': 54477, 'loss/train': 1.7284191846847534} -08/30/2021 23:01:56 - INFO - __main__ - Step 54479: {'lr': 0.0003602801645004841, 'samples': 10459968, 'steps': 54478, 'loss/train': 1.2206257581710815} -08/30/2021 23:01:56 - INFO - __main__ - Step 54480: {'lr': 0.00036027540194956593, 'samples': 10460160, 'steps': 54479, 'loss/train': 0.6962655186653137} -08/30/2021 23:01:58 - INFO - __main__ - Step 54481: {'lr': 0.00036027063934895935, 'samples': 10460352, 'steps': 54480, 'loss/train': 1.462016224861145} -08/30/2021 23:01:58 - INFO - __main__ - Step 54482: {'lr': 0.0003602658766986666, 'samples': 10460544, 'steps': 54481, 'loss/train': 0.15552367269992828} -08/30/2021 23:01:58 - INFO - __main__ - Step 54483: {'lr': 0.00036026111399868973, 'samples': 10460736, 'steps': 54482, 'loss/train': 1.1515041589736938} -08/30/2021 23:01:59 - INFO - __main__ - Step 54484: {'lr': 0.00036025635124903093, 'samples': 10460928, 'steps': 54483, 'loss/train': 1.2796595096588135} -08/30/2021 23:01:59 - INFO - __main__ - Step 54485: {'lr': 0.0003602515884496923, 'samples': 10461120, 'steps': 54484, 'loss/train': 1.388633370399475} -08/30/2021 23:01:59 - INFO - __main__ - Step 54486: {'lr': 0.00036024682560067603, 'samples': 10461312, 'steps': 54485, 'loss/train': 1.4794923067092896} -08/30/2021 23:02:01 - INFO - __main__ - Step 54487: {'lr': 0.00036024206270198416, 'samples': 10461504, 'steps': 54486, 'loss/train': 1.326303482055664} -08/30/2021 23:02:02 - INFO - __main__ - Step 54488: {'lr': 0.00036023729975361897, 'samples': 10461696, 'steps': 54487, 'loss/train': 1.296088695526123} -08/30/2021 23:02:02 - INFO - __main__ - Step 54489: {'lr': 0.00036023253675558257, 'samples': 10461888, 'steps': 54488, 'loss/train': 1.447489857673645} -08/30/2021 23:02:02 - INFO - __main__ - Step 54490: {'lr': 0.0003602277737078771, 'samples': 10462080, 'steps': 54489, 'loss/train': 1.4102386236190796} -08/30/2021 23:02:03 - INFO - __main__ - Step 54491: {'lr': 0.00036022301061050467, 'samples': 10462272, 'steps': 54490, 'loss/train': 1.5670452117919922} -08/30/2021 23:02:04 - INFO - __main__ - Step 54492: {'lr': 0.00036021824746346746, 'samples': 10462464, 'steps': 54491, 'loss/train': 1.3059052228927612} -08/30/2021 23:02:05 - INFO - __main__ - Step 54493: {'lr': 0.00036021348426676754, 'samples': 10462656, 'steps': 54492, 'loss/train': 0.5022376179695129} -08/30/2021 23:02:05 - INFO - __main__ - Step 54494: {'lr': 0.00036020872102040727, 'samples': 10462848, 'steps': 54493, 'loss/train': 1.5012847185134888} -08/30/2021 23:02:05 - INFO - __main__ - Step 54495: {'lr': 0.00036020395772438853, 'samples': 10463040, 'steps': 54494, 'loss/train': 0.9884690642356873} -08/30/2021 23:02:06 - INFO - __main__ - Step 54496: {'lr': 0.00036019919437871355, 'samples': 10463232, 'steps': 54495, 'loss/train': 1.2300623655319214} -08/30/2021 23:02:07 - INFO - __main__ - Step 54497: {'lr': 0.0003601944309833846, 'samples': 10463424, 'steps': 54496, 'loss/train': 1.1033459901809692} -08/30/2021 23:02:08 - INFO - __main__ - Step 54498: {'lr': 0.0003601896675384037, 'samples': 10463616, 'steps': 54497, 'loss/train': 0.9350084066390991} -08/30/2021 23:02:08 - INFO - __main__ - Step 54499: {'lr': 0.0003601849040437731, 'samples': 10463808, 'steps': 54498, 'loss/train': 1.571579933166504} -08/30/2021 23:02:08 - INFO - __main__ - Step 54500: {'lr': 0.0003601801404994949, 'samples': 10464000, 'steps': 54499, 'loss/train': 1.4422886371612549} -08/30/2021 23:02:09 - INFO - __main__ - Step 54501: {'lr': 0.0003601753769055711, 'samples': 10464192, 'steps': 54500, 'loss/train': 1.3957128524780273} -08/30/2021 23:02:09 - INFO - __main__ - Step 54502: {'lr': 0.00036017061326200405, 'samples': 10464384, 'steps': 54501, 'loss/train': 1.102375864982605} -08/30/2021 23:02:11 - INFO - __main__ - Step 54503: {'lr': 0.0003601658495687958, 'samples': 10464576, 'steps': 54502, 'loss/train': 1.2521449327468872} -08/30/2021 23:02:11 - INFO - __main__ - Step 54504: {'lr': 0.0003601610858259485, 'samples': 10464768, 'steps': 54503, 'loss/train': 1.0305943489074707} -08/30/2021 23:02:12 - INFO - __main__ - Step 54505: {'lr': 0.0003601563220334644, 'samples': 10464960, 'steps': 54504, 'loss/train': 1.1198049783706665} -08/30/2021 23:02:12 - INFO - __main__ - Step 54506: {'lr': 0.0003601515581913455, 'samples': 10465152, 'steps': 54505, 'loss/train': 1.1192988157272339} -08/30/2021 23:02:12 - INFO - __main__ - Step 54507: {'lr': 0.0003601467942995941, 'samples': 10465344, 'steps': 54506, 'loss/train': 0.694641649723053} -08/30/2021 23:02:14 - INFO - __main__ - Step 54508: {'lr': 0.00036014203035821213, 'samples': 10465536, 'steps': 54507, 'loss/train': 1.024565577507019} -08/30/2021 23:02:15 - INFO - __main__ - Step 54509: {'lr': 0.0003601372663672019, 'samples': 10465728, 'steps': 54508, 'loss/train': 0.6277898550033569} -08/30/2021 23:02:15 - INFO - __main__ - Step 54510: {'lr': 0.00036013250232656553, 'samples': 10465920, 'steps': 54509, 'loss/train': 1.8217884302139282} -08/30/2021 23:02:16 - INFO - __main__ - Step 54511: {'lr': 0.0003601277382363051, 'samples': 10466112, 'steps': 54510, 'loss/train': 1.3990466594696045} -08/30/2021 23:02:16 - INFO - __main__ - Step 54512: {'lr': 0.0003601229740964229, 'samples': 10466304, 'steps': 54511, 'loss/train': 1.249825119972229} -08/30/2021 23:02:17 - INFO - __main__ - Step 54513: {'lr': 0.000360118209906921, 'samples': 10466496, 'steps': 54512, 'loss/train': 1.5219441652297974} -08/30/2021 23:02:18 - INFO - __main__ - Step 54514: {'lr': 0.0003601134456678014, 'samples': 10466688, 'steps': 54513, 'loss/train': 2.0387253761291504} -08/30/2021 23:02:18 - INFO - __main__ - Step 54515: {'lr': 0.0003601086813790665, 'samples': 10466880, 'steps': 54514, 'loss/train': 1.3793940544128418} -08/30/2021 23:02:19 - INFO - __main__ - Step 54516: {'lr': 0.00036010391704071823, 'samples': 10467072, 'steps': 54515, 'loss/train': 1.2549033164978027} -08/30/2021 23:02:19 - INFO - __main__ - Step 54517: {'lr': 0.0003600991526527589, 'samples': 10467264, 'steps': 54516, 'loss/train': 1.8614650964736938} -08/30/2021 23:02:20 - INFO - __main__ - Step 54518: {'lr': 0.00036009438821519056, 'samples': 10467456, 'steps': 54517, 'loss/train': 1.3409873247146606} -08/30/2021 23:02:21 - INFO - __main__ - Step 54519: {'lr': 0.0003600896237280154, 'samples': 10467648, 'steps': 54518, 'loss/train': 1.1305326223373413} -08/30/2021 23:02:21 - INFO - __main__ - Step 54520: {'lr': 0.0003600848591912356, 'samples': 10467840, 'steps': 54519, 'loss/train': 1.3710821866989136} -08/30/2021 23:02:21 - INFO - __main__ - Step 54521: {'lr': 0.00036008009460485323, 'samples': 10468032, 'steps': 54520, 'loss/train': 1.0729775428771973} -08/30/2021 23:02:22 - INFO - __main__ - Step 54522: {'lr': 0.00036007532996887043, 'samples': 10468224, 'steps': 54521, 'loss/train': 0.0646027997136116} -08/30/2021 23:02:23 - INFO - __main__ - Step 54523: {'lr': 0.0003600705652832894, 'samples': 10468416, 'steps': 54522, 'loss/train': 1.3067927360534668} -08/30/2021 23:02:24 - INFO - __main__ - Step 54524: {'lr': 0.00036006580054811235, 'samples': 10468608, 'steps': 54523, 'loss/train': 1.1525671482086182} -08/30/2021 23:02:24 - INFO - __main__ - Step 54525: {'lr': 0.00036006103576334124, 'samples': 10468800, 'steps': 54524, 'loss/train': 2.3152549266815186} -08/30/2021 23:02:24 - INFO - __main__ - Step 54526: {'lr': 0.00036005627092897835, 'samples': 10468992, 'steps': 54525, 'loss/train': 1.1291697025299072} -08/30/2021 23:02:25 - INFO - __main__ - Step 54527: {'lr': 0.0003600515060450259, 'samples': 10469184, 'steps': 54526, 'loss/train': 1.5302352905273438} -08/30/2021 23:02:26 - INFO - __main__ - Step 54528: {'lr': 0.0003600467411114858, 'samples': 10469376, 'steps': 54527, 'loss/train': 0.7366635203361511} -08/30/2021 23:02:27 - INFO - __main__ - Step 54529: {'lr': 0.00036004197612836045, 'samples': 10469568, 'steps': 54528, 'loss/train': 1.5393773317337036} -08/30/2021 23:02:27 - INFO - __main__ - Step 54530: {'lr': 0.0003600372110956518, 'samples': 10469760, 'steps': 54529, 'loss/train': 0.6021180152893066} -08/30/2021 23:02:27 - INFO - __main__ - Step 54531: {'lr': 0.0003600324460133621, 'samples': 10469952, 'steps': 54530, 'loss/train': 1.0634032487869263} -08/30/2021 23:02:28 - INFO - __main__ - Step 54532: {'lr': 0.0003600276808814935, 'samples': 10470144, 'steps': 54531, 'loss/train': 1.748326301574707} -08/30/2021 23:02:30 - INFO - __main__ - Step 54533: {'lr': 0.00036002291570004806, 'samples': 10470336, 'steps': 54532, 'loss/train': 0.1036919355392456} -08/30/2021 23:02:30 - INFO - __main__ - Step 54534: {'lr': 0.0003600181504690281, 'samples': 10470528, 'steps': 54533, 'loss/train': 1.3171173334121704} -08/30/2021 23:02:30 - INFO - __main__ - Step 54535: {'lr': 0.00036001338518843563, 'samples': 10470720, 'steps': 54534, 'loss/train': 0.883816123008728} -08/30/2021 23:02:31 - INFO - __main__ - Step 54536: {'lr': 0.0003600086198582728, 'samples': 10470912, 'steps': 54535, 'loss/train': 1.1281777620315552} -08/30/2021 23:02:31 - INFO - __main__ - Step 54537: {'lr': 0.00036000385447854176, 'samples': 10471104, 'steps': 54536, 'loss/train': 1.4809339046478271} -08/30/2021 23:02:31 - INFO - __main__ - Step 54538: {'lr': 0.0003599990890492447, 'samples': 10471296, 'steps': 54537, 'loss/train': 1.6544737815856934} -08/30/2021 23:02:33 - INFO - __main__ - Step 54539: {'lr': 0.00035999432357038374, 'samples': 10471488, 'steps': 54538, 'loss/train': 0.8396620750427246} -08/30/2021 23:02:34 - INFO - __main__ - Step 54540: {'lr': 0.0003599895580419611, 'samples': 10471680, 'steps': 54539, 'loss/train': 0.5185154676437378} -08/30/2021 23:02:34 - INFO - __main__ - Step 54541: {'lr': 0.0003599847924639788, 'samples': 10471872, 'steps': 54540, 'loss/train': 1.1997580528259277} -08/30/2021 23:02:34 - INFO - __main__ - Step 54542: {'lr': 0.00035998002683643903, 'samples': 10472064, 'steps': 54541, 'loss/train': 1.8566733598709106} -08/30/2021 23:02:35 - INFO - __main__ - Step 54543: {'lr': 0.00035997526115934405, 'samples': 10472256, 'steps': 54542, 'loss/train': 1.5253015756607056} -08/30/2021 23:02:35 - INFO - __main__ - Step 54544: {'lr': 0.00035997049543269583, 'samples': 10472448, 'steps': 54543, 'loss/train': 0.7787737250328064} -08/30/2021 23:02:37 - INFO - __main__ - Step 54545: {'lr': 0.0003599657296564966, 'samples': 10472640, 'steps': 54544, 'loss/train': 1.1299768686294556} -08/30/2021 23:02:37 - INFO - __main__ - Step 54546: {'lr': 0.00035996096383074855, 'samples': 10472832, 'steps': 54545, 'loss/train': 1.0124627351760864} -08/30/2021 23:02:38 - INFO - __main__ - Step 54547: {'lr': 0.0003599561979554538, 'samples': 10473024, 'steps': 54546, 'loss/train': 0.45943358540534973} -08/30/2021 23:02:38 - INFO - __main__ - Step 54548: {'lr': 0.0003599514320306144, 'samples': 10473216, 'steps': 54547, 'loss/train': 0.040136393159627914} -08/30/2021 23:02:38 - INFO - __main__ - Step 54549: {'lr': 0.0003599466660562327, 'samples': 10473408, 'steps': 54548, 'loss/train': 1.3302639722824097} -08/30/2021 23:02:40 - INFO - __main__ - Step 54550: {'lr': 0.00035994190003231063, 'samples': 10473600, 'steps': 54549, 'loss/train': 0.9709994792938232} -08/30/2021 23:02:40 - INFO - __main__ - Step 54551: {'lr': 0.0003599371339588505, 'samples': 10473792, 'steps': 54550, 'loss/train': 1.1999484300613403} -08/30/2021 23:02:40 - INFO - __main__ - Step 54552: {'lr': 0.00035993236783585437, 'samples': 10473984, 'steps': 54551, 'loss/train': 1.5302873849868774} -08/30/2021 23:02:41 - INFO - __main__ - Step 54553: {'lr': 0.00035992760166332437, 'samples': 10474176, 'steps': 54552, 'loss/train': 1.2610130310058594} -08/30/2021 23:02:41 - INFO - __main__ - Step 54554: {'lr': 0.00035992283544126276, 'samples': 10474368, 'steps': 54553, 'loss/train': 1.8108878135681152} -08/30/2021 23:02:43 - INFO - __main__ - Step 54555: {'lr': 0.00035991806916967154, 'samples': 10474560, 'steps': 54554, 'loss/train': 1.02792489528656} -08/30/2021 23:02:43 - INFO - __main__ - Step 54556: {'lr': 0.000359913302848553, 'samples': 10474752, 'steps': 54555, 'loss/train': 0.6806752681732178} -08/30/2021 23:02:43 - INFO - __main__ - Step 54557: {'lr': 0.0003599085364779092, 'samples': 10474944, 'steps': 54556, 'loss/train': 1.5947924852371216} -08/30/2021 23:02:44 - INFO - __main__ - Step 54558: {'lr': 0.0003599037700577423, 'samples': 10475136, 'steps': 54557, 'loss/train': 1.4165140390396118} -08/30/2021 23:02:44 - INFO - __main__ - Step 54559: {'lr': 0.0003598990035880545, 'samples': 10475328, 'steps': 54558, 'loss/train': 1.9224787950515747} -08/30/2021 23:02:46 - INFO - __main__ - Step 54560: {'lr': 0.0003598942370688479, 'samples': 10475520, 'steps': 54559, 'loss/train': 1.3067187070846558} -08/30/2021 23:02:47 - INFO - __main__ - Step 54561: {'lr': 0.0003598894705001246, 'samples': 10475712, 'steps': 54560, 'loss/train': 0.4878981411457062} -08/30/2021 23:02:47 - INFO - __main__ - Step 54562: {'lr': 0.00035988470388188684, 'samples': 10475904, 'steps': 54561, 'loss/train': 0.5279180407524109} -08/30/2021 23:02:47 - INFO - __main__ - Step 54563: {'lr': 0.0003598799372141367, 'samples': 10476096, 'steps': 54562, 'loss/train': 1.3532823324203491} -08/30/2021 23:02:48 - INFO - __main__ - Step 54564: {'lr': 0.00035987517049687633, 'samples': 10476288, 'steps': 54563, 'loss/train': 1.0842735767364502} -08/30/2021 23:02:48 - INFO - __main__ - Step 54565: {'lr': 0.0003598704037301079, 'samples': 10476480, 'steps': 54564, 'loss/train': 1.6678783893585205} -08/30/2021 23:02:50 - INFO - __main__ - Step 54566: {'lr': 0.00035986563691383364, 'samples': 10476672, 'steps': 54565, 'loss/train': 1.3109883069992065} -08/30/2021 23:02:50 - INFO - __main__ - Step 54567: {'lr': 0.0003598608700480556, 'samples': 10476864, 'steps': 54566, 'loss/train': 1.0542044639587402} -08/30/2021 23:02:50 - INFO - __main__ - Step 54568: {'lr': 0.00035985610313277595, 'samples': 10477056, 'steps': 54567, 'loss/train': 1.556660532951355} -08/30/2021 23:02:51 - INFO - __main__ - Step 54569: {'lr': 0.0003598513361679968, 'samples': 10477248, 'steps': 54568, 'loss/train': 0.9612125754356384} -08/30/2021 23:02:51 - INFO - __main__ - Step 54570: {'lr': 0.00035984656915372034, 'samples': 10477440, 'steps': 54569, 'loss/train': 1.0310747623443604} -08/30/2021 23:02:53 - INFO - __main__ - Step 54571: {'lr': 0.0003598418020899487, 'samples': 10477632, 'steps': 54570, 'loss/train': 1.6246334314346313} -08/30/2021 23:02:53 - INFO - __main__ - Step 54572: {'lr': 0.0003598370349766841, 'samples': 10477824, 'steps': 54571, 'loss/train': 0.3843275308609009} -08/30/2021 23:02:53 - INFO - __main__ - Step 54573: {'lr': 0.0003598322678139285, 'samples': 10478016, 'steps': 54572, 'loss/train': 1.4062119722366333} -08/30/2021 23:02:54 - INFO - __main__ - Step 54574: {'lr': 0.00035982750060168436, 'samples': 10478208, 'steps': 54573, 'loss/train': 1.4864474534988403} -08/30/2021 23:02:54 - INFO - __main__ - Step 54575: {'lr': 0.0003598227333399535, 'samples': 10478400, 'steps': 54574, 'loss/train': 1.512558937072754} -08/30/2021 23:02:56 - INFO - __main__ - Step 54576: {'lr': 0.00035981796602873825, 'samples': 10478592, 'steps': 54575, 'loss/train': 1.2762151956558228} -08/30/2021 23:02:56 - INFO - __main__ - Step 54577: {'lr': 0.00035981319866804074, 'samples': 10478784, 'steps': 54576, 'loss/train': 1.2455973625183105} -08/30/2021 23:02:56 - INFO - __main__ - Step 54578: {'lr': 0.00035980843125786306, 'samples': 10478976, 'steps': 54577, 'loss/train': 1.2093178033828735} -08/30/2021 23:02:57 - INFO - __main__ - Step 54579: {'lr': 0.0003598036637982074, 'samples': 10479168, 'steps': 54578, 'loss/train': 5.774199485778809} -08/30/2021 23:02:57 - INFO - __main__ - Step 54580: {'lr': 0.00035979889628907593, 'samples': 10479360, 'steps': 54579, 'loss/train': 1.66202712059021} -08/30/2021 23:02:58 - INFO - __main__ - Step 54581: {'lr': 0.0003597941287304708, 'samples': 10479552, 'steps': 54580, 'loss/train': 1.4471526145935059} -08/30/2021 23:02:59 - INFO - __main__ - Step 54582: {'lr': 0.0003597893611223941, 'samples': 10479744, 'steps': 54581, 'loss/train': 1.4222338199615479} -08/30/2021 23:02:59 - INFO - __main__ - Step 54583: {'lr': 0.00035978459346484794, 'samples': 10479936, 'steps': 54582, 'loss/train': 1.6904886960983276} -08/30/2021 23:03:00 - INFO - __main__ - Step 54584: {'lr': 0.0003597798257578346, 'samples': 10480128, 'steps': 54583, 'loss/train': 1.4182924032211304} -08/30/2021 23:03:00 - INFO - __main__ - Step 54585: {'lr': 0.0003597750580013561, 'samples': 10480320, 'steps': 54584, 'loss/train': 1.649872064590454} -08/30/2021 23:03:00 - INFO - __main__ - Step 54586: {'lr': 0.0003597702901954147, 'samples': 10480512, 'steps': 54585, 'loss/train': 1.757237195968628} -08/30/2021 23:03:02 - INFO - __main__ - Step 54587: {'lr': 0.00035976552234001256, 'samples': 10480704, 'steps': 54586, 'loss/train': 1.4790384769439697} -08/30/2021 23:03:02 - INFO - __main__ - Step 54588: {'lr': 0.00035976075443515176, 'samples': 10480896, 'steps': 54587, 'loss/train': 0.1956343799829483} -08/30/2021 23:03:03 - INFO - __main__ - Step 54589: {'lr': 0.0003597559864808344, 'samples': 10481088, 'steps': 54588, 'loss/train': 0.8604037761688232} -08/30/2021 23:03:03 - INFO - __main__ - Step 54590: {'lr': 0.0003597512184770627, 'samples': 10481280, 'steps': 54589, 'loss/train': 2.722109317779541} -08/30/2021 23:03:04 - INFO - __main__ - Step 54591: {'lr': 0.0003597464504238388, 'samples': 10481472, 'steps': 54590, 'loss/train': 1.6503816843032837} -08/30/2021 23:03:05 - INFO - __main__ - Step 54592: {'lr': 0.00035974168232116486, 'samples': 10481664, 'steps': 54591, 'loss/train': 1.8491023778915405} -08/30/2021 23:03:05 - INFO - __main__ - Step 54593: {'lr': 0.00035973691416904297, 'samples': 10481856, 'steps': 54592, 'loss/train': 1.453162670135498} -08/30/2021 23:03:06 - INFO - __main__ - Step 54594: {'lr': 0.0003597321459674754, 'samples': 10482048, 'steps': 54593, 'loss/train': 1.3821334838867188} -08/30/2021 23:03:06 - INFO - __main__ - Step 54595: {'lr': 0.0003597273777164641, 'samples': 10482240, 'steps': 54594, 'loss/train': 1.3869150876998901} -08/30/2021 23:03:07 - INFO - __main__ - Step 54596: {'lr': 0.00035972260941601145, 'samples': 10482432, 'steps': 54595, 'loss/train': 0.9404004216194153} -08/30/2021 23:03:08 - INFO - __main__ - Step 54597: {'lr': 0.0003597178410661194, 'samples': 10482624, 'steps': 54596, 'loss/train': 1.1494826078414917} -08/30/2021 23:03:08 - INFO - __main__ - Step 54598: {'lr': 0.00035971307266679023, 'samples': 10482816, 'steps': 54597, 'loss/train': 1.094840168952942} -08/30/2021 23:03:09 - INFO - __main__ - Step 54599: {'lr': 0.000359708304218026, 'samples': 10483008, 'steps': 54598, 'loss/train': 1.6898934841156006} -08/30/2021 23:03:09 - INFO - __main__ - Step 54600: {'lr': 0.00035970353571982897, 'samples': 10483200, 'steps': 54599, 'loss/train': 1.682647705078125} -08/30/2021 23:03:09 - INFO - __main__ - Step 54601: {'lr': 0.0003596987671722012, 'samples': 10483392, 'steps': 54600, 'loss/train': 1.36082923412323} -08/30/2021 23:03:11 - INFO - __main__ - Step 54602: {'lr': 0.00035969399857514484, 'samples': 10483584, 'steps': 54601, 'loss/train': 0.7325038313865662} -08/30/2021 23:03:11 - INFO - __main__ - Step 54603: {'lr': 0.00035968922992866205, 'samples': 10483776, 'steps': 54602, 'loss/train': 1.1663405895233154} -08/30/2021 23:03:12 - INFO - __main__ - Step 54604: {'lr': 0.00035968446123275493, 'samples': 10483968, 'steps': 54603, 'loss/train': 1.9017565250396729} -08/30/2021 23:03:12 - INFO - __main__ - Step 54605: {'lr': 0.00035967969248742576, 'samples': 10484160, 'steps': 54604, 'loss/train': 1.2085704803466797} -08/30/2021 23:03:12 - INFO - __main__ - Step 54606: {'lr': 0.00035967492369267664, 'samples': 10484352, 'steps': 54605, 'loss/train': 1.9153189659118652} -08/30/2021 23:03:13 - INFO - __main__ - Step 54607: {'lr': 0.00035967015484850964, 'samples': 10484544, 'steps': 54606, 'loss/train': 1.165961503982544} -08/30/2021 23:03:14 - INFO - __main__ - Step 54608: {'lr': 0.000359665385954927, 'samples': 10484736, 'steps': 54607, 'loss/train': 1.1614915132522583} -08/30/2021 23:03:15 - INFO - __main__ - Step 54609: {'lr': 0.00035966061701193073, 'samples': 10484928, 'steps': 54608, 'loss/train': 0.6280215978622437} -08/30/2021 23:03:15 - INFO - __main__ - Step 54610: {'lr': 0.00035965584801952316, 'samples': 10485120, 'steps': 54609, 'loss/train': 1.087389349937439} -08/30/2021 23:03:16 - INFO - __main__ - Step 54611: {'lr': 0.0003596510789777064, 'samples': 10485312, 'steps': 54610, 'loss/train': 1.3975533246994019} -08/30/2021 23:03:16 - INFO - __main__ - Step 54612: {'lr': 0.0003596463098864825, 'samples': 10485504, 'steps': 54611, 'loss/train': 1.3112858533859253} -08/30/2021 23:03:18 - INFO - __main__ - Step 54613: {'lr': 0.00035964154074585365, 'samples': 10485696, 'steps': 54612, 'loss/train': 1.4799295663833618} -08/30/2021 23:03:18 - INFO - __main__ - Step 54614: {'lr': 0.00035963677155582204, 'samples': 10485888, 'steps': 54613, 'loss/train': 1.3409079313278198} -08/30/2021 23:03:19 - INFO - __main__ - Step 54615: {'lr': 0.0003596320023163898, 'samples': 10486080, 'steps': 54614, 'loss/train': 0.8664289116859436} -08/30/2021 23:03:19 - INFO - __main__ - Step 54616: {'lr': 0.000359627233027559, 'samples': 10486272, 'steps': 54615, 'loss/train': 0.8100765943527222} -08/30/2021 23:03:20 - INFO - __main__ - Step 54617: {'lr': 0.0003596224636893319, 'samples': 10486464, 'steps': 54616, 'loss/train': 1.4202203750610352} -08/30/2021 23:03:21 - INFO - __main__ - Step 54618: {'lr': 0.0003596176943017107, 'samples': 10486656, 'steps': 54617, 'loss/train': 1.6955711841583252} -08/30/2021 23:03:22 - INFO - __main__ - Step 54619: {'lr': 0.0003596129248646974, 'samples': 10486848, 'steps': 54618, 'loss/train': 1.487973690032959} -08/30/2021 23:03:22 - INFO - __main__ - Step 54620: {'lr': 0.0003596081553782942, 'samples': 10487040, 'steps': 54619, 'loss/train': 1.3339719772338867} -08/30/2021 23:03:23 - INFO - __main__ - Step 54621: {'lr': 0.0003596033858425032, 'samples': 10487232, 'steps': 54620, 'loss/train': 1.9933583736419678} -08/30/2021 23:03:23 - INFO - __main__ - Step 54622: {'lr': 0.00035959861625732667, 'samples': 10487424, 'steps': 54621, 'loss/train': 1.547165870666504} -08/30/2021 23:03:24 - INFO - __main__ - Step 54623: {'lr': 0.0003595938466227667, 'samples': 10487616, 'steps': 54622, 'loss/train': 1.145972728729248} -08/30/2021 23:03:25 - INFO - __main__ - Step 54624: {'lr': 0.0003595890769388254, 'samples': 10487808, 'steps': 54623, 'loss/train': 1.2730042934417725} -08/30/2021 23:03:25 - INFO - __main__ - Step 54625: {'lr': 0.00035958430720550494, 'samples': 10488000, 'steps': 54624, 'loss/train': 1.6948461532592773} -08/30/2021 23:03:26 - INFO - __main__ - Step 54626: {'lr': 0.00035957953742280754, 'samples': 10488192, 'steps': 54625, 'loss/train': 1.0461784601211548} -08/30/2021 23:03:26 - INFO - __main__ - Step 54627: {'lr': 0.0003595747675907352, 'samples': 10488384, 'steps': 54626, 'loss/train': 1.3459765911102295} -08/30/2021 23:03:27 - INFO - __main__ - Step 54628: {'lr': 0.0003595699977092902, 'samples': 10488576, 'steps': 54627, 'loss/train': 1.5525670051574707} -08/30/2021 23:03:28 - INFO - __main__ - Step 54629: {'lr': 0.00035956522777847474, 'samples': 10488768, 'steps': 54628, 'loss/train': 1.1322119235992432} -08/30/2021 23:03:28 - INFO - __main__ - Step 54630: {'lr': 0.00035956045779829085, 'samples': 10488960, 'steps': 54629, 'loss/train': 1.0116513967514038} -08/30/2021 23:03:29 - INFO - __main__ - Step 54631: {'lr': 0.00035955568776874057, 'samples': 10489152, 'steps': 54630, 'loss/train': 1.490096926689148} -08/30/2021 23:03:29 - INFO - __main__ - Step 54632: {'lr': 0.0003595509176898263, 'samples': 10489344, 'steps': 54631, 'loss/train': 1.4106022119522095} -08/30/2021 23:03:31 - INFO - __main__ - Step 54633: {'lr': 0.0003595461475615501, 'samples': 10489536, 'steps': 54632, 'loss/train': 1.5777695178985596} -08/30/2021 23:03:31 - INFO - __main__ - Step 54634: {'lr': 0.00035954137738391405, 'samples': 10489728, 'steps': 54633, 'loss/train': 1.5173395872116089} -08/30/2021 23:03:32 - INFO - __main__ - Step 54635: {'lr': 0.00035953660715692037, 'samples': 10489920, 'steps': 54634, 'loss/train': 1.6186579465866089} -08/30/2021 23:03:32 - INFO - __main__ - Step 54636: {'lr': 0.0003595318368805711, 'samples': 10490112, 'steps': 54635, 'loss/train': 1.632763385772705} -08/30/2021 23:03:32 - INFO - __main__ - Step 54637: {'lr': 0.00035952706655486855, 'samples': 10490304, 'steps': 54636, 'loss/train': 1.479754090309143} -08/30/2021 23:03:33 - INFO - __main__ - Step 54638: {'lr': 0.0003595222961798148, 'samples': 10490496, 'steps': 54637, 'loss/train': 1.2317792177200317} -08/30/2021 23:03:34 - INFO - __main__ - Step 54639: {'lr': 0.000359517525755412, 'samples': 10490688, 'steps': 54638, 'loss/train': 1.6764943599700928} -08/30/2021 23:03:35 - INFO - __main__ - Step 54640: {'lr': 0.0003595127552816623, 'samples': 10490880, 'steps': 54639, 'loss/train': 0.9140795469284058} -08/30/2021 23:03:35 - INFO - __main__ - Step 54641: {'lr': 0.00035950798475856783, 'samples': 10491072, 'steps': 54640, 'loss/train': 1.450689435005188} -08/30/2021 23:03:35 - INFO - __main__ - Step 54642: {'lr': 0.0003595032141861307, 'samples': 10491264, 'steps': 54641, 'loss/train': 1.4408491849899292} -08/30/2021 23:03:36 - INFO - __main__ - Step 54643: {'lr': 0.00035949844356435314, 'samples': 10491456, 'steps': 54642, 'loss/train': 1.7538901567459106} -08/30/2021 23:03:37 - INFO - __main__ - Step 54644: {'lr': 0.00035949367289323723, 'samples': 10491648, 'steps': 54643, 'loss/train': 1.5709326267242432} -08/30/2021 23:03:37 - INFO - __main__ - Step 54645: {'lr': 0.00035948890217278525, 'samples': 10491840, 'steps': 54644, 'loss/train': 1.1291842460632324} -08/30/2021 23:03:38 - INFO - __main__ - Step 54646: {'lr': 0.0003594841314029992, 'samples': 10492032, 'steps': 54645, 'loss/train': 0.7814945578575134} -08/30/2021 23:03:38 - INFO - __main__ - Step 54647: {'lr': 0.00035947936058388134, 'samples': 10492224, 'steps': 54646, 'loss/train': 1.2533886432647705} -08/30/2021 23:03:39 - INFO - __main__ - Step 54648: {'lr': 0.00035947458971543375, 'samples': 10492416, 'steps': 54647, 'loss/train': 1.6516329050064087} -08/30/2021 23:03:40 - INFO - __main__ - Step 54649: {'lr': 0.00035946981879765854, 'samples': 10492608, 'steps': 54648, 'loss/train': 1.001318335533142} -08/30/2021 23:03:40 - INFO - __main__ - Step 54650: {'lr': 0.000359465047830558, 'samples': 10492800, 'steps': 54649, 'loss/train': 0.6158228516578674} -08/30/2021 23:03:41 - INFO - __main__ - Step 54651: {'lr': 0.0003594602768141342, 'samples': 10492992, 'steps': 54650, 'loss/train': 1.5872671604156494} -08/30/2021 23:03:41 - INFO - __main__ - Step 54652: {'lr': 0.0003594555057483892, 'samples': 10493184, 'steps': 54651, 'loss/train': 0.7219210267066956} -08/30/2021 23:03:41 - INFO - __main__ - Step 54653: {'lr': 0.0003594507346333253, 'samples': 10493376, 'steps': 54652, 'loss/train': 1.807542085647583} -08/30/2021 23:03:43 - INFO - __main__ - Step 54654: {'lr': 0.00035944596346894456, 'samples': 10493568, 'steps': 54653, 'loss/train': 0.4334940016269684} -08/30/2021 23:03:44 - INFO - __main__ - Step 54655: {'lr': 0.00035944119225524916, 'samples': 10493760, 'steps': 54654, 'loss/train': 0.6189199686050415} -08/30/2021 23:03:44 - INFO - __main__ - Step 54656: {'lr': 0.00035943642099224126, 'samples': 10493952, 'steps': 54655, 'loss/train': 1.6385068893432617} -08/30/2021 23:03:44 - INFO - __main__ - Step 54657: {'lr': 0.00035943164967992304, 'samples': 10494144, 'steps': 54656, 'loss/train': 1.5558799505233765} -08/30/2021 23:03:45 - INFO - __main__ - Step 54658: {'lr': 0.00035942687831829655, 'samples': 10494336, 'steps': 54657, 'loss/train': 1.5776126384735107} -08/30/2021 23:03:45 - INFO - __main__ - Step 54659: {'lr': 0.000359422106907364, 'samples': 10494528, 'steps': 54658, 'loss/train': 1.2401173114776611} -08/30/2021 23:03:46 - INFO - __main__ - Step 54660: {'lr': 0.00035941733544712755, 'samples': 10494720, 'steps': 54659, 'loss/train': 1.4024578332901} -08/30/2021 23:03:47 - INFO - __main__ - Step 54661: {'lr': 0.0003594125639375894, 'samples': 10494912, 'steps': 54660, 'loss/train': 1.390967845916748} -08/30/2021 23:03:47 - INFO - __main__ - Step 54662: {'lr': 0.00035940779237875154, 'samples': 10495104, 'steps': 54661, 'loss/train': 1.1025558710098267} -08/30/2021 23:03:47 - INFO - __main__ - Step 54663: {'lr': 0.00035940302077061624, 'samples': 10495296, 'steps': 54662, 'loss/train': 1.749678134918213} -08/30/2021 23:03:48 - INFO - __main__ - Step 54664: {'lr': 0.0003593982491131857, 'samples': 10495488, 'steps': 54663, 'loss/train': 1.2479114532470703} -08/30/2021 23:03:49 - INFO - __main__ - Step 54665: {'lr': 0.00035939347740646186, 'samples': 10495680, 'steps': 54664, 'loss/train': 1.4891436100006104} -08/30/2021 23:03:50 - INFO - __main__ - Step 54666: {'lr': 0.00035938870565044713, 'samples': 10495872, 'steps': 54665, 'loss/train': 1.5442767143249512} -08/30/2021 23:03:50 - INFO - __main__ - Step 54667: {'lr': 0.0003593839338451435, 'samples': 10496064, 'steps': 54666, 'loss/train': 1.1562092304229736} -08/30/2021 23:03:51 - INFO - __main__ - Step 54668: {'lr': 0.0003593791619905532, 'samples': 10496256, 'steps': 54667, 'loss/train': 1.853531002998352} -08/30/2021 23:03:51 - INFO - __main__ - Step 54669: {'lr': 0.00035937439008667827, 'samples': 10496448, 'steps': 54668, 'loss/train': 1.4185580015182495} -08/30/2021 23:03:53 - INFO - __main__ - Step 54670: {'lr': 0.00035936961813352094, 'samples': 10496640, 'steps': 54669, 'loss/train': 0.33569204807281494} -08/30/2021 23:03:54 - INFO - __main__ - Step 54671: {'lr': 0.0003593648461310833, 'samples': 10496832, 'steps': 54670, 'loss/train': 1.240635633468628} -08/30/2021 23:03:54 - INFO - __main__ - Step 54672: {'lr': 0.0003593600740793676, 'samples': 10497024, 'steps': 54671, 'loss/train': 1.147263526916504} -08/30/2021 23:03:55 - INFO - __main__ - Step 54673: {'lr': 0.00035935530197837596, 'samples': 10497216, 'steps': 54672, 'loss/train': 0.6365401744842529} -08/30/2021 23:03:55 - INFO - __main__ - Step 54674: {'lr': 0.00035935052982811046, 'samples': 10497408, 'steps': 54673, 'loss/train': 0.9249856472015381} -08/30/2021 23:03:57 - INFO - __main__ - Step 54675: {'lr': 0.00035934575762857333, 'samples': 10497600, 'steps': 54674, 'loss/train': 1.630801796913147} -08/30/2021 23:03:57 - INFO - __main__ - Step 54676: {'lr': 0.00035934098537976675, 'samples': 10497792, 'steps': 54675, 'loss/train': 1.8333457708358765} -08/30/2021 23:03:58 - INFO - __main__ - Step 54677: {'lr': 0.00035933621308169273, 'samples': 10497984, 'steps': 54676, 'loss/train': 0.16368624567985535} -08/30/2021 23:03:58 - INFO - __main__ - Step 54678: {'lr': 0.0003593314407343535, 'samples': 10498176, 'steps': 54677, 'loss/train': 0.24434149265289307} -08/30/2021 23:03:58 - INFO - __main__ - Step 54679: {'lr': 0.00035932666833775117, 'samples': 10498368, 'steps': 54678, 'loss/train': 1.4497014284133911} -08/30/2021 23:03:59 - INFO - __main__ - Step 54680: {'lr': 0.00035932189589188803, 'samples': 10498560, 'steps': 54679, 'loss/train': 1.4546630382537842} -08/30/2021 23:04:00 - INFO - __main__ - Step 54681: {'lr': 0.00035931712339676617, 'samples': 10498752, 'steps': 54680, 'loss/train': 0.8067395091056824} -08/30/2021 23:04:00 - INFO - __main__ - Step 54682: {'lr': 0.00035931235085238754, 'samples': 10498944, 'steps': 54681, 'loss/train': 1.4721364974975586} -08/30/2021 23:04:01 - INFO - __main__ - Step 54683: {'lr': 0.0003593075782587545, 'samples': 10499136, 'steps': 54682, 'loss/train': 0.8990991115570068} -08/30/2021 23:04:01 - INFO - __main__ - Step 54684: {'lr': 0.0003593028056158692, 'samples': 10499328, 'steps': 54683, 'loss/train': 1.0903825759887695} -08/30/2021 23:04:02 - INFO - __main__ - Step 54685: {'lr': 0.0003592980329237337, 'samples': 10499520, 'steps': 54684, 'loss/train': 1.6617538928985596} -08/30/2021 23:04:03 - INFO - __main__ - Step 54686: {'lr': 0.0003592932601823502, 'samples': 10499712, 'steps': 54685, 'loss/train': 0.9660040736198425} -08/30/2021 23:04:04 - INFO - __main__ - Step 54687: {'lr': 0.0003592884873917209, 'samples': 10499904, 'steps': 54686, 'loss/train': 1.1456538438796997} -08/30/2021 23:04:04 - INFO - __main__ - Step 54688: {'lr': 0.0003592837145518479, 'samples': 10500096, 'steps': 54687, 'loss/train': 2.5816855430603027} -08/30/2021 23:04:04 - INFO - __main__ - Step 54689: {'lr': 0.00035927894166273323, 'samples': 10500288, 'steps': 54688, 'loss/train': 0.042873017489910126} -08/30/2021 23:04:05 - INFO - __main__ - Step 54690: {'lr': 0.0003592741687243792, 'samples': 10500480, 'steps': 54689, 'loss/train': 0.6734894514083862} -08/30/2021 23:04:06 - INFO - __main__ - Step 54691: {'lr': 0.00035926939573678796, 'samples': 10500672, 'steps': 54690, 'loss/train': 0.19261178374290466} -08/30/2021 23:04:07 - INFO - __main__ - Step 54692: {'lr': 0.0003592646226999616, 'samples': 10500864, 'steps': 54691, 'loss/train': 1.3513233661651611} -08/30/2021 23:04:07 - INFO - __main__ - Step 54693: {'lr': 0.0003592598496139023, 'samples': 10501056, 'steps': 54692, 'loss/train': 0.6984632015228271} -08/30/2021 23:04:07 - INFO - __main__ - Step 54694: {'lr': 0.0003592550764786122, 'samples': 10501248, 'steps': 54693, 'loss/train': 1.274774432182312} -08/30/2021 23:04:08 - INFO - __main__ - Step 54695: {'lr': 0.00035925030329409343, 'samples': 10501440, 'steps': 54694, 'loss/train': 1.4966890811920166} -08/30/2021 23:04:08 - INFO - __main__ - Step 54696: {'lr': 0.0003592455300603481, 'samples': 10501632, 'steps': 54695, 'loss/train': 1.3233423233032227} -08/30/2021 23:04:09 - INFO - __main__ - Step 54697: {'lr': 0.0003592407567773785, 'samples': 10501824, 'steps': 54696, 'loss/train': 1.7010083198547363} -08/30/2021 23:04:10 - INFO - __main__ - Step 54698: {'lr': 0.0003592359834451866, 'samples': 10502016, 'steps': 54697, 'loss/train': 1.6510733366012573} -08/30/2021 23:04:10 - INFO - __main__ - Step 54699: {'lr': 0.0003592312100637748, 'samples': 10502208, 'steps': 54698, 'loss/train': 1.4536194801330566} -08/30/2021 23:04:11 - INFO - __main__ - Step 54700: {'lr': 0.00035922643663314504, 'samples': 10502400, 'steps': 54699, 'loss/train': 1.4917083978652954} -08/30/2021 23:04:11 - INFO - __main__ - Step 54701: {'lr': 0.00035922166315329954, 'samples': 10502592, 'steps': 54700, 'loss/train': 1.3184608221054077} -08/30/2021 23:04:13 - INFO - __main__ - Step 54702: {'lr': 0.0003592168896242404, 'samples': 10502784, 'steps': 54701, 'loss/train': 0.8541215062141418} -08/30/2021 23:04:13 - INFO - __main__ - Step 54703: {'lr': 0.00035921211604596985, 'samples': 10502976, 'steps': 54702, 'loss/train': 0.5011487007141113} -08/30/2021 23:04:13 - INFO - __main__ - Step 54704: {'lr': 0.00035920734241849, 'samples': 10503168, 'steps': 54703, 'loss/train': 1.5765939950942993} -08/30/2021 23:04:14 - INFO - __main__ - Step 54705: {'lr': 0.00035920256874180304, 'samples': 10503360, 'steps': 54704, 'loss/train': 0.9782493710517883} -08/30/2021 23:04:14 - INFO - __main__ - Step 54706: {'lr': 0.00035919779501591097, 'samples': 10503552, 'steps': 54705, 'loss/train': 1.5047963857650757} -08/30/2021 23:04:15 - INFO - __main__ - Step 54707: {'lr': 0.00035919302124081613, 'samples': 10503744, 'steps': 54706, 'loss/train': 1.508135199546814} -08/30/2021 23:04:16 - INFO - __main__ - Step 54708: {'lr': 0.0003591882474165207, 'samples': 10503936, 'steps': 54707, 'loss/train': 1.7539702653884888} -08/30/2021 23:04:16 - INFO - __main__ - Step 54709: {'lr': 0.00035918347354302663, 'samples': 10504128, 'steps': 54708, 'loss/train': 1.267782211303711} -08/30/2021 23:04:17 - INFO - __main__ - Step 54710: {'lr': 0.00035917869962033615, 'samples': 10504320, 'steps': 54709, 'loss/train': 1.2069759368896484} -08/30/2021 23:04:17 - INFO - __main__ - Step 54711: {'lr': 0.00035917392564845146, 'samples': 10504512, 'steps': 54710, 'loss/train': 0.7255215644836426} -08/30/2021 23:04:18 - INFO - __main__ - Step 54712: {'lr': 0.00035916915162737467, 'samples': 10504704, 'steps': 54711, 'loss/train': 1.448610782623291} -08/30/2021 23:04:19 - INFO - __main__ - Step 54713: {'lr': 0.00035916437755710795, 'samples': 10504896, 'steps': 54712, 'loss/train': 1.2432438135147095} -08/30/2021 23:04:19 - INFO - __main__ - Step 54714: {'lr': 0.0003591596034376535, 'samples': 10505088, 'steps': 54713, 'loss/train': 1.4643007516860962} -08/30/2021 23:04:20 - INFO - __main__ - Step 54715: {'lr': 0.0003591548292690134, 'samples': 10505280, 'steps': 54714, 'loss/train': 1.5806128978729248} -08/30/2021 23:04:20 - INFO - __main__ - Step 54716: {'lr': 0.0003591500550511898, 'samples': 10505472, 'steps': 54715, 'loss/train': 1.3093656301498413} -08/30/2021 23:04:21 - INFO - __main__ - Step 54717: {'lr': 0.00035914528078418486, 'samples': 10505664, 'steps': 54716, 'loss/train': 1.8600953817367554} -08/30/2021 23:04:22 - INFO - __main__ - Step 54718: {'lr': 0.0003591405064680007, 'samples': 10505856, 'steps': 54717, 'loss/train': 1.120902419090271} -08/30/2021 23:04:22 - INFO - __main__ - Step 54719: {'lr': 0.0003591357321026396, 'samples': 10506048, 'steps': 54718, 'loss/train': 1.6283214092254639} -08/30/2021 23:04:23 - INFO - __main__ - Step 54720: {'lr': 0.00035913095768810356, 'samples': 10506240, 'steps': 54719, 'loss/train': 1.5333529710769653} -08/30/2021 23:04:23 - INFO - __main__ - Step 54721: {'lr': 0.00035912618322439483, 'samples': 10506432, 'steps': 54720, 'loss/train': 1.8235855102539062} -08/30/2021 23:04:25 - INFO - __main__ - Step 54722: {'lr': 0.00035912140871151554, 'samples': 10506624, 'steps': 54721, 'loss/train': 1.3883310556411743} -08/30/2021 23:04:26 - INFO - __main__ - Step 54723: {'lr': 0.0003591166341494678, 'samples': 10506816, 'steps': 54722, 'loss/train': 0.9013878703117371} -08/30/2021 23:04:26 - INFO - __main__ - Step 54724: {'lr': 0.00035911185953825373, 'samples': 10507008, 'steps': 54723, 'loss/train': 1.7986218929290771} -08/30/2021 23:04:26 - INFO - __main__ - Step 54725: {'lr': 0.0003591070848778756, 'samples': 10507200, 'steps': 54724, 'loss/train': 1.0796217918395996} -08/30/2021 23:04:27 - INFO - __main__ - Step 54726: {'lr': 0.0003591023101683355, 'samples': 10507392, 'steps': 54725, 'loss/train': 1.3720126152038574} -08/30/2021 23:04:27 - INFO - __main__ - Step 54727: {'lr': 0.0003590975354096356, 'samples': 10507584, 'steps': 54726, 'loss/train': 1.1427823305130005} -08/30/2021 23:04:29 - INFO - __main__ - Step 54728: {'lr': 0.000359092760601778, 'samples': 10507776, 'steps': 54727, 'loss/train': 0.9771320819854736} -08/30/2021 23:04:29 - INFO - __main__ - Step 54729: {'lr': 0.0003590879857447649, 'samples': 10507968, 'steps': 54728, 'loss/train': 1.170641303062439} -08/30/2021 23:04:30 - INFO - __main__ - Step 54730: {'lr': 0.0003590832108385985, 'samples': 10508160, 'steps': 54729, 'loss/train': 1.526761770248413} -08/30/2021 23:04:30 - INFO - __main__ - Step 54731: {'lr': 0.0003590784358832808, 'samples': 10508352, 'steps': 54730, 'loss/train': 0.8689559698104858} -08/30/2021 23:04:30 - INFO - __main__ - Step 54732: {'lr': 0.00035907366087881403, 'samples': 10508544, 'steps': 54731, 'loss/train': 1.3794056177139282} -08/30/2021 23:04:32 - INFO - __main__ - Step 54733: {'lr': 0.00035906888582520034, 'samples': 10508736, 'steps': 54732, 'loss/train': 2.078857421875} -08/30/2021 23:04:32 - INFO - __main__ - Step 54734: {'lr': 0.000359064110722442, 'samples': 10508928, 'steps': 54733, 'loss/train': 1.4995900392532349} -08/30/2021 23:04:33 - INFO - __main__ - Step 54735: {'lr': 0.00035905933557054103, 'samples': 10509120, 'steps': 54734, 'loss/train': 1.1124764680862427} -08/30/2021 23:04:33 - INFO - __main__ - Step 54736: {'lr': 0.0003590545603694996, 'samples': 10509312, 'steps': 54735, 'loss/train': 0.06038980185985565} -08/30/2021 23:04:33 - INFO - __main__ - Step 54737: {'lr': 0.0003590497851193198, 'samples': 10509504, 'steps': 54736, 'loss/train': 1.0883455276489258} -08/30/2021 23:04:35 - INFO - __main__ - Step 54738: {'lr': 0.00035904500982000386, 'samples': 10509696, 'steps': 54737, 'loss/train': 0.20443525910377502} -08/30/2021 23:04:36 - INFO - __main__ - Step 54739: {'lr': 0.0003590402344715539, 'samples': 10509888, 'steps': 54738, 'loss/train': 1.583376169204712} -08/30/2021 23:04:36 - INFO - __main__ - Step 54740: {'lr': 0.00035903545907397215, 'samples': 10510080, 'steps': 54739, 'loss/train': 0.8244765996932983} -08/30/2021 23:04:36 - INFO - __main__ - Step 54741: {'lr': 0.0003590306836272608, 'samples': 10510272, 'steps': 54740, 'loss/train': 1.1616321802139282} -08/30/2021 23:04:37 - INFO - __main__ - Step 54742: {'lr': 0.0003590259081314218, 'samples': 10510464, 'steps': 54741, 'loss/train': 1.4172818660736084} -08/30/2021 23:04:37 - INFO - __main__ - Step 54743: {'lr': 0.00035902113258645733, 'samples': 10510656, 'steps': 54742, 'loss/train': 0.019485360011458397} -08/30/2021 23:04:39 - INFO - __main__ - Step 54744: {'lr': 0.0003590163569923697, 'samples': 10510848, 'steps': 54743, 'loss/train': 1.5700057744979858} -08/30/2021 23:04:40 - INFO - __main__ - Step 54745: {'lr': 0.000359011581349161, 'samples': 10511040, 'steps': 54744, 'loss/train': 1.7024787664413452} -08/30/2021 23:04:40 - INFO - __main__ - Step 54746: {'lr': 0.00035900680565683333, 'samples': 10511232, 'steps': 54745, 'loss/train': 1.552464246749878} -08/30/2021 23:04:41 - INFO - __main__ - Step 54747: {'lr': 0.00035900202991538894, 'samples': 10511424, 'steps': 54746, 'loss/train': 0.4057244062423706} -08/30/2021 23:04:41 - INFO - __main__ - Step 54748: {'lr': 0.00035899725412482985, 'samples': 10511616, 'steps': 54747, 'loss/train': 0.37845394015312195} -08/30/2021 23:04:41 - INFO - __main__ - Step 54749: {'lr': 0.00035899247828515837, 'samples': 10511808, 'steps': 54748, 'loss/train': 0.3141857385635376} -08/30/2021 23:04:43 - INFO - __main__ - Step 54750: {'lr': 0.0003589877023963765, 'samples': 10512000, 'steps': 54749, 'loss/train': 1.2904633283615112} -08/30/2021 23:04:43 - INFO - __main__ - Step 54751: {'lr': 0.0003589829264584864, 'samples': 10512192, 'steps': 54750, 'loss/train': 1.0025943517684937} -08/30/2021 23:04:44 - INFO - __main__ - Step 54752: {'lr': 0.00035897815047149033, 'samples': 10512384, 'steps': 54751, 'loss/train': 1.240922212600708} -08/30/2021 23:04:44 - INFO - __main__ - Step 54753: {'lr': 0.00035897337443539036, 'samples': 10512576, 'steps': 54752, 'loss/train': 1.5903171300888062} -08/30/2021 23:04:44 - INFO - __main__ - Step 54754: {'lr': 0.0003589685983501887, 'samples': 10512768, 'steps': 54753, 'loss/train': 0.7101109027862549} -08/30/2021 23:04:45 - INFO - __main__ - Step 54755: {'lr': 0.0003589638222158874, 'samples': 10512960, 'steps': 54754, 'loss/train': 1.090273141860962} -08/30/2021 23:04:46 - INFO - __main__ - Step 54756: {'lr': 0.00035895904603248875, 'samples': 10513152, 'steps': 54755, 'loss/train': 1.601698875427246} -08/30/2021 23:04:47 - INFO - __main__ - Step 54757: {'lr': 0.0003589542697999948, 'samples': 10513344, 'steps': 54756, 'loss/train': 3.522212028503418} -08/30/2021 23:04:47 - INFO - __main__ - Step 54758: {'lr': 0.00035894949351840784, 'samples': 10513536, 'steps': 54757, 'loss/train': 2.6060585975646973} -08/30/2021 23:04:47 - INFO - __main__ - Step 54759: {'lr': 0.0003589447171877298, 'samples': 10513728, 'steps': 54758, 'loss/train': 1.4959547519683838} -08/30/2021 23:04:48 - INFO - __main__ - Step 54760: {'lr': 0.000358939940807963, 'samples': 10513920, 'steps': 54759, 'loss/train': 0.6446624994277954} -08/30/2021 23:04:49 - INFO - __main__ - Step 54761: {'lr': 0.00035893516437910956, 'samples': 10514112, 'steps': 54760, 'loss/train': 1.4268418550491333} -08/30/2021 23:04:50 - INFO - __main__ - Step 54762: {'lr': 0.00035893038790117156, 'samples': 10514304, 'steps': 54761, 'loss/train': 1.3592456579208374} -08/30/2021 23:04:50 - INFO - __main__ - Step 54763: {'lr': 0.0003589256113741513, 'samples': 10514496, 'steps': 54762, 'loss/train': 1.4319016933441162} -08/30/2021 23:04:51 - INFO - __main__ - Step 54764: {'lr': 0.00035892083479805077, 'samples': 10514688, 'steps': 54763, 'loss/train': 1.1870619058609009} -08/30/2021 23:04:51 - INFO - __main__ - Step 54765: {'lr': 0.0003589160581728722, 'samples': 10514880, 'steps': 54764, 'loss/train': 1.6153000593185425} -08/30/2021 23:04:53 - INFO - __main__ - Step 54766: {'lr': 0.0003589112814986177, 'samples': 10515072, 'steps': 54765, 'loss/train': 0.8619815707206726} -08/30/2021 23:04:53 - INFO - __main__ - Step 54767: {'lr': 0.00035890650477528953, 'samples': 10515264, 'steps': 54766, 'loss/train': 0.8369243144989014} -08/30/2021 23:04:53 - INFO - __main__ - Step 54768: {'lr': 0.00035890172800288965, 'samples': 10515456, 'steps': 54767, 'loss/train': 1.1500431299209595} -08/30/2021 23:04:54 - INFO - __main__ - Step 54769: {'lr': 0.0003588969511814205, 'samples': 10515648, 'steps': 54768, 'loss/train': 1.7910209894180298} -08/30/2021 23:04:54 - INFO - __main__ - Step 54770: {'lr': 0.00035889217431088396, 'samples': 10515840, 'steps': 54769, 'loss/train': 1.439741849899292} -08/30/2021 23:04:56 - INFO - __main__ - Step 54771: {'lr': 0.00035888739739128227, 'samples': 10516032, 'steps': 54770, 'loss/train': 0.945563554763794} -08/30/2021 23:04:56 - INFO - __main__ - Step 54772: {'lr': 0.00035888262042261767, 'samples': 10516224, 'steps': 54771, 'loss/train': 1.5466349124908447} -08/30/2021 23:04:57 - INFO - __main__ - Step 54773: {'lr': 0.0003588778434048922, 'samples': 10516416, 'steps': 54772, 'loss/train': 1.614445447921753} -08/30/2021 23:04:57 - INFO - __main__ - Step 54774: {'lr': 0.0003588730663381081, 'samples': 10516608, 'steps': 54773, 'loss/train': 1.1095051765441895} -08/30/2021 23:04:57 - INFO - __main__ - Step 54775: {'lr': 0.00035886828922226737, 'samples': 10516800, 'steps': 54774, 'loss/train': 0.934881329536438} -08/30/2021 23:04:58 - INFO - __main__ - Step 54776: {'lr': 0.00035886351205737237, 'samples': 10516992, 'steps': 54775, 'loss/train': 0.8662691712379456} -08/30/2021 23:04:59 - INFO - __main__ - Step 54777: {'lr': 0.00035885873484342514, 'samples': 10517184, 'steps': 54776, 'loss/train': 0.26917487382888794} -08/30/2021 23:05:00 - INFO - __main__ - Step 54778: {'lr': 0.00035885395758042784, 'samples': 10517376, 'steps': 54777, 'loss/train': 1.4882285594940186} -08/30/2021 23:05:00 - INFO - __main__ - Step 54779: {'lr': 0.0003588491802683826, 'samples': 10517568, 'steps': 54778, 'loss/train': 1.3917410373687744} -08/30/2021 23:05:00 - INFO - __main__ - Step 54780: {'lr': 0.0003588444029072916, 'samples': 10517760, 'steps': 54779, 'loss/train': 0.669773280620575} -08/30/2021 23:05:01 - INFO - __main__ - Step 54781: {'lr': 0.000358839625497157, 'samples': 10517952, 'steps': 54780, 'loss/train': 0.9478147625923157} -08/30/2021 23:05:03 - INFO - __main__ - Step 54782: {'lr': 0.0003588348480379809, 'samples': 10518144, 'steps': 54781, 'loss/train': 1.8828073740005493} -08/30/2021 23:05:03 - INFO - __main__ - Step 54783: {'lr': 0.0003588300705297656, 'samples': 10518336, 'steps': 54782, 'loss/train': 0.32478082180023193} -08/30/2021 23:05:04 - INFO - __main__ - Step 54784: {'lr': 0.0003588252929725131, 'samples': 10518528, 'steps': 54783, 'loss/train': 1.2364157438278198} -08/30/2021 23:05:04 - INFO - __main__ - Step 54785: {'lr': 0.0003588205153662256, 'samples': 10518720, 'steps': 54784, 'loss/train': 0.6688212752342224} -08/30/2021 23:05:04 - INFO - __main__ - Step 54786: {'lr': 0.0003588157377109052, 'samples': 10518912, 'steps': 54785, 'loss/train': 1.8014135360717773} -08/30/2021 23:05:06 - INFO - __main__ - Step 54787: {'lr': 0.0003588109600065541, 'samples': 10519104, 'steps': 54786, 'loss/train': 1.2262176275253296} -08/30/2021 23:05:06 - INFO - __main__ - Step 54788: {'lr': 0.0003588061822531745, 'samples': 10519296, 'steps': 54787, 'loss/train': 1.5536518096923828} -08/30/2021 23:05:07 - INFO - __main__ - Step 54789: {'lr': 0.00035880140445076857, 'samples': 10519488, 'steps': 54788, 'loss/train': 1.193449854850769} -08/30/2021 23:05:07 - INFO - __main__ - Step 54790: {'lr': 0.0003587966265993384, 'samples': 10519680, 'steps': 54789, 'loss/train': 1.524629831314087} -08/30/2021 23:05:07 - INFO - __main__ - Step 54791: {'lr': 0.0003587918486988861, 'samples': 10519872, 'steps': 54790, 'loss/train': 1.247126579284668} -08/30/2021 23:05:09 - INFO - __main__ - Step 54792: {'lr': 0.0003587870707494139, 'samples': 10520064, 'steps': 54791, 'loss/train': 1.4787753820419312} -08/30/2021 23:05:09 - INFO - __main__ - Step 54793: {'lr': 0.0003587822927509239, 'samples': 10520256, 'steps': 54792, 'loss/train': 2.1730892658233643} -08/30/2021 23:05:10 - INFO - __main__ - Step 54794: {'lr': 0.00035877751470341824, 'samples': 10520448, 'steps': 54793, 'loss/train': 1.630399465560913} -08/30/2021 23:05:10 - INFO - __main__ - Step 54795: {'lr': 0.00035877273660689916, 'samples': 10520640, 'steps': 54794, 'loss/train': 1.3768742084503174} -08/30/2021 23:05:10 - INFO - __main__ - Step 54796: {'lr': 0.0003587679584613688, 'samples': 10520832, 'steps': 54795, 'loss/train': 1.5608149766921997} -08/30/2021 23:05:12 - INFO - __main__ - Step 54797: {'lr': 0.00035876318026682925, 'samples': 10521024, 'steps': 54796, 'loss/train': 0.5692048072814941} -08/30/2021 23:05:12 - INFO - __main__ - Step 54798: {'lr': 0.0003587584020232827, 'samples': 10521216, 'steps': 54797, 'loss/train': 1.264999508857727} -08/30/2021 23:05:13 - INFO - __main__ - Step 54799: {'lr': 0.00035875362373073125, 'samples': 10521408, 'steps': 54798, 'loss/train': 1.406759262084961} -08/30/2021 23:05:13 - INFO - __main__ - Step 54800: {'lr': 0.00035874884538917705, 'samples': 10521600, 'steps': 54799, 'loss/train': 1.4888978004455566} -08/30/2021 23:05:13 - INFO - __main__ - Step 54801: {'lr': 0.0003587440669986224, 'samples': 10521792, 'steps': 54800, 'loss/train': 1.008644938468933} -08/30/2021 23:05:15 - INFO - __main__ - Step 54802: {'lr': 0.00035873928855906933, 'samples': 10521984, 'steps': 54801, 'loss/train': 0.9551413655281067} -08/30/2021 23:05:15 - INFO - __main__ - Step 54803: {'lr': 0.00035873451007052, 'samples': 10522176, 'steps': 54802, 'loss/train': 1.6367748975753784} -08/30/2021 23:05:16 - INFO - __main__ - Step 54804: {'lr': 0.00035872973153297657, 'samples': 10522368, 'steps': 54803, 'loss/train': 1.3025861978530884} -08/30/2021 23:05:16 - INFO - __main__ - Step 54805: {'lr': 0.0003587249529464412, 'samples': 10522560, 'steps': 54804, 'loss/train': 1.1687612533569336} -08/30/2021 23:05:16 - INFO - __main__ - Step 54806: {'lr': 0.00035872017431091605, 'samples': 10522752, 'steps': 54805, 'loss/train': 1.6905964612960815} -08/30/2021 23:05:18 - INFO - __main__ - Step 54807: {'lr': 0.0003587153956264033, 'samples': 10522944, 'steps': 54806, 'loss/train': 1.4622339010238647} -08/30/2021 23:05:18 - INFO - __main__ - Step 54808: {'lr': 0.00035871061689290496, 'samples': 10523136, 'steps': 54807, 'loss/train': 1.3033421039581299} -08/30/2021 23:05:19 - INFO - __main__ - Step 54809: {'lr': 0.00035870583811042347, 'samples': 10523328, 'steps': 54808, 'loss/train': 1.251278042793274} -08/30/2021 23:05:19 - INFO - __main__ - Step 54810: {'lr': 0.0003587010592789607, 'samples': 10523520, 'steps': 54809, 'loss/train': 0.07526694238185883} -08/30/2021 23:05:19 - INFO - __main__ - Step 54811: {'lr': 0.0003586962803985189, 'samples': 10523712, 'steps': 54810, 'loss/train': 1.7876299619674683} -08/30/2021 23:05:21 - INFO - __main__ - Step 54812: {'lr': 0.00035869150146910025, 'samples': 10523904, 'steps': 54811, 'loss/train': 0.04926743730902672} -08/30/2021 23:05:21 - INFO - __main__ - Step 54813: {'lr': 0.00035868672249070684, 'samples': 10524096, 'steps': 54812, 'loss/train': 1.7865430116653442} -08/30/2021 23:05:22 - INFO - __main__ - Step 54814: {'lr': 0.00035868194346334094, 'samples': 10524288, 'steps': 54813, 'loss/train': 0.6404796838760376} -08/30/2021 23:05:22 - INFO - __main__ - Step 54815: {'lr': 0.0003586771643870046, 'samples': 10524480, 'steps': 54814, 'loss/train': 1.2337820529937744} -08/30/2021 23:05:22 - INFO - __main__ - Step 54816: {'lr': 0.0003586723852617, 'samples': 10524672, 'steps': 54815, 'loss/train': 1.2930505275726318} -08/30/2021 23:05:24 - INFO - __main__ - Step 54817: {'lr': 0.00035866760608742934, 'samples': 10524864, 'steps': 54816, 'loss/train': 2.1130659580230713} -08/30/2021 23:05:25 - INFO - __main__ - Step 54818: {'lr': 0.0003586628268641947, 'samples': 10525056, 'steps': 54817, 'loss/train': 1.547697901725769} -08/30/2021 23:05:25 - INFO - __main__ - Step 54819: {'lr': 0.00035865804759199825, 'samples': 10525248, 'steps': 54818, 'loss/train': 1.5298622846603394} -08/30/2021 23:05:25 - INFO - __main__ - Step 54820: {'lr': 0.00035865326827084224, 'samples': 10525440, 'steps': 54819, 'loss/train': 0.06545507907867432} -08/30/2021 23:05:26 - INFO - __main__ - Step 54821: {'lr': 0.00035864848890072864, 'samples': 10525632, 'steps': 54820, 'loss/train': 1.5919142961502075} -08/30/2021 23:05:26 - INFO - __main__ - Step 54822: {'lr': 0.0003586437094816598, 'samples': 10525824, 'steps': 54821, 'loss/train': 1.3524130582809448} -08/30/2021 23:05:28 - INFO - __main__ - Step 54823: {'lr': 0.00035863893001363776, 'samples': 10526016, 'steps': 54822, 'loss/train': 1.1815134286880493} -08/30/2021 23:05:28 - INFO - __main__ - Step 54824: {'lr': 0.0003586341504966647, 'samples': 10526208, 'steps': 54823, 'loss/train': 1.728411078453064} -08/30/2021 23:05:28 - INFO - __main__ - Step 54825: {'lr': 0.00035862937093074273, 'samples': 10526400, 'steps': 54824, 'loss/train': 1.0831817388534546} -08/30/2021 23:05:29 - INFO - __main__ - Step 54826: {'lr': 0.000358624591315874, 'samples': 10526592, 'steps': 54825, 'loss/train': 1.2711889743804932} -08/30/2021 23:05:29 - INFO - __main__ - Step 54827: {'lr': 0.0003586198116520608, 'samples': 10526784, 'steps': 54826, 'loss/train': 1.3327785730361938} -08/30/2021 23:05:31 - INFO - __main__ - Step 54828: {'lr': 0.0003586150319393051, 'samples': 10526976, 'steps': 54827, 'loss/train': 1.2027246952056885} -08/30/2021 23:05:32 - INFO - __main__ - Step 54829: {'lr': 0.00035861025217760924, 'samples': 10527168, 'steps': 54828, 'loss/train': 0.3271122872829437} -08/30/2021 23:05:32 - INFO - __main__ - Step 54830: {'lr': 0.00035860547236697525, 'samples': 10527360, 'steps': 54829, 'loss/train': 0.8940494060516357} -08/30/2021 23:05:32 - INFO - __main__ - Step 54831: {'lr': 0.0003586006925074053, 'samples': 10527552, 'steps': 54830, 'loss/train': 0.4592224955558777} -08/30/2021 23:05:33 - INFO - __main__ - Step 54832: {'lr': 0.0003585959125989015, 'samples': 10527744, 'steps': 54831, 'loss/train': 0.039446692913770676} -08/30/2021 23:05:34 - INFO - __main__ - Step 54833: {'lr': 0.00035859113264146607, 'samples': 10527936, 'steps': 54832, 'loss/train': 1.3696197271347046} -08/30/2021 23:05:35 - INFO - __main__ - Step 54834: {'lr': 0.00035858635263510117, 'samples': 10528128, 'steps': 54833, 'loss/train': 0.044821009039878845} -08/30/2021 23:05:35 - INFO - __main__ - Step 54835: {'lr': 0.00035858157257980894, 'samples': 10528320, 'steps': 54834, 'loss/train': 2.080129861831665} -08/30/2021 23:05:36 - INFO - __main__ - Step 54836: {'lr': 0.0003585767924755916, 'samples': 10528512, 'steps': 54835, 'loss/train': 1.3405967950820923} -08/30/2021 23:05:36 - INFO - __main__ - Step 54837: {'lr': 0.0003585720123224512, 'samples': 10528704, 'steps': 54836, 'loss/train': 0.7504355311393738} -08/30/2021 23:05:38 - INFO - __main__ - Step 54838: {'lr': 0.00035856723212038987, 'samples': 10528896, 'steps': 54837, 'loss/train': 1.0238993167877197} -08/30/2021 23:05:38 - INFO - __main__ - Step 54839: {'lr': 0.0003585624518694098, 'samples': 10529088, 'steps': 54838, 'loss/train': 1.0686841011047363} -08/30/2021 23:05:39 - INFO - __main__ - Step 54840: {'lr': 0.00035855767156951323, 'samples': 10529280, 'steps': 54839, 'loss/train': 1.5319374799728394} -08/30/2021 23:05:39 - INFO - __main__ - Step 54841: {'lr': 0.0003585528912207022, 'samples': 10529472, 'steps': 54840, 'loss/train': 0.13145770132541656} -08/30/2021 23:05:39 - INFO - __main__ - Step 54842: {'lr': 0.0003585481108229789, 'samples': 10529664, 'steps': 54841, 'loss/train': 1.5246318578720093} -08/30/2021 23:05:41 - INFO - __main__ - Step 54843: {'lr': 0.0003585433303763456, 'samples': 10529856, 'steps': 54842, 'loss/train': 1.3429349660873413} -08/30/2021 23:05:41 - INFO - __main__ - Step 54844: {'lr': 0.0003585385498808043, 'samples': 10530048, 'steps': 54843, 'loss/train': 1.8032245635986328} -08/30/2021 23:05:42 - INFO - __main__ - Step 54845: {'lr': 0.00035853376933635717, 'samples': 10530240, 'steps': 54844, 'loss/train': 1.2749818563461304} -08/30/2021 23:05:42 - INFO - __main__ - Step 54846: {'lr': 0.0003585289887430064, 'samples': 10530432, 'steps': 54845, 'loss/train': 1.229638695716858} -08/30/2021 23:05:42 - INFO - __main__ - Step 54847: {'lr': 0.0003585242081007542, 'samples': 10530624, 'steps': 54846, 'loss/train': 0.7809693217277527} -08/30/2021 23:05:43 - INFO - __main__ - Step 54848: {'lr': 0.0003585194274096026, 'samples': 10530816, 'steps': 54847, 'loss/train': 1.448364019393921} -08/30/2021 23:05:44 - INFO - __main__ - Step 54849: {'lr': 0.00035851464666955383, 'samples': 10531008, 'steps': 54848, 'loss/train': 0.1762140840291977} -08/30/2021 23:05:45 - INFO - __main__ - Step 54850: {'lr': 0.0003585098658806101, 'samples': 10531200, 'steps': 54849, 'loss/train': 0.20571884512901306} -08/30/2021 23:05:45 - INFO - __main__ - Step 54851: {'lr': 0.00035850508504277345, 'samples': 10531392, 'steps': 54850, 'loss/train': 1.350258469581604} -08/30/2021 23:05:45 - INFO - __main__ - Step 54852: {'lr': 0.0003585003041560461, 'samples': 10531584, 'steps': 54851, 'loss/train': 0.23520395159721375} -08/30/2021 23:05:46 - INFO - __main__ - Step 54853: {'lr': 0.00035849552322043016, 'samples': 10531776, 'steps': 54852, 'loss/train': 1.3796825408935547} -08/30/2021 23:05:47 - INFO - __main__ - Step 54854: {'lr': 0.0003584907422359278, 'samples': 10531968, 'steps': 54853, 'loss/train': 1.9507673978805542} -08/30/2021 23:05:48 - INFO - __main__ - Step 54855: {'lr': 0.00035848596120254125, 'samples': 10532160, 'steps': 54854, 'loss/train': 1.103347659111023} -08/30/2021 23:05:48 - INFO - __main__ - Step 54856: {'lr': 0.0003584811801202726, 'samples': 10532352, 'steps': 54855, 'loss/train': 1.323451042175293} -08/30/2021 23:05:49 - INFO - __main__ - Step 54857: {'lr': 0.00035847639898912395, 'samples': 10532544, 'steps': 54856, 'loss/train': 1.736045241355896} -08/30/2021 23:05:49 - INFO - __main__ - Step 54858: {'lr': 0.00035847161780909746, 'samples': 10532736, 'steps': 54857, 'loss/train': 0.24536152184009552} -08/30/2021 23:05:50 - INFO - __main__ - Step 54859: {'lr': 0.0003584668365801954, 'samples': 10532928, 'steps': 54858, 'loss/train': 1.7416924238204956} -08/30/2021 23:05:51 - INFO - __main__ - Step 54860: {'lr': 0.00035846205530241985, 'samples': 10533120, 'steps': 54859, 'loss/train': 1.98043692111969} -08/30/2021 23:05:51 - INFO - __main__ - Step 54861: {'lr': 0.00035845727397577296, 'samples': 10533312, 'steps': 54860, 'loss/train': 1.6187208890914917} -08/30/2021 23:05:51 - INFO - __main__ - Step 54862: {'lr': 0.0003584524926002569, 'samples': 10533504, 'steps': 54861, 'loss/train': 1.2378475666046143} -08/30/2021 23:05:52 - INFO - __main__ - Step 54863: {'lr': 0.00035844771117587396, 'samples': 10533696, 'steps': 54862, 'loss/train': 1.2186185121536255} -08/30/2021 23:05:53 - INFO - __main__ - Step 54864: {'lr': 0.0003584429297026259, 'samples': 10533888, 'steps': 54863, 'loss/train': 1.3283289670944214} -08/30/2021 23:05:54 - INFO - __main__ - Step 54865: {'lr': 0.00035843814818051537, 'samples': 10534080, 'steps': 54864, 'loss/train': 1.1565790176391602} -08/30/2021 23:05:54 - INFO - __main__ - Step 54866: {'lr': 0.0003584333666095441, 'samples': 10534272, 'steps': 54865, 'loss/train': 1.7562763690948486} -08/30/2021 23:05:54 - INFO - __main__ - Step 54867: {'lr': 0.0003584285849897145, 'samples': 10534464, 'steps': 54866, 'loss/train': 1.3092586994171143} -08/30/2021 23:05:55 - INFO - __main__ - Step 54868: {'lr': 0.00035842380332102864, 'samples': 10534656, 'steps': 54867, 'loss/train': 0.49937012791633606} -08/30/2021 23:05:56 - INFO - __main__ - Step 54869: {'lr': 0.0003584190216034887, 'samples': 10534848, 'steps': 54868, 'loss/train': 1.8234986066818237} -08/30/2021 23:05:57 - INFO - __main__ - Step 54870: {'lr': 0.0003584142398370969, 'samples': 10535040, 'steps': 54869, 'loss/train': 1.2728663682937622} -08/30/2021 23:05:57 - INFO - __main__ - Step 54871: {'lr': 0.0003584094580218552, 'samples': 10535232, 'steps': 54870, 'loss/train': 0.6441253423690796} -08/30/2021 23:05:57 - INFO - __main__ - Step 54872: {'lr': 0.00035840467615776584, 'samples': 10535424, 'steps': 54871, 'loss/train': 1.3929755687713623} -08/30/2021 23:05:58 - INFO - __main__ - Step 54873: {'lr': 0.0003583998942448311, 'samples': 10535616, 'steps': 54872, 'loss/train': 1.5756875276565552} -08/30/2021 23:05:58 - INFO - __main__ - Step 54874: {'lr': 0.000358395112283053, 'samples': 10535808, 'steps': 54873, 'loss/train': 1.4279135465621948} -08/30/2021 23:06:00 - INFO - __main__ - Step 54875: {'lr': 0.00035839033027243374, 'samples': 10536000, 'steps': 54874, 'loss/train': 0.47282174229621887} -08/30/2021 23:06:00 - INFO - __main__ - Step 54876: {'lr': 0.0003583855482129755, 'samples': 10536192, 'steps': 54875, 'loss/train': 3.4893805980682373} -08/30/2021 23:06:01 - INFO - __main__ - Step 54877: {'lr': 0.0003583807661046804, 'samples': 10536384, 'steps': 54876, 'loss/train': 1.4225763082504272} -08/30/2021 23:06:01 - INFO - __main__ - Step 54878: {'lr': 0.0003583759839475506, 'samples': 10536576, 'steps': 54877, 'loss/train': 1.8133624792099} -08/30/2021 23:06:01 - INFO - __main__ - Step 54879: {'lr': 0.00035837120174158824, 'samples': 10536768, 'steps': 54878, 'loss/train': 1.230550765991211} -08/30/2021 23:06:03 - INFO - __main__ - Step 54880: {'lr': 0.00035836641948679544, 'samples': 10536960, 'steps': 54879, 'loss/train': 1.5679596662521362} -08/30/2021 23:06:03 - INFO - __main__ - Step 54881: {'lr': 0.0003583616371831745, 'samples': 10537152, 'steps': 54880, 'loss/train': 1.2508623600006104} -08/30/2021 23:06:03 - INFO - __main__ - Step 54882: {'lr': 0.0003583568548307274, 'samples': 10537344, 'steps': 54881, 'loss/train': 1.2757011651992798} -08/30/2021 23:06:04 - INFO - __main__ - Step 54883: {'lr': 0.0003583520724294564, 'samples': 10537536, 'steps': 54882, 'loss/train': 1.3630807399749756} -08/30/2021 23:06:04 - INFO - __main__ - Step 54884: {'lr': 0.0003583472899793636, 'samples': 10537728, 'steps': 54883, 'loss/train': 1.0713759660720825} -08/30/2021 23:06:06 - INFO - __main__ - Step 54885: {'lr': 0.0003583425074804512, 'samples': 10537920, 'steps': 54884, 'loss/train': 1.2241028547286987} -08/30/2021 23:06:07 - INFO - __main__ - Step 54886: {'lr': 0.0003583377249327213, 'samples': 10538112, 'steps': 54885, 'loss/train': 1.2938129901885986} -08/30/2021 23:06:07 - INFO - __main__ - Step 54887: {'lr': 0.00035833294233617626, 'samples': 10538304, 'steps': 54886, 'loss/train': 1.2591966390609741} -08/30/2021 23:06:07 - INFO - __main__ - Step 54888: {'lr': 0.0003583281596908179, 'samples': 10538496, 'steps': 54887, 'loss/train': 1.1956291198730469} -08/30/2021 23:06:08 - INFO - __main__ - Step 54889: {'lr': 0.00035832337699664865, 'samples': 10538688, 'steps': 54888, 'loss/train': 0.8087176084518433} -08/30/2021 23:06:08 - INFO - __main__ - Step 54890: {'lr': 0.0003583185942536704, 'samples': 10538880, 'steps': 54889, 'loss/train': 1.428797960281372} -08/30/2021 23:06:10 - INFO - __main__ - Step 54891: {'lr': 0.00035831381146188556, 'samples': 10539072, 'steps': 54890, 'loss/train': 1.2802742719650269} -08/30/2021 23:06:10 - INFO - __main__ - Step 54892: {'lr': 0.00035830902862129627, 'samples': 10539264, 'steps': 54891, 'loss/train': 1.5453442335128784} -08/30/2021 23:06:10 - INFO - __main__ - Step 54893: {'lr': 0.0003583042457319045, 'samples': 10539456, 'steps': 54892, 'loss/train': 1.4810283184051514} -08/30/2021 23:06:11 - INFO - __main__ - Step 54894: {'lr': 0.0003582994627937125, 'samples': 10539648, 'steps': 54893, 'loss/train': 1.3638290166854858} -08/30/2021 23:06:11 - INFO - __main__ - Step 54895: {'lr': 0.00035829467980672247, 'samples': 10539840, 'steps': 54894, 'loss/train': 0.5878710746765137} -08/30/2021 23:06:13 - INFO - __main__ - Step 54896: {'lr': 0.00035828989677093656, 'samples': 10540032, 'steps': 54895, 'loss/train': 1.2077194452285767} -08/30/2021 23:06:13 - INFO - __main__ - Step 54897: {'lr': 0.00035828511368635684, 'samples': 10540224, 'steps': 54896, 'loss/train': 1.7178305387496948} -08/30/2021 23:06:14 - INFO - __main__ - Step 54898: {'lr': 0.0003582803305529856, 'samples': 10540416, 'steps': 54897, 'loss/train': 1.2981431484222412} -08/30/2021 23:06:14 - INFO - __main__ - Step 54899: {'lr': 0.0003582755473708248, 'samples': 10540608, 'steps': 54898, 'loss/train': 2.0900206565856934} -08/30/2021 23:06:14 - INFO - __main__ - Step 54900: {'lr': 0.00035827076413987675, 'samples': 10540800, 'steps': 54899, 'loss/train': 0.36701083183288574} -08/30/2021 23:06:16 - INFO - __main__ - Step 54901: {'lr': 0.00035826598086014357, 'samples': 10540992, 'steps': 54900, 'loss/train': 1.1260123252868652} -08/30/2021 23:06:16 - INFO - __main__ - Step 54902: {'lr': 0.0003582611975316274, 'samples': 10541184, 'steps': 54901, 'loss/train': 1.3970805406570435} -08/30/2021 23:06:16 - INFO - __main__ - Step 54903: {'lr': 0.00035825641415433045, 'samples': 10541376, 'steps': 54902, 'loss/train': 0.8591406345367432} -08/30/2021 23:06:17 - INFO - __main__ - Step 54904: {'lr': 0.0003582516307282548, 'samples': 10541568, 'steps': 54903, 'loss/train': 1.7223007678985596} -08/30/2021 23:06:17 - INFO - __main__ - Step 54905: {'lr': 0.00035824684725340263, 'samples': 10541760, 'steps': 54904, 'loss/train': 1.793871521949768} -08/30/2021 23:06:18 - INFO - __main__ - Step 54906: {'lr': 0.00035824206372977606, 'samples': 10541952, 'steps': 54905, 'loss/train': 1.8346998691558838} -08/30/2021 23:06:19 - INFO - __main__ - Step 54907: {'lr': 0.00035823728015737735, 'samples': 10542144, 'steps': 54906, 'loss/train': 1.0726392269134521} -08/30/2021 23:06:20 - INFO - __main__ - Step 54908: {'lr': 0.0003582324965362086, 'samples': 10542336, 'steps': 54907, 'loss/train': 1.670105218887329} -08/30/2021 23:06:20 - INFO - __main__ - Step 54909: {'lr': 0.0003582277128662719, 'samples': 10542528, 'steps': 54908, 'loss/train': 1.3964343070983887} -08/30/2021 23:06:20 - INFO - __main__ - Step 54910: {'lr': 0.00035822292914756954, 'samples': 10542720, 'steps': 54909, 'loss/train': 5.732332706451416} -08/30/2021 23:06:21 - INFO - __main__ - Step 54911: {'lr': 0.00035821814538010356, 'samples': 10542912, 'steps': 54910, 'loss/train': 1.5952101945877075} -08/30/2021 23:06:21 - INFO - __main__ - Step 54912: {'lr': 0.00035821336156387614, 'samples': 10543104, 'steps': 54911, 'loss/train': 1.186787724494934} -08/30/2021 23:06:23 - INFO - __main__ - Step 54913: {'lr': 0.00035820857769888943, 'samples': 10543296, 'steps': 54912, 'loss/train': 1.4470399618148804} -08/30/2021 23:06:23 - INFO - __main__ - Step 54914: {'lr': 0.0003582037937851456, 'samples': 10543488, 'steps': 54913, 'loss/train': 1.3439602851867676} -08/30/2021 23:06:24 - INFO - __main__ - Step 54915: {'lr': 0.00035819900982264684, 'samples': 10543680, 'steps': 54914, 'loss/train': 0.03276611492037773} -08/30/2021 23:06:24 - INFO - __main__ - Step 54916: {'lr': 0.0003581942258113953, 'samples': 10543872, 'steps': 54915, 'loss/train': 0.13259555399417877} -08/30/2021 23:06:24 - INFO - __main__ - Step 54917: {'lr': 0.00035818944175139314, 'samples': 10544064, 'steps': 54916, 'loss/train': 1.2883217334747314} -08/30/2021 23:06:25 - INFO - __main__ - Step 54918: {'lr': 0.0003581846576426423, 'samples': 10544256, 'steps': 54917, 'loss/train': 2.121966600418091} -08/30/2021 23:06:26 - INFO - __main__ - Step 54919: {'lr': 0.0003581798734851453, 'samples': 10544448, 'steps': 54918, 'loss/train': 1.3454232215881348} -08/30/2021 23:06:27 - INFO - __main__ - Step 54920: {'lr': 0.00035817508927890406, 'samples': 10544640, 'steps': 54919, 'loss/train': 0.8300412893295288} -08/30/2021 23:06:27 - INFO - __main__ - Step 54921: {'lr': 0.00035817030502392083, 'samples': 10544832, 'steps': 54920, 'loss/train': 0.5394120812416077} -08/30/2021 23:06:27 - INFO - __main__ - Step 54922: {'lr': 0.0003581655207201977, 'samples': 10545024, 'steps': 54921, 'loss/train': 1.1002658605575562} -08/30/2021 23:06:28 - INFO - __main__ - Step 54923: {'lr': 0.00035816073636773686, 'samples': 10545216, 'steps': 54922, 'loss/train': 1.1501874923706055} -08/30/2021 23:06:29 - INFO - __main__ - Step 54924: {'lr': 0.0003581559519665405, 'samples': 10545408, 'steps': 54923, 'loss/train': 1.3494172096252441} -08/30/2021 23:06:30 - INFO - __main__ - Step 54925: {'lr': 0.0003581511675166107, 'samples': 10545600, 'steps': 54924, 'loss/train': 0.944462239742279} -08/30/2021 23:06:30 - INFO - __main__ - Step 54926: {'lr': 0.00035814638301794966, 'samples': 10545792, 'steps': 54925, 'loss/train': 1.0862692594528198} -08/30/2021 23:06:30 - INFO - __main__ - Step 54927: {'lr': 0.0003581415984705595, 'samples': 10545984, 'steps': 54926, 'loss/train': 1.0773601531982422} -08/30/2021 23:06:31 - INFO - __main__ - Step 54928: {'lr': 0.0003581368138744424, 'samples': 10546176, 'steps': 54927, 'loss/train': 1.6194422245025635} -08/30/2021 23:06:32 - INFO - __main__ - Step 54929: {'lr': 0.00035813202922960056, 'samples': 10546368, 'steps': 54928, 'loss/train': 1.0069372653961182} -08/30/2021 23:06:33 - INFO - __main__ - Step 54930: {'lr': 0.00035812724453603614, 'samples': 10546560, 'steps': 54929, 'loss/train': 1.9901037216186523} -08/30/2021 23:06:33 - INFO - __main__ - Step 54931: {'lr': 0.00035812245979375114, 'samples': 10546752, 'steps': 54930, 'loss/train': 1.2745238542556763} -08/30/2021 23:06:33 - INFO - __main__ - Step 54932: {'lr': 0.0003581176750027479, 'samples': 10546944, 'steps': 54931, 'loss/train': 1.440755009651184} -08/30/2021 23:06:34 - INFO - __main__ - Step 54933: {'lr': 0.00035811289016302847, 'samples': 10547136, 'steps': 54932, 'loss/train': 1.6475715637207031} -08/30/2021 23:06:35 - INFO - __main__ - Step 54934: {'lr': 0.000358108105274595, 'samples': 10547328, 'steps': 54933, 'loss/train': 1.3965115547180176} -08/30/2021 23:06:36 - INFO - __main__ - Step 54935: {'lr': 0.0003581033203374498, 'samples': 10547520, 'steps': 54934, 'loss/train': 1.4318008422851562} -08/30/2021 23:06:36 - INFO - __main__ - Step 54936: {'lr': 0.0003580985353515948, 'samples': 10547712, 'steps': 54935, 'loss/train': 0.05075906962156296} -08/30/2021 23:06:36 - INFO - __main__ - Step 54937: {'lr': 0.0003580937503170324, 'samples': 10547904, 'steps': 54936, 'loss/train': 1.081440806388855} -08/30/2021 23:06:37 - INFO - __main__ - Step 54938: {'lr': 0.00035808896523376456, 'samples': 10548096, 'steps': 54937, 'loss/train': 1.7787302732467651} -08/30/2021 23:06:37 - INFO - __main__ - Step 54939: {'lr': 0.00035808418010179345, 'samples': 10548288, 'steps': 54938, 'loss/train': 1.4462049007415771} -08/30/2021 23:06:39 - INFO - __main__ - Step 54940: {'lr': 0.0003580793949211213, 'samples': 10548480, 'steps': 54939, 'loss/train': 1.5302996635437012} -08/30/2021 23:06:39 - INFO - __main__ - Step 54941: {'lr': 0.00035807460969175027, 'samples': 10548672, 'steps': 54940, 'loss/train': 0.3005818724632263} -08/30/2021 23:06:39 - INFO - __main__ - Step 54942: {'lr': 0.0003580698244136825, 'samples': 10548864, 'steps': 54941, 'loss/train': 1.421354055404663} -08/30/2021 23:06:40 - INFO - __main__ - Step 54943: {'lr': 0.0003580650390869201, 'samples': 10549056, 'steps': 54942, 'loss/train': 1.8839118480682373} -08/30/2021 23:06:40 - INFO - __main__ - Step 54944: {'lr': 0.0003580602537114653, 'samples': 10549248, 'steps': 54943, 'loss/train': 1.4408870935440063} -08/30/2021 23:06:42 - INFO - __main__ - Step 54945: {'lr': 0.0003580554682873202, 'samples': 10549440, 'steps': 54944, 'loss/train': 0.9393563866615295} -08/30/2021 23:06:43 - INFO - __main__ - Step 54946: {'lr': 0.00035805068281448687, 'samples': 10549632, 'steps': 54945, 'loss/train': 1.4167850017547607} -08/30/2021 23:06:43 - INFO - __main__ - Step 54947: {'lr': 0.00035804589729296766, 'samples': 10549824, 'steps': 54946, 'loss/train': 1.6197949647903442} -08/30/2021 23:06:43 - INFO - __main__ - Step 54948: {'lr': 0.00035804111172276464, 'samples': 10550016, 'steps': 54947, 'loss/train': 1.4808942079544067} -08/30/2021 23:06:44 - INFO - __main__ - Step 54949: {'lr': 0.00035803632610388, 'samples': 10550208, 'steps': 54948, 'loss/train': 1.371775507926941} -08/30/2021 23:06:45 - INFO - __main__ - Step 54950: {'lr': 0.0003580315404363158, 'samples': 10550400, 'steps': 54949, 'loss/train': 1.5300039052963257} -08/30/2021 23:06:46 - INFO - __main__ - Step 54951: {'lr': 0.0003580267547200743, 'samples': 10550592, 'steps': 54950, 'loss/train': 1.7046653032302856} -08/30/2021 23:06:46 - INFO - __main__ - Step 54952: {'lr': 0.00035802196895515757, 'samples': 10550784, 'steps': 54951, 'loss/train': 2.027310371398926} -08/30/2021 23:06:46 - INFO - __main__ - Step 54953: {'lr': 0.00035801718314156785, 'samples': 10550976, 'steps': 54952, 'loss/train': 1.3124637603759766} -08/30/2021 23:06:47 - INFO - __main__ - Step 54954: {'lr': 0.00035801239727930716, 'samples': 10551168, 'steps': 54953, 'loss/train': 1.684937834739685} -08/30/2021 23:06:48 - INFO - __main__ - Step 54955: {'lr': 0.00035800761136837783, 'samples': 10551360, 'steps': 54954, 'loss/train': 1.320955753326416} -08/30/2021 23:06:49 - INFO - __main__ - Step 54956: {'lr': 0.0003580028254087819, 'samples': 10551552, 'steps': 54955, 'loss/train': 1.2315248250961304} -08/30/2021 23:06:49 - INFO - __main__ - Step 54957: {'lr': 0.00035799803940052163, 'samples': 10551744, 'steps': 54956, 'loss/train': 0.8882100582122803} -08/30/2021 23:06:50 - INFO - __main__ - Step 54958: {'lr': 0.00035799325334359906, 'samples': 10551936, 'steps': 54957, 'loss/train': 1.4985897541046143} -08/30/2021 23:06:50 - INFO - __main__ - Step 54959: {'lr': 0.00035798846723801635, 'samples': 10552128, 'steps': 54958, 'loss/train': 1.1715972423553467} -08/30/2021 23:06:51 - INFO - __main__ - Step 54960: {'lr': 0.0003579836810837758, 'samples': 10552320, 'steps': 54959, 'loss/train': 0.6490328311920166} -08/30/2021 23:06:52 - INFO - __main__ - Step 54961: {'lr': 0.0003579788948808794, 'samples': 10552512, 'steps': 54960, 'loss/train': 1.6627075672149658} -08/30/2021 23:06:52 - INFO - __main__ - Step 54962: {'lr': 0.0003579741086293294, 'samples': 10552704, 'steps': 54961, 'loss/train': 1.0530335903167725} -08/30/2021 23:06:52 - INFO - __main__ - Step 54963: {'lr': 0.00035796932232912793, 'samples': 10552896, 'steps': 54962, 'loss/train': 1.2151793241500854} -08/30/2021 23:06:53 - INFO - __main__ - Step 54964: {'lr': 0.00035796453598027725, 'samples': 10553088, 'steps': 54963, 'loss/train': 1.501438856124878} -08/30/2021 23:06:55 - INFO - __main__ - Step 54965: {'lr': 0.0003579597495827793, 'samples': 10553280, 'steps': 54964, 'loss/train': 1.1869953870773315} -08/30/2021 23:06:55 - INFO - __main__ - Step 54966: {'lr': 0.0003579549631366363, 'samples': 10553472, 'steps': 54965, 'loss/train': 1.5104602575302124} -08/30/2021 23:06:55 - INFO - __main__ - Step 54967: {'lr': 0.0003579501766418505, 'samples': 10553664, 'steps': 54966, 'loss/train': 0.08363619446754456} -08/30/2021 23:06:56 - INFO - __main__ - Step 54968: {'lr': 0.0003579453900984241, 'samples': 10553856, 'steps': 54967, 'loss/train': 1.1528701782226562} -08/30/2021 23:06:56 - INFO - __main__ - Step 54969: {'lr': 0.0003579406035063591, 'samples': 10554048, 'steps': 54968, 'loss/train': 1.2789623737335205} -08/30/2021 23:06:58 - INFO - __main__ - Step 54970: {'lr': 0.0003579358168656577, 'samples': 10554240, 'steps': 54969, 'loss/train': 1.9498343467712402} -08/30/2021 23:06:58 - INFO - __main__ - Step 54971: {'lr': 0.00035793103017632224, 'samples': 10554432, 'steps': 54970, 'loss/train': 0.9954383969306946} -08/30/2021 23:06:58 - INFO - __main__ - Step 54972: {'lr': 0.0003579262434383546, 'samples': 10554624, 'steps': 54971, 'loss/train': 1.353716254234314} -08/30/2021 23:06:59 - INFO - __main__ - Step 54973: {'lr': 0.0003579214566517571, 'samples': 10554816, 'steps': 54972, 'loss/train': 1.2005674839019775} -08/30/2021 23:06:59 - INFO - __main__ - Step 54974: {'lr': 0.00035791666981653184, 'samples': 10555008, 'steps': 54973, 'loss/train': 1.0817415714263916} -08/30/2021 23:06:59 - INFO - __main__ - Step 54975: {'lr': 0.00035791188293268094, 'samples': 10555200, 'steps': 54974, 'loss/train': 0.9809725284576416} -08/30/2021 23:07:01 - INFO - __main__ - Step 54976: {'lr': 0.00035790709600020667, 'samples': 10555392, 'steps': 54975, 'loss/train': 1.1118978261947632} -08/30/2021 23:07:02 - INFO - __main__ - Step 54977: {'lr': 0.00035790230901911114, 'samples': 10555584, 'steps': 54976, 'loss/train': 0.5985836386680603} -08/30/2021 23:07:02 - INFO - __main__ - Step 54978: {'lr': 0.00035789752198939646, 'samples': 10555776, 'steps': 54977, 'loss/train': 1.522956371307373} -08/30/2021 23:07:02 - INFO - __main__ - Step 54979: {'lr': 0.00035789273491106485, 'samples': 10555968, 'steps': 54978, 'loss/train': 1.1329950094223022} -08/30/2021 23:07:03 - INFO - __main__ - Step 54980: {'lr': 0.00035788794778411837, 'samples': 10556160, 'steps': 54979, 'loss/train': 1.0635946989059448} -08/30/2021 23:07:04 - INFO - __main__ - Step 54981: {'lr': 0.0003578831606085593, 'samples': 10556352, 'steps': 54980, 'loss/train': 1.4733490943908691} -08/30/2021 23:07:04 - INFO - __main__ - Step 54982: {'lr': 0.00035787837338438976, 'samples': 10556544, 'steps': 54981, 'loss/train': 1.2858651876449585} -08/30/2021 23:07:05 - INFO - __main__ - Step 54983: {'lr': 0.00035787358611161186, 'samples': 10556736, 'steps': 54982, 'loss/train': 1.5461442470550537} -08/30/2021 23:07:05 - INFO - __main__ - Step 54984: {'lr': 0.0003578687987902278, 'samples': 10556928, 'steps': 54983, 'loss/train': 1.275929570198059} -08/30/2021 23:07:06 - INFO - __main__ - Step 54985: {'lr': 0.00035786401142023975, 'samples': 10557120, 'steps': 54984, 'loss/train': 1.9827232360839844} -08/30/2021 23:07:07 - INFO - __main__ - Step 54986: {'lr': 0.00035785922400164983, 'samples': 10557312, 'steps': 54985, 'loss/train': 0.40761321783065796} -08/30/2021 23:07:07 - INFO - __main__ - Step 54987: {'lr': 0.00035785443653446017, 'samples': 10557504, 'steps': 54986, 'loss/train': 1.1394426822662354} -08/30/2021 23:07:08 - INFO - __main__ - Step 54988: {'lr': 0.000357849649018673, 'samples': 10557696, 'steps': 54987, 'loss/train': 1.377744197845459} -08/30/2021 23:07:08 - INFO - __main__ - Step 54989: {'lr': 0.0003578448614542904, 'samples': 10557888, 'steps': 54988, 'loss/train': 3.8520419597625732} -08/30/2021 23:07:09 - INFO - __main__ - Step 54990: {'lr': 0.0003578400738413146, 'samples': 10558080, 'steps': 54989, 'loss/train': 1.7007616758346558} -08/30/2021 23:07:09 - INFO - __main__ - Step 54991: {'lr': 0.00035783528617974774, 'samples': 10558272, 'steps': 54990, 'loss/train': 1.5789684057235718} -08/30/2021 23:07:10 - INFO - __main__ - Step 54992: {'lr': 0.000357830498469592, 'samples': 10558464, 'steps': 54991, 'loss/train': 1.027137279510498} -08/30/2021 23:07:11 - INFO - __main__ - Step 54993: {'lr': 0.0003578257107108494, 'samples': 10558656, 'steps': 54992, 'loss/train': 1.401201605796814} -08/30/2021 23:07:11 - INFO - __main__ - Step 54994: {'lr': 0.0003578209229035222, 'samples': 10558848, 'steps': 54993, 'loss/train': 0.49661901593208313} -08/30/2021 23:07:12 - INFO - __main__ - Step 54995: {'lr': 0.0003578161350476127, 'samples': 10559040, 'steps': 54994, 'loss/train': 1.6620147228240967} -08/30/2021 23:07:12 - INFO - __main__ - Step 54996: {'lr': 0.00035781134714312277, 'samples': 10559232, 'steps': 54995, 'loss/train': 1.3671543598175049} -08/30/2021 23:07:14 - INFO - __main__ - Step 54997: {'lr': 0.0003578065591900548, 'samples': 10559424, 'steps': 54996, 'loss/train': 1.5685914754867554} -08/30/2021 23:07:15 - INFO - __main__ - Step 54998: {'lr': 0.0003578017711884108, 'samples': 10559616, 'steps': 54997, 'loss/train': 1.2992208003997803} -08/30/2021 23:07:15 - INFO - __main__ - Step 54999: {'lr': 0.000357796983138193, 'samples': 10559808, 'steps': 54998, 'loss/train': 2.0973896980285645} -08/30/2021 23:07:15 - INFO - __main__ - Step 55000: {'lr': 0.0003577921950394035, 'samples': 10560000, 'steps': 54999, 'loss/train': 1.237603783607483} -08/30/2021 23:07:16 - INFO - __main__ - Step 55001: {'lr': 0.00035778740689204456, 'samples': 10560192, 'steps': 55000, 'loss/train': 1.12308669090271} -08/30/2021 23:07:18 - INFO - __main__ - Step 55002: {'lr': 0.0003577826186961183, 'samples': 10560384, 'steps': 55001, 'loss/train': 1.4274318218231201} -08/30/2021 23:07:18 - INFO - __main__ - Step 55003: {'lr': 0.0003577778304516268, 'samples': 10560576, 'steps': 55002, 'loss/train': 1.2917907238006592} -08/30/2021 23:07:18 - INFO - __main__ - Step 55004: {'lr': 0.0003577730421585723, 'samples': 10560768, 'steps': 55003, 'loss/train': 1.1044116020202637} -08/30/2021 23:07:19 - INFO - __main__ - Step 55005: {'lr': 0.00035776825381695693, 'samples': 10560960, 'steps': 55004, 'loss/train': 0.7519664764404297} -08/30/2021 23:07:19 - INFO - __main__ - Step 55006: {'lr': 0.0003577634654267828, 'samples': 10561152, 'steps': 55005, 'loss/train': 1.126876711845398} -08/30/2021 23:07:19 - INFO - __main__ - Step 55007: {'lr': 0.0003577586769880522, 'samples': 10561344, 'steps': 55006, 'loss/train': 0.052810702472925186} -08/30/2021 23:07:21 - INFO - __main__ - Step 55008: {'lr': 0.00035775388850076714, 'samples': 10561536, 'steps': 55007, 'loss/train': 0.6534317135810852} -08/30/2021 23:07:21 - INFO - __main__ - Step 55009: {'lr': 0.0003577490999649298, 'samples': 10561728, 'steps': 55008, 'loss/train': 1.0166409015655518} -08/30/2021 23:07:22 - INFO - __main__ - Step 55010: {'lr': 0.0003577443113805425, 'samples': 10561920, 'steps': 55009, 'loss/train': 1.301195740699768} -08/30/2021 23:07:22 - INFO - __main__ - Step 55011: {'lr': 0.00035773952274760723, 'samples': 10562112, 'steps': 55010, 'loss/train': 1.6746796369552612} -08/30/2021 23:07:22 - INFO - __main__ - Step 55012: {'lr': 0.00035773473406612615, 'samples': 10562304, 'steps': 55011, 'loss/train': 1.20713472366333} -08/30/2021 23:07:24 - INFO - __main__ - Step 55013: {'lr': 0.0003577299453361015, 'samples': 10562496, 'steps': 55012, 'loss/train': 0.48610928654670715} -08/30/2021 23:07:25 - INFO - __main__ - Step 55014: {'lr': 0.00035772515655753536, 'samples': 10562688, 'steps': 55013, 'loss/train': 0.7487718462944031} -08/30/2021 23:07:25 - INFO - __main__ - Step 55015: {'lr': 0.00035772036773042994, 'samples': 10562880, 'steps': 55014, 'loss/train': 1.2261285781860352} -08/30/2021 23:07:26 - INFO - __main__ - Step 55016: {'lr': 0.00035771557885478744, 'samples': 10563072, 'steps': 55015, 'loss/train': 0.030547644942998886} -08/30/2021 23:07:26 - INFO - __main__ - Step 55017: {'lr': 0.0003577107899306099, 'samples': 10563264, 'steps': 55016, 'loss/train': 0.028325550258159637} -08/30/2021 23:07:26 - INFO - __main__ - Step 55018: {'lr': 0.00035770600095789957, 'samples': 10563456, 'steps': 55017, 'loss/train': 1.2087516784667969} -08/30/2021 23:07:28 - INFO - __main__ - Step 55019: {'lr': 0.0003577012119366586, 'samples': 10563648, 'steps': 55018, 'loss/train': 1.76043701171875} -08/30/2021 23:07:29 - INFO - __main__ - Step 55020: {'lr': 0.00035769642286688903, 'samples': 10563840, 'steps': 55019, 'loss/train': 1.0970418453216553} -08/30/2021 23:07:29 - INFO - __main__ - Step 55021: {'lr': 0.00035769163374859325, 'samples': 10564032, 'steps': 55020, 'loss/train': 0.07455174624919891} -08/30/2021 23:07:29 - INFO - __main__ - Step 55022: {'lr': 0.0003576868445817732, 'samples': 10564224, 'steps': 55021, 'loss/train': 1.4707401990890503} -08/30/2021 23:07:30 - INFO - __main__ - Step 55023: {'lr': 0.0003576820553664311, 'samples': 10564416, 'steps': 55022, 'loss/train': 0.24428652226924896} -08/30/2021 23:07:31 - INFO - __main__ - Step 55024: {'lr': 0.0003576772661025691, 'samples': 10564608, 'steps': 55023, 'loss/train': 1.034194827079773} -08/30/2021 23:07:32 - INFO - __main__ - Step 55025: {'lr': 0.0003576724767901895, 'samples': 10564800, 'steps': 55024, 'loss/train': 1.277866005897522} -08/30/2021 23:07:32 - INFO - __main__ - Step 55026: {'lr': 0.00035766768742929436, 'samples': 10564992, 'steps': 55025, 'loss/train': 0.9819884896278381} -08/30/2021 23:07:32 - INFO - __main__ - Step 55027: {'lr': 0.00035766289801988574, 'samples': 10565184, 'steps': 55026, 'loss/train': 1.26042640209198} -08/30/2021 23:07:33 - INFO - __main__ - Step 55028: {'lr': 0.00035765810856196585, 'samples': 10565376, 'steps': 55027, 'loss/train': 1.7677744626998901} -08/30/2021 23:07:33 - INFO - __main__ - Step 55029: {'lr': 0.00035765331905553686, 'samples': 10565568, 'steps': 55028, 'loss/train': 1.4031389951705933} -08/30/2021 23:07:35 - INFO - __main__ - Step 55030: {'lr': 0.000357648529500601, 'samples': 10565760, 'steps': 55029, 'loss/train': 1.2488181591033936} -08/30/2021 23:07:35 - INFO - __main__ - Step 55031: {'lr': 0.00035764373989716035, 'samples': 10565952, 'steps': 55030, 'loss/train': 1.5468528270721436} -08/30/2021 23:07:35 - INFO - __main__ - Step 55032: {'lr': 0.0003576389502452172, 'samples': 10566144, 'steps': 55031, 'loss/train': 1.3943970203399658} -08/30/2021 23:07:36 - INFO - __main__ - Step 55033: {'lr': 0.0003576341605447735, 'samples': 10566336, 'steps': 55032, 'loss/train': 1.2777832746505737} -08/30/2021 23:07:36 - INFO - __main__ - Step 55034: {'lr': 0.0003576293707958315, 'samples': 10566528, 'steps': 55033, 'loss/train': 1.7076354026794434} -08/30/2021 23:07:38 - INFO - __main__ - Step 55035: {'lr': 0.0003576245809983934, 'samples': 10566720, 'steps': 55034, 'loss/train': 1.0923969745635986} -08/30/2021 23:07:38 - INFO - __main__ - Step 55036: {'lr': 0.0003576197911524613, 'samples': 10566912, 'steps': 55035, 'loss/train': 0.9455087780952454} -08/30/2021 23:07:38 - INFO - __main__ - Step 55037: {'lr': 0.0003576150012580374, 'samples': 10567104, 'steps': 55036, 'loss/train': 0.31596988439559937} -08/30/2021 23:07:39 - INFO - __main__ - Step 55038: {'lr': 0.00035761021131512383, 'samples': 10567296, 'steps': 55037, 'loss/train': 1.116105556488037} -08/30/2021 23:07:39 - INFO - __main__ - Step 55039: {'lr': 0.00035760542132372275, 'samples': 10567488, 'steps': 55038, 'loss/train': 1.5040106773376465} -08/30/2021 23:07:41 - INFO - __main__ - Step 55040: {'lr': 0.00035760063128383637, 'samples': 10567680, 'steps': 55039, 'loss/train': 1.1676915884017944} -08/30/2021 23:07:41 - INFO - __main__ - Step 55041: {'lr': 0.0003575958411954668, 'samples': 10567872, 'steps': 55040, 'loss/train': 1.7205227613449097} -08/30/2021 23:07:41 - INFO - __main__ - Step 55042: {'lr': 0.00035759105105861614, 'samples': 10568064, 'steps': 55041, 'loss/train': 0.3357863426208496} -08/30/2021 23:07:42 - INFO - __main__ - Step 55043: {'lr': 0.00035758626087328664, 'samples': 10568256, 'steps': 55042, 'loss/train': 1.2908999919891357} -08/30/2021 23:07:42 - INFO - __main__ - Step 55044: {'lr': 0.00035758147063948056, 'samples': 10568448, 'steps': 55043, 'loss/train': 1.5278897285461426} -08/30/2021 23:07:44 - INFO - __main__ - Step 55045: {'lr': 0.00035757668035719974, 'samples': 10568640, 'steps': 55044, 'loss/train': 1.9774776697158813} -08/30/2021 23:07:44 - INFO - __main__ - Step 55046: {'lr': 0.00035757189002644664, 'samples': 10568832, 'steps': 55045, 'loss/train': 1.4386043548583984} -08/30/2021 23:07:44 - INFO - __main__ - Step 55047: {'lr': 0.00035756709964722324, 'samples': 10569024, 'steps': 55046, 'loss/train': 0.4118565320968628} -08/30/2021 23:07:45 - INFO - __main__ - Step 55048: {'lr': 0.00035756230921953183, 'samples': 10569216, 'steps': 55047, 'loss/train': 1.394034504890442} -08/30/2021 23:07:45 - INFO - __main__ - Step 55049: {'lr': 0.0003575575187433744, 'samples': 10569408, 'steps': 55048, 'loss/train': 1.6256165504455566} -08/30/2021 23:07:47 - INFO - __main__ - Step 55050: {'lr': 0.0003575527282187533, 'samples': 10569600, 'steps': 55049, 'loss/train': 1.8410624265670776} -08/30/2021 23:07:47 - INFO - __main__ - Step 55051: {'lr': 0.00035754793764567063, 'samples': 10569792, 'steps': 55050, 'loss/train': 0.6237562894821167} -08/30/2021 23:07:48 - INFO - __main__ - Step 55052: {'lr': 0.0003575431470241285, 'samples': 10569984, 'steps': 55051, 'loss/train': 0.8426141142845154} -08/30/2021 23:07:48 - INFO - __main__ - Step 55053: {'lr': 0.000357538356354129, 'samples': 10570176, 'steps': 55052, 'loss/train': 1.5356061458587646} -08/30/2021 23:07:48 - INFO - __main__ - Step 55054: {'lr': 0.0003575335656356744, 'samples': 10570368, 'steps': 55053, 'loss/train': 1.3171186447143555} -08/30/2021 23:07:49 - INFO - __main__ - Step 55055: {'lr': 0.0003575287748687669, 'samples': 10570560, 'steps': 55054, 'loss/train': 1.7285407781600952} -08/30/2021 23:07:51 - INFO - __main__ - Step 55056: {'lr': 0.0003575239840534086, 'samples': 10570752, 'steps': 55055, 'loss/train': 1.579219102859497} -08/30/2021 23:07:51 - INFO - __main__ - Step 55057: {'lr': 0.00035751919318960157, 'samples': 10570944, 'steps': 55056, 'loss/train': 1.2343171834945679} -08/30/2021 23:07:51 - INFO - __main__ - Step 55058: {'lr': 0.0003575144022773481, 'samples': 10571136, 'steps': 55057, 'loss/train': 1.174000859260559} -08/30/2021 23:07:52 - INFO - __main__ - Step 55059: {'lr': 0.00035750961131665034, 'samples': 10571328, 'steps': 55058, 'loss/train': 0.9515050053596497} -08/30/2021 23:07:52 - INFO - __main__ - Step 55060: {'lr': 0.0003575048203075103, 'samples': 10571520, 'steps': 55059, 'loss/train': 1.121878981590271} -08/30/2021 23:07:53 - INFO - __main__ - Step 55061: {'lr': 0.0003575000292499303, 'samples': 10571712, 'steps': 55060, 'loss/train': 0.8917629718780518} -08/30/2021 23:07:54 - INFO - __main__ - Step 55062: {'lr': 0.0003574952381439125, 'samples': 10571904, 'steps': 55061, 'loss/train': 0.8872008323669434} -08/30/2021 23:07:54 - INFO - __main__ - Step 55063: {'lr': 0.0003574904469894589, 'samples': 10572096, 'steps': 55062, 'loss/train': 1.0737521648406982} -08/30/2021 23:07:55 - INFO - __main__ - Step 55064: {'lr': 0.00035748565578657185, 'samples': 10572288, 'steps': 55063, 'loss/train': 1.4406421184539795} -08/30/2021 23:07:55 - INFO - __main__ - Step 55065: {'lr': 0.0003574808645352534, 'samples': 10572480, 'steps': 55064, 'loss/train': 1.4197230339050293} -08/30/2021 23:07:57 - INFO - __main__ - Step 55066: {'lr': 0.00035747607323550573, 'samples': 10572672, 'steps': 55065, 'loss/train': 1.5644071102142334} -08/30/2021 23:07:57 - INFO - __main__ - Step 55067: {'lr': 0.000357471281887331, 'samples': 10572864, 'steps': 55066, 'loss/train': 0.8464855551719666} -08/30/2021 23:07:58 - INFO - __main__ - Step 55068: {'lr': 0.0003574664904907314, 'samples': 10573056, 'steps': 55067, 'loss/train': 1.206516981124878} -08/30/2021 23:07:58 - INFO - __main__ - Step 55069: {'lr': 0.00035746169904570896, 'samples': 10573248, 'steps': 55068, 'loss/train': 0.5651645660400391} -08/30/2021 23:07:58 - INFO - __main__ - Step 55070: {'lr': 0.000357456907552266, 'samples': 10573440, 'steps': 55069, 'loss/train': 1.661095380783081} -08/30/2021 23:08:00 - INFO - __main__ - Step 55071: {'lr': 0.00035745211601040464, 'samples': 10573632, 'steps': 55070, 'loss/train': 1.5638982057571411} -08/30/2021 23:08:00 - INFO - __main__ - Step 55072: {'lr': 0.000357447324420127, 'samples': 10573824, 'steps': 55071, 'loss/train': 0.7424582839012146} -08/30/2021 23:08:00 - INFO - __main__ - Step 55073: {'lr': 0.00035744253278143526, 'samples': 10574016, 'steps': 55072, 'loss/train': 0.4229337275028229} -08/30/2021 23:08:01 - INFO - __main__ - Step 55074: {'lr': 0.0003574377410943315, 'samples': 10574208, 'steps': 55073, 'loss/train': 1.8057987689971924} -08/30/2021 23:08:01 - INFO - __main__ - Step 55075: {'lr': 0.00035743294935881804, 'samples': 10574400, 'steps': 55074, 'loss/train': 2.08233904838562} -08/30/2021 23:08:02 - INFO - __main__ - Step 55076: {'lr': 0.0003574281575748969, 'samples': 10574592, 'steps': 55075, 'loss/train': 1.3846652507781982} -08/30/2021 23:08:03 - INFO - __main__ - Step 55077: {'lr': 0.0003574233657425703, 'samples': 10574784, 'steps': 55076, 'loss/train': 1.3039796352386475} -08/30/2021 23:08:04 - INFO - __main__ - Step 55078: {'lr': 0.0003574185738618404, 'samples': 10574976, 'steps': 55077, 'loss/train': 0.7944549322128296} -08/30/2021 23:08:04 - INFO - __main__ - Step 55079: {'lr': 0.00035741378193270934, 'samples': 10575168, 'steps': 55078, 'loss/train': 1.7391003370285034} -08/30/2021 23:08:04 - INFO - __main__ - Step 55080: {'lr': 0.00035740898995517933, 'samples': 10575360, 'steps': 55079, 'loss/train': 1.6497116088867188} -08/30/2021 23:08:06 - INFO - __main__ - Step 55081: {'lr': 0.00035740419792925244, 'samples': 10575552, 'steps': 55080, 'loss/train': 1.5516760349273682} -08/30/2021 23:08:06 - INFO - __main__ - Step 55082: {'lr': 0.0003573994058549309, 'samples': 10575744, 'steps': 55081, 'loss/train': 1.091497540473938} -08/30/2021 23:08:07 - INFO - __main__ - Step 55083: {'lr': 0.00035739461373221677, 'samples': 10575936, 'steps': 55082, 'loss/train': 1.3975498676300049} -08/30/2021 23:08:07 - INFO - __main__ - Step 55084: {'lr': 0.00035738982156111233, 'samples': 10576128, 'steps': 55083, 'loss/train': 1.4310529232025146} -08/30/2021 23:08:07 - INFO - __main__ - Step 55085: {'lr': 0.0003573850293416198, 'samples': 10576320, 'steps': 55084, 'loss/train': 1.4916080236434937} -08/30/2021 23:08:08 - INFO - __main__ - Step 55086: {'lr': 0.00035738023707374114, 'samples': 10576512, 'steps': 55085, 'loss/train': 1.1713804006576538} -08/30/2021 23:08:09 - INFO - __main__ - Step 55087: {'lr': 0.0003573754447574785, 'samples': 10576704, 'steps': 55086, 'loss/train': 1.2049801349639893} -08/30/2021 23:08:10 - INFO - __main__ - Step 55088: {'lr': 0.0003573706523928343, 'samples': 10576896, 'steps': 55087, 'loss/train': 2.430856466293335} -08/30/2021 23:08:10 - INFO - __main__ - Step 55089: {'lr': 0.00035736585997981046, 'samples': 10577088, 'steps': 55088, 'loss/train': 1.8722506761550903} -08/30/2021 23:08:11 - INFO - __main__ - Step 55090: {'lr': 0.00035736106751840926, 'samples': 10577280, 'steps': 55089, 'loss/train': 0.03832166641950607} -08/30/2021 23:08:11 - INFO - __main__ - Step 55091: {'lr': 0.00035735627500863275, 'samples': 10577472, 'steps': 55090, 'loss/train': 1.4132860898971558} -08/30/2021 23:08:12 - INFO - __main__ - Step 55092: {'lr': 0.00035735148245048326, 'samples': 10577664, 'steps': 55091, 'loss/train': 1.1814210414886475} -08/30/2021 23:08:13 - INFO - __main__ - Step 55093: {'lr': 0.0003573466898439628, 'samples': 10577856, 'steps': 55092, 'loss/train': 0.3999745845794678} -08/30/2021 23:08:13 - INFO - __main__ - Step 55094: {'lr': 0.00035734189718907364, 'samples': 10578048, 'steps': 55093, 'loss/train': 1.448533058166504} -08/30/2021 23:08:14 - INFO - __main__ - Step 55095: {'lr': 0.00035733710448581773, 'samples': 10578240, 'steps': 55094, 'loss/train': 0.6460314989089966} -08/30/2021 23:08:14 - INFO - __main__ - Step 55096: {'lr': 0.0003573323117341975, 'samples': 10578432, 'steps': 55095, 'loss/train': 1.314246416091919} -08/30/2021 23:08:16 - INFO - __main__ - Step 55097: {'lr': 0.00035732751893421494, 'samples': 10578624, 'steps': 55096, 'loss/train': 1.3325467109680176} -08/30/2021 23:08:16 - INFO - __main__ - Step 55098: {'lr': 0.0003573227260858723, 'samples': 10578816, 'steps': 55097, 'loss/train': 0.9245617985725403} -08/30/2021 23:08:16 - INFO - __main__ - Step 55099: {'lr': 0.00035731793318917167, 'samples': 10579008, 'steps': 55098, 'loss/train': 1.5939275026321411} -08/30/2021 23:08:17 - INFO - __main__ - Step 55100: {'lr': 0.0003573131402441152, 'samples': 10579200, 'steps': 55099, 'loss/train': 1.321107268333435} -08/30/2021 23:08:17 - INFO - __main__ - Step 55101: {'lr': 0.0003573083472507051, 'samples': 10579392, 'steps': 55100, 'loss/train': 1.3674732446670532} -08/30/2021 23:08:19 - INFO - __main__ - Step 55102: {'lr': 0.00035730355420894355, 'samples': 10579584, 'steps': 55101, 'loss/train': 0.9711707830429077} -08/30/2021 23:08:20 - INFO - __main__ - Step 55103: {'lr': 0.00035729876111883265, 'samples': 10579776, 'steps': 55102, 'loss/train': 1.4389941692352295} -08/30/2021 23:08:20 - INFO - __main__ - Step 55104: {'lr': 0.0003572939679803746, 'samples': 10579968, 'steps': 55103, 'loss/train': 5.5494465827941895} -08/30/2021 23:08:20 - INFO - __main__ - Step 55105: {'lr': 0.00035728917479357154, 'samples': 10580160, 'steps': 55104, 'loss/train': 1.235867977142334} -08/30/2021 23:08:21 - INFO - __main__ - Step 55106: {'lr': 0.00035728438155842556, 'samples': 10580352, 'steps': 55105, 'loss/train': 1.4290612936019897} -08/30/2021 23:08:21 - INFO - __main__ - Step 55107: {'lr': 0.000357279588274939, 'samples': 10580544, 'steps': 55106, 'loss/train': 1.3626823425292969} -08/30/2021 23:08:21 - INFO - __main__ - Step 55108: {'lr': 0.00035727479494311387, 'samples': 10580736, 'steps': 55107, 'loss/train': 0.023736894130706787} -08/30/2021 23:08:23 - INFO - __main__ - Step 55109: {'lr': 0.0003572700015629524, 'samples': 10580928, 'steps': 55108, 'loss/train': 0.3429291844367981} -08/30/2021 23:08:24 - INFO - __main__ - Step 55110: {'lr': 0.0003572652081344566, 'samples': 10581120, 'steps': 55109, 'loss/train': 1.2814936637878418} -08/30/2021 23:08:24 - INFO - __main__ - Step 55111: {'lr': 0.00035726041465762885, 'samples': 10581312, 'steps': 55110, 'loss/train': 1.0668532848358154} -08/30/2021 23:08:25 - INFO - __main__ - Step 55112: {'lr': 0.0003572556211324713, 'samples': 10581504, 'steps': 55111, 'loss/train': 1.3139017820358276} -08/30/2021 23:08:25 - INFO - __main__ - Step 55113: {'lr': 0.0003572508275589859, 'samples': 10581696, 'steps': 55112, 'loss/train': 0.03465397283434868} -08/30/2021 23:08:26 - INFO - __main__ - Step 55114: {'lr': 0.00035724603393717493, 'samples': 10581888, 'steps': 55113, 'loss/train': 0.9880599975585938} -08/30/2021 23:08:27 - INFO - __main__ - Step 55115: {'lr': 0.00035724124026704064, 'samples': 10582080, 'steps': 55114, 'loss/train': 0.9760531187057495} -08/30/2021 23:08:27 - INFO - __main__ - Step 55116: {'lr': 0.000357236446548585, 'samples': 10582272, 'steps': 55115, 'loss/train': 1.3435084819793701} -08/30/2021 23:08:28 - INFO - __main__ - Step 55117: {'lr': 0.0003572316527818103, 'samples': 10582464, 'steps': 55116, 'loss/train': 0.9737823009490967} -08/30/2021 23:08:28 - INFO - __main__ - Step 55118: {'lr': 0.00035722685896671876, 'samples': 10582656, 'steps': 55117, 'loss/train': 0.9305632710456848} -08/30/2021 23:08:30 - INFO - __main__ - Step 55119: {'lr': 0.00035722206510331237, 'samples': 10582848, 'steps': 55118, 'loss/train': 1.0313795804977417} -08/30/2021 23:08:30 - INFO - __main__ - Step 55120: {'lr': 0.0003572172711915934, 'samples': 10583040, 'steps': 55119, 'loss/train': 1.3543974161148071} -08/30/2021 23:08:31 - INFO - __main__ - Step 55121: {'lr': 0.0003572124772315639, 'samples': 10583232, 'steps': 55120, 'loss/train': 0.037722066044807434} -08/30/2021 23:08:31 - INFO - __main__ - Step 55122: {'lr': 0.0003572076832232262, 'samples': 10583424, 'steps': 55121, 'loss/train': 0.018370719626545906} -08/30/2021 23:08:31 - INFO - __main__ - Step 55123: {'lr': 0.0003572028891665823, 'samples': 10583616, 'steps': 55122, 'loss/train': 1.138566255569458} -08/30/2021 23:08:32 - INFO - __main__ - Step 55124: {'lr': 0.00035719809506163454, 'samples': 10583808, 'steps': 55123, 'loss/train': 1.4620976448059082} -08/30/2021 23:08:33 - INFO - __main__ - Step 55125: {'lr': 0.0003571933009083849, 'samples': 10584000, 'steps': 55124, 'loss/train': 1.9055577516555786} -08/30/2021 23:08:34 - INFO - __main__ - Step 55126: {'lr': 0.00035718850670683565, 'samples': 10584192, 'steps': 55125, 'loss/train': 0.9276150465011597} -08/30/2021 23:08:34 - INFO - __main__ - Step 55127: {'lr': 0.00035718371245698887, 'samples': 10584384, 'steps': 55126, 'loss/train': 1.2083185911178589} -08/30/2021 23:08:34 - INFO - __main__ - Step 55128: {'lr': 0.0003571789181588468, 'samples': 10584576, 'steps': 55127, 'loss/train': 1.5655773878097534} -08/30/2021 23:08:35 - INFO - __main__ - Step 55129: {'lr': 0.00035717412381241153, 'samples': 10584768, 'steps': 55128, 'loss/train': 1.1169935464859009} -08/30/2021 23:08:36 - INFO - __main__ - Step 55130: {'lr': 0.00035716932941768525, 'samples': 10584960, 'steps': 55129, 'loss/train': 1.4624617099761963} -08/30/2021 23:08:37 - INFO - __main__ - Step 55131: {'lr': 0.0003571645349746702, 'samples': 10585152, 'steps': 55130, 'loss/train': 0.9173088073730469} -08/30/2021 23:08:37 - INFO - __main__ - Step 55132: {'lr': 0.00035715974048336843, 'samples': 10585344, 'steps': 55131, 'loss/train': 0.3494126796722412} -08/30/2021 23:08:37 - INFO - __main__ - Step 55133: {'lr': 0.0003571549459437821, 'samples': 10585536, 'steps': 55132, 'loss/train': 2.1418423652648926} -08/30/2021 23:08:38 - INFO - __main__ - Step 55134: {'lr': 0.00035715015135591346, 'samples': 10585728, 'steps': 55133, 'loss/train': 0.3453420400619507} -08/30/2021 23:08:39 - INFO - __main__ - Step 55135: {'lr': 0.0003571453567197645, 'samples': 10585920, 'steps': 55134, 'loss/train': 0.8115973472595215} -08/30/2021 23:08:40 - INFO - __main__ - Step 55136: {'lr': 0.0003571405620353376, 'samples': 10586112, 'steps': 55135, 'loss/train': 0.6397712826728821} -08/30/2021 23:08:40 - INFO - __main__ - Step 55137: {'lr': 0.00035713576730263475, 'samples': 10586304, 'steps': 55136, 'loss/train': 1.467289924621582} -08/30/2021 23:08:40 - INFO - __main__ - Step 55138: {'lr': 0.0003571309725216582, 'samples': 10586496, 'steps': 55137, 'loss/train': 1.0287584066390991} -08/30/2021 23:08:41 - INFO - __main__ - Step 55139: {'lr': 0.0003571261776924102, 'samples': 10586688, 'steps': 55138, 'loss/train': 1.2748109102249146} -08/30/2021 23:08:42 - INFO - __main__ - Step 55140: {'lr': 0.00035712138281489264, 'samples': 10586880, 'steps': 55139, 'loss/train': 1.642458200454712} -08/30/2021 23:08:43 - INFO - __main__ - Step 55141: {'lr': 0.0003571165878891079, 'samples': 10587072, 'steps': 55140, 'loss/train': 1.6107332706451416} -08/30/2021 23:08:43 - INFO - __main__ - Step 55142: {'lr': 0.00035711179291505806, 'samples': 10587264, 'steps': 55141, 'loss/train': 1.0473591089248657} -08/30/2021 23:08:43 - INFO - __main__ - Step 55143: {'lr': 0.0003571069978927453, 'samples': 10587456, 'steps': 55142, 'loss/train': 1.4788432121276855} -08/30/2021 23:08:44 - INFO - __main__ - Step 55144: {'lr': 0.00035710220282217175, 'samples': 10587648, 'steps': 55143, 'loss/train': 0.8276771903038025} -08/30/2021 23:08:45 - INFO - __main__ - Step 55145: {'lr': 0.0003570974077033397, 'samples': 10587840, 'steps': 55144, 'loss/train': 1.0953863859176636} -08/30/2021 23:08:46 - INFO - __main__ - Step 55146: {'lr': 0.00035709261253625115, 'samples': 10588032, 'steps': 55145, 'loss/train': 1.3230887651443481} -08/30/2021 23:08:46 - INFO - __main__ - Step 55147: {'lr': 0.00035708781732090835, 'samples': 10588224, 'steps': 55146, 'loss/train': 1.5432312488555908} -08/30/2021 23:08:46 - INFO - __main__ - Step 55148: {'lr': 0.00035708302205731334, 'samples': 10588416, 'steps': 55147, 'loss/train': 0.7514558434486389} -08/30/2021 23:08:47 - INFO - __main__ - Step 55149: {'lr': 0.00035707822674546847, 'samples': 10588608, 'steps': 55148, 'loss/train': 1.9047784805297852} -08/30/2021 23:08:48 - INFO - __main__ - Step 55150: {'lr': 0.00035707343138537584, 'samples': 10588800, 'steps': 55149, 'loss/train': 0.6529859304428101} -08/30/2021 23:08:49 - INFO - __main__ - Step 55151: {'lr': 0.00035706863597703746, 'samples': 10588992, 'steps': 55150, 'loss/train': 1.2995728254318237} -08/30/2021 23:08:49 - INFO - __main__ - Step 55152: {'lr': 0.00035706384052045567, 'samples': 10589184, 'steps': 55151, 'loss/train': 1.429237723350525} -08/30/2021 23:08:49 - INFO - __main__ - Step 55153: {'lr': 0.0003570590450156325, 'samples': 10589376, 'steps': 55152, 'loss/train': 1.0988893508911133} -08/30/2021 23:08:50 - INFO - __main__ - Step 55154: {'lr': 0.00035705424946257027, 'samples': 10589568, 'steps': 55153, 'loss/train': 1.1754755973815918} -08/30/2021 23:08:51 - INFO - __main__ - Step 55155: {'lr': 0.000357049453861271, 'samples': 10589760, 'steps': 55154, 'loss/train': 1.3264036178588867} -08/30/2021 23:08:52 - INFO - __main__ - Step 55156: {'lr': 0.00035704465821173695, 'samples': 10589952, 'steps': 55155, 'loss/train': 1.3289949893951416} -08/30/2021 23:08:52 - INFO - __main__ - Step 55157: {'lr': 0.00035703986251397015, 'samples': 10590144, 'steps': 55156, 'loss/train': 0.5880630016326904} -08/30/2021 23:08:52 - INFO - __main__ - Step 55158: {'lr': 0.00035703506676797284, 'samples': 10590336, 'steps': 55157, 'loss/train': 1.032106637954712} -08/30/2021 23:08:53 - INFO - __main__ - Step 55159: {'lr': 0.00035703027097374717, 'samples': 10590528, 'steps': 55158, 'loss/train': 2.063770055770874} -08/30/2021 23:08:53 - INFO - __main__ - Step 55160: {'lr': 0.00035702547513129533, 'samples': 10590720, 'steps': 55159, 'loss/train': 1.5039185285568237} -08/30/2021 23:08:54 - INFO - __main__ - Step 55161: {'lr': 0.0003570206792406195, 'samples': 10590912, 'steps': 55160, 'loss/train': 0.9168261885643005} -08/30/2021 23:08:55 - INFO - __main__ - Step 55162: {'lr': 0.0003570158833017219, 'samples': 10591104, 'steps': 55161, 'loss/train': 1.7124944925308228} -08/30/2021 23:08:55 - INFO - __main__ - Step 55163: {'lr': 0.0003570110873146044, 'samples': 10591296, 'steps': 55162, 'loss/train': 1.1841684579849243} -08/30/2021 23:08:56 - INFO - __main__ - Step 55164: {'lr': 0.0003570062912792694, 'samples': 10591488, 'steps': 55163, 'loss/train': 1.186103105545044} -08/30/2021 23:08:56 - INFO - __main__ - Step 55165: {'lr': 0.0003570014951957191, 'samples': 10591680, 'steps': 55164, 'loss/train': 1.5367989540100098} -08/30/2021 23:08:58 - INFO - __main__ - Step 55166: {'lr': 0.00035699669906395554, 'samples': 10591872, 'steps': 55165, 'loss/train': 2.0744001865386963} -08/30/2021 23:08:58 - INFO - __main__ - Step 55167: {'lr': 0.00035699190288398093, 'samples': 10592064, 'steps': 55166, 'loss/train': 1.5010182857513428} -08/30/2021 23:08:59 - INFO - __main__ - Step 55168: {'lr': 0.0003569871066557974, 'samples': 10592256, 'steps': 55167, 'loss/train': 0.8028724789619446} -08/30/2021 23:08:59 - INFO - __main__ - Step 55169: {'lr': 0.0003569823103794071, 'samples': 10592448, 'steps': 55168, 'loss/train': 1.589728832244873} -08/30/2021 23:08:59 - INFO - __main__ - Step 55170: {'lr': 0.0003569775140548122, 'samples': 10592640, 'steps': 55169, 'loss/train': 2.010615587234497} -08/30/2021 23:09:01 - INFO - __main__ - Step 55171: {'lr': 0.00035697271768201494, 'samples': 10592832, 'steps': 55170, 'loss/train': 1.6273012161254883} -08/30/2021 23:09:02 - INFO - __main__ - Step 55172: {'lr': 0.0003569679212610175, 'samples': 10593024, 'steps': 55171, 'loss/train': 1.2307910919189453} -08/30/2021 23:09:02 - INFO - __main__ - Step 55173: {'lr': 0.00035696312479182186, 'samples': 10593216, 'steps': 55172, 'loss/train': 0.07663355022668839} -08/30/2021 23:09:02 - INFO - __main__ - Step 55174: {'lr': 0.0003569583282744303, 'samples': 10593408, 'steps': 55173, 'loss/train': 1.1500461101531982} -08/30/2021 23:09:03 - INFO - __main__ - Step 55175: {'lr': 0.00035695353170884494, 'samples': 10593600, 'steps': 55174, 'loss/train': 1.2212440967559814} -08/30/2021 23:09:04 - INFO - __main__ - Step 55176: {'lr': 0.000356948735095068, 'samples': 10593792, 'steps': 55175, 'loss/train': 0.7729575634002686} -08/30/2021 23:09:05 - INFO - __main__ - Step 55177: {'lr': 0.0003569439384331016, 'samples': 10593984, 'steps': 55176, 'loss/train': 0.9950864911079407} -08/30/2021 23:09:05 - INFO - __main__ - Step 55178: {'lr': 0.00035693914172294796, 'samples': 10594176, 'steps': 55177, 'loss/train': 1.153062343597412} -08/30/2021 23:09:05 - INFO - __main__ - Step 55179: {'lr': 0.0003569343449646092, 'samples': 10594368, 'steps': 55178, 'loss/train': 1.444591760635376} -08/30/2021 23:09:06 - INFO - __main__ - Step 55180: {'lr': 0.0003569295481580874, 'samples': 10594560, 'steps': 55179, 'loss/train': 1.8953707218170166} -08/30/2021 23:09:08 - INFO - __main__ - Step 55181: {'lr': 0.0003569247513033848, 'samples': 10594752, 'steps': 55180, 'loss/train': 1.341706395149231} -08/30/2021 23:09:08 - INFO - __main__ - Step 55182: {'lr': 0.00035691995440050364, 'samples': 10594944, 'steps': 55181, 'loss/train': 1.5464110374450684} -08/30/2021 23:09:08 - INFO - __main__ - Step 55183: {'lr': 0.0003569151574494459, 'samples': 10595136, 'steps': 55182, 'loss/train': 1.1986277103424072} -08/30/2021 23:09:09 - INFO - __main__ - Step 55184: {'lr': 0.00035691036045021384, 'samples': 10595328, 'steps': 55183, 'loss/train': 0.5342109799385071} -08/30/2021 23:09:09 - INFO - __main__ - Step 55185: {'lr': 0.0003569055634028097, 'samples': 10595520, 'steps': 55184, 'loss/train': 1.1683378219604492} -08/30/2021 23:09:09 - INFO - __main__ - Step 55186: {'lr': 0.00035690076630723555, 'samples': 10595712, 'steps': 55185, 'loss/train': 1.2338920831680298} -08/30/2021 23:09:11 - INFO - __main__ - Step 55187: {'lr': 0.0003568959691634935, 'samples': 10595904, 'steps': 55186, 'loss/train': 1.3028740882873535} -08/30/2021 23:09:11 - INFO - __main__ - Step 55188: {'lr': 0.0003568911719715858, 'samples': 10596096, 'steps': 55187, 'loss/train': 1.3566453456878662} -08/30/2021 23:09:12 - INFO - __main__ - Step 55189: {'lr': 0.00035688637473151464, 'samples': 10596288, 'steps': 55188, 'loss/train': 1.7473326921463013} -08/30/2021 23:09:12 - INFO - __main__ - Step 55190: {'lr': 0.0003568815774432821, 'samples': 10596480, 'steps': 55189, 'loss/train': 1.631582498550415} -08/30/2021 23:09:12 - INFO - __main__ - Step 55191: {'lr': 0.00035687678010689033, 'samples': 10596672, 'steps': 55190, 'loss/train': 1.0861504077911377} -08/30/2021 23:09:14 - INFO - __main__ - Step 55192: {'lr': 0.00035687198272234163, 'samples': 10596864, 'steps': 55191, 'loss/train': 1.4811815023422241} -08/30/2021 23:09:14 - INFO - __main__ - Step 55193: {'lr': 0.00035686718528963804, 'samples': 10597056, 'steps': 55192, 'loss/train': 1.5605378150939941} -08/30/2021 23:09:15 - INFO - __main__ - Step 55194: {'lr': 0.00035686238780878167, 'samples': 10597248, 'steps': 55193, 'loss/train': 1.0274966955184937} -08/30/2021 23:09:15 - INFO - __main__ - Step 55195: {'lr': 0.0003568575902797748, 'samples': 10597440, 'steps': 55194, 'loss/train': 1.2675894498825073} -08/30/2021 23:09:15 - INFO - __main__ - Step 55196: {'lr': 0.0003568527927026195, 'samples': 10597632, 'steps': 55195, 'loss/train': 1.0265432596206665} -08/30/2021 23:09:17 - INFO - __main__ - Step 55197: {'lr': 0.000356847995077318, 'samples': 10597824, 'steps': 55196, 'loss/train': 1.2248847484588623} -08/30/2021 23:09:18 - INFO - __main__ - Step 55198: {'lr': 0.0003568431974038725, 'samples': 10598016, 'steps': 55197, 'loss/train': 1.6994012594223022} -08/30/2021 23:09:18 - INFO - __main__ - Step 55199: {'lr': 0.0003568383996822851, 'samples': 10598208, 'steps': 55198, 'loss/train': 1.3403412103652954} -08/30/2021 23:09:18 - INFO - __main__ - Step 55200: {'lr': 0.0003568336019125579, 'samples': 10598400, 'steps': 55199, 'loss/train': 0.9988178014755249} -08/30/2021 23:09:19 - INFO - __main__ - Step 55201: {'lr': 0.0003568288040946931, 'samples': 10598592, 'steps': 55200, 'loss/train': 1.150381326675415} -08/30/2021 23:09:20 - INFO - __main__ - Step 55202: {'lr': 0.000356824006228693, 'samples': 10598784, 'steps': 55201, 'loss/train': 0.30949753522872925} -08/30/2021 23:09:21 - INFO - __main__ - Step 55203: {'lr': 0.0003568192083145596, 'samples': 10598976, 'steps': 55202, 'loss/train': 0.9256338477134705} -08/30/2021 23:09:21 - INFO - __main__ - Step 55204: {'lr': 0.0003568144103522951, 'samples': 10599168, 'steps': 55203, 'loss/train': 1.4142298698425293} -08/30/2021 23:09:22 - INFO - __main__ - Step 55205: {'lr': 0.00035680961234190166, 'samples': 10599360, 'steps': 55204, 'loss/train': 0.08180546015501022} -08/30/2021 23:09:22 - INFO - __main__ - Step 55206: {'lr': 0.00035680481428338156, 'samples': 10599552, 'steps': 55205, 'loss/train': 1.1518126726150513} -08/30/2021 23:09:24 - INFO - __main__ - Step 55207: {'lr': 0.0003568000161767368, 'samples': 10599744, 'steps': 55206, 'loss/train': 1.2232271432876587} -08/30/2021 23:09:24 - INFO - __main__ - Step 55208: {'lr': 0.0003567952180219696, 'samples': 10599936, 'steps': 55207, 'loss/train': 1.1638550758361816} -08/30/2021 23:09:24 - INFO - __main__ - Step 55209: {'lr': 0.00035679041981908206, 'samples': 10600128, 'steps': 55208, 'loss/train': 1.3882882595062256} -08/30/2021 23:09:25 - INFO - __main__ - Step 55210: {'lr': 0.0003567856215680765, 'samples': 10600320, 'steps': 55209, 'loss/train': 0.9962772727012634} -08/30/2021 23:09:25 - INFO - __main__ - Step 55211: {'lr': 0.0003567808232689549, 'samples': 10600512, 'steps': 55210, 'loss/train': 1.2523547410964966} -08/30/2021 23:09:27 - INFO - __main__ - Step 55212: {'lr': 0.00035677602492171953, 'samples': 10600704, 'steps': 55211, 'loss/train': 1.8029344081878662} -08/30/2021 23:09:27 - INFO - __main__ - Step 55213: {'lr': 0.0003567712265263726, 'samples': 10600896, 'steps': 55212, 'loss/train': 1.1729871034622192} -08/30/2021 23:09:27 - INFO - __main__ - Step 55214: {'lr': 0.0003567664280829161, 'samples': 10601088, 'steps': 55213, 'loss/train': 1.4841314554214478} -08/30/2021 23:09:28 - INFO - __main__ - Step 55215: {'lr': 0.0003567616295913524, 'samples': 10601280, 'steps': 55214, 'loss/train': 1.266242265701294} -08/30/2021 23:09:28 - INFO - __main__ - Step 55216: {'lr': 0.0003567568310516834, 'samples': 10601472, 'steps': 55215, 'loss/train': 0.7293866276741028} -08/30/2021 23:09:28 - INFO - __main__ - Step 55217: {'lr': 0.0003567520324639116, 'samples': 10601664, 'steps': 55216, 'loss/train': 0.7984895706176758} -08/30/2021 23:09:30 - INFO - __main__ - Step 55218: {'lr': 0.0003567472338280389, 'samples': 10601856, 'steps': 55217, 'loss/train': 1.240403413772583} -08/30/2021 23:09:31 - INFO - __main__ - Step 55219: {'lr': 0.00035674243514406754, 'samples': 10602048, 'steps': 55218, 'loss/train': 0.9931859970092773} -08/30/2021 23:09:31 - INFO - __main__ - Step 55220: {'lr': 0.00035673763641199974, 'samples': 10602240, 'steps': 55219, 'loss/train': 1.7366400957107544} -08/30/2021 23:09:32 - INFO - __main__ - Step 55221: {'lr': 0.0003567328376318375, 'samples': 10602432, 'steps': 55220, 'loss/train': 1.8007313013076782} -08/30/2021 23:09:32 - INFO - __main__ - Step 55222: {'lr': 0.0003567280388035832, 'samples': 10602624, 'steps': 55221, 'loss/train': 1.0405681133270264} -08/30/2021 23:09:34 - INFO - __main__ - Step 55223: {'lr': 0.0003567232399272388, 'samples': 10602816, 'steps': 55222, 'loss/train': 1.0924535989761353} -08/30/2021 23:09:34 - INFO - __main__ - Step 55224: {'lr': 0.0003567184410028066, 'samples': 10603008, 'steps': 55223, 'loss/train': 0.13639983534812927} -08/30/2021 23:09:35 - INFO - __main__ - Step 55225: {'lr': 0.0003567136420302887, 'samples': 10603200, 'steps': 55224, 'loss/train': 1.3539752960205078} -08/30/2021 23:09:35 - INFO - __main__ - Step 55226: {'lr': 0.00035670884300968735, 'samples': 10603392, 'steps': 55225, 'loss/train': 1.052544355392456} -08/30/2021 23:09:35 - INFO - __main__ - Step 55227: {'lr': 0.0003567040439410046, 'samples': 10603584, 'steps': 55226, 'loss/train': 1.6347931623458862} -08/30/2021 23:09:37 - INFO - __main__ - Step 55228: {'lr': 0.0003566992448242427, 'samples': 10603776, 'steps': 55227, 'loss/train': 1.0890344381332397} -08/30/2021 23:09:37 - INFO - __main__ - Step 55229: {'lr': 0.0003566944456594036, 'samples': 10603968, 'steps': 55228, 'loss/train': 1.7391352653503418} -08/30/2021 23:09:38 - INFO - __main__ - Step 55230: {'lr': 0.00035668964644648975, 'samples': 10604160, 'steps': 55229, 'loss/train': 0.8697241544723511} -08/30/2021 23:09:38 - INFO - __main__ - Step 55231: {'lr': 0.0003566848471855032, 'samples': 10604352, 'steps': 55230, 'loss/train': 0.6922517418861389} -08/30/2021 23:09:38 - INFO - __main__ - Step 55232: {'lr': 0.0003566800478764461, 'samples': 10604544, 'steps': 55231, 'loss/train': 0.861565351486206} -08/30/2021 23:09:40 - INFO - __main__ - Step 55233: {'lr': 0.00035667524851932066, 'samples': 10604736, 'steps': 55232, 'loss/train': 1.5160175561904907} -08/30/2021 23:09:40 - INFO - __main__ - Step 55234: {'lr': 0.0003566704491141289, 'samples': 10604928, 'steps': 55233, 'loss/train': 1.7381420135498047} -08/30/2021 23:09:41 - INFO - __main__ - Step 55235: {'lr': 0.0003566656496608731, 'samples': 10605120, 'steps': 55234, 'loss/train': 1.8258566856384277} -08/30/2021 23:09:41 - INFO - __main__ - Step 55236: {'lr': 0.0003566608501595554, 'samples': 10605312, 'steps': 55235, 'loss/train': 1.2742383480072021} -08/30/2021 23:09:41 - INFO - __main__ - Step 55237: {'lr': 0.000356656050610178, 'samples': 10605504, 'steps': 55236, 'loss/train': 1.397837519645691} -08/30/2021 23:09:43 - INFO - __main__ - Step 55238: {'lr': 0.000356651251012743, 'samples': 10605696, 'steps': 55237, 'loss/train': 1.0106456279754639} -08/30/2021 23:09:43 - INFO - __main__ - Step 55239: {'lr': 0.0003566464513672527, 'samples': 10605888, 'steps': 55238, 'loss/train': 1.1335854530334473} -08/30/2021 23:09:44 - INFO - __main__ - Step 55240: {'lr': 0.00035664165167370907, 'samples': 10606080, 'steps': 55239, 'loss/train': 1.4258606433868408} -08/30/2021 23:09:44 - INFO - __main__ - Step 55241: {'lr': 0.0003566368519321144, 'samples': 10606272, 'steps': 55240, 'loss/train': 1.9990119934082031} -08/30/2021 23:09:44 - INFO - __main__ - Step 55242: {'lr': 0.0003566320521424707, 'samples': 10606464, 'steps': 55241, 'loss/train': 1.1276401281356812} -08/30/2021 23:09:46 - INFO - __main__ - Step 55243: {'lr': 0.0003566272523047803, 'samples': 10606656, 'steps': 55242, 'loss/train': 1.390738606452942} -08/30/2021 23:09:46 - INFO - __main__ - Step 55244: {'lr': 0.00035662245241904533, 'samples': 10606848, 'steps': 55243, 'loss/train': 1.3159795999526978} -08/30/2021 23:09:47 - INFO - __main__ - Step 55245: {'lr': 0.0003566176524852679, 'samples': 10607040, 'steps': 55244, 'loss/train': 0.6738126873970032} -08/30/2021 23:09:47 - INFO - __main__ - Step 55246: {'lr': 0.00035661285250345023, 'samples': 10607232, 'steps': 55245, 'loss/train': 0.24185334146022797} -08/30/2021 23:09:47 - INFO - __main__ - Step 55247: {'lr': 0.00035660805247359444, 'samples': 10607424, 'steps': 55246, 'loss/train': 1.2494441270828247} -08/30/2021 23:09:49 - INFO - __main__ - Step 55248: {'lr': 0.0003566032523957027, 'samples': 10607616, 'steps': 55247, 'loss/train': 1.6309080123901367} -08/30/2021 23:09:49 - INFO - __main__ - Step 55249: {'lr': 0.00035659845226977715, 'samples': 10607808, 'steps': 55248, 'loss/train': 1.243443489074707} -08/30/2021 23:09:50 - INFO - __main__ - Step 55250: {'lr': 0.00035659365209582004, 'samples': 10608000, 'steps': 55249, 'loss/train': 1.7340915203094482} -08/30/2021 23:09:50 - INFO - __main__ - Step 55251: {'lr': 0.00035658885187383343, 'samples': 10608192, 'steps': 55250, 'loss/train': 0.9365938305854797} -08/30/2021 23:09:50 - INFO - __main__ - Step 55252: {'lr': 0.0003565840516038196, 'samples': 10608384, 'steps': 55251, 'loss/train': 1.5120447874069214} -08/30/2021 23:09:52 - INFO - __main__ - Step 55253: {'lr': 0.00035657925128578064, 'samples': 10608576, 'steps': 55252, 'loss/train': 1.5985994338989258} -08/30/2021 23:09:52 - INFO - __main__ - Step 55254: {'lr': 0.00035657445091971863, 'samples': 10608768, 'steps': 55253, 'loss/train': 1.6367053985595703} -08/30/2021 23:09:53 - INFO - __main__ - Step 55255: {'lr': 0.00035656965050563584, 'samples': 10608960, 'steps': 55254, 'loss/train': 0.8891958594322205} -08/30/2021 23:09:53 - INFO - __main__ - Step 55256: {'lr': 0.0003565648500435344, 'samples': 10609152, 'steps': 55255, 'loss/train': 1.3963193893432617} -08/30/2021 23:09:53 - INFO - __main__ - Step 55257: {'lr': 0.0003565600495334165, 'samples': 10609344, 'steps': 55256, 'loss/train': 0.7875350713729858} -08/30/2021 23:09:54 - INFO - __main__ - Step 55258: {'lr': 0.0003565552489752843, 'samples': 10609536, 'steps': 55257, 'loss/train': 1.0236879587173462} -08/30/2021 23:09:55 - INFO - __main__ - Step 55259: {'lr': 0.0003565504483691399, 'samples': 10609728, 'steps': 55258, 'loss/train': 1.2806881666183472} -08/30/2021 23:09:56 - INFO - __main__ - Step 55260: {'lr': 0.0003565456477149856, 'samples': 10609920, 'steps': 55259, 'loss/train': 1.293763279914856} -08/30/2021 23:09:56 - INFO - __main__ - Step 55261: {'lr': 0.0003565408470128234, 'samples': 10610112, 'steps': 55260, 'loss/train': 1.6316332817077637} -08/30/2021 23:09:56 - INFO - __main__ - Step 55262: {'lr': 0.00035653604626265556, 'samples': 10610304, 'steps': 55261, 'loss/train': 1.100925087928772} -08/30/2021 23:09:57 - INFO - __main__ - Step 55263: {'lr': 0.00035653124546448423, 'samples': 10610496, 'steps': 55262, 'loss/train': 1.580403208732605} -08/30/2021 23:09:58 - INFO - __main__ - Step 55264: {'lr': 0.0003565264446183116, 'samples': 10610688, 'steps': 55263, 'loss/train': 1.4981789588928223} -08/30/2021 23:09:58 - INFO - __main__ - Step 55265: {'lr': 0.00035652164372413975, 'samples': 10610880, 'steps': 55264, 'loss/train': 1.0928590297698975} -08/30/2021 23:09:59 - INFO - __main__ - Step 55266: {'lr': 0.0003565168427819709, 'samples': 10611072, 'steps': 55265, 'loss/train': 0.9962037801742554} -08/30/2021 23:09:59 - INFO - __main__ - Step 55267: {'lr': 0.00035651204179180723, 'samples': 10611264, 'steps': 55266, 'loss/train': 1.5822793245315552} -08/30/2021 23:10:00 - INFO - __main__ - Step 55268: {'lr': 0.00035650724075365084, 'samples': 10611456, 'steps': 55267, 'loss/train': 1.0196447372436523} -08/30/2021 23:10:02 - INFO - __main__ - Step 55269: {'lr': 0.000356502439667504, 'samples': 10611648, 'steps': 55268, 'loss/train': 1.847999930381775} -08/30/2021 23:10:02 - INFO - __main__ - Step 55270: {'lr': 0.0003564976385333687, 'samples': 10611840, 'steps': 55269, 'loss/train': 1.2942416667938232} -08/30/2021 23:10:02 - INFO - __main__ - Step 55271: {'lr': 0.00035649283735124723, 'samples': 10612032, 'steps': 55270, 'loss/train': 2.068279266357422} -08/30/2021 23:10:03 - INFO - __main__ - Step 55272: {'lr': 0.0003564880361211418, 'samples': 10612224, 'steps': 55271, 'loss/train': 1.2610375881195068} -08/30/2021 23:10:03 - INFO - __main__ - Step 55273: {'lr': 0.00035648323484305445, 'samples': 10612416, 'steps': 55272, 'loss/train': 1.0171916484832764} -08/30/2021 23:10:05 - INFO - __main__ - Step 55274: {'lr': 0.00035647843351698736, 'samples': 10612608, 'steps': 55273, 'loss/train': 0.059180378913879395} -08/30/2021 23:10:05 - INFO - __main__ - Step 55275: {'lr': 0.0003564736321429428, 'samples': 10612800, 'steps': 55274, 'loss/train': 0.7148613929748535} -08/30/2021 23:10:05 - INFO - __main__ - Step 55276: {'lr': 0.00035646883072092285, 'samples': 10612992, 'steps': 55275, 'loss/train': 1.365022897720337} -08/30/2021 23:10:06 - INFO - __main__ - Step 55277: {'lr': 0.00035646402925092966, 'samples': 10613184, 'steps': 55276, 'loss/train': 1.5075931549072266} -08/30/2021 23:10:06 - INFO - __main__ - Step 55278: {'lr': 0.00035645922773296546, 'samples': 10613376, 'steps': 55277, 'loss/train': 1.8225433826446533} -08/30/2021 23:10:07 - INFO - __main__ - Step 55279: {'lr': 0.0003564544261670324, 'samples': 10613568, 'steps': 55278, 'loss/train': 1.1647119522094727} -08/30/2021 23:10:08 - INFO - __main__ - Step 55280: {'lr': 0.0003564496245531326, 'samples': 10613760, 'steps': 55279, 'loss/train': 1.2166565656661987} -08/30/2021 23:10:08 - INFO - __main__ - Step 55281: {'lr': 0.0003564448228912682, 'samples': 10613952, 'steps': 55280, 'loss/train': 1.0484657287597656} -08/30/2021 23:10:09 - INFO - __main__ - Step 55282: {'lr': 0.0003564400211814414, 'samples': 10614144, 'steps': 55281, 'loss/train': 1.6991456747055054} -08/30/2021 23:10:09 - INFO - __main__ - Step 55283: {'lr': 0.0003564352194236544, 'samples': 10614336, 'steps': 55282, 'loss/train': 0.7457453012466431} -08/30/2021 23:10:11 - INFO - __main__ - Step 55284: {'lr': 0.00035643041761790936, 'samples': 10614528, 'steps': 55283, 'loss/train': 1.294876217842102} -08/30/2021 23:10:11 - INFO - __main__ - Step 55285: {'lr': 0.00035642561576420834, 'samples': 10614720, 'steps': 55284, 'loss/train': 0.3047093152999878} -08/30/2021 23:10:11 - INFO - __main__ - Step 55286: {'lr': 0.00035642081386255366, 'samples': 10614912, 'steps': 55285, 'loss/train': 1.044171690940857} -08/30/2021 23:10:12 - INFO - __main__ - Step 55287: {'lr': 0.0003564160119129473, 'samples': 10615104, 'steps': 55286, 'loss/train': 1.004141926765442} -08/30/2021 23:10:12 - INFO - __main__ - Step 55288: {'lr': 0.0003564112099153916, 'samples': 10615296, 'steps': 55287, 'loss/train': 1.2524629831314087} -08/30/2021 23:10:13 - INFO - __main__ - Step 55289: {'lr': 0.00035640640786988866, 'samples': 10615488, 'steps': 55288, 'loss/train': 0.9085763096809387} -08/30/2021 23:10:14 - INFO - __main__ - Step 55290: {'lr': 0.0003564016057764406, 'samples': 10615680, 'steps': 55289, 'loss/train': 1.1156152486801147} -08/30/2021 23:10:14 - INFO - __main__ - Step 55291: {'lr': 0.00035639680363504965, 'samples': 10615872, 'steps': 55290, 'loss/train': 1.3552489280700684} -08/30/2021 23:10:15 - INFO - __main__ - Step 55292: {'lr': 0.0003563920014457179, 'samples': 10616064, 'steps': 55291, 'loss/train': 0.042330436408519745} -08/30/2021 23:10:15 - INFO - __main__ - Step 55293: {'lr': 0.0003563871992084476, 'samples': 10616256, 'steps': 55292, 'loss/train': 1.5442012548446655} -08/30/2021 23:10:17 - INFO - __main__ - Step 55294: {'lr': 0.0003563823969232409, 'samples': 10616448, 'steps': 55293, 'loss/train': 1.1046733856201172} -08/30/2021 23:10:17 - INFO - __main__ - Step 55295: {'lr': 0.0003563775945900999, 'samples': 10616640, 'steps': 55294, 'loss/train': 1.1372112035751343} -08/30/2021 23:10:18 - INFO - __main__ - Step 55296: {'lr': 0.00035637279220902677, 'samples': 10616832, 'steps': 55295, 'loss/train': 1.1792093515396118} -08/30/2021 23:10:18 - INFO - __main__ - Step 55297: {'lr': 0.00035636798978002374, 'samples': 10617024, 'steps': 55296, 'loss/train': 1.0071793794631958} -08/30/2021 23:10:18 - INFO - __main__ - Step 55298: {'lr': 0.00035636318730309285, 'samples': 10617216, 'steps': 55297, 'loss/train': 1.6232167482376099} -08/30/2021 23:10:20 - INFO - __main__ - Step 55299: {'lr': 0.0003563583847782364, 'samples': 10617408, 'steps': 55298, 'loss/train': 1.3834015130996704} -08/30/2021 23:10:21 - INFO - __main__ - Step 55300: {'lr': 0.0003563535822054565, 'samples': 10617600, 'steps': 55299, 'loss/train': 0.7916845083236694} -08/30/2021 23:10:21 - INFO - __main__ - Step 55301: {'lr': 0.00035634877958475535, 'samples': 10617792, 'steps': 55300, 'loss/train': 1.506651520729065} -08/30/2021 23:10:21 - INFO - __main__ - Step 55302: {'lr': 0.0003563439769161351, 'samples': 10617984, 'steps': 55301, 'loss/train': 1.3220170736312866} -08/30/2021 23:10:22 - INFO - __main__ - Step 55303: {'lr': 0.00035633917419959784, 'samples': 10618176, 'steps': 55302, 'loss/train': 1.0774294137954712} -08/30/2021 23:10:22 - INFO - __main__ - Step 55304: {'lr': 0.0003563343714351458, 'samples': 10618368, 'steps': 55303, 'loss/train': 2.262615203857422} -08/30/2021 23:10:23 - INFO - __main__ - Step 55305: {'lr': 0.0003563295686227811, 'samples': 10618560, 'steps': 55304, 'loss/train': 1.303059697151184} -08/30/2021 23:10:24 - INFO - __main__ - Step 55306: {'lr': 0.000356324765762506, 'samples': 10618752, 'steps': 55305, 'loss/train': 0.9564140439033508} -08/30/2021 23:10:24 - INFO - __main__ - Step 55307: {'lr': 0.0003563199628543226, 'samples': 10618944, 'steps': 55306, 'loss/train': 1.0562925338745117} -08/30/2021 23:10:25 - INFO - __main__ - Step 55308: {'lr': 0.00035631515989823306, 'samples': 10619136, 'steps': 55307, 'loss/train': 1.583857774734497} -08/30/2021 23:10:25 - INFO - __main__ - Step 55309: {'lr': 0.0003563103568942395, 'samples': 10619328, 'steps': 55308, 'loss/train': 1.736372947692871} -08/30/2021 23:10:26 - INFO - __main__ - Step 55310: {'lr': 0.0003563055538423441, 'samples': 10619520, 'steps': 55309, 'loss/train': 0.5877330303192139} -08/30/2021 23:10:27 - INFO - __main__ - Step 55311: {'lr': 0.00035630075074254917, 'samples': 10619712, 'steps': 55310, 'loss/train': 1.0950294733047485} -08/30/2021 23:10:27 - INFO - __main__ - Step 55312: {'lr': 0.0003562959475948567, 'samples': 10619904, 'steps': 55311, 'loss/train': 0.3165510892868042} -08/30/2021 23:10:28 - INFO - __main__ - Step 55313: {'lr': 0.00035629114439926897, 'samples': 10620096, 'steps': 55312, 'loss/train': 1.2183908224105835} -08/30/2021 23:10:28 - INFO - __main__ - Step 55314: {'lr': 0.00035628634115578806, 'samples': 10620288, 'steps': 55313, 'loss/train': 1.3466416597366333} -08/30/2021 23:10:29 - INFO - __main__ - Step 55315: {'lr': 0.00035628153786441616, 'samples': 10620480, 'steps': 55314, 'loss/train': 1.0653544664382935} -08/30/2021 23:10:30 - INFO - __main__ - Step 55316: {'lr': 0.0003562767345251554, 'samples': 10620672, 'steps': 55315, 'loss/train': 0.7332490682601929} -08/30/2021 23:10:30 - INFO - __main__ - Step 55317: {'lr': 0.00035627193113800797, 'samples': 10620864, 'steps': 55316, 'loss/train': 0.8477377891540527} -08/30/2021 23:10:31 - INFO - __main__ - Step 55318: {'lr': 0.0003562671277029761, 'samples': 10621056, 'steps': 55317, 'loss/train': 1.7145271301269531} -08/30/2021 23:10:31 - INFO - __main__ - Step 55319: {'lr': 0.00035626232422006186, 'samples': 10621248, 'steps': 55318, 'loss/train': 1.4092390537261963} -08/30/2021 23:10:33 - INFO - __main__ - Step 55320: {'lr': 0.0003562575206892676, 'samples': 10621440, 'steps': 55319, 'loss/train': 1.437728762626648} -08/30/2021 23:10:34 - INFO - __main__ - Step 55321: {'lr': 0.0003562527171105952, 'samples': 10621632, 'steps': 55320, 'loss/train': 0.6264386177062988} -08/30/2021 23:10:34 - INFO - __main__ - Step 55322: {'lr': 0.000356247913484047, 'samples': 10621824, 'steps': 55321, 'loss/train': 1.5079323053359985} -08/30/2021 23:10:34 - INFO - __main__ - Step 55323: {'lr': 0.00035624310980962516, 'samples': 10622016, 'steps': 55322, 'loss/train': 1.302291989326477} -08/30/2021 23:10:35 - INFO - __main__ - Step 55324: {'lr': 0.0003562383060873318, 'samples': 10622208, 'steps': 55323, 'loss/train': 1.4527934789657593} -08/30/2021 23:10:35 - INFO - __main__ - Step 55325: {'lr': 0.000356233502317169, 'samples': 10622400, 'steps': 55324, 'loss/train': 1.5112656354904175} -08/30/2021 23:10:37 - INFO - __main__ - Step 55326: {'lr': 0.00035622869849913916, 'samples': 10622592, 'steps': 55325, 'loss/train': 0.46029818058013916} -08/30/2021 23:10:37 - INFO - __main__ - Step 55327: {'lr': 0.00035622389463324424, 'samples': 10622784, 'steps': 55326, 'loss/train': 0.0676017478108406} -08/30/2021 23:10:38 - INFO - __main__ - Step 55328: {'lr': 0.0003562190907194865, 'samples': 10622976, 'steps': 55327, 'loss/train': 0.026389867067337036} -08/30/2021 23:10:38 - INFO - __main__ - Step 55329: {'lr': 0.00035621428675786804, 'samples': 10623168, 'steps': 55328, 'loss/train': 1.9485284090042114} -08/30/2021 23:10:39 - INFO - __main__ - Step 55330: {'lr': 0.0003562094827483911, 'samples': 10623360, 'steps': 55329, 'loss/train': 1.7217789888381958} -08/30/2021 23:10:39 - INFO - __main__ - Step 55331: {'lr': 0.0003562046786910578, 'samples': 10623552, 'steps': 55330, 'loss/train': 1.1546274423599243} -08/30/2021 23:10:40 - INFO - __main__ - Step 55332: {'lr': 0.0003561998745858703, 'samples': 10623744, 'steps': 55331, 'loss/train': 0.8172891139984131} -08/30/2021 23:10:41 - INFO - __main__ - Step 55333: {'lr': 0.00035619507043283075, 'samples': 10623936, 'steps': 55332, 'loss/train': 0.809817373752594} -08/30/2021 23:10:41 - INFO - __main__ - Step 55334: {'lr': 0.0003561902662319414, 'samples': 10624128, 'steps': 55333, 'loss/train': 1.9766159057617188} -08/30/2021 23:10:42 - INFO - __main__ - Step 55335: {'lr': 0.00035618546198320426, 'samples': 10624320, 'steps': 55334, 'loss/train': 1.3971039056777954} -08/30/2021 23:10:42 - INFO - __main__ - Step 55336: {'lr': 0.0003561806576866217, 'samples': 10624512, 'steps': 55335, 'loss/train': 0.38044917583465576} -08/30/2021 23:10:44 - INFO - __main__ - Step 55337: {'lr': 0.0003561758533421957, 'samples': 10624704, 'steps': 55336, 'loss/train': 1.1008824110031128} -08/30/2021 23:10:44 - INFO - __main__ - Step 55338: {'lr': 0.00035617104894992854, 'samples': 10624896, 'steps': 55337, 'loss/train': 1.2946010828018188} -08/30/2021 23:10:45 - INFO - __main__ - Step 55339: {'lr': 0.00035616624450982227, 'samples': 10625088, 'steps': 55338, 'loss/train': 1.4345452785491943} -08/30/2021 23:10:45 - INFO - __main__ - Step 55340: {'lr': 0.0003561614400218792, 'samples': 10625280, 'steps': 55339, 'loss/train': 1.0193989276885986} -08/30/2021 23:10:45 - INFO - __main__ - Step 55341: {'lr': 0.00035615663548610145, 'samples': 10625472, 'steps': 55340, 'loss/train': 0.01815672777593136} -08/30/2021 23:10:46 - INFO - __main__ - Step 55342: {'lr': 0.0003561518309024911, 'samples': 10625664, 'steps': 55341, 'loss/train': 1.6040068864822388} -08/30/2021 23:10:46 - INFO - __main__ - Step 55343: {'lr': 0.0003561470262710504, 'samples': 10625856, 'steps': 55342, 'loss/train': 0.7478710412979126} -08/30/2021 23:10:48 - INFO - __main__ - Step 55344: {'lr': 0.00035614222159178143, 'samples': 10626048, 'steps': 55343, 'loss/train': 1.6130714416503906} -08/30/2021 23:10:48 - INFO - __main__ - Step 55345: {'lr': 0.00035613741686468646, 'samples': 10626240, 'steps': 55344, 'loss/train': 1.321609616279602} -08/30/2021 23:10:48 - INFO - __main__ - Step 55346: {'lr': 0.0003561326120897676, 'samples': 10626432, 'steps': 55345, 'loss/train': 0.9996790289878845} -08/30/2021 23:10:49 - INFO - __main__ - Step 55347: {'lr': 0.00035612780726702707, 'samples': 10626624, 'steps': 55346, 'loss/train': 1.4161497354507446} -08/30/2021 23:10:49 - INFO - __main__ - Step 55348: {'lr': 0.00035612300239646694, 'samples': 10626816, 'steps': 55347, 'loss/train': 1.2000510692596436} -08/30/2021 23:10:51 - INFO - __main__ - Step 55349: {'lr': 0.00035611819747808943, 'samples': 10627008, 'steps': 55348, 'loss/train': 1.8668888807296753} -08/30/2021 23:10:51 - INFO - __main__ - Step 55350: {'lr': 0.00035611339251189665, 'samples': 10627200, 'steps': 55349, 'loss/train': 1.280078411102295} -08/30/2021 23:10:52 - INFO - __main__ - Step 55351: {'lr': 0.0003561085874978909, 'samples': 10627392, 'steps': 55350, 'loss/train': 1.2095434665679932} -08/30/2021 23:10:52 - INFO - __main__ - Step 55352: {'lr': 0.00035610378243607424, 'samples': 10627584, 'steps': 55351, 'loss/train': 1.4801084995269775} -08/30/2021 23:10:52 - INFO - __main__ - Step 55353: {'lr': 0.0003560989773264488, 'samples': 10627776, 'steps': 55352, 'loss/train': 1.151530385017395} -08/30/2021 23:10:54 - INFO - __main__ - Step 55354: {'lr': 0.00035609417216901683, 'samples': 10627968, 'steps': 55353, 'loss/train': 0.8998567461967468} -08/30/2021 23:10:55 - INFO - __main__ - Step 55355: {'lr': 0.00035608936696378046, 'samples': 10628160, 'steps': 55354, 'loss/train': 1.4569636583328247} -08/30/2021 23:10:55 - INFO - __main__ - Step 55356: {'lr': 0.0003560845617107419, 'samples': 10628352, 'steps': 55355, 'loss/train': 0.854587197303772} -08/30/2021 23:10:56 - INFO - __main__ - Step 55357: {'lr': 0.0003560797564099032, 'samples': 10628544, 'steps': 55356, 'loss/train': 0.018760357052087784} -08/30/2021 23:10:56 - INFO - __main__ - Step 55358: {'lr': 0.00035607495106126664, 'samples': 10628736, 'steps': 55357, 'loss/train': 1.4873825311660767} -08/30/2021 23:10:56 - INFO - __main__ - Step 55359: {'lr': 0.0003560701456648343, 'samples': 10628928, 'steps': 55358, 'loss/train': 1.258956789970398} -08/30/2021 23:10:58 - INFO - __main__ - Step 55360: {'lr': 0.0003560653402206085, 'samples': 10629120, 'steps': 55359, 'loss/train': 1.7666727304458618} -08/30/2021 23:10:58 - INFO - __main__ - Step 55361: {'lr': 0.0003560605347285912, 'samples': 10629312, 'steps': 55360, 'loss/train': 1.3753219842910767} -08/30/2021 23:10:59 - INFO - __main__ - Step 55362: {'lr': 0.0003560557291887847, 'samples': 10629504, 'steps': 55361, 'loss/train': 1.6132206916809082} -08/30/2021 23:10:59 - INFO - __main__ - Step 55363: {'lr': 0.0003560509236011911, 'samples': 10629696, 'steps': 55362, 'loss/train': 1.3108277320861816} -08/30/2021 23:10:59 - INFO - __main__ - Step 55364: {'lr': 0.0003560461179658125, 'samples': 10629888, 'steps': 55363, 'loss/train': 1.2954736948013306} -08/30/2021 23:11:01 - INFO - __main__ - Step 55365: {'lr': 0.0003560413122826513, 'samples': 10630080, 'steps': 55364, 'loss/train': 1.3421114683151245} -08/30/2021 23:11:01 - INFO - __main__ - Step 55366: {'lr': 0.0003560365065517095, 'samples': 10630272, 'steps': 55365, 'loss/train': 0.8554668426513672} -08/30/2021 23:11:01 - INFO - __main__ - Step 55367: {'lr': 0.0003560317007729893, 'samples': 10630464, 'steps': 55366, 'loss/train': 0.07721702009439468} -08/30/2021 23:11:02 - INFO - __main__ - Step 55368: {'lr': 0.00035602689494649274, 'samples': 10630656, 'steps': 55367, 'loss/train': 1.06834876537323} -08/30/2021 23:11:02 - INFO - __main__ - Step 55369: {'lr': 0.0003560220890722222, 'samples': 10630848, 'steps': 55368, 'loss/train': 1.087509274482727} -08/30/2021 23:11:04 - INFO - __main__ - Step 55370: {'lr': 0.00035601728315017966, 'samples': 10631040, 'steps': 55369, 'loss/train': 1.802738070487976} -08/30/2021 23:11:04 - INFO - __main__ - Step 55371: {'lr': 0.00035601247718036744, 'samples': 10631232, 'steps': 55370, 'loss/train': 1.0252283811569214} -08/30/2021 23:11:04 - INFO - __main__ - Step 55372: {'lr': 0.00035600767116278765, 'samples': 10631424, 'steps': 55371, 'loss/train': 1.8033604621887207} -08/30/2021 23:11:05 - INFO - __main__ - Step 55373: {'lr': 0.0003560028650974424, 'samples': 10631616, 'steps': 55372, 'loss/train': 1.3439714908599854} -08/30/2021 23:11:05 - INFO - __main__ - Step 55374: {'lr': 0.0003559980589843339, 'samples': 10631808, 'steps': 55373, 'loss/train': 1.2238050699234009} -08/30/2021 23:11:07 - INFO - __main__ - Step 55375: {'lr': 0.0003559932528234643, 'samples': 10632000, 'steps': 55374, 'loss/train': 0.7990780472755432} -08/30/2021 23:11:07 - INFO - __main__ - Step 55376: {'lr': 0.0003559884466148358, 'samples': 10632192, 'steps': 55375, 'loss/train': 1.2638812065124512} -08/30/2021 23:11:07 - INFO - __main__ - Step 55377: {'lr': 0.0003559836403584505, 'samples': 10632384, 'steps': 55376, 'loss/train': 1.2138592004776} -08/30/2021 23:11:08 - INFO - __main__ - Step 55378: {'lr': 0.00035597883405431066, 'samples': 10632576, 'steps': 55377, 'loss/train': 1.200518012046814} -08/30/2021 23:11:08 - INFO - __main__ - Step 55379: {'lr': 0.0003559740277024183, 'samples': 10632768, 'steps': 55378, 'loss/train': 1.6666280031204224} -08/30/2021 23:11:10 - INFO - __main__ - Step 55380: {'lr': 0.0003559692213027758, 'samples': 10632960, 'steps': 55379, 'loss/train': 1.1910959482192993} -08/30/2021 23:11:11 - INFO - __main__ - Step 55381: {'lr': 0.00035596441485538513, 'samples': 10633152, 'steps': 55380, 'loss/train': 1.3170758485794067} -08/30/2021 23:11:11 - INFO - __main__ - Step 55382: {'lr': 0.00035595960836024856, 'samples': 10633344, 'steps': 55381, 'loss/train': 1.7013992071151733} -08/30/2021 23:11:11 - INFO - __main__ - Step 55383: {'lr': 0.00035595480181736816, 'samples': 10633536, 'steps': 55382, 'loss/train': 1.2633439302444458} -08/30/2021 23:11:12 - INFO - __main__ - Step 55384: {'lr': 0.0003559499952267462, 'samples': 10633728, 'steps': 55383, 'loss/train': 1.5431526899337769} -08/30/2021 23:11:12 - INFO - __main__ - Step 55385: {'lr': 0.00035594518858838485, 'samples': 10633920, 'steps': 55384, 'loss/train': 1.5441824197769165} -08/30/2021 23:11:14 - INFO - __main__ - Step 55386: {'lr': 0.0003559403819022862, 'samples': 10634112, 'steps': 55385, 'loss/train': 1.0448249578475952} -08/30/2021 23:11:14 - INFO - __main__ - Step 55387: {'lr': 0.0003559355751684525, 'samples': 10634304, 'steps': 55386, 'loss/train': 1.5194307565689087} -08/30/2021 23:11:15 - INFO - __main__ - Step 55388: {'lr': 0.00035593076838688576, 'samples': 10634496, 'steps': 55387, 'loss/train': 0.6773468852043152} -08/30/2021 23:11:15 - INFO - __main__ - Step 55389: {'lr': 0.0003559259615575883, 'samples': 10634688, 'steps': 55388, 'loss/train': 0.06502977013587952} -08/30/2021 23:11:15 - INFO - __main__ - Step 55390: {'lr': 0.00035592115468056223, 'samples': 10634880, 'steps': 55389, 'loss/train': 1.2024701833724976} -08/30/2021 23:11:17 - INFO - __main__ - Step 55391: {'lr': 0.0003559163477558098, 'samples': 10635072, 'steps': 55390, 'loss/train': 1.704396367073059} -08/30/2021 23:11:18 - INFO - __main__ - Step 55392: {'lr': 0.000355911540783333, 'samples': 10635264, 'steps': 55391, 'loss/train': 0.7037349939346313} -08/30/2021 23:11:18 - INFO - __main__ - Step 55393: {'lr': 0.0003559067337631341, 'samples': 10635456, 'steps': 55392, 'loss/train': 1.6579787731170654} -08/30/2021 23:11:18 - INFO - __main__ - Step 55394: {'lr': 0.0003559019266952153, 'samples': 10635648, 'steps': 55393, 'loss/train': 1.601279616355896} -08/30/2021 23:11:19 - INFO - __main__ - Step 55395: {'lr': 0.0003558971195795787, 'samples': 10635840, 'steps': 55394, 'loss/train': 1.461321234703064} -08/30/2021 23:11:21 - INFO - __main__ - Step 55396: {'lr': 0.00035589231241622653, 'samples': 10636032, 'steps': 55395, 'loss/train': 1.3567804098129272} -08/30/2021 23:11:21 - INFO - __main__ - Step 55397: {'lr': 0.0003558875052051609, 'samples': 10636224, 'steps': 55396, 'loss/train': 0.5615561008453369} -08/30/2021 23:11:22 - INFO - __main__ - Step 55398: {'lr': 0.000355882697946384, 'samples': 10636416, 'steps': 55397, 'loss/train': 1.4395231008529663} -08/30/2021 23:11:22 - INFO - __main__ - Step 55399: {'lr': 0.00035587789063989793, 'samples': 10636608, 'steps': 55398, 'loss/train': 1.357488751411438} -08/30/2021 23:11:22 - INFO - __main__ - Step 55400: {'lr': 0.0003558730832857049, 'samples': 10636800, 'steps': 55399, 'loss/train': 1.5035920143127441} -08/30/2021 23:11:23 - INFO - __main__ - Step 55401: {'lr': 0.00035586827588380724, 'samples': 10636992, 'steps': 55400, 'loss/train': 0.9984560608863831} -08/30/2021 23:11:24 - INFO - __main__ - Step 55402: {'lr': 0.00035586346843420694, 'samples': 10637184, 'steps': 55401, 'loss/train': 0.8850058913230896} -08/30/2021 23:11:25 - INFO - __main__ - Step 55403: {'lr': 0.0003558586609369061, 'samples': 10637376, 'steps': 55402, 'loss/train': 1.0557961463928223} -08/30/2021 23:11:25 - INFO - __main__ - Step 55404: {'lr': 0.000355853853391907, 'samples': 10637568, 'steps': 55403, 'loss/train': 1.8525205850601196} -08/30/2021 23:11:25 - INFO - __main__ - Step 55405: {'lr': 0.0003558490457992118, 'samples': 10637760, 'steps': 55404, 'loss/train': 1.0172795057296753} -08/30/2021 23:11:26 - INFO - __main__ - Step 55406: {'lr': 0.00035584423815882265, 'samples': 10637952, 'steps': 55405, 'loss/train': 0.7502500414848328} -08/30/2021 23:11:27 - INFO - __main__ - Step 55407: {'lr': 0.00035583943047074173, 'samples': 10638144, 'steps': 55406, 'loss/train': 0.35627129673957825} -08/30/2021 23:11:28 - INFO - __main__ - Step 55408: {'lr': 0.00035583462273497125, 'samples': 10638336, 'steps': 55407, 'loss/train': 1.2644280195236206} -08/30/2021 23:11:28 - INFO - __main__ - Step 55409: {'lr': 0.0003558298149515132, 'samples': 10638528, 'steps': 55408, 'loss/train': 1.445717453956604} -08/30/2021 23:11:28 - INFO - __main__ - Step 55410: {'lr': 0.00035582500712037, 'samples': 10638720, 'steps': 55409, 'loss/train': 1.1638656854629517} -08/30/2021 23:11:29 - INFO - __main__ - Step 55411: {'lr': 0.0003558201992415436, 'samples': 10638912, 'steps': 55410, 'loss/train': 1.0031850337982178} -08/30/2021 23:11:30 - INFO - __main__ - Step 55412: {'lr': 0.00035581539131503625, 'samples': 10639104, 'steps': 55411, 'loss/train': 1.0247963666915894} -08/30/2021 23:11:31 - INFO - __main__ - Step 55413: {'lr': 0.00035581058334085015, 'samples': 10639296, 'steps': 55412, 'loss/train': 1.5131694078445435} -08/30/2021 23:11:31 - INFO - __main__ - Step 55414: {'lr': 0.00035580577531898745, 'samples': 10639488, 'steps': 55413, 'loss/train': 1.1767997741699219} -08/30/2021 23:11:31 - INFO - __main__ - Step 55415: {'lr': 0.00035580096724945027, 'samples': 10639680, 'steps': 55414, 'loss/train': 2.3571736812591553} -08/30/2021 23:11:32 - INFO - __main__ - Step 55416: {'lr': 0.00035579615913224077, 'samples': 10639872, 'steps': 55415, 'loss/train': 1.2972009181976318} -08/30/2021 23:11:33 - INFO - __main__ - Step 55417: {'lr': 0.0003557913509673612, 'samples': 10640064, 'steps': 55416, 'loss/train': 1.812063455581665} -08/30/2021 23:11:34 - INFO - __main__ - Step 55418: {'lr': 0.0003557865427548137, 'samples': 10640256, 'steps': 55417, 'loss/train': 1.5160012245178223} -08/30/2021 23:11:34 - INFO - __main__ - Step 55419: {'lr': 0.0003557817344946004, 'samples': 10640448, 'steps': 55418, 'loss/train': 1.3852494955062866} -08/30/2021 23:11:35 - INFO - __main__ - Step 55420: {'lr': 0.0003557769261867235, 'samples': 10640640, 'steps': 55419, 'loss/train': 1.396045207977295} -08/30/2021 23:11:35 - INFO - __main__ - Step 55421: {'lr': 0.0003557721178311851, 'samples': 10640832, 'steps': 55420, 'loss/train': 1.4583454132080078} -08/30/2021 23:11:36 - INFO - __main__ - Step 55422: {'lr': 0.0003557673094279874, 'samples': 10641024, 'steps': 55421, 'loss/train': 1.254266381263733} -08/30/2021 23:11:37 - INFO - __main__ - Step 55423: {'lr': 0.00035576250097713263, 'samples': 10641216, 'steps': 55422, 'loss/train': 1.3631420135498047} -08/30/2021 23:11:37 - INFO - __main__ - Step 55424: {'lr': 0.00035575769247862295, 'samples': 10641408, 'steps': 55423, 'loss/train': 0.8063216209411621} -08/30/2021 23:11:38 - INFO - __main__ - Step 55425: {'lr': 0.0003557528839324604, 'samples': 10641600, 'steps': 55424, 'loss/train': 1.1090645790100098} -08/30/2021 23:11:38 - INFO - __main__ - Step 55426: {'lr': 0.0003557480753386473, 'samples': 10641792, 'steps': 55425, 'loss/train': 1.2671951055526733} -08/30/2021 23:11:39 - INFO - __main__ - Step 55427: {'lr': 0.0003557432666971857, 'samples': 10641984, 'steps': 55426, 'loss/train': 0.8759759068489075} -08/30/2021 23:11:40 - INFO - __main__ - Step 55428: {'lr': 0.0003557384580080778, 'samples': 10642176, 'steps': 55427, 'loss/train': 0.041155535727739334} -08/30/2021 23:11:40 - INFO - __main__ - Step 55429: {'lr': 0.0003557336492713258, 'samples': 10642368, 'steps': 55428, 'loss/train': 1.3602029085159302} -08/30/2021 23:11:40 - INFO - __main__ - Step 55430: {'lr': 0.00035572884048693193, 'samples': 10642560, 'steps': 55429, 'loss/train': 1.2522928714752197} -08/30/2021 23:11:41 - INFO - __main__ - Step 55431: {'lr': 0.0003557240316548982, 'samples': 10642752, 'steps': 55430, 'loss/train': 1.0957622528076172} -08/30/2021 23:11:43 - INFO - __main__ - Step 55432: {'lr': 0.0003557192227752268, 'samples': 10642944, 'steps': 55431, 'loss/train': 0.9033432006835938} -08/30/2021 23:11:44 - INFO - __main__ - Step 55433: {'lr': 0.00035571441384792005, 'samples': 10643136, 'steps': 55432, 'loss/train': 1.8867671489715576} -08/30/2021 23:11:44 - INFO - __main__ - Step 55434: {'lr': 0.00035570960487298, 'samples': 10643328, 'steps': 55433, 'loss/train': 1.381144642829895} -08/30/2021 23:11:44 - INFO - __main__ - Step 55435: {'lr': 0.00035570479585040883, 'samples': 10643520, 'steps': 55434, 'loss/train': 0.932345986366272} -08/30/2021 23:11:45 - INFO - __main__ - Step 55436: {'lr': 0.00035569998678020866, 'samples': 10643712, 'steps': 55435, 'loss/train': 1.2663263082504272} -08/30/2021 23:11:45 - INFO - __main__ - Step 55437: {'lr': 0.0003556951776623817, 'samples': 10643904, 'steps': 55436, 'loss/train': 1.147674798965454} -08/30/2021 23:11:46 - INFO - __main__ - Step 55438: {'lr': 0.0003556903684969302, 'samples': 10644096, 'steps': 55437, 'loss/train': 0.4004209041595459} -08/30/2021 23:11:46 - INFO - __main__ - Step 55439: {'lr': 0.0003556855592838562, 'samples': 10644288, 'steps': 55438, 'loss/train': 0.02406122162938118} -08/30/2021 23:11:47 - INFO - __main__ - Step 55440: {'lr': 0.00035568075002316194, 'samples': 10644480, 'steps': 55439, 'loss/train': 1.3831521272659302} -08/30/2021 23:11:48 - INFO - __main__ - Step 55441: {'lr': 0.0003556759407148496, 'samples': 10644672, 'steps': 55440, 'loss/train': 1.5924197435379028} -08/30/2021 23:11:48 - INFO - __main__ - Step 55442: {'lr': 0.00035567113135892125, 'samples': 10644864, 'steps': 55441, 'loss/train': 1.2679743766784668} -08/30/2021 23:11:49 - INFO - __main__ - Step 55443: {'lr': 0.0003556663219553791, 'samples': 10645056, 'steps': 55442, 'loss/train': 1.531531572341919} -08/30/2021 23:11:49 - INFO - __main__ - Step 55444: {'lr': 0.00035566151250422543, 'samples': 10645248, 'steps': 55443, 'loss/train': 1.22312593460083} -08/30/2021 23:11:51 - INFO - __main__ - Step 55445: {'lr': 0.0003556567030054622, 'samples': 10645440, 'steps': 55444, 'loss/train': 1.1894237995147705} -08/30/2021 23:11:51 - INFO - __main__ - Step 55446: {'lr': 0.00035565189345909177, 'samples': 10645632, 'steps': 55445, 'loss/train': 1.5968416929244995} -08/30/2021 23:11:51 - INFO - __main__ - Step 55447: {'lr': 0.0003556470838651162, 'samples': 10645824, 'steps': 55446, 'loss/train': 1.0069166421890259} -08/30/2021 23:11:52 - INFO - __main__ - Step 55448: {'lr': 0.0003556422742235377, 'samples': 10646016, 'steps': 55447, 'loss/train': 1.3170974254608154} -08/30/2021 23:11:52 - INFO - __main__ - Step 55449: {'lr': 0.0003556374645343584, 'samples': 10646208, 'steps': 55448, 'loss/train': 0.7269425392150879} -08/30/2021 23:11:53 - INFO - __main__ - Step 55450: {'lr': 0.0003556326547975805, 'samples': 10646400, 'steps': 55449, 'loss/train': 1.6099789142608643} -08/30/2021 23:11:54 - INFO - __main__ - Step 55451: {'lr': 0.0003556278450132062, 'samples': 10646592, 'steps': 55450, 'loss/train': 0.9493165016174316} -08/30/2021 23:11:54 - INFO - __main__ - Step 55452: {'lr': 0.0003556230351812375, 'samples': 10646784, 'steps': 55451, 'loss/train': 1.639000415802002} -08/30/2021 23:11:55 - INFO - __main__ - Step 55453: {'lr': 0.00035561822530167677, 'samples': 10646976, 'steps': 55452, 'loss/train': 1.3469408750534058} -08/30/2021 23:11:55 - INFO - __main__ - Step 55454: {'lr': 0.0003556134153745261, 'samples': 10647168, 'steps': 55453, 'loss/train': 1.2902514934539795} -08/30/2021 23:11:56 - INFO - __main__ - Step 55455: {'lr': 0.0003556086053997877, 'samples': 10647360, 'steps': 55454, 'loss/train': 1.410627841949463} -08/30/2021 23:11:57 - INFO - __main__ - Step 55456: {'lr': 0.0003556037953774636, 'samples': 10647552, 'steps': 55455, 'loss/train': 1.404201865196228} -08/30/2021 23:11:57 - INFO - __main__ - Step 55457: {'lr': 0.0003555989853075561, 'samples': 10647744, 'steps': 55456, 'loss/train': 0.5927403569221497} -08/30/2021 23:11:58 - INFO - __main__ - Step 55458: {'lr': 0.0003555941751900673, 'samples': 10647936, 'steps': 55457, 'loss/train': 1.3797026872634888} -08/30/2021 23:11:58 - INFO - __main__ - Step 55459: {'lr': 0.00035558936502499944, 'samples': 10648128, 'steps': 55458, 'loss/train': 1.6795721054077148} -08/30/2021 23:12:00 - INFO - __main__ - Step 55460: {'lr': 0.00035558455481235463, 'samples': 10648320, 'steps': 55459, 'loss/train': 0.06003996729850769} -08/30/2021 23:12:00 - INFO - __main__ - Step 55461: {'lr': 0.000355579744552135, 'samples': 10648512, 'steps': 55460, 'loss/train': 1.2382827997207642} -08/30/2021 23:12:01 - INFO - __main__ - Step 55462: {'lr': 0.00035557493424434285, 'samples': 10648704, 'steps': 55461, 'loss/train': 1.3931047916412354} -08/30/2021 23:12:01 - INFO - __main__ - Step 55463: {'lr': 0.0003555701238889802, 'samples': 10648896, 'steps': 55462, 'loss/train': 1.2699464559555054} -08/30/2021 23:12:01 - INFO - __main__ - Step 55464: {'lr': 0.0003555653134860493, 'samples': 10649088, 'steps': 55463, 'loss/train': 1.0769644975662231} -08/30/2021 23:12:02 - INFO - __main__ - Step 55465: {'lr': 0.00035556050303555233, 'samples': 10649280, 'steps': 55464, 'loss/train': 0.04139209911227226} -08/30/2021 23:12:03 - INFO - __main__ - Step 55466: {'lr': 0.00035555569253749135, 'samples': 10649472, 'steps': 55465, 'loss/train': 0.0201834999024868} -08/30/2021 23:12:04 - INFO - __main__ - Step 55467: {'lr': 0.0003555508819918687, 'samples': 10649664, 'steps': 55466, 'loss/train': 0.6248383522033691} -08/30/2021 23:12:04 - INFO - __main__ - Step 55468: {'lr': 0.0003555460713986864, 'samples': 10649856, 'steps': 55467, 'loss/train': 1.3763900995254517} -08/30/2021 23:12:04 - INFO - __main__ - Step 55469: {'lr': 0.00035554126075794666, 'samples': 10650048, 'steps': 55468, 'loss/train': 0.9383394718170166} -08/30/2021 23:12:05 - INFO - __main__ - Step 55470: {'lr': 0.0003555364500696517, 'samples': 10650240, 'steps': 55469, 'loss/train': 1.3142777681350708} -08/30/2021 23:12:06 - INFO - __main__ - Step 55471: {'lr': 0.0003555316393338036, 'samples': 10650432, 'steps': 55470, 'loss/train': 1.1927725076675415} -08/30/2021 23:12:07 - INFO - __main__ - Step 55472: {'lr': 0.0003555268285504045, 'samples': 10650624, 'steps': 55471, 'loss/train': 0.09798042476177216} -08/30/2021 23:12:07 - INFO - __main__ - Step 55473: {'lr': 0.00035552201771945675, 'samples': 10650816, 'steps': 55472, 'loss/train': 0.5897518396377563} -08/30/2021 23:12:08 - INFO - __main__ - Step 55474: {'lr': 0.0003555172068409624, 'samples': 10651008, 'steps': 55473, 'loss/train': 1.325345754623413} -08/30/2021 23:12:08 - INFO - __main__ - Step 55475: {'lr': 0.0003555123959149236, 'samples': 10651200, 'steps': 55474, 'loss/train': 0.7527827620506287} -08/30/2021 23:12:10 - INFO - __main__ - Step 55476: {'lr': 0.00035550758494134257, 'samples': 10651392, 'steps': 55475, 'loss/train': 0.890178382396698} -08/30/2021 23:12:10 - INFO - __main__ - Step 55477: {'lr': 0.0003555027739202214, 'samples': 10651584, 'steps': 55476, 'loss/train': 1.0366718769073486} -08/30/2021 23:12:10 - INFO - __main__ - Step 55478: {'lr': 0.00035549796285156234, 'samples': 10651776, 'steps': 55477, 'loss/train': 0.7136321663856506} -08/30/2021 23:12:11 - INFO - __main__ - Step 55479: {'lr': 0.0003554931517353675, 'samples': 10651968, 'steps': 55478, 'loss/train': 1.4436877965927124} -08/30/2021 23:12:11 - INFO - __main__ - Step 55480: {'lr': 0.0003554883405716391, 'samples': 10652160, 'steps': 55479, 'loss/train': 1.5136303901672363} -08/30/2021 23:12:13 - INFO - __main__ - Step 55481: {'lr': 0.0003554835293603793, 'samples': 10652352, 'steps': 55480, 'loss/train': 0.7693046927452087} -08/30/2021 23:12:13 - INFO - __main__ - Step 55482: {'lr': 0.0003554787181015903, 'samples': 10652544, 'steps': 55481, 'loss/train': 0.10480514913797379} -08/30/2021 23:12:13 - INFO - __main__ - Step 55483: {'lr': 0.0003554739067952741, 'samples': 10652736, 'steps': 55482, 'loss/train': 1.1686795949935913} -08/30/2021 23:12:14 - INFO - __main__ - Step 55484: {'lr': 0.00035546909544143304, 'samples': 10652928, 'steps': 55483, 'loss/train': 2.042349338531494} -08/30/2021 23:12:14 - INFO - __main__ - Step 55485: {'lr': 0.00035546428404006913, 'samples': 10653120, 'steps': 55484, 'loss/train': 1.565883755683899} -08/30/2021 23:12:14 - INFO - __main__ - Step 55486: {'lr': 0.0003554594725911848, 'samples': 10653312, 'steps': 55485, 'loss/train': 1.542165756225586} -08/30/2021 23:12:17 - INFO - __main__ - Step 55487: {'lr': 0.00035545466109478195, 'samples': 10653504, 'steps': 55486, 'loss/train': 0.9397889375686646} -08/30/2021 23:12:17 - INFO - __main__ - Step 55488: {'lr': 0.00035544984955086296, 'samples': 10653696, 'steps': 55487, 'loss/train': 0.05148085579276085} -08/30/2021 23:12:18 - INFO - __main__ - Step 55489: {'lr': 0.00035544503795942984, 'samples': 10653888, 'steps': 55488, 'loss/train': 1.193132758140564} -08/30/2021 23:12:18 - INFO - __main__ - Step 55490: {'lr': 0.00035544022632048476, 'samples': 10654080, 'steps': 55489, 'loss/train': 1.1140227317810059} -08/30/2021 23:12:18 - INFO - __main__ - Step 55491: {'lr': 0.00035543541463402994, 'samples': 10654272, 'steps': 55490, 'loss/train': 1.3388952016830444} -08/30/2021 23:12:20 - INFO - __main__ - Step 55492: {'lr': 0.0003554306029000676, 'samples': 10654464, 'steps': 55491, 'loss/train': 1.8331475257873535} -08/30/2021 23:12:21 - INFO - __main__ - Step 55493: {'lr': 0.00035542579111859986, 'samples': 10654656, 'steps': 55492, 'loss/train': 1.1105254888534546} -08/30/2021 23:12:21 - INFO - __main__ - Step 55494: {'lr': 0.0003554209792896289, 'samples': 10654848, 'steps': 55493, 'loss/train': 0.9644830822944641} -08/30/2021 23:12:21 - INFO - __main__ - Step 55495: {'lr': 0.00035541616741315685, 'samples': 10655040, 'steps': 55494, 'loss/train': 1.385136365890503} -08/30/2021 23:12:22 - INFO - __main__ - Step 55496: {'lr': 0.0003554113554891859, 'samples': 10655232, 'steps': 55495, 'loss/train': 0.09133853763341904} -08/30/2021 23:12:23 - INFO - __main__ - Step 55497: {'lr': 0.0003554065435177183, 'samples': 10655424, 'steps': 55496, 'loss/train': 0.07849901914596558} -08/30/2021 23:12:23 - INFO - __main__ - Step 55498: {'lr': 0.00035540173149875597, 'samples': 10655616, 'steps': 55497, 'loss/train': 1.8646738529205322} -08/30/2021 23:12:24 - INFO - __main__ - Step 55499: {'lr': 0.00035539691943230135, 'samples': 10655808, 'steps': 55498, 'loss/train': 1.2672700881958008} -08/30/2021 23:12:24 - INFO - __main__ - Step 55500: {'lr': 0.00035539210731835646, 'samples': 10656000, 'steps': 55499, 'loss/train': 1.5393143892288208} -08/30/2021 23:12:25 - INFO - __main__ - Step 55501: {'lr': 0.00035538729515692356, 'samples': 10656192, 'steps': 55500, 'loss/train': 1.4273806810379028} -08/30/2021 23:12:27 - INFO - __main__ - Step 55502: {'lr': 0.0003553824829480048, 'samples': 10656384, 'steps': 55501, 'loss/train': 1.3791733980178833} -08/30/2021 23:12:27 - INFO - __main__ - Step 55503: {'lr': 0.00035537767069160234, 'samples': 10656576, 'steps': 55502, 'loss/train': 1.339461088180542} -08/30/2021 23:12:28 - INFO - __main__ - Step 55504: {'lr': 0.00035537285838771823, 'samples': 10656768, 'steps': 55503, 'loss/train': 1.4004014730453491} -08/30/2021 23:12:28 - INFO - __main__ - Step 55505: {'lr': 0.00035536804603635474, 'samples': 10656960, 'steps': 55504, 'loss/train': 1.37777841091156} -08/30/2021 23:12:28 - INFO - __main__ - Step 55506: {'lr': 0.00035536323363751405, 'samples': 10657152, 'steps': 55505, 'loss/train': 1.558566689491272} -08/30/2021 23:12:29 - INFO - __main__ - Step 55507: {'lr': 0.0003553584211911983, 'samples': 10657344, 'steps': 55506, 'loss/train': 1.4632781744003296} -08/30/2021 23:12:29 - INFO - __main__ - Step 55508: {'lr': 0.00035535360869740973, 'samples': 10657536, 'steps': 55507, 'loss/train': 1.114112377166748} -08/30/2021 23:12:31 - INFO - __main__ - Step 55509: {'lr': 0.00035534879615615046, 'samples': 10657728, 'steps': 55508, 'loss/train': 1.3278900384902954} -08/30/2021 23:12:31 - INFO - __main__ - Step 55510: {'lr': 0.0003553439835674226, 'samples': 10657920, 'steps': 55509, 'loss/train': 1.4269146919250488} -08/30/2021 23:12:31 - INFO - __main__ - Step 55511: {'lr': 0.00035533917093122835, 'samples': 10658112, 'steps': 55510, 'loss/train': 1.3330708742141724} -08/30/2021 23:12:32 - INFO - __main__ - Step 55512: {'lr': 0.00035533435824756986, 'samples': 10658304, 'steps': 55511, 'loss/train': 0.44845032691955566} -08/30/2021 23:12:32 - INFO - __main__ - Step 55513: {'lr': 0.00035532954551644944, 'samples': 10658496, 'steps': 55512, 'loss/train': 1.5402897596359253} -08/30/2021 23:12:34 - INFO - __main__ - Step 55514: {'lr': 0.0003553247327378691, 'samples': 10658688, 'steps': 55513, 'loss/train': 1.9340276718139648} -08/30/2021 23:12:35 - INFO - __main__ - Step 55515: {'lr': 0.0003553199199118311, 'samples': 10658880, 'steps': 55514, 'loss/train': 5.878765106201172} -08/30/2021 23:12:35 - INFO - __main__ - Step 55516: {'lr': 0.00035531510703833754, 'samples': 10659072, 'steps': 55515, 'loss/train': 5.910140514373779} -08/30/2021 23:12:35 - INFO - __main__ - Step 55517: {'lr': 0.00035531029411739056, 'samples': 10659264, 'steps': 55516, 'loss/train': 5.913590431213379} -08/30/2021 23:12:36 - INFO - __main__ - Step 55518: {'lr': 0.00035530548114899243, 'samples': 10659456, 'steps': 55517, 'loss/train': 1.2726004123687744} -08/30/2021 23:12:36 - INFO - __main__ - Step 55519: {'lr': 0.00035530066813314534, 'samples': 10659648, 'steps': 55518, 'loss/train': 1.4622379541397095} -08/30/2021 23:12:37 - INFO - __main__ - Step 55520: {'lr': 0.0003552958550698513, 'samples': 10659840, 'steps': 55519, 'loss/train': 1.734806776046753} -08/30/2021 23:12:38 - INFO - __main__ - Step 55521: {'lr': 0.00035529104195911255, 'samples': 10660032, 'steps': 55520, 'loss/train': 1.0233968496322632} -08/30/2021 23:12:38 - INFO - __main__ - Step 55522: {'lr': 0.00035528622880093145, 'samples': 10660224, 'steps': 55521, 'loss/train': 1.0475138425827026} -08/30/2021 23:12:39 - INFO - __main__ - Step 55523: {'lr': 0.00035528141559530984, 'samples': 10660416, 'steps': 55522, 'loss/train': 1.530788779258728} -08/30/2021 23:12:39 - INFO - __main__ - Step 55524: {'lr': 0.0003552766023422501, 'samples': 10660608, 'steps': 55523, 'loss/train': 1.2065110206604004} -08/30/2021 23:12:39 - INFO - __main__ - Step 55525: {'lr': 0.00035527178904175435, 'samples': 10660800, 'steps': 55524, 'loss/train': 0.8463578820228577} -08/30/2021 23:12:41 - INFO - __main__ - Step 55526: {'lr': 0.0003552669756938247, 'samples': 10660992, 'steps': 55525, 'loss/train': 1.3025094270706177} -08/30/2021 23:12:41 - INFO - __main__ - Step 55527: {'lr': 0.0003552621622984634, 'samples': 10661184, 'steps': 55526, 'loss/train': 0.4661639332771301} -08/30/2021 23:12:42 - INFO - __main__ - Step 55528: {'lr': 0.00035525734885567275, 'samples': 10661376, 'steps': 55527, 'loss/train': 1.4807226657867432} -08/30/2021 23:12:42 - INFO - __main__ - Step 55529: {'lr': 0.0003552525353654546, 'samples': 10661568, 'steps': 55528, 'loss/train': 0.054604776203632355} -08/30/2021 23:12:42 - INFO - __main__ - Step 55530: {'lr': 0.0003552477218278113, 'samples': 10661760, 'steps': 55529, 'loss/train': 0.7658342123031616} -08/30/2021 23:12:43 - INFO - __main__ - Step 55531: {'lr': 0.00035524290824274504, 'samples': 10661952, 'steps': 55530, 'loss/train': 1.4331191778182983} -08/30/2021 23:12:44 - INFO - __main__ - Step 55532: {'lr': 0.0003552380946102579, 'samples': 10662144, 'steps': 55531, 'loss/train': 1.0050603151321411} -08/30/2021 23:12:45 - INFO - __main__ - Step 55533: {'lr': 0.0003552332809303521, 'samples': 10662336, 'steps': 55532, 'loss/train': 1.4581477642059326} -08/30/2021 23:12:45 - INFO - __main__ - Step 55534: {'lr': 0.0003552284672030298, 'samples': 10662528, 'steps': 55533, 'loss/train': 1.2428696155548096} -08/30/2021 23:12:46 - INFO - __main__ - Step 55535: {'lr': 0.0003552236534282933, 'samples': 10662720, 'steps': 55534, 'loss/train': 1.391614317893982} -08/30/2021 23:12:46 - INFO - __main__ - Step 55536: {'lr': 0.00035521883960614456, 'samples': 10662912, 'steps': 55535, 'loss/train': 1.3651405572891235} -08/30/2021 23:12:48 - INFO - __main__ - Step 55537: {'lr': 0.0003552140257365858, 'samples': 10663104, 'steps': 55536, 'loss/train': 0.24041101336479187} -08/30/2021 23:12:48 - INFO - __main__ - Step 55538: {'lr': 0.00035520921181961924, 'samples': 10663296, 'steps': 55537, 'loss/train': 1.1786699295043945} -08/30/2021 23:12:48 - INFO - __main__ - Step 55539: {'lr': 0.00035520439785524703, 'samples': 10663488, 'steps': 55538, 'loss/train': 0.39626067876815796} -08/30/2021 23:12:49 - INFO - __main__ - Step 55540: {'lr': 0.00035519958384347134, 'samples': 10663680, 'steps': 55539, 'loss/train': 1.8849173784255981} -08/30/2021 23:12:49 - INFO - __main__ - Step 55541: {'lr': 0.00035519476978429433, 'samples': 10663872, 'steps': 55540, 'loss/train': 1.102056860923767} -08/30/2021 23:12:51 - INFO - __main__ - Step 55542: {'lr': 0.0003551899556777183, 'samples': 10664064, 'steps': 55541, 'loss/train': 1.7890520095825195} -08/30/2021 23:12:52 - INFO - __main__ - Step 55543: {'lr': 0.00035518514152374514, 'samples': 10664256, 'steps': 55542, 'loss/train': 1.18366277217865} -08/30/2021 23:12:52 - INFO - __main__ - Step 55544: {'lr': 0.00035518032732237724, 'samples': 10664448, 'steps': 55543, 'loss/train': 1.1753648519515991} -08/30/2021 23:12:52 - INFO - __main__ - Step 55545: {'lr': 0.00035517551307361674, 'samples': 10664640, 'steps': 55544, 'loss/train': 6.13233757019043} -08/30/2021 23:12:53 - INFO - __main__ - Step 55546: {'lr': 0.0003551706987774657, 'samples': 10664832, 'steps': 55545, 'loss/train': 1.3345859050750732} -08/30/2021 23:12:53 - INFO - __main__ - Step 55547: {'lr': 0.00035516588443392644, 'samples': 10665024, 'steps': 55546, 'loss/train': 3.279421091079712} -08/30/2021 23:12:55 - INFO - __main__ - Step 55548: {'lr': 0.00035516107004300107, 'samples': 10665216, 'steps': 55547, 'loss/train': 1.5045636892318726} -08/30/2021 23:12:55 - INFO - __main__ - Step 55549: {'lr': 0.00035515625560469174, 'samples': 10665408, 'steps': 55548, 'loss/train': 1.1609314680099487} -08/30/2021 23:12:56 - INFO - __main__ - Step 55550: {'lr': 0.00035515144111900054, 'samples': 10665600, 'steps': 55549, 'loss/train': 2.206282138824463} -08/30/2021 23:12:56 - INFO - __main__ - Step 55551: {'lr': 0.00035514662658592977, 'samples': 10665792, 'steps': 55550, 'loss/train': 0.7513319849967957} -08/30/2021 23:12:56 - INFO - __main__ - Step 55552: {'lr': 0.0003551418120054816, 'samples': 10665984, 'steps': 55551, 'loss/train': 0.7058324217796326} -08/30/2021 23:12:58 - INFO - __main__ - Step 55553: {'lr': 0.0003551369973776581, 'samples': 10666176, 'steps': 55552, 'loss/train': 1.3419108390808105} -08/30/2021 23:12:58 - INFO - __main__ - Step 55554: {'lr': 0.0003551321827024615, 'samples': 10666368, 'steps': 55553, 'loss/train': 1.0806262493133545} -08/30/2021 23:12:59 - INFO - __main__ - Step 55555: {'lr': 0.0003551273679798939, 'samples': 10666560, 'steps': 55554, 'loss/train': 1.4196597337722778} -08/30/2021 23:12:59 - INFO - __main__ - Step 55556: {'lr': 0.00035512255320995764, 'samples': 10666752, 'steps': 55555, 'loss/train': 0.7956951856613159} -08/30/2021 23:12:59 - INFO - __main__ - Step 55557: {'lr': 0.0003551177383926547, 'samples': 10666944, 'steps': 55556, 'loss/train': 1.6736340522766113} -08/30/2021 23:13:01 - INFO - __main__ - Step 55558: {'lr': 0.00035511292352798736, 'samples': 10667136, 'steps': 55557, 'loss/train': 1.126220703125} -08/30/2021 23:13:01 - INFO - __main__ - Step 55559: {'lr': 0.0003551081086159578, 'samples': 10667328, 'steps': 55558, 'loss/train': 1.382939100265503} -08/30/2021 23:13:02 - INFO - __main__ - Step 55560: {'lr': 0.0003551032936565681, 'samples': 10667520, 'steps': 55559, 'loss/train': 1.303977608680725} -08/30/2021 23:13:02 - INFO - __main__ - Step 55561: {'lr': 0.0003550984786498205, 'samples': 10667712, 'steps': 55560, 'loss/train': 1.3649529218673706} -08/30/2021 23:13:02 - INFO - __main__ - Step 55562: {'lr': 0.0003550936635957171, 'samples': 10667904, 'steps': 55561, 'loss/train': 1.1614124774932861} -08/30/2021 23:13:04 - INFO - __main__ - Step 55563: {'lr': 0.00035508884849426014, 'samples': 10668096, 'steps': 55562, 'loss/train': 1.6265507936477661} -08/30/2021 23:13:04 - INFO - __main__ - Step 55564: {'lr': 0.0003550840333454518, 'samples': 10668288, 'steps': 55563, 'loss/train': 1.1556559801101685} -08/30/2021 23:13:05 - INFO - __main__ - Step 55565: {'lr': 0.00035507921814929415, 'samples': 10668480, 'steps': 55564, 'loss/train': 0.9558085799217224} -08/30/2021 23:13:05 - INFO - __main__ - Step 55566: {'lr': 0.0003550744029057895, 'samples': 10668672, 'steps': 55565, 'loss/train': 2.92163348197937} -08/30/2021 23:13:05 - INFO - __main__ - Step 55567: {'lr': 0.0003550695876149399, 'samples': 10668864, 'steps': 55566, 'loss/train': 1.0279262065887451} -08/30/2021 23:13:07 - INFO - __main__ - Step 55568: {'lr': 0.00035506477227674753, 'samples': 10669056, 'steps': 55567, 'loss/train': 0.048378534615039825} -08/30/2021 23:13:07 - INFO - __main__ - Step 55569: {'lr': 0.0003550599568912147, 'samples': 10669248, 'steps': 55568, 'loss/train': 0.9692768454551697} -08/30/2021 23:13:08 - INFO - __main__ - Step 55570: {'lr': 0.00035505514145834337, 'samples': 10669440, 'steps': 55569, 'loss/train': 0.4592815041542053} -08/30/2021 23:13:08 - INFO - __main__ - Step 55571: {'lr': 0.0003550503259781359, 'samples': 10669632, 'steps': 55570, 'loss/train': 2.1162960529327393} -08/30/2021 23:13:08 - INFO - __main__ - Step 55572: {'lr': 0.0003550455104505943, 'samples': 10669824, 'steps': 55571, 'loss/train': 1.6123930215835571} -08/30/2021 23:13:09 - INFO - __main__ - Step 55573: {'lr': 0.00035504069487572086, 'samples': 10670016, 'steps': 55572, 'loss/train': 2.04437255859375} -08/30/2021 23:13:10 - INFO - __main__ - Step 55574: {'lr': 0.00035503587925351767, 'samples': 10670208, 'steps': 55573, 'loss/train': 0.9854397177696228} -08/30/2021 23:13:11 - INFO - __main__ - Step 55575: {'lr': 0.00035503106358398694, 'samples': 10670400, 'steps': 55574, 'loss/train': 1.2532223463058472} -08/30/2021 23:13:11 - INFO - __main__ - Step 55576: {'lr': 0.0003550262478671309, 'samples': 10670592, 'steps': 55575, 'loss/train': 1.0182878971099854} -08/30/2021 23:13:11 - INFO - __main__ - Step 55577: {'lr': 0.00035502143210295163, 'samples': 10670784, 'steps': 55576, 'loss/train': 1.5405141115188599} -08/30/2021 23:13:12 - INFO - __main__ - Step 55578: {'lr': 0.0003550166162914513, 'samples': 10670976, 'steps': 55577, 'loss/train': 0.820939302444458} -08/30/2021 23:13:13 - INFO - __main__ - Step 55579: {'lr': 0.00035501180043263203, 'samples': 10671168, 'steps': 55578, 'loss/train': 1.1022518873214722} -08/30/2021 23:13:14 - INFO - __main__ - Step 55580: {'lr': 0.00035500698452649613, 'samples': 10671360, 'steps': 55579, 'loss/train': 1.6348439455032349} -08/30/2021 23:13:14 - INFO - __main__ - Step 55581: {'lr': 0.00035500216857304575, 'samples': 10671552, 'steps': 55580, 'loss/train': 0.8381043076515198} -08/30/2021 23:13:14 - INFO - __main__ - Step 55582: {'lr': 0.000354997352572283, 'samples': 10671744, 'steps': 55581, 'loss/train': 0.9342495799064636} -08/30/2021 23:13:15 - INFO - __main__ - Step 55583: {'lr': 0.00035499253652421, 'samples': 10671936, 'steps': 55582, 'loss/train': 1.182405948638916} -08/30/2021 23:13:16 - INFO - __main__ - Step 55584: {'lr': 0.000354987720428829, 'samples': 10672128, 'steps': 55583, 'loss/train': 1.4739466905593872} -08/30/2021 23:13:17 - INFO - __main__ - Step 55585: {'lr': 0.00035498290428614217, 'samples': 10672320, 'steps': 55584, 'loss/train': 1.0474975109100342} -08/30/2021 23:13:17 - INFO - __main__ - Step 55586: {'lr': 0.0003549780880961516, 'samples': 10672512, 'steps': 55585, 'loss/train': 1.4440350532531738} -08/30/2021 23:13:17 - INFO - __main__ - Step 55587: {'lr': 0.00035497327185885966, 'samples': 10672704, 'steps': 55586, 'loss/train': 0.9955775737762451} -08/30/2021 23:13:18 - INFO - __main__ - Step 55588: {'lr': 0.00035496845557426824, 'samples': 10672896, 'steps': 55587, 'loss/train': 0.3096802830696106} -08/30/2021 23:13:19 - INFO - __main__ - Step 55589: {'lr': 0.0003549636392423798, 'samples': 10673088, 'steps': 55588, 'loss/train': 1.285921335220337} -08/30/2021 23:13:20 - INFO - __main__ - Step 55590: {'lr': 0.00035495882286319625, 'samples': 10673280, 'steps': 55589, 'loss/train': 1.078321933746338} -08/30/2021 23:13:20 - INFO - __main__ - Step 55591: {'lr': 0.0003549540064367199, 'samples': 10673472, 'steps': 55590, 'loss/train': 0.3283541798591614} -08/30/2021 23:13:20 - INFO - __main__ - Step 55592: {'lr': 0.0003549491899629529, 'samples': 10673664, 'steps': 55591, 'loss/train': 1.2631309032440186} -08/30/2021 23:13:21 - INFO - __main__ - Step 55593: {'lr': 0.00035494437344189746, 'samples': 10673856, 'steps': 55592, 'loss/train': 1.4361330270767212} -08/30/2021 23:13:22 - INFO - __main__ - Step 55594: {'lr': 0.0003549395568735556, 'samples': 10674048, 'steps': 55593, 'loss/train': 1.1085577011108398} -08/30/2021 23:13:23 - INFO - __main__ - Step 55595: {'lr': 0.00035493474025792966, 'samples': 10674240, 'steps': 55594, 'loss/train': 1.2822076082229614} -08/30/2021 23:13:23 - INFO - __main__ - Step 55596: {'lr': 0.0003549299235950218, 'samples': 10674432, 'steps': 55595, 'loss/train': 1.6605780124664307} -08/30/2021 23:13:23 - INFO - __main__ - Step 55597: {'lr': 0.000354925106884834, 'samples': 10674624, 'steps': 55596, 'loss/train': 0.48490074276924133} -08/30/2021 23:13:24 - INFO - __main__ - Step 55598: {'lr': 0.0003549202901273687, 'samples': 10674816, 'steps': 55597, 'loss/train': 1.458268404006958} -08/30/2021 23:13:26 - INFO - __main__ - Step 55599: {'lr': 0.00035491547332262786, 'samples': 10675008, 'steps': 55598, 'loss/train': 1.5057588815689087} -08/30/2021 23:13:26 - INFO - __main__ - Step 55600: {'lr': 0.00035491065647061377, 'samples': 10675200, 'steps': 55599, 'loss/train': 1.568816900253296} -08/30/2021 23:13:27 - INFO - __main__ - Step 55601: {'lr': 0.0003549058395713285, 'samples': 10675392, 'steps': 55600, 'loss/train': 1.5766630172729492} -08/30/2021 23:13:27 - INFO - __main__ - Step 55602: {'lr': 0.00035490102262477436, 'samples': 10675584, 'steps': 55601, 'loss/train': 1.638654112815857} -08/30/2021 23:13:27 - INFO - __main__ - Step 55603: {'lr': 0.0003548962056309534, 'samples': 10675776, 'steps': 55602, 'loss/train': 1.4436196088790894} -08/30/2021 23:13:29 - INFO - __main__ - Step 55604: {'lr': 0.0003548913885898678, 'samples': 10675968, 'steps': 55603, 'loss/train': 1.1649856567382812} -08/30/2021 23:13:29 - INFO - __main__ - Step 55605: {'lr': 0.0003548865715015198, 'samples': 10676160, 'steps': 55604, 'loss/train': 2.042722702026367} -08/30/2021 23:13:30 - INFO - __main__ - Step 55606: {'lr': 0.00035488175436591146, 'samples': 10676352, 'steps': 55605, 'loss/train': 1.488159418106079} -08/30/2021 23:13:30 - INFO - __main__ - Step 55607: {'lr': 0.00035487693718304504, 'samples': 10676544, 'steps': 55606, 'loss/train': 1.6831434965133667} -08/30/2021 23:13:30 - INFO - __main__ - Step 55608: {'lr': 0.00035487211995292276, 'samples': 10676736, 'steps': 55607, 'loss/train': 1.2747161388397217} -08/30/2021 23:13:31 - INFO - __main__ - Step 55609: {'lr': 0.00035486730267554666, 'samples': 10676928, 'steps': 55608, 'loss/train': 1.5266501903533936} -08/30/2021 23:13:32 - INFO - __main__ - Step 55610: {'lr': 0.000354862485350919, 'samples': 10677120, 'steps': 55609, 'loss/train': 0.7851687669754028} -08/30/2021 23:13:33 - INFO - __main__ - Step 55611: {'lr': 0.0003548576679790419, 'samples': 10677312, 'steps': 55610, 'loss/train': 1.3484630584716797} -08/30/2021 23:13:33 - INFO - __main__ - Step 55612: {'lr': 0.00035485285055991754, 'samples': 10677504, 'steps': 55611, 'loss/train': 0.7398014664649963} -08/30/2021 23:13:33 - INFO - __main__ - Step 55613: {'lr': 0.00035484803309354814, 'samples': 10677696, 'steps': 55612, 'loss/train': 1.5234750509262085} -08/30/2021 23:13:35 - INFO - __main__ - Step 55614: {'lr': 0.0003548432155799358, 'samples': 10677888, 'steps': 55613, 'loss/train': 1.6633076667785645} -08/30/2021 23:13:35 - INFO - __main__ - Step 55615: {'lr': 0.00035483839801908276, 'samples': 10678080, 'steps': 55614, 'loss/train': 0.8639807105064392} -08/30/2021 23:13:36 - INFO - __main__ - Step 55616: {'lr': 0.00035483358041099117, 'samples': 10678272, 'steps': 55615, 'loss/train': 1.6672723293304443} -08/30/2021 23:13:36 - INFO - __main__ - Step 55617: {'lr': 0.00035482876275566317, 'samples': 10678464, 'steps': 55616, 'loss/train': 1.2261906862258911} -08/30/2021 23:13:36 - INFO - __main__ - Step 55618: {'lr': 0.00035482394505310087, 'samples': 10678656, 'steps': 55617, 'loss/train': 0.7856540083885193} -08/30/2021 23:13:37 - INFO - __main__ - Step 55619: {'lr': 0.0003548191273033066, 'samples': 10678848, 'steps': 55618, 'loss/train': 1.6973035335540771} -08/30/2021 23:13:38 - INFO - __main__ - Step 55620: {'lr': 0.0003548143095062825, 'samples': 10679040, 'steps': 55619, 'loss/train': 1.1280386447906494} -08/30/2021 23:13:39 - INFO - __main__ - Step 55621: {'lr': 0.00035480949166203057, 'samples': 10679232, 'steps': 55620, 'loss/train': 0.9099001884460449} -08/30/2021 23:13:39 - INFO - __main__ - Step 55622: {'lr': 0.00035480467377055314, 'samples': 10679424, 'steps': 55621, 'loss/train': 1.3519760370254517} -08/30/2021 23:13:39 - INFO - __main__ - Step 55623: {'lr': 0.00035479985583185237, 'samples': 10679616, 'steps': 55622, 'loss/train': 0.9619577527046204} -08/30/2021 23:13:40 - INFO - __main__ - Step 55624: {'lr': 0.0003547950378459304, 'samples': 10679808, 'steps': 55623, 'loss/train': 1.2956039905548096} -08/30/2021 23:13:41 - INFO - __main__ - Step 55625: {'lr': 0.00035479021981278935, 'samples': 10680000, 'steps': 55624, 'loss/train': 1.389266014099121} -08/30/2021 23:13:42 - INFO - __main__ - Step 55626: {'lr': 0.0003547854017324315, 'samples': 10680192, 'steps': 55625, 'loss/train': 1.6224184036254883} -08/30/2021 23:13:42 - INFO - __main__ - Step 55627: {'lr': 0.000354780583604859, 'samples': 10680384, 'steps': 55626, 'loss/train': 0.5724973678588867} -08/30/2021 23:13:42 - INFO - __main__ - Step 55628: {'lr': 0.0003547757654300739, 'samples': 10680576, 'steps': 55627, 'loss/train': 1.5860828161239624} -08/30/2021 23:13:43 - INFO - __main__ - Step 55629: {'lr': 0.0003547709472080785, 'samples': 10680768, 'steps': 55628, 'loss/train': 1.051838755607605} -08/30/2021 23:13:44 - INFO - __main__ - Step 55630: {'lr': 0.00035476612893887494, 'samples': 10680960, 'steps': 55629, 'loss/train': 1.8453034162521362} -08/30/2021 23:13:45 - INFO - __main__ - Step 55631: {'lr': 0.0003547613106224653, 'samples': 10681152, 'steps': 55630, 'loss/train': 1.211069107055664} -08/30/2021 23:13:45 - INFO - __main__ - Step 55632: {'lr': 0.0003547564922588519, 'samples': 10681344, 'steps': 55631, 'loss/train': 1.1199408769607544} -08/30/2021 23:13:45 - INFO - __main__ - Step 55633: {'lr': 0.0003547516738480369, 'samples': 10681536, 'steps': 55632, 'loss/train': 0.511131763458252} -08/30/2021 23:13:46 - INFO - __main__ - Step 55634: {'lr': 0.0003547468553900223, 'samples': 10681728, 'steps': 55633, 'loss/train': 1.5302780866622925} -08/30/2021 23:13:47 - INFO - __main__ - Step 55635: {'lr': 0.0003547420368848104, 'samples': 10681920, 'steps': 55634, 'loss/train': 1.2150541543960571} -08/30/2021 23:13:48 - INFO - __main__ - Step 55636: {'lr': 0.0003547372183324034, 'samples': 10682112, 'steps': 55635, 'loss/train': 0.9853528141975403} -08/30/2021 23:13:48 - INFO - __main__ - Step 55637: {'lr': 0.0003547323997328034, 'samples': 10682304, 'steps': 55636, 'loss/train': 1.2307056188583374} -08/30/2021 23:13:48 - INFO - __main__ - Step 55638: {'lr': 0.0003547275810860126, 'samples': 10682496, 'steps': 55637, 'loss/train': 0.9249447584152222} -08/30/2021 23:13:49 - INFO - __main__ - Step 55639: {'lr': 0.00035472276239203315, 'samples': 10682688, 'steps': 55638, 'loss/train': 1.2306729555130005} -08/30/2021 23:13:50 - INFO - __main__ - Step 55640: {'lr': 0.00035471794365086724, 'samples': 10682880, 'steps': 55639, 'loss/train': 1.4465547800064087} -08/30/2021 23:13:51 - INFO - __main__ - Step 55641: {'lr': 0.00035471312486251707, 'samples': 10683072, 'steps': 55640, 'loss/train': 1.8672592639923096} -08/30/2021 23:13:51 - INFO - __main__ - Step 55642: {'lr': 0.0003547083060269848, 'samples': 10683264, 'steps': 55641, 'loss/train': 1.3993582725524902} -08/30/2021 23:13:52 - INFO - __main__ - Step 55643: {'lr': 0.00035470348714427256, 'samples': 10683456, 'steps': 55642, 'loss/train': 1.5673904418945312} -08/30/2021 23:13:52 - INFO - __main__ - Step 55644: {'lr': 0.0003546986682143825, 'samples': 10683648, 'steps': 55643, 'loss/train': 1.1614502668380737} -08/30/2021 23:13:52 - INFO - __main__ - Step 55645: {'lr': 0.0003546938492373169, 'samples': 10683840, 'steps': 55644, 'loss/train': 0.09984840452671051} -08/30/2021 23:13:54 - INFO - __main__ - Step 55646: {'lr': 0.0003546890302130778, 'samples': 10684032, 'steps': 55645, 'loss/train': 0.0841052308678627} -08/30/2021 23:13:54 - INFO - __main__ - Step 55647: {'lr': 0.0003546842111416675, 'samples': 10684224, 'steps': 55646, 'loss/train': 0.9936304092407227} -08/30/2021 23:13:55 - INFO - __main__ - Step 55648: {'lr': 0.0003546793920230881, 'samples': 10684416, 'steps': 55647, 'loss/train': 1.5294994115829468} -08/30/2021 23:13:55 - INFO - __main__ - Step 55649: {'lr': 0.0003546745728573418, 'samples': 10684608, 'steps': 55648, 'loss/train': 0.883396565914154} -08/30/2021 23:13:55 - INFO - __main__ - Step 55650: {'lr': 0.0003546697536444307, 'samples': 10684800, 'steps': 55649, 'loss/train': 1.0118926763534546} -08/30/2021 23:13:57 - INFO - __main__ - Step 55651: {'lr': 0.00035466493438435703, 'samples': 10684992, 'steps': 55650, 'loss/train': 0.9946087002754211} -08/30/2021 23:13:58 - INFO - __main__ - Step 55652: {'lr': 0.000354660115077123, 'samples': 10685184, 'steps': 55651, 'loss/train': 1.253925085067749} -08/30/2021 23:13:58 - INFO - __main__ - Step 55653: {'lr': 0.0003546552957227307, 'samples': 10685376, 'steps': 55652, 'loss/train': 0.864951491355896} -08/30/2021 23:13:58 - INFO - __main__ - Step 55654: {'lr': 0.0003546504763211823, 'samples': 10685568, 'steps': 55653, 'loss/train': 0.3088420033454895} -08/30/2021 23:13:59 - INFO - __main__ - Step 55655: {'lr': 0.0003546456568724801, 'samples': 10685760, 'steps': 55654, 'loss/train': 1.0639262199401855} -08/30/2021 23:13:59 - INFO - __main__ - Step 55656: {'lr': 0.0003546408373766262, 'samples': 10685952, 'steps': 55655, 'loss/train': 0.39806151390075684} -08/30/2021 23:14:01 - INFO - __main__ - Step 55657: {'lr': 0.0003546360178336226, 'samples': 10686144, 'steps': 55656, 'loss/train': 0.05974964052438736} -08/30/2021 23:14:02 - INFO - __main__ - Step 55658: {'lr': 0.0003546311982434717, 'samples': 10686336, 'steps': 55657, 'loss/train': 1.8015832901000977} -08/30/2021 23:14:02 - INFO - __main__ - Step 55659: {'lr': 0.00035462637860617563, 'samples': 10686528, 'steps': 55658, 'loss/train': 0.8492950797080994} -08/30/2021 23:14:02 - INFO - __main__ - Step 55660: {'lr': 0.00035462155892173654, 'samples': 10686720, 'steps': 55659, 'loss/train': 1.9669959545135498} -08/30/2021 23:14:03 - INFO - __main__ - Step 55661: {'lr': 0.0003546167391901566, 'samples': 10686912, 'steps': 55660, 'loss/train': 0.8186646699905396} -08/30/2021 23:14:04 - INFO - __main__ - Step 55662: {'lr': 0.0003546119194114379, 'samples': 10687104, 'steps': 55661, 'loss/train': 1.4092613458633423} -08/30/2021 23:14:05 - INFO - __main__ - Step 55663: {'lr': 0.00035460709958558273, 'samples': 10687296, 'steps': 55662, 'loss/train': 1.1991801261901855} -08/30/2021 23:14:05 - INFO - __main__ - Step 55664: {'lr': 0.0003546022797125932, 'samples': 10687488, 'steps': 55663, 'loss/train': 1.2259601354599} -08/30/2021 23:14:05 - INFO - __main__ - Step 55665: {'lr': 0.00035459745979247146, 'samples': 10687680, 'steps': 55664, 'loss/train': 1.7016760110855103} -08/30/2021 23:14:06 - INFO - __main__ - Step 55666: {'lr': 0.00035459263982521975, 'samples': 10687872, 'steps': 55665, 'loss/train': 0.9808220863342285} -08/30/2021 23:14:07 - INFO - __main__ - Step 55667: {'lr': 0.00035458781981084026, 'samples': 10688064, 'steps': 55666, 'loss/train': 1.1275321245193481} -08/30/2021 23:14:08 - INFO - __main__ - Step 55668: {'lr': 0.00035458299974933506, 'samples': 10688256, 'steps': 55667, 'loss/train': 1.314697265625} -08/30/2021 23:14:08 - INFO - __main__ - Step 55669: {'lr': 0.00035457817964070637, 'samples': 10688448, 'steps': 55668, 'loss/train': 1.503603219985962} -08/30/2021 23:14:09 - INFO - __main__ - Step 55670: {'lr': 0.0003545733594849564, 'samples': 10688640, 'steps': 55669, 'loss/train': 1.1797946691513062} -08/30/2021 23:14:09 - INFO - __main__ - Step 55671: {'lr': 0.0003545685392820873, 'samples': 10688832, 'steps': 55670, 'loss/train': 1.623259425163269} -08/30/2021 23:14:10 - INFO - __main__ - Step 55672: {'lr': 0.0003545637190321012, 'samples': 10689024, 'steps': 55671, 'loss/train': 1.3980627059936523} -08/30/2021 23:14:11 - INFO - __main__ - Step 55673: {'lr': 0.00035455889873500026, 'samples': 10689216, 'steps': 55672, 'loss/train': 1.5831059217453003} -08/30/2021 23:14:11 - INFO - __main__ - Step 55674: {'lr': 0.00035455407839078673, 'samples': 10689408, 'steps': 55673, 'loss/train': 1.4477463960647583} -08/30/2021 23:14:12 - INFO - __main__ - Step 55675: {'lr': 0.00035454925799946273, 'samples': 10689600, 'steps': 55674, 'loss/train': 1.7354828119277954} -08/30/2021 23:14:12 - INFO - __main__ - Step 55676: {'lr': 0.0003545444375610306, 'samples': 10689792, 'steps': 55675, 'loss/train': 1.2588073015213013} -08/30/2021 23:14:12 - INFO - __main__ - Step 55677: {'lr': 0.0003545396170754922, 'samples': 10689984, 'steps': 55676, 'loss/train': 1.2677406072616577} -08/30/2021 23:14:14 - INFO - __main__ - Step 55678: {'lr': 0.0003545347965428498, 'samples': 10690176, 'steps': 55677, 'loss/train': 1.289686918258667} -08/30/2021 23:14:15 - INFO - __main__ - Step 55679: {'lr': 0.00035452997596310576, 'samples': 10690368, 'steps': 55678, 'loss/train': 0.6954678893089294} -08/30/2021 23:14:15 - INFO - __main__ - Step 55680: {'lr': 0.00035452515533626204, 'samples': 10690560, 'steps': 55679, 'loss/train': 1.1525535583496094} -08/30/2021 23:14:15 - INFO - __main__ - Step 55681: {'lr': 0.00035452033466232095, 'samples': 10690752, 'steps': 55680, 'loss/train': 1.5572208166122437} -08/30/2021 23:14:16 - INFO - __main__ - Step 55682: {'lr': 0.0003545155139412847, 'samples': 10690944, 'steps': 55681, 'loss/train': 0.6655292510986328} -08/30/2021 23:14:17 - INFO - __main__ - Step 55683: {'lr': 0.00035451069317315526, 'samples': 10691136, 'steps': 55682, 'loss/train': 1.54902982711792} -08/30/2021 23:14:18 - INFO - __main__ - Step 55684: {'lr': 0.00035450587235793493, 'samples': 10691328, 'steps': 55683, 'loss/train': 1.3780467510223389} -08/30/2021 23:14:18 - INFO - __main__ - Step 55685: {'lr': 0.0003545010514956258, 'samples': 10691520, 'steps': 55684, 'loss/train': 1.3956325054168701} -08/30/2021 23:14:18 - INFO - __main__ - Step 55686: {'lr': 0.0003544962305862302, 'samples': 10691712, 'steps': 55685, 'loss/train': 2.8110406398773193} -08/30/2021 23:14:19 - INFO - __main__ - Step 55687: {'lr': 0.0003544914096297502, 'samples': 10691904, 'steps': 55686, 'loss/train': 1.5897676944732666} -08/30/2021 23:14:20 - INFO - __main__ - Step 55688: {'lr': 0.000354486588626188, 'samples': 10692096, 'steps': 55687, 'loss/train': 1.5517693758010864} -08/30/2021 23:14:21 - INFO - __main__ - Step 55689: {'lr': 0.00035448176757554574, 'samples': 10692288, 'steps': 55688, 'loss/train': 1.3772660493850708} -08/30/2021 23:14:21 - INFO - __main__ - Step 55690: {'lr': 0.0003544769464778256, 'samples': 10692480, 'steps': 55689, 'loss/train': 0.22232332825660706} -08/30/2021 23:14:21 - INFO - __main__ - Step 55691: {'lr': 0.00035447212533302975, 'samples': 10692672, 'steps': 55690, 'loss/train': 1.047350525856018} -08/30/2021 23:14:22 - INFO - __main__ - Step 55692: {'lr': 0.00035446730414116036, 'samples': 10692864, 'steps': 55691, 'loss/train': 1.302718162536621} -08/30/2021 23:14:23 - INFO - __main__ - Step 55693: {'lr': 0.00035446248290221967, 'samples': 10693056, 'steps': 55692, 'loss/train': 1.6574903726577759} -08/30/2021 23:14:24 - INFO - __main__ - Step 55694: {'lr': 0.00035445766161620976, 'samples': 10693248, 'steps': 55693, 'loss/train': 1.5358338356018066} -08/30/2021 23:14:24 - INFO - __main__ - Step 55695: {'lr': 0.00035445284028313284, 'samples': 10693440, 'steps': 55694, 'loss/train': 2.3100669384002686} -08/30/2021 23:14:24 - INFO - __main__ - Step 55696: {'lr': 0.00035444801890299103, 'samples': 10693632, 'steps': 55695, 'loss/train': 1.6347917318344116} -08/30/2021 23:14:25 - INFO - __main__ - Step 55697: {'lr': 0.0003544431974757866, 'samples': 10693824, 'steps': 55696, 'loss/train': 0.661130964756012} -08/30/2021 23:14:26 - INFO - __main__ - Step 55698: {'lr': 0.00035443837600152174, 'samples': 10694016, 'steps': 55697, 'loss/train': 1.2135374546051025} -08/30/2021 23:14:26 - INFO - __main__ - Step 55699: {'lr': 0.00035443355448019854, 'samples': 10694208, 'steps': 55698, 'loss/train': 1.3254491090774536} -08/30/2021 23:14:27 - INFO - __main__ - Step 55700: {'lr': 0.0003544287329118191, 'samples': 10694400, 'steps': 55699, 'loss/train': 1.1920199394226074} -08/30/2021 23:14:27 - INFO - __main__ - Step 55701: {'lr': 0.0003544239112963857, 'samples': 10694592, 'steps': 55700, 'loss/train': 1.1277209520339966} -08/30/2021 23:14:27 - INFO - __main__ - Step 55702: {'lr': 0.0003544190896339006, 'samples': 10694784, 'steps': 55701, 'loss/train': 0.9427372217178345} -08/30/2021 23:14:28 - INFO - __main__ - Step 55703: {'lr': 0.00035441426792436574, 'samples': 10694976, 'steps': 55702, 'loss/train': 0.8381898403167725} -08/30/2021 23:14:30 - INFO - __main__ - Step 55704: {'lr': 0.0003544094461677836, 'samples': 10695168, 'steps': 55703, 'loss/train': 0.9238675236701965} -08/30/2021 23:14:30 - INFO - __main__ - Step 55705: {'lr': 0.000354404624364156, 'samples': 10695360, 'steps': 55704, 'loss/train': 0.638308584690094} -08/30/2021 23:14:31 - INFO - __main__ - Step 55706: {'lr': 0.00035439980251348533, 'samples': 10695552, 'steps': 55705, 'loss/train': 1.2406498193740845} -08/30/2021 23:14:31 - INFO - __main__ - Step 55707: {'lr': 0.0003543949806157738, 'samples': 10695744, 'steps': 55706, 'loss/train': 0.041314493864774704} -08/30/2021 23:14:31 - INFO - __main__ - Step 55708: {'lr': 0.0003543901586710234, 'samples': 10695936, 'steps': 55707, 'loss/train': 1.1343141794204712} -08/30/2021 23:14:33 - INFO - __main__ - Step 55709: {'lr': 0.00035438533667923644, 'samples': 10696128, 'steps': 55708, 'loss/train': 0.538677990436554} -08/30/2021 23:14:33 - INFO - __main__ - Step 55710: {'lr': 0.0003543805146404151, 'samples': 10696320, 'steps': 55709, 'loss/train': 1.5439282655715942} -08/30/2021 23:14:34 - INFO - __main__ - Step 55711: {'lr': 0.0003543756925545615, 'samples': 10696512, 'steps': 55710, 'loss/train': 1.7141923904418945} -08/30/2021 23:14:34 - INFO - __main__ - Step 55712: {'lr': 0.0003543708704216778, 'samples': 10696704, 'steps': 55711, 'loss/train': 1.2219743728637695} -08/30/2021 23:14:34 - INFO - __main__ - Step 55713: {'lr': 0.00035436604824176616, 'samples': 10696896, 'steps': 55712, 'loss/train': 0.8718641400337219} -08/30/2021 23:14:36 - INFO - __main__ - Step 55714: {'lr': 0.0003543612260148288, 'samples': 10697088, 'steps': 55713, 'loss/train': 1.0926668643951416} -08/30/2021 23:14:37 - INFO - __main__ - Step 55715: {'lr': 0.0003543564037408679, 'samples': 10697280, 'steps': 55714, 'loss/train': 1.4930851459503174} -08/30/2021 23:14:37 - INFO - __main__ - Step 55716: {'lr': 0.00035435158141988564, 'samples': 10697472, 'steps': 55715, 'loss/train': 0.6779083609580994} -08/30/2021 23:14:37 - INFO - __main__ - Step 55717: {'lr': 0.0003543467590518842, 'samples': 10697664, 'steps': 55716, 'loss/train': 1.1186442375183105} -08/30/2021 23:14:38 - INFO - __main__ - Step 55718: {'lr': 0.00035434193663686566, 'samples': 10697856, 'steps': 55717, 'loss/train': 0.6522392630577087} -08/30/2021 23:14:39 - INFO - __main__ - Step 55719: {'lr': 0.0003543371141748323, 'samples': 10698048, 'steps': 55718, 'loss/train': 1.231892704963684} -08/30/2021 23:14:40 - INFO - __main__ - Step 55720: {'lr': 0.0003543322916657862, 'samples': 10698240, 'steps': 55719, 'loss/train': 1.8002524375915527} -08/30/2021 23:14:40 - INFO - __main__ - Step 55721: {'lr': 0.0003543274691097295, 'samples': 10698432, 'steps': 55720, 'loss/train': 0.7160958647727966} -08/30/2021 23:14:41 - INFO - __main__ - Step 55722: {'lr': 0.00035432264650666457, 'samples': 10698624, 'steps': 55721, 'loss/train': 1.4103093147277832} -08/30/2021 23:14:41 - INFO - __main__ - Step 55723: {'lr': 0.0003543178238565935, 'samples': 10698816, 'steps': 55722, 'loss/train': 1.3467888832092285} -08/30/2021 23:14:43 - INFO - __main__ - Step 55724: {'lr': 0.0003543130011595183, 'samples': 10699008, 'steps': 55723, 'loss/train': 1.4478784799575806} -08/30/2021 23:14:43 - INFO - __main__ - Step 55725: {'lr': 0.0003543081784154414, 'samples': 10699200, 'steps': 55724, 'loss/train': 1.8630198240280151} -08/30/2021 23:14:43 - INFO - __main__ - Step 55726: {'lr': 0.00035430335562436474, 'samples': 10699392, 'steps': 55725, 'loss/train': 0.8415594100952148} -08/30/2021 23:14:44 - INFO - __main__ - Step 55727: {'lr': 0.00035429853278629063, 'samples': 10699584, 'steps': 55726, 'loss/train': 0.14067301154136658} -08/30/2021 23:14:44 - INFO - __main__ - Step 55728: {'lr': 0.00035429370990122124, 'samples': 10699776, 'steps': 55727, 'loss/train': 1.494025707244873} -08/30/2021 23:14:46 - INFO - __main__ - Step 55729: {'lr': 0.0003542888869691586, 'samples': 10699968, 'steps': 55728, 'loss/train': 1.278326153755188} -08/30/2021 23:14:46 - INFO - __main__ - Step 55730: {'lr': 0.00035428406399010516, 'samples': 10700160, 'steps': 55729, 'loss/train': 0.7158213257789612} -08/30/2021 23:14:46 - INFO - __main__ - Step 55731: {'lr': 0.00035427924096406287, 'samples': 10700352, 'steps': 55730, 'loss/train': 2.846364736557007} -08/30/2021 23:14:47 - INFO - __main__ - Step 55732: {'lr': 0.00035427441789103397, 'samples': 10700544, 'steps': 55731, 'loss/train': 0.8122023344039917} -08/30/2021 23:14:47 - INFO - __main__ - Step 55733: {'lr': 0.0003542695947710206, 'samples': 10700736, 'steps': 55732, 'loss/train': 1.566859483718872} -08/30/2021 23:14:47 - INFO - __main__ - Step 55734: {'lr': 0.00035426477160402495, 'samples': 10700928, 'steps': 55733, 'loss/train': 1.5851231813430786} -08/30/2021 23:14:49 - INFO - __main__ - Step 55735: {'lr': 0.0003542599483900492, 'samples': 10701120, 'steps': 55734, 'loss/train': 1.6320836544036865} -08/30/2021 23:14:49 - INFO - __main__ - Step 55736: {'lr': 0.00035425512512909555, 'samples': 10701312, 'steps': 55735, 'loss/train': 1.3067712783813477} -08/30/2021 23:14:50 - INFO - __main__ - Step 55737: {'lr': 0.00035425030182116617, 'samples': 10701504, 'steps': 55736, 'loss/train': 1.2268667221069336} -08/30/2021 23:14:50 - INFO - __main__ - Step 55738: {'lr': 0.0003542454784662632, 'samples': 10701696, 'steps': 55737, 'loss/train': 1.8341413736343384} -08/30/2021 23:14:50 - INFO - __main__ - Step 55739: {'lr': 0.00035424065506438877, 'samples': 10701888, 'steps': 55738, 'loss/train': 0.8880284428596497} -08/30/2021 23:14:52 - INFO - __main__ - Step 55740: {'lr': 0.0003542358316155452, 'samples': 10702080, 'steps': 55739, 'loss/train': 1.4299170970916748} -08/30/2021 23:14:53 - INFO - __main__ - Step 55741: {'lr': 0.00035423100811973453, 'samples': 10702272, 'steps': 55740, 'loss/train': 1.304391622543335} -08/30/2021 23:14:53 - INFO - __main__ - Step 55742: {'lr': 0.00035422618457695893, 'samples': 10702464, 'steps': 55741, 'loss/train': 1.3320468664169312} -08/30/2021 23:14:54 - INFO - __main__ - Step 55743: {'lr': 0.0003542213609872207, 'samples': 10702656, 'steps': 55742, 'loss/train': 1.636850118637085} -08/30/2021 23:14:54 - INFO - __main__ - Step 55744: {'lr': 0.0003542165373505219, 'samples': 10702848, 'steps': 55743, 'loss/train': 1.6292940378189087} -08/30/2021 23:14:55 - INFO - __main__ - Step 55745: {'lr': 0.0003542117136668647, 'samples': 10703040, 'steps': 55744, 'loss/train': 0.8332457542419434} -08/30/2021 23:14:55 - INFO - __main__ - Step 55746: {'lr': 0.0003542068899362514, 'samples': 10703232, 'steps': 55745, 'loss/train': 1.1777420043945312} -08/30/2021 23:14:57 - INFO - __main__ - Step 55747: {'lr': 0.000354202066158684, 'samples': 10703424, 'steps': 55746, 'loss/train': 1.5863596200942993} -08/30/2021 23:14:57 - INFO - __main__ - Step 55748: {'lr': 0.0003541972423341648, 'samples': 10703616, 'steps': 55747, 'loss/train': 1.2048829793930054} -08/30/2021 23:14:57 - INFO - __main__ - Step 55749: {'lr': 0.0003541924184626959, 'samples': 10703808, 'steps': 55748, 'loss/train': 1.4137334823608398} -08/30/2021 23:14:58 - INFO - __main__ - Step 55750: {'lr': 0.00035418759454427953, 'samples': 10704000, 'steps': 55749, 'loss/train': 1.1200039386749268} -08/30/2021 23:14:58 - INFO - __main__ - Step 55751: {'lr': 0.00035418277057891776, 'samples': 10704192, 'steps': 55750, 'loss/train': 0.7291431427001953} -08/30/2021 23:15:00 - INFO - __main__ - Step 55752: {'lr': 0.00035417794656661297, 'samples': 10704384, 'steps': 55751, 'loss/train': 1.0747979879379272} -08/30/2021 23:15:00 - INFO - __main__ - Step 55753: {'lr': 0.0003541731225073671, 'samples': 10704576, 'steps': 55752, 'loss/train': 1.8460533618927002} -08/30/2021 23:15:00 - INFO - __main__ - Step 55754: {'lr': 0.0003541682984011825, 'samples': 10704768, 'steps': 55753, 'loss/train': 0.9102686047554016} -08/30/2021 23:15:01 - INFO - __main__ - Step 55755: {'lr': 0.00035416347424806124, 'samples': 10704960, 'steps': 55754, 'loss/train': 1.715810775756836} -08/30/2021 23:15:01 - INFO - __main__ - Step 55756: {'lr': 0.00035415865004800553, 'samples': 10705152, 'steps': 55755, 'loss/train': 1.778009295463562} -08/30/2021 23:15:03 - INFO - __main__ - Step 55757: {'lr': 0.00035415382580101753, 'samples': 10705344, 'steps': 55756, 'loss/train': 2.1117496490478516} -08/30/2021 23:15:03 - INFO - __main__ - Step 55758: {'lr': 0.00035414900150709946, 'samples': 10705536, 'steps': 55757, 'loss/train': 1.0899864435195923} -08/30/2021 23:15:03 - INFO - __main__ - Step 55759: {'lr': 0.00035414417716625343, 'samples': 10705728, 'steps': 55758, 'loss/train': 1.1682169437408447} -08/30/2021 23:15:04 - INFO - __main__ - Step 55760: {'lr': 0.00035413935277848156, 'samples': 10705920, 'steps': 55759, 'loss/train': 0.08942674845457077} -08/30/2021 23:15:04 - INFO - __main__ - Step 55761: {'lr': 0.00035413452834378624, 'samples': 10706112, 'steps': 55760, 'loss/train': 1.2167680263519287} -08/30/2021 23:15:06 - INFO - __main__ - Step 55762: {'lr': 0.0003541297038621694, 'samples': 10706304, 'steps': 55761, 'loss/train': 1.4061381816864014} -08/30/2021 23:15:07 - INFO - __main__ - Step 55763: {'lr': 0.00035412487933363335, 'samples': 10706496, 'steps': 55762, 'loss/train': 1.9082527160644531} -08/30/2021 23:15:07 - INFO - __main__ - Step 55764: {'lr': 0.00035412005475818033, 'samples': 10706688, 'steps': 55763, 'loss/train': 1.1674234867095947} -08/30/2021 23:15:07 - INFO - __main__ - Step 55765: {'lr': 0.0003541152301358124, 'samples': 10706880, 'steps': 55764, 'loss/train': 1.508541226387024} -08/30/2021 23:15:08 - INFO - __main__ - Step 55766: {'lr': 0.0003541104054665316, 'samples': 10707072, 'steps': 55765, 'loss/train': 1.5136747360229492} -08/30/2021 23:15:09 - INFO - __main__ - Step 55767: {'lr': 0.0003541055807503404, 'samples': 10707264, 'steps': 55766, 'loss/train': 1.5840827226638794} -08/30/2021 23:15:10 - INFO - __main__ - Step 55768: {'lr': 0.0003541007559872408, 'samples': 10707456, 'steps': 55767, 'loss/train': 1.5111762285232544} -08/30/2021 23:15:10 - INFO - __main__ - Step 55769: {'lr': 0.000354095931177235, 'samples': 10707648, 'steps': 55768, 'loss/train': 1.3580626249313354} -08/30/2021 23:15:10 - INFO - __main__ - Step 55770: {'lr': 0.0003540911063203252, 'samples': 10707840, 'steps': 55769, 'loss/train': 1.2443751096725464} -08/30/2021 23:15:11 - INFO - __main__ - Step 55771: {'lr': 0.00035408628141651356, 'samples': 10708032, 'steps': 55770, 'loss/train': 0.5195919275283813} -08/30/2021 23:15:12 - INFO - __main__ - Step 55772: {'lr': 0.0003540814564658022, 'samples': 10708224, 'steps': 55771, 'loss/train': 0.8362556099891663} -08/30/2021 23:15:13 - INFO - __main__ - Step 55773: {'lr': 0.00035407663146819337, 'samples': 10708416, 'steps': 55772, 'loss/train': 1.8281182050704956} -08/30/2021 23:15:13 - INFO - __main__ - Step 55774: {'lr': 0.0003540718064236892, 'samples': 10708608, 'steps': 55773, 'loss/train': 0.7100035548210144} -08/30/2021 23:15:14 - INFO - __main__ - Step 55775: {'lr': 0.0003540669813322919, 'samples': 10708800, 'steps': 55774, 'loss/train': 1.6116893291473389} -08/30/2021 23:15:14 - INFO - __main__ - Step 55776: {'lr': 0.00035406215619400357, 'samples': 10708992, 'steps': 55775, 'loss/train': 0.6807646751403809} -08/30/2021 23:15:15 - INFO - __main__ - Step 55777: {'lr': 0.00035405733100882654, 'samples': 10709184, 'steps': 55776, 'loss/train': 1.3845784664154053} -08/30/2021 23:15:16 - INFO - __main__ - Step 55778: {'lr': 0.0003540525057767628, 'samples': 10709376, 'steps': 55777, 'loss/train': 1.4464852809906006} -08/30/2021 23:15:16 - INFO - __main__ - Step 55779: {'lr': 0.0003540476804978146, 'samples': 10709568, 'steps': 55778, 'loss/train': 1.1956968307495117} -08/30/2021 23:15:17 - INFO - __main__ - Step 55780: {'lr': 0.00035404285517198417, 'samples': 10709760, 'steps': 55779, 'loss/train': 1.3396869897842407} -08/30/2021 23:15:17 - INFO - __main__ - Step 55781: {'lr': 0.00035403802979927355, 'samples': 10709952, 'steps': 55780, 'loss/train': 2.1580255031585693} -08/30/2021 23:15:17 - INFO - __main__ - Step 55782: {'lr': 0.0003540332043796851, 'samples': 10710144, 'steps': 55781, 'loss/train': 1.0538784265518188} -08/30/2021 23:15:19 - INFO - __main__ - Step 55783: {'lr': 0.00035402837891322083, 'samples': 10710336, 'steps': 55782, 'loss/train': 1.8561463356018066} -08/30/2021 23:15:19 - INFO - __main__ - Step 55784: {'lr': 0.00035402355339988307, 'samples': 10710528, 'steps': 55783, 'loss/train': 1.161104679107666} -08/30/2021 23:15:19 - INFO - __main__ - Step 55785: {'lr': 0.00035401872783967384, 'samples': 10710720, 'steps': 55784, 'loss/train': 1.2689498662948608} -08/30/2021 23:15:20 - INFO - __main__ - Step 55786: {'lr': 0.00035401390223259536, 'samples': 10710912, 'steps': 55785, 'loss/train': 1.2551660537719727} -08/30/2021 23:15:20 - INFO - __main__ - Step 55787: {'lr': 0.0003540090765786498, 'samples': 10711104, 'steps': 55786, 'loss/train': 0.769989550113678} -08/30/2021 23:15:22 - INFO - __main__ - Step 55788: {'lr': 0.0003540042508778394, 'samples': 10711296, 'steps': 55787, 'loss/train': 0.9293236136436462} -08/30/2021 23:15:23 - INFO - __main__ - Step 55789: {'lr': 0.00035399942513016623, 'samples': 10711488, 'steps': 55788, 'loss/train': 0.7601248025894165} -08/30/2021 23:15:23 - INFO - __main__ - Step 55790: {'lr': 0.0003539945993356326, 'samples': 10711680, 'steps': 55789, 'loss/train': 1.398922085762024} -08/30/2021 23:15:23 - INFO - __main__ - Step 55791: {'lr': 0.0003539897734942406, 'samples': 10711872, 'steps': 55790, 'loss/train': 1.108388066291809} -08/30/2021 23:15:24 - INFO - __main__ - Step 55792: {'lr': 0.00035398494760599243, 'samples': 10712064, 'steps': 55791, 'loss/train': 1.6827489137649536} -08/30/2021 23:15:24 - INFO - __main__ - Step 55793: {'lr': 0.00035398012167089016, 'samples': 10712256, 'steps': 55792, 'loss/train': 2.2388172149658203} -08/30/2021 23:15:25 - INFO - __main__ - Step 55794: {'lr': 0.0003539752956889361, 'samples': 10712448, 'steps': 55793, 'loss/train': 1.8627614974975586} -08/30/2021 23:15:26 - INFO - __main__ - Step 55795: {'lr': 0.00035397046966013235, 'samples': 10712640, 'steps': 55794, 'loss/train': 0.41283100843429565} -08/30/2021 23:15:26 - INFO - __main__ - Step 55796: {'lr': 0.00035396564358448115, 'samples': 10712832, 'steps': 55795, 'loss/train': 1.7279332876205444} -08/30/2021 23:15:27 - INFO - __main__ - Step 55797: {'lr': 0.00035396081746198467, 'samples': 10713024, 'steps': 55796, 'loss/train': 1.4764454364776611} -08/30/2021 23:15:27 - INFO - __main__ - Step 55798: {'lr': 0.000353955991292645, 'samples': 10713216, 'steps': 55797, 'loss/train': 1.5802695751190186} -08/30/2021 23:15:29 - INFO - __main__ - Step 55799: {'lr': 0.00035395116507646435, 'samples': 10713408, 'steps': 55798, 'loss/train': 1.715330958366394} -08/30/2021 23:15:29 - INFO - __main__ - Step 55800: {'lr': 0.00035394633881344497, 'samples': 10713600, 'steps': 55799, 'loss/train': 0.9424576163291931} -08/30/2021 23:15:29 - INFO - __main__ - Step 55801: {'lr': 0.00035394151250358886, 'samples': 10713792, 'steps': 55800, 'loss/train': 1.2360484600067139} -08/30/2021 23:15:30 - INFO - __main__ - Step 55802: {'lr': 0.00035393668614689837, 'samples': 10713984, 'steps': 55801, 'loss/train': 1.7449965476989746} -08/30/2021 23:15:30 - INFO - __main__ - Step 55803: {'lr': 0.00035393185974337565, 'samples': 10714176, 'steps': 55802, 'loss/train': 1.1759607791900635} -08/30/2021 23:15:32 - INFO - __main__ - Step 55804: {'lr': 0.0003539270332930228, 'samples': 10714368, 'steps': 55803, 'loss/train': 1.5261110067367554} -08/30/2021 23:15:32 - INFO - __main__ - Step 55805: {'lr': 0.00035392220679584206, 'samples': 10714560, 'steps': 55804, 'loss/train': 1.4128800630569458} -08/30/2021 23:15:32 - INFO - __main__ - Step 55806: {'lr': 0.0003539173802518356, 'samples': 10714752, 'steps': 55805, 'loss/train': 1.658766508102417} -08/30/2021 23:15:33 - INFO - __main__ - Step 55807: {'lr': 0.0003539125536610055, 'samples': 10714944, 'steps': 55806, 'loss/train': 1.805196762084961} -08/30/2021 23:15:33 - INFO - __main__ - Step 55808: {'lr': 0.00035390772702335405, 'samples': 10715136, 'steps': 55807, 'loss/train': 1.1509133577346802} -08/30/2021 23:15:35 - INFO - __main__ - Step 55809: {'lr': 0.0003539029003388833, 'samples': 10715328, 'steps': 55808, 'loss/train': 1.3984332084655762} -08/30/2021 23:15:35 - INFO - __main__ - Step 55810: {'lr': 0.0003538980736075956, 'samples': 10715520, 'steps': 55809, 'loss/train': 0.8859710693359375} -08/30/2021 23:15:35 - INFO - __main__ - Step 55811: {'lr': 0.0003538932468294931, 'samples': 10715712, 'steps': 55810, 'loss/train': 0.07919716089963913} -08/30/2021 23:15:36 - INFO - __main__ - Step 55812: {'lr': 0.0003538884200045778, 'samples': 10715904, 'steps': 55811, 'loss/train': 1.267533779144287} -08/30/2021 23:15:36 - INFO - __main__ - Step 55813: {'lr': 0.00035388359313285196, 'samples': 10716096, 'steps': 55812, 'loss/train': 1.0388505458831787} -08/30/2021 23:15:38 - INFO - __main__ - Step 55814: {'lr': 0.0003538787662143178, 'samples': 10716288, 'steps': 55813, 'loss/train': 1.569204568862915} -08/30/2021 23:15:38 - INFO - __main__ - Step 55815: {'lr': 0.00035387393924897747, 'samples': 10716480, 'steps': 55814, 'loss/train': 1.1774855852127075} -08/30/2021 23:15:38 - INFO - __main__ - Step 55816: {'lr': 0.0003538691122368332, 'samples': 10716672, 'steps': 55815, 'loss/train': 2.1934115886688232} -08/30/2021 23:15:39 - INFO - __main__ - Step 55817: {'lr': 0.00035386428517788707, 'samples': 10716864, 'steps': 55816, 'loss/train': 1.1093050241470337} -08/30/2021 23:15:39 - INFO - __main__ - Step 55818: {'lr': 0.00035385945807214124, 'samples': 10717056, 'steps': 55817, 'loss/train': 1.2497345209121704} -08/30/2021 23:15:39 - INFO - __main__ - Step 55819: {'lr': 0.000353854630919598, 'samples': 10717248, 'steps': 55818, 'loss/train': 1.3594471216201782} -08/30/2021 23:15:41 - INFO - __main__ - Step 55820: {'lr': 0.0003538498037202595, 'samples': 10717440, 'steps': 55819, 'loss/train': 0.9753965139389038} -08/30/2021 23:15:42 - INFO - __main__ - Step 55821: {'lr': 0.0003538449764741278, 'samples': 10717632, 'steps': 55820, 'loss/train': 1.3397353887557983} -08/30/2021 23:15:42 - INFO - __main__ - Step 55822: {'lr': 0.00035384014918120527, 'samples': 10717824, 'steps': 55821, 'loss/train': 1.1480140686035156} -08/30/2021 23:15:42 - INFO - __main__ - Step 55823: {'lr': 0.00035383532184149393, 'samples': 10718016, 'steps': 55822, 'loss/train': 0.8578100204467773} -08/30/2021 23:15:43 - INFO - __main__ - Step 55824: {'lr': 0.00035383049445499596, 'samples': 10718208, 'steps': 55823, 'loss/train': 0.9850677847862244} -08/30/2021 23:15:44 - INFO - __main__ - Step 55825: {'lr': 0.0003538256670217135, 'samples': 10718400, 'steps': 55824, 'loss/train': 0.15087755024433136} -08/30/2021 23:15:45 - INFO - __main__ - Step 55826: {'lr': 0.0003538208395416489, 'samples': 10718592, 'steps': 55825, 'loss/train': 1.3199774026870728} -08/30/2021 23:15:45 - INFO - __main__ - Step 55827: {'lr': 0.00035381601201480426, 'samples': 10718784, 'steps': 55826, 'loss/train': 1.394762635231018} -08/30/2021 23:15:45 - INFO - __main__ - Step 55828: {'lr': 0.00035381118444118167, 'samples': 10718976, 'steps': 55827, 'loss/train': 0.9617253541946411} -08/30/2021 23:15:46 - INFO - __main__ - Step 55829: {'lr': 0.00035380635682078334, 'samples': 10719168, 'steps': 55828, 'loss/train': 1.202509880065918} -08/30/2021 23:15:47 - INFO - __main__ - Step 55830: {'lr': 0.00035380152915361144, 'samples': 10719360, 'steps': 55829, 'loss/train': 1.505242109298706} -08/30/2021 23:15:48 - INFO - __main__ - Step 55831: {'lr': 0.00035379670143966826, 'samples': 10719552, 'steps': 55830, 'loss/train': 1.1661467552185059} -08/30/2021 23:15:48 - INFO - __main__ - Step 55832: {'lr': 0.00035379187367895584, 'samples': 10719744, 'steps': 55831, 'loss/train': 1.1387711763381958} -08/30/2021 23:15:48 - INFO - __main__ - Step 55833: {'lr': 0.0003537870458714765, 'samples': 10719936, 'steps': 55832, 'loss/train': 1.4760973453521729} -08/30/2021 23:15:49 - INFO - __main__ - Step 55834: {'lr': 0.0003537822180172322, 'samples': 10720128, 'steps': 55833, 'loss/train': 2.007533073425293} -08/30/2021 23:15:50 - INFO - __main__ - Step 55835: {'lr': 0.00035377739011622524, 'samples': 10720320, 'steps': 55834, 'loss/train': 1.4700040817260742} -08/30/2021 23:15:51 - INFO - __main__ - Step 55836: {'lr': 0.0003537725621684578, 'samples': 10720512, 'steps': 55835, 'loss/train': 0.4767780900001526} -08/30/2021 23:15:51 - INFO - __main__ - Step 55837: {'lr': 0.0003537677341739321, 'samples': 10720704, 'steps': 55836, 'loss/train': 0.8098054528236389} -08/30/2021 23:15:51 - INFO - __main__ - Step 55838: {'lr': 0.0003537629061326503, 'samples': 10720896, 'steps': 55837, 'loss/train': 1.8151724338531494} -08/30/2021 23:15:52 - INFO - __main__ - Step 55839: {'lr': 0.0003537580780446144, 'samples': 10721088, 'steps': 55838, 'loss/train': 1.3703428506851196} -08/30/2021 23:15:53 - INFO - __main__ - Step 55840: {'lr': 0.0003537532499098268, 'samples': 10721280, 'steps': 55839, 'loss/train': 1.0196481943130493} -08/30/2021 23:15:54 - INFO - __main__ - Step 55841: {'lr': 0.0003537484217282895, 'samples': 10721472, 'steps': 55840, 'loss/train': 1.4531360864639282} -08/30/2021 23:15:54 - INFO - __main__ - Step 55842: {'lr': 0.00035374359350000484, 'samples': 10721664, 'steps': 55841, 'loss/train': 1.2399746179580688} -08/30/2021 23:15:54 - INFO - __main__ - Step 55843: {'lr': 0.0003537387652249749, 'samples': 10721856, 'steps': 55842, 'loss/train': 0.21520744264125824} -08/30/2021 23:15:55 - INFO - __main__ - Step 55844: {'lr': 0.0003537339369032019, 'samples': 10722048, 'steps': 55843, 'loss/train': 1.1945297718048096} -08/30/2021 23:15:56 - INFO - __main__ - Step 55845: {'lr': 0.0003537291085346879, 'samples': 10722240, 'steps': 55844, 'loss/train': 1.0215296745300293} -08/30/2021 23:15:57 - INFO - __main__ - Step 55846: {'lr': 0.0003537242801194353, 'samples': 10722432, 'steps': 55845, 'loss/train': 0.8148331642150879} -08/30/2021 23:15:57 - INFO - __main__ - Step 55847: {'lr': 0.000353719451657446, 'samples': 10722624, 'steps': 55846, 'loss/train': 1.0143702030181885} -08/30/2021 23:15:57 - INFO - __main__ - Step 55848: {'lr': 0.0003537146231487224, 'samples': 10722816, 'steps': 55847, 'loss/train': 1.4620976448059082} -08/30/2021 23:15:58 - INFO - __main__ - Step 55849: {'lr': 0.0003537097945932666, 'samples': 10723008, 'steps': 55848, 'loss/train': 1.8522289991378784} -08/30/2021 23:15:58 - INFO - __main__ - Step 55850: {'lr': 0.00035370496599108073, 'samples': 10723200, 'steps': 55849, 'loss/train': 1.8698945045471191} -08/30/2021 23:16:00 - INFO - __main__ - Step 55851: {'lr': 0.00035370013734216697, 'samples': 10723392, 'steps': 55850, 'loss/train': 1.5686043500900269} -08/30/2021 23:16:00 - INFO - __main__ - Step 55852: {'lr': 0.0003536953086465276, 'samples': 10723584, 'steps': 55851, 'loss/train': 1.6252377033233643} -08/30/2021 23:16:00 - INFO - __main__ - Step 55853: {'lr': 0.0003536904799041647, 'samples': 10723776, 'steps': 55852, 'loss/train': 0.36260825395584106} -08/30/2021 23:16:01 - INFO - __main__ - Step 55854: {'lr': 0.00035368565111508043, 'samples': 10723968, 'steps': 55853, 'loss/train': 1.5042622089385986} -08/30/2021 23:16:01 - INFO - __main__ - Step 55855: {'lr': 0.000353680822279277, 'samples': 10724160, 'steps': 55854, 'loss/train': 1.1740037202835083} -08/30/2021 23:16:03 - INFO - __main__ - Step 55856: {'lr': 0.00035367599339675664, 'samples': 10724352, 'steps': 55855, 'loss/train': 1.195548415184021} -08/30/2021 23:16:03 - INFO - __main__ - Step 55857: {'lr': 0.0003536711644675215, 'samples': 10724544, 'steps': 55856, 'loss/train': 0.34780389070510864} -08/30/2021 23:16:04 - INFO - __main__ - Step 55858: {'lr': 0.0003536663354915737, 'samples': 10724736, 'steps': 55857, 'loss/train': 1.343656301498413} -08/30/2021 23:16:04 - INFO - __main__ - Step 55859: {'lr': 0.00035366150646891543, 'samples': 10724928, 'steps': 55858, 'loss/train': 0.7453269362449646} -08/30/2021 23:16:04 - INFO - __main__ - Step 55860: {'lr': 0.0003536566773995489, 'samples': 10725120, 'steps': 55859, 'loss/train': 0.6729212999343872} -08/30/2021 23:16:07 - INFO - __main__ - Step 55861: {'lr': 0.0003536518482834763, 'samples': 10725312, 'steps': 55860, 'loss/train': 1.1075812578201294} -08/30/2021 23:16:07 - INFO - __main__ - Step 55862: {'lr': 0.0003536470191206997, 'samples': 10725504, 'steps': 55861, 'loss/train': 1.1422550678253174} -08/30/2021 23:16:07 - INFO - __main__ - Step 55863: {'lr': 0.00035364218991122145, 'samples': 10725696, 'steps': 55862, 'loss/train': 1.2442809343338013} -08/30/2021 23:16:08 - INFO - __main__ - Step 55864: {'lr': 0.00035363736065504355, 'samples': 10725888, 'steps': 55863, 'loss/train': 1.4324740171432495} -08/30/2021 23:16:08 - INFO - __main__ - Step 55865: {'lr': 0.0003536325313521683, 'samples': 10726080, 'steps': 55864, 'loss/train': 1.1130757331848145} -08/30/2021 23:16:10 - INFO - __main__ - Step 55866: {'lr': 0.0003536277020025978, 'samples': 10726272, 'steps': 55865, 'loss/train': 0.3150434195995331} -08/30/2021 23:16:10 - INFO - __main__ - Step 55867: {'lr': 0.0003536228726063343, 'samples': 10726464, 'steps': 55866, 'loss/train': 1.6082249879837036} -08/30/2021 23:16:10 - INFO - __main__ - Step 55868: {'lr': 0.00035361804316337987, 'samples': 10726656, 'steps': 55867, 'loss/train': 1.2010414600372314} -08/30/2021 23:16:11 - INFO - __main__ - Step 55869: {'lr': 0.00035361321367373676, 'samples': 10726848, 'steps': 55868, 'loss/train': 1.2699295282363892} -08/30/2021 23:16:11 - INFO - __main__ - Step 55870: {'lr': 0.00035360838413740715, 'samples': 10727040, 'steps': 55869, 'loss/train': 6.135015964508057} -08/30/2021 23:16:12 - INFO - __main__ - Step 55871: {'lr': 0.0003536035545543933, 'samples': 10727232, 'steps': 55870, 'loss/train': 0.6468329429626465} -08/30/2021 23:16:13 - INFO - __main__ - Step 55872: {'lr': 0.00035359872492469715, 'samples': 10727424, 'steps': 55871, 'loss/train': 1.0681915283203125} -08/30/2021 23:16:13 - INFO - __main__ - Step 55873: {'lr': 0.0003535938952483211, 'samples': 10727616, 'steps': 55872, 'loss/train': 1.4447047710418701} -08/30/2021 23:16:14 - INFO - __main__ - Step 55874: {'lr': 0.00035358906552526714, 'samples': 10727808, 'steps': 55873, 'loss/train': 0.7339169383049011} -08/30/2021 23:16:14 - INFO - __main__ - Step 55875: {'lr': 0.0003535842357555376, 'samples': 10728000, 'steps': 55874, 'loss/train': 1.700046420097351} -08/30/2021 23:16:14 - INFO - __main__ - Step 55876: {'lr': 0.0003535794059391346, 'samples': 10728192, 'steps': 55875, 'loss/train': 1.1830312013626099} -08/30/2021 23:16:16 - INFO - __main__ - Step 55877: {'lr': 0.00035357457607606034, 'samples': 10728384, 'steps': 55876, 'loss/train': 1.050166130065918} -08/30/2021 23:16:17 - INFO - __main__ - Step 55878: {'lr': 0.00035356974616631697, 'samples': 10728576, 'steps': 55877, 'loss/train': 0.2922050952911377} -08/30/2021 23:16:17 - INFO - __main__ - Step 55879: {'lr': 0.00035356491620990667, 'samples': 10728768, 'steps': 55878, 'loss/train': 1.3382513523101807} -08/30/2021 23:16:17 - INFO - __main__ - Step 55880: {'lr': 0.0003535600862068316, 'samples': 10728960, 'steps': 55879, 'loss/train': 1.0374191999435425} -08/30/2021 23:16:18 - INFO - __main__ - Step 55881: {'lr': 0.00035355525615709393, 'samples': 10729152, 'steps': 55880, 'loss/train': 0.9945430755615234} -08/30/2021 23:16:19 - INFO - __main__ - Step 55882: {'lr': 0.0003535504260606959, 'samples': 10729344, 'steps': 55881, 'loss/train': 0.8950099349021912} -08/30/2021 23:16:20 - INFO - __main__ - Step 55883: {'lr': 0.00035354559591763965, 'samples': 10729536, 'steps': 55882, 'loss/train': 1.1675432920455933} -08/30/2021 23:16:20 - INFO - __main__ - Step 55884: {'lr': 0.0003535407657279273, 'samples': 10729728, 'steps': 55883, 'loss/train': 1.177507758140564} -08/30/2021 23:16:21 - INFO - __main__ - Step 55885: {'lr': 0.00035353593549156115, 'samples': 10729920, 'steps': 55884, 'loss/train': 1.4942655563354492} -08/30/2021 23:16:21 - INFO - __main__ - Step 55886: {'lr': 0.00035353110520854324, 'samples': 10730112, 'steps': 55885, 'loss/train': 1.0644011497497559} -08/30/2021 23:16:22 - INFO - __main__ - Step 55887: {'lr': 0.0003535262748788759, 'samples': 10730304, 'steps': 55886, 'loss/train': 0.5848406553268433} -08/30/2021 23:16:23 - INFO - __main__ - Step 55888: {'lr': 0.00035352144450256115, 'samples': 10730496, 'steps': 55887, 'loss/train': 1.3748239278793335} -08/30/2021 23:16:23 - INFO - __main__ - Step 55889: {'lr': 0.00035351661407960125, 'samples': 10730688, 'steps': 55888, 'loss/train': 1.9253418445587158} -08/30/2021 23:16:24 - INFO - __main__ - Step 55890: {'lr': 0.0003535117836099983, 'samples': 10730880, 'steps': 55889, 'loss/train': 0.8561276793479919} -08/30/2021 23:16:24 - INFO - __main__ - Step 55891: {'lr': 0.00035350695309375465, 'samples': 10731072, 'steps': 55890, 'loss/train': 2.533564567565918} -08/30/2021 23:16:25 - INFO - __main__ - Step 55892: {'lr': 0.00035350212253087233, 'samples': 10731264, 'steps': 55891, 'loss/train': 1.2324904203414917} -08/30/2021 23:16:26 - INFO - __main__ - Step 55893: {'lr': 0.0003534972919213535, 'samples': 10731456, 'steps': 55892, 'loss/train': 1.5151067972183228} -08/30/2021 23:16:26 - INFO - __main__ - Step 55894: {'lr': 0.0003534924612652004, 'samples': 10731648, 'steps': 55893, 'loss/train': 1.3352891206741333} -08/30/2021 23:16:26 - INFO - __main__ - Step 55895: {'lr': 0.00035348763056241515, 'samples': 10731840, 'steps': 55894, 'loss/train': 1.1198841333389282} -08/30/2021 23:16:27 - INFO - __main__ - Step 55896: {'lr': 0.0003534827998130001, 'samples': 10732032, 'steps': 55895, 'loss/train': 0.7932049632072449} -08/30/2021 23:16:27 - INFO - __main__ - Step 55897: {'lr': 0.00035347796901695716, 'samples': 10732224, 'steps': 55896, 'loss/train': 1.6382561922073364} -08/30/2021 23:16:29 - INFO - __main__ - Step 55898: {'lr': 0.0003534731381742888, 'samples': 10732416, 'steps': 55897, 'loss/train': 1.0531342029571533} -08/30/2021 23:16:29 - INFO - __main__ - Step 55899: {'lr': 0.0003534683072849969, 'samples': 10732608, 'steps': 55898, 'loss/train': 1.0077290534973145} -08/30/2021 23:16:30 - INFO - __main__ - Step 55900: {'lr': 0.0003534634763490838, 'samples': 10732800, 'steps': 55899, 'loss/train': 0.5583030581474304} -08/30/2021 23:16:30 - INFO - __main__ - Step 55901: {'lr': 0.0003534586453665517, 'samples': 10732992, 'steps': 55900, 'loss/train': 1.0922681093215942} -08/30/2021 23:16:30 - INFO - __main__ - Step 55902: {'lr': 0.00035345381433740273, 'samples': 10733184, 'steps': 55901, 'loss/train': 1.7224851846694946} -08/30/2021 23:16:32 - INFO - __main__ - Step 55903: {'lr': 0.00035344898326163907, 'samples': 10733376, 'steps': 55902, 'loss/train': 1.4505985975265503} -08/30/2021 23:16:33 - INFO - __main__ - Step 55904: {'lr': 0.00035344415213926284, 'samples': 10733568, 'steps': 55903, 'loss/train': 0.9378485679626465} -08/30/2021 23:16:33 - INFO - __main__ - Step 55905: {'lr': 0.0003534393209702764, 'samples': 10733760, 'steps': 55904, 'loss/train': 0.7283466458320618} -08/30/2021 23:16:33 - INFO - __main__ - Step 55906: {'lr': 0.0003534344897546816, 'samples': 10733952, 'steps': 55905, 'loss/train': 0.4423246681690216} -08/30/2021 23:16:34 - INFO - __main__ - Step 55907: {'lr': 0.00035342965849248097, 'samples': 10734144, 'steps': 55906, 'loss/train': 1.1748298406600952} -08/30/2021 23:16:35 - INFO - __main__ - Step 55908: {'lr': 0.00035342482718367645, 'samples': 10734336, 'steps': 55907, 'loss/train': 1.6168564558029175} -08/30/2021 23:16:36 - INFO - __main__ - Step 55909: {'lr': 0.0003534199958282703, 'samples': 10734528, 'steps': 55908, 'loss/train': 1.5999308824539185} -08/30/2021 23:16:36 - INFO - __main__ - Step 55910: {'lr': 0.00035341516442626475, 'samples': 10734720, 'steps': 55909, 'loss/train': 1.3619261980056763} -08/30/2021 23:16:37 - INFO - __main__ - Step 55911: {'lr': 0.0003534103329776619, 'samples': 10734912, 'steps': 55910, 'loss/train': 0.03599366545677185} -08/30/2021 23:16:37 - INFO - __main__ - Step 55912: {'lr': 0.000353405501482464, 'samples': 10735104, 'steps': 55911, 'loss/train': 1.2787939310073853} -08/30/2021 23:16:37 - INFO - __main__ - Step 55913: {'lr': 0.0003534006699406731, 'samples': 10735296, 'steps': 55912, 'loss/train': 1.267722725868225} -08/30/2021 23:16:38 - INFO - __main__ - Step 55914: {'lr': 0.0003533958383522915, 'samples': 10735488, 'steps': 55913, 'loss/train': 0.19397404789924622} -08/30/2021 23:16:40 - INFO - __main__ - Step 55915: {'lr': 0.0003533910067173213, 'samples': 10735680, 'steps': 55914, 'loss/train': 1.641342282295227} -08/30/2021 23:16:40 - INFO - __main__ - Step 55916: {'lr': 0.0003533861750357647, 'samples': 10735872, 'steps': 55915, 'loss/train': 1.713496208190918} -08/30/2021 23:16:40 - INFO - __main__ - Step 55917: {'lr': 0.0003533813433076239, 'samples': 10736064, 'steps': 55916, 'loss/train': 1.640536904335022} -08/30/2021 23:16:41 - INFO - __main__ - Step 55918: {'lr': 0.00035337651153290113, 'samples': 10736256, 'steps': 55917, 'loss/train': 1.3281631469726562} -08/30/2021 23:16:41 - INFO - __main__ - Step 55919: {'lr': 0.00035337167971159837, 'samples': 10736448, 'steps': 55918, 'loss/train': 1.2087630033493042} -08/30/2021 23:16:43 - INFO - __main__ - Step 55920: {'lr': 0.000353366847843718, 'samples': 10736640, 'steps': 55919, 'loss/train': 1.74284827709198} -08/30/2021 23:16:43 - INFO - __main__ - Step 55921: {'lr': 0.0003533620159292621, 'samples': 10736832, 'steps': 55920, 'loss/train': 1.6198315620422363} -08/30/2021 23:16:44 - INFO - __main__ - Step 55922: {'lr': 0.0003533571839682329, 'samples': 10737024, 'steps': 55921, 'loss/train': 1.3473113775253296} -08/30/2021 23:16:44 - INFO - __main__ - Step 55923: {'lr': 0.00035335235196063254, 'samples': 10737216, 'steps': 55922, 'loss/train': 3.014082431793213} -08/30/2021 23:16:44 - INFO - __main__ - Step 55924: {'lr': 0.0003533475199064632, 'samples': 10737408, 'steps': 55923, 'loss/train': 0.45372748374938965} -08/30/2021 23:16:46 - INFO - __main__ - Step 55925: {'lr': 0.00035334268780572707, 'samples': 10737600, 'steps': 55924, 'loss/train': 1.1645843982696533} -08/30/2021 23:16:47 - INFO - __main__ - Step 55926: {'lr': 0.0003533378556584263, 'samples': 10737792, 'steps': 55925, 'loss/train': 1.228293776512146} -08/30/2021 23:16:47 - INFO - __main__ - Step 55927: {'lr': 0.0003533330234645631, 'samples': 10737984, 'steps': 55926, 'loss/train': 1.7800734043121338} -08/30/2021 23:16:47 - INFO - __main__ - Step 55928: {'lr': 0.00035332819122413963, 'samples': 10738176, 'steps': 55927, 'loss/train': 0.6804536581039429} -08/30/2021 23:16:48 - INFO - __main__ - Step 55929: {'lr': 0.00035332335893715805, 'samples': 10738368, 'steps': 55928, 'loss/train': 1.5049625635147095} -08/30/2021 23:16:48 - INFO - __main__ - Step 55930: {'lr': 0.00035331852660362055, 'samples': 10738560, 'steps': 55929, 'loss/train': 0.024609217420220375} -08/30/2021 23:16:50 - INFO - __main__ - Step 55931: {'lr': 0.00035331369422352937, 'samples': 10738752, 'steps': 55930, 'loss/train': 1.2362762689590454} -08/30/2021 23:16:50 - INFO - __main__ - Step 55932: {'lr': 0.00035330886179688666, 'samples': 10738944, 'steps': 55931, 'loss/train': 1.341709852218628} -08/30/2021 23:16:50 - INFO - __main__ - Step 55933: {'lr': 0.0003533040293236945, 'samples': 10739136, 'steps': 55932, 'loss/train': 1.4676406383514404} -08/30/2021 23:16:51 - INFO - __main__ - Step 55934: {'lr': 0.0003532991968039552, 'samples': 10739328, 'steps': 55933, 'loss/train': 1.3624273538589478} -08/30/2021 23:16:51 - INFO - __main__ - Step 55935: {'lr': 0.0003532943642376708, 'samples': 10739520, 'steps': 55934, 'loss/train': 1.358296275138855} -08/30/2021 23:16:53 - INFO - __main__ - Step 55936: {'lr': 0.00035328953162484355, 'samples': 10739712, 'steps': 55935, 'loss/train': 1.3077239990234375} -08/30/2021 23:16:53 - INFO - __main__ - Step 55937: {'lr': 0.00035328469896547566, 'samples': 10739904, 'steps': 55936, 'loss/train': 1.3262988328933716} -08/30/2021 23:16:53 - INFO - __main__ - Step 55938: {'lr': 0.0003532798662595693, 'samples': 10740096, 'steps': 55937, 'loss/train': 1.6996756792068481} -08/30/2021 23:16:54 - INFO - __main__ - Step 55939: {'lr': 0.00035327503350712666, 'samples': 10740288, 'steps': 55938, 'loss/train': 1.3272464275360107} -08/30/2021 23:16:54 - INFO - __main__ - Step 55940: {'lr': 0.0003532702007081498, 'samples': 10740480, 'steps': 55939, 'loss/train': 1.7512575387954712} -08/30/2021 23:16:54 - INFO - __main__ - Step 55941: {'lr': 0.000353265367862641, 'samples': 10740672, 'steps': 55940, 'loss/train': 1.2952749729156494} -08/30/2021 23:16:56 - INFO - __main__ - Step 55942: {'lr': 0.0003532605349706025, 'samples': 10740864, 'steps': 55941, 'loss/train': 1.7662429809570312} -08/30/2021 23:16:56 - INFO - __main__ - Step 55943: {'lr': 0.00035325570203203626, 'samples': 10741056, 'steps': 55942, 'loss/train': 1.521077036857605} -08/30/2021 23:16:57 - INFO - __main__ - Step 55944: {'lr': 0.0003532508690469447, 'samples': 10741248, 'steps': 55943, 'loss/train': 0.4328659474849701} -08/30/2021 23:16:57 - INFO - __main__ - Step 55945: {'lr': 0.0003532460360153299, 'samples': 10741440, 'steps': 55944, 'loss/train': 2.03222918510437} -08/30/2021 23:16:57 - INFO - __main__ - Step 55946: {'lr': 0.000353241202937194, 'samples': 10741632, 'steps': 55945, 'loss/train': 0.24276189506053925} -08/30/2021 23:16:59 - INFO - __main__ - Step 55947: {'lr': 0.00035323636981253914, 'samples': 10741824, 'steps': 55946, 'loss/train': 0.6861918568611145} -08/30/2021 23:16:59 - INFO - __main__ - Step 55948: {'lr': 0.00035323153664136765, 'samples': 10742016, 'steps': 55947, 'loss/train': 0.6402886509895325} -08/30/2021 23:17:00 - INFO - __main__ - Step 55949: {'lr': 0.00035322670342368155, 'samples': 10742208, 'steps': 55948, 'loss/train': 0.5976836681365967} -08/30/2021 23:17:00 - INFO - __main__ - Step 55950: {'lr': 0.0003532218701594832, 'samples': 10742400, 'steps': 55949, 'loss/train': 1.0029876232147217} -08/30/2021 23:17:00 - INFO - __main__ - Step 55951: {'lr': 0.0003532170368487746, 'samples': 10742592, 'steps': 55950, 'loss/train': 1.2363777160644531} -08/30/2021 23:17:01 - INFO - __main__ - Step 55952: {'lr': 0.00035321220349155796, 'samples': 10742784, 'steps': 55951, 'loss/train': 1.3930597305297852} -08/30/2021 23:17:02 - INFO - __main__ - Step 55953: {'lr': 0.00035320737008783556, 'samples': 10742976, 'steps': 55952, 'loss/train': 1.1704849004745483} -08/30/2021 23:17:03 - INFO - __main__ - Step 55954: {'lr': 0.0003532025366376095, 'samples': 10743168, 'steps': 55953, 'loss/train': 1.309885859489441} -08/30/2021 23:17:03 - INFO - __main__ - Step 55955: {'lr': 0.0003531977031408819, 'samples': 10743360, 'steps': 55954, 'loss/train': 0.8559950590133667} -08/30/2021 23:17:03 - INFO - __main__ - Step 55956: {'lr': 0.0003531928695976551, 'samples': 10743552, 'steps': 55955, 'loss/train': 0.036718856543302536} -08/30/2021 23:17:04 - INFO - __main__ - Step 55957: {'lr': 0.00035318803600793117, 'samples': 10743744, 'steps': 55956, 'loss/train': 1.1626948118209839} -08/30/2021 23:17:05 - INFO - __main__ - Step 55958: {'lr': 0.00035318320237171224, 'samples': 10743936, 'steps': 55957, 'loss/train': 1.7497190237045288} -08/30/2021 23:17:06 - INFO - __main__ - Step 55959: {'lr': 0.0003531783686890006, 'samples': 10744128, 'steps': 55958, 'loss/train': 1.4779517650604248} -08/30/2021 23:17:06 - INFO - __main__ - Step 55960: {'lr': 0.0003531735349597984, 'samples': 10744320, 'steps': 55959, 'loss/train': 1.5500249862670898} -08/30/2021 23:17:06 - INFO - __main__ - Step 55961: {'lr': 0.0003531687011841077, 'samples': 10744512, 'steps': 55960, 'loss/train': 1.1005122661590576} -08/30/2021 23:17:07 - INFO - __main__ - Step 55962: {'lr': 0.0003531638673619309, 'samples': 10744704, 'steps': 55961, 'loss/train': 2.1470508575439453} -08/30/2021 23:17:08 - INFO - __main__ - Step 55963: {'lr': 0.00035315903349327, 'samples': 10744896, 'steps': 55962, 'loss/train': 4.586358070373535} -08/30/2021 23:17:09 - INFO - __main__ - Step 55964: {'lr': 0.00035315419957812725, 'samples': 10745088, 'steps': 55963, 'loss/train': 1.56167733669281} -08/30/2021 23:17:09 - INFO - __main__ - Step 55965: {'lr': 0.0003531493656165047, 'samples': 10745280, 'steps': 55964, 'loss/train': 1.7028981447219849} -08/30/2021 23:17:10 - INFO - __main__ - Step 55966: {'lr': 0.00035314453160840476, 'samples': 10745472, 'steps': 55965, 'loss/train': 1.1989740133285522} -08/30/2021 23:17:10 - INFO - __main__ - Step 55967: {'lr': 0.00035313969755382946, 'samples': 10745664, 'steps': 55966, 'loss/train': 1.065708875656128} -08/30/2021 23:17:11 - INFO - __main__ - Step 55968: {'lr': 0.000353134863452781, 'samples': 10745856, 'steps': 55967, 'loss/train': 0.7986748814582825} -08/30/2021 23:17:12 - INFO - __main__ - Step 55969: {'lr': 0.00035313002930526156, 'samples': 10746048, 'steps': 55968, 'loss/train': 1.3339710235595703} -08/30/2021 23:17:12 - INFO - __main__ - Step 55970: {'lr': 0.00035312519511127325, 'samples': 10746240, 'steps': 55969, 'loss/train': 0.46650388836860657} -08/30/2021 23:17:13 - INFO - __main__ - Step 55971: {'lr': 0.0003531203608708184, 'samples': 10746432, 'steps': 55970, 'loss/train': 1.0030601024627686} -08/30/2021 23:17:13 - INFO - __main__ - Step 55972: {'lr': 0.00035311552658389914, 'samples': 10746624, 'steps': 55971, 'loss/train': 0.7478862404823303} -08/30/2021 23:17:13 - INFO - __main__ - Step 55973: {'lr': 0.00035311069225051755, 'samples': 10746816, 'steps': 55972, 'loss/train': 1.30539870262146} -08/30/2021 23:17:15 - INFO - __main__ - Step 55974: {'lr': 0.0003531058578706759, 'samples': 10747008, 'steps': 55973, 'loss/train': 1.0208511352539062} -08/30/2021 23:17:16 - INFO - __main__ - Step 55975: {'lr': 0.00035310102344437636, 'samples': 10747200, 'steps': 55974, 'loss/train': 2.058894634246826} -08/30/2021 23:17:16 - INFO - __main__ - Step 55976: {'lr': 0.00035309618897162097, 'samples': 10747392, 'steps': 55975, 'loss/train': 1.3556779623031616} -08/30/2021 23:17:17 - INFO - __main__ - Step 55977: {'lr': 0.0003530913544524121, 'samples': 10747584, 'steps': 55976, 'loss/train': 1.1167582273483276} -08/30/2021 23:17:17 - INFO - __main__ - Step 55978: {'lr': 0.00035308651988675194, 'samples': 10747776, 'steps': 55977, 'loss/train': 0.8025023937225342} -08/30/2021 23:17:19 - INFO - __main__ - Step 55979: {'lr': 0.0003530816852746426, 'samples': 10747968, 'steps': 55978, 'loss/train': 1.558971881866455} -08/30/2021 23:17:19 - INFO - __main__ - Step 55980: {'lr': 0.00035307685061608605, 'samples': 10748160, 'steps': 55979, 'loss/train': 2.797186851501465} -08/30/2021 23:17:19 - INFO - __main__ - Step 55981: {'lr': 0.00035307201591108485, 'samples': 10748352, 'steps': 55980, 'loss/train': 0.6650704145431519} -08/30/2021 23:17:20 - INFO - __main__ - Step 55982: {'lr': 0.0003530671811596409, 'samples': 10748544, 'steps': 55981, 'loss/train': 0.13816869258880615} -08/30/2021 23:17:20 - INFO - __main__ - Step 55983: {'lr': 0.00035306234636175646, 'samples': 10748736, 'steps': 55982, 'loss/train': 0.6538945436477661} -08/30/2021 23:17:20 - INFO - __main__ - Step 55984: {'lr': 0.0003530575115174337, 'samples': 10748928, 'steps': 55983, 'loss/train': 0.9080739617347717} -08/30/2021 23:17:22 - INFO - __main__ - Step 55985: {'lr': 0.00035305267662667485, 'samples': 10749120, 'steps': 55984, 'loss/train': 5.056089401245117} -08/30/2021 23:17:23 - INFO - __main__ - Step 55986: {'lr': 0.0003530478416894821, 'samples': 10749312, 'steps': 55985, 'loss/train': 1.0960655212402344} -08/30/2021 23:17:23 - INFO - __main__ - Step 55987: {'lr': 0.00035304300670585754, 'samples': 10749504, 'steps': 55986, 'loss/train': 1.725856900215149} -08/30/2021 23:17:23 - INFO - __main__ - Step 55988: {'lr': 0.0003530381716758034, 'samples': 10749696, 'steps': 55987, 'loss/train': 1.5876543521881104} -08/30/2021 23:17:24 - INFO - __main__ - Step 55989: {'lr': 0.00035303333659932187, 'samples': 10749888, 'steps': 55988, 'loss/train': 1.1360228061676025} -08/30/2021 23:17:25 - INFO - __main__ - Step 55990: {'lr': 0.000353028501476415, 'samples': 10750080, 'steps': 55989, 'loss/train': 1.5563544034957886} -08/30/2021 23:17:26 - INFO - __main__ - Step 55991: {'lr': 0.0003530236663070852, 'samples': 10750272, 'steps': 55990, 'loss/train': 1.1620291471481323} -08/30/2021 23:17:26 - INFO - __main__ - Step 55992: {'lr': 0.00035301883109133456, 'samples': 10750464, 'steps': 55991, 'loss/train': 0.83155357837677} -08/30/2021 23:17:26 - INFO - __main__ - Step 55993: {'lr': 0.0003530139958291651, 'samples': 10750656, 'steps': 55992, 'loss/train': 0.9680225849151611} -08/30/2021 23:17:27 - INFO - __main__ - Step 55994: {'lr': 0.0003530091605205792, 'samples': 10750848, 'steps': 55993, 'loss/train': 1.6920452117919922} -08/30/2021 23:17:28 - INFO - __main__ - Step 55995: {'lr': 0.0003530043251655789, 'samples': 10751040, 'steps': 55994, 'loss/train': 1.4270563125610352} -08/30/2021 23:17:29 - INFO - __main__ - Step 55996: {'lr': 0.00035299948976416645, 'samples': 10751232, 'steps': 55995, 'loss/train': 1.6408499479293823} -08/30/2021 23:17:29 - INFO - __main__ - Step 55997: {'lr': 0.00035299465431634403, 'samples': 10751424, 'steps': 55996, 'loss/train': 1.7302969694137573} -08/30/2021 23:17:29 - INFO - __main__ - Step 55998: {'lr': 0.00035298981882211385, 'samples': 10751616, 'steps': 55997, 'loss/train': 1.7459830045700073} -08/30/2021 23:17:30 - INFO - __main__ - Step 55999: {'lr': 0.00035298498328147803, 'samples': 10751808, 'steps': 55998, 'loss/train': 1.2702487707138062} -08/30/2021 23:17:31 - INFO - __main__ - Step 56000: {'lr': 0.00035298014769443874, 'samples': 10752000, 'steps': 55999, 'loss/train': 2.059731960296631} -08/30/2021 23:17:32 - INFO - __main__ - Step 56001: {'lr': 0.0003529753120609982, 'samples': 10752192, 'steps': 56000, 'loss/train': 1.4488636255264282} -08/30/2021 23:17:32 - INFO - __main__ - Step 56002: {'lr': 0.0003529704763811585, 'samples': 10752384, 'steps': 56001, 'loss/train': 2.2082808017730713} -08/30/2021 23:17:32 - INFO - __main__ - Step 56003: {'lr': 0.000352965640654922, 'samples': 10752576, 'steps': 56002, 'loss/train': 0.9415165781974792} -08/30/2021 23:17:33 - INFO - __main__ - Step 56004: {'lr': 0.0003529608048822908, 'samples': 10752768, 'steps': 56003, 'loss/train': 1.3292121887207031} -08/30/2021 23:17:34 - INFO - __main__ - Step 56005: {'lr': 0.0003529559690632669, 'samples': 10752960, 'steps': 56004, 'loss/train': 1.4700969457626343} -08/30/2021 23:17:35 - INFO - __main__ - Step 56006: {'lr': 0.00035295113319785276, 'samples': 10753152, 'steps': 56005, 'loss/train': 1.6381988525390625} -08/30/2021 23:17:35 - INFO - __main__ - Step 56007: {'lr': 0.0003529462972860504, 'samples': 10753344, 'steps': 56006, 'loss/train': 1.5033495426177979} -08/30/2021 23:17:35 - INFO - __main__ - Step 56008: {'lr': 0.000352941461327862, 'samples': 10753536, 'steps': 56007, 'loss/train': 1.196776270866394} -08/30/2021 23:17:36 - INFO - __main__ - Step 56009: {'lr': 0.0003529366253232897, 'samples': 10753728, 'steps': 56008, 'loss/train': 1.2818739414215088} -08/30/2021 23:17:37 - INFO - __main__ - Step 56010: {'lr': 0.00035293178927233587, 'samples': 10753920, 'steps': 56009, 'loss/train': 0.7002621293067932} -08/30/2021 23:17:38 - INFO - __main__ - Step 56011: {'lr': 0.0003529269531750025, 'samples': 10754112, 'steps': 56010, 'loss/train': 0.8729087114334106} -08/30/2021 23:17:38 - INFO - __main__ - Step 56012: {'lr': 0.0003529221170312919, 'samples': 10754304, 'steps': 56011, 'loss/train': 1.4013751745224} -08/30/2021 23:17:39 - INFO - __main__ - Step 56013: {'lr': 0.0003529172808412061, 'samples': 10754496, 'steps': 56012, 'loss/train': 1.402565836906433} -08/30/2021 23:17:39 - INFO - __main__ - Step 56014: {'lr': 0.0003529124446047474, 'samples': 10754688, 'steps': 56013, 'loss/train': 1.1653759479522705} -08/30/2021 23:17:39 - INFO - __main__ - Step 56015: {'lr': 0.0003529076083219179, 'samples': 10754880, 'steps': 56014, 'loss/train': 0.6954762935638428} -08/30/2021 23:17:41 - INFO - __main__ - Step 56016: {'lr': 0.0003529027719927199, 'samples': 10755072, 'steps': 56015, 'loss/train': 1.5562806129455566} -08/30/2021 23:17:41 - INFO - __main__ - Step 56017: {'lr': 0.00035289793561715544, 'samples': 10755264, 'steps': 56016, 'loss/train': 1.1072672605514526} -08/30/2021 23:17:42 - INFO - __main__ - Step 56018: {'lr': 0.0003528930991952267, 'samples': 10755456, 'steps': 56017, 'loss/train': 1.633586049079895} -08/30/2021 23:17:42 - INFO - __main__ - Step 56019: {'lr': 0.00035288826272693606, 'samples': 10755648, 'steps': 56018, 'loss/train': 1.2012773752212524} -08/30/2021 23:17:42 - INFO - __main__ - Step 56020: {'lr': 0.0003528834262122855, 'samples': 10755840, 'steps': 56019, 'loss/train': 1.118121862411499} -08/30/2021 23:17:44 - INFO - __main__ - Step 56021: {'lr': 0.00035287858965127723, 'samples': 10756032, 'steps': 56020, 'loss/train': 1.5564519166946411} -08/30/2021 23:17:44 - INFO - __main__ - Step 56022: {'lr': 0.00035287375304391343, 'samples': 10756224, 'steps': 56021, 'loss/train': 1.4478741884231567} -08/30/2021 23:17:45 - INFO - __main__ - Step 56023: {'lr': 0.00035286891639019636, 'samples': 10756416, 'steps': 56022, 'loss/train': 1.6184475421905518} -08/30/2021 23:17:45 - INFO - __main__ - Step 56024: {'lr': 0.00035286407969012813, 'samples': 10756608, 'steps': 56023, 'loss/train': 0.6426447629928589} -08/30/2021 23:17:45 - INFO - __main__ - Step 56025: {'lr': 0.00035285924294371085, 'samples': 10756800, 'steps': 56024, 'loss/train': 1.3158751726150513} -08/30/2021 23:17:47 - INFO - __main__ - Step 56026: {'lr': 0.00035285440615094696, 'samples': 10756992, 'steps': 56025, 'loss/train': 1.6479753255844116} -08/30/2021 23:17:48 - INFO - __main__ - Step 56027: {'lr': 0.0003528495693118383, 'samples': 10757184, 'steps': 56026, 'loss/train': 1.2189514636993408} -08/30/2021 23:17:48 - INFO - __main__ - Step 56028: {'lr': 0.0003528447324263873, 'samples': 10757376, 'steps': 56027, 'loss/train': 1.6366844177246094} -08/30/2021 23:17:48 - INFO - __main__ - Step 56029: {'lr': 0.000352839895494596, 'samples': 10757568, 'steps': 56028, 'loss/train': 1.5302352905273438} -08/30/2021 23:17:49 - INFO - __main__ - Step 56030: {'lr': 0.00035283505851646665, 'samples': 10757760, 'steps': 56029, 'loss/train': 1.88230562210083} -08/30/2021 23:17:50 - INFO - __main__ - Step 56031: {'lr': 0.0003528302214920014, 'samples': 10757952, 'steps': 56030, 'loss/train': 1.1060776710510254} -08/30/2021 23:17:51 - INFO - __main__ - Step 56032: {'lr': 0.0003528253844212024, 'samples': 10758144, 'steps': 56031, 'loss/train': 1.2878245115280151} -08/30/2021 23:17:51 - INFO - __main__ - Step 56033: {'lr': 0.00035282054730407196, 'samples': 10758336, 'steps': 56032, 'loss/train': 1.1769263744354248} -08/30/2021 23:17:51 - INFO - __main__ - Step 56034: {'lr': 0.00035281571014061214, 'samples': 10758528, 'steps': 56033, 'loss/train': 1.1614952087402344} -08/30/2021 23:17:52 - INFO - __main__ - Step 56035: {'lr': 0.0003528108729308251, 'samples': 10758720, 'steps': 56034, 'loss/train': 1.446807622909546} -08/30/2021 23:17:53 - INFO - __main__ - Step 56036: {'lr': 0.0003528060356747131, 'samples': 10758912, 'steps': 56035, 'loss/train': 1.337592363357544} -08/30/2021 23:17:54 - INFO - __main__ - Step 56037: {'lr': 0.0003528011983722783, 'samples': 10759104, 'steps': 56036, 'loss/train': 0.8057197332382202} -08/30/2021 23:17:54 - INFO - __main__ - Step 56038: {'lr': 0.0003527963610235229, 'samples': 10759296, 'steps': 56037, 'loss/train': 1.2137131690979004} -08/30/2021 23:17:55 - INFO - __main__ - Step 56039: {'lr': 0.000352791523628449, 'samples': 10759488, 'steps': 56038, 'loss/train': 1.5632894039154053} -08/30/2021 23:17:55 - INFO - __main__ - Step 56040: {'lr': 0.0003527866861870588, 'samples': 10759680, 'steps': 56039, 'loss/train': 1.262122392654419} -08/30/2021 23:17:55 - INFO - __main__ - Step 56041: {'lr': 0.00035278184869935454, 'samples': 10759872, 'steps': 56040, 'loss/train': 1.5366052389144897} -08/30/2021 23:17:57 - INFO - __main__ - Step 56042: {'lr': 0.0003527770111653383, 'samples': 10760064, 'steps': 56041, 'loss/train': 0.9623920917510986} -08/30/2021 23:17:58 - INFO - __main__ - Step 56043: {'lr': 0.0003527721735850124, 'samples': 10760256, 'steps': 56042, 'loss/train': 1.455899715423584} -08/30/2021 23:17:58 - INFO - __main__ - Step 56044: {'lr': 0.0003527673359583789, 'samples': 10760448, 'steps': 56043, 'loss/train': 0.3491433560848236} -08/30/2021 23:17:59 - INFO - __main__ - Step 56045: {'lr': 0.00035276249828544004, 'samples': 10760640, 'steps': 56044, 'loss/train': 1.0315723419189453} -08/30/2021 23:17:59 - INFO - __main__ - Step 56046: {'lr': 0.0003527576605661981, 'samples': 10760832, 'steps': 56045, 'loss/train': 1.898078441619873} -08/30/2021 23:17:59 - INFO - __main__ - Step 56047: {'lr': 0.00035275282280065493, 'samples': 10761024, 'steps': 56046, 'loss/train': 0.8580057621002197} -08/30/2021 23:18:01 - INFO - __main__ - Step 56048: {'lr': 0.00035274798498881305, 'samples': 10761216, 'steps': 56047, 'loss/train': 0.8985004425048828} -08/30/2021 23:18:01 - INFO - __main__ - Step 56049: {'lr': 0.00035274314713067454, 'samples': 10761408, 'steps': 56048, 'loss/train': 1.4637941122055054} -08/30/2021 23:18:02 - INFO - __main__ - Step 56050: {'lr': 0.00035273830922624147, 'samples': 10761600, 'steps': 56049, 'loss/train': 1.1327402591705322} -08/30/2021 23:18:02 - INFO - __main__ - Step 56051: {'lr': 0.00035273347127551616, 'samples': 10761792, 'steps': 56050, 'loss/train': 1.7856755256652832} -08/30/2021 23:18:02 - INFO - __main__ - Step 56052: {'lr': 0.00035272863327850067, 'samples': 10761984, 'steps': 56051, 'loss/train': 1.7522681951522827} -08/30/2021 23:18:03 - INFO - __main__ - Step 56053: {'lr': 0.00035272379523519734, 'samples': 10762176, 'steps': 56052, 'loss/train': 1.6141204833984375} -08/30/2021 23:18:04 - INFO - __main__ - Step 56054: {'lr': 0.0003527189571456082, 'samples': 10762368, 'steps': 56053, 'loss/train': 1.451524257659912} -08/30/2021 23:18:05 - INFO - __main__ - Step 56055: {'lr': 0.00035271411900973545, 'samples': 10762560, 'steps': 56054, 'loss/train': 1.6046028137207031} -08/30/2021 23:18:05 - INFO - __main__ - Step 56056: {'lr': 0.00035270928082758134, 'samples': 10762752, 'steps': 56055, 'loss/train': 1.204519510269165} -08/30/2021 23:18:05 - INFO - __main__ - Step 56057: {'lr': 0.00035270444259914794, 'samples': 10762944, 'steps': 56056, 'loss/train': 1.9650378227233887} -08/30/2021 23:18:06 - INFO - __main__ - Step 56058: {'lr': 0.0003526996043244376, 'samples': 10763136, 'steps': 56057, 'loss/train': 1.672080397605896} -08/30/2021 23:18:07 - INFO - __main__ - Step 56059: {'lr': 0.0003526947660034524, 'samples': 10763328, 'steps': 56058, 'loss/train': 0.6025868058204651} -08/30/2021 23:18:08 - INFO - __main__ - Step 56060: {'lr': 0.0003526899276361945, 'samples': 10763520, 'steps': 56059, 'loss/train': 1.8122081756591797} -08/30/2021 23:18:08 - INFO - __main__ - Step 56061: {'lr': 0.00035268508922266614, 'samples': 10763712, 'steps': 56060, 'loss/train': 1.5484557151794434} -08/30/2021 23:18:09 - INFO - __main__ - Step 56062: {'lr': 0.00035268025076286936, 'samples': 10763904, 'steps': 56061, 'loss/train': 1.7149593830108643} -08/30/2021 23:18:09 - INFO - __main__ - Step 56063: {'lr': 0.00035267541225680654, 'samples': 10764096, 'steps': 56062, 'loss/train': 1.268869400024414} -08/30/2021 23:18:10 - INFO - __main__ - Step 56064: {'lr': 0.00035267057370447967, 'samples': 10764288, 'steps': 56063, 'loss/train': 1.5896377563476562} -08/30/2021 23:18:11 - INFO - __main__ - Step 56065: {'lr': 0.00035266573510589114, 'samples': 10764480, 'steps': 56064, 'loss/train': 0.9475966095924377} -08/30/2021 23:18:11 - INFO - __main__ - Step 56066: {'lr': 0.00035266089646104296, 'samples': 10764672, 'steps': 56065, 'loss/train': 1.5359894037246704} -08/30/2021 23:18:12 - INFO - __main__ - Step 56067: {'lr': 0.00035265605776993735, 'samples': 10764864, 'steps': 56066, 'loss/train': 1.6587549448013306} -08/30/2021 23:18:12 - INFO - __main__ - Step 56068: {'lr': 0.0003526512190325765, 'samples': 10765056, 'steps': 56067, 'loss/train': 0.628121554851532} -08/30/2021 23:18:14 - INFO - __main__ - Step 56069: {'lr': 0.0003526463802489626, 'samples': 10765248, 'steps': 56068, 'loss/train': 1.3799668550491333} -08/30/2021 23:18:14 - INFO - __main__ - Step 56070: {'lr': 0.00035264154141909787, 'samples': 10765440, 'steps': 56069, 'loss/train': 1.812149167060852} -08/30/2021 23:18:15 - INFO - __main__ - Step 56071: {'lr': 0.00035263670254298443, 'samples': 10765632, 'steps': 56070, 'loss/train': 1.2185698747634888} -08/30/2021 23:18:15 - INFO - __main__ - Step 56072: {'lr': 0.0003526318636206244, 'samples': 10765824, 'steps': 56071, 'loss/train': 1.196087121963501} -08/30/2021 23:18:15 - INFO - __main__ - Step 56073: {'lr': 0.0003526270246520201, 'samples': 10766016, 'steps': 56072, 'loss/train': 1.5084068775177002} -08/30/2021 23:18:17 - INFO - __main__ - Step 56074: {'lr': 0.0003526221856371737, 'samples': 10766208, 'steps': 56073, 'loss/train': 0.15835455060005188} -08/30/2021 23:18:17 - INFO - __main__ - Step 56075: {'lr': 0.0003526173465760872, 'samples': 10766400, 'steps': 56074, 'loss/train': 1.6262229681015015} -08/30/2021 23:18:18 - INFO - __main__ - Step 56076: {'lr': 0.000352612507468763, 'samples': 10766592, 'steps': 56075, 'loss/train': 0.9375470876693726} -08/30/2021 23:18:18 - INFO - __main__ - Step 56077: {'lr': 0.00035260766831520315, 'samples': 10766784, 'steps': 56076, 'loss/train': 1.4606602191925049} -08/30/2021 23:18:18 - INFO - __main__ - Step 56078: {'lr': 0.0003526028291154099, 'samples': 10766976, 'steps': 56077, 'loss/train': 1.2322391271591187} -08/30/2021 23:18:19 - INFO - __main__ - Step 56079: {'lr': 0.00035259798986938537, 'samples': 10767168, 'steps': 56078, 'loss/train': 1.2986236810684204} -08/30/2021 23:18:21 - INFO - __main__ - Step 56080: {'lr': 0.00035259315057713177, 'samples': 10767360, 'steps': 56079, 'loss/train': 1.610724925994873} -08/30/2021 23:18:22 - INFO - __main__ - Step 56081: {'lr': 0.0003525883112386513, 'samples': 10767552, 'steps': 56080, 'loss/train': 0.18006126582622528} -08/30/2021 23:18:22 - INFO - __main__ - Step 56082: {'lr': 0.00035258347185394606, 'samples': 10767744, 'steps': 56081, 'loss/train': 1.3237583637237549} -08/30/2021 23:18:22 - INFO - __main__ - Step 56083: {'lr': 0.00035257863242301834, 'samples': 10767936, 'steps': 56082, 'loss/train': 1.254301905632019} -08/30/2021 23:18:23 - INFO - __main__ - Step 56084: {'lr': 0.0003525737929458703, 'samples': 10768128, 'steps': 56083, 'loss/train': 1.6901192665100098} -08/30/2021 23:18:24 - INFO - __main__ - Step 56085: {'lr': 0.0003525689534225041, 'samples': 10768320, 'steps': 56084, 'loss/train': 0.5801014304161072} -08/30/2021 23:18:25 - INFO - __main__ - Step 56086: {'lr': 0.00035256411385292186, 'samples': 10768512, 'steps': 56085, 'loss/train': 0.875618040561676} -08/30/2021 23:18:25 - INFO - __main__ - Step 56087: {'lr': 0.0003525592742371258, 'samples': 10768704, 'steps': 56086, 'loss/train': 1.3801052570343018} -08/30/2021 23:18:25 - INFO - __main__ - Step 56088: {'lr': 0.0003525544345751182, 'samples': 10768896, 'steps': 56087, 'loss/train': 1.2382384538650513} -08/30/2021 23:18:26 - INFO - __main__ - Step 56089: {'lr': 0.00035254959486690103, 'samples': 10769088, 'steps': 56088, 'loss/train': 1.844489336013794} -08/30/2021 23:18:28 - INFO - __main__ - Step 56090: {'lr': 0.0003525447551124766, 'samples': 10769280, 'steps': 56089, 'loss/train': 1.1721967458724976} -08/30/2021 23:18:28 - INFO - __main__ - Step 56091: {'lr': 0.0003525399153118472, 'samples': 10769472, 'steps': 56090, 'loss/train': 1.5204496383666992} -08/30/2021 23:18:28 - INFO - __main__ - Step 56092: {'lr': 0.00035253507546501484, 'samples': 10769664, 'steps': 56091, 'loss/train': 1.4560885429382324} -08/30/2021 23:18:29 - INFO - __main__ - Step 56093: {'lr': 0.0003525302355719818, 'samples': 10769856, 'steps': 56092, 'loss/train': 0.09196337312459946} -08/30/2021 23:18:29 - INFO - __main__ - Step 56094: {'lr': 0.0003525253956327501, 'samples': 10770048, 'steps': 56093, 'loss/train': 1.0260504484176636} -08/30/2021 23:18:31 - INFO - __main__ - Step 56095: {'lr': 0.0003525205556473221, 'samples': 10770240, 'steps': 56094, 'loss/train': 1.2777884006500244} -08/30/2021 23:18:31 - INFO - __main__ - Step 56096: {'lr': 0.0003525157156157, 'samples': 10770432, 'steps': 56095, 'loss/train': 0.978280246257782} -08/30/2021 23:18:32 - INFO - __main__ - Step 56097: {'lr': 0.00035251087553788584, 'samples': 10770624, 'steps': 56096, 'loss/train': 0.2951096296310425} -08/30/2021 23:18:32 - INFO - __main__ - Step 56098: {'lr': 0.00035250603541388183, 'samples': 10770816, 'steps': 56097, 'loss/train': 1.4409778118133545} -08/30/2021 23:18:32 - INFO - __main__ - Step 56099: {'lr': 0.00035250119524369016, 'samples': 10771008, 'steps': 56098, 'loss/train': 1.1865261793136597} -08/30/2021 23:18:34 - INFO - __main__ - Step 56100: {'lr': 0.00035249635502731315, 'samples': 10771200, 'steps': 56099, 'loss/train': 1.577815055847168} -08/30/2021 23:18:34 - INFO - __main__ - Step 56101: {'lr': 0.0003524915147647528, 'samples': 10771392, 'steps': 56100, 'loss/train': 0.9136101603507996} -08/30/2021 23:18:35 - INFO - __main__ - Step 56102: {'lr': 0.00035248667445601133, 'samples': 10771584, 'steps': 56101, 'loss/train': 1.368881344795227} -08/30/2021 23:18:35 - INFO - __main__ - Step 56103: {'lr': 0.00035248183410109096, 'samples': 10771776, 'steps': 56102, 'loss/train': 1.2927809953689575} -08/30/2021 23:18:35 - INFO - __main__ - Step 56104: {'lr': 0.0003524769936999939, 'samples': 10771968, 'steps': 56103, 'loss/train': 1.1680505275726318} -08/30/2021 23:18:37 - INFO - __main__ - Step 56105: {'lr': 0.0003524721532527222, 'samples': 10772160, 'steps': 56104, 'loss/train': 0.5859238505363464} -08/30/2021 23:18:38 - INFO - __main__ - Step 56106: {'lr': 0.0003524673127592782, 'samples': 10772352, 'steps': 56105, 'loss/train': 1.632218837738037} -08/30/2021 23:18:38 - INFO - __main__ - Step 56107: {'lr': 0.000352462472219664, 'samples': 10772544, 'steps': 56106, 'loss/train': 1.3636125326156616} -08/30/2021 23:18:38 - INFO - __main__ - Step 56108: {'lr': 0.0003524576316338818, 'samples': 10772736, 'steps': 56107, 'loss/train': 1.5793567895889282} -08/30/2021 23:18:39 - INFO - __main__ - Step 56109: {'lr': 0.0003524527910019337, 'samples': 10772928, 'steps': 56108, 'loss/train': 0.7637110352516174} -08/30/2021 23:18:39 - INFO - __main__ - Step 56110: {'lr': 0.00035244795032382206, 'samples': 10773120, 'steps': 56109, 'loss/train': 1.433558702468872} -08/30/2021 23:18:41 - INFO - __main__ - Step 56111: {'lr': 0.00035244310959954886, 'samples': 10773312, 'steps': 56110, 'loss/train': 1.1827833652496338} -08/30/2021 23:18:41 - INFO - __main__ - Step 56112: {'lr': 0.0003524382688291164, 'samples': 10773504, 'steps': 56111, 'loss/train': 1.3213157653808594} -08/30/2021 23:18:41 - INFO - __main__ - Step 56113: {'lr': 0.0003524334280125269, 'samples': 10773696, 'steps': 56112, 'loss/train': 1.2803272008895874} -08/30/2021 23:18:42 - INFO - __main__ - Step 56114: {'lr': 0.0003524285871497824, 'samples': 10773888, 'steps': 56113, 'loss/train': 1.3229001760482788} -08/30/2021 23:18:42 - INFO - __main__ - Step 56115: {'lr': 0.0003524237462408852, 'samples': 10774080, 'steps': 56114, 'loss/train': 1.3458489179611206} -08/30/2021 23:18:43 - INFO - __main__ - Step 56116: {'lr': 0.0003524189052858374, 'samples': 10774272, 'steps': 56115, 'loss/train': 1.4338762760162354} -08/30/2021 23:18:44 - INFO - __main__ - Step 56117: {'lr': 0.0003524140642846413, 'samples': 10774464, 'steps': 56116, 'loss/train': 0.9339413046836853} -08/30/2021 23:18:44 - INFO - __main__ - Step 56118: {'lr': 0.0003524092232372989, 'samples': 10774656, 'steps': 56117, 'loss/train': 1.4327658414840698} -08/30/2021 23:18:45 - INFO - __main__ - Step 56119: {'lr': 0.00035240438214381253, 'samples': 10774848, 'steps': 56118, 'loss/train': 0.6079670190811157} -08/30/2021 23:18:45 - INFO - __main__ - Step 56120: {'lr': 0.00035239954100418436, 'samples': 10775040, 'steps': 56119, 'loss/train': 1.5516875982284546} -08/30/2021 23:18:47 - INFO - __main__ - Step 56121: {'lr': 0.00035239469981841656, 'samples': 10775232, 'steps': 56120, 'loss/train': 1.196666955947876} -08/30/2021 23:18:47 - INFO - __main__ - Step 56122: {'lr': 0.0003523898585865112, 'samples': 10775424, 'steps': 56121, 'loss/train': 0.13357695937156677} -08/30/2021 23:18:48 - INFO - __main__ - Step 56123: {'lr': 0.0003523850173084706, 'samples': 10775616, 'steps': 56122, 'loss/train': 0.09028620272874832} -08/30/2021 23:18:48 - INFO - __main__ - Step 56124: {'lr': 0.00035238017598429686, 'samples': 10775808, 'steps': 56123, 'loss/train': 1.5310717821121216} -08/30/2021 23:18:48 - INFO - __main__ - Step 56125: {'lr': 0.0003523753346139922, 'samples': 10776000, 'steps': 56124, 'loss/train': 0.033919867128133774} -08/30/2021 23:18:50 - INFO - __main__ - Step 56126: {'lr': 0.0003523704931975588, 'samples': 10776192, 'steps': 56125, 'loss/train': 1.2060437202453613} -08/30/2021 23:18:50 - INFO - __main__ - Step 56127: {'lr': 0.0003523656517349989, 'samples': 10776384, 'steps': 56126, 'loss/train': 0.9775595664978027} -08/30/2021 23:18:51 - INFO - __main__ - Step 56128: {'lr': 0.0003523608102263145, 'samples': 10776576, 'steps': 56127, 'loss/train': 1.4229363203048706} -08/30/2021 23:18:51 - INFO - __main__ - Step 56129: {'lr': 0.00035235596867150797, 'samples': 10776768, 'steps': 56128, 'loss/train': 1.6255919933319092} -08/30/2021 23:18:51 - INFO - __main__ - Step 56130: {'lr': 0.0003523511270705814, 'samples': 10776960, 'steps': 56129, 'loss/train': 1.526809811592102} -08/30/2021 23:18:53 - INFO - __main__ - Step 56131: {'lr': 0.000352346285423537, 'samples': 10777152, 'steps': 56130, 'loss/train': 1.7387748956680298} -08/30/2021 23:18:54 - INFO - __main__ - Step 56132: {'lr': 0.0003523414437303769, 'samples': 10777344, 'steps': 56131, 'loss/train': 1.50251042842865} -08/30/2021 23:18:54 - INFO - __main__ - Step 56133: {'lr': 0.0003523366019911035, 'samples': 10777536, 'steps': 56132, 'loss/train': 1.5491119623184204} -08/30/2021 23:18:54 - INFO - __main__ - Step 56134: {'lr': 0.00035233176020571863, 'samples': 10777728, 'steps': 56133, 'loss/train': 1.5228233337402344} -08/30/2021 23:18:55 - INFO - __main__ - Step 56135: {'lr': 0.0003523269183742246, 'samples': 10777920, 'steps': 56134, 'loss/train': 0.19605764746665955} -08/30/2021 23:18:57 - INFO - __main__ - Step 56136: {'lr': 0.0003523220764966238, 'samples': 10778112, 'steps': 56135, 'loss/train': 0.9463578462600708} -08/30/2021 23:18:57 - INFO - __main__ - Step 56137: {'lr': 0.00035231723457291816, 'samples': 10778304, 'steps': 56136, 'loss/train': 1.3300654888153076} -08/30/2021 23:18:58 - INFO - __main__ - Step 56138: {'lr': 0.00035231239260311, 'samples': 10778496, 'steps': 56137, 'loss/train': 1.4234219789505005} -08/30/2021 23:18:58 - INFO - __main__ - Step 56139: {'lr': 0.0003523075505872014, 'samples': 10778688, 'steps': 56138, 'loss/train': 1.4116520881652832} -08/30/2021 23:18:58 - INFO - __main__ - Step 56140: {'lr': 0.00035230270852519465, 'samples': 10778880, 'steps': 56139, 'loss/train': 1.6587998867034912} -08/30/2021 23:19:00 - INFO - __main__ - Step 56141: {'lr': 0.00035229786641709183, 'samples': 10779072, 'steps': 56140, 'loss/train': 1.2101954221725464} -08/30/2021 23:19:00 - INFO - __main__ - Step 56142: {'lr': 0.00035229302426289524, 'samples': 10779264, 'steps': 56141, 'loss/train': 1.4990845918655396} -08/30/2021 23:19:01 - INFO - __main__ - Step 56143: {'lr': 0.00035228818206260693, 'samples': 10779456, 'steps': 56142, 'loss/train': 0.03902850300073624} -08/30/2021 23:19:01 - INFO - __main__ - Step 56144: {'lr': 0.00035228333981622914, 'samples': 10779648, 'steps': 56143, 'loss/train': 1.2967021465301514} -08/30/2021 23:19:02 - INFO - __main__ - Step 56145: {'lr': 0.0003522784975237641, 'samples': 10779840, 'steps': 56144, 'loss/train': 2.1445465087890625} -08/30/2021 23:19:02 - INFO - __main__ - Step 56146: {'lr': 0.00035227365518521387, 'samples': 10780032, 'steps': 56145, 'loss/train': 1.4401345252990723} -08/30/2021 23:19:02 - INFO - __main__ - Step 56147: {'lr': 0.00035226881280058084, 'samples': 10780224, 'steps': 56146, 'loss/train': 2.1475000381469727} -08/30/2021 23:19:04 - INFO - __main__ - Step 56148: {'lr': 0.00035226397036986694, 'samples': 10780416, 'steps': 56147, 'loss/train': 0.6699005365371704} -08/30/2021 23:19:04 - INFO - __main__ - Step 56149: {'lr': 0.0003522591278930745, 'samples': 10780608, 'steps': 56148, 'loss/train': 1.2636817693710327} -08/30/2021 23:19:05 - INFO - __main__ - Step 56150: {'lr': 0.0003522542853702057, 'samples': 10780800, 'steps': 56149, 'loss/train': 1.2275676727294922} -08/30/2021 23:19:05 - INFO - __main__ - Step 56151: {'lr': 0.0003522494428012627, 'samples': 10780992, 'steps': 56150, 'loss/train': 1.235756754875183} -08/30/2021 23:19:05 - INFO - __main__ - Step 56152: {'lr': 0.0003522446001862476, 'samples': 10781184, 'steps': 56151, 'loss/train': 0.8936092853546143} -08/30/2021 23:19:07 - INFO - __main__ - Step 56153: {'lr': 0.00035223975752516273, 'samples': 10781376, 'steps': 56152, 'loss/train': 1.486735463142395} -08/30/2021 23:19:07 - INFO - __main__ - Step 56154: {'lr': 0.0003522349148180103, 'samples': 10781568, 'steps': 56153, 'loss/train': 1.398812174797058} -08/30/2021 23:19:08 - INFO - __main__ - Step 56155: {'lr': 0.00035223007206479226, 'samples': 10781760, 'steps': 56154, 'loss/train': 1.2574031352996826} -08/30/2021 23:19:08 - INFO - __main__ - Step 56156: {'lr': 0.00035222522926551094, 'samples': 10781952, 'steps': 56155, 'loss/train': 1.2187272310256958} -08/30/2021 23:19:08 - INFO - __main__ - Step 56157: {'lr': 0.0003522203864201685, 'samples': 10782144, 'steps': 56156, 'loss/train': 1.5818597078323364} -08/30/2021 23:19:10 - INFO - __main__ - Step 56158: {'lr': 0.00035221554352876715, 'samples': 10782336, 'steps': 56157, 'loss/train': 1.8235902786254883} -08/30/2021 23:19:10 - INFO - __main__ - Step 56159: {'lr': 0.00035221070059130913, 'samples': 10782528, 'steps': 56158, 'loss/train': 0.8171112537384033} -08/30/2021 23:19:11 - INFO - __main__ - Step 56160: {'lr': 0.0003522058576077965, 'samples': 10782720, 'steps': 56159, 'loss/train': 1.5544496774673462} -08/30/2021 23:19:11 - INFO - __main__ - Step 56161: {'lr': 0.00035220101457823143, 'samples': 10782912, 'steps': 56160, 'loss/train': 0.9186850786209106} -08/30/2021 23:19:11 - INFO - __main__ - Step 56162: {'lr': 0.0003521961715026162, 'samples': 10783104, 'steps': 56161, 'loss/train': 0.8501166105270386} -08/30/2021 23:19:13 - INFO - __main__ - Step 56163: {'lr': 0.0003521913283809529, 'samples': 10783296, 'steps': 56162, 'loss/train': 0.8954331278800964} -08/30/2021 23:19:14 - INFO - __main__ - Step 56164: {'lr': 0.00035218648521324387, 'samples': 10783488, 'steps': 56163, 'loss/train': 0.6433175206184387} -08/30/2021 23:19:14 - INFO - __main__ - Step 56165: {'lr': 0.0003521816419994911, 'samples': 10783680, 'steps': 56164, 'loss/train': 1.3150888681411743} -08/30/2021 23:19:14 - INFO - __main__ - Step 56166: {'lr': 0.0003521767987396969, 'samples': 10783872, 'steps': 56165, 'loss/train': 0.16733968257904053} -08/30/2021 23:19:15 - INFO - __main__ - Step 56167: {'lr': 0.00035217195543386345, 'samples': 10784064, 'steps': 56166, 'loss/train': 0.23477235436439514} -08/30/2021 23:19:16 - INFO - __main__ - Step 56168: {'lr': 0.0003521671120819928, 'samples': 10784256, 'steps': 56167, 'loss/train': 2.9166364669799805} -08/30/2021 23:19:17 - INFO - __main__ - Step 56169: {'lr': 0.0003521622686840873, 'samples': 10784448, 'steps': 56168, 'loss/train': 1.4661478996276855} -08/30/2021 23:19:17 - INFO - __main__ - Step 56170: {'lr': 0.000352157425240149, 'samples': 10784640, 'steps': 56169, 'loss/train': 1.411795973777771} -08/30/2021 23:19:17 - INFO - __main__ - Step 56171: {'lr': 0.00035215258175018015, 'samples': 10784832, 'steps': 56170, 'loss/train': 1.772681713104248} -08/30/2021 23:19:18 - INFO - __main__ - Step 56172: {'lr': 0.00035214773821418295, 'samples': 10785024, 'steps': 56171, 'loss/train': 1.4317295551300049} -08/30/2021 23:19:19 - INFO - __main__ - Step 56173: {'lr': 0.00035214289463215954, 'samples': 10785216, 'steps': 56172, 'loss/train': 1.6848418712615967} -08/30/2021 23:19:20 - INFO - __main__ - Step 56174: {'lr': 0.00035213805100411217, 'samples': 10785408, 'steps': 56173, 'loss/train': 1.1198793649673462} -08/30/2021 23:19:20 - INFO - __main__ - Step 56175: {'lr': 0.00035213320733004297, 'samples': 10785600, 'steps': 56174, 'loss/train': 1.8251439332962036} -08/30/2021 23:19:20 - INFO - __main__ - Step 56176: {'lr': 0.00035212836360995405, 'samples': 10785792, 'steps': 56175, 'loss/train': 1.3288264274597168} -08/30/2021 23:19:21 - INFO - __main__ - Step 56177: {'lr': 0.0003521235198438477, 'samples': 10785984, 'steps': 56176, 'loss/train': 1.2904421091079712} -08/30/2021 23:19:21 - INFO - __main__ - Step 56178: {'lr': 0.000352118676031726, 'samples': 10786176, 'steps': 56177, 'loss/train': 1.4400594234466553} -08/30/2021 23:19:23 - INFO - __main__ - Step 56179: {'lr': 0.0003521138321735913, 'samples': 10786368, 'steps': 56178, 'loss/train': 1.3378797769546509} -08/30/2021 23:19:23 - INFO - __main__ - Step 56180: {'lr': 0.0003521089882694456, 'samples': 10786560, 'steps': 56179, 'loss/train': 1.5753055810928345} -08/30/2021 23:19:23 - INFO - __main__ - Step 56181: {'lr': 0.0003521041443192913, 'samples': 10786752, 'steps': 56180, 'loss/train': 1.7837469577789307} -08/30/2021 23:19:24 - INFO - __main__ - Step 56182: {'lr': 0.00035209930032313033, 'samples': 10786944, 'steps': 56181, 'loss/train': 1.1433008909225464} -08/30/2021 23:19:24 - INFO - __main__ - Step 56183: {'lr': 0.000352094456280965, 'samples': 10787136, 'steps': 56182, 'loss/train': 1.3171823024749756} -08/30/2021 23:19:26 - INFO - __main__ - Step 56184: {'lr': 0.0003520896121927975, 'samples': 10787328, 'steps': 56183, 'loss/train': 1.5922255516052246} -08/30/2021 23:19:26 - INFO - __main__ - Step 56185: {'lr': 0.00035208476805863, 'samples': 10787520, 'steps': 56184, 'loss/train': 0.9351261258125305} -08/30/2021 23:19:26 - INFO - __main__ - Step 56186: {'lr': 0.00035207992387846466, 'samples': 10787712, 'steps': 56185, 'loss/train': 1.7132059335708618} -08/30/2021 23:19:27 - INFO - __main__ - Step 56187: {'lr': 0.0003520750796523037, 'samples': 10787904, 'steps': 56186, 'loss/train': 1.6543177366256714} -08/30/2021 23:19:27 - INFO - __main__ - Step 56188: {'lr': 0.0003520702353801493, 'samples': 10788096, 'steps': 56187, 'loss/train': 1.239197850227356} -08/30/2021 23:19:28 - INFO - __main__ - Step 56189: {'lr': 0.0003520653910620036, 'samples': 10788288, 'steps': 56188, 'loss/train': 0.5263615846633911} -08/30/2021 23:19:29 - INFO - __main__ - Step 56190: {'lr': 0.0003520605466978688, 'samples': 10788480, 'steps': 56189, 'loss/train': 1.5944441556930542} -08/30/2021 23:19:30 - INFO - __main__ - Step 56191: {'lr': 0.00035205570228774715, 'samples': 10788672, 'steps': 56190, 'loss/train': 1.3017621040344238} -08/30/2021 23:19:30 - INFO - __main__ - Step 56192: {'lr': 0.0003520508578316407, 'samples': 10788864, 'steps': 56191, 'loss/train': 1.1193162202835083} -08/30/2021 23:19:31 - INFO - __main__ - Step 56193: {'lr': 0.0003520460133295518, 'samples': 10789056, 'steps': 56192, 'loss/train': 0.788877010345459} -08/30/2021 23:19:31 - INFO - __main__ - Step 56194: {'lr': 0.0003520411687814825, 'samples': 10789248, 'steps': 56193, 'loss/train': 1.5324747562408447} -08/30/2021 23:19:33 - INFO - __main__ - Step 56195: {'lr': 0.000352036324187435, 'samples': 10789440, 'steps': 56194, 'loss/train': 1.3240686655044556} -08/30/2021 23:19:33 - INFO - __main__ - Step 56196: {'lr': 0.0003520314795474115, 'samples': 10789632, 'steps': 56195, 'loss/train': 0.29671040177345276} -08/30/2021 23:19:34 - INFO - __main__ - Step 56197: {'lr': 0.00035202663486141417, 'samples': 10789824, 'steps': 56196, 'loss/train': 0.5146790146827698} -08/30/2021 23:19:34 - INFO - __main__ - Step 56198: {'lr': 0.00035202179012944527, 'samples': 10790016, 'steps': 56197, 'loss/train': 1.2441060543060303} -08/30/2021 23:19:34 - INFO - __main__ - Step 56199: {'lr': 0.0003520169453515069, 'samples': 10790208, 'steps': 56198, 'loss/train': 0.26361212134361267} -08/30/2021 23:19:36 - INFO - __main__ - Step 56200: {'lr': 0.00035201210052760123, 'samples': 10790400, 'steps': 56199, 'loss/train': 0.14536148309707642} -08/30/2021 23:19:36 - INFO - __main__ - Step 56201: {'lr': 0.0003520072556577306, 'samples': 10790592, 'steps': 56200, 'loss/train': 1.5028141736984253} -08/30/2021 23:19:37 - INFO - __main__ - Step 56202: {'lr': 0.000352002410741897, 'samples': 10790784, 'steps': 56201, 'loss/train': 0.7295525074005127} -08/30/2021 23:19:37 - INFO - __main__ - Step 56203: {'lr': 0.00035199756578010267, 'samples': 10790976, 'steps': 56202, 'loss/train': 1.3582055568695068} -08/30/2021 23:19:38 - INFO - __main__ - Step 56204: {'lr': 0.0003519927207723498, 'samples': 10791168, 'steps': 56203, 'loss/train': 0.6318374276161194} -08/30/2021 23:19:39 - INFO - __main__ - Step 56205: {'lr': 0.00035198787571864067, 'samples': 10791360, 'steps': 56204, 'loss/train': 0.31698113679885864} -08/30/2021 23:19:40 - INFO - __main__ - Step 56206: {'lr': 0.0003519830306189773, 'samples': 10791552, 'steps': 56205, 'loss/train': 1.2460066080093384} -08/30/2021 23:19:40 - INFO - __main__ - Step 56207: {'lr': 0.000351978185473362, 'samples': 10791744, 'steps': 56206, 'loss/train': 1.2279210090637207} -08/30/2021 23:19:40 - INFO - __main__ - Step 56208: {'lr': 0.0003519733402817968, 'samples': 10791936, 'steps': 56207, 'loss/train': 1.6996444463729858} -08/30/2021 23:19:41 - INFO - __main__ - Step 56209: {'lr': 0.0003519684950442841, 'samples': 10792128, 'steps': 56208, 'loss/train': 1.4328835010528564} -08/30/2021 23:19:42 - INFO - __main__ - Step 56210: {'lr': 0.00035196364976082593, 'samples': 10792320, 'steps': 56209, 'loss/train': 1.3060847520828247} -08/30/2021 23:19:43 - INFO - __main__ - Step 56211: {'lr': 0.0003519588044314245, 'samples': 10792512, 'steps': 56210, 'loss/train': 0.7972104549407959} -08/30/2021 23:19:43 - INFO - __main__ - Step 56212: {'lr': 0.000351953959056082, 'samples': 10792704, 'steps': 56211, 'loss/train': 1.6470961570739746} -08/30/2021 23:19:43 - INFO - __main__ - Step 56213: {'lr': 0.0003519491136348006, 'samples': 10792896, 'steps': 56212, 'loss/train': 1.480650544166565} -08/30/2021 23:19:44 - INFO - __main__ - Step 56214: {'lr': 0.0003519442681675826, 'samples': 10793088, 'steps': 56213, 'loss/train': 1.7162854671478271} -08/30/2021 23:19:45 - INFO - __main__ - Step 56215: {'lr': 0.00035193942265443, 'samples': 10793280, 'steps': 56214, 'loss/train': 1.61748468875885} -08/30/2021 23:19:46 - INFO - __main__ - Step 56216: {'lr': 0.0003519345770953452, 'samples': 10793472, 'steps': 56215, 'loss/train': 1.6915357112884521} -08/30/2021 23:19:46 - INFO - __main__ - Step 56217: {'lr': 0.00035192973149033007, 'samples': 10793664, 'steps': 56216, 'loss/train': 1.4703187942504883} -08/30/2021 23:19:46 - INFO - __main__ - Step 56218: {'lr': 0.0003519248858393871, 'samples': 10793856, 'steps': 56217, 'loss/train': 0.48813164234161377} -08/30/2021 23:19:47 - INFO - __main__ - Step 56219: {'lr': 0.0003519200401425183, 'samples': 10794048, 'steps': 56218, 'loss/train': 0.8728643655776978} -08/30/2021 23:19:49 - INFO - __main__ - Step 56220: {'lr': 0.0003519151943997259, 'samples': 10794240, 'steps': 56219, 'loss/train': 1.487473487854004} -08/30/2021 23:19:49 - INFO - __main__ - Step 56221: {'lr': 0.0003519103486110121, 'samples': 10794432, 'steps': 56220, 'loss/train': 1.0937063694000244} -08/30/2021 23:19:49 - INFO - __main__ - Step 56222: {'lr': 0.0003519055027763791, 'samples': 10794624, 'steps': 56221, 'loss/train': 0.11141691356897354} -08/30/2021 23:19:50 - INFO - __main__ - Step 56223: {'lr': 0.00035190065689582895, 'samples': 10794816, 'steps': 56222, 'loss/train': 0.18188953399658203} -08/30/2021 23:19:50 - INFO - __main__ - Step 56224: {'lr': 0.00035189581096936395, 'samples': 10795008, 'steps': 56223, 'loss/train': 0.844398021697998} -08/30/2021 23:19:50 - INFO - __main__ - Step 56225: {'lr': 0.0003518909649969864, 'samples': 10795200, 'steps': 56224, 'loss/train': 1.4655299186706543} -08/30/2021 23:19:52 - INFO - __main__ - Step 56226: {'lr': 0.00035188611897869824, 'samples': 10795392, 'steps': 56225, 'loss/train': 1.1828337907791138} -08/30/2021 23:19:52 - INFO - __main__ - Step 56227: {'lr': 0.00035188127291450183, 'samples': 10795584, 'steps': 56226, 'loss/train': 1.137499451637268} -08/30/2021 23:19:53 - INFO - __main__ - Step 56228: {'lr': 0.00035187642680439927, 'samples': 10795776, 'steps': 56227, 'loss/train': 0.6767659783363342} -08/30/2021 23:19:53 - INFO - __main__ - Step 56229: {'lr': 0.0003518715806483928, 'samples': 10795968, 'steps': 56228, 'loss/train': 1.9900949001312256} -08/30/2021 23:19:53 - INFO - __main__ - Step 56230: {'lr': 0.0003518667344464845, 'samples': 10796160, 'steps': 56229, 'loss/train': 1.5314913988113403} -08/30/2021 23:19:55 - INFO - __main__ - Step 56231: {'lr': 0.00035186188819867663, 'samples': 10796352, 'steps': 56230, 'loss/train': 1.2715846300125122} -08/30/2021 23:19:56 - INFO - __main__ - Step 56232: {'lr': 0.00035185704190497137, 'samples': 10796544, 'steps': 56231, 'loss/train': 1.6737961769104004} -08/30/2021 23:19:56 - INFO - __main__ - Step 56233: {'lr': 0.0003518521955653709, 'samples': 10796736, 'steps': 56232, 'loss/train': 1.781301498413086} -08/30/2021 23:19:56 - INFO - __main__ - Step 56234: {'lr': 0.0003518473491798774, 'samples': 10796928, 'steps': 56233, 'loss/train': 1.2351044416427612} -08/30/2021 23:19:57 - INFO - __main__ - Step 56235: {'lr': 0.00035184250274849306, 'samples': 10797120, 'steps': 56234, 'loss/train': 1.651589274406433} -08/30/2021 23:19:58 - INFO - __main__ - Step 56236: {'lr': 0.0003518376562712201, 'samples': 10797312, 'steps': 56235, 'loss/train': 0.6935270428657532} -08/30/2021 23:19:59 - INFO - __main__ - Step 56237: {'lr': 0.00035183280974806065, 'samples': 10797504, 'steps': 56236, 'loss/train': 0.6373516321182251} -08/30/2021 23:19:59 - INFO - __main__ - Step 56238: {'lr': 0.0003518279631790169, 'samples': 10797696, 'steps': 56237, 'loss/train': 1.2254695892333984} -08/30/2021 23:19:59 - INFO - __main__ - Step 56239: {'lr': 0.000351823116564091, 'samples': 10797888, 'steps': 56238, 'loss/train': 0.9763191342353821} -08/30/2021 23:20:00 - INFO - __main__ - Step 56240: {'lr': 0.0003518182699032852, 'samples': 10798080, 'steps': 56239, 'loss/train': 0.75439453125} -08/30/2021 23:20:01 - INFO - __main__ - Step 56241: {'lr': 0.0003518134231966017, 'samples': 10798272, 'steps': 56240, 'loss/train': 1.5486811399459839} -08/30/2021 23:20:02 - INFO - __main__ - Step 56242: {'lr': 0.0003518085764440426, 'samples': 10798464, 'steps': 56241, 'loss/train': 1.3664119243621826} -08/30/2021 23:20:02 - INFO - __main__ - Step 56243: {'lr': 0.00035180372964561013, 'samples': 10798656, 'steps': 56242, 'loss/train': 1.2818729877471924} -08/30/2021 23:20:02 - INFO - __main__ - Step 56244: {'lr': 0.00035179888280130646, 'samples': 10798848, 'steps': 56243, 'loss/train': 1.0736815929412842} -08/30/2021 23:20:03 - INFO - __main__ - Step 56245: {'lr': 0.00035179403591113377, 'samples': 10799040, 'steps': 56244, 'loss/train': 1.0455563068389893} -08/30/2021 23:20:05 - INFO - __main__ - Step 56246: {'lr': 0.0003517891889750943, 'samples': 10799232, 'steps': 56245, 'loss/train': 1.1921799182891846} -08/30/2021 23:20:05 - INFO - __main__ - Step 56247: {'lr': 0.0003517843419931902, 'samples': 10799424, 'steps': 56246, 'loss/train': 0.8170264959335327} -08/30/2021 23:20:06 - INFO - __main__ - Step 56248: {'lr': 0.0003517794949654236, 'samples': 10799616, 'steps': 56247, 'loss/train': 1.2851195335388184} -08/30/2021 23:20:06 - INFO - __main__ - Step 56249: {'lr': 0.00035177464789179675, 'samples': 10799808, 'steps': 56248, 'loss/train': 1.3435691595077515} -08/30/2021 23:20:06 - INFO - __main__ - Step 56250: {'lr': 0.0003517698007723118, 'samples': 10800000, 'steps': 56249, 'loss/train': 1.5542590618133545} -08/30/2021 23:20:08 - INFO - __main__ - Step 56251: {'lr': 0.00035176495360697096, 'samples': 10800192, 'steps': 56250, 'loss/train': 1.3107409477233887} -08/30/2021 23:20:08 - INFO - __main__ - Step 56252: {'lr': 0.0003517601063957764, 'samples': 10800384, 'steps': 56251, 'loss/train': 0.9203411340713501} -08/30/2021 23:20:09 - INFO - __main__ - Step 56253: {'lr': 0.0003517552591387303, 'samples': 10800576, 'steps': 56252, 'loss/train': 1.6615418195724487} -08/30/2021 23:20:09 - INFO - __main__ - Step 56254: {'lr': 0.0003517504118358349, 'samples': 10800768, 'steps': 56253, 'loss/train': 1.0183117389678955} -08/30/2021 23:20:09 - INFO - __main__ - Step 56255: {'lr': 0.0003517455644870923, 'samples': 10800960, 'steps': 56254, 'loss/train': 1.3904917240142822} -08/30/2021 23:20:11 - INFO - __main__ - Step 56256: {'lr': 0.00035174071709250475, 'samples': 10801152, 'steps': 56255, 'loss/train': 0.9888782501220703} -08/30/2021 23:20:11 - INFO - __main__ - Step 56257: {'lr': 0.00035173586965207436, 'samples': 10801344, 'steps': 56256, 'loss/train': 1.1724299192428589} -08/30/2021 23:20:12 - INFO - __main__ - Step 56258: {'lr': 0.0003517310221658033, 'samples': 10801536, 'steps': 56257, 'loss/train': 1.6633081436157227} -08/30/2021 23:20:12 - INFO - __main__ - Step 56259: {'lr': 0.00035172617463369397, 'samples': 10801728, 'steps': 56258, 'loss/train': 1.1430174112319946} -08/30/2021 23:20:12 - INFO - __main__ - Step 56260: {'lr': 0.0003517213270557482, 'samples': 10801920, 'steps': 56259, 'loss/train': 1.0456026792526245} -08/30/2021 23:20:14 - INFO - __main__ - Step 56261: {'lr': 0.00035171647943196854, 'samples': 10802112, 'steps': 56260, 'loss/train': 0.9139151573181152} -08/30/2021 23:20:14 - INFO - __main__ - Step 56262: {'lr': 0.00035171163176235694, 'samples': 10802304, 'steps': 56261, 'loss/train': 1.6453360319137573} -08/30/2021 23:20:15 - INFO - __main__ - Step 56263: {'lr': 0.00035170678404691563, 'samples': 10802496, 'steps': 56262, 'loss/train': 0.6549670100212097} -08/30/2021 23:20:15 - INFO - __main__ - Step 56264: {'lr': 0.00035170193628564683, 'samples': 10802688, 'steps': 56263, 'loss/train': 1.2884488105773926} -08/30/2021 23:20:15 - INFO - __main__ - Step 56265: {'lr': 0.0003516970884785527, 'samples': 10802880, 'steps': 56264, 'loss/train': 1.3687598705291748} -08/30/2021 23:20:17 - INFO - __main__ - Step 56266: {'lr': 0.00035169224062563543, 'samples': 10803072, 'steps': 56265, 'loss/train': 1.206392765045166} -08/30/2021 23:20:18 - INFO - __main__ - Step 56267: {'lr': 0.0003516873927268972, 'samples': 10803264, 'steps': 56266, 'loss/train': 1.0268909931182861} -08/30/2021 23:20:18 - INFO - __main__ - Step 56268: {'lr': 0.0003516825447823403, 'samples': 10803456, 'steps': 56267, 'loss/train': 0.7114416360855103} -08/30/2021 23:20:19 - INFO - __main__ - Step 56269: {'lr': 0.0003516776967919667, 'samples': 10803648, 'steps': 56268, 'loss/train': 0.028562083840370178} -08/30/2021 23:20:19 - INFO - __main__ - Step 56270: {'lr': 0.0003516728487557787, 'samples': 10803840, 'steps': 56269, 'loss/train': 3.810262441635132} -08/30/2021 23:20:19 - INFO - __main__ - Step 56271: {'lr': 0.00035166800067377855, 'samples': 10804032, 'steps': 56270, 'loss/train': 0.9921672344207764} -08/30/2021 23:20:20 - INFO - __main__ - Step 56272: {'lr': 0.00035166315254596826, 'samples': 10804224, 'steps': 56271, 'loss/train': 1.1992790699005127} -08/30/2021 23:20:21 - INFO - __main__ - Step 56273: {'lr': 0.0003516583043723502, 'samples': 10804416, 'steps': 56272, 'loss/train': 1.5328330993652344} -08/30/2021 23:20:22 - INFO - __main__ - Step 56274: {'lr': 0.0003516534561529264, 'samples': 10804608, 'steps': 56273, 'loss/train': 0.9591448307037354} -08/30/2021 23:20:22 - INFO - __main__ - Step 56275: {'lr': 0.00035164860788769925, 'samples': 10804800, 'steps': 56274, 'loss/train': 1.5115023851394653} -08/30/2021 23:20:22 - INFO - __main__ - Step 56276: {'lr': 0.0003516437595766708, 'samples': 10804992, 'steps': 56275, 'loss/train': 1.0127558708190918} -08/30/2021 23:20:23 - INFO - __main__ - Step 56277: {'lr': 0.00035163891121984316, 'samples': 10805184, 'steps': 56276, 'loss/train': 1.7689074277877808} -08/30/2021 23:20:24 - INFO - __main__ - Step 56278: {'lr': 0.0003516340628172186, 'samples': 10805376, 'steps': 56277, 'loss/train': 1.2849451303482056} -08/30/2021 23:20:25 - INFO - __main__ - Step 56279: {'lr': 0.0003516292143687993, 'samples': 10805568, 'steps': 56278, 'loss/train': 1.4143896102905273} -08/30/2021 23:20:25 - INFO - __main__ - Step 56280: {'lr': 0.00035162436587458744, 'samples': 10805760, 'steps': 56279, 'loss/train': 0.24738809466362} -08/30/2021 23:20:25 - INFO - __main__ - Step 56281: {'lr': 0.0003516195173345853, 'samples': 10805952, 'steps': 56280, 'loss/train': 0.4486299157142639} -08/30/2021 23:20:26 - INFO - __main__ - Step 56282: {'lr': 0.0003516146687487949, 'samples': 10806144, 'steps': 56281, 'loss/train': 0.7672046422958374} -08/30/2021 23:20:28 - INFO - __main__ - Step 56283: {'lr': 0.0003516098201172185, 'samples': 10806336, 'steps': 56282, 'loss/train': 0.9187241792678833} -08/30/2021 23:20:28 - INFO - __main__ - Step 56284: {'lr': 0.00035160497143985823, 'samples': 10806528, 'steps': 56283, 'loss/train': 1.5133743286132812} -08/30/2021 23:20:28 - INFO - __main__ - Step 56285: {'lr': 0.0003516001227167164, 'samples': 10806720, 'steps': 56284, 'loss/train': 0.8918207883834839} -08/30/2021 23:20:29 - INFO - __main__ - Step 56286: {'lr': 0.0003515952739477951, 'samples': 10806912, 'steps': 56285, 'loss/train': 0.6635756492614746} -08/30/2021 23:20:29 - INFO - __main__ - Step 56287: {'lr': 0.0003515904251330965, 'samples': 10807104, 'steps': 56286, 'loss/train': 0.9633187651634216} -08/30/2021 23:20:31 - INFO - __main__ - Step 56288: {'lr': 0.00035158557627262295, 'samples': 10807296, 'steps': 56287, 'loss/train': 1.0384821891784668} -08/30/2021 23:20:31 - INFO - __main__ - Step 56289: {'lr': 0.00035158072736637643, 'samples': 10807488, 'steps': 56288, 'loss/train': 1.444690465927124} -08/30/2021 23:20:31 - INFO - __main__ - Step 56290: {'lr': 0.0003515758784143592, 'samples': 10807680, 'steps': 56289, 'loss/train': 0.9422166347503662} -08/30/2021 23:20:32 - INFO - __main__ - Step 56291: {'lr': 0.00035157102941657336, 'samples': 10807872, 'steps': 56290, 'loss/train': 1.3602656126022339} -08/30/2021 23:20:32 - INFO - __main__ - Step 56292: {'lr': 0.0003515661803730213, 'samples': 10808064, 'steps': 56291, 'loss/train': 0.9585633873939514} -08/30/2021 23:20:32 - INFO - __main__ - Step 56293: {'lr': 0.000351561331283705, 'samples': 10808256, 'steps': 56292, 'loss/train': 1.4210909605026245} -08/30/2021 23:20:34 - INFO - __main__ - Step 56294: {'lr': 0.0003515564821486268, 'samples': 10808448, 'steps': 56293, 'loss/train': 1.1082032918930054} -08/30/2021 23:20:35 - INFO - __main__ - Step 56295: {'lr': 0.00035155163296778883, 'samples': 10808640, 'steps': 56294, 'loss/train': 1.853243112564087} -08/30/2021 23:20:35 - INFO - __main__ - Step 56296: {'lr': 0.0003515467837411932, 'samples': 10808832, 'steps': 56295, 'loss/train': 1.3389308452606201} -08/30/2021 23:20:35 - INFO - __main__ - Step 56297: {'lr': 0.0003515419344688422, 'samples': 10809024, 'steps': 56296, 'loss/train': 1.6399043798446655} -08/30/2021 23:20:36 - INFO - __main__ - Step 56298: {'lr': 0.00035153708515073793, 'samples': 10809216, 'steps': 56297, 'loss/train': 1.5292176008224487} -08/30/2021 23:20:38 - INFO - __main__ - Step 56299: {'lr': 0.00035153223578688263, 'samples': 10809408, 'steps': 56298, 'loss/train': 0.882011890411377} -08/30/2021 23:20:39 - INFO - __main__ - Step 56300: {'lr': 0.0003515273863772785, 'samples': 10809600, 'steps': 56299, 'loss/train': 0.8975883722305298} -08/30/2021 23:20:39 - INFO - __main__ - Step 56301: {'lr': 0.00035152253692192765, 'samples': 10809792, 'steps': 56300, 'loss/train': 1.4098734855651855} -08/30/2021 23:20:39 - INFO - __main__ - Step 56302: {'lr': 0.0003515176874208324, 'samples': 10809984, 'steps': 56301, 'loss/train': 1.7833385467529297} -08/30/2021 23:20:40 - INFO - __main__ - Step 56303: {'lr': 0.0003515128378739948, 'samples': 10810176, 'steps': 56302, 'loss/train': 1.7411781549453735} -08/30/2021 23:20:42 - INFO - __main__ - Step 56304: {'lr': 0.0003515079882814171, 'samples': 10810368, 'steps': 56303, 'loss/train': 1.065727949142456} -08/30/2021 23:20:42 - INFO - __main__ - Step 56305: {'lr': 0.00035150313864310137, 'samples': 10810560, 'steps': 56304, 'loss/train': 1.5781422853469849} -08/30/2021 23:20:42 - INFO - __main__ - Step 56306: {'lr': 0.00035149828895904994, 'samples': 10810752, 'steps': 56305, 'loss/train': 1.477195382118225} -08/30/2021 23:20:43 - INFO - __main__ - Step 56307: {'lr': 0.00035149343922926497, 'samples': 10810944, 'steps': 56306, 'loss/train': 0.04176757112145424} -08/30/2021 23:20:43 - INFO - __main__ - Step 56308: {'lr': 0.0003514885894537486, 'samples': 10811136, 'steps': 56307, 'loss/train': 0.04284767806529999} -08/30/2021 23:20:43 - INFO - __main__ - Step 56309: {'lr': 0.00035148373963250307, 'samples': 10811328, 'steps': 56308, 'loss/train': 1.548675537109375} -08/30/2021 23:20:44 - INFO - __main__ - Step 56310: {'lr': 0.0003514788897655305, 'samples': 10811520, 'steps': 56309, 'loss/train': 1.342390537261963} -08/30/2021 23:20:46 - INFO - __main__ - Step 56311: {'lr': 0.0003514740398528331, 'samples': 10811712, 'steps': 56310, 'loss/train': 1.5789802074432373} -08/30/2021 23:20:46 - INFO - __main__ - Step 56312: {'lr': 0.0003514691898944131, 'samples': 10811904, 'steps': 56311, 'loss/train': 0.7250506281852722} -08/30/2021 23:20:46 - INFO - __main__ - Step 56313: {'lr': 0.0003514643398902727, 'samples': 10812096, 'steps': 56312, 'loss/train': 0.9135230779647827} -08/30/2021 23:20:47 - INFO - __main__ - Step 56314: {'lr': 0.00035145948984041393, 'samples': 10812288, 'steps': 56313, 'loss/train': 1.0178760290145874} -08/30/2021 23:20:47 - INFO - __main__ - Step 56315: {'lr': 0.00035145463974483915, 'samples': 10812480, 'steps': 56314, 'loss/train': 0.05449938401579857} -08/30/2021 23:20:48 - INFO - __main__ - Step 56316: {'lr': 0.00035144978960355045, 'samples': 10812672, 'steps': 56315, 'loss/train': 1.1534762382507324} -08/30/2021 23:20:49 - INFO - __main__ - Step 56317: {'lr': 0.00035144493941655, 'samples': 10812864, 'steps': 56316, 'loss/train': 0.04490484297275543} -08/30/2021 23:20:49 - INFO - __main__ - Step 56318: {'lr': 0.00035144008918384006, 'samples': 10813056, 'steps': 56317, 'loss/train': 0.7149926424026489} -08/30/2021 23:20:50 - INFO - __main__ - Step 56319: {'lr': 0.0003514352389054228, 'samples': 10813248, 'steps': 56318, 'loss/train': 1.9637274742126465} -08/30/2021 23:20:50 - INFO - __main__ - Step 56320: {'lr': 0.00035143038858130034, 'samples': 10813440, 'steps': 56319, 'loss/train': 1.1326920986175537} -08/30/2021 23:20:50 - INFO - __main__ - Step 56321: {'lr': 0.00035142553821147494, 'samples': 10813632, 'steps': 56320, 'loss/train': 0.5537501573562622} -08/30/2021 23:20:52 - INFO - __main__ - Step 56322: {'lr': 0.00035142068779594885, 'samples': 10813824, 'steps': 56321, 'loss/train': 1.706468939781189} -08/30/2021 23:20:52 - INFO - __main__ - Step 56323: {'lr': 0.00035141583733472407, 'samples': 10814016, 'steps': 56322, 'loss/train': 0.6052045822143555} -08/30/2021 23:20:53 - INFO - __main__ - Step 56324: {'lr': 0.0003514109868278028, 'samples': 10814208, 'steps': 56323, 'loss/train': 0.7911117076873779} -08/30/2021 23:20:53 - INFO - __main__ - Step 56325: {'lr': 0.0003514061362751874, 'samples': 10814400, 'steps': 56324, 'loss/train': 1.2599706649780273} -08/30/2021 23:20:54 - INFO - __main__ - Step 56326: {'lr': 0.0003514012856768799, 'samples': 10814592, 'steps': 56325, 'loss/train': 1.321623682975769} -08/30/2021 23:20:55 - INFO - __main__ - Step 56327: {'lr': 0.0003513964350328826, 'samples': 10814784, 'steps': 56326, 'loss/train': 2.7075531482696533} -08/30/2021 23:20:55 - INFO - __main__ - Step 56328: {'lr': 0.0003513915843431977, 'samples': 10814976, 'steps': 56327, 'loss/train': 1.152888536453247} -08/30/2021 23:20:56 - INFO - __main__ - Step 56329: {'lr': 0.0003513867336078272, 'samples': 10815168, 'steps': 56328, 'loss/train': 1.200417399406433} -08/30/2021 23:20:56 - INFO - __main__ - Step 56330: {'lr': 0.00035138188282677344, 'samples': 10815360, 'steps': 56329, 'loss/train': 1.5218689441680908} -08/30/2021 23:20:56 - INFO - __main__ - Step 56331: {'lr': 0.00035137703200003857, 'samples': 10815552, 'steps': 56330, 'loss/train': 1.597712516784668} -08/30/2021 23:20:58 - INFO - __main__ - Step 56332: {'lr': 0.00035137218112762475, 'samples': 10815744, 'steps': 56331, 'loss/train': 0.7616521120071411} -08/30/2021 23:20:58 - INFO - __main__ - Step 56333: {'lr': 0.0003513673302095342, 'samples': 10815936, 'steps': 56332, 'loss/train': 1.5828900337219238} -08/30/2021 23:20:59 - INFO - __main__ - Step 56334: {'lr': 0.0003513624792457691, 'samples': 10816128, 'steps': 56333, 'loss/train': 1.4141948223114014} -08/30/2021 23:20:59 - INFO - __main__ - Step 56335: {'lr': 0.00035135762823633167, 'samples': 10816320, 'steps': 56334, 'loss/train': 1.3798741102218628} -08/30/2021 23:20:59 - INFO - __main__ - Step 56336: {'lr': 0.00035135277718122403, 'samples': 10816512, 'steps': 56335, 'loss/train': 1.0160465240478516} -08/30/2021 23:21:01 - INFO - __main__ - Step 56337: {'lr': 0.0003513479260804484, 'samples': 10816704, 'steps': 56336, 'loss/train': 1.274591326713562} -08/30/2021 23:21:01 - INFO - __main__ - Step 56338: {'lr': 0.0003513430749340069, 'samples': 10816896, 'steps': 56337, 'loss/train': 0.8275808691978455} -08/30/2021 23:21:02 - INFO - __main__ - Step 56339: {'lr': 0.0003513382237419018, 'samples': 10817088, 'steps': 56338, 'loss/train': 1.0999596118927002} -08/30/2021 23:21:02 - INFO - __main__ - Step 56340: {'lr': 0.00035133337250413534, 'samples': 10817280, 'steps': 56339, 'loss/train': 1.9294317960739136} -08/30/2021 23:21:02 - INFO - __main__ - Step 56341: {'lr': 0.00035132852122070953, 'samples': 10817472, 'steps': 56340, 'loss/train': 0.9169614911079407} -08/30/2021 23:21:03 - INFO - __main__ - Step 56342: {'lr': 0.0003513236698916267, 'samples': 10817664, 'steps': 56341, 'loss/train': 1.5714478492736816} -08/30/2021 23:21:05 - INFO - __main__ - Step 56343: {'lr': 0.00035131881851688896, 'samples': 10817856, 'steps': 56342, 'loss/train': 0.48499056696891785} -08/30/2021 23:21:05 - INFO - __main__ - Step 56344: {'lr': 0.00035131396709649855, 'samples': 10818048, 'steps': 56343, 'loss/train': 1.3771110773086548} -08/30/2021 23:21:06 - INFO - __main__ - Step 56345: {'lr': 0.00035130911563045764, 'samples': 10818240, 'steps': 56344, 'loss/train': 1.4886866807937622} -08/30/2021 23:21:06 - INFO - __main__ - Step 56346: {'lr': 0.00035130426411876834, 'samples': 10818432, 'steps': 56345, 'loss/train': 0.8399190306663513} -08/30/2021 23:21:06 - INFO - __main__ - Step 56347: {'lr': 0.00035129941256143295, 'samples': 10818624, 'steps': 56346, 'loss/train': 2.588120222091675} -08/30/2021 23:21:07 - INFO - __main__ - Step 56348: {'lr': 0.0003512945609584536, 'samples': 10818816, 'steps': 56347, 'loss/train': 0.9279683232307434} -08/30/2021 23:21:09 - INFO - __main__ - Step 56349: {'lr': 0.0003512897093098325, 'samples': 10819008, 'steps': 56348, 'loss/train': 0.05068553611636162} -08/30/2021 23:21:09 - INFO - __main__ - Step 56350: {'lr': 0.0003512848576155718, 'samples': 10819200, 'steps': 56349, 'loss/train': 1.3194245100021362} -08/30/2021 23:21:09 - INFO - __main__ - Step 56351: {'lr': 0.0003512800058756738, 'samples': 10819392, 'steps': 56350, 'loss/train': 0.02751103788614273} -08/30/2021 23:21:10 - INFO - __main__ - Step 56352: {'lr': 0.00035127515409014046, 'samples': 10819584, 'steps': 56351, 'loss/train': 1.3289200067520142} -08/30/2021 23:21:10 - INFO - __main__ - Step 56353: {'lr': 0.00035127030225897413, 'samples': 10819776, 'steps': 56352, 'loss/train': 1.2871557474136353} -08/30/2021 23:21:10 - INFO - __main__ - Step 56354: {'lr': 0.000351265450382177, 'samples': 10819968, 'steps': 56353, 'loss/train': 1.5532402992248535} -08/30/2021 23:21:12 - INFO - __main__ - Step 56355: {'lr': 0.0003512605984597512, 'samples': 10820160, 'steps': 56354, 'loss/train': 1.0814402103424072} -08/30/2021 23:21:12 - INFO - __main__ - Step 56356: {'lr': 0.00035125574649169894, 'samples': 10820352, 'steps': 56355, 'loss/train': 1.309942364692688} -08/30/2021 23:21:13 - INFO - __main__ - Step 56357: {'lr': 0.0003512508944780224, 'samples': 10820544, 'steps': 56356, 'loss/train': 0.991716742515564} -08/30/2021 23:21:13 - INFO - __main__ - Step 56358: {'lr': 0.0003512460424187237, 'samples': 10820736, 'steps': 56357, 'loss/train': 1.267741322517395} -08/30/2021 23:21:13 - INFO - __main__ - Step 56359: {'lr': 0.00035124119031380526, 'samples': 10820928, 'steps': 56358, 'loss/train': 1.6119405031204224} -08/30/2021 23:21:15 - INFO - __main__ - Step 56360: {'lr': 0.000351236338163269, 'samples': 10821120, 'steps': 56359, 'loss/train': 1.0107890367507935} -08/30/2021 23:21:16 - INFO - __main__ - Step 56361: {'lr': 0.00035123148596711716, 'samples': 10821312, 'steps': 56360, 'loss/train': 0.6051582098007202} -08/30/2021 23:21:16 - INFO - __main__ - Step 56362: {'lr': 0.0003512266337253521, 'samples': 10821504, 'steps': 56361, 'loss/train': 1.6000652313232422} -08/30/2021 23:21:16 - INFO - __main__ - Step 56363: {'lr': 0.0003512217814379758, 'samples': 10821696, 'steps': 56362, 'loss/train': 1.2335125207901} -08/30/2021 23:21:17 - INFO - __main__ - Step 56364: {'lr': 0.0003512169291049905, 'samples': 10821888, 'steps': 56363, 'loss/train': 1.6763275861740112} -08/30/2021 23:21:18 - INFO - __main__ - Step 56365: {'lr': 0.0003512120767263985, 'samples': 10822080, 'steps': 56364, 'loss/train': 1.0438852310180664} -08/30/2021 23:21:19 - INFO - __main__ - Step 56366: {'lr': 0.0003512072243022018, 'samples': 10822272, 'steps': 56365, 'loss/train': 1.2271020412445068} -08/30/2021 23:21:19 - INFO - __main__ - Step 56367: {'lr': 0.00035120237183240276, 'samples': 10822464, 'steps': 56366, 'loss/train': 0.9846289157867432} -08/30/2021 23:21:19 - INFO - __main__ - Step 56368: {'lr': 0.00035119751931700344, 'samples': 10822656, 'steps': 56367, 'loss/train': 1.552603006362915} -08/30/2021 23:21:20 - INFO - __main__ - Step 56369: {'lr': 0.00035119266675600615, 'samples': 10822848, 'steps': 56368, 'loss/train': 1.2388850450515747} -08/30/2021 23:21:21 - INFO - __main__ - Step 56370: {'lr': 0.00035118781414941296, 'samples': 10823040, 'steps': 56369, 'loss/train': 1.216059923171997} -08/30/2021 23:21:22 - INFO - __main__ - Step 56371: {'lr': 0.00035118296149722614, 'samples': 10823232, 'steps': 56370, 'loss/train': 2.545923948287964} -08/30/2021 23:21:22 - INFO - __main__ - Step 56372: {'lr': 0.0003511781087994478, 'samples': 10823424, 'steps': 56371, 'loss/train': 0.9165162444114685} -08/30/2021 23:21:23 - INFO - __main__ - Step 56373: {'lr': 0.00035117325605608013, 'samples': 10823616, 'steps': 56372, 'loss/train': 1.1739851236343384} -08/30/2021 23:21:23 - INFO - __main__ - Step 56374: {'lr': 0.0003511684032671254, 'samples': 10823808, 'steps': 56373, 'loss/train': 0.2769080102443695} -08/30/2021 23:21:23 - INFO - __main__ - Step 56375: {'lr': 0.0003511635504325857, 'samples': 10824000, 'steps': 56374, 'loss/train': 1.0504651069641113} -08/30/2021 23:21:25 - INFO - __main__ - Step 56376: {'lr': 0.0003511586975524634, 'samples': 10824192, 'steps': 56375, 'loss/train': 1.4656623601913452} -08/30/2021 23:21:26 - INFO - __main__ - Step 56377: {'lr': 0.0003511538446267604, 'samples': 10824384, 'steps': 56376, 'loss/train': 1.472334384918213} -08/30/2021 23:21:26 - INFO - __main__ - Step 56378: {'lr': 0.00035114899165547916, 'samples': 10824576, 'steps': 56377, 'loss/train': 1.6079140901565552} -08/30/2021 23:21:26 - INFO - __main__ - Step 56379: {'lr': 0.00035114413863862164, 'samples': 10824768, 'steps': 56378, 'loss/train': 0.03344573825597763} -08/30/2021 23:21:27 - INFO - __main__ - Step 56380: {'lr': 0.0003511392855761902, 'samples': 10824960, 'steps': 56379, 'loss/train': 0.03081243485212326} -08/30/2021 23:21:28 - INFO - __main__ - Step 56381: {'lr': 0.0003511344324681869, 'samples': 10825152, 'steps': 56380, 'loss/train': 1.1805614233016968} -08/30/2021 23:21:28 - INFO - __main__ - Step 56382: {'lr': 0.00035112957931461407, 'samples': 10825344, 'steps': 56381, 'loss/train': 1.4443172216415405} -08/30/2021 23:21:29 - INFO - __main__ - Step 56383: {'lr': 0.00035112472611547376, 'samples': 10825536, 'steps': 56382, 'loss/train': 1.27548086643219} -08/30/2021 23:21:29 - INFO - __main__ - Step 56384: {'lr': 0.0003511198728707682, 'samples': 10825728, 'steps': 56383, 'loss/train': 1.2274144887924194} -08/30/2021 23:21:30 - INFO - __main__ - Step 56385: {'lr': 0.0003511150195804996, 'samples': 10825920, 'steps': 56384, 'loss/train': 1.4640270471572876} -08/30/2021 23:21:31 - INFO - __main__ - Step 56386: {'lr': 0.00035111016624467007, 'samples': 10826112, 'steps': 56385, 'loss/train': 1.3278813362121582} -08/30/2021 23:21:31 - INFO - __main__ - Step 56387: {'lr': 0.00035110531286328193, 'samples': 10826304, 'steps': 56386, 'loss/train': 1.2180472612380981} -08/30/2021 23:21:32 - INFO - __main__ - Step 56388: {'lr': 0.0003511004594363373, 'samples': 10826496, 'steps': 56387, 'loss/train': 1.208565592765808} -08/30/2021 23:21:32 - INFO - __main__ - Step 56389: {'lr': 0.0003510956059638384, 'samples': 10826688, 'steps': 56388, 'loss/train': 1.4527655839920044} -08/30/2021 23:21:33 - INFO - __main__ - Step 56390: {'lr': 0.0003510907524457873, 'samples': 10826880, 'steps': 56389, 'loss/train': 1.8823432922363281} -08/30/2021 23:21:34 - INFO - __main__ - Step 56391: {'lr': 0.0003510858988821863, 'samples': 10827072, 'steps': 56390, 'loss/train': 1.5455334186553955} -08/30/2021 23:21:34 - INFO - __main__ - Step 56392: {'lr': 0.00035108104527303754, 'samples': 10827264, 'steps': 56391, 'loss/train': 1.289292812347412} -08/30/2021 23:21:35 - INFO - __main__ - Step 56393: {'lr': 0.0003510761916183432, 'samples': 10827456, 'steps': 56392, 'loss/train': 1.3379442691802979} -08/30/2021 23:21:35 - INFO - __main__ - Step 56394: {'lr': 0.00035107133791810555, 'samples': 10827648, 'steps': 56393, 'loss/train': 1.9926207065582275} -08/30/2021 23:21:36 - INFO - __main__ - Step 56395: {'lr': 0.00035106648417232666, 'samples': 10827840, 'steps': 56394, 'loss/train': 1.126552700996399} -08/30/2021 23:21:36 - INFO - __main__ - Step 56396: {'lr': 0.0003510616303810088, 'samples': 10828032, 'steps': 56395, 'loss/train': 2.8981428146362305} -08/30/2021 23:21:38 - INFO - __main__ - Step 56397: {'lr': 0.00035105677654415416, 'samples': 10828224, 'steps': 56396, 'loss/train': 1.3787848949432373} -08/30/2021 23:21:38 - INFO - __main__ - Step 56398: {'lr': 0.0003510519226617648, 'samples': 10828416, 'steps': 56397, 'loss/train': 1.388511061668396} -08/30/2021 23:21:38 - INFO - __main__ - Step 56399: {'lr': 0.00035104706873384305, 'samples': 10828608, 'steps': 56398, 'loss/train': 1.3289058208465576} -08/30/2021 23:21:39 - INFO - __main__ - Step 56400: {'lr': 0.0003510422147603911, 'samples': 10828800, 'steps': 56399, 'loss/train': 0.04551689699292183} -08/30/2021 23:21:39 - INFO - __main__ - Step 56401: {'lr': 0.00035103736074141103, 'samples': 10828992, 'steps': 56400, 'loss/train': 1.2905093431472778} -08/30/2021 23:21:41 - INFO - __main__ - Step 56402: {'lr': 0.0003510325066769051, 'samples': 10829184, 'steps': 56401, 'loss/train': 1.3818747997283936} -08/30/2021 23:21:41 - INFO - __main__ - Step 56403: {'lr': 0.00035102765256687555, 'samples': 10829376, 'steps': 56402, 'loss/train': 5.8501877784729} -08/30/2021 23:21:41 - INFO - __main__ - Step 56404: {'lr': 0.0003510227984113244, 'samples': 10829568, 'steps': 56403, 'loss/train': 0.8995800018310547} -08/30/2021 23:21:42 - INFO - __main__ - Step 56405: {'lr': 0.00035101794421025395, 'samples': 10829760, 'steps': 56404, 'loss/train': 1.3171738386154175} -08/30/2021 23:21:42 - INFO - __main__ - Step 56406: {'lr': 0.00035101308996366635, 'samples': 10829952, 'steps': 56405, 'loss/train': 1.2439517974853516} -08/30/2021 23:21:44 - INFO - __main__ - Step 56407: {'lr': 0.00035100823567156385, 'samples': 10830144, 'steps': 56406, 'loss/train': 1.37333345413208} -08/30/2021 23:21:44 - INFO - __main__ - Step 56408: {'lr': 0.0003510033813339486, 'samples': 10830336, 'steps': 56407, 'loss/train': 1.2654346227645874} -08/30/2021 23:21:44 - INFO - __main__ - Step 56409: {'lr': 0.00035099852695082286, 'samples': 10830528, 'steps': 56408, 'loss/train': 1.1296823024749756} -08/30/2021 23:21:45 - INFO - __main__ - Step 56410: {'lr': 0.0003509936725221886, 'samples': 10830720, 'steps': 56409, 'loss/train': 1.2942525148391724} -08/30/2021 23:21:45 - INFO - __main__ - Step 56411: {'lr': 0.0003509888180480483, 'samples': 10830912, 'steps': 56410, 'loss/train': 1.6736493110656738} -08/30/2021 23:21:45 - INFO - __main__ - Step 56412: {'lr': 0.00035098396352840384, 'samples': 10831104, 'steps': 56411, 'loss/train': 1.037999153137207} -08/30/2021 23:21:48 - INFO - __main__ - Step 56413: {'lr': 0.00035097910896325765, 'samples': 10831296, 'steps': 56412, 'loss/train': 1.4722040891647339} -08/30/2021 23:21:48 - INFO - __main__ - Step 56414: {'lr': 0.0003509742543526118, 'samples': 10831488, 'steps': 56413, 'loss/train': 1.3150835037231445} -08/30/2021 23:21:48 - INFO - __main__ - Step 56415: {'lr': 0.00035096939969646854, 'samples': 10831680, 'steps': 56414, 'loss/train': 0.40805065631866455} -08/30/2021 23:21:49 - INFO - __main__ - Step 56416: {'lr': 0.00035096454499483, 'samples': 10831872, 'steps': 56415, 'loss/train': 0.9750242233276367} -08/30/2021 23:21:49 - INFO - __main__ - Step 56417: {'lr': 0.0003509596902476985, 'samples': 10832064, 'steps': 56416, 'loss/train': 1.2096073627471924} -08/30/2021 23:21:51 - INFO - __main__ - Step 56418: {'lr': 0.000350954835455076, 'samples': 10832256, 'steps': 56417, 'loss/train': 1.6839812994003296} -08/30/2021 23:21:51 - INFO - __main__ - Step 56419: {'lr': 0.00035094998061696483, 'samples': 10832448, 'steps': 56418, 'loss/train': 1.9249850511550903} -08/30/2021 23:21:52 - INFO - __main__ - Step 56420: {'lr': 0.0003509451257333671, 'samples': 10832640, 'steps': 56419, 'loss/train': 0.9475346803665161} -08/30/2021 23:21:52 - INFO - __main__ - Step 56421: {'lr': 0.00035094027080428514, 'samples': 10832832, 'steps': 56420, 'loss/train': 1.3457587957382202} -08/30/2021 23:21:52 - INFO - __main__ - Step 56422: {'lr': 0.00035093541582972105, 'samples': 10833024, 'steps': 56421, 'loss/train': 0.9765965342521667} -08/30/2021 23:21:54 - INFO - __main__ - Step 56423: {'lr': 0.000350930560809677, 'samples': 10833216, 'steps': 56422, 'loss/train': 1.2351179122924805} -08/30/2021 23:21:54 - INFO - __main__ - Step 56424: {'lr': 0.0003509257057441552, 'samples': 10833408, 'steps': 56423, 'loss/train': 1.6799372434616089} -08/30/2021 23:21:55 - INFO - __main__ - Step 56425: {'lr': 0.00035092085063315783, 'samples': 10833600, 'steps': 56424, 'loss/train': 1.5770337581634521} -08/30/2021 23:21:55 - INFO - __main__ - Step 56426: {'lr': 0.00035091599547668707, 'samples': 10833792, 'steps': 56425, 'loss/train': 1.8400212526321411} -08/30/2021 23:21:55 - INFO - __main__ - Step 56427: {'lr': 0.00035091114027474514, 'samples': 10833984, 'steps': 56426, 'loss/train': 1.5495290756225586} -08/30/2021 23:21:56 - INFO - __main__ - Step 56428: {'lr': 0.0003509062850273342, 'samples': 10834176, 'steps': 56427, 'loss/train': 0.5808155536651611} -08/30/2021 23:21:57 - INFO - __main__ - Step 56429: {'lr': 0.0003509014297344565, 'samples': 10834368, 'steps': 56428, 'loss/train': 1.4561634063720703} -08/30/2021 23:21:58 - INFO - __main__ - Step 56430: {'lr': 0.0003508965743961141, 'samples': 10834560, 'steps': 56429, 'loss/train': 0.9111874103546143} -08/30/2021 23:21:58 - INFO - __main__ - Step 56431: {'lr': 0.00035089171901230926, 'samples': 10834752, 'steps': 56430, 'loss/train': 1.1718239784240723} -08/30/2021 23:21:59 - INFO - __main__ - Step 56432: {'lr': 0.0003508868635830442, 'samples': 10834944, 'steps': 56431, 'loss/train': 1.7609952688217163} -08/30/2021 23:21:59 - INFO - __main__ - Step 56433: {'lr': 0.00035088200810832104, 'samples': 10835136, 'steps': 56432, 'loss/train': 0.9224588871002197} -08/30/2021 23:22:00 - INFO - __main__ - Step 56434: {'lr': 0.00035087715258814203, 'samples': 10835328, 'steps': 56433, 'loss/train': 0.3581213653087616} -08/30/2021 23:22:01 - INFO - __main__ - Step 56435: {'lr': 0.00035087229702250936, 'samples': 10835520, 'steps': 56434, 'loss/train': 1.6546635627746582} -08/30/2021 23:22:01 - INFO - __main__ - Step 56436: {'lr': 0.00035086744141142514, 'samples': 10835712, 'steps': 56435, 'loss/train': 0.5147892236709595} -08/30/2021 23:22:02 - INFO - __main__ - Step 56437: {'lr': 0.0003508625857548916, 'samples': 10835904, 'steps': 56436, 'loss/train': 0.7432236671447754} -08/30/2021 23:22:02 - INFO - __main__ - Step 56438: {'lr': 0.000350857730052911, 'samples': 10836096, 'steps': 56437, 'loss/train': 1.392895221710205} -08/30/2021 23:22:04 - INFO - __main__ - Step 56439: {'lr': 0.0003508528743054854, 'samples': 10836288, 'steps': 56438, 'loss/train': 1.4067773818969727} -08/30/2021 23:22:04 - INFO - __main__ - Step 56440: {'lr': 0.00035084801851261707, 'samples': 10836480, 'steps': 56439, 'loss/train': 1.563826322555542} -08/30/2021 23:22:04 - INFO - __main__ - Step 56441: {'lr': 0.00035084316267430815, 'samples': 10836672, 'steps': 56440, 'loss/train': 1.4754047393798828} -08/30/2021 23:22:05 - INFO - __main__ - Step 56442: {'lr': 0.0003508383067905609, 'samples': 10836864, 'steps': 56441, 'loss/train': 1.0166155099868774} -08/30/2021 23:22:05 - INFO - __main__ - Step 56443: {'lr': 0.0003508334508613775, 'samples': 10837056, 'steps': 56442, 'loss/train': 0.9441992044448853} -08/30/2021 23:22:07 - INFO - __main__ - Step 56444: {'lr': 0.00035082859488676005, 'samples': 10837248, 'steps': 56443, 'loss/train': 1.2128995656967163} -08/30/2021 23:22:07 - INFO - __main__ - Step 56445: {'lr': 0.0003508237388667108, 'samples': 10837440, 'steps': 56444, 'loss/train': 1.2033194303512573} -08/30/2021 23:22:08 - INFO - __main__ - Step 56446: {'lr': 0.00035081888280123194, 'samples': 10837632, 'steps': 56445, 'loss/train': 1.7337194681167603} -08/30/2021 23:22:08 - INFO - __main__ - Step 56447: {'lr': 0.0003508140266903256, 'samples': 10837824, 'steps': 56446, 'loss/train': 0.08774230629205704} -08/30/2021 23:22:08 - INFO - __main__ - Step 56448: {'lr': 0.0003508091705339941, 'samples': 10838016, 'steps': 56447, 'loss/train': 1.4886800050735474} -08/30/2021 23:22:09 - INFO - __main__ - Step 56449: {'lr': 0.00035080431433223946, 'samples': 10838208, 'steps': 56448, 'loss/train': 0.8500186800956726} -08/30/2021 23:22:10 - INFO - __main__ - Step 56450: {'lr': 0.000350799458085064, 'samples': 10838400, 'steps': 56449, 'loss/train': 1.0560827255249023} -08/30/2021 23:22:11 - INFO - __main__ - Step 56451: {'lr': 0.00035079460179246984, 'samples': 10838592, 'steps': 56450, 'loss/train': 1.252631664276123} -08/30/2021 23:22:11 - INFO - __main__ - Step 56452: {'lr': 0.0003507897454544592, 'samples': 10838784, 'steps': 56451, 'loss/train': 0.3698769509792328} -08/30/2021 23:22:11 - INFO - __main__ - Step 56453: {'lr': 0.0003507848890710342, 'samples': 10838976, 'steps': 56452, 'loss/train': 1.3823071718215942} -08/30/2021 23:22:12 - INFO - __main__ - Step 56454: {'lr': 0.00035078003264219713, 'samples': 10839168, 'steps': 56453, 'loss/train': 1.3327810764312744} -08/30/2021 23:22:13 - INFO - __main__ - Step 56455: {'lr': 0.0003507751761679502, 'samples': 10839360, 'steps': 56454, 'loss/train': 1.5613362789154053} -08/30/2021 23:22:14 - INFO - __main__ - Step 56456: {'lr': 0.0003507703196482955, 'samples': 10839552, 'steps': 56455, 'loss/train': 1.0154962539672852} -08/30/2021 23:22:14 - INFO - __main__ - Step 56457: {'lr': 0.0003507654630832352, 'samples': 10839744, 'steps': 56456, 'loss/train': 1.4267102479934692} -08/30/2021 23:22:14 - INFO - __main__ - Step 56458: {'lr': 0.0003507606064727715, 'samples': 10839936, 'steps': 56457, 'loss/train': 1.0416288375854492} -08/30/2021 23:22:15 - INFO - __main__ - Step 56459: {'lr': 0.0003507557498169067, 'samples': 10840128, 'steps': 56458, 'loss/train': 1.4540621042251587} -08/30/2021 23:22:16 - INFO - __main__ - Step 56460: {'lr': 0.0003507508931156429, 'samples': 10840320, 'steps': 56459, 'loss/train': 1.6540557146072388} -08/30/2021 23:22:17 - INFO - __main__ - Step 56461: {'lr': 0.0003507460363689823, 'samples': 10840512, 'steps': 56460, 'loss/train': 1.3665308952331543} -08/30/2021 23:22:17 - INFO - __main__ - Step 56462: {'lr': 0.00035074117957692707, 'samples': 10840704, 'steps': 56461, 'loss/train': 1.4076887369155884} -08/30/2021 23:22:18 - INFO - __main__ - Step 56463: {'lr': 0.0003507363227394795, 'samples': 10840896, 'steps': 56462, 'loss/train': 1.3722600936889648} -08/30/2021 23:22:18 - INFO - __main__ - Step 56464: {'lr': 0.00035073146585664163, 'samples': 10841088, 'steps': 56463, 'loss/train': 1.7906204462051392} -08/30/2021 23:22:20 - INFO - __main__ - Step 56465: {'lr': 0.00035072660892841566, 'samples': 10841280, 'steps': 56464, 'loss/train': 1.2597562074661255} -08/30/2021 23:22:21 - INFO - __main__ - Step 56466: {'lr': 0.0003507217519548039, 'samples': 10841472, 'steps': 56465, 'loss/train': 0.7803432941436768} -08/30/2021 23:22:21 - INFO - __main__ - Step 56467: {'lr': 0.00035071689493580845, 'samples': 10841664, 'steps': 56466, 'loss/train': 1.1418205499649048} -08/30/2021 23:22:21 - INFO - __main__ - Step 56468: {'lr': 0.0003507120378714315, 'samples': 10841856, 'steps': 56467, 'loss/train': 1.3491010665893555} -08/30/2021 23:22:22 - INFO - __main__ - Step 56469: {'lr': 0.0003507071807616753, 'samples': 10842048, 'steps': 56468, 'loss/train': 1.0862956047058105} -08/30/2021 23:22:22 - INFO - __main__ - Step 56470: {'lr': 0.0003507023236065421, 'samples': 10842240, 'steps': 56469, 'loss/train': 1.5986477136611938} -08/30/2021 23:22:23 - INFO - __main__ - Step 56471: {'lr': 0.0003506974664060338, 'samples': 10842432, 'steps': 56470, 'loss/train': 0.05688268691301346} -08/30/2021 23:22:24 - INFO - __main__ - Step 56472: {'lr': 0.00035069260916015287, 'samples': 10842624, 'steps': 56471, 'loss/train': 1.4795644283294678} -08/30/2021 23:22:24 - INFO - __main__ - Step 56473: {'lr': 0.0003506877518689014, 'samples': 10842816, 'steps': 56472, 'loss/train': 1.4247878789901733} -08/30/2021 23:22:25 - INFO - __main__ - Step 56474: {'lr': 0.0003506828945322816, 'samples': 10843008, 'steps': 56473, 'loss/train': 1.583120584487915} -08/30/2021 23:22:25 - INFO - __main__ - Step 56475: {'lr': 0.0003506780371502956, 'samples': 10843200, 'steps': 56474, 'loss/train': 0.48261404037475586} -08/30/2021 23:22:27 - INFO - __main__ - Step 56476: {'lr': 0.00035067317972294564, 'samples': 10843392, 'steps': 56475, 'loss/train': 0.9055414199829102} -08/30/2021 23:22:27 - INFO - __main__ - Step 56477: {'lr': 0.00035066832225023393, 'samples': 10843584, 'steps': 56476, 'loss/train': 1.215675950050354} -08/30/2021 23:22:27 - INFO - __main__ - Step 56478: {'lr': 0.0003506634647321626, 'samples': 10843776, 'steps': 56477, 'loss/train': 0.32339316606521606} -08/30/2021 23:22:28 - INFO - __main__ - Step 56479: {'lr': 0.0003506586071687338, 'samples': 10843968, 'steps': 56478, 'loss/train': 0.07090987265110016} -08/30/2021 23:22:28 - INFO - __main__ - Step 56480: {'lr': 0.0003506537495599499, 'samples': 10844160, 'steps': 56479, 'loss/train': 1.2480740547180176} -08/30/2021 23:22:30 - INFO - __main__ - Step 56481: {'lr': 0.0003506488919058129, 'samples': 10844352, 'steps': 56480, 'loss/train': 1.4660922288894653} -08/30/2021 23:22:30 - INFO - __main__ - Step 56482: {'lr': 0.00035064403420632505, 'samples': 10844544, 'steps': 56481, 'loss/train': 0.5766159296035767} -08/30/2021 23:22:31 - INFO - __main__ - Step 56483: {'lr': 0.0003506391764614887, 'samples': 10844736, 'steps': 56482, 'loss/train': 0.8548250794410706} -08/30/2021 23:22:31 - INFO - __main__ - Step 56484: {'lr': 0.00035063431867130576, 'samples': 10844928, 'steps': 56483, 'loss/train': 1.335131287574768} -08/30/2021 23:22:31 - INFO - __main__ - Step 56485: {'lr': 0.00035062946083577853, 'samples': 10845120, 'steps': 56484, 'loss/train': 1.0710281133651733} -08/30/2021 23:22:33 - INFO - __main__ - Step 56486: {'lr': 0.00035062460295490926, 'samples': 10845312, 'steps': 56485, 'loss/train': 0.9134763479232788} -08/30/2021 23:22:33 - INFO - __main__ - Step 56487: {'lr': 0.00035061974502870007, 'samples': 10845504, 'steps': 56486, 'loss/train': 1.432463526725769} -08/30/2021 23:22:34 - INFO - __main__ - Step 56488: {'lr': 0.0003506148870571533, 'samples': 10845696, 'steps': 56487, 'loss/train': 1.6364357471466064} -08/30/2021 23:22:34 - INFO - __main__ - Step 56489: {'lr': 0.00035061002904027084, 'samples': 10845888, 'steps': 56488, 'loss/train': 1.7500250339508057} -08/30/2021 23:22:34 - INFO - __main__ - Step 56490: {'lr': 0.0003506051709780551, 'samples': 10846080, 'steps': 56489, 'loss/train': 1.61838698387146} -08/30/2021 23:22:36 - INFO - __main__ - Step 56491: {'lr': 0.0003506003128705083, 'samples': 10846272, 'steps': 56490, 'loss/train': 1.5849438905715942} -08/30/2021 23:22:36 - INFO - __main__ - Step 56492: {'lr': 0.0003505954547176325, 'samples': 10846464, 'steps': 56491, 'loss/train': 1.2359497547149658} -08/30/2021 23:22:37 - INFO - __main__ - Step 56493: {'lr': 0.00035059059651942995, 'samples': 10846656, 'steps': 56492, 'loss/train': 1.3019310235977173} -08/30/2021 23:22:37 - INFO - __main__ - Step 56494: {'lr': 0.00035058573827590286, 'samples': 10846848, 'steps': 56493, 'loss/train': 1.1675150394439697} -08/30/2021 23:22:37 - INFO - __main__ - Step 56495: {'lr': 0.0003505808799870533, 'samples': 10847040, 'steps': 56494, 'loss/train': 0.03174806386232376} -08/30/2021 23:22:38 - INFO - __main__ - Step 56496: {'lr': 0.0003505760216528836, 'samples': 10847232, 'steps': 56495, 'loss/train': 1.9629825353622437} -08/30/2021 23:22:40 - INFO - __main__ - Step 56497: {'lr': 0.0003505711632733959, 'samples': 10847424, 'steps': 56496, 'loss/train': 1.8223012685775757} -08/30/2021 23:22:40 - INFO - __main__ - Step 56498: {'lr': 0.00035056630484859235, 'samples': 10847616, 'steps': 56497, 'loss/train': 1.0175421237945557} -08/30/2021 23:22:40 - INFO - __main__ - Step 56499: {'lr': 0.00035056144637847525, 'samples': 10847808, 'steps': 56498, 'loss/train': 0.28747323155403137} -08/30/2021 23:22:41 - INFO - __main__ - Step 56500: {'lr': 0.0003505565878630467, 'samples': 10848000, 'steps': 56499, 'loss/train': 1.129755973815918} -08/30/2021 23:22:41 - INFO - __main__ - Step 56501: {'lr': 0.0003505517293023088, 'samples': 10848192, 'steps': 56500, 'loss/train': 1.0732613801956177} -08/30/2021 23:22:43 - INFO - __main__ - Step 56502: {'lr': 0.0003505468706962639, 'samples': 10848384, 'steps': 56501, 'loss/train': 0.10525637865066528} -08/30/2021 23:22:43 - INFO - __main__ - Step 56503: {'lr': 0.00035054201204491413, 'samples': 10848576, 'steps': 56502, 'loss/train': 1.207919955253601} -08/30/2021 23:22:43 - INFO - __main__ - Step 56504: {'lr': 0.00035053715334826176, 'samples': 10848768, 'steps': 56503, 'loss/train': 1.325360655784607} -08/30/2021 23:22:44 - INFO - __main__ - Step 56505: {'lr': 0.0003505322946063089, 'samples': 10848960, 'steps': 56504, 'loss/train': 1.4062741994857788} -08/30/2021 23:22:44 - INFO - __main__ - Step 56506: {'lr': 0.0003505274358190576, 'samples': 10849152, 'steps': 56505, 'loss/train': 1.12855863571167} -08/30/2021 23:22:46 - INFO - __main__ - Step 56507: {'lr': 0.00035052257698651025, 'samples': 10849344, 'steps': 56506, 'loss/train': 1.360582709312439} -08/30/2021 23:22:46 - INFO - __main__ - Step 56508: {'lr': 0.000350517718108669, 'samples': 10849536, 'steps': 56507, 'loss/train': 1.701041579246521} -08/30/2021 23:22:46 - INFO - __main__ - Step 56509: {'lr': 0.000350512859185536, 'samples': 10849728, 'steps': 56508, 'loss/train': 1.7182844877243042} -08/30/2021 23:22:47 - INFO - __main__ - Step 56510: {'lr': 0.00035050800021711346, 'samples': 10849920, 'steps': 56509, 'loss/train': 1.9650938510894775} -08/30/2021 23:22:47 - INFO - __main__ - Step 56511: {'lr': 0.00035050314120340357, 'samples': 10850112, 'steps': 56510, 'loss/train': 1.4075977802276611} -08/30/2021 23:22:49 - INFO - __main__ - Step 56512: {'lr': 0.00035049828214440856, 'samples': 10850304, 'steps': 56511, 'loss/train': 1.6018834114074707} -08/30/2021 23:22:49 - INFO - __main__ - Step 56513: {'lr': 0.00035049342304013055, 'samples': 10850496, 'steps': 56512, 'loss/train': 1.0976426601409912} -08/30/2021 23:22:49 - INFO - __main__ - Step 56514: {'lr': 0.0003504885638905717, 'samples': 10850688, 'steps': 56513, 'loss/train': 1.7953767776489258} -08/30/2021 23:22:50 - INFO - __main__ - Step 56515: {'lr': 0.0003504837046957343, 'samples': 10850880, 'steps': 56514, 'loss/train': 1.3804914951324463} -08/30/2021 23:22:50 - INFO - __main__ - Step 56516: {'lr': 0.0003504788454556205, 'samples': 10851072, 'steps': 56515, 'loss/train': 1.636925220489502} -08/30/2021 23:22:51 - INFO - __main__ - Step 56517: {'lr': 0.00035047398617023246, 'samples': 10851264, 'steps': 56516, 'loss/train': 0.7687824368476868} -08/30/2021 23:22:53 - INFO - __main__ - Step 56518: {'lr': 0.0003504691268395724, 'samples': 10851456, 'steps': 56517, 'loss/train': 1.6216387748718262} -08/30/2021 23:22:53 - INFO - __main__ - Step 56519: {'lr': 0.00035046426746364247, 'samples': 10851648, 'steps': 56518, 'loss/train': 1.1298202276229858} -08/30/2021 23:22:53 - INFO - __main__ - Step 56520: {'lr': 0.0003504594080424449, 'samples': 10851840, 'steps': 56519, 'loss/train': 1.0394850969314575} -08/30/2021 23:22:54 - INFO - __main__ - Step 56521: {'lr': 0.00035045454857598194, 'samples': 10852032, 'steps': 56520, 'loss/train': 1.0864089727401733} -08/30/2021 23:22:54 - INFO - __main__ - Step 56522: {'lr': 0.0003504496890642556, 'samples': 10852224, 'steps': 56521, 'loss/train': 1.5368640422821045} -08/30/2021 23:22:56 - INFO - __main__ - Step 56523: {'lr': 0.0003504448295072683, 'samples': 10852416, 'steps': 56522, 'loss/train': 1.122554898262024} -08/30/2021 23:22:56 - INFO - __main__ - Step 56524: {'lr': 0.00035043996990502204, 'samples': 10852608, 'steps': 56523, 'loss/train': 1.0034229755401611} -08/30/2021 23:22:56 - INFO - __main__ - Step 56525: {'lr': 0.00035043511025751906, 'samples': 10852800, 'steps': 56524, 'loss/train': 1.3032256364822388} -08/30/2021 23:22:57 - INFO - __main__ - Step 56526: {'lr': 0.00035043025056476164, 'samples': 10852992, 'steps': 56525, 'loss/train': 0.8567964434623718} -08/30/2021 23:22:57 - INFO - __main__ - Step 56527: {'lr': 0.00035042539082675184, 'samples': 10853184, 'steps': 56526, 'loss/train': 2.180180311203003} -08/30/2021 23:22:59 - INFO - __main__ - Step 56528: {'lr': 0.00035042053104349195, 'samples': 10853376, 'steps': 56527, 'loss/train': 1.3048216104507446} -08/30/2021 23:22:59 - INFO - __main__ - Step 56529: {'lr': 0.00035041567121498406, 'samples': 10853568, 'steps': 56528, 'loss/train': 1.3458185195922852} -08/30/2021 23:23:00 - INFO - __main__ - Step 56530: {'lr': 0.0003504108113412305, 'samples': 10853760, 'steps': 56529, 'loss/train': 0.025860119611024857} -08/30/2021 23:23:00 - INFO - __main__ - Step 56531: {'lr': 0.0003504059514222333, 'samples': 10853952, 'steps': 56530, 'loss/train': 1.1303489208221436} -08/30/2021 23:23:00 - INFO - __main__ - Step 56532: {'lr': 0.00035040109145799474, 'samples': 10854144, 'steps': 56531, 'loss/train': 1.4384759664535522} -08/30/2021 23:23:01 - INFO - __main__ - Step 56533: {'lr': 0.0003503962314485171, 'samples': 10854336, 'steps': 56532, 'loss/train': 1.4004967212677002} -08/30/2021 23:23:02 - INFO - __main__ - Step 56534: {'lr': 0.00035039137139380235, 'samples': 10854528, 'steps': 56533, 'loss/train': 1.4151445627212524} -08/30/2021 23:23:03 - INFO - __main__ - Step 56535: {'lr': 0.0003503865112938528, 'samples': 10854720, 'steps': 56534, 'loss/train': 1.4511741399765015} -08/30/2021 23:23:03 - INFO - __main__ - Step 56536: {'lr': 0.00035038165114867066, 'samples': 10854912, 'steps': 56535, 'loss/train': 1.2138116359710693} -08/30/2021 23:23:04 - INFO - __main__ - Step 56537: {'lr': 0.00035037679095825815, 'samples': 10855104, 'steps': 56536, 'loss/train': 1.4829049110412598} -08/30/2021 23:23:04 - INFO - __main__ - Step 56538: {'lr': 0.00035037193072261734, 'samples': 10855296, 'steps': 56537, 'loss/train': 0.8143882155418396} -08/30/2021 23:23:05 - INFO - __main__ - Step 56539: {'lr': 0.00035036707044175055, 'samples': 10855488, 'steps': 56538, 'loss/train': 0.9588643312454224} -08/30/2021 23:23:06 - INFO - __main__ - Step 56540: {'lr': 0.00035036221011565985, 'samples': 10855680, 'steps': 56539, 'loss/train': 0.704169511795044} -08/30/2021 23:23:06 - INFO - __main__ - Step 56541: {'lr': 0.00035035734974434745, 'samples': 10855872, 'steps': 56540, 'loss/train': 1.5803643465042114} -08/30/2021 23:23:06 - INFO - __main__ - Step 56542: {'lr': 0.00035035248932781564, 'samples': 10856064, 'steps': 56541, 'loss/train': 1.4250285625457764} -08/30/2021 23:23:07 - INFO - __main__ - Step 56543: {'lr': 0.0003503476288660665, 'samples': 10856256, 'steps': 56542, 'loss/train': 1.3363053798675537} -08/30/2021 23:23:08 - INFO - __main__ - Step 56544: {'lr': 0.0003503427683591024, 'samples': 10856448, 'steps': 56543, 'loss/train': 1.5413345098495483} -08/30/2021 23:23:09 - INFO - __main__ - Step 56545: {'lr': 0.00035033790780692527, 'samples': 10856640, 'steps': 56544, 'loss/train': 0.9046850800514221} -08/30/2021 23:23:09 - INFO - __main__ - Step 56546: {'lr': 0.0003503330472095375, 'samples': 10856832, 'steps': 56545, 'loss/train': 0.8477411866188049} -08/30/2021 23:23:10 - INFO - __main__ - Step 56547: {'lr': 0.0003503281865669411, 'samples': 10857024, 'steps': 56546, 'loss/train': 1.3381098508834839} -08/30/2021 23:23:10 - INFO - __main__ - Step 56548: {'lr': 0.00035032332587913844, 'samples': 10857216, 'steps': 56547, 'loss/train': 2.5551445484161377} -08/30/2021 23:23:10 - INFO - __main__ - Step 56549: {'lr': 0.00035031846514613164, 'samples': 10857408, 'steps': 56548, 'loss/train': 1.2439919710159302} -08/30/2021 23:23:12 - INFO - __main__ - Step 56550: {'lr': 0.00035031360436792294, 'samples': 10857600, 'steps': 56549, 'loss/train': 1.2165690660476685} -08/30/2021 23:23:12 - INFO - __main__ - Step 56551: {'lr': 0.00035030874354451434, 'samples': 10857792, 'steps': 56550, 'loss/train': 1.7179961204528809} -08/30/2021 23:23:13 - INFO - __main__ - Step 56552: {'lr': 0.0003503038826759083, 'samples': 10857984, 'steps': 56551, 'loss/train': 1.5298376083374023} -08/30/2021 23:23:13 - INFO - __main__ - Step 56553: {'lr': 0.00035029902176210675, 'samples': 10858176, 'steps': 56552, 'loss/train': 0.7448773980140686} -08/30/2021 23:23:13 - INFO - __main__ - Step 56554: {'lr': 0.0003502941608031121, 'samples': 10858368, 'steps': 56553, 'loss/train': 0.826343297958374} -08/30/2021 23:23:15 - INFO - __main__ - Step 56555: {'lr': 0.00035028929979892645, 'samples': 10858560, 'steps': 56554, 'loss/train': 1.3980389833450317} -08/30/2021 23:23:15 - INFO - __main__ - Step 56556: {'lr': 0.00035028443874955196, 'samples': 10858752, 'steps': 56555, 'loss/train': 1.7466596364974976} -08/30/2021 23:23:16 - INFO - __main__ - Step 56557: {'lr': 0.00035027957765499084, 'samples': 10858944, 'steps': 56556, 'loss/train': 1.0910674333572388} -08/30/2021 23:23:16 - INFO - __main__ - Step 56558: {'lr': 0.00035027471651524533, 'samples': 10859136, 'steps': 56557, 'loss/train': 0.9672409296035767} -08/30/2021 23:23:16 - INFO - __main__ - Step 56559: {'lr': 0.00035026985533031754, 'samples': 10859328, 'steps': 56558, 'loss/train': 1.0487531423568726} -08/30/2021 23:23:18 - INFO - __main__ - Step 56560: {'lr': 0.00035026499410020974, 'samples': 10859520, 'steps': 56559, 'loss/train': 1.6387578248977661} -08/30/2021 23:23:18 - INFO - __main__ - Step 56561: {'lr': 0.00035026013282492404, 'samples': 10859712, 'steps': 56560, 'loss/train': 1.244329810142517} -08/30/2021 23:23:18 - INFO - __main__ - Step 56562: {'lr': 0.0003502552715044627, 'samples': 10859904, 'steps': 56561, 'loss/train': 1.9325666427612305} -08/30/2021 23:23:19 - INFO - __main__ - Step 56563: {'lr': 0.0003502504101388279, 'samples': 10860096, 'steps': 56562, 'loss/train': 1.1325589418411255} -08/30/2021 23:23:19 - INFO - __main__ - Step 56564: {'lr': 0.0003502455487280218, 'samples': 10860288, 'steps': 56563, 'loss/train': 0.8093452453613281} -08/30/2021 23:23:21 - INFO - __main__ - Step 56565: {'lr': 0.00035024068727204655, 'samples': 10860480, 'steps': 56564, 'loss/train': 0.7579498887062073} -08/30/2021 23:23:21 - INFO - __main__ - Step 56566: {'lr': 0.0003502358257709044, 'samples': 10860672, 'steps': 56565, 'loss/train': 0.9509707093238831} -08/30/2021 23:23:22 - INFO - __main__ - Step 56567: {'lr': 0.00035023096422459756, 'samples': 10860864, 'steps': 56566, 'loss/train': 1.457160234451294} -08/30/2021 23:23:22 - INFO - __main__ - Step 56568: {'lr': 0.0003502261026331282, 'samples': 10861056, 'steps': 56567, 'loss/train': 1.0944246053695679} -08/30/2021 23:23:22 - INFO - __main__ - Step 56569: {'lr': 0.0003502212409964985, 'samples': 10861248, 'steps': 56568, 'loss/train': 1.9922066926956177} -08/30/2021 23:23:24 - INFO - __main__ - Step 56570: {'lr': 0.00035021637931471075, 'samples': 10861440, 'steps': 56569, 'loss/train': 0.17963860929012299} -08/30/2021 23:23:24 - INFO - __main__ - Step 56571: {'lr': 0.00035021151758776693, 'samples': 10861632, 'steps': 56570, 'loss/train': 0.925829291343689} -08/30/2021 23:23:25 - INFO - __main__ - Step 56572: {'lr': 0.00035020665581566934, 'samples': 10861824, 'steps': 56571, 'loss/train': 1.26144540309906} -08/30/2021 23:23:25 - INFO - __main__ - Step 56573: {'lr': 0.0003502017939984202, 'samples': 10862016, 'steps': 56572, 'loss/train': 0.13490994274616241} -08/30/2021 23:23:25 - INFO - __main__ - Step 56574: {'lr': 0.0003501969321360217, 'samples': 10862208, 'steps': 56573, 'loss/train': 1.880601167678833} -08/30/2021 23:23:27 - INFO - __main__ - Step 56575: {'lr': 0.00035019207022847596, 'samples': 10862400, 'steps': 56574, 'loss/train': 1.5790601968765259} -08/30/2021 23:23:28 - INFO - __main__ - Step 56576: {'lr': 0.0003501872082757852, 'samples': 10862592, 'steps': 56575, 'loss/train': 2.4476702213287354} -08/30/2021 23:23:28 - INFO - __main__ - Step 56577: {'lr': 0.0003501823462779518, 'samples': 10862784, 'steps': 56576, 'loss/train': 1.4351774454116821} -08/30/2021 23:23:29 - INFO - __main__ - Step 56578: {'lr': 0.00035017748423497766, 'samples': 10862976, 'steps': 56577, 'loss/train': 5.935507297515869} -08/30/2021 23:23:29 - INFO - __main__ - Step 56579: {'lr': 0.00035017262214686505, 'samples': 10863168, 'steps': 56578, 'loss/train': 1.0497462749481201} -08/30/2021 23:23:29 - INFO - __main__ - Step 56580: {'lr': 0.00035016776001361625, 'samples': 10863360, 'steps': 56579, 'loss/train': 0.9540074467658997} -08/30/2021 23:23:31 - INFO - __main__ - Step 56581: {'lr': 0.00035016289783523335, 'samples': 10863552, 'steps': 56580, 'loss/train': 0.8396463990211487} -08/30/2021 23:23:31 - INFO - __main__ - Step 56582: {'lr': 0.00035015803561171864, 'samples': 10863744, 'steps': 56581, 'loss/train': 1.3876549005508423} -08/30/2021 23:23:32 - INFO - __main__ - Step 56583: {'lr': 0.0003501531733430743, 'samples': 10863936, 'steps': 56582, 'loss/train': 1.3443472385406494} -08/30/2021 23:23:32 - INFO - __main__ - Step 56584: {'lr': 0.00035014831102930246, 'samples': 10864128, 'steps': 56583, 'loss/train': 1.109544277191162} -08/30/2021 23:23:32 - INFO - __main__ - Step 56585: {'lr': 0.0003501434486704053, 'samples': 10864320, 'steps': 56584, 'loss/train': 1.376772403717041} -08/30/2021 23:23:34 - INFO - __main__ - Step 56586: {'lr': 0.0003501385862663851, 'samples': 10864512, 'steps': 56585, 'loss/train': 1.4383704662322998} -08/30/2021 23:23:35 - INFO - __main__ - Step 56587: {'lr': 0.00035013372381724397, 'samples': 10864704, 'steps': 56586, 'loss/train': 0.9084556698799133} -08/30/2021 23:23:35 - INFO - __main__ - Step 56588: {'lr': 0.00035012886132298413, 'samples': 10864896, 'steps': 56587, 'loss/train': 1.3339368104934692} -08/30/2021 23:23:35 - INFO - __main__ - Step 56589: {'lr': 0.0003501239987836078, 'samples': 10865088, 'steps': 56588, 'loss/train': 0.8530402183532715} -08/30/2021 23:23:36 - INFO - __main__ - Step 56590: {'lr': 0.00035011913619911706, 'samples': 10865280, 'steps': 56589, 'loss/train': 0.7599702477455139} -08/30/2021 23:23:37 - INFO - __main__ - Step 56591: {'lr': 0.0003501142735695143, 'samples': 10865472, 'steps': 56590, 'loss/train': 1.4078866243362427} -08/30/2021 23:23:38 - INFO - __main__ - Step 56592: {'lr': 0.0003501094108948015, 'samples': 10865664, 'steps': 56591, 'loss/train': 1.8844475746154785} -08/30/2021 23:23:38 - INFO - __main__ - Step 56593: {'lr': 0.000350104548174981, 'samples': 10865856, 'steps': 56592, 'loss/train': 1.167657494544983} -08/30/2021 23:23:38 - INFO - __main__ - Step 56594: {'lr': 0.00035009968541005487, 'samples': 10866048, 'steps': 56593, 'loss/train': 1.3433687686920166} -08/30/2021 23:23:39 - INFO - __main__ - Step 56595: {'lr': 0.00035009482260002544, 'samples': 10866240, 'steps': 56594, 'loss/train': 1.2328038215637207} -08/30/2021 23:23:40 - INFO - __main__ - Step 56596: {'lr': 0.00035008995974489477, 'samples': 10866432, 'steps': 56595, 'loss/train': 1.149763822555542} -08/30/2021 23:23:41 - INFO - __main__ - Step 56597: {'lr': 0.0003500850968446652, 'samples': 10866624, 'steps': 56596, 'loss/train': 1.0382232666015625} -08/30/2021 23:23:41 - INFO - __main__ - Step 56598: {'lr': 0.00035008023389933876, 'samples': 10866816, 'steps': 56597, 'loss/train': 1.346388816833496} -08/30/2021 23:23:41 - INFO - __main__ - Step 56599: {'lr': 0.00035007537090891766, 'samples': 10867008, 'steps': 56598, 'loss/train': 1.5968866348266602} -08/30/2021 23:23:42 - INFO - __main__ - Step 56600: {'lr': 0.0003500705078734042, 'samples': 10867200, 'steps': 56599, 'loss/train': 1.2582712173461914} -08/30/2021 23:23:43 - INFO - __main__ - Step 56601: {'lr': 0.0003500656447928005, 'samples': 10867392, 'steps': 56600, 'loss/train': 1.04105544090271} -08/30/2021 23:23:44 - INFO - __main__ - Step 56602: {'lr': 0.00035006078166710877, 'samples': 10867584, 'steps': 56601, 'loss/train': 0.8569434285163879} -08/30/2021 23:23:44 - INFO - __main__ - Step 56603: {'lr': 0.00035005591849633123, 'samples': 10867776, 'steps': 56602, 'loss/train': 1.3504642248153687} -08/30/2021 23:23:44 - INFO - __main__ - Step 56604: {'lr': 0.00035005105528047, 'samples': 10867968, 'steps': 56603, 'loss/train': 1.5873371362686157} -08/30/2021 23:23:45 - INFO - __main__ - Step 56605: {'lr': 0.00035004619201952736, 'samples': 10868160, 'steps': 56604, 'loss/train': 1.3577191829681396} -08/30/2021 23:23:46 - INFO - __main__ - Step 56606: {'lr': 0.00035004132871350535, 'samples': 10868352, 'steps': 56605, 'loss/train': 1.0760232210159302} -08/30/2021 23:23:47 - INFO - __main__ - Step 56607: {'lr': 0.0003500364653624063, 'samples': 10868544, 'steps': 56606, 'loss/train': 1.4970009326934814} -08/30/2021 23:23:47 - INFO - __main__ - Step 56608: {'lr': 0.0003500316019662324, 'samples': 10868736, 'steps': 56607, 'loss/train': 0.9397467374801636} -08/30/2021 23:23:47 - INFO - __main__ - Step 56609: {'lr': 0.00035002673852498577, 'samples': 10868928, 'steps': 56608, 'loss/train': 1.0903841257095337} -08/30/2021 23:23:48 - INFO - __main__ - Step 56610: {'lr': 0.0003500218750386687, 'samples': 10869120, 'steps': 56609, 'loss/train': 1.455434799194336} -08/30/2021 23:23:48 - INFO - __main__ - Step 56611: {'lr': 0.0003500170115072833, 'samples': 10869312, 'steps': 56610, 'loss/train': 0.5159206986427307} -08/30/2021 23:23:50 - INFO - __main__ - Step 56612: {'lr': 0.00035001214793083167, 'samples': 10869504, 'steps': 56611, 'loss/train': 1.6880433559417725} -08/30/2021 23:23:50 - INFO - __main__ - Step 56613: {'lr': 0.00035000728430931616, 'samples': 10869696, 'steps': 56612, 'loss/train': 1.370440125465393} -08/30/2021 23:23:51 - INFO - __main__ - Step 56614: {'lr': 0.000350002420642739, 'samples': 10869888, 'steps': 56613, 'loss/train': 0.8158270716667175} -08/30/2021 23:23:51 - INFO - __main__ - Step 56615: {'lr': 0.0003499975569311022, 'samples': 10870080, 'steps': 56614, 'loss/train': 1.3353149890899658} -08/30/2021 23:23:51 - INFO - __main__ - Step 56616: {'lr': 0.00034999269317440804, 'samples': 10870272, 'steps': 56615, 'loss/train': 1.0273514986038208} -08/30/2021 23:23:53 - INFO - __main__ - Step 56617: {'lr': 0.0003499878293726588, 'samples': 10870464, 'steps': 56616, 'loss/train': 1.0854586362838745} -08/30/2021 23:23:53 - INFO - __main__ - Step 56618: {'lr': 0.0003499829655258565, 'samples': 10870656, 'steps': 56617, 'loss/train': 1.2031031847000122} -08/30/2021 23:23:54 - INFO - __main__ - Step 56619: {'lr': 0.00034997810163400343, 'samples': 10870848, 'steps': 56618, 'loss/train': 1.568880558013916} -08/30/2021 23:23:54 - INFO - __main__ - Step 56620: {'lr': 0.0003499732376971018, 'samples': 10871040, 'steps': 56619, 'loss/train': 1.4042338132858276} -08/30/2021 23:23:54 - INFO - __main__ - Step 56621: {'lr': 0.0003499683737151538, 'samples': 10871232, 'steps': 56620, 'loss/train': 0.9379310607910156} -08/30/2021 23:23:56 - INFO - __main__ - Step 56622: {'lr': 0.0003499635096881615, 'samples': 10871424, 'steps': 56621, 'loss/train': 1.0947391986846924} -08/30/2021 23:23:57 - INFO - __main__ - Step 56623: {'lr': 0.0003499586456161273, 'samples': 10871616, 'steps': 56622, 'loss/train': 1.7475011348724365} -08/30/2021 23:23:57 - INFO - __main__ - Step 56624: {'lr': 0.0003499537814990532, 'samples': 10871808, 'steps': 56623, 'loss/train': 0.9848609566688538} -08/30/2021 23:23:58 - INFO - __main__ - Step 56625: {'lr': 0.0003499489173369415, 'samples': 10872000, 'steps': 56624, 'loss/train': 1.363951563835144} -08/30/2021 23:23:58 - INFO - __main__ - Step 56626: {'lr': 0.00034994405312979433, 'samples': 10872192, 'steps': 56625, 'loss/train': 0.3817296326160431} -08/30/2021 23:23:58 - INFO - __main__ - Step 56627: {'lr': 0.00034993918887761386, 'samples': 10872384, 'steps': 56626, 'loss/train': 1.5850646495819092} -08/30/2021 23:24:00 - INFO - __main__ - Step 56628: {'lr': 0.0003499343245804025, 'samples': 10872576, 'steps': 56627, 'loss/train': 0.09053673595190048} -08/30/2021 23:24:01 - INFO - __main__ - Step 56629: {'lr': 0.00034992946023816216, 'samples': 10872768, 'steps': 56628, 'loss/train': 1.0626736879348755} -08/30/2021 23:24:01 - INFO - __main__ - Step 56630: {'lr': 0.00034992459585089515, 'samples': 10872960, 'steps': 56629, 'loss/train': 1.168748378753662} -08/30/2021 23:24:02 - INFO - __main__ - Step 56631: {'lr': 0.00034991973141860366, 'samples': 10873152, 'steps': 56630, 'loss/train': 0.9976434707641602} -08/30/2021 23:24:02 - INFO - __main__ - Step 56632: {'lr': 0.00034991486694128986, 'samples': 10873344, 'steps': 56631, 'loss/train': 1.0813840627670288} -08/30/2021 23:24:03 - INFO - __main__ - Step 56633: {'lr': 0.000349910002418956, 'samples': 10873536, 'steps': 56632, 'loss/train': 0.950526773929596} -08/30/2021 23:24:04 - INFO - __main__ - Step 56634: {'lr': 0.0003499051378516043, 'samples': 10873728, 'steps': 56633, 'loss/train': 3.013725996017456} -08/30/2021 23:24:04 - INFO - __main__ - Step 56635: {'lr': 0.0003499002732392368, 'samples': 10873920, 'steps': 56634, 'loss/train': 1.4134043455123901} -08/30/2021 23:24:05 - INFO - __main__ - Step 56636: {'lr': 0.0003498954085818558, 'samples': 10874112, 'steps': 56635, 'loss/train': 1.0327482223510742} -08/30/2021 23:24:05 - INFO - __main__ - Step 56637: {'lr': 0.00034989054387946344, 'samples': 10874304, 'steps': 56636, 'loss/train': 1.5457371473312378} -08/30/2021 23:24:07 - INFO - __main__ - Step 56638: {'lr': 0.000349885679132062, 'samples': 10874496, 'steps': 56637, 'loss/train': 1.0211865901947021} -08/30/2021 23:24:07 - INFO - __main__ - Step 56639: {'lr': 0.00034988081433965355, 'samples': 10874688, 'steps': 56638, 'loss/train': 1.5246831178665161} -08/30/2021 23:24:07 - INFO - __main__ - Step 56640: {'lr': 0.00034987594950224043, 'samples': 10874880, 'steps': 56639, 'loss/train': 1.2874032258987427} -08/30/2021 23:24:08 - INFO - __main__ - Step 56641: {'lr': 0.0003498710846198247, 'samples': 10875072, 'steps': 56640, 'loss/train': 1.2398040294647217} -08/30/2021 23:24:08 - INFO - __main__ - Step 56642: {'lr': 0.0003498662196924086, 'samples': 10875264, 'steps': 56641, 'loss/train': 1.2766425609588623} -08/30/2021 23:24:08 - INFO - __main__ - Step 56643: {'lr': 0.00034986135471999424, 'samples': 10875456, 'steps': 56642, 'loss/train': 1.6594924926757812} -08/30/2021 23:24:10 - INFO - __main__ - Step 56644: {'lr': 0.00034985648970258404, 'samples': 10875648, 'steps': 56643, 'loss/train': 0.2604610025882721} -08/30/2021 23:24:10 - INFO - __main__ - Step 56645: {'lr': 0.00034985162464018, 'samples': 10875840, 'steps': 56644, 'loss/train': 1.013767123222351} -08/30/2021 23:24:11 - INFO - __main__ - Step 56646: {'lr': 0.00034984675953278433, 'samples': 10876032, 'steps': 56645, 'loss/train': 1.6603326797485352} -08/30/2021 23:24:11 - INFO - __main__ - Step 56647: {'lr': 0.00034984189438039926, 'samples': 10876224, 'steps': 56646, 'loss/train': 1.3607041835784912} -08/30/2021 23:24:11 - INFO - __main__ - Step 56648: {'lr': 0.00034983702918302696, 'samples': 10876416, 'steps': 56647, 'loss/train': 1.0277810096740723} -08/30/2021 23:24:13 - INFO - __main__ - Step 56649: {'lr': 0.00034983216394066964, 'samples': 10876608, 'steps': 56648, 'loss/train': 1.5826700925827026} -08/30/2021 23:24:13 - INFO - __main__ - Step 56650: {'lr': 0.00034982729865332953, 'samples': 10876800, 'steps': 56649, 'loss/train': 0.9722830057144165} -08/30/2021 23:24:14 - INFO - __main__ - Step 56651: {'lr': 0.0003498224333210087, 'samples': 10876992, 'steps': 56650, 'loss/train': 1.1788796186447144} -08/30/2021 23:24:14 - INFO - __main__ - Step 56652: {'lr': 0.0003498175679437095, 'samples': 10877184, 'steps': 56651, 'loss/train': 1.1582777500152588} -08/30/2021 23:24:14 - INFO - __main__ - Step 56653: {'lr': 0.00034981270252143406, 'samples': 10877376, 'steps': 56652, 'loss/train': 1.3549057245254517} -08/30/2021 23:24:16 - INFO - __main__ - Step 56654: {'lr': 0.0003498078370541845, 'samples': 10877568, 'steps': 56653, 'loss/train': 0.986901044845581} -08/30/2021 23:24:16 - INFO - __main__ - Step 56655: {'lr': 0.00034980297154196306, 'samples': 10877760, 'steps': 56654, 'loss/train': 0.9739421606063843} -08/30/2021 23:24:17 - INFO - __main__ - Step 56656: {'lr': 0.0003497981059847719, 'samples': 10877952, 'steps': 56655, 'loss/train': 2.0031135082244873} -08/30/2021 23:24:17 - INFO - __main__ - Step 56657: {'lr': 0.00034979324038261327, 'samples': 10878144, 'steps': 56656, 'loss/train': 1.2580126523971558} -08/30/2021 23:24:17 - INFO - __main__ - Step 56658: {'lr': 0.00034978837473548946, 'samples': 10878336, 'steps': 56657, 'loss/train': 1.0706145763397217} -08/30/2021 23:24:19 - INFO - __main__ - Step 56659: {'lr': 0.0003497835090434025, 'samples': 10878528, 'steps': 56658, 'loss/train': 0.9589179754257202} -08/30/2021 23:24:19 - INFO - __main__ - Step 56660: {'lr': 0.00034977864330635455, 'samples': 10878720, 'steps': 56659, 'loss/train': 1.719821810722351} -08/30/2021 23:24:20 - INFO - __main__ - Step 56661: {'lr': 0.00034977377752434797, 'samples': 10878912, 'steps': 56660, 'loss/train': 1.4731706380844116} -08/30/2021 23:24:20 - INFO - __main__ - Step 56662: {'lr': 0.0003497689116973848, 'samples': 10879104, 'steps': 56661, 'loss/train': 1.4630749225616455} -08/30/2021 23:24:20 - INFO - __main__ - Step 56663: {'lr': 0.00034976404582546736, 'samples': 10879296, 'steps': 56662, 'loss/train': 1.4608070850372314} -08/30/2021 23:24:22 - INFO - __main__ - Step 56664: {'lr': 0.00034975917990859773, 'samples': 10879488, 'steps': 56663, 'loss/train': 1.4274542331695557} -08/30/2021 23:24:22 - INFO - __main__ - Step 56665: {'lr': 0.00034975431394677827, 'samples': 10879680, 'steps': 56664, 'loss/train': 1.1619678735733032} -08/30/2021 23:24:23 - INFO - __main__ - Step 56666: {'lr': 0.0003497494479400109, 'samples': 10879872, 'steps': 56665, 'loss/train': 3.0610134601593018} -08/30/2021 23:24:23 - INFO - __main__ - Step 56667: {'lr': 0.00034974458188829805, 'samples': 10880064, 'steps': 56666, 'loss/train': 1.2682088613510132} -08/30/2021 23:24:23 - INFO - __main__ - Step 56668: {'lr': 0.0003497397157916418, 'samples': 10880256, 'steps': 56667, 'loss/train': 1.2507548332214355} -08/30/2021 23:24:25 - INFO - __main__ - Step 56669: {'lr': 0.00034973484965004437, 'samples': 10880448, 'steps': 56668, 'loss/train': 1.1496018171310425} -08/30/2021 23:24:26 - INFO - __main__ - Step 56670: {'lr': 0.0003497299834635079, 'samples': 10880640, 'steps': 56669, 'loss/train': 1.297471046447754} -08/30/2021 23:24:26 - INFO - __main__ - Step 56671: {'lr': 0.0003497251172320348, 'samples': 10880832, 'steps': 56670, 'loss/train': 0.5607073903083801} -08/30/2021 23:24:26 - INFO - __main__ - Step 56672: {'lr': 0.00034972025095562697, 'samples': 10881024, 'steps': 56671, 'loss/train': 1.6480882167816162} -08/30/2021 23:24:27 - INFO - __main__ - Step 56673: {'lr': 0.00034971538463428683, 'samples': 10881216, 'steps': 56672, 'loss/train': 0.019913876429200172} -08/30/2021 23:24:27 - INFO - __main__ - Step 56674: {'lr': 0.0003497105182680164, 'samples': 10881408, 'steps': 56673, 'loss/train': 1.1580127477645874} -08/30/2021 23:24:28 - INFO - __main__ - Step 56675: {'lr': 0.00034970565185681794, 'samples': 10881600, 'steps': 56674, 'loss/train': 1.5405628681182861} -08/30/2021 23:24:29 - INFO - __main__ - Step 56676: {'lr': 0.0003497007854006937, 'samples': 10881792, 'steps': 56675, 'loss/train': 1.0766236782073975} -08/30/2021 23:24:30 - INFO - __main__ - Step 56677: {'lr': 0.0003496959188996458, 'samples': 10881984, 'steps': 56676, 'loss/train': 1.1496772766113281} -08/30/2021 23:24:30 - INFO - __main__ - Step 56678: {'lr': 0.00034969105235367647, 'samples': 10882176, 'steps': 56677, 'loss/train': 2.5835843086242676} -08/30/2021 23:24:31 - INFO - __main__ - Step 56679: {'lr': 0.0003496861857627879, 'samples': 10882368, 'steps': 56678, 'loss/train': 1.807704210281372} -08/30/2021 23:24:31 - INFO - __main__ - Step 56680: {'lr': 0.0003496813191269822, 'samples': 10882560, 'steps': 56679, 'loss/train': 1.1195123195648193} -08/30/2021 23:24:31 - INFO - __main__ - Step 56681: {'lr': 0.0003496764524462617, 'samples': 10882752, 'steps': 56680, 'loss/train': 0.673947274684906} -08/30/2021 23:24:33 - INFO - __main__ - Step 56682: {'lr': 0.00034967158572062854, 'samples': 10882944, 'steps': 56681, 'loss/train': 1.3062444925308228} -08/30/2021 23:24:34 - INFO - __main__ - Step 56683: {'lr': 0.00034966671895008485, 'samples': 10883136, 'steps': 56682, 'loss/train': 1.4439219236373901} -08/30/2021 23:24:34 - INFO - __main__ - Step 56684: {'lr': 0.0003496618521346329, 'samples': 10883328, 'steps': 56683, 'loss/train': 1.268198847770691} -08/30/2021 23:24:35 - INFO - __main__ - Step 56685: {'lr': 0.00034965698527427493, 'samples': 10883520, 'steps': 56684, 'loss/train': 1.6766000986099243} -08/30/2021 23:24:35 - INFO - __main__ - Step 56686: {'lr': 0.00034965211836901293, 'samples': 10883712, 'steps': 56685, 'loss/train': 1.562535047531128} -08/30/2021 23:24:37 - INFO - __main__ - Step 56687: {'lr': 0.00034964725141884936, 'samples': 10883904, 'steps': 56686, 'loss/train': 1.2752197980880737} -08/30/2021 23:24:37 - INFO - __main__ - Step 56688: {'lr': 0.00034964238442378615, 'samples': 10884096, 'steps': 56687, 'loss/train': 1.4188339710235596} -08/30/2021 23:24:38 - INFO - __main__ - Step 56689: {'lr': 0.00034963751738382564, 'samples': 10884288, 'steps': 56688, 'loss/train': 0.740077018737793} -08/30/2021 23:24:38 - INFO - __main__ - Step 56690: {'lr': 0.00034963265029897006, 'samples': 10884480, 'steps': 56689, 'loss/train': 0.5276865363121033} -08/30/2021 23:24:39 - INFO - __main__ - Step 56691: {'lr': 0.00034962778316922156, 'samples': 10884672, 'steps': 56690, 'loss/train': 1.2058615684509277} -08/30/2021 23:24:40 - INFO - __main__ - Step 56692: {'lr': 0.0003496229159945823, 'samples': 10884864, 'steps': 56691, 'loss/train': 1.067211627960205} -08/30/2021 23:24:40 - INFO - __main__ - Step 56693: {'lr': 0.0003496180487750544, 'samples': 10885056, 'steps': 56692, 'loss/train': 0.30880534648895264} -08/30/2021 23:24:41 - INFO - __main__ - Step 56694: {'lr': 0.00034961318151064026, 'samples': 10885248, 'steps': 56693, 'loss/train': 1.328700065612793} -08/30/2021 23:24:41 - INFO - __main__ - Step 56695: {'lr': 0.00034960831420134187, 'samples': 10885440, 'steps': 56694, 'loss/train': 0.9614832401275635} -08/30/2021 23:24:41 - INFO - __main__ - Step 56696: {'lr': 0.0003496034468471616, 'samples': 10885632, 'steps': 56695, 'loss/train': 1.3397225141525269} -08/30/2021 23:24:43 - INFO - __main__ - Step 56697: {'lr': 0.00034959857944810144, 'samples': 10885824, 'steps': 56696, 'loss/train': 1.4187637567520142} -08/30/2021 23:24:43 - INFO - __main__ - Step 56698: {'lr': 0.0003495937120041638, 'samples': 10886016, 'steps': 56697, 'loss/train': 1.4306093454360962} -08/30/2021 23:24:44 - INFO - __main__ - Step 56699: {'lr': 0.00034958884451535073, 'samples': 10886208, 'steps': 56698, 'loss/train': 1.4021881818771362} -08/30/2021 23:24:44 - INFO - __main__ - Step 56700: {'lr': 0.00034958397698166445, 'samples': 10886400, 'steps': 56699, 'loss/train': 1.840881586074829} -08/30/2021 23:24:44 - INFO - __main__ - Step 56701: {'lr': 0.00034957910940310716, 'samples': 10886592, 'steps': 56700, 'loss/train': 0.26254332065582275} -08/30/2021 23:24:46 - INFO - __main__ - Step 56702: {'lr': 0.00034957424177968114, 'samples': 10886784, 'steps': 56701, 'loss/train': 1.6205044984817505} -08/30/2021 23:24:46 - INFO - __main__ - Step 56703: {'lr': 0.0003495693741113884, 'samples': 10886976, 'steps': 56702, 'loss/train': 1.2337194681167603} -08/30/2021 23:24:47 - INFO - __main__ - Step 56704: {'lr': 0.00034956450639823125, 'samples': 10887168, 'steps': 56703, 'loss/train': 1.2526735067367554} -08/30/2021 23:24:47 - INFO - __main__ - Step 56705: {'lr': 0.00034955963864021194, 'samples': 10887360, 'steps': 56704, 'loss/train': 0.7252885103225708} -08/30/2021 23:24:47 - INFO - __main__ - Step 56706: {'lr': 0.00034955477083733257, 'samples': 10887552, 'steps': 56705, 'loss/train': 0.5901670455932617} -08/30/2021 23:24:49 - INFO - __main__ - Step 56707: {'lr': 0.0003495499029895953, 'samples': 10887744, 'steps': 56706, 'loss/train': 1.3329631090164185} -08/30/2021 23:24:49 - INFO - __main__ - Step 56708: {'lr': 0.00034954503509700244, 'samples': 10887936, 'steps': 56707, 'loss/train': 1.696196436882019} -08/30/2021 23:24:50 - INFO - __main__ - Step 56709: {'lr': 0.0003495401671595561, 'samples': 10888128, 'steps': 56708, 'loss/train': 1.3466346263885498} -08/30/2021 23:24:50 - INFO - __main__ - Step 56710: {'lr': 0.0003495352991772585, 'samples': 10888320, 'steps': 56709, 'loss/train': 1.4730360507965088} -08/30/2021 23:24:50 - INFO - __main__ - Step 56711: {'lr': 0.0003495304311501118, 'samples': 10888512, 'steps': 56710, 'loss/train': 1.1673533916473389} -08/30/2021 23:24:52 - INFO - __main__ - Step 56712: {'lr': 0.0003495255630781183, 'samples': 10888704, 'steps': 56711, 'loss/train': 1.339542269706726} -08/30/2021 23:24:52 - INFO - __main__ - Step 56713: {'lr': 0.00034952069496128007, 'samples': 10888896, 'steps': 56712, 'loss/train': 1.0222094058990479} -08/30/2021 23:24:53 - INFO - __main__ - Step 56714: {'lr': 0.0003495158267995994, 'samples': 10889088, 'steps': 56713, 'loss/train': 1.2242183685302734} -08/30/2021 23:24:53 - INFO - __main__ - Step 56715: {'lr': 0.0003495109585930784, 'samples': 10889280, 'steps': 56714, 'loss/train': 1.646255612373352} -08/30/2021 23:24:53 - INFO - __main__ - Step 56716: {'lr': 0.0003495060903417192, 'samples': 10889472, 'steps': 56715, 'loss/train': 1.3751050233840942} -08/30/2021 23:24:55 - INFO - __main__ - Step 56717: {'lr': 0.00034950122204552417, 'samples': 10889664, 'steps': 56716, 'loss/train': 1.5611677169799805} -08/30/2021 23:24:55 - INFO - __main__ - Step 56718: {'lr': 0.00034949635370449546, 'samples': 10889856, 'steps': 56717, 'loss/train': 1.5401617288589478} -08/30/2021 23:24:56 - INFO - __main__ - Step 56719: {'lr': 0.00034949148531863517, 'samples': 10890048, 'steps': 56718, 'loss/train': 1.436754822731018} -08/30/2021 23:24:56 - INFO - __main__ - Step 56720: {'lr': 0.0003494866168879456, 'samples': 10890240, 'steps': 56719, 'loss/train': 1.4176748991012573} -08/30/2021 23:24:56 - INFO - __main__ - Step 56721: {'lr': 0.0003494817484124289, 'samples': 10890432, 'steps': 56720, 'loss/train': 1.3382786512374878} -08/30/2021 23:24:57 - INFO - __main__ - Step 56722: {'lr': 0.0003494768798920872, 'samples': 10890624, 'steps': 56721, 'loss/train': 1.5689197778701782} -08/30/2021 23:24:59 - INFO - __main__ - Step 56723: {'lr': 0.0003494720113269227, 'samples': 10890816, 'steps': 56722, 'loss/train': 1.1819244623184204} -08/30/2021 23:24:59 - INFO - __main__ - Step 56724: {'lr': 0.00034946714271693783, 'samples': 10891008, 'steps': 56723, 'loss/train': 1.3029106855392456} -08/30/2021 23:25:00 - INFO - __main__ - Step 56725: {'lr': 0.0003494622740621345, 'samples': 10891200, 'steps': 56724, 'loss/train': 1.4662553071975708} -08/30/2021 23:25:00 - INFO - __main__ - Step 56726: {'lr': 0.00034945740536251505, 'samples': 10891392, 'steps': 56725, 'loss/train': 1.4535045623779297} -08/30/2021 23:25:00 - INFO - __main__ - Step 56727: {'lr': 0.0003494525366180815, 'samples': 10891584, 'steps': 56726, 'loss/train': 0.8776691555976868} -08/30/2021 23:25:01 - INFO - __main__ - Step 56728: {'lr': 0.0003494476678288363, 'samples': 10891776, 'steps': 56727, 'loss/train': 0.9184784293174744} -08/30/2021 23:25:02 - INFO - __main__ - Step 56729: {'lr': 0.00034944279899478146, 'samples': 10891968, 'steps': 56728, 'loss/train': 0.019302329048514366} -08/30/2021 23:25:03 - INFO - __main__ - Step 56730: {'lr': 0.00034943793011591926, 'samples': 10892160, 'steps': 56729, 'loss/train': 1.2300323247909546} -08/30/2021 23:25:03 - INFO - __main__ - Step 56731: {'lr': 0.0003494330611922518, 'samples': 10892352, 'steps': 56730, 'loss/train': 1.545109510421753} -08/30/2021 23:25:03 - INFO - __main__ - Step 56732: {'lr': 0.0003494281922237814, 'samples': 10892544, 'steps': 56731, 'loss/train': 0.9021186232566833} -08/30/2021 23:25:04 - INFO - __main__ - Step 56733: {'lr': 0.0003494233232105102, 'samples': 10892736, 'steps': 56732, 'loss/train': 1.418137550354004} -08/30/2021 23:25:06 - INFO - __main__ - Step 56734: {'lr': 0.0003494184541524403, 'samples': 10892928, 'steps': 56733, 'loss/train': 1.6505248546600342} -08/30/2021 23:25:06 - INFO - __main__ - Step 56735: {'lr': 0.0003494135850495741, 'samples': 10893120, 'steps': 56734, 'loss/train': 1.2418785095214844} -08/30/2021 23:25:07 - INFO - __main__ - Step 56736: {'lr': 0.0003494087159019136, 'samples': 10893312, 'steps': 56735, 'loss/train': 1.7590183019638062} -08/30/2021 23:25:07 - INFO - __main__ - Step 56737: {'lr': 0.0003494038467094611, 'samples': 10893504, 'steps': 56736, 'loss/train': 0.854834258556366} -08/30/2021 23:25:07 - INFO - __main__ - Step 56738: {'lr': 0.00034939897747221873, 'samples': 10893696, 'steps': 56737, 'loss/train': 0.8972604870796204} -08/30/2021 23:25:09 - INFO - __main__ - Step 56739: {'lr': 0.00034939410819018874, 'samples': 10893888, 'steps': 56738, 'loss/train': 1.434583067893982} -08/30/2021 23:25:09 - INFO - __main__ - Step 56740: {'lr': 0.0003493892388633733, 'samples': 10894080, 'steps': 56739, 'loss/train': 1.1860287189483643} -08/30/2021 23:25:10 - INFO - __main__ - Step 56741: {'lr': 0.0003493843694917745, 'samples': 10894272, 'steps': 56740, 'loss/train': 1.689272403717041} -08/30/2021 23:25:10 - INFO - __main__ - Step 56742: {'lr': 0.00034937950007539475, 'samples': 10894464, 'steps': 56741, 'loss/train': 1.592295527458191} -08/30/2021 23:25:10 - INFO - __main__ - Step 56743: {'lr': 0.0003493746306142361, 'samples': 10894656, 'steps': 56742, 'loss/train': 1.311223030090332} -08/30/2021 23:25:12 - INFO - __main__ - Step 56744: {'lr': 0.00034936976110830077, 'samples': 10894848, 'steps': 56743, 'loss/train': 1.7671316862106323} -08/30/2021 23:25:12 - INFO - __main__ - Step 56745: {'lr': 0.000349364891557591, 'samples': 10895040, 'steps': 56744, 'loss/train': 1.3961111307144165} -08/30/2021 23:25:13 - INFO - __main__ - Step 56746: {'lr': 0.00034936002196210895, 'samples': 10895232, 'steps': 56745, 'loss/train': 0.8962607383728027} -08/30/2021 23:25:13 - INFO - __main__ - Step 56747: {'lr': 0.0003493551523218567, 'samples': 10895424, 'steps': 56746, 'loss/train': 1.892096996307373} -08/30/2021 23:25:13 - INFO - __main__ - Step 56748: {'lr': 0.0003493502826368366, 'samples': 10895616, 'steps': 56747, 'loss/train': 1.541806697845459} -08/30/2021 23:25:15 - INFO - __main__ - Step 56749: {'lr': 0.0003493454129070508, 'samples': 10895808, 'steps': 56748, 'loss/train': 0.867680013179779} -08/30/2021 23:25:15 - INFO - __main__ - Step 56750: {'lr': 0.0003493405431325015, 'samples': 10896000, 'steps': 56749, 'loss/train': 0.8825818300247192} -08/30/2021 23:25:16 - INFO - __main__ - Step 56751: {'lr': 0.0003493356733131909, 'samples': 10896192, 'steps': 56750, 'loss/train': 1.3202054500579834} -08/30/2021 23:25:16 - INFO - __main__ - Step 56752: {'lr': 0.0003493308034491212, 'samples': 10896384, 'steps': 56751, 'loss/train': 1.2743120193481445} -08/30/2021 23:25:16 - INFO - __main__ - Step 56753: {'lr': 0.00034932593354029454, 'samples': 10896576, 'steps': 56752, 'loss/train': 1.5536842346191406} -08/30/2021 23:25:17 - INFO - __main__ - Step 56754: {'lr': 0.00034932106358671314, 'samples': 10896768, 'steps': 56753, 'loss/train': 0.7229862809181213} -08/30/2021 23:25:19 - INFO - __main__ - Step 56755: {'lr': 0.0003493161935883792, 'samples': 10896960, 'steps': 56754, 'loss/train': 1.5224770307540894} -08/30/2021 23:25:19 - INFO - __main__ - Step 56756: {'lr': 0.0003493113235452949, 'samples': 10897152, 'steps': 56755, 'loss/train': 1.5602049827575684} -08/30/2021 23:25:19 - INFO - __main__ - Step 56757: {'lr': 0.00034930645345746246, 'samples': 10897344, 'steps': 56756, 'loss/train': 0.06777407974004745} -08/30/2021 23:25:20 - INFO - __main__ - Step 56758: {'lr': 0.0003493015833248841, 'samples': 10897536, 'steps': 56757, 'loss/train': 0.028674036264419556} -08/30/2021 23:25:20 - INFO - __main__ - Step 56759: {'lr': 0.00034929671314756197, 'samples': 10897728, 'steps': 56758, 'loss/train': 1.5826789140701294} -08/30/2021 23:25:20 - INFO - __main__ - Step 56760: {'lr': 0.0003492918429254983, 'samples': 10897920, 'steps': 56759, 'loss/train': 1.2855006456375122} -08/30/2021 23:25:22 - INFO - __main__ - Step 56761: {'lr': 0.00034928697265869515, 'samples': 10898112, 'steps': 56760, 'loss/train': 1.0997174978256226} -08/30/2021 23:25:23 - INFO - __main__ - Step 56762: {'lr': 0.00034928210234715497, 'samples': 10898304, 'steps': 56761, 'loss/train': 1.3132038116455078} -08/30/2021 23:25:23 - INFO - __main__ - Step 56763: {'lr': 0.0003492772319908797, 'samples': 10898496, 'steps': 56762, 'loss/train': 1.33661687374115} -08/30/2021 23:25:24 - INFO - __main__ - Step 56764: {'lr': 0.0003492723615898716, 'samples': 10898688, 'steps': 56763, 'loss/train': 1.5947891473770142} -08/30/2021 23:25:24 - INFO - __main__ - Step 56765: {'lr': 0.000349267491144133, 'samples': 10898880, 'steps': 56764, 'loss/train': 1.292133092880249} -08/30/2021 23:25:24 - INFO - __main__ - Step 56766: {'lr': 0.00034926262065366597, 'samples': 10899072, 'steps': 56765, 'loss/train': 0.025055456906557083} -08/30/2021 23:25:26 - INFO - __main__ - Step 56767: {'lr': 0.0003492577501184727, 'samples': 10899264, 'steps': 56766, 'loss/train': 1.1451060771942139} -08/30/2021 23:25:26 - INFO - __main__ - Step 56768: {'lr': 0.0003492528795385556, 'samples': 10899456, 'steps': 56767, 'loss/train': 1.6359162330627441} -08/30/2021 23:25:26 - INFO - __main__ - Step 56769: {'lr': 0.00034924800891391645, 'samples': 10899648, 'steps': 56768, 'loss/train': 1.3535114526748657} -08/30/2021 23:25:27 - INFO - __main__ - Step 56770: {'lr': 0.0003492431382445578, 'samples': 10899840, 'steps': 56769, 'loss/train': 1.6838936805725098} -08/30/2021 23:25:27 - INFO - __main__ - Step 56771: {'lr': 0.00034923826753048163, 'samples': 10900032, 'steps': 56770, 'loss/train': 1.3130229711532593} -08/30/2021 23:25:29 - INFO - __main__ - Step 56772: {'lr': 0.00034923339677169033, 'samples': 10900224, 'steps': 56771, 'loss/train': 1.0998550653457642} -08/30/2021 23:25:29 - INFO - __main__ - Step 56773: {'lr': 0.000349228525968186, 'samples': 10900416, 'steps': 56772, 'loss/train': 0.7550140619277954} -08/30/2021 23:25:30 - INFO - __main__ - Step 56774: {'lr': 0.0003492236551199707, 'samples': 10900608, 'steps': 56773, 'loss/train': 1.5905202627182007} -08/30/2021 23:25:30 - INFO - __main__ - Step 56775: {'lr': 0.0003492187842270469, 'samples': 10900800, 'steps': 56774, 'loss/train': 1.6662850379943848} -08/30/2021 23:25:30 - INFO - __main__ - Step 56776: {'lr': 0.00034921391328941655, 'samples': 10900992, 'steps': 56775, 'loss/train': 1.7697941064834595} -08/30/2021 23:25:31 - INFO - __main__ - Step 56777: {'lr': 0.00034920904230708195, 'samples': 10901184, 'steps': 56776, 'loss/train': 1.188982605934143} -08/30/2021 23:25:32 - INFO - __main__ - Step 56778: {'lr': 0.0003492041712800453, 'samples': 10901376, 'steps': 56777, 'loss/train': 1.1459029912948608} -08/30/2021 23:25:33 - INFO - __main__ - Step 56779: {'lr': 0.0003491993002083088, 'samples': 10901568, 'steps': 56778, 'loss/train': 1.34610915184021} -08/30/2021 23:25:33 - INFO - __main__ - Step 56780: {'lr': 0.00034919442909187465, 'samples': 10901760, 'steps': 56779, 'loss/train': 1.0940742492675781} -08/30/2021 23:25:33 - INFO - __main__ - Step 56781: {'lr': 0.000349189557930745, 'samples': 10901952, 'steps': 56780, 'loss/train': 1.2429697513580322} -08/30/2021 23:25:34 - INFO - __main__ - Step 56782: {'lr': 0.000349184686724922, 'samples': 10902144, 'steps': 56781, 'loss/train': 1.6308033466339111} -08/30/2021 23:25:35 - INFO - __main__ - Step 56783: {'lr': 0.00034917981547440797, 'samples': 10902336, 'steps': 56782, 'loss/train': 1.8578672409057617} -08/30/2021 23:25:36 - INFO - __main__ - Step 56784: {'lr': 0.00034917494417920504, 'samples': 10902528, 'steps': 56783, 'loss/train': 1.044552206993103} -08/30/2021 23:25:36 - INFO - __main__ - Step 56785: {'lr': 0.0003491700728393154, 'samples': 10902720, 'steps': 56784, 'loss/train': 1.0783411264419556} -08/30/2021 23:25:36 - INFO - __main__ - Step 56786: {'lr': 0.0003491652014547413, 'samples': 10902912, 'steps': 56785, 'loss/train': 1.473204493522644} -08/30/2021 23:25:37 - INFO - __main__ - Step 56787: {'lr': 0.00034916033002548486, 'samples': 10903104, 'steps': 56786, 'loss/train': 1.4723454713821411} -08/30/2021 23:25:38 - INFO - __main__ - Step 56788: {'lr': 0.00034915545855154827, 'samples': 10903296, 'steps': 56787, 'loss/train': 1.5283957719802856} -08/30/2021 23:25:39 - INFO - __main__ - Step 56789: {'lr': 0.00034915058703293377, 'samples': 10903488, 'steps': 56788, 'loss/train': 1.1729637384414673} -08/30/2021 23:25:39 - INFO - __main__ - Step 56790: {'lr': 0.0003491457154696436, 'samples': 10903680, 'steps': 56789, 'loss/train': 1.6620131731033325} -08/30/2021 23:25:40 - INFO - __main__ - Step 56791: {'lr': 0.0003491408438616798, 'samples': 10903872, 'steps': 56790, 'loss/train': 1.578089714050293} -08/30/2021 23:25:40 - INFO - __main__ - Step 56792: {'lr': 0.0003491359722090448, 'samples': 10904064, 'steps': 56791, 'loss/train': 0.05951777100563049} -08/30/2021 23:25:42 - INFO - __main__ - Step 56793: {'lr': 0.00034913110051174056, 'samples': 10904256, 'steps': 56792, 'loss/train': 1.0769128799438477} -08/30/2021 23:25:42 - INFO - __main__ - Step 56794: {'lr': 0.0003491262287697694, 'samples': 10904448, 'steps': 56793, 'loss/train': 1.943314552307129} -08/30/2021 23:25:43 - INFO - __main__ - Step 56795: {'lr': 0.0003491213569831335, 'samples': 10904640, 'steps': 56794, 'loss/train': 0.9825982451438904} -08/30/2021 23:25:43 - INFO - __main__ - Step 56796: {'lr': 0.000349116485151835, 'samples': 10904832, 'steps': 56795, 'loss/train': 0.2731589078903198} -08/30/2021 23:25:44 - INFO - __main__ - Step 56797: {'lr': 0.00034911161327587625, 'samples': 10905024, 'steps': 56796, 'loss/train': 0.3056858479976654} -08/30/2021 23:25:45 - INFO - __main__ - Step 56798: {'lr': 0.00034910674135525926, 'samples': 10905216, 'steps': 56797, 'loss/train': 1.4800364971160889} -08/30/2021 23:25:46 - INFO - __main__ - Step 56799: {'lr': 0.0003491018693899863, 'samples': 10905408, 'steps': 56798, 'loss/train': 1.1802165508270264} -08/30/2021 23:25:46 - INFO - __main__ - Step 56800: {'lr': 0.00034909699738005964, 'samples': 10905600, 'steps': 56799, 'loss/train': 1.3026938438415527} -08/30/2021 23:25:46 - INFO - __main__ - Step 56801: {'lr': 0.0003490921253254813, 'samples': 10905792, 'steps': 56800, 'loss/train': 1.7394874095916748} -08/30/2021 23:25:47 - INFO - __main__ - Step 56802: {'lr': 0.00034908725322625365, 'samples': 10905984, 'steps': 56801, 'loss/train': 1.2614617347717285} -08/30/2021 23:25:47 - INFO - __main__ - Step 56803: {'lr': 0.0003490823810823788, 'samples': 10906176, 'steps': 56802, 'loss/train': 1.4205695390701294} -08/30/2021 23:25:48 - INFO - __main__ - Step 56804: {'lr': 0.0003490775088938589, 'samples': 10906368, 'steps': 56803, 'loss/train': 1.3422627449035645} -08/30/2021 23:25:49 - INFO - __main__ - Step 56805: {'lr': 0.00034907263666069624, 'samples': 10906560, 'steps': 56804, 'loss/train': 1.2066166400909424} -08/30/2021 23:25:49 - INFO - __main__ - Step 56806: {'lr': 0.000349067764382893, 'samples': 10906752, 'steps': 56805, 'loss/train': 1.4579092264175415} -08/30/2021 23:25:50 - INFO - __main__ - Step 56807: {'lr': 0.0003490628920604513, 'samples': 10906944, 'steps': 56806, 'loss/train': 1.0985229015350342} -08/30/2021 23:25:50 - INFO - __main__ - Step 56808: {'lr': 0.00034905801969337347, 'samples': 10907136, 'steps': 56807, 'loss/train': 1.2382231950759888} -08/30/2021 23:25:51 - INFO - __main__ - Step 56809: {'lr': 0.0003490531472816616, 'samples': 10907328, 'steps': 56808, 'loss/train': 1.6478755474090576} -08/30/2021 23:25:52 - INFO - __main__ - Step 56810: {'lr': 0.00034904827482531785, 'samples': 10907520, 'steps': 56809, 'loss/train': 1.44677734375} -08/30/2021 23:25:52 - INFO - __main__ - Step 56811: {'lr': 0.0003490434023243445, 'samples': 10907712, 'steps': 56810, 'loss/train': 0.957885205745697} -08/30/2021 23:25:53 - INFO - __main__ - Step 56812: {'lr': 0.0003490385297787438, 'samples': 10907904, 'steps': 56811, 'loss/train': 1.7826210260391235} -08/30/2021 23:25:53 - INFO - __main__ - Step 56813: {'lr': 0.00034903365718851775, 'samples': 10908096, 'steps': 56812, 'loss/train': 1.4312103986740112} -08/30/2021 23:25:55 - INFO - __main__ - Step 56814: {'lr': 0.00034902878455366876, 'samples': 10908288, 'steps': 56813, 'loss/train': 1.0159746408462524} -08/30/2021 23:25:55 - INFO - __main__ - Step 56815: {'lr': 0.0003490239118741989, 'samples': 10908480, 'steps': 56814, 'loss/train': 1.5728769302368164} -08/30/2021 23:25:56 - INFO - __main__ - Step 56816: {'lr': 0.00034901903915011035, 'samples': 10908672, 'steps': 56815, 'loss/train': 0.8968613147735596} -08/30/2021 23:25:56 - INFO - __main__ - Step 56817: {'lr': 0.0003490141663814054, 'samples': 10908864, 'steps': 56816, 'loss/train': 1.3985726833343506} -08/30/2021 23:25:56 - INFO - __main__ - Step 56818: {'lr': 0.00034900929356808613, 'samples': 10909056, 'steps': 56817, 'loss/train': 0.9104251861572266} -08/30/2021 23:25:58 - INFO - __main__ - Step 56819: {'lr': 0.00034900442071015485, 'samples': 10909248, 'steps': 56818, 'loss/train': 0.7776812314987183} -08/30/2021 23:25:59 - INFO - __main__ - Step 56820: {'lr': 0.00034899954780761373, 'samples': 10909440, 'steps': 56819, 'loss/train': 0.6282814741134644} -08/30/2021 23:25:59 - INFO - __main__ - Step 56821: {'lr': 0.00034899467486046486, 'samples': 10909632, 'steps': 56820, 'loss/train': 0.8602657318115234} -08/30/2021 23:25:59 - INFO - __main__ - Step 56822: {'lr': 0.0003489898018687106, 'samples': 10909824, 'steps': 56821, 'loss/train': 3.6292970180511475} -08/30/2021 23:26:00 - INFO - __main__ - Step 56823: {'lr': 0.000348984928832353, 'samples': 10910016, 'steps': 56822, 'loss/train': 5.065361976623535} -08/30/2021 23:26:00 - INFO - __main__ - Step 56824: {'lr': 0.00034898005575139437, 'samples': 10910208, 'steps': 56823, 'loss/train': 0.7015039920806885} -08/30/2021 23:26:02 - INFO - __main__ - Step 56825: {'lr': 0.00034897518262583683, 'samples': 10910400, 'steps': 56824, 'loss/train': 1.567171573638916} -08/30/2021 23:26:02 - INFO - __main__ - Step 56826: {'lr': 0.00034897030945568264, 'samples': 10910592, 'steps': 56825, 'loss/train': 0.8680390119552612} -08/30/2021 23:26:02 - INFO - __main__ - Step 56827: {'lr': 0.0003489654362409339, 'samples': 10910784, 'steps': 56826, 'loss/train': 1.1843427419662476} -08/30/2021 23:26:03 - INFO - __main__ - Step 56828: {'lr': 0.00034896056298159287, 'samples': 10910976, 'steps': 56827, 'loss/train': 1.2504146099090576} -08/30/2021 23:26:03 - INFO - __main__ - Step 56829: {'lr': 0.0003489556896776618, 'samples': 10911168, 'steps': 56828, 'loss/train': 0.038397036492824554} -08/30/2021 23:26:05 - INFO - __main__ - Step 56830: {'lr': 0.00034895081632914274, 'samples': 10911360, 'steps': 56829, 'loss/train': 1.4052339792251587} -08/30/2021 23:26:05 - INFO - __main__ - Step 56831: {'lr': 0.000348945942936038, 'samples': 10911552, 'steps': 56830, 'loss/train': 0.9070042967796326} -08/30/2021 23:26:05 - INFO - __main__ - Step 56832: {'lr': 0.0003489410694983497, 'samples': 10911744, 'steps': 56831, 'loss/train': 1.30417001247406} -08/30/2021 23:26:06 - INFO - __main__ - Step 56833: {'lr': 0.00034893619601608015, 'samples': 10911936, 'steps': 56832, 'loss/train': 1.014424443244934} -08/30/2021 23:26:06 - INFO - __main__ - Step 56834: {'lr': 0.0003489313224892314, 'samples': 10912128, 'steps': 56833, 'loss/train': 1.1177945137023926} -08/30/2021 23:26:08 - INFO - __main__ - Step 56835: {'lr': 0.0003489264489178058, 'samples': 10912320, 'steps': 56834, 'loss/train': 1.3818050622940063} -08/30/2021 23:26:08 - INFO - __main__ - Step 56836: {'lr': 0.00034892157530180546, 'samples': 10912512, 'steps': 56835, 'loss/train': 0.2655915915966034} -08/30/2021 23:26:09 - INFO - __main__ - Step 56837: {'lr': 0.0003489167016412326, 'samples': 10912704, 'steps': 56836, 'loss/train': 2.8492355346679688} -08/30/2021 23:26:09 - INFO - __main__ - Step 56838: {'lr': 0.00034891182793608935, 'samples': 10912896, 'steps': 56837, 'loss/train': 1.2801843881607056} -08/30/2021 23:26:09 - INFO - __main__ - Step 56839: {'lr': 0.000348906954186378, 'samples': 10913088, 'steps': 56838, 'loss/train': 0.9203802347183228} -08/30/2021 23:26:11 - INFO - __main__ - Step 56840: {'lr': 0.0003489020803921007, 'samples': 10913280, 'steps': 56839, 'loss/train': 2.1670665740966797} -08/30/2021 23:26:11 - INFO - __main__ - Step 56841: {'lr': 0.00034889720655325955, 'samples': 10913472, 'steps': 56840, 'loss/train': 1.4316847324371338} -08/30/2021 23:26:12 - INFO - __main__ - Step 56842: {'lr': 0.000348892332669857, 'samples': 10913664, 'steps': 56841, 'loss/train': 1.415387511253357} -08/30/2021 23:26:12 - INFO - __main__ - Step 56843: {'lr': 0.000348887458741895, 'samples': 10913856, 'steps': 56842, 'loss/train': 1.4527703523635864} -08/30/2021 23:26:12 - INFO - __main__ - Step 56844: {'lr': 0.0003488825847693758, 'samples': 10914048, 'steps': 56843, 'loss/train': 1.2186700105667114} -08/30/2021 23:26:14 - INFO - __main__ - Step 56845: {'lr': 0.0003488777107523017, 'samples': 10914240, 'steps': 56844, 'loss/train': 1.547472596168518} -08/30/2021 23:26:15 - INFO - __main__ - Step 56846: {'lr': 0.0003488728366906748, 'samples': 10914432, 'steps': 56845, 'loss/train': 0.6210740208625793} -08/30/2021 23:26:15 - INFO - __main__ - Step 56847: {'lr': 0.0003488679625844974, 'samples': 10914624, 'steps': 56846, 'loss/train': 1.1037166118621826} -08/30/2021 23:26:16 - INFO - __main__ - Step 56848: {'lr': 0.0003488630884337715, 'samples': 10914816, 'steps': 56847, 'loss/train': 0.44309526681900024} -08/30/2021 23:26:16 - INFO - __main__ - Step 56849: {'lr': 0.0003488582142384995, 'samples': 10915008, 'steps': 56848, 'loss/train': 1.3238654136657715} -08/30/2021 23:26:16 - INFO - __main__ - Step 56850: {'lr': 0.00034885333999868344, 'samples': 10915200, 'steps': 56849, 'loss/train': 1.545961618423462} -08/30/2021 23:26:18 - INFO - __main__ - Step 56851: {'lr': 0.0003488484657143257, 'samples': 10915392, 'steps': 56850, 'loss/train': 1.3489965200424194} -08/30/2021 23:26:18 - INFO - __main__ - Step 56852: {'lr': 0.00034884359138542825, 'samples': 10915584, 'steps': 56851, 'loss/train': 0.876106858253479} -08/30/2021 23:26:19 - INFO - __main__ - Step 56853: {'lr': 0.0003488387170119935, 'samples': 10915776, 'steps': 56852, 'loss/train': 1.4807602167129517} -08/30/2021 23:26:19 - INFO - __main__ - Step 56854: {'lr': 0.0003488338425940235, 'samples': 10915968, 'steps': 56853, 'loss/train': 1.5972204208374023} -08/30/2021 23:26:19 - INFO - __main__ - Step 56855: {'lr': 0.00034882896813152056, 'samples': 10916160, 'steps': 56854, 'loss/train': 1.1075756549835205} -08/30/2021 23:26:21 - INFO - __main__ - Step 56856: {'lr': 0.0003488240936244867, 'samples': 10916352, 'steps': 56855, 'loss/train': 1.2491711378097534} -08/30/2021 23:26:21 - INFO - __main__ - Step 56857: {'lr': 0.0003488192190729243, 'samples': 10916544, 'steps': 56856, 'loss/train': 0.11716333776712418} -08/30/2021 23:26:22 - INFO - __main__ - Step 56858: {'lr': 0.0003488143444768355, 'samples': 10916736, 'steps': 56857, 'loss/train': 1.8950672149658203} -08/30/2021 23:26:22 - INFO - __main__ - Step 56859: {'lr': 0.0003488094698362224, 'samples': 10916928, 'steps': 56858, 'loss/train': 1.0557746887207031} -08/30/2021 23:26:22 - INFO - __main__ - Step 56860: {'lr': 0.00034880459515108735, 'samples': 10917120, 'steps': 56859, 'loss/train': 1.2659811973571777} -08/30/2021 23:26:24 - INFO - __main__ - Step 56861: {'lr': 0.0003487997204214325, 'samples': 10917312, 'steps': 56860, 'loss/train': 1.2838890552520752} -08/30/2021 23:26:25 - INFO - __main__ - Step 56862: {'lr': 0.00034879484564725993, 'samples': 10917504, 'steps': 56861, 'loss/train': 1.4361438751220703} -08/30/2021 23:26:25 - INFO - __main__ - Step 56863: {'lr': 0.00034878997082857195, 'samples': 10917696, 'steps': 56862, 'loss/train': 1.1798934936523438} -08/30/2021 23:26:25 - INFO - __main__ - Step 56864: {'lr': 0.0003487850959653708, 'samples': 10917888, 'steps': 56863, 'loss/train': 1.8737319707870483} -08/30/2021 23:26:26 - INFO - __main__ - Step 56865: {'lr': 0.0003487802210576585, 'samples': 10918080, 'steps': 56864, 'loss/train': 0.5395573973655701} -08/30/2021 23:26:27 - INFO - __main__ - Step 56866: {'lr': 0.0003487753461054375, 'samples': 10918272, 'steps': 56865, 'loss/train': 1.3379285335540771} -08/30/2021 23:26:28 - INFO - __main__ - Step 56867: {'lr': 0.00034877047110870975, 'samples': 10918464, 'steps': 56866, 'loss/train': 0.8064634799957275} -08/30/2021 23:26:28 - INFO - __main__ - Step 56868: {'lr': 0.0003487655960674776, 'samples': 10918656, 'steps': 56867, 'loss/train': 1.0082318782806396} -08/30/2021 23:26:28 - INFO - __main__ - Step 56869: {'lr': 0.00034876072098174315, 'samples': 10918848, 'steps': 56868, 'loss/train': 1.1583197116851807} -08/30/2021 23:26:29 - INFO - __main__ - Step 56870: {'lr': 0.00034875584585150864, 'samples': 10919040, 'steps': 56869, 'loss/train': 1.3216029405593872} -08/30/2021 23:26:30 - INFO - __main__ - Step 56871: {'lr': 0.0003487509706767763, 'samples': 10919232, 'steps': 56870, 'loss/train': 1.0175455808639526} -08/30/2021 23:26:31 - INFO - __main__ - Step 56872: {'lr': 0.00034874609545754826, 'samples': 10919424, 'steps': 56871, 'loss/train': 1.420638918876648} -08/30/2021 23:26:31 - INFO - __main__ - Step 56873: {'lr': 0.00034874122019382684, 'samples': 10919616, 'steps': 56872, 'loss/train': 1.0788238048553467} -08/30/2021 23:26:31 - INFO - __main__ - Step 56874: {'lr': 0.0003487363448856141, 'samples': 10919808, 'steps': 56873, 'loss/train': 1.0165424346923828} -08/30/2021 23:26:32 - INFO - __main__ - Step 56875: {'lr': 0.00034873146953291224, 'samples': 10920000, 'steps': 56874, 'loss/train': 2.25630521774292} -08/30/2021 23:26:33 - INFO - __main__ - Step 56876: {'lr': 0.0003487265941357236, 'samples': 10920192, 'steps': 56875, 'loss/train': 1.7111485004425049} -08/30/2021 23:26:34 - INFO - __main__ - Step 56877: {'lr': 0.00034872171869405015, 'samples': 10920384, 'steps': 56876, 'loss/train': 0.8773935437202454} -08/30/2021 23:26:34 - INFO - __main__ - Step 56878: {'lr': 0.0003487168432078943, 'samples': 10920576, 'steps': 56877, 'loss/train': 1.4601478576660156} -08/30/2021 23:26:34 - INFO - __main__ - Step 56879: {'lr': 0.0003487119676772582, 'samples': 10920768, 'steps': 56878, 'loss/train': 1.274673342704773} -08/30/2021 23:26:35 - INFO - __main__ - Step 56880: {'lr': 0.00034870709210214397, 'samples': 10920960, 'steps': 56879, 'loss/train': 1.341761589050293} -08/30/2021 23:26:35 - INFO - __main__ - Step 56881: {'lr': 0.00034870221648255383, 'samples': 10921152, 'steps': 56880, 'loss/train': 1.0112030506134033} -08/30/2021 23:26:37 - INFO - __main__ - Step 56882: {'lr': 0.00034869734081849, 'samples': 10921344, 'steps': 56881, 'loss/train': 0.8431229591369629} -08/30/2021 23:26:37 - INFO - __main__ - Step 56883: {'lr': 0.0003486924651099547, 'samples': 10921536, 'steps': 56882, 'loss/train': 1.5484871864318848} -08/30/2021 23:26:37 - INFO - __main__ - Step 56884: {'lr': 0.00034868758935695, 'samples': 10921728, 'steps': 56883, 'loss/train': 1.8331186771392822} -08/30/2021 23:26:38 - INFO - __main__ - Step 56885: {'lr': 0.0003486827135594783, 'samples': 10921920, 'steps': 56884, 'loss/train': 0.8448839783668518} -08/30/2021 23:26:38 - INFO - __main__ - Step 56886: {'lr': 0.0003486778377175417, 'samples': 10922112, 'steps': 56885, 'loss/train': 1.600650668144226} -08/30/2021 23:26:40 - INFO - __main__ - Step 56887: {'lr': 0.00034867296183114236, 'samples': 10922304, 'steps': 56886, 'loss/train': 0.9846146106719971} -08/30/2021 23:26:40 - INFO - __main__ - Step 56888: {'lr': 0.0003486680859002825, 'samples': 10922496, 'steps': 56887, 'loss/train': 0.8097743391990662} -08/30/2021 23:26:40 - INFO - __main__ - Step 56889: {'lr': 0.00034866320992496427, 'samples': 10922688, 'steps': 56888, 'loss/train': 1.458606481552124} -08/30/2021 23:26:41 - INFO - __main__ - Step 56890: {'lr': 0.00034865833390518996, 'samples': 10922880, 'steps': 56889, 'loss/train': 1.0616099834442139} -08/30/2021 23:26:41 - INFO - __main__ - Step 56891: {'lr': 0.0003486534578409618, 'samples': 10923072, 'steps': 56890, 'loss/train': 1.6899924278259277} -08/30/2021 23:26:43 - INFO - __main__ - Step 56892: {'lr': 0.0003486485817322819, 'samples': 10923264, 'steps': 56891, 'loss/train': 1.4150826930999756} -08/30/2021 23:26:43 - INFO - __main__ - Step 56893: {'lr': 0.0003486437055791524, 'samples': 10923456, 'steps': 56892, 'loss/train': 1.5813283920288086} -08/30/2021 23:26:43 - INFO - __main__ - Step 56894: {'lr': 0.00034863882938157553, 'samples': 10923648, 'steps': 56893, 'loss/train': 1.9637569189071655} -08/30/2021 23:26:44 - INFO - __main__ - Step 56895: {'lr': 0.0003486339531395536, 'samples': 10923840, 'steps': 56894, 'loss/train': 1.0609982013702393} -08/30/2021 23:26:44 - INFO - __main__ - Step 56896: {'lr': 0.0003486290768530887, 'samples': 10924032, 'steps': 56895, 'loss/train': 2.417832374572754} -08/30/2021 23:26:46 - INFO - __main__ - Step 56897: {'lr': 0.00034862420052218313, 'samples': 10924224, 'steps': 56896, 'loss/train': 1.2900514602661133} -08/30/2021 23:26:46 - INFO - __main__ - Step 56898: {'lr': 0.00034861932414683897, 'samples': 10924416, 'steps': 56897, 'loss/train': 1.1638840436935425} -08/30/2021 23:26:46 - INFO - __main__ - Step 56899: {'lr': 0.00034861444772705846, 'samples': 10924608, 'steps': 56898, 'loss/train': 0.8779194951057434} -08/30/2021 23:26:47 - INFO - __main__ - Step 56900: {'lr': 0.0003486095712628438, 'samples': 10924800, 'steps': 56899, 'loss/train': 1.247465968132019} -08/30/2021 23:26:47 - INFO - __main__ - Step 56901: {'lr': 0.00034860469475419723, 'samples': 10924992, 'steps': 56900, 'loss/train': 2.773620128631592} -08/30/2021 23:26:49 - INFO - __main__ - Step 56902: {'lr': 0.00034859981820112084, 'samples': 10925184, 'steps': 56901, 'loss/train': 0.9942734837532043} -08/30/2021 23:26:50 - INFO - __main__ - Step 56903: {'lr': 0.00034859494160361694, 'samples': 10925376, 'steps': 56902, 'loss/train': 1.575143814086914} -08/30/2021 23:26:50 - INFO - __main__ - Step 56904: {'lr': 0.00034859006496168764, 'samples': 10925568, 'steps': 56903, 'loss/train': 1.643119215965271} -08/30/2021 23:26:50 - INFO - __main__ - Step 56905: {'lr': 0.0003485851882753352, 'samples': 10925760, 'steps': 56904, 'loss/train': 1.9424742460250854} -08/30/2021 23:26:51 - INFO - __main__ - Step 56906: {'lr': 0.00034858031154456177, 'samples': 10925952, 'steps': 56905, 'loss/train': 0.7926269769668579} -08/30/2021 23:26:51 - INFO - __main__ - Step 56907: {'lr': 0.0003485754347693696, 'samples': 10926144, 'steps': 56906, 'loss/train': 2.12726092338562} -08/30/2021 23:26:53 - INFO - __main__ - Step 56908: {'lr': 0.0003485705579497609, 'samples': 10926336, 'steps': 56907, 'loss/train': 0.6451771259307861} -08/30/2021 23:26:53 - INFO - __main__ - Step 56909: {'lr': 0.0003485656810857378, 'samples': 10926528, 'steps': 56908, 'loss/train': 1.4209744930267334} -08/30/2021 23:26:53 - INFO - __main__ - Step 56910: {'lr': 0.00034856080417730253, 'samples': 10926720, 'steps': 56909, 'loss/train': 1.2591547966003418} -08/30/2021 23:26:54 - INFO - __main__ - Step 56911: {'lr': 0.0003485559272244572, 'samples': 10926912, 'steps': 56910, 'loss/train': 0.6976348161697388} -08/30/2021 23:26:54 - INFO - __main__ - Step 56912: {'lr': 0.0003485510502272042, 'samples': 10927104, 'steps': 56911, 'loss/train': 1.039771556854248} -08/30/2021 23:26:56 - INFO - __main__ - Step 56913: {'lr': 0.0003485461731855456, 'samples': 10927296, 'steps': 56912, 'loss/train': 1.0598288774490356} -08/30/2021 23:26:56 - INFO - __main__ - Step 56914: {'lr': 0.0003485412960994836, 'samples': 10927488, 'steps': 56913, 'loss/train': 1.3684484958648682} -08/30/2021 23:26:57 - INFO - __main__ - Step 56915: {'lr': 0.0003485364189690203, 'samples': 10927680, 'steps': 56914, 'loss/train': 1.4023346900939941} -08/30/2021 23:26:57 - INFO - __main__ - Step 56916: {'lr': 0.0003485315417941581, 'samples': 10927872, 'steps': 56915, 'loss/train': 0.8421781659126282} -08/30/2021 23:26:57 - INFO - __main__ - Step 56917: {'lr': 0.00034852666457489917, 'samples': 10928064, 'steps': 56916, 'loss/train': 2.3677730560302734} -08/30/2021 23:26:59 - INFO - __main__ - Step 56918: {'lr': 0.00034852178731124557, 'samples': 10928256, 'steps': 56917, 'loss/train': 1.5544217824935913} -08/30/2021 23:26:59 - INFO - __main__ - Step 56919: {'lr': 0.00034851691000319963, 'samples': 10928448, 'steps': 56918, 'loss/train': 1.5356897115707397} -08/30/2021 23:27:00 - INFO - __main__ - Step 56920: {'lr': 0.0003485120326507635, 'samples': 10928640, 'steps': 56919, 'loss/train': 1.115616798400879} -08/30/2021 23:27:00 - INFO - __main__ - Step 56921: {'lr': 0.0003485071552539393, 'samples': 10928832, 'steps': 56920, 'loss/train': 1.0191221237182617} -08/30/2021 23:27:00 - INFO - __main__ - Step 56922: {'lr': 0.0003485022778127293, 'samples': 10929024, 'steps': 56921, 'loss/train': 0.8920819163322449} -08/30/2021 23:27:02 - INFO - __main__ - Step 56923: {'lr': 0.0003484974003271357, 'samples': 10929216, 'steps': 56922, 'loss/train': 1.4527028799057007} -08/30/2021 23:27:03 - INFO - __main__ - Step 56924: {'lr': 0.0003484925227971607, 'samples': 10929408, 'steps': 56923, 'loss/train': 1.4513757228851318} -08/30/2021 23:27:03 - INFO - __main__ - Step 56925: {'lr': 0.0003484876452228065, 'samples': 10929600, 'steps': 56924, 'loss/train': 0.3260684311389923} -08/30/2021 23:27:03 - INFO - __main__ - Step 56926: {'lr': 0.00034848276760407525, 'samples': 10929792, 'steps': 56925, 'loss/train': 0.9382138848304749} -08/30/2021 23:27:04 - INFO - __main__ - Step 56927: {'lr': 0.0003484778899409693, 'samples': 10929984, 'steps': 56926, 'loss/train': 1.441593885421753} -08/30/2021 23:27:04 - INFO - __main__ - Step 56928: {'lr': 0.0003484730122334906, 'samples': 10930176, 'steps': 56927, 'loss/train': 1.32077956199646} -08/30/2021 23:27:06 - INFO - __main__ - Step 56929: {'lr': 0.00034846813448164153, 'samples': 10930368, 'steps': 56928, 'loss/train': 1.025976300239563} -08/30/2021 23:27:06 - INFO - __main__ - Step 56930: {'lr': 0.00034846325668542425, 'samples': 10930560, 'steps': 56929, 'loss/train': 0.12417766451835632} -08/30/2021 23:27:07 - INFO - __main__ - Step 56931: {'lr': 0.00034845837884484086, 'samples': 10930752, 'steps': 56930, 'loss/train': 1.356216311454773} -08/30/2021 23:27:07 - INFO - __main__ - Step 56932: {'lr': 0.00034845350095989377, 'samples': 10930944, 'steps': 56931, 'loss/train': 0.8414885401725769} -08/30/2021 23:27:07 - INFO - __main__ - Step 56933: {'lr': 0.000348448623030585, 'samples': 10931136, 'steps': 56932, 'loss/train': 1.196163296699524} -08/30/2021 23:27:09 - INFO - __main__ - Step 56934: {'lr': 0.00034844374505691686, 'samples': 10931328, 'steps': 56933, 'loss/train': 1.2735474109649658} -08/30/2021 23:27:09 - INFO - __main__ - Step 56935: {'lr': 0.0003484388670388914, 'samples': 10931520, 'steps': 56934, 'loss/train': 0.7008181214332581} -08/30/2021 23:27:10 - INFO - __main__ - Step 56936: {'lr': 0.0003484339889765109, 'samples': 10931712, 'steps': 56935, 'loss/train': 1.571568250656128} -08/30/2021 23:27:10 - INFO - __main__ - Step 56937: {'lr': 0.0003484291108697776, 'samples': 10931904, 'steps': 56936, 'loss/train': 0.09991992264986038} -08/30/2021 23:27:10 - INFO - __main__ - Step 56938: {'lr': 0.0003484242327186936, 'samples': 10932096, 'steps': 56937, 'loss/train': 0.8290556073188782} -08/30/2021 23:27:12 - INFO - __main__ - Step 56939: {'lr': 0.0003484193545232612, 'samples': 10932288, 'steps': 56938, 'loss/train': 1.17635977268219} -08/30/2021 23:27:12 - INFO - __main__ - Step 56940: {'lr': 0.00034841447628348267, 'samples': 10932480, 'steps': 56939, 'loss/train': 1.0960227251052856} -08/30/2021 23:27:13 - INFO - __main__ - Step 56941: {'lr': 0.00034840959799936, 'samples': 10932672, 'steps': 56940, 'loss/train': 0.6932271718978882} -08/30/2021 23:27:13 - INFO - __main__ - Step 56942: {'lr': 0.0003484047196708955, 'samples': 10932864, 'steps': 56941, 'loss/train': 1.5163533687591553} -08/30/2021 23:27:13 - INFO - __main__ - Step 56943: {'lr': 0.00034839984129809125, 'samples': 10933056, 'steps': 56942, 'loss/train': 0.9830710291862488} -08/30/2021 23:27:15 - INFO - __main__ - Step 56944: {'lr': 0.00034839496288094964, 'samples': 10933248, 'steps': 56943, 'loss/train': 1.827366590499878} -08/30/2021 23:27:16 - INFO - __main__ - Step 56945: {'lr': 0.0003483900844194728, 'samples': 10933440, 'steps': 56944, 'loss/train': 2.0420448780059814} -08/30/2021 23:27:16 - INFO - __main__ - Step 56946: {'lr': 0.00034838520591366285, 'samples': 10933632, 'steps': 56945, 'loss/train': 1.186514139175415} -08/30/2021 23:27:16 - INFO - __main__ - Step 56947: {'lr': 0.0003483803273635221, 'samples': 10933824, 'steps': 56946, 'loss/train': 1.5188438892364502} -08/30/2021 23:27:17 - INFO - __main__ - Step 56948: {'lr': 0.0003483754487690527, 'samples': 10934016, 'steps': 56947, 'loss/train': 1.1046955585479736} -08/30/2021 23:27:19 - INFO - __main__ - Step 56949: {'lr': 0.0003483705701302567, 'samples': 10934208, 'steps': 56948, 'loss/train': 0.31348347663879395} -08/30/2021 23:27:19 - INFO - __main__ - Step 56950: {'lr': 0.0003483656914471366, 'samples': 10934400, 'steps': 56949, 'loss/train': 1.2855521440505981} -08/30/2021 23:27:19 - INFO - __main__ - Step 56951: {'lr': 0.00034836081271969436, 'samples': 10934592, 'steps': 56950, 'loss/train': 1.785689115524292} -08/30/2021 23:27:20 - INFO - __main__ - Step 56952: {'lr': 0.0003483559339479323, 'samples': 10934784, 'steps': 56951, 'loss/train': 0.675041139125824} -08/30/2021 23:27:20 - INFO - __main__ - Step 56953: {'lr': 0.00034835105513185253, 'samples': 10934976, 'steps': 56952, 'loss/train': 0.06716547906398773} -08/30/2021 23:27:20 - INFO - __main__ - Step 56954: {'lr': 0.00034834617627145737, 'samples': 10935168, 'steps': 56953, 'loss/train': 1.3539644479751587} -08/30/2021 23:27:22 - INFO - __main__ - Step 56955: {'lr': 0.00034834129736674885, 'samples': 10935360, 'steps': 56954, 'loss/train': 1.0353893041610718} -08/30/2021 23:27:23 - INFO - __main__ - Step 56956: {'lr': 0.0003483364184177293, 'samples': 10935552, 'steps': 56955, 'loss/train': 1.4986668825149536} -08/30/2021 23:27:23 - INFO - __main__ - Step 56957: {'lr': 0.0003483315394244009, 'samples': 10935744, 'steps': 56956, 'loss/train': 1.6922856569290161} -08/30/2021 23:27:23 - INFO - __main__ - Step 56958: {'lr': 0.00034832666038676576, 'samples': 10935936, 'steps': 56957, 'loss/train': 1.0952831506729126} -08/30/2021 23:27:24 - INFO - __main__ - Step 56959: {'lr': 0.0003483217813048262, 'samples': 10936128, 'steps': 56958, 'loss/train': 1.5478628873825073} -08/30/2021 23:27:25 - INFO - __main__ - Step 56960: {'lr': 0.0003483169021785844, 'samples': 10936320, 'steps': 56959, 'loss/train': 1.2977089881896973} -08/30/2021 23:27:26 - INFO - __main__ - Step 56961: {'lr': 0.00034831202300804245, 'samples': 10936512, 'steps': 56960, 'loss/train': 0.5518299341201782} -08/30/2021 23:27:26 - INFO - __main__ - Step 56962: {'lr': 0.0003483071437932026, 'samples': 10936704, 'steps': 56961, 'loss/train': 0.92521733045578} -08/30/2021 23:27:27 - INFO - __main__ - Step 56963: {'lr': 0.0003483022645340671, 'samples': 10936896, 'steps': 56962, 'loss/train': 1.1264383792877197} -08/30/2021 23:27:27 - INFO - __main__ - Step 56964: {'lr': 0.0003482973852306381, 'samples': 10937088, 'steps': 56963, 'loss/train': 1.4245665073394775} -08/30/2021 23:27:29 - INFO - __main__ - Step 56965: {'lr': 0.00034829250588291785, 'samples': 10937280, 'steps': 56964, 'loss/train': 0.8493406772613525} -08/30/2021 23:27:29 - INFO - __main__ - Step 56966: {'lr': 0.00034828762649090843, 'samples': 10937472, 'steps': 56965, 'loss/train': 1.405874252319336} -08/30/2021 23:27:29 - INFO - __main__ - Step 56967: {'lr': 0.0003482827470546123, 'samples': 10937664, 'steps': 56966, 'loss/train': 1.0573389530181885} -08/30/2021 23:27:30 - INFO - __main__ - Step 56968: {'lr': 0.00034827786757403136, 'samples': 10937856, 'steps': 56967, 'loss/train': 1.6176581382751465} -08/30/2021 23:27:30 - INFO - __main__ - Step 56969: {'lr': 0.00034827298804916793, 'samples': 10938048, 'steps': 56968, 'loss/train': 1.7509671449661255} -08/30/2021 23:27:31 - INFO - __main__ - Step 56970: {'lr': 0.00034826810848002416, 'samples': 10938240, 'steps': 56969, 'loss/train': 1.8563398122787476} -08/30/2021 23:27:32 - INFO - __main__ - Step 56971: {'lr': 0.00034826322886660234, 'samples': 10938432, 'steps': 56970, 'loss/train': 0.7419421076774597} -08/30/2021 23:27:33 - INFO - __main__ - Step 56972: {'lr': 0.00034825834920890463, 'samples': 10938624, 'steps': 56971, 'loss/train': 3.262617588043213} -08/30/2021 23:27:33 - INFO - __main__ - Step 56973: {'lr': 0.00034825346950693325, 'samples': 10938816, 'steps': 56972, 'loss/train': 1.5513989925384521} -08/30/2021 23:27:33 - INFO - __main__ - Step 56974: {'lr': 0.00034824858976069043, 'samples': 10939008, 'steps': 56973, 'loss/train': 1.1741607189178467} -08/30/2021 23:27:34 - INFO - __main__ - Step 56975: {'lr': 0.00034824370997017817, 'samples': 10939200, 'steps': 56974, 'loss/train': 1.5733639001846313} -08/30/2021 23:27:35 - INFO - __main__ - Step 56976: {'lr': 0.0003482388301353989, 'samples': 10939392, 'steps': 56975, 'loss/train': 1.2643074989318848} -08/30/2021 23:27:36 - INFO - __main__ - Step 56977: {'lr': 0.0003482339502563547, 'samples': 10939584, 'steps': 56976, 'loss/train': 1.3019770383834839} -08/30/2021 23:27:36 - INFO - __main__ - Step 56978: {'lr': 0.0003482290703330478, 'samples': 10939776, 'steps': 56977, 'loss/train': 1.7001034021377563} -08/30/2021 23:27:36 - INFO - __main__ - Step 56979: {'lr': 0.0003482241903654804, 'samples': 10939968, 'steps': 56978, 'loss/train': 1.3058631420135498} -08/30/2021 23:27:37 - INFO - __main__ - Step 56980: {'lr': 0.00034821931035365465, 'samples': 10940160, 'steps': 56979, 'loss/train': 1.4733809232711792} -08/30/2021 23:27:37 - INFO - __main__ - Step 56981: {'lr': 0.0003482144302975729, 'samples': 10940352, 'steps': 56980, 'loss/train': 1.1822497844696045} -08/30/2021 23:27:38 - INFO - __main__ - Step 56982: {'lr': 0.0003482095501972372, 'samples': 10940544, 'steps': 56981, 'loss/train': 0.8622186779975891} -08/30/2021 23:27:39 - INFO - __main__ - Step 56983: {'lr': 0.0003482046700526498, 'samples': 10940736, 'steps': 56982, 'loss/train': 1.3584232330322266} -08/30/2021 23:27:39 - INFO - __main__ - Step 56984: {'lr': 0.0003481997898638128, 'samples': 10940928, 'steps': 56983, 'loss/train': 0.6189478635787964} -08/30/2021 23:27:40 - INFO - __main__ - Step 56985: {'lr': 0.0003481949096307285, 'samples': 10941120, 'steps': 56984, 'loss/train': 1.907167673110962} -08/30/2021 23:27:40 - INFO - __main__ - Step 56986: {'lr': 0.0003481900293533992, 'samples': 10941312, 'steps': 56985, 'loss/train': 1.4248418807983398} -08/30/2021 23:27:42 - INFO - __main__ - Step 56987: {'lr': 0.00034818514903182696, 'samples': 10941504, 'steps': 56986, 'loss/train': 1.3281067609786987} -08/30/2021 23:27:42 - INFO - __main__ - Step 56988: {'lr': 0.000348180268666014, 'samples': 10941696, 'steps': 56987, 'loss/train': 0.9966983199119568} -08/30/2021 23:27:43 - INFO - __main__ - Step 56989: {'lr': 0.00034817538825596253, 'samples': 10941888, 'steps': 56988, 'loss/train': 0.027598761022090912} -08/30/2021 23:27:43 - INFO - __main__ - Step 56990: {'lr': 0.0003481705078016747, 'samples': 10942080, 'steps': 56989, 'loss/train': 1.2920674085617065} -08/30/2021 23:27:43 - INFO - __main__ - Step 56991: {'lr': 0.0003481656273031527, 'samples': 10942272, 'steps': 56990, 'loss/train': 0.04102129861712456} -08/30/2021 23:27:44 - INFO - __main__ - Step 56992: {'lr': 0.0003481607467603989, 'samples': 10942464, 'steps': 56991, 'loss/train': 1.7848039865493774} -08/30/2021 23:27:45 - INFO - __main__ - Step 56993: {'lr': 0.00034815586617341533, 'samples': 10942656, 'steps': 56992, 'loss/train': 1.2939101457595825} -08/30/2021 23:27:46 - INFO - __main__ - Step 56994: {'lr': 0.0003481509855422043, 'samples': 10942848, 'steps': 56993, 'loss/train': 1.4614652395248413} -08/30/2021 23:27:46 - INFO - __main__ - Step 56995: {'lr': 0.0003481461048667679, 'samples': 10943040, 'steps': 56994, 'loss/train': 1.739587426185608} -08/30/2021 23:27:46 - INFO - __main__ - Step 56996: {'lr': 0.00034814122414710837, 'samples': 10943232, 'steps': 56995, 'loss/train': 1.281952977180481} -08/30/2021 23:27:47 - INFO - __main__ - Step 56997: {'lr': 0.0003481363433832279, 'samples': 10943424, 'steps': 56996, 'loss/train': 1.574078917503357} -08/30/2021 23:27:48 - INFO - __main__ - Step 56998: {'lr': 0.00034813146257512876, 'samples': 10943616, 'steps': 56997, 'loss/train': 1.3837085962295532} -08/30/2021 23:27:49 - INFO - __main__ - Step 56999: {'lr': 0.0003481265817228131, 'samples': 10943808, 'steps': 56998, 'loss/train': 0.921924889087677} -08/30/2021 23:27:49 - INFO - __main__ - Step 57000: {'lr': 0.00034812170082628303, 'samples': 10944000, 'steps': 56999, 'loss/train': 0.2893299460411072} -08/30/2021 23:27:49 - INFO - __main__ - Step 57001: {'lr': 0.00034811681988554095, 'samples': 10944192, 'steps': 57000, 'loss/train': 1.6056768894195557} -08/30/2021 23:27:50 - INFO - __main__ - Step 57002: {'lr': 0.0003481119389005889, 'samples': 10944384, 'steps': 57001, 'loss/train': 1.6358243227005005} -08/30/2021 23:27:51 - INFO - __main__ - Step 57003: {'lr': 0.0003481070578714291, 'samples': 10944576, 'steps': 57002, 'loss/train': 0.12685905396938324} -08/30/2021 23:27:52 - INFO - __main__ - Step 57004: {'lr': 0.0003481021767980638, 'samples': 10944768, 'steps': 57003, 'loss/train': 1.4461734294891357} -08/30/2021 23:27:52 - INFO - __main__ - Step 57005: {'lr': 0.00034809729568049513, 'samples': 10944960, 'steps': 57004, 'loss/train': 1.7054307460784912} -08/30/2021 23:27:52 - INFO - __main__ - Step 57006: {'lr': 0.0003480924145187254, 'samples': 10945152, 'steps': 57005, 'loss/train': 1.0822632312774658} -08/30/2021 23:27:53 - INFO - __main__ - Step 57007: {'lr': 0.0003480875333127567, 'samples': 10945344, 'steps': 57006, 'loss/train': 1.6099203824996948} -08/30/2021 23:27:54 - INFO - __main__ - Step 57008: {'lr': 0.0003480826520625913, 'samples': 10945536, 'steps': 57007, 'loss/train': 1.3697259426116943} -08/30/2021 23:27:55 - INFO - __main__ - Step 57009: {'lr': 0.0003480777707682313, 'samples': 10945728, 'steps': 57008, 'loss/train': 1.7698712348937988} -08/30/2021 23:27:55 - INFO - __main__ - Step 57010: {'lr': 0.00034807288942967905, 'samples': 10945920, 'steps': 57009, 'loss/train': 1.7093955278396606} -08/30/2021 23:27:55 - INFO - __main__ - Step 57011: {'lr': 0.0003480680080469366, 'samples': 10946112, 'steps': 57010, 'loss/train': 2.058028221130371} -08/30/2021 23:27:56 - INFO - __main__ - Step 57012: {'lr': 0.0003480631266200063, 'samples': 10946304, 'steps': 57011, 'loss/train': 1.3001831769943237} -08/30/2021 23:27:58 - INFO - __main__ - Step 57013: {'lr': 0.0003480582451488902, 'samples': 10946496, 'steps': 57012, 'loss/train': 0.9852659702301025} -08/30/2021 23:27:58 - INFO - __main__ - Step 57014: {'lr': 0.00034805336363359066, 'samples': 10946688, 'steps': 57013, 'loss/train': 1.2243127822875977} -08/30/2021 23:27:59 - INFO - __main__ - Step 57015: {'lr': 0.00034804848207410974, 'samples': 10946880, 'steps': 57014, 'loss/train': 1.3231433629989624} -08/30/2021 23:27:59 - INFO - __main__ - Step 57016: {'lr': 0.00034804360047044965, 'samples': 10947072, 'steps': 57015, 'loss/train': 1.360616683959961} -08/30/2021 23:27:59 - INFO - __main__ - Step 57017: {'lr': 0.0003480387188226126, 'samples': 10947264, 'steps': 57016, 'loss/train': 1.3785102367401123} -08/30/2021 23:28:01 - INFO - __main__ - Step 57018: {'lr': 0.0003480338371306009, 'samples': 10947456, 'steps': 57017, 'loss/train': 0.46699249744415283} -08/30/2021 23:28:01 - INFO - __main__ - Step 57019: {'lr': 0.0003480289553944166, 'samples': 10947648, 'steps': 57018, 'loss/train': 1.6604140996932983} -08/30/2021 23:28:02 - INFO - __main__ - Step 57020: {'lr': 0.000348024073614062, 'samples': 10947840, 'steps': 57019, 'loss/train': 1.2705460786819458} -08/30/2021 23:28:02 - INFO - __main__ - Step 57021: {'lr': 0.0003480191917895393, 'samples': 10948032, 'steps': 57020, 'loss/train': 1.3671238422393799} -08/30/2021 23:28:03 - INFO - __main__ - Step 57022: {'lr': 0.0003480143099208506, 'samples': 10948224, 'steps': 57021, 'loss/train': 1.883851170539856} -08/30/2021 23:28:03 - INFO - __main__ - Step 57023: {'lr': 0.00034800942800799817, 'samples': 10948416, 'steps': 57022, 'loss/train': 0.9469725489616394} -08/30/2021 23:28:04 - INFO - __main__ - Step 57024: {'lr': 0.00034800454605098417, 'samples': 10948608, 'steps': 57023, 'loss/train': 1.3060386180877686} -08/30/2021 23:28:05 - INFO - __main__ - Step 57025: {'lr': 0.00034799966404981095, 'samples': 10948800, 'steps': 57024, 'loss/train': 1.7397828102111816} -08/30/2021 23:28:05 - INFO - __main__ - Step 57026: {'lr': 0.00034799478200448056, 'samples': 10948992, 'steps': 57025, 'loss/train': 1.2919104099273682} -08/30/2021 23:28:05 - INFO - __main__ - Step 57027: {'lr': 0.0003479898999149952, 'samples': 10949184, 'steps': 57026, 'loss/train': 1.7795907258987427} -08/30/2021 23:28:06 - INFO - __main__ - Step 57028: {'lr': 0.00034798501778135704, 'samples': 10949376, 'steps': 57027, 'loss/train': 1.0661389827728271} -08/30/2021 23:28:07 - INFO - __main__ - Step 57029: {'lr': 0.0003479801356035684, 'samples': 10949568, 'steps': 57028, 'loss/train': 1.827704668045044} -08/30/2021 23:28:08 - INFO - __main__ - Step 57030: {'lr': 0.0003479752533816315, 'samples': 10949760, 'steps': 57029, 'loss/train': 1.6550542116165161} -08/30/2021 23:28:08 - INFO - __main__ - Step 57031: {'lr': 0.0003479703711155484, 'samples': 10949952, 'steps': 57030, 'loss/train': 1.2261172533035278} -08/30/2021 23:28:08 - INFO - __main__ - Step 57032: {'lr': 0.00034796548880532135, 'samples': 10950144, 'steps': 57031, 'loss/train': 1.2753974199295044} -08/30/2021 23:28:09 - INFO - __main__ - Step 57033: {'lr': 0.0003479606064509526, 'samples': 10950336, 'steps': 57032, 'loss/train': 1.0902739763259888} -08/30/2021 23:28:10 - INFO - __main__ - Step 57034: {'lr': 0.00034795572405244425, 'samples': 10950528, 'steps': 57033, 'loss/train': 1.6735591888427734} -08/30/2021 23:28:11 - INFO - __main__ - Step 57035: {'lr': 0.0003479508416097986, 'samples': 10950720, 'steps': 57034, 'loss/train': 0.887643575668335} -08/30/2021 23:28:11 - INFO - __main__ - Step 57036: {'lr': 0.0003479459591230177, 'samples': 10950912, 'steps': 57035, 'loss/train': 1.2060307264328003} -08/30/2021 23:28:12 - INFO - __main__ - Step 57037: {'lr': 0.0003479410765921041, 'samples': 10951104, 'steps': 57036, 'loss/train': 1.460170030593872} -08/30/2021 23:28:12 - INFO - __main__ - Step 57038: {'lr': 0.0003479361940170596, 'samples': 10951296, 'steps': 57037, 'loss/train': 1.211076259613037} -08/30/2021 23:28:13 - INFO - __main__ - Step 57039: {'lr': 0.0003479313113978866, 'samples': 10951488, 'steps': 57038, 'loss/train': 1.531976342201233} -08/30/2021 23:28:14 - INFO - __main__ - Step 57040: {'lr': 0.00034792642873458725, 'samples': 10951680, 'steps': 57039, 'loss/train': 0.9424772262573242} -08/30/2021 23:28:14 - INFO - __main__ - Step 57041: {'lr': 0.00034792154602716376, 'samples': 10951872, 'steps': 57040, 'loss/train': 1.2763078212738037} -08/30/2021 23:28:15 - INFO - __main__ - Step 57042: {'lr': 0.0003479166632756184, 'samples': 10952064, 'steps': 57041, 'loss/train': 1.8003580570220947} -08/30/2021 23:28:15 - INFO - __main__ - Step 57043: {'lr': 0.0003479117804799532, 'samples': 10952256, 'steps': 57042, 'loss/train': 1.2753196954727173} -08/30/2021 23:28:17 - INFO - __main__ - Step 57044: {'lr': 0.00034790689764017046, 'samples': 10952448, 'steps': 57043, 'loss/train': 2.989809036254883} -08/30/2021 23:28:17 - INFO - __main__ - Step 57045: {'lr': 0.00034790201475627246, 'samples': 10952640, 'steps': 57044, 'loss/train': 1.1062965393066406} -08/30/2021 23:28:18 - INFO - __main__ - Step 57046: {'lr': 0.00034789713182826126, 'samples': 10952832, 'steps': 57045, 'loss/train': 0.4613654911518097} -08/30/2021 23:28:18 - INFO - __main__ - Step 57047: {'lr': 0.0003478922488561392, 'samples': 10953024, 'steps': 57046, 'loss/train': 1.091480016708374} -08/30/2021 23:28:18 - INFO - __main__ - Step 57048: {'lr': 0.0003478873658399084, 'samples': 10953216, 'steps': 57047, 'loss/train': 1.351733684539795} -08/30/2021 23:28:19 - INFO - __main__ - Step 57049: {'lr': 0.000347882482779571, 'samples': 10953408, 'steps': 57048, 'loss/train': 1.7358691692352295} -08/30/2021 23:28:20 - INFO - __main__ - Step 57050: {'lr': 0.00034787759967512923, 'samples': 10953600, 'steps': 57049, 'loss/train': 1.3204859495162964} -08/30/2021 23:28:21 - INFO - __main__ - Step 57051: {'lr': 0.00034787271652658534, 'samples': 10953792, 'steps': 57050, 'loss/train': 0.9837892651557922} -08/30/2021 23:28:21 - INFO - __main__ - Step 57052: {'lr': 0.0003478678333339416, 'samples': 10953984, 'steps': 57051, 'loss/train': 1.5108966827392578} -08/30/2021 23:28:21 - INFO - __main__ - Step 57053: {'lr': 0.0003478629500972, 'samples': 10954176, 'steps': 57052, 'loss/train': 2.1211483478546143} -08/30/2021 23:28:22 - INFO - __main__ - Step 57054: {'lr': 0.0003478580668163631, 'samples': 10954368, 'steps': 57053, 'loss/train': 0.46269649267196655} -08/30/2021 23:28:23 - INFO - __main__ - Step 57055: {'lr': 0.0003478531834914326, 'samples': 10954560, 'steps': 57054, 'loss/train': 1.3709542751312256} -08/30/2021 23:28:24 - INFO - __main__ - Step 57056: {'lr': 0.0003478483001224111, 'samples': 10954752, 'steps': 57055, 'loss/train': 0.7645677924156189} -08/30/2021 23:28:24 - INFO - __main__ - Step 57057: {'lr': 0.00034784341670930066, 'samples': 10954944, 'steps': 57056, 'loss/train': 1.2185145616531372} -08/30/2021 23:28:24 - INFO - __main__ - Step 57058: {'lr': 0.00034783853325210344, 'samples': 10955136, 'steps': 57057, 'loss/train': 1.0981371402740479} -08/30/2021 23:28:25 - INFO - __main__ - Step 57059: {'lr': 0.0003478336497508217, 'samples': 10955328, 'steps': 57058, 'loss/train': 1.5518289804458618} -08/30/2021 23:28:27 - INFO - __main__ - Step 57060: {'lr': 0.0003478287662054576, 'samples': 10955520, 'steps': 57059, 'loss/train': 1.1390094757080078} -08/30/2021 23:28:27 - INFO - __main__ - Step 57061: {'lr': 0.0003478238826160135, 'samples': 10955712, 'steps': 57060, 'loss/train': 1.8684204816818237} -08/30/2021 23:28:27 - INFO - __main__ - Step 57062: {'lr': 0.00034781899898249136, 'samples': 10955904, 'steps': 57061, 'loss/train': 1.1276425123214722} -08/30/2021 23:28:28 - INFO - __main__ - Step 57063: {'lr': 0.0003478141153048935, 'samples': 10956096, 'steps': 57062, 'loss/train': 1.4150640964508057} -08/30/2021 23:28:28 - INFO - __main__ - Step 57064: {'lr': 0.0003478092315832221, 'samples': 10956288, 'steps': 57063, 'loss/train': 0.06745883077383041} -08/30/2021 23:28:30 - INFO - __main__ - Step 57065: {'lr': 0.00034780434781747936, 'samples': 10956480, 'steps': 57064, 'loss/train': 1.5051709413528442} -08/30/2021 23:28:31 - INFO - __main__ - Step 57066: {'lr': 0.0003477994640076675, 'samples': 10956672, 'steps': 57065, 'loss/train': 1.1805298328399658} -08/30/2021 23:28:31 - INFO - __main__ - Step 57067: {'lr': 0.00034779458015378874, 'samples': 10956864, 'steps': 57066, 'loss/train': 1.2429498434066772} -08/30/2021 23:28:31 - INFO - __main__ - Step 57068: {'lr': 0.00034778969625584523, 'samples': 10957056, 'steps': 57067, 'loss/train': 1.4781283140182495} -08/30/2021 23:28:32 - INFO - __main__ - Step 57069: {'lr': 0.0003477848123138392, 'samples': 10957248, 'steps': 57068, 'loss/train': 1.6229937076568604} -08/30/2021 23:28:33 - INFO - __main__ - Step 57070: {'lr': 0.0003477799283277728, 'samples': 10957440, 'steps': 57069, 'loss/train': 1.5744439363479614} -08/30/2021 23:28:34 - INFO - __main__ - Step 57071: {'lr': 0.0003477750442976483, 'samples': 10957632, 'steps': 57070, 'loss/train': 1.632590413093567} -08/30/2021 23:28:34 - INFO - __main__ - Step 57072: {'lr': 0.0003477701602234679, 'samples': 10957824, 'steps': 57071, 'loss/train': 1.1744002103805542} -08/30/2021 23:28:34 - INFO - __main__ - Step 57073: {'lr': 0.00034776527610523377, 'samples': 10958016, 'steps': 57072, 'loss/train': 0.2698575556278229} -08/30/2021 23:28:35 - INFO - __main__ - Step 57074: {'lr': 0.00034776039194294806, 'samples': 10958208, 'steps': 57073, 'loss/train': 1.3911490440368652} -08/30/2021 23:28:35 - INFO - __main__ - Step 57075: {'lr': 0.0003477555077366131, 'samples': 10958400, 'steps': 57074, 'loss/train': 1.7398079633712769} -08/30/2021 23:28:37 - INFO - __main__ - Step 57076: {'lr': 0.000347750623486231, 'samples': 10958592, 'steps': 57075, 'loss/train': 1.3328917026519775} -08/30/2021 23:28:37 - INFO - __main__ - Step 57077: {'lr': 0.00034774573919180396, 'samples': 10958784, 'steps': 57076, 'loss/train': 1.9911900758743286} -08/30/2021 23:28:37 - INFO - __main__ - Step 57078: {'lr': 0.0003477408548533342, 'samples': 10958976, 'steps': 57077, 'loss/train': 1.19882071018219} -08/30/2021 23:28:38 - INFO - __main__ - Step 57079: {'lr': 0.0003477359704708239, 'samples': 10959168, 'steps': 57078, 'loss/train': 0.9224775433540344} -08/30/2021 23:28:38 - INFO - __main__ - Step 57080: {'lr': 0.00034773108604427527, 'samples': 10959360, 'steps': 57079, 'loss/train': 0.20800741016864777} -08/30/2021 23:28:40 - INFO - __main__ - Step 57081: {'lr': 0.0003477262015736906, 'samples': 10959552, 'steps': 57080, 'loss/train': 1.3875374794006348} -08/30/2021 23:28:40 - INFO - __main__ - Step 57082: {'lr': 0.000347721317059072, 'samples': 10959744, 'steps': 57081, 'loss/train': 1.4149136543273926} -08/30/2021 23:28:41 - INFO - __main__ - Step 57083: {'lr': 0.00034771643250042163, 'samples': 10959936, 'steps': 57082, 'loss/train': 1.4568796157836914} -08/30/2021 23:28:41 - INFO - __main__ - Step 57084: {'lr': 0.0003477115478977417, 'samples': 10960128, 'steps': 57083, 'loss/train': 1.1072320938110352} -08/30/2021 23:28:42 - INFO - __main__ - Step 57085: {'lr': 0.0003477066632510346, 'samples': 10960320, 'steps': 57084, 'loss/train': 1.9716097116470337} -08/30/2021 23:28:43 - INFO - __main__ - Step 57086: {'lr': 0.00034770177856030223, 'samples': 10960512, 'steps': 57085, 'loss/train': 1.5158183574676514} -08/30/2021 23:28:43 - INFO - __main__ - Step 57087: {'lr': 0.00034769689382554704, 'samples': 10960704, 'steps': 57086, 'loss/train': 1.1423659324645996} -08/30/2021 23:28:44 - INFO - __main__ - Step 57088: {'lr': 0.0003476920090467711, 'samples': 10960896, 'steps': 57087, 'loss/train': 1.2910465002059937} -08/30/2021 23:28:44 - INFO - __main__ - Step 57089: {'lr': 0.0003476871242239767, 'samples': 10961088, 'steps': 57088, 'loss/train': 1.1581976413726807} -08/30/2021 23:28:44 - INFO - __main__ - Step 57090: {'lr': 0.0003476822393571659, 'samples': 10961280, 'steps': 57089, 'loss/train': 0.948721706867218} -08/30/2021 23:28:46 - INFO - __main__ - Step 57091: {'lr': 0.00034767735444634105, 'samples': 10961472, 'steps': 57090, 'loss/train': 1.1170225143432617} -08/30/2021 23:28:46 - INFO - __main__ - Step 57092: {'lr': 0.00034767246949150425, 'samples': 10961664, 'steps': 57091, 'loss/train': 1.2649356126785278} -08/30/2021 23:28:47 - INFO - __main__ - Step 57093: {'lr': 0.0003476675844926578, 'samples': 10961856, 'steps': 57092, 'loss/train': 0.8574861288070679} -08/30/2021 23:28:47 - INFO - __main__ - Step 57094: {'lr': 0.0003476626994498038, 'samples': 10962048, 'steps': 57093, 'loss/train': 1.4239813089370728} -08/30/2021 23:28:48 - INFO - __main__ - Step 57095: {'lr': 0.0003476578143629445, 'samples': 10962240, 'steps': 57094, 'loss/train': 1.4719583988189697} -08/30/2021 23:28:49 - INFO - __main__ - Step 57096: {'lr': 0.0003476529292320821, 'samples': 10962432, 'steps': 57095, 'loss/train': 0.0870312973856926} -08/30/2021 23:28:50 - INFO - __main__ - Step 57097: {'lr': 0.00034764804405721885, 'samples': 10962624, 'steps': 57096, 'loss/train': 1.0821385383605957} -08/30/2021 23:28:50 - INFO - __main__ - Step 57098: {'lr': 0.0003476431588383568, 'samples': 10962816, 'steps': 57097, 'loss/train': 0.9208717942237854} -08/30/2021 23:28:51 - INFO - __main__ - Step 57099: {'lr': 0.0003476382735754983, 'samples': 10963008, 'steps': 57098, 'loss/train': 2.2821109294891357} -08/30/2021 23:28:51 - INFO - __main__ - Step 57100: {'lr': 0.00034763338826864556, 'samples': 10963200, 'steps': 57099, 'loss/train': 1.2312923669815063} -08/30/2021 23:28:51 - INFO - __main__ - Step 57101: {'lr': 0.0003476285029178006, 'samples': 10963392, 'steps': 57100, 'loss/train': 1.197237253189087} -08/30/2021 23:28:53 - INFO - __main__ - Step 57102: {'lr': 0.0003476236175229659, 'samples': 10963584, 'steps': 57101, 'loss/train': 1.3694525957107544} -08/30/2021 23:28:53 - INFO - __main__ - Step 57103: {'lr': 0.0003476187320841434, 'samples': 10963776, 'steps': 57102, 'loss/train': 0.8848452568054199} -08/30/2021 23:28:54 - INFO - __main__ - Step 57104: {'lr': 0.0003476138466013354, 'samples': 10963968, 'steps': 57103, 'loss/train': 1.741289734840393} -08/30/2021 23:28:54 - INFO - __main__ - Step 57105: {'lr': 0.00034760896107454407, 'samples': 10964160, 'steps': 57104, 'loss/train': 1.1370725631713867} -08/30/2021 23:28:54 - INFO - __main__ - Step 57106: {'lr': 0.0003476040755037717, 'samples': 10964352, 'steps': 57105, 'loss/train': 0.9621631503105164} -08/30/2021 23:28:56 - INFO - __main__ - Step 57107: {'lr': 0.00034759918988902045, 'samples': 10964544, 'steps': 57106, 'loss/train': 1.4363473653793335} -08/30/2021 23:28:56 - INFO - __main__ - Step 57108: {'lr': 0.00034759430423029255, 'samples': 10964736, 'steps': 57107, 'loss/train': 1.2451115846633911} -08/30/2021 23:28:56 - INFO - __main__ - Step 57109: {'lr': 0.0003475894185275901, 'samples': 10964928, 'steps': 57108, 'loss/train': 1.2458856105804443} -08/30/2021 23:28:57 - INFO - __main__ - Step 57110: {'lr': 0.00034758453278091537, 'samples': 10965120, 'steps': 57109, 'loss/train': 1.2270549535751343} -08/30/2021 23:28:57 - INFO - __main__ - Step 57111: {'lr': 0.00034757964699027054, 'samples': 10965312, 'steps': 57110, 'loss/train': 0.7215399146080017} -08/30/2021 23:28:59 - INFO - __main__ - Step 57112: {'lr': 0.0003475747611556579, 'samples': 10965504, 'steps': 57111, 'loss/train': 1.2529476881027222} -08/30/2021 23:28:59 - INFO - __main__ - Step 57113: {'lr': 0.0003475698752770795, 'samples': 10965696, 'steps': 57112, 'loss/train': 1.3845411539077759} -08/30/2021 23:29:00 - INFO - __main__ - Step 57114: {'lr': 0.0003475649893545376, 'samples': 10965888, 'steps': 57113, 'loss/train': 1.965736985206604} -08/30/2021 23:29:00 - INFO - __main__ - Step 57115: {'lr': 0.0003475601033880346, 'samples': 10966080, 'steps': 57114, 'loss/train': 1.243262529373169} -08/30/2021 23:29:00 - INFO - __main__ - Step 57116: {'lr': 0.00034755521737757237, 'samples': 10966272, 'steps': 57115, 'loss/train': 0.61931973695755} -08/30/2021 23:29:02 - INFO - __main__ - Step 57117: {'lr': 0.0003475503313231533, 'samples': 10966464, 'steps': 57116, 'loss/train': 1.5781577825546265} -08/30/2021 23:29:03 - INFO - __main__ - Step 57118: {'lr': 0.0003475454452247795, 'samples': 10966656, 'steps': 57117, 'loss/train': 1.2548880577087402} -08/30/2021 23:29:03 - INFO - __main__ - Step 57119: {'lr': 0.00034754055908245326, 'samples': 10966848, 'steps': 57118, 'loss/train': 1.4524797201156616} -08/30/2021 23:29:03 - INFO - __main__ - Step 57120: {'lr': 0.0003475356728961767, 'samples': 10967040, 'steps': 57119, 'loss/train': 0.4162448048591614} -08/30/2021 23:29:04 - INFO - __main__ - Step 57121: {'lr': 0.0003475307866659522, 'samples': 10967232, 'steps': 57120, 'loss/train': 1.1524730920791626} -08/30/2021 23:29:04 - INFO - __main__ - Step 57122: {'lr': 0.00034752590039178175, 'samples': 10967424, 'steps': 57121, 'loss/train': 1.103222131729126} -08/30/2021 23:29:06 - INFO - __main__ - Step 57123: {'lr': 0.00034752101407366763, 'samples': 10967616, 'steps': 57122, 'loss/train': 1.4923452138900757} -08/30/2021 23:29:06 - INFO - __main__ - Step 57124: {'lr': 0.00034751612771161214, 'samples': 10967808, 'steps': 57123, 'loss/train': 0.8017433285713196} -08/30/2021 23:29:07 - INFO - __main__ - Step 57125: {'lr': 0.0003475112413056173, 'samples': 10968000, 'steps': 57124, 'loss/train': 1.3620872497558594} -08/30/2021 23:29:07 - INFO - __main__ - Step 57126: {'lr': 0.0003475063548556854, 'samples': 10968192, 'steps': 57125, 'loss/train': 1.1595778465270996} -08/30/2021 23:29:07 - INFO - __main__ - Step 57127: {'lr': 0.0003475014683618186, 'samples': 10968384, 'steps': 57126, 'loss/train': 1.7068578004837036} -08/30/2021 23:29:09 - INFO - __main__ - Step 57128: {'lr': 0.00034749658182401923, 'samples': 10968576, 'steps': 57127, 'loss/train': 1.121332049369812} -08/30/2021 23:29:09 - INFO - __main__ - Step 57129: {'lr': 0.00034749169524228937, 'samples': 10968768, 'steps': 57128, 'loss/train': 1.7508058547973633} -08/30/2021 23:29:10 - INFO - __main__ - Step 57130: {'lr': 0.0003474868086166312, 'samples': 10968960, 'steps': 57129, 'loss/train': 1.5395227670669556} -08/30/2021 23:29:10 - INFO - __main__ - Step 57131: {'lr': 0.0003474819219470471, 'samples': 10969152, 'steps': 57130, 'loss/train': 0.41437631845474243} -08/30/2021 23:29:10 - INFO - __main__ - Step 57132: {'lr': 0.0003474770352335391, 'samples': 10969344, 'steps': 57131, 'loss/train': 1.6383030414581299} -08/30/2021 23:29:12 - INFO - __main__ - Step 57133: {'lr': 0.00034747214847610943, 'samples': 10969536, 'steps': 57132, 'loss/train': 1.3294097185134888} -08/30/2021 23:29:13 - INFO - __main__ - Step 57134: {'lr': 0.00034746726167476027, 'samples': 10969728, 'steps': 57133, 'loss/train': 1.0824010372161865} -08/30/2021 23:29:13 - INFO - __main__ - Step 57135: {'lr': 0.00034746237482949393, 'samples': 10969920, 'steps': 57134, 'loss/train': 1.1900538206100464} -08/30/2021 23:29:13 - INFO - __main__ - Step 57136: {'lr': 0.0003474574879403126, 'samples': 10970112, 'steps': 57135, 'loss/train': 1.5479648113250732} -08/30/2021 23:29:14 - INFO - __main__ - Step 57137: {'lr': 0.0003474526010072183, 'samples': 10970304, 'steps': 57136, 'loss/train': 1.5143964290618896} -08/30/2021 23:29:15 - INFO - __main__ - Step 57138: {'lr': 0.0003474477140302134, 'samples': 10970496, 'steps': 57137, 'loss/train': 1.0015833377838135} -08/30/2021 23:29:16 - INFO - __main__ - Step 57139: {'lr': 0.0003474428270093001, 'samples': 10970688, 'steps': 57138, 'loss/train': 1.3740386962890625} -08/30/2021 23:29:16 - INFO - __main__ - Step 57140: {'lr': 0.00034743793994448057, 'samples': 10970880, 'steps': 57139, 'loss/train': 0.6994947195053101} -08/30/2021 23:29:16 - INFO - __main__ - Step 57141: {'lr': 0.000347433052835757, 'samples': 10971072, 'steps': 57140, 'loss/train': 1.0940190553665161} -08/30/2021 23:29:17 - INFO - __main__ - Step 57142: {'lr': 0.00034742816568313165, 'samples': 10971264, 'steps': 57141, 'loss/train': 1.4684149026870728} -08/30/2021 23:29:18 - INFO - __main__ - Step 57143: {'lr': 0.0003474232784866066, 'samples': 10971456, 'steps': 57142, 'loss/train': 1.1760928630828857} -08/30/2021 23:29:19 - INFO - __main__ - Step 57144: {'lr': 0.0003474183912461841, 'samples': 10971648, 'steps': 57143, 'loss/train': 2.027261257171631} -08/30/2021 23:29:19 - INFO - __main__ - Step 57145: {'lr': 0.00034741350396186646, 'samples': 10971840, 'steps': 57144, 'loss/train': 1.074097990989685} -08/30/2021 23:29:19 - INFO - __main__ - Step 57146: {'lr': 0.0003474086166336557, 'samples': 10972032, 'steps': 57145, 'loss/train': 1.24247407913208} -08/30/2021 23:29:20 - INFO - __main__ - Step 57147: {'lr': 0.0003474037292615542, 'samples': 10972224, 'steps': 57146, 'loss/train': 0.44781938195228577} -08/30/2021 23:29:20 - INFO - __main__ - Step 57148: {'lr': 0.000347398841845564, 'samples': 10972416, 'steps': 57147, 'loss/train': 2.132817029953003} -08/30/2021 23:29:22 - INFO - __main__ - Step 57149: {'lr': 0.0003473939543856875, 'samples': 10972608, 'steps': 57148, 'loss/train': 2.1498522758483887} -08/30/2021 23:29:22 - INFO - __main__ - Step 57150: {'lr': 0.00034738906688192673, 'samples': 10972800, 'steps': 57149, 'loss/train': 1.2391046285629272} -08/30/2021 23:29:22 - INFO - __main__ - Step 57151: {'lr': 0.0003473841793342839, 'samples': 10972992, 'steps': 57150, 'loss/train': 1.5860317945480347} -08/30/2021 23:29:23 - INFO - __main__ - Step 57152: {'lr': 0.00034737929174276133, 'samples': 10973184, 'steps': 57151, 'loss/train': 0.9298214912414551} -08/30/2021 23:29:23 - INFO - __main__ - Step 57153: {'lr': 0.0003473744041073611, 'samples': 10973376, 'steps': 57152, 'loss/train': 1.6825424432754517} -08/30/2021 23:29:25 - INFO - __main__ - Step 57154: {'lr': 0.0003473695164280855, 'samples': 10973568, 'steps': 57153, 'loss/train': 1.3954739570617676} -08/30/2021 23:29:25 - INFO - __main__ - Step 57155: {'lr': 0.0003473646287049368, 'samples': 10973760, 'steps': 57154, 'loss/train': 1.3306450843811035} -08/30/2021 23:29:25 - INFO - __main__ - Step 57156: {'lr': 0.00034735974093791697, 'samples': 10973952, 'steps': 57155, 'loss/train': 0.9474577307701111} -08/30/2021 23:29:26 - INFO - __main__ - Step 57157: {'lr': 0.00034735485312702835, 'samples': 10974144, 'steps': 57156, 'loss/train': 1.37650465965271} -08/30/2021 23:29:26 - INFO - __main__ - Step 57158: {'lr': 0.00034734996527227313, 'samples': 10974336, 'steps': 57157, 'loss/train': 1.4231430292129517} -08/30/2021 23:29:28 - INFO - __main__ - Step 57159: {'lr': 0.0003473450773736536, 'samples': 10974528, 'steps': 57158, 'loss/train': 1.218062400817871} -08/30/2021 23:29:29 - INFO - __main__ - Step 57160: {'lr': 0.00034734018943117183, 'samples': 10974720, 'steps': 57159, 'loss/train': 0.9181489944458008} -08/30/2021 23:29:29 - INFO - __main__ - Step 57161: {'lr': 0.00034733530144483003, 'samples': 10974912, 'steps': 57160, 'loss/train': 1.6676217317581177} -08/30/2021 23:29:29 - INFO - __main__ - Step 57162: {'lr': 0.0003473304134146305, 'samples': 10975104, 'steps': 57161, 'loss/train': 1.4537638425827026} -08/30/2021 23:29:30 - INFO - __main__ - Step 57163: {'lr': 0.0003473255253405754, 'samples': 10975296, 'steps': 57162, 'loss/train': 1.1282438039779663} -08/30/2021 23:29:30 - INFO - __main__ - Step 57164: {'lr': 0.0003473206372226668, 'samples': 10975488, 'steps': 57163, 'loss/train': 0.19694505631923676} -08/30/2021 23:29:32 - INFO - __main__ - Step 57165: {'lr': 0.0003473157490609071, 'samples': 10975680, 'steps': 57164, 'loss/train': 1.4446901082992554} -08/30/2021 23:29:32 - INFO - __main__ - Step 57166: {'lr': 0.0003473108608552985, 'samples': 10975872, 'steps': 57165, 'loss/train': 1.3291525840759277} -08/30/2021 23:29:32 - INFO - __main__ - Step 57167: {'lr': 0.00034730597260584304, 'samples': 10976064, 'steps': 57166, 'loss/train': 1.3511080741882324} -08/30/2021 23:29:33 - INFO - __main__ - Step 57168: {'lr': 0.0003473010843125431, 'samples': 10976256, 'steps': 57167, 'loss/train': 0.6470757126808167} -08/30/2021 23:29:33 - INFO - __main__ - Step 57169: {'lr': 0.0003472961959754007, 'samples': 10976448, 'steps': 57168, 'loss/train': 1.8624001741409302} -08/30/2021 23:29:35 - INFO - __main__ - Step 57170: {'lr': 0.0003472913075944182, 'samples': 10976640, 'steps': 57169, 'loss/train': 1.0622985363006592} -08/30/2021 23:29:36 - INFO - __main__ - Step 57171: {'lr': 0.00034728641916959767, 'samples': 10976832, 'steps': 57170, 'loss/train': 1.5070276260375977} -08/30/2021 23:29:36 - INFO - __main__ - Step 57172: {'lr': 0.00034728153070094143, 'samples': 10977024, 'steps': 57171, 'loss/train': 0.49868151545524597} -08/30/2021 23:29:36 - INFO - __main__ - Step 57173: {'lr': 0.0003472766421884516, 'samples': 10977216, 'steps': 57172, 'loss/train': 1.0507540702819824} -08/30/2021 23:29:37 - INFO - __main__ - Step 57174: {'lr': 0.00034727175363213046, 'samples': 10977408, 'steps': 57173, 'loss/train': 0.611548900604248} -08/30/2021 23:29:38 - INFO - __main__ - Step 57175: {'lr': 0.0003472668650319801, 'samples': 10977600, 'steps': 57174, 'loss/train': 1.2241181135177612} -08/30/2021 23:29:39 - INFO - __main__ - Step 57176: {'lr': 0.0003472619763880029, 'samples': 10977792, 'steps': 57175, 'loss/train': 0.6720014214515686} -08/30/2021 23:29:39 - INFO - __main__ - Step 57177: {'lr': 0.00034725708770020085, 'samples': 10977984, 'steps': 57176, 'loss/train': 1.5641393661499023} -08/30/2021 23:29:39 - INFO - __main__ - Step 57178: {'lr': 0.0003472521989685763, 'samples': 10978176, 'steps': 57177, 'loss/train': 1.117599606513977} -08/30/2021 23:29:40 - INFO - __main__ - Step 57179: {'lr': 0.00034724731019313145, 'samples': 10978368, 'steps': 57178, 'loss/train': 0.8109197020530701} -08/30/2021 23:29:41 - INFO - __main__ - Step 57180: {'lr': 0.0003472424213738684, 'samples': 10978560, 'steps': 57179, 'loss/train': 1.2628936767578125} -08/30/2021 23:29:42 - INFO - __main__ - Step 57181: {'lr': 0.0003472375325107894, 'samples': 10978752, 'steps': 57180, 'loss/train': 2.362213611602783} -08/30/2021 23:29:42 - INFO - __main__ - Step 57182: {'lr': 0.00034723264360389674, 'samples': 10978944, 'steps': 57181, 'loss/train': 1.6982719898223877} -08/30/2021 23:29:43 - INFO - __main__ - Step 57183: {'lr': 0.0003472277546531925, 'samples': 10979136, 'steps': 57182, 'loss/train': 1.5797861814498901} -08/30/2021 23:29:43 - INFO - __main__ - Step 57184: {'lr': 0.00034722286565867897, 'samples': 10979328, 'steps': 57183, 'loss/train': 0.6407620310783386} -08/30/2021 23:29:43 - INFO - __main__ - Step 57185: {'lr': 0.00034721797662035824, 'samples': 10979520, 'steps': 57184, 'loss/train': 1.0531861782073975} -08/30/2021 23:29:45 - INFO - __main__ - Step 57186: {'lr': 0.00034721308753823266, 'samples': 10979712, 'steps': 57185, 'loss/train': 1.7869772911071777} -08/30/2021 23:29:46 - INFO - __main__ - Step 57187: {'lr': 0.00034720819841230433, 'samples': 10979904, 'steps': 57186, 'loss/train': 1.6745402812957764} -08/30/2021 23:29:46 - INFO - __main__ - Step 57188: {'lr': 0.0003472033092425755, 'samples': 10980096, 'steps': 57187, 'loss/train': 0.025158895179629326} -08/30/2021 23:29:46 - INFO - __main__ - Step 57189: {'lr': 0.00034719842002904844, 'samples': 10980288, 'steps': 57188, 'loss/train': 2.543149709701538} -08/30/2021 23:29:47 - INFO - __main__ - Step 57190: {'lr': 0.00034719353077172516, 'samples': 10980480, 'steps': 57189, 'loss/train': 1.196667194366455} -08/30/2021 23:29:47 - INFO - __main__ - Step 57191: {'lr': 0.00034718864147060803, 'samples': 10980672, 'steps': 57190, 'loss/train': 1.6503345966339111} -08/30/2021 23:29:47 - INFO - __main__ - Step 57192: {'lr': 0.00034718375212569916, 'samples': 10980864, 'steps': 57191, 'loss/train': 1.6431115865707397} -08/30/2021 23:29:49 - INFO - __main__ - Step 57193: {'lr': 0.0003471788627370008, 'samples': 10981056, 'steps': 57192, 'loss/train': 1.0220423936843872} -08/30/2021 23:29:49 - INFO - __main__ - Step 57194: {'lr': 0.0003471739733045151, 'samples': 10981248, 'steps': 57193, 'loss/train': 1.6716105937957764} -08/30/2021 23:29:50 - INFO - __main__ - Step 57195: {'lr': 0.00034716908382824435, 'samples': 10981440, 'steps': 57194, 'loss/train': 0.39487341046333313} -08/30/2021 23:29:50 - INFO - __main__ - Step 57196: {'lr': 0.0003471641943081908, 'samples': 10981632, 'steps': 57195, 'loss/train': 1.2871283292770386} -08/30/2021 23:29:50 - INFO - __main__ - Step 57197: {'lr': 0.0003471593047443564, 'samples': 10981824, 'steps': 57196, 'loss/train': 0.6628235578536987} -08/30/2021 23:29:52 - INFO - __main__ - Step 57198: {'lr': 0.00034715441513674363, 'samples': 10982016, 'steps': 57197, 'loss/train': 1.3066422939300537} -08/30/2021 23:29:52 - INFO - __main__ - Step 57199: {'lr': 0.00034714952548535455, 'samples': 10982208, 'steps': 57198, 'loss/train': 2.057615041732788} -08/30/2021 23:29:53 - INFO - __main__ - Step 57200: {'lr': 0.0003471446357901914, 'samples': 10982400, 'steps': 57199, 'loss/train': 1.4142051935195923} -08/30/2021 23:29:53 - INFO - __main__ - Step 57201: {'lr': 0.0003471397460512563, 'samples': 10982592, 'steps': 57200, 'loss/train': 1.210719347000122} -08/30/2021 23:29:53 - INFO - __main__ - Step 57202: {'lr': 0.0003471348562685517, 'samples': 10982784, 'steps': 57201, 'loss/train': 0.9110336303710938} -08/30/2021 23:29:55 - INFO - __main__ - Step 57203: {'lr': 0.0003471299664420795, 'samples': 10982976, 'steps': 57202, 'loss/train': 0.9891413450241089} -08/30/2021 23:29:56 - INFO - __main__ - Step 57204: {'lr': 0.00034712507657184207, 'samples': 10983168, 'steps': 57203, 'loss/train': 1.6618365049362183} -08/30/2021 23:29:56 - INFO - __main__ - Step 57205: {'lr': 0.00034712018665784155, 'samples': 10983360, 'steps': 57204, 'loss/train': 0.1505172848701477} -08/30/2021 23:29:56 - INFO - __main__ - Step 57206: {'lr': 0.0003471152967000802, 'samples': 10983552, 'steps': 57205, 'loss/train': 1.5891050100326538} -08/30/2021 23:29:57 - INFO - __main__ - Step 57207: {'lr': 0.0003471104066985602, 'samples': 10983744, 'steps': 57206, 'loss/train': 1.4278366565704346} -08/30/2021 23:29:59 - INFO - __main__ - Step 57208: {'lr': 0.0003471055166532837, 'samples': 10983936, 'steps': 57207, 'loss/train': 1.1990008354187012} -08/30/2021 23:29:59 - INFO - __main__ - Step 57209: {'lr': 0.00034710062656425304, 'samples': 10984128, 'steps': 57208, 'loss/train': 1.2362653017044067} -08/30/2021 23:29:59 - INFO - __main__ - Step 57210: {'lr': 0.0003470957364314703, 'samples': 10984320, 'steps': 57209, 'loss/train': 1.130739688873291} -08/30/2021 23:30:00 - INFO - __main__ - Step 57211: {'lr': 0.0003470908462549377, 'samples': 10984512, 'steps': 57210, 'loss/train': 0.7444148063659668} -08/30/2021 23:30:00 - INFO - __main__ - Step 57212: {'lr': 0.00034708595603465743, 'samples': 10984704, 'steps': 57211, 'loss/train': 1.5857688188552856} -08/30/2021 23:30:02 - INFO - __main__ - Step 57213: {'lr': 0.0003470810657706318, 'samples': 10984896, 'steps': 57212, 'loss/train': 0.6763535141944885} -08/30/2021 23:30:03 - INFO - __main__ - Step 57214: {'lr': 0.0003470761754628629, 'samples': 10985088, 'steps': 57213, 'loss/train': 1.6995245218276978} -08/30/2021 23:30:03 - INFO - __main__ - Step 57215: {'lr': 0.000347071285111353, 'samples': 10985280, 'steps': 57214, 'loss/train': 1.137797236442566} -08/30/2021 23:30:03 - INFO - __main__ - Step 57216: {'lr': 0.00034706639471610424, 'samples': 10985472, 'steps': 57215, 'loss/train': 1.124526858329773} -08/30/2021 23:30:04 - INFO - __main__ - Step 57217: {'lr': 0.0003470615042771189, 'samples': 10985664, 'steps': 57216, 'loss/train': 0.02836763486266136} -08/30/2021 23:30:04 - INFO - __main__ - Step 57218: {'lr': 0.00034705661379439914, 'samples': 10985856, 'steps': 57217, 'loss/train': 0.025227637961506844} -08/30/2021 23:30:04 - INFO - __main__ - Step 57219: {'lr': 0.0003470517232679471, 'samples': 10986048, 'steps': 57218, 'loss/train': 1.5040104389190674} -08/30/2021 23:30:06 - INFO - __main__ - Step 57220: {'lr': 0.0003470468326977651, 'samples': 10986240, 'steps': 57219, 'loss/train': 0.09342114627361298} -08/30/2021 23:30:06 - INFO - __main__ - Step 57221: {'lr': 0.0003470419420838553, 'samples': 10986432, 'steps': 57220, 'loss/train': 1.388344645500183} -08/30/2021 23:30:07 - INFO - __main__ - Step 57222: {'lr': 0.0003470370514262199, 'samples': 10986624, 'steps': 57221, 'loss/train': 1.7109969854354858} -08/30/2021 23:30:07 - INFO - __main__ - Step 57223: {'lr': 0.0003470321607248611, 'samples': 10986816, 'steps': 57222, 'loss/train': 1.293199896812439} -08/30/2021 23:30:07 - INFO - __main__ - Step 57224: {'lr': 0.0003470272699797811, 'samples': 10987008, 'steps': 57223, 'loss/train': 1.299668788909912} -08/30/2021 23:30:09 - INFO - __main__ - Step 57225: {'lr': 0.0003470223791909821, 'samples': 10987200, 'steps': 57224, 'loss/train': 1.9548366069793701} -08/30/2021 23:30:09 - INFO - __main__ - Step 57226: {'lr': 0.0003470174883584664, 'samples': 10987392, 'steps': 57225, 'loss/train': 4.906742572784424} -08/30/2021 23:30:10 - INFO - __main__ - Step 57227: {'lr': 0.00034701259748223595, 'samples': 10987584, 'steps': 57226, 'loss/train': 1.3088277578353882} -08/30/2021 23:30:10 - INFO - __main__ - Step 57228: {'lr': 0.00034700770656229324, 'samples': 10987776, 'steps': 57227, 'loss/train': 1.0579522848129272} -08/30/2021 23:30:11 - INFO - __main__ - Step 57229: {'lr': 0.00034700281559864034, 'samples': 10987968, 'steps': 57228, 'loss/train': 1.9059362411499023} -08/30/2021 23:30:11 - INFO - __main__ - Step 57230: {'lr': 0.00034699792459127945, 'samples': 10988160, 'steps': 57229, 'loss/train': 1.5767570734024048} -08/30/2021 23:30:13 - INFO - __main__ - Step 57231: {'lr': 0.00034699303354021285, 'samples': 10988352, 'steps': 57230, 'loss/train': 0.7629421353340149} -08/30/2021 23:30:14 - INFO - __main__ - Step 57232: {'lr': 0.0003469881424454426, 'samples': 10988544, 'steps': 57231, 'loss/train': 1.4237111806869507} -08/30/2021 23:30:14 - INFO - __main__ - Step 57233: {'lr': 0.000346983251306971, 'samples': 10988736, 'steps': 57232, 'loss/train': 1.1473923921585083} -08/30/2021 23:30:14 - INFO - __main__ - Step 57234: {'lr': 0.0003469783601248002, 'samples': 10988928, 'steps': 57233, 'loss/train': 0.9404387474060059} -08/30/2021 23:30:15 - INFO - __main__ - Step 57235: {'lr': 0.0003469734688989326, 'samples': 10989120, 'steps': 57234, 'loss/train': 0.8312382698059082} -08/30/2021 23:30:16 - INFO - __main__ - Step 57236: {'lr': 0.0003469685776293702, 'samples': 10989312, 'steps': 57235, 'loss/train': 1.2217953205108643} -08/30/2021 23:30:17 - INFO - __main__ - Step 57237: {'lr': 0.0003469636863161152, 'samples': 10989504, 'steps': 57236, 'loss/train': 1.2138937711715698} -08/30/2021 23:30:17 - INFO - __main__ - Step 57238: {'lr': 0.0003469587949591698, 'samples': 10989696, 'steps': 57237, 'loss/train': 1.8392994403839111} -08/30/2021 23:30:17 - INFO - __main__ - Step 57239: {'lr': 0.0003469539035585364, 'samples': 10989888, 'steps': 57238, 'loss/train': 0.6179540753364563} -08/30/2021 23:30:18 - INFO - __main__ - Step 57240: {'lr': 0.00034694901211421695, 'samples': 10990080, 'steps': 57239, 'loss/train': 1.163027048110962} -08/30/2021 23:30:19 - INFO - __main__ - Step 57241: {'lr': 0.00034694412062621384, 'samples': 10990272, 'steps': 57240, 'loss/train': 1.2579842805862427} -08/30/2021 23:30:20 - INFO - __main__ - Step 57242: {'lr': 0.0003469392290945292, 'samples': 10990464, 'steps': 57241, 'loss/train': 1.4809110164642334} -08/30/2021 23:30:20 - INFO - __main__ - Step 57243: {'lr': 0.00034693433751916525, 'samples': 10990656, 'steps': 57242, 'loss/train': 1.5301992893218994} -08/30/2021 23:30:20 - INFO - __main__ - Step 57244: {'lr': 0.0003469294459001242, 'samples': 10990848, 'steps': 57243, 'loss/train': 0.4008890986442566} -08/30/2021 23:30:21 - INFO - __main__ - Step 57245: {'lr': 0.0003469245542374082, 'samples': 10991040, 'steps': 57244, 'loss/train': 0.9658870697021484} -08/30/2021 23:30:22 - INFO - __main__ - Step 57246: {'lr': 0.00034691966253101947, 'samples': 10991232, 'steps': 57245, 'loss/train': 1.5814244747161865} -08/30/2021 23:30:23 - INFO - __main__ - Step 57247: {'lr': 0.00034691477078096025, 'samples': 10991424, 'steps': 57246, 'loss/train': 0.972419023513794} -08/30/2021 23:30:23 - INFO - __main__ - Step 57248: {'lr': 0.0003469098789872327, 'samples': 10991616, 'steps': 57247, 'loss/train': 1.6710761785507202} -08/30/2021 23:30:23 - INFO - __main__ - Step 57249: {'lr': 0.0003469049871498392, 'samples': 10991808, 'steps': 57248, 'loss/train': 0.604178786277771} -08/30/2021 23:30:24 - INFO - __main__ - Step 57250: {'lr': 0.0003469000952687817, 'samples': 10992000, 'steps': 57249, 'loss/train': 1.6566071510314941} -08/30/2021 23:30:24 - INFO - __main__ - Step 57251: {'lr': 0.0003468952033440625, 'samples': 10992192, 'steps': 57250, 'loss/train': 0.11098971962928772} -08/30/2021 23:30:26 - INFO - __main__ - Step 57252: {'lr': 0.00034689031137568384, 'samples': 10992384, 'steps': 57251, 'loss/train': 1.3981941938400269} -08/30/2021 23:30:26 - INFO - __main__ - Step 57253: {'lr': 0.0003468854193636479, 'samples': 10992576, 'steps': 57252, 'loss/train': 1.324788212776184} -08/30/2021 23:30:26 - INFO - __main__ - Step 57254: {'lr': 0.00034688052730795683, 'samples': 10992768, 'steps': 57253, 'loss/train': 1.0446434020996094} -08/30/2021 23:30:27 - INFO - __main__ - Step 57255: {'lr': 0.00034687563520861294, 'samples': 10992960, 'steps': 57254, 'loss/train': 1.1589691638946533} -08/30/2021 23:30:27 - INFO - __main__ - Step 57256: {'lr': 0.0003468707430656184, 'samples': 10993152, 'steps': 57255, 'loss/train': 1.2001605033874512} -08/30/2021 23:30:29 - INFO - __main__ - Step 57257: {'lr': 0.00034686585087897537, 'samples': 10993344, 'steps': 57256, 'loss/train': 1.5355124473571777} -08/30/2021 23:30:29 - INFO - __main__ - Step 57258: {'lr': 0.0003468609586486861, 'samples': 10993536, 'steps': 57257, 'loss/train': 1.371069073677063} -08/30/2021 23:30:29 - INFO - __main__ - Step 57259: {'lr': 0.00034685606637475274, 'samples': 10993728, 'steps': 57258, 'loss/train': 1.434818148612976} -08/30/2021 23:30:30 - INFO - __main__ - Step 57260: {'lr': 0.0003468511740571776, 'samples': 10993920, 'steps': 57259, 'loss/train': 0.7995344400405884} -08/30/2021 23:30:30 - INFO - __main__ - Step 57261: {'lr': 0.00034684628169596277, 'samples': 10994112, 'steps': 57260, 'loss/train': 1.8994543552398682} -08/30/2021 23:30:32 - INFO - __main__ - Step 57262: {'lr': 0.0003468413892911105, 'samples': 10994304, 'steps': 57261, 'loss/train': 2.1002390384674072} -08/30/2021 23:30:32 - INFO - __main__ - Step 57263: {'lr': 0.00034683649684262303, 'samples': 10994496, 'steps': 57262, 'loss/train': 1.83897066116333} -08/30/2021 23:30:32 - INFO - __main__ - Step 57264: {'lr': 0.0003468316043505025, 'samples': 10994688, 'steps': 57263, 'loss/train': 1.3655487298965454} -08/30/2021 23:30:33 - INFO - __main__ - Step 57265: {'lr': 0.00034682671181475113, 'samples': 10994880, 'steps': 57264, 'loss/train': 0.42163142561912537} -08/30/2021 23:30:33 - INFO - __main__ - Step 57266: {'lr': 0.00034682181923537114, 'samples': 10995072, 'steps': 57265, 'loss/train': 1.3709806203842163} -08/30/2021 23:30:35 - INFO - __main__ - Step 57267: {'lr': 0.0003468169266123647, 'samples': 10995264, 'steps': 57266, 'loss/train': 1.3205724954605103} -08/30/2021 23:30:35 - INFO - __main__ - Step 57268: {'lr': 0.0003468120339457341, 'samples': 10995456, 'steps': 57267, 'loss/train': 1.3158334493637085} -08/30/2021 23:30:35 - INFO - __main__ - Step 57269: {'lr': 0.00034680714123548146, 'samples': 10995648, 'steps': 57268, 'loss/train': 0.8541487455368042} -08/30/2021 23:30:36 - INFO - __main__ - Step 57270: {'lr': 0.0003468022484816091, 'samples': 10995840, 'steps': 57269, 'loss/train': 0.060717690736055374} -08/30/2021 23:30:36 - INFO - __main__ - Step 57271: {'lr': 0.0003467973556841191, 'samples': 10996032, 'steps': 57270, 'loss/train': 1.8877067565917969} -08/30/2021 23:30:38 - INFO - __main__ - Step 57272: {'lr': 0.00034679246284301365, 'samples': 10996224, 'steps': 57271, 'loss/train': 0.3249967396259308} -08/30/2021 23:30:38 - INFO - __main__ - Step 57273: {'lr': 0.000346787569958295, 'samples': 10996416, 'steps': 57272, 'loss/train': 1.5828485488891602} -08/30/2021 23:30:38 - INFO - __main__ - Step 57274: {'lr': 0.0003467826770299654, 'samples': 10996608, 'steps': 57273, 'loss/train': 1.472226619720459} -08/30/2021 23:30:39 - INFO - __main__ - Step 57275: {'lr': 0.000346777784058027, 'samples': 10996800, 'steps': 57274, 'loss/train': 1.2954763174057007} -08/30/2021 23:30:39 - INFO - __main__ - Step 57276: {'lr': 0.0003467728910424821, 'samples': 10996992, 'steps': 57275, 'loss/train': 1.5763912200927734} -08/30/2021 23:30:40 - INFO - __main__ - Step 57277: {'lr': 0.0003467679979833328, 'samples': 10997184, 'steps': 57276, 'loss/train': 1.3015037775039673} -08/30/2021 23:30:41 - INFO - __main__ - Step 57278: {'lr': 0.00034676310488058126, 'samples': 10997376, 'steps': 57277, 'loss/train': 1.4174572229385376} -08/30/2021 23:30:41 - INFO - __main__ - Step 57279: {'lr': 0.00034675821173422983, 'samples': 10997568, 'steps': 57278, 'loss/train': 0.16137470304965973} -08/30/2021 23:30:42 - INFO - __main__ - Step 57280: {'lr': 0.0003467533185442806, 'samples': 10997760, 'steps': 57279, 'loss/train': 1.961804747581482} -08/30/2021 23:30:42 - INFO - __main__ - Step 57281: {'lr': 0.00034674842531073587, 'samples': 10997952, 'steps': 57280, 'loss/train': 1.2561326026916504} -08/30/2021 23:30:44 - INFO - __main__ - Step 57282: {'lr': 0.0003467435320335978, 'samples': 10998144, 'steps': 57281, 'loss/train': 1.0557690858840942} -08/30/2021 23:30:44 - INFO - __main__ - Step 57283: {'lr': 0.00034673863871286854, 'samples': 10998336, 'steps': 57282, 'loss/train': 0.20197616517543793} -08/30/2021 23:30:45 - INFO - __main__ - Step 57284: {'lr': 0.00034673374534855035, 'samples': 10998528, 'steps': 57283, 'loss/train': 0.9004855155944824} -08/30/2021 23:30:45 - INFO - __main__ - Step 57285: {'lr': 0.0003467288519406454, 'samples': 10998720, 'steps': 57284, 'loss/train': 1.4420886039733887} -08/30/2021 23:30:46 - INFO - __main__ - Step 57286: {'lr': 0.00034672395848915594, 'samples': 10998912, 'steps': 57285, 'loss/train': 0.196761816740036} -08/30/2021 23:30:46 - INFO - __main__ - Step 57287: {'lr': 0.00034671906499408417, 'samples': 10999104, 'steps': 57286, 'loss/train': 1.5899916887283325} -08/30/2021 23:30:47 - INFO - __main__ - Step 57288: {'lr': 0.0003467141714554323, 'samples': 10999296, 'steps': 57287, 'loss/train': 0.96351557970047} -08/30/2021 23:30:48 - INFO - __main__ - Step 57289: {'lr': 0.0003467092778732025, 'samples': 10999488, 'steps': 57288, 'loss/train': 1.1077650785446167} -08/30/2021 23:30:48 - INFO - __main__ - Step 57290: {'lr': 0.00034670438424739695, 'samples': 10999680, 'steps': 57289, 'loss/train': 1.1022433042526245} -08/30/2021 23:30:49 - INFO - __main__ - Step 57291: {'lr': 0.000346699490578018, 'samples': 10999872, 'steps': 57290, 'loss/train': 1.5361850261688232} -08/30/2021 23:30:49 - INFO - __main__ - Step 57292: {'lr': 0.00034669459686506766, 'samples': 11000064, 'steps': 57291, 'loss/train': 0.9836366176605225} -08/30/2021 23:30:50 - INFO - __main__ - Step 57293: {'lr': 0.0003466897031085482, 'samples': 11000256, 'steps': 57292, 'loss/train': 0.29051727056503296} -08/30/2021 23:30:51 - INFO - __main__ - Step 57294: {'lr': 0.000346684809308462, 'samples': 11000448, 'steps': 57293, 'loss/train': 1.387253999710083} -08/30/2021 23:30:51 - INFO - __main__ - Step 57295: {'lr': 0.00034667991546481096, 'samples': 11000640, 'steps': 57294, 'loss/train': 0.2907862067222595} -08/30/2021 23:30:52 - INFO - __main__ - Step 57296: {'lr': 0.0003466750215775975, 'samples': 11000832, 'steps': 57295, 'loss/train': 1.8339520692825317} -08/30/2021 23:30:52 - INFO - __main__ - Step 57297: {'lr': 0.0003466701276468238, 'samples': 11001024, 'steps': 57296, 'loss/train': 1.5265629291534424} -08/30/2021 23:30:53 - INFO - __main__ - Step 57298: {'lr': 0.00034666523367249196, 'samples': 11001216, 'steps': 57297, 'loss/train': 1.4608943462371826} -08/30/2021 23:30:54 - INFO - __main__ - Step 57299: {'lr': 0.0003466603396546043, 'samples': 11001408, 'steps': 57298, 'loss/train': 1.4062610864639282} -08/30/2021 23:30:54 - INFO - __main__ - Step 57300: {'lr': 0.00034665544559316303, 'samples': 11001600, 'steps': 57299, 'loss/train': 1.1037054061889648} -08/30/2021 23:30:55 - INFO - __main__ - Step 57301: {'lr': 0.0003466505514881703, 'samples': 11001792, 'steps': 57300, 'loss/train': 1.4081497192382812} -08/30/2021 23:30:55 - INFO - __main__ - Step 57302: {'lr': 0.00034664565733962823, 'samples': 11001984, 'steps': 57301, 'loss/train': 1.5334961414337158} -08/30/2021 23:30:56 - INFO - __main__ - Step 57303: {'lr': 0.0003466407631475392, 'samples': 11002176, 'steps': 57302, 'loss/train': 1.279776692390442} -08/30/2021 23:30:57 - INFO - __main__ - Step 57304: {'lr': 0.00034663586891190524, 'samples': 11002368, 'steps': 57303, 'loss/train': 1.3260341882705688} -08/30/2021 23:30:57 - INFO - __main__ - Step 57305: {'lr': 0.0003466309746327288, 'samples': 11002560, 'steps': 57304, 'loss/train': 1.4453420639038086} -08/30/2021 23:30:58 - INFO - __main__ - Step 57306: {'lr': 0.0003466260803100118, 'samples': 11002752, 'steps': 57305, 'loss/train': 1.8678979873657227} -08/30/2021 23:30:58 - INFO - __main__ - Step 57307: {'lr': 0.0003466211859437566, 'samples': 11002944, 'steps': 57306, 'loss/train': 1.5966711044311523} -08/30/2021 23:30:59 - INFO - __main__ - Step 57308: {'lr': 0.00034661629153396543, 'samples': 11003136, 'steps': 57307, 'loss/train': 0.9747397303581238} -08/30/2021 23:31:00 - INFO - __main__ - Step 57309: {'lr': 0.00034661139708064043, 'samples': 11003328, 'steps': 57308, 'loss/train': 1.411629557609558} -08/30/2021 23:31:00 - INFO - __main__ - Step 57310: {'lr': 0.00034660650258378384, 'samples': 11003520, 'steps': 57309, 'loss/train': 1.2113087177276611} -08/30/2021 23:31:00 - INFO - __main__ - Step 57311: {'lr': 0.00034660160804339784, 'samples': 11003712, 'steps': 57310, 'loss/train': 0.812248945236206} -08/30/2021 23:31:01 - INFO - __main__ - Step 57312: {'lr': 0.0003465967134594847, 'samples': 11003904, 'steps': 57311, 'loss/train': 1.4831023216247559} -08/30/2021 23:31:02 - INFO - __main__ - Step 57313: {'lr': 0.0003465918188320465, 'samples': 11004096, 'steps': 57312, 'loss/train': 1.0299956798553467} -08/30/2021 23:31:03 - INFO - __main__ - Step 57314: {'lr': 0.0003465869241610855, 'samples': 11004288, 'steps': 57313, 'loss/train': 1.2239888906478882} -08/30/2021 23:31:03 - INFO - __main__ - Step 57315: {'lr': 0.00034658202944660396, 'samples': 11004480, 'steps': 57314, 'loss/train': 0.9121844172477722} -08/30/2021 23:31:03 - INFO - __main__ - Step 57316: {'lr': 0.000346577134688604, 'samples': 11004672, 'steps': 57315, 'loss/train': 0.7463312149047852} -08/30/2021 23:31:04 - INFO - __main__ - Step 57317: {'lr': 0.00034657223988708796, 'samples': 11004864, 'steps': 57316, 'loss/train': 1.2851439714431763} -08/30/2021 23:31:05 - INFO - __main__ - Step 57318: {'lr': 0.0003465673450420579, 'samples': 11005056, 'steps': 57317, 'loss/train': 1.7752279043197632} -08/30/2021 23:31:06 - INFO - __main__ - Step 57319: {'lr': 0.0003465624501535161, 'samples': 11005248, 'steps': 57318, 'loss/train': 0.5596683025360107} -08/30/2021 23:31:06 - INFO - __main__ - Step 57320: {'lr': 0.0003465575552214648, 'samples': 11005440, 'steps': 57319, 'loss/train': 0.9630799293518066} -08/30/2021 23:31:06 - INFO - __main__ - Step 57321: {'lr': 0.00034655266024590604, 'samples': 11005632, 'steps': 57320, 'loss/train': 0.9939124584197998} -08/30/2021 23:31:07 - INFO - __main__ - Step 57322: {'lr': 0.0003465477652268422, 'samples': 11005824, 'steps': 57321, 'loss/train': 1.6171754598617554} -08/30/2021 23:31:07 - INFO - __main__ - Step 57323: {'lr': 0.0003465428701642755, 'samples': 11006016, 'steps': 57322, 'loss/train': 1.4679523706436157} -08/30/2021 23:31:09 - INFO - __main__ - Step 57324: {'lr': 0.00034653797505820795, 'samples': 11006208, 'steps': 57323, 'loss/train': 1.0676627159118652} -08/30/2021 23:31:09 - INFO - __main__ - Step 57325: {'lr': 0.000346533079908642, 'samples': 11006400, 'steps': 57324, 'loss/train': 1.207576036453247} -08/30/2021 23:31:09 - INFO - __main__ - Step 57326: {'lr': 0.0003465281847155796, 'samples': 11006592, 'steps': 57325, 'loss/train': 0.9534304141998291} -08/30/2021 23:31:10 - INFO - __main__ - Step 57327: {'lr': 0.00034652328947902317, 'samples': 11006784, 'steps': 57326, 'loss/train': 0.3770281672477722} -08/30/2021 23:31:10 - INFO - __main__ - Step 57328: {'lr': 0.0003465183941989748, 'samples': 11006976, 'steps': 57327, 'loss/train': 2.1630043983459473} -08/30/2021 23:31:12 - INFO - __main__ - Step 57329: {'lr': 0.00034651349887543674, 'samples': 11007168, 'steps': 57328, 'loss/train': 1.3944100141525269} -08/30/2021 23:31:13 - INFO - __main__ - Step 57330: {'lr': 0.00034650860350841125, 'samples': 11007360, 'steps': 57329, 'loss/train': 1.5637726783752441} -08/30/2021 23:31:13 - INFO - __main__ - Step 57331: {'lr': 0.0003465037080979004, 'samples': 11007552, 'steps': 57330, 'loss/train': 1.1711291074752808} -08/30/2021 23:31:13 - INFO - __main__ - Step 57332: {'lr': 0.0003464988126439065, 'samples': 11007744, 'steps': 57331, 'loss/train': 1.5800998210906982} -08/30/2021 23:31:14 - INFO - __main__ - Step 57333: {'lr': 0.0003464939171464317, 'samples': 11007936, 'steps': 57332, 'loss/train': 1.5062569379806519} -08/30/2021 23:31:15 - INFO - __main__ - Step 57334: {'lr': 0.0003464890216054782, 'samples': 11008128, 'steps': 57333, 'loss/train': 0.6435001492500305} -08/30/2021 23:31:16 - INFO - __main__ - Step 57335: {'lr': 0.0003464841260210483, 'samples': 11008320, 'steps': 57334, 'loss/train': 1.5605562925338745} -08/30/2021 23:31:16 - INFO - __main__ - Step 57336: {'lr': 0.0003464792303931441, 'samples': 11008512, 'steps': 57335, 'loss/train': 1.2090848684310913} -08/30/2021 23:31:16 - INFO - __main__ - Step 57337: {'lr': 0.0003464743347217679, 'samples': 11008704, 'steps': 57336, 'loss/train': 1.2363115549087524} -08/30/2021 23:31:17 - INFO - __main__ - Step 57338: {'lr': 0.00034646943900692187, 'samples': 11008896, 'steps': 57337, 'loss/train': 1.659374713897705} -08/30/2021 23:31:17 - INFO - __main__ - Step 57339: {'lr': 0.0003464645432486081, 'samples': 11009088, 'steps': 57338, 'loss/train': 1.7757110595703125} -08/30/2021 23:31:18 - INFO - __main__ - Step 57340: {'lr': 0.000346459647446829, 'samples': 11009280, 'steps': 57339, 'loss/train': 0.7484453320503235} -08/30/2021 23:31:19 - INFO - __main__ - Step 57341: {'lr': 0.0003464547516015866, 'samples': 11009472, 'steps': 57340, 'loss/train': 1.7045379877090454} -08/30/2021 23:31:19 - INFO - __main__ - Step 57342: {'lr': 0.0003464498557128832, 'samples': 11009664, 'steps': 57341, 'loss/train': 0.5957180261611938} -08/30/2021 23:31:20 - INFO - __main__ - Step 57343: {'lr': 0.00034644495978072094, 'samples': 11009856, 'steps': 57342, 'loss/train': 1.2689871788024902} -08/30/2021 23:31:20 - INFO - __main__ - Step 57344: {'lr': 0.00034644006380510215, 'samples': 11010048, 'steps': 57343, 'loss/train': 1.3786475658416748} -08/30/2021 23:31:22 - INFO - __main__ - Step 57345: {'lr': 0.0003464351677860289, 'samples': 11010240, 'steps': 57344, 'loss/train': 1.326842188835144} -08/30/2021 23:31:22 - INFO - __main__ - Step 57346: {'lr': 0.00034643027172350345, 'samples': 11010432, 'steps': 57345, 'loss/train': 0.49562159180641174} -08/30/2021 23:31:23 - INFO - __main__ - Step 57347: {'lr': 0.000346425375617528, 'samples': 11010624, 'steps': 57346, 'loss/train': 0.0715513676404953} -08/30/2021 23:31:23 - INFO - __main__ - Step 57348: {'lr': 0.00034642047946810477, 'samples': 11010816, 'steps': 57347, 'loss/train': 1.4194996356964111} -08/30/2021 23:31:23 - INFO - __main__ - Step 57349: {'lr': 0.000346415583275236, 'samples': 11011008, 'steps': 57348, 'loss/train': 2.7789392471313477} -08/30/2021 23:31:25 - INFO - __main__ - Step 57350: {'lr': 0.00034641068703892387, 'samples': 11011200, 'steps': 57349, 'loss/train': 1.1572437286376953} -08/30/2021 23:31:26 - INFO - __main__ - Step 57351: {'lr': 0.00034640579075917053, 'samples': 11011392, 'steps': 57350, 'loss/train': 1.1089028120040894} -08/30/2021 23:31:26 - INFO - __main__ - Step 57352: {'lr': 0.0003464008944359782, 'samples': 11011584, 'steps': 57351, 'loss/train': 1.3850922584533691} -08/30/2021 23:31:26 - INFO - __main__ - Step 57353: {'lr': 0.00034639599806934917, 'samples': 11011776, 'steps': 57352, 'loss/train': 0.5813507437705994} -08/30/2021 23:31:27 - INFO - __main__ - Step 57354: {'lr': 0.0003463911016592856, 'samples': 11011968, 'steps': 57353, 'loss/train': 1.7996010780334473} -08/30/2021 23:31:27 - INFO - __main__ - Step 57355: {'lr': 0.0003463862052057896, 'samples': 11012160, 'steps': 57354, 'loss/train': 1.597270131111145} -08/30/2021 23:31:29 - INFO - __main__ - Step 57356: {'lr': 0.00034638130870886353, 'samples': 11012352, 'steps': 57355, 'loss/train': 1.2265816926956177} -08/30/2021 23:31:29 - INFO - __main__ - Step 57357: {'lr': 0.0003463764121685096, 'samples': 11012544, 'steps': 57356, 'loss/train': 2.6046159267425537} -08/30/2021 23:31:30 - INFO - __main__ - Step 57358: {'lr': 0.0003463715155847298, 'samples': 11012736, 'steps': 57357, 'loss/train': 1.6963657140731812} -08/30/2021 23:31:30 - INFO - __main__ - Step 57359: {'lr': 0.00034636661895752653, 'samples': 11012928, 'steps': 57358, 'loss/train': 1.3072112798690796} -08/30/2021 23:31:30 - INFO - __main__ - Step 57360: {'lr': 0.000346361722286902, 'samples': 11013120, 'steps': 57359, 'loss/train': 2.336559534072876} -08/30/2021 23:31:32 - INFO - __main__ - Step 57361: {'lr': 0.0003463568255728583, 'samples': 11013312, 'steps': 57360, 'loss/train': 1.2347654104232788} -08/30/2021 23:31:33 - INFO - __main__ - Step 57362: {'lr': 0.0003463519288153977, 'samples': 11013504, 'steps': 57361, 'loss/train': 1.929038643836975} -08/30/2021 23:31:33 - INFO - __main__ - Step 57363: {'lr': 0.00034634703201452243, 'samples': 11013696, 'steps': 57362, 'loss/train': 1.1651383638381958} -08/30/2021 23:31:33 - INFO - __main__ - Step 57364: {'lr': 0.00034634213517023473, 'samples': 11013888, 'steps': 57363, 'loss/train': 1.8477355241775513} -08/30/2021 23:31:34 - INFO - __main__ - Step 57365: {'lr': 0.0003463372382825367, 'samples': 11014080, 'steps': 57364, 'loss/train': 1.1793138980865479} -08/30/2021 23:31:34 - INFO - __main__ - Step 57366: {'lr': 0.0003463323413514306, 'samples': 11014272, 'steps': 57365, 'loss/train': 1.0213637351989746} -08/30/2021 23:31:35 - INFO - __main__ - Step 57367: {'lr': 0.0003463274443769186, 'samples': 11014464, 'steps': 57366, 'loss/train': 1.834344744682312} -08/30/2021 23:31:36 - INFO - __main__ - Step 57368: {'lr': 0.000346322547359003, 'samples': 11014656, 'steps': 57367, 'loss/train': 1.634212851524353} -08/30/2021 23:31:36 - INFO - __main__ - Step 57369: {'lr': 0.00034631765029768594, 'samples': 11014848, 'steps': 57368, 'loss/train': 1.4976794719696045} -08/30/2021 23:31:37 - INFO - __main__ - Step 57370: {'lr': 0.0003463127531929696, 'samples': 11015040, 'steps': 57369, 'loss/train': 1.355198621749878} -08/30/2021 23:31:37 - INFO - __main__ - Step 57371: {'lr': 0.0003463078560448562, 'samples': 11015232, 'steps': 57370, 'loss/train': 0.6016204953193665} -08/30/2021 23:31:39 - INFO - __main__ - Step 57372: {'lr': 0.000346302958853348, 'samples': 11015424, 'steps': 57371, 'loss/train': 1.2660144567489624} -08/30/2021 23:31:39 - INFO - __main__ - Step 57373: {'lr': 0.0003462980616184472, 'samples': 11015616, 'steps': 57372, 'loss/train': 1.4212183952331543} -08/30/2021 23:31:40 - INFO - __main__ - Step 57374: {'lr': 0.0003462931643401559, 'samples': 11015808, 'steps': 57373, 'loss/train': 0.12295351922512054} -08/30/2021 23:31:40 - INFO - __main__ - Step 57375: {'lr': 0.00034628826701847644, 'samples': 11016000, 'steps': 57374, 'loss/train': 0.24981556832790375} -08/30/2021 23:31:40 - INFO - __main__ - Step 57376: {'lr': 0.000346283369653411, 'samples': 11016192, 'steps': 57375, 'loss/train': 1.6498953104019165} -08/30/2021 23:31:41 - INFO - __main__ - Step 57377: {'lr': 0.0003462784722449617, 'samples': 11016384, 'steps': 57376, 'loss/train': 1.4843896627426147} -08/30/2021 23:31:42 - INFO - __main__ - Step 57378: {'lr': 0.00034627357479313087, 'samples': 11016576, 'steps': 57377, 'loss/train': 1.4692051410675049} -08/30/2021 23:31:43 - INFO - __main__ - Step 57379: {'lr': 0.0003462686772979206, 'samples': 11016768, 'steps': 57378, 'loss/train': 1.530622959136963} -08/30/2021 23:31:43 - INFO - __main__ - Step 57380: {'lr': 0.00034626377975933314, 'samples': 11016960, 'steps': 57379, 'loss/train': 1.1929035186767578} -08/30/2021 23:31:43 - INFO - __main__ - Step 57381: {'lr': 0.00034625888217737076, 'samples': 11017152, 'steps': 57380, 'loss/train': 1.2990503311157227} -08/30/2021 23:31:44 - INFO - __main__ - Step 57382: {'lr': 0.0003462539845520356, 'samples': 11017344, 'steps': 57381, 'loss/train': 1.8029626607894897} -08/30/2021 23:31:45 - INFO - __main__ - Step 57383: {'lr': 0.0003462490868833298, 'samples': 11017536, 'steps': 57382, 'loss/train': 1.5081582069396973} -08/30/2021 23:31:46 - INFO - __main__ - Step 57384: {'lr': 0.00034624418917125575, 'samples': 11017728, 'steps': 57383, 'loss/train': 0.750413715839386} -08/30/2021 23:31:46 - INFO - __main__ - Step 57385: {'lr': 0.00034623929141581555, 'samples': 11017920, 'steps': 57384, 'loss/train': 1.3719102144241333} -08/30/2021 23:31:46 - INFO - __main__ - Step 57386: {'lr': 0.0003462343936170114, 'samples': 11018112, 'steps': 57385, 'loss/train': 0.7519006133079529} -08/30/2021 23:31:47 - INFO - __main__ - Step 57387: {'lr': 0.0003462294957748455, 'samples': 11018304, 'steps': 57386, 'loss/train': 1.6113674640655518} -08/30/2021 23:31:49 - INFO - __main__ - Step 57388: {'lr': 0.00034622459788932004, 'samples': 11018496, 'steps': 57387, 'loss/train': 1.7479612827301025} -08/30/2021 23:31:50 - INFO - __main__ - Step 57389: {'lr': 0.00034621969996043725, 'samples': 11018688, 'steps': 57388, 'loss/train': 1.1651045083999634} -08/30/2021 23:31:50 - INFO - __main__ - Step 57390: {'lr': 0.0003462148019881994, 'samples': 11018880, 'steps': 57389, 'loss/train': 1.542141318321228} -08/30/2021 23:31:50 - INFO - __main__ - Step 57391: {'lr': 0.0003462099039726087, 'samples': 11019072, 'steps': 57390, 'loss/train': 1.809544563293457} -08/30/2021 23:31:51 - INFO - __main__ - Step 57392: {'lr': 0.0003462050059136672, 'samples': 11019264, 'steps': 57391, 'loss/train': 0.29521748423576355} -08/30/2021 23:31:51 - INFO - __main__ - Step 57393: {'lr': 0.00034620010781137724, 'samples': 11019456, 'steps': 57392, 'loss/train': 0.07345857471227646} -08/30/2021 23:31:52 - INFO - __main__ - Step 57394: {'lr': 0.000346195209665741, 'samples': 11019648, 'steps': 57393, 'loss/train': 0.1919942945241928} -08/30/2021 23:31:53 - INFO - __main__ - Step 57395: {'lr': 0.0003461903114767607, 'samples': 11019840, 'steps': 57394, 'loss/train': 1.1142783164978027} -08/30/2021 23:31:53 - INFO - __main__ - Step 57396: {'lr': 0.00034618541324443844, 'samples': 11020032, 'steps': 57395, 'loss/train': 1.2094385623931885} -08/30/2021 23:31:54 - INFO - __main__ - Step 57397: {'lr': 0.0003461805149687767, 'samples': 11020224, 'steps': 57396, 'loss/train': 1.3354653120040894} -08/30/2021 23:31:54 - INFO - __main__ - Step 57398: {'lr': 0.0003461756166497773, 'samples': 11020416, 'steps': 57397, 'loss/train': 1.1025032997131348} -08/30/2021 23:31:55 - INFO - __main__ - Step 57399: {'lr': 0.00034617071828744274, 'samples': 11020608, 'steps': 57398, 'loss/train': 1.3498547077178955} -08/30/2021 23:31:56 - INFO - __main__ - Step 57400: {'lr': 0.00034616581988177516, 'samples': 11020800, 'steps': 57399, 'loss/train': 1.1205404996871948} -08/30/2021 23:31:56 - INFO - __main__ - Step 57401: {'lr': 0.00034616092143277674, 'samples': 11020992, 'steps': 57400, 'loss/train': 1.4811197519302368} -08/30/2021 23:31:57 - INFO - __main__ - Step 57402: {'lr': 0.0003461560229404497, 'samples': 11021184, 'steps': 57401, 'loss/train': 1.1703927516937256} -08/30/2021 23:31:57 - INFO - __main__ - Step 57403: {'lr': 0.0003461511244047962, 'samples': 11021376, 'steps': 57402, 'loss/train': 1.2746347188949585} -08/30/2021 23:31:58 - INFO - __main__ - Step 57404: {'lr': 0.0003461462258258185, 'samples': 11021568, 'steps': 57403, 'loss/train': 1.725419044494629} -08/30/2021 23:31:59 - INFO - __main__ - Step 57405: {'lr': 0.00034614132720351884, 'samples': 11021760, 'steps': 57404, 'loss/train': 1.8319494724273682} -08/30/2021 23:31:59 - INFO - __main__ - Step 57406: {'lr': 0.00034613642853789927, 'samples': 11021952, 'steps': 57405, 'loss/train': 1.7207472324371338} -08/30/2021 23:32:00 - INFO - __main__ - Step 57407: {'lr': 0.00034613152982896224, 'samples': 11022144, 'steps': 57406, 'loss/train': 1.7767510414123535} -08/30/2021 23:32:00 - INFO - __main__ - Step 57408: {'lr': 0.0003461266310767097, 'samples': 11022336, 'steps': 57407, 'loss/train': 1.6346405744552612} -08/30/2021 23:32:01 - INFO - __main__ - Step 57409: {'lr': 0.00034612173228114405, 'samples': 11022528, 'steps': 57408, 'loss/train': 1.8527367115020752} -08/30/2021 23:32:02 - INFO - __main__ - Step 57410: {'lr': 0.00034611683344226745, 'samples': 11022720, 'steps': 57409, 'loss/train': 1.2960453033447266} -08/30/2021 23:32:02 - INFO - __main__ - Step 57411: {'lr': 0.0003461119345600821, 'samples': 11022912, 'steps': 57410, 'loss/train': 1.781599998474121} -08/30/2021 23:32:03 - INFO - __main__ - Step 57412: {'lr': 0.0003461070356345902, 'samples': 11023104, 'steps': 57411, 'loss/train': 1.507386565208435} -08/30/2021 23:32:03 - INFO - __main__ - Step 57413: {'lr': 0.0003461021366657939, 'samples': 11023296, 'steps': 57412, 'loss/train': 1.5147545337677002} -08/30/2021 23:32:05 - INFO - __main__ - Step 57414: {'lr': 0.00034609723765369546, 'samples': 11023488, 'steps': 57413, 'loss/train': 0.9106054902076721} -08/30/2021 23:32:05 - INFO - __main__ - Step 57415: {'lr': 0.00034609233859829707, 'samples': 11023680, 'steps': 57414, 'loss/train': 1.2979462146759033} -08/30/2021 23:32:06 - INFO - __main__ - Step 57416: {'lr': 0.00034608743949960096, 'samples': 11023872, 'steps': 57415, 'loss/train': 1.0761560201644897} -08/30/2021 23:32:06 - INFO - __main__ - Step 57417: {'lr': 0.00034608254035760946, 'samples': 11024064, 'steps': 57416, 'loss/train': 1.3184657096862793} -08/30/2021 23:32:06 - INFO - __main__ - Step 57418: {'lr': 0.0003460776411723245, 'samples': 11024256, 'steps': 57417, 'loss/train': 0.8684802651405334} -08/30/2021 23:32:07 - INFO - __main__ - Step 57419: {'lr': 0.00034607274194374847, 'samples': 11024448, 'steps': 57418, 'loss/train': 1.115295171737671} -08/30/2021 23:32:07 - INFO - __main__ - Step 57420: {'lr': 0.00034606784267188364, 'samples': 11024640, 'steps': 57419, 'loss/train': 0.036703579127788544} -08/30/2021 23:32:09 - INFO - __main__ - Step 57421: {'lr': 0.000346062943356732, 'samples': 11024832, 'steps': 57420, 'loss/train': 0.02843855880200863} -08/30/2021 23:32:09 - INFO - __main__ - Step 57422: {'lr': 0.00034605804399829595, 'samples': 11025024, 'steps': 57421, 'loss/train': 0.05390862002968788} -08/30/2021 23:32:10 - INFO - __main__ - Step 57423: {'lr': 0.00034605314459657763, 'samples': 11025216, 'steps': 57422, 'loss/train': 0.08192064613103867} -08/30/2021 23:32:10 - INFO - __main__ - Step 57424: {'lr': 0.00034604824515157916, 'samples': 11025408, 'steps': 57423, 'loss/train': 1.0345810651779175} -08/30/2021 23:32:10 - INFO - __main__ - Step 57425: {'lr': 0.0003460433456633029, 'samples': 11025600, 'steps': 57424, 'loss/train': 1.5606253147125244} -08/30/2021 23:32:11 - INFO - __main__ - Step 57426: {'lr': 0.000346038446131751, 'samples': 11025792, 'steps': 57425, 'loss/train': 0.9615251421928406} -08/30/2021 23:32:12 - INFO - __main__ - Step 57427: {'lr': 0.0003460335465569256, 'samples': 11025984, 'steps': 57426, 'loss/train': 1.2716492414474487} -08/30/2021 23:32:13 - INFO - __main__ - Step 57428: {'lr': 0.0003460286469388291, 'samples': 11026176, 'steps': 57427, 'loss/train': 1.3033071756362915} -08/30/2021 23:32:13 - INFO - __main__ - Step 57429: {'lr': 0.0003460237472774634, 'samples': 11026368, 'steps': 57428, 'loss/train': 0.9254215359687805} -08/30/2021 23:32:14 - INFO - __main__ - Step 57430: {'lr': 0.000346018847572831, 'samples': 11026560, 'steps': 57429, 'loss/train': 1.2488702535629272} -08/30/2021 23:32:14 - INFO - __main__ - Step 57431: {'lr': 0.00034601394782493393, 'samples': 11026752, 'steps': 57430, 'loss/train': 1.6453608274459839} -08/30/2021 23:32:16 - INFO - __main__ - Step 57432: {'lr': 0.00034600904803377454, 'samples': 11026944, 'steps': 57431, 'loss/train': 1.4031685590744019} -08/30/2021 23:32:16 - INFO - __main__ - Step 57433: {'lr': 0.0003460041481993549, 'samples': 11027136, 'steps': 57432, 'loss/train': 0.7683749794960022} -08/30/2021 23:32:17 - INFO - __main__ - Step 57434: {'lr': 0.0003459992483216773, 'samples': 11027328, 'steps': 57433, 'loss/train': 0.18001098930835724} -08/30/2021 23:32:17 - INFO - __main__ - Step 57435: {'lr': 0.0003459943484007438, 'samples': 11027520, 'steps': 57434, 'loss/train': 1.100398302078247} -08/30/2021 23:32:17 - INFO - __main__ - Step 57436: {'lr': 0.0003459894484365568, 'samples': 11027712, 'steps': 57435, 'loss/train': 0.6147298812866211} -08/30/2021 23:32:18 - INFO - __main__ - Step 57437: {'lr': 0.0003459845484291185, 'samples': 11027904, 'steps': 57436, 'loss/train': 1.4119763374328613} -08/30/2021 23:32:19 - INFO - __main__ - Step 57438: {'lr': 0.00034597964837843097, 'samples': 11028096, 'steps': 57437, 'loss/train': 0.039573926478624344} -08/30/2021 23:32:20 - INFO - __main__ - Step 57439: {'lr': 0.00034597474828449646, 'samples': 11028288, 'steps': 57438, 'loss/train': 1.083383321762085} -08/30/2021 23:32:20 - INFO - __main__ - Step 57440: {'lr': 0.00034596984814731736, 'samples': 11028480, 'steps': 57439, 'loss/train': 1.9350773096084595} -08/30/2021 23:32:20 - INFO - __main__ - Step 57441: {'lr': 0.0003459649479668956, 'samples': 11028672, 'steps': 57440, 'loss/train': 0.753420889377594} -08/30/2021 23:32:21 - INFO - __main__ - Step 57442: {'lr': 0.00034596004774323355, 'samples': 11028864, 'steps': 57441, 'loss/train': 1.6271330118179321} -08/30/2021 23:32:21 - INFO - __main__ - Step 57443: {'lr': 0.0003459551474763334, 'samples': 11029056, 'steps': 57442, 'loss/train': 1.282515048980713} -08/30/2021 23:32:24 - INFO - __main__ - Step 57444: {'lr': 0.00034595024716619726, 'samples': 11029248, 'steps': 57443, 'loss/train': 1.2012004852294922} -08/30/2021 23:32:24 - INFO - __main__ - Step 57445: {'lr': 0.0003459453468128276, 'samples': 11029440, 'steps': 57444, 'loss/train': 1.1732220649719238} -08/30/2021 23:32:24 - INFO - __main__ - Step 57446: {'lr': 0.0003459404464162263, 'samples': 11029632, 'steps': 57445, 'loss/train': 1.3930153846740723} -08/30/2021 23:32:25 - INFO - __main__ - Step 57447: {'lr': 0.0003459355459763957, 'samples': 11029824, 'steps': 57446, 'loss/train': 1.8122808933258057} -08/30/2021 23:32:25 - INFO - __main__ - Step 57448: {'lr': 0.0003459306454933381, 'samples': 11030016, 'steps': 57447, 'loss/train': 0.04777875915169716} -08/30/2021 23:32:25 - INFO - __main__ - Step 57449: {'lr': 0.0003459257449670555, 'samples': 11030208, 'steps': 57448, 'loss/train': 1.219847559928894} -08/30/2021 23:32:27 - INFO - __main__ - Step 57450: {'lr': 0.0003459208443975504, 'samples': 11030400, 'steps': 57449, 'loss/train': 1.7973581552505493} -08/30/2021 23:32:27 - INFO - __main__ - Step 57451: {'lr': 0.00034591594378482484, 'samples': 11030592, 'steps': 57450, 'loss/train': 1.3826237916946411} -08/30/2021 23:32:28 - INFO - __main__ - Step 57452: {'lr': 0.00034591104312888096, 'samples': 11030784, 'steps': 57451, 'loss/train': 1.0369007587432861} -08/30/2021 23:32:28 - INFO - __main__ - Step 57453: {'lr': 0.00034590614242972106, 'samples': 11030976, 'steps': 57452, 'loss/train': 1.347379207611084} -08/30/2021 23:32:28 - INFO - __main__ - Step 57454: {'lr': 0.00034590124168734735, 'samples': 11031168, 'steps': 57453, 'loss/train': 1.9416102170944214} -08/30/2021 23:32:30 - INFO - __main__ - Step 57455: {'lr': 0.00034589634090176195, 'samples': 11031360, 'steps': 57454, 'loss/train': 0.7941985130310059} -08/30/2021 23:32:30 - INFO - __main__ - Step 57456: {'lr': 0.0003458914400729672, 'samples': 11031552, 'steps': 57455, 'loss/train': 2.0067849159240723} -08/30/2021 23:32:31 - INFO - __main__ - Step 57457: {'lr': 0.00034588653920096524, 'samples': 11031744, 'steps': 57456, 'loss/train': 0.9747812151908875} -08/30/2021 23:32:31 - INFO - __main__ - Step 57458: {'lr': 0.00034588163828575837, 'samples': 11031936, 'steps': 57457, 'loss/train': 0.9822937250137329} -08/30/2021 23:32:31 - INFO - __main__ - Step 57459: {'lr': 0.0003458767373273486, 'samples': 11032128, 'steps': 57458, 'loss/train': 1.1482160091400146} -08/30/2021 23:32:32 - INFO - __main__ - Step 57460: {'lr': 0.00034587183632573825, 'samples': 11032320, 'steps': 57459, 'loss/train': 1.1093323230743408} -08/30/2021 23:32:33 - INFO - __main__ - Step 57461: {'lr': 0.00034586693528092954, 'samples': 11032512, 'steps': 57460, 'loss/train': 1.3924261331558228} -08/30/2021 23:32:34 - INFO - __main__ - Step 57462: {'lr': 0.0003458620341929247, 'samples': 11032704, 'steps': 57461, 'loss/train': 1.6451566219329834} -08/30/2021 23:32:34 - INFO - __main__ - Step 57463: {'lr': 0.0003458571330617259, 'samples': 11032896, 'steps': 57462, 'loss/train': 1.2803077697753906} -08/30/2021 23:32:34 - INFO - __main__ - Step 57464: {'lr': 0.00034585223188733535, 'samples': 11033088, 'steps': 57463, 'loss/train': 1.0794323682785034} -08/30/2021 23:32:35 - INFO - __main__ - Step 57465: {'lr': 0.0003458473306697553, 'samples': 11033280, 'steps': 57464, 'loss/train': 1.2126712799072266} -08/30/2021 23:32:36 - INFO - __main__ - Step 57466: {'lr': 0.0003458424294089879, 'samples': 11033472, 'steps': 57465, 'loss/train': 1.098444938659668} -08/30/2021 23:32:37 - INFO - __main__ - Step 57467: {'lr': 0.00034583752810503533, 'samples': 11033664, 'steps': 57466, 'loss/train': 1.3321839570999146} -08/30/2021 23:32:37 - INFO - __main__ - Step 57468: {'lr': 0.0003458326267578999, 'samples': 11033856, 'steps': 57467, 'loss/train': 0.8548885583877563} -08/30/2021 23:32:38 - INFO - __main__ - Step 57469: {'lr': 0.0003458277253675837, 'samples': 11034048, 'steps': 57468, 'loss/train': 1.1701687574386597} -08/30/2021 23:32:38 - INFO - __main__ - Step 57470: {'lr': 0.0003458228239340891, 'samples': 11034240, 'steps': 57469, 'loss/train': 1.7661478519439697} -08/30/2021 23:32:39 - INFO - __main__ - Step 57471: {'lr': 0.0003458179224574182, 'samples': 11034432, 'steps': 57470, 'loss/train': 1.9364041090011597} -08/30/2021 23:32:40 - INFO - __main__ - Step 57472: {'lr': 0.00034581302093757317, 'samples': 11034624, 'steps': 57471, 'loss/train': 0.749711811542511} -08/30/2021 23:32:40 - INFO - __main__ - Step 57473: {'lr': 0.0003458081193745563, 'samples': 11034816, 'steps': 57472, 'loss/train': 0.73874431848526} -08/30/2021 23:32:41 - INFO - __main__ - Step 57474: {'lr': 0.00034580321776836974, 'samples': 11035008, 'steps': 57473, 'loss/train': 1.2635341882705688} -08/30/2021 23:32:41 - INFO - __main__ - Step 57475: {'lr': 0.0003457983161190158, 'samples': 11035200, 'steps': 57474, 'loss/train': 1.393290400505066} -08/30/2021 23:32:43 - INFO - __main__ - Step 57476: {'lr': 0.00034579341442649654, 'samples': 11035392, 'steps': 57475, 'loss/train': 1.0002593994140625} -08/30/2021 23:32:43 - INFO - __main__ - Step 57477: {'lr': 0.00034578851269081426, 'samples': 11035584, 'steps': 57476, 'loss/train': 0.9912737607955933} -08/30/2021 23:32:44 - INFO - __main__ - Step 57478: {'lr': 0.0003457836109119712, 'samples': 11035776, 'steps': 57477, 'loss/train': 1.3044018745422363} -08/30/2021 23:32:44 - INFO - __main__ - Step 57479: {'lr': 0.0003457787090899695, 'samples': 11035968, 'steps': 57478, 'loss/train': 0.8418999910354614} -08/30/2021 23:32:44 - INFO - __main__ - Step 57480: {'lr': 0.00034577380722481137, 'samples': 11036160, 'steps': 57479, 'loss/train': 2.2630624771118164} -08/30/2021 23:32:45 - INFO - __main__ - Step 57481: {'lr': 0.00034576890531649905, 'samples': 11036352, 'steps': 57480, 'loss/train': 1.2399497032165527} -08/30/2021 23:32:46 - INFO - __main__ - Step 57482: {'lr': 0.0003457640033650348, 'samples': 11036544, 'steps': 57481, 'loss/train': 1.7686729431152344} -08/30/2021 23:32:47 - INFO - __main__ - Step 57483: {'lr': 0.00034575910137042064, 'samples': 11036736, 'steps': 57482, 'loss/train': 1.6249058246612549} -08/30/2021 23:32:47 - INFO - __main__ - Step 57484: {'lr': 0.000345754199332659, 'samples': 11036928, 'steps': 57483, 'loss/train': 1.4051047563552856} -08/30/2021 23:32:47 - INFO - __main__ - Step 57485: {'lr': 0.00034574929725175203, 'samples': 11037120, 'steps': 57484, 'loss/train': 1.0107982158660889} -08/30/2021 23:32:48 - INFO - __main__ - Step 57486: {'lr': 0.0003457443951277018, 'samples': 11037312, 'steps': 57485, 'loss/train': 1.4943259954452515} -08/30/2021 23:32:49 - INFO - __main__ - Step 57487: {'lr': 0.00034573949296051065, 'samples': 11037504, 'steps': 57486, 'loss/train': 1.3099762201309204} -08/30/2021 23:32:50 - INFO - __main__ - Step 57488: {'lr': 0.0003457345907501808, 'samples': 11037696, 'steps': 57487, 'loss/train': 2.354846239089966} -08/30/2021 23:32:50 - INFO - __main__ - Step 57489: {'lr': 0.0003457296884967144, 'samples': 11037888, 'steps': 57488, 'loss/train': 0.8203210234642029} -08/30/2021 23:32:50 - INFO - __main__ - Step 57490: {'lr': 0.0003457247862001137, 'samples': 11038080, 'steps': 57489, 'loss/train': 1.1483343839645386} -08/30/2021 23:32:51 - INFO - __main__ - Step 57491: {'lr': 0.0003457198838603809, 'samples': 11038272, 'steps': 57490, 'loss/train': 0.8238843083381653} -08/30/2021 23:32:51 - INFO - __main__ - Step 57492: {'lr': 0.0003457149814775182, 'samples': 11038464, 'steps': 57491, 'loss/train': 1.485921025276184} -08/30/2021 23:32:53 - INFO - __main__ - Step 57493: {'lr': 0.00034571007905152774, 'samples': 11038656, 'steps': 57492, 'loss/train': 0.8518865704536438} -08/30/2021 23:32:53 - INFO - __main__ - Step 57494: {'lr': 0.00034570517658241186, 'samples': 11038848, 'steps': 57493, 'loss/train': 1.4750962257385254} -08/30/2021 23:32:53 - INFO - __main__ - Step 57495: {'lr': 0.00034570027407017264, 'samples': 11039040, 'steps': 57494, 'loss/train': 1.601528286933899} -08/30/2021 23:32:54 - INFO - __main__ - Step 57496: {'lr': 0.0003456953715148124, 'samples': 11039232, 'steps': 57495, 'loss/train': 1.5654919147491455} -08/30/2021 23:32:54 - INFO - __main__ - Step 57497: {'lr': 0.0003456904689163333, 'samples': 11039424, 'steps': 57496, 'loss/train': 1.1852360963821411} -08/30/2021 23:32:56 - INFO - __main__ - Step 57498: {'lr': 0.0003456855662747376, 'samples': 11039616, 'steps': 57497, 'loss/train': 1.0496329069137573} -08/30/2021 23:32:56 - INFO - __main__ - Step 57499: {'lr': 0.0003456806635900274, 'samples': 11039808, 'steps': 57498, 'loss/train': 1.67026948928833} -08/30/2021 23:32:57 - INFO - __main__ - Step 57500: {'lr': 0.00034567576086220493, 'samples': 11040000, 'steps': 57499, 'loss/train': 1.298622727394104} -08/30/2021 23:32:57 - INFO - __main__ - Step 57501: {'lr': 0.0003456708580912725, 'samples': 11040192, 'steps': 57500, 'loss/train': 1.5156292915344238} -08/30/2021 23:32:57 - INFO - __main__ - Step 57502: {'lr': 0.0003456659552772322, 'samples': 11040384, 'steps': 57501, 'loss/train': 1.4259544610977173} -08/30/2021 23:32:59 - INFO - __main__ - Step 57503: {'lr': 0.0003456610524200863, 'samples': 11040576, 'steps': 57502, 'loss/train': 1.458237886428833} -08/30/2021 23:33:00 - INFO - __main__ - Step 57504: {'lr': 0.00034565614951983706, 'samples': 11040768, 'steps': 57503, 'loss/train': 0.942168653011322} -08/30/2021 23:33:00 - INFO - __main__ - Step 57505: {'lr': 0.00034565124657648665, 'samples': 11040960, 'steps': 57504, 'loss/train': 1.7458330392837524} -08/30/2021 23:33:00 - INFO - __main__ - Step 57506: {'lr': 0.0003456463435900372, 'samples': 11041152, 'steps': 57505, 'loss/train': 0.35200047492980957} -08/30/2021 23:33:01 - INFO - __main__ - Step 57507: {'lr': 0.0003456414405604911, 'samples': 11041344, 'steps': 57506, 'loss/train': 1.487480640411377} -08/30/2021 23:33:02 - INFO - __main__ - Step 57508: {'lr': 0.0003456365374878503, 'samples': 11041536, 'steps': 57507, 'loss/train': 1.1866015195846558} -08/30/2021 23:33:03 - INFO - __main__ - Step 57509: {'lr': 0.00034563163437211717, 'samples': 11041728, 'steps': 57508, 'loss/train': 1.4239046573638916} -08/30/2021 23:33:03 - INFO - __main__ - Step 57510: {'lr': 0.000345626731213294, 'samples': 11041920, 'steps': 57509, 'loss/train': 1.2445242404937744} -08/30/2021 23:33:03 - INFO - __main__ - Step 57511: {'lr': 0.00034562182801138277, 'samples': 11042112, 'steps': 57510, 'loss/train': 1.2954127788543701} -08/30/2021 23:33:04 - INFO - __main__ - Step 57512: {'lr': 0.00034561692476638595, 'samples': 11042304, 'steps': 57511, 'loss/train': 1.1406797170639038} -08/30/2021 23:33:05 - INFO - __main__ - Step 57513: {'lr': 0.00034561202147830554, 'samples': 11042496, 'steps': 57512, 'loss/train': 1.5891255140304565} -08/30/2021 23:33:06 - INFO - __main__ - Step 57514: {'lr': 0.00034560711814714387, 'samples': 11042688, 'steps': 57513, 'loss/train': 0.9233707785606384} -08/30/2021 23:33:06 - INFO - __main__ - Step 57515: {'lr': 0.0003456022147729031, 'samples': 11042880, 'steps': 57514, 'loss/train': 1.3124396800994873} -08/30/2021 23:33:06 - INFO - __main__ - Step 57516: {'lr': 0.00034559731135558536, 'samples': 11043072, 'steps': 57515, 'loss/train': 0.9970801472663879} -08/30/2021 23:33:07 - INFO - __main__ - Step 57517: {'lr': 0.000345592407895193, 'samples': 11043264, 'steps': 57516, 'loss/train': 1.049660563468933} -08/30/2021 23:33:08 - INFO - __main__ - Step 57518: {'lr': 0.00034558750439172826, 'samples': 11043456, 'steps': 57517, 'loss/train': 0.8449531197547913} -08/30/2021 23:33:09 - INFO - __main__ - Step 57519: {'lr': 0.0003455826008451932, 'samples': 11043648, 'steps': 57518, 'loss/train': 1.3629741668701172} -08/30/2021 23:33:09 - INFO - __main__ - Step 57520: {'lr': 0.00034557769725559014, 'samples': 11043840, 'steps': 57519, 'loss/train': 1.1600923538208008} -08/30/2021 23:33:09 - INFO - __main__ - Step 57521: {'lr': 0.00034557279362292117, 'samples': 11044032, 'steps': 57520, 'loss/train': 0.5266602635383606} -08/30/2021 23:33:10 - INFO - __main__ - Step 57522: {'lr': 0.00034556788994718855, 'samples': 11044224, 'steps': 57521, 'loss/train': 1.2160521745681763} -08/30/2021 23:33:10 - INFO - __main__ - Step 57523: {'lr': 0.00034556298622839463, 'samples': 11044416, 'steps': 57522, 'loss/train': 1.2337080240249634} -08/30/2021 23:33:12 - INFO - __main__ - Step 57524: {'lr': 0.0003455580824665414, 'samples': 11044608, 'steps': 57523, 'loss/train': 1.113364338874817} -08/30/2021 23:33:12 - INFO - __main__ - Step 57525: {'lr': 0.0003455531786616313, 'samples': 11044800, 'steps': 57524, 'loss/train': 1.587162733078003} -08/30/2021 23:33:12 - INFO - __main__ - Step 57526: {'lr': 0.0003455482748136663, 'samples': 11044992, 'steps': 57525, 'loss/train': 0.8753715753555298} -08/30/2021 23:33:13 - INFO - __main__ - Step 57527: {'lr': 0.00034554337092264874, 'samples': 11045184, 'steps': 57526, 'loss/train': 1.1568371057510376} -08/30/2021 23:33:13 - INFO - __main__ - Step 57528: {'lr': 0.00034553846698858083, 'samples': 11045376, 'steps': 57527, 'loss/train': 2.292367935180664} -08/30/2021 23:33:15 - INFO - __main__ - Step 57529: {'lr': 0.00034553356301146473, 'samples': 11045568, 'steps': 57528, 'loss/train': 1.4185253381729126} -08/30/2021 23:33:15 - INFO - __main__ - Step 57530: {'lr': 0.0003455286589913027, 'samples': 11045760, 'steps': 57529, 'loss/train': 1.5858784914016724} -08/30/2021 23:33:15 - INFO - __main__ - Step 57531: {'lr': 0.0003455237549280969, 'samples': 11045952, 'steps': 57530, 'loss/train': 0.8337659239768982} -08/30/2021 23:33:16 - INFO - __main__ - Step 57532: {'lr': 0.0003455188508218496, 'samples': 11046144, 'steps': 57531, 'loss/train': 1.371749758720398} -08/30/2021 23:33:16 - INFO - __main__ - Step 57533: {'lr': 0.000345513946672563, 'samples': 11046336, 'steps': 57532, 'loss/train': 1.3756765127182007} -08/30/2021 23:33:18 - INFO - __main__ - Step 57534: {'lr': 0.0003455090424802393, 'samples': 11046528, 'steps': 57533, 'loss/train': 1.0895546674728394} -08/30/2021 23:33:18 - INFO - __main__ - Step 57535: {'lr': 0.00034550413824488066, 'samples': 11046720, 'steps': 57534, 'loss/train': 1.26651930809021} -08/30/2021 23:33:19 - INFO - __main__ - Step 57536: {'lr': 0.0003454992339664893, 'samples': 11046912, 'steps': 57535, 'loss/train': 1.100299596786499} -08/30/2021 23:33:19 - INFO - __main__ - Step 57537: {'lr': 0.00034549432964506755, 'samples': 11047104, 'steps': 57536, 'loss/train': 1.2957290410995483} -08/30/2021 23:33:19 - INFO - __main__ - Step 57538: {'lr': 0.0003454894252806175, 'samples': 11047296, 'steps': 57537, 'loss/train': 0.0267304889857769} -08/30/2021 23:33:20 - INFO - __main__ - Step 57539: {'lr': 0.00034548452087314135, 'samples': 11047488, 'steps': 57538, 'loss/train': 0.022666100412607193} -08/30/2021 23:33:22 - INFO - __main__ - Step 57540: {'lr': 0.0003454796164226414, 'samples': 11047680, 'steps': 57539, 'loss/train': 1.9569488763809204} -08/30/2021 23:33:22 - INFO - __main__ - Step 57541: {'lr': 0.00034547471192911973, 'samples': 11047872, 'steps': 57540, 'loss/train': 1.228626012802124} -08/30/2021 23:33:22 - INFO - __main__ - Step 57542: {'lr': 0.0003454698073925787, 'samples': 11048064, 'steps': 57541, 'loss/train': 1.2397302389144897} -08/30/2021 23:33:23 - INFO - __main__ - Step 57543: {'lr': 0.00034546490281302033, 'samples': 11048256, 'steps': 57542, 'loss/train': 0.6691275835037231} -08/30/2021 23:33:23 - INFO - __main__ - Step 57544: {'lr': 0.000345459998190447, 'samples': 11048448, 'steps': 57543, 'loss/train': 1.49228036403656} -08/30/2021 23:33:25 - INFO - __main__ - Step 57545: {'lr': 0.000345455093524861, 'samples': 11048640, 'steps': 57544, 'loss/train': 1.1912755966186523} -08/30/2021 23:33:25 - INFO - __main__ - Step 57546: {'lr': 0.00034545018881626435, 'samples': 11048832, 'steps': 57545, 'loss/train': 1.4535815715789795} -08/30/2021 23:33:26 - INFO - __main__ - Step 57547: {'lr': 0.00034544528406465927, 'samples': 11049024, 'steps': 57546, 'loss/train': 1.5673638582229614} -08/30/2021 23:33:26 - INFO - __main__ - Step 57548: {'lr': 0.000345440379270048, 'samples': 11049216, 'steps': 57547, 'loss/train': 1.0576817989349365} -08/30/2021 23:33:26 - INFO - __main__ - Step 57549: {'lr': 0.0003454354744324328, 'samples': 11049408, 'steps': 57548, 'loss/train': 1.4908499717712402} -08/30/2021 23:33:27 - INFO - __main__ - Step 57550: {'lr': 0.00034543056955181584, 'samples': 11049600, 'steps': 57549, 'loss/train': 1.5017606019973755} -08/30/2021 23:33:28 - INFO - __main__ - Step 57551: {'lr': 0.0003454256646281993, 'samples': 11049792, 'steps': 57550, 'loss/train': 1.3556101322174072} -08/30/2021 23:33:29 - INFO - __main__ - Step 57552: {'lr': 0.0003454207596615855, 'samples': 11049984, 'steps': 57551, 'loss/train': 1.4647105932235718} -08/30/2021 23:33:29 - INFO - __main__ - Step 57553: {'lr': 0.00034541585465197653, 'samples': 11050176, 'steps': 57552, 'loss/train': 1.4885293245315552} -08/30/2021 23:33:29 - INFO - __main__ - Step 57554: {'lr': 0.0003454109495993747, 'samples': 11050368, 'steps': 57553, 'loss/train': 0.9432709217071533} -08/30/2021 23:33:30 - INFO - __main__ - Step 57555: {'lr': 0.0003454060445037821, 'samples': 11050560, 'steps': 57554, 'loss/train': 0.7419079542160034} -08/30/2021 23:33:32 - INFO - __main__ - Step 57556: {'lr': 0.0003454011393652011, 'samples': 11050752, 'steps': 57555, 'loss/train': 1.0104891061782837} -08/30/2021 23:33:32 - INFO - __main__ - Step 57557: {'lr': 0.0003453962341836337, 'samples': 11050944, 'steps': 57556, 'loss/train': 0.6945191621780396} -08/30/2021 23:33:33 - INFO - __main__ - Step 57558: {'lr': 0.0003453913289590823, 'samples': 11051136, 'steps': 57557, 'loss/train': 1.7103712558746338} -08/30/2021 23:33:33 - INFO - __main__ - Step 57559: {'lr': 0.00034538642369154907, 'samples': 11051328, 'steps': 57558, 'loss/train': 1.8439635038375854} -08/30/2021 23:33:33 - INFO - __main__ - Step 57560: {'lr': 0.00034538151838103614, 'samples': 11051520, 'steps': 57559, 'loss/train': 1.214728832244873} -08/30/2021 23:33:35 - INFO - __main__ - Step 57561: {'lr': 0.00034537661302754577, 'samples': 11051712, 'steps': 57560, 'loss/train': 1.7380664348602295} -08/30/2021 23:33:35 - INFO - __main__ - Step 57562: {'lr': 0.00034537170763108017, 'samples': 11051904, 'steps': 57561, 'loss/train': 0.4132211208343506} -08/30/2021 23:33:36 - INFO - __main__ - Step 57563: {'lr': 0.00034536680219164156, 'samples': 11052096, 'steps': 57562, 'loss/train': 1.7337266206741333} -08/30/2021 23:33:36 - INFO - __main__ - Step 57564: {'lr': 0.0003453618967092322, 'samples': 11052288, 'steps': 57563, 'loss/train': 0.9239173531532288} -08/30/2021 23:33:37 - INFO - __main__ - Step 57565: {'lr': 0.00034535699118385413, 'samples': 11052480, 'steps': 57564, 'loss/train': 0.8764766454696655} -08/30/2021 23:33:38 - INFO - __main__ - Step 57566: {'lr': 0.00034535208561550974, 'samples': 11052672, 'steps': 57565, 'loss/train': 1.3058198690414429} -08/30/2021 23:33:38 - INFO - __main__ - Step 57567: {'lr': 0.00034534718000420113, 'samples': 11052864, 'steps': 57566, 'loss/train': 1.596453309059143} -08/30/2021 23:33:39 - INFO - __main__ - Step 57568: {'lr': 0.0003453422743499306, 'samples': 11053056, 'steps': 57567, 'loss/train': 1.6370819807052612} -08/30/2021 23:33:39 - INFO - __main__ - Step 57569: {'lr': 0.00034533736865270025, 'samples': 11053248, 'steps': 57568, 'loss/train': 1.4883334636688232} -08/30/2021 23:33:39 - INFO - __main__ - Step 57570: {'lr': 0.0003453324629125124, 'samples': 11053440, 'steps': 57569, 'loss/train': 1.3380407094955444} -08/30/2021 23:33:41 - INFO - __main__ - Step 57571: {'lr': 0.00034532755712936926, 'samples': 11053632, 'steps': 57570, 'loss/train': 1.3347805738449097} -08/30/2021 23:33:42 - INFO - __main__ - Step 57572: {'lr': 0.0003453226513032729, 'samples': 11053824, 'steps': 57571, 'loss/train': 0.980475664138794} -08/30/2021 23:33:42 - INFO - __main__ - Step 57573: {'lr': 0.00034531774543422567, 'samples': 11054016, 'steps': 57572, 'loss/train': 1.2035059928894043} -08/30/2021 23:33:42 - INFO - __main__ - Step 57574: {'lr': 0.00034531283952222975, 'samples': 11054208, 'steps': 57573, 'loss/train': 1.177834153175354} -08/30/2021 23:33:43 - INFO - __main__ - Step 57575: {'lr': 0.00034530793356728727, 'samples': 11054400, 'steps': 57574, 'loss/train': 1.4501341581344604} -08/30/2021 23:33:44 - INFO - __main__ - Step 57576: {'lr': 0.0003453030275694006, 'samples': 11054592, 'steps': 57575, 'loss/train': 1.279768466949463} -08/30/2021 23:33:45 - INFO - __main__ - Step 57577: {'lr': 0.0003452981215285718, 'samples': 11054784, 'steps': 57576, 'loss/train': 1.2387789487838745} -08/30/2021 23:33:45 - INFO - __main__ - Step 57578: {'lr': 0.0003452932154448031, 'samples': 11054976, 'steps': 57577, 'loss/train': 1.4210563898086548} -08/30/2021 23:33:45 - INFO - __main__ - Step 57579: {'lr': 0.0003452883093180968, 'samples': 11055168, 'steps': 57578, 'loss/train': 1.2626224756240845} -08/30/2021 23:33:46 - INFO - __main__ - Step 57580: {'lr': 0.0003452834031484551, 'samples': 11055360, 'steps': 57579, 'loss/train': 0.8644973635673523} -08/30/2021 23:33:47 - INFO - __main__ - Step 57581: {'lr': 0.0003452784969358801, 'samples': 11055552, 'steps': 57580, 'loss/train': 1.5270440578460693} -08/30/2021 23:33:48 - INFO - __main__ - Step 57582: {'lr': 0.0003452735906803741, 'samples': 11055744, 'steps': 57581, 'loss/train': 1.7835882902145386} -08/30/2021 23:33:48 - INFO - __main__ - Step 57583: {'lr': 0.0003452686843819393, 'samples': 11055936, 'steps': 57582, 'loss/train': 1.4282037019729614} -08/30/2021 23:33:49 - INFO - __main__ - Step 57584: {'lr': 0.0003452637780405778, 'samples': 11056128, 'steps': 57583, 'loss/train': 1.4931445121765137} -08/30/2021 23:33:49 - INFO - __main__ - Step 57585: {'lr': 0.000345258871656292, 'samples': 11056320, 'steps': 57584, 'loss/train': 1.939090371131897} -08/30/2021 23:33:49 - INFO - __main__ - Step 57586: {'lr': 0.0003452539652290841, 'samples': 11056512, 'steps': 57585, 'loss/train': 1.1673301458358765} -08/30/2021 23:33:51 - INFO - __main__ - Step 57587: {'lr': 0.00034524905875895614, 'samples': 11056704, 'steps': 57586, 'loss/train': 1.9163360595703125} -08/30/2021 23:33:51 - INFO - __main__ - Step 57588: {'lr': 0.00034524415224591046, 'samples': 11056896, 'steps': 57587, 'loss/train': 1.6837005615234375} -08/30/2021 23:33:52 - INFO - __main__ - Step 57589: {'lr': 0.00034523924568994913, 'samples': 11057088, 'steps': 57588, 'loss/train': 1.4500340223312378} -08/30/2021 23:33:52 - INFO - __main__ - Step 57590: {'lr': 0.00034523433909107454, 'samples': 11057280, 'steps': 57589, 'loss/train': 1.8550750017166138} -08/30/2021 23:33:52 - INFO - __main__ - Step 57591: {'lr': 0.00034522943244928885, 'samples': 11057472, 'steps': 57590, 'loss/train': 1.1731996536254883} -08/30/2021 23:33:54 - INFO - __main__ - Step 57592: {'lr': 0.0003452245257645943, 'samples': 11057664, 'steps': 57591, 'loss/train': 0.8706366419792175} -08/30/2021 23:33:54 - INFO - __main__ - Step 57593: {'lr': 0.00034521961903699296, 'samples': 11057856, 'steps': 57592, 'loss/train': 1.7030678987503052} -08/30/2021 23:33:55 - INFO - __main__ - Step 57594: {'lr': 0.00034521471226648716, 'samples': 11058048, 'steps': 57593, 'loss/train': 1.2411733865737915} -08/30/2021 23:33:55 - INFO - __main__ - Step 57595: {'lr': 0.000345209805453079, 'samples': 11058240, 'steps': 57594, 'loss/train': 1.1184347867965698} -08/30/2021 23:33:55 - INFO - __main__ - Step 57596: {'lr': 0.00034520489859677083, 'samples': 11058432, 'steps': 57595, 'loss/train': 1.0869066715240479} -08/30/2021 23:33:57 - INFO - __main__ - Step 57597: {'lr': 0.0003451999916975648, 'samples': 11058624, 'steps': 57596, 'loss/train': 1.3778116703033447} -08/30/2021 23:33:58 - INFO - __main__ - Step 57598: {'lr': 0.00034519508475546314, 'samples': 11058816, 'steps': 57597, 'loss/train': 2.072032928466797} -08/30/2021 23:33:58 - INFO - __main__ - Step 57599: {'lr': 0.0003451901777704681, 'samples': 11059008, 'steps': 57598, 'loss/train': 0.8535974025726318} -08/30/2021 23:33:58 - INFO - __main__ - Step 57600: {'lr': 0.00034518527074258175, 'samples': 11059200, 'steps': 57599, 'loss/train': 1.1968071460723877} -08/30/2021 23:33:59 - INFO - __main__ - Step 57601: {'lr': 0.00034518036367180637, 'samples': 11059392, 'steps': 57600, 'loss/train': 0.21868842840194702} -08/30/2021 23:34:00 - INFO - __main__ - Step 57602: {'lr': 0.00034517545655814424, 'samples': 11059584, 'steps': 57601, 'loss/train': 1.3872748613357544} -08/30/2021 23:34:01 - INFO - __main__ - Step 57603: {'lr': 0.0003451705494015975, 'samples': 11059776, 'steps': 57602, 'loss/train': 1.2841793298721313} -08/30/2021 23:34:01 - INFO - __main__ - Step 57604: {'lr': 0.0003451656422021684, 'samples': 11059968, 'steps': 57603, 'loss/train': 1.5994257926940918} -08/30/2021 23:34:01 - INFO - __main__ - Step 57605: {'lr': 0.0003451607349598591, 'samples': 11060160, 'steps': 57604, 'loss/train': 1.85781991481781} -08/30/2021 23:34:02 - INFO - __main__ - Step 57606: {'lr': 0.0003451558276746719, 'samples': 11060352, 'steps': 57605, 'loss/train': 1.6756277084350586} -08/30/2021 23:34:03 - INFO - __main__ - Step 57607: {'lr': 0.0003451509203466089, 'samples': 11060544, 'steps': 57606, 'loss/train': 1.3493287563323975} -08/30/2021 23:34:04 - INFO - __main__ - Step 57608: {'lr': 0.00034514601297567235, 'samples': 11060736, 'steps': 57607, 'loss/train': 1.264882206916809} -08/30/2021 23:34:04 - INFO - __main__ - Step 57609: {'lr': 0.00034514110556186446, 'samples': 11060928, 'steps': 57608, 'loss/train': 1.5122637748718262} -08/30/2021 23:34:04 - INFO - __main__ - Step 57610: {'lr': 0.0003451361981051875, 'samples': 11061120, 'steps': 57609, 'loss/train': 0.8713572025299072} -08/30/2021 23:34:05 - INFO - __main__ - Step 57611: {'lr': 0.00034513129060564365, 'samples': 11061312, 'steps': 57610, 'loss/train': 1.1754547357559204} -08/30/2021 23:34:05 - INFO - __main__ - Step 57612: {'lr': 0.00034512638306323506, 'samples': 11061504, 'steps': 57611, 'loss/train': 1.165854573249817} -08/30/2021 23:34:07 - INFO - __main__ - Step 57613: {'lr': 0.000345121475477964, 'samples': 11061696, 'steps': 57612, 'loss/train': 1.0446141958236694} -08/30/2021 23:34:08 - INFO - __main__ - Step 57614: {'lr': 0.0003451165678498327, 'samples': 11061888, 'steps': 57613, 'loss/train': 1.2917474508285522} -08/30/2021 23:34:08 - INFO - __main__ - Step 57615: {'lr': 0.00034511166017884334, 'samples': 11062080, 'steps': 57614, 'loss/train': 0.7459553480148315} -08/30/2021 23:34:08 - INFO - __main__ - Step 57616: {'lr': 0.0003451067524649981, 'samples': 11062272, 'steps': 57615, 'loss/train': 0.8307577967643738} -08/30/2021 23:34:09 - INFO - __main__ - Step 57617: {'lr': 0.00034510184470829924, 'samples': 11062464, 'steps': 57616, 'loss/train': 0.6022247672080994} -08/30/2021 23:34:10 - INFO - __main__ - Step 57618: {'lr': 0.000345096936908749, 'samples': 11062656, 'steps': 57617, 'loss/train': 1.2412227392196655} -08/30/2021 23:34:11 - INFO - __main__ - Step 57619: {'lr': 0.0003450920290663495, 'samples': 11062848, 'steps': 57618, 'loss/train': 0.7889207601547241} -08/30/2021 23:34:11 - INFO - __main__ - Step 57620: {'lr': 0.000345087121181103, 'samples': 11063040, 'steps': 57619, 'loss/train': 1.3664442300796509} -08/30/2021 23:34:11 - INFO - __main__ - Step 57621: {'lr': 0.0003450822132530117, 'samples': 11063232, 'steps': 57620, 'loss/train': 0.8068606853485107} -08/30/2021 23:34:12 - INFO - __main__ - Step 57622: {'lr': 0.0003450773052820779, 'samples': 11063424, 'steps': 57621, 'loss/train': 1.3867192268371582} -08/30/2021 23:34:13 - INFO - __main__ - Step 57623: {'lr': 0.0003450723972683036, 'samples': 11063616, 'steps': 57622, 'loss/train': 1.0013068914413452} -08/30/2021 23:34:14 - INFO - __main__ - Step 57624: {'lr': 0.00034506748921169124, 'samples': 11063808, 'steps': 57623, 'loss/train': 0.9682133793830872} -08/30/2021 23:34:14 - INFO - __main__ - Step 57625: {'lr': 0.00034506258111224294, 'samples': 11064000, 'steps': 57624, 'loss/train': 1.3219531774520874} -08/30/2021 23:34:15 - INFO - __main__ - Step 57626: {'lr': 0.00034505767296996086, 'samples': 11064192, 'steps': 57625, 'loss/train': 1.5804495811462402} -08/30/2021 23:34:15 - INFO - __main__ - Step 57627: {'lr': 0.0003450527647848473, 'samples': 11064384, 'steps': 57626, 'loss/train': 1.340441346168518} -08/30/2021 23:34:16 - INFO - __main__ - Step 57628: {'lr': 0.0003450478565569044, 'samples': 11064576, 'steps': 57627, 'loss/train': 0.831775426864624} -08/30/2021 23:34:17 - INFO - __main__ - Step 57629: {'lr': 0.0003450429482861344, 'samples': 11064768, 'steps': 57628, 'loss/train': 1.503279685974121} -08/30/2021 23:34:17 - INFO - __main__ - Step 57630: {'lr': 0.0003450380399725396, 'samples': 11064960, 'steps': 57629, 'loss/train': 1.498227596282959} -08/30/2021 23:34:18 - INFO - __main__ - Step 57631: {'lr': 0.000345033131616122, 'samples': 11065152, 'steps': 57630, 'loss/train': 1.1055716276168823} -08/30/2021 23:34:18 - INFO - __main__ - Step 57632: {'lr': 0.000345028223216884, 'samples': 11065344, 'steps': 57631, 'loss/train': 1.2551686763763428} -08/30/2021 23:34:19 - INFO - __main__ - Step 57633: {'lr': 0.0003450233147748278, 'samples': 11065536, 'steps': 57632, 'loss/train': 1.4205131530761719} -08/30/2021 23:34:20 - INFO - __main__ - Step 57634: {'lr': 0.00034501840628995545, 'samples': 11065728, 'steps': 57633, 'loss/train': 1.5272709131240845} -08/30/2021 23:34:20 - INFO - __main__ - Step 57635: {'lr': 0.0003450134977622693, 'samples': 11065920, 'steps': 57634, 'loss/train': 0.944395899772644} -08/30/2021 23:34:21 - INFO - __main__ - Step 57636: {'lr': 0.0003450085891917716, 'samples': 11066112, 'steps': 57635, 'loss/train': 1.1037479639053345} -08/30/2021 23:34:21 - INFO - __main__ - Step 57637: {'lr': 0.00034500368057846444, 'samples': 11066304, 'steps': 57636, 'loss/train': 1.895972728729248} -08/30/2021 23:34:22 - INFO - __main__ - Step 57638: {'lr': 0.00034499877192235005, 'samples': 11066496, 'steps': 57637, 'loss/train': 0.9974783062934875} -08/30/2021 23:34:23 - INFO - __main__ - Step 57639: {'lr': 0.00034499386322343087, 'samples': 11066688, 'steps': 57638, 'loss/train': 1.1062231063842773} -08/30/2021 23:34:23 - INFO - __main__ - Step 57640: {'lr': 0.00034498895448170874, 'samples': 11066880, 'steps': 57639, 'loss/train': 1.6630113124847412} -08/30/2021 23:34:23 - INFO - __main__ - Step 57641: {'lr': 0.0003449840456971861, 'samples': 11067072, 'steps': 57640, 'loss/train': 0.5174520015716553} -08/30/2021 23:34:24 - INFO - __main__ - Step 57642: {'lr': 0.0003449791368698651, 'samples': 11067264, 'steps': 57641, 'loss/train': 1.4498767852783203} -08/30/2021 23:34:26 - INFO - __main__ - Step 57643: {'lr': 0.000344974227999748, 'samples': 11067456, 'steps': 57642, 'loss/train': 0.5241720080375671} -08/30/2021 23:34:26 - INFO - __main__ - Step 57644: {'lr': 0.0003449693190868369, 'samples': 11067648, 'steps': 57643, 'loss/train': 0.9886839389801025} -08/30/2021 23:34:26 - INFO - __main__ - Step 57645: {'lr': 0.0003449644101311341, 'samples': 11067840, 'steps': 57644, 'loss/train': 1.1314173936843872} -08/30/2021 23:34:27 - INFO - __main__ - Step 57646: {'lr': 0.00034495950113264194, 'samples': 11068032, 'steps': 57645, 'loss/train': 1.3463867902755737} -08/30/2021 23:34:27 - INFO - __main__ - Step 57647: {'lr': 0.0003449545920913624, 'samples': 11068224, 'steps': 57646, 'loss/train': 0.8864731788635254} -08/30/2021 23:34:27 - INFO - __main__ - Step 57648: {'lr': 0.0003449496830072978, 'samples': 11068416, 'steps': 57647, 'loss/train': 0.8631796836853027} -08/30/2021 23:34:29 - INFO - __main__ - Step 57649: {'lr': 0.0003449447738804503, 'samples': 11068608, 'steps': 57648, 'loss/train': 0.43476948142051697} -08/30/2021 23:34:30 - INFO - __main__ - Step 57650: {'lr': 0.00034493986471082215, 'samples': 11068800, 'steps': 57649, 'loss/train': 1.7842961549758911} -08/30/2021 23:34:30 - INFO - __main__ - Step 57651: {'lr': 0.0003449349554984156, 'samples': 11068992, 'steps': 57650, 'loss/train': 1.1075594425201416} -08/30/2021 23:34:30 - INFO - __main__ - Step 57652: {'lr': 0.0003449300462432328, 'samples': 11069184, 'steps': 57651, 'loss/train': 1.211912751197815} -08/30/2021 23:34:31 - INFO - __main__ - Step 57653: {'lr': 0.0003449251369452761, 'samples': 11069376, 'steps': 57652, 'loss/train': 1.6299463510513306} -08/30/2021 23:34:32 - INFO - __main__ - Step 57654: {'lr': 0.00034492022760454743, 'samples': 11069568, 'steps': 57653, 'loss/train': 1.9488661289215088} -08/30/2021 23:34:33 - INFO - __main__ - Step 57655: {'lr': 0.00034491531822104923, 'samples': 11069760, 'steps': 57654, 'loss/train': 1.3055777549743652} -08/30/2021 23:34:33 - INFO - __main__ - Step 57656: {'lr': 0.00034491040879478364, 'samples': 11069952, 'steps': 57655, 'loss/train': 2.427436113357544} -08/30/2021 23:34:33 - INFO - __main__ - Step 57657: {'lr': 0.0003449054993257529, 'samples': 11070144, 'steps': 57656, 'loss/train': 1.5588815212249756} -08/30/2021 23:34:34 - INFO - __main__ - Step 57658: {'lr': 0.0003449005898139592, 'samples': 11070336, 'steps': 57657, 'loss/train': 1.192208170890808} -08/30/2021 23:34:34 - INFO - __main__ - Step 57659: {'lr': 0.0003448956802594048, 'samples': 11070528, 'steps': 57658, 'loss/train': 0.7147905826568604} -08/30/2021 23:34:35 - INFO - __main__ - Step 57660: {'lr': 0.00034489077066209185, 'samples': 11070720, 'steps': 57659, 'loss/train': 1.7572073936462402} -08/30/2021 23:34:36 - INFO - __main__ - Step 57661: {'lr': 0.0003448858610220226, 'samples': 11070912, 'steps': 57660, 'loss/train': 1.4784742593765259} -08/30/2021 23:34:36 - INFO - __main__ - Step 57662: {'lr': 0.00034488095133919914, 'samples': 11071104, 'steps': 57661, 'loss/train': 1.6818466186523438} -08/30/2021 23:34:37 - INFO - __main__ - Step 57663: {'lr': 0.0003448760416136239, 'samples': 11071296, 'steps': 57662, 'loss/train': 1.5901094675064087} -08/30/2021 23:34:37 - INFO - __main__ - Step 57664: {'lr': 0.00034487113184529896, 'samples': 11071488, 'steps': 57663, 'loss/train': 1.5783939361572266} -08/30/2021 23:34:39 - INFO - __main__ - Step 57665: {'lr': 0.0003448662220342265, 'samples': 11071680, 'steps': 57664, 'loss/train': 2.082850217819214} -08/30/2021 23:34:39 - INFO - __main__ - Step 57666: {'lr': 0.0003448613121804088, 'samples': 11071872, 'steps': 57665, 'loss/train': 1.508696436882019} -08/30/2021 23:34:40 - INFO - __main__ - Step 57667: {'lr': 0.0003448564022838481, 'samples': 11072064, 'steps': 57666, 'loss/train': 1.1992400884628296} -08/30/2021 23:34:40 - INFO - __main__ - Step 57668: {'lr': 0.0003448514923445466, 'samples': 11072256, 'steps': 57667, 'loss/train': 1.7660138607025146} -08/30/2021 23:34:40 - INFO - __main__ - Step 57669: {'lr': 0.00034484658236250636, 'samples': 11072448, 'steps': 57668, 'loss/train': 0.876061201095581} -08/30/2021 23:34:42 - INFO - __main__ - Step 57670: {'lr': 0.0003448416723377298, 'samples': 11072640, 'steps': 57669, 'loss/train': 1.0351300239562988} -08/30/2021 23:34:43 - INFO - __main__ - Step 57671: {'lr': 0.00034483676227021906, 'samples': 11072832, 'steps': 57670, 'loss/train': 1.0887587070465088} -08/30/2021 23:34:43 - INFO - __main__ - Step 57672: {'lr': 0.00034483185215997624, 'samples': 11073024, 'steps': 57671, 'loss/train': 1.7450810670852661} -08/30/2021 23:34:43 - INFO - __main__ - Step 57673: {'lr': 0.00034482694200700377, 'samples': 11073216, 'steps': 57672, 'loss/train': 1.477314829826355} -08/30/2021 23:34:44 - INFO - __main__ - Step 57674: {'lr': 0.00034482203181130365, 'samples': 11073408, 'steps': 57673, 'loss/train': 0.24988338351249695} -08/30/2021 23:34:45 - INFO - __main__ - Step 57675: {'lr': 0.00034481712157287826, 'samples': 11073600, 'steps': 57674, 'loss/train': 1.4812304973602295} -08/30/2021 23:34:45 - INFO - __main__ - Step 57676: {'lr': 0.00034481221129172967, 'samples': 11073792, 'steps': 57675, 'loss/train': 0.9994809031486511} -08/30/2021 23:34:46 - INFO - __main__ - Step 57677: {'lr': 0.0003448073009678602, 'samples': 11073984, 'steps': 57676, 'loss/train': 1.4245047569274902} -08/30/2021 23:34:46 - INFO - __main__ - Step 57678: {'lr': 0.00034480239060127204, 'samples': 11074176, 'steps': 57677, 'loss/train': 1.153174877166748} -08/30/2021 23:34:47 - INFO - __main__ - Step 57679: {'lr': 0.00034479748019196734, 'samples': 11074368, 'steps': 57678, 'loss/train': 1.445250391960144} -08/30/2021 23:34:48 - INFO - __main__ - Step 57680: {'lr': 0.00034479256973994843, 'samples': 11074560, 'steps': 57679, 'loss/train': 0.6847001314163208} -08/30/2021 23:34:48 - INFO - __main__ - Step 57681: {'lr': 0.0003447876592452174, 'samples': 11074752, 'steps': 57680, 'loss/train': 1.2577377557754517} -08/30/2021 23:34:49 - INFO - __main__ - Step 57682: {'lr': 0.00034478274870777646, 'samples': 11074944, 'steps': 57681, 'loss/train': 1.187567114830017} -08/30/2021 23:34:49 - INFO - __main__ - Step 57683: {'lr': 0.00034477783812762795, 'samples': 11075136, 'steps': 57682, 'loss/train': 1.3287125825881958} -08/30/2021 23:34:49 - INFO - __main__ - Step 57684: {'lr': 0.00034477292750477396, 'samples': 11075328, 'steps': 57683, 'loss/train': 1.7312740087509155} -08/30/2021 23:34:51 - INFO - __main__ - Step 57685: {'lr': 0.00034476801683921683, 'samples': 11075520, 'steps': 57684, 'loss/train': 1.308159589767456} -08/30/2021 23:34:51 - INFO - __main__ - Step 57686: {'lr': 0.00034476310613095867, 'samples': 11075712, 'steps': 57685, 'loss/train': 0.866007387638092} -08/30/2021 23:34:52 - INFO - __main__ - Step 57687: {'lr': 0.0003447581953800017, 'samples': 11075904, 'steps': 57686, 'loss/train': 1.1797256469726562} -08/30/2021 23:34:52 - INFO - __main__ - Step 57688: {'lr': 0.00034475328458634814, 'samples': 11076096, 'steps': 57687, 'loss/train': 1.34390127658844} -08/30/2021 23:34:52 - INFO - __main__ - Step 57689: {'lr': 0.00034474837375000016, 'samples': 11076288, 'steps': 57688, 'loss/train': 1.7094366550445557} -08/30/2021 23:34:55 - INFO - __main__ - Step 57690: {'lr': 0.0003447434628709601, 'samples': 11076480, 'steps': 57689, 'loss/train': 1.3257652521133423} -08/30/2021 23:34:55 - INFO - __main__ - Step 57691: {'lr': 0.00034473855194923006, 'samples': 11076672, 'steps': 57690, 'loss/train': 0.8218780755996704} -08/30/2021 23:34:55 - INFO - __main__ - Step 57692: {'lr': 0.0003447336409848124, 'samples': 11076864, 'steps': 57691, 'loss/train': 1.311018466949463} -08/30/2021 23:34:56 - INFO - __main__ - Step 57693: {'lr': 0.0003447287299777091, 'samples': 11077056, 'steps': 57692, 'loss/train': 0.5102701187133789} -08/30/2021 23:34:56 - INFO - __main__ - Step 57694: {'lr': 0.0003447238189279225, 'samples': 11077248, 'steps': 57693, 'loss/train': 2.0247859954833984} -08/30/2021 23:34:56 - INFO - __main__ - Step 57695: {'lr': 0.0003447189078354548, 'samples': 11077440, 'steps': 57694, 'loss/train': 1.5504810810089111} -08/30/2021 23:34:58 - INFO - __main__ - Step 57696: {'lr': 0.00034471399670030824, 'samples': 11077632, 'steps': 57695, 'loss/train': 0.8103264570236206} -08/30/2021 23:34:58 - INFO - __main__ - Step 57697: {'lr': 0.00034470908552248504, 'samples': 11077824, 'steps': 57696, 'loss/train': 0.17652305960655212} -08/30/2021 23:34:59 - INFO - __main__ - Step 57698: {'lr': 0.00034470417430198743, 'samples': 11078016, 'steps': 57697, 'loss/train': 0.7908549308776855} -08/30/2021 23:34:59 - INFO - __main__ - Step 57699: {'lr': 0.00034469926303881747, 'samples': 11078208, 'steps': 57698, 'loss/train': 1.545953631401062} -08/30/2021 23:34:59 - INFO - __main__ - Step 57700: {'lr': 0.0003446943517329776, 'samples': 11078400, 'steps': 57699, 'loss/train': 0.47651827335357666} -08/30/2021 23:35:01 - INFO - __main__ - Step 57701: {'lr': 0.0003446894403844698, 'samples': 11078592, 'steps': 57700, 'loss/train': 1.7272061109542847} -08/30/2021 23:35:02 - INFO - __main__ - Step 57702: {'lr': 0.0003446845289932965, 'samples': 11078784, 'steps': 57701, 'loss/train': 1.343973159790039} -08/30/2021 23:35:02 - INFO - __main__ - Step 57703: {'lr': 0.0003446796175594598, 'samples': 11078976, 'steps': 57702, 'loss/train': 1.253000020980835} -08/30/2021 23:35:02 - INFO - __main__ - Step 57704: {'lr': 0.00034467470608296185, 'samples': 11079168, 'steps': 57703, 'loss/train': 1.3533598184585571} -08/30/2021 23:35:03 - INFO - __main__ - Step 57705: {'lr': 0.00034466979456380497, 'samples': 11079360, 'steps': 57704, 'loss/train': 5.671090126037598} -08/30/2021 23:35:03 - INFO - __main__ - Step 57706: {'lr': 0.0003446648830019914, 'samples': 11079552, 'steps': 57705, 'loss/train': 2.1126325130462646} -08/30/2021 23:35:05 - INFO - __main__ - Step 57707: {'lr': 0.00034465997139752327, 'samples': 11079744, 'steps': 57706, 'loss/train': 1.5409153699874878} -08/30/2021 23:35:05 - INFO - __main__ - Step 57708: {'lr': 0.00034465505975040273, 'samples': 11079936, 'steps': 57707, 'loss/train': 1.7867683172225952} -08/30/2021 23:35:06 - INFO - __main__ - Step 57709: {'lr': 0.0003446501480606322, 'samples': 11080128, 'steps': 57708, 'loss/train': 1.0364409685134888} -08/30/2021 23:35:06 - INFO - __main__ - Step 57710: {'lr': 0.0003446452363282137, 'samples': 11080320, 'steps': 57709, 'loss/train': 1.5341821908950806} -08/30/2021 23:35:06 - INFO - __main__ - Step 57711: {'lr': 0.00034464032455314955, 'samples': 11080512, 'steps': 57710, 'loss/train': 1.1671291589736938} -08/30/2021 23:35:08 - INFO - __main__ - Step 57712: {'lr': 0.0003446354127354419, 'samples': 11080704, 'steps': 57711, 'loss/train': 1.4817571640014648} -08/30/2021 23:35:08 - INFO - __main__ - Step 57713: {'lr': 0.000344630500875093, 'samples': 11080896, 'steps': 57712, 'loss/train': 1.438253402709961} -08/30/2021 23:35:08 - INFO - __main__ - Step 57714: {'lr': 0.0003446255889721051, 'samples': 11081088, 'steps': 57713, 'loss/train': 1.4417246580123901} -08/30/2021 23:35:09 - INFO - __main__ - Step 57715: {'lr': 0.00034462067702648036, 'samples': 11081280, 'steps': 57714, 'loss/train': 1.0315977334976196} -08/30/2021 23:35:09 - INFO - __main__ - Step 57716: {'lr': 0.000344615765038221, 'samples': 11081472, 'steps': 57715, 'loss/train': 1.712326169013977} -08/30/2021 23:35:12 - INFO - __main__ - Step 57717: {'lr': 0.0003446108530073292, 'samples': 11081664, 'steps': 57716, 'loss/train': 1.1476267576217651} -08/30/2021 23:35:12 - INFO - __main__ - Step 57718: {'lr': 0.0003446059409338072, 'samples': 11081856, 'steps': 57717, 'loss/train': 1.0954937934875488} -08/30/2021 23:35:12 - INFO - __main__ - Step 57719: {'lr': 0.00034460102881765723, 'samples': 11082048, 'steps': 57718, 'loss/train': 1.0650982856750488} -08/30/2021 23:35:13 - INFO - __main__ - Step 57720: {'lr': 0.0003445961166588816, 'samples': 11082240, 'steps': 57719, 'loss/train': 1.8287652730941772} -08/30/2021 23:35:13 - INFO - __main__ - Step 57721: {'lr': 0.0003445912044574823, 'samples': 11082432, 'steps': 57720, 'loss/train': 1.3199036121368408} -08/30/2021 23:35:14 - INFO - __main__ - Step 57722: {'lr': 0.00034458629221346173, 'samples': 11082624, 'steps': 57721, 'loss/train': 1.1869730949401855} -08/30/2021 23:35:15 - INFO - __main__ - Step 57723: {'lr': 0.000344581379926822, 'samples': 11082816, 'steps': 57722, 'loss/train': 0.5886616706848145} -08/30/2021 23:35:15 - INFO - __main__ - Step 57724: {'lr': 0.00034457646759756535, 'samples': 11083008, 'steps': 57723, 'loss/train': 1.2401893138885498} -08/30/2021 23:35:16 - INFO - __main__ - Step 57725: {'lr': 0.00034457155522569393, 'samples': 11083200, 'steps': 57724, 'loss/train': 0.4214799106121063} -08/30/2021 23:35:16 - INFO - __main__ - Step 57726: {'lr': 0.00034456664281121017, 'samples': 11083392, 'steps': 57725, 'loss/train': 1.436943769454956} -08/30/2021 23:35:16 - INFO - __main__ - Step 57727: {'lr': 0.00034456173035411606, 'samples': 11083584, 'steps': 57726, 'loss/train': 1.079527497291565} -08/30/2021 23:35:18 - INFO - __main__ - Step 57728: {'lr': 0.00034455681785441395, 'samples': 11083776, 'steps': 57727, 'loss/train': 1.3954976797103882} -08/30/2021 23:35:18 - INFO - __main__ - Step 57729: {'lr': 0.00034455190531210595, 'samples': 11083968, 'steps': 57728, 'loss/train': 0.8561622500419617} -08/30/2021 23:35:19 - INFO - __main__ - Step 57730: {'lr': 0.0003445469927271944, 'samples': 11084160, 'steps': 57729, 'loss/train': 1.1404969692230225} -08/30/2021 23:35:19 - INFO - __main__ - Step 57731: {'lr': 0.0003445420800996813, 'samples': 11084352, 'steps': 57730, 'loss/train': 1.301236629486084} -08/30/2021 23:35:19 - INFO - __main__ - Step 57732: {'lr': 0.0003445371674295691, 'samples': 11084544, 'steps': 57731, 'loss/train': 1.877077579498291} -08/30/2021 23:35:21 - INFO - __main__ - Step 57733: {'lr': 0.0003445322547168599, 'samples': 11084736, 'steps': 57732, 'loss/train': 1.3867772817611694} -08/30/2021 23:35:21 - INFO - __main__ - Step 57734: {'lr': 0.0003445273419615559, 'samples': 11084928, 'steps': 57733, 'loss/train': 1.3879948854446411} -08/30/2021 23:35:22 - INFO - __main__ - Step 57735: {'lr': 0.00034452242916365935, 'samples': 11085120, 'steps': 57734, 'loss/train': 1.122413992881775} -08/30/2021 23:35:22 - INFO - __main__ - Step 57736: {'lr': 0.0003445175163231724, 'samples': 11085312, 'steps': 57735, 'loss/train': 1.109182357788086} -08/30/2021 23:35:23 - INFO - __main__ - Step 57737: {'lr': 0.00034451260344009737, 'samples': 11085504, 'steps': 57736, 'loss/train': 0.9724215865135193} -08/30/2021 23:35:24 - INFO - __main__ - Step 57738: {'lr': 0.00034450769051443635, 'samples': 11085696, 'steps': 57737, 'loss/train': 1.587076187133789} -08/30/2021 23:35:24 - INFO - __main__ - Step 57739: {'lr': 0.0003445027775461917, 'samples': 11085888, 'steps': 57738, 'loss/train': 1.295042872428894} -08/30/2021 23:35:25 - INFO - __main__ - Step 57740: {'lr': 0.0003444978645353656, 'samples': 11086080, 'steps': 57739, 'loss/train': 1.1635597944259644} -08/30/2021 23:35:25 - INFO - __main__ - Step 57741: {'lr': 0.0003444929514819601, 'samples': 11086272, 'steps': 57740, 'loss/train': 1.6778360605239868} -08/30/2021 23:35:26 - INFO - __main__ - Step 57742: {'lr': 0.00034448803838597766, 'samples': 11086464, 'steps': 57741, 'loss/train': 1.3427680730819702} -08/30/2021 23:35:27 - INFO - __main__ - Step 57743: {'lr': 0.00034448312524742027, 'samples': 11086656, 'steps': 57742, 'loss/train': 1.3636891841888428} -08/30/2021 23:35:27 - INFO - __main__ - Step 57744: {'lr': 0.00034447821206629026, 'samples': 11086848, 'steps': 57743, 'loss/train': 0.6368964314460754} -08/30/2021 23:35:28 - INFO - __main__ - Step 57745: {'lr': 0.0003444732988425898, 'samples': 11087040, 'steps': 57744, 'loss/train': 0.5811021327972412} -08/30/2021 23:35:28 - INFO - __main__ - Step 57746: {'lr': 0.0003444683855763212, 'samples': 11087232, 'steps': 57745, 'loss/train': 1.5221400260925293} -08/30/2021 23:35:28 - INFO - __main__ - Step 57747: {'lr': 0.0003444634722674866, 'samples': 11087424, 'steps': 57746, 'loss/train': 1.543156385421753} -08/30/2021 23:35:29 - INFO - __main__ - Step 57748: {'lr': 0.0003444585589160882, 'samples': 11087616, 'steps': 57747, 'loss/train': 1.1631295680999756} -08/30/2021 23:35:30 - INFO - __main__ - Step 57749: {'lr': 0.0003444536455221282, 'samples': 11087808, 'steps': 57748, 'loss/train': 1.7758017778396606} -08/30/2021 23:35:31 - INFO - __main__ - Step 57750: {'lr': 0.00034444873208560884, 'samples': 11088000, 'steps': 57749, 'loss/train': 0.3763757050037384} -08/30/2021 23:35:31 - INFO - __main__ - Step 57751: {'lr': 0.00034444381860653233, 'samples': 11088192, 'steps': 57750, 'loss/train': 1.2167519330978394} -08/30/2021 23:35:31 - INFO - __main__ - Step 57752: {'lr': 0.00034443890508490093, 'samples': 11088384, 'steps': 57751, 'loss/train': 1.0028660297393799} -08/30/2021 23:35:32 - INFO - __main__ - Step 57753: {'lr': 0.0003444339915207168, 'samples': 11088576, 'steps': 57752, 'loss/train': 1.0443212985992432} -08/30/2021 23:35:33 - INFO - __main__ - Step 57754: {'lr': 0.0003444290779139823, 'samples': 11088768, 'steps': 57753, 'loss/train': 1.092671513557434} -08/30/2021 23:35:34 - INFO - __main__ - Step 57755: {'lr': 0.00034442416426469936, 'samples': 11088960, 'steps': 57754, 'loss/train': 0.5585522651672363} -08/30/2021 23:35:34 - INFO - __main__ - Step 57756: {'lr': 0.0003444192505728704, 'samples': 11089152, 'steps': 57755, 'loss/train': 0.9616211652755737} -08/30/2021 23:35:35 - INFO - __main__ - Step 57757: {'lr': 0.0003444143368384975, 'samples': 11089344, 'steps': 57756, 'loss/train': 0.5474900603294373} -08/30/2021 23:35:35 - INFO - __main__ - Step 57758: {'lr': 0.000344409423061583, 'samples': 11089536, 'steps': 57757, 'loss/train': 0.8820144534111023} -08/30/2021 23:35:36 - INFO - __main__ - Step 57759: {'lr': 0.00034440450924212913, 'samples': 11089728, 'steps': 57758, 'loss/train': 0.8886938095092773} -08/30/2021 23:35:37 - INFO - __main__ - Step 57760: {'lr': 0.00034439959538013805, 'samples': 11089920, 'steps': 57759, 'loss/train': 1.1811778545379639} -08/30/2021 23:35:37 - INFO - __main__ - Step 57761: {'lr': 0.0003443946814756119, 'samples': 11090112, 'steps': 57760, 'loss/train': 1.266503930091858} -08/30/2021 23:35:38 - INFO - __main__ - Step 57762: {'lr': 0.000344389767528553, 'samples': 11090304, 'steps': 57761, 'loss/train': 1.295312523841858} -08/30/2021 23:35:38 - INFO - __main__ - Step 57763: {'lr': 0.0003443848535389635, 'samples': 11090496, 'steps': 57762, 'loss/train': 1.5202609300613403} -08/30/2021 23:35:39 - INFO - __main__ - Step 57764: {'lr': 0.00034437993950684566, 'samples': 11090688, 'steps': 57763, 'loss/train': 1.4758069515228271} -08/30/2021 23:35:40 - INFO - __main__ - Step 57765: {'lr': 0.00034437502543220166, 'samples': 11090880, 'steps': 57764, 'loss/train': 1.0895005464553833} -08/30/2021 23:35:40 - INFO - __main__ - Step 57766: {'lr': 0.0003443701113150337, 'samples': 11091072, 'steps': 57765, 'loss/train': 1.5651397705078125} -08/30/2021 23:35:41 - INFO - __main__ - Step 57767: {'lr': 0.00034436519715534415, 'samples': 11091264, 'steps': 57766, 'loss/train': 0.9641022086143494} -08/30/2021 23:35:41 - INFO - __main__ - Step 57768: {'lr': 0.00034436028295313503, 'samples': 11091456, 'steps': 57767, 'loss/train': 1.4775365591049194} -08/30/2021 23:35:43 - INFO - __main__ - Step 57769: {'lr': 0.00034435536870840855, 'samples': 11091648, 'steps': 57768, 'loss/train': 1.7708853483200073} -08/30/2021 23:35:43 - INFO - __main__ - Step 57770: {'lr': 0.0003443504544211671, 'samples': 11091840, 'steps': 57769, 'loss/train': 1.1335792541503906} -08/30/2021 23:35:44 - INFO - __main__ - Step 57771: {'lr': 0.0003443455400914127, 'samples': 11092032, 'steps': 57770, 'loss/train': 0.9590129256248474} -08/30/2021 23:35:44 - INFO - __main__ - Step 57772: {'lr': 0.0003443406257191477, 'samples': 11092224, 'steps': 57771, 'loss/train': 1.0170713663101196} -08/30/2021 23:35:45 - INFO - __main__ - Step 57773: {'lr': 0.0003443357113043743, 'samples': 11092416, 'steps': 57772, 'loss/train': 1.997900128364563} -08/30/2021 23:35:45 - INFO - __main__ - Step 57774: {'lr': 0.00034433079684709466, 'samples': 11092608, 'steps': 57773, 'loss/train': 0.973318338394165} -08/30/2021 23:35:46 - INFO - __main__ - Step 57775: {'lr': 0.000344325882347311, 'samples': 11092800, 'steps': 57774, 'loss/train': 0.6636830568313599} -08/30/2021 23:35:47 - INFO - __main__ - Step 57776: {'lr': 0.00034432096780502564, 'samples': 11092992, 'steps': 57775, 'loss/train': 1.1859796047210693} -08/30/2021 23:35:47 - INFO - __main__ - Step 57777: {'lr': 0.0003443160532202406, 'samples': 11093184, 'steps': 57776, 'loss/train': 0.8080893754959106} -08/30/2021 23:35:48 - INFO - __main__ - Step 57778: {'lr': 0.00034431113859295827, 'samples': 11093376, 'steps': 57777, 'loss/train': 1.5912752151489258} -08/30/2021 23:35:48 - INFO - __main__ - Step 57779: {'lr': 0.00034430622392318073, 'samples': 11093568, 'steps': 57778, 'loss/train': 1.5313411951065063} -08/30/2021 23:35:49 - INFO - __main__ - Step 57780: {'lr': 0.0003443013092109103, 'samples': 11093760, 'steps': 57779, 'loss/train': 1.464087724685669} -08/30/2021 23:35:50 - INFO - __main__ - Step 57781: {'lr': 0.0003442963944561492, 'samples': 11093952, 'steps': 57780, 'loss/train': 1.627342939376831} -08/30/2021 23:35:50 - INFO - __main__ - Step 57782: {'lr': 0.0003442914796588995, 'samples': 11094144, 'steps': 57781, 'loss/train': 1.3642815351486206} -08/30/2021 23:35:51 - INFO - __main__ - Step 57783: {'lr': 0.00034428656481916357, 'samples': 11094336, 'steps': 57782, 'loss/train': 1.1529780626296997} -08/30/2021 23:35:51 - INFO - __main__ - Step 57784: {'lr': 0.00034428164993694356, 'samples': 11094528, 'steps': 57783, 'loss/train': 1.4525541067123413} -08/30/2021 23:35:51 - INFO - __main__ - Step 57785: {'lr': 0.0003442767350122417, 'samples': 11094720, 'steps': 57784, 'loss/train': 1.0132561922073364} -08/30/2021 23:35:53 - INFO - __main__ - Step 57786: {'lr': 0.0003442718200450602, 'samples': 11094912, 'steps': 57785, 'loss/train': 1.0175509452819824} -08/30/2021 23:35:53 - INFO - __main__ - Step 57787: {'lr': 0.0003442669050354013, 'samples': 11095104, 'steps': 57786, 'loss/train': 1.4026432037353516} -08/30/2021 23:35:54 - INFO - __main__ - Step 57788: {'lr': 0.00034426198998326713, 'samples': 11095296, 'steps': 57787, 'loss/train': 1.24473237991333} -08/30/2021 23:35:54 - INFO - __main__ - Step 57789: {'lr': 0.00034425707488866, 'samples': 11095488, 'steps': 57788, 'loss/train': 1.5531615018844604} -08/30/2021 23:35:54 - INFO - __main__ - Step 57790: {'lr': 0.0003442521597515821, 'samples': 11095680, 'steps': 57789, 'loss/train': 1.4984086751937866} -08/30/2021 23:35:57 - INFO - __main__ - Step 57791: {'lr': 0.00034424724457203553, 'samples': 11095872, 'steps': 57790, 'loss/train': 0.32216769456863403} -08/30/2021 23:35:57 - INFO - __main__ - Step 57792: {'lr': 0.0003442423293500227, 'samples': 11096064, 'steps': 57791, 'loss/train': 0.3440251648426056} -08/30/2021 23:35:58 - INFO - __main__ - Step 57793: {'lr': 0.0003442374140855457, 'samples': 11096256, 'steps': 57792, 'loss/train': 1.1713815927505493} -08/30/2021 23:35:58 - INFO - __main__ - Step 57794: {'lr': 0.00034423249877860683, 'samples': 11096448, 'steps': 57793, 'loss/train': 5.887346267700195} -08/30/2021 23:35:58 - INFO - __main__ - Step 57795: {'lr': 0.0003442275834292082, 'samples': 11096640, 'steps': 57794, 'loss/train': 5.646505832672119} -08/30/2021 23:35:59 - INFO - __main__ - Step 57796: {'lr': 0.0003442226680373521, 'samples': 11096832, 'steps': 57795, 'loss/train': 5.670462131500244} -08/30/2021 23:35:59 - INFO - __main__ - Step 57797: {'lr': 0.00034421775260304067, 'samples': 11097024, 'steps': 57796, 'loss/train': 5.702449798583984} -08/30/2021 23:36:01 - INFO - __main__ - Step 57798: {'lr': 0.0003442128371262762, 'samples': 11097216, 'steps': 57797, 'loss/train': 1.6899532079696655} -08/30/2021 23:36:01 - INFO - __main__ - Step 57799: {'lr': 0.00034420792160706087, 'samples': 11097408, 'steps': 57798, 'loss/train': 1.3607299327850342} -08/30/2021 23:36:01 - INFO - __main__ - Step 57800: {'lr': 0.0003442030060453969, 'samples': 11097600, 'steps': 57799, 'loss/train': 1.086534857749939} -08/30/2021 23:36:02 - INFO - __main__ - Step 57801: {'lr': 0.0003441980904412866, 'samples': 11097792, 'steps': 57800, 'loss/train': 1.604187250137329} -08/30/2021 23:36:02 - INFO - __main__ - Step 57802: {'lr': 0.000344193174794732, 'samples': 11097984, 'steps': 57801, 'loss/train': 1.3944400548934937} -08/30/2021 23:36:04 - INFO - __main__ - Step 57803: {'lr': 0.00034418825910573545, 'samples': 11098176, 'steps': 57802, 'loss/train': 1.3489320278167725} -08/30/2021 23:36:04 - INFO - __main__ - Step 57804: {'lr': 0.00034418334337429907, 'samples': 11098368, 'steps': 57803, 'loss/train': 1.7557225227355957} -08/30/2021 23:36:04 - INFO - __main__ - Step 57805: {'lr': 0.00034417842760042517, 'samples': 11098560, 'steps': 57804, 'loss/train': 1.3637171983718872} -08/30/2021 23:36:05 - INFO - __main__ - Step 57806: {'lr': 0.0003441735117841159, 'samples': 11098752, 'steps': 57805, 'loss/train': 1.4032765626907349} -08/30/2021 23:36:05 - INFO - __main__ - Step 57807: {'lr': 0.0003441685959253736, 'samples': 11098944, 'steps': 57806, 'loss/train': 1.4107378721237183} -08/30/2021 23:36:07 - INFO - __main__ - Step 57808: {'lr': 0.0003441636800242003, 'samples': 11099136, 'steps': 57807, 'loss/train': 1.7993744611740112} -08/30/2021 23:36:07 - INFO - __main__ - Step 57809: {'lr': 0.0003441587640805983, 'samples': 11099328, 'steps': 57808, 'loss/train': 0.7229326963424683} -08/30/2021 23:36:08 - INFO - __main__ - Step 57810: {'lr': 0.0003441538480945697, 'samples': 11099520, 'steps': 57809, 'loss/train': 1.1483817100524902} -08/30/2021 23:36:08 - INFO - __main__ - Step 57811: {'lr': 0.00034414893206611695, 'samples': 11099712, 'steps': 57810, 'loss/train': 1.3096764087677002} -08/30/2021 23:36:08 - INFO - __main__ - Step 57812: {'lr': 0.0003441440159952422, 'samples': 11099904, 'steps': 57811, 'loss/train': 1.5808639526367188} -08/30/2021 23:36:09 - INFO - __main__ - Step 57813: {'lr': 0.00034413909988194753, 'samples': 11100096, 'steps': 57812, 'loss/train': 1.2514926195144653} -08/30/2021 23:36:10 - INFO - __main__ - Step 57814: {'lr': 0.0003441341837262353, 'samples': 11100288, 'steps': 57813, 'loss/train': 0.10937996953725815} -08/30/2021 23:36:11 - INFO - __main__ - Step 57815: {'lr': 0.00034412926752810756, 'samples': 11100480, 'steps': 57814, 'loss/train': 0.21634015440940857} -08/30/2021 23:36:11 - INFO - __main__ - Step 57816: {'lr': 0.0003441243512875667, 'samples': 11100672, 'steps': 57815, 'loss/train': 1.3703187704086304} -08/30/2021 23:36:11 - INFO - __main__ - Step 57817: {'lr': 0.00034411943500461484, 'samples': 11100864, 'steps': 57816, 'loss/train': 1.9440540075302124} -08/30/2021 23:36:12 - INFO - __main__ - Step 57818: {'lr': 0.0003441145186792542, 'samples': 11101056, 'steps': 57817, 'loss/train': 1.3769536018371582} -08/30/2021 23:36:13 - INFO - __main__ - Step 57819: {'lr': 0.000344109602311487, 'samples': 11101248, 'steps': 57818, 'loss/train': 1.109779715538025} -08/30/2021 23:36:14 - INFO - __main__ - Step 57820: {'lr': 0.0003441046859013155, 'samples': 11101440, 'steps': 57819, 'loss/train': 1.5465869903564453} -08/30/2021 23:36:14 - INFO - __main__ - Step 57821: {'lr': 0.00034409976944874186, 'samples': 11101632, 'steps': 57820, 'loss/train': 0.7728293538093567} -08/30/2021 23:36:14 - INFO - __main__ - Step 57822: {'lr': 0.0003440948529537683, 'samples': 11101824, 'steps': 57821, 'loss/train': 1.0767645835876465} -08/30/2021 23:36:15 - INFO - __main__ - Step 57823: {'lr': 0.00034408993641639707, 'samples': 11102016, 'steps': 57822, 'loss/train': 1.489098072052002} -08/30/2021 23:36:17 - INFO - __main__ - Step 57824: {'lr': 0.0003440850198366304, 'samples': 11102208, 'steps': 57823, 'loss/train': 0.8877474069595337} -08/30/2021 23:36:17 - INFO - __main__ - Step 57825: {'lr': 0.0003440801032144704, 'samples': 11102400, 'steps': 57824, 'loss/train': 0.616609513759613} -08/30/2021 23:36:18 - INFO - __main__ - Step 57826: {'lr': 0.00034407518654991945, 'samples': 11102592, 'steps': 57825, 'loss/train': 0.9271731972694397} -08/30/2021 23:36:18 - INFO - __main__ - Step 57827: {'lr': 0.00034407026984297964, 'samples': 11102784, 'steps': 57826, 'loss/train': 0.9796440601348877} -08/30/2021 23:36:19 - INFO - __main__ - Step 57828: {'lr': 0.00034406535309365317, 'samples': 11102976, 'steps': 57827, 'loss/train': 0.7911518812179565} -08/30/2021 23:36:19 - INFO - __main__ - Step 57829: {'lr': 0.0003440604363019423, 'samples': 11103168, 'steps': 57828, 'loss/train': 0.47116604447364807} -08/30/2021 23:36:21 - INFO - __main__ - Step 57830: {'lr': 0.0003440555194678493, 'samples': 11103360, 'steps': 57829, 'loss/train': 0.5575730800628662} -08/30/2021 23:36:22 - INFO - __main__ - Step 57831: {'lr': 0.0003440506025913763, 'samples': 11103552, 'steps': 57830, 'loss/train': 1.621256947517395} -08/30/2021 23:36:22 - INFO - __main__ - Step 57832: {'lr': 0.0003440456856725256, 'samples': 11103744, 'steps': 57831, 'loss/train': 1.3650532960891724} -08/30/2021 23:36:22 - INFO - __main__ - Step 57833: {'lr': 0.0003440407687112993, 'samples': 11103936, 'steps': 57832, 'loss/train': 1.0273456573486328} -08/30/2021 23:36:23 - INFO - __main__ - Step 57834: {'lr': 0.0003440358517076997, 'samples': 11104128, 'steps': 57833, 'loss/train': 1.679181694984436} -08/30/2021 23:36:24 - INFO - __main__ - Step 57835: {'lr': 0.00034403093466172903, 'samples': 11104320, 'steps': 57834, 'loss/train': 1.6843326091766357} -08/30/2021 23:36:25 - INFO - __main__ - Step 57836: {'lr': 0.00034402601757338946, 'samples': 11104512, 'steps': 57835, 'loss/train': 0.2866305112838745} -08/30/2021 23:36:25 - INFO - __main__ - Step 57837: {'lr': 0.00034402110044268327, 'samples': 11104704, 'steps': 57836, 'loss/train': 1.659409761428833} -08/30/2021 23:36:25 - INFO - __main__ - Step 57838: {'lr': 0.00034401618326961253, 'samples': 11104896, 'steps': 57837, 'loss/train': 1.2834805250167847} -08/30/2021 23:36:26 - INFO - __main__ - Step 57839: {'lr': 0.0003440112660541795, 'samples': 11105088, 'steps': 57838, 'loss/train': 0.12566542625427246} -08/30/2021 23:36:27 - INFO - __main__ - Step 57840: {'lr': 0.0003440063487963866, 'samples': 11105280, 'steps': 57839, 'loss/train': 1.818826675415039} -08/30/2021 23:36:28 - INFO - __main__ - Step 57841: {'lr': 0.00034400143149623574, 'samples': 11105472, 'steps': 57840, 'loss/train': 1.8270034790039062} -08/30/2021 23:36:28 - INFO - __main__ - Step 57842: {'lr': 0.0003439965141537294, 'samples': 11105664, 'steps': 57841, 'loss/train': 1.3017204999923706} -08/30/2021 23:36:28 - INFO - __main__ - Step 57843: {'lr': 0.00034399159676886965, 'samples': 11105856, 'steps': 57842, 'loss/train': 1.2645552158355713} -08/30/2021 23:36:29 - INFO - __main__ - Step 57844: {'lr': 0.00034398667934165873, 'samples': 11106048, 'steps': 57843, 'loss/train': 1.4458588361740112} -08/30/2021 23:36:30 - INFO - __main__ - Step 57845: {'lr': 0.00034398176187209887, 'samples': 11106240, 'steps': 57844, 'loss/train': 0.04177282005548477} -08/30/2021 23:36:31 - INFO - __main__ - Step 57846: {'lr': 0.0003439768443601923, 'samples': 11106432, 'steps': 57845, 'loss/train': 1.368549108505249} -08/30/2021 23:36:31 - INFO - __main__ - Step 57847: {'lr': 0.0003439719268059411, 'samples': 11106624, 'steps': 57846, 'loss/train': 0.920562744140625} -08/30/2021 23:36:31 - INFO - __main__ - Step 57848: {'lr': 0.0003439670092093478, 'samples': 11106816, 'steps': 57847, 'loss/train': 0.9704640507698059} -08/30/2021 23:36:32 - INFO - __main__ - Step 57849: {'lr': 0.00034396209157041424, 'samples': 11107008, 'steps': 57848, 'loss/train': 1.2088522911071777} -08/30/2021 23:36:33 - INFO - __main__ - Step 57850: {'lr': 0.0003439571738891428, 'samples': 11107200, 'steps': 57849, 'loss/train': 1.0287530422210693} -08/30/2021 23:36:34 - INFO - __main__ - Step 57851: {'lr': 0.00034395225616553585, 'samples': 11107392, 'steps': 57850, 'loss/train': 1.0662367343902588} -08/30/2021 23:36:34 - INFO - __main__ - Step 57852: {'lr': 0.00034394733839959534, 'samples': 11107584, 'steps': 57851, 'loss/train': 0.16599543392658234} -08/30/2021 23:36:34 - INFO - __main__ - Step 57853: {'lr': 0.0003439424205913236, 'samples': 11107776, 'steps': 57852, 'loss/train': 0.8803872466087341} -08/30/2021 23:36:35 - INFO - __main__ - Step 57854: {'lr': 0.000343937502740723, 'samples': 11107968, 'steps': 57853, 'loss/train': 1.306980848312378} -08/30/2021 23:36:35 - INFO - __main__ - Step 57855: {'lr': 0.00034393258484779555, 'samples': 11108160, 'steps': 57854, 'loss/train': 1.2254265546798706} -08/30/2021 23:36:37 - INFO - __main__ - Step 57856: {'lr': 0.0003439276669125435, 'samples': 11108352, 'steps': 57855, 'loss/train': 1.018570065498352} -08/30/2021 23:36:37 - INFO - __main__ - Step 57857: {'lr': 0.00034392274893496903, 'samples': 11108544, 'steps': 57856, 'loss/train': 1.033927083015442} -08/30/2021 23:36:37 - INFO - __main__ - Step 57858: {'lr': 0.0003439178309150745, 'samples': 11108736, 'steps': 57857, 'loss/train': 1.6335034370422363} -08/30/2021 23:36:38 - INFO - __main__ - Step 57859: {'lr': 0.000343912912852862, 'samples': 11108928, 'steps': 57858, 'loss/train': 0.8771165013313293} -08/30/2021 23:36:38 - INFO - __main__ - Step 57860: {'lr': 0.00034390799474833385, 'samples': 11109120, 'steps': 57859, 'loss/train': 1.149033784866333} -08/30/2021 23:36:39 - INFO - __main__ - Step 57861: {'lr': 0.0003439030766014922, 'samples': 11109312, 'steps': 57860, 'loss/train': 1.5801451206207275} -08/30/2021 23:36:40 - INFO - __main__ - Step 57862: {'lr': 0.0003438981584123392, 'samples': 11109504, 'steps': 57861, 'loss/train': 1.4704382419586182} -08/30/2021 23:36:40 - INFO - __main__ - Step 57863: {'lr': 0.0003438932401808772, 'samples': 11109696, 'steps': 57862, 'loss/train': 1.1314772367477417} -08/30/2021 23:36:41 - INFO - __main__ - Step 57864: {'lr': 0.0003438883219071083, 'samples': 11109888, 'steps': 57863, 'loss/train': 1.182839035987854} -08/30/2021 23:36:41 - INFO - __main__ - Step 57865: {'lr': 0.00034388340359103485, 'samples': 11110080, 'steps': 57864, 'loss/train': 1.3338888883590698} -08/30/2021 23:36:43 - INFO - __main__ - Step 57866: {'lr': 0.0003438784852326589, 'samples': 11110272, 'steps': 57865, 'loss/train': 1.6208808422088623} -08/30/2021 23:36:43 - INFO - __main__ - Step 57867: {'lr': 0.0003438735668319828, 'samples': 11110464, 'steps': 57866, 'loss/train': 1.4217983484268188} -08/30/2021 23:36:43 - INFO - __main__ - Step 57868: {'lr': 0.00034386864838900877, 'samples': 11110656, 'steps': 57867, 'loss/train': 1.821641445159912} -08/30/2021 23:36:44 - INFO - __main__ - Step 57869: {'lr': 0.00034386372990373893, 'samples': 11110848, 'steps': 57868, 'loss/train': 1.2849440574645996} -08/30/2021 23:36:44 - INFO - __main__ - Step 57870: {'lr': 0.0003438588113761755, 'samples': 11111040, 'steps': 57869, 'loss/train': 1.7026925086975098} -08/30/2021 23:36:46 - INFO - __main__ - Step 57871: {'lr': 0.00034385389280632077, 'samples': 11111232, 'steps': 57870, 'loss/train': 1.6099143028259277} -08/30/2021 23:36:46 - INFO - __main__ - Step 57872: {'lr': 0.00034384897419417694, 'samples': 11111424, 'steps': 57871, 'loss/train': 0.5960713028907776} -08/30/2021 23:36:46 - INFO - __main__ - Step 57873: {'lr': 0.0003438440555397462, 'samples': 11111616, 'steps': 57872, 'loss/train': 2.930335760116577} -08/30/2021 23:36:47 - INFO - __main__ - Step 57874: {'lr': 0.00034383913684303075, 'samples': 11111808, 'steps': 57873, 'loss/train': 1.212746500968933} -08/30/2021 23:36:47 - INFO - __main__ - Step 57875: {'lr': 0.00034383421810403294, 'samples': 11112000, 'steps': 57874, 'loss/train': 1.3006385564804077} -08/30/2021 23:36:49 - INFO - __main__ - Step 57876: {'lr': 0.00034382929932275476, 'samples': 11112192, 'steps': 57875, 'loss/train': 1.3369630575180054} -08/30/2021 23:36:49 - INFO - __main__ - Step 57877: {'lr': 0.0003438243804991986, 'samples': 11112384, 'steps': 57876, 'loss/train': 1.265333890914917} -08/30/2021 23:36:50 - INFO - __main__ - Step 57878: {'lr': 0.0003438194616333666, 'samples': 11112576, 'steps': 57877, 'loss/train': 1.7464908361434937} -08/30/2021 23:36:50 - INFO - __main__ - Step 57879: {'lr': 0.00034381454272526096, 'samples': 11112768, 'steps': 57878, 'loss/train': 0.16650265455245972} -08/30/2021 23:36:50 - INFO - __main__ - Step 57880: {'lr': 0.000343809623774884, 'samples': 11112960, 'steps': 57879, 'loss/train': 1.6911827325820923} -08/30/2021 23:36:52 - INFO - __main__ - Step 57881: {'lr': 0.0003438047047822379, 'samples': 11113152, 'steps': 57880, 'loss/train': 0.08717140555381775} -08/30/2021 23:36:53 - INFO - __main__ - Step 57882: {'lr': 0.0003437997857473248, 'samples': 11113344, 'steps': 57881, 'loss/train': 0.9880353808403015} -08/30/2021 23:36:53 - INFO - __main__ - Step 57883: {'lr': 0.0003437948666701469, 'samples': 11113536, 'steps': 57882, 'loss/train': 1.7614012956619263} -08/30/2021 23:36:54 - INFO - __main__ - Step 57884: {'lr': 0.00034378994755070657, 'samples': 11113728, 'steps': 57883, 'loss/train': 1.565075159072876} -08/30/2021 23:36:54 - INFO - __main__ - Step 57885: {'lr': 0.00034378502838900587, 'samples': 11113920, 'steps': 57884, 'loss/train': 1.5057799816131592} -08/30/2021 23:36:54 - INFO - __main__ - Step 57886: {'lr': 0.00034378010918504714, 'samples': 11114112, 'steps': 57885, 'loss/train': 1.13325834274292} -08/30/2021 23:36:56 - INFO - __main__ - Step 57887: {'lr': 0.0003437751899388325, 'samples': 11114304, 'steps': 57886, 'loss/train': 1.3970110416412354} -08/30/2021 23:36:56 - INFO - __main__ - Step 57888: {'lr': 0.00034377027065036423, 'samples': 11114496, 'steps': 57887, 'loss/train': 1.3978787660598755} -08/30/2021 23:36:57 - INFO - __main__ - Step 57889: {'lr': 0.0003437653513196446, 'samples': 11114688, 'steps': 57888, 'loss/train': 1.4013556241989136} -08/30/2021 23:36:57 - INFO - __main__ - Step 57890: {'lr': 0.0003437604319466756, 'samples': 11114880, 'steps': 57889, 'loss/train': 1.4467740058898926} -08/30/2021 23:36:57 - INFO - __main__ - Step 57891: {'lr': 0.0003437555125314597, 'samples': 11115072, 'steps': 57890, 'loss/train': 1.6815907955169678} -08/30/2021 23:36:59 - INFO - __main__ - Step 57892: {'lr': 0.00034375059307399896, 'samples': 11115264, 'steps': 57891, 'loss/train': 1.770148754119873} -08/30/2021 23:36:59 - INFO - __main__ - Step 57893: {'lr': 0.00034374567357429563, 'samples': 11115456, 'steps': 57892, 'loss/train': 1.8611518144607544} -08/30/2021 23:37:00 - INFO - __main__ - Step 57894: {'lr': 0.000343740754032352, 'samples': 11115648, 'steps': 57893, 'loss/train': 1.2542556524276733} -08/30/2021 23:37:00 - INFO - __main__ - Step 57895: {'lr': 0.00034373583444817024, 'samples': 11115840, 'steps': 57894, 'loss/train': 1.2793387174606323} -08/30/2021 23:37:00 - INFO - __main__ - Step 57896: {'lr': 0.0003437309148217526, 'samples': 11116032, 'steps': 57895, 'loss/train': 1.2916450500488281} -08/30/2021 23:37:02 - INFO - __main__ - Step 57897: {'lr': 0.00034372599515310117, 'samples': 11116224, 'steps': 57896, 'loss/train': 0.9101265668869019} -08/30/2021 23:37:03 - INFO - __main__ - Step 57898: {'lr': 0.00034372107544221824, 'samples': 11116416, 'steps': 57897, 'loss/train': 1.8328304290771484} -08/30/2021 23:37:03 - INFO - __main__ - Step 57899: {'lr': 0.00034371615568910607, 'samples': 11116608, 'steps': 57898, 'loss/train': 1.337120771408081} -08/30/2021 23:37:03 - INFO - __main__ - Step 57900: {'lr': 0.00034371123589376683, 'samples': 11116800, 'steps': 57899, 'loss/train': 0.08235103636980057} -08/30/2021 23:37:04 - INFO - __main__ - Step 57901: {'lr': 0.00034370631605620285, 'samples': 11116992, 'steps': 57900, 'loss/train': 1.3802589178085327} -08/30/2021 23:37:05 - INFO - __main__ - Step 57902: {'lr': 0.0003437013961764162, 'samples': 11117184, 'steps': 57901, 'loss/train': 1.0558006763458252} -08/30/2021 23:37:06 - INFO - __main__ - Step 57903: {'lr': 0.00034369647625440906, 'samples': 11117376, 'steps': 57902, 'loss/train': 1.6199114322662354} -08/30/2021 23:37:06 - INFO - __main__ - Step 57904: {'lr': 0.00034369155629018376, 'samples': 11117568, 'steps': 57903, 'loss/train': 2.112682342529297} -08/30/2021 23:37:06 - INFO - __main__ - Step 57905: {'lr': 0.00034368663628374255, 'samples': 11117760, 'steps': 57904, 'loss/train': 1.5754579305648804} -08/30/2021 23:37:07 - INFO - __main__ - Step 57906: {'lr': 0.0003436817162350876, 'samples': 11117952, 'steps': 57905, 'loss/train': 1.8452544212341309} -08/30/2021 23:37:07 - INFO - __main__ - Step 57907: {'lr': 0.00034367679614422103, 'samples': 11118144, 'steps': 57906, 'loss/train': 1.4249106645584106} -08/30/2021 23:37:08 - INFO - __main__ - Step 57908: {'lr': 0.0003436718760111452, 'samples': 11118336, 'steps': 57907, 'loss/train': 1.1053876876831055} -08/30/2021 23:37:09 - INFO - __main__ - Step 57909: {'lr': 0.0003436669558358623, 'samples': 11118528, 'steps': 57908, 'loss/train': 1.2126071453094482} -08/30/2021 23:37:09 - INFO - __main__ - Step 57910: {'lr': 0.00034366203561837446, 'samples': 11118720, 'steps': 57909, 'loss/train': 0.7809210419654846} -08/30/2021 23:37:10 - INFO - __main__ - Step 57911: {'lr': 0.00034365711535868396, 'samples': 11118912, 'steps': 57910, 'loss/train': 1.4636561870574951} -08/30/2021 23:37:10 - INFO - __main__ - Step 57912: {'lr': 0.000343652195056793, 'samples': 11119104, 'steps': 57911, 'loss/train': 1.1502405405044556} -08/30/2021 23:37:11 - INFO - __main__ - Step 57913: {'lr': 0.0003436472747127038, 'samples': 11119296, 'steps': 57912, 'loss/train': 1.3437775373458862} -08/30/2021 23:37:12 - INFO - __main__ - Step 57914: {'lr': 0.0003436423543264186, 'samples': 11119488, 'steps': 57913, 'loss/train': 0.23785971105098724} -08/30/2021 23:37:12 - INFO - __main__ - Step 57915: {'lr': 0.00034363743389793965, 'samples': 11119680, 'steps': 57914, 'loss/train': 1.0402017831802368} -08/30/2021 23:37:13 - INFO - __main__ - Step 57916: {'lr': 0.0003436325134272691, 'samples': 11119872, 'steps': 57915, 'loss/train': 0.9781309366226196} -08/30/2021 23:37:13 - INFO - __main__ - Step 57917: {'lr': 0.0003436275929144091, 'samples': 11120064, 'steps': 57916, 'loss/train': 1.1634918451309204} -08/30/2021 23:37:15 - INFO - __main__ - Step 57918: {'lr': 0.000343622672359362, 'samples': 11120256, 'steps': 57917, 'loss/train': 1.6962443590164185} -08/30/2021 23:37:15 - INFO - __main__ - Step 57919: {'lr': 0.0003436177517621299, 'samples': 11120448, 'steps': 57918, 'loss/train': 0.9304451942443848} -08/30/2021 23:37:15 - INFO - __main__ - Step 57920: {'lr': 0.0003436128311227152, 'samples': 11120640, 'steps': 57919, 'loss/train': 1.8049160242080688} -08/30/2021 23:37:16 - INFO - __main__ - Step 57921: {'lr': 0.00034360791044111996, 'samples': 11120832, 'steps': 57920, 'loss/train': 0.9886671304702759} -08/30/2021 23:37:16 - INFO - __main__ - Step 57922: {'lr': 0.00034360298971734647, 'samples': 11121024, 'steps': 57921, 'loss/train': 1.065738320350647} -08/30/2021 23:37:17 - INFO - __main__ - Step 57923: {'lr': 0.00034359806895139686, 'samples': 11121216, 'steps': 57922, 'loss/train': 0.43623223900794983} -08/30/2021 23:37:18 - INFO - __main__ - Step 57924: {'lr': 0.0003435931481432735, 'samples': 11121408, 'steps': 57923, 'loss/train': 1.290938138961792} -08/30/2021 23:37:18 - INFO - __main__ - Step 57925: {'lr': 0.00034358822729297847, 'samples': 11121600, 'steps': 57924, 'loss/train': 1.566215991973877} -08/30/2021 23:37:19 - INFO - __main__ - Step 57926: {'lr': 0.00034358330640051396, 'samples': 11121792, 'steps': 57925, 'loss/train': 2.0767035484313965} -08/30/2021 23:37:19 - INFO - __main__ - Step 57927: {'lr': 0.0003435783854658823, 'samples': 11121984, 'steps': 57926, 'loss/train': 0.6464002728462219} -08/30/2021 23:37:21 - INFO - __main__ - Step 57928: {'lr': 0.00034357346448908566, 'samples': 11122176, 'steps': 57927, 'loss/train': 0.6116719245910645} -08/30/2021 23:37:21 - INFO - __main__ - Step 57929: {'lr': 0.00034356854347012626, 'samples': 11122368, 'steps': 57928, 'loss/train': 0.2873060703277588} -08/30/2021 23:37:22 - INFO - __main__ - Step 57930: {'lr': 0.00034356362240900635, 'samples': 11122560, 'steps': 57929, 'loss/train': 1.1154003143310547} -08/30/2021 23:37:22 - INFO - __main__ - Step 57931: {'lr': 0.0003435587013057281, 'samples': 11122752, 'steps': 57930, 'loss/train': 1.5685776472091675} -08/30/2021 23:37:22 - INFO - __main__ - Step 57932: {'lr': 0.0003435537801602937, 'samples': 11122944, 'steps': 57931, 'loss/train': 1.1144810914993286} -08/30/2021 23:37:23 - INFO - __main__ - Step 57933: {'lr': 0.00034354885897270546, 'samples': 11123136, 'steps': 57932, 'loss/train': 1.18936288356781} -08/30/2021 23:37:24 - INFO - __main__ - Step 57934: {'lr': 0.0003435439377429655, 'samples': 11123328, 'steps': 57933, 'loss/train': 1.4783251285552979} -08/30/2021 23:37:25 - INFO - __main__ - Step 57935: {'lr': 0.00034353901647107615, 'samples': 11123520, 'steps': 57934, 'loss/train': 1.7091912031173706} -08/30/2021 23:37:25 - INFO - __main__ - Step 57936: {'lr': 0.0003435340951570395, 'samples': 11123712, 'steps': 57935, 'loss/train': 0.7045174241065979} -08/30/2021 23:37:25 - INFO - __main__ - Step 57937: {'lr': 0.00034352917380085784, 'samples': 11123904, 'steps': 57936, 'loss/train': 0.8868584632873535} -08/30/2021 23:37:26 - INFO - __main__ - Step 57938: {'lr': 0.00034352425240253344, 'samples': 11124096, 'steps': 57937, 'loss/train': 1.1050552129745483} -08/30/2021 23:37:28 - INFO - __main__ - Step 57939: {'lr': 0.0003435193309620684, 'samples': 11124288, 'steps': 57938, 'loss/train': 0.7417891025543213} -08/30/2021 23:37:29 - INFO - __main__ - Step 57940: {'lr': 0.000343514409479465, 'samples': 11124480, 'steps': 57939, 'loss/train': 0.11086741089820862} -08/30/2021 23:37:29 - INFO - __main__ - Step 57941: {'lr': 0.00034350948795472543, 'samples': 11124672, 'steps': 57940, 'loss/train': 1.1636950969696045} -08/30/2021 23:37:29 - INFO - __main__ - Step 57942: {'lr': 0.000343504566387852, 'samples': 11124864, 'steps': 57941, 'loss/train': 1.2470804452896118} -08/30/2021 23:37:30 - INFO - __main__ - Step 57943: {'lr': 0.0003434996447788468, 'samples': 11125056, 'steps': 57942, 'loss/train': 0.9283044934272766} -08/30/2021 23:37:31 - INFO - __main__ - Step 57944: {'lr': 0.0003434947231277121, 'samples': 11125248, 'steps': 57943, 'loss/train': 0.2703121304512024} -08/30/2021 23:37:32 - INFO - __main__ - Step 57945: {'lr': 0.0003434898014344501, 'samples': 11125440, 'steps': 57944, 'loss/train': 1.449692726135254} -08/30/2021 23:37:32 - INFO - __main__ - Step 57946: {'lr': 0.00034348487969906307, 'samples': 11125632, 'steps': 57945, 'loss/train': 0.9957125186920166} -08/30/2021 23:37:32 - INFO - __main__ - Step 57947: {'lr': 0.00034347995792155316, 'samples': 11125824, 'steps': 57946, 'loss/train': 0.34559452533721924} -08/30/2021 23:37:33 - INFO - __main__ - Step 57948: {'lr': 0.00034347503610192265, 'samples': 11126016, 'steps': 57947, 'loss/train': 0.7299861907958984} -08/30/2021 23:37:34 - INFO - __main__ - Step 57949: {'lr': 0.0003434701142401738, 'samples': 11126208, 'steps': 57948, 'loss/train': 1.3295950889587402} -08/30/2021 23:37:35 - INFO - __main__ - Step 57950: {'lr': 0.0003434651923363087, 'samples': 11126400, 'steps': 57949, 'loss/train': 1.3353164196014404} -08/30/2021 23:37:35 - INFO - __main__ - Step 57951: {'lr': 0.0003434602703903296, 'samples': 11126592, 'steps': 57950, 'loss/train': 1.6220121383666992} -08/30/2021 23:37:35 - INFO - __main__ - Step 57952: {'lr': 0.0003434553484022388, 'samples': 11126784, 'steps': 57951, 'loss/train': 1.4216296672821045} -08/30/2021 23:37:36 - INFO - __main__ - Step 57953: {'lr': 0.0003434504263720384, 'samples': 11126976, 'steps': 57952, 'loss/train': 1.7862017154693604} -08/30/2021 23:37:36 - INFO - __main__ - Step 57954: {'lr': 0.0003434455042997307, 'samples': 11127168, 'steps': 57953, 'loss/train': 1.262322187423706} -08/30/2021 23:37:38 - INFO - __main__ - Step 57955: {'lr': 0.00034344058218531794, 'samples': 11127360, 'steps': 57954, 'loss/train': 1.8173655271530151} -08/30/2021 23:37:38 - INFO - __main__ - Step 57956: {'lr': 0.0003434356600288023, 'samples': 11127552, 'steps': 57955, 'loss/train': 1.0475902557373047} -08/30/2021 23:37:38 - INFO - __main__ - Step 57957: {'lr': 0.00034343073783018593, 'samples': 11127744, 'steps': 57956, 'loss/train': 1.4100340604782104} -08/30/2021 23:37:39 - INFO - __main__ - Step 57958: {'lr': 0.00034342581558947113, 'samples': 11127936, 'steps': 57957, 'loss/train': 1.584753155708313} -08/30/2021 23:37:39 - INFO - __main__ - Step 57959: {'lr': 0.00034342089330666, 'samples': 11128128, 'steps': 57958, 'loss/train': 1.344902515411377} -08/30/2021 23:37:41 - INFO - __main__ - Step 57960: {'lr': 0.00034341597098175503, 'samples': 11128320, 'steps': 57959, 'loss/train': 0.5916837453842163} -08/30/2021 23:37:41 - INFO - __main__ - Step 57961: {'lr': 0.0003434110486147582, 'samples': 11128512, 'steps': 57960, 'loss/train': 1.376560926437378} -08/30/2021 23:37:41 - INFO - __main__ - Step 57962: {'lr': 0.0003434061262056718, 'samples': 11128704, 'steps': 57961, 'loss/train': 0.968560516834259} -08/30/2021 23:37:42 - INFO - __main__ - Step 57963: {'lr': 0.0003434012037544981, 'samples': 11128896, 'steps': 57962, 'loss/train': 0.9626744985580444} -08/30/2021 23:37:42 - INFO - __main__ - Step 57964: {'lr': 0.0003433962812612391, 'samples': 11129088, 'steps': 57963, 'loss/train': 1.3924027681350708} -08/30/2021 23:37:44 - INFO - __main__ - Step 57965: {'lr': 0.0003433913587258973, 'samples': 11129280, 'steps': 57964, 'loss/train': 1.6076587438583374} -08/30/2021 23:37:44 - INFO - __main__ - Step 57966: {'lr': 0.0003433864361484748, 'samples': 11129472, 'steps': 57965, 'loss/train': 0.9695044755935669} -08/30/2021 23:37:44 - INFO - __main__ - Step 57967: {'lr': 0.00034338151352897376, 'samples': 11129664, 'steps': 57966, 'loss/train': 1.0120548009872437} -08/30/2021 23:37:45 - INFO - __main__ - Step 57968: {'lr': 0.00034337659086739646, 'samples': 11129856, 'steps': 57967, 'loss/train': 0.5006092190742493} -08/30/2021 23:37:45 - INFO - __main__ - Step 57969: {'lr': 0.0003433716681637451, 'samples': 11130048, 'steps': 57968, 'loss/train': 0.7030481696128845} -08/30/2021 23:37:47 - INFO - __main__ - Step 57970: {'lr': 0.0003433667454180219, 'samples': 11130240, 'steps': 57969, 'loss/train': 1.6818792819976807} -08/30/2021 23:37:47 - INFO - __main__ - Step 57971: {'lr': 0.00034336182263022916, 'samples': 11130432, 'steps': 57970, 'loss/train': 1.3140954971313477} -08/30/2021 23:37:47 - INFO - __main__ - Step 57972: {'lr': 0.000343356899800369, 'samples': 11130624, 'steps': 57971, 'loss/train': 2.077301263809204} -08/30/2021 23:37:48 - INFO - __main__ - Step 57973: {'lr': 0.0003433519769284436, 'samples': 11130816, 'steps': 57972, 'loss/train': 1.0022573471069336} -08/30/2021 23:37:48 - INFO - __main__ - Step 57974: {'lr': 0.00034334705401445527, 'samples': 11131008, 'steps': 57973, 'loss/train': 0.963807225227356} -08/30/2021 23:37:48 - INFO - __main__ - Step 57975: {'lr': 0.00034334213105840616, 'samples': 11131200, 'steps': 57974, 'loss/train': 1.4510246515274048} -08/30/2021 23:37:50 - INFO - __main__ - Step 57976: {'lr': 0.00034333720806029863, 'samples': 11131392, 'steps': 57975, 'loss/train': 0.7574708461761475} -08/30/2021 23:37:51 - INFO - __main__ - Step 57977: {'lr': 0.00034333228502013473, 'samples': 11131584, 'steps': 57976, 'loss/train': 1.8057149648666382} -08/30/2021 23:37:51 - INFO - __main__ - Step 57978: {'lr': 0.00034332736193791675, 'samples': 11131776, 'steps': 57977, 'loss/train': 0.050422124564647675} -08/30/2021 23:37:51 - INFO - __main__ - Step 57979: {'lr': 0.0003433224388136469, 'samples': 11131968, 'steps': 57978, 'loss/train': 1.2794603109359741} -08/30/2021 23:37:52 - INFO - __main__ - Step 57980: {'lr': 0.0003433175156473274, 'samples': 11132160, 'steps': 57979, 'loss/train': 0.64133620262146} -08/30/2021 23:37:53 - INFO - __main__ - Step 57981: {'lr': 0.0003433125924389604, 'samples': 11132352, 'steps': 57980, 'loss/train': 0.9147558808326721} -08/30/2021 23:37:54 - INFO - __main__ - Step 57982: {'lr': 0.00034330766918854827, 'samples': 11132544, 'steps': 57981, 'loss/train': 1.220578908920288} -08/30/2021 23:37:54 - INFO - __main__ - Step 57983: {'lr': 0.0003433027458960932, 'samples': 11132736, 'steps': 57982, 'loss/train': 0.924926221370697} -08/30/2021 23:37:54 - INFO - __main__ - Step 57984: {'lr': 0.00034329782256159724, 'samples': 11132928, 'steps': 57983, 'loss/train': 0.9357183575630188} -08/30/2021 23:37:55 - INFO - __main__ - Step 57985: {'lr': 0.00034329289918506276, 'samples': 11133120, 'steps': 57984, 'loss/train': 0.48311126232147217} -08/30/2021 23:37:56 - INFO - __main__ - Step 57986: {'lr': 0.0003432879757664919, 'samples': 11133312, 'steps': 57985, 'loss/train': 1.353756070137024} -08/30/2021 23:37:57 - INFO - __main__ - Step 57987: {'lr': 0.00034328305230588694, 'samples': 11133504, 'steps': 57986, 'loss/train': 1.4232285022735596} -08/30/2021 23:37:57 - INFO - __main__ - Step 57988: {'lr': 0.0003432781288032501, 'samples': 11133696, 'steps': 57987, 'loss/train': 1.144094467163086} -08/30/2021 23:37:57 - INFO - __main__ - Step 57989: {'lr': 0.00034327320525858357, 'samples': 11133888, 'steps': 57988, 'loss/train': 1.37705659866333} -08/30/2021 23:37:58 - INFO - __main__ - Step 57990: {'lr': 0.00034326828167188957, 'samples': 11134080, 'steps': 57989, 'loss/train': 1.6144942045211792} -08/30/2021 23:38:00 - INFO - __main__ - Step 57991: {'lr': 0.0003432633580431703, 'samples': 11134272, 'steps': 57990, 'loss/train': 0.28187695145606995} -08/30/2021 23:38:00 - INFO - __main__ - Step 57992: {'lr': 0.00034325843437242804, 'samples': 11134464, 'steps': 57991, 'loss/train': 1.456911325454712} -08/30/2021 23:38:01 - INFO - __main__ - Step 57993: {'lr': 0.0003432535106596649, 'samples': 11134656, 'steps': 57992, 'loss/train': 1.2609857320785522} -08/30/2021 23:38:01 - INFO - __main__ - Step 57994: {'lr': 0.00034324858690488324, 'samples': 11134848, 'steps': 57993, 'loss/train': 1.2759424448013306} -08/30/2021 23:38:01 - INFO - __main__ - Step 57995: {'lr': 0.0003432436631080851, 'samples': 11135040, 'steps': 57994, 'loss/train': 0.049883775413036346} -08/30/2021 23:38:03 - INFO - __main__ - Step 57996: {'lr': 0.00034323873926927296, 'samples': 11135232, 'steps': 57995, 'loss/train': 1.5175528526306152} -08/30/2021 23:38:04 - INFO - __main__ - Step 57997: {'lr': 0.00034323381538844884, 'samples': 11135424, 'steps': 57996, 'loss/train': 1.4376996755599976} -08/30/2021 23:38:04 - INFO - __main__ - Step 57998: {'lr': 0.0003432288914656149, 'samples': 11135616, 'steps': 57997, 'loss/train': 1.3499665260314941} -08/30/2021 23:38:04 - INFO - __main__ - Step 57999: {'lr': 0.00034322396750077354, 'samples': 11135808, 'steps': 57998, 'loss/train': 0.4412687420845032} -08/30/2021 23:38:05 - INFO - __main__ - Step 58000: {'lr': 0.0003432190434939269, 'samples': 11136000, 'steps': 57999, 'loss/train': 0.8755688071250916} -08/30/2021 23:38:05 - INFO - __main__ - Step 58001: {'lr': 0.0003432141194450772, 'samples': 11136192, 'steps': 58000, 'loss/train': 1.8476886749267578} -08/30/2021 23:38:06 - INFO - __main__ - Step 58002: {'lr': 0.0003432091953542267, 'samples': 11136384, 'steps': 58001, 'loss/train': 1.8664937019348145} -08/30/2021 23:38:07 - INFO - __main__ - Step 58003: {'lr': 0.00034320427122137745, 'samples': 11136576, 'steps': 58002, 'loss/train': 1.1659661531448364} -08/30/2021 23:38:07 - INFO - __main__ - Step 58004: {'lr': 0.0003431993470465319, 'samples': 11136768, 'steps': 58003, 'loss/train': 1.7013026475906372} -08/30/2021 23:38:08 - INFO - __main__ - Step 58005: {'lr': 0.00034319442282969206, 'samples': 11136960, 'steps': 58004, 'loss/train': 1.0599287748336792} -08/30/2021 23:38:08 - INFO - __main__ - Step 58006: {'lr': 0.0003431894985708603, 'samples': 11137152, 'steps': 58005, 'loss/train': 0.33406367897987366} -08/30/2021 23:38:10 - INFO - __main__ - Step 58007: {'lr': 0.0003431845742700388, 'samples': 11137344, 'steps': 58006, 'loss/train': 1.542755365371704} -08/30/2021 23:38:10 - INFO - __main__ - Step 58008: {'lr': 0.00034317964992722975, 'samples': 11137536, 'steps': 58007, 'loss/train': 1.7368049621582031} -08/30/2021 23:38:10 - INFO - __main__ - Step 58009: {'lr': 0.00034317472554243545, 'samples': 11137728, 'steps': 58008, 'loss/train': 1.5427500009536743} -08/30/2021 23:38:11 - INFO - __main__ - Step 58010: {'lr': 0.00034316980111565796, 'samples': 11137920, 'steps': 58009, 'loss/train': 0.0430852472782135} -08/30/2021 23:38:11 - INFO - __main__ - Step 58011: {'lr': 0.00034316487664689974, 'samples': 11138112, 'steps': 58010, 'loss/train': 0.23498308658599854} -08/30/2021 23:38:13 - INFO - __main__ - Step 58012: {'lr': 0.00034315995213616266, 'samples': 11138304, 'steps': 58011, 'loss/train': 1.2453813552856445} -08/30/2021 23:38:13 - INFO - __main__ - Step 58013: {'lr': 0.0003431550275834493, 'samples': 11138496, 'steps': 58012, 'loss/train': 1.4866456985473633} -08/30/2021 23:38:13 - INFO - __main__ - Step 58014: {'lr': 0.0003431501029887617, 'samples': 11138688, 'steps': 58013, 'loss/train': 0.29162171483039856} -08/30/2021 23:38:14 - INFO - __main__ - Step 58015: {'lr': 0.00034314517835210207, 'samples': 11138880, 'steps': 58014, 'loss/train': 1.2801259756088257} -08/30/2021 23:38:14 - INFO - __main__ - Step 58016: {'lr': 0.00034314025367347266, 'samples': 11139072, 'steps': 58015, 'loss/train': 1.3407461643218994} -08/30/2021 23:38:15 - INFO - __main__ - Step 58017: {'lr': 0.00034313532895287574, 'samples': 11139264, 'steps': 58016, 'loss/train': 1.511190414428711} -08/30/2021 23:38:16 - INFO - __main__ - Step 58018: {'lr': 0.00034313040419031336, 'samples': 11139456, 'steps': 58017, 'loss/train': 1.372041940689087} -08/30/2021 23:38:16 - INFO - __main__ - Step 58019: {'lr': 0.00034312547938578796, 'samples': 11139648, 'steps': 58018, 'loss/train': 0.784022331237793} -08/30/2021 23:38:17 - INFO - __main__ - Step 58020: {'lr': 0.0003431205545393016, 'samples': 11139840, 'steps': 58019, 'loss/train': 0.9925459027290344} -08/30/2021 23:38:17 - INFO - __main__ - Step 58021: {'lr': 0.00034311562965085664, 'samples': 11140032, 'steps': 58020, 'loss/train': 0.5568354725837708} -08/30/2021 23:38:19 - INFO - __main__ - Step 58022: {'lr': 0.0003431107047204552, 'samples': 11140224, 'steps': 58021, 'loss/train': 1.1519273519515991} -08/30/2021 23:38:19 - INFO - __main__ - Step 58023: {'lr': 0.00034310577974809944, 'samples': 11140416, 'steps': 58022, 'loss/train': 0.3109199106693268} -08/30/2021 23:38:20 - INFO - __main__ - Step 58024: {'lr': 0.0003431008547337917, 'samples': 11140608, 'steps': 58023, 'loss/train': 1.9225962162017822} -08/30/2021 23:38:20 - INFO - __main__ - Step 58025: {'lr': 0.0003430959296775341, 'samples': 11140800, 'steps': 58024, 'loss/train': 1.2298303842544556} -08/30/2021 23:38:20 - INFO - __main__ - Step 58026: {'lr': 0.00034309100457932895, 'samples': 11140992, 'steps': 58025, 'loss/train': 1.7570264339447021} -08/30/2021 23:38:22 - INFO - __main__ - Step 58027: {'lr': 0.0003430860794391784, 'samples': 11141184, 'steps': 58026, 'loss/train': 1.6850838661193848} -08/30/2021 23:38:22 - INFO - __main__ - Step 58028: {'lr': 0.00034308115425708477, 'samples': 11141376, 'steps': 58027, 'loss/train': 1.1719732284545898} -08/30/2021 23:38:23 - INFO - __main__ - Step 58029: {'lr': 0.0003430762290330501, 'samples': 11141568, 'steps': 58028, 'loss/train': 1.4778354167938232} -08/30/2021 23:38:23 - INFO - __main__ - Step 58030: {'lr': 0.00034307130376707684, 'samples': 11141760, 'steps': 58029, 'loss/train': 0.5399166345596313} -08/30/2021 23:38:23 - INFO - __main__ - Step 58031: {'lr': 0.000343066378459167, 'samples': 11141952, 'steps': 58030, 'loss/train': 0.8089847564697266} -08/30/2021 23:38:25 - INFO - __main__ - Step 58032: {'lr': 0.00034306145310932293, 'samples': 11142144, 'steps': 58031, 'loss/train': 1.3842999935150146} -08/30/2021 23:38:25 - INFO - __main__ - Step 58033: {'lr': 0.0003430565277175468, 'samples': 11142336, 'steps': 58032, 'loss/train': 2.5330135822296143} -08/30/2021 23:38:26 - INFO - __main__ - Step 58034: {'lr': 0.0003430516022838408, 'samples': 11142528, 'steps': 58033, 'loss/train': 1.1577410697937012} -08/30/2021 23:38:26 - INFO - __main__ - Step 58035: {'lr': 0.00034304667680820714, 'samples': 11142720, 'steps': 58034, 'loss/train': 1.5663037300109863} -08/30/2021 23:38:26 - INFO - __main__ - Step 58036: {'lr': 0.0003430417512906482, 'samples': 11142912, 'steps': 58035, 'loss/train': 0.8629599213600159} -08/30/2021 23:38:28 - INFO - __main__ - Step 58037: {'lr': 0.0003430368257311661, 'samples': 11143104, 'steps': 58036, 'loss/train': 0.31418338418006897} -08/30/2021 23:38:28 - INFO - __main__ - Step 58038: {'lr': 0.0003430319001297629, 'samples': 11143296, 'steps': 58037, 'loss/train': 1.5538597106933594} -08/30/2021 23:38:29 - INFO - __main__ - Step 58039: {'lr': 0.00034302697448644105, 'samples': 11143488, 'steps': 58038, 'loss/train': 1.2497516870498657} -08/30/2021 23:38:29 - INFO - __main__ - Step 58040: {'lr': 0.00034302204880120267, 'samples': 11143680, 'steps': 58039, 'loss/train': 1.4606926441192627} -08/30/2021 23:38:29 - INFO - __main__ - Step 58041: {'lr': 0.00034301712307404996, 'samples': 11143872, 'steps': 58040, 'loss/train': 0.864867091178894} -08/30/2021 23:38:30 - INFO - __main__ - Step 58042: {'lr': 0.00034301219730498524, 'samples': 11144064, 'steps': 58041, 'loss/train': 1.0711973905563354} -08/30/2021 23:38:32 - INFO - __main__ - Step 58043: {'lr': 0.00034300727149401064, 'samples': 11144256, 'steps': 58042, 'loss/train': 1.1949002742767334} -08/30/2021 23:38:32 - INFO - __main__ - Step 58044: {'lr': 0.00034300234564112837, 'samples': 11144448, 'steps': 58043, 'loss/train': 0.9533157348632812} -08/30/2021 23:38:33 - INFO - __main__ - Step 58045: {'lr': 0.0003429974197463407, 'samples': 11144640, 'steps': 58044, 'loss/train': 1.811410665512085} -08/30/2021 23:38:33 - INFO - __main__ - Step 58046: {'lr': 0.00034299249380964977, 'samples': 11144832, 'steps': 58045, 'loss/train': 1.1357166767120361} -08/30/2021 23:38:33 - INFO - __main__ - Step 58047: {'lr': 0.0003429875678310579, 'samples': 11145024, 'steps': 58046, 'loss/train': 0.8524813652038574} -08/30/2021 23:38:34 - INFO - __main__ - Step 58048: {'lr': 0.0003429826418105673, 'samples': 11145216, 'steps': 58047, 'loss/train': 0.9991881847381592} -08/30/2021 23:38:35 - INFO - __main__ - Step 58049: {'lr': 0.0003429777157481801, 'samples': 11145408, 'steps': 58048, 'loss/train': 0.9006020426750183} -08/30/2021 23:38:36 - INFO - __main__ - Step 58050: {'lr': 0.0003429727896438986, 'samples': 11145600, 'steps': 58049, 'loss/train': 1.8354930877685547} -08/30/2021 23:38:36 - INFO - __main__ - Step 58051: {'lr': 0.00034296786349772494, 'samples': 11145792, 'steps': 58050, 'loss/train': 1.11492121219635} -08/30/2021 23:38:37 - INFO - __main__ - Step 58052: {'lr': 0.0003429629373096615, 'samples': 11145984, 'steps': 58051, 'loss/train': 0.3116246163845062} -08/30/2021 23:38:37 - INFO - __main__ - Step 58053: {'lr': 0.0003429580110797103, 'samples': 11146176, 'steps': 58052, 'loss/train': 0.9807584881782532} -08/30/2021 23:38:38 - INFO - __main__ - Step 58054: {'lr': 0.0003429530848078737, 'samples': 11146368, 'steps': 58053, 'loss/train': 0.9870104193687439} -08/30/2021 23:38:39 - INFO - __main__ - Step 58055: {'lr': 0.0003429481584941538, 'samples': 11146560, 'steps': 58054, 'loss/train': 1.261991262435913} -08/30/2021 23:38:39 - INFO - __main__ - Step 58056: {'lr': 0.0003429432321385531, 'samples': 11146752, 'steps': 58055, 'loss/train': 0.07171699404716492} -08/30/2021 23:38:40 - INFO - __main__ - Step 58057: {'lr': 0.00034293830574107345, 'samples': 11146944, 'steps': 58056, 'loss/train': 1.0180670022964478} -08/30/2021 23:38:40 - INFO - __main__ - Step 58058: {'lr': 0.0003429333793017173, 'samples': 11147136, 'steps': 58057, 'loss/train': 0.8893603086471558} -08/30/2021 23:38:42 - INFO - __main__ - Step 58059: {'lr': 0.00034292845282048667, 'samples': 11147328, 'steps': 58058, 'loss/train': 1.1295841932296753} -08/30/2021 23:38:42 - INFO - __main__ - Step 58060: {'lr': 0.00034292352629738406, 'samples': 11147520, 'steps': 58059, 'loss/train': 0.6821733713150024} -08/30/2021 23:38:42 - INFO - __main__ - Step 58061: {'lr': 0.00034291859973241146, 'samples': 11147712, 'steps': 58060, 'loss/train': 1.295778751373291} -08/30/2021 23:38:43 - INFO - __main__ - Step 58062: {'lr': 0.0003429136731255712, 'samples': 11147904, 'steps': 58061, 'loss/train': 1.119515299797058} -08/30/2021 23:38:43 - INFO - __main__ - Step 58063: {'lr': 0.0003429087464768655, 'samples': 11148096, 'steps': 58062, 'loss/train': 4.730381488800049} -08/30/2021 23:38:45 - INFO - __main__ - Step 58064: {'lr': 0.00034290381978629655, 'samples': 11148288, 'steps': 58063, 'loss/train': 1.125172734260559} -08/30/2021 23:38:45 - INFO - __main__ - Step 58065: {'lr': 0.00034289889305386654, 'samples': 11148480, 'steps': 58064, 'loss/train': 1.5220035314559937} -08/30/2021 23:38:45 - INFO - __main__ - Step 58066: {'lr': 0.0003428939662795777, 'samples': 11148672, 'steps': 58065, 'loss/train': 1.163615107536316} -08/30/2021 23:38:46 - INFO - __main__ - Step 58067: {'lr': 0.0003428890394634323, 'samples': 11148864, 'steps': 58066, 'loss/train': 1.710109829902649} -08/30/2021 23:38:46 - INFO - __main__ - Step 58068: {'lr': 0.0003428841126054326, 'samples': 11149056, 'steps': 58067, 'loss/train': 1.0260673761367798} -08/30/2021 23:38:48 - INFO - __main__ - Step 58069: {'lr': 0.0003428791857055806, 'samples': 11149248, 'steps': 58068, 'loss/train': 1.0518882274627686} -08/30/2021 23:38:48 - INFO - __main__ - Step 58070: {'lr': 0.0003428742587638788, 'samples': 11149440, 'steps': 58069, 'loss/train': 1.4251055717468262} -08/30/2021 23:38:48 - INFO - __main__ - Step 58071: {'lr': 0.0003428693317803293, 'samples': 11149632, 'steps': 58070, 'loss/train': 1.4703441858291626} -08/30/2021 23:38:49 - INFO - __main__ - Step 58072: {'lr': 0.00034286440475493423, 'samples': 11149824, 'steps': 58071, 'loss/train': 0.5448579788208008} -08/30/2021 23:38:49 - INFO - __main__ - Step 58073: {'lr': 0.0003428594776876959, 'samples': 11150016, 'steps': 58072, 'loss/train': 1.0383001565933228} -08/30/2021 23:38:51 - INFO - __main__ - Step 58074: {'lr': 0.0003428545505786166, 'samples': 11150208, 'steps': 58073, 'loss/train': 1.2746344804763794} -08/30/2021 23:38:51 - INFO - __main__ - Step 58075: {'lr': 0.0003428496234276984, 'samples': 11150400, 'steps': 58074, 'loss/train': 1.3985235691070557} -08/30/2021 23:38:51 - INFO - __main__ - Step 58076: {'lr': 0.0003428446962349437, 'samples': 11150592, 'steps': 58075, 'loss/train': 1.4720648527145386} -08/30/2021 23:38:52 - INFO - __main__ - Step 58077: {'lr': 0.0003428397690003545, 'samples': 11150784, 'steps': 58076, 'loss/train': 1.631380558013916} -08/30/2021 23:38:52 - INFO - __main__ - Step 58078: {'lr': 0.00034283484172393315, 'samples': 11150976, 'steps': 58077, 'loss/train': 2.1027185916900635} -08/30/2021 23:38:52 - INFO - __main__ - Step 58079: {'lr': 0.0003428299144056818, 'samples': 11151168, 'steps': 58078, 'loss/train': 1.1716820001602173} -08/30/2021 23:38:54 - INFO - __main__ - Step 58080: {'lr': 0.00034282498704560284, 'samples': 11151360, 'steps': 58079, 'loss/train': 1.6995404958724976} -08/30/2021 23:38:54 - INFO - __main__ - Step 58081: {'lr': 0.0003428200596436983, 'samples': 11151552, 'steps': 58080, 'loss/train': 0.9309347867965698} -08/30/2021 23:38:55 - INFO - __main__ - Step 58082: {'lr': 0.00034281513219997054, 'samples': 11151744, 'steps': 58081, 'loss/train': 1.289864182472229} -08/30/2021 23:38:55 - INFO - __main__ - Step 58083: {'lr': 0.0003428102047144217, 'samples': 11151936, 'steps': 58082, 'loss/train': 1.2866483926773071} -08/30/2021 23:38:55 - INFO - __main__ - Step 58084: {'lr': 0.00034280527718705397, 'samples': 11152128, 'steps': 58083, 'loss/train': 1.8010245561599731} -08/30/2021 23:38:57 - INFO - __main__ - Step 58085: {'lr': 0.0003428003496178696, 'samples': 11152320, 'steps': 58084, 'loss/train': 1.253327488899231} -08/30/2021 23:38:58 - INFO - __main__ - Step 58086: {'lr': 0.00034279542200687087, 'samples': 11152512, 'steps': 58085, 'loss/train': 1.142523169517517} -08/30/2021 23:38:58 - INFO - __main__ - Step 58087: {'lr': 0.0003427904943540599, 'samples': 11152704, 'steps': 58086, 'loss/train': 0.3590722680091858} -08/30/2021 23:38:59 - INFO - __main__ - Step 58088: {'lr': 0.000342785566659439, 'samples': 11152896, 'steps': 58087, 'loss/train': 0.9169415235519409} -08/30/2021 23:38:59 - INFO - __main__ - Step 58089: {'lr': 0.00034278063892301036, 'samples': 11153088, 'steps': 58088, 'loss/train': 1.6978827714920044} -08/30/2021 23:39:00 - INFO - __main__ - Step 58090: {'lr': 0.00034277571114477623, 'samples': 11153280, 'steps': 58089, 'loss/train': 1.3921388387680054} -08/30/2021 23:39:01 - INFO - __main__ - Step 58091: {'lr': 0.0003427707833247388, 'samples': 11153472, 'steps': 58090, 'loss/train': 1.1821303367614746} -08/30/2021 23:39:01 - INFO - __main__ - Step 58092: {'lr': 0.0003427658554629002, 'samples': 11153664, 'steps': 58091, 'loss/train': 1.3248728513717651} -08/30/2021 23:39:02 - INFO - __main__ - Step 58093: {'lr': 0.00034276092755926275, 'samples': 11153856, 'steps': 58092, 'loss/train': 1.3602943420410156} -08/30/2021 23:39:02 - INFO - __main__ - Step 58094: {'lr': 0.0003427559996138287, 'samples': 11154048, 'steps': 58093, 'loss/train': 1.1875736713409424} -08/30/2021 23:39:04 - INFO - __main__ - Step 58095: {'lr': 0.00034275107162660024, 'samples': 11154240, 'steps': 58094, 'loss/train': 2.1526896953582764} -08/30/2021 23:39:04 - INFO - __main__ - Step 58096: {'lr': 0.0003427461435975796, 'samples': 11154432, 'steps': 58095, 'loss/train': 1.4964807033538818} -08/30/2021 23:39:04 - INFO - __main__ - Step 58097: {'lr': 0.0003427412155267688, 'samples': 11154624, 'steps': 58096, 'loss/train': 1.0730723142623901} -08/30/2021 23:39:05 - INFO - __main__ - Step 58098: {'lr': 0.00034273628741417043, 'samples': 11154816, 'steps': 58097, 'loss/train': 1.528784990310669} -08/30/2021 23:39:05 - INFO - __main__ - Step 58099: {'lr': 0.0003427313592597865, 'samples': 11155008, 'steps': 58098, 'loss/train': 1.0968055725097656} -08/30/2021 23:39:05 - INFO - __main__ - Step 58100: {'lr': 0.00034272643106361916, 'samples': 11155200, 'steps': 58099, 'loss/train': 0.8010907173156738} -08/30/2021 23:39:07 - INFO - __main__ - Step 58101: {'lr': 0.00034272150282567084, 'samples': 11155392, 'steps': 58100, 'loss/train': 0.555972695350647} -08/30/2021 23:39:08 - INFO - __main__ - Step 58102: {'lr': 0.00034271657454594355, 'samples': 11155584, 'steps': 58101, 'loss/train': 1.4861379861831665} -08/30/2021 23:39:08 - INFO - __main__ - Step 58103: {'lr': 0.0003427116462244396, 'samples': 11155776, 'steps': 58102, 'loss/train': 1.5160166025161743} -08/30/2021 23:39:09 - INFO - __main__ - Step 58104: {'lr': 0.00034270671786116127, 'samples': 11155968, 'steps': 58103, 'loss/train': 1.2457619905471802} -08/30/2021 23:39:09 - INFO - __main__ - Step 58105: {'lr': 0.00034270178945611067, 'samples': 11156160, 'steps': 58104, 'loss/train': 1.4042640924453735} -08/30/2021 23:39:10 - INFO - __main__ - Step 58106: {'lr': 0.00034269686100929015, 'samples': 11156352, 'steps': 58105, 'loss/train': 1.5230947732925415} -08/30/2021 23:39:11 - INFO - __main__ - Step 58107: {'lr': 0.0003426919325207018, 'samples': 11156544, 'steps': 58106, 'loss/train': 1.4654512405395508} -08/30/2021 23:39:11 - INFO - __main__ - Step 58108: {'lr': 0.0003426870039903479, 'samples': 11156736, 'steps': 58107, 'loss/train': 1.616666555404663} -08/30/2021 23:39:12 - INFO - __main__ - Step 58109: {'lr': 0.00034268207541823066, 'samples': 11156928, 'steps': 58108, 'loss/train': 0.9702644944190979} -08/30/2021 23:39:12 - INFO - __main__ - Step 58110: {'lr': 0.0003426771468043523, 'samples': 11157120, 'steps': 58109, 'loss/train': 1.0503275394439697} -08/30/2021 23:39:14 - INFO - __main__ - Step 58111: {'lr': 0.00034267221814871505, 'samples': 11157312, 'steps': 58110, 'loss/train': 1.0737967491149902} -08/30/2021 23:39:14 - INFO - __main__ - Step 58112: {'lr': 0.0003426672894513212, 'samples': 11157504, 'steps': 58111, 'loss/train': 0.12731744349002838} -08/30/2021 23:39:15 - INFO - __main__ - Step 58113: {'lr': 0.00034266236071217284, 'samples': 11157696, 'steps': 58112, 'loss/train': 0.9806870222091675} -08/30/2021 23:39:15 - INFO - __main__ - Step 58114: {'lr': 0.00034265743193127217, 'samples': 11157888, 'steps': 58113, 'loss/train': 1.0589088201522827} -08/30/2021 23:39:15 - INFO - __main__ - Step 58115: {'lr': 0.00034265250310862164, 'samples': 11158080, 'steps': 58114, 'loss/train': 1.0427807569503784} -08/30/2021 23:39:17 - INFO - __main__ - Step 58116: {'lr': 0.0003426475742442232, 'samples': 11158272, 'steps': 58115, 'loss/train': 0.7752166986465454} -08/30/2021 23:39:17 - INFO - __main__ - Step 58117: {'lr': 0.0003426426453380793, 'samples': 11158464, 'steps': 58116, 'loss/train': 1.6357320547103882} -08/30/2021 23:39:18 - INFO - __main__ - Step 58118: {'lr': 0.000342637716390192, 'samples': 11158656, 'steps': 58117, 'loss/train': 1.2135121822357178} -08/30/2021 23:39:18 - INFO - __main__ - Step 58119: {'lr': 0.0003426327874005636, 'samples': 11158848, 'steps': 58118, 'loss/train': 0.7144802808761597} -08/30/2021 23:39:18 - INFO - __main__ - Step 58120: {'lr': 0.00034262785836919617, 'samples': 11159040, 'steps': 58119, 'loss/train': 1.4486844539642334} -08/30/2021 23:39:19 - INFO - __main__ - Step 58121: {'lr': 0.00034262292929609217, 'samples': 11159232, 'steps': 58120, 'loss/train': 0.778864860534668} -08/30/2021 23:39:20 - INFO - __main__ - Step 58122: {'lr': 0.0003426180001812537, 'samples': 11159424, 'steps': 58121, 'loss/train': 1.2206759452819824} -08/30/2021 23:39:21 - INFO - __main__ - Step 58123: {'lr': 0.000342613071024683, 'samples': 11159616, 'steps': 58122, 'loss/train': 1.220629096031189} -08/30/2021 23:39:21 - INFO - __main__ - Step 58124: {'lr': 0.0003426081418263823, 'samples': 11159808, 'steps': 58123, 'loss/train': 0.3379243016242981} -08/30/2021 23:39:21 - INFO - __main__ - Step 58125: {'lr': 0.00034260321258635377, 'samples': 11160000, 'steps': 58124, 'loss/train': 1.3498263359069824} -08/30/2021 23:39:22 - INFO - __main__ - Step 58126: {'lr': 0.0003425982833045996, 'samples': 11160192, 'steps': 58125, 'loss/train': 1.2787257432937622} -08/30/2021 23:39:23 - INFO - __main__ - Step 58127: {'lr': 0.0003425933539811221, 'samples': 11160384, 'steps': 58126, 'loss/train': 1.6527032852172852} -08/30/2021 23:39:24 - INFO - __main__ - Step 58128: {'lr': 0.0003425884246159235, 'samples': 11160576, 'steps': 58127, 'loss/train': 1.2861199378967285} -08/30/2021 23:39:24 - INFO - __main__ - Step 58129: {'lr': 0.00034258349520900595, 'samples': 11160768, 'steps': 58128, 'loss/train': 1.4614211320877075} -08/30/2021 23:39:24 - INFO - __main__ - Step 58130: {'lr': 0.0003425785657603718, 'samples': 11160960, 'steps': 58129, 'loss/train': 0.9837599396705627} -08/30/2021 23:39:25 - INFO - __main__ - Step 58131: {'lr': 0.0003425736362700231, 'samples': 11161152, 'steps': 58130, 'loss/train': 2.0948567390441895} -08/30/2021 23:39:26 - INFO - __main__ - Step 58132: {'lr': 0.00034256870673796217, 'samples': 11161344, 'steps': 58131, 'loss/train': 1.559877872467041} -08/30/2021 23:39:27 - INFO - __main__ - Step 58133: {'lr': 0.0003425637771641911, 'samples': 11161536, 'steps': 58132, 'loss/train': 1.761301875114441} -08/30/2021 23:39:27 - INFO - __main__ - Step 58134: {'lr': 0.00034255884754871233, 'samples': 11161728, 'steps': 58133, 'loss/train': 0.8404830098152161} -08/30/2021 23:39:27 - INFO - __main__ - Step 58135: {'lr': 0.000342553917891528, 'samples': 11161920, 'steps': 58134, 'loss/train': 1.1599462032318115} -08/30/2021 23:39:28 - INFO - __main__ - Step 58136: {'lr': 0.0003425489881926402, 'samples': 11162112, 'steps': 58135, 'loss/train': 1.2159727811813354} -08/30/2021 23:39:29 - INFO - __main__ - Step 58137: {'lr': 0.0003425440584520514, 'samples': 11162304, 'steps': 58136, 'loss/train': 1.6771095991134644} -08/30/2021 23:39:30 - INFO - __main__ - Step 58138: {'lr': 0.00034253912866976353, 'samples': 11162496, 'steps': 58137, 'loss/train': 1.4760503768920898} -08/30/2021 23:39:30 - INFO - __main__ - Step 58139: {'lr': 0.000342534198845779, 'samples': 11162688, 'steps': 58138, 'loss/train': 1.6011906862258911} -08/30/2021 23:39:30 - INFO - __main__ - Step 58140: {'lr': 0.0003425292689801, 'samples': 11162880, 'steps': 58139, 'loss/train': 1.0824955701828003} -08/30/2021 23:39:31 - INFO - __main__ - Step 58141: {'lr': 0.00034252433907272875, 'samples': 11163072, 'steps': 58140, 'loss/train': 1.5095313787460327} -08/30/2021 23:39:31 - INFO - __main__ - Step 58142: {'lr': 0.0003425194091236674, 'samples': 11163264, 'steps': 58141, 'loss/train': 1.1028271913528442} -08/30/2021 23:39:33 - INFO - __main__ - Step 58143: {'lr': 0.0003425144791329183, 'samples': 11163456, 'steps': 58142, 'loss/train': 2.8132710456848145} -08/30/2021 23:39:33 - INFO - __main__ - Step 58144: {'lr': 0.00034250954910048357, 'samples': 11163648, 'steps': 58143, 'loss/train': 1.0607272386550903} -08/30/2021 23:39:33 - INFO - __main__ - Step 58145: {'lr': 0.0003425046190263655, 'samples': 11163840, 'steps': 58144, 'loss/train': 0.9200980067253113} -08/30/2021 23:39:34 - INFO - __main__ - Step 58146: {'lr': 0.00034249968891056625, 'samples': 11164032, 'steps': 58145, 'loss/train': 0.7144595980644226} -08/30/2021 23:39:34 - INFO - __main__ - Step 58147: {'lr': 0.00034249475875308813, 'samples': 11164224, 'steps': 58146, 'loss/train': 2.6284947395324707} -08/30/2021 23:39:36 - INFO - __main__ - Step 58148: {'lr': 0.00034248982855393317, 'samples': 11164416, 'steps': 58147, 'loss/train': 1.1523993015289307} -08/30/2021 23:39:36 - INFO - __main__ - Step 58149: {'lr': 0.0003424848983131038, 'samples': 11164608, 'steps': 58148, 'loss/train': 0.9722750186920166} -08/30/2021 23:39:36 - INFO - __main__ - Step 58150: {'lr': 0.0003424799680306022, 'samples': 11164800, 'steps': 58149, 'loss/train': 1.4469280242919922} -08/30/2021 23:39:37 - INFO - __main__ - Step 58151: {'lr': 0.0003424750377064305, 'samples': 11164992, 'steps': 58150, 'loss/train': 1.351000189781189} -08/30/2021 23:39:37 - INFO - __main__ - Step 58152: {'lr': 0.000342470107340591, 'samples': 11165184, 'steps': 58151, 'loss/train': 1.644476056098938} -08/30/2021 23:39:40 - INFO - __main__ - Step 58153: {'lr': 0.0003424651769330859, 'samples': 11165376, 'steps': 58152, 'loss/train': 0.9190403819084167} -08/30/2021 23:39:40 - INFO - __main__ - Step 58154: {'lr': 0.0003424602464839173, 'samples': 11165568, 'steps': 58153, 'loss/train': 1.2978562116622925} -08/30/2021 23:39:40 - INFO - __main__ - Step 58155: {'lr': 0.0003424553159930877, 'samples': 11165760, 'steps': 58154, 'loss/train': 0.713495671749115} -08/30/2021 23:39:41 - INFO - __main__ - Step 58156: {'lr': 0.00034245038546059904, 'samples': 11165952, 'steps': 58155, 'loss/train': 1.877809762954712} -08/30/2021 23:39:41 - INFO - __main__ - Step 58157: {'lr': 0.0003424454548864538, 'samples': 11166144, 'steps': 58156, 'loss/train': 0.409132182598114} -08/30/2021 23:39:43 - INFO - __main__ - Step 58158: {'lr': 0.00034244052427065397, 'samples': 11166336, 'steps': 58157, 'loss/train': 1.1318840980529785} -08/30/2021 23:39:43 - INFO - __main__ - Step 58159: {'lr': 0.00034243559361320187, 'samples': 11166528, 'steps': 58158, 'loss/train': 1.2086416482925415} -08/30/2021 23:39:44 - INFO - __main__ - Step 58160: {'lr': 0.00034243066291409977, 'samples': 11166720, 'steps': 58159, 'loss/train': 1.0776487588882446} -08/30/2021 23:39:44 - INFO - __main__ - Step 58161: {'lr': 0.0003424257321733497, 'samples': 11166912, 'steps': 58160, 'loss/train': 1.3231314420700073} -08/30/2021 23:39:44 - INFO - __main__ - Step 58162: {'lr': 0.00034242080139095416, 'samples': 11167104, 'steps': 58161, 'loss/train': 0.48137930035591125} -08/30/2021 23:39:45 - INFO - __main__ - Step 58163: {'lr': 0.0003424158705669152, 'samples': 11167296, 'steps': 58162, 'loss/train': 1.2340216636657715} -08/30/2021 23:39:46 - INFO - __main__ - Step 58164: {'lr': 0.0003424109397012351, 'samples': 11167488, 'steps': 58163, 'loss/train': 1.5349849462509155} -08/30/2021 23:39:47 - INFO - __main__ - Step 58165: {'lr': 0.000342406008793916, 'samples': 11167680, 'steps': 58164, 'loss/train': 1.677738070487976} -08/30/2021 23:39:47 - INFO - __main__ - Step 58166: {'lr': 0.00034240107784496023, 'samples': 11167872, 'steps': 58165, 'loss/train': 0.9596205949783325} -08/30/2021 23:39:48 - INFO - __main__ - Step 58167: {'lr': 0.00034239614685436994, 'samples': 11168064, 'steps': 58166, 'loss/train': 0.029650403186678886} -08/30/2021 23:39:48 - INFO - __main__ - Step 58168: {'lr': 0.0003423912158221473, 'samples': 11168256, 'steps': 58167, 'loss/train': 0.7860967516899109} -08/30/2021 23:39:48 - INFO - __main__ - Step 58169: {'lr': 0.0003423862847482947, 'samples': 11168448, 'steps': 58168, 'loss/train': 1.541067123413086} -08/30/2021 23:39:50 - INFO - __main__ - Step 58170: {'lr': 0.0003423813536328143, 'samples': 11168640, 'steps': 58169, 'loss/train': 1.5356074571609497} -08/30/2021 23:39:50 - INFO - __main__ - Step 58171: {'lr': 0.00034237642247570815, 'samples': 11168832, 'steps': 58170, 'loss/train': 1.2269033193588257} -08/30/2021 23:39:51 - INFO - __main__ - Step 58172: {'lr': 0.0003423714912769787, 'samples': 11169024, 'steps': 58171, 'loss/train': 1.423087239265442} -08/30/2021 23:39:51 - INFO - __main__ - Step 58173: {'lr': 0.000342366560036628, 'samples': 11169216, 'steps': 58172, 'loss/train': 1.5837994813919067} -08/30/2021 23:39:52 - INFO - __main__ - Step 58174: {'lr': 0.0003423616287546585, 'samples': 11169408, 'steps': 58173, 'loss/train': 1.5073819160461426} -08/30/2021 23:39:53 - INFO - __main__ - Step 58175: {'lr': 0.00034235669743107214, 'samples': 11169600, 'steps': 58174, 'loss/train': 0.06718748062849045} -08/30/2021 23:39:54 - INFO - __main__ - Step 58176: {'lr': 0.0003423517660658713, 'samples': 11169792, 'steps': 58175, 'loss/train': 1.3589560985565186} -08/30/2021 23:39:54 - INFO - __main__ - Step 58177: {'lr': 0.0003423468346590583, 'samples': 11169984, 'steps': 58176, 'loss/train': 1.500417947769165} -08/30/2021 23:39:54 - INFO - __main__ - Step 58178: {'lr': 0.00034234190321063516, 'samples': 11170176, 'steps': 58177, 'loss/train': 1.2618979215621948} -08/30/2021 23:39:55 - INFO - __main__ - Step 58179: {'lr': 0.00034233697172060415, 'samples': 11170368, 'steps': 58178, 'loss/train': 1.6957918405532837} -08/30/2021 23:39:55 - INFO - __main__ - Step 58180: {'lr': 0.00034233204018896754, 'samples': 11170560, 'steps': 58179, 'loss/train': 1.4949250221252441} -08/30/2021 23:39:56 - INFO - __main__ - Step 58181: {'lr': 0.00034232710861572754, 'samples': 11170752, 'steps': 58180, 'loss/train': 1.021200180053711} -08/30/2021 23:39:57 - INFO - __main__ - Step 58182: {'lr': 0.0003423221770008864, 'samples': 11170944, 'steps': 58181, 'loss/train': 1.15692138671875} -08/30/2021 23:39:57 - INFO - __main__ - Step 58183: {'lr': 0.0003423172453444462, 'samples': 11171136, 'steps': 58182, 'loss/train': 1.4904612302780151} -08/30/2021 23:39:58 - INFO - __main__ - Step 58184: {'lr': 0.00034231231364640946, 'samples': 11171328, 'steps': 58183, 'loss/train': 1.2064727544784546} -08/30/2021 23:39:58 - INFO - __main__ - Step 58185: {'lr': 0.0003423073819067781, 'samples': 11171520, 'steps': 58184, 'loss/train': 1.015325665473938} -08/30/2021 23:40:00 - INFO - __main__ - Step 58186: {'lr': 0.00034230245012555445, 'samples': 11171712, 'steps': 58185, 'loss/train': 1.2468750476837158} -08/30/2021 23:40:00 - INFO - __main__ - Step 58187: {'lr': 0.00034229751830274077, 'samples': 11171904, 'steps': 58186, 'loss/train': 1.3481324911117554} -08/30/2021 23:40:00 - INFO - __main__ - Step 58188: {'lr': 0.0003422925864383392, 'samples': 11172096, 'steps': 58187, 'loss/train': 1.331291675567627} -08/30/2021 23:40:01 - INFO - __main__ - Step 58189: {'lr': 0.00034228765453235213, 'samples': 11172288, 'steps': 58188, 'loss/train': 1.913342833518982} -08/30/2021 23:40:01 - INFO - __main__ - Step 58190: {'lr': 0.0003422827225847816, 'samples': 11172480, 'steps': 58189, 'loss/train': 1.7874317169189453} -08/30/2021 23:40:02 - INFO - __main__ - Step 58191: {'lr': 0.0003422777905956299, 'samples': 11172672, 'steps': 58190, 'loss/train': 1.4271373748779297} -08/30/2021 23:40:03 - INFO - __main__ - Step 58192: {'lr': 0.0003422728585648992, 'samples': 11172864, 'steps': 58191, 'loss/train': 0.4440106451511383} -08/30/2021 23:40:03 - INFO - __main__ - Step 58193: {'lr': 0.00034226792649259184, 'samples': 11173056, 'steps': 58192, 'loss/train': 0.7758225202560425} -08/30/2021 23:40:04 - INFO - __main__ - Step 58194: {'lr': 0.00034226299437870993, 'samples': 11173248, 'steps': 58193, 'loss/train': 1.1746567487716675} -08/30/2021 23:40:04 - INFO - __main__ - Step 58195: {'lr': 0.0003422580622232558, 'samples': 11173440, 'steps': 58194, 'loss/train': 1.041857361793518} -08/30/2021 23:40:05 - INFO - __main__ - Step 58196: {'lr': 0.0003422531300262316, 'samples': 11173632, 'steps': 58195, 'loss/train': 0.7676185965538025} -08/30/2021 23:40:06 - INFO - __main__ - Step 58197: {'lr': 0.00034224819778763953, 'samples': 11173824, 'steps': 58196, 'loss/train': 0.8987600207328796} -08/30/2021 23:40:06 - INFO - __main__ - Step 58198: {'lr': 0.0003422432655074819, 'samples': 11174016, 'steps': 58197, 'loss/train': 1.578316569328308} -08/30/2021 23:40:07 - INFO - __main__ - Step 58199: {'lr': 0.0003422383331857608, 'samples': 11174208, 'steps': 58198, 'loss/train': 1.4160542488098145} -08/30/2021 23:40:07 - INFO - __main__ - Step 58200: {'lr': 0.00034223340082247856, 'samples': 11174400, 'steps': 58199, 'loss/train': 1.7254291772842407} -08/30/2021 23:40:09 - INFO - __main__ - Step 58201: {'lr': 0.0003422284684176374, 'samples': 11174592, 'steps': 58200, 'loss/train': 2.102698564529419} -08/30/2021 23:40:09 - INFO - __main__ - Step 58202: {'lr': 0.00034222353597123946, 'samples': 11174784, 'steps': 58201, 'loss/train': 1.5819694995880127} -08/30/2021 23:40:10 - INFO - __main__ - Step 58203: {'lr': 0.00034221860348328703, 'samples': 11174976, 'steps': 58202, 'loss/train': 0.9942245483398438} -08/30/2021 23:40:10 - INFO - __main__ - Step 58204: {'lr': 0.0003422136709537824, 'samples': 11175168, 'steps': 58203, 'loss/train': 0.6993240118026733} -08/30/2021 23:40:10 - INFO - __main__ - Step 58205: {'lr': 0.00034220873838272767, 'samples': 11175360, 'steps': 58204, 'loss/train': 0.020276373252272606} -08/30/2021 23:40:11 - INFO - __main__ - Step 58206: {'lr': 0.00034220380577012506, 'samples': 11175552, 'steps': 58205, 'loss/train': 1.6438995599746704} -08/30/2021 23:40:13 - INFO - __main__ - Step 58207: {'lr': 0.00034219887311597686, 'samples': 11175744, 'steps': 58206, 'loss/train': 0.9736303687095642} -08/30/2021 23:40:13 - INFO - __main__ - Step 58208: {'lr': 0.0003421939404202853, 'samples': 11175936, 'steps': 58207, 'loss/train': 1.4000822305679321} -08/30/2021 23:40:14 - INFO - __main__ - Step 58209: {'lr': 0.0003421890076830525, 'samples': 11176128, 'steps': 58208, 'loss/train': 1.3235080242156982} -08/30/2021 23:40:14 - INFO - __main__ - Step 58210: {'lr': 0.00034218407490428085, 'samples': 11176320, 'steps': 58209, 'loss/train': 1.377208948135376} -08/30/2021 23:40:14 - INFO - __main__ - Step 58211: {'lr': 0.0003421791420839724, 'samples': 11176512, 'steps': 58210, 'loss/train': 2.112405776977539} -08/30/2021 23:40:15 - INFO - __main__ - Step 58212: {'lr': 0.00034217420922212947, 'samples': 11176704, 'steps': 58211, 'loss/train': 1.55793297290802} -08/30/2021 23:40:16 - INFO - __main__ - Step 58213: {'lr': 0.0003421692763187543, 'samples': 11176896, 'steps': 58212, 'loss/train': 1.438162922859192} -08/30/2021 23:40:17 - INFO - __main__ - Step 58214: {'lr': 0.00034216434337384905, 'samples': 11177088, 'steps': 58213, 'loss/train': 1.5120490789413452} -08/30/2021 23:40:17 - INFO - __main__ - Step 58215: {'lr': 0.000342159410387416, 'samples': 11177280, 'steps': 58214, 'loss/train': 1.5225783586502075} -08/30/2021 23:40:18 - INFO - __main__ - Step 58216: {'lr': 0.0003421544773594573, 'samples': 11177472, 'steps': 58215, 'loss/train': 0.18304598331451416} -08/30/2021 23:40:18 - INFO - __main__ - Step 58217: {'lr': 0.0003421495442899753, 'samples': 11177664, 'steps': 58216, 'loss/train': 0.8368443250656128} -08/30/2021 23:40:20 - INFO - __main__ - Step 58218: {'lr': 0.0003421446111789721, 'samples': 11177856, 'steps': 58217, 'loss/train': 0.056102342903614044} -08/30/2021 23:40:20 - INFO - __main__ - Step 58219: {'lr': 0.00034213967802644986, 'samples': 11178048, 'steps': 58218, 'loss/train': 0.07792620360851288} -08/30/2021 23:40:21 - INFO - __main__ - Step 58220: {'lr': 0.000342134744832411, 'samples': 11178240, 'steps': 58219, 'loss/train': 1.8799257278442383} -08/30/2021 23:40:21 - INFO - __main__ - Step 58221: {'lr': 0.0003421298115968576, 'samples': 11178432, 'steps': 58220, 'loss/train': 1.6056959629058838} -08/30/2021 23:40:21 - INFO - __main__ - Step 58222: {'lr': 0.0003421248783197919, 'samples': 11178624, 'steps': 58221, 'loss/train': 1.4657942056655884} -08/30/2021 23:40:23 - INFO - __main__ - Step 58223: {'lr': 0.0003421199450012162, 'samples': 11178816, 'steps': 58222, 'loss/train': 1.5119634866714478} -08/30/2021 23:40:23 - INFO - __main__ - Step 58224: {'lr': 0.00034211501164113276, 'samples': 11179008, 'steps': 58223, 'loss/train': 0.9850744009017944} -08/30/2021 23:40:24 - INFO - __main__ - Step 58225: {'lr': 0.0003421100782395436, 'samples': 11179200, 'steps': 58224, 'loss/train': 1.5450838804244995} -08/30/2021 23:40:24 - INFO - __main__ - Step 58226: {'lr': 0.000342105144796451, 'samples': 11179392, 'steps': 58225, 'loss/train': 1.1443885564804077} -08/30/2021 23:40:24 - INFO - __main__ - Step 58227: {'lr': 0.0003421002113118574, 'samples': 11179584, 'steps': 58226, 'loss/train': 0.7151418924331665} -08/30/2021 23:40:26 - INFO - __main__ - Step 58228: {'lr': 0.00034209527778576477, 'samples': 11179776, 'steps': 58227, 'loss/train': 1.2697087526321411} -08/30/2021 23:40:26 - INFO - __main__ - Step 58229: {'lr': 0.0003420903442181755, 'samples': 11179968, 'steps': 58228, 'loss/train': 1.485098123550415} -08/30/2021 23:40:27 - INFO - __main__ - Step 58230: {'lr': 0.0003420854106090917, 'samples': 11180160, 'steps': 58229, 'loss/train': 1.1717568635940552} -08/30/2021 23:40:27 - INFO - __main__ - Step 58231: {'lr': 0.00034208047695851563, 'samples': 11180352, 'steps': 58230, 'loss/train': 1.856194257736206} -08/30/2021 23:40:27 - INFO - __main__ - Step 58232: {'lr': 0.0003420755432664495, 'samples': 11180544, 'steps': 58231, 'loss/train': 1.4531867504119873} -08/30/2021 23:40:29 - INFO - __main__ - Step 58233: {'lr': 0.0003420706095328956, 'samples': 11180736, 'steps': 58232, 'loss/train': 1.579209566116333} -08/30/2021 23:40:29 - INFO - __main__ - Step 58234: {'lr': 0.0003420656757578561, 'samples': 11180928, 'steps': 58233, 'loss/train': 1.068538784980774} -08/30/2021 23:40:30 - INFO - __main__ - Step 58235: {'lr': 0.00034206074194133323, 'samples': 11181120, 'steps': 58234, 'loss/train': 1.6517542600631714} -08/30/2021 23:40:30 - INFO - __main__ - Step 58236: {'lr': 0.00034205580808332916, 'samples': 11181312, 'steps': 58235, 'loss/train': 1.0482072830200195} -08/30/2021 23:40:30 - INFO - __main__ - Step 58237: {'lr': 0.0003420508741838462, 'samples': 11181504, 'steps': 58236, 'loss/train': 0.9779049158096313} -08/30/2021 23:40:32 - INFO - __main__ - Step 58238: {'lr': 0.0003420459402428865, 'samples': 11181696, 'steps': 58237, 'loss/train': 0.3572382628917694} -08/30/2021 23:40:32 - INFO - __main__ - Step 58239: {'lr': 0.00034204100626045235, 'samples': 11181888, 'steps': 58238, 'loss/train': 0.6780773997306824} -08/30/2021 23:40:33 - INFO - __main__ - Step 58240: {'lr': 0.00034203607223654594, 'samples': 11182080, 'steps': 58239, 'loss/train': 1.6863313913345337} -08/30/2021 23:40:33 - INFO - __main__ - Step 58241: {'lr': 0.00034203113817116957, 'samples': 11182272, 'steps': 58240, 'loss/train': 0.5363484621047974} -08/30/2021 23:40:33 - INFO - __main__ - Step 58242: {'lr': 0.0003420262040643253, 'samples': 11182464, 'steps': 58241, 'loss/train': 1.9159166812896729} -08/30/2021 23:40:35 - INFO - __main__ - Step 58243: {'lr': 0.0003420212699160154, 'samples': 11182656, 'steps': 58242, 'loss/train': 1.2834962606430054} -08/30/2021 23:40:35 - INFO - __main__ - Step 58244: {'lr': 0.00034201633572624216, 'samples': 11182848, 'steps': 58243, 'loss/train': 0.8463221788406372} -08/30/2021 23:40:36 - INFO - __main__ - Step 58245: {'lr': 0.00034201140149500784, 'samples': 11183040, 'steps': 58244, 'loss/train': 1.6710035800933838} -08/30/2021 23:40:36 - INFO - __main__ - Step 58246: {'lr': 0.0003420064672223146, 'samples': 11183232, 'steps': 58245, 'loss/train': 1.238175630569458} -08/30/2021 23:40:36 - INFO - __main__ - Step 58247: {'lr': 0.0003420015329081647, 'samples': 11183424, 'steps': 58246, 'loss/train': 0.28725066781044006} -08/30/2021 23:40:38 - INFO - __main__ - Step 58248: {'lr': 0.00034199659855256023, 'samples': 11183616, 'steps': 58247, 'loss/train': 1.1709293127059937} -08/30/2021 23:40:38 - INFO - __main__ - Step 58249: {'lr': 0.00034199166415550353, 'samples': 11183808, 'steps': 58248, 'loss/train': 1.6371533870697021} -08/30/2021 23:40:38 - INFO - __main__ - Step 58250: {'lr': 0.0003419867297169968, 'samples': 11184000, 'steps': 58249, 'loss/train': 1.169621467590332} -08/30/2021 23:40:39 - INFO - __main__ - Step 58251: {'lr': 0.00034198179523704233, 'samples': 11184192, 'steps': 58250, 'loss/train': 0.8364565968513489} -08/30/2021 23:40:39 - INFO - __main__ - Step 58252: {'lr': 0.0003419768607156423, 'samples': 11184384, 'steps': 58251, 'loss/train': 1.2661550045013428} -08/30/2021 23:40:40 - INFO - __main__ - Step 58253: {'lr': 0.0003419719261527988, 'samples': 11184576, 'steps': 58252, 'loss/train': 1.004204511642456} -08/30/2021 23:40:41 - INFO - __main__ - Step 58254: {'lr': 0.0003419669915485142, 'samples': 11184768, 'steps': 58253, 'loss/train': 0.036508191376924515} -08/30/2021 23:40:41 - INFO - __main__ - Step 58255: {'lr': 0.00034196205690279076, 'samples': 11184960, 'steps': 58254, 'loss/train': 1.972454309463501} -08/30/2021 23:40:42 - INFO - __main__ - Step 58256: {'lr': 0.00034195712221563057, 'samples': 11185152, 'steps': 58255, 'loss/train': 1.0577110052108765} -08/30/2021 23:40:42 - INFO - __main__ - Step 58257: {'lr': 0.00034195218748703596, 'samples': 11185344, 'steps': 58256, 'loss/train': 1.7430599927902222} -08/30/2021 23:40:42 - INFO - __main__ - Step 58258: {'lr': 0.00034194725271700915, 'samples': 11185536, 'steps': 58257, 'loss/train': 1.645064353942871} -08/30/2021 23:40:44 - INFO - __main__ - Step 58259: {'lr': 0.0003419423179055523, 'samples': 11185728, 'steps': 58258, 'loss/train': 0.9579575657844543} -08/30/2021 23:40:44 - INFO - __main__ - Step 58260: {'lr': 0.0003419373830526676, 'samples': 11185920, 'steps': 58259, 'loss/train': 0.7023940682411194} -08/30/2021 23:40:45 - INFO - __main__ - Step 58261: {'lr': 0.0003419324481583574, 'samples': 11186112, 'steps': 58260, 'loss/train': 1.455538272857666} -08/30/2021 23:40:45 - INFO - __main__ - Step 58262: {'lr': 0.00034192751322262375, 'samples': 11186304, 'steps': 58261, 'loss/train': 1.2937004566192627} -08/30/2021 23:40:45 - INFO - __main__ - Step 58263: {'lr': 0.0003419225782454691, 'samples': 11186496, 'steps': 58262, 'loss/train': 0.028503045439720154} -08/30/2021 23:40:48 - INFO - __main__ - Step 58264: {'lr': 0.00034191764322689553, 'samples': 11186688, 'steps': 58263, 'loss/train': 1.3785802125930786} -08/30/2021 23:40:48 - INFO - __main__ - Step 58265: {'lr': 0.00034191270816690526, 'samples': 11186880, 'steps': 58264, 'loss/train': 1.3031697273254395} -08/30/2021 23:40:49 - INFO - __main__ - Step 58266: {'lr': 0.0003419077730655006, 'samples': 11187072, 'steps': 58265, 'loss/train': 1.474822998046875} -08/30/2021 23:40:49 - INFO - __main__ - Step 58267: {'lr': 0.00034190283792268365, 'samples': 11187264, 'steps': 58266, 'loss/train': 1.697913646697998} -08/30/2021 23:40:49 - INFO - __main__ - Step 58268: {'lr': 0.0003418979027384567, 'samples': 11187456, 'steps': 58267, 'loss/train': 1.3406145572662354} -08/30/2021 23:40:51 - INFO - __main__ - Step 58269: {'lr': 0.00034189296751282203, 'samples': 11187648, 'steps': 58268, 'loss/train': 0.7187969088554382} -08/30/2021 23:40:51 - INFO - __main__ - Step 58270: {'lr': 0.0003418880322457817, 'samples': 11187840, 'steps': 58269, 'loss/train': 1.5781772136688232} -08/30/2021 23:40:52 - INFO - __main__ - Step 58271: {'lr': 0.0003418830969373382, 'samples': 11188032, 'steps': 58270, 'loss/train': 1.324567437171936} -08/30/2021 23:40:52 - INFO - __main__ - Step 58272: {'lr': 0.00034187816158749354, 'samples': 11188224, 'steps': 58271, 'loss/train': 1.1467859745025635} -08/30/2021 23:40:52 - INFO - __main__ - Step 58273: {'lr': 0.00034187322619624996, 'samples': 11188416, 'steps': 58272, 'loss/train': 1.5315423011779785} -08/30/2021 23:40:54 - INFO - __main__ - Step 58274: {'lr': 0.0003418682907636097, 'samples': 11188608, 'steps': 58273, 'loss/train': 0.8884255290031433} -08/30/2021 23:40:54 - INFO - __main__ - Step 58275: {'lr': 0.000341863355289575, 'samples': 11188800, 'steps': 58274, 'loss/train': 1.6121199131011963} -08/30/2021 23:40:55 - INFO - __main__ - Step 58276: {'lr': 0.0003418584197741481, 'samples': 11188992, 'steps': 58275, 'loss/train': 1.1168267726898193} -08/30/2021 23:40:55 - INFO - __main__ - Step 58277: {'lr': 0.00034185348421733125, 'samples': 11189184, 'steps': 58276, 'loss/train': 1.1643896102905273} -08/30/2021 23:40:55 - INFO - __main__ - Step 58278: {'lr': 0.0003418485486191267, 'samples': 11189376, 'steps': 58277, 'loss/train': 0.6503121256828308} -08/30/2021 23:40:56 - INFO - __main__ - Step 58279: {'lr': 0.0003418436129795365, 'samples': 11189568, 'steps': 58278, 'loss/train': 0.6299277544021606} -08/30/2021 23:40:58 - INFO - __main__ - Step 58280: {'lr': 0.000341838677298563, 'samples': 11189760, 'steps': 58279, 'loss/train': 1.1273937225341797} -08/30/2021 23:40:58 - INFO - __main__ - Step 58281: {'lr': 0.00034183374157620847, 'samples': 11189952, 'steps': 58280, 'loss/train': 1.6415847539901733} -08/30/2021 23:40:59 - INFO - __main__ - Step 58282: {'lr': 0.000341828805812475, 'samples': 11190144, 'steps': 58281, 'loss/train': 0.8988140821456909} -08/30/2021 23:40:59 - INFO - __main__ - Step 58283: {'lr': 0.0003418238700073649, 'samples': 11190336, 'steps': 58282, 'loss/train': 1.3404672145843506} -08/30/2021 23:40:59 - INFO - __main__ - Step 58284: {'lr': 0.0003418189341608804, 'samples': 11190528, 'steps': 58283, 'loss/train': 0.4190874397754669} -08/30/2021 23:41:00 - INFO - __main__ - Step 58285: {'lr': 0.0003418139982730237, 'samples': 11190720, 'steps': 58284, 'loss/train': 0.07678170502185822} -08/30/2021 23:41:02 - INFO - __main__ - Step 58286: {'lr': 0.0003418090623437971, 'samples': 11190912, 'steps': 58285, 'loss/train': 0.20437584817409515} -08/30/2021 23:41:02 - INFO - __main__ - Step 58287: {'lr': 0.00034180412637320267, 'samples': 11191104, 'steps': 58286, 'loss/train': 0.07539796084165573} -08/30/2021 23:41:02 - INFO - __main__ - Step 58288: {'lr': 0.0003417991903612427, 'samples': 11191296, 'steps': 58287, 'loss/train': 1.7511036396026611} -08/30/2021 23:41:03 - INFO - __main__ - Step 58289: {'lr': 0.0003417942543079195, 'samples': 11191488, 'steps': 58288, 'loss/train': 1.6025481224060059} -08/30/2021 23:41:03 - INFO - __main__ - Step 58290: {'lr': 0.00034178931821323517, 'samples': 11191680, 'steps': 58289, 'loss/train': 1.0312312841415405} -08/30/2021 23:41:05 - INFO - __main__ - Step 58291: {'lr': 0.0003417843820771921, 'samples': 11191872, 'steps': 58290, 'loss/train': 1.3161014318466187} -08/30/2021 23:41:05 - INFO - __main__ - Step 58292: {'lr': 0.00034177944589979225, 'samples': 11192064, 'steps': 58291, 'loss/train': 0.8433822393417358} -08/30/2021 23:41:05 - INFO - __main__ - Step 58293: {'lr': 0.0003417745096810381, 'samples': 11192256, 'steps': 58292, 'loss/train': 1.5228179693222046} -08/30/2021 23:41:06 - INFO - __main__ - Step 58294: {'lr': 0.00034176957342093174, 'samples': 11192448, 'steps': 58293, 'loss/train': 1.3527491092681885} -08/30/2021 23:41:06 - INFO - __main__ - Step 58295: {'lr': 0.0003417646371194754, 'samples': 11192640, 'steps': 58294, 'loss/train': 1.499741792678833} -08/30/2021 23:41:07 - INFO - __main__ - Step 58296: {'lr': 0.00034175970077667136, 'samples': 11192832, 'steps': 58295, 'loss/train': 1.403458833694458} -08/30/2021 23:41:08 - INFO - __main__ - Step 58297: {'lr': 0.00034175476439252177, 'samples': 11193024, 'steps': 58296, 'loss/train': 0.5339193940162659} -08/30/2021 23:41:08 - INFO - __main__ - Step 58298: {'lr': 0.00034174982796702895, 'samples': 11193216, 'steps': 58297, 'loss/train': 1.1196876764297485} -08/30/2021 23:41:09 - INFO - __main__ - Step 58299: {'lr': 0.00034174489150019506, 'samples': 11193408, 'steps': 58298, 'loss/train': 1.637571096420288} -08/30/2021 23:41:09 - INFO - __main__ - Step 58300: {'lr': 0.0003417399549920224, 'samples': 11193600, 'steps': 58299, 'loss/train': 1.0556622743606567} -08/30/2021 23:41:11 - INFO - __main__ - Step 58301: {'lr': 0.00034173501844251305, 'samples': 11193792, 'steps': 58300, 'loss/train': 1.6106003522872925} -08/30/2021 23:41:11 - INFO - __main__ - Step 58302: {'lr': 0.0003417300818516693, 'samples': 11193984, 'steps': 58301, 'loss/train': 0.8166095614433289} -08/30/2021 23:41:11 - INFO - __main__ - Step 58303: {'lr': 0.00034172514521949336, 'samples': 11194176, 'steps': 58302, 'loss/train': 0.6534811854362488} -08/30/2021 23:41:12 - INFO - __main__ - Step 58304: {'lr': 0.0003417202085459876, 'samples': 11194368, 'steps': 58303, 'loss/train': 1.320803165435791} -08/30/2021 23:41:12 - INFO - __main__ - Step 58305: {'lr': 0.00034171527183115413, 'samples': 11194560, 'steps': 58304, 'loss/train': 0.17822426557540894} -08/30/2021 23:41:14 - INFO - __main__ - Step 58306: {'lr': 0.0003417103350749951, 'samples': 11194752, 'steps': 58305, 'loss/train': 0.942302942276001} -08/30/2021 23:41:14 - INFO - __main__ - Step 58307: {'lr': 0.00034170539827751284, 'samples': 11194944, 'steps': 58306, 'loss/train': 1.3024427890777588} -08/30/2021 23:41:14 - INFO - __main__ - Step 58308: {'lr': 0.0003417004614387095, 'samples': 11195136, 'steps': 58307, 'loss/train': 1.1807435750961304} -08/30/2021 23:41:15 - INFO - __main__ - Step 58309: {'lr': 0.0003416955245585874, 'samples': 11195328, 'steps': 58308, 'loss/train': 1.454353928565979} -08/30/2021 23:41:15 - INFO - __main__ - Step 58310: {'lr': 0.00034169058763714865, 'samples': 11195520, 'steps': 58309, 'loss/train': 0.9266914129257202} -08/30/2021 23:41:17 - INFO - __main__ - Step 58311: {'lr': 0.0003416856506743956, 'samples': 11195712, 'steps': 58310, 'loss/train': 1.1807876825332642} -08/30/2021 23:41:17 - INFO - __main__ - Step 58312: {'lr': 0.00034168071367033043, 'samples': 11195904, 'steps': 58311, 'loss/train': 1.4732695817947388} -08/30/2021 23:41:18 - INFO - __main__ - Step 58313: {'lr': 0.0003416757766249553, 'samples': 11196096, 'steps': 58312, 'loss/train': 1.3171892166137695} -08/30/2021 23:41:18 - INFO - __main__ - Step 58314: {'lr': 0.0003416708395382725, 'samples': 11196288, 'steps': 58313, 'loss/train': 1.5048414468765259} -08/30/2021 23:41:18 - INFO - __main__ - Step 58315: {'lr': 0.00034166590241028425, 'samples': 11196480, 'steps': 58314, 'loss/train': 1.036845326423645} -08/30/2021 23:41:20 - INFO - __main__ - Step 58316: {'lr': 0.00034166096524099264, 'samples': 11196672, 'steps': 58315, 'loss/train': 1.2998428344726562} -08/30/2021 23:41:20 - INFO - __main__ - Step 58317: {'lr': 0.00034165602803040013, 'samples': 11196864, 'steps': 58316, 'loss/train': 1.593919277191162} -08/30/2021 23:41:20 - INFO - __main__ - Step 58318: {'lr': 0.00034165109077850884, 'samples': 11197056, 'steps': 58317, 'loss/train': 1.820627212524414} -08/30/2021 23:41:21 - INFO - __main__ - Step 58319: {'lr': 0.00034164615348532094, 'samples': 11197248, 'steps': 58318, 'loss/train': 1.5240626335144043} -08/30/2021 23:41:21 - INFO - __main__ - Step 58320: {'lr': 0.0003416412161508387, 'samples': 11197440, 'steps': 58319, 'loss/train': 1.3691742420196533} -08/30/2021 23:41:23 - INFO - __main__ - Step 58321: {'lr': 0.0003416362787750643, 'samples': 11197632, 'steps': 58320, 'loss/train': 1.2240175008773804} -08/30/2021 23:41:24 - INFO - __main__ - Step 58322: {'lr': 0.00034163134135800004, 'samples': 11197824, 'steps': 58321, 'loss/train': 1.71846342086792} -08/30/2021 23:41:24 - INFO - __main__ - Step 58323: {'lr': 0.00034162640389964814, 'samples': 11198016, 'steps': 58322, 'loss/train': 1.1008986234664917} -08/30/2021 23:41:24 - INFO - __main__ - Step 58324: {'lr': 0.0003416214664000108, 'samples': 11198208, 'steps': 58323, 'loss/train': 1.53416907787323} -08/30/2021 23:41:25 - INFO - __main__ - Step 58325: {'lr': 0.00034161652885909025, 'samples': 11198400, 'steps': 58324, 'loss/train': 0.2563075125217438} -08/30/2021 23:41:25 - INFO - __main__ - Step 58326: {'lr': 0.0003416115912768887, 'samples': 11198592, 'steps': 58325, 'loss/train': 0.9635010361671448} -08/30/2021 23:41:27 - INFO - __main__ - Step 58327: {'lr': 0.0003416066536534083, 'samples': 11198784, 'steps': 58326, 'loss/train': 1.0989446640014648} -08/30/2021 23:41:27 - INFO - __main__ - Step 58328: {'lr': 0.0003416017159886514, 'samples': 11198976, 'steps': 58327, 'loss/train': 0.6972031593322754} -08/30/2021 23:41:27 - INFO - __main__ - Step 58329: {'lr': 0.0003415967782826202, 'samples': 11199168, 'steps': 58328, 'loss/train': 1.3485358953475952} -08/30/2021 23:41:28 - INFO - __main__ - Step 58330: {'lr': 0.0003415918405353169, 'samples': 11199360, 'steps': 58329, 'loss/train': 1.6061773300170898} -08/30/2021 23:41:28 - INFO - __main__ - Step 58331: {'lr': 0.0003415869027467437, 'samples': 11199552, 'steps': 58330, 'loss/train': 1.1461906433105469} -08/30/2021 23:41:29 - INFO - __main__ - Step 58332: {'lr': 0.000341581964916903, 'samples': 11199744, 'steps': 58331, 'loss/train': 1.0337737798690796} -08/30/2021 23:41:30 - INFO - __main__ - Step 58333: {'lr': 0.00034157702704579667, 'samples': 11199936, 'steps': 58332, 'loss/train': 1.602339506149292} -08/30/2021 23:41:30 - INFO - __main__ - Step 58334: {'lr': 0.00034157208913342726, 'samples': 11200128, 'steps': 58333, 'loss/train': 0.9502540230751038} -08/30/2021 23:41:31 - INFO - __main__ - Step 58335: {'lr': 0.00034156715117979685, 'samples': 11200320, 'steps': 58334, 'loss/train': 1.6734758615493774} -08/30/2021 23:41:31 - INFO - __main__ - Step 58336: {'lr': 0.00034156221318490767, 'samples': 11200512, 'steps': 58335, 'loss/train': 0.8886157870292664} -08/30/2021 23:41:33 - INFO - __main__ - Step 58337: {'lr': 0.000341557275148762, 'samples': 11200704, 'steps': 58336, 'loss/train': 1.6553969383239746} -08/30/2021 23:41:33 - INFO - __main__ - Step 58338: {'lr': 0.0003415523370713621, 'samples': 11200896, 'steps': 58337, 'loss/train': 0.9717940092086792} -08/30/2021 23:41:33 - INFO - __main__ - Step 58339: {'lr': 0.00034154739895271005, 'samples': 11201088, 'steps': 58338, 'loss/train': 1.4921331405639648} -08/30/2021 23:41:34 - INFO - __main__ - Step 58340: {'lr': 0.00034154246079280817, 'samples': 11201280, 'steps': 58339, 'loss/train': 1.2828714847564697} -08/30/2021 23:41:34 - INFO - __main__ - Step 58341: {'lr': 0.0003415375225916586, 'samples': 11201472, 'steps': 58340, 'loss/train': 1.5482741594314575} -08/30/2021 23:41:36 - INFO - __main__ - Step 58342: {'lr': 0.0003415325843492637, 'samples': 11201664, 'steps': 58341, 'loss/train': 0.8064612150192261} -08/30/2021 23:41:36 - INFO - __main__ - Step 58343: {'lr': 0.00034152764606562564, 'samples': 11201856, 'steps': 58342, 'loss/train': 1.6249662637710571} -08/30/2021 23:41:36 - INFO - __main__ - Step 58344: {'lr': 0.0003415227077407466, 'samples': 11202048, 'steps': 58343, 'loss/train': 1.5568772554397583} -08/30/2021 23:41:37 - INFO - __main__ - Step 58345: {'lr': 0.00034151776937462895, 'samples': 11202240, 'steps': 58344, 'loss/train': 1.4553463459014893} -08/30/2021 23:41:37 - INFO - __main__ - Step 58346: {'lr': 0.0003415128309672747, 'samples': 11202432, 'steps': 58345, 'loss/train': 3.9053075313568115} -08/30/2021 23:41:39 - INFO - __main__ - Step 58347: {'lr': 0.0003415078925186862, 'samples': 11202624, 'steps': 58346, 'loss/train': 1.044439673423767} -08/30/2021 23:41:39 - INFO - __main__ - Step 58348: {'lr': 0.00034150295402886566, 'samples': 11202816, 'steps': 58347, 'loss/train': 1.4932725429534912} -08/30/2021 23:41:39 - INFO - __main__ - Step 58349: {'lr': 0.0003414980154978153, 'samples': 11203008, 'steps': 58348, 'loss/train': 1.1157665252685547} -08/30/2021 23:41:40 - INFO - __main__ - Step 58350: {'lr': 0.00034149307692553734, 'samples': 11203200, 'steps': 58349, 'loss/train': 1.2668721675872803} -08/30/2021 23:41:40 - INFO - __main__ - Step 58351: {'lr': 0.000341488138312034, 'samples': 11203392, 'steps': 58350, 'loss/train': 1.0727137327194214} -08/30/2021 23:41:42 - INFO - __main__ - Step 58352: {'lr': 0.00034148319965730757, 'samples': 11203584, 'steps': 58351, 'loss/train': 2.1890830993652344} -08/30/2021 23:41:42 - INFO - __main__ - Step 58353: {'lr': 0.0003414782609613602, 'samples': 11203776, 'steps': 58352, 'loss/train': 1.31967031955719} -08/30/2021 23:41:43 - INFO - __main__ - Step 58354: {'lr': 0.0003414733222241941, 'samples': 11203968, 'steps': 58353, 'loss/train': 1.557159423828125} -08/30/2021 23:41:43 - INFO - __main__ - Step 58355: {'lr': 0.00034146838344581155, 'samples': 11204160, 'steps': 58354, 'loss/train': 1.4454480409622192} -08/30/2021 23:41:43 - INFO - __main__ - Step 58356: {'lr': 0.00034146344462621477, 'samples': 11204352, 'steps': 58355, 'loss/train': 1.3503144979476929} -08/30/2021 23:41:44 - INFO - __main__ - Step 58357: {'lr': 0.00034145850576540595, 'samples': 11204544, 'steps': 58356, 'loss/train': 0.9911277890205383} -08/30/2021 23:41:45 - INFO - __main__ - Step 58358: {'lr': 0.00034145356686338736, 'samples': 11204736, 'steps': 58357, 'loss/train': 1.2887252569198608} -08/30/2021 23:41:46 - INFO - __main__ - Step 58359: {'lr': 0.00034144862792016123, 'samples': 11204928, 'steps': 58358, 'loss/train': 1.0167911052703857} -08/30/2021 23:41:46 - INFO - __main__ - Step 58360: {'lr': 0.00034144368893572973, 'samples': 11205120, 'steps': 58359, 'loss/train': 1.5796236991882324} -08/30/2021 23:41:46 - INFO - __main__ - Step 58361: {'lr': 0.00034143874991009513, 'samples': 11205312, 'steps': 58360, 'loss/train': 1.3113913536071777} -08/30/2021 23:41:47 - INFO - __main__ - Step 58362: {'lr': 0.0003414338108432596, 'samples': 11205504, 'steps': 58361, 'loss/train': 1.3880691528320312} -08/30/2021 23:41:48 - INFO - __main__ - Step 58363: {'lr': 0.0003414288717352254, 'samples': 11205696, 'steps': 58362, 'loss/train': 0.9511662125587463} -08/30/2021 23:41:49 - INFO - __main__ - Step 58364: {'lr': 0.00034142393258599485, 'samples': 11205888, 'steps': 58363, 'loss/train': 1.5379542112350464} -08/30/2021 23:41:49 - INFO - __main__ - Step 58365: {'lr': 0.00034141899339557003, 'samples': 11206080, 'steps': 58364, 'loss/train': 1.3214648962020874} -08/30/2021 23:41:50 - INFO - __main__ - Step 58366: {'lr': 0.0003414140541639532, 'samples': 11206272, 'steps': 58365, 'loss/train': 0.6372202634811401} -08/30/2021 23:41:50 - INFO - __main__ - Step 58367: {'lr': 0.0003414091148911466, 'samples': 11206464, 'steps': 58366, 'loss/train': 0.2655096650123596} -08/30/2021 23:41:50 - INFO - __main__ - Step 58368: {'lr': 0.00034140417557715255, 'samples': 11206656, 'steps': 58367, 'loss/train': 0.029668845236301422} -08/30/2021 23:41:52 - INFO - __main__ - Step 58369: {'lr': 0.0003413992362219731, 'samples': 11206848, 'steps': 58368, 'loss/train': 0.02448113076388836} -08/30/2021 23:41:52 - INFO - __main__ - Step 58370: {'lr': 0.0003413942968256106, 'samples': 11207040, 'steps': 58369, 'loss/train': 1.6676126718521118} -08/30/2021 23:41:53 - INFO - __main__ - Step 58371: {'lr': 0.00034138935738806727, 'samples': 11207232, 'steps': 58370, 'loss/train': 1.2436788082122803} -08/30/2021 23:41:53 - INFO - __main__ - Step 58372: {'lr': 0.0003413844179093453, 'samples': 11207424, 'steps': 58371, 'loss/train': 1.169629454612732} -08/30/2021 23:41:53 - INFO - __main__ - Step 58373: {'lr': 0.0003413794783894468, 'samples': 11207616, 'steps': 58372, 'loss/train': 1.327942132949829} -08/30/2021 23:41:56 - INFO - __main__ - Step 58374: {'lr': 0.0003413745388283742, 'samples': 11207808, 'steps': 58373, 'loss/train': 1.7049061059951782} -08/30/2021 23:41:56 - INFO - __main__ - Step 58375: {'lr': 0.00034136959922612977, 'samples': 11208000, 'steps': 58374, 'loss/train': 0.10986167192459106} -08/30/2021 23:41:56 - INFO - __main__ - Step 58376: {'lr': 0.00034136465958271546, 'samples': 11208192, 'steps': 58375, 'loss/train': 1.5120428800582886} -08/30/2021 23:41:57 - INFO - __main__ - Step 58377: {'lr': 0.00034135971989813363, 'samples': 11208384, 'steps': 58376, 'loss/train': 0.8108828067779541} -08/30/2021 23:41:57 - INFO - __main__ - Step 58378: {'lr': 0.0003413547801723866, 'samples': 11208576, 'steps': 58377, 'loss/train': 1.3272757530212402} -08/30/2021 23:41:58 - INFO - __main__ - Step 58379: {'lr': 0.00034134984040547645, 'samples': 11208768, 'steps': 58378, 'loss/train': 1.148912787437439} -08/30/2021 23:42:00 - INFO - __main__ - Step 58380: {'lr': 0.0003413449005974055, 'samples': 11208960, 'steps': 58379, 'loss/train': 1.270913004875183} -08/30/2021 23:42:00 - INFO - __main__ - Step 58381: {'lr': 0.00034133996074817597, 'samples': 11209152, 'steps': 58380, 'loss/train': 1.4343620538711548} -08/30/2021 23:42:00 - INFO - __main__ - Step 58382: {'lr': 0.00034133502085779006, 'samples': 11209344, 'steps': 58381, 'loss/train': 1.547174096107483} -08/30/2021 23:42:01 - INFO - __main__ - Step 58383: {'lr': 0.00034133008092624995, 'samples': 11209536, 'steps': 58382, 'loss/train': 1.1758009195327759} -08/30/2021 23:42:01 - INFO - __main__ - Step 58384: {'lr': 0.0003413251409535579, 'samples': 11209728, 'steps': 58383, 'loss/train': 0.631420910358429} -08/30/2021 23:42:02 - INFO - __main__ - Step 58385: {'lr': 0.0003413202009397163, 'samples': 11209920, 'steps': 58384, 'loss/train': 0.18398058414459229} -08/30/2021 23:42:03 - INFO - __main__ - Step 58386: {'lr': 0.0003413152608847271, 'samples': 11210112, 'steps': 58385, 'loss/train': 1.3006185293197632} -08/30/2021 23:42:03 - INFO - __main__ - Step 58387: {'lr': 0.0003413103207885927, 'samples': 11210304, 'steps': 58386, 'loss/train': 0.7882906794548035} -08/30/2021 23:42:04 - INFO - __main__ - Step 58388: {'lr': 0.00034130538065131524, 'samples': 11210496, 'steps': 58387, 'loss/train': 1.257989764213562} -08/30/2021 23:42:04 - INFO - __main__ - Step 58389: {'lr': 0.000341300440472897, 'samples': 11210688, 'steps': 58388, 'loss/train': 1.9831308126449585} -08/30/2021 23:42:06 - INFO - __main__ - Step 58390: {'lr': 0.00034129550025334014, 'samples': 11210880, 'steps': 58389, 'loss/train': 1.1269623041152954} -08/30/2021 23:42:06 - INFO - __main__ - Step 58391: {'lr': 0.00034129055999264704, 'samples': 11211072, 'steps': 58390, 'loss/train': 1.4731924533843994} -08/30/2021 23:42:06 - INFO - __main__ - Step 58392: {'lr': 0.0003412856196908198, 'samples': 11211264, 'steps': 58391, 'loss/train': 0.9884055852890015} -08/30/2021 23:42:07 - INFO - __main__ - Step 58393: {'lr': 0.00034128067934786064, 'samples': 11211456, 'steps': 58392, 'loss/train': 1.8362431526184082} -08/30/2021 23:42:07 - INFO - __main__ - Step 58394: {'lr': 0.0003412757389637718, 'samples': 11211648, 'steps': 58393, 'loss/train': 0.9452770352363586} -08/30/2021 23:42:08 - INFO - __main__ - Step 58395: {'lr': 0.00034127079853855545, 'samples': 11211840, 'steps': 58394, 'loss/train': 1.2396337985992432} -08/30/2021 23:42:09 - INFO - __main__ - Step 58396: {'lr': 0.00034126585807221397, 'samples': 11212032, 'steps': 58395, 'loss/train': 1.246291160583496} -08/30/2021 23:42:09 - INFO - __main__ - Step 58397: {'lr': 0.0003412609175647495, 'samples': 11212224, 'steps': 58396, 'loss/train': 1.094338297843933} -08/30/2021 23:42:10 - INFO - __main__ - Step 58398: {'lr': 0.0003412559770161643, 'samples': 11212416, 'steps': 58397, 'loss/train': 0.86078280210495} -08/30/2021 23:42:10 - INFO - __main__ - Step 58399: {'lr': 0.0003412510364264606, 'samples': 11212608, 'steps': 58398, 'loss/train': 0.33593595027923584} -08/30/2021 23:42:10 - INFO - __main__ - Step 58400: {'lr': 0.0003412460957956405, 'samples': 11212800, 'steps': 58399, 'loss/train': 1.7203713655471802} -08/30/2021 23:42:12 - INFO - __main__ - Step 58401: {'lr': 0.00034124115512370636, 'samples': 11212992, 'steps': 58400, 'loss/train': 1.215850830078125} -08/30/2021 23:42:12 - INFO - __main__ - Step 58402: {'lr': 0.0003412362144106603, 'samples': 11213184, 'steps': 58401, 'loss/train': 2.255078077316284} -08/30/2021 23:42:13 - INFO - __main__ - Step 58403: {'lr': 0.00034123127365650463, 'samples': 11213376, 'steps': 58402, 'loss/train': 0.6384060382843018} -08/30/2021 23:42:13 - INFO - __main__ - Step 58404: {'lr': 0.0003412263328612416, 'samples': 11213568, 'steps': 58403, 'loss/train': 0.7852904796600342} -08/30/2021 23:42:13 - INFO - __main__ - Step 58405: {'lr': 0.00034122139202487334, 'samples': 11213760, 'steps': 58404, 'loss/train': 1.2657862901687622} -08/30/2021 23:42:15 - INFO - __main__ - Step 58406: {'lr': 0.00034121645114740224, 'samples': 11213952, 'steps': 58405, 'loss/train': 1.1440041065216064} -08/30/2021 23:42:16 - INFO - __main__ - Step 58407: {'lr': 0.00034121151022883033, 'samples': 11214144, 'steps': 58406, 'loss/train': 0.7610243558883667} -08/30/2021 23:42:16 - INFO - __main__ - Step 58408: {'lr': 0.00034120656926915995, 'samples': 11214336, 'steps': 58407, 'loss/train': 1.120870590209961} -08/30/2021 23:42:16 - INFO - __main__ - Step 58409: {'lr': 0.0003412016282683932, 'samples': 11214528, 'steps': 58408, 'loss/train': 1.2031358480453491} -08/30/2021 23:42:17 - INFO - __main__ - Step 58410: {'lr': 0.0003411966872265325, 'samples': 11214720, 'steps': 58409, 'loss/train': 0.04337947070598602} -08/30/2021 23:42:18 - INFO - __main__ - Step 58411: {'lr': 0.00034119174614357994, 'samples': 11214912, 'steps': 58410, 'loss/train': 1.2732492685317993} -08/30/2021 23:42:19 - INFO - __main__ - Step 58412: {'lr': 0.00034118680501953784, 'samples': 11215104, 'steps': 58411, 'loss/train': 1.3456593751907349} -08/30/2021 23:42:19 - INFO - __main__ - Step 58413: {'lr': 0.00034118186385440833, 'samples': 11215296, 'steps': 58412, 'loss/train': 1.5052320957183838} -08/30/2021 23:42:19 - INFO - __main__ - Step 58414: {'lr': 0.00034117692264819374, 'samples': 11215488, 'steps': 58413, 'loss/train': 0.8616198301315308} -08/30/2021 23:42:20 - INFO - __main__ - Step 58415: {'lr': 0.0003411719814008961, 'samples': 11215680, 'steps': 58414, 'loss/train': 1.5524102449417114} -08/30/2021 23:42:20 - INFO - __main__ - Step 58416: {'lr': 0.0003411670401125179, 'samples': 11215872, 'steps': 58415, 'loss/train': 1.472939133644104} -08/30/2021 23:42:21 - INFO - __main__ - Step 58417: {'lr': 0.00034116209878306116, 'samples': 11216064, 'steps': 58416, 'loss/train': 1.1102699041366577} -08/30/2021 23:42:22 - INFO - __main__ - Step 58418: {'lr': 0.00034115715741252824, 'samples': 11216256, 'steps': 58417, 'loss/train': 0.19590973854064941} -08/30/2021 23:42:22 - INFO - __main__ - Step 58419: {'lr': 0.0003411522160009213, 'samples': 11216448, 'steps': 58418, 'loss/train': 1.494523048400879} -08/30/2021 23:42:23 - INFO - __main__ - Step 58420: {'lr': 0.00034114727454824257, 'samples': 11216640, 'steps': 58419, 'loss/train': 1.3751004934310913} -08/30/2021 23:42:23 - INFO - __main__ - Step 58421: {'lr': 0.00034114233305449426, 'samples': 11216832, 'steps': 58420, 'loss/train': 1.1613978147506714} -08/30/2021 23:42:24 - INFO - __main__ - Step 58422: {'lr': 0.00034113739151967864, 'samples': 11217024, 'steps': 58421, 'loss/train': 0.4387499690055847} -08/30/2021 23:42:25 - INFO - __main__ - Step 58423: {'lr': 0.00034113244994379794, 'samples': 11217216, 'steps': 58422, 'loss/train': 1.5585343837738037} -08/30/2021 23:42:25 - INFO - __main__ - Step 58424: {'lr': 0.00034112750832685434, 'samples': 11217408, 'steps': 58423, 'loss/train': 1.387988567352295} -08/30/2021 23:42:26 - INFO - __main__ - Step 58425: {'lr': 0.0003411225666688501, 'samples': 11217600, 'steps': 58424, 'loss/train': 1.0463138818740845} -08/30/2021 23:42:26 - INFO - __main__ - Step 58426: {'lr': 0.0003411176249697875, 'samples': 11217792, 'steps': 58425, 'loss/train': 1.821783423423767} -08/30/2021 23:42:28 - INFO - __main__ - Step 58427: {'lr': 0.0003411126832296686, 'samples': 11217984, 'steps': 58426, 'loss/train': 1.3335225582122803} -08/30/2021 23:42:29 - INFO - __main__ - Step 58428: {'lr': 0.00034110774144849575, 'samples': 11218176, 'steps': 58427, 'loss/train': 1.253514289855957} -08/30/2021 23:42:29 - INFO - __main__ - Step 58429: {'lr': 0.00034110279962627115, 'samples': 11218368, 'steps': 58428, 'loss/train': 1.5873173475265503} -08/30/2021 23:42:29 - INFO - __main__ - Step 58430: {'lr': 0.0003410978577629971, 'samples': 11218560, 'steps': 58429, 'loss/train': 0.23265917599201202} -08/30/2021 23:42:30 - INFO - __main__ - Step 58431: {'lr': 0.0003410929158586757, 'samples': 11218752, 'steps': 58430, 'loss/train': 1.1849981546401978} -08/30/2021 23:42:31 - INFO - __main__ - Step 58432: {'lr': 0.0003410879739133093, 'samples': 11218944, 'steps': 58431, 'loss/train': 1.8296526670455933} -08/30/2021 23:42:32 - INFO - __main__ - Step 58433: {'lr': 0.00034108303192690003, 'samples': 11219136, 'steps': 58432, 'loss/train': 1.786566972732544} -08/30/2021 23:42:32 - INFO - __main__ - Step 58434: {'lr': 0.0003410780898994501, 'samples': 11219328, 'steps': 58433, 'loss/train': 1.3981993198394775} -08/30/2021 23:42:32 - INFO - __main__ - Step 58435: {'lr': 0.00034107314783096183, 'samples': 11219520, 'steps': 58434, 'loss/train': 1.4601951837539673} -08/30/2021 23:42:33 - INFO - __main__ - Step 58436: {'lr': 0.0003410682057214374, 'samples': 11219712, 'steps': 58435, 'loss/train': 2.132354497909546} -08/30/2021 23:42:34 - INFO - __main__ - Step 58437: {'lr': 0.00034106326357087905, 'samples': 11219904, 'steps': 58436, 'loss/train': 1.478259801864624} -08/30/2021 23:42:35 - INFO - __main__ - Step 58438: {'lr': 0.000341058321379289, 'samples': 11220096, 'steps': 58437, 'loss/train': 1.3704030513763428} -08/30/2021 23:42:35 - INFO - __main__ - Step 58439: {'lr': 0.0003410533791466695, 'samples': 11220288, 'steps': 58438, 'loss/train': 1.217626929283142} -08/30/2021 23:42:35 - INFO - __main__ - Step 58440: {'lr': 0.0003410484368730227, 'samples': 11220480, 'steps': 58439, 'loss/train': 1.5148245096206665} -08/30/2021 23:42:36 - INFO - __main__ - Step 58441: {'lr': 0.00034104349455835094, 'samples': 11220672, 'steps': 58440, 'loss/train': 1.871681571006775} -08/30/2021 23:42:36 - INFO - __main__ - Step 58442: {'lr': 0.0003410385522026563, 'samples': 11220864, 'steps': 58441, 'loss/train': 1.5324757099151611} -08/30/2021 23:42:37 - INFO - __main__ - Step 58443: {'lr': 0.0003410336098059412, 'samples': 11221056, 'steps': 58442, 'loss/train': 1.0603808164596558} -08/30/2021 23:42:38 - INFO - __main__ - Step 58444: {'lr': 0.0003410286673682077, 'samples': 11221248, 'steps': 58443, 'loss/train': 1.6743876934051514} -08/30/2021 23:42:38 - INFO - __main__ - Step 58445: {'lr': 0.0003410237248894581, 'samples': 11221440, 'steps': 58444, 'loss/train': 1.8098150491714478} -08/30/2021 23:42:39 - INFO - __main__ - Step 58446: {'lr': 0.00034101878236969464, 'samples': 11221632, 'steps': 58445, 'loss/train': 1.6807851791381836} -08/30/2021 23:42:39 - INFO - __main__ - Step 58447: {'lr': 0.0003410138398089195, 'samples': 11221824, 'steps': 58446, 'loss/train': 1.5474516153335571} -08/30/2021 23:42:40 - INFO - __main__ - Step 58448: {'lr': 0.0003410088972071349, 'samples': 11222016, 'steps': 58447, 'loss/train': 0.9095951914787292} -08/30/2021 23:42:41 - INFO - __main__ - Step 58449: {'lr': 0.0003410039545643431, 'samples': 11222208, 'steps': 58448, 'loss/train': 1.4669469594955444} -08/30/2021 23:42:41 - INFO - __main__ - Step 58450: {'lr': 0.0003409990118805463, 'samples': 11222400, 'steps': 58449, 'loss/train': 1.2733420133590698} -08/30/2021 23:42:42 - INFO - __main__ - Step 58451: {'lr': 0.0003409940691557468, 'samples': 11222592, 'steps': 58450, 'loss/train': 1.3465402126312256} -08/30/2021 23:42:42 - INFO - __main__ - Step 58452: {'lr': 0.0003409891263899467, 'samples': 11222784, 'steps': 58451, 'loss/train': 1.3954256772994995} -08/30/2021 23:42:44 - INFO - __main__ - Step 58453: {'lr': 0.0003409841835831484, 'samples': 11222976, 'steps': 58452, 'loss/train': 0.5714172720909119} -08/30/2021 23:42:44 - INFO - __main__ - Step 58454: {'lr': 0.000340979240735354, 'samples': 11223168, 'steps': 58453, 'loss/train': 1.2832716703414917} -08/30/2021 23:42:44 - INFO - __main__ - Step 58455: {'lr': 0.00034097429784656574, 'samples': 11223360, 'steps': 58454, 'loss/train': 0.8252901434898376} -08/30/2021 23:42:45 - INFO - __main__ - Step 58456: {'lr': 0.00034096935491678595, 'samples': 11223552, 'steps': 58455, 'loss/train': 1.4410642385482788} -08/30/2021 23:42:45 - INFO - __main__ - Step 58457: {'lr': 0.0003409644119460166, 'samples': 11223744, 'steps': 58456, 'loss/train': 1.3467967510223389} -08/30/2021 23:42:47 - INFO - __main__ - Step 58458: {'lr': 0.00034095946893426024, 'samples': 11223936, 'steps': 58457, 'loss/train': 1.1955325603485107} -08/30/2021 23:42:47 - INFO - __main__ - Step 58459: {'lr': 0.0003409545258815189, 'samples': 11224128, 'steps': 58458, 'loss/train': 2.233649969100952} -08/30/2021 23:42:47 - INFO - __main__ - Step 58460: {'lr': 0.00034094958278779486, 'samples': 11224320, 'steps': 58459, 'loss/train': 1.1679543256759644} -08/30/2021 23:42:48 - INFO - __main__ - Step 58461: {'lr': 0.00034094463965309035, 'samples': 11224512, 'steps': 58460, 'loss/train': 1.3892271518707275} -08/30/2021 23:42:48 - INFO - __main__ - Step 58462: {'lr': 0.00034093969647740755, 'samples': 11224704, 'steps': 58461, 'loss/train': 1.3748226165771484} -08/30/2021 23:42:50 - INFO - __main__ - Step 58463: {'lr': 0.00034093475326074874, 'samples': 11224896, 'steps': 58462, 'loss/train': 1.650243878364563} -08/30/2021 23:42:50 - INFO - __main__ - Step 58464: {'lr': 0.00034092981000311614, 'samples': 11225088, 'steps': 58463, 'loss/train': 0.25024887919425964} -08/30/2021 23:42:51 - INFO - __main__ - Step 58465: {'lr': 0.00034092486670451197, 'samples': 11225280, 'steps': 58464, 'loss/train': 0.8582757115364075} -08/30/2021 23:42:51 - INFO - __main__ - Step 58466: {'lr': 0.0003409199233649385, 'samples': 11225472, 'steps': 58465, 'loss/train': 1.2698558568954468} -08/30/2021 23:42:51 - INFO - __main__ - Step 58467: {'lr': 0.0003409149799843979, 'samples': 11225664, 'steps': 58466, 'loss/train': 1.504538655281067} -08/30/2021 23:42:52 - INFO - __main__ - Step 58468: {'lr': 0.00034091003656289235, 'samples': 11225856, 'steps': 58467, 'loss/train': 1.4923176765441895} -08/30/2021 23:42:53 - INFO - __main__ - Step 58469: {'lr': 0.00034090509310042414, 'samples': 11226048, 'steps': 58468, 'loss/train': 1.2800734043121338} -08/30/2021 23:42:54 - INFO - __main__ - Step 58470: {'lr': 0.00034090014959699554, 'samples': 11226240, 'steps': 58469, 'loss/train': 1.1687654256820679} -08/30/2021 23:42:54 - INFO - __main__ - Step 58471: {'lr': 0.0003408952060526087, 'samples': 11226432, 'steps': 58470, 'loss/train': 1.4248583316802979} -08/30/2021 23:42:54 - INFO - __main__ - Step 58472: {'lr': 0.00034089026246726596, 'samples': 11226624, 'steps': 58471, 'loss/train': 1.5376399755477905} -08/30/2021 23:42:55 - INFO - __main__ - Step 58473: {'lr': 0.00034088531884096944, 'samples': 11226816, 'steps': 58472, 'loss/train': 1.5004537105560303} -08/30/2021 23:42:56 - INFO - __main__ - Step 58474: {'lr': 0.0003408803751737214, 'samples': 11227008, 'steps': 58473, 'loss/train': 1.8636672496795654} -08/30/2021 23:42:57 - INFO - __main__ - Step 58475: {'lr': 0.00034087543146552404, 'samples': 11227200, 'steps': 58474, 'loss/train': 1.744942307472229} -08/30/2021 23:42:57 - INFO - __main__ - Step 58476: {'lr': 0.0003408704877163796, 'samples': 11227392, 'steps': 58475, 'loss/train': 1.6072520017623901} -08/30/2021 23:42:57 - INFO - __main__ - Step 58477: {'lr': 0.00034086554392629033, 'samples': 11227584, 'steps': 58476, 'loss/train': 0.9681432843208313} -08/30/2021 23:42:58 - INFO - __main__ - Step 58478: {'lr': 0.00034086060009525844, 'samples': 11227776, 'steps': 58477, 'loss/train': 1.4817302227020264} -08/30/2021 23:43:00 - INFO - __main__ - Step 58479: {'lr': 0.0003408556562232862, 'samples': 11227968, 'steps': 58478, 'loss/train': 1.2142415046691895} -08/30/2021 23:43:00 - INFO - __main__ - Step 58480: {'lr': 0.00034085071231037585, 'samples': 11228160, 'steps': 58479, 'loss/train': 1.4783388376235962} -08/30/2021 23:43:00 - INFO - __main__ - Step 58481: {'lr': 0.0003408457683565295, 'samples': 11228352, 'steps': 58480, 'loss/train': 1.5649255514144897} -08/30/2021 23:43:01 - INFO - __main__ - Step 58482: {'lr': 0.00034084082436174946, 'samples': 11228544, 'steps': 58481, 'loss/train': 1.256433367729187} -08/30/2021 23:43:01 - INFO - __main__ - Step 58483: {'lr': 0.0003408358803260379, 'samples': 11228736, 'steps': 58482, 'loss/train': 1.355131983757019} -08/30/2021 23:43:01 - INFO - __main__ - Step 58484: {'lr': 0.00034083093624939716, 'samples': 11228928, 'steps': 58483, 'loss/train': 1.467124342918396} -08/30/2021 23:43:03 - INFO - __main__ - Step 58485: {'lr': 0.00034082599213182933, 'samples': 11229120, 'steps': 58484, 'loss/train': 1.0623458623886108} -08/30/2021 23:43:04 - INFO - __main__ - Step 58486: {'lr': 0.0003408210479733368, 'samples': 11229312, 'steps': 58485, 'loss/train': 0.13869057595729828} -08/30/2021 23:43:04 - INFO - __main__ - Step 58487: {'lr': 0.0003408161037739217, 'samples': 11229504, 'steps': 58486, 'loss/train': 1.1083955764770508} -08/30/2021 23:43:05 - INFO - __main__ - Step 58488: {'lr': 0.0003408111595335862, 'samples': 11229696, 'steps': 58487, 'loss/train': 1.5257197618484497} -08/30/2021 23:43:05 - INFO - __main__ - Step 58489: {'lr': 0.00034080621525233264, 'samples': 11229888, 'steps': 58488, 'loss/train': 1.21271550655365} -08/30/2021 23:43:06 - INFO - __main__ - Step 58490: {'lr': 0.0003408012709301632, 'samples': 11230080, 'steps': 58489, 'loss/train': 1.4456794261932373} -08/30/2021 23:43:07 - INFO - __main__ - Step 58491: {'lr': 0.00034079632656708005, 'samples': 11230272, 'steps': 58490, 'loss/train': 1.403703212738037} -08/30/2021 23:43:07 - INFO - __main__ - Step 58492: {'lr': 0.00034079138216308553, 'samples': 11230464, 'steps': 58491, 'loss/train': 1.660502314567566} -08/30/2021 23:43:08 - INFO - __main__ - Step 58493: {'lr': 0.00034078643771818184, 'samples': 11230656, 'steps': 58492, 'loss/train': 1.5445058345794678} -08/30/2021 23:43:08 - INFO - __main__ - Step 58494: {'lr': 0.00034078149323237114, 'samples': 11230848, 'steps': 58493, 'loss/train': 1.618409514427185} -08/30/2021 23:43:10 - INFO - __main__ - Step 58495: {'lr': 0.00034077654870565566, 'samples': 11231040, 'steps': 58494, 'loss/train': 0.9836156368255615} -08/30/2021 23:43:10 - INFO - __main__ - Step 58496: {'lr': 0.00034077160413803774, 'samples': 11231232, 'steps': 58495, 'loss/train': 1.3215492963790894} -08/30/2021 23:43:10 - INFO - __main__ - Step 58497: {'lr': 0.0003407666595295195, 'samples': 11231424, 'steps': 58496, 'loss/train': 0.4603157639503479} -08/30/2021 23:43:11 - INFO - __main__ - Step 58498: {'lr': 0.0003407617148801033, 'samples': 11231616, 'steps': 58497, 'loss/train': 1.0663371086120605} -08/30/2021 23:43:11 - INFO - __main__ - Step 58499: {'lr': 0.0003407567701897911, 'samples': 11231808, 'steps': 58498, 'loss/train': 1.4457542896270752} -08/30/2021 23:43:13 - INFO - __main__ - Step 58500: {'lr': 0.0003407518254585854, 'samples': 11232000, 'steps': 58499, 'loss/train': 0.9328857660293579} -08/30/2021 23:43:13 - INFO - __main__ - Step 58501: {'lr': 0.0003407468806864883, 'samples': 11232192, 'steps': 58500, 'loss/train': 1.7675741910934448} -08/30/2021 23:43:13 - INFO - __main__ - Step 58502: {'lr': 0.0003407419358735021, 'samples': 11232384, 'steps': 58501, 'loss/train': 0.7371501922607422} -08/30/2021 23:43:14 - INFO - __main__ - Step 58503: {'lr': 0.0003407369910196289, 'samples': 11232576, 'steps': 58502, 'loss/train': 1.3097244501113892} -08/30/2021 23:43:14 - INFO - __main__ - Step 58504: {'lr': 0.0003407320461248711, 'samples': 11232768, 'steps': 58503, 'loss/train': 0.7195886373519897} -08/30/2021 23:43:16 - INFO - __main__ - Step 58505: {'lr': 0.00034072710118923086, 'samples': 11232960, 'steps': 58504, 'loss/train': 0.927277684211731} -08/30/2021 23:43:16 - INFO - __main__ - Step 58506: {'lr': 0.0003407221562127103, 'samples': 11233152, 'steps': 58505, 'loss/train': 1.2948977947235107} -08/30/2021 23:43:16 - INFO - __main__ - Step 58507: {'lr': 0.0003407172111953117, 'samples': 11233344, 'steps': 58506, 'loss/train': 1.105934977531433} -08/30/2021 23:43:17 - INFO - __main__ - Step 58508: {'lr': 0.00034071226613703744, 'samples': 11233536, 'steps': 58507, 'loss/train': 1.422202467918396} -08/30/2021 23:43:17 - INFO - __main__ - Step 58509: {'lr': 0.0003407073210378897, 'samples': 11233728, 'steps': 58508, 'loss/train': 1.1649856567382812} -08/30/2021 23:43:17 - INFO - __main__ - Step 58510: {'lr': 0.00034070237589787047, 'samples': 11233920, 'steps': 58509, 'loss/train': 1.3617955446243286} -08/30/2021 23:43:19 - INFO - __main__ - Step 58511: {'lr': 0.00034069743071698215, 'samples': 11234112, 'steps': 58510, 'loss/train': 1.4471343755722046} -08/30/2021 23:43:19 - INFO - __main__ - Step 58512: {'lr': 0.000340692485495227, 'samples': 11234304, 'steps': 58511, 'loss/train': 1.0367512702941895} -08/30/2021 23:43:20 - INFO - __main__ - Step 58513: {'lr': 0.0003406875402326073, 'samples': 11234496, 'steps': 58512, 'loss/train': 1.8381812572479248} -08/30/2021 23:43:20 - INFO - __main__ - Step 58514: {'lr': 0.00034068259492912514, 'samples': 11234688, 'steps': 58513, 'loss/train': 1.0300136804580688} -08/30/2021 23:43:21 - INFO - __main__ - Step 58515: {'lr': 0.00034067764958478283, 'samples': 11234880, 'steps': 58514, 'loss/train': 1.3457248210906982} -08/30/2021 23:43:22 - INFO - __main__ - Step 58516: {'lr': 0.0003406727041995825, 'samples': 11235072, 'steps': 58515, 'loss/train': 1.3284367322921753} -08/30/2021 23:43:22 - INFO - __main__ - Step 58517: {'lr': 0.00034066775877352644, 'samples': 11235264, 'steps': 58516, 'loss/train': 0.7124446034431458} -08/30/2021 23:43:23 - INFO - __main__ - Step 58518: {'lr': 0.00034066281330661697, 'samples': 11235456, 'steps': 58517, 'loss/train': 0.8736456632614136} -08/30/2021 23:43:23 - INFO - __main__ - Step 58519: {'lr': 0.0003406578677988562, 'samples': 11235648, 'steps': 58518, 'loss/train': 1.5253947973251343} -08/30/2021 23:43:23 - INFO - __main__ - Step 58520: {'lr': 0.00034065292225024643, 'samples': 11235840, 'steps': 58519, 'loss/train': 1.394162893295288} -08/30/2021 23:43:25 - INFO - __main__ - Step 58521: {'lr': 0.0003406479766607898, 'samples': 11236032, 'steps': 58520, 'loss/train': 0.8299336433410645} -08/30/2021 23:43:25 - INFO - __main__ - Step 58522: {'lr': 0.00034064303103048863, 'samples': 11236224, 'steps': 58521, 'loss/train': 1.7708333730697632} -08/30/2021 23:43:26 - INFO - __main__ - Step 58523: {'lr': 0.000340638085359345, 'samples': 11236416, 'steps': 58522, 'loss/train': 1.3864572048187256} -08/30/2021 23:43:26 - INFO - __main__ - Step 58524: {'lr': 0.00034063313964736135, 'samples': 11236608, 'steps': 58523, 'loss/train': 1.2743518352508545} -08/30/2021 23:43:26 - INFO - __main__ - Step 58525: {'lr': 0.0003406281938945398, 'samples': 11236800, 'steps': 58524, 'loss/train': 1.696038842201233} -08/30/2021 23:43:28 - INFO - __main__ - Step 58526: {'lr': 0.0003406232481008825, 'samples': 11236992, 'steps': 58525, 'loss/train': 1.4155510663986206} -08/30/2021 23:43:28 - INFO - __main__ - Step 58527: {'lr': 0.0003406183022663919, 'samples': 11237184, 'steps': 58526, 'loss/train': 0.8133142590522766} -08/30/2021 23:43:29 - INFO - __main__ - Step 58528: {'lr': 0.00034061335639107006, 'samples': 11237376, 'steps': 58527, 'loss/train': 1.2449642419815063} -08/30/2021 23:43:29 - INFO - __main__ - Step 58529: {'lr': 0.0003406084104749192, 'samples': 11237568, 'steps': 58528, 'loss/train': 1.313981533050537} -08/30/2021 23:43:29 - INFO - __main__ - Step 58530: {'lr': 0.00034060346451794156, 'samples': 11237760, 'steps': 58529, 'loss/train': 1.017622947692871} -08/30/2021 23:43:31 - INFO - __main__ - Step 58531: {'lr': 0.0003405985185201394, 'samples': 11237952, 'steps': 58530, 'loss/train': 1.13120698928833} -08/30/2021 23:43:32 - INFO - __main__ - Step 58532: {'lr': 0.000340593572481515, 'samples': 11238144, 'steps': 58531, 'loss/train': 1.9550281763076782} -08/30/2021 23:43:32 - INFO - __main__ - Step 58533: {'lr': 0.0003405886264020706, 'samples': 11238336, 'steps': 58532, 'loss/train': 1.1073040962219238} -08/30/2021 23:43:32 - INFO - __main__ - Step 58534: {'lr': 0.0003405836802818082, 'samples': 11238528, 'steps': 58533, 'loss/train': 0.8942179679870605} -08/30/2021 23:43:33 - INFO - __main__ - Step 58535: {'lr': 0.00034057873412073026, 'samples': 11238720, 'steps': 58534, 'loss/train': 0.8154551982879639} -08/30/2021 23:43:35 - INFO - __main__ - Step 58536: {'lr': 0.0003405737879188389, 'samples': 11238912, 'steps': 58535, 'loss/train': 0.7828736305236816} -08/30/2021 23:43:35 - INFO - __main__ - Step 58537: {'lr': 0.0003405688416761364, 'samples': 11239104, 'steps': 58536, 'loss/train': 1.2096621990203857} -08/30/2021 23:43:36 - INFO - __main__ - Step 58538: {'lr': 0.00034056389539262506, 'samples': 11239296, 'steps': 58537, 'loss/train': 1.1198557615280151} -08/30/2021 23:43:36 - INFO - __main__ - Step 58539: {'lr': 0.000340558949068307, 'samples': 11239488, 'steps': 58538, 'loss/train': 1.1630693674087524} -08/30/2021 23:43:37 - INFO - __main__ - Step 58540: {'lr': 0.0003405540027031845, 'samples': 11239680, 'steps': 58539, 'loss/train': 1.561592698097229} -08/30/2021 23:43:38 - INFO - __main__ - Step 58541: {'lr': 0.00034054905629725965, 'samples': 11239872, 'steps': 58540, 'loss/train': 1.2983131408691406} -08/30/2021 23:43:39 - INFO - __main__ - Step 58542: {'lr': 0.00034054410985053483, 'samples': 11240064, 'steps': 58541, 'loss/train': 1.3339262008666992} -08/30/2021 23:43:39 - INFO - __main__ - Step 58543: {'lr': 0.00034053916336301225, 'samples': 11240256, 'steps': 58542, 'loss/train': 1.4180879592895508} -08/30/2021 23:43:39 - INFO - __main__ - Step 58544: {'lr': 0.00034053421683469416, 'samples': 11240448, 'steps': 58543, 'loss/train': 1.3751170635223389} -08/30/2021 23:43:40 - INFO - __main__ - Step 58545: {'lr': 0.00034052927026558265, 'samples': 11240640, 'steps': 58544, 'loss/train': 0.98646080493927} -08/30/2021 23:43:40 - INFO - __main__ - Step 58546: {'lr': 0.00034052432365568015, 'samples': 11240832, 'steps': 58545, 'loss/train': 0.5625841021537781} -08/30/2021 23:43:41 - INFO - __main__ - Step 58547: {'lr': 0.0003405193770049888, 'samples': 11241024, 'steps': 58546, 'loss/train': 1.4577291011810303} -08/30/2021 23:43:42 - INFO - __main__ - Step 58548: {'lr': 0.0003405144303135108, 'samples': 11241216, 'steps': 58547, 'loss/train': 1.2476330995559692} -08/30/2021 23:43:42 - INFO - __main__ - Step 58549: {'lr': 0.00034050948358124836, 'samples': 11241408, 'steps': 58548, 'loss/train': 1.0030964612960815} -08/30/2021 23:43:43 - INFO - __main__ - Step 58550: {'lr': 0.00034050453680820373, 'samples': 11241600, 'steps': 58549, 'loss/train': 1.7929127216339111} -08/30/2021 23:43:43 - INFO - __main__ - Step 58551: {'lr': 0.0003404995899943791, 'samples': 11241792, 'steps': 58550, 'loss/train': 1.6089800596237183} -08/30/2021 23:43:44 - INFO - __main__ - Step 58552: {'lr': 0.00034049464313977684, 'samples': 11241984, 'steps': 58551, 'loss/train': 1.3833897113800049} -08/30/2021 23:43:45 - INFO - __main__ - Step 58553: {'lr': 0.0003404896962443991, 'samples': 11242176, 'steps': 58552, 'loss/train': 1.0605577230453491} -08/30/2021 23:43:45 - INFO - __main__ - Step 58554: {'lr': 0.0003404847493082481, 'samples': 11242368, 'steps': 58553, 'loss/train': 0.8979097604751587} -08/30/2021 23:43:46 - INFO - __main__ - Step 58555: {'lr': 0.000340479802331326, 'samples': 11242560, 'steps': 58554, 'loss/train': 4.266524791717529} -08/30/2021 23:43:46 - INFO - __main__ - Step 58556: {'lr': 0.0003404748553136351, 'samples': 11242752, 'steps': 58555, 'loss/train': 1.3507206439971924} -08/30/2021 23:43:47 - INFO - __main__ - Step 58557: {'lr': 0.00034046990825517765, 'samples': 11242944, 'steps': 58556, 'loss/train': 1.5242642164230347} -08/30/2021 23:43:48 - INFO - __main__ - Step 58558: {'lr': 0.0003404649611559559, 'samples': 11243136, 'steps': 58557, 'loss/train': 1.3444191217422485} -08/30/2021 23:43:48 - INFO - __main__ - Step 58559: {'lr': 0.0003404600140159719, 'samples': 11243328, 'steps': 58558, 'loss/train': 1.7055398225784302} -08/30/2021 23:43:49 - INFO - __main__ - Step 58560: {'lr': 0.0003404550668352282, 'samples': 11243520, 'steps': 58559, 'loss/train': 0.5438639521598816} -08/30/2021 23:43:49 - INFO - __main__ - Step 58561: {'lr': 0.00034045011961372676, 'samples': 11243712, 'steps': 58560, 'loss/train': 1.2897387742996216} -08/30/2021 23:43:50 - INFO - __main__ - Step 58562: {'lr': 0.0003404451723514699, 'samples': 11243904, 'steps': 58561, 'loss/train': 1.2012020349502563} -08/30/2021 23:43:51 - INFO - __main__ - Step 58563: {'lr': 0.00034044022504845986, 'samples': 11244096, 'steps': 58562, 'loss/train': 1.4125726222991943} -08/30/2021 23:43:51 - INFO - __main__ - Step 58564: {'lr': 0.00034043527770469874, 'samples': 11244288, 'steps': 58563, 'loss/train': 1.2554422616958618} -08/30/2021 23:43:52 - INFO - __main__ - Step 58565: {'lr': 0.00034043033032018897, 'samples': 11244480, 'steps': 58564, 'loss/train': 1.2383854389190674} -08/30/2021 23:43:52 - INFO - __main__ - Step 58566: {'lr': 0.00034042538289493266, 'samples': 11244672, 'steps': 58565, 'loss/train': 2.2003026008605957} -08/30/2021 23:43:54 - INFO - __main__ - Step 58567: {'lr': 0.00034042043542893214, 'samples': 11244864, 'steps': 58566, 'loss/train': 0.8212010860443115} -08/30/2021 23:43:54 - INFO - __main__ - Step 58568: {'lr': 0.0003404154879221895, 'samples': 11245056, 'steps': 58567, 'loss/train': 1.3356879949569702} -08/30/2021 23:43:54 - INFO - __main__ - Step 58569: {'lr': 0.00034041054037470703, 'samples': 11245248, 'steps': 58568, 'loss/train': 1.1337552070617676} -08/30/2021 23:43:55 - INFO - __main__ - Step 58570: {'lr': 0.00034040559278648695, 'samples': 11245440, 'steps': 58569, 'loss/train': 1.671465516090393} -08/30/2021 23:43:55 - INFO - __main__ - Step 58571: {'lr': 0.00034040064515753154, 'samples': 11245632, 'steps': 58570, 'loss/train': 2.649855852127075} -08/30/2021 23:43:57 - INFO - __main__ - Step 58572: {'lr': 0.000340395697487843, 'samples': 11245824, 'steps': 58571, 'loss/train': 1.4615247249603271} -08/30/2021 23:43:57 - INFO - __main__ - Step 58573: {'lr': 0.00034039074977742356, 'samples': 11246016, 'steps': 58572, 'loss/train': 1.5947604179382324} -08/30/2021 23:43:57 - INFO - __main__ - Step 58574: {'lr': 0.00034038580202627543, 'samples': 11246208, 'steps': 58573, 'loss/train': 0.818996787071228} -08/30/2021 23:43:58 - INFO - __main__ - Step 58575: {'lr': 0.0003403808542344009, 'samples': 11246400, 'steps': 58574, 'loss/train': 1.6902351379394531} -08/30/2021 23:43:58 - INFO - __main__ - Step 58576: {'lr': 0.00034037590640180205, 'samples': 11246592, 'steps': 58575, 'loss/train': 1.5108747482299805} -08/30/2021 23:44:00 - INFO - __main__ - Step 58577: {'lr': 0.00034037095852848125, 'samples': 11246784, 'steps': 58576, 'loss/train': 1.452622890472412} -08/30/2021 23:44:00 - INFO - __main__ - Step 58578: {'lr': 0.00034036601061444074, 'samples': 11246976, 'steps': 58577, 'loss/train': 1.2887787818908691} -08/30/2021 23:44:01 - INFO - __main__ - Step 58579: {'lr': 0.00034036106265968263, 'samples': 11247168, 'steps': 58578, 'loss/train': 1.8293622732162476} -08/30/2021 23:44:01 - INFO - __main__ - Step 58580: {'lr': 0.00034035611466420927, 'samples': 11247360, 'steps': 58579, 'loss/train': 1.3499797582626343} -08/30/2021 23:44:01 - INFO - __main__ - Step 58581: {'lr': 0.00034035116662802287, 'samples': 11247552, 'steps': 58580, 'loss/train': 1.6696134805679321} -08/30/2021 23:44:02 - INFO - __main__ - Step 58582: {'lr': 0.0003403462185511256, 'samples': 11247744, 'steps': 58581, 'loss/train': 1.1487683057785034} -08/30/2021 23:44:03 - INFO - __main__ - Step 58583: {'lr': 0.0003403412704335196, 'samples': 11247936, 'steps': 58582, 'loss/train': 1.540053367614746} -08/30/2021 23:44:04 - INFO - __main__ - Step 58584: {'lr': 0.0003403363222752074, 'samples': 11248128, 'steps': 58583, 'loss/train': 0.6843742728233337} -08/30/2021 23:44:04 - INFO - __main__ - Step 58585: {'lr': 0.0003403313740761909, 'samples': 11248320, 'steps': 58584, 'loss/train': 0.9619364738464355} -08/30/2021 23:44:04 - INFO - __main__ - Step 58586: {'lr': 0.00034032642583647254, 'samples': 11248512, 'steps': 58585, 'loss/train': 1.7156606912612915} -08/30/2021 23:44:05 - INFO - __main__ - Step 58587: {'lr': 0.0003403214775560545, 'samples': 11248704, 'steps': 58586, 'loss/train': 0.714686393737793} -08/30/2021 23:44:07 - INFO - __main__ - Step 58588: {'lr': 0.000340316529234939, 'samples': 11248896, 'steps': 58587, 'loss/train': 0.9419745802879333} -08/30/2021 23:44:07 - INFO - __main__ - Step 58589: {'lr': 0.00034031158087312823, 'samples': 11249088, 'steps': 58588, 'loss/train': 0.6213420033454895} -08/30/2021 23:44:08 - INFO - __main__ - Step 58590: {'lr': 0.0003403066324706245, 'samples': 11249280, 'steps': 58589, 'loss/train': 1.5234297513961792} -08/30/2021 23:44:08 - INFO - __main__ - Step 58591: {'lr': 0.00034030168402742996, 'samples': 11249472, 'steps': 58590, 'loss/train': 1.1701195240020752} -08/30/2021 23:44:08 - INFO - __main__ - Step 58592: {'lr': 0.0003402967355435469, 'samples': 11249664, 'steps': 58591, 'loss/train': 1.2197644710540771} -08/30/2021 23:44:10 - INFO - __main__ - Step 58593: {'lr': 0.00034029178701897744, 'samples': 11249856, 'steps': 58592, 'loss/train': 1.5269335508346558} -08/30/2021 23:44:11 - INFO - __main__ - Step 58594: {'lr': 0.00034028683845372407, 'samples': 11250048, 'steps': 58593, 'loss/train': 1.262350082397461} -08/30/2021 23:44:11 - INFO - __main__ - Step 58595: {'lr': 0.00034028188984778867, 'samples': 11250240, 'steps': 58594, 'loss/train': 0.04223304241895676} -08/30/2021 23:44:11 - INFO - __main__ - Step 58596: {'lr': 0.0003402769412011737, 'samples': 11250432, 'steps': 58595, 'loss/train': 0.06784778833389282} -08/30/2021 23:44:12 - INFO - __main__ - Step 58597: {'lr': 0.00034027199251388137, 'samples': 11250624, 'steps': 58596, 'loss/train': 1.508138656616211} -08/30/2021 23:44:12 - INFO - __main__ - Step 58598: {'lr': 0.0003402670437859138, 'samples': 11250816, 'steps': 58597, 'loss/train': 0.7740739583969116} -08/30/2021 23:44:14 - INFO - __main__ - Step 58599: {'lr': 0.0003402620950172733, 'samples': 11251008, 'steps': 58598, 'loss/train': 1.517117977142334} -08/30/2021 23:44:15 - INFO - __main__ - Step 58600: {'lr': 0.00034025714620796225, 'samples': 11251200, 'steps': 58599, 'loss/train': 0.7694681882858276} -08/30/2021 23:44:15 - INFO - __main__ - Step 58601: {'lr': 0.0003402521973579826, 'samples': 11251392, 'steps': 58600, 'loss/train': 1.7149394750595093} -08/30/2021 23:44:15 - INFO - __main__ - Step 58602: {'lr': 0.00034024724846733667, 'samples': 11251584, 'steps': 58601, 'loss/train': 1.1592369079589844} -08/30/2021 23:44:16 - INFO - __main__ - Step 58603: {'lr': 0.0003402422995360268, 'samples': 11251776, 'steps': 58602, 'loss/train': 1.1043370962142944} -08/30/2021 23:44:16 - INFO - __main__ - Step 58604: {'lr': 0.00034023735056405507, 'samples': 11251968, 'steps': 58603, 'loss/train': 1.4269009828567505} -08/30/2021 23:44:18 - INFO - __main__ - Step 58605: {'lr': 0.00034023240155142383, 'samples': 11252160, 'steps': 58604, 'loss/train': 0.9237139821052551} -08/30/2021 23:44:18 - INFO - __main__ - Step 58606: {'lr': 0.00034022745249813523, 'samples': 11252352, 'steps': 58605, 'loss/train': 1.3100820779800415} -08/30/2021 23:44:19 - INFO - __main__ - Step 58607: {'lr': 0.0003402225034041916, 'samples': 11252544, 'steps': 58606, 'loss/train': 1.4197008609771729} -08/30/2021 23:44:19 - INFO - __main__ - Step 58608: {'lr': 0.000340217554269595, 'samples': 11252736, 'steps': 58607, 'loss/train': 4.563615798950195} -08/30/2021 23:44:19 - INFO - __main__ - Step 58609: {'lr': 0.00034021260509434784, 'samples': 11252928, 'steps': 58608, 'loss/train': 1.6371595859527588} -08/30/2021 23:44:21 - INFO - __main__ - Step 58610: {'lr': 0.0003402076558784522, 'samples': 11253120, 'steps': 58609, 'loss/train': 1.1750199794769287} -08/30/2021 23:44:21 - INFO - __main__ - Step 58611: {'lr': 0.00034020270662191046, 'samples': 11253312, 'steps': 58610, 'loss/train': 1.3374089002609253} -08/30/2021 23:44:22 - INFO - __main__ - Step 58612: {'lr': 0.00034019775732472467, 'samples': 11253504, 'steps': 58611, 'loss/train': 5.810057640075684} -08/30/2021 23:44:22 - INFO - __main__ - Step 58613: {'lr': 0.0003401928079868973, 'samples': 11253696, 'steps': 58612, 'loss/train': 2.313693046569824} -08/30/2021 23:44:23 - INFO - __main__ - Step 58614: {'lr': 0.0003401878586084304, 'samples': 11253888, 'steps': 58613, 'loss/train': 1.7675833702087402} -08/30/2021 23:44:23 - INFO - __main__ - Step 58615: {'lr': 0.0003401829091893262, 'samples': 11254080, 'steps': 58614, 'loss/train': 1.431160569190979} -08/30/2021 23:44:25 - INFO - __main__ - Step 58616: {'lr': 0.000340177959729587, 'samples': 11254272, 'steps': 58615, 'loss/train': 3.1185641288757324} -08/30/2021 23:44:25 - INFO - __main__ - Step 58617: {'lr': 0.000340173010229215, 'samples': 11254464, 'steps': 58616, 'loss/train': 2.082977056503296} -08/30/2021 23:44:25 - INFO - __main__ - Step 58618: {'lr': 0.0003401680606882124, 'samples': 11254656, 'steps': 58617, 'loss/train': 1.5103776454925537} -08/30/2021 23:44:26 - INFO - __main__ - Step 58619: {'lr': 0.0003401631111065815, 'samples': 11254848, 'steps': 58618, 'loss/train': 1.5038206577301025} -08/30/2021 23:44:26 - INFO - __main__ - Step 58620: {'lr': 0.0003401581614843244, 'samples': 11255040, 'steps': 58619, 'loss/train': 1.5555760860443115} -08/30/2021 23:44:26 - INFO - __main__ - Step 58621: {'lr': 0.00034015321182144357, 'samples': 11255232, 'steps': 58620, 'loss/train': 1.083202838897705} -08/30/2021 23:44:28 - INFO - __main__ - Step 58622: {'lr': 0.00034014826211794104, 'samples': 11255424, 'steps': 58621, 'loss/train': 0.03790397197008133} -08/30/2021 23:44:28 - INFO - __main__ - Step 58623: {'lr': 0.0003401433123738191, 'samples': 11255616, 'steps': 58622, 'loss/train': 1.2019463777542114} -08/30/2021 23:44:29 - INFO - __main__ - Step 58624: {'lr': 0.00034013836258907994, 'samples': 11255808, 'steps': 58623, 'loss/train': 1.3544248342514038} -08/30/2021 23:44:29 - INFO - __main__ - Step 58625: {'lr': 0.0003401334127637258, 'samples': 11256000, 'steps': 58624, 'loss/train': 1.3162786960601807} -08/30/2021 23:44:29 - INFO - __main__ - Step 58626: {'lr': 0.000340128462897759, 'samples': 11256192, 'steps': 58625, 'loss/train': 1.0081450939178467} -08/30/2021 23:44:31 - INFO - __main__ - Step 58627: {'lr': 0.0003401235129911817, 'samples': 11256384, 'steps': 58626, 'loss/train': 1.1143519878387451} -08/30/2021 23:44:31 - INFO - __main__ - Step 58628: {'lr': 0.0003401185630439961, 'samples': 11256576, 'steps': 58627, 'loss/train': 1.4830524921417236} -08/30/2021 23:44:32 - INFO - __main__ - Step 58629: {'lr': 0.0003401136130562045, 'samples': 11256768, 'steps': 58628, 'loss/train': 1.7404817342758179} -08/30/2021 23:44:32 - INFO - __main__ - Step 58630: {'lr': 0.0003401086630278091, 'samples': 11256960, 'steps': 58629, 'loss/train': 2.3203773498535156} -08/30/2021 23:44:33 - INFO - __main__ - Step 58631: {'lr': 0.00034010371295881207, 'samples': 11257152, 'steps': 58630, 'loss/train': 1.4743072986602783} -08/30/2021 23:44:33 - INFO - __main__ - Step 58632: {'lr': 0.00034009876284921576, 'samples': 11257344, 'steps': 58631, 'loss/train': 1.2115086317062378} -08/30/2021 23:44:34 - INFO - __main__ - Step 58633: {'lr': 0.00034009381269902236, 'samples': 11257536, 'steps': 58632, 'loss/train': 1.8946534395217896} -08/30/2021 23:44:35 - INFO - __main__ - Step 58634: {'lr': 0.000340088862508234, 'samples': 11257728, 'steps': 58633, 'loss/train': 1.355635643005371} -08/30/2021 23:44:35 - INFO - __main__ - Step 58635: {'lr': 0.00034008391227685305, 'samples': 11257920, 'steps': 58634, 'loss/train': 1.6156717538833618} -08/30/2021 23:44:35 - INFO - __main__ - Step 58636: {'lr': 0.00034007896200488163, 'samples': 11258112, 'steps': 58635, 'loss/train': 1.2679417133331299} -08/30/2021 23:44:36 - INFO - __main__ - Step 58637: {'lr': 0.0003400740116923221, 'samples': 11258304, 'steps': 58636, 'loss/train': 1.526999831199646} -08/30/2021 23:44:37 - INFO - __main__ - Step 58638: {'lr': 0.00034006906133917655, 'samples': 11258496, 'steps': 58637, 'loss/train': 1.8030425310134888} -08/30/2021 23:44:38 - INFO - __main__ - Step 58639: {'lr': 0.0003400641109454473, 'samples': 11258688, 'steps': 58638, 'loss/train': 1.4153028726577759} -08/30/2021 23:44:38 - INFO - __main__ - Step 58640: {'lr': 0.0003400591605111364, 'samples': 11258880, 'steps': 58639, 'loss/train': 1.526519775390625} -08/30/2021 23:44:38 - INFO - __main__ - Step 58641: {'lr': 0.0003400542100362464, 'samples': 11259072, 'steps': 58640, 'loss/train': 1.9305524826049805} -08/30/2021 23:44:39 - INFO - __main__ - Step 58642: {'lr': 0.0003400492595207793, 'samples': 11259264, 'steps': 58641, 'loss/train': 1.3647828102111816} -08/30/2021 23:44:41 - INFO - __main__ - Step 58643: {'lr': 0.00034004430896473743, 'samples': 11259456, 'steps': 58642, 'loss/train': 1.3243318796157837} -08/30/2021 23:44:41 - INFO - __main__ - Step 58644: {'lr': 0.000340039358368123, 'samples': 11259648, 'steps': 58643, 'loss/train': 1.6915072202682495} -08/30/2021 23:44:42 - INFO - __main__ - Step 58645: {'lr': 0.00034003440773093817, 'samples': 11259840, 'steps': 58644, 'loss/train': 1.0202341079711914} -08/30/2021 23:44:42 - INFO - __main__ - Step 58646: {'lr': 0.0003400294570531852, 'samples': 11260032, 'steps': 58645, 'loss/train': 2.145146608352661} -08/30/2021 23:44:42 - INFO - __main__ - Step 58647: {'lr': 0.0003400245063348664, 'samples': 11260224, 'steps': 58646, 'loss/train': 1.1356542110443115} -08/30/2021 23:44:44 - INFO - __main__ - Step 58648: {'lr': 0.000340019555575984, 'samples': 11260416, 'steps': 58647, 'loss/train': 1.5575954914093018} -08/30/2021 23:44:45 - INFO - __main__ - Step 58649: {'lr': 0.00034001460477654013, 'samples': 11260608, 'steps': 58648, 'loss/train': 0.9656021595001221} -08/30/2021 23:44:45 - INFO - __main__ - Step 58650: {'lr': 0.00034000965393653703, 'samples': 11260800, 'steps': 58649, 'loss/train': 0.6885381937026978} -08/30/2021 23:44:45 - INFO - __main__ - Step 58651: {'lr': 0.00034000470305597697, 'samples': 11260992, 'steps': 58650, 'loss/train': 1.862221360206604} -08/30/2021 23:44:46 - INFO - __main__ - Step 58652: {'lr': 0.0003399997521348622, 'samples': 11261184, 'steps': 58651, 'loss/train': 0.7823901176452637} -08/30/2021 23:44:47 - INFO - __main__ - Step 58653: {'lr': 0.00033999480117319494, 'samples': 11261376, 'steps': 58652, 'loss/train': 1.2422887086868286} -08/30/2021 23:44:48 - INFO - __main__ - Step 58654: {'lr': 0.0003399898501709774, 'samples': 11261568, 'steps': 58653, 'loss/train': 1.086638331413269} -08/30/2021 23:44:48 - INFO - __main__ - Step 58655: {'lr': 0.00033998489912821187, 'samples': 11261760, 'steps': 58654, 'loss/train': 1.4552615880966187} -08/30/2021 23:44:48 - INFO - __main__ - Step 58656: {'lr': 0.00033997994804490047, 'samples': 11261952, 'steps': 58655, 'loss/train': 1.1426972150802612} -08/30/2021 23:44:49 - INFO - __main__ - Step 58657: {'lr': 0.0003399749969210455, 'samples': 11262144, 'steps': 58656, 'loss/train': 1.7824389934539795} -08/30/2021 23:44:50 - INFO - __main__ - Step 58658: {'lr': 0.0003399700457566492, 'samples': 11262336, 'steps': 58657, 'loss/train': 2.321087121963501} -08/30/2021 23:44:51 - INFO - __main__ - Step 58659: {'lr': 0.00033996509455171375, 'samples': 11262528, 'steps': 58658, 'loss/train': 1.4311717748641968} -08/30/2021 23:44:51 - INFO - __main__ - Step 58660: {'lr': 0.0003399601433062415, 'samples': 11262720, 'steps': 58659, 'loss/train': 1.6147359609603882} -08/30/2021 23:44:51 - INFO - __main__ - Step 58661: {'lr': 0.00033995519202023453, 'samples': 11262912, 'steps': 58660, 'loss/train': 1.6489475965499878} -08/30/2021 23:44:52 - INFO - __main__ - Step 58662: {'lr': 0.00033995024069369517, 'samples': 11263104, 'steps': 58661, 'loss/train': 1.4745396375656128} -08/30/2021 23:44:53 - INFO - __main__ - Step 58663: {'lr': 0.0003399452893266256, 'samples': 11263296, 'steps': 58662, 'loss/train': 0.812257707118988} -08/30/2021 23:44:54 - INFO - __main__ - Step 58664: {'lr': 0.000339940337919028, 'samples': 11263488, 'steps': 58663, 'loss/train': 0.9347754120826721} -08/30/2021 23:44:54 - INFO - __main__ - Step 58665: {'lr': 0.0003399353864709048, 'samples': 11263680, 'steps': 58664, 'loss/train': 0.5399097204208374} -08/30/2021 23:44:54 - INFO - __main__ - Step 58666: {'lr': 0.000339930434982258, 'samples': 11263872, 'steps': 58665, 'loss/train': 1.2221934795379639} -08/30/2021 23:44:55 - INFO - __main__ - Step 58667: {'lr': 0.00033992548345309, 'samples': 11264064, 'steps': 58666, 'loss/train': 1.701217532157898} -08/30/2021 23:44:56 - INFO - __main__ - Step 58668: {'lr': 0.000339920531883403, 'samples': 11264256, 'steps': 58667, 'loss/train': 1.641194224357605} -08/30/2021 23:44:57 - INFO - __main__ - Step 58669: {'lr': 0.0003399155802731991, 'samples': 11264448, 'steps': 58668, 'loss/train': 1.5220270156860352} -08/30/2021 23:44:57 - INFO - __main__ - Step 58670: {'lr': 0.0003399106286224807, 'samples': 11264640, 'steps': 58669, 'loss/train': 1.4254704713821411} -08/30/2021 23:44:57 - INFO - __main__ - Step 58671: {'lr': 0.0003399056769312499, 'samples': 11264832, 'steps': 58670, 'loss/train': 1.2846100330352783} -08/30/2021 23:44:58 - INFO - __main__ - Step 58672: {'lr': 0.000339900725199509, 'samples': 11265024, 'steps': 58671, 'loss/train': 1.6533279418945312} -08/30/2021 23:44:59 - INFO - __main__ - Step 58673: {'lr': 0.0003398957734272602, 'samples': 11265216, 'steps': 58672, 'loss/train': 0.9581900835037231} -08/30/2021 23:45:00 - INFO - __main__ - Step 58674: {'lr': 0.00033989082161450584, 'samples': 11265408, 'steps': 58673, 'loss/train': 0.7161738872528076} -08/30/2021 23:45:00 - INFO - __main__ - Step 58675: {'lr': 0.000339885869761248, 'samples': 11265600, 'steps': 58674, 'loss/train': 1.6511728763580322} -08/30/2021 23:45:00 - INFO - __main__ - Step 58676: {'lr': 0.000339880917867489, 'samples': 11265792, 'steps': 58675, 'loss/train': 1.2187076807022095} -08/30/2021 23:45:01 - INFO - __main__ - Step 58677: {'lr': 0.00033987596593323103, 'samples': 11265984, 'steps': 58676, 'loss/train': 1.5846315622329712} -08/30/2021 23:45:02 - INFO - __main__ - Step 58678: {'lr': 0.00033987101395847636, 'samples': 11266176, 'steps': 58677, 'loss/train': 1.285315990447998} -08/30/2021 23:45:03 - INFO - __main__ - Step 58679: {'lr': 0.00033986606194322716, 'samples': 11266368, 'steps': 58678, 'loss/train': 1.5435011386871338} -08/30/2021 23:45:03 - INFO - __main__ - Step 58680: {'lr': 0.00033986110988748567, 'samples': 11266560, 'steps': 58679, 'loss/train': 1.130240797996521} -08/30/2021 23:45:03 - INFO - __main__ - Step 58681: {'lr': 0.00033985615779125427, 'samples': 11266752, 'steps': 58680, 'loss/train': 1.0424315929412842} -08/30/2021 23:45:04 - INFO - __main__ - Step 58682: {'lr': 0.00033985120565453497, 'samples': 11266944, 'steps': 58681, 'loss/train': 1.1715854406356812} -08/30/2021 23:45:04 - INFO - __main__ - Step 58683: {'lr': 0.00033984625347733015, 'samples': 11267136, 'steps': 58682, 'loss/train': 1.004608154296875} -08/30/2021 23:45:06 - INFO - __main__ - Step 58684: {'lr': 0.000339841301259642, 'samples': 11267328, 'steps': 58683, 'loss/train': 1.897889256477356} -08/30/2021 23:45:06 - INFO - __main__ - Step 58685: {'lr': 0.0003398363490014727, 'samples': 11267520, 'steps': 58684, 'loss/train': 1.8558295965194702} -08/30/2021 23:45:06 - INFO - __main__ - Step 58686: {'lr': 0.0003398313967028245, 'samples': 11267712, 'steps': 58685, 'loss/train': 1.3434743881225586} -08/30/2021 23:45:07 - INFO - __main__ - Step 58687: {'lr': 0.00033982644436369975, 'samples': 11267904, 'steps': 58686, 'loss/train': 0.8997907638549805} -08/30/2021 23:45:07 - INFO - __main__ - Step 58688: {'lr': 0.00033982149198410057, 'samples': 11268096, 'steps': 58687, 'loss/train': 1.4189918041229248} -08/30/2021 23:45:09 - INFO - __main__ - Step 58689: {'lr': 0.0003398165395640292, 'samples': 11268288, 'steps': 58688, 'loss/train': 0.751264750957489} -08/30/2021 23:45:09 - INFO - __main__ - Step 58690: {'lr': 0.00033981158710348787, 'samples': 11268480, 'steps': 58689, 'loss/train': 0.5940876007080078} -08/30/2021 23:45:09 - INFO - __main__ - Step 58691: {'lr': 0.0003398066346024788, 'samples': 11268672, 'steps': 58690, 'loss/train': 1.5481352806091309} -08/30/2021 23:45:10 - INFO - __main__ - Step 58692: {'lr': 0.0003398016820610043, 'samples': 11268864, 'steps': 58691, 'loss/train': 1.2806178331375122} -08/30/2021 23:45:10 - INFO - __main__ - Step 58693: {'lr': 0.00033979672947906646, 'samples': 11269056, 'steps': 58692, 'loss/train': 1.1124917268753052} -08/30/2021 23:45:12 - INFO - __main__ - Step 58694: {'lr': 0.0003397917768566677, 'samples': 11269248, 'steps': 58693, 'loss/train': 1.04927396774292} -08/30/2021 23:45:13 - INFO - __main__ - Step 58695: {'lr': 0.0003397868241938101, 'samples': 11269440, 'steps': 58694, 'loss/train': 2.4703054428100586} -08/30/2021 23:45:13 - INFO - __main__ - Step 58696: {'lr': 0.00033978187149049597, 'samples': 11269632, 'steps': 58695, 'loss/train': 0.9833458662033081} -08/30/2021 23:45:13 - INFO - __main__ - Step 58697: {'lr': 0.0003397769187467275, 'samples': 11269824, 'steps': 58696, 'loss/train': 1.6109654903411865} -08/30/2021 23:45:14 - INFO - __main__ - Step 58698: {'lr': 0.0003397719659625069, 'samples': 11270016, 'steps': 58697, 'loss/train': 1.714380145072937} -08/30/2021 23:45:16 - INFO - __main__ - Step 58699: {'lr': 0.0003397670131378365, 'samples': 11270208, 'steps': 58698, 'loss/train': 1.5342620611190796} -08/30/2021 23:45:17 - INFO - __main__ - Step 58700: {'lr': 0.0003397620602727184, 'samples': 11270400, 'steps': 58699, 'loss/train': 1.062547206878662} -08/30/2021 23:45:17 - INFO - __main__ - Step 58701: {'lr': 0.00033975710736715504, 'samples': 11270592, 'steps': 58700, 'loss/train': 1.8590065240859985} -08/30/2021 23:45:17 - INFO - __main__ - Step 58702: {'lr': 0.00033975215442114836, 'samples': 11270784, 'steps': 58701, 'loss/train': 0.4686267673969269} -08/30/2021 23:45:18 - INFO - __main__ - Step 58703: {'lr': 0.00033974720143470084, 'samples': 11270976, 'steps': 58702, 'loss/train': 0.417143851518631} -08/30/2021 23:45:18 - INFO - __main__ - Step 58704: {'lr': 0.00033974224840781453, 'samples': 11271168, 'steps': 58703, 'loss/train': 0.34511134028434753} -08/30/2021 23:45:19 - INFO - __main__ - Step 58705: {'lr': 0.0003397372953404918, 'samples': 11271360, 'steps': 58704, 'loss/train': 0.9673738479614258} -08/30/2021 23:45:20 - INFO - __main__ - Step 58706: {'lr': 0.0003397323422327348, 'samples': 11271552, 'steps': 58705, 'loss/train': 1.2641791105270386} -08/30/2021 23:45:20 - INFO - __main__ - Step 58707: {'lr': 0.0003397273890845458, 'samples': 11271744, 'steps': 58706, 'loss/train': 1.498709797859192} -08/30/2021 23:45:21 - INFO - __main__ - Step 58708: {'lr': 0.0003397224358959271, 'samples': 11271936, 'steps': 58707, 'loss/train': 1.4560626745224} -08/30/2021 23:45:21 - INFO - __main__ - Step 58709: {'lr': 0.0003397174826668808, 'samples': 11272128, 'steps': 58708, 'loss/train': 1.497673511505127} -08/30/2021 23:45:23 - INFO - __main__ - Step 58710: {'lr': 0.00033971252939740915, 'samples': 11272320, 'steps': 58709, 'loss/train': 1.4968241453170776} -08/30/2021 23:45:23 - INFO - __main__ - Step 58711: {'lr': 0.00033970757608751446, 'samples': 11272512, 'steps': 58710, 'loss/train': 1.7436162233352661} -08/30/2021 23:45:23 - INFO - __main__ - Step 58712: {'lr': 0.0003397026227371989, 'samples': 11272704, 'steps': 58711, 'loss/train': 1.6594783067703247} -08/30/2021 23:45:24 - INFO - __main__ - Step 58713: {'lr': 0.0003396976693464647, 'samples': 11272896, 'steps': 58712, 'loss/train': 1.2630974054336548} -08/30/2021 23:45:24 - INFO - __main__ - Step 58714: {'lr': 0.0003396927159153141, 'samples': 11273088, 'steps': 58713, 'loss/train': 1.672326683998108} -08/30/2021 23:45:26 - INFO - __main__ - Step 58715: {'lr': 0.0003396877624437495, 'samples': 11273280, 'steps': 58714, 'loss/train': 1.6367125511169434} -08/30/2021 23:45:26 - INFO - __main__ - Step 58716: {'lr': 0.0003396828089317728, 'samples': 11273472, 'steps': 58715, 'loss/train': 1.2915154695510864} -08/30/2021 23:45:26 - INFO - __main__ - Step 58717: {'lr': 0.0003396778553793865, 'samples': 11273664, 'steps': 58716, 'loss/train': 1.3781403303146362} -08/30/2021 23:45:27 - INFO - __main__ - Step 58718: {'lr': 0.00033967290178659273, 'samples': 11273856, 'steps': 58717, 'loss/train': 1.4711723327636719} -08/30/2021 23:45:27 - INFO - __main__ - Step 58719: {'lr': 0.0003396679481533937, 'samples': 11274048, 'steps': 58718, 'loss/train': 1.56981360912323} -08/30/2021 23:45:29 - INFO - __main__ - Step 58720: {'lr': 0.0003396629944797917, 'samples': 11274240, 'steps': 58719, 'loss/train': 1.521945595741272} -08/30/2021 23:45:29 - INFO - __main__ - Step 58721: {'lr': 0.0003396580407657889, 'samples': 11274432, 'steps': 58720, 'loss/train': 1.1058169603347778} -08/30/2021 23:45:30 - INFO - __main__ - Step 58722: {'lr': 0.0003396530870113877, 'samples': 11274624, 'steps': 58721, 'loss/train': 1.5603090524673462} -08/30/2021 23:45:30 - INFO - __main__ - Step 58723: {'lr': 0.0003396481332165901, 'samples': 11274816, 'steps': 58722, 'loss/train': 0.8087930083274841} -08/30/2021 23:45:31 - INFO - __main__ - Step 58724: {'lr': 0.00033964317938139845, 'samples': 11275008, 'steps': 58723, 'loss/train': 1.806008219718933} -08/30/2021 23:45:31 - INFO - __main__ - Step 58725: {'lr': 0.00033963822550581494, 'samples': 11275200, 'steps': 58724, 'loss/train': 1.690191388130188} -08/30/2021 23:45:32 - INFO - __main__ - Step 58726: {'lr': 0.0003396332715898418, 'samples': 11275392, 'steps': 58725, 'loss/train': 1.7882498502731323} -08/30/2021 23:45:33 - INFO - __main__ - Step 58727: {'lr': 0.00033962831763348133, 'samples': 11275584, 'steps': 58726, 'loss/train': 1.1820712089538574} -08/30/2021 23:45:33 - INFO - __main__ - Step 58728: {'lr': 0.00033962336363673585, 'samples': 11275776, 'steps': 58727, 'loss/train': 0.594863772392273} -08/30/2021 23:45:34 - INFO - __main__ - Step 58729: {'lr': 0.00033961840959960735, 'samples': 11275968, 'steps': 58728, 'loss/train': 1.3980870246887207} -08/30/2021 23:45:34 - INFO - __main__ - Step 58730: {'lr': 0.0003396134555220982, 'samples': 11276160, 'steps': 58729, 'loss/train': 0.8610799312591553} -08/30/2021 23:45:36 - INFO - __main__ - Step 58731: {'lr': 0.0003396085014042105, 'samples': 11276352, 'steps': 58730, 'loss/train': 1.176416277885437} -08/30/2021 23:45:37 - INFO - __main__ - Step 58732: {'lr': 0.00033960354724594665, 'samples': 11276544, 'steps': 58731, 'loss/train': 1.1247687339782715} -08/30/2021 23:45:37 - INFO - __main__ - Step 58733: {'lr': 0.0003395985930473089, 'samples': 11276736, 'steps': 58732, 'loss/train': 1.7837703227996826} -08/30/2021 23:45:37 - INFO - __main__ - Step 58734: {'lr': 0.00033959363880829935, 'samples': 11276928, 'steps': 58733, 'loss/train': 1.5966030359268188} -08/30/2021 23:45:38 - INFO - __main__ - Step 58735: {'lr': 0.00033958868452892035, 'samples': 11277120, 'steps': 58734, 'loss/train': 1.230141520500183} -08/30/2021 23:45:38 - INFO - __main__ - Step 58736: {'lr': 0.000339583730209174, 'samples': 11277312, 'steps': 58735, 'loss/train': 1.9571155309677124} -08/30/2021 23:45:40 - INFO - __main__ - Step 58737: {'lr': 0.0003395787758490626, 'samples': 11277504, 'steps': 58736, 'loss/train': 0.08838306367397308} -08/30/2021 23:45:40 - INFO - __main__ - Step 58738: {'lr': 0.0003395738214485884, 'samples': 11277696, 'steps': 58737, 'loss/train': 1.3713037967681885} -08/30/2021 23:45:40 - INFO - __main__ - Step 58739: {'lr': 0.0003395688670077536, 'samples': 11277888, 'steps': 58738, 'loss/train': 2.0473649501800537} -08/30/2021 23:45:41 - INFO - __main__ - Step 58740: {'lr': 0.0003395639125265605, 'samples': 11278080, 'steps': 58739, 'loss/train': 1.5242501497268677} -08/30/2021 23:45:41 - INFO - __main__ - Step 58741: {'lr': 0.00033955895800501126, 'samples': 11278272, 'steps': 58740, 'loss/train': 0.818575382232666} -08/30/2021 23:45:43 - INFO - __main__ - Step 58742: {'lr': 0.0003395540034431082, 'samples': 11278464, 'steps': 58741, 'loss/train': 1.6052708625793457} -08/30/2021 23:45:43 - INFO - __main__ - Step 58743: {'lr': 0.0003395490488408534, 'samples': 11278656, 'steps': 58742, 'loss/train': 1.3403186798095703} -08/30/2021 23:45:44 - INFO - __main__ - Step 58744: {'lr': 0.00033954409419824924, 'samples': 11278848, 'steps': 58743, 'loss/train': 0.07083722949028015} -08/30/2021 23:45:44 - INFO - __main__ - Step 58745: {'lr': 0.0003395391395152978, 'samples': 11279040, 'steps': 58744, 'loss/train': 1.3406776189804077} -08/30/2021 23:45:44 - INFO - __main__ - Step 58746: {'lr': 0.0003395341847920015, 'samples': 11279232, 'steps': 58745, 'loss/train': 1.767698049545288} -08/30/2021 23:45:45 - INFO - __main__ - Step 58747: {'lr': 0.00033952923002836244, 'samples': 11279424, 'steps': 58746, 'loss/train': 1.6017245054244995} -08/30/2021 23:45:46 - INFO - __main__ - Step 58748: {'lr': 0.0003395242752243829, 'samples': 11279616, 'steps': 58747, 'loss/train': 1.5462589263916016} -08/30/2021 23:45:47 - INFO - __main__ - Step 58749: {'lr': 0.00033951932038006513, 'samples': 11279808, 'steps': 58748, 'loss/train': 3.0614047050476074} -08/30/2021 23:45:47 - INFO - __main__ - Step 58750: {'lr': 0.00033951436549541124, 'samples': 11280000, 'steps': 58749, 'loss/train': 1.471692442893982} -08/30/2021 23:45:47 - INFO - __main__ - Step 58751: {'lr': 0.0003395094105704236, 'samples': 11280192, 'steps': 58750, 'loss/train': 1.6002084016799927} -08/30/2021 23:45:48 - INFO - __main__ - Step 58752: {'lr': 0.00033950445560510445, 'samples': 11280384, 'steps': 58751, 'loss/train': 1.1745747327804565} -08/30/2021 23:45:50 - INFO - __main__ - Step 58753: {'lr': 0.00033949950059945593, 'samples': 11280576, 'steps': 58752, 'loss/train': 5.314432621002197} -08/30/2021 23:45:50 - INFO - __main__ - Step 58754: {'lr': 0.00033949454555348035, 'samples': 11280768, 'steps': 58753, 'loss/train': 1.212120771408081} -08/30/2021 23:45:51 - INFO - __main__ - Step 58755: {'lr': 0.0003394895904671799, 'samples': 11280960, 'steps': 58754, 'loss/train': 1.1921107769012451} -08/30/2021 23:45:51 - INFO - __main__ - Step 58756: {'lr': 0.00033948463534055683, 'samples': 11281152, 'steps': 58755, 'loss/train': 1.5529626607894897} -08/30/2021 23:45:51 - INFO - __main__ - Step 58757: {'lr': 0.0003394796801736133, 'samples': 11281344, 'steps': 58756, 'loss/train': 1.4435099363327026} -08/30/2021 23:45:53 - INFO - __main__ - Step 58758: {'lr': 0.0003394747249663517, 'samples': 11281536, 'steps': 58757, 'loss/train': 1.6918872594833374} -08/30/2021 23:45:53 - INFO - __main__ - Step 58759: {'lr': 0.0003394697697187741, 'samples': 11281728, 'steps': 58758, 'loss/train': 1.1807827949523926} -08/30/2021 23:45:54 - INFO - __main__ - Step 58760: {'lr': 0.00033946481443088286, 'samples': 11281920, 'steps': 58759, 'loss/train': 1.160259485244751} -08/30/2021 23:45:54 - INFO - __main__ - Step 58761: {'lr': 0.00033945985910268007, 'samples': 11282112, 'steps': 58760, 'loss/train': 1.1233793497085571} -08/30/2021 23:45:54 - INFO - __main__ - Step 58762: {'lr': 0.0003394549037341681, 'samples': 11282304, 'steps': 58761, 'loss/train': 1.3589684963226318} -08/30/2021 23:45:55 - INFO - __main__ - Step 58763: {'lr': 0.00033944994832534915, 'samples': 11282496, 'steps': 58762, 'loss/train': 1.213646411895752} -08/30/2021 23:45:56 - INFO - __main__ - Step 58764: {'lr': 0.0003394449928762254, 'samples': 11282688, 'steps': 58763, 'loss/train': 1.695613145828247} -08/30/2021 23:45:57 - INFO - __main__ - Step 58765: {'lr': 0.0003394400373867991, 'samples': 11282880, 'steps': 58764, 'loss/train': 1.9866008758544922} -08/30/2021 23:45:57 - INFO - __main__ - Step 58766: {'lr': 0.00033943508185707257, 'samples': 11283072, 'steps': 58765, 'loss/train': 0.10850531607866287} -08/30/2021 23:45:57 - INFO - __main__ - Step 58767: {'lr': 0.0003394301262870479, 'samples': 11283264, 'steps': 58766, 'loss/train': 0.7525590658187866} -08/30/2021 23:45:58 - INFO - __main__ - Step 58768: {'lr': 0.00033942517067672744, 'samples': 11283456, 'steps': 58767, 'loss/train': 1.0791841745376587} -08/30/2021 23:45:59 - INFO - __main__ - Step 58769: {'lr': 0.00033942021502611334, 'samples': 11283648, 'steps': 58768, 'loss/train': 2.1386630535125732} -08/30/2021 23:46:00 - INFO - __main__ - Step 58770: {'lr': 0.0003394152593352079, 'samples': 11283840, 'steps': 58769, 'loss/train': 1.8796067237854004} -08/30/2021 23:46:00 - INFO - __main__ - Step 58771: {'lr': 0.0003394103036040133, 'samples': 11284032, 'steps': 58770, 'loss/train': 1.3748698234558105} -08/30/2021 23:46:00 - INFO - __main__ - Step 58772: {'lr': 0.00033940534783253185, 'samples': 11284224, 'steps': 58771, 'loss/train': 1.4511990547180176} -08/30/2021 23:46:01 - INFO - __main__ - Step 58773: {'lr': 0.00033940039202076574, 'samples': 11284416, 'steps': 58772, 'loss/train': 1.3540029525756836} -08/30/2021 23:46:02 - INFO - __main__ - Step 58774: {'lr': 0.0003393954361687172, 'samples': 11284608, 'steps': 58773, 'loss/train': 2.319308042526245} -08/30/2021 23:46:03 - INFO - __main__ - Step 58775: {'lr': 0.0003393904802763883, 'samples': 11284800, 'steps': 58774, 'loss/train': 1.7409207820892334} -08/30/2021 23:46:03 - INFO - __main__ - Step 58776: {'lr': 0.00033938552434378155, 'samples': 11284992, 'steps': 58775, 'loss/train': 1.778612732887268} -08/30/2021 23:46:03 - INFO - __main__ - Step 58777: {'lr': 0.00033938056837089903, 'samples': 11285184, 'steps': 58776, 'loss/train': 2.207735776901245} -08/30/2021 23:46:04 - INFO - __main__ - Step 58778: {'lr': 0.00033937561235774307, 'samples': 11285376, 'steps': 58777, 'loss/train': 1.5242668390274048} -08/30/2021 23:46:05 - INFO - __main__ - Step 58779: {'lr': 0.00033937065630431577, 'samples': 11285568, 'steps': 58778, 'loss/train': 1.7153576612472534} -08/30/2021 23:46:06 - INFO - __main__ - Step 58780: {'lr': 0.00033936570021061947, 'samples': 11285760, 'steps': 58779, 'loss/train': 0.9997885823249817} -08/30/2021 23:46:06 - INFO - __main__ - Step 58781: {'lr': 0.0003393607440766563, 'samples': 11285952, 'steps': 58780, 'loss/train': 1.0471984148025513} -08/30/2021 23:46:06 - INFO - __main__ - Step 58782: {'lr': 0.0003393557879024286, 'samples': 11286144, 'steps': 58781, 'loss/train': 1.6037567853927612} -08/30/2021 23:46:07 - INFO - __main__ - Step 58783: {'lr': 0.00033935083168793855, 'samples': 11286336, 'steps': 58782, 'loss/train': 1.3418024778366089} -08/30/2021 23:46:08 - INFO - __main__ - Step 58784: {'lr': 0.00033934587543318846, 'samples': 11286528, 'steps': 58783, 'loss/train': 0.46251997351646423} -08/30/2021 23:46:09 - INFO - __main__ - Step 58785: {'lr': 0.00033934091913818043, 'samples': 11286720, 'steps': 58784, 'loss/train': 0.38408803939819336} -08/30/2021 23:46:09 - INFO - __main__ - Step 58786: {'lr': 0.0003393359628029168, 'samples': 11286912, 'steps': 58785, 'loss/train': 1.3493787050247192} -08/30/2021 23:46:10 - INFO - __main__ - Step 58787: {'lr': 0.0003393310064273997, 'samples': 11287104, 'steps': 58786, 'loss/train': 1.2061803340911865} -08/30/2021 23:46:10 - INFO - __main__ - Step 58788: {'lr': 0.0003393260500116315, 'samples': 11287296, 'steps': 58787, 'loss/train': 1.2767568826675415} -08/30/2021 23:46:10 - INFO - __main__ - Step 58789: {'lr': 0.0003393210935556143, 'samples': 11287488, 'steps': 58788, 'loss/train': 0.4508485794067383} -08/30/2021 23:46:12 - INFO - __main__ - Step 58790: {'lr': 0.00033931613705935046, 'samples': 11287680, 'steps': 58789, 'loss/train': 0.9270490407943726} -08/30/2021 23:46:13 - INFO - __main__ - Step 58791: {'lr': 0.000339311180522842, 'samples': 11287872, 'steps': 58790, 'loss/train': 1.1681022644042969} -08/30/2021 23:46:13 - INFO - __main__ - Step 58792: {'lr': 0.00033930622394609143, 'samples': 11288064, 'steps': 58791, 'loss/train': 1.6185396909713745} -08/30/2021 23:46:14 - INFO - __main__ - Step 58793: {'lr': 0.00033930126732910083, 'samples': 11288256, 'steps': 58792, 'loss/train': 0.310821533203125} -08/30/2021 23:46:14 - INFO - __main__ - Step 58794: {'lr': 0.0003392963106718725, 'samples': 11288448, 'steps': 58793, 'loss/train': 0.33043384552001953} -08/30/2021 23:46:15 - INFO - __main__ - Step 58795: {'lr': 0.00033929135397440857, 'samples': 11288640, 'steps': 58794, 'loss/train': 1.2291858196258545} -08/30/2021 23:46:16 - INFO - __main__ - Step 58796: {'lr': 0.0003392863972367114, 'samples': 11288832, 'steps': 58795, 'loss/train': 1.4721119403839111} -08/30/2021 23:46:16 - INFO - __main__ - Step 58797: {'lr': 0.0003392814404587831, 'samples': 11289024, 'steps': 58796, 'loss/train': 0.9029848575592041} -08/30/2021 23:46:17 - INFO - __main__ - Step 58798: {'lr': 0.00033927648364062593, 'samples': 11289216, 'steps': 58797, 'loss/train': 1.0951250791549683} -08/30/2021 23:46:17 - INFO - __main__ - Step 58799: {'lr': 0.00033927152678224216, 'samples': 11289408, 'steps': 58798, 'loss/train': 0.37975120544433594} -08/30/2021 23:46:19 - INFO - __main__ - Step 58800: {'lr': 0.00033926656988363406, 'samples': 11289600, 'steps': 58799, 'loss/train': 1.0550575256347656} -08/30/2021 23:46:20 - INFO - __main__ - Step 58801: {'lr': 0.00033926161294480384, 'samples': 11289792, 'steps': 58800, 'loss/train': 1.6219799518585205} -08/30/2021 23:46:20 - INFO - __main__ - Step 58802: {'lr': 0.00033925665596575374, 'samples': 11289984, 'steps': 58801, 'loss/train': 1.3891360759735107} -08/30/2021 23:46:20 - INFO - __main__ - Step 58803: {'lr': 0.00033925169894648586, 'samples': 11290176, 'steps': 58802, 'loss/train': 1.2500232458114624} -08/30/2021 23:46:21 - INFO - __main__ - Step 58804: {'lr': 0.0003392467418870026, 'samples': 11290368, 'steps': 58803, 'loss/train': 1.4036320447921753} -08/30/2021 23:46:23 - INFO - __main__ - Step 58805: {'lr': 0.0003392417847873061, 'samples': 11290560, 'steps': 58804, 'loss/train': 0.954932689666748} -08/30/2021 23:46:23 - INFO - __main__ - Step 58806: {'lr': 0.00033923682764739867, 'samples': 11290752, 'steps': 58805, 'loss/train': 1.85524582862854} -08/30/2021 23:46:24 - INFO - __main__ - Step 58807: {'lr': 0.0003392318704672825, 'samples': 11290944, 'steps': 58806, 'loss/train': 1.5074431896209717} -08/30/2021 23:46:24 - INFO - __main__ - Step 58808: {'lr': 0.00033922691324695975, 'samples': 11291136, 'steps': 58807, 'loss/train': 2.3309195041656494} -08/30/2021 23:46:24 - INFO - __main__ - Step 58809: {'lr': 0.00033922195598643293, 'samples': 11291328, 'steps': 58808, 'loss/train': 0.2112676203250885} -08/30/2021 23:46:25 - INFO - __main__ - Step 58810: {'lr': 0.0003392169986857039, 'samples': 11291520, 'steps': 58809, 'loss/train': 1.3284920454025269} -08/30/2021 23:46:26 - INFO - __main__ - Step 58811: {'lr': 0.0003392120413447751, 'samples': 11291712, 'steps': 58810, 'loss/train': 1.4437609910964966} -08/30/2021 23:46:27 - INFO - __main__ - Step 58812: {'lr': 0.0003392070839636487, 'samples': 11291904, 'steps': 58811, 'loss/train': 1.9267053604125977} -08/30/2021 23:46:27 - INFO - __main__ - Step 58813: {'lr': 0.000339202126542327, 'samples': 11292096, 'steps': 58812, 'loss/train': 1.9604454040527344} -08/30/2021 23:46:27 - INFO - __main__ - Step 58814: {'lr': 0.00033919716908081224, 'samples': 11292288, 'steps': 58813, 'loss/train': 1.5966546535491943} -08/30/2021 23:46:28 - INFO - __main__ - Step 58815: {'lr': 0.0003391922115791065, 'samples': 11292480, 'steps': 58814, 'loss/train': 1.403215765953064} -08/30/2021 23:46:29 - INFO - __main__ - Step 58816: {'lr': 0.0003391872540372123, 'samples': 11292672, 'steps': 58815, 'loss/train': 0.7499516606330872} -08/30/2021 23:46:30 - INFO - __main__ - Step 58817: {'lr': 0.00033918229645513154, 'samples': 11292864, 'steps': 58816, 'loss/train': 1.1831259727478027} -08/30/2021 23:46:30 - INFO - __main__ - Step 58818: {'lr': 0.0003391773388328667, 'samples': 11293056, 'steps': 58817, 'loss/train': 0.07153192162513733} -08/30/2021 23:46:31 - INFO - __main__ - Step 58819: {'lr': 0.0003391723811704199, 'samples': 11293248, 'steps': 58818, 'loss/train': 1.3652219772338867} -08/30/2021 23:46:31 - INFO - __main__ - Step 58820: {'lr': 0.0003391674234677934, 'samples': 11293440, 'steps': 58819, 'loss/train': 0.9032937288284302} -08/30/2021 23:46:32 - INFO - __main__ - Step 58821: {'lr': 0.0003391624657249894, 'samples': 11293632, 'steps': 58820, 'loss/train': 1.301866054534912} -08/30/2021 23:46:33 - INFO - __main__ - Step 58822: {'lr': 0.0003391575079420102, 'samples': 11293824, 'steps': 58821, 'loss/train': 2.0473484992980957} -08/30/2021 23:46:33 - INFO - __main__ - Step 58823: {'lr': 0.00033915255011885803, 'samples': 11294016, 'steps': 58822, 'loss/train': 1.455654501914978} -08/30/2021 23:46:34 - INFO - __main__ - Step 58824: {'lr': 0.000339147592255535, 'samples': 11294208, 'steps': 58823, 'loss/train': 1.7569061517715454} -08/30/2021 23:46:34 - INFO - __main__ - Step 58825: {'lr': 0.00033914263435204356, 'samples': 11294400, 'steps': 58824, 'loss/train': 0.42737406492233276} -08/30/2021 23:46:35 - INFO - __main__ - Step 58826: {'lr': 0.0003391376764083858, 'samples': 11294592, 'steps': 58825, 'loss/train': 1.7902110815048218} -08/30/2021 23:46:36 - INFO - __main__ - Step 58827: {'lr': 0.00033913271842456394, 'samples': 11294784, 'steps': 58826, 'loss/train': 1.0986599922180176} -08/30/2021 23:46:36 - INFO - __main__ - Step 58828: {'lr': 0.0003391277604005802, 'samples': 11294976, 'steps': 58827, 'loss/train': 1.656203269958496} -08/30/2021 23:46:37 - INFO - __main__ - Step 58829: {'lr': 0.00033912280233643706, 'samples': 11295168, 'steps': 58828, 'loss/train': 1.275792121887207} -08/30/2021 23:46:37 - INFO - __main__ - Step 58830: {'lr': 0.00033911784423213645, 'samples': 11295360, 'steps': 58829, 'loss/train': 1.1996405124664307} -08/30/2021 23:46:37 - INFO - __main__ - Step 58831: {'lr': 0.00033911288608768063, 'samples': 11295552, 'steps': 58830, 'loss/train': 1.6678252220153809} -08/30/2021 23:46:39 - INFO - __main__ - Step 58832: {'lr': 0.000339107927903072, 'samples': 11295744, 'steps': 58831, 'loss/train': 1.1973662376403809} -08/30/2021 23:46:39 - INFO - __main__ - Step 58833: {'lr': 0.00033910296967831267, 'samples': 11295936, 'steps': 58832, 'loss/train': 1.5865659713745117} -08/30/2021 23:46:40 - INFO - __main__ - Step 58834: {'lr': 0.00033909801141340497, 'samples': 11296128, 'steps': 58833, 'loss/train': 1.3550770282745361} -08/30/2021 23:46:40 - INFO - __main__ - Step 58835: {'lr': 0.00033909305310835105, 'samples': 11296320, 'steps': 58834, 'loss/train': 1.2268120050430298} -08/30/2021 23:46:40 - INFO - __main__ - Step 58836: {'lr': 0.00033908809476315325, 'samples': 11296512, 'steps': 58835, 'loss/train': 1.1937689781188965} -08/30/2021 23:46:42 - INFO - __main__ - Step 58837: {'lr': 0.0003390831363778136, 'samples': 11296704, 'steps': 58836, 'loss/train': 1.7368097305297852} -08/30/2021 23:46:42 - INFO - __main__ - Step 58838: {'lr': 0.00033907817795233454, 'samples': 11296896, 'steps': 58837, 'loss/train': 1.6836061477661133} -08/30/2021 23:46:43 - INFO - __main__ - Step 58839: {'lr': 0.0003390732194867182, 'samples': 11297088, 'steps': 58838, 'loss/train': 1.6274300813674927} -08/30/2021 23:46:43 - INFO - __main__ - Step 58840: {'lr': 0.00033906826098096686, 'samples': 11297280, 'steps': 58839, 'loss/train': 1.0285338163375854} -08/30/2021 23:46:43 - INFO - __main__ - Step 58841: {'lr': 0.0003390633024350827, 'samples': 11297472, 'steps': 58840, 'loss/train': 1.7333099842071533} -08/30/2021 23:46:45 - INFO - __main__ - Step 58842: {'lr': 0.000339058343849068, 'samples': 11297664, 'steps': 58841, 'loss/train': 1.0773276090621948} -08/30/2021 23:46:46 - INFO - __main__ - Step 58843: {'lr': 0.00033905338522292514, 'samples': 11297856, 'steps': 58842, 'loss/train': 0.7455134391784668} -08/30/2021 23:46:46 - INFO - __main__ - Step 58844: {'lr': 0.00033904842655665604, 'samples': 11298048, 'steps': 58843, 'loss/train': 0.9754507541656494} -08/30/2021 23:46:47 - INFO - __main__ - Step 58845: {'lr': 0.00033904346785026306, 'samples': 11298240, 'steps': 58844, 'loss/train': 1.5566054582595825} -08/30/2021 23:46:47 - INFO - __main__ - Step 58846: {'lr': 0.0003390385091037486, 'samples': 11298432, 'steps': 58845, 'loss/train': 1.260424256324768} -08/30/2021 23:46:49 - INFO - __main__ - Step 58847: {'lr': 0.0003390335503171146, 'samples': 11298624, 'steps': 58846, 'loss/train': 0.07344728708267212} -08/30/2021 23:46:49 - INFO - __main__ - Step 58848: {'lr': 0.0003390285914903636, 'samples': 11298816, 'steps': 58847, 'loss/train': 1.616707444190979} -08/30/2021 23:46:49 - INFO - __main__ - Step 58849: {'lr': 0.0003390236326234977, 'samples': 11299008, 'steps': 58848, 'loss/train': 1.1169241666793823} -08/30/2021 23:46:50 - INFO - __main__ - Step 58850: {'lr': 0.000339018673716519, 'samples': 11299200, 'steps': 58849, 'loss/train': 0.04388076066970825} -08/30/2021 23:46:50 - INFO - __main__ - Step 58851: {'lr': 0.0003390137147694299, 'samples': 11299392, 'steps': 58850, 'loss/train': 2.0828006267547607} -08/30/2021 23:46:52 - INFO - __main__ - Step 58852: {'lr': 0.0003390087557822326, 'samples': 11299584, 'steps': 58851, 'loss/train': 2.091796398162842} -08/30/2021 23:46:52 - INFO - __main__ - Step 58853: {'lr': 0.00033900379675492933, 'samples': 11299776, 'steps': 58852, 'loss/train': 1.4529201984405518} -08/30/2021 23:46:53 - INFO - __main__ - Step 58854: {'lr': 0.00033899883768752234, 'samples': 11299968, 'steps': 58853, 'loss/train': 1.5650910139083862} -08/30/2021 23:46:53 - INFO - __main__ - Step 58855: {'lr': 0.00033899387858001386, 'samples': 11300160, 'steps': 58854, 'loss/train': 1.2085142135620117} -08/30/2021 23:46:53 - INFO - __main__ - Step 58856: {'lr': 0.0003389889194324061, 'samples': 11300352, 'steps': 58855, 'loss/train': 1.4862236976623535} -08/30/2021 23:46:54 - INFO - __main__ - Step 58857: {'lr': 0.0003389839602447013, 'samples': 11300544, 'steps': 58856, 'loss/train': 1.5161347389221191} -08/30/2021 23:46:55 - INFO - __main__ - Step 58858: {'lr': 0.0003389790010169017, 'samples': 11300736, 'steps': 58857, 'loss/train': 1.302025556564331} -08/30/2021 23:46:56 - INFO - __main__ - Step 58859: {'lr': 0.00033897404174900955, 'samples': 11300928, 'steps': 58858, 'loss/train': 1.1080756187438965} -08/30/2021 23:46:56 - INFO - __main__ - Step 58860: {'lr': 0.000338969082441027, 'samples': 11301120, 'steps': 58859, 'loss/train': 0.7732256054878235} -08/30/2021 23:46:56 - INFO - __main__ - Step 58861: {'lr': 0.00033896412309295643, 'samples': 11301312, 'steps': 58860, 'loss/train': 1.7619364261627197} -08/30/2021 23:46:57 - INFO - __main__ - Step 58862: {'lr': 0.00033895916370479994, 'samples': 11301504, 'steps': 58861, 'loss/train': 1.0133110284805298} -08/30/2021 23:46:59 - INFO - __main__ - Step 58863: {'lr': 0.00033895420427655995, 'samples': 11301696, 'steps': 58862, 'loss/train': 0.7115636467933655} -08/30/2021 23:46:59 - INFO - __main__ - Step 58864: {'lr': 0.0003389492448082384, 'samples': 11301888, 'steps': 58863, 'loss/train': 0.5410496592521667} -08/30/2021 23:47:00 - INFO - __main__ - Step 58865: {'lr': 0.0003389442852998378, 'samples': 11302080, 'steps': 58864, 'loss/train': 1.9697915315628052} -08/30/2021 23:47:00 - INFO - __main__ - Step 58866: {'lr': 0.0003389393257513602, 'samples': 11302272, 'steps': 58865, 'loss/train': 1.2539417743682861} -08/30/2021 23:47:00 - INFO - __main__ - Step 58867: {'lr': 0.00033893436616280796, 'samples': 11302464, 'steps': 58866, 'loss/train': 1.4076707363128662} -08/30/2021 23:47:01 - INFO - __main__ - Step 58868: {'lr': 0.0003389294065341833, 'samples': 11302656, 'steps': 58867, 'loss/train': 0.05458477884531021} -08/30/2021 23:47:02 - INFO - __main__ - Step 58869: {'lr': 0.0003389244468654884, 'samples': 11302848, 'steps': 58868, 'loss/train': 0.03862815350294113} -08/30/2021 23:47:03 - INFO - __main__ - Step 58870: {'lr': 0.0003389194871567255, 'samples': 11303040, 'steps': 58869, 'loss/train': 2.052201747894287} -08/30/2021 23:47:03 - INFO - __main__ - Step 58871: {'lr': 0.00033891452740789687, 'samples': 11303232, 'steps': 58870, 'loss/train': 1.4117408990859985} -08/30/2021 23:47:03 - INFO - __main__ - Step 58872: {'lr': 0.0003389095676190047, 'samples': 11303424, 'steps': 58871, 'loss/train': 1.2843350172042847} -08/30/2021 23:47:04 - INFO - __main__ - Step 58873: {'lr': 0.00033890460779005126, 'samples': 11303616, 'steps': 58872, 'loss/train': 1.5725042819976807} -08/30/2021 23:47:05 - INFO - __main__ - Step 58874: {'lr': 0.0003388996479210388, 'samples': 11303808, 'steps': 58873, 'loss/train': 1.3877595663070679} -08/30/2021 23:47:06 - INFO - __main__ - Step 58875: {'lr': 0.0003388946880119695, 'samples': 11304000, 'steps': 58874, 'loss/train': 0.31325653195381165} -08/30/2021 23:47:06 - INFO - __main__ - Step 58876: {'lr': 0.0003388897280628457, 'samples': 11304192, 'steps': 58875, 'loss/train': 1.5564548969268799} -08/30/2021 23:47:06 - INFO - __main__ - Step 58877: {'lr': 0.00033888476807366946, 'samples': 11304384, 'steps': 58876, 'loss/train': 0.035363029688596725} -08/30/2021 23:47:07 - INFO - __main__ - Step 58878: {'lr': 0.00033887980804444314, 'samples': 11304576, 'steps': 58877, 'loss/train': 0.7051045894622803} -08/30/2021 23:47:08 - INFO - __main__ - Step 58879: {'lr': 0.00033887484797516895, 'samples': 11304768, 'steps': 58878, 'loss/train': 1.4129315614700317} -08/30/2021 23:47:09 - INFO - __main__ - Step 58880: {'lr': 0.00033886988786584914, 'samples': 11304960, 'steps': 58879, 'loss/train': 1.2098859548568726} -08/30/2021 23:47:09 - INFO - __main__ - Step 58881: {'lr': 0.0003388649277164859, 'samples': 11305152, 'steps': 58880, 'loss/train': 1.4665073156356812} -08/30/2021 23:47:09 - INFO - __main__ - Step 58882: {'lr': 0.0003388599675270815, 'samples': 11305344, 'steps': 58881, 'loss/train': 1.6331019401550293} -08/30/2021 23:47:10 - INFO - __main__ - Step 58883: {'lr': 0.00033885500729763824, 'samples': 11305536, 'steps': 58882, 'loss/train': 1.9003345966339111} -08/30/2021 23:47:10 - INFO - __main__ - Step 58884: {'lr': 0.00033885004702815825, 'samples': 11305728, 'steps': 58883, 'loss/train': 1.5604912042617798} -08/30/2021 23:47:12 - INFO - __main__ - Step 58885: {'lr': 0.00033884508671864377, 'samples': 11305920, 'steps': 58884, 'loss/train': 1.8833619356155396} -08/30/2021 23:47:12 - INFO - __main__ - Step 58886: {'lr': 0.0003388401263690971, 'samples': 11306112, 'steps': 58885, 'loss/train': 0.11321484297513962} -08/30/2021 23:47:12 - INFO - __main__ - Step 58887: {'lr': 0.00033883516597952033, 'samples': 11306304, 'steps': 58886, 'loss/train': 1.7042204141616821} -08/30/2021 23:47:13 - INFO - __main__ - Step 58888: {'lr': 0.00033883020554991594, 'samples': 11306496, 'steps': 58887, 'loss/train': 1.1117045879364014} -08/30/2021 23:47:13 - INFO - __main__ - Step 58889: {'lr': 0.000338825245080286, 'samples': 11306688, 'steps': 58888, 'loss/train': 1.708659052848816} -08/30/2021 23:47:15 - INFO - __main__ - Step 58890: {'lr': 0.0003388202845706328, 'samples': 11306880, 'steps': 58889, 'loss/train': 1.3224077224731445} -08/30/2021 23:47:15 - INFO - __main__ - Step 58891: {'lr': 0.0003388153240209585, 'samples': 11307072, 'steps': 58890, 'loss/train': 1.2200595140457153} -08/30/2021 23:47:16 - INFO - __main__ - Step 58892: {'lr': 0.0003388103634312654, 'samples': 11307264, 'steps': 58891, 'loss/train': 1.4970959424972534} -08/30/2021 23:47:16 - INFO - __main__ - Step 58893: {'lr': 0.0003388054028015557, 'samples': 11307456, 'steps': 58892, 'loss/train': 1.5872451066970825} -08/30/2021 23:47:16 - INFO - __main__ - Step 58894: {'lr': 0.00033880044213183163, 'samples': 11307648, 'steps': 58893, 'loss/train': 1.0694379806518555} -08/30/2021 23:47:18 - INFO - __main__ - Step 58895: {'lr': 0.00033879548142209546, 'samples': 11307840, 'steps': 58894, 'loss/train': 1.3389191627502441} -08/30/2021 23:47:18 - INFO - __main__ - Step 58896: {'lr': 0.0003387905206723496, 'samples': 11308032, 'steps': 58895, 'loss/train': 1.2320886850357056} -08/30/2021 23:47:18 - INFO - __main__ - Step 58897: {'lr': 0.00033878555988259583, 'samples': 11308224, 'steps': 58896, 'loss/train': 1.192296028137207} -08/30/2021 23:47:19 - INFO - __main__ - Step 58898: {'lr': 0.0003387805990528368, 'samples': 11308416, 'steps': 58897, 'loss/train': 1.6647263765335083} -08/30/2021 23:47:19 - INFO - __main__ - Step 58899: {'lr': 0.0003387756381830746, 'samples': 11308608, 'steps': 58898, 'loss/train': 0.4628666043281555} -08/30/2021 23:47:21 - INFO - __main__ - Step 58900: {'lr': 0.00033877067727331145, 'samples': 11308800, 'steps': 58899, 'loss/train': 1.670591950416565} -08/30/2021 23:47:21 - INFO - __main__ - Step 58901: {'lr': 0.00033876571632354956, 'samples': 11308992, 'steps': 58900, 'loss/train': 1.3814274072647095} -08/30/2021 23:47:21 - INFO - __main__ - Step 58902: {'lr': 0.0003387607553337913, 'samples': 11309184, 'steps': 58901, 'loss/train': 1.4355747699737549} -08/30/2021 23:47:22 - INFO - __main__ - Step 58903: {'lr': 0.00033875579430403877, 'samples': 11309376, 'steps': 58902, 'loss/train': 1.0601228475570679} -08/30/2021 23:47:22 - INFO - __main__ - Step 58904: {'lr': 0.00033875083323429425, 'samples': 11309568, 'steps': 58903, 'loss/train': 1.3985990285873413} -08/30/2021 23:47:24 - INFO - __main__ - Step 58905: {'lr': 0.0003387458721245599, 'samples': 11309760, 'steps': 58904, 'loss/train': 3.1908650398254395} -08/30/2021 23:47:25 - INFO - __main__ - Step 58906: {'lr': 0.0003387409109748381, 'samples': 11309952, 'steps': 58905, 'loss/train': 1.2943027019500732} -08/30/2021 23:47:25 - INFO - __main__ - Step 58907: {'lr': 0.0003387359497851311, 'samples': 11310144, 'steps': 58906, 'loss/train': 1.2246050834655762} -08/30/2021 23:47:25 - INFO - __main__ - Step 58908: {'lr': 0.00033873098855544093, 'samples': 11310336, 'steps': 58907, 'loss/train': 1.6925221681594849} -08/30/2021 23:47:26 - INFO - __main__ - Step 58909: {'lr': 0.00033872602728576997, 'samples': 11310528, 'steps': 58908, 'loss/train': 1.3939054012298584} -08/30/2021 23:47:27 - INFO - __main__ - Step 58910: {'lr': 0.0003387210659761204, 'samples': 11310720, 'steps': 58909, 'loss/train': 1.2687801122665405} -08/30/2021 23:47:28 - INFO - __main__ - Step 58911: {'lr': 0.00033871610462649456, 'samples': 11310912, 'steps': 58910, 'loss/train': 1.27236807346344} -08/30/2021 23:47:28 - INFO - __main__ - Step 58912: {'lr': 0.00033871114323689457, 'samples': 11311104, 'steps': 58911, 'loss/train': 1.5317920446395874} -08/30/2021 23:47:29 - INFO - __main__ - Step 58913: {'lr': 0.0003387061818073227, 'samples': 11311296, 'steps': 58912, 'loss/train': 1.1287299394607544} -08/30/2021 23:47:29 - INFO - __main__ - Step 58914: {'lr': 0.00033870122033778123, 'samples': 11311488, 'steps': 58913, 'loss/train': 1.429857850074768} -08/30/2021 23:47:29 - INFO - __main__ - Step 58915: {'lr': 0.00033869625882827233, 'samples': 11311680, 'steps': 58914, 'loss/train': 1.5617824792861938} -08/30/2021 23:47:31 - INFO - __main__ - Step 58916: {'lr': 0.00033869129727879827, 'samples': 11311872, 'steps': 58915, 'loss/train': 1.4296057224273682} -08/30/2021 23:47:31 - INFO - __main__ - Step 58917: {'lr': 0.0003386863356893612, 'samples': 11312064, 'steps': 58916, 'loss/train': 3.536475419998169} -08/30/2021 23:47:32 - INFO - __main__ - Step 58918: {'lr': 0.00033868137405996363, 'samples': 11312256, 'steps': 58917, 'loss/train': 0.32338494062423706} -08/30/2021 23:47:32 - INFO - __main__ - Step 58919: {'lr': 0.0003386764123906075, 'samples': 11312448, 'steps': 58918, 'loss/train': 1.9184119701385498} -08/30/2021 23:47:32 - INFO - __main__ - Step 58920: {'lr': 0.00033867145068129515, 'samples': 11312640, 'steps': 58919, 'loss/train': 0.4450545907020569} -08/30/2021 23:47:34 - INFO - __main__ - Step 58921: {'lr': 0.0003386664889320287, 'samples': 11312832, 'steps': 58920, 'loss/train': 1.4108160734176636} -08/30/2021 23:47:34 - INFO - __main__ - Step 58922: {'lr': 0.0003386615271428106, 'samples': 11313024, 'steps': 58921, 'loss/train': 1.092791199684143} -08/30/2021 23:47:35 - INFO - __main__ - Step 58923: {'lr': 0.000338656565313643, 'samples': 11313216, 'steps': 58922, 'loss/train': 1.4416844844818115} -08/30/2021 23:47:35 - INFO - __main__ - Step 58924: {'lr': 0.0003386516034445281, 'samples': 11313408, 'steps': 58923, 'loss/train': 1.1677485704421997} -08/30/2021 23:47:35 - INFO - __main__ - Step 58925: {'lr': 0.0003386466415354682, 'samples': 11313600, 'steps': 58924, 'loss/train': 1.599466323852539} -08/30/2021 23:47:37 - INFO - __main__ - Step 58926: {'lr': 0.00033864167958646543, 'samples': 11313792, 'steps': 58925, 'loss/train': 1.5058428049087524} -08/30/2021 23:47:37 - INFO - __main__ - Step 58927: {'lr': 0.00033863671759752206, 'samples': 11313984, 'steps': 58926, 'loss/train': 0.9152516722679138} -08/30/2021 23:47:38 - INFO - __main__ - Step 58928: {'lr': 0.0003386317555686404, 'samples': 11314176, 'steps': 58927, 'loss/train': 1.6576542854309082} -08/30/2021 23:47:38 - INFO - __main__ - Step 58929: {'lr': 0.0003386267934998226, 'samples': 11314368, 'steps': 58928, 'loss/train': 0.9393288493156433} -08/30/2021 23:47:38 - INFO - __main__ - Step 58930: {'lr': 0.00033862183139107106, 'samples': 11314560, 'steps': 58929, 'loss/train': 0.2901025414466858} -08/30/2021 23:47:40 - INFO - __main__ - Step 58931: {'lr': 0.0003386168692423878, 'samples': 11314752, 'steps': 58930, 'loss/train': 1.3556660413742065} -08/30/2021 23:47:40 - INFO - __main__ - Step 58932: {'lr': 0.0003386119070537751, 'samples': 11314944, 'steps': 58931, 'loss/train': 1.1427834033966064} -08/30/2021 23:47:41 - INFO - __main__ - Step 58933: {'lr': 0.0003386069448252353, 'samples': 11315136, 'steps': 58932, 'loss/train': 1.4643630981445312} -08/30/2021 23:47:41 - INFO - __main__ - Step 58934: {'lr': 0.00033860198255677054, 'samples': 11315328, 'steps': 58933, 'loss/train': 1.835627555847168} -08/30/2021 23:47:41 - INFO - __main__ - Step 58935: {'lr': 0.0003385970202483831, 'samples': 11315520, 'steps': 58934, 'loss/train': 1.5601670742034912} -08/30/2021 23:47:43 - INFO - __main__ - Step 58936: {'lr': 0.0003385920579000752, 'samples': 11315712, 'steps': 58935, 'loss/train': 1.200656533241272} -08/30/2021 23:47:43 - INFO - __main__ - Step 58937: {'lr': 0.0003385870955118492, 'samples': 11315904, 'steps': 58936, 'loss/train': 1.4566508531570435} -08/30/2021 23:47:44 - INFO - __main__ - Step 58938: {'lr': 0.0003385821330837071, 'samples': 11316096, 'steps': 58937, 'loss/train': 1.1573736667633057} -08/30/2021 23:47:44 - INFO - __main__ - Step 58939: {'lr': 0.0003385771706156513, 'samples': 11316288, 'steps': 58938, 'loss/train': 1.4861280918121338} -08/30/2021 23:47:44 - INFO - __main__ - Step 58940: {'lr': 0.00033857220810768395, 'samples': 11316480, 'steps': 58939, 'loss/train': 0.06638515740633011} -08/30/2021 23:47:46 - INFO - __main__ - Step 58941: {'lr': 0.00033856724555980736, 'samples': 11316672, 'steps': 58940, 'loss/train': 1.3598262071609497} -08/30/2021 23:47:46 - INFO - __main__ - Step 58942: {'lr': 0.00033856228297202373, 'samples': 11316864, 'steps': 58941, 'loss/train': 1.0139168500900269} -08/30/2021 23:47:47 - INFO - __main__ - Step 58943: {'lr': 0.0003385573203443354, 'samples': 11317056, 'steps': 58942, 'loss/train': 1.6325628757476807} -08/30/2021 23:47:47 - INFO - __main__ - Step 58944: {'lr': 0.0003385523576767444, 'samples': 11317248, 'steps': 58943, 'loss/train': 1.5046268701553345} -08/30/2021 23:47:47 - INFO - __main__ - Step 58945: {'lr': 0.0003385473949692531, 'samples': 11317440, 'steps': 58944, 'loss/train': 1.1434009075164795} -08/30/2021 23:47:48 - INFO - __main__ - Step 58946: {'lr': 0.0003385424322218637, 'samples': 11317632, 'steps': 58945, 'loss/train': 1.1483182907104492} -08/30/2021 23:47:49 - INFO - __main__ - Step 58947: {'lr': 0.0003385374694345784, 'samples': 11317824, 'steps': 58946, 'loss/train': 1.209281086921692} -08/30/2021 23:47:50 - INFO - __main__ - Step 58948: {'lr': 0.00033853250660739954, 'samples': 11318016, 'steps': 58947, 'loss/train': 1.050894021987915} -08/30/2021 23:47:50 - INFO - __main__ - Step 58949: {'lr': 0.00033852754374032927, 'samples': 11318208, 'steps': 58948, 'loss/train': 1.9154123067855835} -08/30/2021 23:47:50 - INFO - __main__ - Step 58950: {'lr': 0.00033852258083336996, 'samples': 11318400, 'steps': 58949, 'loss/train': 1.8694238662719727} -08/30/2021 23:47:51 - INFO - __main__ - Step 58951: {'lr': 0.0003385176178865236, 'samples': 11318592, 'steps': 58950, 'loss/train': 0.9341641068458557} -08/30/2021 23:47:52 - INFO - __main__ - Step 58952: {'lr': 0.00033851265489979267, 'samples': 11318784, 'steps': 58951, 'loss/train': 1.2058618068695068} -08/30/2021 23:47:53 - INFO - __main__ - Step 58953: {'lr': 0.00033850769187317923, 'samples': 11318976, 'steps': 58952, 'loss/train': 1.5634336471557617} -08/30/2021 23:47:53 - INFO - __main__ - Step 58954: {'lr': 0.00033850272880668565, 'samples': 11319168, 'steps': 58953, 'loss/train': 2.0675899982452393} -08/30/2021 23:47:53 - INFO - __main__ - Step 58955: {'lr': 0.000338497765700314, 'samples': 11319360, 'steps': 58954, 'loss/train': 1.2280032634735107} -08/30/2021 23:47:54 - INFO - __main__ - Step 58956: {'lr': 0.00033849280255406674, 'samples': 11319552, 'steps': 58955, 'loss/train': 0.1917537897825241} -08/30/2021 23:47:55 - INFO - __main__ - Step 58957: {'lr': 0.000338487839367946, 'samples': 11319744, 'steps': 58956, 'loss/train': 1.537724256515503} -08/30/2021 23:47:56 - INFO - __main__ - Step 58958: {'lr': 0.00033848287614195394, 'samples': 11319936, 'steps': 58957, 'loss/train': 0.9597919583320618} -08/30/2021 23:47:56 - INFO - __main__ - Step 58959: {'lr': 0.00033847791287609287, 'samples': 11320128, 'steps': 58958, 'loss/train': 1.011679768562317} -08/30/2021 23:47:56 - INFO - __main__ - Step 58960: {'lr': 0.00033847294957036503, 'samples': 11320320, 'steps': 58959, 'loss/train': 1.364578127861023} -08/30/2021 23:47:57 - INFO - __main__ - Step 58961: {'lr': 0.0003384679862247726, 'samples': 11320512, 'steps': 58960, 'loss/train': 1.002401351928711} -08/30/2021 23:47:59 - INFO - __main__ - Step 58962: {'lr': 0.0003384630228393179, 'samples': 11320704, 'steps': 58961, 'loss/train': 0.7703489661216736} -08/30/2021 23:47:59 - INFO - __main__ - Step 58963: {'lr': 0.0003384580594140031, 'samples': 11320896, 'steps': 58962, 'loss/train': 1.4097155332565308} -08/30/2021 23:48:00 - INFO - __main__ - Step 58964: {'lr': 0.00033845309594883054, 'samples': 11321088, 'steps': 58963, 'loss/train': 1.8449395895004272} -08/30/2021 23:48:00 - INFO - __main__ - Step 58965: {'lr': 0.0003384481324438023, 'samples': 11321280, 'steps': 58964, 'loss/train': 1.6552140712738037} -08/30/2021 23:48:00 - INFO - __main__ - Step 58966: {'lr': 0.00033844316889892074, 'samples': 11321472, 'steps': 58965, 'loss/train': 1.1037263870239258} -08/30/2021 23:48:01 - INFO - __main__ - Step 58967: {'lr': 0.000338438205314188, 'samples': 11321664, 'steps': 58966, 'loss/train': 1.5210975408554077} -08/30/2021 23:48:02 - INFO - __main__ - Step 58968: {'lr': 0.00033843324168960644, 'samples': 11321856, 'steps': 58967, 'loss/train': 1.3310660123825073} -08/30/2021 23:48:03 - INFO - __main__ - Step 58969: {'lr': 0.0003384282780251782, 'samples': 11322048, 'steps': 58968, 'loss/train': 1.5004477500915527} -08/30/2021 23:48:03 - INFO - __main__ - Step 58970: {'lr': 0.0003384233143209056, 'samples': 11322240, 'steps': 58969, 'loss/train': 1.1517926454544067} -08/30/2021 23:48:03 - INFO - __main__ - Step 58971: {'lr': 0.0003384183505767907, 'samples': 11322432, 'steps': 58970, 'loss/train': 0.8498528003692627} -08/30/2021 23:48:04 - INFO - __main__ - Step 58972: {'lr': 0.0003384133867928359, 'samples': 11322624, 'steps': 58971, 'loss/train': 1.4209383726119995} -08/30/2021 23:48:05 - INFO - __main__ - Step 58973: {'lr': 0.0003384084229690434, 'samples': 11322816, 'steps': 58972, 'loss/train': 1.0733853578567505} -08/30/2021 23:48:06 - INFO - __main__ - Step 58974: {'lr': 0.0003384034591054154, 'samples': 11323008, 'steps': 58973, 'loss/train': 1.5427162647247314} -08/30/2021 23:48:06 - INFO - __main__ - Step 58975: {'lr': 0.0003383984952019542, 'samples': 11323200, 'steps': 58974, 'loss/train': 1.3531625270843506} -08/30/2021 23:48:06 - INFO - __main__ - Step 58976: {'lr': 0.00033839353125866194, 'samples': 11323392, 'steps': 58975, 'loss/train': 1.6280808448791504} -08/30/2021 23:48:07 - INFO - __main__ - Step 58977: {'lr': 0.00033838856727554106, 'samples': 11323584, 'steps': 58976, 'loss/train': 1.229718565940857} -08/30/2021 23:48:08 - INFO - __main__ - Step 58978: {'lr': 0.00033838360325259354, 'samples': 11323776, 'steps': 58977, 'loss/train': 1.2192788124084473} -08/30/2021 23:48:09 - INFO - __main__ - Step 58979: {'lr': 0.00033837863918982175, 'samples': 11323968, 'steps': 58978, 'loss/train': 0.9179202318191528} -08/30/2021 23:48:09 - INFO - __main__ - Step 58980: {'lr': 0.0003383736750872279, 'samples': 11324160, 'steps': 58979, 'loss/train': 1.4866210222244263} -08/30/2021 23:48:10 - INFO - __main__ - Step 58981: {'lr': 0.00033836871094481433, 'samples': 11324352, 'steps': 58980, 'loss/train': 1.1453936100006104} -08/30/2021 23:48:10 - INFO - __main__ - Step 58982: {'lr': 0.0003383637467625831, 'samples': 11324544, 'steps': 58981, 'loss/train': 1.502899408340454} -08/30/2021 23:48:11 - INFO - __main__ - Step 58983: {'lr': 0.00033835878254053647, 'samples': 11324736, 'steps': 58982, 'loss/train': 1.1553280353546143} -08/30/2021 23:48:12 - INFO - __main__ - Step 58984: {'lr': 0.00033835381827867686, 'samples': 11324928, 'steps': 58983, 'loss/train': 1.4467045068740845} -08/30/2021 23:48:12 - INFO - __main__ - Step 58985: {'lr': 0.00033834885397700633, 'samples': 11325120, 'steps': 58984, 'loss/train': 0.916881799697876} -08/30/2021 23:48:13 - INFO - __main__ - Step 58986: {'lr': 0.00033834388963552715, 'samples': 11325312, 'steps': 58985, 'loss/train': 1.1837950944900513} -08/30/2021 23:48:13 - INFO - __main__ - Step 58987: {'lr': 0.0003383389252542416, 'samples': 11325504, 'steps': 58986, 'loss/train': 1.0867846012115479} -08/30/2021 23:48:14 - INFO - __main__ - Step 58988: {'lr': 0.0003383339608331519, 'samples': 11325696, 'steps': 58987, 'loss/train': 1.5615942478179932} -08/30/2021 23:48:15 - INFO - __main__ - Step 58989: {'lr': 0.00033832899637226024, 'samples': 11325888, 'steps': 58988, 'loss/train': 1.42579185962677} -08/30/2021 23:48:15 - INFO - __main__ - Step 58990: {'lr': 0.0003383240318715689, 'samples': 11326080, 'steps': 58989, 'loss/train': 1.702448844909668} -08/30/2021 23:48:16 - INFO - __main__ - Step 58991: {'lr': 0.0003383190673310802, 'samples': 11326272, 'steps': 58990, 'loss/train': 1.080240249633789} -08/30/2021 23:48:16 - INFO - __main__ - Step 58992: {'lr': 0.0003383141027507962, 'samples': 11326464, 'steps': 58991, 'loss/train': 1.2901581525802612} -08/30/2021 23:48:18 - INFO - __main__ - Step 58993: {'lr': 0.0003383091381307193, 'samples': 11326656, 'steps': 58992, 'loss/train': 1.146825909614563} -08/30/2021 23:48:18 - INFO - __main__ - Step 58994: {'lr': 0.0003383041734708516, 'samples': 11326848, 'steps': 58993, 'loss/train': 0.5573970675468445} -08/30/2021 23:48:18 - INFO - __main__ - Step 58995: {'lr': 0.0003382992087711954, 'samples': 11327040, 'steps': 58994, 'loss/train': 1.556983470916748} -08/30/2021 23:48:19 - INFO - __main__ - Step 58996: {'lr': 0.00033829424403175297, 'samples': 11327232, 'steps': 58995, 'loss/train': 1.2523374557495117} -08/30/2021 23:48:19 - INFO - __main__ - Step 58997: {'lr': 0.00033828927925252657, 'samples': 11327424, 'steps': 58996, 'loss/train': 1.083922028541565} -08/30/2021 23:48:19 - INFO - __main__ - Step 58998: {'lr': 0.0003382843144335183, 'samples': 11327616, 'steps': 58997, 'loss/train': 1.3436797857284546} -08/30/2021 23:48:21 - INFO - __main__ - Step 58999: {'lr': 0.0003382793495747305, 'samples': 11327808, 'steps': 58998, 'loss/train': 1.4055079221725464} -08/30/2021 23:48:21 - INFO - __main__ - Step 59000: {'lr': 0.0003382743846761654, 'samples': 11328000, 'steps': 58999, 'loss/train': 1.1837085485458374} -08/30/2021 23:48:22 - INFO - __main__ - Step 59001: {'lr': 0.0003382694197378252, 'samples': 11328192, 'steps': 59000, 'loss/train': 1.110337495803833} -08/30/2021 23:48:22 - INFO - __main__ - Step 59002: {'lr': 0.00033826445475971216, 'samples': 11328384, 'steps': 59001, 'loss/train': 0.901333749294281} -08/30/2021 23:48:22 - INFO - __main__ - Step 59003: {'lr': 0.0003382594897418285, 'samples': 11328576, 'steps': 59002, 'loss/train': 0.9534628391265869} -08/30/2021 23:48:24 - INFO - __main__ - Step 59004: {'lr': 0.0003382545246841766, 'samples': 11328768, 'steps': 59003, 'loss/train': 1.4020612239837646} -08/30/2021 23:48:24 - INFO - __main__ - Step 59005: {'lr': 0.00033824955958675843, 'samples': 11328960, 'steps': 59004, 'loss/train': 1.4572243690490723} -08/30/2021 23:48:25 - INFO - __main__ - Step 59006: {'lr': 0.00033824459444957645, 'samples': 11329152, 'steps': 59005, 'loss/train': 0.939325213432312} -08/30/2021 23:48:25 - INFO - __main__ - Step 59007: {'lr': 0.0003382396292726328, 'samples': 11329344, 'steps': 59006, 'loss/train': 1.294857144355774} -08/30/2021 23:48:25 - INFO - __main__ - Step 59008: {'lr': 0.00033823466405592974, 'samples': 11329536, 'steps': 59007, 'loss/train': 1.5731358528137207} -08/30/2021 23:48:27 - INFO - __main__ - Step 59009: {'lr': 0.00033822969879946947, 'samples': 11329728, 'steps': 59008, 'loss/train': 1.6323109865188599} -08/30/2021 23:48:27 - INFO - __main__ - Step 59010: {'lr': 0.0003382247335032542, 'samples': 11329920, 'steps': 59009, 'loss/train': 0.602820873260498} -08/30/2021 23:48:28 - INFO - __main__ - Step 59011: {'lr': 0.0003382197681672864, 'samples': 11330112, 'steps': 59010, 'loss/train': 1.5404332876205444} -08/30/2021 23:48:28 - INFO - __main__ - Step 59012: {'lr': 0.000338214802791568, 'samples': 11330304, 'steps': 59011, 'loss/train': 0.7720848321914673} -08/30/2021 23:48:28 - INFO - __main__ - Step 59013: {'lr': 0.00033820983737610147, 'samples': 11330496, 'steps': 59012, 'loss/train': 1.432164192199707} -08/30/2021 23:48:30 - INFO - __main__ - Step 59014: {'lr': 0.00033820487192088883, 'samples': 11330688, 'steps': 59013, 'loss/train': 1.2767586708068848} -08/30/2021 23:48:31 - INFO - __main__ - Step 59015: {'lr': 0.0003381999064259325, 'samples': 11330880, 'steps': 59014, 'loss/train': 0.8357781767845154} -08/30/2021 23:48:31 - INFO - __main__ - Step 59016: {'lr': 0.00033819494089123466, 'samples': 11331072, 'steps': 59015, 'loss/train': 1.465734601020813} -08/30/2021 23:48:32 - INFO - __main__ - Step 59017: {'lr': 0.00033818997531679756, 'samples': 11331264, 'steps': 59016, 'loss/train': 1.323067307472229} -08/30/2021 23:48:32 - INFO - __main__ - Step 59018: {'lr': 0.0003381850097026234, 'samples': 11331456, 'steps': 59017, 'loss/train': 1.5994404554367065} -08/30/2021 23:48:34 - INFO - __main__ - Step 59019: {'lr': 0.0003381800440487144, 'samples': 11331648, 'steps': 59018, 'loss/train': 1.5859649181365967} -08/30/2021 23:48:34 - INFO - __main__ - Step 59020: {'lr': 0.00033817507835507283, 'samples': 11331840, 'steps': 59019, 'loss/train': 1.1988579034805298} -08/30/2021 23:48:34 - INFO - __main__ - Step 59021: {'lr': 0.00033817011262170097, 'samples': 11332032, 'steps': 59020, 'loss/train': 1.52346932888031} -08/30/2021 23:48:35 - INFO - __main__ - Step 59022: {'lr': 0.000338165146848601, 'samples': 11332224, 'steps': 59021, 'loss/train': 1.3233613967895508} -08/30/2021 23:48:35 - INFO - __main__ - Step 59023: {'lr': 0.0003381601810357752, 'samples': 11332416, 'steps': 59022, 'loss/train': 1.3584074974060059} -08/30/2021 23:48:35 - INFO - __main__ - Step 59024: {'lr': 0.00033815521518322576, 'samples': 11332608, 'steps': 59023, 'loss/train': 1.6075634956359863} -08/30/2021 23:48:37 - INFO - __main__ - Step 59025: {'lr': 0.00033815024929095496, 'samples': 11332800, 'steps': 59024, 'loss/train': 1.31549870967865} -08/30/2021 23:48:37 - INFO - __main__ - Step 59026: {'lr': 0.000338145283358965, 'samples': 11332992, 'steps': 59025, 'loss/train': 1.880662202835083} -08/30/2021 23:48:38 - INFO - __main__ - Step 59027: {'lr': 0.0003381403173872581, 'samples': 11333184, 'steps': 59026, 'loss/train': 1.2815799713134766} -08/30/2021 23:48:38 - INFO - __main__ - Step 59028: {'lr': 0.00033813535137583656, 'samples': 11333376, 'steps': 59027, 'loss/train': 0.9613404870033264} -08/30/2021 23:48:38 - INFO - __main__ - Step 59029: {'lr': 0.0003381303853247026, 'samples': 11333568, 'steps': 59028, 'loss/train': 1.2405524253845215} -08/30/2021 23:48:40 - INFO - __main__ - Step 59030: {'lr': 0.0003381254192338585, 'samples': 11333760, 'steps': 59029, 'loss/train': 1.5383808612823486} -08/30/2021 23:48:40 - INFO - __main__ - Step 59031: {'lr': 0.00033812045310330636, 'samples': 11333952, 'steps': 59030, 'loss/train': 1.4398000240325928} -08/30/2021 23:48:41 - INFO - __main__ - Step 59032: {'lr': 0.0003381154869330485, 'samples': 11334144, 'steps': 59031, 'loss/train': 1.3044570684432983} -08/30/2021 23:48:41 - INFO - __main__ - Step 59033: {'lr': 0.00033811052072308724, 'samples': 11334336, 'steps': 59032, 'loss/train': 1.601513385772705} -08/30/2021 23:48:41 - INFO - __main__ - Step 59034: {'lr': 0.0003381055544734247, 'samples': 11334528, 'steps': 59033, 'loss/train': 1.3422828912734985} -08/30/2021 23:48:43 - INFO - __main__ - Step 59035: {'lr': 0.00033810058818406307, 'samples': 11334720, 'steps': 59034, 'loss/train': 1.0054799318313599} -08/30/2021 23:48:43 - INFO - __main__ - Step 59036: {'lr': 0.0003380956218550049, 'samples': 11334912, 'steps': 59035, 'loss/train': 1.39080810546875} -08/30/2021 23:48:44 - INFO - __main__ - Step 59037: {'lr': 0.000338090655486252, 'samples': 11335104, 'steps': 59036, 'loss/train': 1.2374229431152344} -08/30/2021 23:48:44 - INFO - __main__ - Step 59038: {'lr': 0.00033808568907780687, 'samples': 11335296, 'steps': 59037, 'loss/train': 1.4884473085403442} -08/30/2021 23:48:44 - INFO - __main__ - Step 59039: {'lr': 0.00033808072262967164, 'samples': 11335488, 'steps': 59038, 'loss/train': 1.3518229722976685} -08/30/2021 23:48:46 - INFO - __main__ - Step 59040: {'lr': 0.00033807575614184864, 'samples': 11335680, 'steps': 59039, 'loss/train': 1.1372982263565063} -08/30/2021 23:48:46 - INFO - __main__ - Step 59041: {'lr': 0.0003380707896143401, 'samples': 11335872, 'steps': 59040, 'loss/train': 1.4580377340316772} -08/30/2021 23:48:47 - INFO - __main__ - Step 59042: {'lr': 0.0003380658230471482, 'samples': 11336064, 'steps': 59041, 'loss/train': 1.2731351852416992} -08/30/2021 23:48:47 - INFO - __main__ - Step 59043: {'lr': 0.0003380608564402752, 'samples': 11336256, 'steps': 59042, 'loss/train': 1.2429674863815308} -08/30/2021 23:48:47 - INFO - __main__ - Step 59044: {'lr': 0.0003380558897937233, 'samples': 11336448, 'steps': 59043, 'loss/train': 1.0650434494018555} -08/30/2021 23:48:48 - INFO - __main__ - Step 59045: {'lr': 0.0003380509231074948, 'samples': 11336640, 'steps': 59044, 'loss/train': 5.785302639007568} -08/30/2021 23:48:49 - INFO - __main__ - Step 59046: {'lr': 0.0003380459563815919, 'samples': 11336832, 'steps': 59045, 'loss/train': 1.0075180530548096} -08/30/2021 23:48:50 - INFO - __main__ - Step 59047: {'lr': 0.0003380409896160169, 'samples': 11337024, 'steps': 59046, 'loss/train': 1.0697202682495117} -08/30/2021 23:48:50 - INFO - __main__ - Step 59048: {'lr': 0.00033803602281077194, 'samples': 11337216, 'steps': 59047, 'loss/train': 1.5564501285552979} -08/30/2021 23:48:51 - INFO - __main__ - Step 59049: {'lr': 0.0003380310559658593, 'samples': 11337408, 'steps': 59048, 'loss/train': 1.1588890552520752} -08/30/2021 23:48:51 - INFO - __main__ - Step 59050: {'lr': 0.00033802608908128126, 'samples': 11337600, 'steps': 59049, 'loss/train': 1.327578067779541} -08/30/2021 23:48:53 - INFO - __main__ - Step 59051: {'lr': 0.00033802112215704, 'samples': 11337792, 'steps': 59050, 'loss/train': 1.9613319635391235} -08/30/2021 23:48:53 - INFO - __main__ - Step 59052: {'lr': 0.0003380161551931378, 'samples': 11337984, 'steps': 59051, 'loss/train': 1.2050180435180664} -08/30/2021 23:48:53 - INFO - __main__ - Step 59053: {'lr': 0.00033801118818957686, 'samples': 11338176, 'steps': 59052, 'loss/train': 0.047572895884513855} -08/30/2021 23:48:54 - INFO - __main__ - Step 59054: {'lr': 0.00033800622114635943, 'samples': 11338368, 'steps': 59053, 'loss/train': 1.2006944417953491} -08/30/2021 23:48:54 - INFO - __main__ - Step 59055: {'lr': 0.0003380012540634878, 'samples': 11338560, 'steps': 59054, 'loss/train': 1.3729872703552246} -08/30/2021 23:48:56 - INFO - __main__ - Step 59056: {'lr': 0.00033799628694096407, 'samples': 11338752, 'steps': 59055, 'loss/train': 0.04436753690242767} -08/30/2021 23:48:56 - INFO - __main__ - Step 59057: {'lr': 0.0003379913197787907, 'samples': 11338944, 'steps': 59056, 'loss/train': 1.5208933353424072} -08/30/2021 23:48:56 - INFO - __main__ - Step 59058: {'lr': 0.00033798635257696976, 'samples': 11339136, 'steps': 59057, 'loss/train': 2.2768805027008057} -08/30/2021 23:48:57 - INFO - __main__ - Step 59059: {'lr': 0.0003379813853355034, 'samples': 11339328, 'steps': 59058, 'loss/train': 1.1997323036193848} -08/30/2021 23:48:57 - INFO - __main__ - Step 59060: {'lr': 0.0003379764180543941, 'samples': 11339520, 'steps': 59059, 'loss/train': 0.6003795266151428} -08/30/2021 23:48:59 - INFO - __main__ - Step 59061: {'lr': 0.000337971450733644, 'samples': 11339712, 'steps': 59060, 'loss/train': 0.8755113482475281} -08/30/2021 23:48:59 - INFO - __main__ - Step 59062: {'lr': 0.00033796648337325525, 'samples': 11339904, 'steps': 59061, 'loss/train': 1.215303659439087} -08/30/2021 23:48:59 - INFO - __main__ - Step 59063: {'lr': 0.0003379615159732302, 'samples': 11340096, 'steps': 59062, 'loss/train': 1.6083595752716064} -08/30/2021 23:49:00 - INFO - __main__ - Step 59064: {'lr': 0.00033795654853357104, 'samples': 11340288, 'steps': 59063, 'loss/train': 1.7363594770431519} -08/30/2021 23:49:00 - INFO - __main__ - Step 59065: {'lr': 0.00033795158105428, 'samples': 11340480, 'steps': 59064, 'loss/train': 1.5962884426116943} -08/30/2021 23:49:00 - INFO - __main__ - Step 59066: {'lr': 0.0003379466135353594, 'samples': 11340672, 'steps': 59065, 'loss/train': 1.250943899154663} -08/30/2021 23:49:03 - INFO - __main__ - Step 59067: {'lr': 0.0003379416459768114, 'samples': 11340864, 'steps': 59066, 'loss/train': 1.5900511741638184} -08/30/2021 23:49:03 - INFO - __main__ - Step 59068: {'lr': 0.00033793667837863815, 'samples': 11341056, 'steps': 59067, 'loss/train': 0.9030623435974121} -08/30/2021 23:49:04 - INFO - __main__ - Step 59069: {'lr': 0.0003379317107408421, 'samples': 11341248, 'steps': 59068, 'loss/train': 0.7467013597488403} -08/30/2021 23:49:04 - INFO - __main__ - Step 59070: {'lr': 0.0003379267430634253, 'samples': 11341440, 'steps': 59069, 'loss/train': 2.026566982269287} -08/30/2021 23:49:04 - INFO - __main__ - Step 59071: {'lr': 0.00033792177534639015, 'samples': 11341632, 'steps': 59070, 'loss/train': 1.216873288154602} -08/30/2021 23:49:06 - INFO - __main__ - Step 59072: {'lr': 0.00033791680758973874, 'samples': 11341824, 'steps': 59071, 'loss/train': 1.1709107160568237} -08/30/2021 23:49:06 - INFO - __main__ - Step 59073: {'lr': 0.0003379118397934734, 'samples': 11342016, 'steps': 59072, 'loss/train': 0.9876223206520081} -08/30/2021 23:49:07 - INFO - __main__ - Step 59074: {'lr': 0.00033790687195759636, 'samples': 11342208, 'steps': 59073, 'loss/train': 1.1833842992782593} -08/30/2021 23:49:07 - INFO - __main__ - Step 59075: {'lr': 0.00033790190408210973, 'samples': 11342400, 'steps': 59074, 'loss/train': 1.0073257684707642} -08/30/2021 23:49:08 - INFO - __main__ - Step 59076: {'lr': 0.000337896936167016, 'samples': 11342592, 'steps': 59075, 'loss/train': 1.2722294330596924} -08/30/2021 23:49:09 - INFO - __main__ - Step 59077: {'lr': 0.00033789196821231717, 'samples': 11342784, 'steps': 59076, 'loss/train': 1.9959516525268555} -08/30/2021 23:49:10 - INFO - __main__ - Step 59078: {'lr': 0.00033788700021801564, 'samples': 11342976, 'steps': 59077, 'loss/train': 0.9849477410316467} -08/30/2021 23:49:10 - INFO - __main__ - Step 59079: {'lr': 0.00033788203218411357, 'samples': 11343168, 'steps': 59078, 'loss/train': 1.8005661964416504} -08/30/2021 23:49:10 - INFO - __main__ - Step 59080: {'lr': 0.0003378770641106132, 'samples': 11343360, 'steps': 59079, 'loss/train': 0.6836938858032227} -08/30/2021 23:49:11 - INFO - __main__ - Step 59081: {'lr': 0.00033787209599751676, 'samples': 11343552, 'steps': 59080, 'loss/train': 0.7835308909416199} -08/30/2021 23:49:11 - INFO - __main__ - Step 59082: {'lr': 0.0003378671278448265, 'samples': 11343744, 'steps': 59081, 'loss/train': 1.1010427474975586} -08/30/2021 23:49:12 - INFO - __main__ - Step 59083: {'lr': 0.00033786215965254474, 'samples': 11343936, 'steps': 59082, 'loss/train': 1.2064543962478638} -08/30/2021 23:49:13 - INFO - __main__ - Step 59084: {'lr': 0.00033785719142067364, 'samples': 11344128, 'steps': 59083, 'loss/train': 1.5590165853500366} -08/30/2021 23:49:13 - INFO - __main__ - Step 59085: {'lr': 0.0003378522231492154, 'samples': 11344320, 'steps': 59084, 'loss/train': 1.6903339624404907} -08/30/2021 23:49:13 - INFO - __main__ - Step 59086: {'lr': 0.0003378472548381723, 'samples': 11344512, 'steps': 59085, 'loss/train': 1.6603060960769653} -08/30/2021 23:49:14 - INFO - __main__ - Step 59087: {'lr': 0.0003378422864875466, 'samples': 11344704, 'steps': 59086, 'loss/train': 0.8950554728507996} -08/30/2021 23:49:15 - INFO - __main__ - Step 59088: {'lr': 0.0003378373180973405, 'samples': 11344896, 'steps': 59087, 'loss/train': 1.310755968093872} -08/30/2021 23:49:16 - INFO - __main__ - Step 59089: {'lr': 0.0003378323496675563, 'samples': 11345088, 'steps': 59088, 'loss/train': 1.4918195009231567} -08/30/2021 23:49:16 - INFO - __main__ - Step 59090: {'lr': 0.0003378273811981961, 'samples': 11345280, 'steps': 59089, 'loss/train': 1.6184768676757812} -08/30/2021 23:49:16 - INFO - __main__ - Step 59091: {'lr': 0.00033782241268926237, 'samples': 11345472, 'steps': 59090, 'loss/train': 1.0371448993682861} -08/30/2021 23:49:17 - INFO - __main__ - Step 59092: {'lr': 0.00033781744414075723, 'samples': 11345664, 'steps': 59091, 'loss/train': 1.642082691192627} -08/30/2021 23:49:19 - INFO - __main__ - Step 59093: {'lr': 0.0003378124755526828, 'samples': 11345856, 'steps': 59092, 'loss/train': 3.4553022384643555} -08/30/2021 23:49:19 - INFO - __main__ - Step 59094: {'lr': 0.0003378075069250414, 'samples': 11346048, 'steps': 59093, 'loss/train': 1.6642855405807495} -08/30/2021 23:49:19 - INFO - __main__ - Step 59095: {'lr': 0.00033780253825783533, 'samples': 11346240, 'steps': 59094, 'loss/train': 1.227319359779358} -08/30/2021 23:49:20 - INFO - __main__ - Step 59096: {'lr': 0.0003377975695510668, 'samples': 11346432, 'steps': 59095, 'loss/train': 1.1008540391921997} -08/30/2021 23:49:20 - INFO - __main__ - Step 59097: {'lr': 0.0003377926008047381, 'samples': 11346624, 'steps': 59096, 'loss/train': 1.3149657249450684} -08/30/2021 23:49:22 - INFO - __main__ - Step 59098: {'lr': 0.0003377876320188514, 'samples': 11346816, 'steps': 59097, 'loss/train': 0.7430916428565979} -08/30/2021 23:49:22 - INFO - __main__ - Step 59099: {'lr': 0.0003377826631934089, 'samples': 11347008, 'steps': 59098, 'loss/train': 1.5956075191497803} -08/30/2021 23:49:22 - INFO - __main__ - Step 59100: {'lr': 0.0003377776943284129, 'samples': 11347200, 'steps': 59099, 'loss/train': 1.4470906257629395} -08/30/2021 23:49:23 - INFO - __main__ - Step 59101: {'lr': 0.00033777272542386564, 'samples': 11347392, 'steps': 59100, 'loss/train': 0.04764091223478317} -08/30/2021 23:49:23 - INFO - __main__ - Step 59102: {'lr': 0.0003377677564797693, 'samples': 11347584, 'steps': 59101, 'loss/train': 0.8679090142250061} -08/30/2021 23:49:25 - INFO - __main__ - Step 59103: {'lr': 0.00033776278749612617, 'samples': 11347776, 'steps': 59102, 'loss/train': 0.6373335719108582} -08/30/2021 23:49:25 - INFO - __main__ - Step 59104: {'lr': 0.00033775781847293846, 'samples': 11347968, 'steps': 59103, 'loss/train': 0.9824668169021606} -08/30/2021 23:49:25 - INFO - __main__ - Step 59105: {'lr': 0.00033775284941020854, 'samples': 11348160, 'steps': 59104, 'loss/train': 1.4114757776260376} -08/30/2021 23:49:26 - INFO - __main__ - Step 59106: {'lr': 0.0003377478803079385, 'samples': 11348352, 'steps': 59105, 'loss/train': 1.3459184169769287} -08/30/2021 23:49:26 - INFO - __main__ - Step 59107: {'lr': 0.00033774291116613054, 'samples': 11348544, 'steps': 59106, 'loss/train': 1.4335577487945557} -08/30/2021 23:49:28 - INFO - __main__ - Step 59108: {'lr': 0.000337737941984787, 'samples': 11348736, 'steps': 59107, 'loss/train': 1.279528260231018} -08/30/2021 23:49:28 - INFO - __main__ - Step 59109: {'lr': 0.00033773297276391015, 'samples': 11348928, 'steps': 59108, 'loss/train': 1.2339500188827515} -08/30/2021 23:49:28 - INFO - __main__ - Step 59110: {'lr': 0.00033772800350350215, 'samples': 11349120, 'steps': 59109, 'loss/train': 1.626023530960083} -08/30/2021 23:49:29 - INFO - __main__ - Step 59111: {'lr': 0.0003377230342035653, 'samples': 11349312, 'steps': 59110, 'loss/train': 1.2343449592590332} -08/30/2021 23:49:29 - INFO - __main__ - Step 59112: {'lr': 0.00033771806486410176, 'samples': 11349504, 'steps': 59111, 'loss/train': 1.349181056022644} -08/30/2021 23:49:29 - INFO - __main__ - Step 59113: {'lr': 0.0003377130954851138, 'samples': 11349696, 'steps': 59112, 'loss/train': 1.0913158655166626} -08/30/2021 23:49:31 - INFO - __main__ - Step 59114: {'lr': 0.0003377081260666037, 'samples': 11349888, 'steps': 59113, 'loss/train': 1.4126912355422974} -08/30/2021 23:49:31 - INFO - __main__ - Step 59115: {'lr': 0.00033770315660857367, 'samples': 11350080, 'steps': 59114, 'loss/train': 1.5371184349060059} -08/30/2021 23:49:32 - INFO - __main__ - Step 59116: {'lr': 0.00033769818711102594, 'samples': 11350272, 'steps': 59115, 'loss/train': 1.3325474262237549} -08/30/2021 23:49:32 - INFO - __main__ - Step 59117: {'lr': 0.0003376932175739628, 'samples': 11350464, 'steps': 59116, 'loss/train': 1.24488365650177} -08/30/2021 23:49:33 - INFO - __main__ - Step 59118: {'lr': 0.00033768824799738646, 'samples': 11350656, 'steps': 59117, 'loss/train': 1.6751515865325928} -08/30/2021 23:49:34 - INFO - __main__ - Step 59119: {'lr': 0.0003376832783812991, 'samples': 11350848, 'steps': 59118, 'loss/train': 0.6848888397216797} -08/30/2021 23:49:35 - INFO - __main__ - Step 59120: {'lr': 0.000337678308725703, 'samples': 11351040, 'steps': 59119, 'loss/train': 1.3367704153060913} -08/30/2021 23:49:35 - INFO - __main__ - Step 59121: {'lr': 0.0003376733390306004, 'samples': 11351232, 'steps': 59120, 'loss/train': 1.1341562271118164} -08/30/2021 23:49:35 - INFO - __main__ - Step 59122: {'lr': 0.00033766836929599353, 'samples': 11351424, 'steps': 59121, 'loss/train': 0.6218701004981995} -08/30/2021 23:49:36 - INFO - __main__ - Step 59123: {'lr': 0.00033766339952188474, 'samples': 11351616, 'steps': 59122, 'loss/train': 0.9765797853469849} -08/30/2021 23:49:38 - INFO - __main__ - Step 59124: {'lr': 0.0003376584297082761, 'samples': 11351808, 'steps': 59123, 'loss/train': 1.1154900789260864} -08/30/2021 23:49:38 - INFO - __main__ - Step 59125: {'lr': 0.00033765345985517, 'samples': 11352000, 'steps': 59124, 'loss/train': 1.4942351579666138} -08/30/2021 23:49:39 - INFO - __main__ - Step 59126: {'lr': 0.0003376484899625685, 'samples': 11352192, 'steps': 59125, 'loss/train': 0.7903887629508972} -08/30/2021 23:49:39 - INFO - __main__ - Step 59127: {'lr': 0.00033764352003047397, 'samples': 11352384, 'steps': 59126, 'loss/train': 1.0410959720611572} -08/30/2021 23:49:39 - INFO - __main__ - Step 59128: {'lr': 0.00033763855005888865, 'samples': 11352576, 'steps': 59127, 'loss/train': 1.1598892211914062} -08/30/2021 23:49:41 - INFO - __main__ - Step 59129: {'lr': 0.00033763358004781474, 'samples': 11352768, 'steps': 59128, 'loss/train': 1.5421558618545532} -08/30/2021 23:49:41 - INFO - __main__ - Step 59130: {'lr': 0.00033762860999725456, 'samples': 11352960, 'steps': 59129, 'loss/train': 1.5244030952453613} -08/30/2021 23:49:42 - INFO - __main__ - Step 59131: {'lr': 0.0003376236399072101, 'samples': 11353152, 'steps': 59130, 'loss/train': 1.486205816268921} -08/30/2021 23:49:42 - INFO - __main__ - Step 59132: {'lr': 0.000337618669777684, 'samples': 11353344, 'steps': 59131, 'loss/train': 1.4284369945526123} -08/30/2021 23:49:42 - INFO - __main__ - Step 59133: {'lr': 0.0003376136996086782, 'samples': 11353536, 'steps': 59132, 'loss/train': 1.327958106994629} -08/30/2021 23:49:44 - INFO - __main__ - Step 59134: {'lr': 0.00033760872940019496, 'samples': 11353728, 'steps': 59133, 'loss/train': 0.91539466381073} -08/30/2021 23:49:44 - INFO - __main__ - Step 59135: {'lr': 0.00033760375915223664, 'samples': 11353920, 'steps': 59134, 'loss/train': 1.392862319946289} -08/30/2021 23:49:45 - INFO - __main__ - Step 59136: {'lr': 0.00033759878886480534, 'samples': 11354112, 'steps': 59135, 'loss/train': 1.9612127542495728} -08/30/2021 23:49:45 - INFO - __main__ - Step 59137: {'lr': 0.00033759381853790344, 'samples': 11354304, 'steps': 59136, 'loss/train': 1.0899419784545898} -08/30/2021 23:49:45 - INFO - __main__ - Step 59138: {'lr': 0.0003375888481715331, 'samples': 11354496, 'steps': 59137, 'loss/train': 1.32756507396698} -08/30/2021 23:49:47 - INFO - __main__ - Step 59139: {'lr': 0.0003375838777656966, 'samples': 11354688, 'steps': 59138, 'loss/train': 1.245195746421814} -08/30/2021 23:49:47 - INFO - __main__ - Step 59140: {'lr': 0.00033757890732039617, 'samples': 11354880, 'steps': 59139, 'loss/train': 1.583940029144287} -08/30/2021 23:49:48 - INFO - __main__ - Step 59141: {'lr': 0.000337573936835634, 'samples': 11355072, 'steps': 59140, 'loss/train': 1.5980420112609863} -08/30/2021 23:49:48 - INFO - __main__ - Step 59142: {'lr': 0.0003375689663114123, 'samples': 11355264, 'steps': 59141, 'loss/train': 1.2343775033950806} -08/30/2021 23:49:48 - INFO - __main__ - Step 59143: {'lr': 0.00033756399574773343, 'samples': 11355456, 'steps': 59142, 'loss/train': 1.2602927684783936} -08/30/2021 23:49:49 - INFO - __main__ - Step 59144: {'lr': 0.00033755902514459964, 'samples': 11355648, 'steps': 59143, 'loss/train': 0.9806532263755798} -08/30/2021 23:49:50 - INFO - __main__ - Step 59145: {'lr': 0.0003375540545020131, 'samples': 11355840, 'steps': 59144, 'loss/train': 1.2947758436203003} -08/30/2021 23:49:51 - INFO - __main__ - Step 59146: {'lr': 0.00033754908381997595, 'samples': 11356032, 'steps': 59145, 'loss/train': 1.7343069314956665} -08/30/2021 23:49:51 - INFO - __main__ - Step 59147: {'lr': 0.00033754411309849065, 'samples': 11356224, 'steps': 59146, 'loss/train': 1.4165982007980347} -08/30/2021 23:49:51 - INFO - __main__ - Step 59148: {'lr': 0.0003375391423375592, 'samples': 11356416, 'steps': 59147, 'loss/train': 0.9391774535179138} -08/30/2021 23:49:52 - INFO - __main__ - Step 59149: {'lr': 0.00033753417153718405, 'samples': 11356608, 'steps': 59148, 'loss/train': 1.4960434436798096} -08/30/2021 23:49:53 - INFO - __main__ - Step 59150: {'lr': 0.0003375292006973673, 'samples': 11356800, 'steps': 59149, 'loss/train': 1.2977248430252075} -08/30/2021 23:49:54 - INFO - __main__ - Step 59151: {'lr': 0.0003375242298181113, 'samples': 11356992, 'steps': 59150, 'loss/train': 1.2777845859527588} -08/30/2021 23:49:54 - INFO - __main__ - Step 59152: {'lr': 0.0003375192588994183, 'samples': 11357184, 'steps': 59151, 'loss/train': 1.3735532760620117} -08/30/2021 23:49:55 - INFO - __main__ - Step 59153: {'lr': 0.0003375142879412903, 'samples': 11357376, 'steps': 59152, 'loss/train': 0.027669517323374748} -08/30/2021 23:49:55 - INFO - __main__ - Step 59154: {'lr': 0.0003375093169437298, 'samples': 11357568, 'steps': 59153, 'loss/train': 0.028685377910733223} -08/30/2021 23:49:57 - INFO - __main__ - Step 59155: {'lr': 0.00033750434590673893, 'samples': 11357760, 'steps': 59154, 'loss/train': 0.8482067584991455} -08/30/2021 23:49:57 - INFO - __main__ - Step 59156: {'lr': 0.00033749937483031994, 'samples': 11357952, 'steps': 59155, 'loss/train': 1.3036620616912842} -08/30/2021 23:49:57 - INFO - __main__ - Step 59157: {'lr': 0.00033749440371447513, 'samples': 11358144, 'steps': 59156, 'loss/train': 1.0252490043640137} -08/30/2021 23:49:58 - INFO - __main__ - Step 59158: {'lr': 0.00033748943255920667, 'samples': 11358336, 'steps': 59157, 'loss/train': 1.1696373224258423} -08/30/2021 23:49:58 - INFO - __main__ - Step 59159: {'lr': 0.00033748446136451683, 'samples': 11358528, 'steps': 59158, 'loss/train': 1.4819964170455933} -08/30/2021 23:49:58 - INFO - __main__ - Step 59160: {'lr': 0.00033747949013040784, 'samples': 11358720, 'steps': 59159, 'loss/train': 1.4724578857421875} -08/30/2021 23:50:00 - INFO - __main__ - Step 59161: {'lr': 0.000337474518856882, 'samples': 11358912, 'steps': 59160, 'loss/train': 0.4776204526424408} -08/30/2021 23:50:00 - INFO - __main__ - Step 59162: {'lr': 0.0003374695475439413, 'samples': 11359104, 'steps': 59161, 'loss/train': 1.6590086221694946} -08/30/2021 23:50:01 - INFO - __main__ - Step 59163: {'lr': 0.0003374645761915883, 'samples': 11359296, 'steps': 59162, 'loss/train': 1.0549745559692383} -08/30/2021 23:50:01 - INFO - __main__ - Step 59164: {'lr': 0.00033745960479982515, 'samples': 11359488, 'steps': 59163, 'loss/train': 1.7718043327331543} -08/30/2021 23:50:01 - INFO - __main__ - Step 59165: {'lr': 0.00033745463336865407, 'samples': 11359680, 'steps': 59164, 'loss/train': 0.9100641012191772} -08/30/2021 23:50:03 - INFO - __main__ - Step 59166: {'lr': 0.0003374496618980772, 'samples': 11359872, 'steps': 59165, 'loss/train': 0.932635486125946} -08/30/2021 23:50:03 - INFO - __main__ - Step 59167: {'lr': 0.0003374446903880969, 'samples': 11360064, 'steps': 59166, 'loss/train': 0.7368623614311218} -08/30/2021 23:50:04 - INFO - __main__ - Step 59168: {'lr': 0.0003374397188387153, 'samples': 11360256, 'steps': 59167, 'loss/train': 1.3862361907958984} -08/30/2021 23:50:04 - INFO - __main__ - Step 59169: {'lr': 0.0003374347472499348, 'samples': 11360448, 'steps': 59168, 'loss/train': 0.9291672110557556} -08/30/2021 23:50:04 - INFO - __main__ - Step 59170: {'lr': 0.00033742977562175756, 'samples': 11360640, 'steps': 59169, 'loss/train': 0.8995817303657532} -08/30/2021 23:50:06 - INFO - __main__ - Step 59171: {'lr': 0.00033742480395418574, 'samples': 11360832, 'steps': 59170, 'loss/train': 1.3394420146942139} -08/30/2021 23:50:06 - INFO - __main__ - Step 59172: {'lr': 0.0003374198322472217, 'samples': 11361024, 'steps': 59171, 'loss/train': 1.3764405250549316} -08/30/2021 23:50:07 - INFO - __main__ - Step 59173: {'lr': 0.00033741486050086763, 'samples': 11361216, 'steps': 59172, 'loss/train': 0.6670469045639038} -08/30/2021 23:50:07 - INFO - __main__ - Step 59174: {'lr': 0.00033740988871512574, 'samples': 11361408, 'steps': 59173, 'loss/train': 1.5665777921676636} -08/30/2021 23:50:07 - INFO - __main__ - Step 59175: {'lr': 0.0003374049168899983, 'samples': 11361600, 'steps': 59174, 'loss/train': 1.2131277322769165} -08/30/2021 23:50:10 - INFO - __main__ - Step 59176: {'lr': 0.00033739994502548766, 'samples': 11361792, 'steps': 59175, 'loss/train': 1.4755932092666626} -08/30/2021 23:50:10 - INFO - __main__ - Step 59177: {'lr': 0.0003373949731215958, 'samples': 11361984, 'steps': 59176, 'loss/train': 1.3366997241973877} -08/30/2021 23:50:11 - INFO - __main__ - Step 59178: {'lr': 0.0003373900011783252, 'samples': 11362176, 'steps': 59177, 'loss/train': 1.3102545738220215} -08/30/2021 23:50:11 - INFO - __main__ - Step 59179: {'lr': 0.000337385029195678, 'samples': 11362368, 'steps': 59178, 'loss/train': 1.5608906745910645} -08/30/2021 23:50:11 - INFO - __main__ - Step 59180: {'lr': 0.00033738005717365646, 'samples': 11362560, 'steps': 59179, 'loss/train': 0.5504551529884338} -08/30/2021 23:50:12 - INFO - __main__ - Step 59181: {'lr': 0.00033737508511226283, 'samples': 11362752, 'steps': 59180, 'loss/train': 0.8778849840164185} -08/30/2021 23:50:13 - INFO - __main__ - Step 59182: {'lr': 0.00033737011301149933, 'samples': 11362944, 'steps': 59181, 'loss/train': 1.2649993896484375} -08/30/2021 23:50:14 - INFO - __main__ - Step 59183: {'lr': 0.0003373651408713682, 'samples': 11363136, 'steps': 59182, 'loss/train': 1.1484754085540771} -08/30/2021 23:50:14 - INFO - __main__ - Step 59184: {'lr': 0.00033736016869187165, 'samples': 11363328, 'steps': 59183, 'loss/train': 1.557829737663269} -08/30/2021 23:50:14 - INFO - __main__ - Step 59185: {'lr': 0.0003373551964730119, 'samples': 11363520, 'steps': 59184, 'loss/train': 1.0870318412780762} -08/30/2021 23:50:15 - INFO - __main__ - Step 59186: {'lr': 0.00033735022421479136, 'samples': 11363712, 'steps': 59185, 'loss/train': 1.6649073362350464} -08/30/2021 23:50:17 - INFO - __main__ - Step 59187: {'lr': 0.00033734525191721215, 'samples': 11363904, 'steps': 59186, 'loss/train': 0.9039666056632996} -08/30/2021 23:50:17 - INFO - __main__ - Step 59188: {'lr': 0.00033734027958027646, 'samples': 11364096, 'steps': 59187, 'loss/train': 1.5094884634017944} -08/30/2021 23:50:17 - INFO - __main__ - Step 59189: {'lr': 0.00033733530720398666, 'samples': 11364288, 'steps': 59188, 'loss/train': 1.1415201425552368} -08/30/2021 23:50:18 - INFO - __main__ - Step 59190: {'lr': 0.00033733033478834483, 'samples': 11364480, 'steps': 59189, 'loss/train': 1.6091244220733643} -08/30/2021 23:50:18 - INFO - __main__ - Step 59191: {'lr': 0.00033732536233335334, 'samples': 11364672, 'steps': 59190, 'loss/train': 1.1276490688323975} -08/30/2021 23:50:18 - INFO - __main__ - Step 59192: {'lr': 0.0003373203898390145, 'samples': 11364864, 'steps': 59191, 'loss/train': 1.5039596557617188} -08/30/2021 23:50:19 - INFO - __main__ - Step 59193: {'lr': 0.0003373154173053303, 'samples': 11365056, 'steps': 59192, 'loss/train': 0.027178999036550522} -08/30/2021 23:50:20 - INFO - __main__ - Step 59194: {'lr': 0.0003373104447323031, 'samples': 11365248, 'steps': 59193, 'loss/train': 1.0749531984329224} -08/30/2021 23:50:21 - INFO - __main__ - Step 59195: {'lr': 0.00033730547211993525, 'samples': 11365440, 'steps': 59194, 'loss/train': 1.5997252464294434} -08/30/2021 23:50:21 - INFO - __main__ - Step 59196: {'lr': 0.00033730049946822883, 'samples': 11365632, 'steps': 59195, 'loss/train': 0.8369849324226379} -08/30/2021 23:50:21 - INFO - __main__ - Step 59197: {'lr': 0.0003372955267771862, 'samples': 11365824, 'steps': 59196, 'loss/train': 0.8300724625587463} -08/30/2021 23:50:22 - INFO - __main__ - Step 59198: {'lr': 0.00033729055404680953, 'samples': 11366016, 'steps': 59197, 'loss/train': 1.1340458393096924} -08/30/2021 23:50:23 - INFO - __main__ - Step 59199: {'lr': 0.00033728558127710115, 'samples': 11366208, 'steps': 59198, 'loss/train': 1.2824549674987793} -08/30/2021 23:50:24 - INFO - __main__ - Step 59200: {'lr': 0.0003372806084680632, 'samples': 11366400, 'steps': 59199, 'loss/train': 1.3560410737991333} -08/30/2021 23:50:24 - INFO - __main__ - Step 59201: {'lr': 0.0003372756356196979, 'samples': 11366592, 'steps': 59200, 'loss/train': 1.1852643489837646} -08/30/2021 23:50:24 - INFO - __main__ - Step 59202: {'lr': 0.0003372706627320076, 'samples': 11366784, 'steps': 59201, 'loss/train': 0.07068157941102982} -08/30/2021 23:50:25 - INFO - __main__ - Step 59203: {'lr': 0.0003372656898049944, 'samples': 11366976, 'steps': 59202, 'loss/train': 1.2502074241638184} -08/30/2021 23:50:26 - INFO - __main__ - Step 59204: {'lr': 0.0003372607168386607, 'samples': 11367168, 'steps': 59203, 'loss/train': 1.4712998867034912} -08/30/2021 23:50:27 - INFO - __main__ - Step 59205: {'lr': 0.00033725574383300865, 'samples': 11367360, 'steps': 59204, 'loss/train': 1.6538299322128296} -08/30/2021 23:50:27 - INFO - __main__ - Step 59206: {'lr': 0.0003372507707880406, 'samples': 11367552, 'steps': 59205, 'loss/train': 1.634321689605713} -08/30/2021 23:50:27 - INFO - __main__ - Step 59207: {'lr': 0.0003372457977037586, 'samples': 11367744, 'steps': 59206, 'loss/train': 1.3178449869155884} -08/30/2021 23:50:28 - INFO - __main__ - Step 59208: {'lr': 0.000337240824580165, 'samples': 11367936, 'steps': 59207, 'loss/train': 0.8513045310974121} -08/30/2021 23:50:29 - INFO - __main__ - Step 59209: {'lr': 0.00033723585141726196, 'samples': 11368128, 'steps': 59208, 'loss/train': 1.4241957664489746} -08/30/2021 23:50:30 - INFO - __main__ - Step 59210: {'lr': 0.0003372308782150519, 'samples': 11368320, 'steps': 59209, 'loss/train': 0.6088467836380005} -08/30/2021 23:50:30 - INFO - __main__ - Step 59211: {'lr': 0.0003372259049735369, 'samples': 11368512, 'steps': 59210, 'loss/train': 1.6015602350234985} -08/30/2021 23:50:31 - INFO - __main__ - Step 59212: {'lr': 0.00033722093169271934, 'samples': 11368704, 'steps': 59211, 'loss/train': 1.5628141164779663} -08/30/2021 23:50:31 - INFO - __main__ - Step 59213: {'lr': 0.00033721595837260125, 'samples': 11368896, 'steps': 59212, 'loss/train': 1.4928135871887207} -08/30/2021 23:50:32 - INFO - __main__ - Step 59214: {'lr': 0.00033721098501318506, 'samples': 11369088, 'steps': 59213, 'loss/train': 1.8468180894851685} -08/30/2021 23:50:33 - INFO - __main__ - Step 59215: {'lr': 0.00033720601161447294, 'samples': 11369280, 'steps': 59214, 'loss/train': 1.0922880172729492} -08/30/2021 23:50:33 - INFO - __main__ - Step 59216: {'lr': 0.0003372010381764671, 'samples': 11369472, 'steps': 59215, 'loss/train': 1.5723910331726074} -08/30/2021 23:50:34 - INFO - __main__ - Step 59217: {'lr': 0.00033719606469916985, 'samples': 11369664, 'steps': 59216, 'loss/train': 1.4356945753097534} -08/30/2021 23:50:34 - INFO - __main__ - Step 59218: {'lr': 0.0003371910911825834, 'samples': 11369856, 'steps': 59217, 'loss/train': 1.427831768989563} -08/30/2021 23:50:35 - INFO - __main__ - Step 59219: {'lr': 0.00033718611762671003, 'samples': 11370048, 'steps': 59218, 'loss/train': 1.24912428855896} -08/30/2021 23:50:36 - INFO - __main__ - Step 59220: {'lr': 0.0003371811440315519, 'samples': 11370240, 'steps': 59219, 'loss/train': 1.1611627340316772} -08/30/2021 23:50:36 - INFO - __main__ - Step 59221: {'lr': 0.0003371761703971113, 'samples': 11370432, 'steps': 59220, 'loss/train': 1.7564440965652466} -08/30/2021 23:50:37 - INFO - __main__ - Step 59222: {'lr': 0.0003371711967233905, 'samples': 11370624, 'steps': 59221, 'loss/train': 1.4979043006896973} -08/30/2021 23:50:37 - INFO - __main__ - Step 59223: {'lr': 0.00033716622301039164, 'samples': 11370816, 'steps': 59222, 'loss/train': 1.5645051002502441} -08/30/2021 23:50:39 - INFO - __main__ - Step 59224: {'lr': 0.000337161249258117, 'samples': 11371008, 'steps': 59223, 'loss/train': 0.06679113954305649} -08/30/2021 23:50:40 - INFO - __main__ - Step 59225: {'lr': 0.0003371562754665689, 'samples': 11371200, 'steps': 59224, 'loss/train': 0.7724702954292297} -08/30/2021 23:50:40 - INFO - __main__ - Step 59226: {'lr': 0.0003371513016357496, 'samples': 11371392, 'steps': 59225, 'loss/train': 1.2717159986495972} -08/30/2021 23:50:40 - INFO - __main__ - Step 59227: {'lr': 0.0003371463277656611, 'samples': 11371584, 'steps': 59226, 'loss/train': 2.083587169647217} -08/30/2021 23:50:41 - INFO - __main__ - Step 59228: {'lr': 0.00033714135385630597, 'samples': 11371776, 'steps': 59227, 'loss/train': 1.528214693069458} -08/30/2021 23:50:41 - INFO - __main__ - Step 59229: {'lr': 0.0003371363799076862, 'samples': 11371968, 'steps': 59228, 'loss/train': 0.02398977428674698} -08/30/2021 23:50:42 - INFO - __main__ - Step 59230: {'lr': 0.00033713140591980407, 'samples': 11372160, 'steps': 59229, 'loss/train': 0.7743310332298279} -08/30/2021 23:50:43 - INFO - __main__ - Step 59231: {'lr': 0.00033712643189266197, 'samples': 11372352, 'steps': 59230, 'loss/train': 1.37897789478302} -08/30/2021 23:50:43 - INFO - __main__ - Step 59232: {'lr': 0.00033712145782626205, 'samples': 11372544, 'steps': 59231, 'loss/train': 1.1560449600219727} -08/30/2021 23:50:44 - INFO - __main__ - Step 59233: {'lr': 0.0003371164837206065, 'samples': 11372736, 'steps': 59232, 'loss/train': 1.9193859100341797} -08/30/2021 23:50:44 - INFO - __main__ - Step 59234: {'lr': 0.00033711150957569763, 'samples': 11372928, 'steps': 59233, 'loss/train': 1.3624557256698608} -08/30/2021 23:50:46 - INFO - __main__ - Step 59235: {'lr': 0.00033710653539153763, 'samples': 11373120, 'steps': 59234, 'loss/train': 1.0654305219650269} -08/30/2021 23:50:47 - INFO - __main__ - Step 59236: {'lr': 0.0003371015611681288, 'samples': 11373312, 'steps': 59235, 'loss/train': 1.335206151008606} -08/30/2021 23:50:47 - INFO - __main__ - Step 59237: {'lr': 0.0003370965869054733, 'samples': 11373504, 'steps': 59236, 'loss/train': 0.5567643046379089} -08/30/2021 23:50:47 - INFO - __main__ - Step 59238: {'lr': 0.0003370916126035735, 'samples': 11373696, 'steps': 59237, 'loss/train': 1.6595019102096558} -08/30/2021 23:50:48 - INFO - __main__ - Step 59239: {'lr': 0.0003370866382624315, 'samples': 11373888, 'steps': 59238, 'loss/train': 0.995984673500061} -08/30/2021 23:50:48 - INFO - __main__ - Step 59240: {'lr': 0.00033708166388204963, 'samples': 11374080, 'steps': 59239, 'loss/train': 1.346091628074646} -08/30/2021 23:50:50 - INFO - __main__ - Step 59241: {'lr': 0.0003370766894624301, 'samples': 11374272, 'steps': 59240, 'loss/train': 1.6816624402999878} -08/30/2021 23:50:50 - INFO - __main__ - Step 59242: {'lr': 0.00033707171500357516, 'samples': 11374464, 'steps': 59241, 'loss/train': 0.720859706401825} -08/30/2021 23:50:51 - INFO - __main__ - Step 59243: {'lr': 0.000337066740505487, 'samples': 11374656, 'steps': 59242, 'loss/train': 2.220306873321533} -08/30/2021 23:50:51 - INFO - __main__ - Step 59244: {'lr': 0.00033706176596816795, 'samples': 11374848, 'steps': 59243, 'loss/train': 0.36801525950431824} -08/30/2021 23:50:51 - INFO - __main__ - Step 59245: {'lr': 0.0003370567913916203, 'samples': 11375040, 'steps': 59244, 'loss/train': 1.36960768699646} -08/30/2021 23:50:53 - INFO - __main__ - Step 59246: {'lr': 0.0003370518167758461, 'samples': 11375232, 'steps': 59245, 'loss/train': 1.4784328937530518} -08/30/2021 23:50:54 - INFO - __main__ - Step 59247: {'lr': 0.00033704684212084774, 'samples': 11375424, 'steps': 59246, 'loss/train': 0.7090513706207275} -08/30/2021 23:50:54 - INFO - __main__ - Step 59248: {'lr': 0.0003370418674266273, 'samples': 11375616, 'steps': 59247, 'loss/train': 1.4179662466049194} -08/30/2021 23:50:54 - INFO - __main__ - Step 59249: {'lr': 0.00033703689269318725, 'samples': 11375808, 'steps': 59248, 'loss/train': 1.3202729225158691} -08/30/2021 23:50:55 - INFO - __main__ - Step 59250: {'lr': 0.00033703191792052974, 'samples': 11376000, 'steps': 59249, 'loss/train': 0.5380207300186157} -08/30/2021 23:50:56 - INFO - __main__ - Step 59251: {'lr': 0.00033702694310865696, 'samples': 11376192, 'steps': 59250, 'loss/train': 1.65398108959198} -08/30/2021 23:50:56 - INFO - __main__ - Step 59252: {'lr': 0.00033702196825757114, 'samples': 11376384, 'steps': 59251, 'loss/train': 1.7687321901321411} -08/30/2021 23:50:57 - INFO - __main__ - Step 59253: {'lr': 0.00033701699336727465, 'samples': 11376576, 'steps': 59252, 'loss/train': 0.9318382143974304} -08/30/2021 23:50:57 - INFO - __main__ - Step 59254: {'lr': 0.00033701201843776957, 'samples': 11376768, 'steps': 59253, 'loss/train': 1.4884229898452759} -08/30/2021 23:50:57 - INFO - __main__ - Step 59255: {'lr': 0.0003370070434690583, 'samples': 11376960, 'steps': 59254, 'loss/train': 1.2110114097595215} -08/30/2021 23:50:59 - INFO - __main__ - Step 59256: {'lr': 0.0003370020684611429, 'samples': 11377152, 'steps': 59255, 'loss/train': 1.1395328044891357} -08/30/2021 23:50:59 - INFO - __main__ - Step 59257: {'lr': 0.0003369970934140257, 'samples': 11377344, 'steps': 59256, 'loss/train': 1.4840216636657715} -08/30/2021 23:51:00 - INFO - __main__ - Step 59258: {'lr': 0.00033699211832770906, 'samples': 11377536, 'steps': 59257, 'loss/train': 1.5603110790252686} -08/30/2021 23:51:00 - INFO - __main__ - Step 59259: {'lr': 0.000336987143202195, 'samples': 11377728, 'steps': 59258, 'loss/train': 1.1304256916046143} -08/30/2021 23:51:00 - INFO - __main__ - Step 59260: {'lr': 0.000336982168037486, 'samples': 11377920, 'steps': 59259, 'loss/train': 1.4614261388778687} -08/30/2021 23:51:03 - INFO - __main__ - Step 59261: {'lr': 0.0003369771928335841, 'samples': 11378112, 'steps': 59260, 'loss/train': 1.1103240251541138} -08/30/2021 23:51:03 - INFO - __main__ - Step 59262: {'lr': 0.00033697221759049163, 'samples': 11378304, 'steps': 59261, 'loss/train': 1.5771194696426392} -08/30/2021 23:51:03 - INFO - __main__ - Step 59263: {'lr': 0.0003369672423082108, 'samples': 11378496, 'steps': 59262, 'loss/train': 0.5105088949203491} -08/30/2021 23:51:04 - INFO - __main__ - Step 59264: {'lr': 0.00033696226698674386, 'samples': 11378688, 'steps': 59263, 'loss/train': 2.739560127258301} -08/30/2021 23:51:04 - INFO - __main__ - Step 59265: {'lr': 0.0003369572916260931, 'samples': 11378880, 'steps': 59264, 'loss/train': 2.1617205142974854} -08/30/2021 23:51:04 - INFO - __main__ - Step 59266: {'lr': 0.0003369523162262608, 'samples': 11379072, 'steps': 59265, 'loss/train': 1.4375048875808716} -08/30/2021 23:51:05 - INFO - __main__ - Step 59267: {'lr': 0.00033694734078724904, 'samples': 11379264, 'steps': 59266, 'loss/train': 1.400809407234192} -08/30/2021 23:51:07 - INFO - __main__ - Step 59268: {'lr': 0.00033694236530906014, 'samples': 11379456, 'steps': 59267, 'loss/train': 1.6229270696640015} -08/30/2021 23:51:07 - INFO - __main__ - Step 59269: {'lr': 0.00033693738979169636, 'samples': 11379648, 'steps': 59268, 'loss/train': 1.2574315071105957} -08/30/2021 23:51:07 - INFO - __main__ - Step 59270: {'lr': 0.0003369324142351599, 'samples': 11379840, 'steps': 59269, 'loss/train': 1.1877094507217407} -08/30/2021 23:51:08 - INFO - __main__ - Step 59271: {'lr': 0.0003369274386394531, 'samples': 11380032, 'steps': 59270, 'loss/train': 1.8981167078018188} -08/30/2021 23:51:08 - INFO - __main__ - Step 59272: {'lr': 0.0003369224630045781, 'samples': 11380224, 'steps': 59271, 'loss/train': 1.360382080078125} -08/30/2021 23:51:10 - INFO - __main__ - Step 59273: {'lr': 0.0003369174873305373, 'samples': 11380416, 'steps': 59272, 'loss/train': 1.6627168655395508} -08/30/2021 23:51:10 - INFO - __main__ - Step 59274: {'lr': 0.0003369125116173327, 'samples': 11380608, 'steps': 59273, 'loss/train': 1.6665995121002197} -08/30/2021 23:51:10 - INFO - __main__ - Step 59275: {'lr': 0.00033690753586496666, 'samples': 11380800, 'steps': 59274, 'loss/train': 0.9362266063690186} -08/30/2021 23:51:11 - INFO - __main__ - Step 59276: {'lr': 0.00033690256007344144, 'samples': 11380992, 'steps': 59275, 'loss/train': 1.3537232875823975} -08/30/2021 23:51:11 - INFO - __main__ - Step 59277: {'lr': 0.0003368975842427592, 'samples': 11381184, 'steps': 59276, 'loss/train': 0.5287055969238281} -08/30/2021 23:51:12 - INFO - __main__ - Step 59278: {'lr': 0.00033689260837292234, 'samples': 11381376, 'steps': 59277, 'loss/train': 0.8119242787361145} -08/30/2021 23:51:13 - INFO - __main__ - Step 59279: {'lr': 0.000336887632463933, 'samples': 11381568, 'steps': 59278, 'loss/train': 1.715207815170288} -08/30/2021 23:51:13 - INFO - __main__ - Step 59280: {'lr': 0.00033688265651579354, 'samples': 11381760, 'steps': 59279, 'loss/train': 1.3267779350280762} -08/30/2021 23:51:14 - INFO - __main__ - Step 59281: {'lr': 0.0003368776805285059, 'samples': 11381952, 'steps': 59280, 'loss/train': 1.1703482866287231} -08/30/2021 23:51:14 - INFO - __main__ - Step 59282: {'lr': 0.0003368727045020726, 'samples': 11382144, 'steps': 59281, 'loss/train': 1.4100213050842285} -08/30/2021 23:51:16 - INFO - __main__ - Step 59283: {'lr': 0.00033686772843649583, 'samples': 11382336, 'steps': 59282, 'loss/train': 1.1155202388763428} -08/30/2021 23:51:17 - INFO - __main__ - Step 59284: {'lr': 0.00033686275233177777, 'samples': 11382528, 'steps': 59283, 'loss/train': 0.8511165380477905} -08/30/2021 23:51:17 - INFO - __main__ - Step 59285: {'lr': 0.00033685777618792066, 'samples': 11382720, 'steps': 59284, 'loss/train': 1.948175072669983} -08/30/2021 23:51:17 - INFO - __main__ - Step 59286: {'lr': 0.0003368528000049269, 'samples': 11382912, 'steps': 59285, 'loss/train': 1.2594410181045532} -08/30/2021 23:51:18 - INFO - __main__ - Step 59287: {'lr': 0.00033684782378279847, 'samples': 11383104, 'steps': 59286, 'loss/train': 1.8910175561904907} -08/30/2021 23:51:18 - INFO - __main__ - Step 59288: {'lr': 0.0003368428475215378, 'samples': 11383296, 'steps': 59287, 'loss/train': 1.1009361743927002} -08/30/2021 23:51:20 - INFO - __main__ - Step 59289: {'lr': 0.00033683787122114713, 'samples': 11383488, 'steps': 59288, 'loss/train': 3.395280361175537} -08/30/2021 23:51:20 - INFO - __main__ - Step 59290: {'lr': 0.0003368328948816286, 'samples': 11383680, 'steps': 59289, 'loss/train': 0.5369886755943298} -08/30/2021 23:51:21 - INFO - __main__ - Step 59291: {'lr': 0.0003368279185029845, 'samples': 11383872, 'steps': 59290, 'loss/train': 1.105175495147705} -08/30/2021 23:51:21 - INFO - __main__ - Step 59292: {'lr': 0.0003368229420852171, 'samples': 11384064, 'steps': 59291, 'loss/train': 1.9590833187103271} -08/30/2021 23:51:22 - INFO - __main__ - Step 59293: {'lr': 0.00033681796562832865, 'samples': 11384256, 'steps': 59292, 'loss/train': 1.5062144994735718} -08/30/2021 23:51:23 - INFO - __main__ - Step 59294: {'lr': 0.0003368129891323213, 'samples': 11384448, 'steps': 59293, 'loss/train': 1.5120887756347656} -08/30/2021 23:51:24 - INFO - __main__ - Step 59295: {'lr': 0.0003368080125971974, 'samples': 11384640, 'steps': 59294, 'loss/train': 1.087343692779541} -08/30/2021 23:51:24 - INFO - __main__ - Step 59296: {'lr': 0.00033680303602295913, 'samples': 11384832, 'steps': 59295, 'loss/train': 1.5824439525604248} -08/30/2021 23:51:24 - INFO - __main__ - Step 59297: {'lr': 0.00033679805940960877, 'samples': 11385024, 'steps': 59296, 'loss/train': 0.4324478507041931} -08/30/2021 23:51:25 - INFO - __main__ - Step 59298: {'lr': 0.0003367930827571485, 'samples': 11385216, 'steps': 59297, 'loss/train': 1.225721836090088} -08/30/2021 23:51:27 - INFO - __main__ - Step 59299: {'lr': 0.00033678810606558077, 'samples': 11385408, 'steps': 59298, 'loss/train': 0.47869542241096497} -08/30/2021 23:51:27 - INFO - __main__ - Step 59300: {'lr': 0.00033678312933490753, 'samples': 11385600, 'steps': 59299, 'loss/train': 1.7402771711349487} -08/30/2021 23:51:28 - INFO - __main__ - Step 59301: {'lr': 0.00033677815256513114, 'samples': 11385792, 'steps': 59300, 'loss/train': 1.4555498361587524} -08/30/2021 23:51:28 - INFO - __main__ - Step 59302: {'lr': 0.0003367731757562538, 'samples': 11385984, 'steps': 59301, 'loss/train': 0.8659315705299377} -08/30/2021 23:51:28 - INFO - __main__ - Step 59303: {'lr': 0.0003367681989082779, 'samples': 11386176, 'steps': 59302, 'loss/train': 0.028186127543449402} -08/30/2021 23:51:29 - INFO - __main__ - Step 59304: {'lr': 0.0003367632220212056, 'samples': 11386368, 'steps': 59303, 'loss/train': 1.7209151983261108} -08/30/2021 23:51:30 - INFO - __main__ - Step 59305: {'lr': 0.0003367582450950391, 'samples': 11386560, 'steps': 59304, 'loss/train': 1.6405874490737915} -08/30/2021 23:51:31 - INFO - __main__ - Step 59306: {'lr': 0.0003367532681297807, 'samples': 11386752, 'steps': 59305, 'loss/train': 0.9548050165176392} -08/30/2021 23:51:31 - INFO - __main__ - Step 59307: {'lr': 0.0003367482911254325, 'samples': 11386944, 'steps': 59306, 'loss/train': 1.6253842115402222} -08/30/2021 23:51:31 - INFO - __main__ - Step 59308: {'lr': 0.000336743314081997, 'samples': 11387136, 'steps': 59307, 'loss/train': 0.05865844339132309} -08/30/2021 23:51:32 - INFO - __main__ - Step 59309: {'lr': 0.0003367383369994762, 'samples': 11387328, 'steps': 59308, 'loss/train': 2.0783345699310303} -08/30/2021 23:51:33 - INFO - __main__ - Step 59310: {'lr': 0.0003367333598778725, 'samples': 11387520, 'steps': 59309, 'loss/train': 1.1801239252090454} -08/30/2021 23:51:34 - INFO - __main__ - Step 59311: {'lr': 0.0003367283827171881, 'samples': 11387712, 'steps': 59310, 'loss/train': 1.1335481405258179} -08/30/2021 23:51:34 - INFO - __main__ - Step 59312: {'lr': 0.0003367234055174252, 'samples': 11387904, 'steps': 59311, 'loss/train': 0.7261341214179993} -08/30/2021 23:51:34 - INFO - __main__ - Step 59313: {'lr': 0.00033671842827858605, 'samples': 11388096, 'steps': 59312, 'loss/train': 1.2450182437896729} -08/30/2021 23:51:35 - INFO - __main__ - Step 59314: {'lr': 0.000336713451000673, 'samples': 11388288, 'steps': 59313, 'loss/train': 0.8941906690597534} -08/30/2021 23:51:36 - INFO - __main__ - Step 59315: {'lr': 0.00033670847368368805, 'samples': 11388480, 'steps': 59314, 'loss/train': 0.6869674921035767} -08/30/2021 23:51:37 - INFO - __main__ - Step 59316: {'lr': 0.00033670349632763377, 'samples': 11388672, 'steps': 59315, 'loss/train': 1.5804328918457031} -08/30/2021 23:51:37 - INFO - __main__ - Step 59317: {'lr': 0.0003366985189325121, 'samples': 11388864, 'steps': 59316, 'loss/train': 0.6346843242645264} -08/30/2021 23:51:37 - INFO - __main__ - Step 59318: {'lr': 0.00033669354149832556, 'samples': 11389056, 'steps': 59317, 'loss/train': 1.1809628009796143} -08/30/2021 23:51:38 - INFO - __main__ - Step 59319: {'lr': 0.0003366885640250761, 'samples': 11389248, 'steps': 59318, 'loss/train': 1.1110634803771973} -08/30/2021 23:51:39 - INFO - __main__ - Step 59320: {'lr': 0.00033668358651276614, 'samples': 11389440, 'steps': 59319, 'loss/train': 1.554908275604248} -08/30/2021 23:51:40 - INFO - __main__ - Step 59321: {'lr': 0.000336678608961398, 'samples': 11389632, 'steps': 59320, 'loss/train': 1.4517171382904053} -08/30/2021 23:51:40 - INFO - __main__ - Step 59322: {'lr': 0.00033667363137097374, 'samples': 11389824, 'steps': 59321, 'loss/train': 0.8605591654777527} -08/30/2021 23:51:40 - INFO - __main__ - Step 59323: {'lr': 0.0003366686537414957, 'samples': 11390016, 'steps': 59322, 'loss/train': 0.647480309009552} -08/30/2021 23:51:41 - INFO - __main__ - Step 59324: {'lr': 0.00033666367607296607, 'samples': 11390208, 'steps': 59323, 'loss/train': 1.4006738662719727} -08/30/2021 23:51:41 - INFO - __main__ - Step 59325: {'lr': 0.0003366586983653871, 'samples': 11390400, 'steps': 59324, 'loss/train': 0.8329690098762512} -08/30/2021 23:51:42 - INFO - __main__ - Step 59326: {'lr': 0.0003366537206187611, 'samples': 11390592, 'steps': 59325, 'loss/train': 0.9495279788970947} -08/30/2021 23:51:43 - INFO - __main__ - Step 59327: {'lr': 0.0003366487428330903, 'samples': 11390784, 'steps': 59326, 'loss/train': 1.6387280225753784} -08/30/2021 23:51:43 - INFO - __main__ - Step 59328: {'lr': 0.0003366437650083768, 'samples': 11390976, 'steps': 59327, 'loss/train': 1.099772334098816} -08/30/2021 23:51:44 - INFO - __main__ - Step 59329: {'lr': 0.0003366387871446231, 'samples': 11391168, 'steps': 59328, 'loss/train': 1.3461673259735107} -08/30/2021 23:51:44 - INFO - __main__ - Step 59330: {'lr': 0.00033663380924183123, 'samples': 11391360, 'steps': 59329, 'loss/train': 1.021415114402771} -08/30/2021 23:51:46 - INFO - __main__ - Step 59331: {'lr': 0.0003366288313000035, 'samples': 11391552, 'steps': 59330, 'loss/train': 2.0180437564849854} -08/30/2021 23:51:46 - INFO - __main__ - Step 59332: {'lr': 0.00033662385331914216, 'samples': 11391744, 'steps': 59331, 'loss/train': 1.7529054880142212} -08/30/2021 23:51:46 - INFO - __main__ - Step 59333: {'lr': 0.0003366188752992495, 'samples': 11391936, 'steps': 59332, 'loss/train': 1.6668756008148193} -08/30/2021 23:51:47 - INFO - __main__ - Step 59334: {'lr': 0.00033661389724032765, 'samples': 11392128, 'steps': 59333, 'loss/train': 0.9454957842826843} -08/30/2021 23:51:47 - INFO - __main__ - Step 59335: {'lr': 0.0003366089191423789, 'samples': 11392320, 'steps': 59334, 'loss/train': 1.3477146625518799} -08/30/2021 23:51:49 - INFO - __main__ - Step 59336: {'lr': 0.00033660394100540553, 'samples': 11392512, 'steps': 59335, 'loss/train': 1.110459804534912} -08/30/2021 23:51:49 - INFO - __main__ - Step 59337: {'lr': 0.00033659896282940975, 'samples': 11392704, 'steps': 59336, 'loss/train': 1.854459285736084} -08/30/2021 23:51:50 - INFO - __main__ - Step 59338: {'lr': 0.0003365939846143938, 'samples': 11392896, 'steps': 59337, 'loss/train': 1.4341622591018677} -08/30/2021 23:51:50 - INFO - __main__ - Step 59339: {'lr': 0.00033658900636036, 'samples': 11393088, 'steps': 59338, 'loss/train': 0.17963233590126038} -08/30/2021 23:51:50 - INFO - __main__ - Step 59340: {'lr': 0.00033658402806731054, 'samples': 11393280, 'steps': 59339, 'loss/train': 1.1999081373214722} -08/30/2021 23:51:51 - INFO - __main__ - Step 59341: {'lr': 0.00033657904973524754, 'samples': 11393472, 'steps': 59340, 'loss/train': 1.6364575624465942} -08/30/2021 23:51:53 - INFO - __main__ - Step 59342: {'lr': 0.00033657407136417343, 'samples': 11393664, 'steps': 59341, 'loss/train': 1.584562063217163} -08/30/2021 23:51:53 - INFO - __main__ - Step 59343: {'lr': 0.0003365690929540904, 'samples': 11393856, 'steps': 59342, 'loss/train': 1.4495015144348145} -08/30/2021 23:51:54 - INFO - __main__ - Step 59344: {'lr': 0.0003365641145050006, 'samples': 11394048, 'steps': 59343, 'loss/train': 1.253187894821167} -08/30/2021 23:51:54 - INFO - __main__ - Step 59345: {'lr': 0.0003365591360169064, 'samples': 11394240, 'steps': 59344, 'loss/train': 1.6525559425354004} -08/30/2021 23:51:54 - INFO - __main__ - Step 59346: {'lr': 0.00033655415748981, 'samples': 11394432, 'steps': 59345, 'loss/train': 1.1778801679611206} -08/30/2021 23:51:56 - INFO - __main__ - Step 59347: {'lr': 0.00033654917892371363, 'samples': 11394624, 'steps': 59346, 'loss/train': 0.9295195937156677} -08/30/2021 23:51:56 - INFO - __main__ - Step 59348: {'lr': 0.00033654420031861953, 'samples': 11394816, 'steps': 59347, 'loss/train': 1.1585581302642822} -08/30/2021 23:51:57 - INFO - __main__ - Step 59349: {'lr': 0.0003365392216745299, 'samples': 11395008, 'steps': 59348, 'loss/train': 1.3422008752822876} -08/30/2021 23:51:57 - INFO - __main__ - Step 59350: {'lr': 0.0003365342429914471, 'samples': 11395200, 'steps': 59349, 'loss/train': 0.6726939082145691} -08/30/2021 23:51:57 - INFO - __main__ - Step 59351: {'lr': 0.0003365292642693733, 'samples': 11395392, 'steps': 59350, 'loss/train': 0.6640406847000122} -08/30/2021 23:51:59 - INFO - __main__ - Step 59352: {'lr': 0.0003365242855083107, 'samples': 11395584, 'steps': 59351, 'loss/train': 1.1594438552856445} -08/30/2021 23:51:59 - INFO - __main__ - Step 59353: {'lr': 0.00033651930670826157, 'samples': 11395776, 'steps': 59352, 'loss/train': 1.3292087316513062} -08/30/2021 23:52:00 - INFO - __main__ - Step 59354: {'lr': 0.0003365143278692283, 'samples': 11395968, 'steps': 59353, 'loss/train': 1.1059421300888062} -08/30/2021 23:52:00 - INFO - __main__ - Step 59355: {'lr': 0.0003365093489912129, 'samples': 11396160, 'steps': 59354, 'loss/train': 1.8915578126907349} -08/30/2021 23:52:00 - INFO - __main__ - Step 59356: {'lr': 0.00033650437007421775, 'samples': 11396352, 'steps': 59355, 'loss/train': 1.1315854787826538} -08/30/2021 23:52:01 - INFO - __main__ - Step 59357: {'lr': 0.0003364993911182451, 'samples': 11396544, 'steps': 59356, 'loss/train': 1.7106071710586548} -08/30/2021 23:52:02 - INFO - __main__ - Step 59358: {'lr': 0.0003364944121232971, 'samples': 11396736, 'steps': 59357, 'loss/train': 1.3781297206878662} -08/30/2021 23:52:03 - INFO - __main__ - Step 59359: {'lr': 0.0003364894330893761, 'samples': 11396928, 'steps': 59358, 'loss/train': 1.326269268989563} -08/30/2021 23:52:03 - INFO - __main__ - Step 59360: {'lr': 0.0003364844540164843, 'samples': 11397120, 'steps': 59359, 'loss/train': 1.568508267402649} -08/30/2021 23:52:03 - INFO - __main__ - Step 59361: {'lr': 0.00033647947490462386, 'samples': 11397312, 'steps': 59360, 'loss/train': 1.4494833946228027} -08/30/2021 23:52:04 - INFO - __main__ - Step 59362: {'lr': 0.0003364744957537972, 'samples': 11397504, 'steps': 59361, 'loss/train': 1.247589111328125} -08/30/2021 23:52:05 - INFO - __main__ - Step 59363: {'lr': 0.00033646951656400635, 'samples': 11397696, 'steps': 59362, 'loss/train': 1.2490839958190918} -08/30/2021 23:52:06 - INFO - __main__ - Step 59364: {'lr': 0.0003364645373352538, 'samples': 11397888, 'steps': 59363, 'loss/train': 1.6518312692642212} -08/30/2021 23:52:06 - INFO - __main__ - Step 59365: {'lr': 0.00033645955806754156, 'samples': 11398080, 'steps': 59364, 'loss/train': 1.267189621925354} -08/30/2021 23:52:06 - INFO - __main__ - Step 59366: {'lr': 0.00033645457876087205, 'samples': 11398272, 'steps': 59365, 'loss/train': 1.0230413675308228} -08/30/2021 23:52:07 - INFO - __main__ - Step 59367: {'lr': 0.0003364495994152474, 'samples': 11398464, 'steps': 59366, 'loss/train': 1.295203685760498} -08/30/2021 23:52:08 - INFO - __main__ - Step 59368: {'lr': 0.00033644462003066996, 'samples': 11398656, 'steps': 59367, 'loss/train': 0.8491498827934265} -08/30/2021 23:52:09 - INFO - __main__ - Step 59369: {'lr': 0.00033643964060714183, 'samples': 11398848, 'steps': 59368, 'loss/train': 1.7447905540466309} -08/30/2021 23:52:09 - INFO - __main__ - Step 59370: {'lr': 0.00033643466114466537, 'samples': 11399040, 'steps': 59369, 'loss/train': 1.0838088989257812} -08/30/2021 23:52:09 - INFO - __main__ - Step 59371: {'lr': 0.0003364296816432428, 'samples': 11399232, 'steps': 59370, 'loss/train': 1.4862943887710571} -08/30/2021 23:52:10 - INFO - __main__ - Step 59372: {'lr': 0.0003364247021028763, 'samples': 11399424, 'steps': 59371, 'loss/train': 2.0120232105255127} -08/30/2021 23:52:11 - INFO - __main__ - Step 59373: {'lr': 0.0003364197225235682, 'samples': 11399616, 'steps': 59372, 'loss/train': 0.9148479700088501} -08/30/2021 23:52:12 - INFO - __main__ - Step 59374: {'lr': 0.0003364147429053207, 'samples': 11399808, 'steps': 59373, 'loss/train': 0.7984991073608398} -08/30/2021 23:52:12 - INFO - __main__ - Step 59375: {'lr': 0.00033640976324813605, 'samples': 11400000, 'steps': 59374, 'loss/train': 1.5747536420822144} -08/30/2021 23:52:12 - INFO - __main__ - Step 59376: {'lr': 0.00033640478355201646, 'samples': 11400192, 'steps': 59375, 'loss/train': 1.3024396896362305} -08/30/2021 23:52:13 - INFO - __main__ - Step 59377: {'lr': 0.00033639980381696425, 'samples': 11400384, 'steps': 59376, 'loss/train': 0.5121721625328064} -08/30/2021 23:52:14 - INFO - __main__ - Step 59378: {'lr': 0.0003363948240429816, 'samples': 11400576, 'steps': 59377, 'loss/train': 1.3542097806930542} -08/30/2021 23:52:15 - INFO - __main__ - Step 59379: {'lr': 0.0003363898442300708, 'samples': 11400768, 'steps': 59378, 'loss/train': 0.9155076146125793} -08/30/2021 23:52:15 - INFO - __main__ - Step 59380: {'lr': 0.0003363848643782341, 'samples': 11400960, 'steps': 59379, 'loss/train': 1.4796979427337646} -08/30/2021 23:52:16 - INFO - __main__ - Step 59381: {'lr': 0.00033637988448747365, 'samples': 11401152, 'steps': 59380, 'loss/train': 0.8945176601409912} -08/30/2021 23:52:16 - INFO - __main__ - Step 59382: {'lr': 0.00033637490455779175, 'samples': 11401344, 'steps': 59381, 'loss/train': 1.4898449182510376} -08/30/2021 23:52:16 - INFO - __main__ - Step 59383: {'lr': 0.0003363699245891907, 'samples': 11401536, 'steps': 59382, 'loss/train': 1.3867021799087524} -08/30/2021 23:52:17 - INFO - __main__ - Step 59384: {'lr': 0.00033636494458167267, 'samples': 11401728, 'steps': 59383, 'loss/train': 5.8033928871154785} -08/30/2021 23:52:18 - INFO - __main__ - Step 59385: {'lr': 0.00033635996453523987, 'samples': 11401920, 'steps': 59384, 'loss/train': 0.8983581066131592} -08/30/2021 23:52:19 - INFO - __main__ - Step 59386: {'lr': 0.0003363549844498947, 'samples': 11402112, 'steps': 59385, 'loss/train': 1.5056425333023071} -08/30/2021 23:52:19 - INFO - __main__ - Step 59387: {'lr': 0.00033635000432563926, 'samples': 11402304, 'steps': 59386, 'loss/train': 0.9520968198776245} -08/30/2021 23:52:19 - INFO - __main__ - Step 59388: {'lr': 0.0003363450241624759, 'samples': 11402496, 'steps': 59387, 'loss/train': 1.5993014574050903} -08/30/2021 23:52:20 - INFO - __main__ - Step 59389: {'lr': 0.00033634004396040673, 'samples': 11402688, 'steps': 59388, 'loss/train': 0.9830499291419983} -08/30/2021 23:52:21 - INFO - __main__ - Step 59390: {'lr': 0.0003363350637194341, 'samples': 11402880, 'steps': 59389, 'loss/train': 1.2680844068527222} -08/30/2021 23:52:22 - INFO - __main__ - Step 59391: {'lr': 0.0003363300834395602, 'samples': 11403072, 'steps': 59390, 'loss/train': 1.7563400268554688} -08/30/2021 23:52:22 - INFO - __main__ - Step 59392: {'lr': 0.0003363251031207873, 'samples': 11403264, 'steps': 59391, 'loss/train': 1.650937557220459} -08/30/2021 23:52:22 - INFO - __main__ - Step 59393: {'lr': 0.00033632012276311763, 'samples': 11403456, 'steps': 59392, 'loss/train': 1.5559488534927368} -08/30/2021 23:52:23 - INFO - __main__ - Step 59394: {'lr': 0.00033631514236655345, 'samples': 11403648, 'steps': 59393, 'loss/train': 1.7367321252822876} -08/30/2021 23:52:25 - INFO - __main__ - Step 59395: {'lr': 0.00033631016193109704, 'samples': 11403840, 'steps': 59394, 'loss/train': 1.3136630058288574} -08/30/2021 23:52:25 - INFO - __main__ - Step 59396: {'lr': 0.00033630518145675057, 'samples': 11404032, 'steps': 59395, 'loss/train': 1.7318987846374512} -08/30/2021 23:52:26 - INFO - __main__ - Step 59397: {'lr': 0.0003363002009435163, 'samples': 11404224, 'steps': 59396, 'loss/train': 1.2763962745666504} -08/30/2021 23:52:26 - INFO - __main__ - Step 59398: {'lr': 0.00033629522039139656, 'samples': 11404416, 'steps': 59397, 'loss/train': 0.9393520951271057} -08/30/2021 23:52:26 - INFO - __main__ - Step 59399: {'lr': 0.00033629023980039346, 'samples': 11404608, 'steps': 59398, 'loss/train': 0.5364485383033752} -08/30/2021 23:52:28 - INFO - __main__ - Step 59400: {'lr': 0.00033628525917050935, 'samples': 11404800, 'steps': 59399, 'loss/train': 0.8415135741233826} -08/30/2021 23:52:28 - INFO - __main__ - Step 59401: {'lr': 0.0003362802785017464, 'samples': 11404992, 'steps': 59400, 'loss/train': 1.508277416229248} -08/30/2021 23:52:29 - INFO - __main__ - Step 59402: {'lr': 0.00033627529779410695, 'samples': 11405184, 'steps': 59401, 'loss/train': 0.9456004500389099} -08/30/2021 23:52:29 - INFO - __main__ - Step 59403: {'lr': 0.0003362703170475931, 'samples': 11405376, 'steps': 59402, 'loss/train': 1.3428499698638916} -08/30/2021 23:52:29 - INFO - __main__ - Step 59404: {'lr': 0.00033626533626220724, 'samples': 11405568, 'steps': 59403, 'loss/train': 1.3293548822402954} -08/30/2021 23:52:31 - INFO - __main__ - Step 59405: {'lr': 0.0003362603554379515, 'samples': 11405760, 'steps': 59404, 'loss/train': 0.9952874183654785} -08/30/2021 23:52:31 - INFO - __main__ - Step 59406: {'lr': 0.0003362553745748281, 'samples': 11405952, 'steps': 59405, 'loss/train': 1.782294511795044} -08/30/2021 23:52:32 - INFO - __main__ - Step 59407: {'lr': 0.00033625039367283957, 'samples': 11406144, 'steps': 59406, 'loss/train': 1.5301787853240967} -08/30/2021 23:52:32 - INFO - __main__ - Step 59408: {'lr': 0.00033624541273198785, 'samples': 11406336, 'steps': 59407, 'loss/train': 1.4580206871032715} -08/30/2021 23:52:32 - INFO - __main__ - Step 59409: {'lr': 0.0003362404317522752, 'samples': 11406528, 'steps': 59408, 'loss/train': 1.8322279453277588} -08/30/2021 23:52:34 - INFO - __main__ - Step 59410: {'lr': 0.000336235450733704, 'samples': 11406720, 'steps': 59409, 'loss/train': 0.08567579835653305} -08/30/2021 23:52:35 - INFO - __main__ - Step 59411: {'lr': 0.00033623046967627647, 'samples': 11406912, 'steps': 59410, 'loss/train': 0.27010083198547363} -08/30/2021 23:52:35 - INFO - __main__ - Step 59412: {'lr': 0.00033622548857999477, 'samples': 11407104, 'steps': 59411, 'loss/train': 0.9477778673171997} -08/30/2021 23:52:35 - INFO - __main__ - Step 59413: {'lr': 0.00033622050744486117, 'samples': 11407296, 'steps': 59412, 'loss/train': 1.8144454956054688} -08/30/2021 23:52:36 - INFO - __main__ - Step 59414: {'lr': 0.000336215526270878, 'samples': 11407488, 'steps': 59413, 'loss/train': 1.3649078607559204} -08/30/2021 23:52:37 - INFO - __main__ - Step 59415: {'lr': 0.00033621054505804745, 'samples': 11407680, 'steps': 59414, 'loss/train': 0.09282448887825012} -08/30/2021 23:52:38 - INFO - __main__ - Step 59416: {'lr': 0.0003362055638063717, 'samples': 11407872, 'steps': 59415, 'loss/train': 1.3905246257781982} -08/30/2021 23:52:38 - INFO - __main__ - Step 59417: {'lr': 0.00033620058251585314, 'samples': 11408064, 'steps': 59416, 'loss/train': 0.6932212114334106} -08/30/2021 23:52:38 - INFO - __main__ - Step 59418: {'lr': 0.00033619560118649383, 'samples': 11408256, 'steps': 59417, 'loss/train': 1.1944527626037598} -08/30/2021 23:52:39 - INFO - __main__ - Step 59419: {'lr': 0.0003361906198182961, 'samples': 11408448, 'steps': 59418, 'loss/train': 1.8040827512741089} -08/30/2021 23:52:39 - INFO - __main__ - Step 59420: {'lr': 0.0003361856384112623, 'samples': 11408640, 'steps': 59419, 'loss/train': 1.327609896659851} -08/30/2021 23:52:41 - INFO - __main__ - Step 59421: {'lr': 0.00033618065696539457, 'samples': 11408832, 'steps': 59420, 'loss/train': 1.1794135570526123} -08/30/2021 23:52:41 - INFO - __main__ - Step 59422: {'lr': 0.00033617567548069517, 'samples': 11409024, 'steps': 59421, 'loss/train': 0.27892613410949707} -08/30/2021 23:52:41 - INFO - __main__ - Step 59423: {'lr': 0.00033617069395716626, 'samples': 11409216, 'steps': 59422, 'loss/train': 1.4374927282333374} -08/30/2021 23:52:42 - INFO - __main__ - Step 59424: {'lr': 0.0003361657123948103, 'samples': 11409408, 'steps': 59423, 'loss/train': 1.213124394416809} -08/30/2021 23:52:42 - INFO - __main__ - Step 59425: {'lr': 0.00033616073079362923, 'samples': 11409600, 'steps': 59424, 'loss/train': 0.9420284032821655} -08/30/2021 23:52:44 - INFO - __main__ - Step 59426: {'lr': 0.00033615574915362556, 'samples': 11409792, 'steps': 59425, 'loss/train': 2.133023262023926} -08/30/2021 23:52:44 - INFO - __main__ - Step 59427: {'lr': 0.0003361507674748015, 'samples': 11409984, 'steps': 59426, 'loss/train': 1.1065961122512817} -08/30/2021 23:52:45 - INFO - __main__ - Step 59428: {'lr': 0.00033614578575715914, 'samples': 11410176, 'steps': 59427, 'loss/train': 1.06520676612854} -08/30/2021 23:52:45 - INFO - __main__ - Step 59429: {'lr': 0.0003361408040007008, 'samples': 11410368, 'steps': 59428, 'loss/train': 0.032700277864933014} -08/30/2021 23:52:45 - INFO - __main__ - Step 59430: {'lr': 0.00033613582220542884, 'samples': 11410560, 'steps': 59429, 'loss/train': 1.1022206544876099} -08/30/2021 23:52:47 - INFO - __main__ - Step 59431: {'lr': 0.00033613084037134534, 'samples': 11410752, 'steps': 59430, 'loss/train': 1.8937164545059204} -08/30/2021 23:52:48 - INFO - __main__ - Step 59432: {'lr': 0.00033612585849845256, 'samples': 11410944, 'steps': 59431, 'loss/train': 1.244881510734558} -08/30/2021 23:52:48 - INFO - __main__ - Step 59433: {'lr': 0.00033612087658675287, 'samples': 11411136, 'steps': 59432, 'loss/train': 1.126632809638977} -08/30/2021 23:52:48 - INFO - __main__ - Step 59434: {'lr': 0.0003361158946362485, 'samples': 11411328, 'steps': 59433, 'loss/train': 0.6648529767990112} -08/30/2021 23:52:49 - INFO - __main__ - Step 59435: {'lr': 0.00033611091264694156, 'samples': 11411520, 'steps': 59434, 'loss/train': 1.1737480163574219} -08/30/2021 23:52:49 - INFO - __main__ - Step 59436: {'lr': 0.0003361059306188344, 'samples': 11411712, 'steps': 59435, 'loss/train': 0.9358706474304199} -08/30/2021 23:52:51 - INFO - __main__ - Step 59437: {'lr': 0.0003361009485519292, 'samples': 11411904, 'steps': 59436, 'loss/train': 0.14283666014671326} -08/30/2021 23:52:51 - INFO - __main__ - Step 59438: {'lr': 0.0003360959664462282, 'samples': 11412096, 'steps': 59437, 'loss/train': 0.18070244789123535} -08/30/2021 23:52:52 - INFO - __main__ - Step 59439: {'lr': 0.0003360909843017338, 'samples': 11412288, 'steps': 59438, 'loss/train': 0.04775748774409294} -08/30/2021 23:52:52 - INFO - __main__ - Step 59440: {'lr': 0.0003360860021184481, 'samples': 11412480, 'steps': 59439, 'loss/train': 1.5097215175628662} -08/30/2021 23:52:52 - INFO - __main__ - Step 59441: {'lr': 0.0003360810198963733, 'samples': 11412672, 'steps': 59440, 'loss/train': 1.2952772378921509} -08/30/2021 23:52:54 - INFO - __main__ - Step 59442: {'lr': 0.0003360760376355118, 'samples': 11412864, 'steps': 59441, 'loss/train': 1.2062057256698608} -08/30/2021 23:52:54 - INFO - __main__ - Step 59443: {'lr': 0.00033607105533586573, 'samples': 11413056, 'steps': 59442, 'loss/train': 1.3953914642333984} -08/30/2021 23:52:55 - INFO - __main__ - Step 59444: {'lr': 0.0003360660729974374, 'samples': 11413248, 'steps': 59443, 'loss/train': 1.484487533569336} -08/30/2021 23:52:55 - INFO - __main__ - Step 59445: {'lr': 0.00033606109062022906, 'samples': 11413440, 'steps': 59444, 'loss/train': 0.9972631931304932} -08/30/2021 23:52:55 - INFO - __main__ - Step 59446: {'lr': 0.0003360561082042428, 'samples': 11413632, 'steps': 59445, 'loss/train': 1.2883492708206177} -08/30/2021 23:52:56 - INFO - __main__ - Step 59447: {'lr': 0.00033605112574948106, 'samples': 11413824, 'steps': 59446, 'loss/train': 1.44814133644104} -08/30/2021 23:52:58 - INFO - __main__ - Step 59448: {'lr': 0.000336046143255946, 'samples': 11414016, 'steps': 59447, 'loss/train': 1.2546206712722778} -08/30/2021 23:52:58 - INFO - __main__ - Step 59449: {'lr': 0.0003360411607236399, 'samples': 11414208, 'steps': 59448, 'loss/train': 0.024742096662521362} -08/30/2021 23:52:58 - INFO - __main__ - Step 59450: {'lr': 0.0003360361781525649, 'samples': 11414400, 'steps': 59449, 'loss/train': 0.09804750978946686} -08/30/2021 23:52:59 - INFO - __main__ - Step 59451: {'lr': 0.00033603119554272343, 'samples': 11414592, 'steps': 59450, 'loss/train': 0.9889927506446838} -08/30/2021 23:52:59 - INFO - __main__ - Step 59452: {'lr': 0.0003360262128941176, 'samples': 11414784, 'steps': 59451, 'loss/train': 0.8895063400268555} -08/30/2021 23:52:59 - INFO - __main__ - Step 59453: {'lr': 0.00033602123020674965, 'samples': 11414976, 'steps': 59452, 'loss/train': 0.8405062556266785} -08/30/2021 23:53:01 - INFO - __main__ - Step 59454: {'lr': 0.0003360162474806219, 'samples': 11415168, 'steps': 59453, 'loss/train': 1.0882436037063599} -08/30/2021 23:53:02 - INFO - __main__ - Step 59455: {'lr': 0.0003360112647157366, 'samples': 11415360, 'steps': 59454, 'loss/train': 1.3447877168655396} -08/30/2021 23:53:02 - INFO - __main__ - Step 59456: {'lr': 0.0003360062819120958, 'samples': 11415552, 'steps': 59455, 'loss/train': 1.5456767082214355} -08/30/2021 23:53:02 - INFO - __main__ - Step 59457: {'lr': 0.000336001299069702, 'samples': 11415744, 'steps': 59456, 'loss/train': 1.0125421285629272} -08/30/2021 23:53:03 - INFO - __main__ - Step 59458: {'lr': 0.0003359963161885573, 'samples': 11415936, 'steps': 59457, 'loss/train': 1.1881515979766846} -08/30/2021 23:53:04 - INFO - __main__ - Step 59459: {'lr': 0.000335991333268664, 'samples': 11416128, 'steps': 59458, 'loss/train': 1.4432138204574585} -08/30/2021 23:53:05 - INFO - __main__ - Step 59460: {'lr': 0.0003359863503100244, 'samples': 11416320, 'steps': 59459, 'loss/train': 1.9680920839309692} -08/30/2021 23:53:05 - INFO - __main__ - Step 59461: {'lr': 0.0003359813673126406, 'samples': 11416512, 'steps': 59460, 'loss/train': 1.1212599277496338} -08/30/2021 23:53:06 - INFO - __main__ - Step 59462: {'lr': 0.000335976384276515, 'samples': 11416704, 'steps': 59461, 'loss/train': 1.3377097845077515} -08/30/2021 23:53:06 - INFO - __main__ - Step 59463: {'lr': 0.0003359714012016497, 'samples': 11416896, 'steps': 59462, 'loss/train': 1.8361855745315552} -08/30/2021 23:53:07 - INFO - __main__ - Step 59464: {'lr': 0.000335966418088047, 'samples': 11417088, 'steps': 59463, 'loss/train': 1.5688608884811401} -08/30/2021 23:53:08 - INFO - __main__ - Step 59465: {'lr': 0.0003359614349357092, 'samples': 11417280, 'steps': 59464, 'loss/train': 1.2281084060668945} -08/30/2021 23:53:08 - INFO - __main__ - Step 59466: {'lr': 0.00033595645174463843, 'samples': 11417472, 'steps': 59465, 'loss/train': 1.424838900566101} -08/30/2021 23:53:09 - INFO - __main__ - Step 59467: {'lr': 0.0003359514685148371, 'samples': 11417664, 'steps': 59466, 'loss/train': 0.48817774653434753} -08/30/2021 23:53:09 - INFO - __main__ - Step 59468: {'lr': 0.0003359464852463074, 'samples': 11417856, 'steps': 59467, 'loss/train': 1.618391752243042} -08/30/2021 23:53:11 - INFO - __main__ - Step 59469: {'lr': 0.00033594150193905144, 'samples': 11418048, 'steps': 59468, 'loss/train': 1.1780403852462769} -08/30/2021 23:53:11 - INFO - __main__ - Step 59470: {'lr': 0.0003359365185930716, 'samples': 11418240, 'steps': 59469, 'loss/train': 1.3403642177581787} -08/30/2021 23:53:12 - INFO - __main__ - Step 59471: {'lr': 0.00033593153520837006, 'samples': 11418432, 'steps': 59470, 'loss/train': 1.5577113628387451} -08/30/2021 23:53:12 - INFO - __main__ - Step 59472: {'lr': 0.0003359265517849491, 'samples': 11418624, 'steps': 59471, 'loss/train': 1.8197662830352783} -08/30/2021 23:53:12 - INFO - __main__ - Step 59473: {'lr': 0.000335921568322811, 'samples': 11418816, 'steps': 59472, 'loss/train': 1.2587448358535767} -08/30/2021 23:53:13 - INFO - __main__ - Step 59474: {'lr': 0.00033591658482195796, 'samples': 11419008, 'steps': 59473, 'loss/train': 1.377042531967163} -08/30/2021 23:53:14 - INFO - __main__ - Step 59475: {'lr': 0.0003359116012823923, 'samples': 11419200, 'steps': 59474, 'loss/train': 0.890034019947052} -08/30/2021 23:53:15 - INFO - __main__ - Step 59476: {'lr': 0.0003359066177041161, 'samples': 11419392, 'steps': 59475, 'loss/train': 0.7871702313423157} -08/30/2021 23:53:15 - INFO - __main__ - Step 59477: {'lr': 0.0003359016340871317, 'samples': 11419584, 'steps': 59476, 'loss/train': 1.1494500637054443} -08/30/2021 23:53:15 - INFO - __main__ - Step 59478: {'lr': 0.0003358966504314414, 'samples': 11419776, 'steps': 59477, 'loss/train': 1.4305261373519897} -08/30/2021 23:53:16 - INFO - __main__ - Step 59479: {'lr': 0.00033589166673704735, 'samples': 11419968, 'steps': 59478, 'loss/train': 1.5579413175582886} -08/30/2021 23:53:17 - INFO - __main__ - Step 59480: {'lr': 0.0003358866830039519, 'samples': 11420160, 'steps': 59479, 'loss/train': 0.15474049746990204} -08/30/2021 23:53:18 - INFO - __main__ - Step 59481: {'lr': 0.0003358816992321572, 'samples': 11420352, 'steps': 59480, 'loss/train': 1.7838441133499146} -08/30/2021 23:53:18 - INFO - __main__ - Step 59482: {'lr': 0.0003358767154216655, 'samples': 11420544, 'steps': 59481, 'loss/train': 1.1977540254592896} -08/30/2021 23:53:18 - INFO - __main__ - Step 59483: {'lr': 0.00033587173157247915, 'samples': 11420736, 'steps': 59482, 'loss/train': 0.8217096328735352} -08/30/2021 23:53:19 - INFO - __main__ - Step 59484: {'lr': 0.00033586674768460025, 'samples': 11420928, 'steps': 59483, 'loss/train': 0.8427931666374207} -08/30/2021 23:53:20 - INFO - __main__ - Step 59485: {'lr': 0.0003358617637580311, 'samples': 11421120, 'steps': 59484, 'loss/train': 1.143505573272705} -08/30/2021 23:53:21 - INFO - __main__ - Step 59486: {'lr': 0.00033585677979277407, 'samples': 11421312, 'steps': 59485, 'loss/train': 1.8316614627838135} -08/30/2021 23:53:21 - INFO - __main__ - Step 59487: {'lr': 0.00033585179578883123, 'samples': 11421504, 'steps': 59486, 'loss/train': 1.2786799669265747} -08/30/2021 23:53:21 - INFO - __main__ - Step 59488: {'lr': 0.00033584681174620497, 'samples': 11421696, 'steps': 59487, 'loss/train': 1.5275200605392456} -08/30/2021 23:53:22 - INFO - __main__ - Step 59489: {'lr': 0.00033584182766489736, 'samples': 11421888, 'steps': 59488, 'loss/train': 1.025773286819458} -08/30/2021 23:53:22 - INFO - __main__ - Step 59490: {'lr': 0.0003358368435449108, 'samples': 11422080, 'steps': 59489, 'loss/train': 1.2890390157699585} -08/30/2021 23:53:24 - INFO - __main__ - Step 59491: {'lr': 0.0003358318593862474, 'samples': 11422272, 'steps': 59490, 'loss/train': 1.0115821361541748} -08/30/2021 23:53:24 - INFO - __main__ - Step 59492: {'lr': 0.0003358268751889096, 'samples': 11422464, 'steps': 59491, 'loss/train': 1.2791686058044434} -08/30/2021 23:53:24 - INFO - __main__ - Step 59493: {'lr': 0.0003358218909528995, 'samples': 11422656, 'steps': 59492, 'loss/train': 1.580369234085083} -08/30/2021 23:53:25 - INFO - __main__ - Step 59494: {'lr': 0.00033581690667821933, 'samples': 11422848, 'steps': 59493, 'loss/train': 0.8855935335159302} -08/30/2021 23:53:25 - INFO - __main__ - Step 59495: {'lr': 0.00033581192236487153, 'samples': 11423040, 'steps': 59494, 'loss/train': 1.394609808921814} -08/30/2021 23:53:27 - INFO - __main__ - Step 59496: {'lr': 0.00033580693801285805, 'samples': 11423232, 'steps': 59495, 'loss/train': 1.3154865503311157} -08/30/2021 23:53:27 - INFO - __main__ - Step 59497: {'lr': 0.0003358019536221814, 'samples': 11423424, 'steps': 59496, 'loss/train': 1.1394550800323486} -08/30/2021 23:53:27 - INFO - __main__ - Step 59498: {'lr': 0.00033579696919284357, 'samples': 11423616, 'steps': 59497, 'loss/train': 1.101121425628662} -08/30/2021 23:53:28 - INFO - __main__ - Step 59499: {'lr': 0.00033579198472484707, 'samples': 11423808, 'steps': 59498, 'loss/train': 0.9729105830192566} -08/30/2021 23:53:28 - INFO - __main__ - Step 59500: {'lr': 0.000335787000218194, 'samples': 11424000, 'steps': 59499, 'loss/train': 0.8507187962532043} -08/30/2021 23:53:30 - INFO - __main__ - Step 59501: {'lr': 0.0003357820156728866, 'samples': 11424192, 'steps': 59500, 'loss/train': 1.3423972129821777} -08/30/2021 23:53:30 - INFO - __main__ - Step 59502: {'lr': 0.0003357770310889272, 'samples': 11424384, 'steps': 59501, 'loss/train': 1.171541452407837} -08/30/2021 23:53:30 - INFO - __main__ - Step 59503: {'lr': 0.0003357720464663179, 'samples': 11424576, 'steps': 59502, 'loss/train': 1.242734432220459} -08/30/2021 23:53:31 - INFO - __main__ - Step 59504: {'lr': 0.0003357670618050611, 'samples': 11424768, 'steps': 59503, 'loss/train': 1.0610122680664062} -08/30/2021 23:53:31 - INFO - __main__ - Step 59505: {'lr': 0.000335762077105159, 'samples': 11424960, 'steps': 59504, 'loss/train': 1.6891008615493774} -08/30/2021 23:53:33 - INFO - __main__ - Step 59506: {'lr': 0.0003357570923666138, 'samples': 11425152, 'steps': 59505, 'loss/train': 1.1201844215393066} -08/30/2021 23:53:34 - INFO - __main__ - Step 59507: {'lr': 0.0003357521075894278, 'samples': 11425344, 'steps': 59506, 'loss/train': 0.989077627658844} -08/30/2021 23:53:34 - INFO - __main__ - Step 59508: {'lr': 0.00033574712277360325, 'samples': 11425536, 'steps': 59507, 'loss/train': 1.706749439239502} -08/30/2021 23:53:34 - INFO - __main__ - Step 59509: {'lr': 0.00033574213791914235, 'samples': 11425728, 'steps': 59508, 'loss/train': 1.0681970119476318} -08/30/2021 23:53:35 - INFO - __main__ - Step 59510: {'lr': 0.00033573715302604736, 'samples': 11425920, 'steps': 59509, 'loss/train': 1.2094299793243408} -08/30/2021 23:53:35 - INFO - __main__ - Step 59511: {'lr': 0.0003357321680943205, 'samples': 11426112, 'steps': 59510, 'loss/train': 1.408000111579895} -08/30/2021 23:53:37 - INFO - __main__ - Step 59512: {'lr': 0.00033572718312396404, 'samples': 11426304, 'steps': 59511, 'loss/train': 1.633359670639038} -08/30/2021 23:53:38 - INFO - __main__ - Step 59513: {'lr': 0.0003357221981149803, 'samples': 11426496, 'steps': 59512, 'loss/train': 1.8050627708435059} -08/30/2021 23:53:38 - INFO - __main__ - Step 59514: {'lr': 0.0003357172130673714, 'samples': 11426688, 'steps': 59513, 'loss/train': 0.9116045236587524} -08/30/2021 23:53:39 - INFO - __main__ - Step 59515: {'lr': 0.00033571222798113977, 'samples': 11426880, 'steps': 59514, 'loss/train': 1.1150002479553223} -08/30/2021 23:53:39 - INFO - __main__ - Step 59516: {'lr': 0.0003357072428562874, 'samples': 11427072, 'steps': 59515, 'loss/train': 1.2428091764450073} -08/30/2021 23:53:39 - INFO - __main__ - Step 59517: {'lr': 0.0003357022576928167, 'samples': 11427264, 'steps': 59516, 'loss/train': 1.238661289215088} -08/30/2021 23:53:40 - INFO - __main__ - Step 59518: {'lr': 0.0003356972724907299, 'samples': 11427456, 'steps': 59517, 'loss/train': 1.9126455783843994} -08/30/2021 23:53:41 - INFO - __main__ - Step 59519: {'lr': 0.0003356922872500292, 'samples': 11427648, 'steps': 59518, 'loss/train': 2.0081751346588135} -08/30/2021 23:53:42 - INFO - __main__ - Step 59520: {'lr': 0.0003356873019707169, 'samples': 11427840, 'steps': 59519, 'loss/train': 1.8880316019058228} -08/30/2021 23:53:42 - INFO - __main__ - Step 59521: {'lr': 0.0003356823166527952, 'samples': 11428032, 'steps': 59520, 'loss/train': 1.7752128839492798} -08/30/2021 23:53:42 - INFO - __main__ - Step 59522: {'lr': 0.00033567733129626645, 'samples': 11428224, 'steps': 59521, 'loss/train': 0.9479182362556458} -08/30/2021 23:53:43 - INFO - __main__ - Step 59523: {'lr': 0.00033567234590113274, 'samples': 11428416, 'steps': 59522, 'loss/train': 1.2158397436141968} -08/30/2021 23:53:45 - INFO - __main__ - Step 59524: {'lr': 0.00033566736046739643, 'samples': 11428608, 'steps': 59523, 'loss/train': 1.3037676811218262} -08/30/2021 23:53:45 - INFO - __main__ - Step 59525: {'lr': 0.0003356623749950597, 'samples': 11428800, 'steps': 59524, 'loss/train': 1.5904158353805542} -08/30/2021 23:53:46 - INFO - __main__ - Step 59526: {'lr': 0.0003356573894841248, 'samples': 11428992, 'steps': 59525, 'loss/train': 0.08511671423912048} -08/30/2021 23:53:46 - INFO - __main__ - Step 59527: {'lr': 0.0003356524039345941, 'samples': 11429184, 'steps': 59526, 'loss/train': 1.3012559413909912} -08/30/2021 23:53:46 - INFO - __main__ - Step 59528: {'lr': 0.00033564741834646967, 'samples': 11429376, 'steps': 59527, 'loss/train': 1.6012877225875854} -08/30/2021 23:53:48 - INFO - __main__ - Step 59529: {'lr': 0.0003356424327197539, 'samples': 11429568, 'steps': 59528, 'loss/train': 1.9932719469070435} -08/30/2021 23:53:48 - INFO - __main__ - Step 59530: {'lr': 0.00033563744705444886, 'samples': 11429760, 'steps': 59529, 'loss/train': 2.1074087619781494} -08/30/2021 23:53:48 - INFO - __main__ - Step 59531: {'lr': 0.000335632461350557, 'samples': 11429952, 'steps': 59530, 'loss/train': 1.8902236223220825} -08/30/2021 23:53:49 - INFO - __main__ - Step 59532: {'lr': 0.00033562747560808044, 'samples': 11430144, 'steps': 59531, 'loss/train': 1.0934573411941528} -08/30/2021 23:53:49 - INFO - __main__ - Step 59533: {'lr': 0.00033562248982702144, 'samples': 11430336, 'steps': 59532, 'loss/train': 1.6786918640136719} -08/30/2021 23:53:51 - INFO - __main__ - Step 59534: {'lr': 0.0003356175040073823, 'samples': 11430528, 'steps': 59533, 'loss/train': 1.8935232162475586} -08/30/2021 23:53:51 - INFO - __main__ - Step 59535: {'lr': 0.0003356125181491653, 'samples': 11430720, 'steps': 59534, 'loss/train': 5.017116546630859} -08/30/2021 23:53:51 - INFO - __main__ - Step 59536: {'lr': 0.0003356075322523725, 'samples': 11430912, 'steps': 59535, 'loss/train': 1.4133442640304565} -08/30/2021 23:53:52 - INFO - __main__ - Step 59537: {'lr': 0.00033560254631700634, 'samples': 11431104, 'steps': 59536, 'loss/train': 1.377843976020813} -08/30/2021 23:53:52 - INFO - __main__ - Step 59538: {'lr': 0.0003355975603430689, 'samples': 11431296, 'steps': 59537, 'loss/train': 1.8543263673782349} -08/30/2021 23:53:52 - INFO - __main__ - Step 59539: {'lr': 0.0003355925743305626, 'samples': 11431488, 'steps': 59538, 'loss/train': 1.44297194480896} -08/30/2021 23:53:54 - INFO - __main__ - Step 59540: {'lr': 0.0003355875882794896, 'samples': 11431680, 'steps': 59539, 'loss/train': 1.0738028287887573} -08/30/2021 23:53:54 - INFO - __main__ - Step 59541: {'lr': 0.00033558260218985214, 'samples': 11431872, 'steps': 59540, 'loss/train': 1.1790761947631836} -08/30/2021 23:53:55 - INFO - __main__ - Step 59542: {'lr': 0.00033557761606165253, 'samples': 11432064, 'steps': 59541, 'loss/train': 1.3438873291015625} -08/30/2021 23:53:55 - INFO - __main__ - Step 59543: {'lr': 0.00033557262989489294, 'samples': 11432256, 'steps': 59542, 'loss/train': 1.1743943691253662} -08/30/2021 23:53:55 - INFO - __main__ - Step 59544: {'lr': 0.0003355676436895756, 'samples': 11432448, 'steps': 59543, 'loss/train': 1.444443702697754} -08/30/2021 23:53:57 - INFO - __main__ - Step 59545: {'lr': 0.0003355626574457029, 'samples': 11432640, 'steps': 59544, 'loss/train': 1.572969675064087} -08/30/2021 23:53:57 - INFO - __main__ - Step 59546: {'lr': 0.00033555767116327686, 'samples': 11432832, 'steps': 59545, 'loss/train': 1.5157380104064941} -08/30/2021 23:53:58 - INFO - __main__ - Step 59547: {'lr': 0.00033555268484229987, 'samples': 11433024, 'steps': 59546, 'loss/train': 1.563647747039795} -08/30/2021 23:53:58 - INFO - __main__ - Step 59548: {'lr': 0.0003355476984827743, 'samples': 11433216, 'steps': 59547, 'loss/train': 1.581427812576294} -08/30/2021 23:53:58 - INFO - __main__ - Step 59549: {'lr': 0.0003355427120847021, 'samples': 11433408, 'steps': 59548, 'loss/train': 1.9217238426208496} -08/30/2021 23:54:00 - INFO - __main__ - Step 59550: {'lr': 0.0003355377256480858, 'samples': 11433600, 'steps': 59549, 'loss/train': 1.5115524530410767} -08/30/2021 23:54:00 - INFO - __main__ - Step 59551: {'lr': 0.00033553273917292744, 'samples': 11433792, 'steps': 59550, 'loss/train': 1.2947574853897095} -08/30/2021 23:54:01 - INFO - __main__ - Step 59552: {'lr': 0.0003355277526592293, 'samples': 11433984, 'steps': 59551, 'loss/train': 1.548445224761963} -08/30/2021 23:54:01 - INFO - __main__ - Step 59553: {'lr': 0.00033552276610699375, 'samples': 11434176, 'steps': 59552, 'loss/train': 1.0060101747512817} -08/30/2021 23:54:01 - INFO - __main__ - Step 59554: {'lr': 0.00033551777951622297, 'samples': 11434368, 'steps': 59553, 'loss/train': 1.2337366342544556} -08/30/2021 23:54:03 - INFO - __main__ - Step 59555: {'lr': 0.0003355127928869192, 'samples': 11434560, 'steps': 59554, 'loss/train': 1.2919800281524658} -08/30/2021 23:54:03 - INFO - __main__ - Step 59556: {'lr': 0.0003355078062190847, 'samples': 11434752, 'steps': 59555, 'loss/train': 1.3907957077026367} -08/30/2021 23:54:04 - INFO - __main__ - Step 59557: {'lr': 0.00033550281951272163, 'samples': 11434944, 'steps': 59556, 'loss/train': 0.7404875755310059} -08/30/2021 23:54:04 - INFO - __main__ - Step 59558: {'lr': 0.0003354978327678323, 'samples': 11435136, 'steps': 59557, 'loss/train': 1.3297829627990723} -08/30/2021 23:54:04 - INFO - __main__ - Step 59559: {'lr': 0.00033549284598441897, 'samples': 11435328, 'steps': 59558, 'loss/train': 1.1501740217208862} -08/30/2021 23:54:06 - INFO - __main__ - Step 59560: {'lr': 0.0003354878591624839, 'samples': 11435520, 'steps': 59559, 'loss/train': 1.3025771379470825} -08/30/2021 23:54:06 - INFO - __main__ - Step 59561: {'lr': 0.0003354828723020294, 'samples': 11435712, 'steps': 59560, 'loss/train': 1.3005484342575073} -08/30/2021 23:54:07 - INFO - __main__ - Step 59562: {'lr': 0.0003354778854030576, 'samples': 11435904, 'steps': 59561, 'loss/train': 1.8889622688293457} -08/30/2021 23:54:07 - INFO - __main__ - Step 59563: {'lr': 0.0003354728984655708, 'samples': 11436096, 'steps': 59562, 'loss/train': 0.100043386220932} -08/30/2021 23:54:08 - INFO - __main__ - Step 59564: {'lr': 0.0003354679114895711, 'samples': 11436288, 'steps': 59563, 'loss/train': 1.8457481861114502} -08/30/2021 23:54:10 - INFO - __main__ - Step 59565: {'lr': 0.000335462924475061, 'samples': 11436480, 'steps': 59564, 'loss/train': 1.0684540271759033} -08/30/2021 23:54:11 - INFO - __main__ - Step 59566: {'lr': 0.00033545793742204255, 'samples': 11436672, 'steps': 59565, 'loss/train': 1.7257028818130493} -08/30/2021 23:54:11 - INFO - __main__ - Step 59567: {'lr': 0.00033545295033051814, 'samples': 11436864, 'steps': 59566, 'loss/train': 2.5105414390563965} -08/30/2021 23:54:11 - INFO - __main__ - Step 59568: {'lr': 0.00033544796320048996, 'samples': 11437056, 'steps': 59567, 'loss/train': 0.9362022280693054} -08/30/2021 23:54:12 - INFO - __main__ - Step 59569: {'lr': 0.0003354429760319602, 'samples': 11437248, 'steps': 59568, 'loss/train': 1.3529255390167236} -08/30/2021 23:54:12 - INFO - __main__ - Step 59570: {'lr': 0.00033543798882493123, 'samples': 11437440, 'steps': 59569, 'loss/train': 0.2671198844909668} -08/30/2021 23:54:13 - INFO - __main__ - Step 59571: {'lr': 0.0003354330015794051, 'samples': 11437632, 'steps': 59570, 'loss/train': 0.12280721217393875} -08/30/2021 23:54:14 - INFO - __main__ - Step 59572: {'lr': 0.00033542801429538424, 'samples': 11437824, 'steps': 59571, 'loss/train': 1.2619775533676147} -08/30/2021 23:54:14 - INFO - __main__ - Step 59573: {'lr': 0.0003354230269728709, 'samples': 11438016, 'steps': 59572, 'loss/train': 0.9547221660614014} -08/30/2021 23:54:15 - INFO - __main__ - Step 59574: {'lr': 0.0003354180396118671, 'samples': 11438208, 'steps': 59573, 'loss/train': 1.591331958770752} -08/30/2021 23:54:15 - INFO - __main__ - Step 59575: {'lr': 0.0003354130522123754, 'samples': 11438400, 'steps': 59574, 'loss/train': 0.8355203866958618} -08/30/2021 23:54:16 - INFO - __main__ - Step 59576: {'lr': 0.0003354080647743978, 'samples': 11438592, 'steps': 59575, 'loss/train': 1.5975719690322876} -08/30/2021 23:54:17 - INFO - __main__ - Step 59577: {'lr': 0.0003354030772979367, 'samples': 11438784, 'steps': 59576, 'loss/train': 0.4746231734752655} -08/30/2021 23:54:17 - INFO - __main__ - Step 59578: {'lr': 0.00033539808978299423, 'samples': 11438976, 'steps': 59577, 'loss/train': 1.2841274738311768} -08/30/2021 23:54:18 - INFO - __main__ - Step 59579: {'lr': 0.0003353931022295728, 'samples': 11439168, 'steps': 59578, 'loss/train': 1.2729490995407104} -08/30/2021 23:54:18 - INFO - __main__ - Step 59580: {'lr': 0.0003353881146376745, 'samples': 11439360, 'steps': 59579, 'loss/train': 1.0510896444320679} -08/30/2021 23:54:19 - INFO - __main__ - Step 59581: {'lr': 0.0003353831270073016, 'samples': 11439552, 'steps': 59580, 'loss/train': 0.9666589498519897} -08/30/2021 23:54:20 - INFO - __main__ - Step 59582: {'lr': 0.0003353781393384564, 'samples': 11439744, 'steps': 59581, 'loss/train': 1.0285776853561401} -08/30/2021 23:54:20 - INFO - __main__ - Step 59583: {'lr': 0.0003353731516311411, 'samples': 11439936, 'steps': 59582, 'loss/train': 1.6774648427963257} -08/30/2021 23:54:20 - INFO - __main__ - Step 59584: {'lr': 0.00033536816388535814, 'samples': 11440128, 'steps': 59583, 'loss/train': 1.4264315366744995} -08/30/2021 23:54:21 - INFO - __main__ - Step 59585: {'lr': 0.0003353631761011094, 'samples': 11440320, 'steps': 59584, 'loss/train': 1.6628700494766235} -08/30/2021 23:54:22 - INFO - __main__ - Step 59586: {'lr': 0.00033535818827839744, 'samples': 11440512, 'steps': 59585, 'loss/train': 1.84689462184906} -08/30/2021 23:54:23 - INFO - __main__ - Step 59587: {'lr': 0.0003353532004172244, 'samples': 11440704, 'steps': 59586, 'loss/train': 2.0278661251068115} -08/30/2021 23:54:23 - INFO - __main__ - Step 59588: {'lr': 0.00033534821251759246, 'samples': 11440896, 'steps': 59587, 'loss/train': 1.2155430316925049} -08/30/2021 23:54:24 - INFO - __main__ - Step 59589: {'lr': 0.00033534322457950396, 'samples': 11441088, 'steps': 59588, 'loss/train': 1.6607884168624878} -08/30/2021 23:54:24 - INFO - __main__ - Step 59590: {'lr': 0.00033533823660296115, 'samples': 11441280, 'steps': 59589, 'loss/train': 2.0612988471984863} -08/30/2021 23:54:26 - INFO - __main__ - Step 59591: {'lr': 0.00033533324858796623, 'samples': 11441472, 'steps': 59590, 'loss/train': 1.382971167564392} -08/30/2021 23:54:26 - INFO - __main__ - Step 59592: {'lr': 0.00033532826053452145, 'samples': 11441664, 'steps': 59591, 'loss/train': 0.9431319236755371} -08/30/2021 23:54:26 - INFO - __main__ - Step 59593: {'lr': 0.00033532327244262906, 'samples': 11441856, 'steps': 59592, 'loss/train': 0.8664615750312805} -08/30/2021 23:54:27 - INFO - __main__ - Step 59594: {'lr': 0.0003353182843122913, 'samples': 11442048, 'steps': 59593, 'loss/train': 1.3683347702026367} -08/30/2021 23:54:27 - INFO - __main__ - Step 59595: {'lr': 0.0003353132961435105, 'samples': 11442240, 'steps': 59594, 'loss/train': 2.2648630142211914} -08/30/2021 23:54:28 - INFO - __main__ - Step 59596: {'lr': 0.00033530830793628886, 'samples': 11442432, 'steps': 59595, 'loss/train': 1.2228997945785522} -08/30/2021 23:54:29 - INFO - __main__ - Step 59597: {'lr': 0.00033530331969062853, 'samples': 11442624, 'steps': 59596, 'loss/train': 0.13200846314430237} -08/30/2021 23:54:30 - INFO - __main__ - Step 59598: {'lr': 0.00033529833140653187, 'samples': 11442816, 'steps': 59597, 'loss/train': 0.8539416193962097} -08/30/2021 23:54:30 - INFO - __main__ - Step 59599: {'lr': 0.0003352933430840011, 'samples': 11443008, 'steps': 59598, 'loss/train': 1.2471369504928589} -08/30/2021 23:54:30 - INFO - __main__ - Step 59600: {'lr': 0.0003352883547230385, 'samples': 11443200, 'steps': 59599, 'loss/train': 1.1926660537719727} -08/30/2021 23:54:31 - INFO - __main__ - Step 59601: {'lr': 0.00033528336632364624, 'samples': 11443392, 'steps': 59600, 'loss/train': 1.6726816892623901} -08/30/2021 23:54:32 - INFO - __main__ - Step 59602: {'lr': 0.00033527837788582663, 'samples': 11443584, 'steps': 59601, 'loss/train': 2.3026862144470215} -08/30/2021 23:54:33 - INFO - __main__ - Step 59603: {'lr': 0.00033527338940958197, 'samples': 11443776, 'steps': 59602, 'loss/train': 1.251391887664795} -08/30/2021 23:54:33 - INFO - __main__ - Step 59604: {'lr': 0.00033526840089491433, 'samples': 11443968, 'steps': 59603, 'loss/train': 1.8059701919555664} -08/30/2021 23:54:34 - INFO - __main__ - Step 59605: {'lr': 0.00033526341234182613, 'samples': 11444160, 'steps': 59604, 'loss/train': 1.0970380306243896} -08/30/2021 23:54:34 - INFO - __main__ - Step 59606: {'lr': 0.00033525842375031946, 'samples': 11444352, 'steps': 59605, 'loss/train': 1.2555947303771973} -08/30/2021 23:54:35 - INFO - __main__ - Step 59607: {'lr': 0.00033525343512039673, 'samples': 11444544, 'steps': 59606, 'loss/train': 1.5133765935897827} -08/30/2021 23:54:36 - INFO - __main__ - Step 59608: {'lr': 0.0003352484464520601, 'samples': 11444736, 'steps': 59607, 'loss/train': 1.4554907083511353} -08/30/2021 23:54:36 - INFO - __main__ - Step 59609: {'lr': 0.0003352434577453119, 'samples': 11444928, 'steps': 59608, 'loss/train': 1.9755858182907104} -08/30/2021 23:54:37 - INFO - __main__ - Step 59610: {'lr': 0.00033523846900015427, 'samples': 11445120, 'steps': 59609, 'loss/train': 1.738843321800232} -08/30/2021 23:54:37 - INFO - __main__ - Step 59611: {'lr': 0.00033523348021658947, 'samples': 11445312, 'steps': 59610, 'loss/train': 0.053249672055244446} -08/30/2021 23:54:39 - INFO - __main__ - Step 59612: {'lr': 0.00033522849139461973, 'samples': 11445504, 'steps': 59611, 'loss/train': 1.449386477470398} -08/30/2021 23:54:39 - INFO - __main__ - Step 59613: {'lr': 0.0003352235025342475, 'samples': 11445696, 'steps': 59612, 'loss/train': 0.05001894012093544} -08/30/2021 23:54:39 - INFO - __main__ - Step 59614: {'lr': 0.00033521851363547473, 'samples': 11445888, 'steps': 59613, 'loss/train': 1.0461491346359253} -08/30/2021 23:54:40 - INFO - __main__ - Step 59615: {'lr': 0.0003352135246983039, 'samples': 11446080, 'steps': 59614, 'loss/train': 1.3499770164489746} -08/30/2021 23:54:40 - INFO - __main__ - Step 59616: {'lr': 0.0003352085357227372, 'samples': 11446272, 'steps': 59615, 'loss/train': 1.6037282943725586} -08/30/2021 23:54:42 - INFO - __main__ - Step 59617: {'lr': 0.00033520354670877673, 'samples': 11446464, 'steps': 59616, 'loss/train': 0.32540133595466614} -08/30/2021 23:54:43 - INFO - __main__ - Step 59618: {'lr': 0.00033519855765642493, 'samples': 11446656, 'steps': 59617, 'loss/train': 1.161939263343811} -08/30/2021 23:54:43 - INFO - __main__ - Step 59619: {'lr': 0.00033519356856568397, 'samples': 11446848, 'steps': 59618, 'loss/train': 1.3406963348388672} -08/30/2021 23:54:43 - INFO - __main__ - Step 59620: {'lr': 0.00033518857943655607, 'samples': 11447040, 'steps': 59619, 'loss/train': 1.1450269222259521} -08/30/2021 23:54:44 - INFO - __main__ - Step 59621: {'lr': 0.00033518359026904357, 'samples': 11447232, 'steps': 59620, 'loss/train': 1.5163629055023193} -08/30/2021 23:54:45 - INFO - __main__ - Step 59622: {'lr': 0.00033517860106314863, 'samples': 11447424, 'steps': 59621, 'loss/train': 1.7235796451568604} -08/30/2021 23:54:46 - INFO - __main__ - Step 59623: {'lr': 0.00033517361181887353, 'samples': 11447616, 'steps': 59622, 'loss/train': 0.22339722514152527} -08/30/2021 23:54:46 - INFO - __main__ - Step 59624: {'lr': 0.0003351686225362205, 'samples': 11447808, 'steps': 59623, 'loss/train': 2.0765442848205566} -08/30/2021 23:54:46 - INFO - __main__ - Step 59625: {'lr': 0.00033516363321519185, 'samples': 11448000, 'steps': 59624, 'loss/train': 1.6375408172607422} -08/30/2021 23:54:47 - INFO - __main__ - Step 59626: {'lr': 0.0003351586438557897, 'samples': 11448192, 'steps': 59625, 'loss/train': 1.228614330291748} -08/30/2021 23:54:47 - INFO - __main__ - Step 59627: {'lr': 0.00033515365445801635, 'samples': 11448384, 'steps': 59626, 'loss/train': 1.0468555688858032} -08/30/2021 23:54:49 - INFO - __main__ - Step 59628: {'lr': 0.00033514866502187417, 'samples': 11448576, 'steps': 59627, 'loss/train': 1.2167309522628784} -08/30/2021 23:54:49 - INFO - __main__ - Step 59629: {'lr': 0.0003351436755473654, 'samples': 11448768, 'steps': 59628, 'loss/train': 1.053054690361023} -08/30/2021 23:54:50 - INFO - __main__ - Step 59630: {'lr': 0.00033513868603449203, 'samples': 11448960, 'steps': 59629, 'loss/train': 1.5874356031417847} -08/30/2021 23:54:50 - INFO - __main__ - Step 59631: {'lr': 0.00033513369648325653, 'samples': 11449152, 'steps': 59630, 'loss/train': 0.7195480465888977} -08/30/2021 23:54:50 - INFO - __main__ - Step 59632: {'lr': 0.00033512870689366114, 'samples': 11449344, 'steps': 59631, 'loss/train': 1.3263505697250366} -08/30/2021 23:54:52 - INFO - __main__ - Step 59633: {'lr': 0.0003351237172657081, 'samples': 11449536, 'steps': 59632, 'loss/train': 1.3192288875579834} -08/30/2021 23:54:52 - INFO - __main__ - Step 59634: {'lr': 0.00033511872759939954, 'samples': 11449728, 'steps': 59633, 'loss/train': 1.0848983526229858} -08/30/2021 23:54:52 - INFO - __main__ - Step 59635: {'lr': 0.0003351137378947378, 'samples': 11449920, 'steps': 59634, 'loss/train': 2.0865628719329834} -08/30/2021 23:54:53 - INFO - __main__ - Step 59636: {'lr': 0.00033510874815172523, 'samples': 11450112, 'steps': 59635, 'loss/train': 1.2444217205047607} -08/30/2021 23:54:53 - INFO - __main__ - Step 59637: {'lr': 0.00033510375837036386, 'samples': 11450304, 'steps': 59636, 'loss/train': 1.2617526054382324} -08/30/2021 23:54:55 - INFO - __main__ - Step 59638: {'lr': 0.0003350987685506561, 'samples': 11450496, 'steps': 59637, 'loss/train': 1.1474472284317017} -08/30/2021 23:54:55 - INFO - __main__ - Step 59639: {'lr': 0.0003350937786926041, 'samples': 11450688, 'steps': 59638, 'loss/train': 0.5737676024436951} -08/30/2021 23:54:55 - INFO - __main__ - Step 59640: {'lr': 0.0003350887887962102, 'samples': 11450880, 'steps': 59639, 'loss/train': 1.4543455839157104} -08/30/2021 23:54:56 - INFO - __main__ - Step 59641: {'lr': 0.00033508379886147655, 'samples': 11451072, 'steps': 59640, 'loss/train': 1.3561283349990845} -08/30/2021 23:54:56 - INFO - __main__ - Step 59642: {'lr': 0.00033507880888840547, 'samples': 11451264, 'steps': 59641, 'loss/train': 1.263848066329956} -08/30/2021 23:54:58 - INFO - __main__ - Step 59643: {'lr': 0.00033507381887699927, 'samples': 11451456, 'steps': 59642, 'loss/train': 1.8754993677139282} -08/30/2021 23:54:58 - INFO - __main__ - Step 59644: {'lr': 0.0003350688288272601, 'samples': 11451648, 'steps': 59643, 'loss/train': 2.172424077987671} -08/30/2021 23:54:59 - INFO - __main__ - Step 59645: {'lr': 0.00033506383873919016, 'samples': 11451840, 'steps': 59644, 'loss/train': 2.2921624183654785} -08/30/2021 23:54:59 - INFO - __main__ - Step 59646: {'lr': 0.0003350588486127918, 'samples': 11452032, 'steps': 59645, 'loss/train': 1.8611721992492676} -08/30/2021 23:54:59 - INFO - __main__ - Step 59647: {'lr': 0.0003350538584480672, 'samples': 11452224, 'steps': 59646, 'loss/train': 1.0862886905670166} -08/30/2021 23:55:01 - INFO - __main__ - Step 59648: {'lr': 0.0003350488682450187, 'samples': 11452416, 'steps': 59647, 'loss/train': 1.4954073429107666} -08/30/2021 23:55:01 - INFO - __main__ - Step 59649: {'lr': 0.00033504387800364856, 'samples': 11452608, 'steps': 59648, 'loss/train': 1.7261111736297607} -08/30/2021 23:55:02 - INFO - __main__ - Step 59650: {'lr': 0.00033503888772395886, 'samples': 11452800, 'steps': 59649, 'loss/train': 1.1935325860977173} -08/30/2021 23:55:02 - INFO - __main__ - Step 59651: {'lr': 0.0003350338974059519, 'samples': 11452992, 'steps': 59650, 'loss/train': 1.6750245094299316} -08/30/2021 23:55:02 - INFO - __main__ - Step 59652: {'lr': 0.0003350289070496301, 'samples': 11453184, 'steps': 59651, 'loss/train': 1.7220368385314941} -08/30/2021 23:55:04 - INFO - __main__ - Step 59653: {'lr': 0.0003350239166549955, 'samples': 11453376, 'steps': 59652, 'loss/train': 1.2379019260406494} -08/30/2021 23:55:04 - INFO - __main__ - Step 59654: {'lr': 0.0003350189262220504, 'samples': 11453568, 'steps': 59653, 'loss/train': 1.7653824090957642} -08/30/2021 23:55:05 - INFO - __main__ - Step 59655: {'lr': 0.0003350139357507972, 'samples': 11453760, 'steps': 59654, 'loss/train': 1.6006726026535034} -08/30/2021 23:55:05 - INFO - __main__ - Step 59656: {'lr': 0.00033500894524123796, 'samples': 11453952, 'steps': 59655, 'loss/train': 1.2506486177444458} -08/30/2021 23:55:05 - INFO - __main__ - Step 59657: {'lr': 0.0003350039546933751, 'samples': 11454144, 'steps': 59656, 'loss/train': 0.8107120394706726} -08/30/2021 23:55:06 - INFO - __main__ - Step 59658: {'lr': 0.00033499896410721066, 'samples': 11454336, 'steps': 59657, 'loss/train': 1.5907068252563477} -08/30/2021 23:55:07 - INFO - __main__ - Step 59659: {'lr': 0.000334993973482747, 'samples': 11454528, 'steps': 59658, 'loss/train': 1.9400674104690552} -08/30/2021 23:55:08 - INFO - __main__ - Step 59660: {'lr': 0.0003349889828199864, 'samples': 11454720, 'steps': 59659, 'loss/train': 1.310667634010315} -08/30/2021 23:55:08 - INFO - __main__ - Step 59661: {'lr': 0.000334983992118931, 'samples': 11454912, 'steps': 59660, 'loss/train': 0.6708696484565735} -08/30/2021 23:55:08 - INFO - __main__ - Step 59662: {'lr': 0.00033497900137958325, 'samples': 11455104, 'steps': 59661, 'loss/train': 1.6113548278808594} -08/30/2021 23:55:09 - INFO - __main__ - Step 59663: {'lr': 0.00033497401060194525, 'samples': 11455296, 'steps': 59662, 'loss/train': 1.5807186365127563} -08/30/2021 23:55:10 - INFO - __main__ - Step 59664: {'lr': 0.00033496901978601924, 'samples': 11455488, 'steps': 59663, 'loss/train': 1.902320384979248} -08/30/2021 23:55:11 - INFO - __main__ - Step 59665: {'lr': 0.0003349640289318075, 'samples': 11455680, 'steps': 59664, 'loss/train': 1.3955453634262085} -08/30/2021 23:55:11 - INFO - __main__ - Step 59666: {'lr': 0.0003349590380393123, 'samples': 11455872, 'steps': 59665, 'loss/train': 1.8161306381225586} -08/30/2021 23:55:12 - INFO - __main__ - Step 59667: {'lr': 0.0003349540471085358, 'samples': 11456064, 'steps': 59666, 'loss/train': 1.3871043920516968} -08/30/2021 23:55:12 - INFO - __main__ - Step 59668: {'lr': 0.00033494905613948035, 'samples': 11456256, 'steps': 59667, 'loss/train': 1.646823525428772} -08/30/2021 23:55:14 - INFO - __main__ - Step 59669: {'lr': 0.00033494406513214826, 'samples': 11456448, 'steps': 59668, 'loss/train': 1.4401887655258179} -08/30/2021 23:55:15 - INFO - __main__ - Step 59670: {'lr': 0.0003349390740865416, 'samples': 11456640, 'steps': 59669, 'loss/train': 1.7677853107452393} -08/30/2021 23:55:15 - INFO - __main__ - Step 59671: {'lr': 0.0003349340830026627, 'samples': 11456832, 'steps': 59670, 'loss/train': 0.047431644052267075} -08/30/2021 23:55:16 - INFO - __main__ - Step 59672: {'lr': 0.0003349290918805138, 'samples': 11457024, 'steps': 59671, 'loss/train': 0.036663372069597244} -08/30/2021 23:55:16 - INFO - __main__ - Step 59673: {'lr': 0.0003349241007200972, 'samples': 11457216, 'steps': 59672, 'loss/train': 1.2027740478515625} -08/30/2021 23:55:16 - INFO - __main__ - Step 59674: {'lr': 0.0003349191095214151, 'samples': 11457408, 'steps': 59673, 'loss/train': 1.6536368131637573} -08/30/2021 23:55:18 - INFO - __main__ - Step 59675: {'lr': 0.00033491411828446974, 'samples': 11457600, 'steps': 59674, 'loss/train': 0.9581016302108765} -08/30/2021 23:55:18 - INFO - __main__ - Step 59676: {'lr': 0.00033490912700926345, 'samples': 11457792, 'steps': 59675, 'loss/train': 2.5357964038848877} -08/30/2021 23:55:19 - INFO - __main__ - Step 59677: {'lr': 0.00033490413569579837, 'samples': 11457984, 'steps': 59676, 'loss/train': 1.1402490139007568} -08/30/2021 23:55:19 - INFO - __main__ - Step 59678: {'lr': 0.00033489914434407683, 'samples': 11458176, 'steps': 59677, 'loss/train': 1.1416606903076172} -08/30/2021 23:55:19 - INFO - __main__ - Step 59679: {'lr': 0.00033489415295410096, 'samples': 11458368, 'steps': 59678, 'loss/train': 2.04219126701355} -08/30/2021 23:55:21 - INFO - __main__ - Step 59680: {'lr': 0.0003348891615258732, 'samples': 11458560, 'steps': 59679, 'loss/train': 1.275970697402954} -08/30/2021 23:55:21 - INFO - __main__ - Step 59681: {'lr': 0.0003348841700593956, 'samples': 11458752, 'steps': 59680, 'loss/train': 0.6447604298591614} -08/30/2021 23:55:22 - INFO - __main__ - Step 59682: {'lr': 0.00033487917855467056, 'samples': 11458944, 'steps': 59681, 'loss/train': 1.9180761575698853} -08/30/2021 23:55:22 - INFO - __main__ - Step 59683: {'lr': 0.0003348741870117003, 'samples': 11459136, 'steps': 59682, 'loss/train': 1.2197058200836182} -08/30/2021 23:55:22 - INFO - __main__ - Step 59684: {'lr': 0.000334869195430487, 'samples': 11459328, 'steps': 59683, 'loss/train': 1.4845428466796875} -08/30/2021 23:55:23 - INFO - __main__ - Step 59685: {'lr': 0.0003348642038110329, 'samples': 11459520, 'steps': 59684, 'loss/train': 0.928158700466156} -08/30/2021 23:55:24 - INFO - __main__ - Step 59686: {'lr': 0.0003348592121533404, 'samples': 11459712, 'steps': 59685, 'loss/train': 1.0008618831634521} -08/30/2021 23:55:25 - INFO - __main__ - Step 59687: {'lr': 0.00033485422045741154, 'samples': 11459904, 'steps': 59686, 'loss/train': 0.965795636177063} -08/30/2021 23:55:25 - INFO - __main__ - Step 59688: {'lr': 0.00033484922872324875, 'samples': 11460096, 'steps': 59687, 'loss/train': 1.744931697845459} -08/30/2021 23:55:26 - INFO - __main__ - Step 59689: {'lr': 0.0003348442369508542, 'samples': 11460288, 'steps': 59688, 'loss/train': 1.3161970376968384} -08/30/2021 23:55:26 - INFO - __main__ - Step 59690: {'lr': 0.0003348392451402302, 'samples': 11460480, 'steps': 59689, 'loss/train': 1.1430429220199585} -08/30/2021 23:55:27 - INFO - __main__ - Step 59691: {'lr': 0.00033483425329137886, 'samples': 11460672, 'steps': 59690, 'loss/train': 1.626570463180542} -08/30/2021 23:55:28 - INFO - __main__ - Step 59692: {'lr': 0.00033482926140430253, 'samples': 11460864, 'steps': 59691, 'loss/train': 1.1314787864685059} -08/30/2021 23:55:28 - INFO - __main__ - Step 59693: {'lr': 0.00033482426947900346, 'samples': 11461056, 'steps': 59692, 'loss/train': 0.9415705800056458} -08/30/2021 23:55:29 - INFO - __main__ - Step 59694: {'lr': 0.0003348192775154839, 'samples': 11461248, 'steps': 59693, 'loss/train': 1.9621731042861938} -08/30/2021 23:55:29 - INFO - __main__ - Step 59695: {'lr': 0.000334814285513746, 'samples': 11461440, 'steps': 59694, 'loss/train': 1.3592627048492432} -08/30/2021 23:55:31 - INFO - __main__ - Step 59696: {'lr': 0.0003348092934737922, 'samples': 11461632, 'steps': 59695, 'loss/train': 1.2920070886611938} -08/30/2021 23:55:31 - INFO - __main__ - Step 59697: {'lr': 0.00033480430139562456, 'samples': 11461824, 'steps': 59696, 'loss/train': 1.2732104063034058} -08/30/2021 23:55:31 - INFO - __main__ - Step 59698: {'lr': 0.00033479930927924543, 'samples': 11462016, 'steps': 59697, 'loss/train': 1.5100641250610352} -08/30/2021 23:55:32 - INFO - __main__ - Step 59699: {'lr': 0.000334794317124657, 'samples': 11462208, 'steps': 59698, 'loss/train': 1.5801640748977661} -08/30/2021 23:55:32 - INFO - __main__ - Step 59700: {'lr': 0.00033478932493186163, 'samples': 11462400, 'steps': 59699, 'loss/train': 0.9741455316543579} -08/30/2021 23:55:34 - INFO - __main__ - Step 59701: {'lr': 0.0003347843327008615, 'samples': 11462592, 'steps': 59700, 'loss/train': 1.263201355934143} -08/30/2021 23:55:34 - INFO - __main__ - Step 59702: {'lr': 0.0003347793404316589, 'samples': 11462784, 'steps': 59701, 'loss/train': 1.4084205627441406} -08/30/2021 23:55:34 - INFO - __main__ - Step 59703: {'lr': 0.00033477434812425596, 'samples': 11462976, 'steps': 59702, 'loss/train': 1.3989253044128418} -08/30/2021 23:55:35 - INFO - __main__ - Step 59704: {'lr': 0.00033476935577865497, 'samples': 11463168, 'steps': 59703, 'loss/train': 1.5004475116729736} -08/30/2021 23:55:35 - INFO - __main__ - Step 59705: {'lr': 0.0003347643633948583, 'samples': 11463360, 'steps': 59704, 'loss/train': 1.8358335494995117} -08/30/2021 23:55:37 - INFO - __main__ - Step 59706: {'lr': 0.00033475937097286805, 'samples': 11463552, 'steps': 59705, 'loss/train': 1.3572688102722168} -08/30/2021 23:55:37 - INFO - __main__ - Step 59707: {'lr': 0.00033475437851268657, 'samples': 11463744, 'steps': 59706, 'loss/train': 1.1815388202667236} -08/30/2021 23:55:38 - INFO - __main__ - Step 59708: {'lr': 0.0003347493860143161, 'samples': 11463936, 'steps': 59707, 'loss/train': 0.8684139847755432} -08/30/2021 23:55:38 - INFO - __main__ - Step 59709: {'lr': 0.0003347443934777589, 'samples': 11464128, 'steps': 59708, 'loss/train': 1.5310202836990356} -08/30/2021 23:55:38 - INFO - __main__ - Step 59710: {'lr': 0.0003347394009030171, 'samples': 11464320, 'steps': 59709, 'loss/train': 0.36027631163597107} -08/30/2021 23:55:39 - INFO - __main__ - Step 59711: {'lr': 0.00033473440829009303, 'samples': 11464512, 'steps': 59710, 'loss/train': 1.3714977502822876} -08/30/2021 23:55:40 - INFO - __main__ - Step 59712: {'lr': 0.00033472941563898897, 'samples': 11464704, 'steps': 59711, 'loss/train': 0.7579142451286316} -08/30/2021 23:55:41 - INFO - __main__ - Step 59713: {'lr': 0.00033472442294970716, 'samples': 11464896, 'steps': 59712, 'loss/train': 0.32478347420692444} -08/30/2021 23:55:41 - INFO - __main__ - Step 59714: {'lr': 0.00033471943022224984, 'samples': 11465088, 'steps': 59713, 'loss/train': 0.04143539443612099} -08/30/2021 23:55:42 - INFO - __main__ - Step 59715: {'lr': 0.0003347144374566192, 'samples': 11465280, 'steps': 59714, 'loss/train': 0.5237289071083069} -08/30/2021 23:55:42 - INFO - __main__ - Step 59716: {'lr': 0.00033470944465281753, 'samples': 11465472, 'steps': 59715, 'loss/train': 1.9920235872268677} -08/30/2021 23:55:44 - INFO - __main__ - Step 59717: {'lr': 0.00033470445181084716, 'samples': 11465664, 'steps': 59716, 'loss/train': 1.4423717260360718} -08/30/2021 23:55:44 - INFO - __main__ - Step 59718: {'lr': 0.0003346994589307102, 'samples': 11465856, 'steps': 59717, 'loss/train': 1.4636828899383545} -08/30/2021 23:55:44 - INFO - __main__ - Step 59719: {'lr': 0.00033469446601240907, 'samples': 11466048, 'steps': 59718, 'loss/train': 1.0583508014678955} -08/30/2021 23:55:45 - INFO - __main__ - Step 59720: {'lr': 0.00033468947305594586, 'samples': 11466240, 'steps': 59719, 'loss/train': 1.0116227865219116} -08/30/2021 23:55:45 - INFO - __main__ - Step 59721: {'lr': 0.0003346844800613229, 'samples': 11466432, 'steps': 59720, 'loss/train': 1.2756251096725464} -08/30/2021 23:55:46 - INFO - __main__ - Step 59722: {'lr': 0.00033467948702854233, 'samples': 11466624, 'steps': 59721, 'loss/train': 1.3189589977264404} -08/30/2021 23:55:47 - INFO - __main__ - Step 59723: {'lr': 0.00033467449395760656, 'samples': 11466816, 'steps': 59722, 'loss/train': 1.0390872955322266} -08/30/2021 23:55:47 - INFO - __main__ - Step 59724: {'lr': 0.0003346695008485179, 'samples': 11467008, 'steps': 59723, 'loss/train': 1.437348484992981} -08/30/2021 23:55:48 - INFO - __main__ - Step 59725: {'lr': 0.00033466450770127824, 'samples': 11467200, 'steps': 59724, 'loss/train': 1.2895927429199219} -08/30/2021 23:55:48 - INFO - __main__ - Step 59726: {'lr': 0.0003346595145158902, 'samples': 11467392, 'steps': 59725, 'loss/train': 1.1519036293029785} -08/30/2021 23:55:50 - INFO - __main__ - Step 59727: {'lr': 0.00033465452129235584, 'samples': 11467584, 'steps': 59726, 'loss/train': 1.6210496425628662} -08/30/2021 23:55:51 - INFO - __main__ - Step 59728: {'lr': 0.00033464952803067746, 'samples': 11467776, 'steps': 59727, 'loss/train': 1.3351916074752808} -08/30/2021 23:55:51 - INFO - __main__ - Step 59729: {'lr': 0.0003346445347308573, 'samples': 11467968, 'steps': 59728, 'loss/train': 1.0022586584091187} -08/30/2021 23:55:51 - INFO - __main__ - Step 59730: {'lr': 0.0003346395413928977, 'samples': 11468160, 'steps': 59729, 'loss/train': 0.0895194411277771} -08/30/2021 23:55:52 - INFO - __main__ - Step 59731: {'lr': 0.0003346345480168007, 'samples': 11468352, 'steps': 59730, 'loss/train': 1.2002934217453003} -08/30/2021 23:55:52 - INFO - __main__ - Step 59732: {'lr': 0.00033462955460256876, 'samples': 11468544, 'steps': 59731, 'loss/train': 1.5982295274734497} -08/30/2021 23:55:53 - INFO - __main__ - Step 59733: {'lr': 0.00033462456115020405, 'samples': 11468736, 'steps': 59732, 'loss/train': 1.6238337755203247} -08/30/2021 23:55:54 - INFO - __main__ - Step 59734: {'lr': 0.0003346195676597088, 'samples': 11468928, 'steps': 59733, 'loss/train': 1.6143372058868408} -08/30/2021 23:55:54 - INFO - __main__ - Step 59735: {'lr': 0.00033461457413108524, 'samples': 11469120, 'steps': 59734, 'loss/train': 1.692519187927246} -08/30/2021 23:55:55 - INFO - __main__ - Step 59736: {'lr': 0.00033460958056433574, 'samples': 11469312, 'steps': 59735, 'loss/train': 0.8821504712104797} -08/30/2021 23:55:55 - INFO - __main__ - Step 59737: {'lr': 0.00033460458695946244, 'samples': 11469504, 'steps': 59736, 'loss/train': 1.8254777193069458} -08/30/2021 23:55:57 - INFO - __main__ - Step 59738: {'lr': 0.0003345995933164676, 'samples': 11469696, 'steps': 59737, 'loss/train': 1.6471219062805176} -08/30/2021 23:55:57 - INFO - __main__ - Step 59739: {'lr': 0.0003345945996353535, 'samples': 11469888, 'steps': 59738, 'loss/train': 1.2928080558776855} -08/30/2021 23:55:57 - INFO - __main__ - Step 59740: {'lr': 0.0003345896059161224, 'samples': 11470080, 'steps': 59739, 'loss/train': 0.8101669549942017} -08/30/2021 23:55:58 - INFO - __main__ - Step 59741: {'lr': 0.00033458461215877644, 'samples': 11470272, 'steps': 59740, 'loss/train': 1.3493016958236694} -08/30/2021 23:55:58 - INFO - __main__ - Step 59742: {'lr': 0.000334579618363318, 'samples': 11470464, 'steps': 59741, 'loss/train': 1.7585716247558594} -08/30/2021 23:55:59 - INFO - __main__ - Step 59743: {'lr': 0.0003345746245297494, 'samples': 11470656, 'steps': 59742, 'loss/train': 0.2537163496017456} -08/30/2021 23:56:00 - INFO - __main__ - Step 59744: {'lr': 0.00033456963065807264, 'samples': 11470848, 'steps': 59743, 'loss/train': 1.1767010688781738} -08/30/2021 23:56:00 - INFO - __main__ - Step 59745: {'lr': 0.0003345646367482902, 'samples': 11471040, 'steps': 59744, 'loss/train': 1.826465368270874} -08/30/2021 23:56:01 - INFO - __main__ - Step 59746: {'lr': 0.00033455964280040417, 'samples': 11471232, 'steps': 59745, 'loss/train': 1.0680867433547974} -08/30/2021 23:56:01 - INFO - __main__ - Step 59747: {'lr': 0.0003345546488144169, 'samples': 11471424, 'steps': 59746, 'loss/train': 1.2335466146469116} -08/30/2021 23:56:03 - INFO - __main__ - Step 59748: {'lr': 0.0003345496547903306, 'samples': 11471616, 'steps': 59747, 'loss/train': 1.3852471113204956} -08/30/2021 23:56:03 - INFO - __main__ - Step 59749: {'lr': 0.0003345446607281475, 'samples': 11471808, 'steps': 59748, 'loss/train': 1.362723469734192} -08/30/2021 23:56:03 - INFO - __main__ - Step 59750: {'lr': 0.00033453966662786995, 'samples': 11472000, 'steps': 59749, 'loss/train': 1.731467604637146} -08/30/2021 23:56:04 - INFO - __main__ - Step 59751: {'lr': 0.0003345346724895001, 'samples': 11472192, 'steps': 59750, 'loss/train': 0.04695221409201622} -08/30/2021 23:56:04 - INFO - __main__ - Step 59752: {'lr': 0.0003345296783130402, 'samples': 11472384, 'steps': 59751, 'loss/train': 0.7827739715576172} -08/30/2021 23:56:06 - INFO - __main__ - Step 59753: {'lr': 0.0003345246840984926, 'samples': 11472576, 'steps': 59752, 'loss/train': 1.3239326477050781} -08/30/2021 23:56:06 - INFO - __main__ - Step 59754: {'lr': 0.0003345196898458594, 'samples': 11472768, 'steps': 59753, 'loss/train': 0.9566469192504883} -08/30/2021 23:56:07 - INFO - __main__ - Step 59755: {'lr': 0.00033451469555514294, 'samples': 11472960, 'steps': 59754, 'loss/train': 1.815759301185608} -08/30/2021 23:56:07 - INFO - __main__ - Step 59756: {'lr': 0.0003345097012263456, 'samples': 11473152, 'steps': 59755, 'loss/train': 1.2994920015335083} -08/30/2021 23:56:07 - INFO - __main__ - Step 59757: {'lr': 0.0003345047068594694, 'samples': 11473344, 'steps': 59756, 'loss/train': 1.2464489936828613} -08/30/2021 23:56:08 - INFO - __main__ - Step 59758: {'lr': 0.0003344997124545166, 'samples': 11473536, 'steps': 59757, 'loss/train': 0.05283069238066673} -08/30/2021 23:56:09 - INFO - __main__ - Step 59759: {'lr': 0.00033449471801148963, 'samples': 11473728, 'steps': 59758, 'loss/train': 2.0384433269500732} -08/30/2021 23:56:10 - INFO - __main__ - Step 59760: {'lr': 0.00033448972353039065, 'samples': 11473920, 'steps': 59759, 'loss/train': 1.4910094738006592} -08/30/2021 23:56:10 - INFO - __main__ - Step 59761: {'lr': 0.00033448472901122185, 'samples': 11474112, 'steps': 59760, 'loss/train': 1.7265764474868774} -08/30/2021 23:56:10 - INFO - __main__ - Step 59762: {'lr': 0.0003344797344539855, 'samples': 11474304, 'steps': 59761, 'loss/train': 1.7909163236618042} -08/30/2021 23:56:11 - INFO - __main__ - Step 59763: {'lr': 0.000334474739858684, 'samples': 11474496, 'steps': 59762, 'loss/train': 1.116208791732788} -08/30/2021 23:56:12 - INFO - __main__ - Step 59764: {'lr': 0.0003344697452253195, 'samples': 11474688, 'steps': 59763, 'loss/train': 1.0572972297668457} -08/30/2021 23:56:13 - INFO - __main__ - Step 59765: {'lr': 0.00033446475055389413, 'samples': 11474880, 'steps': 59764, 'loss/train': 1.1873688697814941} -08/30/2021 23:56:13 - INFO - __main__ - Step 59766: {'lr': 0.00033445975584441023, 'samples': 11475072, 'steps': 59765, 'loss/train': 1.6671496629714966} -08/30/2021 23:56:14 - INFO - __main__ - Step 59767: {'lr': 0.00033445476109687013, 'samples': 11475264, 'steps': 59766, 'loss/train': 1.2718393802642822} -08/30/2021 23:56:14 - INFO - __main__ - Step 59768: {'lr': 0.000334449766311276, 'samples': 11475456, 'steps': 59767, 'loss/train': 1.464003086090088} -08/30/2021 23:56:15 - INFO - __main__ - Step 59769: {'lr': 0.00033444477148763006, 'samples': 11475648, 'steps': 59768, 'loss/train': 0.8690761923789978} -08/30/2021 23:56:16 - INFO - __main__ - Step 59770: {'lr': 0.0003344397766259348, 'samples': 11475840, 'steps': 59769, 'loss/train': 1.0399092435836792} -08/30/2021 23:56:16 - INFO - __main__ - Step 59771: {'lr': 0.0003344347817261921, 'samples': 11476032, 'steps': 59770, 'loss/train': 1.2288081645965576} -08/30/2021 23:56:17 - INFO - __main__ - Step 59772: {'lr': 0.0003344297867884044, 'samples': 11476224, 'steps': 59771, 'loss/train': 1.487261414527893} -08/30/2021 23:56:17 - INFO - __main__ - Step 59773: {'lr': 0.000334424791812574, 'samples': 11476416, 'steps': 59772, 'loss/train': 1.0129410028457642} -08/30/2021 23:56:18 - INFO - __main__ - Step 59774: {'lr': 0.00033441979679870305, 'samples': 11476608, 'steps': 59773, 'loss/train': 1.3561673164367676} -08/30/2021 23:56:19 - INFO - __main__ - Step 59775: {'lr': 0.00033441480174679385, 'samples': 11476800, 'steps': 59774, 'loss/train': 1.1367835998535156} -08/30/2021 23:56:19 - INFO - __main__ - Step 59776: {'lr': 0.00033440980665684866, 'samples': 11476992, 'steps': 59775, 'loss/train': 1.3179066181182861} -08/30/2021 23:56:20 - INFO - __main__ - Step 59777: {'lr': 0.00033440481152886977, 'samples': 11477184, 'steps': 59776, 'loss/train': 0.6363301277160645} -08/30/2021 23:56:20 - INFO - __main__ - Step 59778: {'lr': 0.00033439981636285935, 'samples': 11477376, 'steps': 59777, 'loss/train': 0.5855116844177246} -08/30/2021 23:56:22 - INFO - __main__ - Step 59779: {'lr': 0.0003343948211588196, 'samples': 11477568, 'steps': 59778, 'loss/train': 1.2617617845535278} -08/30/2021 23:56:22 - INFO - __main__ - Step 59780: {'lr': 0.00033438982591675284, 'samples': 11477760, 'steps': 59779, 'loss/train': 0.06369766592979431} -08/30/2021 23:56:23 - INFO - __main__ - Step 59781: {'lr': 0.00033438483063666136, 'samples': 11477952, 'steps': 59780, 'loss/train': 1.5154879093170166} -08/30/2021 23:56:23 - INFO - __main__ - Step 59782: {'lr': 0.0003343798353185474, 'samples': 11478144, 'steps': 59781, 'loss/train': 1.9766372442245483} -08/30/2021 23:56:24 - INFO - __main__ - Step 59783: {'lr': 0.0003343748399624131, 'samples': 11478336, 'steps': 59782, 'loss/train': 1.3903272151947021} -08/30/2021 23:56:25 - INFO - __main__ - Step 59784: {'lr': 0.00033436984456826097, 'samples': 11478528, 'steps': 59783, 'loss/train': 1.8117170333862305} -08/30/2021 23:56:25 - INFO - __main__ - Step 59785: {'lr': 0.000334364849136093, 'samples': 11478720, 'steps': 59784, 'loss/train': 1.3325172662734985} -08/30/2021 23:56:26 - INFO - __main__ - Step 59786: {'lr': 0.0003343598536659115, 'samples': 11478912, 'steps': 59785, 'loss/train': 1.488703966140747} -08/30/2021 23:56:26 - INFO - __main__ - Step 59787: {'lr': 0.00033435485815771875, 'samples': 11479104, 'steps': 59786, 'loss/train': 1.30879807472229} -08/30/2021 23:56:27 - INFO - __main__ - Step 59788: {'lr': 0.00033434986261151705, 'samples': 11479296, 'steps': 59787, 'loss/train': 0.7776273488998413} -08/30/2021 23:56:28 - INFO - __main__ - Step 59789: {'lr': 0.0003343448670273086, 'samples': 11479488, 'steps': 59788, 'loss/train': 1.7939506769180298} -08/30/2021 23:56:28 - INFO - __main__ - Step 59790: {'lr': 0.00033433987140509566, 'samples': 11479680, 'steps': 59789, 'loss/train': 1.5992141962051392} -08/30/2021 23:56:29 - INFO - __main__ - Step 59791: {'lr': 0.0003343348757448804, 'samples': 11479872, 'steps': 59790, 'loss/train': 1.2350643873214722} -08/30/2021 23:56:29 - INFO - __main__ - Step 59792: {'lr': 0.0003343298800466652, 'samples': 11480064, 'steps': 59791, 'loss/train': 0.997530460357666} -08/30/2021 23:56:29 - INFO - __main__ - Step 59793: {'lr': 0.0003343248843104523, 'samples': 11480256, 'steps': 59792, 'loss/train': 1.1343399286270142} -08/30/2021 23:56:31 - INFO - __main__ - Step 59794: {'lr': 0.00033431988853624384, 'samples': 11480448, 'steps': 59793, 'loss/train': 1.1660022735595703} -08/30/2021 23:56:31 - INFO - __main__ - Step 59795: {'lr': 0.00033431489272404215, 'samples': 11480640, 'steps': 59794, 'loss/train': 1.2844220399856567} -08/30/2021 23:56:32 - INFO - __main__ - Step 59796: {'lr': 0.0003343098968738495, 'samples': 11480832, 'steps': 59795, 'loss/train': 0.9138148427009583} -08/30/2021 23:56:32 - INFO - __main__ - Step 59797: {'lr': 0.00033430490098566813, 'samples': 11481024, 'steps': 59796, 'loss/train': 1.4196208715438843} -08/30/2021 23:56:32 - INFO - __main__ - Step 59798: {'lr': 0.00033429990505950025, 'samples': 11481216, 'steps': 59797, 'loss/train': 1.470782995223999} -08/30/2021 23:56:33 - INFO - __main__ - Step 59799: {'lr': 0.0003342949090953481, 'samples': 11481408, 'steps': 59798, 'loss/train': 1.1563445329666138} -08/30/2021 23:56:35 - INFO - __main__ - Step 59800: {'lr': 0.000334289913093214, 'samples': 11481600, 'steps': 59799, 'loss/train': 0.7588146924972534} -08/30/2021 23:56:35 - INFO - __main__ - Step 59801: {'lr': 0.0003342849170531001, 'samples': 11481792, 'steps': 59800, 'loss/train': 1.3940439224243164} -08/30/2021 23:56:35 - INFO - __main__ - Step 59802: {'lr': 0.00033427992097500876, 'samples': 11481984, 'steps': 59801, 'loss/train': 1.6214178800582886} -08/30/2021 23:56:36 - INFO - __main__ - Step 59803: {'lr': 0.00033427492485894216, 'samples': 11482176, 'steps': 59802, 'loss/train': 1.1407142877578735} -08/30/2021 23:56:36 - INFO - __main__ - Step 59804: {'lr': 0.0003342699287049027, 'samples': 11482368, 'steps': 59803, 'loss/train': 1.1118789911270142} -08/30/2021 23:56:37 - INFO - __main__ - Step 59805: {'lr': 0.0003342649325128924, 'samples': 11482560, 'steps': 59804, 'loss/train': 1.1539078950881958} -08/30/2021 23:56:38 - INFO - __main__ - Step 59806: {'lr': 0.00033425993628291367, 'samples': 11482752, 'steps': 59805, 'loss/train': 0.8938167095184326} -08/30/2021 23:56:38 - INFO - __main__ - Step 59807: {'lr': 0.0003342549400149687, 'samples': 11482944, 'steps': 59806, 'loss/train': 1.771031141281128} -08/30/2021 23:56:39 - INFO - __main__ - Step 59808: {'lr': 0.0003342499437090597, 'samples': 11483136, 'steps': 59807, 'loss/train': 1.3330076932907104} -08/30/2021 23:56:39 - INFO - __main__ - Step 59809: {'lr': 0.000334244947365189, 'samples': 11483328, 'steps': 59808, 'loss/train': 1.23978853225708} -08/30/2021 23:56:40 - INFO - __main__ - Step 59810: {'lr': 0.00033423995098335886, 'samples': 11483520, 'steps': 59809, 'loss/train': 1.120497226715088} -08/30/2021 23:56:41 - INFO - __main__ - Step 59811: {'lr': 0.00033423495456357156, 'samples': 11483712, 'steps': 59810, 'loss/train': 1.323451280593872} -08/30/2021 23:56:41 - INFO - __main__ - Step 59812: {'lr': 0.00033422995810582917, 'samples': 11483904, 'steps': 59811, 'loss/train': 1.096530795097351} -08/30/2021 23:56:42 - INFO - __main__ - Step 59813: {'lr': 0.0003342249616101341, 'samples': 11484096, 'steps': 59812, 'loss/train': 1.330569863319397} -08/30/2021 23:56:42 - INFO - __main__ - Step 59814: {'lr': 0.0003342199650764886, 'samples': 11484288, 'steps': 59813, 'loss/train': 1.453934669494629} -08/30/2021 23:56:44 - INFO - __main__ - Step 59815: {'lr': 0.0003342149685048949, 'samples': 11484480, 'steps': 59814, 'loss/train': 1.1754119396209717} -08/30/2021 23:56:44 - INFO - __main__ - Step 59816: {'lr': 0.0003342099718953551, 'samples': 11484672, 'steps': 59815, 'loss/train': 1.1980715990066528} -08/30/2021 23:56:44 - INFO - __main__ - Step 59817: {'lr': 0.00033420497524787177, 'samples': 11484864, 'steps': 59816, 'loss/train': 1.5578720569610596} -08/30/2021 23:56:45 - INFO - __main__ - Step 59818: {'lr': 0.0003341999785624468, 'samples': 11485056, 'steps': 59817, 'loss/train': 0.9726073145866394} -08/30/2021 23:56:45 - INFO - __main__ - Step 59819: {'lr': 0.0003341949818390827, 'samples': 11485248, 'steps': 59818, 'loss/train': 1.4954408407211304} -08/30/2021 23:56:45 - INFO - __main__ - Step 59820: {'lr': 0.00033418998507778164, 'samples': 11485440, 'steps': 59819, 'loss/train': 1.964455246925354} -08/30/2021 23:56:47 - INFO - __main__ - Step 59821: {'lr': 0.00033418498827854587, 'samples': 11485632, 'steps': 59820, 'loss/train': 0.9344597458839417} -08/30/2021 23:56:47 - INFO - __main__ - Step 59822: {'lr': 0.0003341799914413776, 'samples': 11485824, 'steps': 59821, 'loss/train': 1.8223085403442383} -08/30/2021 23:56:48 - INFO - __main__ - Step 59823: {'lr': 0.0003341749945662792, 'samples': 11486016, 'steps': 59822, 'loss/train': 1.943886160850525} -08/30/2021 23:56:48 - INFO - __main__ - Step 59824: {'lr': 0.00033416999765325286, 'samples': 11486208, 'steps': 59823, 'loss/train': 1.70814847946167} -08/30/2021 23:56:48 - INFO - __main__ - Step 59825: {'lr': 0.0003341650007023008, 'samples': 11486400, 'steps': 59824, 'loss/train': 0.05768867954611778} -08/30/2021 23:56:50 - INFO - __main__ - Step 59826: {'lr': 0.0003341600037134252, 'samples': 11486592, 'steps': 59825, 'loss/train': 1.1454423666000366} -08/30/2021 23:56:50 - INFO - __main__ - Step 59827: {'lr': 0.00033415500668662845, 'samples': 11486784, 'steps': 59826, 'loss/train': 1.0220969915390015} -08/30/2021 23:56:51 - INFO - __main__ - Step 59828: {'lr': 0.00033415000962191277, 'samples': 11486976, 'steps': 59827, 'loss/train': 1.5042085647583008} -08/30/2021 23:56:51 - INFO - __main__ - Step 59829: {'lr': 0.0003341450125192804, 'samples': 11487168, 'steps': 59828, 'loss/train': 1.5808707475662231} -08/30/2021 23:56:51 - INFO - __main__ - Step 59830: {'lr': 0.0003341400153787336, 'samples': 11487360, 'steps': 59829, 'loss/train': 1.0826679468154907} -08/30/2021 23:56:53 - INFO - __main__ - Step 59831: {'lr': 0.00033413501820027456, 'samples': 11487552, 'steps': 59830, 'loss/train': 1.0123571157455444} -08/30/2021 23:56:53 - INFO - __main__ - Step 59832: {'lr': 0.00033413002098390567, 'samples': 11487744, 'steps': 59831, 'loss/train': 1.1429065465927124} -08/30/2021 23:56:54 - INFO - __main__ - Step 59833: {'lr': 0.00033412502372962894, 'samples': 11487936, 'steps': 59832, 'loss/train': 1.335215449333191} -08/30/2021 23:56:54 - INFO - __main__ - Step 59834: {'lr': 0.0003341200264374469, 'samples': 11488128, 'steps': 59833, 'loss/train': 1.3216681480407715} -08/30/2021 23:56:54 - INFO - __main__ - Step 59835: {'lr': 0.0003341150291073616, 'samples': 11488320, 'steps': 59834, 'loss/train': 1.0301731824874878} -08/30/2021 23:56:57 - INFO - __main__ - Step 59836: {'lr': 0.0003341100317393754, 'samples': 11488512, 'steps': 59835, 'loss/train': 1.4344308376312256} -08/30/2021 23:56:57 - INFO - __main__ - Step 59837: {'lr': 0.00033410503433349055, 'samples': 11488704, 'steps': 59836, 'loss/train': 0.5759755969047546} -08/30/2021 23:56:57 - INFO - __main__ - Step 59838: {'lr': 0.00033410003688970927, 'samples': 11488896, 'steps': 59837, 'loss/train': 1.4586576223373413} -08/30/2021 23:56:58 - INFO - __main__ - Step 59839: {'lr': 0.0003340950394080337, 'samples': 11489088, 'steps': 59838, 'loss/train': 1.195893406867981} -08/30/2021 23:56:58 - INFO - __main__ - Step 59840: {'lr': 0.0003340900418884663, 'samples': 11489280, 'steps': 59839, 'loss/train': 0.9461076855659485} -08/30/2021 23:56:59 - INFO - __main__ - Step 59841: {'lr': 0.00033408504433100916, 'samples': 11489472, 'steps': 59840, 'loss/train': 1.8688420057296753} -08/30/2021 23:57:00 - INFO - __main__ - Step 59842: {'lr': 0.0003340800467356647, 'samples': 11489664, 'steps': 59841, 'loss/train': 1.3909554481506348} -08/30/2021 23:57:00 - INFO - __main__ - Step 59843: {'lr': 0.00033407504910243504, 'samples': 11489856, 'steps': 59842, 'loss/train': 0.9482306241989136} -08/30/2021 23:57:01 - INFO - __main__ - Step 59844: {'lr': 0.0003340700514313224, 'samples': 11490048, 'steps': 59843, 'loss/train': 1.2253609895706177} -08/30/2021 23:57:01 - INFO - __main__ - Step 59845: {'lr': 0.0003340650537223291, 'samples': 11490240, 'steps': 59844, 'loss/train': 0.9642473459243774} -08/30/2021 23:57:02 - INFO - __main__ - Step 59846: {'lr': 0.0003340600559754574, 'samples': 11490432, 'steps': 59845, 'loss/train': 1.307847023010254} -08/30/2021 23:57:03 - INFO - __main__ - Step 59847: {'lr': 0.0003340550581907095, 'samples': 11490624, 'steps': 59846, 'loss/train': 1.3682631254196167} -08/30/2021 23:57:03 - INFO - __main__ - Step 59848: {'lr': 0.0003340500603680878, 'samples': 11490816, 'steps': 59847, 'loss/train': 1.4190080165863037} -08/30/2021 23:57:04 - INFO - __main__ - Step 59849: {'lr': 0.00033404506250759436, 'samples': 11491008, 'steps': 59848, 'loss/train': 1.7067573070526123} -08/30/2021 23:57:04 - INFO - __main__ - Step 59850: {'lr': 0.0003340400646092315, 'samples': 11491200, 'steps': 59849, 'loss/train': 1.9834634065628052} -08/30/2021 23:57:06 - INFO - __main__ - Step 59851: {'lr': 0.0003340350666730015, 'samples': 11491392, 'steps': 59850, 'loss/train': 0.5499975085258484} -08/30/2021 23:57:06 - INFO - __main__ - Step 59852: {'lr': 0.0003340300686989066, 'samples': 11491584, 'steps': 59851, 'loss/train': 0.4791135787963867} -08/30/2021 23:57:07 - INFO - __main__ - Step 59853: {'lr': 0.0003340250706869491, 'samples': 11491776, 'steps': 59852, 'loss/train': 0.043618444353342056} -08/30/2021 23:57:07 - INFO - __main__ - Step 59854: {'lr': 0.00033402007263713115, 'samples': 11491968, 'steps': 59853, 'loss/train': 0.031721729785203934} -08/30/2021 23:57:07 - INFO - __main__ - Step 59855: {'lr': 0.000334015074549455, 'samples': 11492160, 'steps': 59854, 'loss/train': 1.2451456785202026} -08/30/2021 23:57:08 - INFO - __main__ - Step 59856: {'lr': 0.000334010076423923, 'samples': 11492352, 'steps': 59855, 'loss/train': 1.618203043937683} -08/30/2021 23:57:09 - INFO - __main__ - Step 59857: {'lr': 0.00033400507826053733, 'samples': 11492544, 'steps': 59856, 'loss/train': 1.1706225872039795} -08/30/2021 23:57:10 - INFO - __main__ - Step 59858: {'lr': 0.0003340000800593004, 'samples': 11492736, 'steps': 59857, 'loss/train': 1.5623292922973633} -08/30/2021 23:57:10 - INFO - __main__ - Step 59859: {'lr': 0.0003339950818202142, 'samples': 11492928, 'steps': 59858, 'loss/train': 1.1343538761138916} -08/30/2021 23:57:10 - INFO - __main__ - Step 59860: {'lr': 0.00033399008354328106, 'samples': 11493120, 'steps': 59859, 'loss/train': 1.705298662185669} -08/30/2021 23:57:11 - INFO - __main__ - Step 59861: {'lr': 0.0003339850852285034, 'samples': 11493312, 'steps': 59860, 'loss/train': 1.181028962135315} -08/30/2021 23:57:12 - INFO - __main__ - Step 59862: {'lr': 0.00033398008687588333, 'samples': 11493504, 'steps': 59861, 'loss/train': 1.382114052772522} -08/30/2021 23:57:13 - INFO - __main__ - Step 59863: {'lr': 0.00033397508848542306, 'samples': 11493696, 'steps': 59862, 'loss/train': 1.5730162858963013} -08/30/2021 23:57:13 - INFO - __main__ - Step 59864: {'lr': 0.000333970090057125, 'samples': 11493888, 'steps': 59863, 'loss/train': 0.9286319613456726} -08/30/2021 23:57:13 - INFO - __main__ - Step 59865: {'lr': 0.00033396509159099133, 'samples': 11494080, 'steps': 59864, 'loss/train': 1.2114009857177734} -08/30/2021 23:57:14 - INFO - __main__ - Step 59866: {'lr': 0.00033396009308702426, 'samples': 11494272, 'steps': 59865, 'loss/train': 1.3148281574249268} -08/30/2021 23:57:14 - INFO - __main__ - Step 59867: {'lr': 0.000333955094545226, 'samples': 11494464, 'steps': 59866, 'loss/train': 1.6499541997909546} -08/30/2021 23:57:15 - INFO - __main__ - Step 59868: {'lr': 0.00033395009596559887, 'samples': 11494656, 'steps': 59867, 'loss/train': 0.9818961024284363} -08/30/2021 23:57:16 - INFO - __main__ - Step 59869: {'lr': 0.00033394509734814516, 'samples': 11494848, 'steps': 59868, 'loss/train': 1.1983884572982788} -08/30/2021 23:57:16 - INFO - __main__ - Step 59870: {'lr': 0.0003339400986928671, 'samples': 11495040, 'steps': 59869, 'loss/train': 1.9102174043655396} -08/30/2021 23:57:17 - INFO - __main__ - Step 59871: {'lr': 0.000333935099999767, 'samples': 11495232, 'steps': 59870, 'loss/train': 1.401785135269165} -08/30/2021 23:57:17 - INFO - __main__ - Step 59872: {'lr': 0.00033393010126884696, 'samples': 11495424, 'steps': 59871, 'loss/train': 1.3177196979522705} -08/30/2021 23:57:18 - INFO - __main__ - Step 59873: {'lr': 0.00033392510250010926, 'samples': 11495616, 'steps': 59872, 'loss/train': 1.6992017030715942} -08/30/2021 23:57:19 - INFO - __main__ - Step 59874: {'lr': 0.00033392010369355627, 'samples': 11495808, 'steps': 59873, 'loss/train': 0.8227543830871582} -08/30/2021 23:57:19 - INFO - __main__ - Step 59875: {'lr': 0.00033391510484919015, 'samples': 11496000, 'steps': 59874, 'loss/train': 1.7897945642471313} -08/30/2021 23:57:20 - INFO - __main__ - Step 59876: {'lr': 0.00033391010596701314, 'samples': 11496192, 'steps': 59875, 'loss/train': 1.1453529596328735} -08/30/2021 23:57:20 - INFO - __main__ - Step 59877: {'lr': 0.0003339051070470276, 'samples': 11496384, 'steps': 59876, 'loss/train': 0.8803033232688904} -08/30/2021 23:57:22 - INFO - __main__ - Step 59878: {'lr': 0.00033390010808923573, 'samples': 11496576, 'steps': 59877, 'loss/train': 1.0257887840270996} -08/30/2021 23:57:22 - INFO - __main__ - Step 59879: {'lr': 0.00033389510909363974, 'samples': 11496768, 'steps': 59878, 'loss/train': 1.421064853668213} -08/30/2021 23:57:23 - INFO - __main__ - Step 59880: {'lr': 0.00033389011006024183, 'samples': 11496960, 'steps': 59879, 'loss/train': 0.3296405076980591} -08/30/2021 23:57:23 - INFO - __main__ - Step 59881: {'lr': 0.0003338851109890444, 'samples': 11497152, 'steps': 59880, 'loss/train': 0.059413522481918335} -08/30/2021 23:57:23 - INFO - __main__ - Step 59882: {'lr': 0.00033388011188004965, 'samples': 11497344, 'steps': 59881, 'loss/train': 0.3087981641292572} -08/30/2021 23:57:25 - INFO - __main__ - Step 59883: {'lr': 0.00033387511273325976, 'samples': 11497536, 'steps': 59882, 'loss/train': 1.4966094493865967} -08/30/2021 23:57:25 - INFO - __main__ - Step 59884: {'lr': 0.0003338701135486771, 'samples': 11497728, 'steps': 59883, 'loss/train': 1.114499807357788} -08/30/2021 23:57:26 - INFO - __main__ - Step 59885: {'lr': 0.0003338651143263038, 'samples': 11497920, 'steps': 59884, 'loss/train': 0.1135730892419815} -08/30/2021 23:57:26 - INFO - __main__ - Step 59886: {'lr': 0.0003338601150661423, 'samples': 11498112, 'steps': 59885, 'loss/train': 0.5827957391738892} -08/30/2021 23:57:26 - INFO - __main__ - Step 59887: {'lr': 0.0003338551157681946, 'samples': 11498304, 'steps': 59886, 'loss/train': 0.7452296018600464} -08/30/2021 23:57:28 - INFO - __main__ - Step 59888: {'lr': 0.00033385011643246313, 'samples': 11498496, 'steps': 59887, 'loss/train': 1.2587543725967407} -08/30/2021 23:57:29 - INFO - __main__ - Step 59889: {'lr': 0.00033384511705895003, 'samples': 11498688, 'steps': 59888, 'loss/train': 1.1873503923416138} -08/30/2021 23:57:29 - INFO - __main__ - Step 59890: {'lr': 0.00033384011764765764, 'samples': 11498880, 'steps': 59889, 'loss/train': 1.2524337768554688} -08/30/2021 23:57:30 - INFO - __main__ - Step 59891: {'lr': 0.0003338351181985882, 'samples': 11499072, 'steps': 59890, 'loss/train': 0.9410980939865112} -08/30/2021 23:57:30 - INFO - __main__ - Step 59892: {'lr': 0.000333830118711744, 'samples': 11499264, 'steps': 59891, 'loss/train': 1.0223844051361084} -08/30/2021 23:57:30 - INFO - __main__ - Step 59893: {'lr': 0.00033382511918712723, 'samples': 11499456, 'steps': 59892, 'loss/train': 1.0214662551879883} -08/30/2021 23:57:32 - INFO - __main__ - Step 59894: {'lr': 0.00033382011962474004, 'samples': 11499648, 'steps': 59893, 'loss/train': 1.7625105381011963} -08/30/2021 23:57:32 - INFO - __main__ - Step 59895: {'lr': 0.0003338151200245849, 'samples': 11499840, 'steps': 59894, 'loss/train': 1.229467511177063} -08/30/2021 23:57:33 - INFO - __main__ - Step 59896: {'lr': 0.000333810120386664, 'samples': 11500032, 'steps': 59895, 'loss/train': 1.0320736169815063} -08/30/2021 23:57:33 - INFO - __main__ - Step 59897: {'lr': 0.00033380512071097947, 'samples': 11500224, 'steps': 59896, 'loss/train': 1.7375085353851318} -08/30/2021 23:57:33 - INFO - __main__ - Step 59898: {'lr': 0.00033380012099753364, 'samples': 11500416, 'steps': 59897, 'loss/train': 1.5975598096847534} -08/30/2021 23:57:35 - INFO - __main__ - Step 59899: {'lr': 0.00033379512124632885, 'samples': 11500608, 'steps': 59898, 'loss/train': 1.06941819190979} -08/30/2021 23:57:35 - INFO - __main__ - Step 59900: {'lr': 0.0003337901214573672, 'samples': 11500800, 'steps': 59899, 'loss/train': 1.3083606958389282} -08/30/2021 23:57:36 - INFO - __main__ - Step 59901: {'lr': 0.000333785121630651, 'samples': 11500992, 'steps': 59900, 'loss/train': 1.334172248840332} -08/30/2021 23:57:36 - INFO - __main__ - Step 59902: {'lr': 0.0003337801217661826, 'samples': 11501184, 'steps': 59901, 'loss/train': 1.0839506387710571} -08/30/2021 23:57:36 - INFO - __main__ - Step 59903: {'lr': 0.0003337751218639641, 'samples': 11501376, 'steps': 59902, 'loss/train': 1.4798659086227417} -08/30/2021 23:57:38 - INFO - __main__ - Step 59904: {'lr': 0.0003337701219239978, 'samples': 11501568, 'steps': 59903, 'loss/train': 1.450107216835022} -08/30/2021 23:57:38 - INFO - __main__ - Step 59905: {'lr': 0.00033376512194628605, 'samples': 11501760, 'steps': 59904, 'loss/train': 1.417326807975769} -08/30/2021 23:57:39 - INFO - __main__ - Step 59906: {'lr': 0.000333760121930831, 'samples': 11501952, 'steps': 59905, 'loss/train': 1.63825261592865} -08/30/2021 23:57:39 - INFO - __main__ - Step 59907: {'lr': 0.0003337551218776349, 'samples': 11502144, 'steps': 59906, 'loss/train': 1.145716905593872} -08/30/2021 23:57:39 - INFO - __main__ - Step 59908: {'lr': 0.0003337501217867001, 'samples': 11502336, 'steps': 59907, 'loss/train': 1.6498032808303833} -08/30/2021 23:57:41 - INFO - __main__ - Step 59909: {'lr': 0.00033374512165802874, 'samples': 11502528, 'steps': 59908, 'loss/train': 1.8988059759140015} -08/30/2021 23:57:41 - INFO - __main__ - Step 59910: {'lr': 0.00033374012149162314, 'samples': 11502720, 'steps': 59909, 'loss/train': 0.2469071000814438} -08/30/2021 23:57:42 - INFO - __main__ - Step 59911: {'lr': 0.0003337351212874856, 'samples': 11502912, 'steps': 59910, 'loss/train': 0.5788956880569458} -08/30/2021 23:57:42 - INFO - __main__ - Step 59912: {'lr': 0.00033373012104561815, 'samples': 11503104, 'steps': 59911, 'loss/train': 1.4770945310592651} -08/30/2021 23:57:42 - INFO - __main__ - Step 59913: {'lr': 0.0003337251207660233, 'samples': 11503296, 'steps': 59912, 'loss/train': 1.744764804840088} -08/30/2021 23:57:44 - INFO - __main__ - Step 59914: {'lr': 0.00033372012044870317, 'samples': 11503488, 'steps': 59913, 'loss/train': 1.0111316442489624} -08/30/2021 23:57:44 - INFO - __main__ - Step 59915: {'lr': 0.00033371512009366006, 'samples': 11503680, 'steps': 59914, 'loss/train': 1.3482054471969604} -08/30/2021 23:57:45 - INFO - __main__ - Step 59916: {'lr': 0.0003337101197008962, 'samples': 11503872, 'steps': 59915, 'loss/train': 0.8457168936729431} -08/30/2021 23:57:45 - INFO - __main__ - Step 59917: {'lr': 0.00033370511927041386, 'samples': 11504064, 'steps': 59916, 'loss/train': 1.6057029962539673} -08/30/2021 23:57:45 - INFO - __main__ - Step 59918: {'lr': 0.0003337001188022153, 'samples': 11504256, 'steps': 59917, 'loss/train': 1.407637357711792} -08/30/2021 23:57:46 - INFO - __main__ - Step 59919: {'lr': 0.0003336951182963027, 'samples': 11504448, 'steps': 59918, 'loss/train': 1.4570865631103516} -08/30/2021 23:57:48 - INFO - __main__ - Step 59920: {'lr': 0.0003336901177526784, 'samples': 11504640, 'steps': 59919, 'loss/train': 1.4743255376815796} -08/30/2021 23:57:48 - INFO - __main__ - Step 59921: {'lr': 0.0003336851171713447, 'samples': 11504832, 'steps': 59920, 'loss/train': 1.1863462924957275} -08/30/2021 23:57:49 - INFO - __main__ - Step 59922: {'lr': 0.00033368011655230366, 'samples': 11505024, 'steps': 59921, 'loss/train': 1.4263556003570557} -08/30/2021 23:57:49 - INFO - __main__ - Step 59923: {'lr': 0.0003336751158955577, 'samples': 11505216, 'steps': 59922, 'loss/train': 0.6447646021842957} -08/30/2021 23:57:49 - INFO - __main__ - Step 59924: {'lr': 0.00033367011520110906, 'samples': 11505408, 'steps': 59923, 'loss/train': 1.1414626836776733} -08/30/2021 23:57:51 - INFO - __main__ - Step 59925: {'lr': 0.00033366511446896, 'samples': 11505600, 'steps': 59924, 'loss/train': 1.3145540952682495} -08/30/2021 23:57:51 - INFO - __main__ - Step 59926: {'lr': 0.0003336601136991126, 'samples': 11505792, 'steps': 59925, 'loss/train': 0.9927424192428589} -08/30/2021 23:57:52 - INFO - __main__ - Step 59927: {'lr': 0.0003336551128915693, 'samples': 11505984, 'steps': 59926, 'loss/train': 1.2483415603637695} -08/30/2021 23:57:52 - INFO - __main__ - Step 59928: {'lr': 0.00033365011204633234, 'samples': 11506176, 'steps': 59927, 'loss/train': 1.9663574695587158} -08/30/2021 23:57:52 - INFO - __main__ - Step 59929: {'lr': 0.0003336451111634038, 'samples': 11506368, 'steps': 59928, 'loss/train': 1.0541672706604004} -08/30/2021 23:57:54 - INFO - __main__ - Step 59930: {'lr': 0.00033364011024278616, 'samples': 11506560, 'steps': 59929, 'loss/train': 1.6667582988739014} -08/30/2021 23:57:54 - INFO - __main__ - Step 59931: {'lr': 0.0003336351092844816, 'samples': 11506752, 'steps': 59930, 'loss/train': 0.2971011996269226} -08/30/2021 23:57:55 - INFO - __main__ - Step 59932: {'lr': 0.0003336301082884924, 'samples': 11506944, 'steps': 59931, 'loss/train': 1.9761375188827515} -08/30/2021 23:57:55 - INFO - __main__ - Step 59933: {'lr': 0.00033362510725482063, 'samples': 11507136, 'steps': 59932, 'loss/train': 1.3288410902023315} -08/30/2021 23:57:55 - INFO - __main__ - Step 59934: {'lr': 0.0003336201061834687, 'samples': 11507328, 'steps': 59933, 'loss/train': 1.4965769052505493} -08/30/2021 23:57:57 - INFO - __main__ - Step 59935: {'lr': 0.0003336151050744389, 'samples': 11507520, 'steps': 59934, 'loss/train': 1.2845549583435059} -08/30/2021 23:57:57 - INFO - __main__ - Step 59936: {'lr': 0.00033361010392773336, 'samples': 11507712, 'steps': 59935, 'loss/train': 0.32606035470962524} -08/30/2021 23:57:57 - INFO - __main__ - Step 59937: {'lr': 0.0003336051027433544, 'samples': 11507904, 'steps': 59936, 'loss/train': 1.5637669563293457} -08/30/2021 23:57:58 - INFO - __main__ - Step 59938: {'lr': 0.00033360010152130436, 'samples': 11508096, 'steps': 59937, 'loss/train': 1.0551283359527588} -08/30/2021 23:57:58 - INFO - __main__ - Step 59939: {'lr': 0.00033359510026158534, 'samples': 11508288, 'steps': 59938, 'loss/train': 1.6106975078582764} -08/30/2021 23:58:01 - INFO - __main__ - Step 59940: {'lr': 0.00033359009896419966, 'samples': 11508480, 'steps': 59939, 'loss/train': 1.4372414350509644} -08/30/2021 23:58:01 - INFO - __main__ - Step 59941: {'lr': 0.00033358509762914957, 'samples': 11508672, 'steps': 59940, 'loss/train': 1.8201642036437988} -08/30/2021 23:58:01 - INFO - __main__ - Step 59942: {'lr': 0.0003335800962564374, 'samples': 11508864, 'steps': 59941, 'loss/train': 1.0826791524887085} -08/30/2021 23:58:02 - INFO - __main__ - Step 59943: {'lr': 0.0003335750948460652, 'samples': 11509056, 'steps': 59942, 'loss/train': 0.5303946137428284} -08/30/2021 23:58:02 - INFO - __main__ - Step 59944: {'lr': 0.0003335700933980354, 'samples': 11509248, 'steps': 59943, 'loss/train': 0.4935438334941864} -08/30/2021 23:58:02 - INFO - __main__ - Step 59945: {'lr': 0.0003335650919123503, 'samples': 11509440, 'steps': 59944, 'loss/train': 0.03718230128288269} -08/30/2021 23:58:04 - INFO - __main__ - Step 59946: {'lr': 0.0003335600903890119, 'samples': 11509632, 'steps': 59945, 'loss/train': 0.03926106169819832} -08/30/2021 23:58:04 - INFO - __main__ - Step 59947: {'lr': 0.0003335550888280227, 'samples': 11509824, 'steps': 59946, 'loss/train': 1.1444340944290161} -08/30/2021 23:58:05 - INFO - __main__ - Step 59948: {'lr': 0.00033355008722938485, 'samples': 11510016, 'steps': 59947, 'loss/train': 1.2942636013031006} -08/30/2021 23:58:05 - INFO - __main__ - Step 59949: {'lr': 0.0003335450855931006, 'samples': 11510208, 'steps': 59948, 'loss/train': 1.9871902465820312} -08/30/2021 23:58:06 - INFO - __main__ - Step 59950: {'lr': 0.00033354008391917224, 'samples': 11510400, 'steps': 59949, 'loss/train': 1.2428416013717651} -08/30/2021 23:58:07 - INFO - __main__ - Step 59951: {'lr': 0.00033353508220760204, 'samples': 11510592, 'steps': 59950, 'loss/train': 1.0078407526016235} -08/30/2021 23:58:08 - INFO - __main__ - Step 59952: {'lr': 0.00033353008045839224, 'samples': 11510784, 'steps': 59951, 'loss/train': 0.8023725152015686} -08/30/2021 23:58:08 - INFO - __main__ - Step 59953: {'lr': 0.000333525078671545, 'samples': 11510976, 'steps': 59952, 'loss/train': 1.3900474309921265} -08/30/2021 23:58:08 - INFO - __main__ - Step 59954: {'lr': 0.0003335200768470627, 'samples': 11511168, 'steps': 59953, 'loss/train': 1.2211180925369263} -08/30/2021 23:58:09 - INFO - __main__ - Step 59955: {'lr': 0.0003335150749849475, 'samples': 11511360, 'steps': 59954, 'loss/train': 0.9000880122184753} -08/30/2021 23:58:10 - INFO - __main__ - Step 59956: {'lr': 0.0003335100730852017, 'samples': 11511552, 'steps': 59955, 'loss/train': 1.6677347421646118} -08/30/2021 23:58:10 - INFO - __main__ - Step 59957: {'lr': 0.0003335050711478276, 'samples': 11511744, 'steps': 59956, 'loss/train': 1.5843745470046997} -08/30/2021 23:58:11 - INFO - __main__ - Step 59958: {'lr': 0.0003335000691728273, 'samples': 11511936, 'steps': 59957, 'loss/train': 0.874744176864624} -08/30/2021 23:58:11 - INFO - __main__ - Step 59959: {'lr': 0.0003334950671602033, 'samples': 11512128, 'steps': 59958, 'loss/train': 1.0463758707046509} -08/30/2021 23:58:12 - INFO - __main__ - Step 59960: {'lr': 0.00033349006510995766, 'samples': 11512320, 'steps': 59959, 'loss/train': 0.8631131052970886} -08/30/2021 23:58:12 - INFO - __main__ - Step 59961: {'lr': 0.00033348506302209265, 'samples': 11512512, 'steps': 59960, 'loss/train': 1.395923376083374} -08/30/2021 23:58:13 - INFO - __main__ - Step 59962: {'lr': 0.00033348006089661055, 'samples': 11512704, 'steps': 59961, 'loss/train': 1.5277764797210693} -08/30/2021 23:58:14 - INFO - __main__ - Step 59963: {'lr': 0.0003334750587335136, 'samples': 11512896, 'steps': 59962, 'loss/train': 1.312781810760498} -08/30/2021 23:58:14 - INFO - __main__ - Step 59964: {'lr': 0.00033347005653280414, 'samples': 11513088, 'steps': 59963, 'loss/train': 1.4424299001693726} -08/30/2021 23:58:14 - INFO - __main__ - Step 59965: {'lr': 0.0003334650542944844, 'samples': 11513280, 'steps': 59964, 'loss/train': 1.5940728187561035} -08/30/2021 23:58:15 - INFO - __main__ - Step 59966: {'lr': 0.00033346005201855656, 'samples': 11513472, 'steps': 59965, 'loss/train': 1.9113858938217163} -08/30/2021 23:58:16 - INFO - __main__ - Step 59967: {'lr': 0.00033345504970502284, 'samples': 11513664, 'steps': 59966, 'loss/train': 1.5821585655212402} -08/30/2021 23:58:17 - INFO - __main__ - Step 59968: {'lr': 0.0003334500473538856, 'samples': 11513856, 'steps': 59967, 'loss/train': 1.1747950315475464} -08/30/2021 23:58:17 - INFO - __main__ - Step 59969: {'lr': 0.00033344504496514703, 'samples': 11514048, 'steps': 59968, 'loss/train': 1.3834439516067505} -08/30/2021 23:58:17 - INFO - __main__ - Step 59970: {'lr': 0.0003334400425388095, 'samples': 11514240, 'steps': 59969, 'loss/train': 1.16960608959198} -08/30/2021 23:58:18 - INFO - __main__ - Step 59971: {'lr': 0.00033343504007487515, 'samples': 11514432, 'steps': 59970, 'loss/train': 1.699402093887329} -08/30/2021 23:58:19 - INFO - __main__ - Step 59972: {'lr': 0.00033343003757334625, 'samples': 11514624, 'steps': 59971, 'loss/train': 1.7500873804092407} -08/30/2021 23:58:20 - INFO - __main__ - Step 59973: {'lr': 0.000333425035034225, 'samples': 11514816, 'steps': 59972, 'loss/train': 1.920077919960022} -08/30/2021 23:58:20 - INFO - __main__ - Step 59974: {'lr': 0.00033342003245751374, 'samples': 11515008, 'steps': 59973, 'loss/train': 1.5325719118118286} -08/30/2021 23:58:20 - INFO - __main__ - Step 59975: {'lr': 0.0003334150298432147, 'samples': 11515200, 'steps': 59974, 'loss/train': 1.2195863723754883} -08/30/2021 23:58:21 - INFO - __main__ - Step 59976: {'lr': 0.00033341002719133016, 'samples': 11515392, 'steps': 59975, 'loss/train': 0.8065526485443115} -08/30/2021 23:58:22 - INFO - __main__ - Step 59977: {'lr': 0.0003334050245018624, 'samples': 11515584, 'steps': 59976, 'loss/train': 1.0746419429779053} -08/30/2021 23:58:23 - INFO - __main__ - Step 59978: {'lr': 0.00033340002177481353, 'samples': 11515776, 'steps': 59977, 'loss/train': 1.3480299711227417} -08/30/2021 23:58:23 - INFO - __main__ - Step 59979: {'lr': 0.00033339501901018595, 'samples': 11515968, 'steps': 59978, 'loss/train': 0.912415087223053} -08/30/2021 23:58:24 - INFO - __main__ - Step 59980: {'lr': 0.0003333900162079818, 'samples': 11516160, 'steps': 59979, 'loss/train': 0.5242136120796204} -08/30/2021 23:58:24 - INFO - __main__ - Step 59981: {'lr': 0.00033338501336820347, 'samples': 11516352, 'steps': 59980, 'loss/train': 1.3247582912445068} -08/30/2021 23:58:26 - INFO - __main__ - Step 59982: {'lr': 0.0003333800104908531, 'samples': 11516544, 'steps': 59981, 'loss/train': 2.3978195190429688} -08/30/2021 23:58:26 - INFO - __main__ - Step 59983: {'lr': 0.00033337500757593306, 'samples': 11516736, 'steps': 59982, 'loss/train': 0.7306232452392578} -08/30/2021 23:58:26 - INFO - __main__ - Step 59984: {'lr': 0.0003333700046234454, 'samples': 11516928, 'steps': 59983, 'loss/train': 1.4217044115066528} -08/30/2021 23:58:27 - INFO - __main__ - Step 59985: {'lr': 0.00033336500163339255, 'samples': 11517120, 'steps': 59984, 'loss/train': 2.6274688243865967} -08/30/2021 23:58:27 - INFO - __main__ - Step 59986: {'lr': 0.00033335999860577677, 'samples': 11517312, 'steps': 59985, 'loss/train': 2.3362929821014404} -08/30/2021 23:58:29 - INFO - __main__ - Step 59987: {'lr': 0.0003333549955406002, 'samples': 11517504, 'steps': 59986, 'loss/train': 0.8453044891357422} -08/30/2021 23:58:29 - INFO - __main__ - Step 59988: {'lr': 0.0003333499924378652, 'samples': 11517696, 'steps': 59987, 'loss/train': 1.0473734140396118} -08/30/2021 23:58:29 - INFO - __main__ - Step 59989: {'lr': 0.00033334498929757394, 'samples': 11517888, 'steps': 59988, 'loss/train': 1.5850181579589844} -08/30/2021 23:58:30 - INFO - __main__ - Step 59990: {'lr': 0.0003333399861197287, 'samples': 11518080, 'steps': 59989, 'loss/train': 1.8422579765319824} -08/30/2021 23:58:30 - INFO - __main__ - Step 59991: {'lr': 0.00033333498290433184, 'samples': 11518272, 'steps': 59990, 'loss/train': 1.579368233680725} -08/30/2021 23:58:30 - INFO - __main__ - Step 59992: {'lr': 0.00033332997965138545, 'samples': 11518464, 'steps': 59991, 'loss/train': 1.1963123083114624} -08/30/2021 23:58:32 - INFO - __main__ - Step 59993: {'lr': 0.0003333249763608919, 'samples': 11518656, 'steps': 59992, 'loss/train': 1.4305427074432373} -08/30/2021 23:58:32 - INFO - __main__ - Step 59994: {'lr': 0.00033331997303285334, 'samples': 11518848, 'steps': 59993, 'loss/train': 1.2449132204055786} -08/30/2021 23:58:33 - INFO - __main__ - Step 59995: {'lr': 0.00033331496966727207, 'samples': 11519040, 'steps': 59994, 'loss/train': 1.3063499927520752} -08/30/2021 23:58:33 - INFO - __main__ - Step 59996: {'lr': 0.00033330996626415046, 'samples': 11519232, 'steps': 59995, 'loss/train': 0.9000343680381775} -08/30/2021 23:58:33 - INFO - __main__ - Step 59997: {'lr': 0.0003333049628234906, 'samples': 11519424, 'steps': 59996, 'loss/train': 1.6371190547943115} -08/30/2021 23:58:36 - INFO - __main__ - Step 59998: {'lr': 0.0003332999593452948, 'samples': 11519616, 'steps': 59997, 'loss/train': 1.5421613454818726} -08/30/2021 23:58:36 - INFO - __main__ - Step 59999: {'lr': 0.0003332949558295654, 'samples': 11519808, 'steps': 59998, 'loss/train': 1.0983376502990723} -08/30/2021 23:58:36 - INFO - __main__ - Step 60000: {'lr': 0.0003332899522763045, 'samples': 11520000, 'steps': 59999, 'loss/train': 1.3309777975082397} -08/30/2021 23:58:37 - INFO - __main__ - Evaluating model checkpoint -08/31/2021 00:07:18 - INFO - __main__ - Step 60000: {'loss/eval': 1.1882071495056152, 'perplexity': 3.281193256378174} -08/31/2021 00:07:18 - INFO - __main__ - Saving model checkpoint +version https://git-lfs.github.com/spec/v1 +oid sha256:7f51d46c136e473cc41bc6ddc1e830c3b4cb96f28fd852056d0e3632cad160ed +size 11445768